Epoch: 0, step: 0, loss: 1.1638894081115723, mean loss: 1.1638894081115723
Epoch: 0, step: 1, loss: 0.9553995132446289, mean loss: 1.0596444606781006
Epoch: 0, step: 2, loss: 0.9755326509475708, mean loss: 1.031607190767924
Epoch: 0, step: 3, loss: 1.146655797958374, mean loss: 1.0603693425655365
Epoch: 0, step: 4, loss: 0.8968734741210938, mean loss: 1.0276701688766479
Epoch: 0, step: 5, loss: 0.8691169023513794, mean loss: 1.0012446244557698
Epoch: 0, step: 6, loss: 0.7992992401123047, mean loss: 0.9723952838352747
Epoch: 0, step: 7, loss: 1.0544853210449219, mean loss: 0.9826565384864806
Epoch: 0, step: 8, loss: 0.7345256805419922, mean loss: 0.9550864431593152
Epoch: 0, step: 9, loss: 0.8906333446502686, mean loss: 0.9486411333084106
Epoch: 0, step: 10, loss: 0.927553653717041, mean loss: 0.9467240897091952
Epoch: 0, step: 11, loss: 1.1294214725494385, mean loss: 0.9619488716125488
Epoch: 0, step: 12, loss: 0.9107316732406616, mean loss: 0.9580090871224036
Epoch: 0, step: 13, loss: 0.9129786491394043, mean loss: 0.9547926272664751
Epoch: 0, step: 14, loss: 0.9530107975006104, mean loss: 0.9546738386154174
Epoch: 0, step: 15, loss: 0.8807125687599182, mean loss: 0.9500512592494488
Epoch: 0, step: 16, loss: 0.8830963373184204, mean loss: 0.9461127344299766
Epoch: 0, step: 17, loss: 0.848498523235321, mean loss: 0.9406897226969402
Epoch: 0, step: 18, loss: 0.8076579570770264, mean loss: 0.9336880508222078
Epoch: 0, step: 19, loss: 0.7507230639457703, mean loss: 0.924539801478386
Epoch: 0, step: 20, loss: 0.91470867395401, mean loss: 0.9240716525486538
Epoch: 0, step: 21, loss: 0.8898685574531555, mean loss: 0.9225169664079493
Epoch: 0, step: 22, loss: 0.7834203243255615, mean loss: 0.9164692863174108
Epoch: 0, step: 23, loss: 0.7508494853973389, mean loss: 0.9095684612790744
Epoch: 0, step: 24, loss: 0.7760809063911438, mean loss: 0.9042289590835572
Epoch: 0, step: 25, loss: 0.7471703290939331, mean loss: 0.8981882425454947
Epoch: 0, step: 26, loss: 0.9646943211555481, mean loss: 0.9006514306421634
Epoch: 0, step: 27, loss: 0.7100625038146973, mean loss: 0.8938446832554682
Epoch: 0, step: 28, loss: 0.8879171013832092, mean loss: 0.8936402838805627
Epoch: 0, step: 29, loss: 0.76289302110672, mean loss: 0.8892820417881013
Epoch: 0, step: 30, loss: 0.8545520305633545, mean loss: 0.8881617188453675
Epoch: 0, step: 31, loss: 0.7978349328041077, mean loss: 0.8853390067815782
Epoch: 0, step: 32, loss: 0.8012599349021912, mean loss: 0.8827911561185664
Epoch: 0, step: 33, loss: 0.7513855695724487, mean loss: 0.8789262859260335
Epoch: 0, step: 34, loss: 0.8435215353965759, mean loss: 0.8779147216251919
Epoch: 0, step: 35, loss: 0.8201726675033569, mean loss: 0.8763107756773632
Epoch: 0, step: 36, loss: 0.6606957912445068, mean loss: 0.8704833436656644
Epoch: 0, step: 37, loss: 0.8042402267456055, mean loss: 0.8687401037467155
Epoch: 0, step: 38, loss: 0.6547872424125671, mean loss: 0.8632541329432758
Epoch: 0, step: 39, loss: 0.7064419984817505, mean loss: 0.8593338295817377
Epoch: 0, step: 40, loss: 0.7404818534851074, mean loss: 0.856435000896454
Epoch: 0, step: 41, loss: 0.682525634765625, mean loss: 0.8522943017028628
Epoch: 0, step: 42, loss: 0.6804389953613281, mean loss: 0.8482976666716643
Epoch: 0, step: 43, loss: 0.684424102306366, mean loss: 0.8445732674815438
Epoch: 0, step: 44, loss: 0.6478545069694519, mean loss: 0.840201739470164
Epoch: 0, step: 45, loss: 0.706439197063446, mean loss: 0.8372938581134962
Epoch: 0, step: 46, loss: 0.6846575140953064, mean loss: 0.8340462763258751
Epoch: 0, step: 47, loss: 0.8585658669471741, mean loss: 0.8345571011304855
Epoch: 0, step: 48, loss: 0.6501793265342712, mean loss: 0.8307942894040322
Epoch: 0, step: 49, loss: 0.7207923531532288, mean loss: 0.8285942506790162
Epoch: 0, step: 50, loss: 0.671491265296936, mean loss: 0.8255137999852499
Epoch: 0, step: 51, loss: 0.6999425888061523, mean loss: 0.8230989690010364
Epoch: 0, step: 52, loss: 0.6477469801902771, mean loss: 0.8197904409102673
Epoch: 0, step: 53, loss: 0.6235356330871582, mean loss: 0.8161560926172468
Epoch: 0, step: 54, loss: 0.6614269614219666, mean loss: 0.8133428356864235
Epoch: 0, step: 55, loss: 0.7725139260292053, mean loss: 0.8126137480139732
Epoch: 0, step: 56, loss: 0.7527450323104858, mean loss: 0.811563419668298
Epoch: 0, step: 57, loss: 0.7128615379333496, mean loss: 0.809861663086661
Epoch: 0, step: 58, loss: 0.6206385493278503, mean loss: 0.8066544916670201
Epoch: 0, step: 59, loss: 0.7192602157592773, mean loss: 0.8051979204018911
Epoch: 0, step: 60, loss: 0.6545922160148621, mean loss: 0.8027289744283332
Epoch: 0, step: 61, loss: 0.5992737412452698, mean loss: 0.7994474384092516
Epoch: 0, step: 62, loss: 0.6248669028282166, mean loss: 0.7966763187968542
Epoch: 0, step: 63, loss: 0.5701197385787964, mean loss: 0.793136372230947
Epoch: 0, step: 64, loss: 0.7350955605506897, mean loss: 0.7922434366666353
Epoch: 0, step: 65, loss: 0.6070762276649475, mean loss: 0.7894378728938825
Epoch: 0, step: 66, loss: 0.6891947984695435, mean loss: 0.787941707603967
Epoch: 0, step: 67, loss: 0.7905483245849609, mean loss: 0.7879800402066287
Epoch: 0, step: 68, loss: 0.6278472542762756, mean loss: 0.7856592751931454
Epoch: 0, step: 69, loss: 0.953527569770813, mean loss: 0.788057393687112
Epoch: 0, step: 70, loss: 0.7231031060218811, mean loss: 0.7871425445650665
Epoch: 0, step: 71, loss: 0.7085049152374268, mean loss: 0.7860503552688493
Epoch: 0, step: 72, loss: 0.6627025604248047, mean loss: 0.7843606594490679
Epoch: 0, step: 73, loss: 0.7195305228233337, mean loss: 0.7834845765216931
Epoch: 0, step: 74, loss: 0.593020498752594, mean loss: 0.7809450554847718
Epoch: 0, step: 75, loss: 0.7247958183288574, mean loss: 0.7802062497327202
Epoch: 0, step: 76, loss: 0.633760929107666, mean loss: 0.7783043624518754
Epoch: 0, step: 77, loss: 0.7282317280769348, mean loss: 0.7776624056009146
Epoch: 0, step: 78, loss: 0.554481029510498, mean loss: 0.7748373248909093
Epoch: 0, step: 79, loss: 0.7817375659942627, mean loss: 0.7749235779047012
Epoch: 0, step: 80, loss: 0.6729843020439148, mean loss: 0.773665068326173
Epoch: 0, step: 81, loss: 0.645117461681366, mean loss: 0.7720974145866022
Epoch: 0, step: 82, loss: 0.5843460559844971, mean loss: 0.769835350025131
Epoch: 0, step: 83, loss: 0.6350879073143005, mean loss: 0.768231213802383
Epoch: 0, step: 84, loss: 0.5633720755577087, mean loss: 0.7658211062936221
Epoch: 0, step: 85, loss: 0.6324207782745361, mean loss: 0.764269939688749
Epoch: 0, step: 86, loss: 0.7082880735397339, mean loss: 0.7636264699628983
Epoch: 0, step: 87, loss: 0.6709017753601074, mean loss: 0.762572780251503
Epoch: 0, step: 88, loss: 0.7395465970039368, mean loss: 0.762314059091418
Epoch: 0, step: 89, loss: 0.6053422689437866, mean loss: 0.7605699280897776
Epoch: 0, step: 90, loss: 0.5482318997383118, mean loss: 0.7582365431628385
Epoch: 0, step: 91, loss: 0.6534765362739563, mean loss: 0.7570978474357855
Epoch: 0, step: 92, loss: 0.6124739050865173, mean loss: 0.7555427512814923
Epoch: 0, step: 93, loss: 0.6361672878265381, mean loss: 0.7542727995426098
Epoch: 0, step: 94, loss: 0.5870407223701477, mean loss: 0.7525124618881629
Epoch: 0, step: 95, loss: 0.633165717124939, mean loss: 0.7512692666302127
Epoch: 0, step: 96, loss: 0.6273614764213562, mean loss: 0.7499918667311523
Epoch: 0, step: 97, loss: 0.5955002307891846, mean loss: 0.7484154214664382
Epoch: 0, step: 98, loss: 0.641704261302948, mean loss: 0.7473375309597363
Epoch: 0, step: 99, loss: 0.6829594969749451, mean loss: 0.7466937506198884
Epoch: 0, step: 100, loss: 0.6650400161743164, mean loss: 0.7458852978035956
Epoch: 0, step: 101, loss: 0.6049938201904297, mean loss: 0.7445040088073881
Epoch: 0, step: 102, loss: 0.5483745336532593, mean loss: 0.7425998391456975
Epoch: 0, step: 103, loss: 0.6317673325538635, mean loss: 0.7415341419669299
Epoch: 0, step: 104, loss: 0.6409972906112671, mean loss: 0.740576648144495
Epoch: 0, step: 105, loss: 0.5515583157539368, mean loss: 0.7387934563294897
Epoch: 0, step: 106, loss: 0.7067016363143921, mean loss: 0.7384935327779467
Epoch: 0, step: 107, loss: 0.7167412638664246, mean loss: 0.7382921228806179
Epoch: 0, step: 108, loss: 0.5812868475914001, mean loss: 0.736851707510992
Epoch: 0, step: 109, loss: 0.6634315252304077, mean loss: 0.7361842513084412
Epoch: 0, step: 110, loss: 0.5771923065185547, mean loss: 0.7347518914454693
Epoch: 0, step: 111, loss: 0.6381315588951111, mean loss: 0.7338892099048411
Epoch: 0, step: 112, loss: 0.639965295791626, mean loss: 0.7330580248241931
Epoch: 0, step: 113, loss: 0.6205725073814392, mean loss: 0.7320713097589058
Epoch: 0, step: 114, loss: 0.5883920788764954, mean loss: 0.730821925142537
Epoch: 0, step: 115, loss: 0.6321128606796265, mean loss: 0.7299709849316498
Epoch: 0, step: 116, loss: 0.665238618850708, mean loss: 0.729417716845488
Epoch: 0, step: 117, loss: 0.5798978805541992, mean loss: 0.7281505995887821
Epoch: 0, step: 118, loss: 0.5369054675102234, mean loss: 0.7265434976385422
Epoch: 0, step: 119, loss: 0.6065517067909241, mean loss: 0.7255435660481454
Epoch: 0, step: 120, loss: 0.7342929244041443, mean loss: 0.7256158747948892
Epoch: 0, step: 121, loss: 0.6575655937194824, mean loss: 0.7250580856057465
Epoch: 0, step: 122, loss: 0.5446503162384033, mean loss: 0.7235913557734917
Epoch: 0, step: 123, loss: 0.6174830794334412, mean loss: 0.7227356438675235
Epoch: 0, step: 124, loss: 0.5080816745758057, mean loss: 0.7210184121131898
Epoch: 0, step: 125, loss: 0.6073914766311646, mean loss: 0.7201166110379357
Epoch: 0, step: 126, loss: 0.5572855472564697, mean loss: 0.7188344766774517
Epoch: 0, step: 127, loss: 0.6023832559585571, mean loss: 0.7179247015155853
Epoch: 0, step: 128, loss: 0.5283045768737793, mean loss: 0.7164547780687496
Epoch: 0, step: 129, loss: 0.6129440069198608, mean loss: 0.7156585413676043
Epoch: 0, step: 130, loss: 0.5725684762001038, mean loss: 0.7145662507938066
Epoch: 0, step: 131, loss: 0.6608913540840149, mean loss: 0.7141596227884295
Epoch: 0, step: 132, loss: 0.5834540128707886, mean loss: 0.7131768738416803
Epoch: 0, step: 133, loss: 0.5571823716163635, mean loss: 0.7120127357653719
Epoch: 0, step: 134, loss: 0.49806687235832214, mean loss: 0.7104279515919864
Epoch: 0, step: 135, loss: 0.55550217628479, mean loss: 0.7092887914794335
Epoch: 0, step: 136, loss: 0.6029496192932129, mean loss: 0.7085125931423077
Epoch: 0, step: 137, loss: 0.5561036467552185, mean loss: 0.7074081804873288
Epoch: 0, step: 138, loss: 0.6896644234657288, mean loss: 0.7072805275591159
Epoch: 0, step: 139, loss: 0.6837083101272583, mean loss: 0.7071121545774597
Epoch: 0, step: 140, loss: 0.6139639616012573, mean loss: 0.7064515290953589
Epoch: 0, step: 141, loss: 0.5802630186080933, mean loss: 0.7055628776130543
Epoch: 0, step: 142, loss: 0.537249743938446, mean loss: 0.7043858626922528
Epoch: 0, step: 143, loss: 0.5472269654273987, mean loss: 0.7032944814612468
Epoch: 0, step: 144, loss: 0.8010542988777161, mean loss: 0.7039686870986018
Epoch: 0, step: 145, loss: 0.519896388053894, mean loss: 0.7027079179270628
Epoch: 0, step: 146, loss: 0.5362956523895264, mean loss: 0.7015758616989163
Epoch: 0, step: 147, loss: 0.6138589382171631, mean loss: 0.700983179783499
Epoch: 0, step: 148, loss: 0.6009321212768555, mean loss: 0.7003116961693604
Epoch: 0, step: 149, loss: 0.5289856195449829, mean loss: 0.6991695223251979
Epoch: 0, step: 150, loss: 0.5751463770866394, mean loss: 0.6983481769924922
Epoch: 0, step: 151, loss: 0.6283420324325562, mean loss: 0.6978876102519663
Epoch: 0, step: 152, loss: 0.5070878267288208, mean loss: 0.6966405528433183
Epoch: 0, step: 153, loss: 0.4877279996871948, mean loss: 0.6952839778228239
Epoch: 0, step: 154, loss: 0.6579147577285767, mean loss: 0.6950428860802804
Epoch: 0, step: 155, loss: 0.5210188627243042, mean loss: 0.6939273474690242
Epoch: 0, step: 156, loss: 0.604405403137207, mean loss: 0.6933571440019426
Epoch: 0, step: 157, loss: 0.6275365352630615, mean loss: 0.6929405578706839
Epoch: 0, step: 158, loss: 0.5115058422088623, mean loss: 0.6917994590300435
Epoch: 0, step: 159, loss: 0.5235850811004639, mean loss: 0.6907481191679836
Epoch: 0, step: 160, loss: 0.5692417025566101, mean loss: 0.6899934209281614
Epoch: 0, step: 161, loss: 0.5696674585342407, mean loss: 0.6892506680738779
Epoch: 0, step: 162, loss: 0.5494279265403748, mean loss: 0.688392859843611
Epoch: 0, step: 163, loss: 0.6102181673049927, mean loss: 0.6879161848891072
Epoch: 0, step: 164, loss: 0.6022596955299377, mean loss: 0.6873970546505668
Epoch: 0, step: 165, loss: 0.4970073997974396, mean loss: 0.6862501290189215
Epoch: 0, step: 166, loss: 0.5498227477073669, mean loss: 0.6854331985919062
Epoch: 0, step: 167, loss: 0.5079062581062317, mean loss: 0.6843764906128248
Epoch: 0, step: 168, loss: 0.5554112195968628, mean loss: 0.6836133825003043
Epoch: 0, step: 169, loss: 0.6100161075592041, mean loss: 0.683180457353592
Epoch: 0, step: 170, loss: 0.6207928657531738, mean loss: 0.6828156176366305
Epoch: 0, step: 171, loss: 0.5686418414115906, mean loss: 0.6821518166120663
Epoch: 0, step: 172, loss: 0.5811365246772766, mean loss: 0.6815679131904778
Epoch: 0, step: 173, loss: 0.4654940664768219, mean loss: 0.6803261094737327
Epoch: 0, step: 174, loss: 0.5819791555404663, mean loss: 0.6797641268798283
Epoch: 0, step: 175, loss: 0.6254109144210815, mean loss: 0.67945530180904
Epoch: 0, step: 176, loss: 0.5459550023078918, mean loss: 0.6787010628288075
Epoch: 0, step: 177, loss: 0.5634518265724182, mean loss: 0.6780535952093896
Epoch: 0, step: 178, loss: 0.5084499716758728, mean loss: 0.677106088932666
Epoch: 0, step: 179, loss: 0.4866146445274353, mean loss: 0.6760478031304147
Epoch: 0, step: 180, loss: 0.6148279309272766, mean loss: 0.6757095717922758
Epoch: 0, step: 181, loss: 0.5367759466171265, mean loss: 0.6749462002253793
Epoch: 0, step: 182, loss: 0.6005659699440002, mean loss: 0.6745397508795794
Epoch: 0, step: 183, loss: 0.5389605164527893, mean loss: 0.6738029072142164
Epoch: 0, step: 184, loss: 0.5133253931999207, mean loss: 0.6729354611925176
Epoch: 0, step: 185, loss: 0.5178577899932861, mean loss: 0.6721017102720916
Epoch: 0, step: 186, loss: 0.6004090309143066, mean loss: 0.6717183269600179
Epoch: 0, step: 187, loss: 0.5036156177520752, mean loss: 0.6708241636131671
Epoch: 0, step: 188, loss: 0.5744686126708984, mean loss: 0.6703143458833138
Epoch: 0, step: 189, loss: 0.5101205706596375, mean loss: 0.6694712207505576
Epoch: 0, step: 190, loss: 0.5321003198623657, mean loss: 0.6687520013741797
Epoch: 0, step: 191, loss: 0.5638724565505981, mean loss: 0.6682057537448902
Epoch: 0, step: 192, loss: 0.5535389184951782, mean loss: 0.6676116250648398
Epoch: 0, step: 193, loss: 0.49378034472465515, mean loss: 0.6667155875373131
Epoch: 0, step: 194, loss: 0.506625235080719, mean loss: 0.665894611370869
Epoch: 0, step: 195, loss: 0.5146822333335876, mean loss: 0.665123119646189
Epoch: 0, step: 196, loss: 0.5208650827407837, mean loss: 0.6643908453471767
Epoch: 0, step: 197, loss: 0.5790799856185913, mean loss: 0.6639599824192546
Epoch: 0, step: 198, loss: 0.5932356119155884, mean loss: 0.6636045835725025
Epoch: 0, step: 199, loss: 0.5158122181892395, mean loss: 0.6628656217455862
Epoch: 0, step: 200, loss: 0.4768831729888916, mean loss: 0.6619403359308762
Epoch: 0, step: 201, loss: 0.5025132894515991, mean loss: 0.6611510931265233
Epoch: 0, step: 202, loss: 0.5579531788825989, mean loss: 0.6606427290169473
Epoch: 0, step: 203, loss: 0.4821799397468567, mean loss: 0.6597679114224861
Epoch: 0, step: 204, loss: 0.5954304337501526, mean loss: 0.659454070067987
Epoch: 0, step: 205, loss: 0.5070923566818237, mean loss: 0.658714450100093
Epoch: 0, step: 206, loss: 0.5477649569511414, mean loss: 0.6581784622104845
Epoch: 0, step: 207, loss: 0.5204585790634155, mean loss: 0.6575163473876621
Epoch: 0, step: 208, loss: 0.5041348934173584, mean loss: 0.6567824648327802
Epoch: 0, step: 209, loss: 0.5104902982711792, mean loss: 0.6560858354682012
Epoch: 0, step: 210, loss: 0.5666165947914124, mean loss: 0.6556618106308705
Epoch: 0, step: 211, loss: 0.5337876677513123, mean loss: 0.6550869325984198
Epoch: 0, step: 212, loss: 0.578034520149231, mean loss: 0.6547251841831654
Epoch: 0, step: 213, loss: 0.5286397337913513, mean loss: 0.65413599983554
Epoch: 0, step: 214, loss: 0.5839055776596069, mean loss: 0.6538093467091404
Epoch: 0, step: 215, loss: 0.5357722043991089, mean loss: 0.653262878457705
Epoch: 0, step: 216, loss: 0.5399452447891235, mean loss: 0.6527406773808913
Epoch: 0, step: 217, loss: 0.4898613393306732, mean loss: 0.6519935244540553
Epoch: 0, step: 218, loss: 0.5261816382408142, mean loss: 0.6514190409553647
Epoch: 0, step: 219, loss: 0.5021575093269348, mean loss: 0.6507405794479628
Epoch: 0, step: 220, loss: 0.5421568155288696, mean loss: 0.6502492501994601
Epoch: 0, step: 221, loss: 0.4729160964488983, mean loss: 0.6494504522095927
Epoch: 0, step: 222, loss: 0.5688917636871338, mean loss: 0.6490892024852768
Epoch: 0, step: 223, loss: 0.5574254989624023, mean loss: 0.6486799895231211
Epoch: 0, step: 224, loss: 0.5758495926856995, mean loss: 0.6483562988705104
Epoch: 0, step: 225, loss: 0.45397472381591797, mean loss: 0.647496203405667
Epoch: 0, step: 226, loss: 0.5033833980560303, mean loss: 0.6468613452323206
Epoch: 0, step: 227, loss: 0.5654218792915344, mean loss: 0.6465041545922294
Epoch: 0, step: 228, loss: 0.5074887871742249, mean loss: 0.6458971005860372
Epoch: 0, step: 229, loss: 0.5814615488052368, mean loss: 0.6456169460130772
Epoch: 0, step: 230, loss: 0.5559998750686646, mean loss: 0.6452289933250062
Epoch: 0, step: 231, loss: 0.4580981731414795, mean loss: 0.6444223949621462
Epoch: 0, step: 232, loss: 0.5198214650154114, mean loss: 0.6438876270224606
Epoch: 0, step: 233, loss: 0.5352623462677002, mean loss: 0.6434234164209446
Epoch: 0, step: 234, loss: 0.4563051760196686, mean loss: 0.6426271685894498
Epoch: 0, step: 235, loss: 0.46070975065231323, mean loss: 0.641856332072767
Epoch: 0, step: 236, loss: 0.4807007908821106, mean loss: 0.6411763508863085
Epoch: 0, step: 237, loss: 0.5234236717224121, mean loss: 0.6406815917301577
Epoch: 0, step: 238, loss: 0.5039430856704712, mean loss: 0.6401094640897406
Epoch: 0, step: 239, loss: 0.4730340540409088, mean loss: 0.6394133165478705
Epoch: 0, step: 240, loss: 0.5189664959907532, mean loss: 0.6389135372094592
Epoch: 0, step: 241, loss: 0.4736194312572479, mean loss: 0.6382305037137889
Epoch: 0, step: 242, loss: 0.5373628735542297, mean loss: 0.6378154105855602
Epoch: 0, step: 243, loss: 0.4640880227088928, mean loss: 0.6371034130942624
Epoch: 0, step: 244, loss: 0.54061359167099, mean loss: 0.6367095770884532
Epoch: 0, step: 245, loss: 0.48187410831451416, mean loss: 0.6360801646137624
Epoch: 0, step: 246, loss: 0.5005093216896057, mean loss: 0.6355312948043529
Epoch: 0, step: 247, loss: 0.4959070682525635, mean loss: 0.6349682938908376
Epoch: 0, step: 248, loss: 0.4747489094734192, mean loss: 0.6343248425477958
Epoch: 0, step: 249, loss: 0.49197396636009216, mean loss: 0.633755439043045
Epoch: 0, step: 250, loss: 0.5216343402862549, mean loss: 0.6333087414384363
Epoch: 0, step: 251, loss: 0.6038126945495605, mean loss: 0.6331916936333217
Epoch: 0, step: 252, loss: 0.5415919423103333, mean loss: 0.6328296392802665
Epoch: 0, step: 253, loss: 0.4994257092475891, mean loss: 0.6323044269573032
Epoch: 0, step: 254, loss: 0.4489893913269043, mean loss: 0.6315855444646349
Epoch: 0, step: 255, loss: 0.529657781124115, mean loss: 0.631187389139086
Epoch: 0, step: 256, loss: 0.4232092499732971, mean loss: 0.6303781356792969
Epoch: 0, step: 257, loss: 0.4921625852584839, mean loss: 0.6298424164916193
Epoch: 0, step: 258, loss: 0.5225826501846313, mean loss: 0.6294282861197776
Epoch: 0, step: 259, loss: 0.5269293785095215, mean loss: 0.6290340595520458
Epoch: 0, step: 260, loss: 0.5424551367759705, mean loss: 0.6287023395414095
Epoch: 0, step: 261, loss: 0.5412905216217041, mean loss: 0.6283687066485862
Epoch: 0, step: 262, loss: 0.5190451145172119, mean loss: 0.6279530275910525
Epoch: 0, step: 263, loss: 0.6248671412467957, mean loss: 0.6279413386276274
Epoch: 0, step: 264, loss: 0.5095261931419373, mean loss: 0.627494489022021
Epoch: 0, step: 265, loss: 0.4905413091182709, mean loss: 0.6269796274434355
Epoch: 0, step: 266, loss: 0.5977596640586853, mean loss: 0.6268701893783241
Epoch: 0, step: 267, loss: 0.5752169489860535, mean loss: 0.6266774534067111
Epoch: 0, step: 268, loss: 0.6269355416297913, mean loss: 0.6266784128424846
Epoch: 0, step: 269, loss: 0.4999677240848541, mean loss: 0.6262091139952342
Epoch: 0, step: 270, loss: 0.4937088191509247, mean loss: 0.6257201830179488
Epoch: 0, step: 271, loss: 0.4524227976799011, mean loss: 0.6250830602777354
Epoch: 0, step: 272, loss: 0.5171245336532593, mean loss: 0.6246876077992575
Epoch: 0, step: 273, loss: 0.5453667640686035, mean loss: 0.6243981156688536
Epoch: 0, step: 274, loss: 0.4582478702068329, mean loss: 0.6237939329580826
Epoch: 0, step: 275, loss: 0.5348421931266785, mean loss: 0.62347164404565
Epoch: 0, step: 276, loss: 0.5205299258232117, mean loss: 0.6231000132939445
Epoch: 0, step: 277, loss: 0.4932638108730316, mean loss: 0.6226329765945887
Epoch: 0, step: 278, loss: 0.4772791564464569, mean loss: 0.622111995160366
Epoch: 0, step: 279, loss: 0.47581666707992554, mean loss: 0.6215895118457929
Epoch: 0, step: 280, loss: 0.5501254796981812, mean loss: 0.6213351914466911
Epoch: 0, step: 281, loss: 0.5273979902267456, mean loss: 0.6210020808040673
Epoch: 0, step: 282, loss: 0.5586431622505188, mean loss: 0.6207817312685424
Epoch: 0, step: 283, loss: 0.5270110964775085, mean loss: 0.6204515529770247
Epoch: 0, step: 284, loss: 0.5483667254447937, mean loss: 0.6201986237576134
Epoch: 0, step: 285, loss: 0.5620232820510864, mean loss: 0.6199952134719262
Epoch: 0, step: 286, loss: 0.5121587514877319, mean loss: 0.6196194766705876
Epoch: 0, step: 287, loss: 0.4247109293937683, mean loss: 0.6189427108814319
Epoch: 0, step: 288, loss: 0.5064342021942139, mean loss: 0.6185534080832062
Epoch: 0, step: 289, loss: 0.4826045334339142, mean loss: 0.6180846188602777
Epoch: 0, step: 290, loss: 0.47133585810661316, mean loss: 0.6175803275862101
Epoch: 0, step: 291, loss: 0.5538028478622437, mean loss: 0.6173619115597582
Epoch: 0, step: 292, loss: 0.5074450969696045, mean loss: 0.6169867688478464
Epoch: 0, step: 293, loss: 0.46498072147369385, mean loss: 0.6164697414758255
Epoch: 0, step: 294, loss: 0.47918614745140076, mean loss: 0.6160043733604884
Epoch: 0, step: 295, loss: 0.523289680480957, mean loss: 0.6156911480467062
Epoch: 0, step: 296, loss: 0.4311845600605011, mean loss: 0.6150699137437223
Epoch: 0, step: 297, loss: 0.5053440928459167, mean loss: 0.6147017062910451
Epoch: 0, step: 298, loss: 0.5390363931655884, mean loss: 0.6144486450431339
Epoch: 0, step: 299, loss: 0.5460255146026611, mean loss: 0.6142205679416657
Epoch: 0, step: 300, loss: 0.5488355159759521, mean loss: 0.6140033418554008
Epoch: 0, step: 301, loss: 0.6016528606414795, mean loss: 0.6139624462222422
Epoch: 0, step: 302, loss: 0.47532182931900024, mean loss: 0.6135048864304823
Epoch: 0, step: 303, loss: 0.5165820717811584, mean loss: 0.6131860613822937
Epoch: 0, step: 304, loss: 0.5766047835350037, mean loss: 0.6130661227664009
Epoch: 0, step: 305, loss: 0.5440959334373474, mean loss: 0.6128407299908158
Epoch: 0, step: 306, loss: 0.47404009103775024, mean loss: 0.6123886106456918
Epoch: 0, step: 307, loss: 0.558301568031311, mean loss: 0.6122130033644763
Epoch: 0, step: 308, loss: 0.5089102983474731, mean loss: 0.6118786904032562
Epoch: 0, step: 309, loss: 0.5482245683670044, mean loss: 0.6116733545257198
Epoch: 0, step: 310, loss: 0.46375811100006104, mean loss: 0.6111977428102032
Epoch: 0, step: 311, loss: 0.537634551525116, mean loss: 0.6109619633509562
Epoch: 0, step: 312, loss: 0.42725691199302673, mean loss: 0.610375046253966
Epoch: 0, step: 313, loss: 0.4723648726940155, mean loss: 0.6099355234082336
Epoch: 0, step: 314, loss: 0.43596771359443665, mean loss: 0.60938324464692
Epoch: 0, step: 315, loss: 0.4354851245880127, mean loss: 0.6088329341404044
Epoch: 0, step: 316, loss: 0.47930335998535156, mean loss: 0.6084243234963822
Epoch: 0, step: 317, loss: 0.4717998206615448, mean loss: 0.6079946866950148
Epoch: 0, step: 318, loss: 0.4730182886123657, mean loss: 0.6075715631900535
Epoch: 0, step: 319, loss: 0.4904382526874542, mean loss: 0.6072055215947328
Epoch: 0, step: 320, loss: 0.5060541033744812, mean loss: 0.6068904081423333
Epoch: 0, step: 321, loss: 0.4722887873649597, mean loss: 0.6064723906865029
Epoch: 0, step: 322, loss: 0.5029953718185425, mean loss: 0.6061520283989861
Epoch: 0, step: 323, loss: 0.4591042995452881, mean loss: 0.6056981773840056
Epoch: 0, step: 324, loss: 0.40747734904289246, mean loss: 0.6050882671429559
Epoch: 0, step: 325, loss: 0.44609275460243225, mean loss: 0.6046005508468194
Epoch: 0, step: 326, loss: 0.48767974972724915, mean loss: 0.6042429948800929
Epoch: 0, step: 327, loss: 0.4799630045890808, mean loss: 0.6038640924706691
Epoch: 0, step: 328, loss: 0.51359623670578, mean loss: 0.603589722088405
Epoch: 0, step: 329, loss: 0.4735408127307892, mean loss: 0.603195634484291
Epoch: 0, step: 330, loss: 0.446956604719162, mean loss: 0.60272361324633
Epoch: 0, step: 331, loss: 0.4545069932937622, mean loss: 0.6022771776440632
Epoch: 0, step: 332, loss: 0.49590539932250977, mean loss: 0.6019577428743288
Epoch: 0, step: 333, loss: 0.46348240971565247, mean loss: 0.6015431460684645
Epoch: 0, step: 334, loss: 0.44905951619148254, mean loss: 0.6010879710539063
Epoch: 0, step: 335, loss: 0.5214101672172546, mean loss: 0.6008508347329639
Epoch: 0, step: 336, loss: 0.45928117632865906, mean loss: 0.6004307467258294
Epoch: 0, step: 337, loss: 0.42198050022125244, mean loss: 0.5999027874166443
Epoch: 0, step: 338, loss: 0.465876042842865, mean loss: 0.599507428288108
Epoch: 0, step: 339, loss: 0.48996642231941223, mean loss: 0.5991852488587883
Epoch: 0, step: 340, loss: 0.5021087527275085, mean loss: 0.5989005670519517
Epoch: 0, step: 341, loss: 0.47846558690071106, mean loss: 0.5985484179871821
Epoch: 0, step: 342, loss: 0.490369975566864, mean loss: 0.5982330289422249
Epoch: 0, step: 343, loss: 0.45486366748809814, mean loss: 0.5978162575426489
Epoch: 0, step: 344, loss: 0.5057859420776367, mean loss: 0.5975495030050691
Epoch: 0, step: 345, loss: 0.5138381123542786, mean loss: 0.5973075625696622
Epoch: 0, step: 346, loss: 0.4817448556423187, mean loss: 0.5969745288321194
Epoch: 0, step: 347, loss: 0.4716620147228241, mean loss: 0.5966144354007709
Epoch: 0, step: 348, loss: 0.5365014672279358, mean loss: 0.5964421919389575
Epoch: 0, step: 349, loss: 0.4454195499420166, mean loss: 0.5960106986761091
Epoch: 0, step: 350, loss: 0.5286690592765808, mean loss: 0.5958188421536034
Epoch: 0, step: 351, loss: 0.5309527516365051, mean loss: 0.5956345634873617
Epoch: 0, step: 352, loss: 0.45318201184272766, mean loss: 0.5952310151824194
Epoch: 0, step: 353, loss: 0.4838423430919647, mean loss: 0.5949163579166271
Epoch: 0, step: 354, loss: 0.5409753918647766, mean loss: 0.5947644115333824
Epoch: 0, step: 355, loss: 0.44306010007858276, mean loss: 0.5943382758270488
Epoch: 0, step: 356, loss: 0.49707460403442383, mean loss: 0.5940658285671254
Epoch: 0, step: 357, loss: 0.5150816440582275, mean loss: 0.5938452023534134
Epoch: 0, step: 358, loss: 0.5171788930892944, mean loss: 0.5936316471744048
Epoch: 0, step: 359, loss: 0.4938920736312866, mean loss: 0.5933545928034516
Epoch: 0, step: 360, loss: 0.43053504824638367, mean loss: 0.5929035691343184
Epoch: 0, step: 361, loss: 0.5850845575332642, mean loss: 0.5928819696547575
Epoch: 0, step: 362, loss: 0.46066948771476746, mean loss: 0.5925177479414242
Epoch: 0, step: 363, loss: 0.5275635123252869, mean loss: 0.5923393022391821
Epoch: 0, step: 364, loss: 0.5190779566764832, mean loss: 0.5921385862239418
Epoch: 0, step: 365, loss: 0.4475935101509094, mean loss: 0.5917436543221029
Epoch: 0, step: 366, loss: 0.5072135925292969, mean loss: 0.5915133271782532
Epoch: 0, step: 367, loss: 0.484892338514328, mean loss: 0.5912235962307969
Epoch: 0, step: 368, loss: 0.44969916343688965, mean loss: 0.5908400611825749
Epoch: 0, step: 369, loss: 0.5097461342811584, mean loss: 0.5906208884071656
Epoch: 0, step: 370, loss: 0.5411682724952698, mean loss: 0.5904875929464867
Epoch: 0, step: 371, loss: 0.5097852349281311, mean loss: 0.5902706511238567
Epoch: 0, step: 372, loss: 0.46172577142715454, mean loss: 0.5899260267815063
Epoch: 0, step: 373, loss: 0.585888683795929, mean loss: 0.5899152317467855
Epoch: 0, step: 374, loss: 0.4387296736240387, mean loss: 0.5895120702584582
Epoch: 0, step: 375, loss: 0.5553013682365417, mean loss: 0.5894210843488255
Epoch: 0, step: 376, loss: 0.45821237564086914, mean loss: 0.5890730506387247
Epoch: 0, step: 377, loss: 0.4767226576805115, mean loss: 0.5887758273769305
Epoch: 0, step: 378, loss: 0.5807727575302124, mean loss: 0.5887547110976515
Epoch: 0, step: 379, loss: 0.4679974615573883, mean loss: 0.5884369288620193
Epoch: 0, step: 380, loss: 0.46114328503608704, mean loss: 0.5881028248099827
Epoch: 0, step: 381, loss: 0.44559788703918457, mean loss: 0.5877297752346664
Epoch: 0, step: 382, loss: 0.5217133164405823, mean loss: 0.5875574085015226
Epoch: 0, step: 383, loss: 0.4543638527393341, mean loss: 0.5872105502833919
Epoch: 0, step: 384, loss: 0.49067628383636475, mean loss: 0.586959811928984
Epoch: 0, step: 385, loss: 0.6093793511390686, mean loss: 0.5870178936367823
Epoch: 0, step: 386, loss: 0.47771960496902466, mean loss: 0.5867354691182609
Epoch: 0, step: 387, loss: 0.48744791746139526, mean loss: 0.586479573366568
Epoch: 0, step: 388, loss: 0.4461006224155426, mean loss: 0.5861187020273623
Epoch: 0, step: 389, loss: 0.47880467772483826, mean loss: 0.585843537862484
Epoch: 0, step: 390, loss: 0.46882542967796326, mean loss: 0.5855442588134188
Epoch: 0, step: 391, loss: 0.538993239402771, mean loss: 0.5854255062128814
Epoch: 0, step: 392, loss: 0.4588741362094879, mean loss: 0.5851034925487506
Epoch: 0, step: 393, loss: 0.473688006401062, mean loss: 0.584820712127056
Epoch: 0, step: 394, loss: 0.4344346821308136, mean loss: 0.5844399880004832
Epoch: 0, step: 395, loss: 0.49667003750801086, mean loss: 0.5842183467113609
Epoch: 0, step: 396, loss: 0.5330381989479065, mean loss: 0.5840894294625865
Epoch: 0, step: 397, loss: 0.4706043004989624, mean loss: 0.5838042909476024
Epoch: 0, step: 398, loss: 0.5129736661911011, mean loss: 0.5836267705848042
Epoch: 0, step: 399, loss: 0.447098970413208, mean loss: 0.5832854510843751
Epoch: 0, step: 400, loss: 0.4770409166812897, mean loss: 0.5830205021207764
Epoch: 0, step: 401, loss: 0.47108811140060425, mean loss: 0.5827420633378904
Epoch: 0, step: 402, loss: 0.5345972776412964, mean loss: 0.5826225973684199
Epoch: 0, step: 403, loss: 0.47658154368400574, mean loss: 0.5823601195127655
Epoch: 0, step: 404, loss: 0.5282221436500549, mean loss: 0.5822264454982896
Epoch: 0, step: 405, loss: 0.5613946318626404, mean loss: 0.5821751356124876
Epoch: 0, step: 406, loss: 0.5260971784591675, mean loss: 0.5820373519339782
Epoch: 0, step: 407, loss: 0.4608560800552368, mean loss: 0.5817403390127068
Epoch: 0, step: 408, loss: 0.48322778940200806, mean loss: 0.5814994770332186
Epoch: 0, step: 409, loss: 0.4994422197341919, mean loss: 0.5812993373812697
Epoch: 0, step: 410, loss: 0.5315456986427307, mean loss: 0.5811782822991808
Epoch: 0, step: 411, loss: 0.4725518524646759, mean loss: 0.5809146259160873
Epoch: 0, step: 412, loss: 0.46344029903411865, mean loss: 0.5806301844466395
Epoch: 0, step: 413, loss: 0.47943589091300964, mean loss: 0.5803857537859303
Epoch: 0, step: 414, loss: 0.4832703471183777, mean loss: 0.5801517407578157
Epoch: 0, step: 415, loss: 0.4647846519947052, mean loss: 0.5798744160252121
Epoch: 0, step: 416, loss: 0.6213459372520447, mean loss: 0.579973868114485
Epoch: 0, step: 417, loss: 0.48078176379203796, mean loss: 0.5797365664295031
Epoch: 0, step: 418, loss: 0.5045295357704163, mean loss: 0.579557074709553
Epoch: 0, step: 419, loss: 0.41834819316864014, mean loss: 0.5791732440392174
Epoch: 0, step: 420, loss: 0.43276309967041016, mean loss: 0.5788254764753961
Epoch: 0, step: 421, loss: 0.5005587935447693, mean loss: 0.5786400104021008
Epoch: 0, step: 422, loss: 0.4741881787776947, mean loss: 0.5783930793580715
Epoch: 0, step: 423, loss: 0.40637215971946716, mean loss: 0.5779873696419427
Epoch: 0, step: 424, loss: 0.5086257457733154, mean loss: 0.5778241658210754
Epoch: 0, step: 425, loss: 0.5044779181480408, mean loss: 0.5776519915307632
Epoch: 0, step: 426, loss: 0.4224618375301361, mean loss: 0.5772885485471552
Epoch: 0, step: 427, loss: 0.5480555295944214, mean loss: 0.577220247101004
Epoch: 0, step: 428, loss: 0.5525090098381042, mean loss: 0.5771626451493421
Epoch: 0, step: 429, loss: 0.4979928433895111, mean loss: 0.576978529331296
Epoch: 0, step: 430, loss: 0.478740394115448, mean loss: 0.5767505986231386
Epoch: 0, step: 431, loss: 0.4446752667427063, mean loss: 0.5764448686882302
Epoch: 0, step: 432, loss: 0.47436225414276123, mean loss: 0.5762091120726518
Epoch: 0, step: 433, loss: 0.4958757162094116, mean loss: 0.5760240120821835
Epoch: 0, step: 434, loss: 0.4610123038291931, mean loss: 0.5757596173505674
Epoch: 0, step: 435, loss: 0.43343350291252136, mean loss: 0.5754331813082783
Epoch: 0, step: 436, loss: 0.4713312089443207, mean loss: 0.5751949616918848
Epoch: 0, step: 437, loss: 0.4848329722881317, mean loss: 0.574988655780004
Epoch: 0, step: 438, loss: 0.49950161576271057, mean loss: 0.5748167035248394
Epoch: 0, step: 439, loss: 0.5034106969833374, mean loss: 0.5746544171463359
Epoch: 0, step: 440, loss: 0.519891083240509, mean loss: 0.5745302372508578
Epoch: 0, step: 441, loss: 0.4969745874404907, mean loss: 0.5743547719797937
Epoch: 0, step: 442, loss: 0.45757338404655457, mean loss: 0.5740911571086126
Epoch: 0, step: 443, loss: 0.45938771963119507, mean loss: 0.573832816033213
Epoch: 0, step: 444, loss: 0.42631182074546814, mean loss: 0.5735013081786338
Epoch: 0, step: 445, loss: 0.49103909730911255, mean loss: 0.5733164153291506
Epoch: 0, step: 446, loss: 0.42607489228248596, mean loss: 0.572987015948733
Epoch: 0, step: 447, loss: 0.5153131484985352, mean loss: 0.5728582796374603
Epoch: 0, step: 448, loss: 0.4660259783267975, mean loss: 0.5726203457815345
Epoch: 0, step: 449, loss: 0.5306980609893799, mean loss: 0.5725271851486631
Epoch: 0, step: 450, loss: 0.5568492412567139, mean loss: 0.5724924225236255
Epoch: 0, step: 451, loss: 0.4095105528831482, mean loss: 0.5721318431660138
Epoch: 0, step: 452, loss: 0.532845139503479, mean loss: 0.5720451175508647
Epoch: 0, step: 453, loss: 0.5338507294654846, mean loss: 0.5719609889427472
Epoch: 0, step: 454, loss: 0.4052383303642273, mean loss: 0.5715945655172998
Epoch: 0, step: 455, loss: 0.4750882387161255, mean loss: 0.5713829288357183
Epoch: 0, step: 456, loss: 0.5102924704551697, mean loss: 0.5712492516839008
Epoch: 0, step: 457, loss: 0.4588852822780609, mean loss: 0.5710039155061588
Epoch: 0, step: 458, loss: 0.49255916476249695, mean loss: 0.5708330119097674
Epoch: 0, step: 459, loss: 0.45216283202171326, mean loss: 0.5705750332578369
Epoch: 0, step: 460, loss: 0.4423506259918213, mean loss: 0.5702968892073683
Epoch: 0, step: 461, loss: 0.42609289288520813, mean loss: 0.5699847593451991
Epoch: 0, step: 462, loss: 0.42881372570991516, mean loss: 0.56967985430495
Epoch: 0, step: 463, loss: 0.47259822487831116, mean loss: 0.5694706266553237
Epoch: 0, step: 464, loss: 0.4426373541355133, mean loss: 0.5691978669294746
Epoch: 0, step: 465, loss: 0.5174790024757385, mean loss: 0.5690868822418056
Epoch: 0, step: 466, loss: 0.4773270785808563, mean loss: 0.5688903944395337
Epoch: 0, step: 467, loss: 0.49083787202835083, mean loss: 0.5687236155454927
Epoch: 0, step: 468, loss: 0.4589560627937317, mean loss: 0.5684895695907981
Epoch: 0, step: 469, loss: 0.49279162287712097, mean loss: 0.5683285101297052
Epoch: 0, step: 470, loss: 0.48687344789505005, mean loss: 0.5681555694455552
Epoch: 0, step: 471, loss: 0.45130354166030884, mean loss: 0.567908001590078
Epoch: 0, step: 472, loss: 0.5123452544212341, mean loss: 0.5677905327799959
Epoch: 0, step: 473, loss: 0.42792069911956787, mean loss: 0.5674954487427376
Epoch: 0, step: 474, loss: 0.4570155143737793, mean loss: 0.567262859407224
Epoch: 0, step: 475, loss: 0.411443293094635, mean loss: 0.5669355073771555
Epoch: 0, step: 476, loss: 0.46760043501853943, mean loss: 0.5667272577495693
Epoch: 0, step: 477, loss: 0.45631054043769836, mean loss: 0.5664962604330173
Epoch: 0, step: 478, loss: 0.46118542551994324, mean loss: 0.5662764048277708
Epoch: 0, step: 479, loss: 0.4575344920158386, mean loss: 0.5660498591760792
Epoch: 0, step: 480, loss: 0.5204192399978638, mean loss: 0.5659549930239416
Epoch: 0, step: 481, loss: 0.6342304944992065, mean loss: 0.5660966434419401
Epoch: 0, step: 482, loss: 0.42464420199394226, mean loss: 0.5658037812443252
Epoch: 0, step: 483, loss: 0.4681638181209564, mean loss: 0.5656020457833265
Epoch: 0, step: 484, loss: 0.3802269995212555, mean loss: 0.5652198291930954
Epoch: 0, step: 485, loss: 0.49718642234802246, mean loss: 0.5650798427592578
Epoch: 0, step: 486, loss: 0.5062694549560547, mean loss: 0.5649590822093539
Epoch: 0, step: 487, loss: 0.46754732728004456, mean loss: 0.5647594679574496
Epoch: 0, step: 488, loss: 0.4645722210407257, mean loss: 0.5645545860619143
Epoch: 0, step: 489, loss: 0.4302176535129547, mean loss: 0.5642804290567124
Epoch: 0, step: 490, loss: 0.47738879919052124, mean loss: 0.5641034603604472
Epoch: 0, step: 491, loss: 0.4324842095375061, mean loss: 0.5638359415579616
Epoch: 0, step: 492, loss: 0.4724816679954529, mean loss: 0.5636506387718307
Epoch: 0, step: 493, loss: 0.5049123167991638, mean loss: 0.5635317352860562
Epoch: 0, step: 494, loss: 0.4906409978866577, mean loss: 0.5633844812711079
Epoch: 0, step: 495, loss: 0.41010016202926636, mean loss: 0.5630754403048944
Epoch: 0, step: 496, loss: 0.4880549907684326, mean loss: 0.5629244937263502
Epoch: 0, step: 497, loss: 0.44858431816101074, mean loss: 0.5626948949802351
Epoch: 0, step: 498, loss: 0.4615040719509125, mean loss: 0.5624921077597355
Epoch: 0, step: 499, loss: 0.5068670511245728, mean loss: 0.5623808576464652
Epoch: 0, step: 500, loss: 0.49430158734321594, mean loss: 0.5622449708793928
Epoch: 0, step: 501, loss: 0.5032212138175964, mean loss: 0.5621273936740905
Epoch: 0, step: 502, loss: 0.5242226719856262, mean loss: 0.5620520363745111
Epoch: 0, step: 503, loss: 0.4940255880355835, mean loss: 0.5619170632627275
Epoch: 0, step: 504, loss: 0.5036541819572449, mean loss: 0.5618016912205385
Epoch: 0, step: 505, loss: 0.5216696262359619, mean loss: 0.561722378839146
Epoch: 0, step: 506, loss: 0.4584524929523468, mean loss: 0.5615186907013022
Epoch: 0, step: 507, loss: 0.42911186814308167, mean loss: 0.5612580473498097
Epoch: 0, step: 508, loss: 0.42759969830513, mean loss: 0.5609954572731011
Epoch: 0, step: 509, loss: 0.47097277641296387, mean loss: 0.560818942212591
Epoch: 0, step: 510, loss: 0.4879809319972992, mean loss: 0.5606764020751833
Epoch: 0, step: 511, loss: 0.45401275157928467, mean loss: 0.5604680746328086
Epoch: 0, step: 512, loss: 0.5659003853797913, mean loss: 0.5604786639325103
Epoch: 0, step: 513, loss: 0.49801358580589294, mean loss: 0.5603571365431589
Epoch: 0, step: 514, loss: 0.43910470604896545, mean loss: 0.5601216949305488
Epoch: 0, step: 515, loss: 0.4759124517440796, mean loss: 0.559958498722823
Epoch: 0, step: 516, loss: 0.48213741183280945, mean loss: 0.5598079743768075
Epoch: 0, step: 517, loss: 0.43664175271987915, mean loss: 0.5595702017481262
Epoch: 0, step: 518, loss: 0.40841901302337646, mean loss: 0.5592789663170573
Epoch: 0, step: 519, loss: 0.4320375323295593, mean loss: 0.5590342712516967
Epoch: 0, step: 520, loss: 0.5224766731262207, mean loss: 0.5589641031170989
Epoch: 0, step: 521, loss: 0.44622868299484253, mean loss: 0.5587481348793167
Epoch: 0, step: 522, loss: 0.44174274802207947, mean loss: 0.5585244152103737
Epoch: 0, step: 523, loss: 0.45742982625961304, mean loss: 0.5583314866055058
Epoch: 0, step: 524, loss: 0.47106996178627014, mean loss: 0.5581652741772787
Epoch: 0, step: 525, loss: 0.43757423758506775, mean loss: 0.557936013651438
Epoch: 0, step: 526, loss: 0.42292869091033936, mean loss: 0.5576798327733714
Epoch: 0, step: 527, loss: 0.45298129320144653, mean loss: 0.5574815400847882
Epoch: 0, step: 528, loss: 0.4635623097419739, mean loss: 0.5573039990066354
Epoch: 0, step: 529, loss: 0.5101476311683655, mean loss: 0.5572150247276952
Epoch: 0, step: 530, loss: 0.46164804697036743, mean loss: 0.5570350492516928
Epoch: 0, step: 531, loss: 0.4795099198818207, mean loss: 0.5568893253243058
Epoch: 0, step: 532, loss: 0.4321102797985077, mean loss: 0.5566552182970529
Epoch: 0, step: 533, loss: 0.4449057877063751, mean loss: 0.5564459497004411
Epoch: 0, step: 534, loss: 0.45722389221191406, mean loss: 0.556260487910743
Epoch: 0, step: 535, loss: 0.4413088262081146, mean loss: 0.5560460258553277
Epoch: 0, step: 536, loss: 0.46434804797172546, mean loss: 0.5558752661199765
Epoch: 0, step: 537, loss: 0.45989662408828735, mean loss: 0.5556968671570923
Epoch: 0, step: 538, loss: 0.4159158766269684, mean loss: 0.5554375332228991
Epoch: 0, step: 539, loss: 0.49281686544418335, mean loss: 0.5553215690233089
Epoch: 0, step: 540, loss: 0.4682330787181854, mean loss: 0.5551605921465896
Epoch: 0, step: 541, loss: 0.46833711862564087, mean loss: 0.5550004012360343
Epoch: 0, step: 542, loss: 0.4781433641910553, mean loss: 0.5548588597313474
Epoch: 0, step: 543, loss: 0.4304448068141937, mean loss: 0.5546301574281909
Epoch: 0, step: 544, loss: 0.47463956475257874, mean loss: 0.5544833856985109
Epoch: 0, step: 545, loss: 0.4612085223197937, mean loss: 0.5543125526153997
Epoch: 0, step: 546, loss: 0.4742072820663452, mean loss: 0.5541661078794782
Epoch: 0, step: 547, loss: 0.5327316522598267, mean loss: 0.5541269939093694
Epoch: 0, step: 548, loss: 0.4081707298755646, mean loss: 0.5538611355049362
Epoch: 0, step: 549, loss: 0.44015511870384216, mean loss: 0.5536543972925706
Epoch: 0, step: 550, loss: 0.490753173828125, mean loss: 0.5535402389922721
Epoch: 0, step: 551, loss: 0.47271928191185, mean loss: 0.5533938242149525
Epoch: 0, step: 552, loss: 0.5370109677314758, mean loss: 0.5533641987963568
Epoch: 0, step: 553, loss: 0.44368138909339905, mean loss: 0.5531662153853406
Epoch: 0, step: 554, loss: 0.4557715356349945, mean loss: 0.5529907294758806
Epoch: 0, step: 555, loss: 0.4251192808151245, mean loss: 0.5527607448559871
Epoch: 0, step: 556, loss: 0.4689579904079437, mean loss: 0.5526102910778039
Epoch: 0, step: 557, loss: 0.4457128643989563, mean loss: 0.5524187186285586
Epoch: 0, step: 558, loss: 0.45675650238990784, mean loss: 0.5522475876513875
Epoch: 0, step: 559, loss: 0.5044009685516357, mean loss: 0.5521621472601379
Epoch: 0, step: 560, loss: 0.5051411986351013, mean loss: 0.5520783309524284
Epoch: 0, step: 561, loss: 0.467588871717453, mean loss: 0.5519279938363519
Epoch: 0, step: 562, loss: 0.39719441533088684, mean loss: 0.5516531562191131
Epoch: 0, step: 563, loss: 0.5260212421417236, mean loss: 0.5516077095629476
Epoch: 0, step: 564, loss: 0.470064640045166, mean loss: 0.551463385546102
Epoch: 0, step: 565, loss: 0.4936014711856842, mean loss: 0.5513611560154299
Epoch: 0, step: 566, loss: 0.4960518777370453, mean loss: 0.5512636087874256
Epoch: 0, step: 567, loss: 0.4571160674095154, mean loss: 0.5510978560737322
Epoch: 0, step: 568, loss: 0.49500730633735657, mean loss: 0.5509992786576753
Epoch: 0, step: 569, loss: 0.472277969121933, mean loss: 0.5508611710970862
Epoch: 0, step: 570, loss: 0.5370633006095886, mean loss: 0.5508370067004356
Epoch: 0, step: 571, loss: 0.43898335099220276, mean loss: 0.5506414583512953
Epoch: 0, step: 572, loss: 0.4430959224700928, mean loss: 0.550453769807
Epoch: 0, step: 573, loss: 0.4260686933994293, mean loss: 0.550237071067614
Epoch: 0, step: 574, loss: 0.42415985465049744, mean loss: 0.5500178063434104
Epoch: 0, step: 575, loss: 0.4396541118621826, mean loss: 0.5498262027071582
Epoch: 0, step: 576, loss: 0.4301604628562927, mean loss: 0.5496188097438118
Epoch: 0, step: 577, loss: 0.4714822471141815, mean loss: 0.5494836253794007
Epoch: 0, step: 578, loss: 0.48214125633239746, mean loss: 0.5493673173154162
Epoch: 0, step: 579, loss: 0.49697619676589966, mean loss: 0.5492769877972274
Epoch: 0, step: 580, loss: 0.4796127378940582, mean loss: 0.5491570837526437
Epoch: 0, step: 581, loss: 0.4327163100242615, mean loss: 0.5489570136946912
Epoch: 0, step: 582, loss: 0.5033524632453918, mean loss: 0.5488787897659617
Epoch: 0, step: 583, loss: 0.4041348695755005, mean loss: 0.5486309405875534
Epoch: 0, step: 584, loss: 0.40440869331359863, mean loss: 0.5483844068315294
Epoch: 0, step: 585, loss: 0.4398115873336792, mean loss: 0.548199128982557
Epoch: 0, step: 586, loss: 0.4805402457714081, mean loss: 0.5480838668305789
Epoch: 0, step: 587, loss: 0.4730871915817261, mean loss: 0.5479563214645093
Epoch: 0, step: 588, loss: 0.47650811076164246, mean loss: 0.5478350172018559
Epoch: 0, step: 589, loss: 0.4611668288707733, mean loss: 0.5476881219673965
Epoch: 0, step: 590, loss: 0.456705778837204, mean loss: 0.54753417553232
Epoch: 0, step: 591, loss: 0.5174865126609802, mean loss: 0.5474834193450373
Epoch: 0, step: 592, loss: 0.5466675758361816, mean loss: 0.5474820435549718
Epoch: 0, step: 593, loss: 0.5007116198539734, mean loss: 0.547403305467933
Epoch: 0, step: 594, loss: 0.4735231101512909, mean loss: 0.5472791370724429
Epoch: 0, step: 595, loss: 0.49285441637039185, mean loss: 0.5471878204269697
Epoch: 0, step: 596, loss: 0.38027244806289673, mean loss: 0.5469082301885039
Epoch: 0, step: 597, loss: 0.4295472502708435, mean loss: 0.5467119743692436
Epoch: 0, step: 598, loss: 0.47210177779197693, mean loss: 0.5465874164450745
Epoch: 0, step: 599, loss: 0.4368517994880676, mean loss: 0.5464045237501461
Epoch: 0, step: 600, loss: 0.38130441308021545, mean loss: 0.5461298147473675
Epoch: 0, step: 601, loss: 0.5066381692886353, mean loss: 0.5460642140074029
Epoch: 0, step: 602, loss: 0.4176488220691681, mean loss: 0.5458512531584174
Epoch: 0, step: 603, loss: 0.45162642002105713, mean loss: 0.545695251779051
Epoch: 0, step: 604, loss: 0.4456428289413452, mean loss: 0.5455298758735341
Epoch: 0, step: 605, loss: 0.45834624767303467, mean loss: 0.545386008500266
Epoch: 0, step: 606, loss: 0.44337233901023865, mean loss: 0.5452179464417981
Epoch: 0, step: 607, loss: 0.4497545063495636, mean loss: 0.5450609342048043
Epoch: 0, step: 608, loss: 0.461138516664505, mean loss: 0.544923130563523
Epoch: 0, step: 609, loss: 0.4096122682094574, mean loss: 0.5447013094776967
Epoch: 0, step: 610, loss: 0.4544086456298828, mean loss: 0.5445535309771274
Epoch: 0, step: 611, loss: 0.49485188722610474, mean loss: 0.544472319140933
Epoch: 0, step: 612, loss: 0.45790693163871765, mean loss: 0.5443311031743714
Epoch: 0, step: 613, loss: 0.4536304473876953, mean loss: 0.5441833822366081
Epoch: 0, step: 614, loss: 0.41875091195106506, mean loss: 0.5439794270003715
Epoch: 0, step: 615, loss: 0.46298912167549133, mean loss: 0.543847949231987
Epoch: 0, step: 616, loss: 0.5101224780082703, mean loss: 0.5437932888248173
Epoch: 0, step: 617, loss: 0.4306982755661011, mean loss: 0.5436102871852401
Epoch: 0, step: 618, loss: 0.41482725739479065, mean loss: 0.5434022370563379
Epoch: 0, step: 619, loss: 0.48848748207092285, mean loss: 0.5433136648708776
Epoch: 0, step: 620, loss: 0.44367992877960205, mean loss: 0.5431532240720189
Epoch: 0, step: 621, loss: 0.45070934295654297, mean loss: 0.5430046004689394
Epoch: 0, step: 622, loss: 0.4494321644306183, mean loss: 0.5428544039423931
Epoch: 0, step: 623, loss: 0.41636866331100464, mean loss: 0.5426517024349711
Epoch: 0, step: 624, loss: 0.5164380669593811, mean loss: 0.5426097606182101
Epoch: 0, step: 625, loss: 0.5056918263435364, mean loss: 0.542550786282308
Epoch: 0, step: 626, loss: 0.4603904187679291, mean loss: 0.5424197490135451
Epoch: 0, step: 627, loss: 0.42196211218833923, mean loss: 0.542227937489938
Epoch: 0, step: 628, loss: 0.4473951458930969, mean loss: 0.54207716993573
Epoch: 0, step: 629, loss: 0.3961501717567444, mean loss: 0.5418455397798903
Epoch: 0, step: 630, loss: 0.3836016058921814, mean loss: 0.5415947570003534
Epoch: 0, step: 631, loss: 0.4884340465068817, mean loss: 0.5415106419521043
Epoch: 0, step: 632, loss: 0.4787815809249878, mean loss: 0.5414115439094074
Epoch: 0, step: 633, loss: 0.5432913303375244, mean loss: 0.5414145088722278
Epoch: 0, step: 634, loss: 0.4214310050010681, mean loss: 0.5412255584724307
Epoch: 0, step: 635, loss: 0.48455384373664856, mean loss: 0.5411364520027203
Epoch: 0, step: 636, loss: 0.49128440022468567, mean loss: 0.5410581913248899
Epoch: 0, step: 637, loss: 0.4520461857318878, mean loss: 0.540918674074744
Epoch: 0, step: 638, loss: 0.41655653715133667, mean loss: 0.5407240541421565
Epoch: 0, step: 639, loss: 0.42046260833740234, mean loss: 0.5405361456330866
Epoch: 0, step: 640, loss: 0.4531622529029846, mean loss: 0.5403998369080787
Epoch: 0, step: 641, loss: 0.4526653289794922, mean loss: 0.5402631787960404
Epoch: 0, step: 642, loss: 0.44981738924980164, mean loss: 0.5401225166039
Epoch: 0, step: 643, loss: 0.41024279594421387, mean loss: 0.5399208400190247
Epoch: 0, step: 644, loss: 0.4488462507724762, mean loss: 0.5397796391054642
Epoch: 0, step: 645, loss: 0.44981279969215393, mean loss: 0.5396403715521928
Epoch: 0, step: 646, loss: 0.43474993109703064, mean loss: 0.5394782534062034
Epoch: 0, step: 647, loss: 0.4206429719924927, mean loss: 0.539294865626244
Epoch: 0, step: 648, loss: 0.4898488521575928, mean loss: 0.539218677623981
Epoch: 0, step: 649, loss: 0.5025273561477661, mean loss: 0.5391622294370946
Epoch: 0, step: 650, loss: 0.4246862232685089, mean loss: 0.5389863830374501
Epoch: 0, step: 651, loss: 0.4445969760417938, mean loss: 0.5388416140083157
Epoch: 0, step: 652, loss: 0.48320192098617554, mean loss: 0.5387564077402879
Epoch: 0, step: 653, loss: 0.43409234285354614, mean loss: 0.538596370943825
Epoch: 0, step: 654, loss: 0.49263912439346313, mean loss: 0.5385262072086335
Epoch: 0, step: 655, loss: 0.5056370496749878, mean loss: 0.5384760712977591
Epoch: 0, step: 656, loss: 0.4369773268699646, mean loss: 0.538321583102283
Epoch: 0, step: 657, loss: 0.4797612726688385, mean loss: 0.5382325856700133
Epoch: 0, step: 658, loss: 0.4796614646911621, mean loss: 0.5381437068824885
Epoch: 0, step: 659, loss: 0.5270745158195496, mean loss: 0.538126935380878
Epoch: 0, step: 660, loss: 0.4349311888217926, mean loss: 0.5379708147355541
Epoch: 0, step: 661, loss: 0.5356647372245789, mean loss: 0.5379673312347822
Epoch: 0, step: 662, loss: 0.48165348172187805, mean loss: 0.5378823933018819
Epoch: 0, step: 663, loss: 0.4530061185359955, mean loss: 0.537754567586873
Epoch: 0, step: 664, loss: 0.43409207463264465, mean loss: 0.5375986841388215
Epoch: 0, step: 665, loss: 0.3894251883029938, mean loss: 0.5373762014123413
Epoch: 0, step: 666, loss: 0.44068625569343567, mean loss: 0.5372312389749816
Epoch: 0, step: 667, loss: 0.4446343183517456, mean loss: 0.537092620830336
Epoch: 0, step: 668, loss: 0.40271565318107605, mean loss: 0.5368917583973775
Epoch: 0, step: 669, loss: 0.41518476605415344, mean loss: 0.5367101061699995
Epoch: 0, step: 670, loss: 0.47027909755706787, mean loss: 0.5366111031765376
Epoch: 0, step: 671, loss: 0.461009681224823, mean loss: 0.536498601060538
Epoch: 0, step: 672, loss: 0.411605566740036, mean loss: 0.5363130244865105
Epoch: 0, step: 673, loss: 0.46766138076782227, mean loss: 0.5362111674483523
Epoch: 0, step: 674, loss: 0.4318601191043854, mean loss: 0.5360565733026575
Epoch: 0, step: 675, loss: 0.4553872048854828, mean loss: 0.535937239917425
Epoch: 0, step: 676, loss: 0.4422995150089264, mean loss: 0.5357989271775306
Epoch: 0, step: 677, loss: 0.40826302766799927, mean loss: 0.5356108211310564
Epoch: 0, step: 678, loss: 0.4752216339111328, mean loss: 0.5355218827109977
Epoch: 0, step: 679, loss: 0.45253774523735046, mean loss: 0.5353998472147129
Epoch: 0, step: 680, loss: 0.42888790369033813, mean loss: 0.5352434420112997
Epoch: 0, step: 681, loss: 0.536665141582489, mean loss: 0.5352455266147765
Epoch: 0, step: 682, loss: 0.4266565144062042, mean loss: 0.5350865383099324
Epoch: 0, step: 683, loss: 0.45019641518592834, mean loss: 0.534962429942792
Epoch: 0, step: 684, loss: 0.4125862419605255, mean loss: 0.5347837785734748
Epoch: 0, step: 685, loss: 0.5103561878204346, mean loss: 0.5347481698405987
Epoch: 0, step: 686, loss: 0.43357935547828674, mean loss: 0.53460090810208
Epoch: 0, step: 687, loss: 0.48107460141181946, mean loss: 0.5345231082377047
Epoch: 0, step: 688, loss: 0.4738706648349762, mean loss: 0.5344350785665831
Epoch: 0, step: 689, loss: 0.4569888114929199, mean loss: 0.5343228375998097
Epoch: 0, step: 690, loss: 0.426130473613739, mean loss: 0.5341662639905679
Epoch: 0, step: 691, loss: 0.4281660318374634, mean loss: 0.534013084464335
Epoch: 0, step: 692, loss: 0.46246176958084106, mean loss: 0.5339098358137095
Epoch: 0, step: 693, loss: 0.452808678150177, mean loss: 0.5337929753559811
Epoch: 0, step: 694, loss: 0.429116815328598, mean loss: 0.5336423621760856
Epoch: 0, step: 695, loss: 0.46185362339019775, mean loss: 0.5335392174364507
Epoch: 0, step: 696, loss: 0.4498583674430847, mean loss: 0.5334191588281388
Epoch: 0, step: 697, loss: 0.4720015823841095, mean loss: 0.533331168030941
Epoch: 0, step: 698, loss: 0.45838576555252075, mean loss: 0.5332239500016444
Epoch: 0, step: 699, loss: 0.4802827835083008, mean loss: 0.5331483197637967
Epoch: 0, step: 700, loss: 0.4846675395965576, mean loss: 0.5330791603056408
Epoch: 0, step: 701, loss: 0.4401789903640747, mean loss: 0.5329468238812226
Epoch: 0, step: 702, loss: 0.45972806215286255, mean loss: 0.5328426720153217
Epoch: 0, step: 703, loss: 0.3746773302555084, mean loss: 0.5326180053366856
Epoch: 0, step: 704, loss: 0.4264312982559204, mean loss: 0.5324673858940179
Epoch: 0, step: 705, loss: 0.4188652038574219, mean loss: 0.5323064762877338
Epoch: 0, step: 706, loss: 0.4328145980834961, mean loss: 0.5321657522733007
Epoch: 0, step: 707, loss: 0.4003821611404419, mean loss: 0.5319796172575763
Epoch: 0, step: 708, loss: 0.42823854088783264, mean loss: 0.5318332969806091
Epoch: 0, step: 709, loss: 0.4234091639518738, mean loss: 0.5316805869340897
Epoch: 0, step: 710, loss: 0.4139626622200012, mean loss: 0.5315150202326634
Epoch: 0, step: 711, loss: 0.43392229080200195, mean loss: 0.5313779517924518
Epoch: 0, step: 712, loss: 0.5309868454933167, mean loss: 0.5313774032562679
Epoch: 0, step: 713, loss: 0.43757084012031555, mean loss: 0.5312460215151812
Epoch: 0, step: 714, loss: 0.43931955099105835, mean loss: 0.5311174530249376
Epoch: 0, step: 715, loss: 0.5032444596290588, mean loss: 0.5310785242632116
Epoch: 0, step: 716, loss: 0.44084882736206055, mean loss: 0.5309526808923591
Epoch: 0, step: 717, loss: 0.4819871187210083, mean loss: 0.5308844837305606
Epoch: 0, step: 718, loss: 0.37864792346954346, mean loss: 0.5306727499888902
Epoch: 0, step: 719, loss: 0.4637211859226227, mean loss: 0.5305797617054648
Epoch: 0, step: 720, loss: 0.42393600940704346, mean loss: 0.530431850814621
Epoch: 0, step: 721, loss: 0.4216334819793701, mean loss: 0.5302811605530763
Epoch: 0, step: 722, loss: 0.35632002353668213, mean loss: 0.5300405504050592
Epoch: 0, step: 723, loss: 0.496103972196579, mean loss: 0.5299936766782518
Epoch: 0, step: 724, loss: 0.41568639874458313, mean loss: 0.5298360114673089
Epoch: 0, step: 725, loss: 0.4962146580219269, mean loss: 0.5297897010631141
Epoch: 0, step: 726, loss: 0.4032246470451355, mean loss: 0.5296156088292516
Epoch: 0, step: 727, loss: 0.5235971808433533, mean loss: 0.5296073417578424
Epoch: 0, step: 728, loss: 0.43193185329437256, mean loss: 0.5294733561769598
Epoch: 0, step: 729, loss: 0.455972284078598, mean loss: 0.5293726697768251
Epoch: 0, step: 730, loss: 0.3959146738052368, mean loss: 0.5291901006988886
Epoch: 0, step: 731, loss: 0.4911922514438629, mean loss: 0.5291381910687588
Epoch: 0, step: 732, loss: 0.4610444903373718, mean loss: 0.529045293796274
Epoch: 0, step: 733, loss: 0.45106467604637146, mean loss: 0.5289390531726365
Epoch: 0, step: 734, loss: 0.4727506935596466, mean loss: 0.5288626064248637
Epoch: 0, step: 735, loss: 0.5081589221954346, mean loss: 0.5288344764191172
Epoch: 0, step: 736, loss: 0.49530816078186035, mean loss: 0.5287889861672349
Epoch: 0, step: 737, loss: 0.48378464579582214, mean loss: 0.5287280046762167
Epoch: 0, step: 738, loss: 0.4384830594062805, mean loss: 0.5286058870236187
Epoch: 0, step: 739, loss: 0.39840811491012573, mean loss: 0.5284299440883301
Epoch: 0, step: 740, loss: 0.46787571907043457, mean loss: 0.5283482244864166
Epoch: 0, step: 741, loss: 0.41493234038352966, mean loss: 0.5281953728905906
Epoch: 0, step: 742, loss: 0.3906908631324768, mean loss: 0.5280103062556537
Epoch: 0, step: 743, loss: 0.4544667899608612, mean loss: 0.5279114574434295
Epoch: 0, step: 744, loss: 0.4301326870918274, mean loss: 0.5277802107718166
Epoch: 0, step: 745, loss: 0.4321499764919281, mean loss: 0.5276520201092431
Epoch: 0, step: 746, loss: 0.4277159869670868, mean loss: 0.5275182369323459
Epoch: 0, step: 747, loss: 0.4777733385562897, mean loss: 0.5274517330575116
Epoch: 0, step: 748, loss: 0.4096031188964844, mean loss: 0.5272943917835984
Epoch: 0, step: 749, loss: 0.4507099986076355, mean loss: 0.5271922792593637
Epoch: 0, step: 750, loss: 0.4574829936027527, mean loss: 0.5270994573077571
Epoch: 0, step: 751, loss: 0.3989178240299225, mean loss: 0.5269290030081855
Epoch: 0, step: 752, loss: 0.4392407536506653, mean loss: 0.526812551149809
Epoch: 0, step: 753, loss: 0.5120478868484497, mean loss: 0.5267929693669159
Epoch: 0, step: 754, loss: 0.5038197636604309, mean loss: 0.5267625412798874
Epoch: 0, step: 755, loss: 0.4418400228023529, mean loss: 0.5266502099062399
Epoch: 0, step: 756, loss: 0.4270000457763672, mean loss: 0.5265185716445095
Epoch: 0, step: 757, loss: 0.444392591714859, mean loss: 0.5264102260245496
Epoch: 0, step: 758, loss: 0.45658573508262634, mean loss: 0.5263182306478145
Epoch: 0, step: 759, loss: 0.40809381008148193, mean loss: 0.5261626721997009
Epoch: 0, step: 760, loss: 0.41516202688217163, mean loss: 0.526016810642122
Epoch: 0, step: 761, loss: 0.5151282548904419, mean loss: 0.5260025211988784
Epoch: 0, step: 762, loss: 0.44521430134773254, mean loss: 0.525896638866177
Epoch: 0, step: 763, loss: 0.5074212551116943, mean loss: 0.5258724564267078
Epoch: 0, step: 764, loss: 0.47760626673698425, mean loss: 0.5258093633682899
Epoch: 0, step: 765, loss: 0.446150004863739, mean loss: 0.5257053694276834
Epoch: 0, step: 766, loss: 0.41455984115600586, mean loss: 0.5255604600036003
Epoch: 0, step: 767, loss: 0.4219017028808594, mean loss: 0.5254254876635968
Epoch: 0, step: 768, loss: 0.4310252070426941, mean loss: 0.525302730471632
Epoch: 0, step: 769, loss: 0.44979774951934814, mean loss: 0.5252046720548108
Epoch: 0, step: 770, loss: 0.49324798583984375, mean loss: 0.5251632236939613
Epoch: 0, step: 771, loss: 0.40180596709251404, mean loss: 0.5250034345014724
Epoch: 0, step: 772, loss: 0.4508236050605774, mean loss: 0.5249074709446278
Epoch: 0, step: 773, loss: 0.46496298909187317, mean loss: 0.5248300232936552
Epoch: 0, step: 774, loss: 0.38430166244506836, mean loss: 0.5246486963764313
Epoch: 0, step: 775, loss: 0.41631942987442017, mean loss: 0.5245090968061967
Epoch: 0, step: 776, loss: 0.46699580550193787, mean loss: 0.5244350771262685
Epoch: 0, step: 777, loss: 0.3978629410266876, mean loss: 0.5242723880053178
Epoch: 0, step: 778, loss: 0.45492252707481384, mean loss: 0.524183363793597
Epoch: 0, step: 779, loss: 0.4513951241970062, mean loss: 0.5240900455377039
Epoch: 0, step: 780, loss: 0.3837200999259949, mean loss: 0.5239103144933868
Epoch: 0, step: 781, loss: 0.42086562514305115, mean loss: 0.5237785437908927
Epoch: 0, step: 782, loss: 0.44756829738616943, mean loss: 0.5236812126971446
Epoch: 0, step: 783, loss: 0.4857145845890045, mean loss: 0.5236327858755782
Epoch: 0, step: 784, loss: 0.49428585171699524, mean loss: 0.5235954012460767
Epoch: 0, step: 785, loss: 0.44225120544433594, mean loss: 0.5234919099028175
Epoch: 0, step: 786, loss: 0.4351733326911926, mean loss: 0.5233796880766274
Epoch: 0, step: 787, loss: 0.42819562554359436, mean loss: 0.5232588961190981
Epoch: 0, step: 788, loss: 0.49222999811172485, mean loss: 0.5232195692521686
Epoch: 0, step: 789, loss: 0.4019184112548828, mean loss: 0.5230660234825518
Epoch: 0, step: 790, loss: 0.41852495074272156, mean loss: 0.5229338603058896
Epoch: 0, step: 791, loss: 0.4771440625190735, mean loss: 0.5228760449046437
Epoch: 0, step: 792, loss: 0.4244590997695923, mean loss: 0.5227519377859362
Epoch: 0, step: 793, loss: 0.4223613739013672, mean loss: 0.5226255013074922
Epoch: 0, step: 794, loss: 0.42947500944137573, mean loss: 0.522508330877472
Epoch: 0, step: 795, loss: 0.4598310887813568, mean loss: 0.5224295906235824
Epoch: 0, step: 796, loss: 0.4274047017097473, mean loss: 0.5223103624066265
Epoch: 0, step: 797, loss: 0.3649291396141052, mean loss: 0.5221131428291923
Epoch: 0, step: 798, loss: 0.45960307121276855, mean loss: 0.5220349074454421
Epoch: 0, step: 799, loss: 0.4188150465488434, mean loss: 0.5219058826193214
Epoch: 0, step: 800, loss: 0.44045454263687134, mean loss: 0.521804195553176
Epoch: 0, step: 801, loss: 0.4361955523490906, mean loss: 0.5216974516090312
Epoch: 0, step: 802, loss: 0.4120788872241974, mean loss: 0.5215609403208807
Epoch: 0, step: 803, loss: 0.47003838419914246, mean loss: 0.5214968575396348
Epoch: 0, step: 804, loss: 0.4578680992126465, mean loss: 0.5214178156038249
Epoch: 0, step: 805, loss: 0.4611610472202301, mean loss: 0.5213430553452845
Epoch: 0, step: 806, loss: 0.44037896394729614, mean loss: 0.5212427280944815
Epoch: 0, step: 807, loss: 0.456299364566803, mean loss: 0.521162352644571
Epoch: 0, step: 808, loss: 0.39116156101226807, mean loss: 0.5210016594534309
Epoch: 0, step: 809, loss: 0.44274213910102844, mean loss: 0.5209050427616378
Epoch: 0, step: 810, loss: 0.4790993332862854, mean loss: 0.5208534944145659
Epoch: 0, step: 811, loss: 0.5781908631324768, mean loss: 0.5209241069376175
Epoch: 0, step: 812, loss: 0.40607738494873047, mean loss: 0.5207828440569423
Epoch: 0, step: 813, loss: 0.4527879059314728, mean loss: 0.5206993121919233
Epoch: 0, step: 814, loss: 0.4230421781539917, mean loss: 0.5205794874875823
Epoch: 0, step: 815, loss: 0.455733984708786, mean loss: 0.5205000199596671
Epoch: 0, step: 816, loss: 0.42922842502593994, mean loss: 0.5203883044211925
Epoch: 0, step: 817, loss: 0.4555043876171112, mean loss: 0.5203089842295006
Epoch: 0, step: 818, loss: 0.4702616333961487, mean loss: 0.5202478763530252
Epoch: 0, step: 819, loss: 0.4639279842376709, mean loss: 0.5201791935577625
Epoch: 0, step: 820, loss: 0.45158326625823975, mean loss: 0.5200956418801748
Epoch: 0, step: 821, loss: 0.40458229184150696, mean loss: 0.5199551146903467
Epoch: 0, step: 822, loss: 0.41263866424560547, mean loss: 0.5198247180312401
Epoch: 0, step: 823, loss: 0.4579631984233856, mean loss: 0.5197496433715219
Epoch: 0, step: 824, loss: 0.47505810856819153, mean loss: 0.5196954718141845
Epoch: 0, step: 825, loss: 0.45435112714767456, mean loss: 0.519616362438075
Epoch: 0, step: 826, loss: 0.4357379674911499, mean loss: 0.5195149375348743
Epoch: 0, step: 827, loss: 0.43598806858062744, mean loss: 0.5194140596738185
Epoch: 0, step: 828, loss: 0.427869975566864, mean loss: 0.519303632551856
Epoch: 0, step: 829, loss: 0.4758049547672272, mean loss: 0.5192512245063323
Epoch: 0, step: 830, loss: 0.38562896847724915, mean loss: 0.5190904275676692
Epoch: 0, step: 831, loss: 0.4398229420185089, mean loss: 0.518995154147538
Epoch: 0, step: 832, loss: 0.40853145718574524, mean loss: 0.5188625446673918
Epoch: 0, step: 833, loss: 0.4414864182472229, mean loss: 0.5187697675373916
Epoch: 0, step: 834, loss: 0.3719477951526642, mean loss: 0.5185939328399248
Epoch: 0, step: 835, loss: 0.5625428557395935, mean loss: 0.5186465033218622
Epoch: 0, step: 836, loss: 0.5279368758201599, mean loss: 0.5186576029305818
Epoch: 0, step: 837, loss: 0.409189909696579, mean loss: 0.518526973225052
Epoch: 0, step: 838, loss: 0.4519416093826294, mean loss: 0.5184476104552757
Epoch: 0, step: 839, loss: 0.43422070145606995, mean loss: 0.5183473403255147
Epoch: 0, step: 840, loss: 0.41357290744781494, mean loss: 0.5182227571710822
Epoch: 0, step: 841, loss: 0.4431624114513397, mean loss: 0.518133611867377
Epoch: 0, step: 842, loss: 0.5382653474807739, mean loss: 0.5181574929297892
Epoch: 0, step: 843, loss: 0.41071897745132446, mean loss: 0.5180301961105019
Epoch: 0, step: 844, loss: 0.48591095209121704, mean loss: 0.5179921851708341
Epoch: 0, step: 845, loss: 0.42579251527786255, mean loss: 0.5178832021094949
Epoch: 0, step: 846, loss: 0.4118437170982361, mean loss: 0.5177580079123152
Epoch: 0, step: 847, loss: 0.4266493320465088, mean loss: 0.5176505684360584
Epoch: 0, step: 848, loss: 0.46957293152809143, mean loss: 0.5175939398884636
Epoch: 0, step: 849, loss: 0.4106735587120056, mean loss: 0.5174681512047266
Epoch: 0, step: 850, loss: 0.376137375831604, mean loss: 0.5173020750879543
Epoch: 0, step: 851, loss: 0.4674241840839386, mean loss: 0.5172435329623628
Epoch: 0, step: 852, loss: 0.4269179105758667, mean loss: 0.5171376412596823
Epoch: 0, step: 853, loss: 0.43308326601982117, mean loss: 0.5170392169327036
Epoch: 0, step: 854, loss: 0.4375513195991516, mean loss: 0.5169462486317287
Epoch: 0, step: 855, loss: 0.4415307641029358, mean loss: 0.5168581464301764
Epoch: 0, step: 856, loss: 0.42425423860549927, mean loss: 0.5167500905283973
Epoch: 0, step: 857, loss: 0.43763187527656555, mean loss: 0.5166578781563089
Epoch: 0, step: 858, loss: 0.46091607213020325, mean loss: 0.5165929866475475
Epoch: 0, step: 859, loss: 0.4707511067390442, mean loss: 0.516539682136026
Epoch: 0, step: 860, loss: 0.4780372977256775, mean loss: 0.5164949639195215
Epoch: 0, step: 861, loss: 0.39553970098495483, mean loss: 0.516354644588971
Epoch: 0, step: 862, loss: 0.4745107889175415, mean loss: 0.5163061580818198
Epoch: 0, step: 863, loss: 0.40482422709465027, mean loss: 0.5161771280691032
Epoch: 0, step: 864, loss: 0.43610823154449463, mean loss: 0.5160845628708088
Epoch: 0, step: 865, loss: 0.4155225157737732, mean loss: 0.5159684404145767
Epoch: 0, step: 866, loss: 0.36901000142097473, mean loss: 0.5157989381781365
Epoch: 0, step: 867, loss: 0.39831098914146423, mean loss: 0.5156635833981403
Epoch: 0, step: 868, loss: 0.5174552798271179, mean loss: 0.5156656451891979
Epoch: 0, step: 869, loss: 0.4130542576313019, mean loss: 0.5155477010655681
Epoch: 0, step: 870, loss: 0.3895239233970642, mean loss: 0.5154030124574528
Epoch: 0, step: 871, loss: 0.4076665937900543, mean loss: 0.515279461518614
Epoch: 0, step: 872, loss: 0.4103708863258362, mean loss: 0.5151592913293898
Epoch: 0, step: 873, loss: 0.4458124339580536, mean loss: 0.5150799470989877
Epoch: 0, step: 874, loss: 0.3817741274833679, mean loss: 0.5149275975908556
Epoch: 0, step: 875, loss: 0.46830931305885315, mean loss: 0.5148743803710703
Epoch: 0, step: 876, loss: 0.42635029554367065, mean loss: 0.5147734407076411
Epoch: 0, step: 877, loss: 0.46134617924690247, mean loss: 0.5147125896125833
Epoch: 0, step: 878, loss: 0.44102901220321655, mean loss: 0.5146287630171232
Epoch: 0, step: 879, loss: 0.4366893768310547, mean loss: 0.5145401955328209
Epoch: 0, step: 880, loss: 0.4381033182144165, mean loss: 0.5144534340375674
Epoch: 0, step: 881, loss: 0.3938333988189697, mean loss: 0.5143166766280225
Epoch: 0, step: 882, loss: 0.4305206537246704, mean loss: 0.5142217773948363
Epoch: 0, step: 883, loss: 0.395170658826828, mean loss: 0.5140871041837866
Epoch: 0, step: 884, loss: 0.43159160017967224, mean loss: 0.5139938889250248
Epoch: 0, step: 885, loss: 0.45614340901374817, mean loss: 0.5139285949296396
Epoch: 0, step: 886, loss: 0.397317111492157, mean loss: 0.5137971276427878
Epoch: 0, step: 887, loss: 0.4642446041107178, mean loss: 0.5137413252514229
Epoch: 0, step: 888, loss: 0.5224241018295288, mean loss: 0.5137510921542104
Epoch: 0, step: 889, loss: 0.47814780473709106, mean loss: 0.5137110884604833
Epoch: 0, step: 890, loss: 0.417129784822464, mean loss: 0.513602691935637
Epoch: 0, step: 891, loss: 0.4907889664173126, mean loss: 0.5135771160101681
Epoch: 0, step: 892, loss: 0.4334093928337097, mean loss: 0.5134873425239682
Epoch: 0, step: 893, loss: 0.42318272590637207, mean loss: 0.513386330648557
Epoch: 0, step: 894, loss: 0.4254522919654846, mean loss: 0.513288080326006
Epoch: 0, step: 895, loss: 0.45379942655563354, mean loss: 0.5132216867392088
Epoch: 0, step: 896, loss: 0.4225609600543976, mean loss: 0.513120615694967
Epoch: 0, step: 897, loss: 0.4109099507331848, mean loss: 0.513006795355366
Epoch: 0, step: 898, loss: 0.46536192297935486, mean loss: 0.5129537977220222
Epoch: 0, step: 899, loss: 0.4409099221229553, mean loss: 0.5128737489713566
Epoch: 0, step: 900, loss: 0.49839258193969727, mean loss: 0.5128576766439075
Epoch: 0, step: 901, loss: 0.42935603857040405, mean loss: 0.5127651027657772
Epoch: 0, step: 902, loss: 0.46069878339767456, mean loss: 0.5127074434973741
Epoch: 0, step: 903, loss: 0.4747229516506195, mean loss: 0.5126654252541808
Epoch: 0, step: 904, loss: 0.40844911336898804, mean loss: 0.5125502691084513
Epoch: 0, step: 905, loss: 0.37210676074028015, mean loss: 0.5123952541985526
Epoch: 0, step: 906, loss: 0.4810463786125183, mean loss: 0.5123606909399131
Epoch: 0, step: 907, loss: 0.43286216259002686, mean loss: 0.5122731374945938
Epoch: 0, step: 908, loss: 0.4026799201965332, mean loss: 0.5121525728991064
Epoch: 0, step: 909, loss: 0.456412672996521, mean loss: 0.5120913202618509
Epoch: 0, step: 910, loss: 0.36862725019454956, mean loss: 0.511933840492293
Epoch: 0, step: 911, loss: 0.5014106035232544, mean loss: 0.5119223018552655
Epoch: 0, step: 912, loss: 0.43132856488227844, mean loss: 0.5118340283207935
Epoch: 0, step: 913, loss: 0.45742249488830566, mean loss: 0.511774497102596
Epoch: 0, step: 914, loss: 0.45987316966056824, mean loss: 0.5117177743403644
Epoch: 0, step: 915, loss: 0.48919931054115295, mean loss: 0.5116931908646011
Epoch: 0, step: 916, loss: 0.44327980279922485, mean loss: 0.5116185852069507
Epoch: 0, step: 917, loss: 0.40427589416503906, mean loss: 0.5115016541709573
Epoch: 0, step: 918, loss: 0.47451648116111755, mean loss: 0.5114614091513601
Epoch: 0, step: 919, loss: 0.41156694293022156, mean loss: 0.5113528282098153
Epoch: 0, step: 920, loss: 0.43716585636138916, mean loss: 0.5112722777517823
Epoch: 0, step: 921, loss: 0.4470132291316986, mean loss: 0.5112025824712833
Epoch: 0, step: 922, loss: 0.36575260758399963, mean loss: 0.5110449985331605
Epoch: 0, step: 923, loss: 0.4776155352592468, mean loss: 0.5110088194603533
Epoch: 0, step: 924, loss: 0.3819584846496582, mean loss: 0.5108693055848822
Epoch: 0, step: 925, loss: 0.49775463342666626, mean loss: 0.5108551428719683
Epoch: 0, step: 926, loss: 0.4309815764427185, mean loss: 0.5107689793698872
Epoch: 0, step: 927, loss: 0.3841436505317688, mean loss: 0.5106325296620875
Epoch: 0, step: 928, loss: 0.48325222730636597, mean loss: 0.5106030567854936
Epoch: 0, step: 929, loss: 0.4099592864513397, mean loss: 0.5104948376776074
Epoch: 0, step: 930, loss: 0.401462197303772, mean loss: 0.5103777242078181
Epoch: 0, step: 931, loss: 0.5159047842025757, mean loss: 0.5103836545297009
Epoch: 0, step: 932, loss: 0.4023551046848297, mean loss: 0.5102678683026431
Epoch: 0, step: 933, loss: 0.4591376483440399, mean loss: 0.5102131250264562
Epoch: 0, step: 934, loss: 0.4493332505226135, mean loss: 0.5101480128612115
Epoch: 0, step: 935, loss: 0.44654613733291626, mean loss: 0.5100800621394932
Epoch: 0, step: 936, loss: 0.4511271119117737, mean loss: 0.5100171454370089
Epoch: 0, step: 937, loss: 0.396725058555603, mean loss: 0.5098963649605895
Epoch: 0, step: 938, loss: 0.48648393154144287, mean loss: 0.509871431591666
Epoch: 0, step: 939, loss: 0.45755353569984436, mean loss: 0.5098157742556109
Epoch: 0, step: 940, loss: 0.42257994413375854, mean loss: 0.5097230688038342
Epoch: 0, step: 941, loss: 0.430657297372818, mean loss: 0.5096391348638862
Epoch: 0, step: 942, loss: 0.4198382794857025, mean loss: 0.5095439059610462
Epoch: 0, step: 943, loss: 0.4170229434967041, mean loss: 0.5094458964669102
Epoch: 0, step: 944, loss: 0.3819727599620819, mean loss: 0.5093110042589686
Epoch: 0, step: 945, loss: 0.5088077187538147, mean loss: 0.5093104722446925
Epoch: 0, step: 946, loss: 0.40087905526161194, mean loss: 0.5091959723323556
Epoch: 0, step: 947, loss: 0.42553234100341797, mean loss: 0.5091077195566921
Epoch: 0, step: 948, loss: 0.44972726702690125, mean loss: 0.5090451479523403
Epoch: 0, step: 949, loss: 0.484375923871994, mean loss: 0.5090191803480453
Epoch: 0, step: 950, loss: 0.41821733117103577, mean loss: 0.5089236999598465
Epoch: 0, step: 951, loss: 0.3984891176223755, mean loss: 0.5088076972473072
Epoch: 0, step: 952, loss: 0.40795189142227173, mean loss: 0.5087018674405653
Epoch: 0, step: 953, loss: 0.4299817979335785, mean loss: 0.5086193516444364
Epoch: 0, step: 954, loss: 0.41806870698928833, mean loss: 0.5085245342154782
Epoch: 0, step: 955, loss: 0.4515022933483124, mean loss: 0.5084648875200104
Epoch: 0, step: 956, loss: 0.46234580874443054, mean loss: 0.5084166962151248
Epoch: 0, step: 957, loss: 0.5030819773674011, mean loss: 0.5084111276150749
Epoch: 0, step: 958, loss: 0.386311799287796, mean loss: 0.5082838081903333
Epoch: 0, step: 959, loss: 0.37824082374572754, mean loss: 0.5081483467482034
Epoch: 0, step: 960, loss: 0.47943630814552307, mean loss: 0.5081184694967958
Epoch: 0, step: 961, loss: 0.4332367777824402, mean loss: 0.5080406299004192
Epoch: 0, step: 962, loss: 0.4468504786491394, mean loss: 0.5079770887257035
Epoch: 0, step: 963, loss: 0.4352703392505646, mean loss: 0.5079016667864139
Epoch: 0, step: 964, loss: 0.4668801426887512, mean loss: 0.5078591574350174
Epoch: 0, step: 965, loss: 0.5199026465415955, mean loss: 0.5078716248150449
Epoch: 0, step: 966, loss: 0.42474114894866943, mean loss: 0.5077856574149763
Epoch: 0, step: 967, loss: 0.3713127672672272, mean loss: 0.5076446730243278
Epoch: 0, step: 968, loss: 0.4168882966041565, mean loss: 0.5075510131931409
Epoch: 0, step: 969, loss: 0.41856446862220764, mean loss: 0.5074592744873977
Epoch: 0, step: 970, loss: 0.45568928122520447, mean loss: 0.5074059583254387
Epoch: 0, step: 971, loss: 0.402208536863327, mean loss: 0.5072977305255806
Epoch: 0, step: 972, loss: 0.4134458601474762, mean loss: 0.5072012743381417
Epoch: 0, step: 973, loss: 0.4224950671195984, mean loss: 0.507114306979601
Epoch: 0, step: 974, loss: 0.4037643373012543, mean loss: 0.5070083070107002
Epoch: 0, step: 975, loss: 0.4185047745704651, mean loss: 0.5069176271618885
Epoch: 0, step: 976, loss: 0.4003117084503174, mean loss: 0.5068085115849064
Epoch: 0, step: 977, loss: 0.4438450336456299, mean loss: 0.5067441317506126
Epoch: 0, step: 978, loss: 0.4661239981651306, mean loss: 0.5067026402964906
Epoch: 0, step: 979, loss: 0.428143709897995, mean loss: 0.5066224781226146
Epoch: 0, step: 980, loss: 0.4254802465438843, mean loss: 0.5065397643289564
Epoch: 0, step: 981, loss: 0.4209343492984772, mean loss: 0.5064525897718989
Epoch: 0, step: 982, loss: 0.4140048921108246, mean loss: 0.5063585432839426
Epoch: 0, step: 983, loss: 0.4290499985218048, mean loss: 0.5062799776896721
Epoch: 0, step: 984, loss: 0.5239299535751343, mean loss: 0.5062978964469163
Epoch: 0, step: 985, loss: 0.41461601853370667, mean loss: 0.506204912797917
Epoch: 0, step: 986, loss: 0.4485239088535309, mean loss: 0.5061464720644374
Epoch: 0, step: 987, loss: 0.39120781421661377, mean loss: 0.5060301373905024
Epoch: 0, step: 988, loss: 0.40177831053733826, mean loss: 0.5059247260387802
Epoch: 0, step: 989, loss: 0.4330889582633972, mean loss: 0.5058511545561789
Epoch: 0, step: 990, loss: 0.4224748909473419, mean loss: 0.5057670210913869
Epoch: 0, step: 991, loss: 0.4547428488731384, mean loss: 0.5057155854339088
Epoch: 0, step: 992, loss: 0.3857755661010742, mean loss: 0.5055947999159502
Epoch: 0, step: 993, loss: 0.4315962791442871, mean loss: 0.505520354724027
Epoch: 0, step: 994, loss: 0.37699654698371887, mean loss: 0.5053911850680066
Epoch: 0, step: 995, loss: 0.4372221529483795, mean loss: 0.5053227422646737
Epoch: 0, step: 996, loss: 0.43166035413742065, mean loss: 0.5052488582244257
Epoch: 0, step: 997, loss: 0.41719314455986023, mean loss: 0.5051606260464051
Epoch: 0, step: 998, loss: 0.41922932863235474, mean loss: 0.5050746087316763
Epoch: 0, step: 999, loss: 0.42461666464805603, mean loss: 0.5049941507875927
Epoch: 0, step: 1000, loss: 0.4684116542339325, mean loss: 0.5049576048369896
Epoch: 0, step: 1001, loss: 0.4663093686103821, mean loss: 0.5049190337429511
Epoch: 0, step: 1002, loss: 0.4556124210357666, mean loss: 0.5048698746076499
Epoch: 0, step: 1003, loss: 0.4371650218963623, mean loss: 0.5048024394953876
Epoch: 0, step: 1004, loss: 0.3765803277492523, mean loss: 0.5046748553045954
Epoch: 0, step: 1005, loss: 0.42811235785484314, mean loss: 0.5045987494423193
Epoch: 0, step: 1006, loss: 0.44665420055389404, mean loss: 0.5045412076857271
Epoch: 0, step: 1007, loss: 0.4350011348724365, mean loss: 0.5044722195182536
Epoch: 0, step: 1008, loss: 0.4511239528656006, mean loss: 0.5044193471033352
Epoch: 0, step: 1009, loss: 0.468121200799942, mean loss: 0.504383408344619
Epoch: 0, step: 1010, loss: 0.4121406078338623, mean loss: 0.5042921691749743
Epoch: 0, step: 1011, loss: 0.4746067523956299, mean loss: 0.5042628357591845
Epoch: 0, step: 1012, loss: 0.4232470989227295, mean loss: 0.5041828597109748
Epoch: 0, step: 1013, loss: 0.4524545967578888, mean loss: 0.5041318456449461
Epoch: 0, step: 1014, loss: 0.37443405389785767, mean loss: 0.5040040645693332
Epoch: 0, step: 1015, loss: 0.40859273076057434, mean loss: 0.5039101557762143
Epoch: 0, step: 1016, loss: 0.44961193203926086, mean loss: 0.5038567651924022
Epoch: 0, step: 1017, loss: 0.42414727807044983, mean loss: 0.5037784651068207
Epoch: 0, step: 1018, loss: 0.38133591413497925, mean loss: 0.5036583055867305
Epoch: 0, step: 1019, loss: 0.4815773367881775, mean loss: 0.5036366575781045
Epoch: 0, step: 1020, loss: 0.3996681869029999, mean loss: 0.503534827538266
Epoch: 0, step: 1021, loss: 0.4322008788585663, mean loss: 0.5034650291540392
Epoch: 0, step: 1022, loss: 0.39183416962623596, mean loss: 0.503355908079232
Epoch: 0, step: 1023, loss: 0.4294310510158539, mean loss: 0.5032837158360061
Epoch: 0, step: 1024, loss: 0.4426174759864807, mean loss: 0.5032245292605431
Epoch: 0, step: 1025, loss: 0.4510799050331116, mean loss: 0.5031737060400485
Epoch: 0, step: 1026, loss: 0.4590003192424774, mean loss: 0.5031306939789019
Epoch: 0, step: 1027, loss: 0.4299224019050598, mean loss: 0.5030594796870013
Epoch: 0, step: 1028, loss: 0.4685482084751129, mean loss: 0.5030259410366495
Epoch: 0, step: 1029, loss: 0.42395031452178955, mean loss: 0.5029491685837225
Epoch: 0, step: 1030, loss: 0.4581846296787262, mean loss: 0.5029057500202841
Epoch: 0, step: 1031, loss: 0.4176814556121826, mean loss: 0.5028231683396561
Epoch: 0, step: 1032, loss: 0.4125785231590271, mean loss: 0.5027358066308656
Epoch: 0, step: 1033, loss: 0.40709245204925537, mean loss: 0.5026433082221793
Epoch: 0, step: 1034, loss: 0.3829103410243988, mean loss: 0.5025276241959012
Epoch: 0, step: 1035, loss: 0.39442911744117737, mean loss: 0.5024232820079141
Epoch: 0, step: 1036, loss: 0.5054261088371277, mean loss: 0.5024261776943454
Epoch: 0, step: 1037, loss: 0.46061640977859497, mean loss: 0.5023858985345037
Epoch: 0, step: 1038, loss: 0.39004284143447876, mean loss: 0.5022777723967751
Epoch: 0, step: 1039, loss: 0.4001862108707428, mean loss: 0.5021796074337692
Epoch: 0, step: 1040, loss: 0.4240018129348755, mean loss: 0.5021045086878528
Epoch: 0, step: 1041, loss: 0.4217274785041809, mean loss: 0.5020273714228013
Epoch: 0, step: 1042, loss: 0.40912824869155884, mean loss: 0.5019383022734905
Epoch: 0, step: 1043, loss: 0.4167667031288147, mean loss: 0.5018567202819726
Epoch: 0, step: 1044, loss: 0.401640921831131, mean loss: 0.5017608199963737
Epoch: 0, step: 1045, loss: 0.42584899067878723, mean loss: 0.5016882465457833
Epoch: 0, step: 1046, loss: 0.4239281415939331, mean loss: 0.5016139771045685
Epoch: 0, step: 1047, loss: 0.40140703320503235, mean loss: 0.5015183597916872
Epoch: 0, step: 1048, loss: 0.45998871326446533, mean loss: 0.5014787700428529
Epoch: 0, step: 1049, loss: 0.4839681386947632, mean loss: 0.5014620932510928
Epoch: 0, step: 1050, loss: 0.39269208908081055, mean loss: 0.5013586013346606
Epoch: 0, step: 1051, loss: 0.39778366684913635, mean loss: 0.5012601460737428
Epoch: 0, step: 1052, loss: 0.4628959894180298, mean loss: 0.5012237128765389
Epoch: 0, step: 1053, loss: 0.43127018213272095, mean loss: 0.5011573433027782
Epoch: 0, step: 1054, loss: 0.4196156859397888, mean loss: 0.5010800526322919
Epoch: 0, step: 1055, loss: 0.5046887397766113, mean loss: 0.5010834699496635
Epoch: 0, step: 1056, loss: 0.434916615486145, mean loss: 0.5010208712226403
Epoch: 0, step: 1057, loss: 0.417738676071167, mean loss: 0.5009421545920624
Epoch: 0, step: 1058, loss: 0.4506722390651703, mean loss: 0.5008946853611588
Epoch: 0, step: 1059, loss: 0.4416087865829468, mean loss: 0.5008387552679718
Epoch: 0, step: 1060, loss: 0.3768889605998993, mean loss: 0.5007219317103205
Epoch: 0, step: 1061, loss: 0.40985164046287537, mean loss: 0.5006363664643249
Epoch: 0, step: 1062, loss: 0.40810373425483704, mean loss: 0.5005493178921616
Epoch: 0, step: 1063, loss: 0.4321187436580658, mean loss: 0.5004850034426935
Epoch: 0, step: 1064, loss: 0.40231144428253174, mean loss: 0.5003928216970033
Epoch: 0, step: 1065, loss: 0.4535180926322937, mean loss: 0.5003488491556668
Epoch: 0, step: 1066, loss: 0.37493258714675903, mean loss: 0.5002313081416003
Epoch: 0, step: 1067, loss: 0.4120796024799347, mean loss: 0.5001487690913553
Epoch: 0, step: 1068, loss: 0.46001365780830383, mean loss: 0.5001112245532047
Epoch: 0, step: 1069, loss: 0.5034394264221191, mean loss: 0.500114335022241
Epoch: 0, step: 1070, loss: 0.40636253356933594, mean loss: 0.5000267983262066
Epoch: 0, step: 1071, loss: 0.412396103143692, mean loss: 0.4999450532747303
Epoch: 0, step: 1072, loss: 0.4444192349910736, mean loss: 0.49989330507502516
Epoch: 0, step: 1073, loss: 0.4122403562068939, mean loss: 0.499811691528593
Epoch: 0, step: 1074, loss: 0.4079369902610779, mean loss: 0.4997262266902046
Epoch: 0, step: 1075, loss: 0.4250872731208801, mean loss: 0.49965685963298406
Epoch: 0, step: 1076, loss: 0.4428533613681793, mean loss: 0.49960411729476234
Epoch: 0, step: 1077, loss: 0.38587626814842224, mean loss: 0.4994986183623446
Epoch: 0, step: 1078, loss: 0.4285779595375061, mean loss: 0.4994328902262697
Epoch: 0, step: 1079, loss: 0.3907665014266968, mean loss: 0.49933227319960344
Epoch: 0, step: 1080, loss: 0.44237613677978516, mean loss: 0.49927958482178675
Epoch: 0, step: 1081, loss: 0.4876398742198944, mean loss: 0.4992688272334301
Epoch: 0, step: 1082, loss: 0.41702038049697876, mean loss: 0.4991928822225931
Epoch: 0, step: 1083, loss: 0.4130030572414398, mean loss: 0.4991133713139389
Epoch: 0, step: 1084, loss: 0.48460716009140015, mean loss: 0.4991000015340103
Epoch: 0, step: 1085, loss: 0.38171249628067017, mean loss: 0.4989919099085468
Epoch: 0, step: 1086, loss: 0.4314725399017334, mean loss: 0.498929794572754
Epoch: 0, step: 1087, loss: 0.3727540969848633, mean loss: 0.498813824262471
Epoch: 0, step: 1088, loss: 0.48275020718574524, mean loss: 0.4987990734662573
Epoch: 0, step: 1089, loss: 0.42227885127067566, mean loss: 0.49872887142754574
Epoch: 0, step: 1090, loss: 0.42349791526794434, mean loss: 0.4986599154640631
Epoch: 0, step: 1091, loss: 0.42586493492126465, mean loss: 0.4985932533939689
Epoch: 0, step: 1092, loss: 0.4162074327468872, mean loss: 0.498517877528784
Epoch: 0, step: 1093, loss: 0.39847224950790405, mean loss: 0.4984264281430245
Epoch: 0, step: 1094, loss: 0.39792102575302124, mean loss: 0.4983346423874172
Epoch: 0, step: 1095, loss: 0.4189850687980652, mean loss: 0.4982622431414415
Epoch: 0, step: 1096, loss: 0.4518212676048279, mean loss: 0.4982199086149724
Epoch: 0, step: 1097, loss: 0.4415934085845947, mean loss: 0.49816833621057316
Epoch: 0, step: 1098, loss: 0.395755410194397, mean loss: 0.4980751488347623
Epoch: 0, step: 1099, loss: 0.3953121602535248, mean loss: 0.49798172793605205
Epoch: 0, step: 1100, loss: 0.3879249095916748, mean loss: 0.4978817671564477
Epoch: 0, step: 1101, loss: 0.39658546447753906, mean loss: 0.4977898467365939
Epoch: 0, step: 1102, loss: 0.40089118480682373, mean loss: 0.4977019966351163
Epoch: 0, step: 1103, loss: 0.4660532474517822, mean loss: 0.49767332928984154
Epoch: 0, step: 1104, loss: 0.44632232189178467, mean loss: 0.4976268577899338
Epoch: 0, step: 1105, loss: 0.5324363708496094, mean loss: 0.49765833112904745
Epoch: 0, step: 1106, loss: 0.3646092712879181, mean loss: 0.4975381422764358
Epoch: 0, step: 1107, loss: 0.41035276651382446, mean loss: 0.49745945511419515
Epoch: 0, step: 1108, loss: 0.39391544461250305, mean loss: 0.49736608810743077
Epoch: 0, step: 1109, loss: 0.4323618710041046, mean loss: 0.49730752574968
Epoch: 0, step: 1110, loss: 0.41873255372047424, mean loss: 0.497236801202399
Epoch: 0, step: 1111, loss: 0.42923781275749207, mean loss: 0.49717565103293415
Epoch: 0, step: 1112, loss: 0.3725700080394745, mean loss: 0.49706369627732455
Epoch: 0, step: 1113, loss: 0.4130809009075165, mean loss: 0.4969883077716066
Epoch: 0, step: 1114, loss: 0.43255913257598877, mean loss: 0.4969305237579782
Epoch: 0, step: 1115, loss: 0.3822113573551178, mean loss: 0.4968277288060043
Epoch: 0, step: 1116, loss: 0.38175973296165466, mean loss: 0.49672471359038717
Epoch: 0, step: 1117, loss: 0.4018023610115051, mean loss: 0.4966398098760948
Epoch: 0, step: 1118, loss: 0.4813726246356964, mean loss: 0.49662616627891837
Epoch: 0, step: 1119, loss: 0.43204715847969055, mean loss: 0.4965685064505262
Epoch: 0, step: 1120, loss: 0.41176366806030273, mean loss: 0.49649285539041005
Epoch: 0, step: 1121, loss: 0.4093721807003021, mean loss: 0.49641520773025843
Epoch: 0, step: 1122, loss: 0.4252023696899414, mean loss: 0.4963517946954941
Epoch: 0, step: 1123, loss: 0.4351554214954376, mean loss: 0.49629734952360793
Epoch: 0, step: 1124, loss: 0.4672568142414093, mean loss: 0.4962715357144682
Epoch: 0, step: 1125, loss: 0.4520912766456604, mean loss: 0.49623229924993106
Epoch: 0, step: 1126, loss: 0.4433305859565735, mean loss: 0.4961853589541961
Epoch: 0, step: 1127, loss: 0.4381507933139801, mean loss: 0.4961339098711817
Epoch: 0, step: 1128, loss: 0.37576961517333984, mean loss: 0.4960272984498373
Epoch: 0, step: 1129, loss: 0.46603819727897644, mean loss: 0.49600075942225247
Epoch: 0, step: 1130, loss: 0.3994775414466858, mean loss: 0.4959154161702847
Epoch: 0, step: 1131, loss: 0.44685742259025574, mean loss: 0.4958720787201256
Epoch: 0, step: 1132, loss: 0.4284290373325348, mean loss: 0.4958125526465267
Epoch: 0, step: 1133, loss: 0.3606484830379486, mean loss: 0.49569336034528455
Epoch: 0, step: 1134, loss: 0.46111783385276794, mean loss: 0.49566289732634844
Epoch: 0, step: 1135, loss: 0.43103650212287903, mean loss: 0.49560600789395104
Epoch: 0, step: 1136, loss: 0.4370534121990204, mean loss: 0.49555451044830906
Epoch: 0, step: 1137, loss: 0.43002834916114807, mean loss: 0.4954969303417298
Epoch: 0, step: 1138, loss: 0.46939581632614136, mean loss: 0.49547401452608836
Epoch: 0, step: 1139, loss: 0.41304370760917664, mean loss: 0.49540170723931914
Epoch: 0, step: 1140, loss: 0.3588293492794037, mean loss: 0.4952820119212123
Epoch: 0, step: 1141, loss: 0.4660890996456146, mean loss: 0.4952564489507433
Epoch: 0, step: 1142, loss: 0.41439858078956604, mean loss: 0.49518570715882626
Epoch: 0, step: 1143, loss: 0.38546285033226013, mean loss: 0.49508979557069116
Epoch: 0, step: 1144, loss: 0.3571186065673828, mean loss: 0.4949692967156664
Epoch: 0, step: 1145, loss: 0.46776336431503296, mean loss: 0.49494555680955765
Epoch: 0, step: 1146, loss: 0.4126320481300354, mean loss: 0.4948737926345973
Epoch: 0, step: 1147, loss: 0.4372466504573822, mean loss: 0.49482359477555793
Epoch: 0, step: 1148, loss: 0.4740549325942993, mean loss: 0.49480551935155337
Epoch: 0, step: 1149, loss: 0.43211856484413147, mean loss: 0.4947510089563295
Epoch: 0, step: 1150, loss: 0.39067691564559937, mean loss: 0.4946605883713506
Epoch: 0, step: 1151, loss: 0.4137953817844391, mean loss: 0.49459039287952167
Epoch: 0, step: 1152, loss: 0.39365339279174805, mean loss: 0.49450284994796245
Epoch: 0, step: 1153, loss: 0.43949058651924133, mean loss: 0.49445517900911606
Epoch: 0, step: 1154, loss: 0.3886675238609314, mean loss: 0.49436358796569774
Epoch: 0, step: 1155, loss: 0.4061948359012604, mean loss: 0.4942873174189292
Epoch: 0, step: 1156, loss: 0.4266904294490814, mean loss: 0.4942288931423779
Epoch: 0, step: 1157, loss: 0.42082342505455017, mean loss: 0.49416550327356284
Epoch: 0, step: 1158, loss: 0.38766512274742126, mean loss: 0.49407361338527456
Epoch: 0, step: 1159, loss: 0.419668972492218, mean loss: 0.4940094714534702
Epoch: 0, step: 1160, loss: 0.3769288957118988, mean loss: 0.49390862685765485
Epoch: 0, step: 1161, loss: 0.49321335554122925, mean loss: 0.4939080285174514
Epoch: 0, step: 1162, loss: 0.38370969891548157, mean loss: 0.49381327500962513
Epoch: 0, step: 1163, loss: 0.4022506773471832, mean loss: 0.49373461298414195
Epoch: 0, step: 1164, loss: 0.4299967885017395, mean loss: 0.4936799024051871
Epoch: 0, step: 1165, loss: 0.4123099446296692, mean loss: 0.4936101168496335
Epoch: 0, step: 1166, loss: 0.41133904457092285, mean loss: 0.4935396189299431
Epoch: 0, step: 1167, loss: 0.4516339600086212, mean loss: 0.49350374079730497
Epoch: 0, step: 1168, loss: 0.41789355874061584, mean loss: 0.4934390614285653
Epoch: 0, step: 1169, loss: 0.4444659352302551, mean loss: 0.4933972040557462
Epoch: 0, step: 1170, loss: 0.40557044744491577, mean loss: 0.49332220255565157
Epoch: 0, step: 1171, loss: 0.441820353269577, mean loss: 0.49327825899824024
Epoch: 0, step: 1172, loss: 0.45531612634658813, mean loss: 0.49324589571379723
Epoch: 0, step: 1173, loss: 0.3819485604763031, mean loss: 0.4931510938950259
Epoch: 0, step: 1174, loss: 0.3475370705127716, mean loss: 0.4930271670666155
Epoch: 0, step: 1175, loss: 0.3964439332485199, mean loss: 0.49294503846643
Epoch: 0, step: 1176, loss: 0.45936161279678345, mean loss: 0.49291650539449317
Epoch: 0, step: 1177, loss: 0.40832656621932983, mean loss: 0.49284469729672137
Epoch: 0, step: 1178, loss: 0.389262318611145, mean loss: 0.4927568411655207
Epoch: 0, step: 1179, loss: 0.39522525668144226, mean loss: 0.4926741872803647
Epoch: 0, step: 1180, loss: 0.41205164790153503, mean loss: 0.4926059209472751
Epoch: 0, step: 1181, loss: 0.3987201452255249, mean loss: 0.492526491356986
Epoch: 0, step: 1182, loss: 0.5306121110916138, mean loss: 0.4925586854565081
Epoch: 0, step: 1183, loss: 0.4399460554122925, mean loss: 0.49251424911356534
Epoch: 0, step: 1184, loss: 0.488192617893219, mean loss: 0.49251060216738785
Epoch: 0, step: 1185, loss: 0.49020087718963623, mean loss: 0.4925086546758383
Epoch: 0, step: 1186, loss: 0.4306171238422394, mean loss: 0.49245651353781505
Epoch: 0, step: 1187, loss: 0.4321978986263275, mean loss: 0.4924057907979906
Epoch: 0, step: 1188, loss: 0.4540536105632782, mean loss: 0.4923735349693659
Epoch: 0, step: 1189, loss: 0.3911310136318207, mean loss: 0.49228845722034276
Epoch: 0, step: 1190, loss: 0.40429240465164185, mean loss: 0.4922145730452221
Epoch: 0, step: 1191, loss: 0.4013150930404663, mean loss: 0.49213831509219796
Epoch: 0, step: 1192, loss: 0.3989828824996948, mean loss: 0.4920602300690693
Epoch: 0, step: 1193, loss: 0.4572877883911133, mean loss: 0.4920311074210978
Epoch: 0, step: 1194, loss: 0.3909556269645691, mean loss: 0.49194652542908396
Epoch: 0, step: 1195, loss: 0.4446350634098053, mean loss: 0.4919069673504725
Epoch: 0, step: 1196, loss: 0.43766963481903076, mean loss: 0.4918616562957261
Epoch: 0, step: 1197, loss: 0.3556543290615082, mean loss: 0.4917479606970331
Epoch: 0, step: 1198, loss: 0.44199544191360474, mean loss: 0.49170646568553733
Epoch: 0, step: 1199, loss: 0.44697538018226624, mean loss: 0.49166918978095125
Epoch: 0, step: 1200, loss: 0.46624788641929626, mean loss: 0.49164802300046695
Epoch: 0, step: 1201, loss: 0.4527766704559326, mean loss: 0.4916156841048392
Epoch: 0, step: 1202, loss: 0.4153147041797638, mean loss: 0.4915522585188666
Epoch: 0, step: 1203, loss: 0.590568482875824, mean loss: 0.4916344979078674
Epoch: 0, step: 1204, loss: 0.40234166383743286, mean loss: 0.49156039597087947
Epoch: 0, step: 1205, loss: 0.3898107707500458, mean loss: 0.49147602646406285
Epoch: 0, step: 1206, loss: 0.394771546125412, mean loss: 0.4913959067620424
Epoch: 0, step: 1207, loss: 0.4536864757537842, mean loss: 0.49136469034564484
Epoch: 0, step: 1208, loss: 0.4280819296836853, mean loss: 0.49131234728471684
Epoch: 0, step: 1209, loss: 0.40246883034706116, mean loss: 0.4912389228905535
Epoch: 0, step: 1210, loss: 0.42199358344078064, mean loss: 0.4911817425937329
Epoch: 0, step: 1211, loss: 0.3501049280166626, mean loss: 0.4910653425817056
Epoch: 0, step: 1212, loss: 0.39088207483291626, mean loss: 0.4909827512645178
Epoch: 0, step: 1213, loss: 0.4592128098011017, mean loss: 0.49095658162575057
Epoch: 0, step: 1214, loss: 0.4500584304332733, mean loss: 0.49092292059596254
Epoch: 0, step: 1215, loss: 0.42758724093437195, mean loss: 0.49087083533308296
Epoch: 0, step: 1216, loss: 0.46022123098373413, mean loss: 0.49084565077733167
Epoch: 0, step: 1217, loss: 0.4678153991699219, mean loss: 0.4908267425247804
Epoch: 0, step: 1218, loss: 0.4363655149936676, mean loss: 0.49078206555387716
Epoch: 0, step: 1219, loss: 0.36354130506515503, mean loss: 0.49067776984855854
Epoch: 0, step: 1220, loss: 0.4157492518424988, mean loss: 0.4906164033309451
Epoch: 0, step: 1221, loss: 0.43822482228279114, mean loss: 0.4905735296966995
Epoch: 0, step: 1222, loss: 0.4195692241191864, mean loss: 0.4905154722105364
Epoch: 0, step: 1223, loss: 0.45256301760673523, mean loss: 0.49048446530318035
Epoch: 0, step: 1224, loss: 0.3855818212032318, mean loss: 0.4903988304916702
Epoch: 0, step: 1225, loss: 0.43131664395332336, mean loss: 0.4903506394749179
Epoch: 0, step: 1226, loss: 0.47603100538253784, mean loss: 0.49033896903148483
Epoch: 0, step: 1227, loss: 0.4117245376110077, mean loss: 0.4902749507648558
Epoch: 0, step: 1228, loss: 0.38333889842033386, mean loss: 0.4901879401445592
Epoch: 0, step: 1229, loss: 0.4069605767726898, mean loss: 0.49012027562149263
Epoch: 0, step: 1230, loss: 0.38395780324935913, mean loss: 0.4900340347828475
Epoch: 0, step: 1231, loss: 0.43460339307785034, mean loss: 0.4899890423788662
Epoch: 0, step: 1232, loss: 0.3883604109287262, mean loss: 0.48990661850907696
Epoch: 0, step: 1233, loss: 0.35357487201690674, mean loss: 0.4897961389738321
Epoch: 0, step: 1234, loss: 0.4288899302482605, mean loss: 0.48974682220563326
Epoch: 0, step: 1235, loss: 0.4867122173309326, mean loss: 0.4897443670236958
Epoch: 0, step: 1236, loss: 0.40351077914237976, mean loss: 0.48967465514990327
Epoch: 0, step: 1237, loss: 0.42292216420173645, mean loss: 0.489620735528782
Epoch: 0, step: 1238, loss: 0.41753503680229187, mean loss: 0.48956255498098017
Epoch: 0, step: 1239, loss: 0.4661661684513092, mean loss: 0.4895436869273272
Epoch: 0, step: 1240, loss: 0.45152318477630615, mean loss: 0.4895130499392925
Epoch: 0, step: 1241, loss: 0.40108129382133484, mean loss: 0.4894418488474101
Epoch: 0, step: 1242, loss: 0.4059518873691559, mean loss: 0.4893746807368081
Epoch: 0, step: 1243, loss: 0.4606421887874603, mean loss: 0.48935158387832794
Epoch: 0, step: 1244, loss: 0.4164353013038635, mean loss: 0.48929301658308744
Epoch: 0, step: 1245, loss: 0.4021753668785095, mean loss: 0.4892230987261817
Epoch: 0, step: 1246, loss: 0.3695319890975952, mean loss: 0.4891271154786848
Epoch: 0, step: 1247, loss: 0.43346062302589417, mean loss: 0.48908251091742455
Epoch: 0, step: 1248, loss: 0.414429634809494, mean loss: 0.4890227408004446
Epoch: 0, step: 1249, loss: 0.3670639097690582, mean loss: 0.4889251737356195
Epoch: 0, step: 1250, loss: 0.41780126094818115, mean loss: 0.4888683200883074
Epoch: 0, step: 1251, loss: 0.4146125018596649, mean loss: 0.4888090103293388
Epoch: 0, step: 1252, loss: 0.3690114915370941, mean loss: 0.48871340177483585
Epoch: 0, step: 1253, loss: 0.4421427845954895, mean loss: 0.48867626412158277
Epoch: 0, step: 1254, loss: 0.3995465338230133, mean loss: 0.4886052444161656
Epoch: 0, step: 1255, loss: 0.4300414025783539, mean loss: 0.48855861715355586
Epoch: 0, step: 1256, loss: 0.39002054929733276, mean loss: 0.4884802256914586
Epoch: 0, step: 1257, loss: 0.39794695377349854, mean loss: 0.48840825965654766
Epoch: 0, step: 1258, loss: 0.41570475697517395, mean loss: 0.4883505126329723
Epoch: 0, step: 1259, loss: 0.4069528877735138, mean loss: 0.4882859113434013
Epoch: 0, step: 1260, loss: 0.45402151346206665, mean loss: 0.4882587389422266
Epoch: 0, step: 1261, loss: 0.3572050631046295, mean loss: 0.48815489292333786
Epoch: 0, step: 1262, loss: 0.4212532341480255, mean loss: 0.48810192248883644
Epoch: 0, step: 1263, loss: 0.40175431966781616, mean loss: 0.4880336095119211
Epoch: 0, step: 1264, loss: 0.37755632400512695, mean loss: 0.4879462756893861
Epoch: 0, step: 1265, loss: 0.4485943913459778, mean loss: 0.487915192052464
Epoch: 0, step: 1266, loss: 0.4039710462093353, mean loss: 0.4878489377937085
Epoch: 0, step: 1267, loss: 0.4136713445186615, mean loss: 0.48779043811446954
Epoch: 0, step: 1268, loss: 0.38332968950271606, mean loss: 0.487708120739677
Epoch: 0, step: 1269, loss: 0.46461164951324463, mean loss: 0.48768993454186094
Epoch: 0, step: 1270, loss: 0.41850584745407104, mean loss: 0.4876355017432081
Epoch: 0, step: 1271, loss: 0.383604496717453, mean loss: 0.48755371636189854
Epoch: 0, step: 1272, loss: 0.4905830919742584, mean loss: 0.4875560960756553
Epoch: 0, step: 1273, loss: 0.3884390592575073, mean loss: 0.48747829620374156
Epoch: 0, step: 1274, loss: 0.3999272286891937, mean loss: 0.4874096286998086
Epoch: 0, step: 1275, loss: 0.39080315828323364, mean loss: 0.4873339182997956
Epoch: 0, step: 1276, loss: 0.4091905951499939, mean loss: 0.4872727254077441
Epoch: 0, step: 1277, loss: 0.5056304931640625, mean loss: 0.48728708985825764
Epoch: 0, step: 1278, loss: 0.40400922298431396, mean loss: 0.4872219781562452
Epoch: 0, step: 1279, loss: 0.40901464223861694, mean loss: 0.4871608786750595
Epoch: 0, step: 1280, loss: 0.3851962685585022, mean loss: 0.4870812810090825
Epoch: 0, step: 1281, loss: 0.3790670931339264, mean loss: 0.4869970265723624
Epoch: 0, step: 1282, loss: 0.40403419733047485, mean loss: 0.4869323634162892
Epoch: 0, step: 1283, loss: 0.3976551592350006, mean loss: 0.48686283288343774
Epoch: 0, step: 1284, loss: 0.44388723373413086, mean loss: 0.4868293888374072
Epoch: 0, step: 1285, loss: 0.4211304187774658, mean loss: 0.48677830099132635
Epoch: 0, step: 1286, loss: 0.42019838094711304, mean loss: 0.48672656834171935
Epoch: 0, step: 1287, loss: 0.4164043962955475, mean loss: 0.4866719703820562
Epoch: 0, step: 1288, loss: 0.42425113916397095, mean loss: 0.48662354460143703
Epoch: 0, step: 1289, loss: 0.435001015663147, mean loss: 0.48658352713714376
Epoch: 0, step: 1290, loss: 0.37504181265830994, mean loss: 0.4864971276681439
Epoch: 0, step: 1291, loss: 0.4561922252178192, mean loss: 0.4864736718612938
Epoch: 0, step: 1292, loss: 0.3881986141204834, mean loss: 0.4863976664028709
Epoch: 0, step: 1293, loss: 0.4437567889690399, mean loss: 0.4863647136382389
Epoch: 0, step: 1294, loss: 0.4100762605667114, mean loss: 0.48630580363586706
Epoch: 0, step: 1295, loss: 0.39906829595565796, mean loss: 0.4862384907441385
Epoch: 0, step: 1296, loss: 0.42548438906669617, mean loss: 0.4861916487227989
Epoch: 0, step: 1297, loss: 0.4295918345451355, mean loss: 0.48614804331896405
Epoch: 0, step: 1298, loss: 0.516811192035675, mean loss: 0.486171648514281
Epoch: 0, step: 1299, loss: 0.47447848320007324, mean loss: 0.4861626537717316
Epoch: 0, step: 1300, loss: 0.3986642360687256, mean loss: 0.4860953990309914
Epoch: 0, step: 1301, loss: 0.4112248420715332, mean loss: 0.4860378947629734
Epoch: 0, step: 1302, loss: 0.42156872153282166, mean loss: 0.4859884172700876
Epoch: 0, step: 1303, loss: 0.4354506731033325, mean loss: 0.48594966133130946
Epoch: 0, step: 1304, loss: 0.45274585485458374, mean loss: 0.48592421780144224
Epoch: 0, step: 1305, loss: 0.4530971944332123, mean loss: 0.4858990822552185
Epoch: 0, step: 1306, loss: 0.3638090491294861, mean loss: 0.4858056698350764
Epoch: 0, step: 1307, loss: 0.44416579604148865, mean loss: 0.48577383506917915
Epoch: 0, step: 1308, loss: 0.3809357285499573, mean loss: 0.4856937448426557
Epoch: 0, step: 1309, loss: 0.37474438548088074, mean loss: 0.485609050675204
Epoch: 0, step: 1310, loss: 0.38370639085769653, mean loss: 0.485531321720347
Epoch: 0, step: 1311, loss: 0.4355021119117737, mean loss: 0.48549318970067584
Epoch: 0, step: 1312, loss: 0.40860626101493835, mean loss: 0.48543463149147115
Epoch: 0, step: 1313, loss: 0.39246079325675964, mean loss: 0.4853638751457826
Epoch: 0, step: 1314, loss: 0.435576856136322, mean loss: 0.48532601429482486
Epoch: 0, step: 1315, loss: 0.40146321058273315, mean loss: 0.4852622887600892
Epoch: 0, step: 1316, loss: 0.3888746201992035, mean loss: 0.48518910146429506
Epoch: 0, step: 1317, loss: 0.38654810190200806, mean loss: 0.4851142600382235
Epoch: 0, step: 1318, loss: 0.4083670973777771, mean loss: 0.48505607416812463
Epoch: 0, step: 1319, loss: 0.3951539695262909, mean loss: 0.48498796651309295
Epoch: 0, step: 1320, loss: 0.46204236149787903, mean loss: 0.4849705966379868
Epoch: 0, step: 1321, loss: 0.4264816641807556, mean loss: 0.48492635387515987
Epoch: 0, step: 1322, loss: 0.5395148992538452, mean loss: 0.4849676150583637
Epoch: 0, step: 1323, loss: 0.4520052969455719, mean loss: 0.48494271904770453
Epoch: 0, step: 1324, loss: 0.3916710615158081, mean loss: 0.4848723253439069
Epoch: 0, step: 1325, loss: 0.39467886090278625, mean loss: 0.4848043061399543
Epoch: 0, step: 1326, loss: 0.40367576479911804, mean loss: 0.4847431693341209
Epoch: 0, step: 1327, loss: 0.4709790349006653, mean loss: 0.4847328047750596
Epoch: 0, step: 1328, loss: 0.38548991084098816, mean loss: 0.4846581299113018
Epoch: 0, step: 1329, loss: 0.4053748846054077, mean loss: 0.4845985184486658
Epoch: 0, step: 1330, loss: 0.4454640746116638, mean loss: 0.484569116161786
Epoch: 0, step: 1331, loss: 0.4511288106441498, mean loss: 0.4845440108273133
Epoch: 0, step: 1332, loss: 0.4925256669521332, mean loss: 0.4845499985663417
Epoch: 0, step: 1333, loss: 0.4627654552459717, mean loss: 0.4845336683239726
Epoch: 0, step: 1334, loss: 0.4043603837490082, mean loss: 0.4844736134291599
Epoch: 0, step: 1335, loss: 0.41368263959884644, mean loss: 0.4844206261732989
Epoch: 0, step: 1336, loss: 0.3760069012641907, mean loss: 0.48433953886970194
Epoch: 0, step: 1337, loss: 0.4199666976928711, mean loss: 0.4842914276281647
Epoch: 0, step: 1338, loss: 0.3989393413066864, mean loss: 0.48422768447183795
Epoch: 0, step: 1339, loss: 0.41196638345718384, mean loss: 0.48417375812779717
Epoch: 0, step: 1340, loss: 0.4608372747898102, mean loss: 0.4841563558285146
Epoch: 0, step: 1341, loss: 0.4088411331176758, mean loss: 0.48410023420205345
Epoch: 0, step: 1342, loss: 0.4550837278366089, mean loss: 0.4840786284638811
Epoch: 0, step: 1343, loss: 0.43540051579475403, mean loss: 0.4840424096300499
Epoch: 0, step: 1344, loss: 0.4510769844055176, mean loss: 0.48401790002021755
Epoch: 0, step: 1345, loss: 0.40669679641723633, mean loss: 0.4839604549209583
Epoch: 0, step: 1346, loss: 0.4069015681743622, mean loss: 0.48390324713569727
Epoch: 0, step: 1347, loss: 0.4040869176387787, mean loss: 0.48384403620877076
Epoch: 0, step: 1348, loss: 0.39568808674812317, mean loss: 0.4837786870987184
Epoch: 0, step: 1349, loss: 0.3618173897266388, mean loss: 0.4836883453969613
Epoch: 0, step: 1350, loss: 0.4333842694759369, mean loss: 0.48365111069975847
Epoch: 0, step: 1351, loss: 0.4609470069408417, mean loss: 0.48363431772360543
Epoch: 0, step: 1352, loss: 0.398896187543869, mean loss: 0.48357168791563815
Epoch: 0, step: 1353, loss: 0.3858197033405304, mean loss: 0.4834994929491868
Epoch: 0, step: 1354, loss: 0.5031869411468506, mean loss: 0.4835140224312515
Epoch: 0, step: 1355, loss: 0.41704314947128296, mean loss: 0.48346500261343445
Epoch: 0, step: 1356, loss: 0.375497430562973, mean loss: 0.48338543918524696
Epoch: 0, step: 1357, loss: 0.46110019087791443, mean loss: 0.4833690288403962
Epoch: 0, step: 1358, loss: 0.46122828125953674, mean loss: 0.4833527368995714
Epoch: 0, step: 1359, loss: 0.39618945121765137, mean loss: 0.48328864624833473
Epoch: 0, step: 1360, loss: 0.4611119031906128, mean loss: 0.4832723518008272
Epoch: 0, step: 1361, loss: 0.39658820629119873, mean loss: 0.483208707053757
Epoch: 0, step: 1362, loss: 0.45046359300613403, mean loss: 0.48318468275878446
Epoch: 0, step: 1363, loss: 0.42564013600349426, mean loss: 0.48314249467465303
Epoch: 0, step: 1364, loss: 0.4020114541053772, mean loss: 0.4830830580148953
Epoch: 0, step: 1365, loss: 0.4076160490512848, mean loss: 0.4830278113026233
Epoch: 0, step: 1366, loss: 0.3509708046913147, mean loss: 0.4829312077864482
Epoch: 0, step: 1367, loss: 0.44771134853363037, mean loss: 0.4829054622752985
Epoch: 0, step: 1368, loss: 0.3945778012275696, mean loss: 0.48284094243523445
Epoch: 0, step: 1369, loss: 0.39040428400039673, mean loss: 0.4827734704217784
Epoch: 0, step: 1370, loss: 0.3760058581829071, mean loss: 0.48269559470169165
Epoch: 0, step: 1371, loss: 0.3721800148487091, mean loss: 0.4826150439875131
Epoch: 0, step: 1372, loss: 0.3934035301208496, mean loss: 0.4825500683765396
Epoch: 0, step: 1373, loss: 0.44936636090278625, mean loss: 0.4825259172066169
Epoch: 0, step: 1374, loss: 0.4479501247406006, mean loss: 0.48250077117573253
Epoch: 0, step: 1375, loss: 0.4132830798625946, mean loss: 0.48245046762099913
Epoch: 0, step: 1376, loss: 0.45229241251945496, mean loss: 0.48242856634641557
Epoch: 0, step: 1377, loss: 0.4688023328781128, mean loss: 0.48241867793315846
Epoch: 0, step: 1378, loss: 0.3816850483417511, mean loss: 0.48234562961583327
Epoch: 0, step: 1379, loss: 0.4316003918647766, mean loss: 0.48230885770441945
Epoch: 0, step: 1380, loss: 0.4718027412891388, mean loss: 0.4823012500893468
Epoch: 0, step: 1381, loss: 0.4102567136287689, mean loss: 0.4822491194551496
Epoch: 0, step: 1382, loss: 0.3828926384449005, mean loss: 0.4821772781818233
Epoch: 0, step: 1383, loss: 0.40893134474754333, mean loss: 0.4821243548195153
Epoch: 0, step: 1384, loss: 0.40415701270103455, mean loss: 0.4820680607096825
Epoch: 0, step: 1385, loss: 0.46452486515045166, mean loss: 0.4820554032814291
Epoch: 0, step: 1386, loss: 0.3904937207698822, mean loss: 0.4819893890907214
Epoch: 0, step: 1387, loss: 0.4358829855918884, mean loss: 0.4819561712207655
Epoch: 0, step: 1388, loss: 0.3854728937149048, mean loss: 0.48188670881795354
Epoch: 0, step: 1389, loss: 0.3636798560619354, mean loss: 0.4818016679166902
Epoch: 0, step: 1390, loss: 0.3977838456630707, mean loss: 0.48174126689422175
Epoch: 0, step: 1391, loss: 0.4495396614074707, mean loss: 0.4817181335569468
Epoch: 0, step: 1392, loss: 0.4910847842693329, mean loss: 0.4817248576421675
Epoch: 0, step: 1393, loss: 0.4190262258052826, mean loss: 0.4816798801444366
Epoch: 0, step: 1394, loss: 0.3758997917175293, mean loss: 0.4816040521240589
Epoch: 0, step: 1395, loss: 0.4627954363822937, mean loss: 0.4815905789036135
Epoch: 0, step: 1396, loss: 0.40726330876350403, mean loss: 0.48153737398583246
Epoch: 0, step: 1397, loss: 0.4505331814289093, mean loss: 0.4815151964518146
Epoch: 0, step: 1398, loss: 0.4635330140590668, mean loss: 0.48150234285467897
Epoch: 0, step: 1399, loss: 0.4638291597366333, mean loss: 0.4814897191524518
Epoch: 0, step: 1400, loss: 0.4505840837955475, mean loss: 0.4814676594555518
Epoch: 0, step: 1401, loss: 0.3899047374725342, mean loss: 0.4814023506666909
Epoch: 0, step: 1402, loss: 0.37502825260162354, mean loss: 0.48132653163742145
Epoch: 0, step: 1403, loss: 0.43115246295928955, mean loss: 0.48129079512126893
Epoch: 0, step: 1404, loss: 0.44490283727645874, mean loss: 0.4812648962188883
Epoch: 0, step: 1405, loss: 0.40381667017936707, mean loss: 0.4812098121320892
Epoch: 0, step: 1406, loss: 0.5313630104064941, mean loss: 0.4812454576177142
Epoch: 0, step: 1407, loss: 0.40186265110969543, mean loss: 0.4811890777835466
Epoch: 0, step: 1408, loss: 0.4354543089866638, mean loss: 0.4811566187567213
Epoch: 0, step: 1409, loss: 0.4481010138988495, mean loss: 0.4811331750653327
Epoch: 0, step: 1410, loss: 0.39459556341171265, mean loss: 0.48107184436961786
Epoch: 0, step: 1411, loss: 0.40487128496170044, mean loss: 0.4810178779677709
Epoch: 0, step: 1412, loss: 0.3670579791069031, mean loss: 0.48093722694239166
Epoch: 0, step: 1413, loss: 0.4279511868953705, mean loss: 0.4808997544953994
Epoch: 0, step: 1414, loss: 0.46305230259895325, mean loss: 0.4808871414551899
Epoch: 0, step: 1415, loss: 0.4645228683948517, mean loss: 0.48087558476517556
Epoch: 0, step: 1416, loss: 0.513188898563385, mean loss: 0.4808983887974961
Epoch: 0, step: 1417, loss: 0.4156876802444458, mean loss: 0.4808524009917464
Epoch: 0, step: 1418, loss: 0.41014546155929565, mean loss: 0.48080257228178697
Epoch: 0, step: 1419, loss: 0.45519179105758667, mean loss: 0.48078453652036146
Epoch: 0, step: 1420, loss: 0.45508602261543274, mean loss: 0.48076645171113913
Epoch: 0, step: 1421, loss: 0.4243136942386627, mean loss: 0.4807267521629869
Epoch: 0, step: 1422, loss: 0.4224386513233185, mean loss: 0.4806857907428606
Epoch: 0, step: 1423, loss: 0.4328901171684265, mean loss: 0.4806522263653505
Epoch: 0, step: 1424, loss: 0.42185041308403015, mean loss: 0.48061096193497765
Epoch: 0, step: 1425, loss: 0.43771278858184814, mean loss: 0.48058087906446356
Epoch: 0, step: 1426, loss: 0.41194674372673035, mean loss: 0.4805327822632458
Epoch: 0, step: 1427, loss: 0.37032538652420044, mean loss: 0.4804556062158095
Epoch: 0, step: 1428, loss: 0.4449878931045532, mean loss: 0.4804307862626176
Epoch: 0, step: 1429, loss: 0.3699286878108978, mean loss: 0.4803535120678961
Epoch: 0, step: 1430, loss: 0.42071396112442017, mean loss: 0.48031183523285526
Epoch: 0, step: 1431, loss: 0.4276922941207886, mean loss: 0.48027508974325184
Epoch: 0, step: 1432, loss: 0.37763625383377075, mean loss: 0.48020346459607144
Epoch: 0, step: 1433, loss: 0.41504746675491333, mean loss: 0.48015802805643326
Epoch: 0, step: 1434, loss: 0.4674062728881836, mean loss: 0.4801491418158979
Epoch: 0, step: 1435, loss: 0.4265941381454468, mean loss: 0.48011184724509676
Epoch: 0, step: 1436, loss: 0.4114669859409332, mean loss: 0.48006407768260256
Epoch: 0, step: 1437, loss: 0.4293433129787445, mean loss: 0.4800288059408057
Epoch: 0, step: 1438, loss: 0.4325304329395294, mean loss: 0.47999579803739967
Epoch: 0, step: 1439, loss: 0.40372732281684875, mean loss: 0.4799428338184965
Epoch: 0, step: 1440, loss: 0.41238629817962646, mean loss: 0.47989595211437514
Epoch: 0, step: 1441, loss: 0.4601987898349762, mean loss: 0.47988229250114395
Epoch: 0, step: 1442, loss: 0.5283278822898865, mean loss: 0.4799158653284404
Epoch: 0, step: 1443, loss: 0.4577213227748871, mean loss: 0.4799004951466166
Valid: 0, mean loss: 0.26723238329092663
Epoch: 1, step: 0, loss: 0.40746042132377625, mean loss: 0.47985036360763883
Epoch: 1, step: 1, loss: 0.38926222920417786, mean loss: 0.47978771621178584
Epoch: 1, step: 2, loss: 0.4075525403022766, mean loss: 0.4797377955649928
Epoch: 1, step: 3, loss: 0.36705127358436584, mean loss: 0.4796599733813045
Epoch: 1, step: 4, loss: 0.46956634521484375, mean loss: 0.4796530074543435
Epoch: 1, step: 5, loss: 0.3999726176261902, mean loss: 0.4795980554613586
Epoch: 1, step: 6, loss: 0.42170920968055725, mean loss: 0.4795581596338046
Epoch: 1, step: 7, loss: 0.47606566548347473, mean loss: 0.479555754334803
Epoch: 1, step: 8, loss: 0.45293736457824707, mean loss: 0.4795374347272624
Epoch: 1, step: 9, loss: 0.3735721707344055, mean loss: 0.47946455627884915
Epoch: 1, step: 10, loss: 0.3845205307006836, mean loss: 0.4793993026530222
Epoch: 1, step: 11, loss: 0.4881264865398407, mean loss: 0.4794052965979994
Epoch: 1, step: 12, loss: 0.40548741817474365, mean loss: 0.4793545636684021
Epoch: 1, step: 13, loss: 0.4472314119338989, mean loss: 0.47933253132839215
Epoch: 1, step: 14, loss: 0.4038909375667572, mean loss: 0.4792808235876371
Epoch: 1, step: 15, loss: 0.4343468248844147, mean loss: 0.4792500468761965
Epoch: 1, step: 16, loss: 0.4418950378894806, mean loss: 0.4792244787660071
Epoch: 1, step: 17, loss: 0.39560532569885254, mean loss: 0.4791672837228695
Epoch: 1, step: 18, loss: 0.40520036220550537, mean loss: 0.47911672533495603
Epoch: 1, step: 19, loss: 0.4111998975276947, mean loss: 0.4790703340591314
Epoch: 1, step: 20, loss: 0.4064754843711853, mean loss: 0.4790207812607096
Epoch: 1, step: 21, loss: 0.38895341753959656, mean loss: 0.47895934376840327
Epoch: 1, step: 22, loss: 0.3907333314418793, mean loss: 0.4788992033373695
Epoch: 1, step: 23, loss: 0.3934948742389679, mean loss: 0.47884102600147144
Epoch: 1, step: 24, loss: 0.41100212931632996, mean loss: 0.4787948456769751
Epoch: 1, step: 25, loss: 0.42083704471588135, mean loss: 0.4787554186014914
Epoch: 1, step: 26, loss: 0.38762366771698, mean loss: 0.47869346635751825
Epoch: 1, step: 27, loss: 0.3844437003135681, mean loss: 0.4786294379838471
Epoch: 1, step: 28, loss: 0.3905898630619049, mean loss: 0.4785696690938797
Epoch: 1, step: 29, loss: 0.4364601969718933, mean loss: 0.4785411009309747
Epoch: 1, step: 30, loss: 0.4170965254306793, mean loss: 0.4784994435916525
Epoch: 1, step: 31, loss: 0.4655422866344452, mean loss: 0.47849066503002835
Epoch: 1, step: 32, loss: 0.4770185649394989, mean loss: 0.4784896683475026
Epoch: 1, step: 33, loss: 0.40829527378082275, mean loss: 0.4784421755230326
Epoch: 1, step: 34, loss: 0.41451528668403625, mean loss: 0.4783989524744599
Epoch: 1, step: 35, loss: 0.41217726469039917, mean loss: 0.478354208090822
Epoch: 1, step: 36, loss: 0.40265411138534546, mean loss: 0.47830309391343817
Epoch: 1, step: 37, loss: 0.4171501696109772, mean loss: 0.4782618301318576
Epoch: 1, step: 38, loss: 0.4316183030605316, mean loss: 0.47823037798953033
Epoch: 1, step: 39, loss: 0.3904074430465698, mean loss: 0.47817119811423187
Epoch: 1, step: 40, loss: 0.435442179441452, mean loss: 0.4781424243642839
Epoch: 1, step: 41, loss: 0.38556382060050964, mean loss: 0.47808012382339304
Epoch: 1, step: 42, loss: 0.4778831899166107, mean loss: 0.478079991386334
Epoch: 1, step: 43, loss: 0.4582444131374359, mean loss: 0.4780666610246076
Epoch: 1, step: 44, loss: 0.37097492814064026, mean loss: 0.4779947391086345
Epoch: 1, step: 45, loss: 0.39483577013015747, mean loss: 0.47793892772005836
Epoch: 1, step: 46, loss: 0.38941389322280884, mean loss: 0.4778795547928302
Epoch: 1, step: 47, loss: 0.44601625204086304, mean loss: 0.47785819869178997
Epoch: 1, step: 48, loss: 0.40019914507865906, mean loss: 0.47780618325065594
Epoch: 1, step: 49, loss: 0.40452390909194946, mean loss: 0.47775713219700217
Epoch: 1, step: 50, loss: 0.4368656873703003, mean loss: 0.47772978005999434
Epoch: 1, step: 51, loss: 0.3642805218696594, mean loss: 0.4776539449943591
Epoch: 1, step: 52, loss: 0.4649079740047455, mean loss: 0.47764543065168064
Epoch: 1, step: 53, loss: 0.4363737106323242, mean loss: 0.47761787943671447
Epoch: 1, step: 54, loss: 0.41630879044532776, mean loss: 0.4775769794440584
Epoch: 1, step: 55, loss: 0.42212826013565063, mean loss: 0.47754001363118614
Epoch: 1, step: 56, loss: 0.43296146392822266, mean loss: 0.47751031439753994
Epoch: 1, step: 57, loss: 0.41600361466407776, mean loss: 0.4774693645308732
Epoch: 1, step: 58, loss: 0.4180888235569, mean loss: 0.4774298565195798
Epoch: 1, step: 59, loss: 0.4000340402126312, mean loss: 0.47737839653533315
Epoch: 1, step: 60, loss: 0.37604179978370667, mean loss: 0.477311063248455
Epoch: 1, step: 61, loss: 0.35651031136512756, mean loss: 0.47723085026579676
Epoch: 1, step: 62, loss: 0.3723280131816864, mean loss: 0.47716123988949677
Epoch: 1, step: 63, loss: 0.44538241624832153, mean loss: 0.4771401663990185
Epoch: 1, step: 64, loss: 0.395577996969223, mean loss: 0.4770861159222592
Epoch: 1, step: 65, loss: 0.4089314639568329, mean loss: 0.4770409803911563
Epoch: 1, step: 66, loss: 0.3983970582485199, mean loss: 0.4769889327921208
Epoch: 1, step: 67, loss: 0.3946968615055084, mean loss: 0.47693450681904764
Epoch: 1, step: 68, loss: 0.4352404773235321, mean loss: 0.4769069496283698
Epoch: 1, step: 69, loss: 0.38502001762390137, mean loss: 0.47684625812770637
Epoch: 1, step: 70, loss: 0.44932132959365845, mean loss: 0.4768280898580469
Epoch: 1, step: 71, loss: 0.41662582755088806, mean loss: 0.47678837860322687
Epoch: 1, step: 72, loss: 0.42269134521484375, mean loss: 0.47675271806704467
Epoch: 1, step: 73, loss: 0.4106493890285492, mean loss: 0.4767091717369798
Epoch: 1, step: 74, loss: 0.4662388861179352, mean loss: 0.47670227885638794
Epoch: 1, step: 75, loss: 0.44935137033462524, mean loss: 0.4766842848376236
Epoch: 1, step: 76, loss: 0.39867621660232544, mean loss: 0.47663299748178184
Epoch: 1, step: 77, loss: 0.3986891806125641, mean loss: 0.47658178603837237
Epoch: 1, step: 78, loss: 0.3685171604156494, mean loss: 0.4765108309329077
Epoch: 1, step: 79, loss: 0.4002649188041687, mean loss: 0.47646080080683895
Epoch: 1, step: 80, loss: 0.4347488284111023, mean loss: 0.47643344869379256
Epoch: 1, step: 81, loss: 0.4135095179080963, mean loss: 0.4763922141388871
Epoch: 1, step: 82, loss: 0.45118799805641174, mean loss: 0.47637570843090904
Epoch: 1, step: 83, loss: 0.3918917775154114, mean loss: 0.4763204179002052
Epoch: 1, step: 84, loss: 0.3826330006122589, mean loss: 0.47625914424599464
Epoch: 1, step: 85, loss: 0.4036642014980316, mean loss: 0.476211696570996
Epoch: 1, step: 86, loss: 0.38058263063430786, mean loss: 0.47614923473824833
Epoch: 1, step: 87, loss: 0.4111109673976898, mean loss: 0.47610678156113306
Epoch: 1, step: 88, loss: 0.40814417600631714, mean loss: 0.47606244848510254
Epoch: 1, step: 89, loss: 0.42439085245132446, mean loss: 0.47602876426343776
Epoch: 1, step: 90, loss: 0.4198741018772125, mean loss: 0.47599218142149236
Epoch: 1, step: 91, loss: 0.4103260338306427, mean loss: 0.47594943002332124
Epoch: 1, step: 92, loss: 0.3947126865386963, mean loss: 0.4758965759286663
Epoch: 1, step: 93, loss: 0.39340442419052124, mean loss: 0.47584293993923965
Epoch: 1, step: 94, loss: 0.4470408260822296, mean loss: 0.47582422511542094
Epoch: 1, step: 95, loss: 0.4254840910434723, mean loss: 0.4757915367166729
Epoch: 1, step: 96, loss: 0.3952869772911072, mean loss: 0.47573929495195805
Epoch: 1, step: 97, loss: 0.4047001302242279, mean loss: 0.47569322545472864
Epoch: 1, step: 98, loss: 0.3936297595500946, mean loss: 0.47564004109574964
Epoch: 1, step: 99, loss: 0.3931829631328583, mean loss: 0.4755866362525094
Epoch: 1, step: 100, loss: 0.37293264269828796, mean loss: 0.4755201935382348
Epoch: 1, step: 101, loss: 0.3705675005912781, mean loss: 0.47545230693218893
Epoch: 1, step: 102, loss: 0.40000447630882263, mean loss: 0.47540353651808204
Epoch: 1, step: 103, loss: 0.4249819219112396, mean loss: 0.4753709644156228
Epoch: 1, step: 104, loss: 0.427608460187912, mean loss: 0.4753401300035972
Epoch: 1, step: 105, loss: 0.43148285150527954, mean loss: 0.4753118349852112
Epoch: 1, step: 106, loss: 0.4104037582874298, mean loss: 0.4752699858061668
Epoch: 1, step: 107, loss: 0.40693044662475586, mean loss: 0.4752259525979314
Epoch: 1, step: 108, loss: 0.4435659646987915, mean loss: 0.4752055662567214
Epoch: 1, step: 109, loss: 0.40182632207870483, mean loss: 0.47515834666587325
Epoch: 1, step: 110, loss: 0.411612331867218, mean loss: 0.47511748106150115
Epoch: 1, step: 111, loss: 0.4432726204395294, mean loss: 0.47509701521277237
Epoch: 1, step: 112, loss: 0.3931591510772705, mean loss: 0.47504438973805463
Epoch: 1, step: 113, loss: 0.34203043580055237, mean loss: 0.4749590149280819
Epoch: 1, step: 114, loss: 0.4478129744529724, mean loss: 0.4749416024582454
Epoch: 1, step: 115, loss: 0.38049402832984924, mean loss: 0.4748810591414964
Epoch: 1, step: 116, loss: 0.3668740391731262, mean loss: 0.47481186822543725
Epoch: 1, step: 117, loss: 0.3884090185165405, mean loss: 0.47475655270065564
Epoch: 1, step: 118, loss: 0.3955523669719696, mean loss: 0.47470587823761745
Epoch: 1, step: 119, loss: 0.38014480471611023, mean loss: 0.4746454171931664
Epoch: 1, step: 120, loss: 0.3676868975162506, mean loss: 0.4745770730911364
Epoch: 1, step: 121, loss: 0.45350226759910583, mean loss: 0.47456361536093716
Epoch: 1, step: 122, loss: 0.4758075475692749, mean loss: 0.474564409191319
Epoch: 1, step: 123, loss: 0.41542649269104004, mean loss: 0.4745266936833469
Epoch: 1, step: 124, loss: 0.3418673276901245, mean loss: 0.47444214341821417
Epoch: 1, step: 125, loss: 0.4002477526664734, mean loss: 0.47439488584448697
Epoch: 1, step: 126, loss: 0.3609415292739868, mean loss: 0.4743226685583186
Epoch: 1, step: 127, loss: 0.36825263500213623, mean loss: 0.47425519398226507
Epoch: 1, step: 128, loss: 0.41852396726608276, mean loss: 0.47421976408606914
Epoch: 1, step: 129, loss: 0.4222733974456787, mean loss: 0.4741867613118376
Epoch: 1, step: 130, loss: 0.44171562790870667, mean loss: 0.4741661447192007
Epoch: 1, step: 131, loss: 0.4090772569179535, mean loss: 0.47412484466348925
Epoch: 1, step: 132, loss: 0.4118366241455078, mean loss: 0.47408534674305935
Epoch: 1, step: 133, loss: 0.389838844537735, mean loss: 0.4740319585921054
Epoch: 1, step: 134, loss: 0.4194105863571167, mean loss: 0.473997366209436
Epoch: 1, step: 135, loss: 0.4211236834526062, mean loss: 0.4739639018532608
Epoch: 1, step: 136, loss: 0.4884565770626068, mean loss: 0.47397306863074934
Epoch: 1, step: 137, loss: 0.36547765135765076, mean loss: 0.4739044874567461
Epoch: 1, step: 138, loss: 0.3822636008262634, mean loss: 0.4738465968145285
Epoch: 1, step: 139, loss: 0.3808754086494446, mean loss: 0.4737879028826061
Epoch: 1, step: 140, loss: 0.4170820116996765, mean loss: 0.473752126295109
Epoch: 1, step: 141, loss: 0.3668777048587799, mean loss: 0.4736847401529675
Epoch: 1, step: 142, loss: 0.42709314823150635, mean loss: 0.47365538187198364
Epoch: 1, step: 143, loss: 0.38961008191108704, mean loss: 0.47360245662011907
Epoch: 1, step: 144, loss: 0.44022268056869507, mean loss: 0.47358144983846306
Epoch: 1, step: 145, loss: 0.42121315002441406, mean loss: 0.4735485138008442
Epoch: 1, step: 146, loss: 0.4339493215084076, mean loss: 0.4735236243022317
Epoch: 1, step: 147, loss: 0.45106565952301025, mean loss: 0.47350951754043574
Epoch: 1, step: 148, loss: 0.3571743369102478, mean loss: 0.47343648855071185
Epoch: 1, step: 149, loss: 0.4054745137691498, mean loss: 0.47339385243102455
Epoch: 1, step: 150, loss: 0.38247618079185486, mean loss: 0.47333685075601567
Epoch: 1, step: 151, loss: 0.4998560845851898, mean loss: 0.47335346681731216
Epoch: 1, step: 152, loss: 0.44798463582992554, mean loss: 0.4733375815129995
Epoch: 1, step: 153, loss: 0.4864794909954071, mean loss: 0.4733458054863927
Epoch: 1, step: 154, loss: 0.37515702843666077, mean loss: 0.47328439912175874
Epoch: 1, step: 155, loss: 0.46066588163375854, mean loss: 0.47327651254832875
Epoch: 1, step: 156, loss: 0.3904932141304016, mean loss: 0.47322480530384536
Epoch: 1, step: 157, loss: 0.38597598671913147, mean loss: 0.4731703428702719
Epoch: 1, step: 158, loss: 0.41350361704826355, mean loss: 0.47313312095771914
Epoch: 1, step: 159, loss: 0.40841540694236755, mean loss: 0.4730927732557146
Epoch: 1, step: 160, loss: 0.393716424703598, mean loss: 0.47304331758683477
Epoch: 1, step: 161, loss: 0.4320780634880066, mean loss: 0.4730178099566362
Epoch: 1, step: 162, loss: 0.43769365549087524, mean loss: 0.4729958285288417
Epoch: 1, step: 163, loss: 0.3687753677368164, mean loss: 0.47293101480944366
Epoch: 1, step: 164, loss: 0.3779134154319763, mean loss: 0.4728719609875807
Epoch: 1, step: 165, loss: 0.4205515384674072, mean loss: 0.4728394638307359
Epoch: 1, step: 166, loss: 0.3814050257205963, mean loss: 0.4727827075066452
Epoch: 1, step: 167, loss: 0.35974541306495667, mean loss: 0.4727125851155523
Epoch: 1, step: 168, loss: 0.47423985600471497, mean loss: 0.4727135319666925
Epoch: 1, step: 169, loss: 0.4095548391342163, mean loss: 0.4726744001867468
Epoch: 1, step: 170, loss: 0.3766206204891205, mean loss: 0.4726149241621662
Epoch: 1, step: 171, loss: 0.4246697425842285, mean loss: 0.47258525511416005
Epoch: 1, step: 172, loss: 0.3729425072669983, mean loss: 0.47252363313033374
Epoch: 1, step: 173, loss: 0.37980592250823975, mean loss: 0.47246632923007287
Epoch: 1, step: 174, loss: 0.3991399109363556, mean loss: 0.4724210380513862
Epoch: 1, step: 175, loss: 0.4083612561225891, mean loss: 0.4723814949761215
Epoch: 1, step: 176, loss: 0.3694002330303192, mean loss: 0.47231796551162686
Epoch: 1, step: 177, loss: 0.38267356157302856, mean loss: 0.4722626976916894
Epoch: 1, step: 178, loss: 0.3927030861377716, mean loss: 0.4722136775983105
Epoch: 1, step: 179, loss: 0.4524730145931244, mean loss: 0.4722015220176423
Epoch: 1, step: 180, loss: 0.37682682275772095, mean loss: 0.4721428298950208
Epoch: 1, step: 181, loss: 0.4035024046897888, mean loss: 0.4721006156113768
Epoch: 1, step: 182, loss: 0.36313095688819885, mean loss: 0.472033639791633
Epoch: 1, step: 183, loss: 0.3695286512374878, mean loss: 0.47197067603944987
Epoch: 1, step: 184, loss: 0.38774845004081726, mean loss: 0.47191897424325674
Epoch: 1, step: 185, loss: 0.458848237991333, mean loss: 0.47191095538666045
Epoch: 1, step: 186, loss: 0.4635787308216095, mean loss: 0.471905846726596
Epoch: 1, step: 187, loss: 0.37756580114364624, mean loss: 0.47184804032611627
Epoch: 1, step: 188, loss: 0.44350090622901917, mean loss: 0.4718306813952546
Epoch: 1, step: 189, loss: 0.41031432151794434, mean loss: 0.47179303368419134
Epoch: 1, step: 190, loss: 0.3798883557319641, mean loss: 0.47173682287198815
Epoch: 1, step: 191, loss: 0.3576769530773163, mean loss: 0.4716671041251699
Epoch: 1, step: 192, loss: 0.3956509530544281, mean loss: 0.4716206678691707
Epoch: 1, step: 193, loss: 0.4216202199459076, mean loss: 0.4715901425651882
Epoch: 1, step: 194, loss: 0.3698604702949524, mean loss: 0.47152807443079514
Epoch: 1, step: 195, loss: 0.40646669268608093, mean loss: 0.4714884028565606
Epoch: 1, step: 196, loss: 0.4369598925113678, mean loss: 0.47146736171680115
Epoch: 1, step: 197, loss: 0.4229540228843689, mean loss: 0.47143781644345617
Epoch: 1, step: 198, loss: 0.3841843605041504, mean loss: 0.4713847102621176
Epoch: 1, step: 199, loss: 0.4288730025291443, mean loss: 0.471358851559117
Epoch: 1, step: 200, loss: 0.38967135548591614, mean loss: 0.47130919350679285
Epoch: 1, step: 201, loss: 0.40614190697669983, mean loss: 0.4712696022027041
Epoch: 1, step: 202, loss: 0.36156561970710754, mean loss: 0.47120299383446146
Epoch: 1, step: 203, loss: 0.4357944130897522, mean loss: 0.4711815080451746
Epoch: 1, step: 204, loss: 0.3946596086025238, mean loss: 0.47113510301215905
Epoch: 1, step: 205, loss: 0.39744701981544495, mean loss: 0.4710904435677974
Epoch: 1, step: 206, loss: 0.4204344153404236, mean loss: 0.4710597615397978
Epoch: 1, step: 207, loss: 0.4423593580722809, mean loss: 0.47104238841421214
Epoch: 1, step: 208, loss: 0.40224897861480713, mean loss: 0.47100077110640853
Epoch: 1, step: 209, loss: 0.3963298201560974, mean loss: 0.4709556254286877
Epoch: 1, step: 210, loss: 0.425597220659256, mean loss: 0.4709282185375883
Epoch: 1, step: 211, loss: 0.4138953685760498, mean loss: 0.47089377841079993
Epoch: 1, step: 212, loss: 0.42676326632499695, mean loss: 0.4708671456334398
Epoch: 1, step: 213, loss: 0.4200747609138489, mean loss: 0.47083651090200457
Epoch: 1, step: 214, loss: 0.429629385471344, mean loss: 0.4708116723694966
Epoch: 1, step: 215, loss: 0.3791607916355133, mean loss: 0.47075646099556046
Epoch: 1, step: 216, loss: 0.3952895700931549, mean loss: 0.47071102638333745
Epoch: 1, step: 217, loss: 0.3828394114971161, mean loss: 0.47065815537558403
Epoch: 1, step: 218, loss: 0.42270389199256897, mean loss: 0.47062931937836033
Epoch: 1, step: 219, loss: 0.441049188375473, mean loss: 0.4706115428573249
Epoch: 1, step: 220, loss: 0.4122018814086914, mean loss: 0.470576461979578
Epoch: 1, step: 221, loss: 0.40180546045303345, mean loss: 0.470535182867017
Epoch: 1, step: 222, loss: 0.47154492139816284, mean loss: 0.4705357885889913
Epoch: 1, step: 223, loss: 0.42317670583724976, mean loss: 0.47050739585352863
Epoch: 1, step: 224, loss: 0.38983872532844543, mean loss: 0.4704590623181631
Epoch: 1, step: 225, loss: 0.4324636161327362, mean loss: 0.4704363105539802
Epoch: 1, step: 226, loss: 0.47044873237609863, mean loss: 0.4704363179877457
Epoch: 1, step: 227, loss: 0.4163857400417328, mean loss: 0.47040399108706027
Epoch: 1, step: 228, loss: 0.3738795220851898, mean loss: 0.47034629564832636
Epoch: 1, step: 229, loss: 0.41519230604171753, mean loss: 0.4703133482232328
Epoch: 1, step: 230, loss: 0.3523145616054535, mean loss: 0.47024290118644607
Epoch: 1, step: 231, loss: 0.4434072971343994, mean loss: 0.47022688948951763
Epoch: 1, step: 232, loss: 0.38306811451911926, mean loss: 0.47017491645733495
Epoch: 1, step: 233, loss: 0.35945144295692444, mean loss: 0.47010893107384244
Epoch: 1, step: 234, loss: 0.46894291043281555, mean loss: 0.4701082366005601
Epoch: 1, step: 235, loss: 0.3637658655643463, mean loss: 0.4700449375701814
Epoch: 1, step: 236, loss: 0.4005715250968933, mean loss: 0.47000360894884097
Epoch: 1, step: 237, loss: 0.41887128353118896, mean loss: 0.46997320923099456
Epoch: 1, step: 238, loss: 0.3520669639110565, mean loss: 0.4699031520442329
Epoch: 1, step: 239, loss: 0.3514116108417511, mean loss: 0.4698327888962504
Epoch: 1, step: 240, loss: 0.4421105980873108, mean loss: 0.4698163365574914
Epoch: 1, step: 241, loss: 0.4354687035083771, mean loss: 0.46979596429589643
Epoch: 1, step: 242, loss: 0.38804513216018677, mean loss: 0.46974750500002466
Epoch: 1, step: 243, loss: 0.41946929693222046, mean loss: 0.46971771933173806
Epoch: 1, step: 244, loss: 0.40380963683128357, mean loss: 0.4696786973764388
Epoch: 1, step: 245, loss: 0.41239726543426514, mean loss: 0.4696448030380115
Epoch: 1, step: 246, loss: 0.44553178548812866, mean loss: 0.4696305434179347
Epoch: 1, step: 247, loss: 0.43136078119277954, mean loss: 0.4696079253551539
Epoch: 1, step: 248, loss: 0.41515010595321655, mean loss: 0.4695757588936052
Epoch: 1, step: 249, loss: 0.3745229244232178, mean loss: 0.4695196474210725
Epoch: 1, step: 250, loss: 0.3811846971511841, mean loss: 0.469467532406164
Epoch: 1, step: 251, loss: 0.4081898629665375, mean loss: 0.4694314017048435
Epoch: 1, step: 252, loss: 0.43844571709632874, mean loss: 0.4694131426096116
Epoch: 1, step: 253, loss: 0.37810277938842773, mean loss: 0.469359367366254
Epoch: 1, step: 254, loss: 0.4293680787086487, mean loss: 0.4693358292328475
Epoch: 1, step: 255, loss: 0.3928113877773285, mean loss: 0.4692908148555207
Epoch: 1, step: 256, loss: 0.45500218868255615, mean loss: 0.469282414722556
Epoch: 1, step: 257, loss: 0.5200023651123047, mean loss: 0.4693122149284254
Epoch: 1, step: 258, loss: 0.3852948248386383, mean loss: 0.46926287999590055
Epoch: 1, step: 259, loss: 0.3597237765789032, mean loss: 0.4691985964845056
Epoch: 1, step: 260, loss: 0.39244040846824646, mean loss: 0.4691535770193935
Epoch: 1, step: 261, loss: 0.3723650574684143, mean loss: 0.4690968428344281
Epoch: 1, step: 262, loss: 0.3832634389400482, mean loss: 0.4690465596452691
Epoch: 1, step: 263, loss: 0.3769988715648651, mean loss: 0.46899266755622904
Epoch: 1, step: 264, loss: 0.39591294527053833, mean loss: 0.4689499058696956
Epoch: 1, step: 265, loss: 0.4138244390487671, mean loss: 0.4689176687545956
Epoch: 1, step: 266, loss: 0.43562033772468567, mean loss: 0.4688982080117377
Epoch: 1, step: 267, loss: 0.4263652265071869, mean loss: 0.46887336398048507
Epoch: 1, step: 268, loss: 0.39309123158454895, mean loss: 0.46882912455701986
Epoch: 1, step: 269, loss: 0.4095456898212433, mean loss: 0.46879453678879596
Epoch: 1, step: 270, loss: 0.41517630219459534, mean loss: 0.4687632725120646
Epoch: 1, step: 271, loss: 0.3948676586151123, mean loss: 0.46872020980000345
Epoch: 1, step: 272, loss: 0.411836713552475, mean loss: 0.4686870802157009
Epoch: 1, step: 273, loss: 0.3876035809516907, mean loss: 0.46863988376676957
Epoch: 1, step: 274, loss: 0.3549202084541321, mean loss: 0.46857372921452256
Epoch: 1, step: 275, loss: 0.4306270480155945, mean loss: 0.4685516671905697
Epoch: 1, step: 276, loss: 0.38101527094841003, mean loss: 0.4685008035088485
Epoch: 1, step: 277, loss: 0.3739899694919586, mean loss: 0.46844591916853673
Epoch: 1, step: 278, loss: 0.39328861236572266, mean loss: 0.46840229914137316
Epoch: 1, step: 279, loss: 0.410936564207077, mean loss: 0.46836896634848785
Epoch: 1, step: 280, loss: 0.4038926959037781, mean loss: 0.46833158880040393
Epoch: 1, step: 281, loss: 0.37883609533309937, mean loss: 0.46827973741369056
Epoch: 1, step: 282, loss: 0.3517608046531677, mean loss: 0.4682122684312004
Epoch: 1, step: 283, loss: 0.40393179655075073, mean loss: 0.4681750690840474
Epoch: 1, step: 284, loss: 0.46401020884513855, mean loss: 0.46817266025799825
Epoch: 1, step: 285, loss: 0.38245800137519836, mean loss: 0.46812311421240127
Epoch: 1, step: 286, loss: 0.3958861827850342, mean loss: 0.46808138288286494
Epoch: 1, step: 287, loss: 0.37051862478256226, mean loss: 0.46802505334585554
Epoch: 1, step: 288, loss: 0.4610530734062195, mean loss: 0.4680210302760692
Epoch: 1, step: 289, loss: 0.42413827776908875, mean loss: 0.4679957230370225
Epoch: 1, step: 290, loss: 0.3923139274120331, mean loss: 0.46795210240553836
Epoch: 1, step: 291, loss: 0.4589628279209137, mean loss: 0.4679469242520334
Epoch: 1, step: 292, loss: 0.3843269348144531, mean loss: 0.46789878378603594
Epoch: 1, step: 293, loss: 0.4124526083469391, mean loss: 0.46786688149867167
Epoch: 1, step: 294, loss: 0.3832559287548065, mean loss: 0.46781822655172295
Epoch: 1, step: 295, loss: 0.44355395436286926, mean loss: 0.46780428156770637
Epoch: 1, step: 296, loss: 0.422662615776062, mean loss: 0.4677783529831046
Epoch: 1, step: 297, loss: 0.3773876130580902, mean loss: 0.46772646392459427
Epoch: 1, step: 298, loss: 0.4302341341972351, mean loss: 0.4677049536952613
Epoch: 1, step: 299, loss: 0.3753071129322052, mean loss: 0.46765197328197977
Epoch: 1, step: 300, loss: 0.3902710974216461, mean loss: 0.46760762894051255
Epoch: 1, step: 301, loss: 0.4092084765434265, mean loss: 0.4675741815450961
Epoch: 1, step: 302, loss: 0.39257726073265076, mean loss: 0.46753125256924466
Epoch: 1, step: 303, loss: 0.36718374490737915, mean loss: 0.46747384552824817
Epoch: 1, step: 304, loss: 0.39846882224082947, mean loss: 0.46743439154123423
Epoch: 1, step: 305, loss: 0.4387364983558655, mean loss: 0.4674179927451283
Epoch: 1, step: 306, loss: 0.42040225863456726, mean loss: 0.4673911419546597
Epoch: 1, step: 307, loss: 0.37844476103782654, mean loss: 0.4673403734724012
Epoch: 1, step: 308, loss: 0.3788773715496063, mean loss: 0.467289909694921
Epoch: 1, step: 309, loss: 0.42194655537605286, mean loss: 0.46726405829565143
Epoch: 1, step: 310, loss: 0.3584526777267456, mean loss: 0.46720205750900246
Epoch: 1, step: 311, loss: 0.44551435112953186, mean loss: 0.4671897068789458
Epoch: 1, step: 312, loss: 0.38670942187309265, mean loss: 0.4671439013667057
Epoch: 1, step: 313, loss: 0.38737109303474426, mean loss: 0.46709852434262605
Epoch: 1, step: 314, loss: 0.42828959226608276, mean loss: 0.4670764612772045
Epoch: 1, step: 315, loss: 0.4363843500614166, mean loss: 0.46705902257765003
Epoch: 1, step: 316, loss: 0.3669193983078003, mean loss: 0.4670021573736354
Epoch: 1, step: 317, loss: 0.485770046710968, mean loss: 0.4670128088431798
Epoch: 1, step: 318, loss: 0.3937234580516815, mean loss: 0.4669712380259413
Epoch: 1, step: 319, loss: 0.3964208960533142, mean loss: 0.4669312435010135
Epoch: 1, step: 320, loss: 0.3821701407432556, mean loss: 0.46688322021333206
Epoch: 1, step: 321, loss: 0.41773363947868347, mean loss: 0.46685538919366354
Epoch: 1, step: 322, loss: 0.3680045008659363, mean loss: 0.46679944641588894
Epoch: 1, step: 323, loss: 0.3843410015106201, mean loss: 0.4667528070239742
Epoch: 1, step: 324, loss: 0.3990447223186493, mean loss: 0.4667145322446043
Epoch: 1, step: 325, loss: 0.3711616098880768, mean loss: 0.46666054754270797
Epoch: 1, step: 326, loss: 0.40292203426361084, mean loss: 0.46662455741663283
Epoch: 1, step: 327, loss: 0.4505220353603363, mean loss: 0.46661547021456945
Epoch: 1, step: 328, loss: 0.41002506017684937, mean loss: 0.4665835523296074
Epoch: 1, step: 329, loss: 0.45903027057647705, mean loss: 0.46657929456086267
Epoch: 1, step: 330, loss: 0.405770868062973, mean loss: 0.4665450362924132
Epoch: 1, step: 331, loss: 0.3947488069534302, mean loss: 0.46650461048760516
Epoch: 1, step: 332, loss: 0.3935748040676117, mean loss: 0.4664635695160689
Epoch: 1, step: 333, loss: 0.45085132122039795, mean loss: 0.4664547887240016
Epoch: 1, step: 334, loss: 0.4237143099308014, mean loss: 0.46643076372186937
Epoch: 1, step: 335, loss: 0.36677661538124084, mean loss: 0.4663747782452735
Epoch: 1, step: 336, loss: 0.410248726606369, mean loss: 0.4663432644599625
Epoch: 1, step: 337, loss: 0.45821163058280945, mean loss: 0.4663387012535219
Epoch: 1, step: 338, loss: 0.36063069105148315, mean loss: 0.4662794146521747
Epoch: 1, step: 339, loss: 0.3678593635559082, mean loss: 0.4662242464620983
Epoch: 1, step: 340, loss: 0.40961018204689026, mean loss: 0.46619252989940074
Epoch: 1, step: 341, loss: 0.39662668108940125, mean loss: 0.46615357925617007
Epoch: 1, step: 342, loss: 0.38712242245674133, mean loss: 0.46610935365079825
Epoch: 1, step: 343, loss: 0.3677719831466675, mean loss: 0.4660543551214335
Epoch: 1, step: 344, loss: 0.4088604152202606, mean loss: 0.46602238533948764
Epoch: 1, step: 345, loss: 0.38206666707992554, mean loss: 0.46597548270358846
Epoch: 1, step: 346, loss: 0.3982302248477936, mean loss: 0.4659376573223178
Epoch: 1, step: 347, loss: 0.42969101667404175, mean loss: 0.46591743040231315
Epoch: 1, step: 348, loss: 0.37680643796920776, mean loss: 0.4658677310200303
Epoch: 1, step: 349, loss: 0.4033806025981903, mean loss: 0.46583289984476733
Epoch: 1, step: 350, loss: 0.38399043679237366, mean loss: 0.46578730515783007
Epoch: 1, step: 351, loss: 0.41146886348724365, mean loss: 0.4657570610366326
Epoch: 1, step: 352, loss: 0.4365268051624298, mean loss: 0.4657407948953559
Epoch: 1, step: 353, loss: 0.40475431084632874, mean loss: 0.4657068758274755
Epoch: 1, step: 354, loss: 0.4246816635131836, mean loss: 0.4656840713737155
Epoch: 1, step: 355, loss: 0.42558467388153076, mean loss: 0.46566179393066426
Epoch: 1, step: 356, loss: 0.397586464881897, mean loss: 0.46562399530265275
Epoch: 1, step: 357, loss: 0.42117831110954285, mean loss: 0.46559933066103615
Epoch: 1, step: 358, loss: 0.4791489839553833, mean loss: 0.46560684572109956
Epoch: 1, step: 359, loss: 0.38769063353538513, mean loss: 0.46556365491611856
Epoch: 1, step: 360, loss: 0.35793402791023254, mean loss: 0.46550402631389926
Epoch: 1, step: 361, loss: 0.3744141757488251, mean loss: 0.4654535889658566
Epoch: 1, step: 362, loss: 0.40437981486320496, mean loss: 0.4654197905297179
Epoch: 1, step: 363, loss: 0.3728439509868622, mean loss: 0.4653685870786433
Epoch: 1, step: 364, loss: 0.37907034158706665, mean loss: 0.46532088213365075
Epoch: 1, step: 365, loss: 0.3690418601036072, mean loss: 0.4652676893037999
Epoch: 1, step: 366, loss: 0.35829827189445496, mean loss: 0.4652086228115805
Epoch: 1, step: 367, loss: 0.4495374262332916, mean loss: 0.4651999742483474
Epoch: 1, step: 368, loss: 0.4192148447036743, mean loss: 0.4651746101393873
Epoch: 1, step: 369, loss: 0.43683022260665894, mean loss: 0.465158984787936
Epoch: 1, step: 370, loss: 0.395026832818985, mean loss: 0.4651203444838209
Epoch: 1, step: 371, loss: 0.4288674294948578, mean loss: 0.4651003814249063
Epoch: 1, step: 372, loss: 0.3806612491607666, mean loss: 0.4650539096955369
Epoch: 1, step: 373, loss: 0.4071544408798218, mean loss: 0.465022061802899
Epoch: 1, step: 374, loss: 0.3813167214393616, mean loss: 0.4649760445734523
Epoch: 1, step: 375, loss: 0.3919282853603363, mean loss: 0.46493590844201654
Epoch: 1, step: 376, loss: 0.4319763779640198, mean loss: 0.4649178087547689
Epoch: 1, step: 377, loss: 0.464901864528656, mean loss: 0.46491780000382155
Epoch: 1, step: 378, loss: 0.3813858926296234, mean loss: 0.4648719788807419
Epoch: 1, step: 379, loss: 0.423554003238678, mean loss: 0.4648493264818153
Epoch: 1, step: 380, loss: 0.3815600275993347, mean loss: 0.4648036885098249
Epoch: 1, step: 381, loss: 0.41703230142593384, mean loss: 0.46477752674252815
Epoch: 1, step: 382, loss: 0.36735981702804565, mean loss: 0.4647242056096795
Epoch: 1, step: 383, loss: 0.3713560700416565, mean loss: 0.4646731289490843
Epoch: 1, step: 384, loss: 0.357284814119339, mean loss: 0.4646144147255579
Epoch: 1, step: 385, loss: 0.45700618624687195, mean loss: 0.464610257223657
Epoch: 1, step: 386, loss: 0.38917407393455505, mean loss: 0.4645690577789333
Epoch: 1, step: 387, loss: 0.4639550745487213, mean loss: 0.4645687226352487
Epoch: 1, step: 388, loss: 0.39493992924690247, mean loss: 0.46453073638680986
Epoch: 1, step: 389, loss: 0.48599886894226074, mean loss: 0.4645424420207005
Epoch: 1, step: 390, loss: 0.36335861682891846, mean loss: 0.46448730097154967
Epoch: 1, step: 391, loss: 0.44521674513816833, mean loss: 0.46447680502610666
Epoch: 1, step: 392, loss: 0.3448117971420288, mean loss: 0.46441166348670326
Epoch: 1, step: 393, loss: 0.38918229937553406, mean loss: 0.4643707334735851
Epoch: 1, step: 394, loss: 0.40050143003463745, mean loss: 0.46433600302038286
Epoch: 1, step: 395, loss: 0.3833039700984955, mean loss: 0.46429196387205574
Epoch: 1, step: 396, loss: 0.38915151357650757, mean loss: 0.46425114885288377
Epoch: 1, step: 397, loss: 0.380634605884552, mean loss: 0.46420575442130485
Epoch: 1, step: 398, loss: 0.4048856794834137, mean loss: 0.46417356772844653
Epoch: 1, step: 399, loss: 0.42778152227401733, mean loss: 0.46415383234587904
Epoch: 1, step: 400, loss: 0.42203396558761597, mean loss: 0.4641310031498041
Epoch: 1, step: 401, loss: 0.3523617386817932, mean loss: 0.46407045641932304
Epoch: 1, step: 402, loss: 0.38101503252983093, mean loss: 0.46402548867493243
Epoch: 1, step: 403, loss: 0.3715458810329437, mean loss: 0.4639754455972041
Epoch: 1, step: 404, loss: 0.45523372292518616, mean loss: 0.4639707177861322
Epoch: 1, step: 405, loss: 0.3989826440811157, mean loss: 0.463935589097643
Epoch: 1, step: 406, loss: 0.40498268604278564, mean loss: 0.46390373987935296
Epoch: 1, step: 407, loss: 0.35704532265663147, mean loss: 0.46384604094996706
Epoch: 1, step: 408, loss: 0.3560677766799927, mean loss: 0.46378787674906585
Epoch: 1, step: 409, loss: 0.45583081245422363, mean loss: 0.46378358491287663
Epoch: 1, step: 410, loss: 0.37485137581825256, mean loss: 0.4637356430211814
Epoch: 1, step: 411, loss: 0.4058821201324463, mean loss: 0.4637044719420388
Epoch: 1, step: 412, loss: 0.3844882845878601, mean loss: 0.46366181379052873
Epoch: 1, step: 413, loss: 0.4338836967945099, mean loss: 0.4636457868169033
Epoch: 1, step: 414, loss: 0.387041836977005, mean loss: 0.4636045797432939
Epoch: 1, step: 415, loss: 0.4320284128189087, mean loss: 0.4635876033094636
Epoch: 1, step: 416, loss: 0.3929818868637085, mean loss: 0.46354966364452765
Epoch: 1, step: 417, loss: 0.38551032543182373, mean loss: 0.4635077520772813
Epoch: 1, step: 418, loss: 0.39292797446250916, mean loss: 0.46346986706514237
Epoch: 1, step: 419, loss: 0.39013034105300903, mean loss: 0.46343052182586547
Epoch: 1, step: 420, loss: 0.4031226933002472, mean loss: 0.46339818518858633
Epoch: 1, step: 421, loss: 0.4075471758842468, mean loss: 0.4633682543154329
Epoch: 1, step: 422, loss: 0.395084023475647, mean loss: 0.4633316800086092
Epoch: 1, step: 423, loss: 0.37526458501815796, mean loss: 0.4632845348828113
Epoch: 1, step: 424, loss: 0.3648105561733246, mean loss: 0.4632318468257169
Epoch: 1, step: 425, loss: 0.3609391748905182, mean loss: 0.4631771448621152
Epoch: 1, step: 426, loss: 0.4441288113594055, mean loss: 0.4631669640318091
Epoch: 1, step: 427, loss: 0.44557708501815796, mean loss: 0.4631575677289172
Epoch: 1, step: 428, loss: 0.4170076251029968, mean loss: 0.4631329281439594
Epoch: 1, step: 429, loss: 0.475882351398468, mean loss: 0.4631397314647996
Epoch: 1, step: 430, loss: 0.40669625997543335, mean loss: 0.46310962828000524
Epoch: 1, step: 431, loss: 0.422354131937027, mean loss: 0.46308790360178403
Epoch: 1, step: 432, loss: 0.39620789885520935, mean loss: 0.46305227227267026
Epoch: 1, step: 433, loss: 0.4173157811164856, mean loss: 0.4630279184435136
Epoch: 1, step: 434, loss: 0.4316917955875397, mean loss: 0.4630112414223023
Epoch: 1, step: 435, loss: 0.4475979804992676, mean loss: 0.46300304287925814
Epoch: 1, step: 436, loss: 0.4100329279899597, mean loss: 0.4629748822652819
Epoch: 1, step: 437, loss: 0.3655928373336792, mean loss: 0.4629231383519282
Epoch: 1, step: 438, loss: 0.3619280755519867, mean loss: 0.46286950316191233
Epoch: 1, step: 439, loss: 0.39115700125694275, mean loss: 0.4628314392012409
Epoch: 1, step: 440, loss: 0.3769771456718445, mean loss: 0.46278589315692825
Epoch: 1, step: 441, loss: 0.4101604223251343, mean loss: 0.46275798993803546
Epoch: 1, step: 442, loss: 0.4232265055179596, mean loss: 0.4627370405557249
Epoch: 1, step: 443, loss: 0.4284270107746124, mean loss: 0.46271886787045946
Epoch: 1, step: 444, loss: 0.4334779679775238, mean loss: 0.4627033883046083
Epoch: 1, step: 445, loss: 0.3628326952457428, mean loss: 0.4626505466680692
Epoch: 1, step: 446, loss: 0.3722696006298065, mean loss: 0.4626027513502277
Epoch: 1, step: 447, loss: 0.3862878084182739, mean loss: 0.46256241575671186
Epoch: 1, step: 448, loss: 0.3760768175125122, mean loss: 0.46251672870005883
Epoch: 1, step: 449, loss: 0.40064510703086853, mean loss: 0.462484061529167
Epoch: 1, step: 450, loss: 0.4420475959777832, mean loss: 0.462473277114628
Epoch: 1, step: 451, loss: 0.34845444560050964, mean loss: 0.46241314060011635
Epoch: 1, step: 452, loss: 0.3983596861362457, mean loss: 0.4623793749414638
Epoch: 1, step: 453, loss: 0.4339580535888672, mean loss: 0.46236440058880174
Epoch: 1, step: 454, loss: 0.440888911485672, mean loss: 0.4623530917477785
Epoch: 1, step: 455, loss: 0.44544368982315063, mean loss: 0.462344192062555
Epoch: 1, step: 456, loss: 0.4385371506214142, mean loss: 0.46233166863202313
Epoch: 1, step: 457, loss: 0.36046847701072693, mean loss: 0.4622781128004662
Epoch: 1, step: 458, loss: 0.38988518714904785, mean loss: 0.4622400713261355
Epoch: 1, step: 459, loss: 0.4138485789299011, mean loss: 0.46221465562634756
Epoch: 1, step: 460, loss: 0.40428754687309265, mean loss: 0.46218424769524347
Epoch: 1, step: 461, loss: 0.4061991274356842, mean loss: 0.46215487459961935
Epoch: 1, step: 462, loss: 0.3735564649105072, mean loss: 0.4621084150245333
Epoch: 1, step: 463, loss: 0.3516160845756531, mean loss: 0.4620505049980926
Epoch: 1, step: 464, loss: 0.4531486928462982, mean loss: 0.46204584192205705
Epoch: 1, step: 465, loss: 0.3904992341995239, mean loss: 0.46200838296513425
Epoch: 1, step: 466, loss: 0.41139522194862366, mean loss: 0.4619818977945343
Epoch: 1, step: 467, loss: 0.37869006395339966, mean loss: 0.4619383351199312
Epoch: 1, step: 468, loss: 0.44219017028808594, mean loss: 0.4619280119809705
Epoch: 1, step: 469, loss: 0.4168214499950409, mean loss: 0.4619044453341649
Epoch: 1, step: 470, loss: 0.3900240957736969, mean loss: 0.46186690990358503
Epoch: 1, step: 471, loss: 0.3815702497959137, mean loss: 0.46182500141709876
Epoch: 1, step: 472, loss: 0.42075783014297485, mean loss: 0.46180357879254263
Epoch: 1, step: 473, loss: 0.40835464000701904, mean loss: 0.461775711775449
Epoch: 1, step: 474, loss: 0.38568824529647827, mean loss: 0.461736062235856
Epoch: 1, step: 475, loss: 0.45359155535697937, mean loss: 0.46173182030518994
Epoch: 1, step: 476, loss: 0.3918764591217041, mean loss: 0.4616954562441887
Epoch: 1, step: 477, loss: 0.45135024189949036, mean loss: 0.46169007371851506
Epoch: 1, step: 478, loss: 0.4395159184932709, mean loss: 0.46167854269655706
Epoch: 1, step: 479, loss: 0.36139681935310364, mean loss: 0.4616264212187278
Epoch: 1, step: 480, loss: 0.38877758383750916, mean loss: 0.46158857766684147
Epoch: 1, step: 481, loss: 0.41623544692993164, mean loss: 0.4615650298315679
Epoch: 1, step: 482, loss: 0.3756807744503021, mean loss: 0.4615204609393098
Epoch: 1, step: 483, loss: 0.37329724431037903, mean loss: 0.461474702009523
Epoch: 1, step: 484, loss: 0.451509952545166, mean loss: 0.4614695362503398
Epoch: 1, step: 485, loss: 0.3866223096847534, mean loss: 0.4614307553039328
Epoch: 1, step: 486, loss: 0.37699201703071594, mean loss: 0.4613870273193273
Epoch: 1, step: 487, loss: 0.3751603364944458, mean loss: 0.4613423965269749
Epoch: 1, step: 488, loss: 0.3948567807674408, mean loss: 0.4613080014851955
Epoch: 1, step: 489, loss: 0.39599114656448364, mean loss: 0.46127422855090355
Epoch: 1, step: 490, loss: 0.4178083837032318, mean loss: 0.46125176558199005
Epoch: 1, step: 491, loss: 0.3725001811981201, mean loss: 0.46120592282146117
Epoch: 1, step: 492, loss: 0.4360811710357666, mean loss: 0.46119295186029147
Epoch: 1, step: 493, loss: 0.3950072228908539, mean loss: 0.46115880029735573
Epoch: 1, step: 494, loss: 0.45764994621276855, mean loss: 0.4611569906768892
Epoch: 1, step: 495, loss: 0.35514670610427856, mean loss: 0.4611023462003054
Epoch: 1, step: 496, loss: 0.39836177229881287, mean loss: 0.4610700223600676
Epoch: 1, step: 497, loss: 0.407177597284317, mean loss: 0.46104227136878245
Epoch: 1, step: 498, loss: 0.3884527087211609, mean loss: 0.4610049118409144
Epoch: 1, step: 499, loss: 0.43775931000709534, mean loss: 0.46099295422680237
Epoch: 1, step: 500, loss: 0.38459858298301697, mean loss: 0.4609536769151089
Epoch: 1, step: 501, loss: 0.39044055342674255, mean loss: 0.4609174420109525
Epoch: 1, step: 502, loss: 0.3480850160121918, mean loss: 0.46085949007155924
Epoch: 1, step: 503, loss: 0.36109495162963867, mean loss: 0.4608082762427903
Epoch: 1, step: 504, loss: 0.40247058868408203, mean loss: 0.46077834413013835
Epoch: 1, step: 505, loss: 0.39059317111968994, mean loss: 0.46074235173372274
Epoch: 1, step: 506, loss: 0.4673936367034912, mean loss: 0.46074576090080105
Epoch: 1, step: 507, loss: 0.4161863923072815, mean loss: 0.46072293335541503
Epoch: 1, step: 508, loss: 0.3552379310131073, mean loss: 0.460668921577462
Epoch: 1, step: 509, loss: 0.38685423135757446, mean loss: 0.46063114537980593
Epoch: 1, step: 510, loss: 0.39316844940185547, mean loss: 0.4605966376069272
Epoch: 1, step: 511, loss: 0.45237648487091064, mean loss: 0.4605924350748536
Epoch: 1, step: 512, loss: 0.40349531173706055, mean loss: 0.46056325923257574
Epoch: 1, step: 513, loss: 0.38511931896209717, mean loss: 0.4605247281088421
Epoch: 1, step: 514, loss: 0.3620641231536865, mean loss: 0.46047446746312737
Epoch: 1, step: 515, loss: 0.3772710859775543, mean loss: 0.46043201675828777
Epoch: 1, step: 516, loss: 0.40745097398757935, mean loss: 0.4604049993983843
Epoch: 1, step: 517, loss: 0.3795981705188751, mean loss: 0.4603638134509432
Epoch: 1, step: 518, loss: 0.4282948076725006, mean loss: 0.46034747671850385
Epoch: 1, step: 519, loss: 0.4390708804130554, mean loss: 0.460336643420996
Epoch: 1, step: 520, loss: 0.41570377349853516, mean loss: 0.4603139294922823
Epoch: 1, step: 521, loss: 0.4612344801425934, mean loss: 0.46031439772760796
Epoch: 1, step: 522, loss: 0.4012378454208374, mean loss: 0.4602843638931866
Epoch: 1, step: 523, loss: 0.40272679924964905, mean loss: 0.4602551171631848
Epoch: 1, step: 524, loss: 0.3716599941253662, mean loss: 0.4602101221794175
Epoch: 1, step: 525, loss: 0.3698067367076874, mean loss: 0.4601642321360308
Epoch: 1, step: 526, loss: 0.37857571244239807, mean loss: 0.46012283765622686
Epoch: 1, step: 527, loss: 0.3362827003002167, mean loss: 0.46006003839793275
Epoch: 1, step: 528, loss: 0.40559500455856323, mean loss: 0.4600324332109893
Epoch: 1, step: 529, loss: 0.43179288506507874, mean loss: 0.46001812746218185
Epoch: 1, step: 530, loss: 0.3679547607898712, mean loss: 0.4599715130993098
Epoch: 1, step: 531, loss: 0.4154350161552429, mean loss: 0.4599489743862814
Epoch: 1, step: 532, loss: 0.3622319996356964, mean loss: 0.4598995474895942
Epoch: 1, step: 533, loss: 0.3991248607635498, mean loss: 0.45986882216769026
Epoch: 1, step: 534, loss: 0.37676095962524414, mean loss: 0.45982682729020546
Epoch: 1, step: 535, loss: 0.3748571276664734, mean loss: 0.4597839133004965
Epoch: 1, step: 536, loss: 0.37227529287338257, mean loss: 0.4597397393376358
Epoch: 1, step: 537, loss: 0.4026604890823364, mean loss: 0.459710940523178
Epoch: 1, step: 538, loss: 0.42607396841049194, mean loss: 0.4596939778544374
Epoch: 1, step: 539, loss: 0.410687655210495, mean loss: 0.45966927708697575
Epoch: 1, step: 540, loss: 0.4200533330440521, mean loss: 0.45964931943254606
Epoch: 1, step: 541, loss: 0.4143444895744324, mean loss: 0.4596265073329196
Epoch: 1, step: 542, loss: 0.3938508629798889, mean loss: 0.45959340434129753
Epoch: 1, step: 543, loss: 0.429512083530426, mean loss: 0.4595782728921975
Epoch: 1, step: 544, loss: 0.4122105538845062, mean loss: 0.4595544580510674
Epoch: 1, step: 545, loss: 0.39371567964553833, mean loss: 0.4595213732377983
Epoch: 1, step: 546, loss: 0.3806372880935669, mean loss: 0.45948175290372284
Epoch: 1, step: 547, loss: 0.38508984446525574, mean loss: 0.45944440756816135
Epoch: 1, step: 548, loss: 0.38484981656074524, mean loss: 0.4594069792736268
Epoch: 1, step: 549, loss: 0.42409399151802063, mean loss: 0.4593892696508807
Epoch: 1, step: 550, loss: 0.4203348457813263, mean loss: 0.45936969349856516
Epoch: 1, step: 551, loss: 0.3399292528629303, mean loss: 0.4593098535984471
Epoch: 1, step: 552, loss: 0.41173282265663147, mean loss: 0.45928602934659846
Epoch: 1, step: 553, loss: 0.4597107470035553, mean loss: 0.45928624191799833
Epoch: 1, step: 554, loss: 0.4390774071216583, mean loss: 0.45927613244586407
Epoch: 1, step: 555, loss: 0.3864191770553589, mean loss: 0.4592397039681688
Epoch: 1, step: 556, loss: 0.41485437750816345, mean loss: 0.45921752239572505
Epoch: 1, step: 557, loss: 0.44157272577285767, mean loss: 0.45920870881099835
Epoch: 1, step: 558, loss: 0.3502061069011688, mean loss: 0.4591542891395506
Epoch: 1, step: 559, loss: 0.4173625409603119, mean loss: 0.4591334349737925
Epoch: 1, step: 560, loss: 0.40082645416259766, mean loss: 0.459104354185358
Epoch: 1, step: 561, loss: 0.3705484867095947, mean loss: 0.45906020868811187
Epoch: 1, step: 562, loss: 0.3885897099971771, mean loss: 0.45902509633201277
Epoch: 1, step: 563, loss: 0.38163435459136963, mean loss: 0.45898655512596664
Epoch: 1, step: 564, loss: 0.4539119303226471, mean loss: 0.4589840291803204
Epoch: 1, step: 565, loss: 0.3900579512119293, mean loss: 0.45894973759924157
Epoch: 1, step: 566, loss: 0.3606637120246887, mean loss: 0.4589008633945799
Epoch: 1, step: 567, loss: 0.38498252630233765, mean loss: 0.45886412465845056
Epoch: 1, step: 568, loss: 0.4267376661300659, mean loss: 0.458848165165888
Epoch: 1, step: 569, loss: 0.36179086565971375, mean loss: 0.45879997385530896
Epoch: 1, step: 570, loss: 0.38546451926231384, mean loss: 0.4587635790887616
Epoch: 1, step: 571, loss: 0.37961000204086304, mean loss: 0.45872431640173383
Epoch: 1, step: 572, loss: 0.3878611922264099, mean loss: 0.45868918346956955
Epoch: 1, step: 573, loss: 0.42625242471694946, mean loss: 0.4586731097536366
Epoch: 1, step: 574, loss: 0.41013532876968384, mean loss: 0.4586490692479487
Epoch: 1, step: 575, loss: 0.38250797986984253, mean loss: 0.4586113756393457
Epoch: 1, step: 576, loss: 0.3566569983959198, mean loss: 0.4585609281493687
Epoch: 1, step: 577, loss: 0.38721320033073425, mean loss: 0.45852564242839017
Epoch: 1, step: 578, loss: 0.4252111613750458, mean loss: 0.4585091745682551
Epoch: 1, step: 579, loss: 0.4000040292739868, mean loss: 0.4584802688640583
Epoch: 1, step: 580, loss: 0.3949166536331177, mean loss: 0.45844887942443807
Epoch: 1, step: 581, loss: 0.40122559666633606, mean loss: 0.45842063496108265
Epoch: 1, step: 582, loss: 0.4374871850013733, mean loss: 0.45841030765473845
Epoch: 1, step: 583, loss: 0.36976736783981323, mean loss: 0.4583665981183406
Epoch: 1, step: 584, loss: 0.4172039031982422, mean loss: 0.4583463109350384
Epoch: 1, step: 585, loss: 0.3930298984050751, mean loss: 0.45831413536236354
Epoch: 1, step: 586, loss: 0.35422801971435547, mean loss: 0.45826288665943493
Epoch: 1, step: 587, loss: 0.4028763771057129, mean loss: 0.4582356295189065
Epoch: 1, step: 588, loss: 0.4311491847038269, mean loss: 0.4582223061323767
Epoch: 1, step: 589, loss: 0.3849703073501587, mean loss: 0.45818629236699704
Epoch: 1, step: 590, loss: 0.41161173582077026, mean loss: 0.45816340560702346
Epoch: 1, step: 591, loss: 0.37500619888305664, mean loss: 0.4581225621852533
Epoch: 1, step: 592, loss: 0.37529128789901733, mean loss: 0.4580818988203607
Epoch: 1, step: 593, loss: 0.4261159896850586, mean loss: 0.45806621387966623
Epoch: 1, step: 594, loss: 0.45368948578834534, mean loss: 0.4580640673725101
Epoch: 1, step: 595, loss: 0.4053098261356354, mean loss: 0.45803820745033513
Epoch: 1, step: 596, loss: 0.42236006259918213, mean loss: 0.4580207267326227
Epoch: 1, step: 597, loss: 0.41727927327156067, mean loss: 0.4580007749924361
Epoch: 1, step: 598, loss: 0.4504188895225525, mean loss: 0.45799706383948946
Epoch: 1, step: 599, loss: 0.3950168490409851, mean loss: 0.4579662516013297
Epoch: 1, step: 600, loss: 0.4183945953845978, mean loss: 0.4579469011581919
Epoch: 1, step: 601, loss: 0.3948257565498352, mean loss: 0.4579160501588721
Epoch: 1, step: 602, loss: 0.38886138796806335, mean loss: 0.45788231559014186
Epoch: 1, step: 603, loss: 0.36642172932624817, mean loss: 0.4578376571007552
Epoch: 1, step: 604, loss: 0.4483688473701477, mean loss: 0.4578330359149423
Epoch: 1, step: 605, loss: 0.40507960319519043, mean loss: 0.4578073025331278
Epoch: 1, step: 606, loss: 0.39669013023376465, mean loss: 0.45777750381430804
Epoch: 1, step: 607, loss: 0.39548709988594055, mean loss: 0.4577471478669745
Epoch: 1, step: 608, loss: 0.4151080250740051, mean loss: 0.4577263786887997
Epoch: 1, step: 609, loss: 0.39204880595207214, mean loss: 0.4576944032395608
Epoch: 1, step: 610, loss: 0.41512152552604675, mean loss: 0.4576736865107464
Epoch: 1, step: 611, loss: 0.3912038803100586, mean loss: 0.4576413568384698
Epoch: 1, step: 612, loss: 0.4088716506958008, mean loss: 0.45761764769596
Epoch: 1, step: 613, loss: 0.43644043803215027, mean loss: 0.45760735750661896
Epoch: 1, step: 614, loss: 0.4176415801048279, mean loss: 0.45758794722133395
Epoch: 1, step: 615, loss: 0.3941296935081482, mean loss: 0.4575571422438033
Epoch: 1, step: 616, loss: 0.4371398985385895, mean loss: 0.45754723576941936
Epoch: 1, step: 617, loss: 0.3747307360172272, mean loss: 0.4575070725784629
Epoch: 1, step: 618, loss: 0.41405007243156433, mean loss: 0.45748600762444114
Epoch: 1, step: 619, loss: 0.37415266036987305, mean loss: 0.4574456329406938
Epoch: 1, step: 620, loss: 0.38904869556427, mean loss: 0.45741251093712165
Epoch: 1, step: 621, loss: 0.3568001091480255, mean loss: 0.45736381180750446
Epoch: 1, step: 622, loss: 0.4376726448535919, mean loss: 0.45735428536001826
Epoch: 1, step: 623, loss: 0.4355500042438507, mean loss: 0.4573437417037725
Epoch: 1, step: 624, loss: 0.3650537431240082, mean loss: 0.4572991356145604
Epoch: 1, step: 625, loss: 0.3756166398525238, mean loss: 0.4572596754716802
Epoch: 1, step: 626, loss: 0.3779526352882385, mean loss: 0.45722138139143714
Epoch: 1, step: 627, loss: 0.4164617955684662, mean loss: 0.4572017097766577
Epoch: 1, step: 628, loss: 0.3910306394100189, mean loss: 0.4571697893375035
Epoch: 1, step: 629, loss: 0.36312156915664673, mean loss: 0.4571244430404057
Epoch: 1, step: 630, loss: 0.4067580997943878, mean loss: 0.45710017010390164
Epoch: 1, step: 631, loss: 0.42739665508270264, mean loss: 0.45708586205235
Epoch: 1, step: 632, loss: 0.4148280918598175, mean loss: 0.45706551647209365
Epoch: 1, step: 633, loss: 0.38806360960006714, mean loss: 0.45703231054963356
Epoch: 1, step: 634, loss: 0.38277843594551086, mean loss: 0.4569965944002328
Epoch: 1, step: 635, loss: 0.4140874147415161, mean loss: 0.4569759649869354
Epoch: 1, step: 636, loss: 0.35445234179496765, mean loss: 0.4569266984693035
Epoch: 1, step: 637, loss: 0.3914088308811188, mean loss: 0.45689522975288266
Epoch: 1, step: 638, loss: 0.3833167850971222, mean loss: 0.45685990644771907
Epoch: 1, step: 639, loss: 0.38462546467781067, mean loss: 0.45682524500733046
Epoch: 1, step: 640, loss: 0.4000193476676941, mean loss: 0.4567979999726352
Epoch: 1, step: 641, loss: 0.3398911654949188, mean loss: 0.4567419564278233
Epoch: 1, step: 642, loss: 0.3721196949481964, mean loss: 0.4567014091056002
Epoch: 1, step: 643, loss: 0.381706565618515, mean loss: 0.4566654920349646
Epoch: 1, step: 644, loss: 0.37790974974632263, mean loss: 0.4566277918232419
Epoch: 1, step: 645, loss: 0.42884621024131775, mean loss: 0.4566144992004755
Epoch: 1, step: 646, loss: 0.3736589252948761, mean loss: 0.4565748265204632
Epoch: 1, step: 647, loss: 0.38648396730422974, mean loss: 0.45654132228565625
Epoch: 1, step: 648, loss: 0.4739971160888672, mean loss: 0.4565496623686965
Epoch: 1, step: 649, loss: 0.41733628511428833, mean loss: 0.45653093582750526
Epoch: 1, step: 650, loss: 0.38282546401023865, mean loss: 0.45649575421804595
Epoch: 1, step: 651, loss: 0.47955697774887085, mean loss: 0.45650675671018853
Epoch: 1, step: 652, loss: 0.35325077176094055, mean loss: 0.45645751685088987
Epoch: 1, step: 653, loss: 0.374502569437027, mean loss: 0.45641845348224647
Epoch: 1, step: 654, loss: 0.3855946362018585, mean loss: 0.4563847117874964
Epoch: 1, step: 655, loss: 0.4520362317562103, mean loss: 0.4563826410827196
Epoch: 1, step: 656, loss: 0.4274584949016571, mean loss: 0.4563688742354178
Epoch: 1, step: 657, loss: 0.43313100934028625, mean loss: 0.45635781911415463
Epoch: 1, step: 658, loss: 0.4765177071094513, mean loss: 0.4563674053661733
Epoch: 1, step: 659, loss: 0.37824320793151855, mean loss: 0.4563302740936283
Epoch: 1, step: 660, loss: 0.4458147883415222, mean loss: 0.45632527861346106
Epoch: 1, step: 661, loss: 0.3931521475315094, mean loss: 0.4562952818750556
Epoch: 1, step: 662, loss: 0.39771637320518494, mean loss: 0.45626747983012444
Epoch: 1, step: 663, loss: 0.35357820987701416, mean loss: 0.4562187657551941
Epoch: 1, step: 664, loss: 0.3797530233860016, mean loss: 0.45618250888351597
Epoch: 1, step: 665, loss: 0.3972143530845642, mean loss: 0.45615456189024634
Epoch: 1, step: 666, loss: 0.45522141456604004, mean loss: 0.45615411984982746
Epoch: 1, step: 667, loss: 0.379215270280838, mean loss: 0.4561176904702967
Epoch: 1, step: 668, loss: 0.37500131130218506, mean loss: 0.4560793012705011
Epoch: 1, step: 669, loss: 0.4472941756248474, mean loss: 0.456075145581927
Epoch: 1, step: 670, loss: 0.4034329354763031, mean loss: 0.45605025564807095
Epoch: 1, step: 671, loss: 0.4005478620529175, mean loss: 0.45602402578342294
Epoch: 1, step: 672, loss: 0.4119448959827423, mean loss: 0.4560032042766678
Epoch: 1, step: 673, loss: 0.4038996696472168, mean loss: 0.45597860392981726
Epoch: 1, step: 674, loss: 0.40477454662323, mean loss: 0.45595443967436344
Epoch: 1, step: 675, loss: 0.4507765471935272, mean loss: 0.45595199727224983
Epoch: 1, step: 676, loss: 0.355333149433136, mean loss: 0.4559045579286199
Epoch: 1, step: 677, loss: 0.41025546193122864, mean loss: 0.4558830456307889
Epoch: 1, step: 678, loss: 0.3991604447364807, mean loss: 0.45585632749565264
Epoch: 1, step: 679, loss: 0.44397613406181335, mean loss: 0.4558507341842431
Epoch: 1, step: 680, loss: 0.4339010715484619, mean loss: 0.455840404931238
Epoch: 1, step: 681, loss: 0.41577044129371643, mean loss: 0.45582155734721286
Epoch: 1, step: 682, loss: 0.4110882878303528, mean loss: 0.45580052619088146
Epoch: 1, step: 683, loss: 0.40633857250213623, mean loss: 0.45577728279159163
Epoch: 1, step: 684, loss: 0.3424089550971985, mean loss: 0.4557240332248023
Epoch: 1, step: 685, loss: 0.39044907689094543, mean loss: 0.45569338770539675
Epoch: 1, step: 686, loss: 0.3991281986236572, mean loss: 0.4556668437405531
Epoch: 1, step: 687, loss: 0.3641524612903595, mean loss: 0.4556239195461581
Epoch: 1, step: 688, loss: 0.3781679570674896, mean loss: 0.45558760638981555
Epoch: 1, step: 689, loss: 0.44524678587913513, mean loss: 0.4555827606444966
Epoch: 1, step: 690, loss: 0.4043131470680237, mean loss: 0.45555874677396896
Epoch: 1, step: 691, loss: 0.4367130696773529, mean loss: 0.4555499238914331
Epoch: 1, step: 692, loss: 0.3881359100341797, mean loss: 0.4555183777922954
Epoch: 1, step: 693, loss: 0.40052497386932373, mean loss: 0.4554926559008441
Epoch: 1, step: 694, loss: 0.38340887427330017, mean loss: 0.45545895614318743
Epoch: 1, step: 695, loss: 0.4162250757217407, mean loss: 0.4554406225542054
Epoch: 1, step: 696, loss: 0.4100673794746399, mean loss: 0.45541943000722757
Epoch: 1, step: 697, loss: 0.3866339325904846, mean loss: 0.45538731726333553
Epoch: 1, step: 698, loss: 0.4240765869617462, mean loss: 0.45537270656324147
Epoch: 1, step: 699, loss: 0.4114772081375122, mean loss: 0.45535223291658766
Epoch: 1, step: 700, loss: 0.4309009313583374, mean loss: 0.455340833708402
Epoch: 1, step: 701, loss: 0.38188034296035767, mean loss: 0.45530660235204223
Epoch: 1, step: 702, loss: 0.39909952878952026, mean loss: 0.4552804229977979
Epoch: 1, step: 703, loss: 0.3612591028213501, mean loss: 0.45523665143347
Epoch: 1, step: 704, loss: 0.39209577441215515, mean loss: 0.4552072699178714
Epoch: 1, step: 705, loss: 0.3867988884449005, mean loss: 0.4551754520660235
Epoch: 1, step: 706, loss: 0.38546428084373474, mean loss: 0.4551430433392814
Epoch: 1, step: 707, loss: 0.38382282853126526, mean loss: 0.45510990197552303
Epoch: 1, step: 708, loss: 0.39611873030662537, mean loss: 0.45508250245315013
Epoch: 1, step: 709, loss: 0.4466279149055481, mean loss: 0.4550785773892933
Epoch: 1, step: 710, loss: 0.41896265745162964, mean loss: 0.45506181826171205
Epoch: 1, step: 711, loss: 0.4158092439174652, mean loss: 0.4550436120583984
Epoch: 1, step: 712, loss: 0.4247686266899109, mean loss: 0.45502957636745334
Epoch: 1, step: 713, loss: 0.4475548565387726, mean loss: 0.4550261126418608
Epoch: 1, step: 714, loss: 0.37281185388565063, mean loss: 0.45498803285549855
Epoch: 1, step: 715, loss: 0.3720795810222626, mean loss: 0.45494964931298315
Epoch: 1, step: 716, loss: 0.41619396209716797, mean loss: 0.4549317151680429
Epoch: 1, step: 717, loss: 0.433518648147583, mean loss: 0.4549218108817245
Epoch: 1, step: 718, loss: 0.3814789056777954, mean loss: 0.45488785669531495
Epoch: 1, step: 719, loss: 0.414047509431839, mean loss: 0.45486898407643167
Epoch: 1, step: 720, loss: 0.3634887635707855, mean loss: 0.4548267761223875
Epoch: 1, step: 721, loss: 0.4467645585536957, mean loss: 0.45482305395361156
Epoch: 1, step: 722, loss: 0.3862771689891815, mean loss: 0.45479142225773506
Epoch: 1, step: 723, loss: 0.4178199768066406, mean loss: 0.45477436900798823
Epoch: 1, step: 724, loss: 0.41395002603530884, mean loss: 0.45475554727309997
Epoch: 1, step: 725, loss: 0.37865716218948364, mean loss: 0.4547204788928771
Epoch: 1, step: 726, loss: 0.47148609161376953, mean loss: 0.454728201422919
Epoch: 1, step: 727, loss: 0.3725794851779938, mean loss: 0.45469037973035686
Epoch: 1, step: 728, loss: 0.4162846505641937, mean loss: 0.4546727056718359
Epoch: 1, step: 729, loss: 0.39446958899497986, mean loss: 0.45464501334585755
Epoch: 1, step: 730, loss: 0.3830121159553528, mean loss: 0.45461207868039066
Epoch: 1, step: 731, loss: 0.4135564863681793, mean loss: 0.45459321122068835
Epoch: 1, step: 732, loss: 0.3990565836429596, mean loss: 0.4545677005970881
Epoch: 1, step: 733, loss: 0.4409627914428711, mean loss: 0.45456145408232496
Epoch: 1, step: 734, loss: 0.43224483728408813, mean loss: 0.45455121240412477
Epoch: 1, step: 735, loss: 0.38826730847358704, mean loss: 0.4545208069436062
Epoch: 1, step: 736, loss: 0.4537314176559448, mean loss: 0.4545204450044555
Epoch: 1, step: 737, loss: 0.40794965624809265, mean loss: 0.454499101838206
Epoch: 1, step: 738, loss: 0.42353320121765137, mean loss: 0.4544849168173079
Epoch: 1, step: 739, loss: 0.4363839328289032, mean loss: 0.4544766288209762
Epoch: 1, step: 740, loss: 0.3967752754688263, mean loss: 0.4544502208789386
Epoch: 1, step: 741, loss: 0.44847774505615234, mean loss: 0.45444748873080376
Epoch: 1, step: 742, loss: 0.39912909269332886, mean loss: 0.4544221945396572
Epoch: 1, step: 743, loss: 0.407492995262146, mean loss: 0.45440074609391795
Epoch: 1, step: 744, loss: 0.47613272070884705, mean loss: 0.4544106739032441
Epoch: 1, step: 745, loss: 0.42650195956230164, mean loss: 0.45439793019806557
Epoch: 1, step: 746, loss: 0.406232625246048, mean loss: 0.4543759469461477
Epoch: 1, step: 747, loss: 0.4058291018009186, mean loss: 0.4543537996627785
Epoch: 1, step: 748, loss: 0.3779827058315277, mean loss: 0.454318974722591
Epoch: 1, step: 749, loss: 0.3698909282684326, mean loss: 0.45428049338874676
Epoch: 1, step: 750, loss: 0.39316681027412415, mean loss: 0.4542526511640932
Epoch: 1, step: 751, loss: 0.4023955464363098, mean loss: 0.454229036817678
Epoch: 1, step: 752, loss: 0.3795608580112457, mean loss: 0.45419505039127545
Epoch: 1, step: 753, loss: 0.3301282823085785, mean loss: 0.45413860509187476
Epoch: 1, step: 754, loss: 0.43976446986198425, mean loss: 0.45413206842282977
Epoch: 1, step: 755, loss: 0.3656797707080841, mean loss: 0.45409186283295944
Epoch: 1, step: 756, loss: 0.394305944442749, mean loss: 0.45406469976235964
Epoch: 1, step: 757, loss: 0.3637024462223053, mean loss: 0.4540236633166103
Epoch: 1, step: 758, loss: 0.3757762312889099, mean loss: 0.4539881447364797
Epoch: 1, step: 759, loss: 0.4415760040283203, mean loss: 0.45398251309369014
Epoch: 1, step: 760, loss: 0.4882103204727173, mean loss: 0.45399803590882803
Epoch: 1, step: 761, loss: 0.3729158341884613, mean loss: 0.45396128060433105
Epoch: 1, step: 762, loss: 0.39820337295532227, mean loss: 0.45393601648668314
Epoch: 1, step: 763, loss: 0.37852343916893005, mean loss: 0.4539018622397095
Epoch: 1, step: 764, loss: 0.4157407879829407, mean loss: 0.45388458696842987
Epoch: 1, step: 765, loss: 0.35084348917007446, mean loss: 0.45383796203729937
Epoch: 1, step: 766, loss: 0.40889525413513184, mean loss: 0.4538176351680537
Epoch: 1, step: 767, loss: 0.38447389006614685, mean loss: 0.45378628627786294
Epoch: 1, step: 768, loss: 0.38727787137031555, mean loss: 0.45375623276909316
Epoch: 1, step: 769, loss: 0.4715177118778229, mean loss: 0.4537642551173808
Epoch: 1, step: 770, loss: 0.40807172656059265, mean loss: 0.45374362643631677
Epoch: 1, step: 771, loss: 0.4315226972103119, mean loss: 0.4537335989411787
Epoch: 1, step: 772, loss: 0.3487062156200409, mean loss: 0.45368622529060537
Epoch: 1, step: 773, loss: 0.4213981032371521, mean loss: 0.45367166797678504
Epoch: 1, step: 774, loss: 0.45076751708984375, mean loss: 0.45367035921117577
Epoch: 1, step: 775, loss: 0.367690771818161, mean loss: 0.453631629667305
Epoch: 1, step: 776, loss: 0.38478392362594604, mean loss: 0.4536006311504021
Epoch: 1, step: 777, loss: 0.3587741255760193, mean loss: 0.4535579549552741
Epoch: 1, step: 778, loss: 0.41563931107521057, mean loss: 0.453540897535625
Epoch: 1, step: 779, loss: 0.3943590521812439, mean loss: 0.4535142869936491
Epoch: 1, step: 780, loss: 0.3728562295436859, mean loss: 0.45347803618131205
Epoch: 1, step: 781, loss: 0.3725053668022156, mean loss: 0.4534416603190573
Epoch: 1, step: 782, loss: 0.3803090751171112, mean loss: 0.45340882125969406
Epoch: 1, step: 783, loss: 0.4043653607368469, mean loss: 0.4533868089345043
Epoch: 1, step: 784, loss: 0.39155590534210205, mean loss: 0.453359069632758
Epoch: 1, step: 785, loss: 0.39593270421028137, mean loss: 0.4533333178993847
Epoch: 1, step: 786, loss: 0.44398045539855957, mean loss: 0.45332912567056316
Epoch: 1, step: 787, loss: 0.4239021837711334, mean loss: 0.45331594155680893
Epoch: 1, step: 788, loss: 0.39092883467674255, mean loss: 0.4532880028613857
Epoch: 1, step: 789, loss: 0.36890146136283875, mean loss: 0.4532502291185484
Epoch: 1, step: 790, loss: 0.3699074387550354, mean loss: 0.4532129392794596
Epoch: 1, step: 791, loss: 0.43267786502838135, mean loss: 0.4532037554358768
Epoch: 1, step: 792, loss: 0.36955419182777405, mean loss: 0.4531663617999322
Epoch: 1, step: 793, loss: 0.3530315160751343, mean loss: 0.4531216187946932
Epoch: 1, step: 794, loss: 0.40898507833480835, mean loss: 0.45310190618171425
Epoch: 1, step: 795, loss: 0.3750130534172058, mean loss: 0.4530670450867301
Epoch: 1, step: 796, loss: 0.36004531383514404, mean loss: 0.45302553605895163
Epoch: 1, step: 797, loss: 0.3732580244541168, mean loss: 0.45298995732942227
Epoch: 1, step: 798, loss: 0.37510305643081665, mean loss: 0.45295523289745676
Epoch: 1, step: 799, loss: 0.3997240364551544, mean loss: 0.45293151133041476
Epoch: 1, step: 800, loss: 0.3995528221130371, mean loss: 0.4529077346314315
Epoch: 1, step: 801, loss: 0.40900129079818726, mean loss: 0.4528881859030997
Epoch: 1, step: 802, loss: 0.37778958678245544, mean loss: 0.452854764185645
Epoch: 1, step: 803, loss: 0.4286574721336365, mean loss: 0.45284400026569305
Epoch: 1, step: 804, loss: 0.38536974787712097, mean loss: 0.4528139983749022
Epoch: 1, step: 805, loss: 0.4094984829425812, mean loss: 0.45279474703471007
Epoch: 1, step: 806, loss: 0.3829464614391327, mean loss: 0.452763717143286
Epoch: 1, step: 807, loss: 0.40371477603912354, mean loss: 0.4527419369740568
Epoch: 1, step: 808, loss: 0.3758496642112732, mean loss: 0.4527078081357244
Epoch: 1, step: 809, loss: 0.37390047311782837, mean loss: 0.45267284481051684
Epoch: 1, step: 810, loss: 0.3845919072628021, mean loss: 0.4526426537073915
Epoch: 1, step: 811, loss: 0.37862491607666016, mean loss: 0.4526098444265268
Epoch: 1, step: 812, loss: 0.35674089193344116, mean loss: 0.4525673681516074
Epoch: 1, step: 813, loss: 0.3949742019176483, mean loss: 0.45254186187781026
Epoch: 1, step: 814, loss: 0.3985913395881653, mean loss: 0.4525179793978237
Epoch: 1, step: 815, loss: 0.42912259697914124, mean loss: 0.4525076274587004
Epoch: 1, step: 816, loss: 0.3781110644340515, mean loss: 0.4524747231849168
Epoch: 1, step: 817, loss: 0.3710430860519409, mean loss: 0.45243872334533547
Epoch: 1, step: 818, loss: 0.4320790469646454, mean loss: 0.4524297265815791
Epoch: 1, step: 819, loss: 0.34094664454460144, mean loss: 0.4523804849375698
Epoch: 1, step: 820, loss: 0.36254948377609253, mean loss: 0.45234082445140583
Epoch: 1, step: 821, loss: 0.34756389260292053, mean loss: 0.4522945857347913
Epoch: 1, step: 822, loss: 0.37904059886932373, mean loss: 0.4522622725513482
Epoch: 1, step: 823, loss: 0.3738456964492798, mean loss: 0.45222769734142665
Epoch: 1, step: 824, loss: 0.39504751563072205, mean loss: 0.45220249673247526
Epoch: 1, step: 825, loss: 0.38301563262939453, mean loss: 0.45217201793771616
Epoch: 1, step: 826, loss: 0.38480618596076965, mean loss: 0.45214235442737843
Epoch: 1, step: 827, loss: 0.3758564293384552, mean loss: 0.4521087778758428
Epoch: 1, step: 828, loss: 0.3737391531467438, mean loss: 0.45207429937838167
Epoch: 1, step: 829, loss: 0.40665891766548157, mean loss: 0.452054327794515
Epoch: 1, step: 830, loss: 0.3943440020084381, mean loss: 0.4520289606183453
Epoch: 1, step: 831, loss: 0.38905060291290283, mean loss: 0.4520012899866645
Epoch: 1, step: 832, loss: 0.42912808060646057, mean loss: 0.4519912446597518
Epoch: 1, step: 833, loss: 0.3738691210746765, mean loss: 0.45195695048785317
Epoch: 1, step: 834, loss: 0.46866610646247864, mean loss: 0.45196428228073365
Epoch: 1, step: 835, loss: 0.44836872816085815, mean loss: 0.45196270528331267
Epoch: 1, step: 836, loss: 0.40990301966667175, mean loss: 0.45194426614012256
Epoch: 1, step: 837, loss: 0.3991699814796448, mean loss: 0.45192113981029763
Epoch: 1, step: 838, loss: 0.36139145493507385, mean loss: 0.45188148598424627
Epoch: 1, step: 839, loss: 0.3762262463569641, mean loss: 0.45184836197390155
Epoch: 1, step: 840, loss: 0.3663784861564636, mean loss: 0.451810957214244
Epoch: 1, step: 841, loss: 0.4334559440612793, mean loss: 0.4518029278996539
Epoch: 1, step: 842, loss: 0.4236334264278412, mean loss: 0.451790610671201
Epoch: 1, step: 843, loss: 0.37079426646232605, mean loss: 0.45175521017110976
Epoch: 1, step: 844, loss: 0.39723432064056396, mean loss: 0.4517313915212493
Epoch: 1, step: 845, loss: 0.3940669894218445, mean loss: 0.45170621055963384
Epoch: 1, step: 846, loss: 0.4061666429042816, mean loss: 0.4516863329657205
Epoch: 1, step: 847, loss: 0.39443108439445496, mean loss: 0.4516613524907767
Epoch: 1, step: 848, loss: 0.37305930256843567, mean loss: 0.4516270733586693
Epoch: 1, step: 849, loss: 0.3903191387653351, mean loss: 0.45160034801664956
Epoch: 1, step: 850, loss: 0.4562373459339142, mean loss: 0.45160236849504487
Epoch: 1, step: 851, loss: 0.3749307692050934, mean loss: 0.4515689749413472
Epoch: 1, step: 852, loss: 0.3795151114463806, mean loss: 0.4515376062589375
Epoch: 1, step: 853, loss: 0.3906736373901367, mean loss: 0.4515111206327979
Epoch: 1, step: 854, loss: 0.40110090374946594, mean loss: 0.4514891936137099
Epoch: 1, step: 855, loss: 0.41917818784713745, mean loss: 0.4514751453503332
Epoch: 1, step: 856, loss: 0.425823837518692, mean loss: 0.45146399745470883
Epoch: 1, step: 857, loss: 0.3949308395385742, mean loss: 0.4514394391758573
Epoch: 1, step: 858, loss: 0.48394501209259033, mean loss: 0.4514535536234981
Epoch: 1, step: 859, loss: 0.45663461089134216, mean loss: 0.4514558023462706
Epoch: 1, step: 860, loss: 0.35980865359306335, mean loss: 0.45141604219496767
Epoch: 1, step: 861, loss: 0.45536091923713684, mean loss: 0.4514177528962002
Epoch: 1, step: 862, loss: 0.39598456025123596, mean loss: 0.45139372463757643
Epoch: 1, step: 863, loss: 0.3550114333629608, mean loss: 0.4513519645460363
Epoch: 1, step: 864, loss: 0.3977702558040619, mean loss: 0.45132875895541613
Epoch: 1, step: 865, loss: 0.36380982398986816, mean loss: 0.45129087197058254
Epoch: 1, step: 866, loss: 0.3458499014377594, mean loss: 0.4512452462801746
Epoch: 1, step: 867, loss: 0.4278302490711212, mean loss: 0.45123511868622607
Epoch: 1, step: 868, loss: 0.36759182810783386, mean loss: 0.45119895643349006
Epoch: 1, step: 869, loss: 0.41791123151779175, mean loss: 0.45118457107267945
Epoch: 1, step: 870, loss: 0.38436582684516907, mean loss: 0.45115570768424423
Epoch: 1, step: 871, loss: 0.3663580119609833, mean loss: 0.4511190938259872
Epoch: 1, step: 872, loss: 0.3735169470310211, mean loss: 0.4510856013155017
Epoch: 1, step: 873, loss: 0.3521835505962372, mean loss: 0.45104293433935017
Epoch: 1, step: 874, loss: 0.4341903030872345, mean loss: 0.45103566714174254
Epoch: 1, step: 875, loss: 0.3891106843948364, mean loss: 0.4510089753388344
Epoch: 1, step: 876, loss: 0.3641658127307892, mean loss: 0.45097155906886105
Epoch: 1, step: 877, loss: 0.4078456163406372, mean loss: 0.4509529863114415
Epoch: 1, step: 878, loss: 0.3786805272102356, mean loss: 0.4509218746200505
Epoch: 1, step: 879, loss: 0.41280868649482727, mean loss: 0.45090547479727716
Epoch: 1, step: 880, loss: 0.39315637946128845, mean loss: 0.45088063647670257
Epoch: 1, step: 881, loss: 0.4096244275569916, mean loss: 0.45086289949952296
Epoch: 1, step: 882, loss: 0.3769586980342865, mean loss: 0.4508311400661473
Epoch: 1, step: 883, loss: 0.44426262378692627, mean loss: 0.45082831853853594
Epoch: 1, step: 884, loss: 0.3868406414985657, mean loss: 0.45080084422465017
Epoch: 1, step: 885, loss: 0.36717915534973145, mean loss: 0.45076495508779396
Epoch: 1, step: 886, loss: 0.38332611322402954, mean loss: 0.4507360237957031
Epoch: 1, step: 887, loss: 0.40644264221191406, mean loss: 0.4507170300643207
Epoch: 1, step: 888, loss: 0.3641248047351837, mean loss: 0.4506799138082859
Epoch: 1, step: 889, loss: 0.4505653977394104, mean loss: 0.4506798647439891
Epoch: 1, step: 890, loss: 0.3999321758747101, mean loss: 0.45065813125839194
Epoch: 1, step: 891, loss: 0.3879062533378601, mean loss: 0.4506312682969534
Epoch: 1, step: 892, loss: 0.387943297624588, mean loss: 0.45060444417599815
Epoch: 1, step: 893, loss: 0.37026503682136536, mean loss: 0.45057008172631696
Epoch: 1, step: 894, loss: 0.438065767288208, mean loss: 0.450564735717579
Epoch: 1, step: 895, loss: 0.35715219378471375, mean loss: 0.4505248158278641
Epoch: 1, step: 896, loss: 0.3655398190021515, mean loss: 0.4504885129671953
Epoch: 1, step: 897, loss: 0.40066513419151306, mean loss: 0.45046723910776926
Epoch: 1, step: 898, loss: 0.41813209652900696, mean loss: 0.450453438364031
Epoch: 1, step: 899, loss: 0.37444180250167847, mean loss: 0.4504210101917348
Epoch: 1, step: 900, loss: 0.36548152565956116, mean loss: 0.4503847886631497
Epoch: 1, step: 901, loss: 0.37510383129119873, mean loss: 0.45035269959351115
Epoch: 1, step: 902, loss: 0.3771696388721466, mean loss: 0.4503215180593308
Epoch: 1, step: 903, loss: 0.3909902572631836, mean loss: 0.45029624920890654
Epoch: 1, step: 904, loss: 0.3573845624923706, mean loss: 0.45025669548957215
Epoch: 1, step: 905, loss: 0.3818874955177307, mean loss: 0.4502276022129884
Epoch: 1, step: 906, loss: 0.43214261531829834, mean loss: 0.45021990974727394
Epoch: 1, step: 907, loss: 0.3402129113674164, mean loss: 0.4501731380642893
Epoch: 1, step: 908, loss: 0.3551507592201233, mean loss: 0.4501327545628681
Epoch: 1, step: 909, loss: 0.3882104158401489, mean loss: 0.45010644940623146
Epoch: 1, step: 910, loss: 0.3643191158771515, mean loss: 0.45007002166375626
Epoch: 1, step: 911, loss: 0.34524810314178467, mean loss: 0.4500255301873038
Epoch: 1, step: 912, loss: 0.3990907669067383, mean loss: 0.4500039201901546
Epoch: 1, step: 913, loss: 0.37859880924224854, mean loss: 0.449973638124443
Epoch: 1, step: 914, loss: 0.3830784559249878, mean loss: 0.44994528069239575
Epoch: 1, step: 915, loss: 0.3891008496284485, mean loss: 0.44991949915380935
Epoch: 1, step: 916, loss: 0.37136268615722656, mean loss: 0.4498862264672373
Epoch: 1, step: 917, loss: 0.3901708722114563, mean loss: 0.44986094477618915
Epoch: 1, step: 918, loss: 0.4106771945953369, mean loss: 0.44984436257128824
Epoch: 1, step: 919, loss: 0.3590506911277771, mean loss: 0.4498059557728773
Epoch: 1, step: 920, loss: 0.3859812021255493, mean loss: 0.44977896856203275
Epoch: 1, step: 921, loss: 0.38934922218322754, mean loss: 0.44975342767176274
Epoch: 1, step: 922, loss: 0.3881203234195709, mean loss: 0.4497273891824293
Epoch: 1, step: 923, loss: 0.4058210849761963, mean loss: 0.44970884766882874
Epoch: 1, step: 924, loss: 0.39047539234161377, mean loss: 0.44968384409967416
Epoch: 1, step: 925, loss: 0.4556351602077484, mean loss: 0.44968635520351724
Epoch: 1, step: 926, loss: 0.3802908658981323, mean loss: 0.44965708675589794
Epoch: 1, step: 927, loss: 0.34854039549827576, mean loss: 0.449614457459415
Epoch: 1, step: 928, loss: 0.3828059732913971, mean loss: 0.44958630386305254
Epoch: 1, step: 929, loss: 0.4442567527294159, mean loss: 0.4495840588962734
Epoch: 1, step: 930, loss: 0.42415839433670044, mean loss: 0.44957335335330095
Epoch: 1, step: 931, loss: 0.3868895471096039, mean loss: 0.44954697127996607
Epoch: 1, step: 932, loss: 0.4015164375305176, mean loss: 0.4495267649132225
Epoch: 1, step: 933, loss: 0.38022899627685547, mean loss: 0.4494976237153098
Epoch: 1, step: 934, loss: 0.434122234582901, mean loss: 0.4494911607522445
Epoch: 1, step: 935, loss: 0.3694666922092438, mean loss: 0.4494575370259659
Epoch: 1, step: 936, loss: 0.4258802533149719, mean loss: 0.4494476347648525
Epoch: 1, step: 937, loss: 0.387082576751709, mean loss: 0.4494214529604809
Epoch: 1, step: 938, loss: 0.40105587244033813, mean loss: 0.44940115687129917
Epoch: 1, step: 939, loss: 0.4626600742340088, mean loss: 0.4494067184977097
Epoch: 1, step: 940, loss: 0.35373544692993164, mean loss: 0.4493666047570104
Epoch: 1, step: 941, loss: 0.4246479272842407, mean loss: 0.4493562448754208
Epoch: 1, step: 942, loss: 0.32748258113861084, mean loss: 0.44930518762207483
Epoch: 1, step: 943, loss: 0.40624701976776123, mean loss: 0.44928715656350937
Epoch: 1, step: 944, loss: 0.3498861789703369, mean loss: 0.44924554878720413
Epoch: 1, step: 945, loss: 0.37826403975486755, mean loss: 0.44921584941104
Epoch: 1, step: 946, loss: 0.36398857831954956, mean loss: 0.44918020437921585
Epoch: 1, step: 947, loss: 0.34572455286979675, mean loss: 0.4491369536887855
Epoch: 1, step: 948, loss: 0.3604865074157715, mean loss: 0.44909990795277505
Epoch: 1, step: 949, loss: 0.4092176854610443, mean loss: 0.44908324871196814
Epoch: 1, step: 950, loss: 0.3858838379383087, mean loss: 0.4490568606490146
Epoch: 1, step: 951, loss: 0.3934955894947052, mean loss: 0.44903367147073653
Epoch: 1, step: 952, loss: 0.3960936367511749, mean loss: 0.44901158551549264
Epoch: 1, step: 953, loss: 0.40852877497673035, mean loss: 0.44899470360951316
Epoch: 1, step: 954, loss: 0.4041270911693573, mean loss: 0.44897600097823337
Epoch: 1, step: 955, loss: 0.3527054190635681, mean loss: 0.4489358882357689
Epoch: 1, step: 956, loss: 0.39467576146125793, mean loss: 0.44891328926585033
Epoch: 1, step: 957, loss: 0.38059303164482117, mean loss: 0.4488848461944011
Epoch: 1, step: 958, loss: 0.45058131217956543, mean loss: 0.44888555217275533
Epoch: 1, step: 959, loss: 0.34977635741233826, mean loss: 0.44884432538624935
Epoch: 1, step: 960, loss: 0.36366915702819824, mean loss: 0.4488089095158302
Epoch: 1, step: 961, loss: 0.3544551730155945, mean loss: 0.4487696934989972
Epoch: 1, step: 962, loss: 0.4286399185657501, mean loss: 0.44876133048489947
Epoch: 1, step: 963, loss: 0.4190822243690491, mean loss: 0.44874900527471845
Epoch: 1, step: 964, loss: 0.37122225761413574, mean loss: 0.4487168231461752
Epoch: 1, step: 965, loss: 0.380240261554718, mean loss: 0.44868840963514145
Epoch: 1, step: 966, loss: 0.3894565999507904, mean loss: 0.4486638423146585
Epoch: 1, step: 967, loss: 0.44304999709129333, mean loss: 0.4486615148498064
Epoch: 1, step: 968, loss: 0.3838977515697479, mean loss: 0.44863467532917645
Epoch: 1, step: 969, loss: 0.40202781558036804, mean loss: 0.44861536842787203
Epoch: 1, step: 970, loss: 0.397895872592926, mean loss: 0.44859436656624263
Epoch: 1, step: 971, loss: 0.3720695674419403, mean loss: 0.44856269239441965
Epoch: 1, step: 972, loss: 0.40279510617256165, mean loss: 0.4485437566947002
Epoch: 1, step: 973, loss: 0.3637343645095825, mean loss: 0.44850868250438375
Epoch: 1, step: 974, loss: 0.3333912193775177, mean loss: 0.44846109363992454
Epoch: 1, step: 975, loss: 0.391777366399765, mean loss: 0.44843767061213935
Epoch: 1, step: 976, loss: 0.3745124340057373, mean loss: 0.4484071356114758
Epoch: 1, step: 977, loss: 0.3477703332901001, mean loss: 0.4483655844957362
Epoch: 1, step: 978, loss: 0.41495561599731445, mean loss: 0.44835179581703277
Epoch: 1, step: 979, loss: 0.3390042185783386, mean loss: 0.44830668543038316
Epoch: 1, step: 980, loss: 0.3648728132247925, mean loss: 0.448272279709886
Epoch: 1, step: 981, loss: 0.385431706905365, mean loss: 0.4482463767532477
Epoch: 1, step: 982, loss: 0.3943067789077759, mean loss: 0.44822415194985027
Epoch: 1, step: 983, loss: 0.46656617522239685, mean loss: 0.44823170632516846
Epoch: 1, step: 984, loss: 0.38564327359199524, mean loss: 0.4482059391647184
Epoch: 1, step: 985, loss: 0.4566976726055145, mean loss: 0.44820943370522903
Epoch: 1, step: 986, loss: 0.4280320703983307, mean loss: 0.4482011336791875
Epoch: 1, step: 987, loss: 0.34221115708351135, mean loss: 0.44815755227433735
Epoch: 1, step: 988, loss: 0.38682273030281067, mean loss: 0.4481323427297539
Epoch: 1, step: 989, loss: 0.44741085171699524, mean loss: 0.44813204630780945
Epoch: 1, step: 990, loss: 0.405666708946228, mean loss: 0.4481146067442113
Epoch: 1, step: 991, loss: 0.39867183566093445, mean loss: 0.4480943100401541
Epoch: 1, step: 992, loss: 0.3583557903766632, mean loss: 0.4480574866837062
Epoch: 1, step: 993, loss: 0.3947189748287201, mean loss: 0.4480356087050946
Epoch: 1, step: 994, loss: 0.411476194858551, mean loss: 0.44802061919552244
Epoch: 1, step: 995, loss: 0.39158761501312256, mean loss: 0.4479974909151198
Epoch: 1, step: 996, loss: 0.33523842692375183, mean loss: 0.44795129711586074
Epoch: 1, step: 997, loss: 0.3843247592449188, mean loss: 0.44792524202254747
Epoch: 1, step: 998, loss: 0.36479452252388, mean loss: 0.44789121389340353
Epoch: 1, step: 999, loss: 0.4351930022239685, mean loss: 0.447886018225781
Epoch: 1, step: 1000, loss: 0.3848203122615814, mean loss: 0.44786022448101037
Epoch: 1, step: 1001, loss: 0.3948809802532196, mean loss: 0.44783856493717233
Epoch: 1, step: 1002, loss: 0.44440340995788574, mean loss: 0.4478371611141322
Epoch: 1, step: 1003, loss: 0.48881036043167114, mean loss: 0.44785389853215407
Epoch: 1, step: 1004, loss: 0.38756099343299866, mean loss: 0.44782927913440024
Epoch: 1, step: 1005, loss: 0.37893161177635193, mean loss: 0.4478011576375194
Epoch: 1, step: 1006, loss: 0.48145946860313416, mean loss: 0.4478148901185335
Epoch: 1, step: 1007, loss: 0.3653441071510315, mean loss: 0.4477812560308632
Epoch: 1, step: 1008, loss: 0.4027967154979706, mean loss: 0.447762917449317
Epoch: 1, step: 1009, loss: 0.3804231882095337, mean loss: 0.4477354766468558
Epoch: 1, step: 1010, loss: 0.42990848422050476, mean loss: 0.44772821514281247
Epoch: 1, step: 1011, loss: 0.3783929944038391, mean loss: 0.44769998418974283
Epoch: 1, step: 1012, loss: 0.38088762760162354, mean loss: 0.4476727915334188
Epoch: 1, step: 1013, loss: 0.3786679208278656, mean loss: 0.44764471794891697
Epoch: 1, step: 1014, loss: 0.4032979905605316, mean loss: 0.44762668349288265
Epoch: 1, step: 1015, loss: 0.38226014375686646, mean loss: 0.4476001117287623
Epoch: 1, step: 1016, loss: 0.4059624969959259, mean loss: 0.4475831927467498
Epoch: 1, step: 1017, loss: 0.36438632011413574, mean loss: 0.4475494003533166
Epoch: 1, step: 1018, loss: 0.42204225063323975, mean loss: 0.44753904422269536
Epoch: 1, step: 1019, loss: 0.47158539295196533, mean loss: 0.4475488032927965
Epoch: 1, step: 1020, loss: 0.360740065574646, mean loss: 0.44751358676633884
Epoch: 1, step: 1021, loss: 0.34510233998298645, mean loss: 0.4474720574691842
Epoch: 1, step: 1022, loss: 0.4085468649864197, mean loss: 0.4474562791179549
Epoch: 1, step: 1023, loss: 0.42497366666793823, mean loss: 0.4474471694694743
Epoch: 1, step: 1024, loss: 0.3925457298755646, mean loss: 0.44742493316344195
Epoch: 1, step: 1025, loss: 0.3872855305671692, mean loss: 0.44740058522716813
Epoch: 1, step: 1026, loss: 0.3673570454120636, mean loss: 0.44736819205039147
Epoch: 1, step: 1027, loss: 0.3691066801548004, mean loss: 0.44733653286273145
Epoch: 1, step: 1028, loss: 0.3975071609020233, mean loss: 0.44731638350083874
Epoch: 1, step: 1029, loss: 0.35233286023139954, mean loss: 0.44727799080752045
Epoch: 1, step: 1030, loss: 0.37603476643562317, mean loss: 0.4472492056663601
Epoch: 1, step: 1031, loss: 0.3575500249862671, mean loss: 0.4472129782105119
Epoch: 1, step: 1032, loss: 0.34457927942276, mean loss: 0.4471715435319541
Epoch: 1, step: 1033, loss: 0.3687891960144043, mean loss: 0.4471399122375564
Epoch: 1, step: 1034, loss: 0.35404518246650696, mean loss: 0.44710235889759226
Epoch: 1, step: 1035, loss: 0.3613970875740051, mean loss: 0.44706780032044563
Epoch: 1, step: 1036, loss: 0.3531554341316223, mean loss: 0.44702994769400917
Epoch: 1, step: 1037, loss: 0.4007832705974579, mean loss: 0.4470113148668147
Epoch: 1, step: 1038, loss: 0.37522435188293457, mean loss: 0.4469824034842195
Epoch: 1, step: 1039, loss: 0.41251012682914734, mean loss: 0.4469685257560975
Epoch: 1, step: 1040, loss: 0.36187583208084106, mean loss: 0.44693428322343143
Epoch: 1, step: 1041, loss: 0.41802316904067993, mean loss: 0.4469226536521592
Epoch: 1, step: 1042, loss: 0.3494414687156677, mean loss: 0.44688345735745216
Epoch: 1, step: 1043, loss: 0.3787879943847656, mean loss: 0.44685608779837954
Epoch: 1, step: 1044, loss: 0.34792980551719666, mean loss: 0.4468163424057395
Epoch: 1, step: 1045, loss: 0.40773847699165344, mean loss: 0.44680064848388645
Epoch: 1, step: 1046, loss: 0.41069263219833374, mean loss: 0.4467861530939685
Epoch: 1, step: 1047, loss: 0.4235808849334717, mean loss: 0.44677684118860717
Epoch: 1, step: 1048, loss: 0.3836578130722046, mean loss: 0.44675152268555207
Epoch: 1, step: 1049, loss: 0.40198707580566406, mean loss: 0.4467335738295457
Epoch: 1, step: 1050, loss: 0.3809444010257721, mean loss: 0.4467072054236123
Epoch: 1, step: 1051, loss: 0.3517611026763916, mean loss: 0.44666916611962704
Epoch: 1, step: 1052, loss: 0.3929538130760193, mean loss: 0.44664765416406293
Epoch: 1, step: 1053, loss: 0.36230048537254333, mean loss: 0.44661388828384213
Epoch: 1, step: 1054, loss: 0.3987671434879303, mean loss: 0.4465947419273812
Epoch: 1, step: 1055, loss: 0.3391788899898529, mean loss: 0.4465517755866062
Epoch: 1, step: 1056, loss: 0.3686973452568054, mean loss: 0.4465206462662024
Epoch: 1, step: 1057, loss: 0.3921400308609009, mean loss: 0.4464989114079269
Epoch: 1, step: 1058, loss: 0.4397713243961334, mean loss: 0.4464962235984935
Epoch: 1, step: 1059, loss: 0.37627556920051575, mean loss: 0.446468180206162
Epoch: 1, step: 1060, loss: 0.3569079339504242, mean loss: 0.44643242761284635
Epoch: 1, step: 1061, loss: 0.4400988519191742, mean loss: 0.4464299002482439
Epoch: 1, step: 1062, loss: 0.3845577836036682, mean loss: 0.44640522050486753
Epoch: 1, step: 1063, loss: 0.37420469522476196, mean loss: 0.4463764324166378
Epoch: 1, step: 1064, loss: 0.42015671730041504, mean loss: 0.44636598215154566
Epoch: 1, step: 1065, loss: 0.4026722013950348, mean loss: 0.4463485742707662
Epoch: 1, step: 1066, loss: 0.34077978134155273, mean loss: 0.44630653174072665
Epoch: 1, step: 1067, loss: 0.37598973512649536, mean loss: 0.4462785393853866
Epoch: 1, step: 1068, loss: 0.35527685284614563, mean loss: 0.4462423270150964
Epoch: 1, step: 1069, loss: 0.4003337323665619, mean loss: 0.44622406583981855
Epoch: 1, step: 1070, loss: 0.361585795879364, mean loss: 0.44619041245216035
Epoch: 1, step: 1071, loss: 0.36375150084495544, mean loss: 0.44615764658904145
Epoch: 1, step: 1072, loss: 0.3440787196159363, mean loss: 0.4461170907976338
Epoch: 1, step: 1073, loss: 0.35587868094444275, mean loss: 0.44608125346250543
Epoch: 1, step: 1074, loss: 0.3919176459312439, mean loss: 0.44605975143490273
Epoch: 1, step: 1075, loss: 0.44134432077407837, mean loss: 0.44605788023225956
Epoch: 1, step: 1076, loss: 0.3885042071342468, mean loss: 0.44603505053249837
Epoch: 1, step: 1077, loss: 0.3732927441596985, mean loss: 0.4460062074292578
Epoch: 1, step: 1078, loss: 0.40977153182029724, mean loss: 0.4459918456870426
Epoch: 1, step: 1079, loss: 0.35499411821365356, mean loss: 0.4459557927046839
Epoch: 1, step: 1080, loss: 0.36766448616981506, mean loss: 0.4459247862466503
Epoch: 1, step: 1081, loss: 0.34796515107154846, mean loss: 0.44588600571015974
Epoch: 1, step: 1082, loss: 0.41132214665412903, mean loss: 0.44587232788702713
Epoch: 1, step: 1083, loss: 0.3668934404850006, mean loss: 0.44584108623852947
Epoch: 1, step: 1084, loss: 0.33430513739585876, mean loss: 0.445796983451324
Epoch: 1, step: 1085, loss: 0.39314842224121094, mean loss: 0.44577617374333584
Epoch: 1, step: 1086, loss: 0.39163050055503845, mean loss: 0.4457547807472124
Epoch: 1, step: 1087, loss: 0.36528700590133667, mean loss: 0.44572300042539337
Epoch: 1, step: 1088, loss: 0.37384894490242004, mean loss: 0.4456946253541249
Epoch: 1, step: 1089, loss: 0.3818279504776001, mean loss: 0.44566942145717287
Epoch: 1, step: 1090, loss: 0.3776358664035797, mean loss: 0.44564258376287164
Epoch: 1, step: 1091, loss: 0.44830068945884705, mean loss: 0.4456436319118054
Epoch: 1, step: 1092, loss: 0.36680054664611816, mean loss: 0.44561255462159427
Epoch: 1, step: 1093, loss: 0.4243258237838745, mean loss: 0.4456041674148024
Epoch: 1, step: 1094, loss: 0.3898215591907501, mean loss: 0.44558219710829433
Epoch: 1, step: 1095, loss: 0.41391226649284363, mean loss: 0.4455697286316741
Epoch: 1, step: 1096, loss: 0.35491448640823364, mean loss: 0.4455340516374894
Epoch: 1, step: 1097, loss: 0.3462041914463043, mean loss: 0.44549497616141104
Epoch: 1, step: 1098, loss: 0.36323100328445435, mean loss: 0.4454626269782113
Epoch: 1, step: 1099, loss: 0.4120078980922699, mean loss: 0.44544947653446687
Epoch: 1, step: 1100, loss: 0.3976233899593353, mean loss: 0.4454306843589953
Epoch: 1, step: 1101, loss: 0.41172918677330017, mean loss: 0.44541744732145183
Epoch: 1, step: 1102, loss: 0.42870861291885376, mean loss: 0.44541088711948773
Epoch: 1, step: 1103, loss: 0.3558051586151123, mean loss: 0.4453757200360873
Epoch: 1, step: 1104, loss: 0.3967680335044861, mean loss: 0.4453566507200686
Epoch: 1, step: 1105, loss: 0.4174273610115051, mean loss: 0.4453456980574378
Epoch: 1, step: 1106, loss: 0.40602150559425354, mean loss: 0.44533028285067056
Epoch: 1, step: 1107, loss: 0.3794892430305481, mean loss: 0.4453044830701768
Epoch: 1, step: 1108, loss: 0.4466177225112915, mean loss: 0.44530499746087054
Epoch: 1, step: 1109, loss: 0.3654192090034485, mean loss: 0.44527371876531163
Epoch: 1, step: 1110, loss: 0.4167862832546234, mean loss: 0.4452625690840941
Epoch: 1, step: 1111, loss: 0.3704755902290344, mean loss: 0.4452333097026954
Epoch: 1, step: 1112, loss: 0.37052521109580994, mean loss: 0.4452040926129
Epoch: 1, step: 1113, loss: 0.3746435046195984, mean loss: 0.44517650833299643
Epoch: 1, step: 1114, loss: 0.3483772873878479, mean loss: 0.44513868136115387
Epoch: 1, step: 1115, loss: 0.3698890209197998, mean loss: 0.445109286962544
Epoch: 1, step: 1116, loss: 0.3284357786178589, mean loss: 0.4450637291693598
Epoch: 1, step: 1117, loss: 0.3981517553329468, mean loss: 0.4450454184848023
Epoch: 1, step: 1118, loss: 0.35666167736053467, mean loss: 0.44501093399743424
Epoch: 1, step: 1119, loss: 0.3737674951553345, mean loss: 0.4449831479448437
Epoch: 1, step: 1120, loss: 0.40732911229133606, mean loss: 0.44496846800891643
Epoch: 1, step: 1121, loss: 0.37212127447128296, mean loss: 0.4449400786115908
Epoch: 1, step: 1122, loss: 0.44255366921424866, mean loss: 0.44493914896242936
Epoch: 1, step: 1123, loss: 0.354961633682251, mean loss: 0.4449041109891894
Epoch: 1, step: 1124, loss: 0.3756563365459442, mean loss: 0.4448771558414887
Epoch: 1, step: 1125, loss: 0.3750046491622925, mean loss: 0.4448499680956991
Epoch: 1, step: 1126, loss: 0.42946895956993103, mean loss: 0.44484398559530014
Epoch: 1, step: 1127, loss: 0.4391716718673706, mean loss: 0.4448417801856081
Epoch: 1, step: 1128, loss: 0.3655594289302826, mean loss: 0.4448109669904059
Epoch: 1, step: 1129, loss: 0.37970077991485596, mean loss: 0.4447856716574317
Epoch: 1, step: 1130, loss: 0.3796592056751251, mean loss: 0.44476037982598227
Epoch: 1, step: 1131, loss: 0.38131552934646606, mean loss: 0.4447357506138396
Epoch: 1, step: 1132, loss: 0.43216511607170105, mean loss: 0.44473087260276384
Epoch: 1, step: 1133, loss: 0.37182316184043884, mean loss: 0.44470259187709965
Epoch: 1, step: 1134, loss: 0.3739878237247467, mean loss: 0.44467517242453963
Epoch: 1, step: 1135, loss: 0.44927793741226196, mean loss: 0.44467695644197675
Epoch: 1, step: 1136, loss: 0.37990570068359375, mean loss: 0.44465186103098936
Epoch: 1, step: 1137, loss: 0.4614463150501251, mean loss: 0.4446583654670928
Epoch: 1, step: 1138, loss: 0.3884982764720917, mean loss: 0.4446366232723599
Epoch: 1, step: 1139, loss: 0.47705385088920593, mean loss: 0.4446491686390847
Epoch: 1, step: 1140, loss: 0.43240633606910706, mean loss: 0.4446444325336418
Epoch: 1, step: 1141, loss: 0.39387282729148865, mean loss: 0.4446247992756208
Epoch: 1, step: 1142, loss: 0.37689340114593506, mean loss: 0.4445986178306538
Epoch: 1, step: 1143, loss: 0.4046739339828491, mean loss: 0.4445831909821809
Epoch: 1, step: 1144, loss: 0.4766881763935089, mean loss: 0.4445955915172954
Epoch: 1, step: 1145, loss: 0.37043991684913635, mean loss: 0.4445669599826745
Epoch: 1, step: 1146, loss: 0.41964152455329895, mean loss: 0.4445573399767195
Epoch: 1, step: 1147, loss: 0.43771782517433167, mean loss: 0.444554701275021
Epoch: 1, step: 1148, loss: 0.41359615325927734, mean loss: 0.44454276199695864
Epoch: 1, step: 1149, loss: 0.37991535663604736, mean loss: 0.44451784780830755
Epoch: 1, step: 1150, loss: 0.4551943838596344, mean loss: 0.44452196208038897
Epoch: 1, step: 1151, loss: 0.38749513030052185, mean loss: 0.44449999488786973
Epoch: 1, step: 1152, loss: 0.42757973074913025, mean loss: 0.44449347957630303
Epoch: 1, step: 1153, loss: 0.40647709369659424, mean loss: 0.4444788466333162
Epoch: 1, step: 1154, loss: 0.3890342712402344, mean loss: 0.4444575135916105
Epoch: 1, step: 1155, loss: 0.41457223892211914, mean loss: 0.44444601925519917
Epoch: 1, step: 1156, loss: 0.3473201394081116, mean loss: 0.4444086775097755
Epoch: 1, step: 1157, loss: 0.41394034028053284, mean loss: 0.44439696792590566
Epoch: 1, step: 1158, loss: 0.35446640849113464, mean loss: 0.4443624191132146
Epoch: 1, step: 1159, loss: 0.4038711190223694, mean loss: 0.44434686945880186
Epoch: 1, step: 1160, loss: 0.3823058009147644, mean loss: 0.44432305330964866
Epoch: 1, step: 1161, loss: 0.3899174630641937, mean loss: 0.44430217626043705
Epoch: 1, step: 1162, loss: 0.39256343245506287, mean loss: 0.44428233017535634
Epoch: 1, step: 1163, loss: 0.3858008086681366, mean loss: 0.4442599062790729
Epoch: 1, step: 1164, loss: 0.44936075806617737, mean loss: 0.4442618613774965
Epoch: 1, step: 1165, loss: 0.34713518619537354, mean loss: 0.44422464809198614
Epoch: 1, step: 1166, loss: 0.39636000990867615, mean loss: 0.44420631617387685
Epoch: 1, step: 1167, loss: 0.3876418471336365, mean loss: 0.4441846605578584
Epoch: 1, step: 1168, loss: 0.40410861372947693, mean loss: 0.444169323379585
Epoch: 1, step: 1169, loss: 0.3940635621547699, mean loss: 0.4441501551465227
Epoch: 1, step: 1170, loss: 0.36009085178375244, mean loss: 0.44411801009743557
Epoch: 1, step: 1171, loss: 0.4166351556777954, mean loss: 0.4441075044191406
Epoch: 1, step: 1172, loss: 0.393302857875824, mean loss: 0.4440880911036865
Epoch: 1, step: 1173, loss: 0.35277995467185974, mean loss: 0.44405321404622594
Epoch: 1, step: 1174, loss: 0.38547325134277344, mean loss: 0.44403084674469734
Epoch: 1, step: 1175, loss: 0.35539716482162476, mean loss: 0.44399701709510836
Epoch: 1, step: 1176, loss: 0.34070706367492676, mean loss: 0.44395760849021704
Epoch: 1, step: 1177, loss: 0.41175758838653564, mean loss: 0.4439453277807953
Epoch: 1, step: 1178, loss: 0.4046040177345276, mean loss: 0.4439303291875638
Epoch: 1, step: 1179, loss: 0.4016019403934479, mean loss: 0.44391419794183434
Epoch: 1, step: 1180, loss: 0.4088255763053894, mean loss: 0.4439008308478776
Epoch: 1, step: 1181, loss: 0.38290250301361084, mean loss: 0.443877602238649
Epoch: 1, step: 1182, loss: 0.3871975243091583, mean loss: 0.4438560262668449
Epoch: 1, step: 1183, loss: 0.3816390335559845, mean loss: 0.4438323516120843
Epoch: 1, step: 1184, loss: 0.40796563029289246, mean loss: 0.4438187088881135
Epoch: 1, step: 1185, loss: 0.41747575998306274, mean loss: 0.4438086925577313
Epoch: 1, step: 1186, loss: 0.40239331126213074, mean loss: 0.4437929512497512
Epoch: 1, step: 1187, loss: 0.3526214361190796, mean loss: 0.4437583116163429
Epoch: 1, step: 1188, loss: 0.4096221625804901, mean loss: 0.4437453468806665
Epoch: 1, step: 1189, loss: 0.3380114436149597, mean loss: 0.443705204928022
Epoch: 1, step: 1190, loss: 0.37103667855262756, mean loss: 0.4436776267396442
Epoch: 1, step: 1191, loss: 0.43786701560020447, mean loss: 0.4436754224106839
Epoch: 1, step: 1192, loss: 0.3788830637931824, mean loss: 0.4436508519296003
Epoch: 1, step: 1193, loss: 0.3869782090187073, mean loss: 0.4436293687442664
Epoch: 1, step: 1194, loss: 0.3611072599887848, mean loss: 0.44359809852495774
Epoch: 1, step: 1195, loss: 0.3750983476638794, mean loss: 0.4435721516496316
Epoch: 1, step: 1196, loss: 0.4119347631931305, mean loss: 0.4435601723279896
Epoch: 1, step: 1197, loss: 0.4229918122291565, mean loss: 0.44355238718033674
Epoch: 1, step: 1198, loss: 0.37393367290496826, mean loss: 0.44352604638795107
Epoch: 1, step: 1199, loss: 0.4287380874156952, mean loss: 0.4435204533626212
Epoch: 1, step: 1200, loss: 0.4077152907848358, mean loss: 0.44350691643915136
Epoch: 1, step: 1201, loss: 0.41884636878967285, mean loss: 0.4434975965042876
Epoch: 1, step: 1202, loss: 0.3774679899215698, mean loss: 0.4434726514319103
Epoch: 1, step: 1203, loss: 0.34808945655822754, mean loss: 0.44343663058792476
Epoch: 1, step: 1204, loss: 0.3695183992385864, mean loss: 0.4434087263858299
Epoch: 1, step: 1205, loss: 0.3864978849887848, mean loss: 0.4433872505966235
Epoch: 1, step: 1206, loss: 0.3952880799770355, mean loss: 0.4433691068129118
Epoch: 1, step: 1207, loss: 0.39136824011802673, mean loss: 0.4433494986429665
Epoch: 1, step: 1208, loss: 0.37077024579048157, mean loss: 0.44332214121633534
Epoch: 1, step: 1209, loss: 0.41535329818725586, mean loss: 0.44331160284292576
Epoch: 1, step: 1210, loss: 0.4039033055305481, mean loss: 0.4432967597930906
Epoch: 1, step: 1211, loss: 0.41229209303855896, mean loss: 0.4432850863492824
Epoch: 1, step: 1212, loss: 0.37951788306236267, mean loss: 0.44326108664913677
Epoch: 1, step: 1213, loss: 0.39656972885131836, mean loss: 0.4432435202993257
Epoch: 1, step: 1214, loss: 0.4379546344280243, mean loss: 0.4432415312486031
Epoch: 1, step: 1215, loss: 0.38050952553749084, mean loss: 0.44321794778780943
Epoch: 1, step: 1216, loss: 0.3704613745212555, mean loss: 0.44319060597147475
Epoch: 1, step: 1217, loss: 0.34172335267066956, mean loss: 0.4431524890468689
Epoch: 1, step: 1218, loss: 0.36616426706314087, mean loss: 0.44312357871191443
Epoch: 1, step: 1219, loss: 0.3393646478652954, mean loss: 0.44308463016429933
Epoch: 1, step: 1220, loss: 0.3568926453590393, mean loss: 0.44305228795611723
Epoch: 1, step: 1221, loss: 0.36504799127578735, mean loss: 0.44302302903013063
Epoch: 1, step: 1222, loss: 0.36382290720939636, mean loss: 0.44299333269648955
Epoch: 1, step: 1223, loss: 0.36700233817100525, mean loss: 0.44296485031473337
Epoch: 1, step: 1224, loss: 0.4221937358379364, mean loss: 0.44295706795636813
Epoch: 1, step: 1225, loss: 0.3619290590286255, mean loss: 0.4429267203874813
Epoch: 1, step: 1226, loss: 0.3494971692562103, mean loss: 0.44289174114707275
Epoch: 1, step: 1227, loss: 0.4225062131881714, mean loss: 0.44288411183271686
Epoch: 1, step: 1228, loss: 0.39850080013275146, mean loss: 0.4428675075260577
Epoch: 1, step: 1229, loss: 0.4321792423725128, mean loss: 0.44286351041867045
Epoch: 1, step: 1230, loss: 0.35376691818237305, mean loss: 0.44283020328138584
Epoch: 1, step: 1231, loss: 0.42889338731765747, mean loss: 0.4428249952036714
Epoch: 1, step: 1232, loss: 0.3833335340023041, mean loss: 0.44280277202055546
Epoch: 1, step: 1233, loss: 0.40228140354156494, mean loss: 0.44278764081499944
Epoch: 1, step: 1234, loss: 0.38432425260543823, mean loss: 0.4427658179750556
Epoch: 1, step: 1235, loss: 0.3920861482620239, mean loss: 0.4427469076505358
Epoch: 1, step: 1236, loss: 0.3823688328266144, mean loss: 0.442724386921396
Epoch: 1, step: 1237, loss: 0.37607428431510925, mean loss: 0.4426995360255696
Epoch: 1, step: 1238, loss: 0.4467090666294098, mean loss: 0.44270103044621956
Epoch: 1, step: 1239, loss: 0.3582679331302643, mean loss: 0.442669572511303
Epoch: 1, step: 1240, loss: 0.36474931240081787, mean loss: 0.44264055193025625
Epoch: 1, step: 1241, loss: 0.41948068141937256, mean loss: 0.4426319294914957
Epoch: 1, step: 1242, loss: 0.3704618811607361, mean loss: 0.4426050705230064
Epoch: 1, step: 1243, loss: 0.4107419550418854, mean loss: 0.4425932166854018
Epoch: 1, step: 1244, loss: 0.3888883590698242, mean loss: 0.44257324462976194
Epoch: 1, step: 1245, loss: 0.3677369952201843, mean loss: 0.4425454244626952
Epoch: 1, step: 1246, loss: 0.422220379114151, mean loss: 0.44253787149155116
Epoch: 1, step: 1247, loss: 0.3763646185398102, mean loss: 0.4425132900454324
Epoch: 1, step: 1248, loss: 0.36635372042655945, mean loss: 0.4424850094774343
Epoch: 1, step: 1249, loss: 0.35845187306404114, mean loss: 0.4424538167764642
Epoch: 1, step: 1250, loss: 0.34981727600097656, mean loss: 0.44241944329194643
Epoch: 1, step: 1251, loss: 0.40019363164901733, mean loss: 0.4424037808989038
Epoch: 1, step: 1252, loss: 0.3665587902069092, mean loss: 0.44237565891496167
Epoch: 1, step: 1253, loss: 0.37371790409088135, mean loss: 0.4423502112667689
Epoch: 1, step: 1254, loss: 0.3639122247695923, mean loss: 0.44232114939700334
Epoch: 1, step: 1255, loss: 0.41686323285102844, mean loss: 0.44231172053902335
Epoch: 1, step: 1256, loss: 0.3615664541721344, mean loss: 0.44228182595688087
Epoch: 1, step: 1257, loss: 0.3695066273212433, mean loss: 0.4422548921305908
Epoch: 1, step: 1258, loss: 0.38961443305015564, mean loss: 0.4422354173029621
Epoch: 1, step: 1259, loss: 0.3629459738731384, mean loss: 0.4422060942839422
Epoch: 1, step: 1260, loss: 0.34485283493995667, mean loss: 0.44217010416958213
Epoch: 1, step: 1261, loss: 0.43075311183929443, mean loss: 0.4421658850297705
Epoch: 1, step: 1262, loss: 0.37858089804649353, mean loss: 0.44214239593225174
Epoch: 1, step: 1263, loss: 0.4109264612197876, mean loss: 0.4421308686299207
Epoch: 1, step: 1264, loss: 0.34620365500450134, mean loss: 0.44209545806748973
Epoch: 1, step: 1265, loss: 0.4091402590274811, mean loss: 0.4420832974774381
Epoch: 1, step: 1266, loss: 0.3441801965236664, mean loss: 0.4420471841978535
Epoch: 1, step: 1267, loss: 0.3543446362018585, mean loss: 0.44201484550021486
Epoch: 1, step: 1268, loss: 0.3888172209262848, mean loss: 0.4419952370871762
Epoch: 1, step: 1269, loss: 0.3796636760234833, mean loss: 0.441972270410292
Epoch: 1, step: 1270, loss: 0.36156904697418213, mean loss: 0.44194265596335425
Epoch: 1, step: 1271, loss: 0.3480726480484009, mean loss: 0.44190809410476994
Epoch: 1, step: 1272, loss: 0.35955262184143066, mean loss: 0.4418777829261673
Epoch: 1, step: 1273, loss: 0.4127194583415985, mean loss: 0.4418670550657609
Epoch: 1, step: 1274, loss: 0.40711748600006104, mean loss: 0.44185427479026784
Epoch: 1, step: 1275, loss: 0.39594244956970215, mean loss: 0.4418373954427603
Epoch: 1, step: 1276, loss: 0.36619216203689575, mean loss: 0.4418095949159665
Epoch: 1, step: 1277, loss: 0.40451082587242126, mean loss: 0.44179589220874993
Epoch: 1, step: 1278, loss: 0.3753564953804016, mean loss: 0.4417714928709503
Epoch: 1, step: 1279, loss: 0.3827088475227356, mean loss: 0.44174981054886947
Epoch: 1, step: 1280, loss: 0.39564740657806396, mean loss: 0.4417328922354857
Epoch: 1, step: 1281, loss: 0.3815576434135437, mean loss: 0.44171081767612325
Epoch: 1, step: 1282, loss: 0.35640957951545715, mean loss: 0.4416795374274395
Epoch: 1, step: 1283, loss: 0.3570495843887329, mean loss: 0.4416485147173813
Epoch: 1, step: 1284, loss: 0.44125252962112427, mean loss: 0.44164836961474435
Epoch: 1, step: 1285, loss: 0.4131332337856293, mean loss: 0.441637924510045
Epoch: 1, step: 1286, loss: 0.35908564925193787, mean loss: 0.44160769665385385
Epoch: 1, step: 1287, loss: 0.3564651310443878, mean loss: 0.4415765317323277
Epoch: 1, step: 1288, loss: 0.41272345185279846, mean loss: 0.44156597444001905
Epoch: 1, step: 1289, loss: 0.3715616464614868, mean loss: 0.44154036934565966
Epoch: 1, step: 1290, loss: 0.33843594789505005, mean loss: 0.4415026712025333
Epoch: 1, step: 1291, loss: 0.3599417507648468, mean loss: 0.44147286092459553
Epoch: 1, step: 1292, loss: 0.38802939653396606, mean loss: 0.44145333463143127
Epoch: 1, step: 1293, loss: 0.3921988904476166, mean loss: 0.4414353454261048
Epoch: 1, step: 1294, loss: 0.3680054545402527, mean loss: 0.4414085364115426
Epoch: 1, step: 1295, loss: 0.4259549081325531, mean loss: 0.4414028964012218
Epoch: 1, step: 1296, loss: 0.3963538110256195, mean loss: 0.44138646112746205
Epoch: 1, step: 1297, loss: 0.4108758866786957, mean loss: 0.4413753340033013
Epoch: 1, step: 1298, loss: 0.34859710931777954, mean loss: 0.44134151037053226
Epoch: 1, step: 1299, loss: 0.3639625012874603, mean loss: 0.44131331102319876
Epoch: 1, step: 1300, loss: 0.36031031608581543, mean loss: 0.4412838017354256
Epoch: 1, step: 1301, loss: 0.38902008533477783, mean loss: 0.44126476906375744
Epoch: 1, step: 1302, loss: 0.3815899193286896, mean loss: 0.44124304541987863
Epoch: 1, step: 1303, loss: 0.3706887662410736, mean loss: 0.4412173706457961
Epoch: 1, step: 1304, loss: 0.36371910572052, mean loss: 0.44118917920711825
Epoch: 1, step: 1305, loss: 0.3851805329322815, mean loss: 0.4411688124266547
Epoch: 1, step: 1306, loss: 0.3487682044506073, mean loss: 0.4411352244193933
Epoch: 1, step: 1307, loss: 0.3767106235027313, mean loss: 0.441111814317316
Epoch: 1, step: 1308, loss: 0.3511667251586914, mean loss: 0.44107914265398196
Epoch: 1, step: 1309, loss: 0.35927650332450867, mean loss: 0.4410494394443489
Epoch: 1, step: 1310, loss: 0.3909871280193329, mean loss: 0.44103126800644504
Epoch: 1, step: 1311, loss: 0.3721129596233368, mean loss: 0.4410062613633452
Epoch: 1, step: 1312, loss: 0.36902663111686707, mean loss: 0.44098015340895763
Epoch: 1, step: 1313, loss: 0.36113977432250977, mean loss: 0.44095120475809235
Epoch: 1, step: 1314, loss: 0.3870527446269989, mean loss: 0.4409316692524269
Epoch: 1, step: 1315, loss: 0.4158281981945038, mean loss: 0.44092257379189864
Epoch: 1, step: 1316, loss: 0.3845284581184387, mean loss: 0.44090214854174525
Epoch: 1, step: 1317, loss: 0.39424169063568115, mean loss: 0.44088525482056273
Epoch: 1, step: 1318, loss: 0.4017500579357147, mean loss: 0.44087109079707926
Epoch: 1, step: 1319, loss: 0.42710354924201965, mean loss: 0.4408661097762562
Epoch: 1, step: 1320, loss: 0.37314918637275696, mean loss: 0.44084161902638147
Epoch: 1, step: 1321, loss: 0.34860703349113464, mean loss: 0.4408082731892393
Epoch: 1, step: 1322, loss: 0.39802131056785583, mean loss: 0.44079280988507547
Epoch: 1, step: 1323, loss: 0.5039310455322266, mean loss: 0.44081561994130636
Epoch: 1, step: 1324, loss: 0.3944694697856903, mean loss: 0.4407988824367359
Epoch: 1, step: 1325, loss: 0.3789574205875397, mean loss: 0.4407765569992452
Epoch: 1, step: 1326, loss: 0.40640974044799805, mean loss: 0.44076415468363667
Epoch: 1, step: 1327, loss: 0.3695978820323944, mean loss: 0.44073848142510447
Epoch: 1, step: 1328, loss: 0.42674118280410767, mean loss: 0.44073343371554047
Epoch: 1, step: 1329, loss: 0.38099464774131775, mean loss: 0.44071189846464853
Epoch: 1, step: 1330, loss: 0.3767356872558594, mean loss: 0.44068884397412283
Epoch: 1, step: 1331, loss: 0.3956669270992279, mean loss: 0.4406726257043552
Epoch: 1, step: 1332, loss: 0.3675909638404846, mean loss: 0.4406463089373895
Epoch: 1, step: 1333, loss: 0.36009082198143005, mean loss: 0.4406173112818978
Epoch: 1, step: 1334, loss: 0.3910527527332306, mean loss: 0.44059947588839343
Epoch: 1, step: 1335, loss: 0.3982716500759125, mean loss: 0.44058425005177027
Epoch: 1, step: 1336, loss: 0.3983524441719055, mean loss: 0.4405690642172216
Epoch: 1, step: 1337, loss: 0.39564716815948486, mean loss: 0.4405529168785955
Epoch: 1, step: 1338, loss: 0.3875754475593567, mean loss: 0.4405338807775106
Epoch: 1, step: 1339, loss: 0.4189550578594208, mean loss: 0.4405261297635314
Epoch: 1, step: 1340, loss: 0.3851128816604614, mean loss: 0.4405062327265105
Epoch: 1, step: 1341, loss: 0.3546334207057953, mean loss: 0.44047540975019295
Epoch: 1, step: 1342, loss: 0.3547959327697754, mean loss: 0.44044466720373426
Epoch: 1, step: 1343, loss: 0.38022419810295105, mean loss: 0.4404230673224212
Epoch: 1, step: 1344, loss: 0.382598340511322, mean loss: 0.44040233418265384
Epoch: 1, step: 1345, loss: 0.3694765865802765, mean loss: 0.4403769127677426
Epoch: 1, step: 1346, loss: 0.40524017810821533, mean loss: 0.4403643234683304
Epoch: 1, step: 1347, loss: 0.4221360683441162, mean loss: 0.4403577947236584
Epoch: 1, step: 1348, loss: 0.38166382908821106, mean loss: 0.44033678005640614
Epoch: 1, step: 1349, loss: 0.38005146384239197, mean loss: 0.4403152033505314
Epoch: 1, step: 1350, loss: 0.4617246985435486, mean loss: 0.4403228632772552
Epoch: 1, step: 1351, loss: 0.4205210506916046, mean loss: 0.4403157810839127
Epoch: 1, step: 1352, loss: 0.36044761538505554, mean loss: 0.44028722614444227
Epoch: 1, step: 1353, loss: 0.4061974585056305, mean loss: 0.44027504252484295
Epoch: 1, step: 1354, loss: 0.37316903471946716, mean loss: 0.4402510675309861
Epoch: 1, step: 1355, loss: 0.47325828671455383, mean loss: 0.4402628558235516
Epoch: 1, step: 1356, loss: 0.4397875666618347, mean loss: 0.44026268613802444
Epoch: 1, step: 1357, loss: 0.36158737540245056, mean loss: 0.4402346078686684
Epoch: 1, step: 1358, loss: 0.4158538579940796, mean loss: 0.44022590977738246
Epoch: 1, step: 1359, loss: 0.36008164286613464, mean loss: 0.4401973276565154
Epoch: 1, step: 1360, loss: 0.40913504362106323, mean loss: 0.4401862537584636
Epoch: 1, step: 1361, loss: 0.38996970653533936, mean loss: 0.4401683576261674
Epoch: 1, step: 1362, loss: 0.3722754716873169, mean loss: 0.440144170634383
Epoch: 1, step: 1363, loss: 0.3583035171031952, mean loss: 0.44011502510249867
Epoch: 1, step: 1364, loss: 0.47874733805656433, mean loss: 0.4401287781508981
Epoch: 1, step: 1365, loss: 0.3910253643989563, mean loss: 0.44011130362643125
Epoch: 1, step: 1366, loss: 0.3672681152820587, mean loss: 0.4400853900055332
Epoch: 1, step: 1367, loss: 0.3794833719730377, mean loss: 0.44006383879001665
Epoch: 1, step: 1368, loss: 0.4040990173816681, mean loss: 0.4400510535708882
Epoch: 1, step: 1369, loss: 0.3586592376232147, mean loss: 0.4400221296846239
Epoch: 1, step: 1370, loss: 0.39506420493125916, mean loss: 0.440006158841017
Epoch: 1, step: 1371, loss: 0.376346230506897, mean loss: 0.4399835523323756
Epoch: 1, step: 1372, loss: 0.37259069085121155, mean loss: 0.43995962870387684
Epoch: 1, step: 1373, loss: 0.41484132409095764, mean loss: 0.4399507151820128
Epoch: 1, step: 1374, loss: 0.44321393966674805, mean loss: 0.4399518727643061
Epoch: 1, step: 1375, loss: 0.38839617371559143, mean loss: 0.4399335906015229
Epoch: 1, step: 1376, loss: 0.38377517461776733, mean loss: 0.43991368332893027
Epoch: 1, step: 1377, loss: 0.336443156003952, mean loss: 0.4398770176565968
Epoch: 1, step: 1378, loss: 0.41626691818237305, mean loss: 0.43986865417821414
Epoch: 1, step: 1379, loss: 0.3932929039001465, mean loss: 0.43985216134879557
Epoch: 1, step: 1380, loss: 0.40634703636169434, mean loss: 0.4398403011275612
Epoch: 1, step: 1381, loss: 0.3685583174228668, mean loss: 0.439815077495677
Epoch: 1, step: 1382, loss: 0.37992075085639954, mean loss: 0.4397938909634381
Epoch: 1, step: 1383, loss: 0.34800633788108826, mean loss: 0.43976143426149955
Epoch: 1, step: 1384, loss: 0.43968358635902405, mean loss: 0.4397614067436832
Epoch: 1, step: 1385, loss: 0.42698895931243896, mean loss: 0.4397568935113753
Epoch: 1, step: 1386, loss: 0.36310097575187683, mean loss: 0.4397298161826012
Epoch: 1, step: 1387, loss: 0.3653744161128998, mean loss: 0.4397035607447235
Epoch: 1, step: 1388, loss: 0.39116331934928894, mean loss: 0.43968642687907034
Epoch: 1, step: 1389, loss: 0.3958588242530823, mean loss: 0.4396709619522439
Epoch: 1, step: 1390, loss: 0.3779892325401306, mean loss: 0.4396492047284654
Epoch: 1, step: 1391, loss: 0.35907265543937683, mean loss: 0.4396207926871082
Epoch: 1, step: 1392, loss: 0.4414421319961548, mean loss: 0.4396214346819298
Epoch: 1, step: 1393, loss: 0.3668699562549591, mean loss: 0.43959579991151865
Epoch: 1, step: 1394, loss: 0.392939954996109, mean loss: 0.43957936601052694
Epoch: 1, step: 1395, loss: 0.42694327235221863, mean loss: 0.439574916681774
Epoch: 1, step: 1396, loss: 0.351759672164917, mean loss: 0.43954400670482335
Epoch: 1, step: 1397, loss: 0.4330277144908905, mean loss: 0.4395417138504201
Epoch: 1, step: 1398, loss: 0.35079172253608704, mean loss: 0.43951049682920507
Epoch: 1, step: 1399, loss: 0.34928029775619507, mean loss: 0.43947877031757604
Epoch: 1, step: 1400, loss: 0.40286725759506226, mean loss: 0.4394659015960567
Epoch: 1, step: 1401, loss: 0.3793959319591522, mean loss: 0.4394447947901407
Epoch: 1, step: 1402, loss: 0.3754386007785797, mean loss: 0.43942231281121147
Epoch: 1, step: 1403, loss: 0.35412880778312683, mean loss: 0.43939236424905276
Epoch: 1, step: 1404, loss: 0.3953493535518646, mean loss: 0.4393769051368389
Epoch: 1, step: 1405, loss: 0.3496696650981903, mean loss: 0.43934542891226397
Epoch: 1, step: 1406, loss: 0.39692869782447815, mean loss: 0.43933055106902025
Epoch: 1, step: 1407, loss: 0.35827159881591797, mean loss: 0.43930212927650514
Epoch: 1, step: 1408, loss: 0.39057835936546326, mean loss: 0.4392850511938164
Epoch: 1, step: 1409, loss: 0.3700660467147827, mean loss: 0.43926079786358546
Epoch: 1, step: 1410, loss: 0.41848132014274597, mean loss: 0.4392535195876762
Epoch: 1, step: 1411, loss: 0.41054853796958923, mean loss: 0.43924346882380433
Epoch: 1, step: 1412, loss: 0.38658076524734497, mean loss: 0.43922503595590917
Epoch: 1, step: 1413, loss: 0.36728236079216003, mean loss: 0.43919986357131724
Epoch: 1, step: 1414, loss: 0.4212620258331299, mean loss: 0.43919358940631614
Epoch: 1, step: 1415, loss: 0.44470465183258057, mean loss: 0.43919551635122045
Epoch: 1, step: 1416, loss: 0.3559734523296356, mean loss: 0.43916642789822447
Epoch: 1, step: 1417, loss: 0.4157072603702545, mean loss: 0.4391582311241057
Epoch: 1, step: 1418, loss: 0.35740575194358826, mean loss: 0.4391296762937946
Epoch: 1, step: 1419, loss: 0.37929749488830566, mean loss: 0.4391087851690022
Epoch: 1, step: 1420, loss: 0.38273343443870544, mean loss: 0.4390891079087124
Epoch: 1, step: 1421, loss: 0.3849892020225525, mean loss: 0.4390702314586475
Epoch: 1, step: 1422, loss: 0.39385876059532166, mean loss: 0.4390544618489986
Epoch: 1, step: 1423, loss: 0.4133661985397339, mean loss: 0.4390455049928936
Epoch: 1, step: 1424, loss: 0.36954474449157715, mean loss: 0.43902128025936227
Epoch: 1, step: 1425, loss: 0.42550143599510193, mean loss: 0.43901656951223184
Epoch: 1, step: 1426, loss: 0.38199925422668457, mean loss: 0.43899670977162386
Epoch: 1, step: 1427, loss: 0.37797680497169495, mean loss: 0.43897546328666565
Epoch: 1, step: 1428, loss: 0.4139550030231476, mean loss: 0.43896675445956385
Epoch: 1, step: 1429, loss: 0.4353088140487671, mean loss: 0.4389654816897619
Epoch: 1, step: 1430, loss: 0.38060882687568665, mean loss: 0.43894518372287006
Epoch: 1, step: 1431, loss: 0.39037221670150757, mean loss: 0.4389282946522785
Epoch: 1, step: 1432, loss: 0.3611300587654114, mean loss: 0.4389012532077575
Epoch: 1, step: 1433, loss: 0.3732679486274719, mean loss: 0.43887844802895964
Epoch: 1, step: 1434, loss: 0.3653847873210907, mean loss: 0.4388529205330556
Epoch: 1, step: 1435, loss: 0.4274373948574066, mean loss: 0.43884895680886266
Epoch: 1, step: 1436, loss: 0.3604269027709961, mean loss: 0.438821736380526
Epoch: 1, step: 1437, loss: 0.38038092851638794, mean loss: 0.4388014585152019
Epoch: 1, step: 1438, loss: 0.33537405729293823, mean loss: 0.43876558359282164
Epoch: 1, step: 1439, loss: 0.377123087644577, mean loss: 0.43874420963444843
Epoch: 1, step: 1440, loss: 0.3739260137081146, mean loss: 0.43872174232216893
Epoch: 1, step: 1441, loss: 0.38672494888305664, mean loss: 0.43870372541522534
Epoch: 1, step: 1442, loss: 0.3667431175708771, mean loss: 0.43867879967645
Epoch: 1, step: 1443, loss: 0.40042707324028015, mean loss: 0.4386655546188198
Valid: 1, mean loss: 0.25337474048137665
Epoch: 2, step: 0, loss: 0.39636358618736267, mean loss: 0.4386509121929176
Epoch: 2, step: 1, loss: 0.40299350023269653, mean loss: 0.43863857398808703
Epoch: 2, step: 2, loss: 0.3842960000038147, mean loss: 0.4386197768334747
Epoch: 2, step: 3, loss: 0.34633100032806396, mean loss: 0.43858786508502884
Epoch: 2, step: 4, loss: 0.4134473502635956, mean loss: 0.4385791749658372
Epoch: 2, step: 5, loss: 0.4083612561225891, mean loss: 0.4385687333905631
Epoch: 2, step: 6, loss: 0.3559975326061249, mean loss: 0.4385402113868379
Epoch: 2, step: 7, loss: 0.3670979142189026, mean loss: 0.43851554208532967
Epoch: 2, step: 8, loss: 0.41555967926979065, mean loss: 0.4385076180733119
Epoch: 2, step: 9, loss: 0.39533036947250366, mean loss: 0.43849271909173815
Epoch: 2, step: 10, loss: 0.3816137909889221, mean loss: 0.438473098902672
Epoch: 2, step: 11, loss: 0.4424259662628174, mean loss: 0.43847446196038237
Epoch: 2, step: 12, loss: 0.3952575623989105, mean loss: 0.4384595647182033
Epoch: 2, step: 13, loss: 0.3677902817726135, mean loss: 0.4384352127943764
Epoch: 2, step: 14, loss: 0.38900163769721985, mean loss: 0.4384181843496306
Epoch: 2, step: 15, loss: 0.4196925163269043, mean loss: 0.4384117361168404
Epoch: 2, step: 16, loss: 0.37416872382164, mean loss: 0.43838962148265964
Epoch: 2, step: 17, loss: 0.3788583278656006, mean loss: 0.43836913583447756
Epoch: 2, step: 18, loss: 0.3711008131504059, mean loss: 0.43834599571659516
Epoch: 2, step: 19, loss: 0.35986462235450745, mean loss: 0.4383190076239672
Epoch: 2, step: 20, loss: 0.4013804793357849, mean loss: 0.4383063096080551
Epoch: 2, step: 21, loss: 0.38601386547088623, mean loss: 0.43828833969598047
Epoch: 2, step: 22, loss: 0.45973846316337585, mean loss: 0.43829570834024956
Epoch: 2, step: 23, loss: 0.37183764576911926, mean loss: 0.4382728862033776
Epoch: 2, step: 24, loss: 0.3757774531841278, mean loss: 0.4382514322270579
Epoch: 2, step: 25, loss: 0.3638010621070862, mean loss: 0.4382258830266049
Epoch: 2, step: 26, loss: 0.46161434054374695, mean loss: 0.4382339065111734
Epoch: 2, step: 27, loss: 0.3905092775821686, mean loss: 0.43821754004034724
Epoch: 2, step: 28, loss: 0.4256846606731415, mean loss: 0.43821324354416374
Epoch: 2, step: 29, loss: 0.36231210827827454, mean loss: 0.4381872321886922
Epoch: 2, step: 30, loss: 0.4105781614780426, mean loss: 0.43817777378831174
Epoch: 2, step: 31, loss: 0.35068750381469727, mean loss: 0.4381478113670879
Epoch: 2, step: 32, loss: 0.40705645084381104, mean loss: 0.4381371672861145
Epoch: 2, step: 33, loss: 0.3711233139038086, mean loss: 0.4381142330447106
Epoch: 2, step: 34, loss: 0.3876303732395172, mean loss: 0.43809696179606017
Epoch: 2, step: 35, loss: 0.3919042646884918, mean loss: 0.4380811640200316
Epoch: 2, step: 36, loss: 0.36092913150787354, mean loss: 0.4380547872567796
Epoch: 2, step: 37, loss: 0.3819321095943451, mean loss: 0.4380356065740515
Epoch: 2, step: 38, loss: 0.40815407037734985, mean loss: 0.43802539764470516
Epoch: 2, step: 39, loss: 0.37137463688850403, mean loss: 0.438002634406742
Epoch: 2, step: 40, loss: 0.3421685993671417, mean loss: 0.43796991537804975
Epoch: 2, step: 41, loss: 0.4381093680858612, mean loss: 0.4379699629728306
Epoch: 2, step: 42, loss: 0.3768565356731415, mean loss: 0.4379491122640965
Epoch: 2, step: 43, loss: 0.4224224090576172, mean loss: 0.43794381666273
Epoch: 2, step: 44, loss: 0.38769596815109253, mean loss: 0.4379266847675675
Epoch: 2, step: 45, loss: 0.36918914318084717, mean loss: 0.437903256839283
Epoch: 2, step: 46, loss: 0.357915997505188, mean loss: 0.43787600394002096
Epoch: 2, step: 47, loss: 0.4000018537044525, mean loss: 0.4378631040250906
Epoch: 2, step: 48, loss: 0.38653454184532166, mean loss: 0.43784562749728
Epoch: 2, step: 49, loss: 0.3450320065021515, mean loss: 0.4378140367481326
Epoch: 2, step: 50, loss: 0.36770254373550415, mean loss: 0.4377901811873933
Epoch: 2, step: 51, loss: 0.424882709980011, mean loss: 0.4377857908910643
Epoch: 2, step: 52, loss: 0.36626920104026794, mean loss: 0.43776147379148905
Epoch: 2, step: 53, loss: 0.39707595109939575, mean loss: 0.4377476445859513
Epoch: 2, step: 54, loss: 0.41212713718414307, mean loss: 0.4377389390108912
Epoch: 2, step: 55, loss: 0.4048454463481903, mean loss: 0.43772776594952484
Epoch: 2, step: 56, loss: 0.3292236626148224, mean loss: 0.4376909224509392
Epoch: 2, step: 57, loss: 0.37572380900382996, mean loss: 0.43766988812865576
Epoch: 2, step: 58, loss: 0.3971104025840759, mean loss: 0.4376561251542599
Epoch: 2, step: 59, loss: 0.37450283765792847, mean loss: 0.4376347027365203
Epoch: 2, step: 60, loss: 0.36740967631340027, mean loss: 0.4376108895705579
Epoch: 2, step: 61, loss: 0.38266775012016296, mean loss: 0.43759226477752383
Epoch: 2, step: 62, loss: 0.4139636754989624, mean loss: 0.4375842578004725
Epoch: 2, step: 63, loss: 0.3814835846424103, mean loss: 0.4375652535073973
Epoch: 2, step: 64, loss: 0.3802998661994934, mean loss: 0.43754586123265704
Epoch: 2, step: 65, loss: 0.3491087853908539, mean loss: 0.4375159231568812
Epoch: 2, step: 66, loss: 0.36346638202667236, mean loss: 0.43749086409050886
Epoch: 2, step: 67, loss: 0.4193061888217926, mean loss: 0.43748471230591185
Epoch: 2, step: 68, loss: 0.3866674304008484, mean loss: 0.4374675268876146
Epoch: 2, step: 69, loss: 0.4006785452365875, mean loss: 0.4374550897741423
Epoch: 2, step: 70, loss: 0.4433848559856415, mean loss: 0.43745709375055714
Epoch: 2, step: 71, loss: 0.3510567247867584, mean loss: 0.43742790443671803
Epoch: 2, step: 72, loss: 0.38173359632492065, mean loss: 0.43740909514657556
Epoch: 2, step: 73, loss: 0.42229539155960083, mean loss: 0.43740399261329166
Epoch: 2, step: 74, loss: 0.39630335569381714, mean loss: 0.4373901213217225
Epoch: 2, step: 75, loss: 0.3633936047554016, mean loss: 0.43736515623516165
Epoch: 2, step: 76, loss: 0.3976714015007019, mean loss: 0.43735176879680265
Epoch: 2, step: 77, loss: 0.3789384365081787, mean loss: 0.43733207448382605
Epoch: 2, step: 78, loss: 0.3532961905002594, mean loss: 0.43730375096377766
Epoch: 2, step: 79, loss: 0.44126901030540466, mean loss: 0.43730508696759895
Epoch: 2, step: 80, loss: 0.37780311703681946, mean loss: 0.4372850458864502
Epoch: 2, step: 81, loss: 0.40676867961883545, mean loss: 0.437274771015653
Epoch: 2, step: 82, loss: 0.35388070344924927, mean loss: 0.4372467016559874
Epoch: 2, step: 83, loss: 0.4115908145904541, mean loss: 0.4372380691233274
Epoch: 2, step: 84, loss: 0.39946699142456055, mean loss: 0.43722536442178056
Epoch: 2, step: 85, loss: 0.3577369451522827, mean loss: 0.4371986366412595
Epoch: 2, step: 86, loss: 0.3937147557735443, mean loss: 0.43718402021071573
Epoch: 2, step: 87, loss: 0.3792586624622345, mean loss: 0.43716455604480564
Epoch: 2, step: 88, loss: 0.3669447898864746, mean loss: 0.43714096861915624
Epoch: 2, step: 89, loss: 0.4443984627723694, mean loss: 0.43714340565547366
Epoch: 2, step: 90, loss: 0.37123364210128784, mean loss: 0.4371212808607257
Epoch: 2, step: 91, loss: 0.41410866379737854, mean loss: 0.43711355850600647
Epoch: 2, step: 92, loss: 0.34906771779060364, mean loss: 0.4370840228331734
Epoch: 2, step: 93, loss: 0.3690793514251709, mean loss: 0.43706121777904594
Epoch: 2, step: 94, loss: 0.36955106258392334, mean loss: 0.43703858614807206
Epoch: 2, step: 95, loss: 0.3565656840801239, mean loss: 0.4370116180173522
Epoch: 2, step: 96, loss: 0.36228954792022705, mean loss: 0.4369865854980567
Epoch: 2, step: 97, loss: 0.4390549659729004, mean loss: 0.43698727819078104
Epoch: 2, step: 98, loss: 0.3663908541202545, mean loss: 0.43696364363300716
Epoch: 2, step: 99, loss: 0.39135807752609253, mean loss: 0.4369483807260102
Epoch: 2, step: 100, loss: 0.3355581760406494, mean loss: 0.4369144596137033
Epoch: 2, step: 101, loss: 0.34474536776542664, mean loss: 0.43688363383047646
Epoch: 2, step: 102, loss: 0.3409024775028229, mean loss: 0.43685154384173436
Epoch: 2, step: 103, loss: 0.3647254407405853, mean loss: 0.43682743752385295
Epoch: 2, step: 104, loss: 0.38403305411338806, mean loss: 0.43680979823771515
Epoch: 2, step: 105, loss: 0.39198797941207886, mean loss: 0.4367948276903452
Epoch: 2, step: 106, loss: 0.37500476837158203, mean loss: 0.43677419661878636
Epoch: 2, step: 107, loss: 0.377583384513855, mean loss: 0.4367544400059342
Epoch: 2, step: 108, loss: 0.3654176890850067, mean loss: 0.4367306372862409
Epoch: 2, step: 109, loss: 0.3947688341140747, mean loss: 0.436716640687451
Epoch: 2, step: 110, loss: 0.43042051792144775, mean loss: 0.4367145412800598
Epoch: 2, step: 111, loss: 0.4039420783519745, mean loss: 0.43670361712575045
Epoch: 2, step: 112, loss: 0.4842870831489563, mean loss: 0.4367194729958015
Epoch: 2, step: 113, loss: 0.4508180022239685, mean loss: 0.436724169374625
Epoch: 2, step: 114, loss: 0.36692318320274353, mean loss: 0.436700925622986
Epoch: 2, step: 115, loss: 0.3569345474243164, mean loss: 0.43667437223477074
Epoch: 2, step: 116, loss: 0.377297580242157, mean loss: 0.43665461290299284
Epoch: 2, step: 117, loss: 0.42214569449424744, mean loss: 0.43664978625016226
Epoch: 2, step: 118, loss: 0.44105514883995056, mean loss: 0.43665125128594207
Epoch: 2, step: 119, loss: 0.4095993936061859, mean loss: 0.43664225798219214
Epoch: 2, step: 120, loss: 0.35353827476501465, mean loss: 0.43661463950987006
Epoch: 2, step: 121, loss: 0.35134631395339966, mean loss: 0.4365863111625091
Epoch: 2, step: 122, loss: 0.35239914059638977, mean loss: 0.43655835129184617
Epoch: 2, step: 123, loss: 0.3544652760028839, mean loss: 0.43653109595476486
Epoch: 2, step: 124, loss: 0.4383316934108734, mean loss: 0.4365316935642757
Epoch: 2, step: 125, loss: 0.3613067865371704, mean loss: 0.4365067350682481
Epoch: 2, step: 126, loss: 0.37079790234565735, mean loss: 0.4364849410938791
Epoch: 2, step: 127, loss: 0.36035895347595215, mean loss: 0.43645970038180415
Epoch: 2, step: 128, loss: 0.3753010332584381, mean loss: 0.4364394290304209
Epoch: 2, step: 129, loss: 0.38188689947128296, mean loss: 0.4364213533082343
Epoch: 2, step: 130, loss: 0.38268953561782837, mean loss: 0.4364035554222818
Epoch: 2, step: 131, loss: 0.3827655017375946, mean loss: 0.4363857944773531
Epoch: 2, step: 132, loss: 0.4165896475315094, mean loss: 0.43637924163162456
Epoch: 2, step: 133, loss: 0.35986313223838806, mean loss: 0.43635392193956857
Epoch: 2, step: 134, loss: 0.367948055267334, mean loss: 0.43633129346895255
Epoch: 2, step: 135, loss: 0.3900204002857208, mean loss: 0.43631597902014857
Epoch: 2, step: 136, loss: 0.3633767068386078, mean loss: 0.4362918668640555
Epoch: 2, step: 137, loss: 0.3895324468612671, mean loss: 0.4362764143128319
Epoch: 2, step: 138, loss: 0.42548227310180664, mean loss: 0.43627284835934294
Epoch: 2, step: 139, loss: 0.3727959990501404, mean loss: 0.4362518850669687
Epoch: 2, step: 140, loss: 0.3397446572780609, mean loss: 0.43622002398153165
Epoch: 2, step: 141, loss: 0.37027281522750854, mean loss: 0.4361982592261673
Epoch: 2, step: 142, loss: 0.36758938431739807, mean loss: 0.43617562350366357
Epoch: 2, step: 143, loss: 0.3830569386482239, mean loss: 0.43615810414850015
Epoch: 2, step: 144, loss: 0.3944012224674225, mean loss: 0.4361443366306363
Epoch: 2, step: 145, loss: 0.3899643123149872, mean loss: 0.4361291157920352
Epoch: 2, step: 146, loss: 0.3923642933368683, mean loss: 0.43611469575168754
Epoch: 2, step: 147, loss: 0.41930878162384033, mean loss: 0.43610916020684964
Epoch: 2, step: 148, loss: 0.3691595792770386, mean loss: 0.4360871155638039
Epoch: 2, step: 149, loss: 0.323593407869339, mean loss: 0.4360500866935951
Epoch: 2, step: 150, loss: 0.4359268546104431, mean loss: 0.4360500461433867
Epoch: 2, step: 151, loss: 0.3939233124256134, mean loss: 0.43603618866519006
Epoch: 2, step: 152, loss: 0.37694740295410156, mean loss: 0.43601675795630773
Epoch: 2, step: 153, loss: 0.44479089975357056, mean loss: 0.4360196422895744
Epoch: 2, step: 154, loss: 0.4282453954219818, mean loss: 0.43601708749270696
Epoch: 2, step: 155, loss: 0.3782314956188202, mean loss: 0.43599810405253814
Epoch: 2, step: 156, loss: 0.40624940395355225, mean loss: 0.43598833436449247
Epoch: 2, step: 157, loss: 0.3824506402015686, mean loss: 0.43597075797113627
Epoch: 2, step: 158, loss: 0.34847068786621094, mean loss: 0.4359420411775344
Epoch: 2, step: 159, loss: 0.3807234466075897, mean loss: 0.4359239248407332
Epoch: 2, step: 160, loss: 0.37125763297080994, mean loss: 0.4359027158240491
Epoch: 2, step: 161, loss: 0.38037607073783875, mean loss: 0.4358845103666438
Epoch: 2, step: 162, loss: 0.4214765429496765, mean loss: 0.4358797879912203
Epoch: 2, step: 163, loss: 0.39084360003471375, mean loss: 0.43586503170420965
Epoch: 2, step: 164, loss: 0.3817330598831177, mean loss: 0.43584730095680674
Epoch: 2, step: 165, loss: 0.40195345878601074, mean loss: 0.43583620277665913
Epoch: 2, step: 166, loss: 0.4258873760700226, mean loss: 0.43583294620490576
Epoch: 2, step: 167, loss: 0.38808196783065796, mean loss: 0.4358173208847571
Epoch: 2, step: 168, loss: 0.3835318684577942, mean loss: 0.43580021736744373
Epoch: 2, step: 169, loss: 0.3641471564769745, mean loss: 0.43577678601986675
Epoch: 2, step: 170, loss: 0.35994163155555725, mean loss: 0.4357519951880706
Epoch: 2, step: 171, loss: 0.3702569901943207, mean loss: 0.43573059159166744
Epoch: 2, step: 172, loss: 0.40904152393341064, mean loss: 0.43572187252350075
Epoch: 2, step: 173, loss: 0.37036994099617004, mean loss: 0.43570052963273415
Epoch: 2, step: 174, loss: 0.40155941247940063, mean loss: 0.43568938333265145
Epoch: 2, step: 175, loss: 0.4138548672199249, mean loss: 0.43568225718509507
Epoch: 2, step: 176, loss: 0.42025911808013916, mean loss: 0.43567722516581125
Epoch: 2, step: 177, loss: 0.4014430344104767, mean loss: 0.4356660594154018
Epoch: 2, step: 178, loss: 0.37944352626800537, mean loss: 0.4356477279732279
Epoch: 2, step: 179, loss: 0.360101580619812, mean loss: 0.4356231040660071
Epoch: 2, step: 180, loss: 0.3763144910335541, mean loss: 0.4356037790047388
Epoch: 2, step: 181, loss: 0.332987904548645, mean loss: 0.43557035363846647
Epoch: 2, step: 182, loss: 0.38429781794548035, mean loss: 0.4355536579251181
Epoch: 2, step: 183, loss: 0.37082740664482117, mean loss: 0.43553258818186275
Epoch: 2, step: 184, loss: 0.3815734386444092, mean loss: 0.43551502907039596
Epoch: 2, step: 185, loss: 0.34823524951934814, mean loss: 0.43548663616878536
Epoch: 2, step: 186, loss: 0.38153281807899475, mean loss: 0.435469090211683
Epoch: 2, step: 187, loss: 0.3437570333480835, mean loss: 0.4354392748485934
Epoch: 2, step: 188, loss: 0.35575583577156067, mean loss: 0.4354133783783051
Epoch: 2, step: 189, loss: 0.3558137118816376, mean loss: 0.4353875175379878
Epoch: 2, step: 190, loss: 0.3830357491970062, mean loss: 0.4353705146901993
Epoch: 2, step: 191, loss: 0.35210078954696655, mean loss: 0.43534347906515275
Epoch: 2, step: 192, loss: 0.4208700358867645, mean loss: 0.4353387814204989
Epoch: 2, step: 193, loss: 0.3948342502117157, mean loss: 0.43532563913263106
Epoch: 2, step: 194, loss: 0.3689446747303009, mean loss: 0.4353041078434963
Epoch: 2, step: 195, loss: 0.35727229714393616, mean loss: 0.43527880569994915
Epoch: 2, step: 196, loss: 0.3571334779262543, mean loss: 0.4352534749616108
Epoch: 2, step: 197, loss: 0.36092326045036316, mean loss: 0.4352293886963771
Epoch: 2, step: 198, loss: 0.40806853771209717, mean loss: 0.435220590234769
Epoch: 2, step: 199, loss: 0.3760714530944824, mean loss: 0.4352014357214464
Epoch: 2, step: 200, loss: 0.3474571108818054, mean loss: 0.4351730303071247
Epoch: 2, step: 201, loss: 0.35789623856544495, mean loss: 0.4351480216366581
Epoch: 2, step: 202, loss: 0.450613796710968, mean loss: 0.43515302512260906
Epoch: 2, step: 203, loss: 0.38031846284866333, mean loss: 0.4351352907881091
Epoch: 2, step: 204, loss: 0.39301732182502747, mean loss: 0.43512167359801435
Epoch: 2, step: 205, loss: 0.4671907126903534, mean loss: 0.4351320385104553
Epoch: 2, step: 206, loss: 0.3844850957393646, mean loss: 0.4351156743932433
Epoch: 2, step: 207, loss: 0.38576892018318176, mean loss: 0.43509973551914444
Epoch: 2, step: 208, loss: 0.35844656825065613, mean loss: 0.43507498473862505
Epoch: 2, step: 209, loss: 0.41446706652641296, mean loss: 0.4350683327314552
Epoch: 2, step: 210, loss: 0.3921123147010803, mean loss: 0.435054471480074
Epoch: 2, step: 211, loss: 0.38425007462501526, mean loss: 0.43503808296495944
Epoch: 2, step: 212, loss: 0.36634668707847595, mean loss: 0.4350159315957603
Epoch: 2, step: 213, loss: 0.3841581344604492, mean loss: 0.43499953643227374
Epoch: 2, step: 214, loss: 0.38937807083129883, mean loss: 0.4349848340585706
Epoch: 2, step: 215, loss: 0.38258326053619385, mean loss: 0.43496795210833783
Epoch: 2, step: 216, loss: 0.37674736976623535, mean loss: 0.43494920151821154
Epoch: 2, step: 217, loss: 0.395298570394516, mean loss: 0.43493643570007773
Epoch: 2, step: 218, loss: 0.37830284237861633, mean loss: 0.43491820795842295
Epoch: 2, step: 219, loss: 0.40325114130973816, mean loss: 0.43490801906953985
Epoch: 2, step: 220, loss: 0.3661949336528778, mean loss: 0.43488591772331386
Epoch: 2, step: 221, loss: 0.38189730048179626, mean loss: 0.43486887958272175
Epoch: 2, step: 222, loss: 0.3915384113788605, mean loss: 0.4348549514347938
Epoch: 2, step: 223, loss: 0.3777683675289154, mean loss: 0.43483660741682917
Epoch: 2, step: 224, loss: 0.3906722962856293, mean loss: 0.434822420358965
Epoch: 2, step: 225, loss: 0.39157840609550476, mean loss: 0.434808533392278
Epoch: 2, step: 226, loss: 0.436123788356781, mean loss: 0.4348089556250114
Epoch: 2, step: 227, loss: 0.39922234416007996, mean loss: 0.4347975350179944
Epoch: 2, step: 228, loss: 0.40236467123031616, mean loss: 0.4347871298643891
Epoch: 2, step: 229, loss: 0.3655734956264496, mean loss: 0.43476493177771885
Epoch: 2, step: 230, loss: 0.44391629099845886, mean loss: 0.43476786584608074
Epoch: 2, step: 231, loss: 0.3540887236595154, mean loss: 0.43474200714666195
Epoch: 2, step: 232, loss: 0.4101846218109131, mean loss: 0.4347341387117578
Epoch: 2, step: 233, loss: 0.34114691615104675, mean loss: 0.4347041620229171
Epoch: 2, step: 234, loss: 0.4027608633041382, mean loss: 0.43469393362115
Epoch: 2, step: 235, loss: 0.3391254246234894, mean loss: 0.4346633419089228
Epoch: 2, step: 236, loss: 0.3617557883262634, mean loss: 0.43464001149177633
Epoch: 2, step: 237, loss: 0.3329974412918091, mean loss: 0.434607496274182
Epoch: 2, step: 238, loss: 0.36830776929855347, mean loss: 0.4345862939310494
Epoch: 2, step: 239, loss: 0.38136178255081177, mean loss: 0.43456927842229615
Epoch: 2, step: 240, loss: 0.46078822016716003, mean loss: 0.43457765775810464
Epoch: 2, step: 241, loss: 0.39112961292266846, mean loss: 0.4345637765936205
Epoch: 2, step: 242, loss: 0.43707454204559326, mean loss: 0.434564578498907
Epoch: 2, step: 243, loss: 0.4046674966812134, mean loss: 0.43455503281505714
Epoch: 2, step: 244, loss: 0.36896073818206787, mean loss: 0.43453409623841077
Epoch: 2, step: 245, loss: 0.4167221188545227, mean loss: 0.4345284127740254
Epoch: 2, step: 246, loss: 0.4016667306423187, mean loss: 0.43451793057876803
Epoch: 2, step: 247, loss: 0.40989401936531067, mean loss: 0.4345100785662637
Epoch: 2, step: 248, loss: 0.368431955575943, mean loss: 0.43448901445310134
Epoch: 2, step: 249, loss: 0.3920806646347046, mean loss: 0.43447550000127905
Epoch: 2, step: 250, loss: 0.3725517690181732, mean loss: 0.43445577278529207
Epoch: 2, step: 251, loss: 0.3976903259754181, mean loss: 0.43444406404426983
Epoch: 2, step: 252, loss: 0.4020380973815918, mean loss: 0.43443374695841735
Epoch: 2, step: 253, loss: 0.3858972191810608, mean loss: 0.4344182993047645
Epoch: 2, step: 254, loss: 0.3876163363456726, mean loss: 0.43440340844795283
Epoch: 2, step: 255, loss: 0.39674901962280273, mean loss: 0.4343914318611764
Epoch: 2, step: 256, loss: 0.41954490542411804, mean loss: 0.4343867111850438
Epoch: 2, step: 257, loss: 0.37474966049194336, mean loss: 0.434367754716292
Epoch: 2, step: 258, loss: 0.36259135603904724, mean loss: 0.43434494683619124
Epoch: 2, step: 259, loss: 0.3842054009437561, mean loss: 0.4343290194073817
Epoch: 2, step: 260, loss: 0.3667067289352417, mean loss: 0.4343075451963712
Epoch: 2, step: 261, loss: 0.35458284616470337, mean loss: 0.4342822357681072
Epoch: 2, step: 262, loss: 0.3345406651496887, mean loss: 0.4342505818263051
Epoch: 2, step: 263, loss: 0.32869598269462585, mean loss: 0.4342170936920628
Epoch: 2, step: 264, loss: 0.3398747444152832, mean loss: 0.43418717223653575
Epoch: 2, step: 265, loss: 0.4144698977470398, mean loss: 0.43418092072274705
Epoch: 2, step: 266, loss: 0.4053907096385956, mean loss: 0.43417179545774415
Epoch: 2, step: 267, loss: 0.3669764995574951, mean loss: 0.43415050417260465
Epoch: 2, step: 268, loss: 0.39766398072242737, mean loss: 0.43413894683226567
Epoch: 2, step: 269, loss: 0.36883750557899475, mean loss: 0.4341182687318055
Epoch: 2, step: 270, loss: 0.36964595317840576, mean loss: 0.4340978596417284
Epoch: 2, step: 271, loss: 0.4022595286369324, mean loss: 0.43408778422052435
Epoch: 2, step: 272, loss: 0.4077318608760834, mean loss: 0.4340794463770114
Epoch: 2, step: 273, loss: 0.3907596170902252, mean loss: 0.43406574624124705
Epoch: 2, step: 274, loss: 0.403030127286911, mean loss: 0.43405593415811256
Epoch: 2, step: 275, loss: 0.39826735854148865, mean loss: 0.4340446229774499
Epoch: 2, step: 276, loss: 0.37049099802970886, mean loss: 0.4340245428431852
Epoch: 2, step: 277, loss: 0.3841227889060974, mean loss: 0.4340087810763068
Epoch: 2, step: 278, loss: 0.36098286509513855, mean loss: 0.43398572268793256
Epoch: 2, step: 279, loss: 0.3405955731868744, mean loss: 0.4339562434740749
Epoch: 2, step: 280, loss: 0.3776627480983734, mean loss: 0.4339384796699172
Epoch: 2, step: 281, loss: 0.38159963488578796, mean loss: 0.4339219689933292
Epoch: 2, step: 282, loss: 0.37920916080474854, mean loss: 0.43390471487532584
Epoch: 2, step: 283, loss: 0.37462374567985535, mean loss: 0.43388602604518856
Epoch: 2, step: 284, loss: 0.4646037817001343, mean loss: 0.4338957070271157
Epoch: 2, step: 285, loss: 0.41700658202171326, mean loss: 0.4338903859417328
Epoch: 2, step: 286, loss: 0.3695391118526459, mean loss: 0.43387011782390944
Epoch: 2, step: 287, loss: 0.4067797362804413, mean loss: 0.43386158810679876
Epoch: 2, step: 288, loss: 0.3831939697265625, mean loss: 0.43384563984794444
Epoch: 2, step: 289, loss: 0.34606093168258667, mean loss: 0.4338180172210831
Epoch: 2, step: 290, loss: 0.35059067606925964, mean loss: 0.4337918368684087
Epoch: 2, step: 291, loss: 0.42894837260246277, mean loss: 0.4337903137664383
Epoch: 2, step: 292, loss: 0.3447096645832062, mean loss: 0.43376230978995817
Epoch: 2, step: 293, loss: 0.3586162328720093, mean loss: 0.43373869380098334
Epoch: 2, step: 294, loss: 0.38717159628868103, mean loss: 0.433724063861457
Epoch: 2, step: 295, loss: 0.4154207408428192, mean loss: 0.4337183153303582
Epoch: 2, step: 296, loss: 0.44562605023384094, mean loss: 0.4337220540226356
Epoch: 2, step: 297, loss: 0.3809654116630554, mean loss: 0.4337054951267286
Epoch: 2, step: 298, loss: 0.37005308270454407, mean loss: 0.43368552260949544
Epoch: 2, step: 299, loss: 0.34973040223121643, mean loss: 0.4336591878791384
Epoch: 2, step: 300, loss: 0.36892226338386536, mean loss: 0.4336388878087416
Epoch: 2, step: 301, loss: 0.41385728120803833, mean loss: 0.43363268667814575
Epoch: 2, step: 302, loss: 0.3534851372241974, mean loss: 0.43360756992808186
Epoch: 2, step: 303, loss: 0.38222238421440125, mean loss: 0.43359147181225677
Epoch: 2, step: 304, loss: 0.38129696249961853, mean loss: 0.4335750939515262
Epoch: 2, step: 305, loss: 0.4624496102333069, mean loss: 0.4335841341883082
Epoch: 2, step: 306, loss: 0.35414496064186096, mean loss: 0.4335592705972139
Epoch: 2, step: 307, loss: 0.36825883388519287, mean loss: 0.4335388386708334
Epoch: 2, step: 308, loss: 0.3415290415287018, mean loss: 0.4335100586279363
Epoch: 2, step: 309, loss: 0.3775445818901062, mean loss: 0.43349255847886253
Epoch: 2, step: 310, loss: 0.3674832582473755, mean loss: 0.4334719241243044
Epoch: 2, step: 311, loss: 0.35648393630981445, mean loss: 0.43344786537811236
Epoch: 2, step: 312, loss: 0.38457903265953064, mean loss: 0.43343259863874384
Epoch: 2, step: 313, loss: 0.4114239513874054, mean loss: 0.4334257252323568
Epoch: 2, step: 314, loss: 0.3693675696849823, mean loss: 0.43340572580820835
Epoch: 2, step: 315, loss: 0.3927287757396698, mean loss: 0.4333930301309086
Epoch: 2, step: 316, loss: 0.3681361675262451, mean loss: 0.4333726691753377
Epoch: 2, step: 317, loss: 0.3580969572067261, mean loss: 0.4333491895396644
Epoch: 2, step: 318, loss: 0.349884569644928, mean loss: 0.43332316377730246
Epoch: 2, step: 319, loss: 0.3887750804424286, mean loss: 0.43330927721765944
Epoch: 2, step: 320, loss: 0.4415335953235626, mean loss: 0.4333118401089358
Epoch: 2, step: 321, loss: 0.3706037104129791, mean loss: 0.43329230486603987
Epoch: 2, step: 322, loss: 0.33168408274650574, mean loss: 0.43326066107216893
Epoch: 2, step: 323, loss: 0.37871187925338745, mean loss: 0.4332436782633835
Epoch: 2, step: 324, loss: 0.3702322840690613, mean loss: 0.4332240668739673
Epoch: 2, step: 325, loss: 0.3756677210330963, mean loss: 0.4332061588634381
Epoch: 2, step: 326, loss: 0.45956864953041077, mean loss: 0.4332143587050141
Epoch: 2, step: 327, loss: 0.3427751660346985, mean loss: 0.4331862370655022
Epoch: 2, step: 328, loss: 0.4156607389450073, mean loss: 0.43318078928865406
Epoch: 2, step: 329, loss: 0.3390905559062958, mean loss: 0.43315155055857874
Epoch: 2, step: 330, loss: 0.36738309264183044, mean loss: 0.43313111922651387
Epoch: 2, step: 331, loss: 0.3548958897590637, mean loss: 0.43310682257139976
Epoch: 2, step: 332, loss: 0.4538570046424866, mean loss: 0.4331132647266531
Epoch: 2, step: 333, loss: 0.39714953303337097, mean loss: 0.4331021027987533
Epoch: 2, step: 334, loss: 0.34181728959083557, mean loss: 0.43307377986570705
Epoch: 2, step: 335, loss: 0.42434370517730713, mean loss: 0.4330710720261635
Epoch: 2, step: 336, loss: 0.36068812012672424, mean loss: 0.43304862769999314
Epoch: 2, step: 337, loss: 0.3708434998989105, mean loss: 0.4330293452673208
Epoch: 2, step: 338, loss: 0.39373502135276794, mean loss: 0.4330171685322992
Epoch: 2, step: 339, loss: 0.3939228951931, mean loss: 0.43300505754303675
Epoch: 2, step: 340, loss: 0.408477783203125, mean loss: 0.4329974616079671
Epoch: 2, step: 341, loss: 0.4221455156803131, mean loss: 0.4329941018723858
Epoch: 2, step: 342, loss: 0.40079009532928467, mean loss: 0.43298413467754115
Epoch: 2, step: 343, loss: 0.387365460395813, mean loss: 0.43297001998871637
Epoch: 2, step: 344, loss: 0.3706205189228058, mean loss: 0.43295073464969197
Epoch: 2, step: 345, loss: 0.417756587266922, mean loss: 0.43294603639756374
Epoch: 2, step: 346, loss: 0.419541597366333, mean loss: 0.43294189283062984
Epoch: 2, step: 347, loss: 0.351433128118515, mean loss: 0.4329167047080365
Epoch: 2, step: 348, loss: 0.364362895488739, mean loss: 0.4328955265155066
Epoch: 2, step: 349, loss: 0.3643219769001007, mean loss: 0.43287434876701514
Epoch: 2, step: 350, loss: 0.34898996353149414, mean loss: 0.4328484505313759
Epoch: 2, step: 351, loss: 0.4002227187156677, mean loss: 0.4328383808610624
Epoch: 2, step: 352, loss: 0.3958900570869446, mean loss: 0.4328269805760349
Epoch: 2, step: 353, loss: 0.36162376403808594, mean loss: 0.4328050178318838
Epoch: 2, step: 354, loss: 0.3583928942680359, mean loss: 0.4327820723728755
Epoch: 2, step: 355, loss: 0.3672122061252594, mean loss: 0.4327618597137363
Epoch: 2, step: 356, loss: 0.36946842074394226, mean loss: 0.4327423548018812
Epoch: 2, step: 357, loss: 0.3747466504573822, mean loss: 0.4327244879798404
Epoch: 2, step: 358, loss: 0.33533918857574463, mean loss: 0.4326944955870458
Epoch: 2, step: 359, loss: 0.4109087884426117, mean loss: 0.43268778816489545
Epoch: 2, step: 360, loss: 0.3783271908760071, mean loss: 0.43267105667911865
Epoch: 2, step: 361, loss: 0.3612743318080902, mean loss: 0.4326490884560814
Epoch: 2, step: 362, loss: 0.37824171781539917, mean loss: 0.4326323528760627
Epoch: 2, step: 363, loss: 0.4234081208705902, mean loss: 0.4326295163963562
Epoch: 2, step: 364, loss: 0.3649649918079376, mean loss: 0.43260871574323956
Epoch: 2, step: 365, loss: 0.378726989030838, mean loss: 0.43259215713023635
Epoch: 2, step: 366, loss: 0.3874814212322235, mean loss: 0.43257829822519855
Epoch: 2, step: 367, loss: 0.3827682435512543, mean loss: 0.4325630002968589
Epoch: 2, step: 368, loss: 0.3544154167175293, mean loss: 0.4325390065653332
Epoch: 2, step: 369, loss: 0.34868741035461426, mean loss: 0.43251326942714696
Epoch: 2, step: 370, loss: 0.3626425862312317, mean loss: 0.4324918301257674
Epoch: 2, step: 371, loss: 0.342942476272583, mean loss: 0.4324643609988186
Epoch: 2, step: 372, loss: 0.36877796053886414, mean loss: 0.4324448312838661
Epoch: 2, step: 373, loss: 0.46456897258758545, mean loss: 0.4324546792732296
Epoch: 2, step: 374, loss: 0.3583095371723175, mean loss: 0.432431956275344
Epoch: 2, step: 375, loss: 0.42477771639823914, mean loss: 0.43242961122636203
Epoch: 2, step: 376, loss: 0.34812596440315247, mean loss: 0.43240379081385877
Epoch: 2, step: 377, loss: 0.3590780198574066, mean loss: 0.4323813395673932
Epoch: 2, step: 378, loss: 0.37825435400009155, mean loss: 0.4323647717726068
Epoch: 2, step: 379, loss: 0.334744393825531, mean loss: 0.43233490017592774
Epoch: 2, step: 380, loss: 0.35034385323524475, mean loss: 0.43230981879111874
Epoch: 2, step: 381, loss: 0.37901508808135986, mean loss: 0.4322935207083329
Epoch: 2, step: 382, loss: 0.3939038813114166, mean loss: 0.43228178434654846
Epoch: 2, step: 383, loss: 0.3914434313774109, mean loss: 0.43226930318732804
Epoch: 2, step: 384, loss: 0.38986262679100037, mean loss: 0.43225634667147217
Epoch: 2, step: 385, loss: 0.3622627258300781, mean loss: 0.4322349680456807
Epoch: 2, step: 386, loss: 0.40956932306289673, mean loss: 0.43222804723805236
Epoch: 2, step: 387, loss: 0.37042737007141113, mean loss: 0.4322091825624826
Epoch: 2, step: 388, loss: 0.379244327545166, mean loss: 0.432193019957961
Epoch: 2, step: 389, loss: 0.3459204435348511, mean loss: 0.43216670129523277
Epoch: 2, step: 390, loss: 0.3802570104598999, mean loss: 0.4321508703434684
Epoch: 2, step: 391, loss: 0.3728405833244324, mean loss: 0.43213278793888943
Epoch: 2, step: 392, loss: 0.3534013330936432, mean loss: 0.432108791762466
Epoch: 2, step: 393, loss: 0.39583921432495117, mean loss: 0.43209774070291773
Epoch: 2, step: 394, loss: 0.3663853108882904, mean loss: 0.43207772473282496
Epoch: 2, step: 395, loss: 0.3923490047454834, mean loss: 0.43206562707144025
Epoch: 2, step: 396, loss: 0.3899918496608734, mean loss: 0.4320528192244355
Epoch: 2, step: 397, loss: 0.3954431116580963, mean loss: 0.43204167810831673
Epoch: 2, step: 398, loss: 0.36416640877723694, mean loss: 0.43202102849793306
Epoch: 2, step: 399, loss: 0.4012448489665985, mean loss: 0.43201166834600746
Epoch: 2, step: 400, loss: 0.33752864599227905, mean loss: 0.43198294137052745
Epoch: 2, step: 401, loss: 0.4221208095550537, mean loss: 0.4319799437620729
Epoch: 2, step: 402, loss: 0.36618244647979736, mean loss: 0.4319599505997264
Epoch: 2, step: 403, loss: 0.3573324978351593, mean loss: 0.4319372812641357
Epoch: 2, step: 404, loss: 0.4218912720680237, mean loss: 0.43193423054770813
Epoch: 2, step: 405, loss: 0.3386785387992859, mean loss: 0.43190591977304255
Epoch: 2, step: 406, loss: 0.3681256175041199, mean loss: 0.4318865630803964
Epoch: 2, step: 407, loss: 0.40563443303108215, mean loss: 0.4318785982351145
Epoch: 2, step: 408, loss: 0.38655346632003784, mean loss: 0.43186485084903165
Epoch: 2, step: 409, loss: 0.3721238672733307, mean loss: 0.43184673654230765
Epoch: 2, step: 410, loss: 0.3463350832462311, mean loss: 0.43182081606540673
Epoch: 2, step: 411, loss: 0.3842019736766815, mean loss: 0.43180638611316774
Epoch: 2, step: 412, loss: 0.35320231318473816, mean loss: 0.43178257391294705
Epoch: 2, step: 413, loss: 0.36858391761779785, mean loss: 0.4317634344046808
Epoch: 2, step: 414, loss: 0.44590768218040466, mean loss: 0.4317677166474225
Epoch: 2, step: 415, loss: 0.37447312474250793, mean loss: 0.431750375669243
Epoch: 2, step: 416, loss: 0.417379766702652, mean loss: 0.4317460275273469
Epoch: 2, step: 417, loss: 0.33938297629356384, mean loss: 0.43171808952031915
Epoch: 2, step: 418, loss: 0.3778470754623413, mean loss: 0.4317017995251398
Epoch: 2, step: 419, loss: 0.39333581924438477, mean loss: 0.4316902015867236
Epoch: 2, step: 420, loss: 0.3886319100856781, mean loss: 0.4316771891081799
Epoch: 2, step: 421, loss: 0.40933284163475037, mean loss: 0.43167043855003084
Epoch: 2, step: 422, loss: 0.32303401827812195, mean loss: 0.4316376277918696
Epoch: 2, step: 423, loss: 0.34433019161224365, mean loss: 0.4316112668509941
Epoch: 2, step: 424, loss: 0.3921665549278259, mean loss: 0.43159936081057054
Epoch: 2, step: 425, loss: 0.3792605400085449, mean loss: 0.4315835675634969
Epoch: 2, step: 426, loss: 0.4290345311164856, mean loss: 0.4315827986233922
Epoch: 2, step: 427, loss: 0.356787770986557, mean loss: 0.43156024282494926
Epoch: 2, step: 428, loss: 0.4213296175003052, mean loss: 0.43155715852427856
Epoch: 2, step: 429, loss: 0.3752860426902771, mean loss: 0.4315401991765287
Epoch: 2, step: 430, loss: 0.41303905844688416, mean loss: 0.43153462486476923
Epoch: 2, step: 431, loss: 0.3440002501010895, mean loss: 0.431508259089238
Epoch: 2, step: 432, loss: 0.37511494755744934, mean loss: 0.4314912782667352
Epoch: 2, step: 433, loss: 0.3691670298576355, mean loss: 0.4314725172046012
Epoch: 2, step: 434, loss: 0.327812522649765, mean loss: 0.43144132250265876
Epoch: 2, step: 435, loss: 0.34611180424690247, mean loss: 0.43141565176912816
Epoch: 2, step: 436, loss: 0.40379783511161804, mean loss: 0.43140734565885525
Epoch: 2, step: 437, loss: 0.3740677833557129, mean loss: 0.43139010586261256
Epoch: 2, step: 438, loss: 0.4029228985309601, mean loss: 0.4313815494432162
Epoch: 2, step: 439, loss: 0.3492544889450073, mean loss: 0.43135687184090304
Epoch: 2, step: 440, loss: 0.4365464448928833, mean loss: 0.4313584307393867
Epoch: 2, step: 441, loss: 0.38121339678764343, mean loss: 0.4313433721706324
Epoch: 2, step: 442, loss: 0.3536975681781769, mean loss: 0.4313200621123939
Epoch: 2, step: 443, loss: 0.36004212498664856, mean loss: 0.431298670174481
Epoch: 2, step: 444, loss: 0.38780829310417175, mean loss: 0.4312856217565181
Epoch: 2, step: 445, loss: 0.42537468671798706, mean loss: 0.43128384883059173
Epoch: 2, step: 446, loss: 0.3694706857204437, mean loss: 0.4312653141489995
Epoch: 2, step: 447, loss: 0.4179582893848419, mean loss: 0.4312613252327033
Epoch: 2, step: 448, loss: 0.39235445857048035, mean loss: 0.4312496659978629
Epoch: 2, step: 449, loss: 0.416708767414093, mean loss: 0.4312453098269271
Epoch: 2, step: 450, loss: 0.41798388957977295, mean loss: 0.43124133815269916
Epoch: 2, step: 451, loss: 0.40042272210121155, mean loss: 0.4312321110221448
Epoch: 2, step: 452, loss: 0.3706722855567932, mean loss: 0.43121398476489686
Epoch: 2, step: 453, loss: 0.38115188479423523, mean loss: 0.431199005082081
Epoch: 2, step: 454, loss: 0.34272751212120056, mean loss: 0.43117254038182345
Epoch: 2, step: 455, loss: 0.3540448546409607, mean loss: 0.431149475882499
Epoch: 2, step: 456, loss: 0.3967621326446533, mean loss: 0.43113919566030534
Epoch: 2, step: 457, loss: 0.3587408661842346, mean loss: 0.43111755838311583
Epoch: 2, step: 458, loss: 0.4157375395298004, mean loss: 0.4311129632176383
Epoch: 2, step: 459, loss: 0.3728916049003601, mean loss: 0.4310955733256678
Epoch: 2, step: 460, loss: 0.38939979672431946, mean loss: 0.4310831231087071
Epoch: 2, step: 461, loss: 0.3739233613014221, mean loss: 0.43106606049324225
Epoch: 2, step: 462, loss: 0.39480942487716675, mean loss: 0.4310552408466842
Epoch: 2, step: 463, loss: 0.4210129678249359, mean loss: 0.43105224494184474
Epoch: 2, step: 464, loss: 0.36473897099494934, mean loss: 0.4310324676457079
Epoch: 2, step: 465, loss: 0.3525811433792114, mean loss: 0.43100907726876503
Epoch: 2, step: 466, loss: 0.3759098947048187, mean loss: 0.4309926542635299
Epoch: 2, step: 467, loss: 0.376396507024765, mean loss: 0.4309763860432561
Epoch: 2, step: 468, loss: 0.39733609557151794, mean loss: 0.43096636510477776
Epoch: 2, step: 469, loss: 0.34887397289276123, mean loss: 0.43094191829351747
Epoch: 2, step: 470, loss: 0.37400323152542114, mean loss: 0.4309249672108238
Epoch: 2, step: 471, loss: 0.32284995913505554, mean loss: 0.43089280202984886
Epoch: 2, step: 472, loss: 0.3673480749130249, mean loss: 0.43087389553561595
Epoch: 2, step: 473, loss: 0.3567546606063843, mean loss: 0.4308518493622283
Epoch: 2, step: 474, loss: 0.3908320665359497, mean loss: 0.4308399493375996
Epoch: 2, step: 475, loss: 0.3885353207588196, mean loss: 0.43082737364539425
Epoch: 2, step: 476, loss: 0.41272225975990295, mean loss: 0.43082199322522025
Epoch: 2, step: 477, loss: 0.4008452892303467, mean loss: 0.43081308749022473
Epoch: 2, step: 478, loss: 0.37549030780792236, mean loss: 0.4307966566082282
Epoch: 2, step: 479, loss: 0.35747626423835754, mean loss: 0.4307748868955293
Epoch: 2, step: 480, loss: 0.38683757185935974, mean loss: 0.43076184524666133
Epoch: 2, step: 481, loss: 0.34431204199790955, mean loss: 0.4307361924860534
Epoch: 2, step: 482, loss: 0.3605765104293823, mean loss: 0.4307153797651822
Epoch: 2, step: 483, loss: 0.4238903820514679, mean loss: 0.4307133557445079
Epoch: 2, step: 484, loss: 0.37842273712158203, mean loss: 0.4306978530410917
Epoch: 2, step: 485, loss: 0.3968512713909149, mean loss: 0.43068782145198375
Epoch: 2, step: 486, loss: 0.34308117628097534, mean loss: 0.4306618639274886
Epoch: 2, step: 487, loss: 0.3821139633655548, mean loss: 0.43064748362518945
Epoch: 2, step: 488, loss: 0.3486427962779999, mean loss: 0.43062320033015034
Epoch: 2, step: 489, loss: 0.37492865324020386, mean loss: 0.43060671289761926
Epoch: 2, step: 490, loss: 0.375238299369812, mean loss: 0.4305903268622455
Epoch: 2, step: 491, loss: 0.3689076602458954, mean loss: 0.4305720775525957
Epoch: 2, step: 492, loss: 0.33368319272994995, mean loss: 0.430543420680421
Epoch: 2, step: 493, loss: 0.37079936265945435, mean loss: 0.43052575537645266
Epoch: 2, step: 494, loss: 0.4516872465610504, mean loss: 0.4305320106206692
Epoch: 2, step: 495, loss: 0.35279524326324463, mean loss: 0.4305090387627031
Epoch: 2, step: 496, loss: 0.39312607049942017, mean loss: 0.4304979950497745
Epoch: 2, step: 497, loss: 0.37879568338394165, mean loss: 0.4304827256133699
Epoch: 2, step: 498, loss: 0.387144535779953, mean loss: 0.43046993016316815
Epoch: 2, step: 499, loss: 0.4244943857192993, mean loss: 0.4304681664251387
Epoch: 2, step: 500, loss: 0.41366755962371826, mean loss: 0.43046320903157087
Epoch: 2, step: 501, loss: 0.3789125680923462, mean loss: 0.43044800235282776
Epoch: 2, step: 502, loss: 0.3410702645778656, mean loss: 0.43042164501346625
Epoch: 2, step: 503, loss: 0.38443395495414734, mean loss: 0.4304080873218214
Epoch: 2, step: 504, loss: 0.39029204845428467, mean loss: 0.4303962641450258
Epoch: 2, step: 505, loss: 0.36043262481689453, mean loss: 0.4303756502265437
Epoch: 2, step: 506, loss: 0.37879735231399536, mean loss: 0.4303604577971144
Epoch: 2, step: 507, loss: 0.3803156018257141, mean loss: 0.43034572138487315
Epoch: 2, step: 508, loss: 0.38851144909858704, mean loss: 0.430333406320909
Epoch: 2, step: 509, loss: 0.3693135678768158, mean loss: 0.4303154487463227
Epoch: 2, step: 510, loss: 0.34555014967918396, mean loss: 0.43029051044121325
Epoch: 2, step: 511, loss: 0.3929496705532074, mean loss: 0.4302795278412462
Epoch: 2, step: 512, loss: 0.37866753339767456, mean loss: 0.4302643523062731
Epoch: 2, step: 513, loss: 0.3574706017971039, mean loss: 0.4302429549663233
Epoch: 2, step: 514, loss: 0.368038535118103, mean loss: 0.43022467567750516
Epoch: 2, step: 515, loss: 0.35994136333465576, mean loss: 0.43020402840595906
Epoch: 2, step: 516, loss: 0.46675899624824524, mean loss: 0.4302147640793342
Epoch: 2, step: 517, loss: 0.3819248378276825, mean loss: 0.43020058617967133
Epoch: 2, step: 518, loss: 0.3388062119483948, mean loss: 0.4301737607102756
Epoch: 2, step: 519, loss: 0.34298449754714966, mean loss: 0.43014817700629576
Epoch: 2, step: 520, loss: 0.40103664994239807, mean loss: 0.43013963739730077
Epoch: 2, step: 521, loss: 0.4271606504917145, mean loss: 0.43013876379410265
Epoch: 2, step: 522, loss: 0.3864792585372925, mean loss: 0.43012596417368143
Epoch: 2, step: 523, loss: 0.3832463324069977, mean loss: 0.4301122245395177
Epoch: 2, step: 524, loss: 0.36817115545272827, mean loss: 0.4300940759696124
Epoch: 2, step: 525, loss: 0.34138184785842896, mean loss: 0.43006809113419614
Epoch: 2, step: 526, loss: 0.3589976727962494, mean loss: 0.4300472798843168
Epoch: 2, step: 527, loss: 0.3600039482116699, mean loss: 0.4300267753961222
Epoch: 2, step: 528, loss: 0.375078946352005, mean loss: 0.43001069467354563
Epoch: 2, step: 529, loss: 0.39098209142684937, mean loss: 0.4299992761237368
Epoch: 2, step: 530, loss: 0.38404110074043274, mean loss: 0.4299858341303518
Epoch: 2, step: 531, loss: 0.3434160053730011, mean loss: 0.4299605213149257
Epoch: 2, step: 532, loss: 0.34708142280578613, mean loss: 0.42993629474418343
Epoch: 2, step: 533, loss: 0.34357091784477234, mean loss: 0.42991105646922745
Epoch: 2, step: 534, loss: 0.3625810742378235, mean loss: 0.42989138659419635
Epoch: 2, step: 535, loss: 0.37405067682266235, mean loss: 0.4298750779756883
Epoch: 2, step: 536, loss: 0.44909510016441345, mean loss: 0.4298806896609989
Epoch: 2, step: 537, loss: 0.4207965135574341, mean loss: 0.42987803812098035
Epoch: 2, step: 538, loss: 0.3742804229259491, mean loss: 0.4298618147141537
Epoch: 2, step: 539, loss: 0.37339362502098083, mean loss: 0.42984534208005415
Epoch: 2, step: 540, loss: 0.3635445833206177, mean loss: 0.42982600677566235
Epoch: 2, step: 541, loss: 0.3316974937915802, mean loss: 0.42979739787974863
Epoch: 2, step: 542, loss: 0.3792625367641449, mean loss: 0.4297826689782285
Epoch: 2, step: 543, loss: 0.3339652121067047, mean loss: 0.4297547501388137
Epoch: 2, step: 544, loss: 0.3437718451023102, mean loss: 0.4297297041425898
Epoch: 2, step: 545, loss: 0.36438265442848206, mean loss: 0.4297106747163481
Epoch: 2, step: 546, loss: 0.3674624264240265, mean loss: 0.4296925529555643
Epoch: 2, step: 547, loss: 0.351600706577301, mean loss: 0.4296698254100526
Epoch: 2, step: 548, loss: 0.32479289174079895, mean loss: 0.4296393113182082
Epoch: 2, step: 549, loss: 0.38518550992012024, mean loss: 0.4296263811840028
Epoch: 2, step: 550, loss: 0.4097345173358917, mean loss: 0.4296205969839888
Epoch: 2, step: 551, loss: 0.41180741786956787, mean loss: 0.42961541873424625
Epoch: 2, step: 552, loss: 0.3963635265827179, mean loss: 0.4296057552956669
Epoch: 2, step: 553, loss: 0.3574526309967041, mean loss: 0.42958479273776484
Epoch: 2, step: 554, loss: 0.40368780493736267, mean loss: 0.4295772711032018
Epoch: 2, step: 555, loss: 0.37736988067626953, mean loss: 0.42956211216289203
Epoch: 2, step: 556, loss: 0.3232555389404297, mean loss: 0.42953125394134706
Epoch: 2, step: 557, loss: 0.4163926839828491, mean loss: 0.429527441239676
Epoch: 2, step: 558, loss: 0.371896356344223, mean loss: 0.4295107220389521
Epoch: 2, step: 559, loss: 0.37316200137138367, mean loss: 0.4294943796025636
Epoch: 2, step: 560, loss: 0.3670981526374817, mean loss: 0.4294762884958761
Epoch: 2, step: 561, loss: 0.35701340436935425, mean loss: 0.4294552847613467
Epoch: 2, step: 562, loss: 0.34852463006973267, mean loss: 0.4294318333980631
Epoch: 2, step: 563, loss: 0.4232955276966095, mean loss: 0.42943005578922727
Epoch: 2, step: 564, loss: 0.4341985881328583, mean loss: 0.429431436771661
Epoch: 2, step: 565, loss: 0.4149912893772125, mean loss: 0.4294272560688832
Epoch: 2, step: 566, loss: 0.37013334035873413, mean loss: 0.42941009429877897
Epoch: 2, step: 567, loss: 0.4560866355895996, mean loss: 0.42941781320540245
Epoch: 2, step: 568, loss: 0.35133376717567444, mean loss: 0.4293952259777398
Epoch: 2, step: 569, loss: 0.35938888788223267, mean loss: 0.4293749812298811
Epoch: 2, step: 570, loss: 0.3858117461204529, mean loss: 0.42936238705956903
Epoch: 2, step: 571, loss: 0.35306546092033386, mean loss: 0.4293403359248467
Epoch: 2, step: 572, loss: 0.38365647196769714, mean loss: 0.4293271363108747
Epoch: 2, step: 573, loss: 0.426945298910141, mean loss: 0.4293264483162471
Epoch: 2, step: 574, loss: 0.39856815338134766, mean loss: 0.4293175663367684
Epoch: 2, step: 575, loss: 0.3739253282546997, mean loss: 0.42930157550591325
Epoch: 2, step: 576, loss: 0.3632088601589203, mean loss: 0.42928250112918975
Epoch: 2, step: 577, loss: 0.37927666306495667, mean loss: 0.42926807359368363
Epoch: 2, step: 578, loss: 0.37608081102371216, mean loss: 0.4292527325891927
Epoch: 2, step: 579, loss: 0.39071768522262573, mean loss: 0.42924162098383906
Epoch: 2, step: 580, loss: 0.35098007321357727, mean loss: 0.4292190607221584
Epoch: 2, step: 581, loss: 0.38487929105758667, mean loss: 0.4292062826905548
Epoch: 2, step: 582, loss: 0.36996495723724365, mean loss: 0.4291892151810609
Epoch: 2, step: 583, loss: 0.374291330575943, mean loss: 0.42917340357835204
Epoch: 2, step: 584, loss: 0.3501138389110565, mean loss: 0.4291506395228763
Epoch: 2, step: 585, loss: 0.3654900789260864, mean loss: 0.4291323146637523
Epoch: 2, step: 586, loss: 0.3822097182273865, mean loss: 0.42911881175830296
Epoch: 2, step: 587, loss: 0.3820168077945709, mean loss: 0.42910526112425124
Epoch: 2, step: 588, loss: 0.41106969118118286, mean loss: 0.42910007401756645
Epoch: 2, step: 589, loss: 0.3660971224308014, mean loss: 0.42908195931038223
Epoch: 2, step: 590, loss: 0.36139631271362305, mean loss: 0.4290625038212771
Epoch: 2, step: 591, loss: 0.3934556245803833, mean loss: 0.42905227195942625
Epoch: 2, step: 592, loss: 0.38051697611808777, mean loss: 0.4290383290419194
Epoch: 2, step: 593, loss: 0.4037635326385498, mean loss: 0.42903107034105686
Epoch: 2, step: 594, loss: 0.3589875102043152, mean loss: 0.4290109602175608
Epoch: 2, step: 595, loss: 0.3859208822250366, mean loss: 0.42899859222732184
Epoch: 2, step: 596, loss: 0.3540891110897064, mean loss: 0.4289770973977271
Epoch: 2, step: 597, loss: 0.36700841784477234, mean loss: 0.4289593209549408
Epoch: 2, step: 598, loss: 0.3651334345340729, mean loss: 0.4289410170012784
Epoch: 2, step: 599, loss: 0.37766772508621216, mean loss: 0.4289263170896055
Epoch: 2, step: 600, loss: 0.3978835642337799, mean loss: 0.42891741976863795
Epoch: 2, step: 601, loss: 0.421418696641922, mean loss: 0.42891527113736955
Epoch: 2, step: 602, loss: 0.4255312383174896, mean loss: 0.42891430177821177
Epoch: 2, step: 603, loss: 0.3496335744857788, mean loss: 0.4288915982480593
Epoch: 2, step: 604, loss: 0.37507158517837524, mean loss: 0.4288761902855429
Epoch: 2, step: 605, loss: 0.36104467511177063, mean loss: 0.4288567765719843
Epoch: 2, step: 606, loss: 0.35132747888565063, mean loss: 0.42883459365419135
Epoch: 2, step: 607, loss: 0.3735973834991455, mean loss: 0.42881879353687014
Epoch: 2, step: 608, loss: 0.4514097273349762, mean loss: 0.4288252536266037
Epoch: 2, step: 609, loss: 0.3752354085445404, mean loss: 0.42880993348792956
Epoch: 2, step: 610, loss: 0.386593759059906, mean loss: 0.42879786827660404
Epoch: 2, step: 611, loss: 0.34433579444885254, mean loss: 0.4287737362555104
Epoch: 2, step: 612, loss: 0.3765151798725128, mean loss: 0.42875880950418704
Epoch: 2, step: 613, loss: 0.34568923711776733, mean loss: 0.4287350888952817
Epoch: 2, step: 614, loss: 0.36232659220695496, mean loss: 0.4287161312884623
Epoch: 2, step: 615, loss: 0.4604772925376892, mean loss: 0.4287251955468097
Epoch: 2, step: 616, loss: 0.40349552035331726, mean loss: 0.42871799735131944
Epoch: 2, step: 617, loss: 0.3521764576435089, mean loss: 0.42869616576555
Epoch: 2, step: 618, loss: 0.3873480260372162, mean loss: 0.4286843755916896
Epoch: 2, step: 619, loss: 0.3431863486766815, mean loss: 0.4286600032921129
Epoch: 2, step: 620, loss: 0.3532036542892456, mean loss: 0.4286384996303851
Epoch: 2, step: 621, loss: 0.3942889869213104, mean loss: 0.4286287134444281
Epoch: 2, step: 622, loss: 0.3436852693557739, mean loss: 0.4286045199257472
Epoch: 2, step: 623, loss: 0.3494453728199005, mean loss: 0.4285819803052729
Epoch: 2, step: 624, loss: 0.4038369655609131, mean loss: 0.4285749364638996
Epoch: 2, step: 625, loss: 0.3438906669616699, mean loss: 0.42855083735476407
Epoch: 2, step: 626, loss: 0.3843635320663452, mean loss: 0.42853826628640324
Epoch: 2, step: 627, loss: 0.38548311591148376, mean loss: 0.4285260207942602
Epoch: 2, step: 628, loss: 0.3631468415260315, mean loss: 0.4285074313204848
Epoch: 2, step: 629, loss: 0.3737885653972626, mean loss: 0.4284918773506374
Epoch: 2, step: 630, loss: 0.35479339957237244, mean loss: 0.4284709343333659
Epoch: 2, step: 631, loss: 0.34973379969596863, mean loss: 0.42844856582920754
Epoch: 2, step: 632, loss: 0.37433236837387085, mean loss: 0.4284331962758263
Epoch: 2, step: 633, loss: 0.4190514087677002, mean loss: 0.42843053250878826
Epoch: 2, step: 634, loss: 0.36115115880966187, mean loss: 0.4284114353263588
Epoch: 2, step: 635, loss: 0.35137709975242615, mean loss: 0.4283895754127453
Epoch: 2, step: 636, loss: 0.38883358240127563, mean loss: 0.42837835385444417
Epoch: 2, step: 637, loss: 0.3490583002567291, mean loss: 0.42835585809335575
Epoch: 2, step: 638, loss: 0.36544883251190186, mean loss: 0.4283380222482802
Epoch: 2, step: 639, loss: 0.4502347707748413, mean loss: 0.42834422880965395
Epoch: 2, step: 640, loss: 0.34483450651168823, mean loss: 0.42832056496088716
Epoch: 2, step: 641, loss: 0.3410773277282715, mean loss: 0.42829585016280425
Epoch: 2, step: 642, loss: 0.4133130609989166, mean loss: 0.4282916069486542
Epoch: 2, step: 643, loss: 0.3933665454387665, mean loss: 0.42828171876589377
Epoch: 2, step: 644, loss: 0.37057527899742126, mean loss: 0.4282653852137374
Epoch: 2, step: 645, loss: 0.3840062618255615, mean loss: 0.42825286140972263
Epoch: 2, step: 646, loss: 0.34887629747390747, mean loss: 0.4282304069361906
Epoch: 2, step: 647, loss: 0.3611811399459839, mean loss: 0.4282114450394173
Epoch: 2, step: 648, loss: 0.3690823018550873, mean loss: 0.42819472772440903
Epoch: 2, step: 649, loss: 0.35228630900382996, mean loss: 0.42817327254670395
Epoch: 2, step: 650, loss: 0.40607380867004395, mean loss: 0.42816702799630085
Epoch: 2, step: 651, loss: 0.3659457564353943, mean loss: 0.4281494513659164
Epoch: 2, step: 652, loss: 0.3724481165409088, mean loss: 0.4281337209691853
Epoch: 2, step: 653, loss: 0.3564774990081787, mean loss: 0.4281134905282025
Epoch: 2, step: 654, loss: 0.3690541386604309, mean loss: 0.4280968212220022
Epoch: 2, step: 655, loss: 0.3236420750617981, mean loss: 0.4280673475351624
Epoch: 2, step: 656, loss: 0.3304811716079712, mean loss: 0.428039819699922
Epoch: 2, step: 657, loss: 0.3763224184513092, mean loss: 0.4280252349843979
Epoch: 2, step: 658, loss: 0.354420006275177, mean loss: 0.4280044835807584
Epoch: 2, step: 659, loss: 0.4121025800704956, mean loss: 0.4280000016462854
Epoch: 2, step: 660, loss: 0.35164299607276917, mean loss: 0.427978486570046
Epoch: 2, step: 661, loss: 0.3515472114086151, mean loss: 0.4279569566333808
Epoch: 2, step: 662, loss: 0.43359729647636414, mean loss: 0.4279585450140744
Epoch: 2, step: 663, loss: 0.32907262444496155, mean loss: 0.42793070550940965
Epoch: 2, step: 664, loss: 0.3599945604801178, mean loss: 0.4279115847255568
Epoch: 2, step: 665, loss: 0.35284098982810974, mean loss: 0.42789046187949675
Epoch: 2, step: 666, loss: 0.34963753819465637, mean loss: 0.4278684498053238
Epoch: 2, step: 667, loss: 0.3469008207321167, mean loss: 0.4278456805058094
Epoch: 2, step: 668, loss: 0.4481540322303772, mean loss: 0.4278513899102864
Epoch: 2, step: 669, loss: 0.3600119948387146, mean loss: 0.4278323231887935
Epoch: 2, step: 670, loss: 0.3921346664428711, mean loss: 0.4278222929396376
Epoch: 2, step: 671, loss: 0.34791308641433716, mean loss: 0.42779984653331027
Epoch: 2, step: 672, loss: 0.37443801760673523, mean loss: 0.4277848614648108
Epoch: 2, step: 673, loss: 0.4040515422821045, mean loss: 0.4277781985453322
Epoch: 2, step: 674, loss: 0.39677730202674866, mean loss: 0.4277694977604547
Epoch: 2, step: 675, loss: 0.38764694333076477, mean loss: 0.42775824002913326
Epoch: 2, step: 676, loss: 0.3507111966609955, mean loss: 0.4277366279552572
Epoch: 2, step: 677, loss: 0.3806029260158539, mean loss: 0.4277234104280728
Epoch: 2, step: 678, loss: 0.34320375323295593, mean loss: 0.42769971554239994
Epoch: 2, step: 679, loss: 0.363978773355484, mean loss: 0.4276818565339395
Epoch: 2, step: 680, loss: 0.3772088587284088, mean loss: 0.4276677144779559
Epoch: 2, step: 681, loss: 0.4021201729774475, mean loss: 0.4276605583038661
Epoch: 2, step: 682, loss: 0.36442193388938904, mean loss: 0.4276428493639573
Epoch: 2, step: 683, loss: 0.3934735357761383, mean loss: 0.42763328348669305
Epoch: 2, step: 684, loss: 0.35721540451049805, mean loss: 0.42761357515224685
Epoch: 2, step: 685, loss: 0.40261489152908325, mean loss: 0.427606580556941
Epoch: 2, step: 686, loss: 0.38062167167663574, mean loss: 0.42759343792508636
Epoch: 2, step: 687, loss: 0.37644311785697937, mean loss: 0.4275791341443067
Epoch: 2, step: 688, loss: 0.40661296248435974, mean loss: 0.42757327276000145
Epoch: 2, step: 689, loss: 0.3657098710536957, mean loss: 0.4275559828210114
Epoch: 2, step: 690, loss: 0.3619273900985718, mean loss: 0.4275376456897674
Epoch: 2, step: 691, loss: 0.35218459367752075, mean loss: 0.42751659735121644
Epoch: 2, step: 692, loss: 0.42976370453834534, mean loss: 0.4275172248595066
Epoch: 2, step: 693, loss: 0.34713393449783325, mean loss: 0.42749478396325824
Epoch: 2, step: 694, loss: 0.3744106590747833, mean loss: 0.4274799684106798
Epoch: 2, step: 695, loss: 0.36519506573677063, mean loss: 0.42746258981060337
Epoch: 2, step: 696, loss: 0.4030593931674957, mean loss: 0.42745578278225105
Epoch: 2, step: 697, loss: 0.37717628479003906, mean loss: 0.4274417617287117
Epoch: 2, step: 698, loss: 0.37822508811950684, mean loss: 0.42742804088298847
Epoch: 2, step: 699, loss: 0.4083598256111145, mean loss: 0.42742272644171986
Epoch: 2, step: 700, loss: 0.3477090001106262, mean loss: 0.4274005158743387
Epoch: 2, step: 701, loss: 0.4181950092315674, mean loss: 0.4273979516663602
Epoch: 2, step: 702, loss: 0.31517985463142395, mean loss: 0.427366701848194
Epoch: 2, step: 703, loss: 0.388794481754303, mean loss: 0.42735596347957094
Epoch: 2, step: 704, loss: 0.3885160982608795, mean loss: 0.4273451536089284
Epoch: 2, step: 705, loss: 0.36238235235214233, mean loss: 0.4273270782607768
Epoch: 2, step: 706, loss: 0.3566778302192688, mean loss: 0.4273074261750907
Epoch: 2, step: 707, loss: 0.3756249248981476, mean loss: 0.42729305395560324
Epoch: 2, step: 708, loss: 0.3591582775115967, mean loss: 0.42727411184372
Epoch: 2, step: 709, loss: 0.3874935507774353, mean loss: 0.42726305554548033
Epoch: 2, step: 710, loss: 0.43830037117004395, mean loss: 0.4272661223183685
Epoch: 2, step: 711, loss: 0.4131517708301544, mean loss: 0.42726220166517737
Epoch: 2, step: 712, loss: 0.39063093066215515, mean loss: 0.427252029137823
Epoch: 2, step: 713, loss: 0.3701895773410797, mean loss: 0.4272361872578128
Epoch: 2, step: 714, loss: 0.4054506719112396, mean loss: 0.42723014076451654
Epoch: 2, step: 715, loss: 0.4038405120372772, mean loss: 0.4272236508564346
Epoch: 2, step: 716, loss: 0.4093589186668396, mean loss: 0.42721869531352485
Epoch: 2, step: 717, loss: 0.3708116412162781, mean loss: 0.4272030527583121
Epoch: 2, step: 718, loss: 0.38852450251579285, mean loss: 0.4271923295672274
Epoch: 2, step: 719, loss: 0.3810735046863556, mean loss: 0.42717954718782586
Epoch: 2, step: 720, loss: 0.378834992647171, mean loss: 0.427166151633783
Epoch: 2, step: 721, loss: 0.37495848536491394, mean loss: 0.4271516896763678
Epoch: 2, step: 722, loss: 0.34618237614631653, mean loss: 0.4271292667149914
Epoch: 2, step: 723, loss: 0.4618397355079651, mean loss: 0.4271388764793305
Epoch: 2, step: 724, loss: 0.4021415412425995, mean loss: 0.42713195775936463
Epoch: 2, step: 725, loss: 0.3512164056301117, mean loss: 0.4271109517958535
Epoch: 2, step: 726, loss: 0.37300682067871094, mean loss: 0.4270959852312291
Epoch: 2, step: 727, loss: 0.36219322681427, mean loss: 0.427078036459543
Epoch: 2, step: 728, loss: 0.35612714290618896, mean loss: 0.42705842050887854
Epoch: 2, step: 729, loss: 0.3562304973602295, mean loss: 0.4270388439684837
Epoch: 2, step: 730, loss: 0.3570631146430969, mean loss: 0.42701950831517466
Epoch: 2, step: 731, loss: 0.3661300241947174, mean loss: 0.42700268801569385
Epoch: 2, step: 732, loss: 0.36657851934432983, mean loss: 0.4269860008661022
Epoch: 2, step: 733, loss: 0.3474087715148926, mean loss: 0.42696403034447017
Epoch: 2, step: 734, loss: 0.3520899713039398, mean loss: 0.4269433640295266
Epoch: 2, step: 735, loss: 0.3933078944683075, mean loss: 0.4269340827189413
Epoch: 2, step: 736, loss: 0.32759779691696167, mean loss: 0.4269066796056166
Epoch: 2, step: 737, loss: 0.3614201545715332, mean loss: 0.42688861933947375
Epoch: 2, step: 738, loss: 0.38332313299179077, mean loss: 0.4268766079012748
Epoch: 2, step: 739, loss: 0.3328208923339844, mean loss: 0.4268506829521107
Epoch: 2, step: 740, loss: 0.38916951417922974, mean loss: 0.4268402996044191
Epoch: 2, step: 741, loss: 0.47527119517326355, mean loss: 0.4268536414489284
Epoch: 2, step: 742, loss: 0.3308570384979248, mean loss: 0.4268272033869755
Epoch: 2, step: 743, loss: 0.3529732823371887, mean loss: 0.42680686915761157
Epoch: 2, step: 744, loss: 0.3812659978866577, mean loss: 0.4267943338228274
Epoch: 2, step: 745, loss: 0.40987956523895264, mean loss: 0.4267896792359854
Epoch: 2, step: 746, loss: 0.43478551506996155, mean loss: 0.4267918789157196
Epoch: 2, step: 747, loss: 0.39058631658554077, mean loss: 0.4267819213903263
Epoch: 2, step: 748, loss: 0.3613748848438263, mean loss: 0.42676393760243886
Epoch: 2, step: 749, loss: 0.37803196907043457, mean loss: 0.42675054233896115
Epoch: 2, step: 750, loss: 0.36246877908706665, mean loss: 0.4267328776609584
Epoch: 2, step: 751, loss: 0.3740215301513672, mean loss: 0.4267183965215327
Epoch: 2, step: 752, loss: 0.34057530760765076, mean loss: 0.426694737337541
Epoch: 2, step: 753, loss: 0.4243100583553314, mean loss: 0.4266940825657172
Epoch: 2, step: 754, loss: 0.4148796796798706, mean loss: 0.4266908395234757
Epoch: 2, step: 755, loss: 0.3734069764614105, mean loss: 0.42667621716807996
Epoch: 2, step: 756, loss: 0.3669118285179138, mean loss: 0.42665982090233234
Epoch: 2, step: 757, loss: 0.38162410259246826, mean loss: 0.4266474688128343
Epoch: 2, step: 758, loss: 0.37919703125953674, mean loss: 0.4266344579991372
Epoch: 2, step: 759, loss: 0.3604587912559509, mean loss: 0.4266163177396133
Epoch: 2, step: 760, loss: 0.3589780628681183, mean loss: 0.42659778163249584
Epoch: 2, step: 761, loss: 0.3724018335342407, mean loss: 0.4265829334275374
Epoch: 2, step: 762, loss: 0.35598278045654297, mean loss: 0.4265635962177398
Epoch: 2, step: 763, loss: 0.33478185534477234, mean loss: 0.4265384643062193
Epoch: 2, step: 764, loss: 0.391015887260437, mean loss: 0.4265287400858399
Epoch: 2, step: 765, loss: 0.4073597192764282, mean loss: 0.4265234940483989
Epoch: 2, step: 766, loss: 0.39060449600219727, mean loss: 0.42651366668915236
Epoch: 2, step: 767, loss: 0.3712097108364105, mean loss: 0.4264985397865668
Epoch: 2, step: 768, loss: 0.3903425931930542, mean loss: 0.4264886530087179
Epoch: 2, step: 769, loss: 0.3816867172718048, mean loss: 0.4264764053499599
Epoch: 2, step: 770, loss: 0.36450135707855225, mean loss: 0.4264594676488745
Epoch: 2, step: 771, loss: 0.3843165636062622, mean loss: 0.426447953194218
Epoch: 2, step: 772, loss: 0.3658580183982849, mean loss: 0.42643140308911126
Epoch: 2, step: 773, loss: 0.40978625416755676, mean loss: 0.426426857718024
Epoch: 2, step: 774, loss: 0.3892357647418976, mean loss: 0.4264167045394884
Epoch: 2, step: 775, loss: 0.3464517295360565, mean loss: 0.426394880037577
Epoch: 2, step: 776, loss: 0.3835597634315491, mean loss: 0.4263831924204948
Epoch: 2, step: 777, loss: 0.3893515169620514, mean loss: 0.42637309103602716
Epoch: 2, step: 778, loss: 0.38061803579330444, mean loss: 0.4263606135189171
Epoch: 2, step: 779, loss: 0.3535163402557373, mean loss: 0.4263407541205356
Epoch: 2, step: 780, loss: 0.40785786509513855, mean loss: 0.4263357165383537
Epoch: 2, step: 781, loss: 0.35911402106285095, mean loss: 0.426317400000077
Epoch: 2, step: 782, loss: 0.38098660111427307, mean loss: 0.4263050516484328
Epoch: 2, step: 783, loss: 0.33626627922058105, mean loss: 0.4262805312855712
Epoch: 2, step: 784, loss: 0.3799283504486084, mean loss: 0.4262679115793809
Epoch: 2, step: 785, loss: 0.36461544036865234, mean loss: 0.42625113083054833
Epoch: 2, step: 786, loss: 0.36190134286880493, mean loss: 0.4262336206841642
Epoch: 2, step: 787, loss: 0.3481423258781433, mean loss: 0.4262123771328024
Epoch: 2, step: 788, loss: 0.3708246946334839, mean loss: 0.426197313852275
Epoch: 2, step: 789, loss: 0.3677496314048767, mean loss: 0.4261814226933714
Epoch: 2, step: 790, loss: 0.3918797969818115, mean loss: 0.4261720990658336
Epoch: 2, step: 791, loss: 0.37247058749198914, mean loss: 0.42615750626377547
Epoch: 2, step: 792, loss: 0.3603389263153076, mean loss: 0.42613962563895924
Epoch: 2, step: 793, loss: 0.3602082431316376, mean loss: 0.4261217192341501
Epoch: 2, step: 794, loss: 0.4400728940963745, mean loss: 0.42612550722623865
Epoch: 2, step: 795, loss: 0.3602028787136078, mean loss: 0.4261076129188248
Epoch: 2, step: 796, loss: 0.39405661821365356, mean loss: 0.42609891522691024
Epoch: 2, step: 797, loss: 0.41624969244003296, mean loss: 0.4260962431642985
Epoch: 2, step: 798, loss: 0.35948145389556885, mean loss: 0.4260781756868728
Epoch: 2, step: 799, loss: 0.34290528297424316, mean loss: 0.42605562338407654
Epoch: 2, step: 800, loss: 0.3899356424808502, mean loss: 0.426045832117906
Epoch: 2, step: 801, loss: 0.3929453194141388, mean loss: 0.42603686178926
Epoch: 2, step: 802, loss: 0.35676315426826477, mean loss: 0.4260180935130419
Epoch: 2, step: 803, loss: 0.41314423084259033, mean loss: 0.42601460655132184
Epoch: 2, step: 804, loss: 0.376430869102478, mean loss: 0.4260011801398816
Epoch: 2, step: 805, loss: 0.3246282637119293, mean loss: 0.42597373755286805
Epoch: 2, step: 806, loss: 0.3448139727115631, mean loss: 0.4259517727991898
Epoch: 2, step: 807, loss: 0.3410223126411438, mean loss: 0.425928794049147
Epoch: 2, step: 808, loss: 0.3924664855003357, mean loss: 0.425919742843156
Epoch: 2, step: 809, loss: 0.4756616950035095, mean loss: 0.42593319388484346
Epoch: 2, step: 810, loss: 0.38918858766555786, mean loss: 0.42592326022541677
Epoch: 2, step: 811, loss: 0.3642704486846924, mean loss: 0.4259065973033787
Epoch: 2, step: 812, loss: 0.34542974829673767, mean loss: 0.42588485268057225
Epoch: 2, step: 813, loss: 0.3636573553085327, mean loss: 0.4258680435240698
Epoch: 2, step: 814, loss: 0.34425976872444153, mean loss: 0.4258460051025738
Epoch: 2, step: 815, loss: 0.3513045310974121, mean loss: 0.42582588051455944
Epoch: 2, step: 816, loss: 0.32540982961654663, mean loss: 0.4257987776668137
Epoch: 2, step: 817, loss: 0.33581438660621643, mean loss: 0.42577449693528086
Epoch: 2, step: 818, loss: 0.41582199931144714, mean loss: 0.42577181215038096
Epoch: 2, step: 819, loss: 0.3538096249103546, mean loss: 0.4257524048722688
Epoch: 2, step: 820, loss: 0.40292832255363464, mean loss: 0.4257462511698372
Epoch: 2, step: 821, loss: 0.4311519265174866, mean loss: 0.425747708225187
Epoch: 2, step: 822, loss: 0.3669070601463318, mean loss: 0.42573185248601186
Epoch: 2, step: 823, loss: 0.3798385560512543, mean loss: 0.42571948899020506
Epoch: 2, step: 824, loss: 0.3649205267429352, mean loss: 0.4257031143706933
Epoch: 2, step: 825, loss: 0.34054532647132874, mean loss: 0.42568018551019265
Epoch: 2, step: 826, loss: 0.37932178378105164, mean loss: 0.42566770680178645
Epoch: 2, step: 827, loss: 0.36797988414764404, mean loss: 0.42565218262992044
Epoch: 2, step: 828, loss: 0.41239693760871887, mean loss: 0.4256486165161133
Epoch: 2, step: 829, loss: 0.43805620074272156, mean loss: 0.42565195368239267
Epoch: 2, step: 830, loss: 0.3333171010017395, mean loss: 0.4256271258112766
Epoch: 2, step: 831, loss: 0.3610951006412506, mean loss: 0.4256097784926825
Epoch: 2, step: 832, loss: 0.358333021402359, mean loss: 0.4255916982032199
Epoch: 2, step: 833, loss: 0.41755199432373047, mean loss: 0.4255895381538165
Epoch: 2, step: 834, loss: 0.3546799123287201, mean loss: 0.42557049178641787
Epoch: 2, step: 835, loss: 0.3890184462070465, mean loss: 0.42556067652176177
Epoch: 2, step: 836, loss: 0.44785940647125244, mean loss: 0.4255666627579898
Epoch: 2, step: 837, loss: 0.4027408957481384, mean loss: 0.42556053667988736
Epoch: 2, step: 838, loss: 0.3569158613681793, mean loss: 0.4255421184681053
Epoch: 2, step: 839, loss: 0.39307308197021484, mean loss: 0.42553340896260694
Epoch: 2, step: 840, loss: 0.3831494450569153, mean loss: 0.425522042922407
Epoch: 2, step: 841, loss: 0.35060712695121765, mean loss: 0.42550195849453265
Epoch: 2, step: 842, loss: 0.34337007999420166, mean loss: 0.4254799451258646
Epoch: 2, step: 843, loss: 0.3788406550884247, mean loss: 0.4254674479956295
Epoch: 2, step: 844, loss: 0.409633994102478, mean loss: 0.42546320651320435
Epoch: 2, step: 845, loss: 0.4367051124572754, mean loss: 0.4254662172003881
Epoch: 2, step: 846, loss: 0.3737640678882599, mean loss: 0.42545237459013047
Epoch: 2, step: 847, loss: 0.32711923122406006, mean loss: 0.42542605415561063
Epoch: 2, step: 848, loss: 0.3672252595424652, mean loss: 0.42541047995314524
Epoch: 2, step: 849, loss: 0.3971586525440216, mean loss: 0.4254029219468828
Epoch: 2, step: 850, loss: 0.39672261476516724, mean loss: 0.42539525136459294
Epoch: 2, step: 851, loss: 0.42781662940979004, mean loss: 0.4253958987918778
Epoch: 2, step: 852, loss: 0.363111287355423, mean loss: 0.4253792496041108
Epoch: 2, step: 853, loss: 0.3272513449192047, mean loss: 0.4253530262196413
Epoch: 2, step: 854, loss: 0.40278276801109314, mean loss: 0.4253469962281348
Epoch: 2, step: 855, loss: 0.3177585005760193, mean loss: 0.425318259984638
Epoch: 2, step: 856, loss: 0.3998059332370758, mean loss: 0.4253114476143449
Epoch: 2, step: 857, loss: 0.35870954394340515, mean loss: 0.42529366814192876
Epoch: 2, step: 858, loss: 0.35295477509498596, mean loss: 0.4252743623257967
Epoch: 2, step: 859, loss: 0.37091776728630066, mean loss: 0.4252598594989452
Epoch: 2, step: 860, loss: 0.3769717216491699, mean loss: 0.4252469792274462
Epoch: 2, step: 861, loss: 0.36415258049964905, mean loss: 0.42523068738778547
Epoch: 2, step: 862, loss: 0.3766961991786957, mean loss: 0.4252177483080177
Epoch: 2, step: 863, loss: 0.4077133238315582, mean loss: 0.42521308294968174
Epoch: 2, step: 864, loss: 0.39054837822914124, mean loss: 0.4252038464176486
Epoch: 2, step: 865, loss: 0.3939881920814514, mean loss: 0.42519553111281744
Epoch: 2, step: 866, loss: 0.36908695101737976, mean loss: 0.4251805887479452
Epoch: 2, step: 867, loss: 0.37801259756088257, mean loss: 0.42516803070982295
Epoch: 2, step: 868, loss: 0.3303090035915375, mean loss: 0.4251427820999964
Epoch: 2, step: 869, loss: 0.3453764319419861, mean loss: 0.4251215563548772
Epoch: 2, step: 870, loss: 0.40155747532844543, mean loss: 0.4251152876448409
Epoch: 2, step: 871, loss: 0.44039836525917053, mean loss: 0.42511935229314257
Epoch: 2, step: 872, loss: 0.34730106592178345, mean loss: 0.42509866144326985
Epoch: 2, step: 873, loss: 0.40643492341041565, mean loss: 0.425093700322049
Epoch: 2, step: 874, loss: 0.3576602041721344, mean loss: 0.42507578017956965
Epoch: 2, step: 875, loss: 0.4160568118095398, mean loss: 0.4250733840668252
Epoch: 2, step: 876, loss: 0.3827384114265442, mean loss: 0.42506213971818235
Epoch: 2, step: 877, loss: 0.3635903596878052, mean loss: 0.4250458168875848
Epoch: 2, step: 878, loss: 0.39657604694366455, mean loss: 0.425038259210403
Epoch: 2, step: 879, loss: 0.4082295894622803, mean loss: 0.4250337983107883
Epoch: 2, step: 880, loss: 0.3616717755794525, mean loss: 0.4250169869489599
Epoch: 2, step: 881, loss: 0.4343019127845764, mean loss: 0.42501944979400913
Epoch: 2, step: 882, loss: 0.35842403769493103, mean loss: 0.42500178991278426
Epoch: 2, step: 883, loss: 0.4317540228366852, mean loss: 0.4250035800063484
Epoch: 2, step: 884, loss: 0.38565459847450256, mean loss: 0.4249931509097325
Epoch: 2, step: 885, loss: 0.38342252373695374, mean loss: 0.4249821359051822
Epoch: 2, step: 886, loss: 0.3864526152610779, mean loss: 0.42497192940964734
Epoch: 2, step: 887, loss: 0.40377864241600037, mean loss: 0.4249663167806766
Epoch: 2, step: 888, loss: 0.46024999022483826, mean loss: 0.4249756584998834
Epoch: 2, step: 889, loss: 0.34257984161376953, mean loss: 0.42495384912537676
Epoch: 2, step: 890, loss: 0.4150077700614929, mean loss: 0.4249512171912503
Epoch: 2, step: 891, loss: 0.3378674387931824, mean loss: 0.42492817915463704
Epoch: 2, step: 892, loss: 0.3880856931209564, mean loss: 0.42491843504301746
Epoch: 2, step: 893, loss: 0.3693658411502838, mean loss: 0.4249037463613959
Epoch: 2, step: 894, loss: 0.3525290787220001, mean loss: 0.4248846148076979
Epoch: 2, step: 895, loss: 0.3904312551021576, mean loss: 0.4248755097972049
Epoch: 2, step: 896, loss: 0.39504215121269226, mean loss: 0.42486762780022086
Epoch: 2, step: 897, loss: 0.36307594180107117, mean loss: 0.4248513066998513
Epoch: 2, step: 898, loss: 0.363461434841156, mean loss: 0.4248350960128012
Epoch: 2, step: 899, loss: 0.34968993067741394, mean loss: 0.4248152583239587
Epoch: 2, step: 900, loss: 0.3688296377658844, mean loss: 0.4248004824937771
Epoch: 2, step: 901, loss: 0.3768921196460724, mean loss: 0.42478784176479356
Epoch: 2, step: 902, loss: 0.38049325346946716, mean loss: 0.4247761576212179
Epoch: 2, step: 903, loss: 0.4040370285511017, mean loss: 0.4247706884416108
Epoch: 2, step: 904, loss: 0.4284888803958893, mean loss: 0.4247716687189518
Epoch: 2, step: 905, loss: 0.4030822217464447, mean loss: 0.42476595194326056
Epoch: 2, step: 906, loss: 0.36474496126174927, mean loss: 0.4247501361354393
Epoch: 2, step: 907, loss: 0.34578755497932434, mean loss: 0.42472933461247936
Epoch: 2, step: 908, loss: 0.37624379992485046, mean loss: 0.42471656518011497
Epoch: 2, step: 909, loss: 0.39451131224632263, mean loss: 0.42470861224358686
Epoch: 2, step: 910, loss: 0.3506806492805481, mean loss: 0.42468912607276216
Epoch: 2, step: 911, loss: 0.4168221056461334, mean loss: 0.42468705580422883
Epoch: 2, step: 912, loss: 0.33351048827171326, mean loss: 0.4246630682831732
Epoch: 2, step: 913, loss: 0.377072274684906, mean loss: 0.4246505509781763
Epoch: 2, step: 914, loss: 0.39731326699256897, mean loss: 0.42464336263108565
Epoch: 2, step: 915, loss: 0.34645503759384155, mean loss: 0.42462280839211686
Epoch: 2, step: 916, loss: 0.36223646998405457, mean loss: 0.42460641250817255
Epoch: 2, step: 917, loss: 0.40359094738960266, mean loss: 0.4246008908410368
Epoch: 2, step: 918, loss: 0.3611466884613037, mean loss: 0.42458422307051413
Epoch: 2, step: 919, loss: 0.3257264792919159, mean loss: 0.42455826252855544
Epoch: 2, step: 920, loss: 0.3825763165950775, mean loss: 0.42454724075225364
Epoch: 2, step: 921, loss: 0.4103296399116516, mean loss: 0.4245435090984897
Epoch: 2, step: 922, loss: 0.336652010679245, mean loss: 0.424520446516905
Epoch: 2, step: 923, loss: 0.35989895462989807, mean loss: 0.42450349439416446
Epoch: 2, step: 924, loss: 0.4856385588645935, mean loss: 0.4245195277181798
Epoch: 2, step: 925, loss: 0.3870682120323181, mean loss: 0.4245097082856455
Epoch: 2, step: 926, loss: 0.41644129157066345, mean loss: 0.42450759336645416
Epoch: 2, step: 927, loss: 0.3715914189815521, mean loss: 0.42449372644444555
Epoch: 2, step: 928, loss: 0.36909523606300354, mean loss: 0.42447921282370116
Epoch: 2, step: 929, loss: 0.3848976194858551, mean loss: 0.4244688457222507
Epoch: 2, step: 930, loss: 0.3186241686344147, mean loss: 0.42444113043628895
Epoch: 2, step: 931, loss: 0.3755069971084595, mean loss: 0.4244283204537424
Epoch: 2, step: 932, loss: 0.33591848611831665, mean loss: 0.4244051564039294
Epoch: 2, step: 933, loss: 0.3788008391857147, mean loss: 0.4243932243481423
Epoch: 2, step: 934, loss: 0.3570432960987091, mean loss: 0.42437560731224133
Epoch: 2, step: 935, loss: 0.46229293942451477, mean loss: 0.4243855229325636
Epoch: 2, step: 936, loss: 0.36577609181404114, mean loss: 0.4243702002054738
Epoch: 2, step: 937, loss: 0.39997681975364685, mean loss: 0.4243638245179537
Epoch: 2, step: 938, loss: 0.35437139868736267, mean loss: 0.4243455354074675
Epoch: 2, step: 939, loss: 0.3550572395324707, mean loss: 0.42432743501669556
Epoch: 2, step: 940, loss: 0.38890039920806885, mean loss: 0.42431818272215166
Epoch: 2, step: 941, loss: 0.3624863624572754, mean loss: 0.42430203864375354
Epoch: 2, step: 942, loss: 0.36201104521751404, mean loss: 0.42428577892215963
Epoch: 2, step: 943, loss: 0.34312981367111206, mean loss: 0.42426460043435926
Epoch: 2, step: 944, loss: 0.35162442922592163, mean loss: 0.42424564917654334
Epoch: 2, step: 945, loss: 0.36021867394447327, mean loss: 0.4242289493916628
Epoch: 2, step: 946, loss: 0.37205255031585693, mean loss: 0.4242153440724774
Epoch: 2, step: 947, loss: 0.36532869935035706, mean loss: 0.424199993018066
Epoch: 2, step: 948, loss: 0.3721332252025604, mean loss: 0.42418642336265405
Epoch: 2, step: 949, loss: 0.36926406621932983, mean loss: 0.424172113212278
Epoch: 2, step: 950, loss: 0.37634146213531494, mean loss: 0.4241596540689915
Epoch: 2, step: 951, loss: 0.349765807390213, mean loss: 0.4241402806714189
Epoch: 2, step: 952, loss: 0.3914865553379059, mean loss: 0.42413177931100926
Epoch: 2, step: 953, loss: 0.35775598883628845, mean loss: 0.4241145029470127
Epoch: 2, step: 954, loss: 0.40717166662216187, mean loss: 0.4241100941943911
Epoch: 2, step: 955, loss: 0.384906530380249, mean loss: 0.42409989555656225
Epoch: 2, step: 956, loss: 0.35177138447761536, mean loss: 0.42408108450036486
Epoch: 2, step: 957, loss: 0.3451140522956848, mean loss: 0.42406055225070166
Epoch: 2, step: 958, loss: 0.37272146344184875, mean loss: 0.42404720702356136
Epoch: 2, step: 959, loss: 0.3631361424922943, mean loss: 0.424031377744837
Epoch: 2, step: 960, loss: 0.3525022566318512, mean loss: 0.42401279392537405
Epoch: 2, step: 961, loss: 0.38591355085372925, mean loss: 0.4240028980180827
Epoch: 2, step: 962, loss: 0.40213972330093384, mean loss: 0.4239972207460191
Epoch: 2, step: 963, loss: 0.35456743836402893, mean loss: 0.4239791963996063
Epoch: 2, step: 964, loss: 0.40264567732810974, mean loss: 0.42397365954025734
Epoch: 2, step: 965, loss: 0.36146584153175354, mean loss: 0.423957440594225
Epoch: 2, step: 966, loss: 0.3952796459197998, mean loss: 0.42395000147757794
Epoch: 2, step: 967, loss: 0.40388229489326477, mean loss: 0.42394479719682476
Epoch: 2, step: 968, loss: 0.338567852973938, mean loss: 0.4239226616136713
Epoch: 2, step: 969, loss: 0.37728437781333923, mean loss: 0.42391057289314243
Epoch: 2, step: 970, loss: 0.39733508229255676, mean loss: 0.4239036862669179
Epoch: 2, step: 971, loss: 0.36117443442344666, mean loss: 0.423887435165404
Epoch: 2, step: 972, loss: 0.3402469754219055, mean loss: 0.42386577226466754
Epoch: 2, step: 973, loss: 0.3590169847011566, mean loss: 0.42384898076089655
Epoch: 2, step: 974, loss: 0.3716450333595276, mean loss: 0.42383546692517265
Epoch: 2, step: 975, loss: 0.34867990016937256, mean loss: 0.4238160167267369
Epoch: 2, step: 976, loss: 0.42216989398002625, mean loss: 0.4238155908217572
Epoch: 2, step: 977, loss: 0.34229394793510437, mean loss: 0.42379450400259355
Epoch: 2, step: 978, loss: 0.3659314513206482, mean loss: 0.4237795407099424
Epoch: 2, step: 979, loss: 0.3316342532634735, mean loss: 0.423755718246797
Epoch: 2, step: 980, loss: 0.3383563160896301, mean loss: 0.42373364551426734
Epoch: 2, step: 981, loss: 0.39200741052627563, mean loss: 0.4237254475207304
Epoch: 2, step: 982, loss: 0.43276554346084595, mean loss: 0.4237277828593871
Epoch: 2, step: 983, loss: 0.38248738646507263, mean loss: 0.42371713193056626
Epoch: 2, step: 984, loss: 0.39965885877609253, mean loss: 0.4237109201378592
Epoch: 2, step: 985, loss: 0.34937572479248047, mean loss: 0.4236917319098403
Epoch: 2, step: 986, loss: 0.40511876344680786, mean loss: 0.4236869388857208
Epoch: 2, step: 987, loss: 0.37763741612434387, mean loss: 0.4236750582038938
Epoch: 2, step: 988, loss: 0.3741389513015747, mean loss: 0.42366228128697286
Epoch: 2, step: 989, loss: 0.3677219748497009, mean loss: 0.4236478562466332
Epoch: 2, step: 990, loss: 0.43181365728378296, mean loss: 0.42364996137708877
Epoch: 2, step: 991, loss: 0.3378031253814697, mean loss: 0.423627835903894
Epoch: 2, step: 992, loss: 0.3926694989204407, mean loss: 0.4236198590069645
Epoch: 2, step: 993, loss: 0.3434486389160156, mean loss: 0.4235992069667556
Epoch: 2, step: 994, loss: 0.38236457109451294, mean loss: 0.42358858769406127
Epoch: 2, step: 995, loss: 0.37133070826530457, mean loss: 0.4235751330392135
Epoch: 2, step: 996, loss: 0.41675931215286255, mean loss: 0.423573378645163
Epoch: 2, step: 997, loss: 0.37895527482032776, mean loss: 0.4235618968891607
Epoch: 2, step: 998, loss: 0.3703315854072571, mean loss: 0.4235482024431916
Epoch: 2, step: 999, loss: 0.39157480001449585, mean loss: 0.4235399788314558
Epoch: 2, step: 1000, loss: 0.40173396468162537, mean loss: 0.42353437173087727
Epoch: 2, step: 1001, loss: 0.3937850892543793, mean loss: 0.4235267241004206
Epoch: 2, step: 1002, loss: 0.3286769986152649, mean loss: 0.42350234740407383
Epoch: 2, step: 1003, loss: 0.406328946352005, mean loss: 0.4234979349166504
Epoch: 2, step: 1004, loss: 0.36969611048698425, mean loss: 0.4234841147716646
Epoch: 2, step: 1005, loss: 0.36288052797317505, mean loss: 0.4234685514468576
Epoch: 2, step: 1006, loss: 0.36014991998672485, mean loss: 0.4234522950588062
Epoch: 2, step: 1007, loss: 0.3341221809387207, mean loss: 0.42342936638475076
Epoch: 2, step: 1008, loss: 0.4313797652721405, mean loss: 0.42343140651790123
Epoch: 2, step: 1009, loss: 0.37483489513397217, mean loss: 0.42341893948060416
Epoch: 2, step: 1010, loss: 0.3631777763366699, mean loss: 0.4234034890668714
Epoch: 2, step: 1011, loss: 0.3475584089756012, mean loss: 0.42338404161043774
Epoch: 2, step: 1012, loss: 0.4107408821582794, mean loss: 0.42338080060570765
Epoch: 2, step: 1013, loss: 0.38737785816192627, mean loss: 0.42337157381369234
Epoch: 2, step: 1014, loss: 0.35270267724990845, mean loss: 0.42335346751172875
Epoch: 2, step: 1015, loss: 0.3555413484573364, mean loss: 0.42333609760418406
Epoch: 2, step: 1016, loss: 0.4278985261917114, mean loss: 0.4233372659597763
Epoch: 2, step: 1017, loss: 0.3833068907260895, mean loss: 0.4233270175278168
Epoch: 2, step: 1018, loss: 0.3570845425128937, mean loss: 0.4233100627095381
Epoch: 2, step: 1019, loss: 0.38874560594558716, mean loss: 0.4233012181709598
Epoch: 2, step: 1020, loss: 0.3571723401546478, mean loss: 0.4232843010878141
Epoch: 2, step: 1021, loss: 0.3818571865558624, mean loss: 0.4232737059178571
Epoch: 2, step: 1022, loss: 0.3710440695285797, mean loss: 0.42326035137007156
Epoch: 2, step: 1023, loss: 0.3439072072505951, mean loss: 0.42324006682402876
Epoch: 2, step: 1024, loss: 0.3435989320278168, mean loss: 0.4232197138634368
Epoch: 2, step: 1025, loss: 0.40532171726226807, mean loss: 0.4232151410487712
Epoch: 2, step: 1026, loss: 0.37928342819213867, mean loss: 0.42320391966617693
Epoch: 2, step: 1027, loss: 0.3950379192829132, mean loss: 0.4231967271226674
Epoch: 2, step: 1028, loss: 0.34785744547843933, mean loss: 0.4231774931983263
Epoch: 2, step: 1029, loss: 0.38532018661499023, mean loss: 0.42316783079235815
Epoch: 2, step: 1030, loss: 0.5117371678352356, mean loss: 0.42319043077629354
Epoch: 2, step: 1031, loss: 0.33300432562828064, mean loss: 0.423167424116817
Epoch: 2, step: 1032, loss: 0.4034878611564636, mean loss: 0.42316240510050473
Epoch: 2, step: 1033, loss: 0.3497976064682007, mean loss: 0.4231436991345098
Epoch: 2, step: 1034, loss: 0.354198694229126, mean loss: 0.4231261245729739
Epoch: 2, step: 1035, loss: 0.3623763918876648, mean loss: 0.42311064298972073
Epoch: 2, step: 1036, loss: 0.36094382405281067, mean loss: 0.4230948043097368
Epoch: 2, step: 1037, loss: 0.37693774700164795, mean loss: 0.42308304754526704
Epoch: 2, step: 1038, loss: 0.34487655758857727, mean loss: 0.4230631324727036
Epoch: 2, step: 1039, loss: 0.390793114900589, mean loss: 0.423054917091448
Epoch: 2, step: 1040, loss: 0.36668696999549866, mean loss: 0.42304057045182064
Epoch: 2, step: 1041, loss: 0.3502323031425476, mean loss: 0.4230220441751516
Epoch: 2, step: 1042, loss: 0.37604600191116333, mean loss: 0.42301009402448664
Epoch: 2, step: 1043, loss: 0.355803906917572, mean loss: 0.4229930019117941
Epoch: 2, step: 1044, loss: 0.3485119342803955, mean loss: 0.42297406444227176
Epoch: 2, step: 1045, loss: 0.36676639318466187, mean loss: 0.42295977677799684
Epoch: 2, step: 1046, loss: 0.3752794861793518, mean loss: 0.4229476598045283
Epoch: 2, step: 1047, loss: 0.34103086590766907, mean loss: 0.42292684761095695
Epoch: 2, step: 1048, loss: 0.35612672567367554, mean loss: 0.42290988034605037
Epoch: 2, step: 1049, loss: 0.36137646436691284, mean loss: 0.42289425479603027
Epoch: 2, step: 1050, loss: 0.39425569772720337, mean loss: 0.4228869842814152
Epoch: 2, step: 1051, loss: 0.38399195671081543, mean loss: 0.42287711244700643
Epoch: 2, step: 1052, loss: 0.4044497609138489, mean loss: 0.42287243664098434
Epoch: 2, step: 1053, loss: 0.3991774618625641, mean loss: 0.42286642573921407
Epoch: 2, step: 1054, loss: 0.3795301020145416, mean loss: 0.42285543504083095
Epoch: 2, step: 1055, loss: 0.36182209849357605, mean loss: 0.4228399600569194
Epoch: 2, step: 1056, loss: 0.4079185724258423, mean loss: 0.42283617770264026
Epoch: 2, step: 1057, loss: 0.3618767559528351, mean loss: 0.42282072929368186
Epoch: 2, step: 1058, loss: 0.3352554142475128, mean loss: 0.42279854400991035
Epoch: 2, step: 1059, loss: 0.4330461919307709, mean loss: 0.4228011396654121
Epoch: 2, step: 1060, loss: 0.3809073567390442, mean loss: 0.42279053095866953
Epoch: 2, step: 1061, loss: 0.3430359959602356, mean loss: 0.42277033993715096
Epoch: 2, step: 1062, loss: 0.45756885409355164, mean loss: 0.42277914745781825
Epoch: 2, step: 1063, loss: 0.3815253674983978, mean loss: 0.42276870874831435
Epoch: 2, step: 1064, loss: 0.3967741131782532, mean loss: 0.42276213283240993
Epoch: 2, step: 1065, loss: 0.4106202721595764, mean loss: 0.42275906205328173
Epoch: 2, step: 1066, loss: 0.38214778900146484, mean loss: 0.4227487937162269
Epoch: 2, step: 1067, loss: 0.352105051279068, mean loss: 0.4227309363495846
Epoch: 2, step: 1068, loss: 0.33367717266082764, mean loss: 0.4227084309758952
Epoch: 2, step: 1069, loss: 0.39914631843566895, mean loss: 0.42270247794089266
Epoch: 2, step: 1070, loss: 0.4187026917934418, mean loss: 0.42270146763875893
Epoch: 2, step: 1071, loss: 0.3411569595336914, mean loss: 0.42268087559125767
Epoch: 2, step: 1072, loss: 0.38356268405914307, mean loss: 0.422670999753961
Epoch: 2, step: 1073, loss: 0.37493419647216797, mean loss: 0.4226589510908409
Epoch: 2, step: 1074, loss: 0.3841988444328308, mean loss: 0.42264924629481315
Epoch: 2, step: 1075, loss: 0.3696267008781433, mean loss: 0.42263587027427413
Epoch: 2, step: 1076, loss: 0.38964858651161194, mean loss: 0.4226275506566795
Epoch: 2, step: 1077, loss: 0.41461724042892456, mean loss: 0.42262553091128674
Epoch: 2, step: 1078, loss: 0.4279934763908386, mean loss: 0.42262688406114296
Epoch: 2, step: 1079, loss: 0.3439244329929352, mean loss: 0.4226070497740794
Epoch: 2, step: 1080, loss: 0.36832308769226074, mean loss: 0.4225933727869084
Epoch: 2, step: 1081, loss: 0.39198270440101624, mean loss: 0.4225856622910933
Epoch: 2, step: 1082, loss: 0.37045520544052124, mean loss: 0.4225725345003981
Epoch: 2, step: 1083, loss: 0.3385426998138428, mean loss: 0.42255137895289396
Epoch: 2, step: 1084, loss: 0.35340026021003723, mean loss: 0.422533973687668
Epoch: 2, step: 1085, loss: 0.351754367351532, mean loss: 0.4225161630167228
Epoch: 2, step: 1086, loss: 0.37510988116264343, mean loss: 0.42250423690808026
Epoch: 2, step: 1087, loss: 0.37881070375442505, mean loss: 0.42249324758887663
Epoch: 2, step: 1088, loss: 0.4158329665660858, mean loss: 0.4224915728890972
Epoch: 2, step: 1089, loss: 0.35470789670944214, mean loss: 0.42247453325204853
Epoch: 2, step: 1090, loss: 0.3823096454143524, mean loss: 0.422464439035452
Epoch: 2, step: 1091, loss: 0.3754889965057373, mean loss: 0.42245263616044454
Epoch: 2, step: 1092, loss: 0.36100608110427856, mean loss: 0.4224372012056452
Epoch: 2, step: 1093, loss: 0.41447949409484863, mean loss: 0.422435202785979
Epoch: 2, step: 1094, loss: 0.3781159520149231, mean loss: 0.42242407568309903
Epoch: 2, step: 1095, loss: 0.3165474236011505, mean loss: 0.42239750021821904
Epoch: 2, step: 1096, loss: 0.4095076322555542, mean loss: 0.4223942656214906
Epoch: 2, step: 1097, loss: 0.3833426237106323, mean loss: 0.4223844684208105
Epoch: 2, step: 1098, loss: 0.35090214014053345, mean loss: 0.4223665395699752
Epoch: 2, step: 1099, loss: 0.370653361082077, mean loss: 0.4223535723737646
Epoch: 2, step: 1100, loss: 0.3162200450897217, mean loss: 0.42232696582393153
Epoch: 2, step: 1101, loss: 0.36160382628440857, mean loss: 0.4223117469919667
Epoch: 2, step: 1102, loss: 0.35579389333724976, mean loss: 0.42229508002788385
Epoch: 2, step: 1103, loss: 0.3387099504470825, mean loss: 0.4222741418691712
Epoch: 2, step: 1104, loss: 0.36719441413879395, mean loss: 0.4222603477976134
Epoch: 2, step: 1105, loss: 0.45783159136772156, mean loss: 0.42226925396776116
Epoch: 2, step: 1106, loss: 0.37160488963127136, mean loss: 0.42225657202424766
Epoch: 2, step: 1107, loss: 0.35629838705062866, mean loss: 0.42224006597195196
Epoch: 2, step: 1108, loss: 0.40173086524009705, mean loss: 0.42223493482340757
Epoch: 2, step: 1109, loss: 0.36394166946411133, mean loss: 0.4222203542167644
Epoch: 2, step: 1110, loss: 0.3230096101760864, mean loss: 0.42219554532853215
Epoch: 2, step: 1111, loss: 0.3628712296485901, mean loss: 0.4221807142496122
Epoch: 2, step: 1112, loss: 0.3553105890750885, mean loss: 0.4221640008966568
Epoch: 2, step: 1113, loss: 0.3702146112918854, mean loss: 0.4221510200396841
Epoch: 2, step: 1114, loss: 0.3529670536518097, mean loss: 0.4221337370103591
Epoch: 2, step: 1115, loss: 0.4253259599208832, mean loss: 0.4221345342688283
Epoch: 2, step: 1116, loss: 0.39208000898361206, mean loss: 0.42212703001782076
Epoch: 2, step: 1117, loss: 0.3419581353664398, mean loss: 0.42210701781246596
Epoch: 2, step: 1118, loss: 0.35062697529792786, mean loss: 0.4220891790197246
Epoch: 2, step: 1119, loss: 0.3605920374393463, mean loss: 0.4220738354215259
Epoch: 2, step: 1120, loss: 0.35371091961860657, mean loss: 0.4220567830603877
Epoch: 2, step: 1121, loss: 0.368940144777298, mean loss: 0.42204353701592806
Epoch: 2, step: 1122, loss: 0.38916558027267456, mean loss: 0.4220353400683481
Epoch: 2, step: 1123, loss: 0.38960593938827515, mean loss: 0.42202725696748067
Epoch: 2, step: 1124, loss: 0.4229314625263214, mean loss: 0.4220274822865833
Epoch: 2, step: 1125, loss: 0.38976964354515076, mean loss: 0.42201944595406177
Epoch: 2, step: 1126, loss: 0.35507088899612427, mean loss: 0.42200277134460773
Epoch: 2, step: 1127, loss: 0.36595892906188965, mean loss: 0.4219888162045971
Epoch: 2, step: 1128, loss: 0.38092923164367676, mean loss: 0.42197859474964045
Epoch: 2, step: 1129, loss: 0.42847132682800293, mean loss: 0.4219802106610587
Epoch: 2, step: 1130, loss: 0.38463449478149414, mean loss: 0.4219709183704691
Epoch: 2, step: 1131, loss: 0.4146518409252167, mean loss: 0.4219690977044379
Epoch: 2, step: 1132, loss: 0.436511367559433, mean loss: 0.4219727142848545
Epoch: 2, step: 1133, loss: 0.38962849974632263, mean loss: 0.4219646724612497
Epoch: 2, step: 1134, loss: 0.3882755935192108, mean loss: 0.4219562983426959
Epoch: 2, step: 1135, loss: 0.46287548542022705, mean loss: 0.4219664671267609
Epoch: 2, step: 1136, loss: 0.3595849573612213, mean loss: 0.4219509686150179
Epoch: 2, step: 1137, loss: 0.3853762745857239, mean loss: 0.421941883991563
Epoch: 2, step: 1138, loss: 0.36057305335998535, mean loss: 0.4219266446494643
Epoch: 2, step: 1139, loss: 0.3993537127971649, mean loss: 0.4219210406445357
Epoch: 2, step: 1140, loss: 0.34379297494888306, mean loss: 0.4219016492159689
Epoch: 2, step: 1141, loss: 0.39193832874298096, mean loss: 0.42189421414885403
Epoch: 2, step: 1142, loss: 0.40062540769577026, mean loss: 0.4218889378386449
Epoch: 2, step: 1143, loss: 0.4347071349620819, mean loss: 0.42189211695499496
Epoch: 2, step: 1144, loss: 0.37680497765541077, mean loss: 0.4218809374014865
Epoch: 2, step: 1145, loss: 0.3925100862979889, mean loss: 0.42187365657572956
Epoch: 2, step: 1146, loss: 0.33812442421913147, mean loss: 0.42185290087997823
Epoch: 2, step: 1147, loss: 0.3922649323940277, mean loss: 0.4218455698669738
Epoch: 2, step: 1148, loss: 0.36425724625587463, mean loss: 0.4218313047385093
Epoch: 2, step: 1149, loss: 0.3970393240451813, mean loss: 0.4218251650701851
Epoch: 2, step: 1150, loss: 0.34255796670913696, mean loss: 0.42180553961874634
Epoch: 2, step: 1151, loss: 0.37128570675849915, mean loss: 0.42179303470962254
Epoch: 2, step: 1152, loss: 0.391095370054245, mean loss: 0.4217854381581117
Epoch: 2, step: 1153, loss: 0.3727765679359436, mean loss: 0.4217733132520696
Epoch: 2, step: 1154, loss: 0.3558645248413086, mean loss: 0.42175701130094156
Epoch: 2, step: 1155, loss: 0.3757082521915436, mean loss: 0.4217456243674328
Epoch: 2, step: 1156, loss: 0.3569414019584656, mean loss: 0.42172960354607086
Epoch: 2, step: 1157, loss: 0.3507023751735687, mean loss: 0.4217120486206204
Epoch: 2, step: 1158, loss: 0.34714552760124207, mean loss: 0.42169362348570083
Epoch: 2, step: 1159, loss: 0.36242008209228516, mean loss: 0.4216789808124317
Epoch: 2, step: 1160, loss: 0.3544754981994629, mean loss: 0.421662383261774
Epoch: 2, step: 1161, loss: 0.4003511369228363, mean loss: 0.421657121225641
Epoch: 2, step: 1162, loss: 0.3555915653705597, mean loss: 0.4216408127694931
Epoch: 2, step: 1163, loss: 0.3623465299606323, mean loss: 0.421626179432176
Epoch: 2, step: 1164, loss: 0.3678737282752991, mean loss: 0.42161291704600357
Epoch: 2, step: 1165, loss: 0.3514983654022217, mean loss: 0.4215956218926627
Epoch: 2, step: 1166, loss: 0.3486529588699341, mean loss: 0.4215776335663932
Epoch: 2, step: 1167, loss: 0.37321737408638, mean loss: 0.4215657104254958
Epoch: 2, step: 1168, loss: 0.39824333786964417, mean loss: 0.4215599617509688
Epoch: 2, step: 1169, loss: 0.3703378140926361, mean loss: 0.4215473392404567
Epoch: 2, step: 1170, loss: 0.3727951645851135, mean loss: 0.4215353283573191
Epoch: 2, step: 1171, loss: 0.39245253801345825, mean loss: 0.4215281651084659
Epoch: 2, step: 1172, loss: 0.3480777144432068, mean loss: 0.42151007831933385
Epoch: 2, step: 1173, loss: 0.3440980315208435, mean loss: 0.4214910207007227
Epoch: 2, step: 1174, loss: 0.39070412516593933, mean loss: 0.4214834433205763
Epoch: 2, step: 1175, loss: 0.3772541582584381, mean loss: 0.42147256013035433
Epoch: 2, step: 1176, loss: 0.3412553668022156, mean loss: 0.42145282650345933
Epoch: 2, step: 1177, loss: 0.3617618978023529, mean loss: 0.4214381459995978
Epoch: 2, step: 1178, loss: 0.35991623997688293, mean loss: 0.42142301890197725
Epoch: 2, step: 1179, loss: 0.3807404935359955, mean loss: 0.42141301828118916
Epoch: 2, step: 1180, loss: 0.32927846908569336, mean loss: 0.42139037523641265
Epoch: 2, step: 1181, loss: 0.363020122051239, mean loss: 0.42137603365086346
Epoch: 2, step: 1182, loss: 0.3520711660385132, mean loss: 0.42135900961067374
Epoch: 2, step: 1183, loss: 0.40076568722724915, mean loss: 0.42135395231146366
Epoch: 2, step: 1184, loss: 0.34028321504592896, mean loss: 0.42133404788296736
Epoch: 2, step: 1185, loss: 0.4331260621547699, mean loss: 0.4213369423390969
Epoch: 2, step: 1186, loss: 0.38861754536628723, mean loss: 0.42132891303922626
Epoch: 2, step: 1187, loss: 0.3680713176727295, mean loss: 0.4213158468970853
Epoch: 2, step: 1188, loss: 0.3277171552181244, mean loss: 0.42129288916059304
Epoch: 2, step: 1189, loss: 0.4021252691745758, mean loss: 0.42128818891047387
Epoch: 2, step: 1190, loss: 0.35189712047576904, mean loss: 0.42127117712610646
Epoch: 2, step: 1191, loss: 0.3417942225933075, mean loss: 0.42125169748038765
Epoch: 2, step: 1192, loss: 0.34094831347465515, mean loss: 0.4212320201013125
Epoch: 2, step: 1193, loss: 0.3487480580806732, mean loss: 0.421214263128745
Epoch: 2, step: 1194, loss: 0.32865244150161743, mean loss: 0.42119159307691373
Epoch: 2, step: 1195, loss: 0.39278391003608704, mean loss: 0.42118463722896055
Epoch: 2, step: 1196, loss: 0.43923085927963257, mean loss: 0.4211890549087771
Epoch: 2, step: 1197, loss: 0.39993032813072205, mean loss: 0.421183852087735
Epoch: 2, step: 1198, loss: 0.3619246780872345, mean loss: 0.4211693526568565
Epoch: 2, step: 1199, loss: 0.35720348358154297, mean loss: 0.42115370542860914
Epoch: 2, step: 1200, loss: 0.38931795954704285, mean loss: 0.42114591972406484
Epoch: 2, step: 1201, loss: 0.3565109670162201, mean loss: 0.4211301165571436
Epoch: 2, step: 1202, loss: 0.3611813187599182, mean loss: 0.4211154627322115
Epoch: 2, step: 1203, loss: 0.37321144342422485, mean loss: 0.421103755982625
Epoch: 2, step: 1204, loss: 0.31904301047325134, mean loss: 0.42107882054516854
Epoch: 2, step: 1205, loss: 0.3867432773113251, mean loss: 0.42107043374906844
Epoch: 2, step: 1206, loss: 0.3949657082557678, mean loss: 0.42106405896872817
Epoch: 2, step: 1207, loss: 0.4277327358722687, mean loss: 0.4210656870636753
Epoch: 2, step: 1208, loss: 0.36772415041923523, mean loss: 0.4210526674062078
Epoch: 2, step: 1209, loss: 0.37083956599235535, mean loss: 0.4210404143311922
Epoch: 2, step: 1210, loss: 0.38345417380332947, mean loss: 0.4210312447189629
Epoch: 2, step: 1211, loss: 0.4092291593551636, mean loss: 0.4210283661615571
Epoch: 2, step: 1212, loss: 0.346085786819458, mean loss: 0.4210100919407958
Epoch: 2, step: 1213, loss: 0.35553380846977234, mean loss: 0.4209941299019194
Epoch: 2, step: 1214, loss: 0.4168853759765625, mean loss: 0.4209931284995491
Epoch: 2, step: 1215, loss: 0.347974956035614, mean loss: 0.4209753365471944
Epoch: 2, step: 1216, loss: 0.367367684841156, mean loss: 0.42096227743593834
Epoch: 2, step: 1217, loss: 0.3839578330516815, mean loss: 0.4209532651504088
Epoch: 2, step: 1218, loss: 0.3695997893810272, mean loss: 0.420940761260521
Epoch: 2, step: 1219, loss: 0.440937876701355, mean loss: 0.42094562910751243
Epoch: 2, step: 1220, loss: 0.3901057243347168, mean loss: 0.42093812365490285
Epoch: 2, step: 1221, loss: 0.36917421221733093, mean loss: 0.42092552902924896
Epoch: 2, step: 1222, loss: 0.42798250913619995, mean loss: 0.4209272456383725
Epoch: 2, step: 1223, loss: 0.3783717453479767, mean loss: 0.4209168965381074
Epoch: 2, step: 1224, loss: 0.40756934881210327, mean loss: 0.42091365132835146
Epoch: 2, step: 1225, loss: 0.3482450246810913, mean loss: 0.4208959875882816
Epoch: 2, step: 1226, loss: 0.3619956374168396, mean loss: 0.42088167401594345
Epoch: 2, step: 1227, loss: 0.38251838088035583, mean loss: 0.42087235348797075
Epoch: 2, step: 1228, loss: 0.39778468012809753, mean loss: 0.4208667456003439
Epoch: 2, step: 1229, loss: 0.37190040946006775, mean loss: 0.42085485479506457
Epoch: 2, step: 1230, loss: 0.42071789503097534, mean loss: 0.4208548215443328
Epoch: 2, step: 1231, loss: 0.3778952658176422, mean loss: 0.4208443944677001
Epoch: 2, step: 1232, loss: 0.3716805577278137, mean loss: 0.42083246439326677
Epoch: 2, step: 1233, loss: 0.32443180680274963, mean loss: 0.4208090775282521
Epoch: 2, step: 1234, loss: 0.4122365117073059, mean loss: 0.4208069983223775
Epoch: 2, step: 1235, loss: 0.3982360064983368, mean loss: 0.42080152523997594
Epoch: 2, step: 1236, loss: 0.392309308052063, mean loss: 0.4207946180358092
Epoch: 2, step: 1237, loss: 0.3545852601528168, mean loss: 0.4207785711725317
Epoch: 2, step: 1238, loss: 0.36126887798309326, mean loss: 0.42076415157156505
Epoch: 2, step: 1239, loss: 0.4365933835506439, mean loss: 0.4207679861723352
Epoch: 2, step: 1240, loss: 0.38045090436935425, mean loss: 0.42075822180280187
Epoch: 2, step: 1241, loss: 0.33725425601005554, mean loss: 0.42073800292488595
Epoch: 2, step: 1242, loss: 0.3418993055820465, mean loss: 0.4207189182729027
Epoch: 2, step: 1243, loss: 0.41086238622665405, mean loss: 0.4207165328585643
Epoch: 2, step: 1244, loss: 0.41653871536254883, mean loss: 0.4207155220147472
Epoch: 2, step: 1245, loss: 0.3961416482925415, mean loss: 0.4207095776814811
Epoch: 2, step: 1246, loss: 0.3387453556060791, mean loss: 0.4206897556205197
Epoch: 2, step: 1247, loss: 0.3691275119781494, mean loss: 0.42067728892718254
Epoch: 2, step: 1248, loss: 0.3578055500984192, mean loss: 0.4206620915042121
Epoch: 2, step: 1249, loss: 0.3486294448375702, mean loss: 0.42064468390472765
Epoch: 2, step: 1250, loss: 0.36870524287223816, mean loss: 0.4206321351149155
Epoch: 2, step: 1251, loss: 0.35981377959251404, mean loss: 0.42061744469087625
Epoch: 2, step: 1252, loss: 0.3812549412250519, mean loss: 0.42060793913582534
Epoch: 2, step: 1253, loss: 0.4421774446964264, mean loss: 0.42061314664561783
Epoch: 2, step: 1254, loss: 0.35730352997779846, mean loss: 0.42059786554094303
Epoch: 2, step: 1255, loss: 0.35503697395324707, mean loss: 0.4205820448624711
Epoch: 2, step: 1256, loss: 0.38159051537513733, mean loss: 0.4205726379796032
Epoch: 2, step: 1257, loss: 0.36002466082572937, mean loss: 0.4205580340294937
Epoch: 2, step: 1258, loss: 0.3555225133895874, mean loss: 0.4205423514829203
Epoch: 2, step: 1259, loss: 0.35443785786628723, mean loss: 0.42052641500904936
Epoch: 2, step: 1260, loss: 0.35029441118240356, mean loss: 0.42050948755572887
Epoch: 2, step: 1261, loss: 0.3778792917728424, mean loss: 0.42049921521939565
Epoch: 2, step: 1262, loss: 0.36841022968292236, mean loss: 0.4204866666803601
Epoch: 2, step: 1263, loss: 0.3858882784843445, mean loss: 0.4204783337352262
Epoch: 2, step: 1264, loss: 0.36547303199768066, mean loss: 0.42046508902014373
Epoch: 2, step: 1265, loss: 0.386122465133667, mean loss: 0.42045682165762893
Epoch: 2, step: 1266, loss: 0.33768460154533386, mean loss: 0.42043690054568855
Epoch: 2, step: 1267, loss: 0.3761454224586487, mean loss: 0.42042624330842027
Epoch: 2, step: 1268, loss: 0.3685530722141266, mean loss: 0.42041376479721165
Epoch: 2, step: 1269, loss: 0.33046072721481323, mean loss: 0.42039213107003937
Epoch: 2, step: 1270, loss: 0.3593847155570984, mean loss: 0.42037746229977896
Epoch: 2, step: 1271, loss: 0.3585473597049713, mean loss: 0.4203625992943475
Epoch: 2, step: 1272, loss: 0.3928491473197937, mean loss: 0.4203559870732529
Epoch: 2, step: 1273, loss: 0.34733375906944275, mean loss: 0.42033844208814863
Epoch: 2, step: 1274, loss: 0.4057725965976715, mean loss: 0.42033494320621484
Epoch: 2, step: 1275, loss: 0.3678063154220581, mean loss: 0.42032232826198235
Epoch: 2, step: 1276, loss: 0.38982969522476196, mean loss: 0.42031500710158926
Epoch: 2, step: 1277, loss: 0.34833866357803345, mean loss: 0.4202977300148097
Epoch: 2, step: 1278, loss: 0.38355591893196106, mean loss: 0.42028891268553614
Epoch: 2, step: 1279, loss: 0.3566148281097412, mean loss: 0.4202736357938433
Epoch: 2, step: 1280, loss: 0.3454447090625763, mean loss: 0.4202556869028068
Epoch: 2, step: 1281, loss: 0.35285118222236633, mean loss: 0.4202395227530033
Epoch: 2, step: 1282, loss: 0.3489508330821991, mean loss: 0.42022243124265307
Epoch: 2, step: 1283, loss: 0.3664451837539673, mean loss: 0.4202095412025072
Epoch: 2, step: 1284, loss: 0.3475862741470337, mean loss: 0.4201921380711735
Epoch: 2, step: 1285, loss: 0.3470913767814636, mean loss: 0.42017462471197614
Epoch: 2, step: 1286, loss: 0.3366221487522125, mean loss: 0.42015461214288397
Epoch: 2, step: 1287, loss: 0.40589138865470886, mean loss: 0.42015119662001804
Epoch: 2, step: 1288, loss: 0.3673963248729706, mean loss: 0.4201385667728198
Epoch: 2, step: 1289, loss: 0.3624284863471985, mean loss: 0.4201247539244652
Epoch: 2, step: 1290, loss: 0.38991013169288635, mean loss: 0.42011752381624995
Epoch: 2, step: 1291, loss: 0.34235596656799316, mean loss: 0.4200989205728891
Epoch: 2, step: 1292, loss: 0.3699042499065399, mean loss: 0.42008691515058194
Epoch: 2, step: 1293, loss: 0.3697023391723633, mean loss: 0.42007486718884635
Epoch: 2, step: 1294, loss: 0.3922275900840759, mean loss: 0.42006820993876154
Epoch: 2, step: 1295, loss: 0.351498544216156, mean loss: 0.4200518213953288
Epoch: 2, step: 1296, loss: 0.43654119968414307, mean loss: 0.42005576150961527
Epoch: 2, step: 1297, loss: 0.3530328571796417, mean loss: 0.42003975030456747
Epoch: 2, step: 1298, loss: 0.39182108640670776, mean loss: 0.42003301071443183
Epoch: 2, step: 1299, loss: 0.4447265863418579, mean loss: 0.42003890698368385
Epoch: 2, step: 1300, loss: 0.3669038414955139, mean loss: 0.4200262225564964
Epoch: 2, step: 1301, loss: 0.37589678168296814, mean loss: 0.4200156904703691
Epoch: 2, step: 1302, loss: 0.34184178709983826, mean loss: 0.41999703766593804
Epoch: 2, step: 1303, loss: 0.33145520091056824, mean loss: 0.4199759160445746
Epoch: 2, step: 1304, loss: 0.3673460781574249, mean loss: 0.41996336421106945
Epoch: 2, step: 1305, loss: 0.4214661717414856, mean loss: 0.4199637225342765
Epoch: 2, step: 1306, loss: 0.34651994705200195, mean loss: 0.4199462150788576
Epoch: 2, step: 1307, loss: 0.36222025752067566, mean loss: 0.41993245770098386
Epoch: 2, step: 1308, loss: 0.38658541440963745, mean loss: 0.41992451225345195
Epoch: 2, step: 1309, loss: 0.36091870069503784, mean loss: 0.4199104565575114
Epoch: 2, step: 1310, loss: 0.3581443130970001, mean loss: 0.419895746830562
Epoch: 2, step: 1311, loss: 0.3573745787143707, mean loss: 0.4198808608381534
Epoch: 2, step: 1312, loss: 0.354988157749176, mean loss: 0.4198654138724098
Epoch: 2, step: 1313, loss: 0.36571890115737915, mean loss: 0.4198525279817113
Epoch: 2, step: 1314, loss: 0.3460853397846222, mean loss: 0.4198349769019594
Epoch: 2, step: 1315, loss: 0.33701199293136597, mean loss: 0.4198152759067238
Epoch: 2, step: 1316, loss: 0.3944876194000244, mean loss: 0.4198092526828221
Epoch: 2, step: 1317, loss: 0.40072792768478394, mean loss: 0.41980471599119157
Epoch: 2, step: 1318, loss: 0.3399251401424408, mean loss: 0.4197857286900628
Epoch: 2, step: 1319, loss: 0.3756483793258667, mean loss: 0.41977523977624054
Epoch: 2, step: 1320, loss: 0.3586917817592621, mean loss: 0.4197607271941505
Epoch: 2, step: 1321, loss: 0.4060170650482178, mean loss: 0.41975746266632485
Epoch: 2, step: 1322, loss: 0.3598363399505615, mean loss: 0.41974323300051725
Epoch: 2, step: 1323, loss: 0.37822669744491577, mean loss: 0.41973337627317736
Epoch: 2, step: 1324, loss: 0.38938912749290466, mean loss: 0.419726173745577
Epoch: 2, step: 1325, loss: 0.3921942114830017, mean loss: 0.4197196402946367
Epoch: 2, step: 1326, loss: 0.459152489900589, mean loss: 0.4197289956563463
Epoch: 2, step: 1327, loss: 0.3687255382537842, mean loss: 0.41971689806208573
Epoch: 2, step: 1328, loss: 0.3672836124897003, mean loss: 0.41970446427371194
Epoch: 2, step: 1329, loss: 0.3858202397823334, mean loss: 0.4196964310294039
Epoch: 2, step: 1330, loss: 0.35386455059051514, mean loss: 0.419680827360184
Epoch: 2, step: 1331, loss: 0.3334157168865204, mean loss: 0.4196603853908774
Epoch: 2, step: 1332, loss: 0.37493541836738586, mean loss: 0.41964978956831794
Epoch: 2, step: 1333, loss: 0.37417882680892944, mean loss: 0.41963901956292726
Epoch: 2, step: 1334, loss: 0.38410598039627075, mean loss: 0.41963060539310326
Epoch: 2, step: 1335, loss: 0.3868016302585602, mean loss: 0.4196228333819445
Epoch: 2, step: 1336, loss: 0.35124537348747253, mean loss: 0.4196066493677683
Epoch: 2, step: 1337, loss: 0.3554977476596832, mean loss: 0.41959147925378154
Epoch: 2, step: 1338, loss: 0.40610840916633606, mean loss: 0.4195882895045297
Epoch: 2, step: 1339, loss: 0.3741937577724457, mean loss: 0.41957755286031684
Epoch: 2, step: 1340, loss: 0.37890809774398804, mean loss: 0.41956793605844495
Epoch: 2, step: 1341, loss: 0.3885340690612793, mean loss: 0.4195605994468617
Epoch: 2, step: 1342, loss: 0.37208622694015503, mean loss: 0.41954937884357485
Epoch: 2, step: 1343, loss: 0.37632840871810913, mean loss: 0.4195391659489327
Epoch: 2, step: 1344, loss: 0.3309188187122345, mean loss: 0.419518230360169
Epoch: 2, step: 1345, loss: 0.3568021059036255, mean loss: 0.4195034178602974
Epoch: 2, step: 1346, loss: 0.4011697471141815, mean loss: 0.41949908877629594
Epoch: 2, step: 1347, loss: 0.3662014603614807, mean loss: 0.4194865067110422
Epoch: 2, step: 1348, loss: 0.37150970101356506, mean loss: 0.41947518341491347
Epoch: 2, step: 1349, loss: 0.3879666030406952, mean loss: 0.4194677486389875
Epoch: 2, step: 1350, loss: 0.30849751830101013, mean loss: 0.41944157024070067
Epoch: 2, step: 1351, loss: 0.3503634035587311, mean loss: 0.4194252782202568
Epoch: 2, step: 1352, loss: 0.42376795411109924, mean loss: 0.4194263021947654
Epoch: 2, step: 1353, loss: 0.4501948654651642, mean loss: 0.41943355551001066
Epoch: 2, step: 1354, loss: 0.37602999806404114, mean loss: 0.41942332605975235
Epoch: 2, step: 1355, loss: 0.3628264367580414, mean loss: 0.41940999031769255
Epoch: 2, step: 1356, loss: 0.4101170599460602, mean loss: 0.41940780117037296
Epoch: 2, step: 1357, loss: 0.38897860050201416, mean loss: 0.4194006346134562
Epoch: 2, step: 1358, loss: 0.36803218722343445, mean loss: 0.4193885393821424
Epoch: 2, step: 1359, loss: 0.3604678809642792, mean loss: 0.4193746691706504
Epoch: 2, step: 1360, loss: 0.3587794601917267, mean loss: 0.4193604081188785
Epoch: 2, step: 1361, loss: 0.38522347807884216, mean loss: 0.41935237590004554
Epoch: 2, step: 1362, loss: 0.3980071544647217, mean loss: 0.4193473546764663
Epoch: 2, step: 1363, loss: 0.4001196324825287, mean loss: 0.419342832634558
Epoch: 2, step: 1364, loss: 0.35612955689430237, mean loss: 0.419327969414304
Epoch: 2, step: 1365, loss: 0.3396579325199127, mean loss: 0.41930924114987184
Epoch: 2, step: 1366, loss: 0.37009501457214355, mean loss: 0.41929767493916026
Epoch: 2, step: 1367, loss: 0.3682747781276703, mean loss: 0.41928568647656356
Epoch: 2, step: 1368, loss: 0.36582279205322266, mean loss: 0.4192731276571078
Epoch: 2, step: 1369, loss: 0.3931056559085846, mean loss: 0.4192669821729019
Epoch: 2, step: 1370, loss: 0.3747437596321106, mean loss: 0.419256528258241
Epoch: 2, step: 1371, loss: 0.42061617970466614, mean loss: 0.4192568474252472
Epoch: 2, step: 1372, loss: 0.36765116453170776, mean loss: 0.41924473625817527
Epoch: 2, step: 1373, loss: 0.3766815960407257, mean loss: 0.41923474959927864
Epoch: 2, step: 1374, loss: 0.3507753908634186, mean loss: 0.4192186906364037
Epoch: 2, step: 1375, loss: 0.35540035367012024, mean loss: 0.41920372385944166
Epoch: 2, step: 1376, loss: 0.36032769083976746, mean loss: 0.4191899193968345
Epoch: 2, step: 1377, loss: 0.37686827778816223, mean loss: 0.4191799987119754
Epoch: 2, step: 1378, loss: 0.3546130657196045, mean loss: 0.41916486701921885
Epoch: 2, step: 1379, loss: 0.3515814244747162, mean loss: 0.41914903209828525
Epoch: 2, step: 1380, loss: 0.4113101661205292, mean loss: 0.41914719586826
Epoch: 2, step: 1381, loss: 0.3722173869609833, mean loss: 0.4191362052806939
Epoch: 2, step: 1382, loss: 0.3829692304134369, mean loss: 0.4191277372463068
Epoch: 2, step: 1383, loss: 0.35071903467178345, mean loss: 0.41911172397323226
Epoch: 2, step: 1384, loss: 0.3391166627407074, mean loss: 0.41909300291981955
Epoch: 2, step: 1385, loss: 0.36855071783065796, mean loss: 0.41908117739686934
Epoch: 2, step: 1386, loss: 0.36574095487594604, mean loss: 0.4190687001518352
Epoch: 2, step: 1387, loss: 0.3417019248008728, mean loss: 0.41905060689286633
Epoch: 2, step: 1388, loss: 0.4376209080219269, mean loss: 0.41905494879165733
Epoch: 2, step: 1389, loss: 0.3765013515949249, mean loss: 0.41904500171423875
Epoch: 2, step: 1390, loss: 0.37164756655693054, mean loss: 0.419033924959119
Epoch: 2, step: 1391, loss: 0.3950234651565552, mean loss: 0.4190283150386044
Epoch: 2, step: 1392, loss: 0.3723151385784149, mean loss: 0.4190174032945118
Epoch: 2, step: 1393, loss: 0.4409497380256653, mean loss: 0.41902252527833506
Epoch: 2, step: 1394, loss: 0.3951067328453064, mean loss: 0.41901694139030493
Epoch: 2, step: 1395, loss: 0.3284435570240021, mean loss: 0.4189957991437208
Epoch: 2, step: 1396, loss: 0.3346533477306366, mean loss: 0.4189761159578601
Epoch: 2, step: 1397, loss: 0.3763597905635834, mean loss: 0.41896617281147785
Epoch: 2, step: 1398, loss: 0.3724321126937866, mean loss: 0.41895531812052433
Epoch: 2, step: 1399, loss: 0.36222872138023376, mean loss: 0.4189420889701651
Epoch: 2, step: 1400, loss: 0.43064600229263306, mean loss: 0.4189448177911776
Epoch: 2, step: 1401, loss: 0.47188737988471985, mean loss: 0.41895715871474254
Epoch: 2, step: 1402, loss: 0.4001522958278656, mean loss: 0.4189527763183578
Epoch: 2, step: 1403, loss: 0.4020577073097229, mean loss: 0.4189488399089895
Epoch: 2, step: 1404, loss: 0.3570170998573303, mean loss: 0.41893441369420925
Epoch: 2, step: 1405, loss: 0.3840802311897278, mean loss: 0.4189262967443945
Epoch: 2, step: 1406, loss: 0.3682517409324646, mean loss: 0.41891449824478755
Epoch: 2, step: 1407, loss: 0.3500646650791168, mean loss: 0.4188984717473095
Epoch: 2, step: 1408, loss: 0.3601290285587311, mean loss: 0.4188847948929486
Epoch: 2, step: 1409, loss: 0.3611987233161926, mean loss: 0.41887137328485724
Epoch: 2, step: 1410, loss: 0.3451194763183594, mean loss: 0.4188542176912386
Epoch: 2, step: 1411, loss: 0.35253196954727173, mean loss: 0.4188387939126005
Epoch: 2, step: 1412, loss: 0.3807540535926819, mean loss: 0.4188299390555161
Epoch: 2, step: 1413, loss: 0.35541683435440063, mean loss: 0.4188151986778543
Epoch: 2, step: 1414, loss: 0.3679673671722412, mean loss: 0.4188033818450619
Epoch: 2, step: 1415, loss: 0.3969949781894684, mean loss: 0.4187983148367776
Epoch: 2, step: 1416, loss: 0.32706964015960693, mean loss: 0.418777007362985
Epoch: 2, step: 1417, loss: 0.3507000803947449, mean loss: 0.4187611975796668
Epoch: 2, step: 1418, loss: 0.4083501398563385, mean loss: 0.41875878033849584
Epoch: 2, step: 1419, loss: 0.3289790451526642, mean loss: 0.41873794010284454
Epoch: 2, step: 1420, loss: 0.35523220896720886, mean loss: 0.4187232021749876
Epoch: 2, step: 1421, loss: 0.34804531931877136, mean loss: 0.4187068035942785
Epoch: 2, step: 1422, loss: 0.370032399892807, mean loss: 0.41869551284881307
Epoch: 2, step: 1423, loss: 0.346953809261322, mean loss: 0.41867887516245234
Epoch: 2, step: 1424, loss: 0.43050616979599, mean loss: 0.41868161740558557
Epoch: 2, step: 1425, loss: 0.3551592230796814, mean loss: 0.41866689269665514
Epoch: 2, step: 1426, loss: 0.39620381593704224, mean loss: 0.41866168688512334
Epoch: 2, step: 1427, loss: 0.3481349050998688, mean loss: 0.41864534611084503
Epoch: 2, step: 1428, loss: 0.3959003984928131, mean loss: 0.41864007741785964
Epoch: 2, step: 1429, loss: 0.3869872987270355, mean loss: 0.4186327469920396
Epoch: 2, step: 1430, loss: 0.4017290771007538, mean loss: 0.4186288331995202
Epoch: 2, step: 1431, loss: 0.37371504306793213, mean loss: 0.4186184364888416
Epoch: 2, step: 1432, loss: 0.32786476612091064, mean loss: 0.41859743355656487
Epoch: 2, step: 1433, loss: 0.3734174072742462, mean loss: 0.4185869800567309
Epoch: 2, step: 1434, loss: 0.4046545922756195, mean loss: 0.4185837572050582
Epoch: 2, step: 1435, loss: 0.3837437033653259, mean loss: 0.4185756998383052
Epoch: 2, step: 1436, loss: 0.3207937479019165, mean loss: 0.4185530912945049
Epoch: 2, step: 1437, loss: 0.39415305852890015, mean loss: 0.41854745097255264
Epoch: 2, step: 1438, loss: 0.3457306921482086, mean loss: 0.4185306225096859
Epoch: 2, step: 1439, loss: 0.3316960036754608, mean loss: 0.41851055905801443
Epoch: 2, step: 1440, loss: 0.43081721663475037, mean loss: 0.4185134018987575
Epoch: 2, step: 1441, loss: 0.3931286633014679, mean loss: 0.4185075393725226
Epoch: 2, step: 1442, loss: 0.36914321780204773, mean loss: 0.4184961414686735
Epoch: 2, step: 1443, loss: 0.38974231481552124, mean loss: 0.4184895039278948
Valid: 2, mean loss: 0.24181667466958362
Epoch: 3, step: 0, loss: 0.39977434277534485, mean loss: 0.41848518471230456
Epoch: 3, step: 1, loss: 0.35455453395843506, mean loss: 0.41847043375458565
Epoch: 3, step: 2, loss: 0.4036181569099426, mean loss: 0.41846700762382566
Epoch: 3, step: 3, loss: 0.3774506747722626, mean loss: 0.4184575481374669
Epoch: 3, step: 4, loss: 0.390663206577301, mean loss: 0.4184511394813543
Epoch: 3, step: 5, loss: 0.3770810663700104, mean loss: 0.4184416028116652
Epoch: 3, step: 6, loss: 0.3425777554512024, mean loss: 0.4184241186338914
Epoch: 3, step: 7, loss: 0.3582899868488312, mean loss: 0.4184102628431575
Epoch: 3, step: 8, loss: 0.40059220790863037, mean loss: 0.4184061582463055
Epoch: 3, step: 9, loss: 0.3882419764995575, mean loss: 0.4183992111754288
Epoch: 3, step: 10, loss: 0.3487702012062073, mean loss: 0.418383178707096
Epoch: 3, step: 11, loss: 0.38513490557670593, mean loss: 0.4183755248688984
Epoch: 3, step: 12, loss: 0.4406558573246002, mean loss: 0.41838065267843944
Epoch: 3, step: 13, loss: 0.40516695380210876, mean loss: 0.41837761225071823
Epoch: 3, step: 14, loss: 0.3428831696510315, mean loss: 0.4183602452291862
Epoch: 3, step: 15, loss: 0.3976447284221649, mean loss: 0.4183554808508957
Epoch: 3, step: 16, loss: 0.34199652075767517, mean loss: 0.41833792303068573
Epoch: 3, step: 17, loss: 0.39595460891723633, mean loss: 0.41833277744123437
Epoch: 3, step: 18, loss: 0.4202790856361389, mean loss: 0.41833322476557244
Epoch: 3, step: 19, loss: 0.3817688524723053, mean loss: 0.41832482302561536
Epoch: 3, step: 20, loss: 0.40958449244499207, mean loss: 0.4183228151389669
Epoch: 3, step: 21, loss: 0.3508538603782654, mean loss: 0.41830731928348674
Epoch: 3, step: 22, loss: 0.3466910123825073, mean loss: 0.41829087466651754
Epoch: 3, step: 23, loss: 0.3625316023826599, mean loss: 0.4182780740989593
Epoch: 3, step: 24, loss: 0.36044108867645264, mean loss: 0.41826479960150176
Epoch: 3, step: 25, loss: 0.3708035945892334, mean loss: 0.4182539090083369
Epoch: 3, step: 26, loss: 0.3991449773311615, mean loss: 0.4182495252203862
Epoch: 3, step: 27, loss: 0.3463068902492523, mean loss: 0.41823302461603507
Epoch: 3, step: 28, loss: 0.3616551160812378, mean loss: 0.41822005100710713
Epoch: 3, step: 29, loss: 0.3576759696006775, mean loss: 0.41820617111682595
Epoch: 3, step: 30, loss: 0.3897642195224762, mean loss: 0.418199652218913
Epoch: 3, step: 31, loss: 0.4072369635105133, mean loss: 0.4181971401454234
Epoch: 3, step: 32, loss: 0.39220550656318665, mean loss: 0.41819118559019264
Epoch: 3, step: 33, loss: 0.37393876910209656, mean loss: 0.4181810499015788
Epoch: 3, step: 34, loss: 0.34567779302597046, mean loss: 0.41816444736966313
Epoch: 3, step: 35, loss: 0.3455297648906708, mean loss: 0.4181478185504143
Epoch: 3, step: 36, loss: 0.3620050847530365, mean loss: 0.418134968302349
Epoch: 3, step: 37, loss: 0.3880157470703125, mean loss: 0.41812807603204416
Epoch: 3, step: 38, loss: 0.35833069682121277, mean loss: 0.4181143955517854
Epoch: 3, step: 39, loss: 0.32641273736953735, mean loss: 0.4180934207900786
Epoch: 3, step: 40, loss: 0.35291460156440735, mean loss: 0.4180785159606193
Epoch: 3, step: 41, loss: 0.3391822278499603, mean loss: 0.41806047840046595
Epoch: 3, step: 42, loss: 0.34765228629112244, mean loss: 0.4180443850994124
Epoch: 3, step: 43, loss: 0.3893123269081116, mean loss: 0.4180378192725862
Epoch: 3, step: 44, loss: 0.37171506881713867, mean loss: 0.4180272360533823
Epoch: 3, step: 45, loss: 0.4003989100456238, mean loss: 0.41802320948280036
Epoch: 3, step: 46, loss: 0.38310593366622925, mean loss: 0.41801523568151777
Epoch: 3, step: 47, loss: 0.3801797330379486, mean loss: 0.41800659743890506
Epoch: 3, step: 48, loss: 0.42357128858566284, mean loss: 0.4180078676263387
Epoch: 3, step: 49, loss: 0.41766658425331116, mean loss: 0.41800778974332337
Epoch: 3, step: 50, loss: 0.3633852005004883, mean loss: 0.41799532736841055
Epoch: 3, step: 51, loss: 0.3874662220478058, mean loss: 0.41798836361263486
Epoch: 3, step: 52, loss: 0.3661436140537262, mean loss: 0.4179765404086305
Epoch: 3, step: 53, loss: 0.3464653789997101, mean loss: 0.41796023599426463
Epoch: 3, step: 54, loss: 0.3552798628807068, mean loss: 0.4179459482411045
Epoch: 3, step: 55, loss: 0.3856344223022461, mean loss: 0.417938584629906
Epoch: 3, step: 56, loss: 0.3645663559436798, mean loss: 0.4179264241767991
Epoch: 3, step: 57, loss: 0.34459346532821655, mean loss: 0.41790971963036433
Epoch: 3, step: 58, loss: 0.37122800946235657, mean loss: 0.41789908840509266
Epoch: 3, step: 59, loss: 0.37240469455718994, mean loss: 0.4178887299365481
Epoch: 3, step: 60, loss: 0.36638176441192627, mean loss: 0.4178770051549581
Epoch: 3, step: 61, loss: 0.4199278652667999, mean loss: 0.41787747189599406
Epoch: 3, step: 62, loss: 0.3763849437236786, mean loss: 0.4178680310477182
Epoch: 3, step: 63, loss: 0.4148242771625519, mean loss: 0.41786733865602455
Epoch: 3, step: 64, loss: 0.36744043231010437, mean loss: 0.41785587017607323
Epoch: 3, step: 65, loss: 0.3508477807044983, mean loss: 0.41784063413935846
Epoch: 3, step: 66, loss: 0.3919045031070709, mean loss: 0.41783473822414313
Epoch: 3, step: 67, loss: 0.3448234796524048, mean loss: 0.4178181447562859
Epoch: 3, step: 68, loss: 0.3168448507785797, mean loss: 0.4177952014947595
Epoch: 3, step: 69, loss: 0.3588672876358032, mean loss: 0.41778181487189286
Epoch: 3, step: 70, loss: 0.36631888151168823, mean loss: 0.4177701267198692
Epoch: 3, step: 71, loss: 0.3477185070514679, mean loss: 0.41775422035754667
Epoch: 3, step: 72, loss: 0.36668696999549866, mean loss: 0.41774262733816825
Epoch: 3, step: 73, loss: 0.42303162813186646, mean loss: 0.4177438277468822
Epoch: 3, step: 74, loss: 0.36638447642326355, mean loss: 0.417732173707553
Epoch: 3, step: 75, loss: 0.3445226550102234, mean loss: 0.41771556537754
Epoch: 3, step: 76, loss: 0.3728026747703552, mean loss: 0.4177053787387087
Epoch: 3, step: 77, loss: 0.3643384575843811, mean loss: 0.41769327739604334
Epoch: 3, step: 78, loss: 0.38358354568481445, mean loss: 0.41768554451648965
Epoch: 3, step: 79, loss: 0.3842758536338806, mean loss: 0.4176779720570874
Epoch: 3, step: 80, loss: 0.37735581398010254, mean loss: 0.4176688349263199
Epoch: 3, step: 81, loss: 0.3708841800689697, mean loss: 0.417658235774789
Epoch: 3, step: 82, loss: 0.35567060112953186, mean loss: 0.41764419554044124
Epoch: 3, step: 83, loss: 0.34652695059776306, mean loss: 0.4176280910918582
Epoch: 3, step: 84, loss: 0.3598053455352783, mean loss: 0.4176150001374646
Epoch: 3, step: 85, loss: 0.35947945713996887, mean loss: 0.41760184134547784
Epoch: 3, step: 86, loss: 0.36313894391059875, mean loss: 0.41758951663458516
Epoch: 3, step: 87, loss: 0.3531301021575928, mean loss: 0.41757493305664917
Epoch: 3, step: 88, loss: 0.3768382966518402, mean loss: 0.4175657187077677
Epoch: 3, step: 89, loss: 0.3864319920539856, mean loss: 0.4175586780640197
Epoch: 3, step: 90, loss: 0.34730279445648193, mean loss: 0.4175427938488699
Epoch: 3, step: 91, loss: 0.3675802946090698, mean loss: 0.4175315003363835
Epoch: 3, step: 92, loss: 0.3939206302165985, mean loss: 0.4175261645465259
Epoch: 3, step: 93, loss: 0.3716903030872345, mean loss: 0.41751580850010495
Epoch: 3, step: 94, loss: 0.34869810938835144, mean loss: 0.4175002635036939
Epoch: 3, step: 95, loss: 0.385661780834198, mean loss: 0.4174930732411217
Epoch: 3, step: 96, loss: 0.3493414521217346, mean loss: 0.4174776856545064
Epoch: 3, step: 97, loss: 0.410305380821228, mean loss: 0.41747606662407
Epoch: 3, step: 98, loss: 0.4296906292438507, mean loss: 0.41747882323942087
Epoch: 3, step: 99, loss: 0.42755621671676636, mean loss: 0.4174810970195376
Epoch: 3, step: 100, loss: 0.36908280849456787, mean loss: 0.41747017929146973
Epoch: 3, step: 101, loss: 0.3673238754272461, mean loss: 0.41745886979578545
Epoch: 3, step: 102, loss: 0.37082430720329285, mean loss: 0.41744835467456953
Epoch: 3, step: 103, loss: 0.37817901372909546, mean loss: 0.4174395022532563
Epoch: 3, step: 104, loss: 0.39153844118118286, mean loss: 0.4174336647366748
Epoch: 3, step: 105, loss: 0.3652801215648651, mean loss: 0.41742191314966
Epoch: 3, step: 106, loss: 0.34874022006988525, mean loss: 0.4174064408151072
Epoch: 3, step: 107, loss: 0.3721228837966919, mean loss: 0.4173962418157787
Epoch: 3, step: 108, loss: 0.33440908789634705, mean loss: 0.41737755522403824
Epoch: 3, step: 109, loss: 0.3469211757183075, mean loss: 0.4173616938148744
Epoch: 3, step: 110, loss: 0.34007564187049866, mean loss: 0.41734429879980706
Epoch: 3, step: 111, loss: 0.3533041179180145, mean loss: 0.4173298883180605
Epoch: 3, step: 112, loss: 0.35885128378868103, mean loss: 0.4173167322765466
Epoch: 3, step: 113, loss: 0.3799588084220886, mean loss: 0.41730832968458653
Epoch: 3, step: 114, loss: 0.37620022892951965, mean loss: 0.4172990856772209
Epoch: 3, step: 115, loss: 0.3570997714996338, mean loss: 0.4172855516587457
Epoch: 3, step: 116, loss: 0.35985174775123596, mean loss: 0.4172726422849746
Epoch: 3, step: 117, loss: 0.3341505825519562, mean loss: 0.4172539631704279
Epoch: 3, step: 118, loss: 0.3723869323730469, mean loss: 0.4172438829568136
Epoch: 3, step: 119, loss: 0.35835614800453186, mean loss: 0.4172306557027812
Epoch: 3, step: 120, loss: 0.35998550057411194, mean loss: 0.4172178002895477
Epoch: 3, step: 121, loss: 0.35460343956947327, mean loss: 0.41720374228309953
Epoch: 3, step: 122, loss: 0.34619373083114624, mean loss: 0.4171878028865896
Epoch: 3, step: 123, loss: 0.3841956555843353, mean loss: 0.4171803989038018
Epoch: 3, step: 124, loss: 0.38292089104652405, mean loss: 0.4171727122293891
Epoch: 3, step: 125, loss: 0.32890772819519043, mean loss: 0.41715291299564433
Epoch: 3, step: 126, loss: 0.3923591375350952, mean loss: 0.41714735260644037
Epoch: 3, step: 127, loss: 0.34041473269462585, mean loss: 0.41713014798314174
Epoch: 3, step: 128, loss: 0.38821735978126526, mean loss: 0.41712366674839574
Epoch: 3, step: 129, loss: 0.3687012195587158, mean loss: 0.4171128145639068
Epoch: 3, step: 130, loss: 0.38329899311065674, mean loss: 0.41710523808587563
Epoch: 3, step: 131, loss: 0.40054628252983093, mean loss: 0.4171015286424267
Epoch: 3, step: 132, loss: 0.33420005440711975, mean loss: 0.41708296168291153
Epoch: 3, step: 133, loss: 0.3724459409713745, mean loss: 0.4170729668282963
Epoch: 3, step: 134, loss: 0.38254767656326294, mean loss: 0.41706523786248817
Epoch: 3, step: 135, loss: 0.41513344645500183, mean loss: 0.4170648055009377
Epoch: 3, step: 136, loss: 0.382887601852417, mean loss: 0.4170571578832048
Epoch: 3, step: 137, loss: 0.34238219261169434, mean loss: 0.4170404520744192
Epoch: 3, step: 138, loss: 0.401189923286438, mean loss: 0.41703690688793116
Epoch: 3, step: 139, loss: 0.35450971126556396, mean loss: 0.4170229249568886
Epoch: 3, step: 140, loss: 0.3830622136592865, mean loss: 0.41701533257788176
Epoch: 3, step: 141, loss: 0.43052324652671814, mean loss: 0.4170183517808207
Epoch: 3, step: 142, loss: 0.35487210750579834, mean loss: 0.41700446435193245
Epoch: 3, step: 143, loss: 0.40042227506637573, mean loss: 0.41700075966263717
Epoch: 3, step: 144, loss: 0.40621140599250793, mean loss: 0.41699834971095745
Epoch: 3, step: 145, loss: 0.36457741260528564, mean loss: 0.4169866433828856
Epoch: 3, step: 146, loss: 0.34045282006263733, mean loss: 0.41696955612606035
Epoch: 3, step: 147, loss: 0.3097701370716095, mean loss: 0.4169456276843071
Epoch: 3, step: 148, loss: 0.38454779982566833, mean loss: 0.41693839764015206
Epoch: 3, step: 149, loss: 0.3928561806678772, mean loss: 0.41693302454399583
Epoch: 3, step: 150, loss: 0.34195998311042786, mean loss: 0.4169163006891144
Epoch: 3, step: 151, loss: 0.3428841531276703, mean loss: 0.41689979039750835
Epoch: 3, step: 152, loss: 0.42583057284355164, mean loss: 0.4169017816533492
Epoch: 3, step: 153, loss: 0.39380499720573425, mean loss: 0.41689663301660207
Epoch: 3, step: 154, loss: 0.3604241609573364, mean loss: 0.416884047219397
Epoch: 3, step: 155, loss: 0.37187710404396057, mean loss: 0.4168740189343757
Epoch: 3, step: 156, loss: 0.36250394582748413, mean loss: 0.4168619070891748
Epoch: 3, step: 157, loss: 0.40752092003822327, mean loss: 0.4168598266911679
Epoch: 3, step: 158, loss: 0.3968394100666046, mean loss: 0.4168553687939012
Epoch: 3, step: 159, loss: 0.3359638750553131, mean loss: 0.41683736089235657
Epoch: 3, step: 160, loss: 0.37470921874046326, mean loss: 0.41682798449748637
Epoch: 3, step: 161, loss: 0.3761892020702362, mean loss: 0.41681894159975
Epoch: 3, step: 162, loss: 0.3678579032421112, mean loss: 0.4168080492664113
Epoch: 3, step: 163, loss: 0.4089767038822174, mean loss: 0.41680630741912833
Epoch: 3, step: 164, loss: 0.3833562135696411, mean loss: 0.4167988691060642
Epoch: 3, step: 165, loss: 0.33586278557777405, mean loss: 0.416780875312483
Epoch: 3, step: 166, loss: 0.3999425172805786, mean loss: 0.41677713262343385
Epoch: 3, step: 167, loss: 0.35806748270988464, mean loss: 0.41676408603456416
Epoch: 3, step: 168, loss: 0.4131224751472473, mean loss: 0.416763276967493
Epoch: 3, step: 169, loss: 0.35277819633483887, mean loss: 0.41674906437739245
Epoch: 3, step: 170, loss: 0.3346753716468811, mean loss: 0.41673083792997284
Epoch: 3, step: 171, loss: 0.3527047336101532, mean loss: 0.4167166225426905
Epoch: 3, step: 172, loss: 0.3699779808521271, mean loss: 0.41670624770546727
Epoch: 3, step: 173, loss: 0.3481753468513489, mean loss: 0.4166910388948028
Epoch: 3, step: 174, loss: 0.3638870120048523, mean loss: 0.41667932289149906
Epoch: 3, step: 175, loss: 0.3450266122817993, mean loss: 0.41666342832392816
Epoch: 3, step: 176, loss: 0.3919994831085205, mean loss: 0.4166579583870873
Epoch: 3, step: 177, loss: 0.39515969157218933, mean loss: 0.4166531915873501
Epoch: 3, step: 178, loss: 0.36970338225364685, mean loss: 0.41664278373779706
Epoch: 3, step: 179, loss: 0.36718448996543884, mean loss: 0.41663182223651773
Epoch: 3, step: 180, loss: 0.364297091960907, mean loss: 0.416620225797281
Epoch: 3, step: 181, loss: 0.358751118183136, mean loss: 0.41660740587977674
Epoch: 3, step: 182, loss: 0.3837796151638031, mean loss: 0.4166001350512682
Epoch: 3, step: 183, loss: 0.33160120248794556, mean loss: 0.41658131332129406
Epoch: 3, step: 184, loss: 0.35511624813079834, mean loss: 0.4165677058240192
Epoch: 3, step: 185, loss: 0.3351669907569885, mean loss: 0.416549688844146
Epoch: 3, step: 186, loss: 0.3444191515445709, mean loss: 0.41653372722934195
Epoch: 3, step: 187, loss: 0.3688240945339203, mean loss: 0.4165231720008695
Epoch: 3, step: 188, loss: 0.38442787528038025, mean loss: 0.41651607284211695
Epoch: 3, step: 189, loss: 0.3772611618041992, mean loss: 0.4165073919683801
Epoch: 3, step: 190, loss: 0.39329540729522705, mean loss: 0.41650225997972806
Epoch: 3, step: 191, loss: 0.42881372570991516, mean loss: 0.41650498134704245
Epoch: 3, step: 192, loss: 0.36581316590309143, mean loss: 0.4164937787358946
Epoch: 3, step: 193, loss: 0.3506013751029968, mean loss: 0.4164792200961171
Epoch: 3, step: 194, loss: 0.40966424345970154, mean loss: 0.41647771468930544
Epoch: 3, step: 195, loss: 0.37744903564453125, mean loss: 0.4164690952813892
Epoch: 3, step: 196, loss: 0.3448044955730438, mean loss: 0.4164532717884088
Epoch: 3, step: 197, loss: 0.40761280059814453, mean loss: 0.4164513202495147
Epoch: 3, step: 198, loss: 0.37160608172416687, mean loss: 0.4164414228232235
Epoch: 3, step: 199, loss: 0.35687124729156494, mean loss: 0.4164282784773427
Epoch: 3, step: 200, loss: 0.3382187783718109, mean loss: 0.41641102511310146
Epoch: 3, step: 201, loss: 0.4097234606742859, mean loss: 0.4164095501319725
Epoch: 3, step: 202, loss: 0.3663756847381592, mean loss: 0.41639851730608635
Epoch: 3, step: 203, loss: 0.35228949785232544, mean loss: 0.41638438392437255
Epoch: 3, step: 204, loss: 0.34490302205085754, mean loss: 0.4163686287200804
Epoch: 3, step: 205, loss: 0.3405270278453827, mean loss: 0.4163519161592883
Epoch: 3, step: 206, loss: 0.3609423041343689, mean loss: 0.4163397087100649
Epoch: 3, step: 207, loss: 0.37918397784233093, mean loss: 0.41633152462837597
Epoch: 3, step: 208, loss: 0.408132404088974, mean loss: 0.41632971905239285
Epoch: 3, step: 209, loss: 0.4233892858028412, mean loss: 0.41633127333833525
Epoch: 3, step: 210, loss: 0.36202937364578247, mean loss: 0.41631932046585174
Epoch: 3, step: 211, loss: 0.32844677567481995, mean loss: 0.4162999823177903
Epoch: 3, step: 212, loss: 0.39696893095970154, mean loss: 0.41629572906116585
Epoch: 3, step: 213, loss: 0.36419546604156494, mean loss: 0.41628426837858346
Epoch: 3, step: 214, loss: 0.3483923375606537, mean loss: 0.4162693372303939
Epoch: 3, step: 215, loss: 0.359254390001297, mean loss: 0.4162568009623136
Epoch: 3, step: 216, loss: 0.32631340622901917, mean loss: 0.41623702883772945
Epoch: 3, step: 217, loss: 0.3694380223751068, mean loss: 0.4162267433418036
Epoch: 3, step: 218, loss: 0.36431610584259033, mean loss: 0.41621533691739154
Epoch: 3, step: 219, loss: 0.3715200126171112, mean loss: 0.4162055180851639
Epoch: 3, step: 220, loss: 0.38989657163619995, mean loss: 0.41619973970904944
Epoch: 3, step: 221, loss: 0.38197582960128784, mean loss: 0.41619222457727345
Epoch: 3, step: 222, loss: 0.3590194284915924, mean loss: 0.4161796729206136
Epoch: 3, step: 223, loss: 0.3765999376773834, mean loss: 0.41617098553359794
Epoch: 3, step: 224, loss: 0.39204442501068115, mean loss: 0.4161656911380476
Epoch: 3, step: 225, loss: 0.33408719301223755, mean loss: 0.4161476835693495
Epoch: 3, step: 226, loss: 0.43728941679000854, mean loss: 0.4161523209313194
Epoch: 3, step: 227, loss: 0.3978605568408966, mean loss: 0.4161483095795452
Epoch: 3, step: 228, loss: 0.417883962392807, mean loss: 0.4161486901217099
Epoch: 3, step: 229, loss: 0.4102689325809479, mean loss: 0.416147401266484
Epoch: 3, step: 230, loss: 0.3647580146789551, mean loss: 0.4161361390734996
Epoch: 3, step: 231, loss: 0.40762704610824585, mean loss: 0.41613427467977365
Epoch: 3, step: 232, loss: 0.352908194065094, mean loss: 0.41612042449782083
Epoch: 3, step: 233, loss: 0.3637980818748474, mean loss: 0.4161089653776669
Epoch: 3, step: 234, loss: 0.3361659049987793, mean loss: 0.41609146087572274
Epoch: 3, step: 235, loss: 0.37459659576416016, mean loss: 0.4160823770611186
Epoch: 3, step: 236, loss: 0.3871406018733978, mean loss: 0.41607604268265774
Epoch: 3, step: 237, loss: 0.45885908603668213, mean loss: 0.41608540439892777
Epoch: 3, step: 238, loss: 0.3356303870677948, mean loss: 0.41606780321377546
Epoch: 3, step: 239, loss: 0.37154218554496765, mean loss: 0.41605806445225557
Epoch: 3, step: 240, loss: 0.3726469576358795, mean loss: 0.4160485715358295
Epoch: 3, step: 241, loss: 0.35183951258659363, mean loss: 0.4160345337004668
Epoch: 3, step: 242, loss: 0.38360923528671265, mean loss: 0.41602744620354576
Epoch: 3, step: 243, loss: 0.3673172891139984, mean loss: 0.4160168015013846
Epoch: 3, step: 244, loss: 0.37844955921173096, mean loss: 0.4160085936704277
Epoch: 3, step: 245, loss: 0.34954139590263367, mean loss: 0.41599407484173223
Epoch: 3, step: 246, loss: 0.3636762201786041, mean loss: 0.41598264923468636
Epoch: 3, step: 247, loss: 0.361192524433136, mean loss: 0.41597068632534107
Epoch: 3, step: 248, loss: 0.36652839183807373, mean loss: 0.4159598934210653
Epoch: 3, step: 249, loss: 0.3454798758029938, mean loss: 0.4159445114879317
Epoch: 3, step: 250, loss: 0.39765071868896484, mean loss: 0.41594051982465463
Epoch: 3, step: 251, loss: 0.32749202847480774, mean loss: 0.41592122477854865
Epoch: 3, step: 252, loss: 0.320314884185791, mean loss: 0.41590037279586756
Epoch: 3, step: 253, loss: 0.3698524236679077, mean loss: 0.4158903318126299
Epoch: 3, step: 254, loss: 0.3820273280143738, mean loss: 0.41588294942680076
Epoch: 3, step: 255, loss: 0.34451472759246826, mean loss: 0.41586739401663636
Epoch: 3, step: 256, loss: 0.39686816930770874, mean loss: 0.4158632538499968
Epoch: 3, step: 257, loss: 0.4187832474708557, mean loss: 0.41586389001418433
Epoch: 3, step: 258, loss: 0.4003492295742035, mean loss: 0.41586051065011553
Epoch: 3, step: 259, loss: 0.3654923737049103, mean loss: 0.415849541979178
Epoch: 3, step: 260, loss: 0.32542744278907776, mean loss: 0.41582985504271164
Epoch: 3, step: 261, loss: 0.35665959119796753, mean loss: 0.41581697514200533
Epoch: 3, step: 262, loss: 0.42448610067367554, mean loss: 0.4158188617852113
Epoch: 3, step: 263, loss: 0.3590452969074249, mean loss: 0.41580650896430665
Epoch: 3, step: 264, loss: 0.4147757589817047, mean loss: 0.41580628474199155
Epoch: 3, step: 265, loss: 0.3876206576824188, mean loss: 0.4158001547665545
Epoch: 3, step: 266, loss: 0.3559558689594269, mean loss: 0.4157871423104103
Epoch: 3, step: 267, loss: 0.3544604778289795, mean loss: 0.4157738104268274
Epoch: 3, step: 268, loss: 0.37282419204711914, mean loss: 0.4157644755825805
Epoch: 3, step: 269, loss: 0.4071526527404785, mean loss: 0.4157626042607982
Epoch: 3, step: 270, loss: 0.34320226311683655, mean loss: 0.41574684055427114
Epoch: 3, step: 271, loss: 0.3168083727359772, mean loss: 0.41572535087837664
Epoch: 3, step: 272, loss: 0.37100791931152344, mean loss: 0.41571564025262925
Epoch: 3, step: 273, loss: 0.3814498484134674, mean loss: 0.4157082008709881
Epoch: 3, step: 274, loss: 0.3327224552631378, mean loss: 0.415690187902547
Epoch: 3, step: 275, loss: 0.35919782519340515, mean loss: 0.415677928275223
Epoch: 3, step: 276, loss: 0.3757534623146057, mean loss: 0.41566926599143894
Epoch: 3, step: 277, loss: 0.34239357709884644, mean loss: 0.4156533710480783
Epoch: 3, step: 278, loss: 0.3630610406398773, mean loss: 0.4156419652076081
Epoch: 3, step: 279, loss: 0.3758706748485565, mean loss: 0.4156333417708433
Epoch: 3, step: 280, loss: 0.3627927899360657, mean loss: 0.41562188706634845
Epoch: 3, step: 281, loss: 0.3677842319011688, mean loss: 0.41561151913068195
Epoch: 3, step: 282, loss: 0.3781965970993042, mean loss: 0.4156034118886383
Epoch: 3, step: 283, loss: 0.32656779885292053, mean loss: 0.41558412341094425
Epoch: 3, step: 284, loss: 0.3281717598438263, mean loss: 0.41556519069195635
Epoch: 3, step: 285, loss: 0.37579798698425293, mean loss: 0.41555657934425005
Epoch: 3, step: 286, loss: 0.36094456911087036, mean loss: 0.41554475600364965
Epoch: 3, step: 287, loss: 0.3622882068157196, mean loss: 0.41553322861205055
Epoch: 3, step: 288, loss: 0.3263813555240631, mean loss: 0.41551393584574714
Epoch: 3, step: 289, loss: 0.371470183134079, mean loss: 0.4155044066911146
Epoch: 3, step: 290, loss: 0.3712845742702484, mean loss: 0.4154948415099723
Epoch: 3, step: 291, loss: 0.36012476682662964, mean loss: 0.4154828670128522
Epoch: 3, step: 292, loss: 0.387320876121521, mean loss: 0.41547677793374055
Epoch: 3, step: 293, loss: 0.3116428256034851, mean loss: 0.415454332202584
Epoch: 3, step: 294, loss: 0.35756370425224304, mean loss: 0.41544182072042485
Epoch: 3, step: 295, loss: 0.3877881169319153, mean loss: 0.41543584541709977
Epoch: 3, step: 296, loss: 0.40267136693000793, mean loss: 0.4154330879147262
Epoch: 3, step: 297, loss: 0.33244815468788147, mean loss: 0.41541516460301414
Epoch: 3, step: 298, loss: 0.33531659841537476, mean loss: 0.41539786843238413
Epoch: 3, step: 299, loss: 0.3570861220359802, mean loss: 0.41538527954067506
Epoch: 3, step: 300, loss: 0.3753405213356018, mean loss: 0.41537663616528003
Epoch: 3, step: 301, loss: 0.4038853943347931, mean loss: 0.415374156397945
Epoch: 3, step: 302, loss: 0.37938717007637024, mean loss: 0.4153663922153514
Epoch: 3, step: 303, loss: 0.3892439901828766, mean loss: 0.41536075752983964
Epoch: 3, step: 304, loss: 0.37814438343048096, mean loss: 0.4153527315703617
Epoch: 3, step: 305, loss: 0.37317660450935364, mean loss: 0.4153436379681493
Epoch: 3, step: 306, loss: 0.40074583888053894, mean loss: 0.41534049121257965
Epoch: 3, step: 307, loss: 0.37122026085853577, mean loss: 0.4153309825422447
Epoch: 3, step: 308, loss: 0.34445109963417053, mean loss: 0.4153157099969079
Epoch: 3, step: 309, loss: 0.3379451036453247, mean loss: 0.41529904248153704
Epoch: 3, step: 310, loss: 0.37696075439453125, mean loss: 0.4152907852581713
Epoch: 3, step: 311, loss: 0.40153923630714417, mean loss: 0.4152878241149863
Epoch: 3, step: 312, loss: 0.3537997603416443, mean loss: 0.41527458664162287
Epoch: 3, step: 313, loss: 0.3873279392719269, mean loss: 0.4152685714355597
Epoch: 3, step: 314, loss: 0.33645495772361755, mean loss: 0.41525161132931654
Epoch: 3, step: 315, loss: 0.32475724816322327, mean loss: 0.4152321418019572
Epoch: 3, step: 316, loss: 0.33879753947257996, mean loss: 0.4152157007173521
Epoch: 3, step: 317, loss: 0.3767315447330475, mean loss: 0.41520742455477483
Epoch: 3, step: 318, loss: 0.3801085650920868, mean loss: 0.41519987803586217
Epoch: 3, step: 319, loss: 0.3537388741970062, mean loss: 0.4151866662981496
Epoch: 3, step: 320, loss: 0.3735430836677551, mean loss: 0.41517771646306895
Epoch: 3, step: 321, loss: 0.3663868308067322, mean loss: 0.41516723281767653
Epoch: 3, step: 322, loss: 0.356107622385025, mean loss: 0.41515454546849656
Epoch: 3, step: 323, loss: 0.37804269790649414, mean loss: 0.4151465747108587
Epoch: 3, step: 324, loss: 0.3799859285354614, mean loss: 0.4151390246472608
Epoch: 3, step: 325, loss: 0.34951671957969666, mean loss: 0.41512493656115784
Epoch: 3, step: 326, loss: 0.3723936975002289, mean loss: 0.41511576479917867
Epoch: 3, step: 327, loss: 0.38355058431625366, mean loss: 0.4151089911552982
Epoch: 3, step: 328, loss: 0.3522450923919678, mean loss: 0.4150955039425191
Epoch: 3, step: 329, loss: 0.4101729989051819, mean loss: 0.4150944480641327
Epoch: 3, step: 330, loss: 0.34885191917419434, mean loss: 0.41508024207466454
Epoch: 3, step: 331, loss: 0.367984414100647, mean loss: 0.41507014434139394
Epoch: 3, step: 332, loss: 0.3825957179069519, mean loss: 0.41506318304955375
Epoch: 3, step: 333, loss: 0.3958730399608612, mean loss: 0.4150590702884975
Epoch: 3, step: 334, loss: 0.4105675220489502, mean loss: 0.415058107882618
Epoch: 3, step: 335, loss: 0.3745698034763336, mean loss: 0.4150494342955558
Epoch: 3, step: 336, loss: 0.33037328720092773, mean loss: 0.415031298474803
Epoch: 3, step: 337, loss: 0.35148680210113525, mean loss: 0.4150176915162648
Epoch: 3, step: 338, loss: 0.3368576765060425, mean loss: 0.41500095847943963
Epoch: 3, step: 339, loss: 0.3449741303920746, mean loss: 0.4149859698604141
Epoch: 3, step: 340, loss: 0.3972514867782593, mean loss: 0.4149821747645266
Epoch: 3, step: 341, loss: 0.37318453192710876, mean loss: 0.41497323217940946
Epoch: 3, step: 342, loss: 0.36461809277534485, mean loss: 0.41496246102659573
Epoch: 3, step: 343, loss: 0.3555556535720825, mean loss: 0.4149497564056688
Epoch: 3, step: 344, loss: 0.3518812358379364, mean loss: 0.4149362715819425
Epoch: 3, step: 345, loss: 0.34867793321609497, mean loss: 0.41492210776442096
Epoch: 3, step: 346, loss: 0.41041064262390137, mean loss: 0.41492114357011867
Epoch: 3, step: 347, loss: 0.4048061966896057, mean loss: 0.41491898225668267
Epoch: 3, step: 348, loss: 0.3380855321884155, mean loss: 0.4149025683600648
Epoch: 3, step: 349, loss: 0.3552899956703186, mean loss: 0.4148898360720063
Epoch: 3, step: 350, loss: 0.35970714688301086, mean loss: 0.41487805245270476
Epoch: 3, step: 351, loss: 0.37581005692481995, mean loss: 0.41486971171924447
Epoch: 3, step: 352, loss: 0.3463789224624634, mean loss: 0.41485509255398156
Epoch: 3, step: 353, loss: 0.34684547781944275, mean loss: 0.41484057919189565
Epoch: 3, step: 354, loss: 0.3450503647327423, mean loss: 0.4148256890245265
Epoch: 3, step: 355, loss: 0.343029648065567, mean loss: 0.4148103741693731
Epoch: 3, step: 356, loss: 0.35418379306793213, mean loss: 0.41479744463618873
Epoch: 3, step: 357, loss: 0.4247695803642273, mean loss: 0.4147995708911414
Epoch: 3, step: 358, loss: 0.39487209916114807, mean loss: 0.4147953228690288
Epoch: 3, step: 359, loss: 0.3815017342567444, mean loss: 0.414788227048779
Epoch: 3, step: 360, loss: 0.3470848500728607, mean loss: 0.41477380058873725
Epoch: 3, step: 361, loss: 0.36001861095428467, mean loss: 0.4147621356569873
Epoch: 3, step: 362, loss: 0.36623725295066833, mean loss: 0.41475180021871116
Epoch: 3, step: 363, loss: 0.32592809200286865, mean loss: 0.4147328854597214
Epoch: 3, step: 364, loss: 0.3509974777698517, mean loss: 0.4147193160733706
Epoch: 3, step: 365, loss: 0.40088900923728943, mean loss: 0.4147163722021837
Epoch: 3, step: 366, loss: 0.34778061509132385, mean loss: 0.41470212752095137
Epoch: 3, step: 367, loss: 0.3938151001930237, mean loss: 0.41469768347258373
Epoch: 3, step: 368, loss: 0.36921384930610657, mean loss: 0.4146880081196447
Epoch: 3, step: 369, loss: 0.36008381843566895, mean loss: 0.41467639514863575
Epoch: 3, step: 370, loss: 0.3469049036502838, mean loss: 0.41466198488040307
Epoch: 3, step: 371, loss: 0.3705134987831116, mean loss: 0.41465259957298445
Epoch: 3, step: 372, loss: 0.3344217538833618, mean loss: 0.4146355473209781
Epoch: 3, step: 373, loss: 0.34074223041534424, mean loss: 0.4146198453836841
Epoch: 3, step: 374, loss: 0.3744807243347168, mean loss: 0.4146113178457515
Epoch: 3, step: 375, loss: 0.32450783252716064, mean loss: 0.4145921794673916
Epoch: 3, step: 376, loss: 0.3652361333370209, mean loss: 0.41458169825139446
Epoch: 3, step: 377, loss: 0.3456982374191284, mean loss: 0.41456707331278886
Epoch: 3, step: 378, loss: 0.37177774310112, mean loss: 0.41455799045772374
Epoch: 3, step: 379, loss: 0.36308473348617554, mean loss: 0.4145470665916432
Epoch: 3, step: 380, loss: 0.3449009954929352, mean loss: 0.4145322891524116
Epoch: 3, step: 381, loss: 0.38434702157974243, mean loss: 0.41452588582878563
Epoch: 3, step: 382, loss: 0.37833401560783386, mean loss: 0.41451820992842064
Epoch: 3, step: 383, loss: 0.4045542776584625, mean loss: 0.41451609713531845
Epoch: 3, step: 384, loss: 0.3707776963710785, mean loss: 0.41450682463144645
Epoch: 3, step: 385, loss: 0.31915003061294556, mean loss: 0.41448661335674986
Epoch: 3, step: 386, loss: 0.35833850502967834, mean loss: 0.4144747150502597
Epoch: 3, step: 387, loss: 0.3673311769962311, mean loss: 0.4144647270125364
Epoch: 3, step: 388, loss: 0.348106324672699, mean loss: 0.4144506710069571
Epoch: 3, step: 389, loss: 0.36070117354393005, mean loss: 0.41443928822477516
Epoch: 3, step: 390, loss: 0.3709781765937805, mean loss: 0.4144300862108791
Epoch: 3, step: 391, loss: 0.3794388771057129, mean loss: 0.4144226790963353
Epoch: 3, step: 392, loss: 0.33868280053138733, mean loss: 0.4144066494924062
Epoch: 3, step: 393, loss: 0.3784463405609131, mean loss: 0.4143990404553915
Epoch: 3, step: 394, loss: 0.3898180425167084, mean loss: 0.41439384032889715
Epoch: 3, step: 395, loss: 0.3431119918823242, mean loss: 0.4143787637958078
Epoch: 3, step: 396, loss: 0.38036519289016724, mean loss: 0.41437157124539425
Epoch: 3, step: 397, loss: 0.3225098252296448, mean loss: 0.41435215015744165
Epoch: 3, step: 398, loss: 0.35701099038124084, mean loss: 0.4143400298531136
Epoch: 3, step: 399, loss: 0.3544003963470459, mean loss: 0.4143273629821275
Epoch: 3, step: 400, loss: 0.3753756880760193, mean loss: 0.4143191331754708
Epoch: 3, step: 401, loss: 0.32336461544036865, mean loss: 0.41429992013834893
Epoch: 3, step: 402, loss: 0.3810764253139496, mean loss: 0.4142929035607725
Epoch: 3, step: 403, loss: 0.4139346480369568, mean loss: 0.41429282791560273
Epoch: 3, step: 404, loss: 0.36131924390792847, mean loss: 0.41428164497618797
Epoch: 3, step: 405, loss: 0.3575510084629059, mean loss: 0.41426967143534515
Epoch: 3, step: 406, loss: 0.37216541171073914, mean loss: 0.4142607868057346
Epoch: 3, step: 407, loss: 0.35898780822753906, mean loss: 0.4142491258397898
Epoch: 3, step: 408, loss: 0.3410223722457886, mean loss: 0.4142336804161252
Epoch: 3, step: 409, loss: 0.3549545407295227, mean loss: 0.4142211795431419
Epoch: 3, step: 410, loss: 0.4030318558216095, mean loss: 0.4142188204194393
Epoch: 3, step: 411, loss: 0.3452255427837372, mean loss: 0.41420427714843683
Epoch: 3, step: 412, loss: 0.3653024733066559, mean loss: 0.41419397118345436
Epoch: 3, step: 413, loss: 0.38951733708381653, mean loss: 0.4141887717240992
Epoch: 3, step: 414, loss: 0.4195769727230072, mean loss: 0.4141899067990937
Epoch: 3, step: 415, loss: 0.37437471747398376, mean loss: 0.4141815211231617
Epoch: 3, step: 416, loss: 0.44081589579582214, mean loss: 0.41418712954065434
Epoch: 3, step: 417, loss: 0.3638477027416229, mean loss: 0.41417653176659136
Epoch: 3, step: 418, loss: 0.4441852867603302, mean loss: 0.41418284806947364
Epoch: 3, step: 419, loss: 0.3602498471736908, mean loss: 0.4141714985322481
Epoch: 3, step: 420, loss: 0.34688645601272583, mean loss: 0.41415734220097955
Epoch: 3, step: 421, loss: 0.30858761072158813, mean loss: 0.4141351356945682
Epoch: 3, step: 422, loss: 0.3533592224121094, mean loss: 0.4141223542196403
Epoch: 3, step: 423, loss: 0.40600255131721497, mean loss: 0.41412064694400896
Epoch: 3, step: 424, loss: 0.37333643436431885, mean loss: 0.4141120734286464
Epoch: 3, step: 425, loss: 0.3809661567211151, mean loss: 0.41410510707372683
Epoch: 3, step: 426, loss: 0.3606553077697754, mean loss: 0.4140938757647745
Epoch: 3, step: 427, loss: 0.34387364983558655, mean loss: 0.4140791236164701
Epoch: 3, step: 428, loss: 0.3554474115371704, mean loss: 0.41406680861708356
Epoch: 3, step: 429, loss: 0.37093091011047363, mean loss: 0.4140577502595643
Epoch: 3, step: 430, loss: 0.3366146683692932, mean loss: 0.4140414909520081
Epoch: 3, step: 431, loss: 0.35722842812538147, mean loss: 0.41402956545603276
Epoch: 3, step: 432, loss: 0.34331291913986206, mean loss: 0.41401472460685834
Epoch: 3, step: 433, loss: 0.3234306871891022, mean loss: 0.4139957183044207
Epoch: 3, step: 434, loss: 0.3734300434589386, mean loss: 0.4139872086180676
Epoch: 3, step: 435, loss: 0.39114683866500854, mean loss: 0.41398241827202037
Epoch: 3, step: 436, loss: 0.34071382880210876, mean loss: 0.4139670547598648
Epoch: 3, step: 437, loss: 0.40060341358184814, mean loss: 0.41396425315794066
Epoch: 3, step: 438, loss: 0.3353384733200073, mean loss: 0.4139477732208545
Epoch: 3, step: 439, loss: 0.38684558868408203, mean loss: 0.41394209380246877
Epoch: 3, step: 440, loss: 0.3774977922439575, mean loss: 0.4139344582898858
Epoch: 3, step: 441, loss: 0.3746611475944519, mean loss: 0.4139262317899496
Epoch: 3, step: 442, loss: 0.3902476131916046, mean loss: 0.4139212729169447
Epoch: 3, step: 443, loss: 0.36419421434402466, mean loss: 0.4139108610537594
Epoch: 3, step: 444, loss: 0.35470664501190186, mean loss: 0.4138984674560952
Epoch: 3, step: 445, loss: 0.4131626486778259, mean loss: 0.4138983134546766
Epoch: 3, step: 446, loss: 0.3589366376399994, mean loss: 0.41388681279014117
Epoch: 3, step: 447, loss: 0.3854461908340454, mean loss: 0.41388086286922987
Epoch: 3, step: 448, loss: 0.3483532965183258, mean loss: 0.41386715704066873
Epoch: 3, step: 449, loss: 0.35754355788230896, mean loss: 0.41385537878906725
Epoch: 3, step: 450, loss: 0.3862917423248291, mean loss: 0.4138496159547657
Epoch: 3, step: 451, loss: 0.37911662459373474, mean loss: 0.4138423557140966
Epoch: 3, step: 452, loss: 0.37843337655067444, mean loss: 0.4138349557184512
Epoch: 3, step: 453, loss: 0.3576027750968933, mean loss: 0.41382320641201126
Epoch: 3, step: 454, loss: 0.38791871070861816, mean loss: 0.413817794986128
Epoch: 3, step: 455, loss: 0.4005057215690613, mean loss: 0.41381501468675097
Epoch: 3, step: 456, loss: 0.3698037266731262, mean loss: 0.41380582460781723
Epoch: 3, step: 457, loss: 0.37760263681411743, mean loss: 0.4137982665310336
Epoch: 3, step: 458, loss: 0.36449167132377625, mean loss: 0.4137879750271289
Epoch: 3, step: 459, loss: 0.3441569209098816, mean loss: 0.41377344433970875
Epoch: 3, step: 460, loss: 0.4212905764579773, mean loss: 0.41377501269608646
Epoch: 3, step: 461, loss: 0.3445068299770355, mean loss: 0.41376056376352094
Epoch: 3, step: 462, loss: 0.38624662160873413, mean loss: 0.4137548257151049
Epoch: 3, step: 463, loss: 0.33785051107406616, mean loss: 0.41373899912739825
Epoch: 3, step: 464, loss: 0.34448447823524475, mean loss: 0.41372456207905717
Epoch: 3, step: 465, loss: 0.37216493487358093, mean loss: 0.413715900214279
Epoch: 3, step: 466, loss: 0.36321255564689636, mean loss: 0.4137053764917186
Epoch: 3, step: 467, loss: 0.3343352675437927, mean loss: 0.4136888410523545
Epoch: 3, step: 468, loss: 0.3879322409629822, mean loss: 0.41368347621167767
Epoch: 3, step: 469, loss: 0.3320521414279938, mean loss: 0.4136664767666998
Epoch: 3, step: 470, loss: 0.4112453758716583, mean loss: 0.41366597268573063
Epoch: 3, step: 471, loss: 0.3629322052001953, mean loss: 0.4136554119514497
Epoch: 3, step: 472, loss: 0.3743327856063843, mean loss: 0.41364722826230405
Epoch: 3, step: 473, loss: 0.3611049950122833, mean loss: 0.41363629562950127
Epoch: 3, step: 474, loss: 0.34921202063560486, mean loss: 0.4136228934503888
Epoch: 3, step: 475, loss: 0.37553074955940247, mean loss: 0.4136149707915096
Epoch: 3, step: 476, loss: 0.3292634189128876, mean loss: 0.41359743043969455
Epoch: 3, step: 477, loss: 0.35395970940589905, mean loss: 0.4135850317450929
Epoch: 3, step: 478, loss: 0.3665790557861328, mean loss: 0.41357526122421184
Epoch: 3, step: 479, loss: 0.3300216794013977, mean loss: 0.4135578976369669
Epoch: 3, step: 480, loss: 0.3470429480075836, mean loss: 0.41354407778456104
Epoch: 3, step: 481, loss: 0.3778931498527527, mean loss: 0.41353667210779915
Epoch: 3, step: 482, loss: 0.3841937184333801, mean loss: 0.41353057803642335
Epoch: 3, step: 483, loss: 0.3842546343803406, mean loss: 0.4135244991444682
Epoch: 3, step: 484, loss: 0.3472673296928406, mean loss: 0.4135107442826348
Epoch: 3, step: 485, loss: 0.36791202425956726, mean loss: 0.41350128004020575
Epoch: 3, step: 486, loss: 0.3607785105705261, mean loss: 0.4134903394364561
Epoch: 3, step: 487, loss: 0.3466007113456726, mean loss: 0.41347646192025467
Epoch: 3, step: 488, loss: 0.38792604207992554, mean loss: 0.41347116210282253
Epoch: 3, step: 489, loss: 0.40732496976852417, mean loss: 0.4134698874880705
Epoch: 3, step: 490, loss: 0.3297387659549713, mean loss: 0.4134525266915677
Epoch: 3, step: 491, loss: 0.3724958300590515, mean loss: 0.4134440364974067
Epoch: 3, step: 492, loss: 0.374636173248291, mean loss: 0.41343599341694054
Epoch: 3, step: 493, loss: 0.42268598079681396, mean loss: 0.41343791011552733
Epoch: 3, step: 494, loss: 0.35553187131881714, mean loss: 0.4134259138365141
Epoch: 3, step: 495, loss: 0.37709662318229675, mean loss: 0.413418389128425
Epoch: 3, step: 496, loss: 0.3858574628829956, mean loss: 0.4134126817508633
Epoch: 3, step: 497, loss: 0.3814389705657959, mean loss: 0.413406061934883
Epoch: 3, step: 498, loss: 0.3418169617652893, mean loss: 0.41339124324306564
Epoch: 3, step: 499, loss: 0.37901541590690613, mean loss: 0.41338412904038846
Epoch: 3, step: 500, loss: 0.35838308930397034, mean loss: 0.4133727487300768
Epoch: 3, step: 501, loss: 0.3669404685497284, mean loss: 0.41336314337629515
Epoch: 3, step: 502, loss: 0.41708314418792725, mean loss: 0.41336391276632856
Epoch: 3, step: 503, loss: 0.35736581683158875, mean loss: 0.4133523333420244
Epoch: 3, step: 504, loss: 0.3712210953235626, mean loss: 0.41334362314189654
Epoch: 3, step: 505, loss: 0.32745161652565, mean loss: 0.4133258695233318
Epoch: 3, step: 506, loss: 0.331630676984787, mean loss: 0.41330898686316675
Epoch: 3, step: 507, loss: 0.3619668781757355, mean loss: 0.413298378989471
Epoch: 3, step: 508, loss: 0.35625430941581726, mean loss: 0.41328659545929675
Epoch: 3, step: 509, loss: 0.3237248957157135, mean loss: 0.413268098619201
Epoch: 3, step: 510, loss: 0.35944223403930664, mean loss: 0.41325698446174075
Epoch: 3, step: 511, loss: 0.33755698800086975, mean loss: 0.4132413568819594
Epoch: 3, step: 512, loss: 0.3413116931915283, mean loss: 0.413226510718143
Epoch: 3, step: 513, loss: 0.42530739307403564, mean loss: 0.4132290036777707
Epoch: 3, step: 514, loss: 0.38115236163139343, mean loss: 0.41322238584363696
Epoch: 3, step: 515, loss: 0.31793320178985596, mean loss: 0.4132027304838899
Epoch: 3, step: 516, loss: 0.35411012172698975, mean loss: 0.41319054392815535
Epoch: 3, step: 517, loss: 0.3846096992492676, mean loss: 0.4131846509704896
Epoch: 3, step: 518, loss: 0.429506778717041, mean loss: 0.4131880156639026
Epoch: 3, step: 519, loss: 0.3527398705482483, mean loss: 0.4131755572663108
Epoch: 3, step: 520, loss: 0.34353160858154297, mean loss: 0.4131612065659842
Epoch: 3, step: 521, loss: 0.3315924108028412, mean loss: 0.4131444021169189
Epoch: 3, step: 522, loss: 0.38910579681396484, mean loss: 0.41313945080789666
Epoch: 3, step: 523, loss: 0.37619704008102417, mean loss: 0.41313184322743396
Epoch: 3, step: 524, loss: 0.31852853298187256, mean loss: 0.41311236550245034
Epoch: 3, step: 525, loss: 0.37705105543136597, mean loss: 0.4131049424250376
Epoch: 3, step: 526, loss: 0.32211044430732727, mean loss: 0.4130862154239843
Epoch: 3, step: 527, loss: 0.36673563718795776, mean loss: 0.4130766782679687
Epoch: 3, step: 528, loss: 0.36467185616493225, mean loss: 0.41306672047695797
Epoch: 3, step: 529, loss: 0.333980530500412, mean loss: 0.41305045429226517
Epoch: 3, step: 530, loss: 0.38026681542396545, mean loss: 0.41304371284894453
Epoch: 3, step: 531, loss: 0.3799486458301544, mean loss: 0.4130369087644423
Epoch: 3, step: 532, loss: 0.3713960349559784, mean loss: 0.41302834948925043
Epoch: 3, step: 533, loss: 0.33177313208580017, mean loss: 0.41301165092422715
Epoch: 3, step: 534, loss: 0.3406531810760498, mean loss: 0.4129967837637899
Epoch: 3, step: 535, loss: 0.35087522864341736, mean loss: 0.41298402255690403
Epoch: 3, step: 536, loss: 0.41417646408081055, mean loss: 0.41298426746171485
Epoch: 3, step: 537, loss: 0.4254145324230194, mean loss: 0.412986819877518
Epoch: 3, step: 538, loss: 0.3493700921535492, mean loss: 0.4129737595761992
Epoch: 3, step: 539, loss: 0.3272656798362732, mean loss: 0.4129561676058092
Epoch: 3, step: 540, loss: 0.36418843269348145, mean loss: 0.4129461598621375
Epoch: 3, step: 541, loss: 0.3231438100337982, mean loss: 0.41292773508786007
Epoch: 3, step: 542, loss: 0.38500261306762695, mean loss: 0.4129220068577021
Epoch: 3, step: 543, loss: 0.4067918360233307, mean loss: 0.41292074964465153
Epoch: 3, step: 544, loss: 0.3566347360610962, mean loss: 0.41290920853052737
Epoch: 3, step: 545, loss: 0.3681766986846924, mean loss: 0.41290003827430644
Epoch: 3, step: 546, loss: 0.32617196440696716, mean loss: 0.41288226248544246
Epoch: 3, step: 547, loss: 0.33045652508735657, mean loss: 0.41286537196548384
Epoch: 3, step: 548, loss: 0.37810179591178894, mean loss: 0.41285824974133845
Epoch: 3, step: 549, loss: 0.38944026827812195, mean loss: 0.41285345294054715
Epoch: 3, step: 550, loss: 0.35603418946266174, mean loss: 0.4128418168022146
Epoch: 3, step: 551, loss: 0.3616279065608978, mean loss: 0.4128313307436066
Epoch: 3, step: 552, loss: 0.3716157078742981, mean loss: 0.4128228935638995
Epoch: 3, step: 553, loss: 0.37096238136291504, mean loss: 0.4128143261238256
Epoch: 3, step: 554, loss: 0.36822202801704407, mean loss: 0.41280520144649663
Epoch: 3, step: 555, loss: 0.36916181445121765, mean loss: 0.41279627276666947
Epoch: 3, step: 556, loss: 0.3410342335700989, mean loss: 0.41278159450133983
Epoch: 3, step: 557, loss: 0.3680661618709564, mean loss: 0.4127724502410882
Epoch: 3, step: 558, loss: 0.317658007144928, mean loss: 0.41275300341158583
Epoch: 3, step: 559, loss: 0.36889952421188354, mean loss: 0.4127440390863201
Epoch: 3, step: 560, loss: 0.37030190229415894, mean loss: 0.41273536503424735
Epoch: 3, step: 561, loss: 0.35915517807006836, mean loss: 0.41272441689633066
Epoch: 3, step: 562, loss: 0.3490588963031769, mean loss: 0.41271141066127587
Epoch: 3, step: 563, loss: 0.4252088963985443, mean loss: 0.41271396325231696
Epoch: 3, step: 564, loss: 0.37305009365081787, mean loss: 0.4127058636260965
Epoch: 3, step: 565, loss: 0.3874496817588806, mean loss: 0.4127007071986022
Epoch: 3, step: 566, loss: 0.3211302161216736, mean loss: 0.41268201552865386
Epoch: 3, step: 567, loss: 0.3420652151107788, mean loss: 0.41266760393673185
Epoch: 3, step: 568, loss: 0.36400339007377625, mean loss: 0.41265767449093244
Epoch: 3, step: 569, loss: 0.3331044018268585, mean loss: 0.4126414457531389
Epoch: 3, step: 570, loss: 0.39818084239959717, mean loss: 0.41263849641531436
Epoch: 3, step: 571, loss: 0.39032408595085144, mean loss: 0.4126339461684823
Epoch: 3, step: 572, loss: 0.34259000420570374, mean loss: 0.4126196660579904
Epoch: 3, step: 573, loss: 0.3508698046207428, mean loss: 0.4126070794576159
Epoch: 3, step: 574, loss: 0.4120655059814453, mean loss: 0.41260696909008454
Epoch: 3, step: 575, loss: 0.4302784502506256, mean loss: 0.4126105696363683
Epoch: 3, step: 576, loss: 0.40395212173461914, mean loss: 0.41260880584579956
Epoch: 3, step: 577, loss: 0.3770763576030731, mean loss: 0.41260156909462997
Epoch: 3, step: 578, loss: 0.36528483033180237, mean loss: 0.41259193424658214
Epoch: 3, step: 579, loss: 0.3317042887210846, mean loss: 0.41257546689203706
Epoch: 3, step: 580, loss: 0.36375313997268677, mean loss: 0.41256552951631564
Epoch: 3, step: 581, loss: 0.3963545560836792, mean loss: 0.41256223057992314
Epoch: 3, step: 582, loss: 0.35023337602615356, mean loss: 0.4125495492259956
Epoch: 3, step: 583, loss: 0.3469350039958954, mean loss: 0.41253620208498054
Epoch: 3, step: 584, loss: 0.3772216737270355, mean loss: 0.41252901995596736
Epoch: 3, step: 585, loss: 0.39469435811042786, mean loss: 0.4125253935505494
Epoch: 3, step: 586, loss: 0.37578320503234863, mean loss: 0.4125179241078744
Epoch: 3, step: 587, loss: 0.3857143819332123, mean loss: 0.41251247623344867
Epoch: 3, step: 588, loss: 0.3755505084991455, mean loss: 0.41250496516502067
Epoch: 3, step: 589, loss: 0.36404308676719666, mean loss: 0.4124951191921645
Epoch: 3, step: 590, loss: 0.3382658362388611, mean loss: 0.41248004113347
Epoch: 3, step: 591, loss: 0.34568271040916443, mean loss: 0.41246647546922866
Epoch: 3, step: 592, loss: 0.43837103247642517, mean loss: 0.41247173527775804
Epoch: 3, step: 593, loss: 0.36824336647987366, mean loss: 0.41246275672136384
Epoch: 3, step: 594, loss: 0.41474246978759766, mean loss: 0.412463219419368
Epoch: 3, step: 595, loss: 0.34328633546829224, mean loss: 0.41244918190233243
Epoch: 3, step: 596, loss: 0.31561988592147827, mean loss: 0.41242953708675506
Epoch: 3, step: 597, loss: 0.42920055985450745, mean loss: 0.41243293891693106
Epoch: 3, step: 598, loss: 0.3360607326030731, mean loss: 0.4124174507388102
Epoch: 3, step: 599, loss: 0.3344171345233917, mean loss: 0.412401635589537
Epoch: 3, step: 600, loss: 0.39469999074935913, mean loss: 0.41239804717582523
Epoch: 3, step: 601, loss: 0.36026525497436523, mean loss: 0.41238748114578844
Epoch: 3, step: 602, loss: 0.35943880677223206, mean loss: 0.41237675193112305
Epoch: 3, step: 603, loss: 0.36073386669158936, mean loss: 0.4123662894341134
Epoch: 3, step: 604, loss: 0.3349619209766388, mean loss: 0.41235061101230713
Epoch: 3, step: 605, loss: 0.360175222158432, mean loss: 0.41234004491492887
Epoch: 3, step: 606, loss: 0.3752523362636566, mean loss: 0.4123325357615271
Epoch: 3, step: 607, loss: 0.3453918993473053, mean loss: 0.41231898502541087
Epoch: 3, step: 608, loss: 0.335334837436676, mean loss: 0.4123034043438507
Epoch: 3, step: 609, loss: 0.3508417010307312, mean loss: 0.41229096773856677
Epoch: 3, step: 610, loss: 0.3379932641983032, mean loss: 0.4122759368456798
Epoch: 3, step: 611, loss: 0.3227595388889313, mean loss: 0.41225783077813194
Epoch: 3, step: 612, loss: 0.38029295206069946, mean loss: 0.4122513666975015
Epoch: 3, step: 613, loss: 0.3454069495201111, mean loss: 0.41223785185375356
Epoch: 3, step: 614, loss: 0.37501558661460876, mean loss: 0.41223032764408324
Epoch: 3, step: 615, loss: 0.3787406384944916, mean loss: 0.4122235593156375
Epoch: 3, step: 616, loss: 0.3568766117095947, mean loss: 0.4122123758548159
Epoch: 3, step: 617, loss: 0.3310781419277191, mean loss: 0.4121959851004872
Epoch: 3, step: 618, loss: 0.42127349972724915, mean loss: 0.4121978185714278
Epoch: 3, step: 619, loss: 0.3799683451652527, mean loss: 0.41219131019634575
Epoch: 3, step: 620, loss: 0.36155346035957336, mean loss: 0.412181086523857
Epoch: 3, step: 621, loss: 0.36357688903808594, mean loss: 0.4121712754222248
Epoch: 3, step: 622, loss: 0.3615054488182068, mean loss: 0.4121610502301756
Epoch: 3, step: 623, loss: 0.39779767394065857, mean loss: 0.4121581520509404
Epoch: 3, step: 624, loss: 0.3647454082965851, mean loss: 0.41214858724485726
Epoch: 3, step: 625, loss: 0.3476910889148712, mean loss: 0.4121355865392643
Epoch: 3, step: 626, loss: 0.3616808354854584, mean loss: 0.4121254121591365
Epoch: 3, step: 627, loss: 0.4089645743370056, mean loss: 0.41212477489344657
Epoch: 3, step: 628, loss: 0.3998234272003174, mean loss: 0.412122295282946
Epoch: 3, step: 629, loss: 0.3586187958717346, mean loss: 0.41211151263493895
Epoch: 3, step: 630, loss: 0.3488244116306305, mean loss: 0.41209876085154096
Epoch: 3, step: 631, loss: 0.32725098729133606, mean loss: 0.4120816682299535
Epoch: 3, step: 632, loss: 0.429294228553772, mean loss: 0.4120851350094749
Epoch: 3, step: 633, loss: 0.34337225556373596, mean loss: 0.4120712983442623
Epoch: 3, step: 634, loss: 0.34190496802330017, mean loss: 0.4120571718432917
Epoch: 3, step: 635, loss: 0.3356846570968628, mean loss: 0.41204179895385
Epoch: 3, step: 636, loss: 0.33861666917800903, mean loss: 0.4120270223127198
Epoch: 3, step: 637, loss: 0.3684464991092682, mean loss: 0.4120182535957775
Epoch: 3, step: 638, loss: 0.3398212790489197, mean loss: 0.41200372996380263
Epoch: 3, step: 639, loss: 0.35450467467308044, mean loss: 0.4119921653911376
Epoch: 3, step: 640, loss: 0.35186582803726196, mean loss: 0.41198007483466187
Epoch: 3, step: 641, loss: 0.36487171053886414, mean loss: 0.4119706039130101
Epoch: 3, step: 642, loss: 0.3991954028606415, mean loss: 0.4119680360334016
Epoch: 3, step: 643, loss: 0.3325195014476776, mean loss: 0.41195206968802667
Epoch: 3, step: 644, loss: 0.36005929112434387, mean loss: 0.41194164317033255
Epoch: 3, step: 645, loss: 0.4150250256061554, mean loss: 0.41194226257218786
Epoch: 3, step: 646, loss: 0.33835944533348083, mean loss: 0.41192748393847856
Epoch: 3, step: 647, loss: 0.3543674051761627, mean loss: 0.4119159256897311
Epoch: 3, step: 648, loss: 0.3501451313495636, mean loss: 0.4119035244059849
Epoch: 3, step: 649, loss: 0.34301939606666565, mean loss: 0.41188969780455187
Epoch: 3, step: 650, loss: 0.34157446026802063, mean loss: 0.4118755867795596
Epoch: 3, step: 651, loss: 0.3944095969200134, mean loss: 0.411872082367469
Epoch: 3, step: 652, loss: 0.35119229555130005, mean loss: 0.4118599098926814
Epoch: 3, step: 653, loss: 0.3471202850341797, mean loss: 0.41184692561172304
Epoch: 3, step: 654, loss: 0.39915868639945984, mean loss: 0.411844381348797
Epoch: 3, step: 655, loss: 0.3663146495819092, mean loss: 0.4118352534955959
Epoch: 3, step: 656, loss: 0.3672938644886017, mean loss: 0.4118263255763722
Epoch: 3, step: 657, loss: 0.3438529372215271, mean loss: 0.4118127036548582
Epoch: 3, step: 658, loss: 0.3797420859336853, mean loss: 0.41180627796507235
Epoch: 3, step: 659, loss: 0.31454744935035706, mean loss: 0.41178679502664794
Epoch: 3, step: 660, loss: 0.34346553683280945, mean loss: 0.4117731116182374
Epoch: 3, step: 661, loss: 0.3350405991077423, mean loss: 0.41175774667780674
Epoch: 3, step: 662, loss: 0.3171981871128082, mean loss: 0.41173881583505095
Epoch: 3, step: 663, loss: 0.36558786034584045, mean loss: 0.4117295782538882
Epoch: 3, step: 664, loss: 0.36255601048469543, mean loss: 0.4117197376359636
Epoch: 3, step: 665, loss: 0.3846209943294525, mean loss: 0.41171431571853534
Epoch: 3, step: 666, loss: 0.33867600560188293, mean loss: 0.4116997051343952
Epoch: 3, step: 667, loss: 0.3368554711341858, mean loss: 0.41168473628759517
Epoch: 3, step: 668, loss: 0.37145981192588806, mean loss: 0.4116766929113981
Epoch: 3, step: 669, loss: 0.4208095073699951, mean loss: 0.4116785187439568
Epoch: 3, step: 670, loss: 0.34645479917526245, mean loss: 0.4116654818221961
Epoch: 3, step: 671, loss: 0.31631648540496826, mean loss: 0.41164642726655715
Epoch: 3, step: 672, loss: 0.3775174021720886, mean loss: 0.41163960828052426
Epoch: 3, step: 673, loss: 0.3395550549030304, mean loss: 0.4116252086494061
Epoch: 3, step: 674, loss: 0.36446860432624817, mean loss: 0.41161579051393116
Epoch: 3, step: 675, loss: 0.3252740502357483, mean loss: 0.41159854975109605
Epoch: 3, step: 676, loss: 0.34144094586372375, mean loss: 0.41158454344167555
Epoch: 3, step: 677, loss: 0.3570919930934906, mean loss: 0.411573666685119
Epoch: 3, step: 678, loss: 0.35610267519950867, mean loss: 0.41156259684048013
Epoch: 3, step: 679, loss: 0.36647018790245056, mean loss: 0.41155359995122676
Epoch: 3, step: 680, loss: 0.35796815156936646, mean loss: 0.4115429106537239
Epoch: 3, step: 681, loss: 0.3606925308704376, mean loss: 0.41153276897446917
Epoch: 3, step: 682, loss: 0.36815911531448364, mean loss: 0.4115241201900903
Epoch: 3, step: 683, loss: 0.34159788489341736, mean loss: 0.41151017955306946
Epoch: 3, step: 684, loss: 0.4168434739112854, mean loss: 0.41151124259758975
Epoch: 3, step: 685, loss: 0.3609432876110077, mean loss: 0.41150116528491804
Epoch: 3, step: 686, loss: 0.3849707245826721, mean loss: 0.41149587928358267
Epoch: 3, step: 687, loss: 0.3702494502067566, mean loss: 0.41148766286344785
Epoch: 3, step: 688, loss: 0.35970941185951233, mean loss: 0.41147735052506823
Epoch: 3, step: 689, loss: 0.3830455243587494, mean loss: 0.41147168907023624
Epoch: 3, step: 690, loss: 0.3890778124332428, mean loss: 0.4114672308029384
Epoch: 3, step: 691, loss: 0.35989344120025635, mean loss: 0.4114569653193391
Epoch: 3, step: 692, loss: 0.33731788396835327, mean loss: 0.4114422112732991
Epoch: 3, step: 693, loss: 0.3644549250602722, mean loss: 0.41143286243004146
Epoch: 3, step: 694, loss: 0.3627411425113678, mean loss: 0.41142317639067033
Epoch: 3, step: 695, loss: 0.31777679920196533, mean loss: 0.4114045514150958
Epoch: 3, step: 696, loss: 0.36182722449302673, mean loss: 0.4113946931277778
Epoch: 3, step: 697, loss: 0.3675083518028259, mean loss: 0.41138596820902534
Epoch: 3, step: 698, loss: 0.3445987403392792, mean loss: 0.41137269306931756
Epoch: 3, step: 699, loss: 0.38115906715393066, mean loss: 0.4113666887716396
Epoch: 3, step: 700, loss: 0.35347557067871094, mean loss: 0.41135518646325636
Epoch: 3, step: 701, loss: 0.36536747217178345, mean loss: 0.4113460510412676
Epoch: 3, step: 702, loss: 0.35394716262817383, mean loss: 0.4113346510634298
Epoch: 3, step: 703, loss: 0.3807922601699829, mean loss: 0.41132858625189417
Epoch: 3, step: 704, loss: 0.34950366616249084, mean loss: 0.4113163120966253
Epoch: 3, step: 705, loss: 0.3919953405857086, mean loss: 0.41131247704868745
Epoch: 3, step: 706, loss: 0.3610948920249939, mean loss: 0.41130251126479705
Epoch: 3, step: 707, loss: 0.3637396991252899, mean loss: 0.4112930741988964
Epoch: 3, step: 708, loss: 0.35680046677589417, mean loss: 0.41128226431843157
Epoch: 3, step: 709, loss: 0.3757971525192261, mean loss: 0.41127522641446507
Epoch: 3, step: 710, loss: 0.3948611319065094, mean loss: 0.411271971587079
Epoch: 3, step: 711, loss: 0.34520062804222107, mean loss: 0.4112588725895483
Epoch: 3, step: 712, loss: 0.3672589063644409, mean loss: 0.411250151089801
Epoch: 3, step: 713, loss: 0.3311975598335266, mean loss: 0.41123428652554095
Epoch: 3, step: 714, loss: 0.32673877477645874, mean loss: 0.41121754479545397
Epoch: 3, step: 715, loss: 0.3500913381576538, mean loss: 0.4112054358004782
Epoch: 3, step: 716, loss: 0.3638787269592285, mean loss: 0.4111960623188301
Epoch: 3, step: 717, loss: 0.3680524230003357, mean loss: 0.41118751902391554
Epoch: 3, step: 718, loss: 0.3697677254676819, mean loss: 0.41117931870842234
Epoch: 3, step: 719, loss: 0.39880380034446716, mean loss: 0.41117686908087603
Epoch: 3, step: 720, loss: 0.420152485370636, mean loss: 0.4111786453754119
Epoch: 3, step: 721, loss: 0.33209216594696045, mean loss: 0.4111629970811047
Epoch: 3, step: 722, loss: 0.3600275218486786, mean loss: 0.41115288126008936
Epoch: 3, step: 723, loss: 0.3438003659248352, mean loss: 0.41113955995563223
Epoch: 3, step: 724, loss: 0.34687119722366333, mean loss: 0.4111268511633182
Epoch: 3, step: 725, loss: 0.34526315331459045, mean loss: 0.41111382947532915
Epoch: 3, step: 726, loss: 0.34818920493125916, mean loss: 0.4111013913206456
Epoch: 3, step: 727, loss: 0.38669320940971375, mean loss: 0.4110965675692798
Epoch: 3, step: 728, loss: 0.3331593871116638, mean loss: 0.4110811680078379
Epoch: 3, step: 729, loss: 0.35547691583633423, mean loss: 0.4110701833669506
Epoch: 3, step: 730, loss: 0.3417091965675354, mean loss: 0.41105648378433174
Epoch: 3, step: 731, loss: 0.37832900881767273, mean loss: 0.41105002101281385
Epoch: 3, step: 732, loss: 0.344433069229126, mean loss: 0.41103686860377464
Epoch: 3, step: 733, loss: 0.3323535919189453, mean loss: 0.4110213369660556
Epoch: 3, step: 734, loss: 0.36813536286354065, mean loss: 0.4110128731858893
Epoch: 3, step: 735, loss: 0.39040178060531616, mean loss: 0.4110088062773296
Epoch: 3, step: 736, loss: 0.34604620933532715, mean loss: 0.41099599061409386
Epoch: 3, step: 737, loss: 0.3296060860157013, mean loss: 0.4109799373784729
Epoch: 3, step: 738, loss: 0.4103107154369354, mean loss: 0.4109798054080644
Epoch: 3, step: 739, loss: 0.3937532603740692, mean loss: 0.4109764090072296
Epoch: 3, step: 740, loss: 0.3330284655094147, mean loss: 0.4109610437512671
Epoch: 3, step: 741, loss: 0.36508023738861084, mean loss: 0.41095200141654836
Epoch: 3, step: 742, loss: 0.3512613773345947, mean loss: 0.4109402397172219
Epoch: 3, step: 743, loss: 0.37482985854148865, mean loss: 0.41093312577293983
Epoch: 3, step: 744, loss: 0.40170836448669434, mean loss: 0.41093130880203455
Epoch: 3, step: 745, loss: 0.3681098222732544, mean loss: 0.4109228760555736
Epoch: 3, step: 746, loss: 0.33314740657806396, mean loss: 0.41090756290938785
Epoch: 3, step: 747, loss: 0.35296356678009033, mean loss: 0.4108961566109372
Epoch: 3, step: 748, loss: 0.3570207953453064, mean loss: 0.41088555331212484
Epoch: 3, step: 749, loss: 0.32536667585372925, mean loss: 0.4108687255125463
Epoch: 3, step: 750, loss: 0.3465861976146698, mean loss: 0.4108560789400698
Epoch: 3, step: 751, loss: 0.3537827432155609, mean loss: 0.4108448528708872
Epoch: 3, step: 752, loss: 0.3180105686187744, mean loss: 0.41082659637447577
Epoch: 3, step: 753, loss: 0.3576001226902008, mean loss: 0.4108161310827565
Epoch: 3, step: 754, loss: 0.3802955150604248, mean loss: 0.41081013135481814
Epoch: 3, step: 755, loss: 0.3912649154663086, mean loss: 0.4108062899208778
Epoch: 3, step: 756, loss: 0.33126017451286316, mean loss: 0.4107906589294437
Epoch: 3, step: 757, loss: 0.37260255217552185, mean loss: 0.41078315635444296
Epoch: 3, step: 758, loss: 0.37572455406188965, mean loss: 0.41077626996624955
Epoch: 3, step: 759, loss: 0.33050602674484253, mean loss: 0.4107605059750435
Epoch: 3, step: 760, loss: 0.3533032536506653, mean loss: 0.4107492243625706
Epoch: 3, step: 761, loss: 0.3462897539138794, mean loss: 0.4107365703636604
Epoch: 3, step: 762, loss: 0.3907303214073181, mean loss: 0.4107326437200968
Epoch: 3, step: 763, loss: 0.4332951009273529, mean loss: 0.4107370712038502
Epoch: 3, step: 764, loss: 0.33892562985420227, mean loss: 0.4107229822414508
Epoch: 3, step: 765, loss: 0.32732731103897095, mean loss: 0.4107066237339572
Epoch: 3, step: 766, loss: 0.3461701571941376, mean loss: 0.41069396704312766
Epoch: 3, step: 767, loss: 0.421524316072464, mean loss: 0.41069609064097656
Epoch: 3, step: 768, loss: 0.3633420467376709, mean loss: 0.4106868073545811
Epoch: 3, step: 769, loss: 0.3436015844345093, mean loss: 0.41067365854569826
Epoch: 3, step: 770, loss: 0.32427820563316345, mean loss: 0.4106567282198287
Epoch: 3, step: 771, loss: 0.36951619386672974, mean loss: 0.4106486677703081
Epoch: 3, step: 772, loss: 0.3809407949447632, mean loss: 0.4106428484024677
Epoch: 3, step: 773, loss: 0.36405959725379944, mean loss: 0.4106337251648749
Epoch: 3, step: 774, loss: 0.37885868549346924, mean loss: 0.41062750330474734
Epoch: 3, step: 775, loss: 0.35247987508773804, mean loss: 0.4106161196657072
Epoch: 3, step: 776, loss: 0.41933122277259827, mean loss: 0.4106178254991593
Epoch: 3, step: 777, loss: 0.35868826508522034, mean loss: 0.4106076631585695
Epoch: 3, step: 778, loss: 0.34146949648857117, mean loss: 0.41059413583188786
Epoch: 3, step: 779, loss: 0.38153275847435, mean loss: 0.41058845089891494
Epoch: 3, step: 780, loss: 0.34213918447494507, mean loss: 0.4105750635986169
Epoch: 3, step: 781, loss: 0.3338828384876251, mean loss: 0.410560067074348
Epoch: 3, step: 782, loss: 0.4040704071521759, mean loss: 0.41055879832363007
Epoch: 3, step: 783, loss: 0.3872149884700775, mean loss: 0.4105542354210004
Epoch: 3, step: 784, loss: 0.32572299242019653, mean loss: 0.41053765710499474
Epoch: 3, step: 785, loss: 0.37270355224609375, mean loss: 0.4105302647437484
Epoch: 3, step: 786, loss: 0.3814413845539093, mean loss: 0.4105245822119668
Epoch: 3, step: 787, loss: 0.3992651700973511, mean loss: 0.4105223831080382
Epoch: 3, step: 788, loss: 0.3372202217578888, mean loss: 0.410508069075359
Epoch: 3, step: 789, loss: 0.3339695632457733, mean loss: 0.4104931259855836
Epoch: 3, step: 790, loss: 0.36622172594070435, mean loss: 0.41048448429125506
Epoch: 3, step: 791, loss: 0.37915903329849243, mean loss: 0.4104783708152612
Epoch: 3, step: 792, loss: 0.36677664518356323, mean loss: 0.41046984364928424
Epoch: 3, step: 793, loss: 0.41173499822616577, mean loss: 0.4104700904605556
Epoch: 3, step: 794, loss: 0.3938220143318176, mean loss: 0.4104668433226331
Epoch: 3, step: 795, loss: 0.3610050678253174, mean loss: 0.4104571978905939
Epoch: 3, step: 796, loss: 0.3950539231300354, mean loss: 0.4104541947175074
Epoch: 3, step: 797, loss: 0.3474554419517517, mean loss: 0.4104419142588786
Epoch: 3, step: 798, loss: 0.34798821806907654, mean loss: 0.4104297424217728
Epoch: 3, step: 799, loss: 0.339106023311615, mean loss: 0.41041584458094854
Epoch: 3, step: 800, loss: 0.3749818205833435, mean loss: 0.4104089414007425
Epoch: 3, step: 801, loss: 0.3799275755882263, mean loss: 0.4104030042433969
Epoch: 3, step: 802, loss: 0.36957478523254395, mean loss: 0.4103950532757219
Epoch: 3, step: 803, loss: 0.32236045598983765, mean loss: 0.4103779125831039
Epoch: 3, step: 804, loss: 0.3393023610115051, mean loss: 0.41036407657929397
Epoch: 3, step: 805, loss: 0.40542909502983093, mean loss: 0.41036311609242176
Epoch: 3, step: 806, loss: 0.35286837816238403, mean loss: 0.410351928169104
Epoch: 3, step: 807, loss: 0.34890833497047424, mean loss: 0.4103399741626451
Epoch: 3, step: 808, loss: 0.34355849027633667, mean loss: 0.4103269841832858
Epoch: 3, step: 809, loss: 0.34555408358573914, mean loss: 0.41031438735314235
Epoch: 3, step: 810, loss: 0.43642812967300415, mean loss: 0.41031946488421756
Epoch: 3, step: 811, loss: 0.40247464179992676, mean loss: 0.4103179398408497
Epoch: 3, step: 812, loss: 0.32635846734046936, mean loss: 0.41030162118730246
Epoch: 3, step: 813, loss: 0.3543097972869873, mean loss: 0.4102907405374967
Epoch: 3, step: 814, loss: 0.31689324975013733, mean loss: 0.4102725945319037
Epoch: 3, step: 815, loss: 0.3744703531265259, mean loss: 0.4102656399395561
Epoch: 3, step: 816, loss: 0.3055645227432251, mean loss: 0.41024530567713696
Epoch: 3, step: 817, loss: 0.4496237635612488, mean loss: 0.41025295197963874
Epoch: 3, step: 818, loss: 0.3932799696922302, mean loss: 0.410249656894745
Epoch: 3, step: 819, loss: 0.38054409623146057, mean loss: 0.41024389106387094
Epoch: 3, step: 820, loss: 0.35277581214904785, mean loss: 0.41023273871011295
Epoch: 3, step: 821, loss: 0.3663363456726074, mean loss: 0.4102242217537611
Epoch: 3, step: 822, loss: 0.36084020137786865, mean loss: 0.4102146419243962
Epoch: 3, step: 823, loss: 0.36694562435150146, mean loss: 0.41020624995046817
Epoch: 3, step: 824, loss: 0.35779306292533875, mean loss: 0.41019608644706984
Epoch: 3, step: 825, loss: 0.3676728308200836, mean loss: 0.41018784231065514
Epoch: 3, step: 826, loss: 0.34902769327163696, mean loss: 0.41017598727110505
Epoch: 3, step: 827, loss: 0.4407810568809509, mean loss: 0.4101819184861457
Epoch: 3, step: 828, loss: 0.342773973941803, mean loss: 0.41016885746220766
Epoch: 3, step: 829, loss: 0.4049416184425354, mean loss: 0.41016784482388535
Epoch: 3, step: 830, loss: 0.3726794421672821, mean loss: 0.4101605838510679
Epoch: 3, step: 831, loss: 0.38226374983787537, mean loss: 0.41015518167562
Epoch: 3, step: 832, loss: 0.334555059671402, mean loss: 0.4101405446723278
Epoch: 3, step: 833, loss: 0.31162726879119873, mean loss: 0.41012147512608677
Epoch: 3, step: 834, loss: 0.3374817967414856, mean loss: 0.41010741674048884
Epoch: 3, step: 835, loss: 0.372945636510849, mean loss: 0.4101002259935404
Epoch: 3, step: 836, loss: 0.3862467110157013, mean loss: 0.41009561126825933
Epoch: 3, step: 837, loss: 0.3886973559856415, mean loss: 0.4100914723407385
Epoch: 3, step: 838, loss: 0.4027014374732971, mean loss: 0.41009004321003506
Epoch: 3, step: 839, loss: 0.33353522419929504, mean loss: 0.41007524142755036
Epoch: 3, step: 840, loss: 0.40481480956077576, mean loss: 0.41007422452597164
Epoch: 3, step: 841, loss: 0.36186230182647705, mean loss: 0.41006490641180476
Epoch: 3, step: 842, loss: 0.3566492795944214, mean loss: 0.4100545845515502
Epoch: 3, step: 843, loss: 0.3672609329223633, mean loss: 0.4100463168445121
Epoch: 3, step: 844, loss: 0.38657867908477783, mean loss: 0.41004178378718936
Epoch: 3, step: 845, loss: 0.3590831756591797, mean loss: 0.4100319424182963
Epoch: 3, step: 846, loss: 0.35438287258148193, mean loss: 0.4100211972802703
Epoch: 3, step: 847, loss: 0.3693901002407074, mean loss: 0.41001335343914297
Epoch: 3, step: 848, loss: 0.35571327805519104, mean loss: 0.41000287282239256
Epoch: 3, step: 849, loss: 0.3741070628166199, mean loss: 0.4099959458038658
Epoch: 3, step: 850, loss: 0.370012104511261, mean loss: 0.40998823138339646
Epoch: 3, step: 851, loss: 0.36326172947883606, mean loss: 0.40997921778349206
Epoch: 3, step: 852, loss: 0.3547225892543793, mean loss: 0.4099685607673823
Epoch: 3, step: 853, loss: 0.3548678457736969, mean loss: 0.4099579358705459
Epoch: 3, step: 854, loss: 0.35182714462280273, mean loss: 0.4099467288546894
Epoch: 3, step: 855, loss: 0.36061909794807434, mean loss: 0.4099372208302278
Epoch: 3, step: 856, loss: 0.3485504388809204, mean loss: 0.4099253906544812
Epoch: 3, step: 857, loss: 0.3824176490306854, mean loss: 0.40992009051158645
Epoch: 3, step: 858, loss: 0.37807121872901917, mean loss: 0.40991395510958634
Epoch: 3, step: 859, loss: 0.3989401161670685, mean loss: 0.40991184150424304
Epoch: 3, step: 860, loss: 0.33239471912384033, mean loss: 0.40989691427097125
Epoch: 3, step: 861, loss: 0.4000781178474426, mean loss: 0.40989502385964594
Epoch: 3, step: 862, loss: 0.3747835159301758, mean loss: 0.40988826514782123
Epoch: 3, step: 863, loss: 0.36655378341674805, mean loss: 0.409879925178281
Epoch: 3, step: 864, loss: 0.3305094838142395, mean loss: 0.4098646528208894
Epoch: 3, step: 865, loss: 0.36043304204940796, mean loss: 0.4098551430843039
Epoch: 3, step: 866, loss: 0.42132920026779175, mean loss: 0.4098573500581803
Epoch: 3, step: 867, loss: 0.40926381945610046, mean loss: 0.4098572359176799
Epoch: 3, step: 868, loss: 0.3454742729663849, mean loss: 0.40984485695921974
Epoch: 3, step: 869, loss: 0.3463667333126068, mean loss: 0.4098326543210716
Epoch: 3, step: 870, loss: 0.36777183413505554, mean loss: 0.4098245703656255
Epoch: 3, step: 871, loss: 0.36782750487327576, mean loss: 0.40981650021468535
Epoch: 3, step: 872, loss: 0.3480182886123657, mean loss: 0.40980462735943035
Epoch: 3, step: 873, loss: 0.3690020442008972, mean loss: 0.4097967897522159
Epoch: 3, step: 874, loss: 0.34358665347099304, mean loss: 0.40978407415085594
Epoch: 3, step: 875, loss: 0.38650283217430115, mean loss: 0.40977960386629825
Epoch: 3, step: 876, loss: 0.3694764971733093, mean loss: 0.40977186666017557
Epoch: 3, step: 877, loss: 0.3781381845474243, mean loss: 0.4097657949361616
Epoch: 3, step: 878, loss: 0.38595181703567505, mean loss: 0.409761224992216
Epoch: 3, step: 879, loss: 0.39564836025238037, mean loss: 0.40975851722845164
Epoch: 3, step: 880, loss: 0.4074387550354004, mean loss: 0.4097580722328267
Epoch: 3, step: 881, loss: 0.3672148883342743, mean loss: 0.40974991281896045
Epoch: 3, step: 882, loss: 0.3548368811607361, mean loss: 0.4097393829950567
Epoch: 3, step: 883, loss: 0.3907240629196167, mean loss: 0.40973573741988883
Epoch: 3, step: 884, loss: 0.33895525336265564, mean loss: 0.40972217014289875
Epoch: 3, step: 885, loss: 0.32843950390815735, mean loss: 0.40970659278256244
Epoch: 3, step: 886, loss: 0.3777397871017456, mean loss: 0.4097004677000407
Epoch: 3, step: 887, loss: 0.3937845826148987, mean loss: 0.40969741867990944
Epoch: 3, step: 888, loss: 0.35956257581710815, mean loss: 0.40968781614344846
Epoch: 3, step: 889, loss: 0.37113866209983826, mean loss: 0.40968043407641597
Epoch: 3, step: 890, loss: 0.36238721013069153, mean loss: 0.4096713792757371
Epoch: 3, step: 891, loss: 0.4018208384513855, mean loss: 0.4096698764922715
Epoch: 3, step: 892, loss: 0.3112667202949524, mean loss: 0.40965104335232944
Epoch: 3, step: 893, loss: 0.3419455587863922, mean loss: 0.4096380878443758
Epoch: 3, step: 894, loss: 0.3732897937297821, mean loss: 0.40963113389486083
Epoch: 3, step: 895, loss: 0.3134985864162445, mean loss: 0.40961274587889324
Epoch: 3, step: 896, loss: 0.3910987675189972, mean loss: 0.40960920524428623
Epoch: 3, step: 897, loss: 0.3344118893146515, mean loss: 0.40959482717240675
Epoch: 3, step: 898, loss: 0.35285764932632446, mean loss: 0.4095839808375098
Epoch: 3, step: 899, loss: 0.34399884939193726, mean loss: 0.4095714454530592
Epoch: 3, step: 900, loss: 0.3298974335193634, mean loss: 0.40955622014980414
Epoch: 3, step: 901, loss: 0.3409889042377472, mean loss: 0.4095431197837529
Epoch: 3, step: 902, loss: 0.38897743821144104, mean loss: 0.40953919128679545
Epoch: 3, step: 903, loss: 0.3286793529987335, mean loss: 0.4095237482313546
Epoch: 3, step: 904, loss: 0.3438259959220886, mean loss: 0.4095112033101575
Epoch: 3, step: 905, loss: 0.3520076870918274, mean loss: 0.40950022516654955
Epoch: 3, step: 906, loss: 0.3558657765388489, mean loss: 0.40948998763102223
Epoch: 3, step: 907, loss: 0.4334765374660492, mean loss: 0.4094945652168686
Epoch: 3, step: 908, loss: 0.40517327189445496, mean loss: 0.409493740699921
Epoch: 3, step: 909, loss: 0.3963319659233093, mean loss: 0.40949122986917386
Epoch: 3, step: 910, loss: 0.32394975423812866, mean loss: 0.40947491450094364
Epoch: 3, step: 911, loss: 0.3491320013999939, mean loss: 0.4094634074618321
Epoch: 3, step: 912, loss: 0.3943331241607666, mean loss: 0.40946052275576894
Epoch: 3, step: 913, loss: 0.3633972406387329, mean loss: 0.40945174210725255
Epoch: 3, step: 914, loss: 0.35916033387184143, mean loss: 0.40944215731437367
Epoch: 3, step: 915, loss: 0.3801226317882538, mean loss: 0.4094365705145402
Epoch: 3, step: 916, loss: 0.367717981338501, mean loss: 0.40942862260271395
Epoch: 3, step: 917, loss: 0.3204943537712097, mean loss: 0.40941168274198414
Epoch: 3, step: 918, loss: 0.4229309856891632, mean loss: 0.40941425735690457
Epoch: 3, step: 919, loss: 0.36682572960853577, mean loss: 0.40940614834552824
Epoch: 3, step: 920, loss: 0.33830106258392334, mean loss: 0.409392612254578
Epoch: 3, step: 921, loss: 0.3561130166053772, mean loss: 0.40938247148646817
Epoch: 3, step: 922, loss: 0.3384111225605011, mean loss: 0.40936896599666306
Epoch: 3, step: 923, loss: 0.34351301193237305, mean loss: 0.40935643632503743
Epoch: 3, step: 924, loss: 0.352603018283844, mean loss: 0.4093456405445464
Epoch: 3, step: 925, loss: 0.35040953755378723, mean loss: 0.4093344317003108
Epoch: 3, step: 926, loss: 0.38111743330955505, mean loss: 0.4093290662318965
Epoch: 3, step: 927, loss: 0.3703756630420685, mean loss: 0.4093216606419365
Epoch: 3, step: 928, loss: 0.4079703986644745, mean loss: 0.4093214037968543
Epoch: 3, step: 929, loss: 0.38494575023651123, mean loss: 0.40931677140355127
Epoch: 3, step: 930, loss: 0.3310483396053314, mean loss: 0.40930189995536614
Epoch: 3, step: 931, loss: 0.42899325489997864, mean loss: 0.4093056407142842
Epoch: 3, step: 932, loss: 0.5111966133117676, mean loss: 0.40932499322569876
Epoch: 3, step: 933, loss: 0.3504454791545868, mean loss: 0.409313812155803
Epoch: 3, step: 934, loss: 0.3544873893260956, mean loss: 0.409303402734343
Epoch: 3, step: 935, loss: 0.35124722123146057, mean loss: 0.4092923821987502
Epoch: 3, step: 936, loss: 0.3731279969215393, mean loss: 0.40928551858415974
Epoch: 3, step: 937, loss: 0.36609843373298645, mean loss: 0.4092773236913986
Epoch: 3, step: 938, loss: 0.3419559895992279, mean loss: 0.40926455166823555
Epoch: 3, step: 939, loss: 0.34385886788368225, mean loss: 0.4092521454307954
Epoch: 3, step: 940, loss: 0.36834990978240967, mean loss: 0.4092443885114614
Epoch: 3, step: 941, loss: 0.3891691267490387, mean loss: 0.4092405820530309
Epoch: 3, step: 942, loss: 0.3716137707233429, mean loss: 0.40923344900822906
Epoch: 3, step: 943, loss: 0.387602299451828, mean loss: 0.40922934909360503
Epoch: 3, step: 944, loss: 0.3581961393356323, mean loss: 0.40921967821815347
Epoch: 3, step: 945, loss: 0.3458930552005768, mean loss: 0.4092076799947701
Epoch: 3, step: 946, loss: 0.42877137660980225, mean loss: 0.4092113859422251
Epoch: 3, step: 947, loss: 0.3858913779258728, mean loss: 0.4092069692740402
Epoch: 3, step: 948, loss: 0.3401593267917633, mean loss: 0.40919389454529903
Epoch: 3, step: 949, loss: 0.33763086795806885, mean loss: 0.4091803460737755
Epoch: 3, step: 950, loss: 0.3578515946865082, mean loss: 0.4091706302397064
Epoch: 3, step: 951, loss: 0.34576335549354553, mean loss: 0.4091586303769611
Epoch: 3, step: 952, loss: 0.35634708404541016, mean loss: 0.4091486376529627
Epoch: 3, step: 953, loss: 0.3387790024280548, mean loss: 0.40913532519832313
Epoch: 3, step: 954, loss: 0.3553425669670105, mean loss: 0.40912515066489563
Epoch: 3, step: 955, loss: 0.3626369833946228, mean loss: 0.4091163594078476
Epoch: 3, step: 956, loss: 0.3846771717071533, mean loss: 0.409111738650105
Epoch: 3, step: 957, loss: 0.4521898925304413, mean loss: 0.4091198819684188
Epoch: 3, step: 958, loss: 0.31640303134918213, mean loss: 0.40910235846612825
Epoch: 3, step: 959, loss: 0.3448048532009125, mean loss: 0.40909020852182265
Epoch: 3, step: 960, loss: 0.3239535093307495, mean loss: 0.40907412374963464
Epoch: 3, step: 961, loss: 0.3585289418697357, mean loss: 0.409064576114221
Epoch: 3, step: 962, loss: 0.3811623454093933, mean loss: 0.4090593065711228
Epoch: 3, step: 963, loss: 0.4117187559604645, mean loss: 0.40905980873301656
Epoch: 3, step: 964, loss: 0.3858794867992401, mean loss: 0.40905543261031807
Epoch: 3, step: 965, loss: 0.36741504073143005, mean loss: 0.4090475729667018
Epoch: 3, step: 966, loss: 0.391926109790802, mean loss: 0.409044341892315
Epoch: 3, step: 967, loss: 0.359747052192688, mean loss: 0.40903504051689993
Epoch: 3, step: 968, loss: 0.3726707696914673, mean loss: 0.40902818062804397
Epoch: 3, step: 969, loss: 0.36141204833984375, mean loss: 0.40901919984111673
Epoch: 3, step: 970, loss: 0.35814082622528076, mean loss: 0.40900960557869626
Epoch: 3, step: 971, loss: 0.40520477294921875, mean loss: 0.4090088882271447
Epoch: 3, step: 972, loss: 0.4306287169456482, mean loss: 0.4090129635954234
Epoch: 3, step: 973, loss: 0.42311012744903564, mean loss: 0.40901562042992273
Epoch: 3, step: 974, loss: 0.34459319710731506, mean loss: 0.40900348128853914
Epoch: 3, step: 975, loss: 0.378574937582016, mean loss: 0.40899774870683103
Epoch: 3, step: 976, loss: 0.32932543754577637, mean loss: 0.4089827416789235
Epoch: 3, step: 977, loss: 0.3358495533466339, mean loss: 0.408968968950424
Epoch: 3, step: 978, loss: 0.4067085385322571, mean loss: 0.40896854333746635
Epoch: 3, step: 979, loss: 0.39058032631874084, mean loss: 0.4089650817002264
Epoch: 3, step: 980, loss: 0.32978686690330505, mean loss: 0.40895017896828645
Epoch: 3, step: 981, loss: 0.37838542461395264, mean loss: 0.40894442722678204
Epoch: 3, step: 982, loss: 0.3695920705795288, mean loss: 0.40893702320859815
Epoch: 3, step: 983, loss: 0.37050071358680725, mean loss: 0.4089297929020478
Epoch: 3, step: 984, loss: 0.3709920346736908, mean loss: 0.40892265772088765
Epoch: 3, step: 985, loss: 0.3464932441711426, mean loss: 0.40891091845545896
Epoch: 3, step: 986, loss: 0.3790801465511322, mean loss: 0.4089053101133074
Epoch: 3, step: 987, loss: 0.3478313684463501, mean loss: 0.40889383004908425
Epoch: 3, step: 988, loss: 0.410684734582901, mean loss: 0.4088941666220092
Epoch: 3, step: 989, loss: 0.4129332900047302, mean loss: 0.40889492557040885
Epoch: 3, step: 990, loss: 0.3557182252407074, mean loss: 0.40888493558349737
Epoch: 3, step: 991, loss: 0.33167994022369385, mean loss: 0.40887043426956804
Epoch: 3, step: 992, loss: 0.35042890906333923, mean loss: 0.408859459335257
Epoch: 3, step: 993, loss: 0.3056487441062927, mean loss: 0.4088400806805013
Epoch: 3, step: 994, loss: 0.3571447432041168, mean loss: 0.4088303762807498
Epoch: 3, step: 995, loss: 0.3500235378742218, mean loss: 0.4088193389612291
Epoch: 3, step: 996, loss: 0.3428038954734802, mean loss: 0.4088069510003569
Epoch: 3, step: 997, loss: 0.36093589663505554, mean loss: 0.40879796956426584
Epoch: 3, step: 998, loss: 0.331773579120636, mean loss: 0.40878352116988514
Epoch: 3, step: 999, loss: 0.3830486536026001, mean loss: 0.4087786946755927
Epoch: 3, step: 1000, loss: 0.3323083519935608, mean loss: 0.40876435559014695
Epoch: 3, step: 1001, loss: 0.3799827992916107, mean loss: 0.4087589597228244
Epoch: 3, step: 1002, loss: 0.3680780231952667, mean loss: 0.40875133443012945
Epoch: 3, step: 1003, loss: 0.36598891019821167, mean loss: 0.40874332048255974
Epoch: 3, step: 1004, loss: 0.362223356962204, mean loss: 0.4087346039819938
Epoch: 3, step: 1005, loss: 0.33635494112968445, mean loss: 0.40872104465961606
Epoch: 3, step: 1006, loss: 0.3385363221168518, mean loss: 0.40870789899141174
Epoch: 3, step: 1007, loss: 0.35343170166015625, mean loss: 0.4086975476435969
Epoch: 3, step: 1008, loss: 0.3924728333950043, mean loss: 0.40869450987646555
Epoch: 3, step: 1009, loss: 0.3968867361545563, mean loss: 0.408692299510737
Epoch: 3, step: 1010, loss: 0.36344966292381287, mean loss: 0.40868383186398666
Epoch: 3, step: 1011, loss: 0.33191555738449097, mean loss: 0.4086694665431634
Epoch: 3, step: 1012, loss: 0.3480176031589508, mean loss: 0.4086581191412206
Epoch: 3, step: 1013, loss: 0.3909439444541931, mean loss: 0.40865480560311973
Epoch: 3, step: 1014, loss: 0.3577772378921509, mean loss: 0.4086452904417749
Epoch: 3, step: 1015, loss: 0.33154910802841187, mean loss: 0.4086308745512713
Epoch: 3, step: 1016, loss: 0.34193524718284607, mean loss: 0.4086184057482486
Epoch: 3, step: 1017, loss: 0.4255545139312744, mean loss: 0.40862157137594635
Epoch: 3, step: 1018, loss: 0.39048993587493896, mean loss: 0.408618182918555
Epoch: 3, step: 1019, loss: 0.3479045331478119, mean loss: 0.4086068388135904
Epoch: 3, step: 1020, loss: 0.384187787771225, mean loss: 0.40860227706297536
Epoch: 3, step: 1021, loss: 0.3428759276866913, mean loss: 0.4085900009424344
Epoch: 3, step: 1022, loss: 0.32860898971557617, mean loss: 0.40857506517936687
Epoch: 3, step: 1023, loss: 0.35123202204704285, mean loss: 0.4085643588606342
Epoch: 3, step: 1024, loss: 0.3324790894985199, mean loss: 0.40855015589827426
Epoch: 3, step: 1025, loss: 0.34071168303489685, mean loss: 0.40853749474245804
Epoch: 3, step: 1026, loss: 0.37394484877586365, mean loss: 0.40853103968629706
Epoch: 3, step: 1027, loss: 0.37589946389198303, mean loss: 0.40852495170573844
Epoch: 3, step: 1028, loss: 0.34787246584892273, mean loss: 0.4085136380542076
Epoch: 3, step: 1029, loss: 0.3412494361400604, mean loss: 0.40850109344363056
Epoch: 3, step: 1030, loss: 0.3682229518890381, mean loss: 0.40849358306855044
Epoch: 3, step: 1031, loss: 0.3437640368938446, mean loss: 0.40848151566620616
Epoch: 3, step: 1032, loss: 0.35603997111320496, mean loss: 0.4084717409141926
Epoch: 3, step: 1033, loss: 0.34096550941467285, mean loss: 0.40845916055051396
Epoch: 3, step: 1034, loss: 0.32296761870384216, mean loss: 0.4084432314389346
Epoch: 3, step: 1035, loss: 0.3564353585243225, mean loss: 0.40843354293801903
Epoch: 3, step: 1036, loss: 0.3628474771976471, mean loss: 0.40842505233162296
Epoch: 3, step: 1037, loss: 0.3344574570655823, mean loss: 0.4084112781053164
Epoch: 3, step: 1038, loss: 0.35111483931541443, mean loss: 0.4084006103639666
Epoch: 3, step: 1039, loss: 0.35211995244026184, mean loss: 0.4083901336964454
Epoch: 3, step: 1040, loss: 0.40964409708976746, mean loss: 0.4083903670788004
Epoch: 3, step: 1041, loss: 0.3665095567703247, mean loss: 0.40838257385023535
Epoch: 3, step: 1042, loss: 0.3725469410419464, mean loss: 0.4083759067557594
Epoch: 3, step: 1043, loss: 0.4001220762729645, mean loss: 0.40837437144502975
Epoch: 3, step: 1044, loss: 0.36173877120018005, mean loss: 0.40836569828151015
Epoch: 3, step: 1045, loss: 0.34980908036231995, mean loss: 0.4083548101041358
Epoch: 3, step: 1046, loss: 0.44122907519340515, mean loss: 0.4083609216983149
Epoch: 3, step: 1047, loss: 0.3915949761867523, mean loss: 0.4083578053515655
Epoch: 3, step: 1048, loss: 0.3756897449493408, mean loss: 0.4083517343498182
Epoch: 3, step: 1049, loss: 0.3689633905887604, mean loss: 0.40834441581697517
Epoch: 3, step: 1050, loss: 0.3766378164291382, mean loss: 0.40833852568147677
Epoch: 3, step: 1051, loss: 0.33869338035583496, mean loss: 0.40832559010470754
Epoch: 3, step: 1052, loss: 0.35559359192848206, mean loss: 0.40831579771878806
Epoch: 3, step: 1053, loss: 0.31608203053474426, mean loss: 0.4082986729940974
Epoch: 3, step: 1054, loss: 0.3399205207824707, mean loss: 0.40828597981566567
Epoch: 3, step: 1055, loss: 0.38561663031578064, mean loss: 0.4082817724382529
Epoch: 3, step: 1056, loss: 0.3565533459186554, mean loss: 0.40827217354671097
Epoch: 3, step: 1057, loss: 0.3195851445198059, mean loss: 0.4082557195524574
Epoch: 3, step: 1058, loss: 0.33588907122612, mean loss: 0.4082422959486128
Epoch: 3, step: 1059, loss: 0.36411532759666443, mean loss: 0.40823411216368105
Epoch: 3, step: 1060, loss: 0.34666916728019714, mean loss: 0.4082226964498143
Epoch: 3, step: 1061, loss: 0.3472454845905304, mean loss: 0.4082113918128363
Epoch: 3, step: 1062, loss: 0.4237683415412903, mean loss: 0.4082142753994403
Epoch: 3, step: 1063, loss: 0.3541436195373535, mean loss: 0.40820425489242357
Epoch: 3, step: 1064, loss: 0.3607109785079956, mean loss: 0.4081954549523857
Epoch: 3, step: 1065, loss: 0.33767858147621155, mean loss: 0.4081823914337721
Epoch: 3, step: 1066, loss: 0.37693408131599426, mean loss: 0.4081766036378622
Epoch: 3, step: 1067, loss: 0.3477238118648529, mean loss: 0.40816540867642276
Epoch: 3, step: 1068, loss: 0.3418198227882385, mean loss: 0.4081531247316184
Epoch: 3, step: 1069, loss: 0.38787150382995605, mean loss: 0.40814937026643855
Epoch: 3, step: 1070, loss: 0.3224961757659912, mean loss: 0.40813351737091746
Epoch: 3, step: 1071, loss: 0.36855068802833557, mean loss: 0.4081261926430598
Epoch: 3, step: 1072, loss: 0.4427516460418701, mean loss: 0.4081325988324028
Epoch: 3, step: 1073, loss: 0.41175758838653564, mean loss: 0.4081332693817099
Epoch: 3, step: 1074, loss: 0.41035178303718567, mean loss: 0.40813367968569647
Epoch: 3, step: 1075, loss: 0.34639665484428406, mean loss: 0.4081222638157184
Epoch: 3, step: 1076, loss: 0.3391484320163727, mean loss: 0.4081095121367021
Epoch: 3, step: 1077, loss: 0.3468819558620453, mean loss: 0.40809819465864766
Epoch: 3, step: 1078, loss: 0.4036405384540558, mean loss: 0.40809737084489706
Epoch: 3, step: 1079, loss: 0.39817601442337036, mean loss: 0.4080955376304807
Epoch: 3, step: 1080, loss: 0.36114203929901123, mean loss: 0.4080868634205543
Epoch: 3, step: 1081, loss: 0.3685210049152374, mean loss: 0.40807955535655255
Epoch: 3, step: 1082, loss: 0.390076220035553, mean loss: 0.4080762306408885
Epoch: 3, step: 1083, loss: 0.3785124719142914, mean loss: 0.40807077204437325
Epoch: 3, step: 1084, loss: 0.36746522784233093, mean loss: 0.4080632760975019
Epoch: 3, step: 1085, loss: 0.376681923866272, mean loss: 0.40805748404282655
Epoch: 3, step: 1086, loss: 0.4230179786682129, mean loss: 0.40806024479105046
Epoch: 3, step: 1087, loss: 0.3569175601005554, mean loss: 0.40805080887136586
Epoch: 3, step: 1088, loss: 0.3703138828277588, mean loss: 0.4080438476232486
Epoch: 3, step: 1089, loss: 0.3773423135280609, mean loss: 0.4080381852230097
Epoch: 3, step: 1090, loss: 0.36655089259147644, mean loss: 0.40803053497542874
Epoch: 3, step: 1091, loss: 0.3594135046005249, mean loss: 0.4080215716586192
Epoch: 3, step: 1092, loss: 0.3723032474517822, mean loss: 0.4080149876357239
Epoch: 3, step: 1093, loss: 0.3961292505264282, mean loss: 0.40801279712022276
Epoch: 3, step: 1094, loss: 0.3463832139968872, mean loss: 0.40800144101498537
Epoch: 3, step: 1095, loss: 0.37963229417800903, mean loss: 0.40799621456936325
Epoch: 3, step: 1096, loss: 0.33515673875808716, mean loss: 0.4079827978304037
Epoch: 3, step: 1097, loss: 0.36880895495414734, mean loss: 0.40797558349469903
Epoch: 3, step: 1098, loss: 0.3832301199436188, mean loss: 0.40797102715819544
Epoch: 3, step: 1099, loss: 0.38887956738471985, mean loss: 0.40796751253010755
Epoch: 3, step: 1100, loss: 0.39554789662361145, mean loss: 0.40796522657098616
Epoch: 3, step: 1101, loss: 0.4236202836036682, mean loss: 0.40796810751633633
Epoch: 3, step: 1102, loss: 0.35000738501548767, mean loss: 0.40795744316997
Epoch: 3, step: 1103, loss: 0.35534578561782837, mean loss: 0.4079477647929369
Epoch: 3, step: 1104, loss: 0.3554174304008484, mean loss: 0.40793810315335766
Epoch: 3, step: 1105, loss: 0.34510213136672974, mean loss: 0.40792654817509605
Epoch: 3, step: 1106, loss: 0.3492051959037781, mean loss: 0.4079157518242464
Epoch: 3, step: 1107, loss: 0.3642745018005371, mean loss: 0.4079077295356391
Epoch: 3, step: 1108, loss: 0.3298240303993225, mean loss: 0.40789337855252267
Epoch: 3, step: 1109, loss: 0.38623932003974915, mean loss: 0.4078893994899514
Epoch: 3, step: 1110, loss: 0.3239864408969879, mean loss: 0.40787398465280406
Epoch: 3, step: 1111, loss: 0.3840053379535675, mean loss: 0.40786960025774543
Epoch: 3, step: 1112, loss: 0.34375473856925964, mean loss: 0.40785782526019015
Epoch: 3, step: 1113, loss: 0.36221548914909363, mean loss: 0.4078494443685062
Epoch: 3, step: 1114, loss: 0.3922211527824402, mean loss: 0.40784657521271656
Epoch: 3, step: 1115, loss: 0.3815426230430603, mean loss: 0.4078417470276634
Epoch: 3, step: 1116, loss: 0.37182003259658813, mean loss: 0.40783513632580415
Epoch: 3, step: 1117, loss: 0.38949817419052124, mean loss: 0.4078317717455958
Epoch: 3, step: 1118, loss: 0.3732565641403198, mean loss: 0.40782542883464273
Epoch: 3, step: 1119, loss: 0.32837751507759094, mean loss: 0.4078108565834034
Epoch: 3, step: 1120, loss: 0.3640734553337097, mean loss: 0.40780283578728205
Epoch: 3, step: 1121, loss: 0.36381566524505615, mean loss: 0.40779477066617054
Epoch: 3, step: 1122, loss: 0.37616127729415894, mean loss: 0.4077889716756349
Epoch: 3, step: 1123, loss: 0.3465081453323364, mean loss: 0.4077777398526247
Epoch: 3, step: 1124, loss: 0.38351303339004517, mean loss: 0.40777329332404444
Epoch: 3, step: 1125, loss: 0.3465133309364319, mean loss: 0.4077620694394003
Epoch: 3, step: 1126, loss: 0.44409245252609253, mean loss: 0.4077687245746058
Epoch: 3, step: 1127, loss: 0.4110785722732544, mean loss: 0.407769330773818
Epoch: 3, step: 1128, loss: 0.36623311042785645, mean loss: 0.40776172480048967
Epoch: 3, step: 1129, loss: 0.3930020034313202, mean loss: 0.40775902254465496
Epoch: 3, step: 1130, loss: 0.390995055437088, mean loss: 0.4077559539070735
Epoch: 3, step: 1131, loss: 0.3438819646835327, mean loss: 0.4077442639383283
Epoch: 3, step: 1132, loss: 0.35827577114105225, mean loss: 0.4077352120640744
Epoch: 3, step: 1133, loss: 0.40113499760627747, mean loss: 0.4077340045605146
Epoch: 3, step: 1134, loss: 0.33497145771980286, mean loss: 0.40772069515008097
Epoch: 3, step: 1135, loss: 0.3389819860458374, mean loss: 0.40770812406209556
Epoch: 3, step: 1136, loss: 0.3798355162143707, mean loss: 0.40770302758964216
Epoch: 3, step: 1137, loss: 0.3696270287036896, mean loss: 0.4076960667123321
Epoch: 3, step: 1138, loss: 0.40757855772972107, mean loss: 0.40769604523381214
Epoch: 3, step: 1139, loss: 0.35483598709106445, mean loss: 0.40768638513546734
Epoch: 3, step: 1140, loss: 0.3977867662906647, mean loss: 0.40768457632515404
Epoch: 3, step: 1141, loss: 0.32437047362327576, mean loss: 0.40766935635754314
Epoch: 3, step: 1142, loss: 0.3499363362789154, mean loss: 0.40765881151369315
Epoch: 3, step: 1143, loss: 0.3487549424171448, mean loss: 0.4076480547808413
Epoch: 3, step: 1144, loss: 0.3590182363986969, mean loss: 0.40763917586567205
Epoch: 3, step: 1145, loss: 0.3519989550113678, mean loss: 0.4076290188337527
Epoch: 3, step: 1146, loss: 0.36948361992836, mean loss: 0.4076220567240784
Epoch: 3, step: 1147, loss: 0.3320453464984894, mean loss: 0.4076082653535993
Epoch: 3, step: 1148, loss: 0.39402827620506287, mean loss: 0.40760578770551525
Epoch: 3, step: 1149, loss: 0.3375609517097473, mean loss: 0.40759301046436314
Epoch: 3, step: 1150, loss: 0.3680431544780731, mean loss: 0.4075857972861785
Epoch: 3, step: 1151, loss: 0.3483012914657593, mean loss: 0.4075749868365395
Epoch: 3, step: 1152, loss: 0.3389517068862915, mean loss: 0.4075624757554182
Epoch: 3, step: 1153, loss: 0.3585124611854553, mean loss: 0.40755353481218637
Epoch: 3, step: 1154, loss: 0.3816979229450226, mean loss: 0.4075488226540185
Epoch: 3, step: 1155, loss: 0.36670565605163574, mean loss: 0.4075413803860516
Epoch: 3, step: 1156, loss: 0.3580745756626129, mean loss: 0.40753236839757945
Epoch: 3, step: 1157, loss: 0.3644750118255615, mean loss: 0.4075245255275299
Epoch: 3, step: 1158, loss: 0.33585864305496216, mean loss: 0.4075114740100517
Epoch: 3, step: 1159, loss: 0.36044344305992126, mean loss: 0.4075029037203667
Epoch: 3, step: 1160, loss: 0.3778151571750641, mean loss: 0.4074974990696211
Epoch: 3, step: 1161, loss: 0.3396209478378296, mean loss: 0.4074851444006674
Epoch: 3, step: 1162, loss: 0.40437060594558716, mean loss: 0.40748457760568013
Epoch: 3, step: 1163, loss: 0.3970486521720886, mean loss: 0.4074826787837308
Epoch: 3, step: 1164, loss: 0.38913601636886597, mean loss: 0.40747934120643137
Epoch: 3, step: 1165, loss: 0.3518230617046356, mean loss: 0.407469218201793
Epoch: 3, step: 1166, loss: 0.40167495608329773, mean loss: 0.40746816450800893
Epoch: 3, step: 1167, loss: 0.41889381408691406, mean loss: 0.40747024189884146
Epoch: 3, step: 1168, loss: 0.3836611807346344, mean loss: 0.4074659137655631
Epoch: 3, step: 1169, loss: 0.3479151427745819, mean loss: 0.40745509028846555
Epoch: 3, step: 1170, loss: 0.38981086015701294, mean loss: 0.4074518839955105
Epoch: 3, step: 1171, loss: 0.39708808064460754, mean loss: 0.40745000103705287
Epoch: 3, step: 1172, loss: 0.34353435039520264, mean loss: 0.4074383905646384
Epoch: 3, step: 1173, loss: 0.3558332920074463, mean loss: 0.4074290180440141
Epoch: 3, step: 1174, loss: 0.3982385993003845, mean loss: 0.40742734918279316
Epoch: 3, step: 1175, loss: 0.32807883620262146, mean loss: 0.4074129431346849
Epoch: 3, step: 1176, loss: 0.363008975982666, mean loss: 0.40740488287562665
Epoch: 3, step: 1177, loss: 0.34690120816230774, mean loss: 0.4073939021724119
Epoch: 3, step: 1178, loss: 0.43110769987106323, mean loss: 0.4073982051660063
Epoch: 3, step: 1179, loss: 0.3460726737976074, mean loss: 0.40738707934391477
Epoch: 3, step: 1180, loss: 0.36130839586257935, mean loss: 0.4073787211571777
Epoch: 3, step: 1181, loss: 0.3851020932197571, mean loss: 0.4073746811448568
Epoch: 3, step: 1182, loss: 0.3398455083370209, mean loss: 0.4073624365079016
Epoch: 3, step: 1183, loss: 0.3603971600532532, mean loss: 0.40735392213581045
Epoch: 3, step: 1184, loss: 0.3511720895767212, mean loss: 0.40734373873313523
Epoch: 3, step: 1185, loss: 0.36370763182640076, mean loss: 0.40733583077610247
Epoch: 3, step: 1186, loss: 0.30816325545310974, mean loss: 0.4073178614745401
Epoch: 3, step: 1187, loss: 0.4265492856502533, mean loss: 0.4073213454281951
Epoch: 3, step: 1188, loss: 0.3437560796737671, mean loss: 0.40730983206725424
Epoch: 3, step: 1189, loss: 0.3239564001560211, mean loss: 0.40729473727697696
Epoch: 3, step: 1190, loss: 0.39169955253601074, mean loss: 0.40729191359695865
Epoch: 3, step: 1191, loss: 0.3189485967159271, mean loss: 0.4072759209617521
Epoch: 3, step: 1192, loss: 0.3636454641819, mean loss: 0.4072680240464978
Epoch: 3, step: 1193, loss: 0.35256633162498474, mean loss: 0.40725812507935677
Epoch: 3, step: 1194, loss: 0.3308623433113098, mean loss: 0.4072443027920819
Epoch: 3, step: 1195, loss: 0.37889569997787476, mean loss: 0.4072391746077812
Epoch: 3, step: 1196, loss: 0.39670294523239136, mean loss: 0.4072372689775813
Epoch: 3, step: 1197, loss: 0.36927053332328796, mean loss: 0.4072304033834304
Epoch: 3, step: 1198, loss: 0.37637588381767273, mean loss: 0.4072248249130696
Epoch: 3, step: 1199, loss: 0.4117913544178009, mean loss: 0.40722565038839587
Epoch: 3, step: 1200, loss: 0.37784090638160706, mean loss: 0.4072203395725624
Epoch: 3, step: 1201, loss: 0.3470504879951477, mean loss: 0.4072094668129712
Epoch: 3, step: 1202, loss: 0.34285399317741394, mean loss: 0.40719783980779767
Epoch: 3, step: 1203, loss: 0.33890852332115173, mean loss: 0.4071855043098774
Epoch: 3, step: 1204, loss: 0.3529672622680664, mean loss: 0.40717571232106725
Epoch: 3, step: 1205, loss: 0.321279913187027, mean loss: 0.40716020206481335
Epoch: 3, step: 1206, loss: 0.3809513449668884, mean loss: 0.4071554703700854
Epoch: 3, step: 1207, loss: 0.3629806637763977, mean loss: 0.40714749657828153
Epoch: 3, step: 1208, loss: 0.354928582906723, mean loss: 0.4071380724826902
Epoch: 3, step: 1209, loss: 0.33763816952705383, mean loss: 0.4071255319011392
Epoch: 3, step: 1210, loss: 0.35048964619636536, mean loss: 0.4071153143500469
Epoch: 3, step: 1211, loss: 0.3562416136264801, mean loss: 0.40710613799710255
Epoch: 3, step: 1212, loss: 0.409140944480896, mean loss: 0.4071065049594982
Epoch: 3, step: 1213, loss: 0.3441717326641083, mean loss: 0.40709515718230826
Epoch: 3, step: 1214, loss: 0.3240996301174164, mean loss: 0.40708019494559206
Epoch: 3, step: 1215, loss: 0.37656089663505554, mean loss: 0.40707469399059737
Epoch: 3, step: 1216, loss: 0.4385206997394562, mean loss: 0.40708036095865446
Epoch: 3, step: 1217, loss: 0.37729498744010925, mean loss: 0.4070749942246872
Epoch: 3, step: 1218, loss: 0.34603071212768555, mean loss: 0.4070639972363793
Epoch: 3, step: 1219, loss: 0.3863380551338196, mean loss: 0.40706026417764324
Epoch: 3, step: 1220, loss: 0.36843761801719666, mean loss: 0.4070533089019075
Epoch: 3, step: 1221, loss: 0.41865748167037964, mean loss: 0.40705539823801995
Epoch: 3, step: 1222, loss: 0.36763250827789307, mean loss: 0.40704830140814413
Epoch: 3, step: 1223, loss: 0.3171720802783966, mean loss: 0.40703212498245483
Epoch: 3, step: 1224, loss: 0.37725892663002014, mean loss: 0.4070267671997749
Epoch: 3, step: 1225, loss: 0.35901594161987305, mean loss: 0.40701812905195556
Epoch: 3, step: 1226, loss: 0.3867858648300171, mean loss: 0.40701448950091723
Epoch: 3, step: 1227, loss: 0.31124377250671387, mean loss: 0.40699726455181756
Epoch: 3, step: 1228, loss: 0.37531501054763794, mean loss: 0.4069915673293748
Epoch: 3, step: 1229, loss: 0.321571409702301, mean loss: 0.4069762095160654
Epoch: 3, step: 1230, loss: 0.3716062009334564, mean loss: 0.40696985143435
Epoch: 3, step: 1231, loss: 0.36255913972854614, mean loss: 0.4069618696385725
Epoch: 3, step: 1232, loss: 0.3832659125328064, mean loss: 0.40695761160495064
Epoch: 3, step: 1233, loss: 0.31825506687164307, mean loss: 0.40694167510751383
Epoch: 3, step: 1234, loss: 0.37588343024253845, mean loss: 0.40693609611616033
Epoch: 3, step: 1235, loss: 0.3488105535507202, mean loss: 0.4069256569023375
Epoch: 3, step: 1236, loss: 0.31435272097587585, mean loss: 0.4069090340012913
Epoch: 3, step: 1237, loss: 0.35997435450553894, mean loss: 0.40690060766745006
Epoch: 3, step: 1238, loss: 0.3506481349468231, mean loss: 0.40689051029306117
Epoch: 3, step: 1239, loss: 0.382420152425766, mean loss: 0.4068861186279737
Epoch: 3, step: 1240, loss: 0.36901140213012695, mean loss: 0.40687932251878695
Epoch: 3, step: 1241, loss: 0.3763517737388611, mean loss: 0.4068738457429025
Epoch: 3, step: 1242, loss: 0.40024641156196594, mean loss: 0.4068726569654709
Epoch: 3, step: 1243, loss: 0.39226675033569336, mean loss: 0.4068700375417568
Epoch: 3, step: 1244, loss: 0.3525242209434509, mean loss: 0.40686029290905135
Epoch: 3, step: 1245, loss: 0.37723758816719055, mean loss: 0.40685498227715067
Epoch: 3, step: 1246, loss: 0.34214043617248535, mean loss: 0.4068433826094495
Epoch: 3, step: 1247, loss: 0.35992148518562317, mean loss: 0.40683497366725885
Epoch: 3, step: 1248, loss: 0.3742631673812866, mean loss: 0.4068291374719021
Epoch: 3, step: 1249, loss: 0.33469358086586, mean loss: 0.4068162145846563
Epoch: 3, step: 1250, loss: 0.3533354103565216, mean loss: 0.4068066353612588
Epoch: 3, step: 1251, loss: 0.35125571489334106, mean loss: 0.406796687130516
Epoch: 3, step: 1252, loss: 0.4078657627105713, mean loss: 0.40679687854959923
Epoch: 3, step: 1253, loss: 0.36772769689559937, mean loss: 0.4067898844247059
Epoch: 3, step: 1254, loss: 0.3819698393344879, mean loss: 0.40678544196093464
Epoch: 3, step: 1255, loss: 0.36732012033462524, mean loss: 0.40677837944811673
Epoch: 3, step: 1256, loss: 0.3437611758708954, mean loss: 0.40676710422829615
Epoch: 3, step: 1257, loss: 0.3726164698600769, mean loss: 0.40676099499137874
Epoch: 3, step: 1258, loss: 0.3706109821796417, mean loss: 0.4067545292405628
Epoch: 3, step: 1259, loss: 0.334394633769989, mean loss: 0.4067415893450924
Epoch: 3, step: 1260, loss: 0.36447852849960327, mean loss: 0.40673403292441557
Epoch: 3, step: 1261, loss: 0.31679096817970276, mean loss: 0.40671795443590203
Epoch: 3, step: 1262, loss: 0.3542541265487671, mean loss: 0.4067085775229642
Epoch: 3, step: 1263, loss: 0.36114317178726196, mean loss: 0.4067004350273002
Epoch: 3, step: 1264, loss: 0.30939432978630066, mean loss: 0.4066830496234694
Epoch: 3, step: 1265, loss: 0.3442758321762085, mean loss: 0.4066719014960226
Epoch: 3, step: 1266, loss: 0.3411775827407837, mean loss: 0.40666020399311936
Epoch: 3, step: 1267, loss: 0.3465515375137329, mean loss: 0.4066494703026766
Epoch: 3, step: 1268, loss: 0.3142591714859009, mean loss: 0.406632974980624
Epoch: 3, step: 1269, loss: 0.3966749310493469, mean loss: 0.406631197393346
Epoch: 3, step: 1270, loss: 0.3413151204586029, mean loss: 0.40661954005318274
Epoch: 3, step: 1271, loss: 0.39219930768013, mean loss: 0.40661696684969006
Epoch: 3, step: 1272, loss: 0.3471861481666565, mean loss: 0.4066063636706208
Epoch: 3, step: 1273, loss: 0.360361784696579, mean loss: 0.4065981145484349
Epoch: 3, step: 1274, loss: 0.33013033866882324, mean loss: 0.4065844766358471
Epoch: 3, step: 1275, loss: 0.3683891296386719, mean loss: 0.4065776657679803
Epoch: 3, step: 1276, loss: 0.35997164249420166, mean loss: 0.4065693566178156
Epoch: 3, step: 1277, loss: 0.35089629888534546, mean loss: 0.4065594327216066
Epoch: 3, step: 1278, loss: 0.3635929524898529, mean loss: 0.4065517751774555
Epoch: 3, step: 1279, loss: 0.40989890694618225, mean loss: 0.40655237160150554
Epoch: 3, step: 1280, loss: 0.3545199930667877, mean loss: 0.40654310162492713
Epoch: 3, step: 1281, loss: 0.3836715817451477, mean loss: 0.40653902760998595
Epoch: 3, step: 1282, loss: 0.3894806206226349, mean loss: 0.4065359896033987
Epoch: 3, step: 1283, loss: 0.34362947940826416, mean loss: 0.4065247883017258
Epoch: 3, step: 1284, loss: 0.3737507164478302, mean loss: 0.4065189535016806
Epoch: 3, step: 1285, loss: 0.3511616587638855, mean loss: 0.4065090999426315
Epoch: 3, step: 1286, loss: 0.34362319111824036, mean loss: 0.40649790828774196
Epoch: 3, step: 1287, loss: 0.40261125564575195, mean loss: 0.40649721671253874
Epoch: 3, step: 1288, loss: 0.34448209404945374, mean loss: 0.4064861839563276
Epoch: 3, step: 1289, loss: 0.37938517332077026, mean loss: 0.4064813634279328
Epoch: 3, step: 1290, loss: 0.3382248282432556, mean loss: 0.4064692246167671
Epoch: 3, step: 1291, loss: 0.3243599832057953, mean loss: 0.4064546248227751
Epoch: 3, step: 1292, loss: 0.3504520654678345, mean loss: 0.40644466881222313
Epoch: 3, step: 1293, loss: 0.3767058253288269, mean loss: 0.4064393828464422
Epoch: 3, step: 1294, loss: 0.45374247431755066, mean loss: 0.40644778929596614
Epoch: 3, step: 1295, loss: 0.36284908652305603, mean loss: 0.4064400425470726
Epoch: 3, step: 1296, loss: 0.38339248299598694, mean loss: 0.40643594811474876
Epoch: 3, step: 1297, loss: 0.331849068403244, mean loss: 0.4064227000011233
Epoch: 3, step: 1298, loss: 0.33897602558135986, mean loss: 0.4064107222574863
Epoch: 3, step: 1299, loss: 0.37007707357406616, mean loss: 0.40640427097043313
Epoch: 3, step: 1300, loss: 0.39902809262275696, mean loss: 0.40640296151217864
Epoch: 3, step: 1301, loss: 0.38026708364486694, mean loss: 0.40639832255622066
Epoch: 3, step: 1302, loss: 0.3639373779296875, mean loss: 0.40639078733978296
Epoch: 3, step: 1303, loss: 0.38379016518592834, mean loss: 0.4063867772932688
Epoch: 3, step: 1304, loss: 0.4281839430332184, mean loss: 0.4063906440957772
Epoch: 3, step: 1305, loss: 0.3186548054218292, mean loss: 0.4063750825777435
Epoch: 3, step: 1306, loss: 0.37448936700820923, mean loss: 0.40636942807950455
Epoch: 3, step: 1307, loss: 0.3276916444301605, mean loss: 0.4063554781178646
Epoch: 3, step: 1308, loss: 0.3509092628955841, mean loss: 0.40634564897139724
Epoch: 3, step: 1309, loss: 0.3992583453655243, mean loss: 0.4063443928027326
Epoch: 3, step: 1310, loss: 0.3684985339641571, mean loss: 0.40633768611146226
Epoch: 3, step: 1311, loss: 0.3786032497882843, mean loss: 0.40633277214329727
Epoch: 3, step: 1312, loss: 0.3473142385482788, mean loss: 0.4063223171329173
Epoch: 3, step: 1313, loss: 0.37382861971855164, mean loss: 0.4063165619615722
Epoch: 3, step: 1314, loss: 0.3646697998046875, mean loss: 0.40630918693728374
Epoch: 3, step: 1315, loss: 0.3456920385360718, mean loss: 0.4062984544393374
Epoch: 3, step: 1316, loss: 0.3851172626018524, mean loss: 0.40629470489218966
Epoch: 3, step: 1317, loss: 0.36295145750045776, mean loss: 0.4062870335209699
Epoch: 3, step: 1318, loss: 0.33996888995170593, mean loss: 0.4062752978735501
Epoch: 3, step: 1319, loss: 0.3601258099079132, mean loss: 0.4062671327129051
Epoch: 3, step: 1320, loss: 0.4268806576728821, mean loss: 0.40627077918822085
Epoch: 3, step: 1321, loss: 0.4338279664516449, mean loss: 0.4062756531159293
Epoch: 3, step: 1322, loss: 0.3232373297214508, mean loss: 0.4062609690622786
Epoch: 3, step: 1323, loss: 0.37239763140678406, mean loss: 0.40625498190922776
Epoch: 3, step: 1324, loss: 0.3272198736667633, mean loss: 0.40624101070395247
Epoch: 3, step: 1325, loss: 0.3056736886501312, mean loss: 0.40622323634515894
Epoch: 3, step: 1326, loss: 0.3851531147956848, mean loss: 0.40621951305101694
Epoch: 3, step: 1327, loss: 0.3733808994293213, mean loss: 0.4062137111758188
Epoch: 3, step: 1328, loss: 0.3551514148712158, mean loss: 0.40620469116233976
Epoch: 3, step: 1329, loss: 0.35409778356552124, mean loss: 0.40619548824683344
Epoch: 3, step: 1330, loss: 0.3525821268558502, mean loss: 0.40618602093950673
Epoch: 3, step: 1331, loss: 0.3466273844242096, mean loss: 0.4061755056435118
Epoch: 3, step: 1332, loss: 0.3273577094078064, mean loss: 0.40616159252855405
Epoch: 3, step: 1333, loss: 0.3879394829273224, mean loss: 0.4061583764837956
Epoch: 3, step: 1334, loss: 0.34479114413261414, mean loss: 0.40614754760919686
Epoch: 3, step: 1335, loss: 0.35492971539497375, mean loss: 0.4061385112944096
Epoch: 3, step: 1336, loss: 0.3699415624141693, mean loss: 0.4061321262266939
Epoch: 3, step: 1337, loss: 0.3428484797477722, mean loss: 0.40612096508974876
Epoch: 3, step: 1338, loss: 0.35026371479034424, mean loss: 0.406111115460001
Epoch: 3, step: 1339, loss: 0.3461378812789917, mean loss: 0.4061005418996729
Epoch: 3, step: 1340, loss: 0.36415258049964905, mean loss: 0.4060931475824862
Epoch: 3, step: 1341, loss: 0.40746957063674927, mean loss: 0.4060933901667397
Epoch: 3, step: 1342, loss: 0.35465818643569946, mean loss: 0.4060843266947166
Epoch: 3, step: 1343, loss: 0.40297141671180725, mean loss: 0.4060837782609635
Epoch: 3, step: 1344, loss: 0.3439314067363739, mean loss: 0.4060728301595852
Epoch: 3, step: 1345, loss: 0.33189183473587036, mean loss: 0.40605976552495615
Epoch: 3, step: 1346, loss: 0.3420346677303314, mean loss: 0.4060484915158358
Epoch: 3, step: 1347, loss: 0.3566814363002777, mean loss: 0.4060398001328753
Epoch: 3, step: 1348, loss: 0.3321211338043213, mean loss: 0.406026788573937
Epoch: 3, step: 1349, loss: 0.3520132005214691, mean loss: 0.40601728248663455
Epoch: 3, step: 1350, loss: 0.3660416305065155, mean loss: 0.40601024823501036
Epoch: 3, step: 1351, loss: 0.34517160058021545, mean loss: 0.40599954474316396
Epoch: 3, step: 1352, loss: 0.33136609196662903, mean loss: 0.4059864166072314
Epoch: 3, step: 1353, loss: 0.4105919301509857, mean loss: 0.40598722658147407
Epoch: 3, step: 1354, loss: 0.3527625799179077, mean loss: 0.40597786757907145
Epoch: 3, step: 1355, loss: 0.3847567141056061, mean loss: 0.40597413671523996
Epoch: 3, step: 1356, loss: 0.3706497550010681, mean loss: 0.40596792747254107
Epoch: 3, step: 1357, loss: 0.3577517867088318, mean loss: 0.405959453634094
Epoch: 3, step: 1358, loss: 0.3359082043170929, mean loss: 0.40594714450576563
Epoch: 3, step: 1359, loss: 0.4071296155452728, mean loss: 0.4059473522483938
Epoch: 3, step: 1360, loss: 0.3629515767097473, mean loss: 0.40593979985500916
Epoch: 3, step: 1361, loss: 0.3980794847011566, mean loss: 0.40593841939923925
Epoch: 3, step: 1362, loss: 0.39349472522735596, mean loss: 0.40593623437831355
Epoch: 3, step: 1363, loss: 0.3266368508338928, mean loss: 0.4059223124359778
Epoch: 3, step: 1364, loss: 0.36660727858543396, mean loss: 0.40591541142950943
Epoch: 3, step: 1365, loss: 0.3708190321922302, mean loss: 0.40590925200879385
Epoch: 3, step: 1366, loss: 0.4082931578159332, mean loss: 0.40590967031126923
Epoch: 3, step: 1367, loss: 0.34098920226097107, mean loss: 0.4058982807554709
Epoch: 3, step: 1368, loss: 0.35053470730781555, mean loss: 0.4058885695515685
Epoch: 3, step: 1369, loss: 0.326922208070755, mean loss: 0.40587472066319935
Epoch: 3, step: 1370, loss: 0.36308446526527405, mean loss: 0.4058672175498559
Epoch: 3, step: 1371, loss: 0.3682766854763031, mean loss: 0.40586062734437317
Epoch: 3, step: 1372, loss: 0.33338531851768494, mean loss: 0.4058479235216165
Epoch: 3, step: 1373, loss: 0.3441808521747589, mean loss: 0.4058371161133889
Epoch: 3, step: 1374, loss: 0.32249951362609863, mean loss: 0.4058225134145126
Epoch: 3, step: 1375, loss: 0.37287887930870056, mean loss: 0.405816741929911
Epoch: 3, step: 1376, loss: 0.39423519372940063, mean loss: 0.40581471328247704
Epoch: 3, step: 1377, loss: 0.36152535676956177, mean loss: 0.4058069568277462
Epoch: 3, step: 1378, loss: 0.34423068165779114, mean loss: 0.405796174779914
Epoch: 3, step: 1379, loss: 0.3617725968360901, mean loss: 0.4057884675708902
Epoch: 3, step: 1380, loss: 0.3310772478580475, mean loss: 0.4057753901650241
Epoch: 3, step: 1381, loss: 0.3697337806224823, mean loss: 0.40576908256797434
Epoch: 3, step: 1382, loss: 0.3544428050518036, mean loss: 0.405760101592031
Epoch: 3, step: 1383, loss: 0.38170742988586426, mean loss: 0.405755893636869
Epoch: 3, step: 1384, loss: 0.38194453716278076, mean loss: 0.4057517286278653
Epoch: 3, step: 1385, loss: 0.3934275805950165, mean loss: 0.4057495733029208
Epoch: 3, step: 1386, loss: 0.36945709586143494, mean loss: 0.40574322735477575
Epoch: 3, step: 1387, loss: 0.3385239243507385, mean loss: 0.4057314757283764
Epoch: 3, step: 1388, loss: 0.35019049048423767, mean loss: 0.4057217674631703
Epoch: 3, step: 1389, loss: 0.41090530157089233, mean loss: 0.40572267335868023
Epoch: 3, step: 1390, loss: 0.399274080991745, mean loss: 0.4057215465733636
Epoch: 3, step: 1391, loss: 0.3765201270580292, mean loss: 0.4057164449976272
Epoch: 3, step: 1392, loss: 0.34585216641426086, mean loss: 0.4057059883550799
Epoch: 3, step: 1393, loss: 0.36270830035209656, mean loss: 0.40569847915354257
Epoch: 3, step: 1394, loss: 0.4050976634025574, mean loss: 0.4056983742442094
Epoch: 3, step: 1395, loss: 0.36648762226104736, mean loss: 0.4056915287916984
Epoch: 3, step: 1396, loss: 0.33867090940475464, mean loss: 0.405679830306904
Epoch: 3, step: 1397, loss: 0.38129204511642456, mean loss: 0.40567557414893013
Epoch: 3, step: 1398, loss: 0.3256050944328308, mean loss: 0.40566160268152196
Epoch: 3, step: 1399, loss: 0.3102157413959503, mean loss: 0.4056449512751567
Epoch: 3, step: 1400, loss: 0.34742358326911926, mean loss: 0.4056347957949533
Epoch: 3, step: 1401, loss: 0.33103495836257935, mean loss: 0.40562178570820195
Epoch: 3, step: 1402, loss: 0.3753245174884796, mean loss: 0.4056165028366728
Epoch: 3, step: 1403, loss: 0.3429321348667145, mean loss: 0.40560557459957897
Epoch: 3, step: 1404, loss: 0.3487365245819092, mean loss: 0.40559566191873225
Epoch: 3, step: 1405, loss: 0.3700394332408905, mean loss: 0.40558946529470336
Epoch: 3, step: 1406, loss: 0.35954979062080383, mean loss: 0.40558144304785304
Epoch: 3, step: 1407, loss: 0.3752119839191437, mean loss: 0.40557615220131493
Epoch: 3, step: 1408, loss: 0.3513187766075134, mean loss: 0.405566701343347
Epoch: 3, step: 1409, loss: 0.3602440059185028, mean loss: 0.40555880815361783
Epoch: 3, step: 1410, loss: 0.3362620174884796, mean loss: 0.405546741848435
Epoch: 3, step: 1411, loss: 0.3295462131500244, mean loss: 0.4055335105586198
Epoch: 3, step: 1412, loss: 0.35152214765548706, mean loss: 0.40552410910293607
Epoch: 3, step: 1413, loss: 0.32756176590919495, mean loss: 0.40551054099587136
Epoch: 3, step: 1414, loss: 0.3501586318016052, mean loss: 0.4055009095517798
Epoch: 3, step: 1415, loss: 0.3774019479751587, mean loss: 0.40549602107551386
Epoch: 3, step: 1416, loss: 0.37464815378189087, mean loss: 0.40549065529584893
Epoch: 3, step: 1417, loss: 0.3641839325428009, mean loss: 0.40548347151797887
Epoch: 3, step: 1418, loss: 0.3618941605091095, mean loss: 0.4054758920864002
Epoch: 3, step: 1419, loss: 0.3671574294567108, mean loss: 0.40546923032307797
Epoch: 3, step: 1420, loss: 0.37498265504837036, mean loss: 0.4054639310748119
Epoch: 3, step: 1421, loss: 0.3646487891674042, mean loss: 0.40545683772376784
Epoch: 3, step: 1422, loss: 0.3288032114505768, mean loss: 0.4054435182404884
Epoch: 3, step: 1423, loss: 0.3420732021331787, mean loss: 0.40543250880405557
Epoch: 3, step: 1424, loss: 0.3789002299308777, mean loss: 0.40542790010527613
Epoch: 3, step: 1425, loss: 0.37584882974624634, mean loss: 0.40542276306631136
Epoch: 3, step: 1426, loss: 0.3420751094818115, mean loss: 0.40541176330010464
Epoch: 3, step: 1427, loss: 0.34346798062324524, mean loss: 0.40540100917116767
Epoch: 3, step: 1428, loss: 0.3786188066005707, mean loss: 0.4053963602903188
Epoch: 3, step: 1429, loss: 0.32739880681037903, mean loss: 0.4053828237485833
Epoch: 3, step: 1430, loss: 0.32544124126434326, mean loss: 0.40536895222637537
Epoch: 3, step: 1431, loss: 0.36699801683425903, mean loss: 0.4053622952285627
Epoch: 3, step: 1432, loss: 0.34098973870277405, mean loss: 0.40535112913029286
Epoch: 3, step: 1433, loss: 0.34847068786621094, mean loss: 0.40534126432951867
Epoch: 3, step: 1434, loss: 0.34005117416381836, mean loss: 0.40532994300297703
Epoch: 3, step: 1435, loss: 0.40154558420181274, mean loss: 0.4053292869074845
Epoch: 3, step: 1436, loss: 0.36965951323509216, mean loss: 0.4053231038993943
Epoch: 3, step: 1437, loss: 0.4208843410015106, mean loss: 0.40532580082090247
Epoch: 3, step: 1438, loss: 0.3436751961708069, mean loss: 0.4053151179921639
Epoch: 3, step: 1439, loss: 0.36541736125946045, mean loss: 0.4053082056988977
Epoch: 3, step: 1440, loss: 0.39214012026786804, mean loss: 0.4053059247209952
Epoch: 3, step: 1441, loss: 0.350843220949173, mean loss: 0.4052964923164625
Epoch: 3, step: 1442, loss: 0.34641194343566895, mean loss: 0.4052862958577818
Epoch: 3, step: 1443, loss: 0.3055371046066284, mean loss: 0.40526902626095856
Valid: 3, mean loss: 0.23315159479777017
Epoch: 4, step: 0, loss: 0.35910943150520325, mean loss: 0.405261036024719
Epoch: 4, step: 1, loss: 0.3238067030906677, mean loss: 0.4052469387016083
Epoch: 4, step: 2, loss: 0.3574736714363098, mean loss: 0.40523867200022995
Epoch: 4, step: 3, loss: 0.32588449120521545, mean loss: 0.4052249429032066
Epoch: 4, step: 4, loss: 0.42570582032203674, mean loss: 0.40522848569466463
Epoch: 4, step: 5, loss: 0.3304414451122284, mean loss: 0.4052155512358991
Epoch: 4, step: 6, loss: 0.3460922837257385, mean loss: 0.4052053276032672
Epoch: 4, step: 7, loss: 0.3728521168231964, mean loss: 0.40519973403293874
Epoch: 4, step: 8, loss: 0.397438645362854, mean loss: 0.40519839244457745
Epoch: 4, step: 9, loss: 0.3295552730560303, mean loss: 0.4051853189707806
Epoch: 4, step: 10, loss: 0.35524269938468933, mean loss: 0.4051766888308832
Epoch: 4, step: 11, loss: 0.41957443952560425, mean loss: 0.4051791763482804
Epoch: 4, step: 12, loss: 0.3976755142211914, mean loss: 0.4051778801551335
Epoch: 4, step: 13, loss: 0.41244709491729736, mean loss: 0.4051791356326399
Epoch: 4, step: 14, loss: 0.3658272922039032, mean loss: 0.4051723402875477
Epoch: 4, step: 15, loss: 0.3582893908023834, mean loss: 0.40516424585566146
Epoch: 4, step: 16, loss: 0.3255387246608734, mean loss: 0.40515050072857794
Epoch: 4, step: 17, loss: 0.3410910367965698, mean loss: 0.4051394445559973
Epoch: 4, step: 18, loss: 0.36609938740730286, mean loss: 0.4051327077040303
Epoch: 4, step: 19, loss: 0.34603795409202576, mean loss: 0.40512251192183363
Epoch: 4, step: 20, loss: 0.3784448206424713, mean loss: 0.40511790993955327
Epoch: 4, step: 21, loss: 0.3603270649909973, mean loss: 0.40511018471620924
Epoch: 4, step: 22, loss: 0.32388007640838623, mean loss: 0.40509617711001716
Epoch: 4, step: 23, loss: 0.36435118317604065, mean loss: 0.40508915211106306
Epoch: 4, step: 24, loss: 0.3768641948699951, mean loss: 0.40508428657800993
Epoch: 4, step: 25, loss: 0.3416685163974762, mean loss: 0.4050733565934907
Epoch: 4, step: 26, loss: 0.3412359952926636, mean loss: 0.405062355841931
Epoch: 4, step: 27, loss: 0.4226667881011963, mean loss: 0.40506538899704114
Epoch: 4, step: 28, loss: 0.37993675470352173, mean loss: 0.40506106020560384
Epoch: 4, step: 29, loss: 0.38365015387535095, mean loss: 0.40505737248491314
Epoch: 4, step: 30, loss: 0.3235722482204437, mean loss: 0.40504334026099986
Epoch: 4, step: 31, loss: 0.36599645018577576, mean loss: 0.40503661731160673
Epoch: 4, step: 32, loss: 0.33797749876976013, mean loss: 0.40502507330772625
Epoch: 4, step: 33, loss: 0.40574127435684204, mean loss: 0.4050251965781306
Epoch: 4, step: 34, loss: 0.37907838821411133, mean loss: 0.40502073145881134
Epoch: 4, step: 35, loss: 0.3726222515106201, mean loss: 0.405015157047258
Epoch: 4, step: 36, loss: 0.3575948178768158, mean loss: 0.4050069994110683
Epoch: 4, step: 37, loss: 0.3753833770751953, mean loss: 0.40500190418878834
Epoch: 4, step: 38, loss: 0.3436807692050934, mean loss: 0.4049913588517318
Epoch: 4, step: 39, loss: 0.36270982027053833, mean loss: 0.40498408898608856
Epoch: 4, step: 40, loss: 0.37240171432495117, mean loss: 0.40497848775269313
Epoch: 4, step: 41, loss: 0.3564033508300781, mean loss: 0.40497013864012477
Epoch: 4, step: 42, loss: 0.3762328326702118, mean loss: 0.404965200110142
Epoch: 4, step: 43, loss: 0.37357980012893677, mean loss: 0.4049598074297328
Epoch: 4, step: 44, loss: 0.370850533246994, mean loss: 0.40495394773652155
Epoch: 4, step: 45, loss: 0.3459685742855072, mean loss: 0.40494381627423176
Epoch: 4, step: 46, loss: 0.35850951075553894, mean loss: 0.40493584198168175
Epoch: 4, step: 47, loss: 0.3389631509780884, mean loss: 0.4049245142531441
Epoch: 4, step: 48, loss: 0.3930809497833252, mean loss: 0.40492248102319217
Epoch: 4, step: 49, loss: 0.3446555435657501, mean loss: 0.404912136543711
Epoch: 4, step: 50, loss: 0.3710342347621918, mean loss: 0.4049063225911142
Epoch: 4, step: 51, loss: 0.41972076892852783, mean loss: 0.4049088645345489
Epoch: 4, step: 52, loss: 0.3735549747943878, mean loss: 0.40490348558623185
Epoch: 4, step: 53, loss: 0.3960060775279999, mean loss: 0.4049019594441978
Epoch: 4, step: 54, loss: 0.38368088006973267, mean loss: 0.40489832008913446
Epoch: 4, step: 55, loss: 0.3553828001022339, mean loss: 0.404889829773636
Epoch: 4, step: 56, loss: 0.33353957533836365, mean loss: 0.4048775976024659
Epoch: 4, step: 57, loss: 0.37079617381095886, mean loss: 0.4048717557403144
Epoch: 4, step: 58, loss: 0.36457160115242004, mean loss: 0.40486484911570636
Epoch: 4, step: 59, loss: 0.386963814496994, mean loss: 0.4048617817691302
Epoch: 4, step: 60, loss: 0.32412877678871155, mean loss: 0.4048479505193477
Epoch: 4, step: 61, loss: 0.33070579171180725, mean loss: 0.4048352505949202
Epoch: 4, step: 62, loss: 0.3455459177494049, mean loss: 0.4048250965731964
Epoch: 4, step: 63, loss: 0.3757673501968384, mean loss: 0.40482012093169356
Epoch: 4, step: 64, loss: 0.3328583538532257, mean loss: 0.40480780082091145
Epoch: 4, step: 65, loss: 0.37236157059669495, mean loss: 0.40480224686161254
Epoch: 4, step: 66, loss: 0.3634536564350128, mean loss: 0.404795170258767
Epoch: 4, step: 67, loss: 0.3797115385532379, mean loss: 0.40479087805621644
Epoch: 4, step: 68, loss: 0.32498428225517273, mean loss: 0.4047772242331538
Epoch: 4, step: 69, loss: 0.35298022627830505, mean loss: 0.4047683639871814
Epoch: 4, step: 70, loss: 0.35921403765678406, mean loss: 0.40476057292743617
Epoch: 4, step: 71, loss: 0.36901432275772095, mean loss: 0.40475446036755763
Epoch: 4, step: 72, loss: 0.39817124605178833, mean loss: 0.4047533348393792
Epoch: 4, step: 73, loss: 0.36380094289779663, mean loss: 0.4047463344305003
Epoch: 4, step: 74, loss: 0.3291414678096771, mean loss: 0.40473341273051383
Epoch: 4, step: 75, loss: 0.37490254640579224, mean loss: 0.40472831517987734
Epoch: 4, step: 76, loss: 0.35895147919654846, mean loss: 0.4047204940905243
Epoch: 4, step: 77, loss: 0.4257703721523285, mean loss: 0.4047240899016042
Epoch: 4, step: 78, loss: 0.36229318380355835, mean loss: 0.40471684294923904
Epoch: 4, step: 79, loss: 0.40840938687324524, mean loss: 0.4047174735066031
Epoch: 4, step: 80, loss: 0.4034273326396942, mean loss: 0.4047172532332777
Epoch: 4, step: 81, loss: 0.37761929631233215, mean loss: 0.4047126274297746
Epoch: 4, step: 82, loss: 0.34970927238464355, mean loss: 0.4047032395896918
Epoch: 4, step: 83, loss: 0.32002678513526917, mean loss: 0.4046887896827883
Epoch: 4, step: 84, loss: 0.33981895446777344, mean loss: 0.4046777216337839
Epoch: 4, step: 85, loss: 0.3596256673336029, mean loss: 0.4046700361929275
Epoch: 4, step: 86, loss: 0.3813844621181488, mean loss: 0.40466606457872406
Epoch: 4, step: 87, loss: 0.34325090050697327, mean loss: 0.404655591324278
Epoch: 4, step: 88, loss: 0.3286466896533966, mean loss: 0.40464263157974756
Epoch: 4, step: 89, loss: 0.3794582188129425, mean loss: 0.4046383382942435
Epoch: 4, step: 90, loss: 0.3433418869972229, mean loss: 0.404627890629117
Epoch: 4, step: 91, loss: 0.38940373063087463, mean loss: 0.4046252961914895
Epoch: 4, step: 92, loss: 0.3266151547431946, mean loss: 0.4046120042948379
Epoch: 4, step: 93, loss: 0.36418935656547546, mean loss: 0.40460511798347004
Epoch: 4, step: 94, loss: 0.34450650215148926, mean loss: 0.4045948814622927
Epoch: 4, step: 95, loss: 0.3637668490409851, mean loss: 0.4045879284594962
Epoch: 4, step: 96, loss: 0.35396385192871094, mean loss: 0.4045793086610064
Epoch: 4, step: 97, loss: 0.34477686882019043, mean loss: 0.40456912778939574
Epoch: 4, step: 98, loss: 0.38315892219543457, mean loss: 0.4045654834990819
Epoch: 4, step: 99, loss: 0.33137238025665283, mean loss: 0.4045530272187479
Epoch: 4, step: 100, loss: 0.36813119053840637, mean loss: 0.4045468298669221
Epoch: 4, step: 101, loss: 0.3674970269203186, mean loss: 0.40454052673610436
Epoch: 4, step: 102, loss: 0.3581344187259674, mean loss: 0.40453263319842614
Epoch: 4, step: 103, loss: 0.4149908423423767, mean loss: 0.40453441180542343
Epoch: 4, step: 104, loss: 0.3275587260723114, mean loss: 0.4045213229284071
Epoch: 4, step: 105, loss: 0.36637744307518005, mean loss: 0.40451483807974115
Epoch: 4, step: 106, loss: 0.3766753673553467, mean loss: 0.4045101058902588
Epoch: 4, step: 107, loss: 0.3297034204006195, mean loss: 0.40449739231352705
Epoch: 4, step: 108, loss: 0.3371347486972809, mean loss: 0.4044859458150366
Epoch: 4, step: 109, loss: 0.37561899423599243, mean loss: 0.40448104147395963
Epoch: 4, step: 110, loss: 0.3750554323196411, mean loss: 0.4044760430691432
Epoch: 4, step: 111, loss: 0.35587209463119507, mean loss: 0.40446778832246555
Epoch: 4, step: 112, loss: 0.408917099237442, mean loss: 0.4044685438515732
Epoch: 4, step: 113, loss: 0.3631221652030945, mean loss: 0.40446152409288927
Epoch: 4, step: 114, loss: 0.3534702956676483, mean loss: 0.40445286830806065
Epoch: 4, step: 115, loss: 0.34337541460990906, mean loss: 0.4044425021414452
Epoch: 4, step: 116, loss: 0.3946284055709839, mean loss: 0.4044408367593698
Epoch: 4, step: 117, loss: 0.37880972027778625, mean loss: 0.4044364880799532
Epoch: 4, step: 118, loss: 0.3595215976238251, mean loss: 0.4044288689297486
Epoch: 4, step: 119, loss: 0.40418413281440735, mean loss: 0.4044288274209095
Epoch: 4, step: 120, loss: 0.32043933868408203, mean loss: 0.4044145846722684
Epoch: 4, step: 121, loss: 0.34668251872062683, mean loss: 0.40440479625823794
Epoch: 4, step: 122, loss: 0.3875296413898468, mean loss: 0.40440193557763643
Epoch: 4, step: 123, loss: 0.34743204712867737, mean loss: 0.40439227966434
Epoch: 4, step: 124, loss: 0.35574814677238464, mean loss: 0.40438403629323477
Epoch: 4, step: 125, loss: 0.4041118025779724, mean loss: 0.40438399016756293
Epoch: 4, step: 126, loss: 0.34348514676094055, mean loss: 0.4043736735754222
Epoch: 4, step: 127, loss: 0.3481532037258148, mean loss: 0.404364151138117
Epoch: 4, step: 128, loss: 0.34730276465415955, mean loss: 0.40435448790585893
Epoch: 4, step: 129, loss: 0.3731398582458496, mean loss: 0.404349202665483
Epoch: 4, step: 130, loss: 0.32695823907852173, mean loss: 0.40433610109724416
Epoch: 4, step: 131, loss: 0.3801012635231018, mean loss: 0.4043319990597401
Epoch: 4, step: 132, loss: 0.3320925235748291, mean loss: 0.40431977372965294
Epoch: 4, step: 133, loss: 0.36705145239830017, mean loss: 0.40431346775311633
Epoch: 4, step: 134, loss: 0.36221450567245483, mean loss: 0.4043063456143783
Epoch: 4, step: 135, loss: 0.34744006395339966, mean loss: 0.4042967268251934
Epoch: 4, step: 136, loss: 0.4080173671245575, mean loss: 0.40429735605575307
Epoch: 4, step: 137, loss: 0.37545931339263916, mean loss: 0.4042924798226345
Epoch: 4, step: 138, loss: 0.3572370409965515, mean loss: 0.4042845245497983
Epoch: 4, step: 139, loss: 0.3096247911453247, mean loss: 0.40426852391872925
Epoch: 4, step: 140, loss: 0.3570807874202728, mean loss: 0.40426054897593755
Epoch: 4, step: 141, loss: 0.38146936893463135, mean loss: 0.40425669781337564
Epoch: 4, step: 142, loss: 0.381084144115448, mean loss: 0.4042527828693483
Epoch: 4, step: 143, loss: 0.3639831244945526, mean loss: 0.4042459805621904
Epoch: 4, step: 144, loss: 0.3276403546333313, mean loss: 0.40423304260814064
Epoch: 4, step: 145, loss: 0.38039925694465637, mean loss: 0.40422901799050076
Epoch: 4, step: 146, loss: 0.4236220419406891, mean loss: 0.4042322921799234
Epoch: 4, step: 147, loss: 0.35331791639328003, mean loss: 0.4042236975857663
Epoch: 4, step: 148, loss: 0.34094977378845215, mean loss: 0.4042130184425094
Epoch: 4, step: 149, loss: 0.3564128577709198, mean loss: 0.40420495226622327
Epoch: 4, step: 150, loss: 0.33666661381721497, mean loss: 0.40419355723695904
Epoch: 4, step: 151, loss: 0.3827904760837555, mean loss: 0.40418994673069164
Epoch: 4, step: 152, loss: 0.33198633790016174, mean loss: 0.4041777686890606
Epoch: 4, step: 153, loss: 0.3545994162559509, mean loss: 0.40416940808999935
Epoch: 4, step: 154, loss: 0.33928483724594116, mean loss: 0.40415846818596224
Epoch: 4, step: 155, loss: 0.32737743854522705, mean loss: 0.4041455246543303
Epoch: 4, step: 156, loss: 0.35712873935699463, mean loss: 0.40413760003182947
Epoch: 4, step: 157, loss: 0.3760790526866913, mean loss: 0.4041328715944609
Epoch: 4, step: 158, loss: 0.37146425247192383, mean loss: 0.40412736719359776
Epoch: 4, step: 159, loss: 0.3866927921772003, mean loss: 0.40412443010211924
Epoch: 4, step: 160, loss: 0.338270366191864, mean loss: 0.40411333795728005
Epoch: 4, step: 161, loss: 0.37181565165519714, mean loss: 0.4041078988049894
Epoch: 4, step: 162, loss: 0.35538771748542786, mean loss: 0.40409969537321305
Epoch: 4, step: 163, loss: 0.35986194014549255, mean loss: 0.404092247939673
Epoch: 4, step: 164, loss: 0.38624632358551025, mean loss: 0.4040892440810038
Epoch: 4, step: 165, loss: 0.30664733052253723, mean loss: 0.40407284523994713
Epoch: 4, step: 166, loss: 0.361646443605423, mean loss: 0.40406570635358763
Epoch: 4, step: 167, loss: 0.32941868901252747, mean loss: 0.4040531479724737
Epoch: 4, step: 168, loss: 0.35855633020401, mean loss: 0.40404549501742437
Epoch: 4, step: 169, loss: 0.37225499749183655, mean loss: 0.4040401484823545
Epoch: 4, step: 170, loss: 0.31947317719459534, mean loss: 0.40402592837620216
Epoch: 4, step: 171, loss: 0.3875696659088135, mean loss: 0.404023161687825
Epoch: 4, step: 172, loss: 0.40025895833969116, mean loss: 0.40402252894226304
Epoch: 4, step: 173, loss: 0.3428863286972046, mean loss: 0.40401225395062523
Epoch: 4, step: 174, loss: 0.3688943386077881, mean loss: 0.40400635277177416
Epoch: 4, step: 175, loss: 0.32927221059799194, mean loss: 0.403993796632296
Epoch: 4, step: 176, loss: 0.32360830903053284, mean loss: 0.4039802932747281
Epoch: 4, step: 177, loss: 0.33510512113571167, mean loss: 0.4039687253922728
Epoch: 4, step: 178, loss: 0.3280756175518036, mean loss: 0.4039559809577068
Epoch: 4, step: 179, loss: 0.33409520983695984, mean loss: 0.40394425147968116
Epoch: 4, step: 180, loss: 0.35022592544555664, mean loss: 0.40393523379862795
Epoch: 4, step: 181, loss: 0.413024365901947, mean loss: 0.4039367593327171
Epoch: 4, step: 182, loss: 0.3485254943370819, mean loss: 0.4039274605804104
Epoch: 4, step: 183, loss: 0.3465633690357208, mean loss: 0.4039178357328358
Epoch: 4, step: 184, loss: 0.34227412939071655, mean loss: 0.4039074945641825
Epoch: 4, step: 185, loss: 0.356636106967926, mean loss: 0.4038995657839752
Epoch: 4, step: 186, loss: 0.34400466084480286, mean loss: 0.4038895213591992
Epoch: 4, step: 187, loss: 0.39118608832359314, mean loss: 0.4038873913402462
Epoch: 4, step: 188, loss: 0.36891141533851624, mean loss: 0.40388152780696845
Epoch: 4, step: 189, loss: 0.4302392601966858, mean loss: 0.40388594579764725
Epoch: 4, step: 190, loss: 0.35737863183021545, mean loss: 0.4038781517111771
Epoch: 4, step: 191, loss: 0.3983447253704071, mean loss: 0.40387722452847924
Epoch: 4, step: 192, loss: 0.35899120569229126, mean loss: 0.40386970467275196
Epoch: 4, step: 193, loss: 0.39847275614738464, mean loss: 0.4038688006612737
Epoch: 4, step: 194, loss: 0.3711019456386566, mean loss: 0.40386331299504985
Epoch: 4, step: 195, loss: 0.37967032194137573, mean loss: 0.4038592619248801
Epoch: 4, step: 196, loss: 0.37478286027908325, mean loss: 0.40385439395206146
Epoch: 4, step: 197, loss: 0.34712740778923035, mean loss: 0.40384489830657055
Epoch: 4, step: 198, loss: 0.3356890380382538, mean loss: 0.40383349146803194
Epoch: 4, step: 199, loss: 0.3488095700740814, mean loss: 0.4038242839845323
Epoch: 4, step: 200, loss: 0.3639979362487793, mean loss: 0.4038176207173856
Epoch: 4, step: 201, loss: 0.3806072473526001, mean loss: 0.4038137380855079
Epoch: 4, step: 202, loss: 0.35750651359558105, mean loss: 0.403805993107336
Epoch: 4, step: 203, loss: 0.3676561713218689, mean loss: 0.4037999479866361
Epoch: 4, step: 204, loss: 0.3366438150405884, mean loss: 0.40378871974170283
Epoch: 4, step: 205, loss: 0.4285303056240082, mean loss: 0.4037928557473669
Epoch: 4, step: 206, loss: 0.3294849991798401, mean loss: 0.40378043591508084
Epoch: 4, step: 207, loss: 0.3599000573158264, mean loss: 0.40377310296411173
Epoch: 4, step: 208, loss: 0.33906012773513794, mean loss: 0.40376229043692224
Epoch: 4, step: 209, loss: 0.35811907052993774, mean loss: 0.4037546654419495
Epoch: 4, step: 210, loss: 0.31690672039985657, mean loss: 0.4037401593545865
Epoch: 4, step: 211, loss: 0.3843216598033905, mean loss: 0.40373691645218984
Epoch: 4, step: 212, loss: 0.32075417041778564, mean loss: 0.4037230605921073
Epoch: 4, step: 213, loss: 0.3477027714252472, mean loss: 0.4037137082900761
Epoch: 4, step: 214, loss: 0.36598652601242065, mean loss: 0.40370741098039864
Epoch: 4, step: 215, loss: 0.34936076402664185, mean loss: 0.4036983411127495
Epoch: 4, step: 216, loss: 0.46822407841682434, mean loss: 0.4037091079636262
Epoch: 4, step: 217, loss: 0.33680281043052673, mean loss: 0.40369794575182555
Epoch: 4, step: 218, loss: 0.4214455783367157, mean loss: 0.4037009061575945
Epoch: 4, step: 219, loss: 0.32962724566459656, mean loss: 0.40368855231161505
Epoch: 4, step: 220, loss: 0.32919153571128845, mean loss: 0.40367612993099133
Epoch: 4, step: 221, loss: 0.379284530878067, mean loss: 0.40367206330894184
Epoch: 4, step: 222, loss: 0.34393376111984253, mean loss: 0.4036621052655698
Epoch: 4, step: 223, loss: 0.3700544536113739, mean loss: 0.40365650399029407
Epoch: 4, step: 224, loss: 0.37911978363990784, mean loss: 0.4036524152183643
Epoch: 4, step: 225, loss: 0.3139978349208832, mean loss: 0.40363747776746506
Epoch: 4, step: 226, loss: 0.35984328389167786, mean loss: 0.40363018238284476
Epoch: 4, step: 227, loss: 0.3135842978954315, mean loss: 0.4036151847338628
Epoch: 4, step: 228, loss: 0.37438639998435974, mean loss: 0.4036103173259112
Epoch: 4, step: 229, loss: 0.3713708817958832, mean loss: 0.4036049494545276
Epoch: 4, step: 230, loss: 0.3754730224609375, mean loss: 0.40360026626375123
Epoch: 4, step: 231, loss: 0.36112233996391296, mean loss: 0.4035931960363378
Epoch: 4, step: 232, loss: 0.38087424635887146, mean loss: 0.4035894152159555
Epoch: 4, step: 233, loss: 0.33263370394706726, mean loss: 0.4035776089412019
Epoch: 4, step: 234, loss: 0.37418147921562195, mean loss: 0.40357271855196125
Epoch: 4, step: 235, loss: 0.35860198736190796, mean loss: 0.4035652383904193
Epoch: 4, step: 236, loss: 0.40928611159324646, mean loss: 0.40356618980788195
Epoch: 4, step: 237, loss: 0.3608383536338806, mean loss: 0.4035590850795524
Epoch: 4, step: 238, loss: 0.3411441743373871, mean loss: 0.4035487085357881
Epoch: 4, step: 239, loss: 0.346956729888916, mean loss: 0.4035393016244439
Epoch: 4, step: 240, loss: 0.35046708583831787, mean loss: 0.4035304812462179
Epoch: 4, step: 241, loss: 0.34460291266441345, mean loss: 0.4035206893604449
Epoch: 4, step: 242, loss: 0.3714766204357147, mean loss: 0.40351536554105216
Epoch: 4, step: 243, loss: 0.3489074409008026, mean loss: 0.40350629445722486
Epoch: 4, step: 244, loss: 0.3800375461578369, mean loss: 0.40350239664152987
Epoch: 4, step: 245, loss: 0.33037522435188293, mean loss: 0.4034902533050487
Epoch: 4, step: 246, loss: 0.34775689244270325, mean loss: 0.4034809998830227
Epoch: 4, step: 247, loss: 0.34585320949554443, mean loss: 0.4034714335167565
Epoch: 4, step: 248, loss: 0.38432565331459045, mean loss: 0.4034682557939014
Epoch: 4, step: 249, loss: 0.31553885340690613, mean loss: 0.4034536641240728
Epoch: 4, step: 250, loss: 0.3318973779678345, mean loss: 0.4034417915031741
Epoch: 4, step: 251, loss: 0.3593589663505554, mean loss: 0.4034344784930293
Epoch: 4, step: 252, loss: 0.35350286960601807, mean loss: 0.40342619658742523
Epoch: 4, step: 253, loss: 0.35330140590667725, mean loss: 0.40341788401848977
Epoch: 4, step: 254, loss: 0.38626566529273987, mean loss: 0.4034150400094157
Epoch: 4, step: 255, loss: 0.34885889291763306, mean loss: 0.40340599555532225
Epoch: 4, step: 256, loss: 0.35276904702186584, mean loss: 0.40339760222720467
Epoch: 4, step: 257, loss: 0.37156790494918823, mean loss: 0.4033923271696511
Epoch: 4, step: 258, loss: 0.3633747696876526, mean loss: 0.4033856962570609
Epoch: 4, step: 259, loss: 0.3481036126613617, mean loss: 0.40337653752883096
Epoch: 4, step: 260, loss: 0.3984896242618561, mean loss: 0.4033757280351641
Epoch: 4, step: 261, loss: 0.33388155698776245, mean loss: 0.4033642185666236
Epoch: 4, step: 262, loss: 0.4275577962398529, mean loss: 0.4033682247891229
Epoch: 4, step: 263, loss: 0.3443613350391388, mean loss: 0.4033584554365153
Epoch: 4, step: 264, loss: 0.339400053024292, mean loss: 0.4033478680499216
Epoch: 4, step: 265, loss: 0.3268504738807678, mean loss: 0.4033352071108006
Epoch: 4, step: 266, loss: 0.3921586871147156, mean loss: 0.40333335761220784
Epoch: 4, step: 267, loss: 0.36860501766204834, mean loss: 0.40332761169229553
Epoch: 4, step: 268, loss: 0.34099915623664856, mean loss: 0.40331730094697615
Epoch: 4, step: 269, loss: 0.3442299962043762, mean loss: 0.4033075279888646
Epoch: 4, step: 270, loss: 0.33466637134552, mean loss: 0.4032961767144073
Epoch: 4, step: 271, loss: 0.4242159128189087, mean loss: 0.40329963566548277
Epoch: 4, step: 272, loss: 0.35112905502319336, mean loss: 0.403291011003449
Epoch: 4, step: 273, loss: 0.3475598990917206, mean loss: 0.403281799249414
Epoch: 4, step: 274, loss: 0.337284117937088, mean loss: 0.40327089234455327
Epoch: 4, step: 275, loss: 0.38739094138145447, mean loss: 0.40326826842668095
Epoch: 4, step: 276, loss: 0.36136627197265625, mean loss: 0.40326134590950696
Epoch: 4, step: 277, loss: 0.3891229033470154, mean loss: 0.40325901052091057
Epoch: 4, step: 278, loss: 0.39861375093460083, mean loss: 0.4032582433434397
Epoch: 4, step: 279, loss: 0.4023240804672241, mean loss: 0.403258089089332
Epoch: 4, step: 280, loss: 0.35771310329437256, mean loss: 0.4032505696926348
Epoch: 4, step: 281, loss: 0.37011557817459106, mean loss: 0.40324510006709535
Epoch: 4, step: 282, loss: 0.36188018321990967, mean loss: 0.40323827304665516
Epoch: 4, step: 283, loss: 0.3738565146923065, mean loss: 0.4032334245716792
Epoch: 4, step: 284, loss: 0.35703933238983154, mean loss: 0.40322580304186867
Epoch: 4, step: 285, loss: 0.35328197479248047, mean loss: 0.40321756420514
Epoch: 4, step: 286, loss: 0.3720083236694336, mean loss: 0.4032124167137107
Epoch: 4, step: 287, loss: 0.30992674827575684, mean loss: 0.40319703319318995
Epoch: 4, step: 288, loss: 0.35802921652793884, mean loss: 0.40318958590272574
Epoch: 4, step: 289, loss: 0.4029460847377777, mean loss: 0.4031895457607599
Epoch: 4, step: 290, loss: 0.34304454922676086, mean loss: 0.4031796322950381
Epoch: 4, step: 291, loss: 0.3891022205352783, mean loss: 0.40317731235242776
Epoch: 4, step: 292, loss: 0.30882591009140015, mean loss: 0.4031617659028873
Epoch: 4, step: 293, loss: 0.34171563386917114, mean loss: 0.4031516429816297
Epoch: 4, step: 294, loss: 0.38678327202796936, mean loss: 0.4031489468243321
Epoch: 4, step: 295, loss: 0.37585577368736267, mean loss: 0.40314445190121995
Epoch: 4, step: 296, loss: 0.32970479130744934, mean loss: 0.403132359087027
Epoch: 4, step: 297, loss: 0.3973768651485443, mean loss: 0.40313141152464
Epoch: 4, step: 298, loss: 0.40338969230651855, mean loss: 0.403131454039995
Epoch: 4, step: 299, loss: 0.41412654519081116, mean loss: 0.40313326363366697
Epoch: 4, step: 300, loss: 0.3651459515094757, mean loss: 0.40312701263611483
Epoch: 4, step: 301, loss: 0.3658163845539093, mean loss: 0.4031208740003659
Epoch: 4, step: 302, loss: 0.3830060362815857, mean loss: 0.40311756509467106
Epoch: 4, step: 303, loss: 0.3530370891094208, mean loss: 0.40310932817427875
Epoch: 4, step: 304, loss: 0.31561946868896484, mean loss: 0.40309494076110897
Epoch: 4, step: 305, loss: 0.42002901434898376, mean loss: 0.4030977250546946
Epoch: 4, step: 306, loss: 0.3685941994190216, mean loss: 0.40309205293146005
Epoch: 4, step: 307, loss: 0.3576921820640564, mean loss: 0.4030845907567613
Epoch: 4, step: 308, loss: 0.3624919652938843, mean loss: 0.403077919824064
Epoch: 4, step: 309, loss: 0.3286203145980835, mean loss: 0.40306568558068145
Epoch: 4, step: 310, loss: 0.3703779876232147, mean loss: 0.40306031549723187
Epoch: 4, step: 311, loss: 0.39071232080459595, mean loss: 0.40305828724580406
Epoch: 4, step: 312, loss: 0.4097353518009186, mean loss: 0.40305938382398687
Epoch: 4, step: 313, loss: 0.35658591985702515, mean loss: 0.40305175271331906
Epoch: 4, step: 314, loss: 0.38332390785217285, mean loss: 0.40304851386175755
Epoch: 4, step: 315, loss: 0.40469226241111755, mean loss: 0.4030487836825963
Epoch: 4, step: 316, loss: 0.37602370977401733, mean loss: 0.40304434825277374
Epoch: 4, step: 317, loss: 0.3931160569190979, mean loss: 0.4030427190615473
Epoch: 4, step: 318, loss: 0.37274810671806335, mean loss: 0.4030377486575533
Epoch: 4, step: 319, loss: 0.38699087500572205, mean loss: 0.40303511629638994
Epoch: 4, step: 320, loss: 0.35532984137535095, mean loss: 0.4030272919114595
Epoch: 4, step: 321, loss: 0.36489439010620117, mean loss: 0.4030210385658043
Epoch: 4, step: 322, loss: 0.3796473443508148, mean loss: 0.40301720618439507
Epoch: 4, step: 323, loss: 0.3596479594707489, mean loss: 0.40301009647181907
Epoch: 4, step: 324, loss: 0.3023304343223572, mean loss: 0.4029935943144433
Epoch: 4, step: 325, loss: 0.3722946345806122, mean loss: 0.4029885633475908
Epoch: 4, step: 326, loss: 0.3481135666370392, mean loss: 0.4029795718685296
Epoch: 4, step: 327, loss: 0.3947197496891022, mean loss: 0.40297821868665223
Epoch: 4, step: 328, loss: 0.3305968940258026, mean loss: 0.4029663626138167
Epoch: 4, step: 329, loss: 0.3814956247806549, mean loss: 0.40296284627941886
Epoch: 4, step: 330, loss: 0.3988211452960968, mean loss: 0.40296216809029434
Epoch: 4, step: 331, loss: 0.3256766200065613, mean loss: 0.40294951492263165
Epoch: 4, step: 332, loss: 0.3731461465358734, mean loss: 0.40294463632247013
Epoch: 4, step: 333, loss: 0.3204871118068695, mean loss: 0.4029311408192761
Epoch: 4, step: 334, loss: 0.37577900290489197, mean loss: 0.4029266976613782
Epoch: 4, step: 335, loss: 0.37285685539245605, mean loss: 0.402921777857342
Epoch: 4, step: 336, loss: 0.4027641713619232, mean loss: 0.40292175207515724
Epoch: 4, step: 337, loss: 0.35150086879730225, mean loss: 0.40291334172460475
Epoch: 4, step: 338, loss: 0.312187522649765, mean loss: 0.40289850512295716
Epoch: 4, step: 339, loss: 0.34165096282958984, mean loss: 0.40288849080930556
Epoch: 4, step: 340, loss: 0.357575386762619, mean loss: 0.4028810830760954
Epoch: 4, step: 341, loss: 0.3556530177593231, mean loss: 0.4028733635492375
Epoch: 4, step: 342, loss: 0.3992922604084015, mean loss: 0.40287277830603746
Epoch: 4, step: 343, loss: 0.4266803562641144, mean loss: 0.4028766684331548
Epoch: 4, step: 344, loss: 0.33192628622055054, mean loss: 0.40286507712745107
Epoch: 4, step: 345, loss: 0.3351345360279083, mean loss: 0.4028540136610839
Epoch: 4, step: 346, loss: 0.3835445046424866, mean loss: 0.4028508600584351
Epoch: 4, step: 347, loss: 0.3676110804080963, mean loss: 0.4028451056855334
Epoch: 4, step: 348, loss: 0.3738235533237457, mean loss: 0.4028403674729029
Epoch: 4, step: 349, loss: 0.3983895182609558, mean loss: 0.4028396409222643
Epoch: 4, step: 350, loss: 0.38496461510658264, mean loss: 0.40283672350332916
Epoch: 4, step: 351, loss: 0.4170054793357849, mean loss: 0.4028390356371138
Epoch: 4, step: 352, loss: 0.340270072221756, mean loss: 0.40282882696303723
Epoch: 4, step: 353, loss: 0.36242130398750305, mean loss: 0.40282223519746213
Epoch: 4, step: 354, loss: 0.3340280055999756, mean loss: 0.4028110144782324
Epoch: 4, step: 355, loss: 0.33671873807907104, mean loss: 0.4028002362205026
Epoch: 4, step: 356, loss: 0.34029391407966614, mean loss: 0.4027900444184252
Epoch: 4, step: 357, loss: 0.34767577052116394, mean loss: 0.40278105937214265
Epoch: 4, step: 358, loss: 0.37848377227783203, mean loss: 0.4027770989341485
Epoch: 4, step: 359, loss: 0.35970398783683777, mean loss: 0.40277007919635555
Epoch: 4, step: 360, loss: 0.36846110224723816, mean loss: 0.40276448868357256
Epoch: 4, step: 361, loss: 0.41743704676628113, mean loss: 0.4027668791296597
Epoch: 4, step: 362, loss: 0.35844284296035767, mean loss: 0.40275965905535294
Epoch: 4, step: 363, loss: 0.32298919558525085, mean loss: 0.4027466671231917
Epoch: 4, step: 364, loss: 0.34340301156044006, mean loss: 0.4027370036065718
Epoch: 4, step: 365, loss: 0.35994207859039307, mean loss: 0.4027300360186499
Epoch: 4, step: 366, loss: 0.3817083239555359, mean loss: 0.40272661395905957
Epoch: 4, step: 367, loss: 0.36142387986183167, mean loss: 0.4027198915088484
Epoch: 4, step: 368, loss: 0.3720410168170929, mean loss: 0.40271489901500107
Epoch: 4, step: 369, loss: 0.3832094371318817, mean loss: 0.40271172533099797
Epoch: 4, step: 370, loss: 0.3649568259716034, mean loss: 0.4027055833268725
Epoch: 4, step: 371, loss: 0.34974175691604614, mean loss: 0.40269696852101516
Epoch: 4, step: 372, loss: 0.34930479526519775, mean loss: 0.40268828545494656
Epoch: 4, step: 373, loss: 0.38039615750312805, mean loss: 0.40268466071869424
Epoch: 4, step: 374, loss: 0.3396129906177521, mean loss: 0.40267440682987926
Epoch: 4, step: 375, loss: 0.35930758714675903, mean loss: 0.40266735760691386
Epoch: 4, step: 376, loss: 0.3569183349609375, mean loss: 0.4026599223683886
Epoch: 4, step: 377, loss: 0.3669249415397644, mean loss: 0.4026541155791737
Epoch: 4, step: 378, loss: 0.32141736149787903, mean loss: 0.4026409170813538
Epoch: 4, step: 379, loss: 0.3477514684200287, mean loss: 0.40263200066669147
Epoch: 4, step: 380, loss: 0.36840009689331055, mean loss: 0.4026264408317437
Epoch: 4, step: 381, loss: 0.3234919011592865, mean loss: 0.40261359014326165
Epoch: 4, step: 382, loss: 0.3263232409954071, mean loss: 0.40260120333547667
Epoch: 4, step: 383, loss: 0.3694455921649933, mean loss: 0.4025958209310659
Epoch: 4, step: 384, loss: 0.38488247990608215, mean loss: 0.40259294585542477
Epoch: 4, step: 385, loss: 0.34328824281692505, mean loss: 0.40258332159332827
Epoch: 4, step: 386, loss: 0.33745530247688293, mean loss: 0.40257275400950276
Epoch: 4, step: 387, loss: 0.39799219369888306, mean loss: 0.4025720108945919
Epoch: 4, step: 388, loss: 0.3462781012058258, mean loss: 0.4025628796845856
Epoch: 4, step: 389, loss: 0.39715468883514404, mean loss: 0.40256200258584257
Epoch: 4, step: 390, loss: 0.334060400724411, mean loss: 0.402550894818393
Epoch: 4, step: 391, loss: 0.35250332951545715, mean loss: 0.4025427807513854
Epoch: 4, step: 392, loss: 0.3329993486404419, mean loss: 0.4025315077035477
Epoch: 4, step: 393, loss: 0.3610685169696808, mean loss: 0.40252478760780475
Epoch: 4, step: 394, loss: 0.3421552777290344, mean loss: 0.4025150048319372
Epoch: 4, step: 395, loss: 0.3853659927845001, mean loss: 0.4025122263141071
Epoch: 4, step: 396, loss: 0.3649463951587677, mean loss: 0.4025061408076831
Epoch: 4, step: 397, loss: 0.40265709161758423, mean loss: 0.4025061652571178
Epoch: 4, step: 398, loss: 0.3445105254650116, mean loss: 0.40249677325067373
Epoch: 4, step: 399, loss: 0.3529403507709503, mean loss: 0.40248874921853645
Epoch: 4, step: 400, loss: 0.360343873500824, mean loss: 0.4024819263472854
Epoch: 4, step: 401, loss: 0.3943721652030945, mean loss: 0.4024806136633838
Epoch: 4, step: 402, loss: 0.37173911929130554, mean loss: 0.4024756385065021
Epoch: 4, step: 403, loss: 0.3780050277709961, mean loss: 0.402471678860752
Epoch: 4, step: 404, loss: 0.34577614068984985, mean loss: 0.40246250630968083
Epoch: 4, step: 405, loss: 0.3464600145816803, mean loss: 0.40245344734951777
Epoch: 4, step: 406, loss: 0.3530978858470917, mean loss: 0.40244546488768657
Epoch: 4, step: 407, loss: 0.3816991150379181, mean loss: 0.40244211004456726
Epoch: 4, step: 408, loss: 0.34628722071647644, mean loss: 0.402433030838532
Epoch: 4, step: 409, loss: 0.34582704305648804, mean loss: 0.40242388017772013
Epoch: 4, step: 410, loss: 0.35233190655708313, mean loss: 0.40241578385096716
Epoch: 4, step: 411, loss: 0.38051316142082214, mean loss: 0.40241224431922346
Epoch: 4, step: 412, loss: 0.34448060393333435, mean loss: 0.4024028838990609
Epoch: 4, step: 413, loss: 0.3203752040863037, mean loss: 0.40238963225450314
Epoch: 4, step: 414, loss: 0.35891735553741455, mean loss: 0.4023826104039593
Epoch: 4, step: 415, loss: 0.40529894828796387, mean loss: 0.40238308138875967
Epoch: 4, step: 416, loss: 0.3463696837425232, mean loss: 0.4023740367581047
Epoch: 4, step: 417, loss: 0.3501167893409729, mean loss: 0.40236560000521204
Epoch: 4, step: 418, loss: 0.36052531003952026, mean loss: 0.40235884612466877
Epoch: 4, step: 419, loss: 0.33674272894859314, mean loss: 0.4023482560476552
Epoch: 4, step: 420, loss: 0.4072389006614685, mean loss: 0.40234904524317133
Epoch: 4, step: 421, loss: 0.37382590770721436, mean loss: 0.40234444325260404
Epoch: 4, step: 422, loss: 0.3424510359764099, mean loss: 0.40233478146727153
Epoch: 4, step: 423, loss: 0.38073283433914185, mean loss: 0.40233129728225087
Epoch: 4, step: 424, loss: 0.3142085075378418, mean loss: 0.4023170862211729
Epoch: 4, step: 425, loss: 0.38016027212142944, mean loss: 0.40231351369390755
Epoch: 4, step: 426, loss: 0.38285398483276367, mean loss: 0.4023103765781795
Epoch: 4, step: 427, loss: 0.4026813209056854, mean loss: 0.4023104363693348
Epoch: 4, step: 428, loss: 0.39457058906555176, mean loss: 0.4023091890127991
Epoch: 4, step: 429, loss: 0.35706716775894165, mean loss: 0.4023018989674794
Epoch: 4, step: 430, loss: 0.37427523732185364, mean loss: 0.4022973836361365
Epoch: 4, step: 431, loss: 0.3698565363883972, mean loss: 0.4022921579841958
Epoch: 4, step: 432, loss: 0.36946025490760803, mean loss: 0.40228687019178533
Epoch: 4, step: 433, loss: 0.365323543548584, mean loss: 0.4022809179652727
Epoch: 4, step: 434, loss: 0.374898761510849, mean loss: 0.40227650931023257
Epoch: 4, step: 435, loss: 0.3685538172721863, mean loss: 0.4022710806733945
Epoch: 4, step: 436, loss: 0.3820387125015259, mean loss: 0.4022678242162608
Epoch: 4, step: 437, loss: 0.3443690836429596, mean loss: 0.40225850674915853
Epoch: 4, step: 438, loss: 0.4197254180908203, mean loss: 0.4022613171934613
Epoch: 4, step: 439, loss: 0.35334905982017517, mean loss: 0.4022534484261876
Epoch: 4, step: 440, loss: 0.35798975825309753, mean loss: 0.4022463286433063
Epoch: 4, step: 441, loss: 0.3288102447986603, mean loss: 0.40223451840145286
Epoch: 4, step: 442, loss: 0.3625883460044861, mean loss: 0.40222814339383156
Epoch: 4, step: 443, loss: 0.3735899329185486, mean loss: 0.40222353917992876
Epoch: 4, step: 444, loss: 0.35671159625053406, mean loss: 0.40221622332348617
Epoch: 4, step: 445, loss: 0.3577248454093933, mean loss: 0.4022090726680837
Epoch: 4, step: 446, loss: 0.3591192960739136, mean loss: 0.4022021483909514
Epoch: 4, step: 447, loss: 0.3648931384086609, mean loss: 0.4021961540127409
Epoch: 4, step: 448, loss: 0.3590490221977234, mean loss: 0.40218922274658586
Epoch: 4, step: 449, loss: 0.352347195148468, mean loss: 0.402181217281183
Epoch: 4, step: 450, loss: 0.34404465556144714, mean loss: 0.40217188107406565
Epoch: 4, step: 451, loss: 0.36231350898742676, mean loss: 0.40216548120699974
Epoch: 4, step: 452, loss: 0.3835723102092743, mean loss: 0.40216249627025263
Epoch: 4, step: 453, loss: 0.37504005432128906, mean loss: 0.40215814274827044
Epoch: 4, step: 454, loss: 0.35078322887420654, mean loss: 0.402149897697095
Epoch: 4, step: 455, loss: 0.32894542813301086, mean loss: 0.40213815115191465
Epoch: 4, step: 456, loss: 0.34741872549057007, mean loss: 0.4021293721649643
Epoch: 4, step: 457, loss: 0.33632585406303406, mean loss: 0.4021188165797699
Epoch: 4, step: 458, loss: 0.38388511538505554, mean loss: 0.40211589216899285
Epoch: 4, step: 459, loss: 0.32755815982818604, mean loss: 0.4021039361503365
Epoch: 4, step: 460, loss: 0.31839519739151, mean loss: 0.4020905148358009
Epoch: 4, step: 461, loss: 0.31795409321784973, mean loss: 0.4020770271119121
Epoch: 4, step: 462, loss: 0.375644326210022, mean loss: 0.40207279042319566
Epoch: 4, step: 463, loss: 0.32232415676116943, mean loss: 0.4020600101934421
Epoch: 4, step: 464, loss: 0.325354665517807, mean loss: 0.40204771963989694
Epoch: 4, step: 465, loss: 0.3656766712665558, mean loss: 0.4020418928138198
Epoch: 4, step: 466, loss: 0.3388219177722931, mean loss: 0.4020317662760909
Epoch: 4, step: 467, loss: 0.3504742681980133, mean loss: 0.4020235091495569
Epoch: 4, step: 468, loss: 0.4050157070159912, mean loss: 0.4020239882845235
Epoch: 4, step: 469, loss: 0.3634312152862549, mean loss: 0.402017809486413
Epoch: 4, step: 470, loss: 0.342872679233551, mean loss: 0.4020083417210452
Epoch: 4, step: 471, loss: 0.4608113765716553, mean loss: 0.4020177532183004
Epoch: 4, step: 472, loss: 0.3141738176345825, mean loss: 0.4020036959394424
Epoch: 4, step: 473, loss: 0.33493420481681824, mean loss: 0.4019929648208628
Epoch: 4, step: 474, loss: 0.3512263298034668, mean loss: 0.40198484345867797
Epoch: 4, step: 475, loss: 0.3304360508918762, mean loss: 0.40197339931399356
Epoch: 4, step: 476, loss: 0.3802497982978821, mean loss: 0.4019699252054031
Epoch: 4, step: 477, loss: 0.3413180410861969, mean loss: 0.4019602271107246
Epoch: 4, step: 478, loss: 0.34113436937332153, mean loss: 0.40195050275297284
Epoch: 4, step: 479, loss: 0.30534806847572327, mean loss: 0.4019350611873914
Epoch: 4, step: 480, loss: 0.3722195625305176, mean loss: 0.40193031202666635
Epoch: 4, step: 481, loss: 0.36313343048095703, mean loss: 0.401924112461063
Epoch: 4, step: 482, loss: 0.3709288537502289, mean loss: 0.4019191603507082
Epoch: 4, step: 483, loss: 0.3501662015914917, mean loss: 0.4019108931049
Epoch: 4, step: 484, loss: 0.3772667646408081, mean loss: 0.4019069569719398
Epoch: 4, step: 485, loss: 0.34045180678367615, mean loss: 0.4018971429907535
Epoch: 4, step: 486, loss: 0.3462783992290497, mean loss: 0.4018882624632489
Epoch: 4, step: 487, loss: 0.35175326466560364, mean loss: 0.40188025879182526
Epoch: 4, step: 488, loss: 0.3517502248287201, mean loss: 0.401872257190235
Epoch: 4, step: 489, loss: 0.3368249237537384, mean loss: 0.40186187619224
Epoch: 4, step: 490, loss: 0.3607327938079834, mean loss: 0.40185531338988095
Epoch: 4, step: 491, loss: 0.34436702728271484, mean loss: 0.4018461416786322
Epoch: 4, step: 492, loss: 0.3344394266605377, mean loss: 0.4018353892914862
Epoch: 4, step: 493, loss: 0.3921982944011688, mean loss: 0.4018338522747573
Epoch: 4, step: 494, loss: 0.37265318632125854, mean loss: 0.4018291990031972
Epoch: 4, step: 495, loss: 0.3508917987346649, mean loss: 0.4018210776064707
Epoch: 4, step: 496, loss: 0.38728582859039307, mean loss: 0.40181876049360343
Epoch: 4, step: 497, loss: 0.33914074301719666, mean loss: 0.4018087703728708
Epoch: 4, step: 498, loss: 0.37408721446990967, mean loss: 0.40180435259503766
Epoch: 4, step: 499, loss: 0.41131076216697693, mean loss: 0.40180586731931617
Epoch: 4, step: 500, loss: 0.35756993293762207, mean loss: 0.40179882001417333
Epoch: 4, step: 501, loss: 0.33430278301239014, mean loss: 0.4017880688136315
Epoch: 4, step: 502, loss: 0.36900725960731506, mean loss: 0.40178284810823156
Epoch: 4, step: 503, loss: 0.37223953008651733, mean loss: 0.4017781437582281
Epoch: 4, step: 504, loss: 0.32116976380348206, mean loss: 0.4017653100725165
Epoch: 4, step: 505, loss: 0.3596130311489105, mean loss: 0.40175860006313674
Epoch: 4, step: 506, loss: 0.3575754761695862, mean loss: 0.4017515678931712
Epoch: 4, step: 507, loss: 0.33864155411720276, mean loss: 0.40174152492471543
Epoch: 4, step: 508, loss: 0.33953410387039185, mean loss: 0.40173162716480226
Epoch: 4, step: 509, loss: 0.3571334481239319, mean loss: 0.4017245323224477
Epoch: 4, step: 510, loss: 0.34693098068237305, mean loss: 0.40171581694919495
Epoch: 4, step: 511, loss: 0.3723761737346649, mean loss: 0.4017111509754013
Epoch: 4, step: 512, loss: 0.41709187626838684, mean loss: 0.40171359663055994
Epoch: 4, step: 513, loss: 0.33648377656936646, mean loss: 0.4017032262299143
Epoch: 4, step: 514, loss: 0.3625362515449524, mean loss: 0.40169700035569955
Epoch: 4, step: 515, loss: 0.33917543292045593, mean loss: 0.4016870636793748
Epoch: 4, step: 516, loss: 0.38263437151908875, mean loss: 0.401684036078523
Epoch: 4, step: 517, loss: 0.3397972881793976, mean loss: 0.4016742034207697
Epoch: 4, step: 518, loss: 0.39101967215538025, mean loss: 0.40167251088204603
Epoch: 4, step: 519, loss: 0.39649367332458496, mean loss: 0.4016716883220782
Epoch: 4, step: 520, loss: 0.3673141896724701, mean loss: 0.4016662321526881
Epoch: 4, step: 521, loss: 0.32431021332740784, mean loss: 0.4016539495202929
Epoch: 4, step: 522, loss: 0.3635779619216919, mean loss: 0.4016479047532507
Epoch: 4, step: 523, loss: 0.3793080151081085, mean loss: 0.4016443587390213
Epoch: 4, step: 524, loss: 0.35574373602867126, mean loss: 0.4016370740821874
Epoch: 4, step: 525, loss: 0.3847457766532898, mean loss: 0.4016343937747566
Epoch: 4, step: 526, loss: 0.3444018065929413, mean loss: 0.40162531356102005
Epoch: 4, step: 527, loss: 0.3505854904651642, mean loss: 0.40161721714238174
Epoch: 4, step: 528, loss: 0.3448932468891144, mean loss: 0.40160822047778966
Epoch: 4, step: 529, loss: 0.3458990752696991, mean loss: 0.40159938616995455
Epoch: 4, step: 530, loss: 0.3244226574897766, mean loss: 0.40158714949186985
Epoch: 4, step: 531, loss: 0.33807215094566345, mean loss: 0.4015770805320496
Epoch: 4, step: 532, loss: 0.3851204514503479, mean loss: 0.4015744720950419
Epoch: 4, step: 533, loss: 0.3498624861240387, mean loss: 0.4015662768516233
Epoch: 4, step: 534, loss: 0.33374300599098206, mean loss: 0.40155553001738775
Epoch: 4, step: 535, loss: 0.3325670659542084, mean loss: 0.4015446002860723
Epoch: 4, step: 536, loss: 0.3947327733039856, mean loss: 0.4015435212702348
Epoch: 4, step: 537, loss: 0.3677690625190735, mean loss: 0.40153817213201004
Epoch: 4, step: 538, loss: 0.3482598662376404, mean loss: 0.4015297353456451
Epoch: 4, step: 539, loss: 0.36204320192337036, mean loss: 0.4015234835195808
Epoch: 4, step: 540, loss: 0.3654063045978546, mean loss: 0.40151776606209755
Epoch: 4, step: 541, loss: 0.34445858001708984, mean loss: 0.4015087348518973
Epoch: 4, step: 542, loss: 0.3687494695186615, mean loss: 0.4015035506035458
Epoch: 4, step: 543, loss: 0.36569976806640625, mean loss: 0.40149788544808107
Epoch: 4, step: 544, loss: 0.33690953254699707, mean loss: 0.4014876673887707
Epoch: 4, step: 545, loss: 0.3522006571292877, mean loss: 0.4014798712783215
Epoch: 4, step: 546, loss: 0.41038841009140015, mean loss: 0.4014812801884612
Epoch: 4, step: 547, loss: 0.3625696897506714, mean loss: 0.4014751271855457
Epoch: 4, step: 548, loss: 0.369020938873291, mean loss: 0.4014699960885793
Epoch: 4, step: 549, loss: 0.37694114446640015, mean loss: 0.4014661186223096
Epoch: 4, step: 550, loss: 0.39726147055625916, mean loss: 0.4014654540659533
Epoch: 4, step: 551, loss: 0.3291662931442261, mean loss: 0.40145402878767866
Epoch: 4, step: 552, loss: 0.3322961628437042, mean loss: 0.401443101648171
Epoch: 4, step: 553, loss: 0.34281033277511597, mean loss: 0.4014338389674643
Epoch: 4, step: 554, loss: 0.3455864191055298, mean loss: 0.4014250177038627
Epoch: 4, step: 555, loss: 0.4037446081638336, mean loss: 0.4014253840321097
Epoch: 4, step: 556, loss: 0.35253581404685974, mean loss: 0.4014176642200167
Epoch: 4, step: 557, loss: 0.3394685685634613, mean loss: 0.4014078838133769
Epoch: 4, step: 558, loss: 0.3484683632850647, mean loss: 0.4013995271408389
Epoch: 4, step: 559, loss: 0.34580400586128235, mean loss: 0.40139075259518237
Epoch: 4, step: 560, loss: 0.404901921749115, mean loss: 0.40139130666953204
Epoch: 4, step: 561, loss: 0.3567012548446655, mean loss: 0.401384255541128
Epoch: 4, step: 562, loss: 0.37787577509880066, mean loss: 0.4013805469939688
Epoch: 4, step: 563, loss: 0.39870116114616394, mean loss: 0.4013801243779045
Epoch: 4, step: 564, loss: 0.3387891352176666, mean loss: 0.40137025353905253
Epoch: 4, step: 565, loss: 0.3403218686580658, mean loss: 0.4013606274928714
Epoch: 4, step: 566, loss: 0.36773067712783813, mean loss: 0.40135532559308185
Epoch: 4, step: 567, loss: 0.36239224672317505, mean loss: 0.4013491838719485
Epoch: 4, step: 568, loss: 0.4036486744880676, mean loss: 0.40134954628181707
Epoch: 4, step: 569, loss: 0.3743235766887665, mean loss: 0.401345287540942
Epoch: 4, step: 570, loss: 0.38521233201026917, mean loss: 0.40134274571716216
Epoch: 4, step: 571, loss: 0.32725998759269714, mean loss: 0.40133107546540975
Epoch: 4, step: 572, loss: 0.32775065302848816, mean loss: 0.4013194861722239
Epoch: 4, step: 573, loss: 0.36060836911201477, mean loss: 0.40131307497268687
Epoch: 4, step: 574, loss: 0.34955960512161255, mean loss: 0.4013049261032409
Epoch: 4, step: 575, loss: 0.3577502965927124, mean loss: 0.40129806926610134
Epoch: 4, step: 576, loss: 0.3533276915550232, mean loss: 0.4012905184432285
Epoch: 4, step: 577, loss: 0.33134523034095764, mean loss: 0.4012795103714466
Epoch: 4, step: 578, loss: 0.3508652150630951, mean loss: 0.4012715773588096
Epoch: 4, step: 579, loss: 0.4197981655597687, mean loss: 0.40127449217759514
Epoch: 4, step: 580, loss: 0.37530598044395447, mean loss: 0.4012704071513668
Epoch: 4, step: 581, loss: 0.3699151277542114, mean loss: 0.40126547552516406
Epoch: 4, step: 582, loss: 0.3594132959842682, mean loss: 0.40125889395895226
Epoch: 4, step: 583, loss: 0.34021222591400146, mean loss: 0.40124929542624077
Epoch: 4, step: 584, loss: 0.3781159520149231, mean loss: 0.4012456586799098
Epoch: 4, step: 585, loss: 0.3487611413002014, mean loss: 0.40123740899154453
Epoch: 4, step: 586, loss: 0.3347037434577942, mean loss: 0.40122695265561276
Epoch: 4, step: 587, loss: 0.3555595874786377, mean loss: 0.40121977676542153
Epoch: 4, step: 588, loss: 0.34548500180244446, mean loss: 0.4012110203200228
Epoch: 4, step: 589, loss: 0.34141212701797485, mean loss: 0.4012016268400822
Epoch: 4, step: 590, loss: 0.4630899727344513, mean loss: 0.4012113470137738
Epoch: 4, step: 591, loss: 0.32257309556007385, mean loss: 0.40119899804212594
Epoch: 4, step: 592, loss: 0.37579187750816345, mean loss: 0.4011950088569267
Epoch: 4, step: 593, loss: 0.36897075176239014, mean loss: 0.40118995010385067
Epoch: 4, step: 594, loss: 0.34549325704574585, mean loss: 0.4011812078823693
Epoch: 4, step: 595, loss: 0.3802473247051239, mean loss: 0.4011779225899686
Epoch: 4, step: 596, loss: 0.3618968427181244, mean loss: 0.4011717589182485
Epoch: 4, step: 597, loss: 0.31807684898376465, mean loss: 0.40115872237762495
Epoch: 4, step: 598, loss: 0.33870378136634827, mean loss: 0.401148925524133
Epoch: 4, step: 599, loss: 0.35125282406806946, mean loss: 0.4011410999122359
Epoch: 4, step: 600, loss: 0.4350684583187103, mean loss: 0.4011464201817053
Epoch: 4, step: 601, loss: 0.3568529188632965, mean loss: 0.4011394754496077
Epoch: 4, step: 602, loss: 0.3869325518608093, mean loss: 0.4011372483099951
Epoch: 4, step: 603, loss: 0.38792911171913147, mean loss: 0.4011351780691501
Epoch: 4, step: 604, loss: 0.42527759075164795, mean loss: 0.4011389615533505
Epoch: 4, step: 605, loss: 0.3849306106567383, mean loss: 0.40113642185562304
Epoch: 4, step: 606, loss: 0.3544398248195648, mean loss: 0.4011291060798066
Epoch: 4, step: 607, loss: 0.34234344959259033, mean loss: 0.4011198978002817
Epoch: 4, step: 608, loss: 0.32720333337783813, mean loss: 0.4011083212044442
Epoch: 4, step: 609, loss: 0.3570087254047394, mean loss: 0.40110141553645173
Epoch: 4, step: 610, loss: 0.3852020800113678, mean loss: 0.4010989262088292
Epoch: 4, step: 611, loss: 0.3410778343677521, mean loss: 0.4010895302958923
Epoch: 4, step: 612, loss: 0.34701812267303467, mean loss: 0.40108106709232005
Epoch: 4, step: 613, loss: 0.33173632621765137, mean loss: 0.4010702150201957
Epoch: 4, step: 614, loss: 0.3735748529434204, mean loss: 0.401065912819902
Epoch: 4, step: 615, loss: 0.35849234461784363, mean loss: 0.40105925237431345
Epoch: 4, step: 616, loss: 0.3472907245159149, mean loss: 0.40105084184281675
Epoch: 4, step: 617, loss: 0.3331233561038971, mean loss: 0.4010402182135176
Epoch: 4, step: 618, loss: 0.33610543608665466, mean loss: 0.4010300642210036
Epoch: 4, step: 619, loss: 0.36496683955192566, mean loss: 0.4010244258181473
Epoch: 4, step: 620, loss: 0.3573641777038574, mean loss: 0.40101760070510767
Epoch: 4, step: 621, loss: 0.3426368236541748, mean loss: 0.40100847585717847
Epoch: 4, step: 622, loss: 0.3426571488380432, mean loss: 0.40099935703751616
Epoch: 4, step: 623, loss: 0.3680529296398163, mean loss: 0.40099420915823525
Epoch: 4, step: 624, loss: 0.36274611949920654, mean loss: 0.4009882338278714
Epoch: 4, step: 625, loss: 0.33935385942459106, mean loss: 0.40097860646542166
Epoch: 4, step: 626, loss: 0.3217833638191223, mean loss: 0.4009662380064733
Epoch: 4, step: 627, loss: 0.3562104105949402, mean loss: 0.40095924927639653
Epoch: 4, step: 628, loss: 0.3299424946308136, mean loss: 0.4009481615707532
Epoch: 4, step: 629, loss: 0.3324998617172241, mean loss: 0.4009374765411164
Epoch: 4, step: 630, loss: 0.3744683861732483, mean loss: 0.4009333452643304
Epoch: 4, step: 631, loss: 0.36705681681632996, mean loss: 0.4009280586650095
Epoch: 4, step: 632, loss: 0.35486626625061035, mean loss: 0.4009208716167314
Epoch: 4, step: 633, loss: 0.35332435369491577, mean loss: 0.40091344626292147
Epoch: 4, step: 634, loss: 0.33416640758514404, mean loss: 0.40090303493260204
Epoch: 4, step: 635, loss: 0.34114742279052734, mean loss: 0.4008937155919685
Epoch: 4, step: 636, loss: 0.3921278119087219, mean loss: 0.4008923486960254
Epoch: 4, step: 637, loss: 0.3296664357185364, mean loss: 0.40088124393877916
Epoch: 4, step: 638, loss: 0.36540868878364563, mean loss: 0.40087571431209873
Epoch: 4, step: 639, loss: 0.33753708004951477, mean loss: 0.4008658423304493
Epoch: 4, step: 640, loss: 0.353665292263031, mean loss: 0.40085848678267505
Epoch: 4, step: 641, loss: 0.34060317277908325, mean loss: 0.4008490982949836
Epoch: 4, step: 642, loss: 0.32681313157081604, mean loss: 0.4008375644163851
Epoch: 4, step: 643, loss: 0.35345137119293213, mean loss: 0.40083018338940324
Epoch: 4, step: 644, loss: 0.35329964756965637, mean loss: 0.40082278103216606
Epoch: 4, step: 645, loss: 0.3189934492111206, mean loss: 0.4008100389998053
Epoch: 4, step: 646, loss: 0.33813345432281494, mean loss: 0.4008002808517939
Epoch: 4, step: 647, loss: 0.34177252650260925, mean loss: 0.40079109222253656
Epoch: 4, step: 648, loss: 0.42308416962623596, mean loss: 0.4007945619622103
Epoch: 4, step: 649, loss: 0.35608312487602234, mean loss: 0.40078760406661645
Epoch: 4, step: 650, loss: 0.3952934443950653, mean loss: 0.40078674921059165
Epoch: 4, step: 651, loss: 0.4171045124530792, mean loss: 0.40078928775496664
Epoch: 4, step: 652, loss: 0.35371509194374084, mean loss: 0.40078196559042917
Epoch: 4, step: 653, loss: 0.338652104139328, mean loss: 0.4007723030925363
Epoch: 4, step: 654, loss: 0.3896160125732422, mean loss: 0.4007705683249233
Epoch: 4, step: 655, loss: 0.3233982026576996, mean loss: 0.4007585390392163
Epoch: 4, step: 656, loss: 0.38185784220695496, mean loss: 0.40075560095483387
Epoch: 4, step: 657, loss: 0.357197105884552, mean loss: 0.4007488309058643
Epoch: 4, step: 658, loss: 0.35942012071609497, mean loss: 0.4007424084178783
Epoch: 4, step: 659, loss: 0.35340049862861633, mean loss: 0.4007350526208321
Epoch: 4, step: 660, loss: 0.34822672605514526, mean loss: 0.400726895354005
Epoch: 4, step: 661, loss: 0.3287127912044525, mean loss: 0.40071570956584884
Epoch: 4, step: 662, loss: 0.3537507653236389, mean loss: 0.4007084157400619
Epoch: 4, step: 663, loss: 0.3756045401096344, mean loss: 0.40070451762272796
Epoch: 4, step: 664, loss: 0.3610065281391144, mean loss: 0.400698354295685
Epoch: 4, step: 665, loss: 0.32381671667099, mean loss: 0.40068641985954334
Epoch: 4, step: 666, loss: 0.37494489550590515, mean loss: 0.40068242458958314
Epoch: 4, step: 667, loss: 0.375408411026001, mean loss: 0.40067850248940257
Epoch: 4, step: 668, loss: 0.32837462425231934, mean loss: 0.40066728388921063
Epoch: 4, step: 669, loss: 0.33637991547584534, mean loss: 0.4006573106704062
Epoch: 4, step: 670, loss: 0.34679651260375977, mean loss: 0.400648956273312
Epoch: 4, step: 671, loss: 0.3581715226173401, mean loss: 0.40064236858198815
Epoch: 4, step: 672, loss: 0.3295239508152008, mean loss: 0.4006313407609668
Epoch: 4, step: 673, loss: 0.33913007378578186, mean loss: 0.4006218056808156
Epoch: 4, step: 674, loss: 0.3530478775501251, mean loss: 0.40061443102136274
Epoch: 4, step: 675, loss: 0.3729226589202881, mean loss: 0.4006101390542051
Epoch: 4, step: 676, loss: 0.4093441069126129, mean loss: 0.40061149252822625
Epoch: 4, step: 677, loss: 0.4009738564491272, mean loss: 0.4006115486738601
Epoch: 4, step: 678, loss: 0.34655386209487915, mean loss: 0.40060317412907637
Epoch: 4, step: 679, loss: 0.4224224090576172, mean loss: 0.4006065538123057
Epoch: 4, step: 680, loss: 0.34829622507095337, mean loss: 0.40059845247596665
Epoch: 4, step: 681, loss: 0.3902122378349304, mean loss: 0.40059684420488567
Epoch: 4, step: 682, loss: 0.3570997416973114, mean loss: 0.40059010986481636
Epoch: 4, step: 683, loss: 0.3127775192260742, mean loss: 0.40057651658453175
Epoch: 4, step: 684, loss: 0.3212296664714813, mean loss: 0.40056423569146365
Epoch: 4, step: 685, loss: 0.3638250231742859, mean loss: 0.4005585502670568
Epoch: 4, step: 686, loss: 0.37350648641586304, mean loss: 0.40055436458488886
Epoch: 4, step: 687, loss: 0.3471791446208954, mean loss: 0.40054610727982015
Epoch: 4, step: 688, loss: 0.33835145831108093, mean loss: 0.40053648707116296
Epoch: 4, step: 689, loss: 0.3465881943702698, mean loss: 0.4005281436915309
Epoch: 4, step: 690, loss: 0.35286745429039, mean loss: 0.4005207738617178
Epoch: 4, step: 691, loss: 0.3481959402561188, mean loss: 0.40051268406060375
Epoch: 4, step: 692, loss: 0.36178430914878845, mean loss: 0.4005066972968208
Epoch: 4, step: 693, loss: 0.34933584928512573, mean loss: 0.4004987883558607
Epoch: 4, step: 694, loss: 0.3474436402320862, mean loss: 0.40049058944562677
Epoch: 4, step: 695, loss: 0.30992358922958374, mean loss: 0.4004765957805748
Epoch: 4, step: 696, loss: 0.32830098271369934, mean loss: 0.40046544552365115
Epoch: 4, step: 697, loss: 0.34308192133903503, mean loss: 0.40045658183440425
Epoch: 4, step: 698, loss: 0.34187158942222595, mean loss: 0.40044753395912824
Epoch: 4, step: 699, loss: 0.38915133476257324, mean loss: 0.4004457896417724
Epoch: 4, step: 700, loss: 0.33895543217658997, mean loss: 0.4004362959938698
Epoch: 4, step: 701, loss: 0.3516336679458618, mean loss: 0.4004287623989257
Epoch: 4, step: 702, loss: 0.35421791672706604, mean loss: 0.40042162999490166
Epoch: 4, step: 703, loss: 0.32557588815689087, mean loss: 0.4004100797260995
Epoch: 4, step: 704, loss: 0.3746834397315979, mean loss: 0.40040611017819105
Epoch: 4, step: 705, loss: 0.3710823655128479, mean loss: 0.40040158630520967
Epoch: 4, step: 706, loss: 0.3564012050628662, mean loss: 0.4003947992650674
Epoch: 4, step: 707, loss: 0.3409462571144104, mean loss: 0.4003856307668949
Epoch: 4, step: 708, loss: 0.3515687882900238, mean loss: 0.4003781031119254
Epoch: 4, step: 709, loss: 0.3500683605670929, mean loss: 0.40037034644486635
Epoch: 4, step: 710, loss: 0.3258078694343567, mean loss: 0.4003588523062799
Epoch: 4, step: 711, loss: 0.32485273480415344, mean loss: 0.40034721449532085
Epoch: 4, step: 712, loss: 0.44036000967025757, mean loss: 0.4003533807451552
Epoch: 4, step: 713, loss: 0.3819360136985779, mean loss: 0.40035054293821426
Epoch: 4, step: 714, loss: 0.34032002091407776, mean loss: 0.40034129466799023
Epoch: 4, step: 715, loss: 0.39420098066329956, mean loss: 0.4003403488402015
Epoch: 4, step: 716, loss: 0.3920342028141022, mean loss: 0.40033906959393223
Epoch: 4, step: 717, loss: 0.34143462777137756, mean loss: 0.40032999899925675
Epoch: 4, step: 718, loss: 0.3336543142795563, mean loss: 0.4003197333049196
Epoch: 4, step: 719, loss: 0.3691007196903229, mean loss: 0.40031492742228186
Epoch: 4, step: 720, loss: 0.34743815660476685, mean loss: 0.4003067887781665
Epoch: 4, step: 721, loss: 0.3151489198207855, mean loss: 0.4002936835351752
Epoch: 4, step: 722, loss: 0.34584885835647583, mean loss: 0.40028530611939145
Epoch: 4, step: 723, loss: 0.3864312469959259, mean loss: 0.40028317472568015
Epoch: 4, step: 724, loss: 0.358531653881073, mean loss: 0.40027675240283067
Epoch: 4, step: 725, loss: 0.324851393699646, mean loss: 0.40026515207082464
Epoch: 4, step: 726, loss: 0.3458554148674011, mean loss: 0.4002567852036551
Epoch: 4, step: 727, loss: 0.3380591571331024, mean loss: 0.4002472222227094
Epoch: 4, step: 728, loss: 0.34358304738998413, mean loss: 0.4002385113580157
Epoch: 4, step: 729, loss: 0.36663901805877686, mean loss: 0.40023334697232565
Epoch: 4, step: 730, loss: 0.40295326709747314, mean loss: 0.4002337649714228
Epoch: 4, step: 731, loss: 0.4034267067909241, mean loss: 0.4002342555894037
Epoch: 4, step: 732, loss: 0.34538033604621887, mean loss: 0.4002258281935605
Epoch: 4, step: 733, loss: 0.4013616442680359, mean loss: 0.4002260026660758
Epoch: 4, step: 734, loss: 0.36326614022254944, mean loss: 0.4002203261398212
Epoch: 4, step: 735, loss: 0.32446807622909546, mean loss: 0.4002086934233116
Epoch: 4, step: 736, loss: 0.34540095925331116, mean loss: 0.40020027829446625
Epoch: 4, step: 737, loss: 0.37001317739486694, mean loss: 0.40019564410642516
Epoch: 4, step: 738, loss: 0.3815648555755615, mean loss: 0.40019278443051864
Epoch: 4, step: 739, loss: 0.3532622158527374, mean loss: 0.40018558207192784
Epoch: 4, step: 740, loss: 0.4013528823852539, mean loss: 0.40018576118813365
Epoch: 4, step: 741, loss: 0.3490135669708252, mean loss: 0.4001779102838352
Epoch: 4, step: 742, loss: 0.3495851159095764, mean loss: 0.4001701494624862
Epoch: 4, step: 743, loss: 0.35742631554603577, mean loss: 0.40016359365973825
Epoch: 4, step: 744, loss: 0.3383423984050751, mean loss: 0.40015411333536244
Epoch: 4, step: 745, loss: 0.33025044202804565, mean loss: 0.400143395201154
Epoch: 4, step: 746, loss: 0.30993741750717163, mean loss: 0.40012956629149676
Epoch: 4, step: 747, loss: 0.4188675582408905, mean loss: 0.40013243845457913
Epoch: 4, step: 748, loss: 0.3151087462902069, mean loss: 0.40011940800367274
Epoch: 4, step: 749, loss: 0.3576539158821106, mean loss: 0.4001129008795352
Epoch: 4, step: 750, loss: 0.35026586055755615, mean loss: 0.4001052638272414
Epoch: 4, step: 751, loss: 0.34449610114097595, mean loss: 0.40009674526678085
Epoch: 4, step: 752, loss: 0.3422851860523224, mean loss: 0.4000878906858015
Epoch: 4, step: 753, loss: 0.3434283137321472, mean loss: 0.4000792138746294
Epoch: 4, step: 754, loss: 0.3200749158859253, mean loss: 0.40006696394383956
Epoch: 4, step: 755, loss: 0.31040507555007935, mean loss: 0.4000532373840732
Epoch: 4, step: 756, loss: 0.3545866012573242, mean loss: 0.40004627784999597
Epoch: 4, step: 757, loss: 0.38837143778800964, mean loss: 0.4000444910670051
Epoch: 4, step: 758, loss: 0.41019803285598755, mean loss: 0.4000460447841878
Epoch: 4, step: 759, loss: 0.3987431824207306, mean loss: 0.4000458454478409
Epoch: 4, step: 760, loss: 0.37249448895454407, mean loss: 0.40004163076886073
Epoch: 4, step: 761, loss: 0.32804274559020996, mean loss: 0.4000306183973131
Epoch: 4, step: 762, loss: 0.33672070503234863, mean loss: 0.40002093650201337
Epoch: 4, step: 763, loss: 0.3498018682003021, mean loss: 0.4000132577453923
Epoch: 4, step: 764, loss: 0.3521984815597534, mean loss: 0.40000594773527376
Epoch: 4, step: 765, loss: 0.3449033200740814, mean loss: 0.3999975248328492
Epoch: 4, step: 766, loss: 0.3660198450088501, mean loss: 0.3999923318510635
Epoch: 4, step: 767, loss: 0.3588395416736603, mean loss: 0.3999860432217576
Epoch: 4, step: 768, loss: 0.37310990691185, mean loss: 0.39998193686021294
Epoch: 4, step: 769, loss: 0.43753868341445923, mean loss: 0.3999876742183789
Epoch: 4, step: 770, loss: 0.32484155893325806, mean loss: 0.3999761962719477
Epoch: 4, step: 771, loss: 0.35952240228652954, mean loss: 0.3999700182337703
Epoch: 4, step: 772, loss: 0.34480634331703186, mean loss: 0.3999615950126806
Epoch: 4, step: 773, loss: 0.3384277820587158, mean loss: 0.3999522005374204
Epoch: 4, step: 774, loss: 0.34955182671546936, mean loss: 0.3999445069984459
Epoch: 4, step: 775, loss: 0.37528491020202637, mean loss: 0.3999407433237212
Epoch: 4, step: 776, loss: 0.3565073609352112, mean loss: 0.39993411530870693
Epoch: 4, step: 777, loss: 0.37188485264778137, mean loss: 0.3999298355920971
Epoch: 4, step: 778, loss: 0.35551726818084717, mean loss: 0.3999230602194943
Epoch: 4, step: 779, loss: 0.3435969352722168, mean loss: 0.39991446868121683
Epoch: 4, step: 780, loss: 0.37009817361831665, mean loss: 0.39990992143475307
Epoch: 4, step: 781, loss: 0.4037066102027893, mean loss: 0.39991050037479087
Epoch: 4, step: 782, loss: 0.33540526032447815, mean loss: 0.3999006657597504
Epoch: 4, step: 783, loss: 0.3290758728981018, mean loss: 0.3998898692974239
Epoch: 4, step: 784, loss: 0.3512929081916809, mean loss: 0.39988246235319197
Epoch: 4, step: 785, loss: 0.346261203289032, mean loss: 0.3998742908720789
Epoch: 4, step: 786, loss: 0.3419575095176697, mean loss: 0.3998654661301385
Epoch: 4, step: 787, loss: 0.38088884949684143, mean loss: 0.3998625751160262
Epoch: 4, step: 788, loss: 0.33537477254867554, mean loss: 0.3998527521453381
Epoch: 4, step: 789, loss: 0.3553665578365326, mean loss: 0.3998459769101403
Epoch: 4, step: 790, loss: 0.3412637412548065, mean loss: 0.39983705621032983
Epoch: 4, step: 791, loss: 0.35004934668540955, mean loss: 0.39982947586478707
Epoch: 4, step: 792, loss: 0.3435971438884735, mean loss: 0.3998209156072172
Epoch: 4, step: 793, loss: 0.40089255571365356, mean loss: 0.39982107871834455
Epoch: 4, step: 794, loss: 0.3693263828754425, mean loss: 0.3998164379184902
Epoch: 4, step: 795, loss: 0.28651341795921326, mean loss: 0.3997991976537368
Epoch: 4, step: 796, loss: 0.39306268095970154, mean loss: 0.3997981727767105
Epoch: 4, step: 797, loss: 0.31769824028015137, mean loss: 0.399785684195558
Epoch: 4, step: 798, loss: 0.3878710865974426, mean loss: 0.3997838720894594
Epoch: 4, step: 799, loss: 0.38005927205085754, mean loss: 0.3997808726064852
Epoch: 4, step: 800, loss: 0.3376702666282654, mean loss: 0.3997714289990687
Epoch: 4, step: 801, loss: 0.3566814363002777, mean loss: 0.3997648783768889
Epoch: 4, step: 802, loss: 0.34663963317871094, mean loss: 0.39975680340421854
Epoch: 4, step: 803, loss: 0.3439672589302063, mean loss: 0.3997483247500432
Epoch: 4, step: 804, loss: 0.3375999629497528, mean loss: 0.3997388811454542
Epoch: 4, step: 805, loss: 0.346699595451355, mean loss: 0.3997308229130485
Epoch: 4, step: 806, loss: 0.3833996653556824, mean loss: 0.39972834210527736
Epoch: 4, step: 807, loss: 0.3516368567943573, mean loss: 0.3997210378092095
Epoch: 4, step: 808, loss: 0.3173470199108124, mean loss: 0.39970852846708366
Epoch: 4, step: 809, loss: 0.3625100553035736, mean loss: 0.3997028803539401
Epoch: 4, step: 810, loss: 0.40157651901245117, mean loss: 0.3997031647988556
Epoch: 4, step: 811, loss: 0.319217711687088, mean loss: 0.39969094782054476
Epoch: 4, step: 812, loss: 0.3490150570869446, mean loss: 0.39968325683697614
Epoch: 4, step: 813, loss: 0.40697982907295227, mean loss: 0.39968436405582836
Epoch: 4, step: 814, loss: 0.3780168294906616, mean loss: 0.39968107661316943
Epoch: 4, step: 815, loss: 0.36721277236938477, mean loss: 0.39967615120293826
Epoch: 4, step: 816, loss: 0.3593598008155823, mean loss: 0.39967003617936975
Epoch: 4, step: 817, loss: 0.35993993282318115, mean loss: 0.3996640109892945
Epoch: 4, step: 818, loss: 0.3720731735229492, mean loss: 0.39965982738998196
Epoch: 4, step: 819, loss: 0.33138367533683777, mean loss: 0.39964947624503755
Epoch: 4, step: 820, loss: 0.32641148567199707, mean loss: 0.3996383745335667
Epoch: 4, step: 821, loss: 0.3242826461791992, mean loss: 0.3996269535380598
Epoch: 4, step: 822, loss: 0.37754786014556885, mean loss: 0.39962360771393607
Epoch: 4, step: 823, loss: 0.37607768177986145, mean loss: 0.3996200401494006
Epoch: 4, step: 824, loss: 0.33676886558532715, mean loss: 0.39961051868680947
Epoch: 4, step: 825, loss: 0.37370726466178894, mean loss: 0.3996065951403046
Epoch: 4, step: 826, loss: 0.38433682918548584, mean loss: 0.39960428259056135
Epoch: 4, step: 827, loss: 0.31903648376464844, mean loss: 0.3995920827421625
Epoch: 4, step: 828, loss: 0.38657665252685547, mean loss: 0.3995901122001163
Epoch: 4, step: 829, loss: 0.4057133197784424, mean loss: 0.3995910391161893
Epoch: 4, step: 830, loss: 0.35024741291999817, mean loss: 0.39958357073020534
Epoch: 4, step: 831, loss: 0.36127743124961853, mean loss: 0.3995777737962646
Epoch: 4, step: 832, loss: 0.3713587522506714, mean loss: 0.39957350400937613
Epoch: 4, step: 833, loss: 0.3431957960128784, mean loss: 0.39956497485536757
Epoch: 4, step: 834, loss: 0.3634042739868164, mean loss: 0.39955950507759286
Epoch: 4, step: 835, loss: 0.362037718296051, mean loss: 0.3995538302762042
Epoch: 4, step: 836, loss: 0.3974403738975525, mean loss: 0.3995535106850385
Epoch: 4, step: 837, loss: 0.35243040323257446, mean loss: 0.3995463859333826
Epoch: 4, step: 838, loss: 0.36886316537857056, mean loss: 0.39954174750245974
Epoch: 4, step: 839, loss: 0.36785873770713806, mean loss: 0.3995369586557555
Epoch: 4, step: 840, loss: 0.3588491976261139, mean loss: 0.3995308096817447
Epoch: 4, step: 841, loss: 0.38415563106536865, mean loss: 0.3995284864453264
Epoch: 4, step: 842, loss: 0.408338338136673, mean loss: 0.3995298174396898
Epoch: 4, step: 843, loss: 0.405156672000885, mean loss: 0.3995306674177202
Epoch: 4, step: 844, loss: 0.34826549887657166, mean loss: 0.39952292460416616
Epoch: 4, step: 845, loss: 0.3512483239173889, mean loss: 0.3995156345708399
Epoch: 4, step: 846, loss: 0.37844160199165344, mean loss: 0.39951245262420254
Epoch: 4, step: 847, loss: 0.350142240524292, mean loss: 0.39950499939169953
Epoch: 4, step: 848, loss: 0.3194500207901001, mean loss: 0.3994929156213446
Epoch: 4, step: 849, loss: 0.37037432193756104, mean loss: 0.3994885210252559
Epoch: 4, step: 850, loss: 0.41022568941116333, mean loss: 0.39949014124079624
Epoch: 4, step: 851, loss: 0.3844899535179138, mean loss: 0.39948787808634195
Epoch: 4, step: 852, loss: 0.37055808305740356, mean loss: 0.3994835139597725
Epoch: 4, step: 853, loss: 0.3307015299797058, mean loss: 0.3994731396032144
Epoch: 4, step: 854, loss: 0.3760404586791992, mean loss: 0.3994696057952029
Epoch: 4, step: 855, loss: 0.3364967703819275, mean loss: 0.39946011049432634
Epoch: 4, step: 856, loss: 0.3478333353996277, mean loss: 0.39945232717228585
Epoch: 4, step: 857, loss: 0.3396896421909332, mean loss: 0.39944331862767
Epoch: 4, step: 858, loss: 0.37323513627052307, mean loss: 0.3994393686378649
Epoch: 4, step: 859, loss: 0.34754055738449097, mean loss: 0.39943154784050905
Epoch: 4, step: 860, loss: 0.37052202224731445, mean loss: 0.3994271920283058
Epoch: 4, step: 861, loss: 0.31569692492485046, mean loss: 0.3994145782489892
Epoch: 4, step: 862, loss: 0.3275562524795532, mean loss: 0.39940375458190536
Epoch: 4, step: 863, loss: 0.3527168333530426, mean loss: 0.3993967234190697
Epoch: 4, step: 864, loss: 0.4093881845474243, mean loss: 0.39939822793060836
Epoch: 4, step: 865, loss: 0.38462284207344055, mean loss: 0.3993960033919367
Epoch: 4, step: 866, loss: 0.34424418210983276, mean loss: 0.3993877011457705
Epoch: 4, step: 867, loss: 0.3614520728588104, mean loss: 0.39938199138835223
Epoch: 4, step: 868, loss: 0.37342777848243713, mean loss: 0.3993780855624823
Epoch: 4, step: 869, loss: 0.36588847637176514, mean loss: 0.39937304650001
Epoch: 4, step: 870, loss: 0.3852805495262146, mean loss: 0.39937092637108357
Epoch: 4, step: 871, loss: 0.358213871717453, mean loss: 0.39936473547838597
Epoch: 4, step: 872, loss: 0.3442067801952362, mean loss: 0.3993564398015499
Epoch: 4, step: 873, loss: 0.4016270041465759, mean loss: 0.3993567812397973
Epoch: 4, step: 874, loss: 0.35720115900039673, mean loss: 0.3993504430016016
Epoch: 4, step: 875, loss: 0.3789204955101013, mean loss: 0.3993473717527304
Epoch: 4, step: 876, loss: 0.3211161196231842, mean loss: 0.3993356129593846
Epoch: 4, step: 877, loss: 0.341312438249588, mean loss: 0.39932689291509393
Epoch: 4, step: 878, loss: 0.33632683753967285, mean loss: 0.3993174263402817
Epoch: 4, step: 879, loss: 0.3495909571647644, mean loss: 0.3993099554164272
Epoch: 4, step: 880, loss: 0.3667512536048889, mean loss: 0.3993050645193547
Epoch: 4, step: 881, loss: 0.327206015586853, mean loss: 0.3992942355843994
Epoch: 4, step: 882, loss: 0.3484414517879486, mean loss: 0.3992865988846252
Epoch: 4, step: 883, loss: 0.35597047209739685, mean loss: 0.39928009496168415
Epoch: 4, step: 884, loss: 0.3590618669986725, mean loss: 0.3992740570953033
Epoch: 4, step: 885, loss: 0.42476335167884827, mean loss: 0.39927788316774154
Epoch: 4, step: 886, loss: 0.3565828204154968, mean loss: 0.39927147538404767
Epoch: 4, step: 887, loss: 0.39424923062324524, mean loss: 0.3992707217458783
Epoch: 4, step: 888, loss: 0.3952171504497528, mean loss: 0.39927011355813696
Epoch: 4, step: 889, loss: 0.3770448565483093, mean loss: 0.3992667794361733
Epoch: 4, step: 890, loss: 0.32944348454475403, mean loss: 0.3992563064655881
Epoch: 4, step: 891, loss: 0.3414011597633362, mean loss: 0.39924762992889007
Epoch: 4, step: 892, loss: 0.38124334812164307, mean loss: 0.3992449302315131
Epoch: 4, step: 893, loss: 0.39293718338012695, mean loss: 0.39924398454232995
Epoch: 4, step: 894, loss: 0.36465001106262207, mean loss: 0.39923879881702945
Epoch: 4, step: 895, loss: 0.3666537404060364, mean loss: 0.39923391496534916
Epoch: 4, step: 896, loss: 0.3458022177219391, mean loss: 0.39922590781755307
Epoch: 4, step: 897, loss: 0.36980730295181274, mean loss: 0.3992214998755594
Epoch: 4, step: 898, loss: 0.3573896288871765, mean loss: 0.39921523292859484
Epoch: 4, step: 899, loss: 0.3805125057697296, mean loss: 0.3992124314416028
Epoch: 4, step: 900, loss: 0.4013257324695587, mean loss: 0.3992127479461749
Epoch: 4, step: 901, loss: 0.33645474910736084, mean loss: 0.3992033502224794
Epoch: 4, step: 902, loss: 0.38384318351745605, mean loss: 0.3992010504520489
Epoch: 4, step: 903, loss: 0.3319142758846283, mean loss: 0.39919097758160466
Epoch: 4, step: 904, loss: 0.34090352058410645, mean loss: 0.39918225322043155
Epoch: 4, step: 905, loss: 0.31498169898986816, mean loss: 0.39916965211982836
Epoch: 4, step: 906, loss: 0.3076570928096771, mean loss: 0.39915595878460314
Epoch: 4, step: 907, loss: 0.33892199397087097, mean loss: 0.3991469471202085
Epoch: 4, step: 908, loss: 0.3193524479866028, mean loss: 0.39913501077030067
Epoch: 4, step: 909, loss: 0.33252817392349243, mean loss: 0.3991250486349661
Epoch: 4, step: 910, loss: 0.3665813207626343, mean loss: 0.3991201819192681
Epoch: 4, step: 911, loss: 0.3415502905845642, mean loss: 0.39911157398097047
Epoch: 4, step: 912, loss: 0.3644375801086426, mean loss: 0.3991063902473971
Epoch: 4, step: 913, loss: 0.3284529149532318, mean loss: 0.3990958291898045
Epoch: 4, step: 914, loss: 0.3812859058380127, mean loss: 0.3990931674167733
Epoch: 4, step: 915, loss: 0.33043625950813293, mean loss: 0.3990829078668766
Epoch: 4, step: 916, loss: 0.363190233707428, mean loss: 0.3990775451484903
Epoch: 4, step: 917, loss: 0.33654335141181946, mean loss: 0.39906820332092285
Epoch: 4, step: 918, loss: 0.3076503276824951, mean loss: 0.3990545486718357
Epoch: 4, step: 919, loss: 0.3621816635131836, mean loss: 0.39904904196855634
Epoch: 4, step: 920, loss: 0.35555344820022583, mean loss: 0.3990425471807755
Epoch: 4, step: 921, loss: 0.35185927152633667, mean loss: 0.39903550279802624
Epoch: 4, step: 922, loss: 0.33305320143699646, mean loss: 0.3990256532232597
Epoch: 4, step: 923, loss: 0.398873895406723, mean loss: 0.39902563057283935
Epoch: 4, step: 924, loss: 0.33161455392837524, mean loss: 0.39901557071958693
Epoch: 4, step: 925, loss: 0.4254833161830902, mean loss: 0.39901951995048274
Epoch: 4, step: 926, loss: 0.37936893105506897, mean loss: 0.39901658833942866
Epoch: 4, step: 927, loss: 0.365328848361969, mean loss: 0.399011563318549
Epoch: 4, step: 928, loss: 0.39383941888809204, mean loss: 0.399010791932355
Epoch: 4, step: 929, loss: 0.31594881415367126, mean loss: 0.3989984057143743
Epoch: 4, step: 930, loss: 0.33574435114860535, mean loss: 0.3989889746640439
Epoch: 4, step: 931, loss: 0.3740236759185791, mean loss: 0.39898525294389703
Epoch: 4, step: 932, loss: 0.32708272337913513, mean loss: 0.39897453561947244
Epoch: 4, step: 933, loss: 0.3765135109424591, mean loss: 0.3989711882238425
Epoch: 4, step: 934, loss: 0.3493104577064514, mean loss: 0.39896378832360146
Epoch: 4, step: 935, loss: 0.3519528806209564, mean loss: 0.39895678431470655
Epoch: 4, step: 936, loss: 0.37592488527297974, mean loss: 0.3989533533748821
Epoch: 4, step: 937, loss: 0.3885335922241211, mean loss: 0.3989518014295215
Epoch: 4, step: 938, loss: 0.36246809363365173, mean loss: 0.3989463682638036
Epoch: 4, step: 939, loss: 0.39098912477493286, mean loss: 0.39894518344493984
Epoch: 4, step: 940, loss: 0.3555072546005249, mean loss: 0.39893871658044017
Epoch: 4, step: 941, loss: 0.36778542399406433, mean loss: 0.3989340792936604
Epoch: 4, step: 942, loss: 0.3916693925857544, mean loss: 0.39893299807819566
Epoch: 4, step: 943, loss: 0.37013575434684753, mean loss: 0.398928712774069
Epoch: 4, step: 944, loss: 0.32006773352622986, mean loss: 0.3989169792553593
Epoch: 4, step: 945, loss: 0.33477672934532166, mean loss: 0.39890743741514656
Epoch: 4, step: 946, loss: 0.3792870342731476, mean loss: 0.39890451901515517
Epoch: 4, step: 947, loss: 0.4219002425670624, mean loss: 0.3989079389621438
Epoch: 4, step: 948, loss: 0.355963796377182, mean loss: 0.39890155321603454
Epoch: 4, step: 949, loss: 0.32676851749420166, mean loss: 0.3988908287087907
Epoch: 4, step: 950, loss: 0.35551315546035767, mean loss: 0.3988843804148635
Epoch: 4, step: 951, loss: 0.3520335555076599, mean loss: 0.3988774168558702
Epoch: 4, step: 952, loss: 0.35793909430503845, mean loss: 0.3988713329916183
Epoch: 4, step: 953, loss: 0.3998669981956482, mean loss: 0.39887148093592795
Epoch: 4, step: 954, loss: 0.3534536361694336, mean loss: 0.39886473337319334
Epoch: 4, step: 955, loss: 0.35434162616729736, mean loss: 0.3988581197209049
Epoch: 4, step: 956, loss: 0.37189650535583496, mean loss: 0.39885411532251414
Epoch: 4, step: 957, loss: 0.3980518877506256, mean loss: 0.39885399619160056
Epoch: 4, step: 958, loss: 0.312274307012558, mean loss: 0.39884114100389767
Epoch: 4, step: 959, loss: 0.37451186776161194, mean loss: 0.39883752917592225
Epoch: 4, step: 960, loss: 0.3570922017097473, mean loss: 0.39883133274910526
Epoch: 4, step: 961, loss: 0.34768232703208923, mean loss: 0.39882374162329387
Epoch: 4, step: 962, loss: 0.3789719343185425, mean loss: 0.3988207958142265
Epoch: 4, step: 963, loss: 0.35718974471092224, mean loss: 0.398814619100413
Epoch: 4, step: 964, loss: 0.3692202866077423, mean loss: 0.39881022890125967
Epoch: 4, step: 965, loss: 0.30978065729141235, mean loss: 0.39879702368446796
Epoch: 4, step: 966, loss: 0.3561100959777832, mean loss: 0.3987906931301588
Epoch: 4, step: 967, loss: 0.36204105615615845, mean loss: 0.39878524389573206
Epoch: 4, step: 968, loss: 0.35460227727890015, mean loss: 0.398778693418843
Epoch: 4, step: 969, loss: 0.37083888053894043, mean loss: 0.3987745517329728
Epoch: 4, step: 970, loss: 0.3426572382450104, mean loss: 0.39876623436029046
Epoch: 4, step: 971, loss: 0.3099905848503113, mean loss: 0.39875307851418645
Epoch: 4, step: 972, loss: 0.39230841398239136, mean loss: 0.398752123607603
Epoch: 4, step: 973, loss: 0.3216119110584259, mean loss: 0.3987406954279661
Epoch: 4, step: 974, loss: 0.3275791108608246, mean loss: 0.3987301545326073
Epoch: 4, step: 975, loss: 0.3684840798377991, mean loss: 0.3987256749599333
Epoch: 4, step: 976, loss: 0.37211599946022034, mean loss: 0.3987217345370842
Epoch: 4, step: 977, loss: 0.3245322108268738, mean loss: 0.39871075000588635
Epoch: 4, step: 978, loss: 0.35331371426582336, mean loss: 0.3987040294972646
Epoch: 4, step: 979, loss: 0.35374799370765686, mean loss: 0.398697375258693
Epoch: 4, step: 980, loss: 0.357618510723114, mean loss: 0.39869129580560203
Epoch: 4, step: 981, loss: 0.39872032403945923, mean loss: 0.3986913001009903
Epoch: 4, step: 982, loss: 0.39291122555732727, mean loss: 0.39869044493387334
Epoch: 4, step: 983, loss: 0.32916441559791565, mean loss: 0.3986801600182911
Epoch: 4, step: 984, loss: 0.3976523280143738, mean loss: 0.3986800079946254
Epoch: 4, step: 985, loss: 0.33940666913986206, mean loss: 0.39867124234262086
Epoch: 4, step: 986, loss: 0.35345810651779175, mean loss: 0.3986645569757977
Epoch: 4, step: 987, loss: 0.32537999749183655, mean loss: 0.39865372247557834
Epoch: 4, step: 988, loss: 0.370159775018692, mean loss: 0.3986495105099528
Epoch: 4, step: 989, loss: 0.38275739550590515, mean loss: 0.3986471616901177
Epoch: 4, step: 990, loss: 0.3312379717826843, mean loss: 0.39863720023158256
Epoch: 4, step: 991, loss: 0.3532795310020447, mean loss: 0.39863049844830395
Epoch: 4, step: 992, loss: 0.3497660160064697, mean loss: 0.398623279585482
Epoch: 4, step: 993, loss: 0.3545914590358734, mean loss: 0.39861677562380554
Epoch: 4, step: 994, loss: 0.33020299673080444, mean loss: 0.3986066716836353
Epoch: 4, step: 995, loss: 0.35271164774894714, mean loss: 0.39859989450939803
Epoch: 4, step: 996, loss: 0.3386082351207733, mean loss: 0.39859103703717175
Epoch: 4, step: 997, loss: 0.3250115215778351, mean loss: 0.39858017498883114
Epoch: 4, step: 998, loss: 0.38702285289764404, mean loss: 0.3985784691110317
Epoch: 4, step: 999, loss: 0.382205605506897, mean loss: 0.3985760528088469
Epoch: 4, step: 1000, loss: 0.3288835883140564, mean loss: 0.39856576913399155
Epoch: 4, step: 1001, loss: 0.34155935049057007, mean loss: 0.39855735862666736
Epoch: 4, step: 1002, loss: 0.30906805396080017, mean loss: 0.3985441576671356
Epoch: 4, step: 1003, loss: 0.3502793610095978, mean loss: 0.3985370389655637
Epoch: 4, step: 1004, loss: 0.37730610370635986, mean loss: 0.3985339080209745
Epoch: 4, step: 1005, loss: 0.3372066020965576, mean loss: 0.39852486536306764
Epoch: 4, step: 1006, loss: 0.3166074752807617, mean loss: 0.39851278849588756
Epoch: 4, step: 1007, loss: 0.4197014570236206, mean loss: 0.3985159118255644
Epoch: 4, step: 1008, loss: 0.3129327893257141, mean loss: 0.39850329824818786
Epoch: 4, step: 1009, loss: 0.38155338168144226, mean loss: 0.398500800470916
Epoch: 4, step: 1010, loss: 0.36961984634399414, mean loss: 0.3984965451365817
Epoch: 4, step: 1011, loss: 0.3294685482978821, mean loss: 0.3984863760150675
Epoch: 4, step: 1012, loss: 0.36656370759010315, mean loss: 0.3984816738986402
Epoch: 4, step: 1013, loss: 0.3492814600467682, mean loss: 0.3984744279172187
Epoch: 4, step: 1014, loss: 0.34286096692085266, mean loss: 0.39846623862830743
Epoch: 4, step: 1015, loss: 0.38945579528808594, mean loss: 0.39846491200237394
Epoch: 4, step: 1016, loss: 0.421891987323761, mean loss: 0.3984683607106503
Epoch: 4, step: 1017, loss: 0.3529060482978821, mean loss: 0.39846165445330367
Epoch: 4, step: 1018, loss: 0.377045601606369, mean loss: 0.39845850271631367
Epoch: 4, step: 1019, loss: 0.3527561128139496, mean loss: 0.39845177782080127
Epoch: 4, step: 1020, loss: 0.36789047718048096, mean loss: 0.39844728152822506
Epoch: 4, step: 1021, loss: 0.334419846534729, mean loss: 0.39843786295879385
Epoch: 4, step: 1022, loss: 0.3526808023452759, mean loss: 0.3984311329895905
Epoch: 4, step: 1023, loss: 0.35693612694740295, mean loss: 0.3984250307828196
Epoch: 4, step: 1024, loss: 0.4372030198574066, mean loss: 0.39843073258977074
Epoch: 4, step: 1025, loss: 0.3775634765625, mean loss: 0.39842766477794667
Epoch: 4, step: 1026, loss: 0.35459816455841064, mean loss: 0.39842122210556397
Epoch: 4, step: 1027, loss: 0.3399049937725067, mean loss: 0.3984126218368495
Epoch: 4, step: 1028, loss: 0.3761845529079437, mean loss: 0.39840935540497163
Epoch: 4, step: 1029, loss: 0.3411468267440796, mean loss: 0.39840094186858305
Epoch: 4, step: 1030, loss: 0.3679138123989105, mean loss: 0.3983964630777105
Epoch: 4, step: 1031, loss: 0.35222887992858887, mean loss: 0.3983896817053325
Epoch: 4, step: 1032, loss: 0.4038732945919037, mean loss: 0.3983904870530909
Epoch: 4, step: 1033, loss: 0.3455699682235718, mean loss: 0.39838273073608216
Epoch: 4, step: 1034, loss: 0.39712366461753845, mean loss: 0.3983825458783346
Epoch: 4, step: 1035, loss: 0.33905860781669617, mean loss: 0.39837383713816116
Epoch: 4, step: 1036, loss: 0.330247700214386, mean loss: 0.3983638377051766
Epoch: 4, step: 1037, loss: 0.3606259524822235, mean loss: 0.3983582994185281
Epoch: 4, step: 1038, loss: 0.3404472768306732, mean loss: 0.3983498018363435
Epoch: 4, step: 1039, loss: 0.35048577189445496, mean loss: 0.3983427795314811
Epoch: 4, step: 1040, loss: 0.43058180809020996, mean loss: 0.39834750874206626
Epoch: 4, step: 1041, loss: 0.3356861472129822, mean loss: 0.3983383181639599
Epoch: 4, step: 1042, loss: 0.3798218071460724, mean loss: 0.3983356027348621
Epoch: 4, step: 1043, loss: 0.3608885705471039, mean loss: 0.39833011196767915
Epoch: 4, step: 1044, loss: 0.3532046973705292, mean loss: 0.3983234963080109
Epoch: 4, step: 1045, loss: 0.3196384310722351, mean loss: 0.39831196229082594
Epoch: 4, step: 1046, loss: 0.3736928701400757, mean loss: 0.3983083540404741
Epoch: 4, step: 1047, loss: 0.32805970311164856, mean loss: 0.39829805968951737
Epoch: 4, step: 1048, loss: 0.37414196133613586, mean loss: 0.3982945203344473
Epoch: 4, step: 1049, loss: 0.3840840458869934, mean loss: 0.39829243851867707
Epoch: 4, step: 1050, loss: 0.36399564146995544, mean loss: 0.39828741481909474
Epoch: 4, step: 1051, loss: 0.34341734647750854, mean loss: 0.3982793787809662
Epoch: 4, step: 1052, loss: 0.39711177349090576, mean loss: 0.3982792078034746
Epoch: 4, step: 1053, loss: 0.33838385343551636, mean loss: 0.39827043835188336
Epoch: 4, step: 1054, loss: 0.35125452280044556, mean loss: 0.39826355562379795
Epoch: 4, step: 1055, loss: 0.3450287878513336, mean loss: 0.39825576364959236
Epoch: 4, step: 1056, loss: 0.3779745399951935, mean loss: 0.3982527955208562
Epoch: 4, step: 1057, loss: 0.3505457639694214, mean loss: 0.39824581468510095
Epoch: 4, step: 1058, loss: 0.35132914781570435, mean loss: 0.3982389505056029
Epoch: 4, step: 1059, loss: 0.334566593170166, mean loss: 0.39822963623448887
Epoch: 4, step: 1060, loss: 0.3461518883705139, mean loss: 0.3982220191878509
Epoch: 4, step: 1061, loss: 0.3544261157512665, mean loss: 0.3982156144052483
Epoch: 4, step: 1062, loss: 0.3329737186431885, mean loss: 0.3982060747217036
Epoch: 4, step: 1063, loss: 0.39121904969215393, mean loss: 0.39820505322681626
Epoch: 4, step: 1064, loss: 0.35132765769958496, mean loss: 0.39819820080823315
Epoch: 4, step: 1065, loss: 0.3667181432247162, mean loss: 0.39819359980595553
Epoch: 4, step: 1066, loss: 0.3614012598991394, mean loss: 0.3981882231670681
Epoch: 4, step: 1067, loss: 0.3401845693588257, mean loss: 0.39817974805692663
Epoch: 4, step: 1068, loss: 0.35631999373435974, mean loss: 0.39817363268010814
Epoch: 4, step: 1069, loss: 0.3433665335178375, mean loss: 0.3981656269688662
Epoch: 4, step: 1070, loss: 0.35628265142440796, mean loss: 0.3981595099868968
Epoch: 4, step: 1071, loss: 0.35545507073402405, mean loss: 0.3981532739414452
Epoch: 4, step: 1072, loss: 0.40925925970077515, mean loss: 0.39815489548995725
Epoch: 4, step: 1073, loss: 0.37053877115249634, mean loss: 0.3981508639389591
Epoch: 4, step: 1074, loss: 0.3310398757457733, mean loss: 0.39814106814444833
Epoch: 4, step: 1075, loss: 0.33636847138404846, mean loss: 0.39813205287930525
Epoch: 4, step: 1076, loss: 0.40286844968795776, mean loss: 0.39813274402140486
Epoch: 4, step: 1077, loss: 0.37557533383369446, mean loss: 0.3981294528906509
Epoch: 4, step: 1078, loss: 0.35592079162597656, mean loss: 0.39812329553671
Epoch: 4, step: 1079, loss: 0.38335973024368286, mean loss: 0.398121142157875
Epoch: 4, step: 1080, loss: 0.34744641184806824, mean loss: 0.3981137519390752
Epoch: 4, step: 1081, loss: 0.3485106825828552, mean loss: 0.39810651906223704
Epoch: 4, step: 1082, loss: 0.3278309106826782, mean loss: 0.398096273310906
Epoch: 4, step: 1083, loss: 0.365767240524292, mean loss: 0.3980915606239109
Epoch: 4, step: 1084, loss: 0.3455395996570587, mean loss: 0.3980839011047494
Epoch: 4, step: 1085, loss: 0.3429352939128876, mean loss: 0.3980758642922761
Epoch: 4, step: 1086, loss: 0.3728109896183014, mean loss: 0.3980721829758439
Epoch: 4, step: 1087, loss: 0.3584015965461731, mean loss: 0.3980664034615039
Epoch: 4, step: 1088, loss: 0.3502228856086731, mean loss: 0.398059434267352
Epoch: 4, step: 1089, loss: 0.3385332226753235, mean loss: 0.39805076455986704
Epoch: 4, step: 1090, loss: 0.3264107406139374, mean loss: 0.3980403320531034
Epoch: 4, step: 1091, loss: 0.3894483149051666, mean loss: 0.3980390810313871
Epoch: 4, step: 1092, loss: 0.3889603614807129, mean loss: 0.3980377593368827
Epoch: 4, step: 1093, loss: 0.3473874032497406, mean loss: 0.39803038665040713
Epoch: 4, step: 1094, loss: 0.35482195019721985, mean loss: 0.39802409812814643
Epoch: 4, step: 1095, loss: 0.3515073359012604, mean loss: 0.3980173290998829
Epoch: 4, step: 1096, loss: 0.3694666624069214, mean loss: 0.3980131750671908
Epoch: 4, step: 1097, loss: 0.30969399213790894, mean loss: 0.3980003267717399
Epoch: 4, step: 1098, loss: 0.4042564034461975, mean loss: 0.39800123674652893
Epoch: 4, step: 1099, loss: 0.36489924788475037, mean loss: 0.39799642261202317
Epoch: 4, step: 1100, loss: 0.4207451045513153, mean loss: 0.3979997305489054
Epoch: 4, step: 1101, loss: 0.31525853276252747, mean loss: 0.39798770071497314
Epoch: 4, step: 1102, loss: 0.34556844830513, mean loss: 0.39798008053000294
Epoch: 4, step: 1103, loss: 0.36837491393089294, mean loss: 0.39797577745346235
Epoch: 4, step: 1104, loss: 0.35469019412994385, mean loss: 0.397969486858589
Epoch: 4, step: 1105, loss: 0.36357834935188293, mean loss: 0.3979644895994337
Epoch: 4, step: 1106, loss: 0.3295283317565918, mean loss: 0.3979545468189829
Epoch: 4, step: 1107, loss: 0.3550790548324585, mean loss: 0.39794831853717194
Epoch: 4, step: 1108, loss: 0.38278353214263916, mean loss: 0.3979461159538176
Epoch: 4, step: 1109, loss: 0.34662672877311707, mean loss: 0.3979386632400243
Epoch: 4, step: 1110, loss: 0.32256945967674255, mean loss: 0.3979277195484949
Epoch: 4, step: 1111, loss: 0.42202532291412354, mean loss: 0.39793121803911125
Epoch: 4, step: 1112, loss: 0.3157038390636444, mean loss: 0.3979192819991961
Epoch: 4, step: 1113, loss: 0.3764743506908417, mean loss: 0.3979161695273081
Epoch: 4, step: 1114, loss: 0.33678770065307617, mean loss: 0.3979072987583523
Epoch: 4, step: 1115, loss: 0.3113701641559601, mean loss: 0.3978947425867617
Epoch: 4, step: 1116, loss: 0.38240575790405273, mean loss: 0.3978924955267468
Epoch: 4, step: 1117, loss: 0.349925696849823, mean loss: 0.39788553776656743
Epoch: 4, step: 1118, loss: 0.3498903512954712, mean loss: 0.3978785768983338
Epoch: 4, step: 1119, loss: 0.4187813103199005, mean loss: 0.39788160803717104
Epoch: 4, step: 1120, loss: 0.38833391666412354, mean loss: 0.39788022371190307
Epoch: 4, step: 1121, loss: 0.37275388836860657, mean loss: 0.39787658115821456
Epoch: 4, step: 1122, loss: 0.4091600775718689, mean loss: 0.3978782166845827
Epoch: 4, step: 1123, loss: 0.34135985374450684, mean loss: 0.3978700256174899
Epoch: 4, step: 1124, loss: 0.41287359595298767, mean loss: 0.3978721997328841
Epoch: 4, step: 1125, loss: 0.3466518223285675, mean loss: 0.3978647786408232
Epoch: 4, step: 1126, loss: 0.3517620265483856, mean loss: 0.3978580999863118
Epoch: 4, step: 1127, loss: 0.33503594994544983, mean loss: 0.39784900060189105
Epoch: 4, step: 1128, loss: 0.34877556562423706, mean loss: 0.3978418936598233
Epoch: 4, step: 1129, loss: 0.3472925126552582, mean loss: 0.39783457402747396
Epoch: 4, step: 1130, loss: 0.31776610016822815, mean loss: 0.3978229816611993
Epoch: 4, step: 1131, loss: 0.36354589462280273, mean loss: 0.39781801972040043
Epoch: 4, step: 1132, loss: 0.33569830656051636, mean loss: 0.39780902859098083
Epoch: 4, step: 1133, loss: 0.3391830325126648, mean loss: 0.3978005443657886
Epoch: 4, step: 1134, loss: 0.3403136730194092, mean loss: 0.39779222619600907
Epoch: 4, step: 1135, loss: 0.34291863441467285, mean loss: 0.3977842873083092
Epoch: 4, step: 1136, loss: 0.3299805819988251, mean loss: 0.3977744791634648
Epoch: 4, step: 1137, loss: 0.3512929081916809, mean loss: 0.39776775634440614
Epoch: 4, step: 1138, loss: 0.32530948519706726, mean loss: 0.39775727792486204
Epoch: 4, step: 1139, loss: 0.35520318150520325, mean loss: 0.3977511249323202
Epoch: 4, step: 1140, loss: 0.34304124116897583, mean loss: 0.3977432154507872
Epoch: 4, step: 1141, loss: 0.32602056860923767, mean loss: 0.3977328479100469
Epoch: 4, step: 1142, loss: 0.3580614924430847, mean loss: 0.3977271142266437
Epoch: 4, step: 1143, loss: 0.36212435364723206, mean loss: 0.3977219693190455
Epoch: 4, step: 1144, loss: 0.34339943528175354, mean loss: 0.3977141203761128
Epoch: 4, step: 1145, loss: 0.38997215032577515, mean loss: 0.39771300191756753
Epoch: 4, step: 1146, loss: 0.3719324469566345, mean loss: 0.39770927801825207
Epoch: 4, step: 1147, loss: 0.3800503611564636, mean loss: 0.3977067276258688
Epoch: 4, step: 1148, loss: 0.360628217458725, mean loss: 0.39770137332837174
Epoch: 4, step: 1149, loss: 0.32568296790122986, mean loss: 0.39769097506018997
Epoch: 4, step: 1150, loss: 0.3726867139339447, mean loss: 0.3976873653790688
Epoch: 4, step: 1151, loss: 0.3823760747909546, mean loss: 0.39768515531980375
Epoch: 4, step: 1152, loss: 0.338832825422287, mean loss: 0.3976766616944758
Epoch: 4, step: 1153, loss: 0.3750676214694977, mean loss: 0.39767339920670886
Epoch: 4, step: 1154, loss: 0.40413543581962585, mean loss: 0.39767433154498805
Epoch: 4, step: 1155, loss: 0.3428407311439514, mean loss: 0.3976664213314276
Epoch: 4, step: 1156, loss: 0.34423428773880005, mean loss: 0.3976587144031725
Epoch: 4, step: 1157, loss: 0.3692416846752167, mean loss: 0.39765461618717485
Epoch: 4, step: 1158, loss: 0.3825664818286896, mean loss: 0.39765244053694293
Epoch: 4, step: 1159, loss: 0.30329909920692444, mean loss: 0.39763883711402914
Epoch: 4, step: 1160, loss: 0.31014788150787354, mean loss: 0.39762622489612426
Epoch: 4, step: 1161, loss: 0.3606624901294708, mean loss: 0.3976208971741919
Epoch: 4, step: 1162, loss: 0.32133036851882935, mean loss: 0.39760990271841223
Epoch: 4, step: 1163, loss: 0.35707008838653564, mean loss: 0.39760406124660647
Epoch: 4, step: 1164, loss: 0.34737759828567505, mean loss: 0.397596825046785
Epoch: 4, step: 1165, loss: 0.33292585611343384, mean loss: 0.39758750914806223
Epoch: 4, step: 1166, loss: 0.38406428694725037, mean loss: 0.3975855613989335
Epoch: 4, step: 1167, loss: 0.36566612124443054, mean loss: 0.39758096470536286
Epoch: 4, step: 1168, loss: 0.39449718594551086, mean loss: 0.3975805206767437
Epoch: 4, step: 1169, loss: 0.36360594630241394, mean loss: 0.39757562943367225
Epoch: 4, step: 1170, loss: 0.3541378676891327, mean loss: 0.39756937669698816
Epoch: 4, step: 1171, loss: 0.3411746025085449, mean loss: 0.3975612600052512
Epoch: 4, step: 1172, loss: 0.346476286649704, mean loss: 0.3975539085916154
Epoch: 4, step: 1173, loss: 0.36528289318084717, mean loss: 0.39754926528004547
Epoch: 4, step: 1174, loss: 0.357132226228714, mean loss: 0.3975434507153711
Epoch: 4, step: 1175, loss: 0.3608205318450928, mean loss: 0.397538168362254
Epoch: 4, step: 1176, loss: 0.36373743414878845, mean loss: 0.39753330704566925
Epoch: 4, step: 1177, loss: 0.34852948784828186, mean loss: 0.39752626019217524
Epoch: 4, step: 1178, loss: 0.3731380105018616, mean loss: 0.39752275361421835
Epoch: 4, step: 1179, loss: 0.3779360353946686, mean loss: 0.39751993781228917
Epoch: 4, step: 1180, loss: 0.3648678660392761, mean loss: 0.3975152443996439
Epoch: 4, step: 1181, loss: 0.3226587772369385, mean loss: 0.39750448606863464
Epoch: 4, step: 1182, loss: 0.3850589692592621, mean loss: 0.3975026976627129
Epoch: 4, step: 1183, loss: 0.3310111165046692, mean loss: 0.39749314427461546
Epoch: 4, step: 1184, loss: 0.3700063228607178, mean loss: 0.3974891955860055
Epoch: 4, step: 1185, loss: 0.34025734663009644, mean loss: 0.3974809749814442
Epoch: 4, step: 1186, loss: 0.40136265754699707, mean loss: 0.3974815324541665
Epoch: 4, step: 1187, loss: 0.36623334884643555, mean loss: 0.3974770453514084
Epoch: 4, step: 1188, loss: 0.32304757833480835, mean loss: 0.3974663591393457
Epoch: 4, step: 1189, loss: 0.37101712822914124, mean loss: 0.3974625622356836
Epoch: 4, step: 1190, loss: 0.35314422845840454, mean loss: 0.3974562010567289
Epoch: 4, step: 1191, loss: 0.3327298164367676, mean loss: 0.39744691196593956
Epoch: 4, step: 1192, loss: 0.333326131105423, mean loss: 0.3974377111077303
Epoch: 4, step: 1193, loss: 0.38763153553009033, mean loss: 0.3974363041958827
Epoch: 4, step: 1194, loss: 0.34062546491622925, mean loss: 0.3974281545990846
Epoch: 4, step: 1195, loss: 0.390204519033432, mean loss: 0.3974271185067774
Epoch: 4, step: 1196, loss: 0.33648809790611267, mean loss: 0.3974183792237428
Epoch: 4, step: 1197, loss: 0.335436075925827, mean loss: 0.39740949159780387
Epoch: 4, step: 1198, loss: 0.37024280428886414, mean loss: 0.39740559673223985
Epoch: 4, step: 1199, loss: 0.338072270154953, mean loss: 0.39739709138152635
Epoch: 4, step: 1200, loss: 0.3550107777118683, mean loss: 0.3973910162326558
Epoch: 4, step: 1201, loss: 0.35847610235214233, mean loss: 0.39738543943215704
Epoch: 4, step: 1202, loss: 0.38888466358184814, mean loss: 0.3973842213814549
Epoch: 4, step: 1203, loss: 0.3573946952819824, mean loss: 0.39737849222298793
Epoch: 4, step: 1204, loss: 0.4411563277244568, mean loss: 0.3973847632207678
Epoch: 4, step: 1205, loss: 0.3825221359729767, mean loss: 0.3973826345144877
Epoch: 4, step: 1206, loss: 0.3436752259731293, mean loss: 0.39737494334900847
Epoch: 4, step: 1207, loss: 0.32687345147132874, mean loss: 0.3973648486336766
Epoch: 4, step: 1208, loss: 0.3562810719013214, mean loss: 0.3973589669190406
Epoch: 4, step: 1209, loss: 0.38139232993125916, mean loss: 0.39735668139986113
Epoch: 4, step: 1210, loss: 0.34686100482940674, mean loss: 0.39734945431004143
Epoch: 4, step: 1211, loss: 0.3546457290649414, mean loss: 0.3973433433018495
Epoch: 4, step: 1212, loss: 0.3435535728931427, mean loss: 0.3973356469546741
Epoch: 4, step: 1213, loss: 0.3263174891471863, mean loss: 0.3973254869893225
Epoch: 4, step: 1214, loss: 0.38949811458587646, mean loss: 0.3973243673537334
Epoch: 4, step: 1215, loss: 0.38565418124198914, mean loss: 0.3973226982767723
Epoch: 4, step: 1216, loss: 0.3994121551513672, mean loss: 0.39732299706940416
Epoch: 4, step: 1217, loss: 0.3498774766921997, mean loss: 0.39731621332328215
Epoch: 4, step: 1218, loss: 0.3430425226688385, mean loss: 0.3973084543968126
Epoch: 4, step: 1219, loss: 0.31756460666656494, mean loss: 0.39729705590514164
Epoch: 4, step: 1220, loss: 0.3313677906990051, mean loss: 0.39728763340046735
Epoch: 4, step: 1221, loss: 0.3579297959804535, mean loss: 0.39728200924536305
Epoch: 4, step: 1222, loss: 0.3328067362308502, mean loss: 0.39727279717606534
Epoch: 4, step: 1223, loss: 0.31008729338645935, mean loss: 0.3972603421040954
Epoch: 4, step: 1224, loss: 0.3310159742832184, mean loss: 0.39725087997471087
Epoch: 4, step: 1225, loss: 0.3452852666378021, mean loss: 0.3972434584361023
Epoch: 4, step: 1226, loss: 0.37090206146240234, mean loss: 0.3972396969914395
Epoch: 4, step: 1227, loss: 0.35021108388900757, mean loss: 0.39723298245501715
Epoch: 4, step: 1228, loss: 0.3314500153064728, mean loss: 0.39722359159603804
Epoch: 4, step: 1229, loss: 0.36395856738090515, mean loss: 0.3972188435195015
Epoch: 4, step: 1230, loss: 0.34725093841552734, mean loss: 0.3972117123784848
Epoch: 4, step: 1231, loss: 0.3552546501159668, mean loss: 0.3972057253547601
Epoch: 4, step: 1232, loss: 0.3358246684074402, mean loss: 0.39719696789193415
Epoch: 4, step: 1233, loss: 0.3465665876865387, mean loss: 0.3971897452984669
Epoch: 4, step: 1234, loss: 0.35392171144485474, mean loss: 0.3971835738487659
Epoch: 4, step: 1235, loss: 0.3649619221687317, mean loss: 0.3971789786331812
Epoch: 4, step: 1236, loss: 0.3647560775279999, mean loss: 0.3971743553762148
Epoch: 4, step: 1237, loss: 0.37728607654571533, mean loss: 0.3971715198645481
Epoch: 4, step: 1238, loss: 0.3620308041572571, mean loss: 0.3971665104966639
Epoch: 4, step: 1239, loss: 0.39974749088287354, mean loss: 0.39716687836730047
Epoch: 4, step: 1240, loss: 0.384236603975296, mean loss: 0.3971650356603898
Epoch: 4, step: 1241, loss: 0.4115898609161377, mean loss: 0.39716709106438747
Epoch: 4, step: 1242, loss: 0.35985806584358215, mean loss: 0.3971617756312459
Epoch: 4, step: 1243, loss: 0.35426148772239685, mean loss: 0.3971556644791221
Epoch: 4, step: 1244, loss: 0.3522327244281769, mean loss: 0.397149266111361
Epoch: 4, step: 1245, loss: 0.4375840723514557, mean loss: 0.39715502441472755
Epoch: 4, step: 1246, loss: 0.4058850407600403, mean loss: 0.397156267475577
Epoch: 4, step: 1247, loss: 0.3458707332611084, mean loss: 0.397148966004305
Epoch: 4, step: 1248, loss: 0.3348142206668854, mean loss: 0.39714009273094736
Epoch: 4, step: 1249, loss: 0.33016231656074524, mean loss: 0.3971305598849226
Epoch: 4, step: 1250, loss: 0.35455769300460815, mean loss: 0.39712450141518013
Epoch: 4, step: 1251, loss: 0.37478289008140564, mean loss: 0.3971213224721901
Epoch: 4, step: 1252, loss: 0.3474627137184143, mean loss: 0.3971142576537588
Epoch: 4, step: 1253, loss: 0.36150893568992615, mean loss: 0.3971091928853429
Epoch: 4, step: 1254, loss: 0.3385448753833771, mean loss: 0.39710086344180684
Epoch: 4, step: 1255, loss: 0.3738199472427368, mean loss: 0.3970975527313121
Epoch: 4, step: 1256, loss: 0.33712175488471985, mean loss: 0.3970890249625297
Epoch: 4, step: 1257, loss: 0.3864118456840515, mean loss: 0.3970875070240482
Epoch: 4, step: 1258, loss: 0.35793590545654297, mean loss: 0.3970819417644082
Epoch: 4, step: 1259, loss: 0.4089255630970001, mean loss: 0.39708362505339806
Epoch: 4, step: 1260, loss: 0.3101244866847992, mean loss: 0.3970712676371172
Epoch: 4, step: 1261, loss: 0.3201722502708435, mean loss: 0.3970603413771902
Epoch: 4, step: 1262, loss: 0.3567623198032379, mean loss: 0.39705461641319334
Epoch: 4, step: 1263, loss: 0.3478021025657654, mean loss: 0.39704762031747637
Epoch: 4, step: 1264, loss: 0.38221415877342224, mean loss: 0.3970455135909398
Epoch: 4, step: 1265, loss: 0.31589075922966003, mean loss: 0.39703398920094246
Epoch: 4, step: 1266, loss: 0.39157867431640625, mean loss: 0.3970332146283336
Epoch: 4, step: 1267, loss: 0.32417407631874084, mean loss: 0.3970228711958649
Epoch: 4, step: 1268, loss: 0.337218314409256, mean loss: 0.3970143822594864
Epoch: 4, step: 1269, loss: 0.37250304222106934, mean loss: 0.39701090349990104
Epoch: 4, step: 1270, loss: 0.3574475347995758, mean loss: 0.3970052892855261
Epoch: 4, step: 1271, loss: 0.3561112582683563, mean loss: 0.39699948706773136
Epoch: 4, step: 1272, loss: 0.3616446554660797, mean loss: 0.3969944714865707
Epoch: 4, step: 1273, loss: 0.32850754261016846, mean loss: 0.39698475702857405
Epoch: 4, step: 1274, loss: 0.33109861612319946, mean loss: 0.39697541280209475
Epoch: 4, step: 1275, loss: 0.32624945044517517, mean loss: 0.3969653835958615
Epoch: 4, step: 1276, loss: 0.35176461935043335, mean loss: 0.3969589748670588
Epoch: 4, step: 1277, loss: 0.3408212661743164, mean loss: 0.39695101658683585
Epoch: 4, step: 1278, loss: 0.34097546339035034, mean loss: 0.3969430824191255
Epoch: 4, step: 1279, loss: 0.3430529832839966, mean loss: 0.3969354449334204
Epoch: 4, step: 1280, loss: 0.3539045751094818, mean loss: 0.3969293473183115
Epoch: 4, step: 1281, loss: 0.3872746527194977, mean loss: 0.3969279794103207
Epoch: 4, step: 1282, loss: 0.34017717838287354, mean loss: 0.39691993991449587
Epoch: 4, step: 1283, loss: 0.3390682637691498, mean loss: 0.39691174562609
Epoch: 4, step: 1284, loss: 0.33502188324928284, mean loss: 0.3969029805981369
Epoch: 4, step: 1285, loss: 0.3631937503814697, mean loss: 0.39689820727185304
Epoch: 4, step: 1286, loss: 0.3724658489227295, mean loss: 0.39689474806778263
Epoch: 4, step: 1287, loss: 0.34410813450813293, mean loss: 0.39688727544411906
Epoch: 4, step: 1288, loss: 0.32163089513778687, mean loss: 0.3968766234440757
Epoch: 4, step: 1289, loss: 0.3382222354412079, mean loss: 0.3968683225117232
Epoch: 4, step: 1290, loss: 0.3478136658668518, mean loss: 0.3968613811424513
Epoch: 4, step: 1291, loss: 0.33066508173942566, mean loss: 0.3968520155086931
Epoch: 4, step: 1292, loss: 0.3804973065853119, mean loss: 0.3968497019270092
Epoch: 4, step: 1293, loss: 0.37449780106544495, mean loss: 0.39684654041345024
Epoch: 4, step: 1294, loss: 0.34335336089134216, mean loss: 0.3968389752629026
Epoch: 4, step: 1295, loss: 0.3454907238483429, mean loss: 0.3968317144807456
Epoch: 4, step: 1296, loss: 0.32206377387046814, mean loss: 0.3968211435857067
Epoch: 4, step: 1297, loss: 0.30926331877708435, mean loss: 0.39680876617196503
Epoch: 4, step: 1298, loss: 0.3396594524383545, mean loss: 0.3968006885304479
Epoch: 4, step: 1299, loss: 0.34323152899742126, mean loss: 0.39679311798783445
Epoch: 4, step: 1300, loss: 0.3926510214805603, mean loss: 0.39679253269795073
Epoch: 4, step: 1301, loss: 0.39855819940567017, mean loss: 0.39679278215637226
Epoch: 4, step: 1302, loss: 0.3477884829044342, mean loss: 0.3967858596674258
Epoch: 4, step: 1303, loss: 0.35657376050949097, mean loss: 0.3967801799924035
Epoch: 4, step: 1304, loss: 0.3579256534576416, mean loss: 0.3967746928399484
Epoch: 4, step: 1305, loss: 0.3962130546569824, mean loss: 0.39677461353492394
Epoch: 4, step: 1306, loss: 0.32622453570365906, mean loss: 0.39676465305520753
Epoch: 4, step: 1307, loss: 0.34602057933807373, mean loss: 0.39675748986015996
Epoch: 4, step: 1308, loss: 0.29913225769996643, mean loss: 0.39674371071659464
Epoch: 4, step: 1309, loss: 0.33337804675102234, mean loss: 0.3967347683423404
Epoch: 4, step: 1310, loss: 0.3137566149234772, mean loss: 0.39672305984037637
Epoch: 4, step: 1311, loss: 0.3639582693576813, mean loss: 0.39671843726835565
Epoch: 4, step: 1312, loss: 0.4102332890033722, mean loss: 0.396720343722261
Epoch: 4, step: 1313, loss: 0.35031893849372864, mean loss: 0.3967137990952894
Epoch: 4, step: 1314, loss: 0.33408018946647644, mean loss: 0.3967049662635832
Epoch: 4, step: 1315, loss: 0.34161290526390076, mean loss: 0.3966971980654727
Epoch: 4, step: 1316, loss: 0.3279472887516022, mean loss: 0.396687505423528
Epoch: 4, step: 1317, loss: 0.34729698300361633, mean loss: 0.39668054312828976
Epoch: 4, step: 1318, loss: 0.3468717038631439, mean loss: 0.3966735228549613
Epoch: 4, step: 1319, loss: 0.39025282859802246, mean loss: 0.39667261802206155
Epoch: 4, step: 1320, loss: 0.3526299297809601, mean loss: 0.39666641220435817
Epoch: 4, step: 1321, loss: 0.3496273458003998, mean loss: 0.3966597851169527
Epoch: 4, step: 1322, loss: 0.301342248916626, mean loss: 0.39664635822074196
Epoch: 4, step: 1323, loss: 0.3618755340576172, mean loss: 0.39664146092156405
Epoch: 4, step: 1324, loss: 0.3480513095855713, mean loss: 0.3966346182020406
Epoch: 4, step: 1325, loss: 0.34688764810562134, mean loss: 0.39662761355967274
Epoch: 4, step: 1326, loss: 0.37037327885627747, mean loss: 0.39662391732784064
Epoch: 4, step: 1327, loss: 0.3534110188484192, mean loss: 0.3966178344310952
Epoch: 4, step: 1328, loss: 0.35950830578804016, mean loss: 0.3966126114151004
Epoch: 4, step: 1329, loss: 0.36953017115592957, mean loss: 0.3966088002076336
Epoch: 4, step: 1330, loss: 0.3342450261116028, mean loss: 0.3966000252288668
Epoch: 4, step: 1331, loss: 0.3169211149215698, mean loss: 0.39658881547783875
Epoch: 4, step: 1332, loss: 0.3690204918384552, mean loss: 0.3965849375310615
Epoch: 4, step: 1333, loss: 0.33073490858078003, mean loss: 0.3965756759236142
Epoch: 4, step: 1334, loss: 0.33407315611839294, mean loss: 0.3965668863694298
Epoch: 4, step: 1335, loss: 0.3492375910282135, mean loss: 0.3965602315191288
Epoch: 4, step: 1336, loss: 0.3234579563140869, mean loss: 0.3965499542415799
Epoch: 4, step: 1337, loss: 0.3362603485584259, mean loss: 0.39654147945866125
Epoch: 4, step: 1338, loss: 0.3444852828979492, mean loss: 0.396534163057177
Epoch: 4, step: 1339, loss: 0.35110539197921753, mean loss: 0.3965277790252661
Epoch: 4, step: 1340, loss: 0.33028465509414673, mean loss: 0.3965184712939283
Epoch: 4, step: 1341, loss: 0.3945665955543518, mean loss: 0.39651819707705005
Epoch: 4, step: 1342, loss: 0.3542531132698059, mean loss: 0.3965122601359337
Epoch: 4, step: 1343, loss: 0.35867202281951904, mean loss: 0.3965069454958612
Epoch: 4, step: 1344, loss: 0.3392808735370636, mean loss: 0.39649890925488956
Epoch: 4, step: 1345, loss: 0.3289232552051544, mean loss: 0.39648942095749423
Epoch: 4, step: 1346, loss: 0.36888957023620605, mean loss: 0.3964855462065857
Epoch: 4, step: 1347, loss: 0.3282075822353363, mean loss: 0.3964759619892961
Epoch: 4, step: 1348, loss: 0.38249948620796204, mean loss: 0.3964740003786601
Epoch: 4, step: 1349, loss: 0.3111141622066498, mean loss: 0.3964620217317092
Epoch: 4, step: 1350, loss: 0.3384886682033539, mean loss: 0.3964538874040077
Epoch: 4, step: 1351, loss: 0.34617191553115845, mean loss: 0.39644683325531627
Epoch: 4, step: 1352, loss: 0.3126791715621948, mean loss: 0.396435082987159
Epoch: 4, step: 1353, loss: 0.4340905547142029, mean loss: 0.396440364259491
Epoch: 4, step: 1354, loss: 0.38200998306274414, mean loss: 0.39643834064692657
Epoch: 4, step: 1355, loss: 0.38836371898651123, mean loss: 0.3964372084789989
Epoch: 4, step: 1356, loss: 0.349062979221344, mean loss: 0.39643056692155354
Epoch: 4, step: 1357, loss: 0.3385254740715027, mean loss: 0.39642245014375005
Epoch: 4, step: 1358, loss: 0.3459898829460144, mean loss: 0.39641538180917435
Epoch: 4, step: 1359, loss: 0.36924096941947937, mean loss: 0.39641157373568925
Epoch: 4, step: 1360, loss: 0.33474159240722656, mean loss: 0.3964029328527793
Epoch: 4, step: 1361, loss: 0.3814340829849243, mean loss: 0.39640083578779356
Epoch: 4, step: 1362, loss: 0.3164573311805725, mean loss: 0.3963896376501542
Epoch: 4, step: 1363, loss: 0.3530486822128296, mean loss: 0.39638356748832826
Epoch: 4, step: 1364, loss: 0.34330660104751587, mean loss: 0.3963761347805225
Epoch: 4, step: 1365, loss: 0.34265899658203125, mean loss: 0.3963686134786185
Epoch: 4, step: 1366, loss: 0.4102102220058441, mean loss: 0.3963705512650566
Epoch: 4, step: 1367, loss: 0.3667505383491516, mean loss: 0.3963664051266305
Epoch: 4, step: 1368, loss: 0.3763265609741211, mean loss: 0.3963636003898702
Epoch: 4, step: 1369, loss: 0.3603513836860657, mean loss: 0.3963585608969085
Epoch: 4, step: 1370, loss: 0.33048757910728455, mean loss: 0.39634934430508123
Epoch: 4, step: 1371, loss: 0.39750927686691284, mean loss: 0.3963495065788028
Epoch: 4, step: 1372, loss: 0.3462957739830017, mean loss: 0.3963425050775305
Epoch: 4, step: 1373, loss: 0.33458372950553894, mean loss: 0.3963338674865414
Epoch: 4, step: 1374, loss: 0.37908828258514404, mean loss: 0.39633145585391644
Epoch: 4, step: 1375, loss: 0.3348367214202881, mean loss: 0.39632285759686475
Epoch: 4, step: 1376, loss: 0.3534398078918457, mean loss: 0.39631686248296777
Epoch: 4, step: 1377, loss: 0.35485368967056274, mean loss: 0.3963110666802263
Epoch: 4, step: 1378, loss: 0.3385727107524872, mean loss: 0.39630299702880384
Epoch: 4, step: 1379, loss: 0.3548722565174103, mean loss: 0.39629720737808954
Epoch: 4, step: 1380, loss: 0.3249553143978119, mean loss: 0.396287239249966
Epoch: 4, step: 1381, loss: 0.34871697425842285, mean loss: 0.3962805935018532
Epoch: 4, step: 1382, loss: 0.3418629765510559, mean loss: 0.3962729922143897
Epoch: 4, step: 1383, loss: 0.3766275942325592, mean loss: 0.3962702484437219
Epoch: 4, step: 1384, loss: 0.378695547580719, mean loss: 0.396267794219331
Epoch: 4, step: 1385, loss: 0.39829182624816895, mean loss: 0.396268076826428
Epoch: 4, step: 1386, loss: 0.29360347986221313, mean loss: 0.3962537442008571
Epoch: 4, step: 1387, loss: 0.32624760270118713, mean loss: 0.3962439722659744
Epoch: 4, step: 1388, loss: 0.31074321269989014, mean loss: 0.3962320391522876
Epoch: 4, step: 1389, loss: 0.3666509687900543, mean loss: 0.39622791117707656
Epoch: 4, step: 1390, loss: 0.38241344690322876, mean loss: 0.3962259836670621
Epoch: 4, step: 1391, loss: 0.34388813376426697, mean loss: 0.3962186820696984
Epoch: 4, step: 1392, loss: 0.340677946805954, mean loss: 0.3962109347220539
Epoch: 4, step: 1393, loss: 0.3233693838119507, mean loss: 0.39620077550993255
Epoch: 4, step: 1394, loss: 0.3758591115474701, mean loss: 0.39619793885340454
Epoch: 4, step: 1395, loss: 0.312678724527359, mean loss: 0.39618629367572383
Epoch: 4, step: 1396, loss: 0.3515855371952057, mean loss: 0.3961800758092132
Epoch: 4, step: 1397, loss: 0.36720559000968933, mean loss: 0.39617603699045106
Epoch: 4, step: 1398, loss: 0.36317917704582214, mean loss: 0.39617143812495353
Epoch: 4, step: 1399, loss: 0.35333070158958435, mean loss: 0.3961654681226493
Epoch: 4, step: 1400, loss: 0.3387340009212494, mean loss: 0.39615746596754253
Epoch: 4, step: 1401, loss: 0.3481042683124542, mean loss: 0.39615077145686334
Epoch: 4, step: 1402, loss: 0.3703860938549042, mean loss: 0.39614718256180803
Epoch: 4, step: 1403, loss: 0.3312584161758423, mean loss: 0.39613814512916373
Epoch: 4, step: 1404, loss: 0.3605726659297943, mean loss: 0.3961331924095983
Epoch: 4, step: 1405, loss: 0.3879033029079437, mean loss: 0.39613204650462736
Epoch: 4, step: 1406, loss: 0.3643421530723572, mean loss: 0.3961276207920515
Epoch: 4, step: 1407, loss: 0.3329072892665863, mean loss: 0.3961188206345452
Epoch: 4, step: 1408, loss: 0.33484724164009094, mean loss: 0.3961102929269607
Epoch: 4, step: 1409, loss: 0.32300058007240295, mean loss: 0.39610011901757375
Epoch: 4, step: 1410, loss: 0.3512331545352936, mean loss: 0.3960938762230166
Epoch: 4, step: 1411, loss: 0.3826916515827179, mean loss: 0.3960920116953816
Epoch: 4, step: 1412, loss: 0.3559989035129547, mean loss: 0.39608643468770566
Epoch: 4, step: 1413, loss: 0.33980435132980347, mean loss: 0.39607860685970037
Epoch: 4, step: 1414, loss: 0.3455599546432495, mean loss: 0.3960715815986495
Epoch: 4, step: 1415, loss: 0.35230329632759094, mean loss: 0.39606549590826146
Epoch: 4, step: 1416, loss: 0.316305011510849, mean loss: 0.396054407282598
Epoch: 4, step: 1417, loss: 0.3213178515434265, mean loss: 0.39604401854813326
Epoch: 4, step: 1418, loss: 0.39128103852272034, mean loss: 0.3960433565634181
Epoch: 4, step: 1419, loss: 0.4169679582118988, mean loss: 0.39604626437354157
Epoch: 4, step: 1420, loss: 0.3537602722644806, mean loss: 0.3960403888709559
Epoch: 4, step: 1421, loss: 0.3421725034713745, mean loss: 0.39603290514139217
Epoch: 4, step: 1422, loss: 0.35627931356430054, mean loss: 0.3960273830422705
Epoch: 4, step: 1423, loss: 0.33687472343444824, mean loss: 0.39601916739510273
Epoch: 4, step: 1424, loss: 0.3485294282436371, mean loss: 0.39601257251395405
Epoch: 4, step: 1425, loss: 0.4038445055484772, mean loss: 0.3960136599803571
Epoch: 4, step: 1426, loss: 0.34914344549179077, mean loss: 0.39600715293961175
Epoch: 4, step: 1427, loss: 0.380662739276886, mean loss: 0.3960050229543726
Epoch: 4, step: 1428, loss: 0.32901158928871155, mean loss: 0.3959957247678819
Epoch: 4, step: 1429, loss: 0.35127976536750793, mean loss: 0.3959895193891142
Epoch: 4, step: 1430, loss: 0.3547400236129761, mean loss: 0.3959837958570237
Epoch: 4, step: 1431, loss: 0.3453357219696045, mean loss: 0.39597676920970304
Epoch: 4, step: 1432, loss: 0.3629860281944275, mean loss: 0.3959721928827485
Epoch: 4, step: 1433, loss: 0.39468690752983093, mean loss: 0.3959720146184832
Epoch: 4, step: 1434, loss: 0.40045204758644104, mean loss: 0.39597263589611015
Epoch: 4, step: 1435, loss: 0.32475945353507996, mean loss: 0.39596276163344224
Epoch: 4, step: 1436, loss: 0.33107322454452515, mean loss: 0.3959537654408609
Epoch: 4, step: 1437, loss: 0.3502367436885834, mean loss: 0.395947428176964
Epoch: 4, step: 1438, loss: 0.3636523187160492, mean loss: 0.3959429520703166
Epoch: 4, step: 1439, loss: 0.34222573041915894, mean loss: 0.39593550788771525
Epoch: 4, step: 1440, loss: 0.3600027859210968, mean loss: 0.3959305289876229
Epoch: 4, step: 1441, loss: 0.39215970039367676, mean loss: 0.3959300065674796
Epoch: 4, step: 1442, loss: 0.3123023808002472, mean loss: 0.39591842218934314
Epoch: 4, step: 1443, loss: 0.3009535074234009, mean loss: 0.395905269154057
Valid: 4, mean loss: 0.2208336740732193
Epoch: 5, step: 0, loss: 0.3542100489139557, mean loss: 0.3958994949925503
Epoch: 5, step: 1, loss: 0.32937315106391907, mean loss: 0.39589028336918713
Epoch: 5, step: 2, loss: 0.3587166666984558, mean loss: 0.3958851368072779
Epoch: 5, step: 3, loss: 0.33493903279304504, mean loss: 0.39587670019265797
Epoch: 5, step: 4, loss: 0.35668516159057617, mean loss: 0.3958712757582494
Epoch: 5, step: 5, loss: 0.38787761330604553, mean loss: 0.3958701695220949
Epoch: 5, step: 6, loss: 0.3703968822956085, mean loss: 0.39586664478330613
Epoch: 5, step: 7, loss: 0.34352290630340576, mean loss: 0.39585940298218825
Epoch: 5, step: 8, loss: 0.34626734256744385, mean loss: 0.39585254282719934
Epoch: 5, step: 9, loss: 0.3277011215686798, mean loss: 0.39584311662785515
Epoch: 5, step: 10, loss: 0.3624115288257599, mean loss: 0.3958384932579475
Epoch: 5, step: 11, loss: 0.4353070855140686, mean loss: 0.39584395075134576
Epoch: 5, step: 12, loss: 0.3400671184062958, mean loss: 0.39583623931316725
Epoch: 5, step: 13, loss: 0.4347209632396698, mean loss: 0.3958416145860352
Epoch: 5, step: 14, loss: 0.35099685192108154, mean loss: 0.3958354162774429
Epoch: 5, step: 15, loss: 0.33608561754226685, mean loss: 0.3958271589807686
Epoch: 5, step: 16, loss: 0.3296639621257782, mean loss: 0.3958180166293999
Epoch: 5, step: 17, loss: 0.3127255141735077, mean loss: 0.3958065365931391
Epoch: 5, step: 18, loss: 0.3934532701969147, mean loss: 0.39580621151144324
Epoch: 5, step: 19, loss: 0.47751957178115845, mean loss: 0.3958174978871711
Epoch: 5, step: 20, loss: 0.33359089493751526, mean loss: 0.39580890423947745
Epoch: 5, step: 21, loss: 0.33352139592170715, mean loss: 0.3958003033684035
Epoch: 5, step: 22, loss: 0.372976154088974, mean loss: 0.39579715216734324
Epoch: 5, step: 23, loss: 0.3850620687007904, mean loss: 0.3957956702397526
Epoch: 5, step: 24, loss: 0.3497683107852936, mean loss: 0.39578931725708116
Epoch: 5, step: 25, loss: 0.4083651900291443, mean loss: 0.3957910528177729
Epoch: 5, step: 26, loss: 0.38791343569755554, mean loss: 0.3957899658000938
Epoch: 5, step: 27, loss: 0.40119296312332153, mean loss: 0.39579071124674436
Epoch: 5, step: 28, loss: 0.36627277731895447, mean loss: 0.3957866392459266
Epoch: 5, step: 29, loss: 0.33485379815101624, mean loss: 0.3957782347161204
Epoch: 5, step: 30, loss: 0.37197405099868774, mean loss: 0.3957749518332467
Epoch: 5, step: 31, loss: 0.339085191488266, mean loss: 0.3957671347124048
Epoch: 5, step: 32, loss: 0.40996041893959045, mean loss: 0.3957690915970356
Epoch: 5, step: 33, loss: 0.3570307493209839, mean loss: 0.395763751323769
Epoch: 5, step: 34, loss: 0.3332110643386841, mean loss: 0.3957551293131577
Epoch: 5, step: 35, loss: 0.32612839341163635, mean loss: 0.3957455335667545
Epoch: 5, step: 36, loss: 0.33947837352752686, mean loss: 0.39573778006530225
Epoch: 5, step: 37, loss: 0.36544468998908997, mean loss: 0.3957336063135695
Epoch: 5, step: 38, loss: 0.34977683424949646, mean loss: 0.395727275307637
Epoch: 5, step: 39, loss: 0.34569883346557617, mean loss: 0.3957203843376863
Epoch: 5, step: 40, loss: 0.32461029291152954, mean loss: 0.3957105909082102
Epoch: 5, step: 41, loss: 0.36715927720069885, mean loss: 0.3957066593034584
Epoch: 5, step: 42, loss: 0.3446449637413025, mean loss: 0.3956996289171769
Epoch: 5, step: 43, loss: 0.3627530634403229, mean loss: 0.39569509332170927
Epoch: 5, step: 44, loss: 0.36815980076789856, mean loss: 0.39569130319197027
Epoch: 5, step: 45, loss: 0.3420381546020508, mean loss: 0.39568391905371125
Epoch: 5, step: 46, loss: 0.3314915895462036, mean loss: 0.3956750856521002
Epoch: 5, step: 47, loss: 0.31723180413246155, mean loss: 0.39566429268546294
Epoch: 5, step: 48, loss: 0.38210350275039673, mean loss: 0.39566242712074495
Epoch: 5, step: 49, loss: 0.33179789781570435, mean loss: 0.39565364245371537
Epoch: 5, step: 50, loss: 0.32811495661735535, mean loss: 0.39564435367832873
Epoch: 5, step: 51, loss: 0.3682185113430023, mean loss: 0.3956405822478646
Epoch: 5, step: 52, loss: 0.3291648328304291, mean loss: 0.3956314421750724
Epoch: 5, step: 53, loss: 0.3316293954849243, mean loss: 0.3956226434334323
Epoch: 5, step: 54, loss: 0.32359743118286133, mean loss: 0.39561274306061434
Epoch: 5, step: 55, loss: 0.34045231342315674, mean loss: 0.3956051619130556
Epoch: 5, step: 56, loss: 0.3560234308242798, mean loss: 0.3955997226206152
Epoch: 5, step: 57, loss: 0.3383149802684784, mean loss: 0.3955918516749774
Epoch: 5, step: 58, loss: 0.3415178656578064, mean loss: 0.39558442290921053
Epoch: 5, step: 59, loss: 0.3645791709423065, mean loss: 0.39558016394602824
Epoch: 5, step: 60, loss: 0.31060105562210083, mean loss: 0.3955684925947957
Epoch: 5, step: 61, loss: 0.3559785485267639, mean loss: 0.3955630559092604
Epoch: 5, step: 62, loss: 0.3456072509288788, mean loss: 0.39555619667474434
Epoch: 5, step: 63, loss: 0.3796360194683075, mean loss: 0.3955540110381152
Epoch: 5, step: 64, loss: 0.36256393790245056, mean loss: 0.39554948254489136
Epoch: 5, step: 65, loss: 0.3505048453807831, mean loss: 0.39554330019007883
Epoch: 5, step: 66, loss: 0.32343295216560364, mean loss: 0.3955334044376396
Epoch: 5, step: 67, loss: 0.35471153259277344, mean loss: 0.39552780319287495
Epoch: 5, step: 68, loss: 0.3327397108078003, mean loss: 0.3955191891041954
Epoch: 5, step: 69, loss: 0.35612601041793823, mean loss: 0.3955137853759806
Epoch: 5, step: 70, loss: 0.3392561376094818, mean loss: 0.3955060693359632
Epoch: 5, step: 71, loss: 0.3650120496749878, mean loss: 0.39550188749015125
Epoch: 5, step: 72, loss: 0.35069194436073303, mean loss: 0.3954957432500403
Epoch: 5, step: 73, loss: 0.3411177694797516, mean loss: 0.3954882880850046
Epoch: 5, step: 74, loss: 0.3652251958847046, mean loss: 0.3954841396145179
Epoch: 5, step: 75, loss: 0.3713553249835968, mean loss: 0.39548083248531957
Epoch: 5, step: 76, loss: 0.3483154773712158, mean loss: 0.39547436882146947
Epoch: 5, step: 77, loss: 0.3501622974872589, mean loss: 0.39546815998735957
Epoch: 5, step: 78, loss: 0.3503434360027313, mean loss: 0.395461977671428
Epoch: 5, step: 79, loss: 0.3869139850139618, mean loss: 0.39546080671352973
Epoch: 5, step: 80, loss: 0.33238428831100464, mean loss: 0.3954521672780548
Epoch: 5, step: 81, loss: 0.2981427311897278, mean loss: 0.3954388408693876
Epoch: 5, step: 82, loss: 0.36227545142173767, mean loss: 0.39543429980551686
Epoch: 5, step: 83, loss: 0.3591247797012329, mean loss: 0.3954293286225891
Epoch: 5, step: 84, loss: 0.3546268939971924, mean loss: 0.3954237430737013
Epoch: 5, step: 85, loss: 0.3334863781929016, mean loss: 0.39541526547106226
Epoch: 5, step: 86, loss: 0.38901397585868835, mean loss: 0.3954143894221212
Epoch: 5, step: 87, loss: 0.3375277817249298, mean loss: 0.3954064684303728
Epoch: 5, step: 88, loss: 0.3989771604537964, mean loss: 0.3954069569639647
Epoch: 5, step: 89, loss: 0.31678006052970886, mean loss: 0.3953962008905811
Epoch: 5, step: 90, loss: 0.3406643867492676, mean loss: 0.3953887146624124
Epoch: 5, step: 91, loss: 0.39157620072364807, mean loss: 0.3953881932573332
Epoch: 5, step: 92, loss: 0.3633294403553009, mean loss: 0.3953838094541195
Epoch: 5, step: 93, loss: 0.3552241325378418, mean loss: 0.3953783186588069
Epoch: 5, step: 94, loss: 0.3637290298938751, mean loss: 0.3953739920301309
Epoch: 5, step: 95, loss: 0.3043919503688812, mean loss: 0.39536155599381856
Epoch: 5, step: 96, loss: 0.3377915918827057, mean loss: 0.3953536880200436
Epoch: 5, step: 97, loss: 0.39560937881469727, mean loss: 0.39535372296002647
Epoch: 5, step: 98, loss: 0.3393644690513611, mean loss: 0.3953460731097862
Epoch: 5, step: 99, loss: 0.39644959568977356, mean loss: 0.395346223864237
Epoch: 5, step: 100, loss: 0.3865934908390045, mean loss: 0.39534502829901025
Epoch: 5, step: 101, loss: 0.32328447699546814, mean loss: 0.39533518665037554
Epoch: 5, step: 102, loss: 0.3465685248374939, mean loss: 0.39532852726736134
Epoch: 5, step: 103, loss: 0.3063909709453583, mean loss: 0.39531638396365815
Epoch: 5, step: 104, loss: 0.31378933787345886, mean loss: 0.3953052539914957
Epoch: 5, step: 105, loss: 0.31510916352272034, mean loss: 0.39529430721419995
Epoch: 5, step: 106, loss: 0.4025759994983673, mean loss: 0.3952953010305346
Epoch: 5, step: 107, loss: 0.3824172616004944, mean loss: 0.39529354365615826
Epoch: 5, step: 108, loss: 0.36703306436538696, mean loss: 0.395289687675903
Epoch: 5, step: 109, loss: 0.3802708089351654, mean loss: 0.3952876387156382
Epoch: 5, step: 110, loss: 0.36523833870887756, mean loss: 0.39528353977961217
Epoch: 5, step: 111, loss: 0.3288690745830536, mean loss: 0.39527448161469175
Epoch: 5, step: 112, loss: 0.35198691487312317, mean loss: 0.395268578496358
Epoch: 5, step: 113, loss: 0.37408751249313354, mean loss: 0.39526569043172705
Epoch: 5, step: 114, loss: 0.3251075744628906, mean loss: 0.3952561255897408
Epoch: 5, step: 115, loss: 0.3332001864910126, mean loss: 0.3952476664922628
Epoch: 5, step: 116, loss: 0.32847270369529724, mean loss: 0.3952385653660808
Epoch: 5, step: 117, loss: 0.4109586775302887, mean loss: 0.3952407076544652
Epoch: 5, step: 118, loss: 0.3346770107746124, mean loss: 0.3952324553453114
Epoch: 5, step: 119, loss: 0.36296284198760986, mean loss: 0.3952280589402218
Epoch: 5, step: 120, loss: 0.3505140244960785, mean loss: 0.3952219679397526
Epoch: 5, step: 121, loss: 0.3368310332298279, mean loss: 0.3952140149385663
Epoch: 5, step: 122, loss: 0.3656322956085205, mean loss: 0.39520998637812366
Epoch: 5, step: 123, loss: 0.36037206649780273, mean loss: 0.3952052426526498
Epoch: 5, step: 124, loss: 0.3431043326854706, mean loss: 0.39519814926803887
Epoch: 5, step: 125, loss: 0.37577831745147705, mean loss: 0.3951955056753603
Epoch: 5, step: 126, loss: 0.3712877333164215, mean loss: 0.3951922515890177
Epoch: 5, step: 127, loss: 0.3766942024230957, mean loss: 0.3951897341626206
Epoch: 5, step: 128, loss: 0.349384605884552, mean loss: 0.39518350132437347
Epoch: 5, step: 129, loss: 0.34378209710121155, mean loss: 0.3951765079360438
Epoch: 5, step: 130, loss: 0.36542779207229614, mean loss: 0.3951724610423064
Epoch: 5, step: 131, loss: 0.3814082145690918, mean loss: 0.3951705888651474
Epoch: 5, step: 132, loss: 0.3362395763397217, mean loss: 0.3951625743115604
Epoch: 5, step: 133, loss: 0.35954275727272034, mean loss: 0.39515773071392113
Epoch: 5, step: 134, loss: 0.3987744152545929, mean loss: 0.3951582224453339
Epoch: 5, step: 135, loss: 0.3789909780025482, mean loss: 0.3951560246143873
Epoch: 5, step: 136, loss: 0.36049893498420715, mean loss: 0.39515131385053925
Epoch: 5, step: 137, loss: 0.31743937730789185, mean loss: 0.3951407522935207
Epoch: 5, step: 138, loss: 0.3350983262062073, mean loss: 0.3951325932466275
Epoch: 5, step: 139, loss: 0.34111282229423523, mean loss: 0.39512525360383505
Epoch: 5, step: 140, loss: 0.3875477612018585, mean loss: 0.39512422419310256
Epoch: 5, step: 141, loss: 0.34293898940086365, mean loss: 0.39511713573415225
Epoch: 5, step: 142, loss: 0.37221527099609375, mean loss: 0.3951140253355731
Epoch: 5, step: 143, loss: 0.32435712218284607, mean loss: 0.39510441684790976
Epoch: 5, step: 144, loss: 0.3909265697002411, mean loss: 0.39510384959099903
Epoch: 5, step: 145, loss: 0.3429775536060333, mean loss: 0.3950967729828012
Epoch: 5, step: 146, loss: 0.3898453414440155, mean loss: 0.39509606015104626
Epoch: 5, step: 147, loss: 0.3526711165904999, mean loss: 0.3950903021511059
Epoch: 5, step: 148, loss: 0.3308660686016083, mean loss: 0.39508158668991045
Epoch: 5, step: 149, loss: 0.3821744918823242, mean loss: 0.395079835388037
Epoch: 5, step: 150, loss: 0.37241077423095703, mean loss: 0.3950767599489979
Epoch: 5, step: 151, loss: 0.35861730575561523, mean loss: 0.3950718142823954
Epoch: 5, step: 152, loss: 0.41201159358024597, mean loss: 0.39507411182468455
Epoch: 5, step: 153, loss: 0.3414345383644104, mean loss: 0.3950668376758562
Epoch: 5, step: 154, loss: 0.3230104148387909, mean loss: 0.39505706731343765
Epoch: 5, step: 155, loss: 0.3282741904258728, mean loss: 0.3950480132357685
Epoch: 5, step: 156, loss: 0.3314087688922882, mean loss: 0.395039386525135
Epoch: 5, step: 157, loss: 0.36481863260269165, mean loss: 0.39503529046198477
Epoch: 5, step: 158, loss: 0.36480391025543213, mean loss: 0.39503119351386085
Epoch: 5, step: 159, loss: 0.33180296421051025, mean loss: 0.3950226260031151
Epoch: 5, step: 160, loss: 0.33676543831825256, mean loss: 0.39501473314473756
Epoch: 5, step: 161, loss: 0.33755627274513245, mean loss: 0.39500694955487037
Epoch: 5, step: 162, loss: 0.35610660910606384, mean loss: 0.3950016806478612
Epoch: 5, step: 163, loss: 0.3744205832481384, mean loss: 0.39499889339198363
Epoch: 5, step: 164, loss: 0.3799966871738434, mean loss: 0.3949968619490292
Epoch: 5, step: 165, loss: 0.3516574501991272, mean loss: 0.3949909941705632
Epoch: 5, step: 166, loss: 0.33179619908332825, mean loss: 0.3949824393045706
Epoch: 5, step: 167, loss: 0.37587738037109375, mean loss: 0.3949798533464042
Epoch: 5, step: 168, loss: 0.31991857290267944, mean loss: 0.39496969482963007
Epoch: 5, step: 169, loss: 0.4081822335720062, mean loss: 0.39497148272391186
Epoch: 5, step: 170, loss: 0.3752681612968445, mean loss: 0.3949688168706542
Epoch: 5, step: 171, loss: 0.3741186261177063, mean loss: 0.3949659962279658
Epoch: 5, step: 172, loss: 0.32189056277275085, mean loss: 0.3949561118192744
Epoch: 5, step: 173, loss: 0.35061004757881165, mean loss: 0.3949501142449925
Epoch: 5, step: 174, loss: 0.33791789412498474, mean loss: 0.3949424019772278
Epoch: 5, step: 175, loss: 0.3581973910331726, mean loss: 0.39493743374967993
Epoch: 5, step: 176, loss: 0.3578433096408844, mean loss: 0.394932418997198
Epoch: 5, step: 177, loss: 0.32934603095054626, mean loss: 0.39492355357572645
Epoch: 5, step: 178, loss: 0.36838504672050476, mean loss: 0.3949199668063177
Epoch: 5, step: 179, loss: 0.34989333152770996, mean loss: 0.39491388212587464
Epoch: 5, step: 180, loss: 0.3489573001861572, mean loss: 0.39490767261608684
Epoch: 5, step: 181, loss: 0.3876952528953552, mean loss: 0.3949066982281213
Epoch: 5, step: 182, loss: 0.33719775080680847, mean loss: 0.3948989028819885
Epoch: 5, step: 183, loss: 0.3505518138408661, mean loss: 0.3948929132697463
Epoch: 5, step: 184, loss: 0.30682677030563354, mean loss: 0.39488102047528795
Epoch: 5, step: 185, loss: 0.3466542661190033, mean loss: 0.3948745086261985
Epoch: 5, step: 186, loss: 0.35992375016212463, mean loss: 0.3948697900142822
Epoch: 5, step: 187, loss: 0.3286091983318329, mean loss: 0.3948608455499622
Epoch: 5, step: 188, loss: 0.34939754009246826, mean loss: 0.39485470932301425
Epoch: 5, step: 189, loss: 0.34528177976608276, mean loss: 0.39484801931902547
Epoch: 5, step: 190, loss: 0.36485186219215393, mean loss: 0.39484397180085967
Epoch: 5, step: 191, loss: 0.3655546009540558, mean loss: 0.39484002018579667
Epoch: 5, step: 192, loss: 0.39341169595718384, mean loss: 0.3948398275074979
Epoch: 5, step: 193, loss: 0.3682802617549896, mean loss: 0.39483624515441557
Epoch: 5, step: 194, loss: 0.42830148339271545, mean loss: 0.39484075833556703
Epoch: 5, step: 195, loss: 0.32065823674201965, mean loss: 0.3948307552986747
Epoch: 5, step: 196, loss: 0.337712824344635, mean loss: 0.39482305435072346
Epoch: 5, step: 197, loss: 0.3572005033493042, mean loss: 0.3948179825590004
Epoch: 5, step: 198, loss: 0.36579352617263794, mean loss: 0.3948140703799485
Epoch: 5, step: 199, loss: 0.3383272886276245, mean loss: 0.3948064576061274
Epoch: 5, step: 200, loss: 0.39445042610168457, mean loss: 0.3948064096299107
Epoch: 5, step: 201, loss: 0.35010525584220886, mean loss: 0.3948003868390474
Epoch: 5, step: 202, loss: 0.35004428029060364, mean loss: 0.3947943574565136
Epoch: 5, step: 203, loss: 0.33232080936431885, mean loss: 0.3947859423772986
Epoch: 5, step: 204, loss: 0.34998318552970886, mean loss: 0.3947799083359723
Epoch: 5, step: 205, loss: 0.35846269130706787, mean loss: 0.39477501778695145
Epoch: 5, step: 206, loss: 0.3571217954158783, mean loss: 0.39476994801148746
Epoch: 5, step: 207, loss: 0.28979408740997314, mean loss: 0.3947558155585255
Epoch: 5, step: 208, loss: 0.3335148096084595, mean loss: 0.3947475720525422
Epoch: 5, step: 209, loss: 0.3711971044540405, mean loss: 0.3947444024068358
Epoch: 5, step: 210, loss: 0.4290634095668793, mean loss: 0.39474902076333696
Epoch: 5, step: 211, loss: 0.3753437101840973, mean loss: 0.39474640971508895
Epoch: 5, step: 212, loss: 0.35515937209129333, mean loss: 0.39474108386581896
Epoch: 5, step: 213, loss: 0.36580124497413635, mean loss: 0.3947371909630894
Epoch: 5, step: 214, loss: 0.3776666522026062, mean loss: 0.3947348949928459
Epoch: 5, step: 215, loss: 0.3602350354194641, mean loss: 0.39473025542055257
Epoch: 5, step: 216, loss: 0.3373567759990692, mean loss: 0.3947225408206573
Epoch: 5, step: 217, loss: 0.32987213134765625, mean loss: 0.39471382202400856
Epoch: 5, step: 218, loss: 0.32660943269729614, mean loss: 0.3947046669777219
Epoch: 5, step: 219, loss: 0.39197108149528503, mean loss: 0.39470429956031833
Epoch: 5, step: 220, loss: 0.3404771685600281, mean loss: 0.3946970119469599
Epoch: 5, step: 221, loss: 0.33110982179641724, mean loss: 0.3946884675784903
Epoch: 5, step: 222, loss: 0.35696813464164734, mean loss: 0.3946833996847731
Epoch: 5, step: 223, loss: 0.3423115015029907, mean loss: 0.39467636423364716
Epoch: 5, step: 224, loss: 0.34790709614753723, mean loss: 0.39467008226345424
Epoch: 5, step: 225, loss: 0.3646308481693268, mean loss: 0.39466604798543997
Epoch: 5, step: 226, loss: 0.32684028148651123, mean loss: 0.3946569401881392
Epoch: 5, step: 227, loss: 0.30735528469085693, mean loss: 0.39464521869841074
Epoch: 5, step: 228, loss: 0.36596351861953735, mean loss: 0.3946413682889492
Epoch: 5, step: 229, loss: 0.3530052602291107, mean loss: 0.3946357795496123
Epoch: 5, step: 230, loss: 0.32718321681022644, mean loss: 0.39462672672948895
Epoch: 5, step: 231, loss: 0.3510725796222687, mean loss: 0.39462088210427326
Epoch: 5, step: 232, loss: 0.33353763818740845, mean loss: 0.3946126863114493
Epoch: 5, step: 233, loss: 0.3240087628364563, mean loss: 0.39460321436035256
Epoch: 5, step: 234, loss: 0.3598393499851227, mean loss: 0.39459855119947057
Epoch: 5, step: 235, loss: 0.35024020075798035, mean loss: 0.3945926018498942
Epoch: 5, step: 236, loss: 0.30134204030036926, mean loss: 0.3945800967457572
Epoch: 5, step: 237, loss: 0.36180058121681213, mean loss: 0.39457570153048116
Epoch: 5, step: 238, loss: 0.35830071568489075, mean loss: 0.39457083827993206
Epoch: 5, step: 239, loss: 0.3814888000488281, mean loss: 0.3945690846555043
Epoch: 5, step: 240, loss: 0.3460842967033386, mean loss: 0.39456258622527346
Epoch: 5, step: 241, loss: 0.36809852719306946, mean loss: 0.3945590397150842
Epoch: 5, step: 242, loss: 0.36409273743629456, mean loss: 0.394554957402036
Epoch: 5, step: 243, loss: 0.28658515214920044, mean loss: 0.39454049199404395
Epoch: 5, step: 244, loss: 0.3820265531539917, mean loss: 0.3945388156459073
Epoch: 5, step: 245, loss: 0.36414849758148193, mean loss: 0.3945347451505866
Epoch: 5, step: 246, loss: 0.3453701138496399, mean loss: 0.39452816089569165
Epoch: 5, step: 247, loss: 0.325957328081131, mean loss: 0.3945189789416458
Epoch: 5, step: 248, loss: 0.3891555964946747, mean loss: 0.3945182608558984
Epoch: 5, step: 249, loss: 0.35718396306037903, mean loss: 0.3945132629579338
Epoch: 5, step: 250, loss: 0.31309813261032104, mean loss: 0.3945023654702685
Epoch: 5, step: 251, loss: 0.31328484416007996, mean loss: 0.39449149588765203
Epoch: 5, step: 252, loss: 0.313154935836792, mean loss: 0.39448061183037236
Epoch: 5, step: 253, loss: 0.3494853079319, mean loss: 0.3944745915863399
Epoch: 5, step: 254, loss: 0.37522435188293457, mean loss: 0.3944720163034364
Epoch: 5, step: 255, loss: 0.38187795877456665, mean loss: 0.3944703317050511
Epoch: 5, step: 256, loss: 0.39631304144859314, mean loss: 0.3944705781554648
Epoch: 5, step: 257, loss: 0.3541755974292755, mean loss: 0.3944651896851885
Epoch: 5, step: 258, loss: 0.3561825156211853, mean loss: 0.3944600709963178
Epoch: 5, step: 259, loss: 0.33089447021484375, mean loss: 0.394451572921347
Epoch: 5, step: 260, loss: 0.3614965081214905, mean loss: 0.3944471677529471
Epoch: 5, step: 261, loss: 0.3231378495693207, mean loss: 0.3944376369699768
Epoch: 5, step: 262, loss: 0.39474374055862427, mean loss: 0.3944376778765101
Epoch: 5, step: 263, loss: 0.35201495885849, mean loss: 0.3944320094212698
Epoch: 5, step: 264, loss: 0.3072603940963745, mean loss: 0.39442036324687774
Epoch: 5, step: 265, loss: 0.3285168707370758, mean loss: 0.39441155968122055
Epoch: 5, step: 266, loss: 0.3295905590057373, mean loss: 0.3944029018742651
Epoch: 5, step: 267, loss: 0.350911408662796, mean loss: 0.39439709371544945
Epoch: 5, step: 268, loss: 0.3264910876750946, mean loss: 0.39438802628240893
Epoch: 5, step: 269, loss: 0.35436907410621643, mean loss: 0.39438268329813975
Epoch: 5, step: 270, loss: 0.3137250244617462, mean loss: 0.39437191602289795
Epoch: 5, step: 271, loss: 0.34585416316986084, mean loss: 0.3943654400815134
Epoch: 5, step: 272, loss: 0.3729521334171295, mean loss: 0.3943625823067017
Epoch: 5, step: 273, loss: 0.38891303539276123, mean loss: 0.3943618551186961
Epoch: 5, step: 274, loss: 0.33541375398635864, mean loss: 0.39435399012855166
Epoch: 5, step: 275, loss: 0.37412723898887634, mean loss: 0.3943512917892854
Epoch: 5, step: 276, loss: 0.3800298571586609, mean loss: 0.3943493815005525
Epoch: 5, step: 277, loss: 0.3652927279472351, mean loss: 0.3943455062466777
Epoch: 5, step: 278, loss: 0.35851114988327026, mean loss: 0.3943407276953557
Epoch: 5, step: 279, loss: 0.35876378417015076, mean loss: 0.3943359841028857
Epoch: 5, step: 280, loss: 0.332477331161499, mean loss: 0.3943277373820563
Epoch: 5, step: 281, loss: 0.35466673970222473, mean loss: 0.39432245065882515
Epoch: 5, step: 282, loss: 0.3502599000930786, mean loss: 0.3943165780011461
Epoch: 5, step: 283, loss: 0.3393176198005676, mean loss: 0.39430924871567163
Epoch: 5, step: 284, loss: 0.33709803223609924, mean loss: 0.3943016256355278
Epoch: 5, step: 285, loss: 0.35301637649536133, mean loss: 0.39429612533588215
Epoch: 5, step: 286, loss: 0.3608679175376892, mean loss: 0.3942916723975848
Epoch: 5, step: 287, loss: 0.32218432426452637, mean loss: 0.3942820683288404
Epoch: 5, step: 288, loss: 0.30758944153785706, mean loss: 0.39427052316613015
Epoch: 5, step: 289, loss: 0.37907394766807556, mean loss: 0.3942684996540798
Epoch: 5, step: 290, loss: 0.3607277572154999, mean loss: 0.3942640341045606
Epoch: 5, step: 291, loss: 0.3718302845954895, mean loss: 0.3942610477161808
Epoch: 5, step: 292, loss: 0.3630692660808563, mean loss: 0.39425689600825653
Epoch: 5, step: 293, loss: 0.38664987683296204, mean loss: 0.39425588362880815
Epoch: 5, step: 294, loss: 0.36997559666633606, mean loss: 0.3942526527190327
Epoch: 5, step: 295, loss: 0.3284236490726471, mean loss: 0.3942438942033799
Epoch: 5, step: 296, loss: 0.3361726999282837, mean loss: 0.39423616888819096
Epoch: 5, step: 297, loss: 0.3365476429462433, mean loss: 0.39422849550086164
Epoch: 5, step: 298, loss: 0.3728586435317993, mean loss: 0.3942256533872868
Epoch: 5, step: 299, loss: 0.36194175481796265, mean loss: 0.39422136031566857
Epoch: 5, step: 300, loss: 0.40214455127716064, mean loss: 0.39422241379139805
Epoch: 5, step: 301, loss: 0.3764779269695282, mean loss: 0.39422005477958977
Epoch: 5, step: 302, loss: 0.3273114264011383, mean loss: 0.39421116090369207
Epoch: 5, step: 303, loss: 0.368644118309021, mean loss: 0.3942077628384881
Epoch: 5, step: 304, loss: 0.3499705195426941, mean loss: 0.3942018841350601
Epoch: 5, step: 305, loss: 0.4099403917789459, mean loss: 0.39420397535318974
Epoch: 5, step: 306, loss: 0.32983070611953735, mean loss: 0.3941954230389565
Epoch: 5, step: 307, loss: 0.34765639901161194, mean loss: 0.39418924091567975
Epoch: 5, step: 308, loss: 0.357316255569458, mean loss: 0.39418434345448355
Epoch: 5, step: 309, loss: 0.3696342706680298, mean loss: 0.3941810831526527
Epoch: 5, step: 310, loss: 0.3510112166404724, mean loss: 0.3941753508639112
Epoch: 5, step: 311, loss: 0.3306908905506134, mean loss: 0.3941669222313683
Epoch: 5, step: 312, loss: 0.33395159244537354, mean loss: 0.39415892869230207
Epoch: 5, step: 313, loss: 0.33567431569099426, mean loss: 0.39415116593506805
Epoch: 5, step: 314, loss: 0.34141477942466736, mean loss: 0.3941441670781987
Epoch: 5, step: 315, loss: 0.320600688457489, mean loss: 0.3941344081240293
Epoch: 5, step: 316, loss: 0.36274248361587524, mean loss: 0.3941302430816373
Epoch: 5, step: 317, loss: 0.310164213180542, mean loss: 0.39411910404875045
Epoch: 5, step: 318, loss: 0.38249990344047546, mean loss: 0.3941175628363074
Epoch: 5, step: 319, loss: 0.35885289311408997, mean loss: 0.3941128858244079
Epoch: 5, step: 320, loss: 0.4462803900241852, mean loss: 0.39411980367405647
Epoch: 5, step: 321, loss: 0.3486309349536896, mean loss: 0.3941137722674375
Epoch: 5, step: 322, loss: 0.39378559589385986, mean loss: 0.39411372876003015
Epoch: 5, step: 323, loss: 0.35486844182014465, mean loss: 0.3941085265745927
Epoch: 5, step: 324, loss: 0.31389179825782776, mean loss: 0.39409789480145596
Epoch: 5, step: 325, loss: 0.3521157205104828, mean loss: 0.39409233130101984
Epoch: 5, step: 326, loss: 0.3200298845767975, mean loss: 0.39408251780602527
Epoch: 5, step: 327, loss: 0.33573299646377563, mean loss: 0.39407478734479817
Epoch: 5, step: 328, loss: 0.35980674624443054, mean loss: 0.39407024793016043
Epoch: 5, step: 329, loss: 0.3810584247112274, mean loss: 0.3940685245098665
Epoch: 5, step: 330, loss: 0.35469457507133484, mean loss: 0.39406331010787493
Epoch: 5, step: 331, loss: 0.3748186528682709, mean loss: 0.39406076182169386
Epoch: 5, step: 332, loss: 0.36609429121017456, mean loss: 0.39405705912467126
Epoch: 5, step: 333, loss: 0.36699602007865906, mean loss: 0.3940534767790205
Epoch: 5, step: 334, loss: 0.37570154666900635, mean loss: 0.3940510476684831
Epoch: 5, step: 335, loss: 0.3174208104610443, mean loss: 0.39404090602777275
Epoch: 5, step: 336, loss: 0.33972516655921936, mean loss: 0.3940337185539778
Epoch: 5, step: 337, loss: 0.3168755769729614, mean loss: 0.39402350974985223
Epoch: 5, step: 338, loss: 0.33698147535324097, mean loss: 0.3940159635090272
Epoch: 5, step: 339, loss: 0.32454439997673035, mean loss: 0.3940067741487716
Epoch: 5, step: 340, loss: 0.3531457185745239, mean loss: 0.39400136996208013
Epoch: 5, step: 341, loss: 0.336727499961853, mean loss: 0.3939937960570285
Epoch: 5, step: 342, loss: 0.3916720747947693, mean loss: 0.3939934890728605
Epoch: 5, step: 343, loss: 0.392047256231308, mean loss: 0.39399323177079265
Epoch: 5, step: 344, loss: 0.36434245109558105, mean loss: 0.393989312302098
Epoch: 5, step: 345, loss: 0.38973572850227356, mean loss: 0.39398875010492646
Epoch: 5, step: 346, loss: 0.33264145255088806, mean loss: 0.3939806428897085
Epoch: 5, step: 347, loss: 0.4153091311454773, mean loss: 0.39398346113604255
Epoch: 5, step: 348, loss: 0.37752091884613037, mean loss: 0.39398128614036415
Epoch: 5, step: 349, loss: 0.38778895139694214, mean loss: 0.39398046813049054
Epoch: 5, step: 350, loss: 0.4499627947807312, mean loss: 0.3939878624412355
Epoch: 5, step: 351, loss: 0.33485040068626404, mean loss: 0.39398005242251455
Epoch: 5, step: 352, loss: 0.3183433413505554, mean loss: 0.39397006474113705
Epoch: 5, step: 353, loss: 0.4091237783432007, mean loss: 0.39397206549550756
Epoch: 5, step: 354, loss: 0.3336889147758484, mean loss: 0.3939641073237954
Epoch: 5, step: 355, loss: 0.37237367033958435, mean loss: 0.39396125747730854
Epoch: 5, step: 356, loss: 0.38099730014801025, mean loss: 0.39395954651553877
Epoch: 5, step: 357, loss: 0.29993224143981934, mean loss: 0.39394713858401653
Epoch: 5, step: 358, loss: 0.3933229148387909, mean loss: 0.3939470562217332
Epoch: 5, step: 359, loss: 0.3817245066165924, mean loss: 0.39394544374817053
Epoch: 5, step: 360, loss: 0.34439268708229065, mean loss: 0.3939389073075076
Epoch: 5, step: 361, loss: 0.32478055357933044, mean loss: 0.39392978592083805
Epoch: 5, step: 362, loss: 0.3311263918876648, mean loss: 0.39392150379054225
Epoch: 5, step: 363, loss: 0.3041161596775055, mean loss: 0.39390966236858643
Epoch: 5, step: 364, loss: 0.31352752447128296, mean loss: 0.39389906485535015
Epoch: 5, step: 365, loss: 0.40210315585136414, mean loss: 0.3939001463332036
Epoch: 5, step: 366, loss: 0.3529096245765686, mean loss: 0.39389474360198484
Epoch: 5, step: 367, loss: 0.36998072266578674, mean loss: 0.39389159204413876
Epoch: 5, step: 368, loss: 0.3632635772228241, mean loss: 0.39388755620083643
Epoch: 5, step: 369, loss: 0.3269326984882355, mean loss: 0.3938787347439573
Epoch: 5, step: 370, loss: 0.4195556938648224, mean loss: 0.3938821172968648
Epoch: 5, step: 371, loss: 0.3930529057979584, mean loss: 0.39388200807511836
Epoch: 5, step: 372, loss: 0.3230162262916565, mean loss: 0.3938726750339247
Epoch: 5, step: 373, loss: 0.4072558879852295, mean loss: 0.3938744373743186
Epoch: 5, step: 374, loss: 0.3737095296382904, mean loss: 0.39387178235025855
Epoch: 5, step: 375, loss: 0.32360073924064636, mean loss: 0.39386253129139737
Epoch: 5, step: 376, loss: 0.37300780415534973, mean loss: 0.39385978616475054
Epoch: 5, step: 377, loss: 0.3979094326496124, mean loss: 0.39386031915323233
Epoch: 5, step: 378, loss: 0.3654131591320038, mean loss: 0.39385657561329007
Epoch: 5, step: 379, loss: 0.32139644026756287, mean loss: 0.39384704138495513
Epoch: 5, step: 380, loss: 0.34866172075271606, mean loss: 0.3938410967302213
Epoch: 5, step: 381, loss: 0.3266812264919281, mean loss: 0.3938322622300584
Epoch: 5, step: 382, loss: 0.377040833234787, mean loss: 0.39383005370329327
Epoch: 5, step: 383, loss: 0.3198930323123932, mean loss: 0.39382033026544594
Epoch: 5, step: 384, loss: 0.35209882259368896, mean loss: 0.39381484420263574
Epoch: 5, step: 385, loss: 0.444247841835022, mean loss: 0.39382147488862473
Epoch: 5, step: 386, loss: 0.43409204483032227, mean loss: 0.3938267687718825
Epoch: 5, step: 387, loss: 0.3606981337070465, mean loss: 0.39382241432458165
Epoch: 5, step: 388, loss: 0.43726298213005066, mean loss: 0.39382812342798623
Epoch: 5, step: 389, loss: 0.3571822941303253, mean loss: 0.39382330794450426
Epoch: 5, step: 390, loss: 0.3415765166282654, mean loss: 0.39381644330236576
Epoch: 5, step: 391, loss: 0.33841484785079956, mean loss: 0.3938091651106354
Epoch: 5, step: 392, loss: 0.36653846502304077, mean loss: 0.393805582987939
Epoch: 5, step: 393, loss: 0.3148285150527954, mean loss: 0.393795210375917
Epoch: 5, step: 394, loss: 0.3304590582847595, mean loss: 0.39378689308739556
Epoch: 5, step: 395, loss: 0.35316142439842224, mean loss: 0.3937815588609396
Epoch: 5, step: 396, loss: 0.3501032888889313, mean loss: 0.39377582454690885
Epoch: 5, step: 397, loss: 0.35914433002471924, mean loss: 0.3937712785381766
Epoch: 5, step: 398, loss: 0.3434467315673828, mean loss: 0.39376467340010457
Epoch: 5, step: 399, loss: 0.3864935338497162, mean loss: 0.3937637191823158
Epoch: 5, step: 400, loss: 0.3933051526546478, mean loss: 0.39376365901087795
Epoch: 5, step: 401, loss: 0.3680354356765747, mean loss: 0.3937602834895798
Epoch: 5, step: 402, loss: 0.40154099464416504, mean loss: 0.3937613041784365
Epoch: 5, step: 403, loss: 0.3625555634498596, mean loss: 0.39375721108547634
Epoch: 5, step: 404, loss: 0.4023289382457733, mean loss: 0.3937583352464154
Epoch: 5, step: 405, loss: 0.3379271328449249, mean loss: 0.393751014081663
Epoch: 5, step: 406, loss: 0.32487037777900696, mean loss: 0.39374198292441864
Epoch: 5, step: 407, loss: 0.3380945324897766, mean loss: 0.39373468776835746
Epoch: 5, step: 408, loss: 0.3703669309616089, mean loss: 0.39373162475134255
Epoch: 5, step: 409, loss: 0.3659316897392273, mean loss: 0.3937279812474091
Epoch: 5, step: 410, loss: 0.3486822843551636, mean loss: 0.3937220782600035
Epoch: 5, step: 411, loss: 0.3319604694843292, mean loss: 0.39371398580602346
Epoch: 5, step: 412, loss: 0.3375300467014313, mean loss: 0.39370662514322974
Epoch: 5, step: 413, loss: 0.34435486793518066, mean loss: 0.39370016041213096
Epoch: 5, step: 414, loss: 0.3666303753852844, mean loss: 0.39369661492620733
Epoch: 5, step: 415, loss: 0.3229016661643982, mean loss: 0.39368734371762143
Epoch: 5, step: 416, loss: 0.3918778896331787, mean loss: 0.3936871067850452
Epoch: 5, step: 417, loss: 0.33940640091896057, mean loss: 0.393680000120229
Epoch: 5, step: 418, loss: 0.34521567821502686, mean loss: 0.39367365579218805
Epoch: 5, step: 419, loss: 0.38515982031822205, mean loss: 0.3936725414158171
Epoch: 5, step: 420, loss: 0.37064436078071594, mean loss: 0.39366952765052
Epoch: 5, step: 421, loss: 0.3330826163291931, mean loss: 0.3936615995019566
Epoch: 5, step: 422, loss: 0.4027670621871948, mean loss: 0.3936627908486379
Epoch: 5, step: 423, loss: 0.3873338997364044, mean loss: 0.3936619628932334
Epoch: 5, step: 424, loss: 0.36324700713157654, mean loss: 0.3936579844817538
Epoch: 5, step: 425, loss: 0.3369975686073303, mean loss: 0.39365057401669046
Epoch: 5, step: 426, loss: 0.40027686953544617, mean loss: 0.39365144053892387
Epoch: 5, step: 427, loss: 0.34066060185432434, mean loss: 0.3936445118204766
Epoch: 5, step: 428, loss: 0.37819382548332214, mean loss: 0.3936424918588689
Epoch: 5, step: 429, loss: 0.3452221155166626, mean loss: 0.39363616239790916
Epoch: 5, step: 430, loss: 0.32841092348098755, mean loss: 0.39362763733727435
Epoch: 5, step: 431, loss: 0.3532753586769104, mean loss: 0.3936223639082806
Epoch: 5, step: 432, loss: 0.34499648213386536, mean loss: 0.39361601007556474
Epoch: 5, step: 433, loss: 0.3329511880874634, mean loss: 0.3936080841777351
Epoch: 5, step: 434, loss: 0.31476739048957825, mean loss: 0.3935977849362343
Epoch: 5, step: 435, loss: 0.34232568740844727, mean loss: 0.3935910879537986
Epoch: 5, step: 436, loss: 0.33141976594924927, mean loss: 0.39358296841324686
Epoch: 5, step: 437, loss: 0.3543645739555359, mean loss: 0.39357784718127276
Epoch: 5, step: 438, loss: 0.3643186092376709, mean loss: 0.3935740269386897
Epoch: 5, step: 439, loss: 0.35468900203704834, mean loss: 0.39356895056468166
Epoch: 5, step: 440, loss: 0.3925434648990631, mean loss: 0.3935688167067433
Epoch: 5, step: 441, loss: 0.32933011651039124, mean loss: 0.3935604326425047
Epoch: 5, step: 442, loss: 0.38471367955207825, mean loss: 0.39355927816604763
Epoch: 5, step: 443, loss: 0.3687632977962494, mean loss: 0.3935560427823877
Epoch: 5, step: 444, loss: 0.32330605387687683, mean loss: 0.39354687774795777
Epoch: 5, step: 445, loss: 0.3565952479839325, mean loss: 0.3935420575510149
Epoch: 5, step: 446, loss: 0.3255269229412079, mean loss: 0.3935331863974203
Epoch: 5, step: 447, loss: 0.342655211687088, mean loss: 0.39352655129378045
Epoch: 5, step: 448, loss: 0.33928295969963074, mean loss: 0.3935194781953851
Epoch: 5, step: 449, loss: 0.40652918815612793, mean loss: 0.3935211743766055
Epoch: 5, step: 450, loss: 0.3527480959892273, mean loss: 0.39351585915324644
Epoch: 5, step: 451, loss: 0.3953220844268799, mean loss: 0.3935160945840694
Epoch: 5, step: 452, loss: 0.4011176526546478, mean loss: 0.3935170852732484
Epoch: 5, step: 453, loss: 0.3600136339664459, mean loss: 0.39351271943388083
Epoch: 5, step: 454, loss: 0.360040545463562, mean loss: 0.3935083582385753
Epoch: 5, step: 455, loss: 0.41763702034950256, mean loss: 0.39351150162863663
Epoch: 5, step: 456, loss: 0.34015408158302307, mean loss: 0.39350455133294227
Epoch: 5, step: 457, loss: 0.36224544048309326, mean loss: 0.39350048007599386
Epoch: 5, step: 458, loss: 0.3482130765914917, mean loss: 0.39349458251075303
Epoch: 5, step: 459, loss: 0.4020102322101593, mean loss: 0.3934956913193076
Epoch: 5, step: 460, loss: 0.36812934279441833, mean loss: 0.39349238883935383
Epoch: 5, step: 461, loss: 0.3629164397716522, mean loss: 0.39348840863249784
Epoch: 5, step: 462, loss: 0.3160805106163025, mean loss: 0.39347833341474225
Epoch: 5, step: 463, loss: 0.34429898858070374, mean loss: 0.3934719331876686
Epoch: 5, step: 464, loss: 0.36896559596061707, mean loss: 0.3934687443344185
Epoch: 5, step: 465, loss: 0.36794987320899963, mean loss: 0.393465424158628
Epoch: 5, step: 466, loss: 0.3319554626941681, mean loss: 0.3934574223423844
Epoch: 5, step: 467, loss: 0.3614225685596466, mean loss: 0.39345325547794857
Epoch: 5, step: 468, loss: 0.39458245038986206, mean loss: 0.3934534023364363
Epoch: 5, step: 469, loss: 0.37989577651023865, mean loss: 0.3934516393161728
Epoch: 5, step: 470, loss: 0.3507925868034363, mean loss: 0.3934460926964208
Epoch: 5, step: 471, loss: 0.39408984780311584, mean loss: 0.39344617638793233
Epoch: 5, step: 472, loss: 0.29462212324142456, mean loss: 0.39343333041716066
Epoch: 5, step: 473, loss: 0.33610716462135315, mean loss: 0.39342587965477493
Epoch: 5, step: 474, loss: 0.36838001012802124, mean loss: 0.3934226248309248
Epoch: 5, step: 475, loss: 0.3441200256347656, mean loss: 0.3934162185680355
Epoch: 5, step: 476, loss: 0.3614821434020996, mean loss: 0.39341206966909226
Epoch: 5, step: 477, loss: 0.34122976660728455, mean loss: 0.39340529098591975
Epoch: 5, step: 478, loss: 0.3363410532474518, mean loss: 0.393397879083369
Epoch: 5, step: 479, loss: 0.35609304904937744, mean loss: 0.3933930343002477
Epoch: 5, step: 480, loss: 0.38583728671073914, mean loss: 0.3933920531617476
Epoch: 5, step: 481, loss: 0.3431444466114044, mean loss: 0.39338552919309655
Epoch: 5, step: 482, loss: 0.34108486771583557, mean loss: 0.39337873954471575
Epoch: 5, step: 483, loss: 0.3396677076816559, mean loss: 0.3933717677077657
Epoch: 5, step: 484, loss: 0.3237714469432831, mean loss: 0.39336273457074244
Epoch: 5, step: 485, loss: 0.35302093625068665, mean loss: 0.39335749945546605
Epoch: 5, step: 486, loss: 0.3488777279853821, mean loss: 0.39335172810844776
Epoch: 5, step: 487, loss: 0.3116907775402069, mean loss: 0.3933411337972687
Epoch: 5, step: 488, loss: 0.3418295383453369, mean loss: 0.39333445178981613
Epoch: 5, step: 489, loss: 0.3677864074707031, mean loss: 0.39333113816539084
Epoch: 5, step: 490, loss: 0.3604634404182434, mean loss: 0.39332687572242014
Epoch: 5, step: 491, loss: 0.3322974145412445, mean loss: 0.3933189621512089
Epoch: 5, step: 492, loss: 0.36432313919067383, mean loss: 0.3933152028068603
Epoch: 5, step: 493, loss: 0.37495362758636475, mean loss: 0.39331282251450606
Epoch: 5, step: 494, loss: 0.3836917579174042, mean loss: 0.39331157545493417
Epoch: 5, step: 495, loss: 0.413077175617218, mean loss: 0.3933141370931097
Epoch: 5, step: 496, loss: 0.37369775772094727, mean loss: 0.3933115951235137
Epoch: 5, step: 497, loss: 0.34914451837539673, mean loss: 0.3933058725170421
Epoch: 5, step: 498, loss: 0.4071107804775238, mean loss: 0.39330766094921726
Epoch: 5, step: 499, loss: 0.3819124400615692, mean loss: 0.39330618488433544
Epoch: 5, step: 500, loss: 0.3517846167087555, mean loss: 0.393300807139461
Epoch: 5, step: 501, loss: 0.35945358872413635, mean loss: 0.39329642392029296
Epoch: 5, step: 502, loss: 0.356289267539978, mean loss: 0.3932916321092894
Epoch: 5, step: 503, loss: 0.351654589176178, mean loss: 0.393286241503006
Epoch: 5, step: 504, loss: 0.3164927363395691, mean loss: 0.39327630059618873
Epoch: 5, step: 505, loss: 0.3639247715473175, mean loss: 0.3932725015372904
Epoch: 5, step: 506, loss: 0.38532838225364685, mean loss: 0.393271473438509
Epoch: 5, step: 507, loss: 0.39746561646461487, mean loss: 0.39327201615887986
Epoch: 5, step: 508, loss: 0.3669155538082123, mean loss: 0.3932686060848275
Epoch: 5, step: 509, loss: 0.4060060977935791, mean loss: 0.3932702538845311
Epoch: 5, step: 510, loss: 0.3539089262485504, mean loss: 0.39326516252149446
Epoch: 5, step: 511, loss: 0.35689330101013184, mean loss: 0.393260458452494
Epoch: 5, step: 512, loss: 0.34112748503685, mean loss: 0.39325371682913757
Epoch: 5, step: 513, loss: 0.3215404748916626, mean loss: 0.39324444436444433
Epoch: 5, step: 514, loss: 0.32706865668296814, mean loss: 0.39323588899434975
Epoch: 5, step: 515, loss: 0.36293017864227295, mean loss: 0.3932319715033528
Epoch: 5, step: 516, loss: 0.3626510500907898, mean loss: 0.39322801894791626
Epoch: 5, step: 517, loss: 0.32879337668418884, mean loss: 0.39321969190704475
Epoch: 5, step: 518, loss: 0.32855668663978577, mean loss: 0.3932113364340809
Epoch: 5, step: 519, loss: 0.3324154317378998, mean loss: 0.3932034816660323
Epoch: 5, step: 520, loss: 0.35932618379592896, mean loss: 0.39319910531958224
Epoch: 5, step: 521, loss: 0.3424830436706543, mean loss: 0.39319255454954233
Epoch: 5, step: 522, loss: 0.34959113597869873, mean loss: 0.3931869234739165
Epoch: 5, step: 523, loss: 0.3882182836532593, mean loss: 0.39318628186236937
Epoch: 5, step: 524, loss: 0.42092519998550415, mean loss: 0.39318986338827294
Epoch: 5, step: 525, loss: 0.34299954771995544, mean loss: 0.393183383874244
Epoch: 5, step: 526, loss: 0.3191307783126831, mean loss: 0.3931738249991231
Epoch: 5, step: 527, loss: 0.37986743450164795, mean loss: 0.39317210760231136
Epoch: 5, step: 528, loss: 0.36981165409088135, mean loss: 0.3931690929612594
Epoch: 5, step: 529, loss: 0.3760606348514557, mean loss: 0.3931668854182775
Epoch: 5, step: 530, loss: 0.3548898696899414, mean loss: 0.3931619470857103
Epoch: 5, step: 531, loss: 0.3649121820926666, mean loss: 0.3931583028951797
Epoch: 5, step: 532, loss: 0.36917370557785034, mean loss: 0.3931552093059475
Epoch: 5, step: 533, loss: 0.3479757308959961, mean loss: 0.39314938270310895
Epoch: 5, step: 534, loss: 0.3505449891090393, mean loss: 0.393143888906385
Epoch: 5, step: 535, loss: 0.40568146109580994, mean loss: 0.39314550540615156
Epoch: 5, step: 536, loss: 0.40373197197914124, mean loss: 0.39314687016914923
Epoch: 5, step: 537, loss: 0.3421894311904907, mean loss: 0.3931403017959888
Epoch: 5, step: 538, loss: 0.3860526382923126, mean loss: 0.39313938831957385
Epoch: 5, step: 539, loss: 0.3362760543823242, mean loss: 0.3931320605703551
Epoch: 5, step: 540, loss: 0.37986910343170166, mean loss: 0.3931303516466161
Epoch: 5, step: 541, loss: 0.3661399185657501, mean loss: 0.3931268743942223
Epoch: 5, step: 542, loss: 0.3307218551635742, mean loss: 0.3931188356180751
Epoch: 5, step: 543, loss: 0.3576204776763916, mean loss: 0.39311426344420314
Epoch: 5, step: 544, loss: 0.3805729150772095, mean loss: 0.3931126483317283
Epoch: 5, step: 545, loss: 0.3092513382434845, mean loss: 0.3931018498112431
Epoch: 5, step: 546, loss: 0.3466825485229492, mean loss: 0.3930958733336728
Epoch: 5, step: 547, loss: 0.3149181306362152, mean loss: 0.39308580925763037
Epoch: 5, step: 548, loss: 0.35512489080429077, mean loss: 0.39308092305368475
Epoch: 5, step: 549, loss: 0.35409989953041077, mean loss: 0.39307590619094046
Epoch: 5, step: 550, loss: 0.38215017318725586, mean loss: 0.39307450022864426
Epoch: 5, step: 551, loss: 0.34730976819992065, mean loss: 0.3930686118174208
Epoch: 5, step: 552, loss: 0.34413257241249084, mean loss: 0.3930623161736018
Epoch: 5, step: 553, loss: 0.38867032527923584, mean loss: 0.39306175121464965
Epoch: 5, step: 554, loss: 0.38743099570274353, mean loss: 0.3930610270017221
Epoch: 5, step: 555, loss: 0.3510432839393616, mean loss: 0.39305562348538176
Epoch: 5, step: 556, loss: 0.33673766255378723, mean loss: 0.39304838188053004
Epoch: 5, step: 557, loss: 0.3368343412876129, mean loss: 0.39304115456751987
Epoch: 5, step: 558, loss: 0.390956312417984, mean loss: 0.39304088655850206
Epoch: 5, step: 559, loss: 0.341894268989563, mean loss: 0.3930343124431333
Epoch: 5, step: 560, loss: 0.35278457403182983, mean loss: 0.39302913961979297
Epoch: 5, step: 561, loss: 0.3462675213813782, mean loss: 0.393023130673733
Epoch: 5, step: 562, loss: 0.3280636966228485, mean loss: 0.39301478435045784
Epoch: 5, step: 563, loss: 0.35430750250816345, mean loss: 0.39300981167807314
Epoch: 5, step: 564, loss: 0.3593868911266327, mean loss: 0.39300549274158614
Epoch: 5, step: 565, loss: 0.3314149081707001, mean loss: 0.3929975823145927
Epoch: 5, step: 566, loss: 0.3358142077922821, mean loss: 0.39299023887366263
Epoch: 5, step: 567, loss: 0.37880241870880127, mean loss: 0.392988417119661
Epoch: 5, step: 568, loss: 0.3585231602191925, mean loss: 0.3929839922567902
Epoch: 5, step: 569, loss: 0.3308674097061157, mean loss: 0.39297601836942814
Epoch: 5, step: 570, loss: 0.3413175940513611, mean loss: 0.3929693878439092
Epoch: 5, step: 571, loss: 0.3241254687309265, mean loss: 0.39296055263868424
Epoch: 5, step: 572, loss: 0.3397214710712433, mean loss: 0.3929537209844346
Epoch: 5, step: 573, loss: 0.3410821855068207, mean loss: 0.3929470656681044
Epoch: 5, step: 574, loss: 0.3535591959953308, mean loss: 0.3929420127021425
Epoch: 5, step: 575, loss: 0.33771470189094543, mean loss: 0.39293492864482965
Epoch: 5, step: 576, loss: 0.3446347713470459, mean loss: 0.39292873393439004
Epoch: 5, step: 577, loss: 0.34472498297691345, mean loss: 0.39292255238130497
Epoch: 5, step: 578, loss: 0.34673380851745605, mean loss: 0.3929166299881951
Epoch: 5, step: 579, loss: 0.3301934599876404, mean loss: 0.39290858855614375
Epoch: 5, step: 580, loss: 0.3824608623981476, mean loss: 0.3929072492757748
Epoch: 5, step: 581, loss: 0.3443281948566437, mean loss: 0.39290102278841016
Epoch: 5, step: 582, loss: 0.34339985251426697, mean loss: 0.39289467892447655
Epoch: 5, step: 583, loss: 0.40041083097457886, mean loss: 0.3928956420398084
Epoch: 5, step: 584, loss: 0.3483894467353821, mean loss: 0.392889939772633
Epoch: 5, step: 585, loss: 0.3487878441810608, mean loss: 0.3928842900037896
Epoch: 5, step: 586, loss: 0.3138175308704376, mean loss: 0.3928741623287373
Epoch: 5, step: 587, loss: 0.3204186260700226, mean loss: 0.3928648826750156
Epoch: 5, step: 588, loss: 0.3155561685562134, mean loss: 0.39285498272443053
Epoch: 5, step: 589, loss: 0.34200814366340637, mean loss: 0.39284847224567754
Epoch: 5, step: 590, loss: 0.381241112947464, mean loss: 0.3928469862183701
Epoch: 5, step: 591, loss: 0.3152962625026703, mean loss: 0.3928370590903983
Epoch: 5, step: 592, loss: 0.34221988916397095, mean loss: 0.39283058050727704
Epoch: 5, step: 593, loss: 0.3561955392360687, mean loss: 0.3928258921221643
Epoch: 5, step: 594, loss: 0.3419802486896515, mean loss: 0.39281938596177624
Epoch: 5, step: 595, loss: 0.31240391731262207, mean loss: 0.39280909739106884
Epoch: 5, step: 596, loss: 0.33970406651496887, mean loss: 0.3928023038601905
Epoch: 5, step: 597, loss: 0.339884877204895, mean loss: 0.3927955351947191
Epoch: 5, step: 598, loss: 0.39995479583740234, mean loss: 0.39279645081828257
Epoch: 5, step: 599, loss: 0.39585137367248535, mean loss: 0.392796841473379
Epoch: 5, step: 600, loss: 0.32833459973335266, mean loss: 0.39278859927394927
Epoch: 5, step: 601, loss: 0.33472317457199097, mean loss: 0.39278117592637807
Epoch: 5, step: 602, loss: 0.34649384021759033, mean loss: 0.3927752590996225
Epoch: 5, step: 603, loss: 0.31297779083251953, mean loss: 0.39276506003670497
Epoch: 5, step: 604, loss: 0.36923694610595703, mean loss: 0.39276205324898217
Epoch: 5, step: 605, loss: 0.3533917963504791, mean loss: 0.39275702254914846
Epoch: 5, step: 606, loss: 0.3565347492694855, mean loss: 0.3927523946874799
Epoch: 5, step: 607, loss: 0.34899336099624634, mean loss: 0.3927468046218576
Epoch: 5, step: 608, loss: 0.39564117789268494, mean loss: 0.39274717432083206
Epoch: 5, step: 609, loss: 0.3463767170906067, mean loss: 0.3927412521679291
Epoch: 5, step: 610, loss: 0.3803805112838745, mean loss: 0.39273967373083496
Epoch: 5, step: 611, loss: 0.377137154340744, mean loss: 0.3927376815807596
Epoch: 5, step: 612, loss: 0.35120388865470886, mean loss: 0.39273237916879405
Epoch: 5, step: 613, loss: 0.35322296619415283, mean loss: 0.39272733584316544
Epoch: 5, step: 614, loss: 0.3790823221206665, mean loss: 0.3927255942970617
Epoch: 5, step: 615, loss: 0.3367287516593933, mean loss: 0.39271844819667406
Epoch: 5, step: 616, loss: 0.3366301655769348, mean loss: 0.3927112913404
Epoch: 5, step: 617, loss: 0.3690750300884247, mean loss: 0.39270827574187334
Epoch: 5, step: 618, loss: 0.3385303318500519, mean loss: 0.39270136440829867
Epoch: 5, step: 619, loss: 0.31650370359420776, mean loss: 0.3926916453189091
Epoch: 5, step: 620, loss: 0.3356996774673462, mean loss: 0.39268437686235363
Epoch: 5, step: 621, loss: 0.31969279050827026, mean loss: 0.39267506908546584
Epoch: 5, step: 622, loss: 0.36750197410583496, mean loss: 0.39267185945968747
Epoch: 5, step: 623, loss: 0.347083181142807, mean loss: 0.39266604754251294
Epoch: 5, step: 624, loss: 0.3603930175304413, mean loss: 0.39266193370822206
Epoch: 5, step: 625, loss: 0.36334237456321716, mean loss: 0.3926581968283922
Epoch: 5, step: 626, loss: 0.33170369267463684, mean loss: 0.39265042895479035
Epoch: 5, step: 627, loss: 0.3651047646999359, mean loss: 0.3926469190587334
Epoch: 5, step: 628, loss: 0.3705487847328186, mean loss: 0.392644103651124
Epoch: 5, step: 629, loss: 0.35548827052116394, mean loss: 0.3926393704239737
Epoch: 5, step: 630, loss: 0.3722999393939972, mean loss: 0.39263677974367434
Epoch: 5, step: 631, loss: 0.3675902783870697, mean loss: 0.39263358991925296
Epoch: 5, step: 632, loss: 0.3480251729488373, mean loss: 0.39262790948923
Epoch: 5, step: 633, loss: 0.329851895570755, mean loss: 0.3926199166175826
Epoch: 5, step: 634, loss: 0.34572404623031616, mean loss: 0.392613946424026
Epoch: 5, step: 635, loss: 0.3812336325645447, mean loss: 0.39261249780973634
Epoch: 5, step: 636, loss: 0.3953569531440735, mean loss: 0.39261284711040256
Epoch: 5, step: 637, loss: 0.331454336643219, mean loss: 0.3926050641490298
Epoch: 5, step: 638, loss: 0.38581669330596924, mean loss: 0.39260420037872273
Epoch: 5, step: 639, loss: 0.34577852487564087, mean loss: 0.39259824291364603
Epoch: 5, step: 640, loss: 0.31731802225112915, mean loss: 0.3925886664958032
Epoch: 5, step: 641, loss: 0.34689974784851074, mean loss: 0.3925828551349984
Epoch: 5, step: 642, loss: 0.36098793148994446, mean loss: 0.39257883695826623
Epoch: 5, step: 643, loss: 0.3435281217098236, mean loss: 0.39257259958348895
Epoch: 5, step: 644, loss: 0.4191996157169342, mean loss: 0.39257598509094394
Epoch: 5, step: 645, loss: 0.3377383053302765, mean loss: 0.3925690136086453
Epoch: 5, step: 646, loss: 0.33256995677948, mean loss: 0.3925613869330601
Epoch: 5, step: 647, loss: 0.3821209967136383, mean loss: 0.3925600599897175
Epoch: 5, step: 648, loss: 0.36120566725730896, mean loss: 0.39255607544368465
Epoch: 5, step: 649, loss: 0.3926723599433899, mean loss: 0.3925560902193517
Epoch: 5, step: 650, loss: 0.34800875186920166, mean loss: 0.39255043053972394
Epoch: 5, step: 651, loss: 0.3442710041999817, mean loss: 0.3925442974825161
Epoch: 5, step: 652, loss: 0.3528062403202057, mean loss: 0.39253925009814394
Epoch: 5, step: 653, loss: 0.3269056975841522, mean loss: 0.3925309146203037
Epoch: 5, step: 654, loss: 0.3653184771537781, mean loss: 0.39252745907268893
Epoch: 5, step: 655, loss: 0.370842307806015, mean loss: 0.3925247057523148
Epoch: 5, step: 656, loss: 0.33474355936050415, mean loss: 0.3925173703268493
Epoch: 5, step: 657, loss: 0.35508376359939575, mean loss: 0.39251261866313675
Epoch: 5, step: 658, loss: 0.33511680364608765, mean loss: 0.39250533400581766
Epoch: 5, step: 659, loss: 0.31892281770706177, mean loss: 0.39249599612303865
Epoch: 5, step: 660, loss: 0.35699519515037537, mean loss: 0.39249149151690077
Epoch: 5, step: 661, loss: 0.3235328197479248, mean loss: 0.3924827426369504
Epoch: 5, step: 662, loss: 0.3528185486793518, mean loss: 0.39247771102538653
Epoch: 5, step: 663, loss: 0.33043840527534485, mean loss: 0.39246984201146595
Epoch: 5, step: 664, loss: 0.3347558379173279, mean loss: 0.39246252254360364
Epoch: 5, step: 665, loss: 0.3617677390575409, mean loss: 0.3924586302302019
Epoch: 5, step: 666, loss: 0.3495657444000244, mean loss: 0.3924531918016701
Epoch: 5, step: 667, loss: 0.35784122347831726, mean loss: 0.3924488038746514
Epoch: 5, step: 668, loss: 0.38543501496315, mean loss: 0.3924479148153395
Epoch: 5, step: 669, loss: 0.3420836925506592, mean loss: 0.3924415315172071
Epoch: 5, step: 670, loss: 0.3261745870113373, mean loss: 0.3924331337292834
Epoch: 5, step: 671, loss: 0.3057052493095398, mean loss: 0.39242214438761847
Epoch: 5, step: 672, loss: 0.33794769644737244, mean loss: 0.39241524277252404
Epoch: 5, step: 673, loss: 0.37722933292388916, mean loss: 0.39241331904439525
Epoch: 5, step: 674, loss: 0.3404361605644226, mean loss: 0.3924067354904396
Epoch: 5, step: 675, loss: 0.34295374155044556, mean loss: 0.3924004724466275
Epoch: 5, step: 676, loss: 0.37326687574386597, mean loss: 0.39239804955227486
Epoch: 5, step: 677, loss: 0.37814152240753174, mean loss: 0.3923962444716032
Epoch: 5, step: 678, loss: 0.33253833651542664, mean loss: 0.39238866656199994
Epoch: 5, step: 679, loss: 0.3190279006958008, mean loss: 0.39237938038910547
Epoch: 5, step: 680, loss: 0.3767032325267792, mean loss: 0.39237739631773955
Epoch: 5, step: 681, loss: 0.40978309512138367, mean loss: 0.39237959901310826
Epoch: 5, step: 682, loss: 0.3601714074611664, mean loss: 0.3923755235744708
Epoch: 5, step: 683, loss: 0.3654572069644928, mean loss: 0.392372117917005
Epoch: 5, step: 684, loss: 0.3613836467266083, mean loss: 0.3923681978067975
Epoch: 5, step: 685, loss: 0.3334086239337921, mean loss: 0.39236074023357803
Epoch: 5, step: 686, loss: 0.3177194893360138, mean loss: 0.3923513003384348
Epoch: 5, step: 687, loss: 0.35978591442108154, mean loss: 0.3923471823078433
Epoch: 5, step: 688, loss: 0.35508671402931213, mean loss: 0.3923424711600018
Epoch: 5, step: 689, loss: 0.34225142002105713, mean loss: 0.39233613853659616
Epoch: 5, step: 690, loss: 0.3269348442554474, mean loss: 0.39232787140294917
Epoch: 5, step: 691, loss: 0.3436938524246216, mean loss: 0.3923217245350298
Epoch: 5, step: 692, loss: 0.3878268599510193, mean loss: 0.39232115649957117
Epoch: 5, step: 693, loss: 0.36361682415008545, mean loss: 0.392317529467432
Epoch: 5, step: 694, loss: 0.33621153235435486, mean loss: 0.3923104409017828
Epoch: 5, step: 695, loss: 0.3598407804965973, mean loss: 0.39230633912558205
Epoch: 5, step: 696, loss: 0.34160116314888, mean loss: 0.3922999345309153
Epoch: 5, step: 697, loss: 0.34265410900115967, mean loss: 0.39229366453526865
Epoch: 5, step: 698, loss: 0.3597033619880676, mean loss: 0.39228954907845
Epoch: 5, step: 699, loss: 0.33907002210617065, mean loss: 0.392282829441206
Epoch: 5, step: 700, loss: 0.3520277738571167, mean loss: 0.3922777473738428
Epoch: 5, step: 701, loss: 0.34983766078948975, mean loss: 0.39227239012989124
Epoch: 5, step: 702, loss: 0.3318631649017334, mean loss: 0.3922647655905465
Epoch: 5, step: 703, loss: 0.3570965528488159, mean loss: 0.3922603274011546
Epoch: 5, step: 704, loss: 0.35283464193344116, mean loss: 0.39225535255125327
Epoch: 5, step: 705, loss: 0.4000993072986603, mean loss: 0.3922563421998462
Epoch: 5, step: 706, loss: 0.38076362013816833, mean loss: 0.39225489237998223
Epoch: 5, step: 707, loss: 0.3439261317253113, mean loss: 0.39224879642127203
Epoch: 5, step: 708, loss: 0.3313373625278473, mean loss: 0.39224111431332737
Epoch: 5, step: 709, loss: 0.37894248962402344, mean loss: 0.392239437311475
Epoch: 5, step: 710, loss: 0.3790285885334015, mean loss: 0.3922377715885172
Epoch: 5, step: 711, loss: 0.3695906400680542, mean loss: 0.39223491642821456
Epoch: 5, step: 712, loss: 0.42212533950805664, mean loss: 0.39223868428691616
Epoch: 5, step: 713, loss: 0.32417598366737366, mean loss: 0.39223010567579697
Epoch: 5, step: 714, loss: 0.3366384208202362, mean loss: 0.39222309979238734
Epoch: 5, step: 715, loss: 0.35817867517471313, mean loss: 0.3922188099203337
Epoch: 5, step: 716, loss: 0.33106592297554016, mean loss: 0.3922111051342754
Epoch: 5, step: 717, loss: 0.37086907029151917, mean loss: 0.39220841654334027
Epoch: 5, step: 718, loss: 0.3645823895931244, mean loss: 0.39220493675659757
Epoch: 5, step: 719, loss: 0.3281659781932831, mean loss: 0.392196871396577
Epoch: 5, step: 720, loss: 0.35072848200798035, mean loss: 0.3921916493352008
Epoch: 5, step: 721, loss: 0.35119518637657166, mean loss: 0.3921864873529597
Epoch: 5, step: 722, loss: 0.33911579847335815, mean loss: 0.3921798059115799
Epoch: 5, step: 723, loss: 0.31529369950294495, mean loss: 0.3921701273986886
Epoch: 5, step: 724, loss: 0.3541310429573059, mean loss: 0.3921653395969968
Epoch: 5, step: 725, loss: 0.3901486098766327, mean loss: 0.39216508579260206
Epoch: 5, step: 726, loss: 0.38063710927963257, mean loss: 0.3921636351852643
Epoch: 5, step: 727, loss: 0.3880446255207062, mean loss: 0.3921631169404651
Epoch: 5, step: 728, loss: 0.35876354575157166, mean loss: 0.39215891520802215
Epoch: 5, step: 729, loss: 0.4086802303791046, mean loss: 0.39216099336087384
Epoch: 5, step: 730, loss: 0.37052348256111145, mean loss: 0.39215827200371123
Epoch: 5, step: 731, loss: 0.373677134513855, mean loss: 0.39215594791700475
Epoch: 5, step: 732, loss: 0.3677804172039032, mean loss: 0.39215288296909667
Epoch: 5, step: 733, loss: 0.37061524391174316, mean loss: 0.3921501751945106
Epoch: 5, step: 734, loss: 0.3371181786060333, mean loss: 0.39214325728167737
Epoch: 5, step: 735, loss: 0.3615435063838959, mean loss: 0.3921394111591412
Epoch: 5, step: 736, loss: 0.35491088032722473, mean loss: 0.39213473244469704
Epoch: 5, step: 737, loss: 0.34362027049064636, mean loss: 0.3921286361313075
Epoch: 5, step: 738, loss: 0.3625977039337158, mean loss: 0.39212492574907387
Epoch: 5, step: 739, loss: 0.3540898561477661, mean loss: 0.3921201474739983
Epoch: 5, step: 740, loss: 0.3524407744407654, mean loss: 0.3921151632542981
Epoch: 5, step: 741, loss: 0.32901790738105774, mean loss: 0.392107238454515
Epoch: 5, step: 742, loss: 0.39043185114860535, mean loss: 0.39210702805801795
Epoch: 5, step: 743, loss: 0.3821569085121155, mean loss: 0.39210577867083235
Epoch: 5, step: 744, loss: 0.3589443266391754, mean loss: 0.3921016152744693
Epoch: 5, step: 745, loss: 0.3563310503959656, mean loss: 0.39209712486963894
Epoch: 5, step: 746, loss: 0.3254951238632202, mean loss: 0.39208876513561025
Epoch: 5, step: 747, loss: 0.3976253569126129, mean loss: 0.3920894599889959
Epoch: 5, step: 748, loss: 0.30098387598991394, mean loss: 0.39207802749006265
Epoch: 5, step: 749, loss: 0.37029850482940674, mean loss: 0.3920752948021504
Epoch: 5, step: 750, loss: 0.3595823347568512, mean loss: 0.3920712184052058
Epoch: 5, step: 751, loss: 0.3520735800266266, mean loss: 0.3920662011399802
Epoch: 5, step: 752, loss: 0.3413204848766327, mean loss: 0.39205983644460035
Epoch: 5, step: 753, loss: 0.32863765954971313, mean loss: 0.392051882823219
Epoch: 5, step: 754, loss: 0.34997397661209106, mean loss: 0.39204660659673485
Epoch: 5, step: 755, loss: 0.3564024567604065, mean loss: 0.3920421376712288
Epoch: 5, step: 756, loss: 0.3551897406578064, mean loss: 0.3920375178395862
Epoch: 5, step: 757, loss: 0.3266911804676056, mean loss: 0.3920293270226682
Epoch: 5, step: 758, loss: 0.366321861743927, mean loss: 0.39202610513204544
Epoch: 5, step: 759, loss: 0.37926149368286133, mean loss: 0.3920245055566759
Epoch: 5, step: 760, loss: 0.38042935729026794, mean loss: 0.392023052712638
Epoch: 5, step: 761, loss: 0.3467214107513428, mean loss: 0.3920173772375739
Epoch: 5, step: 762, loss: 0.3548981845378876, mean loss: 0.3920127274577042
Epoch: 5, step: 763, loss: 0.3505510985851288, mean loss: 0.3920075343679156
Epoch: 5, step: 764, loss: 0.3274557292461395, mean loss: 0.39199945023452526
Epoch: 5, step: 765, loss: 0.2965087294578552, mean loss: 0.39198749296921387
Epoch: 5, step: 766, loss: 0.3220254182815552, mean loss: 0.39197873347570095
Epoch: 5, step: 767, loss: 0.36811381578445435, mean loss: 0.3919757458795954
Epoch: 5, step: 768, loss: 0.3609176576137543, mean loss: 0.3919718582731032
Epoch: 5, step: 769, loss: 0.3521195352077484, mean loss: 0.39196687049800116
Epoch: 5, step: 770, loss: 0.33749404549598694, mean loss: 0.3919600537260074
Epoch: 5, step: 771, loss: 0.32642096281051636, mean loss: 0.391951853139056
Epoch: 5, step: 772, loss: 0.35832133889198303, mean loss: 0.39194764564321627
Epoch: 5, step: 773, loss: 0.3402099311351776, mean loss: 0.3919411735748515
Epoch: 5, step: 774, loss: 0.3734365403652191, mean loss: 0.3919388590491217
Epoch: 5, step: 775, loss: 0.3867539167404175, mean loss: 0.3919382106071121
Epoch: 5, step: 776, loss: 0.3515947759151459, mean loss: 0.39193316578596765
Epoch: 5, step: 777, loss: 0.3388899266719818, mean loss: 0.3919265337230627
Epoch: 5, step: 778, loss: 0.374199777841568, mean loss: 0.3919243176015623
Epoch: 5, step: 779, loss: 0.3905114531517029, mean loss: 0.3919241409935061
Epoch: 5, step: 780, loss: 0.30421963334083557, mean loss: 0.39191317930026115
Epoch: 5, step: 781, loss: 0.34913212060928345, mean loss: 0.3919078330044987
Epoch: 5, step: 782, loss: 0.319722980260849, mean loss: 0.39189881328030235
Epoch: 5, step: 783, loss: 0.3817364573478699, mean loss: 0.3918975436206406
Epoch: 5, step: 784, loss: 0.38130906224250793, mean loss: 0.39189622088717674
Epoch: 5, step: 785, loss: 0.3384964168071747, mean loss: 0.3918895509141465
Epoch: 5, step: 786, loss: 0.34193259477615356, mean loss: 0.39188331175389446
Epoch: 5, step: 787, loss: 0.41424787044525146, mean loss: 0.3918861045309538
Epoch: 5, step: 788, loss: 0.37546733021736145, mean loss: 0.39188405449046015
Epoch: 5, step: 789, loss: 0.36304426193237305, mean loss: 0.39188045401698224
Epoch: 5, step: 790, loss: 0.3653416335582733, mean loss: 0.3918771412195214
Epoch: 5, step: 791, loss: 0.3218415081501007, mean loss: 0.3918683998774009
Epoch: 5, step: 792, loss: 0.39560654759407043, mean loss: 0.3918688663877861
Epoch: 5, step: 793, loss: 0.3580890893936157, mean loss: 0.3918646512920793
Epoch: 5, step: 794, loss: 0.32672446966171265, mean loss: 0.3918565240080331
Epoch: 5, step: 795, loss: 0.3393860161304474, mean loss: 0.3918499782859925
Epoch: 5, step: 796, loss: 0.35257574915885925, mean loss: 0.3918450794174473
Epoch: 5, step: 797, loss: 0.35177332162857056, mean loss: 0.3918400816926046
Epoch: 5, step: 798, loss: 0.3326617181301117, mean loss: 0.39183270192410946
Epoch: 5, step: 799, loss: 0.3470488488674164, mean loss: 0.39182711790253133
Epoch: 5, step: 800, loss: 0.4080900251865387, mean loss: 0.3918291454436464
Epoch: 5, step: 801, loss: 0.35528048872947693, mean loss: 0.3918245893907027
Epoch: 5, step: 802, loss: 0.3557792007923126, mean loss: 0.39182009663380396
Epoch: 5, step: 803, loss: 0.3306671380996704, mean loss: 0.3918124753777553
Epoch: 5, step: 804, loss: 0.36516693234443665, mean loss: 0.39180915506086644
Epoch: 5, step: 805, loss: 0.3182436525821686, mean loss: 0.3917999891622272
Epoch: 5, step: 806, loss: 0.3491956293582916, mean loss: 0.3917946815305087
Epoch: 5, step: 807, loss: 0.3327622711658478, mean loss: 0.3917873282158146
Epoch: 5, step: 808, loss: 0.32741713523864746, mean loss: 0.391779311004085
Epoch: 5, step: 809, loss: 0.3430444300174713, mean loss: 0.3917732419030904
Epoch: 5, step: 810, loss: 0.37080225348472595, mean loss: 0.391770630648151
Epoch: 5, step: 811, loss: 0.32550278306007385, mean loss: 0.39176238016911863
Epoch: 5, step: 812, loss: 0.3367827534675598, mean loss: 0.39175553594819224
Epoch: 5, step: 813, loss: 0.3347797393798828, mean loss: 0.39174844411391685
Epoch: 5, step: 814, loss: 0.3040637671947479, mean loss: 0.39173753127298105
Epoch: 5, step: 815, loss: 0.3610784113407135, mean loss: 0.39173371605148627
Epoch: 5, step: 816, loss: 0.3407396674156189, mean loss: 0.39172737114061956
Epoch: 5, step: 817, loss: 0.3622812330722809, mean loss: 0.3917237077743508
Epoch: 5, step: 818, loss: 0.34812214970588684, mean loss: 0.39171828402039277
Epoch: 5, step: 819, loss: 0.34213951230049133, mean loss: 0.39171211750649726
Epoch: 5, step: 820, loss: 0.3748977780342102, mean loss: 0.39171002643082603
Epoch: 5, step: 821, loss: 0.3388572931289673, mean loss: 0.3917034543426263
Epoch: 5, step: 822, loss: 0.3119035065174103, mean loss: 0.39169353267809504
Epoch: 5, step: 823, loss: 0.37660112977027893, mean loss: 0.39169165644700255
Epoch: 5, step: 824, loss: 0.34130552411079407, mean loss: 0.39168539341004344
Epoch: 5, step: 825, loss: 0.37822598218917847, mean loss: 0.39168372060228546
Epoch: 5, step: 826, loss: 0.36455121636390686, mean loss: 0.39168034884831027
Epoch: 5, step: 827, loss: 0.33070316910743713, mean loss: 0.39167277216096674
Epoch: 5, step: 828, loss: 0.3398095965385437, mean loss: 0.39166632873002843
Epoch: 5, step: 829, loss: 0.32688793540000916, mean loss: 0.39165828172464584
Epoch: 5, step: 830, loss: 0.3205614686012268, mean loss: 0.3916494509193889
Epoch: 5, step: 831, loss: 0.3426573574542999, mean loss: 0.39164336645671316
Epoch: 5, step: 832, loss: 0.3592231273651123, mean loss: 0.39163934059813976
Epoch: 5, step: 833, loss: 0.3375609815120697, mean loss: 0.39163262612594135
Epoch: 5, step: 834, loss: 0.37118977308273315, mean loss: 0.39163008821743195
Epoch: 5, step: 835, loss: 0.3102714419364929, mean loss: 0.39161998908060464
Epoch: 5, step: 836, loss: 0.3385843336582184, mean loss: 0.39161340652438986
Epoch: 5, step: 837, loss: 0.346826434135437, mean loss: 0.39160784844888863
Epoch: 5, step: 838, loss: 0.3599441349506378, mean loss: 0.3916039194609871
Epoch: 5, step: 839, loss: 0.3316957652568817, mean loss: 0.3915964866875126
Epoch: 5, step: 840, loss: 0.33887535333633423, mean loss: 0.39158994641541844
Epoch: 5, step: 841, loss: 0.42068859934806824, mean loss: 0.3915935557745021
Epoch: 5, step: 842, loss: 0.39507409930229187, mean loss: 0.39159398744305324
Epoch: 5, step: 843, loss: 0.3306044042110443, mean loss: 0.3915864242506882
Epoch: 5, step: 844, loss: 0.38778191804885864, mean loss: 0.391585952520223
Epoch: 5, step: 845, loss: 0.35241588950157166, mean loss: 0.3915810963259484
Epoch: 5, step: 846, loss: 0.3443377912044525, mean loss: 0.3915752399598741
Epoch: 5, step: 847, loss: 0.3584206998348236, mean loss: 0.3915711305721541
Epoch: 5, step: 848, loss: 0.3556402921676636, mean loss: 0.3915666776240311
Epoch: 5, step: 849, loss: 0.33263731002807617, mean loss: 0.3915593753479969
Epoch: 5, step: 850, loss: 0.36165446043014526, mean loss: 0.3915556701175524
Epoch: 5, step: 851, loss: 0.38798704743385315, mean loss: 0.3915552280186074
Epoch: 5, step: 852, loss: 0.35387858748435974, mean loss: 0.3915505610248586
Epoch: 5, step: 853, loss: 0.3381277322769165, mean loss: 0.39154394437527373
Epoch: 5, step: 854, loss: 0.3646646738052368, mean loss: 0.39154061567303594
Epoch: 5, step: 855, loss: 0.38807615637779236, mean loss: 0.3915401866909538
Epoch: 5, step: 856, loss: 0.3250524401664734, mean loss: 0.39153195495311494
Epoch: 5, step: 857, loss: 0.3882380425930023, mean loss: 0.39153154718976263
Epoch: 5, step: 858, loss: 0.3906906545162201, mean loss: 0.3915314431060055
Epoch: 5, step: 859, loss: 0.3374718129634857, mean loss: 0.39152475255772057
Epoch: 5, step: 860, loss: 0.3589397966861725, mean loss: 0.3915207202651984
Epoch: 5, step: 861, loss: 0.3642694652080536, mean loss: 0.3915173484197323
Epoch: 5, step: 862, loss: 0.3520286977291107, mean loss: 0.3915124630243728
Epoch: 5, step: 863, loss: 0.35512086749076843, mean loss: 0.39150796134258986
Epoch: 5, step: 864, loss: 0.33177924156188965, mean loss: 0.3915005737458328
Epoch: 5, step: 865, loss: 0.3157903850078583, mean loss: 0.3914912106257811
Epoch: 5, step: 866, loss: 0.3496013879776001, mean loss: 0.3914860307293241
Epoch: 5, step: 867, loss: 0.3642429709434509, mean loss: 0.39148266239849
Epoch: 5, step: 868, loss: 0.34849831461906433, mean loss: 0.3914773484724448
Epoch: 5, step: 869, loss: 0.3397211730480194, mean loss: 0.3914709509229486
Epoch: 5, step: 870, loss: 0.4109691381454468, mean loss: 0.3914733607841799
Epoch: 5, step: 871, loss: 0.3297257721424103, mean loss: 0.39146573008859886
Epoch: 5, step: 872, loss: 0.36115777492523193, mean loss: 0.39146198512935465
Epoch: 5, step: 873, loss: 0.3478409945964813, mean loss: 0.39145659582980774
Epoch: 5, step: 874, loss: 0.3382319509983063, mean loss: 0.3914500208273579
Epoch: 5, step: 875, loss: 0.3510841727256775, mean loss: 0.3914450349271477
Epoch: 5, step: 876, loss: 0.36415159702301025, mean loss: 0.391441664118465
Epoch: 5, step: 877, loss: 0.3103502690792084, mean loss: 0.3914316503625945
Epoch: 5, step: 878, loss: 0.3266616463661194, mean loss: 0.39142365307848576
Epoch: 5, step: 879, loss: 0.30620571970939636, mean loss: 0.391413132345971
Epoch: 5, step: 880, loss: 0.4329758882522583, mean loss: 0.39141826291700005
Epoch: 5, step: 881, loss: 0.3847110867500305, mean loss: 0.3914174350749651
Epoch: 5, step: 882, loss: 0.3318054676055908, mean loss: 0.39141007829754076
Epoch: 5, step: 883, loss: 0.34332409501075745, mean loss: 0.39140414468657253
Epoch: 5, step: 884, loss: 0.3067390024662018, mean loss: 0.39139369864805057
Epoch: 5, step: 885, loss: 0.321548193693161, mean loss: 0.3913850821288111
Epoch: 5, step: 886, loss: 0.39569687843322754, mean loss: 0.39138561398970967
Epoch: 5, step: 887, loss: 0.3704468309879303, mean loss: 0.391383031505373
Epoch: 5, step: 888, loss: 0.3703695237636566, mean loss: 0.3913804401244701
Epoch: 5, step: 889, loss: 0.34320104122161865, mean loss: 0.39137449938477803
Epoch: 5, step: 890, loss: 0.34489408135414124, mean loss: 0.3913687688437805
Epoch: 5, step: 891, loss: 0.3531591594219208, mean loss: 0.3913640585862088
Epoch: 5, step: 892, loss: 0.3430918753147125, mean loss: 0.3913581086067596
Epoch: 5, step: 893, loss: 0.34392690658569336, mean loss: 0.3913522630063134
Epoch: 5, step: 894, loss: 0.38740304112434387, mean loss: 0.3913517763492731
Epoch: 5, step: 895, loss: 0.3198966383934021, mean loss: 0.3913429721183766
Epoch: 5, step: 896, loss: 0.3510151505470276, mean loss: 0.39133800380230277
Epoch: 5, step: 897, loss: 0.3475261330604553, mean loss: 0.39133260692243804
Epoch: 5, step: 898, loss: 0.3663902282714844, mean loss: 0.39132953482259186
Epoch: 5, step: 899, loss: 0.3929155766963959, mean loss: 0.39132973014794575
Epoch: 5, step: 900, loss: 0.3840811252593994, mean loss: 0.3913288375725377
Epoch: 5, step: 901, loss: 0.3450966477394104, mean loss: 0.39132314535512414
Epoch: 5, step: 902, loss: 0.37541595101356506, mean loss: 0.39132118706454905
Epoch: 5, step: 903, loss: 0.33280956745147705, mean loss: 0.3913139847480039
Epoch: 5, step: 904, loss: 0.3215814530849457, mean loss: 0.39130540228256844
Epoch: 5, step: 905, loss: 0.3413625955581665, mean loss: 0.39129925623202394
Epoch: 5, step: 906, loss: 0.3351150453090668, mean loss: 0.39129234295394805
Epoch: 5, step: 907, loss: 0.3356156647205353, mean loss: 0.39128549296892917
Epoch: 5, step: 908, loss: 0.33081182837486267, mean loss: 0.39127805371876384
Epoch: 5, step: 909, loss: 0.3411003649234772, mean loss: 0.39127188180132283
Epoch: 5, step: 910, loss: 0.35200026631355286, mean loss: 0.39126705193839234
Epoch: 5, step: 911, loss: 0.38347920775413513, mean loss: 0.3912660942595699
Epoch: 5, step: 912, loss: 0.3355656862258911, mean loss: 0.39125924556806196
Epoch: 5, step: 913, loss: 0.38311541080474854, mean loss: 0.39125824435896883
Epoch: 5, step: 914, loss: 0.34613117575645447, mean loss: 0.3912526970856311
Epoch: 5, step: 915, loss: 0.34530341625213623, mean loss: 0.3912470494355778
Epoch: 5, step: 916, loss: 0.3623339831829071, mean loss: 0.39124349615227283
Epoch: 5, step: 917, loss: 0.36861667037010193, mean loss: 0.39124071576080294
Epoch: 5, step: 918, loss: 0.36065468192100525, mean loss: 0.3912369578011224
Epoch: 5, step: 919, loss: 0.35217052698135376, mean loss: 0.39123215848529685
Epoch: 5, step: 920, loss: 0.32838550209999084, mean loss: 0.39122443871421403
Epoch: 5, step: 921, loss: 0.3540770411491394, mean loss: 0.39121987627285254
Epoch: 5, step: 922, loss: 0.35730716586112976, mean loss: 0.391215711627094
Epoch: 5, step: 923, loss: 0.31183332204818726, mean loss: 0.3912059642806329
Epoch: 5, step: 924, loss: 0.3131548762321472, mean loss: 0.3911963815810567
Epoch: 5, step: 925, loss: 0.33397889137268066, mean loss: 0.39118935758274975
Epoch: 5, step: 926, loss: 0.3603702485561371, mean loss: 0.3911855747045091
Epoch: 5, step: 927, loss: 0.34003159403800964, mean loss: 0.39117929660182543
Epoch: 5, step: 928, loss: 0.3493162989616394, mean loss: 0.3911741594073672
Epoch: 5, step: 929, loss: 0.337706059217453, mean loss: 0.39116759890427644
Epoch: 5, step: 930, loss: 0.370385080575943, mean loss: 0.3911650492148729
Epoch: 5, step: 931, loss: 0.32856011390686035, mean loss: 0.3911573695123081
Epoch: 5, step: 932, loss: 0.3498149514198303, mean loss: 0.39115229868953216
Epoch: 5, step: 933, loss: 0.3482414782047272, mean loss: 0.39114703614103025
Epoch: 5, step: 934, loss: 0.36569109559059143, mean loss: 0.39114391462778064
Epoch: 5, step: 935, loss: 0.40716877579689026, mean loss: 0.3911458794219407
Epoch: 5, step: 936, loss: 0.37117907404899597, mean loss: 0.39114343160958653
Epoch: 5, step: 937, loss: 0.3698038160800934, mean loss: 0.39114081581949955
Epoch: 5, step: 938, loss: 0.32437005639076233, mean loss: 0.39113263212548943
Epoch: 5, step: 939, loss: 0.35108456015586853, mean loss: 0.3911277242735324
Epoch: 5, step: 940, loss: 0.3866133689880371, mean loss: 0.39112717111150747
Epoch: 5, step: 941, loss: 0.3551845848560333, mean loss: 0.39112276746212554
Epoch: 5, step: 942, loss: 0.339069664478302, mean loss: 0.3911163907497669
Epoch: 5, step: 943, loss: 0.3290975093841553, mean loss: 0.39110879412049626
Epoch: 5, step: 944, loss: 0.29581138491630554, mean loss: 0.3910971226680524
Epoch: 5, step: 945, loss: 0.3473881185054779, mean loss: 0.39109177010815005
Epoch: 5, step: 946, loss: 0.3400879502296448, mean loss: 0.3910855249973531
Epoch: 5, step: 947, loss: 0.36420363187789917, mean loss: 0.39108223387429736
Epoch: 5, step: 948, loss: 0.3966026306152344, mean loss: 0.391082909648167
Epoch: 5, step: 949, loss: 0.371579110622406, mean loss: 0.3910805224022642
Epoch: 5, step: 950, loss: 0.3596998155117035, mean loss: 0.3910766819045417
Epoch: 5, step: 951, loss: 0.36311572790145874, mean loss: 0.391073260348741
Epoch: 5, step: 952, loss: 0.37729182839393616, mean loss: 0.39107157413413746
Epoch: 5, step: 953, loss: 0.34731563925743103, mean loss: 0.39106622107139255
Epoch: 5, step: 954, loss: 0.34505340456962585, mean loss: 0.39106059259230974
Epoch: 5, step: 955, loss: 0.33676066994667053, mean loss: 0.3910539512123384
Epoch: 5, step: 956, loss: 0.30706462264060974, mean loss: 0.3910436798012375
Epoch: 5, step: 957, loss: 0.352035790681839, mean loss: 0.3910389099444119
Epoch: 5, step: 958, loss: 0.33195167779922485, mean loss: 0.39103168568323754
Epoch: 5, step: 959, loss: 0.3321385979652405, mean loss: 0.3910244860392622
Epoch: 5, step: 960, loss: 0.33078595995903015, mean loss: 0.391017122816419
Epoch: 5, step: 961, loss: 0.36205512285232544, mean loss: 0.3910135830950838
Epoch: 5, step: 962, loss: 0.3601342439651489, mean loss: 0.39100980949870967
Epoch: 5, step: 963, loss: 0.3413163721561432, mean loss: 0.391003737475574
Epoch: 5, step: 964, loss: 0.34033504128456116, mean loss: 0.39099754704231915
Epoch: 5, step: 965, loss: 0.33515042066574097, mean loss: 0.3909907247693682
Epoch: 5, step: 966, loss: 0.32520419359207153, mean loss: 0.3909826892824771
Epoch: 5, step: 967, loss: 0.4059739410877228, mean loss: 0.39098452016325447
Epoch: 5, step: 968, loss: 0.3355795741081238, mean loss: 0.39097775438647403
Epoch: 5, step: 969, loss: 0.3291581869125366, mean loss: 0.39097020620973727
Epoch: 5, step: 970, loss: 0.3872129023075104, mean loss: 0.39096974749848074
Epoch: 5, step: 971, loss: 0.3209736943244934, mean loss: 0.39096120305839605
Epoch: 5, step: 972, loss: 0.3379988968372345, mean loss: 0.39095473872222847
Epoch: 5, step: 973, loss: 0.30749478936195374, mean loss: 0.39094455322682203
Epoch: 5, step: 974, loss: 0.337196409702301, mean loss: 0.3909379945759954
Epoch: 5, step: 975, loss: 0.34768617153167725, mean loss: 0.39093271738919155
Epoch: 5, step: 976, loss: 0.36459746956825256, mean loss: 0.3909295045981923
Epoch: 5, step: 977, loss: 0.35218772292137146, mean loss: 0.3909247788380463
Epoch: 5, step: 978, loss: 0.3754779100418091, mean loss: 0.3909228948438036
Epoch: 5, step: 979, loss: 0.34577077627182007, mean loss: 0.3909173884878802
Epoch: 5, step: 980, loss: 0.32066917419433594, mean loss: 0.39090882267708965
Epoch: 5, step: 981, loss: 0.3434458076953888, mean loss: 0.39090303591593606
Epoch: 5, step: 982, loss: 0.3343227207660675, mean loss: 0.39089613840098425
Epoch: 5, step: 983, loss: 0.3501812219619751, mean loss: 0.3908911755881565
Epoch: 5, step: 984, loss: 0.3313109874725342, mean loss: 0.39088391413926976
Epoch: 5, step: 985, loss: 0.38490185141563416, mean loss: 0.3908831851528301
Epoch: 5, step: 986, loss: 0.34845128655433655, mean loss: 0.39087801494464214
Epoch: 5, step: 987, loss: 0.3619244694709778, mean loss: 0.3908744874659051
Epoch: 5, step: 988, loss: 0.3593277931213379, mean loss: 0.39087064452591913
Epoch: 5, step: 989, loss: 0.36016735434532166, mean loss: 0.3908669047829008
Epoch: 5, step: 990, loss: 0.3478427231311798, mean loss: 0.3908616649605099
Epoch: 5, step: 991, loss: 0.35309654474258423, mean loss: 0.39085706618795535
Epoch: 5, step: 992, loss: 0.3743929862976074, mean loss: 0.3908550615514169
Epoch: 5, step: 993, loss: 0.3858790695667267, mean loss: 0.39085445575740857
Epoch: 5, step: 994, loss: 0.33600595593452454, mean loss: 0.39084777912931085
Epoch: 5, step: 995, loss: 0.33092549443244934, mean loss: 0.3908404857645717
Epoch: 5, step: 996, loss: 0.32804661989212036, mean loss: 0.3908328438191083
Epoch: 5, step: 997, loss: 0.338114857673645, mean loss: 0.39082642887798574
Epoch: 5, step: 998, loss: 0.33167243003845215, mean loss: 0.390819231652187
Epoch: 5, step: 999, loss: 0.3710140287876129, mean loss: 0.39081682226011105
Epoch: 5, step: 1000, loss: 0.3665662407875061, mean loss: 0.39081387242657833
Epoch: 5, step: 1001, loss: 0.38523176312446594, mean loss: 0.39081319350304367
Epoch: 5, step: 1002, loss: 0.3538089990615845, mean loss: 0.39080869341859253
Epoch: 5, step: 1003, loss: 0.338035523891449, mean loss: 0.39080227644758975
Epoch: 5, step: 1004, loss: 0.32640066742897034, mean loss: 0.3907944464647303
Epoch: 5, step: 1005, loss: 0.37191537022590637, mean loss: 0.39079215141534557
Epoch: 5, step: 1006, loss: 0.3313475549221039, mean loss: 0.3907849258657536
Epoch: 5, step: 1007, loss: 0.3300665318965912, mean loss: 0.3907775463818001
Epoch: 5, step: 1008, loss: 0.3153640627861023, mean loss: 0.3907683820260345
Epoch: 5, step: 1009, loss: 0.32561734318733215, mean loss: 0.3907604657394198
Epoch: 5, step: 1010, loss: 0.3884040415287018, mean loss: 0.39076017945291625
Epoch: 5, step: 1011, loss: 0.3562600612640381, mean loss: 0.39075598847645987
Epoch: 5, step: 1012, loss: 0.3464204967021942, mean loss: 0.3907506033808964
Epoch: 5, step: 1013, loss: 0.3304087519645691, mean loss: 0.39074327500447953
Epoch: 5, step: 1014, loss: 0.3794150650501251, mean loss: 0.3907418993869987
Epoch: 5, step: 1015, loss: 0.37670567631721497, mean loss: 0.3907401951345619
Epoch: 5, step: 1016, loss: 0.4022836685180664, mean loss: 0.3907415965517506
Epoch: 5, step: 1017, loss: 0.33345815539360046, mean loss: 0.39073464299006594
Epoch: 5, step: 1018, loss: 0.3438138961791992, mean loss: 0.39072894803354075
Epoch: 5, step: 1019, loss: 0.3460082709789276, mean loss: 0.3907235207669079
Epoch: 5, step: 1020, loss: 0.39493030309677124, mean loss: 0.39072403123679383
Epoch: 5, step: 1021, loss: 0.32685670256614685, mean loss: 0.39071628222821936
Epoch: 5, step: 1022, loss: 0.41511958837509155, mean loss: 0.3907192427166516
Epoch: 5, step: 1023, loss: 0.3255552351474762, mean loss: 0.3907113383004011
Epoch: 5, step: 1024, loss: 0.3490554988384247, mean loss: 0.39070628604576657
Epoch: 5, step: 1025, loss: 0.32576867938041687, mean loss: 0.39069841100251346
Epoch: 5, step: 1026, loss: 0.32380470633506775, mean loss: 0.39069029972511954
Epoch: 5, step: 1027, loss: 0.3327595293521881, mean loss: 0.39068327611086484
Epoch: 5, step: 1028, loss: 0.33263829350471497, mean loss: 0.3906762395024752
Epoch: 5, step: 1029, loss: 0.3369802236557007, mean loss: 0.3906697308944938
Epoch: 5, step: 1030, loss: 0.33419787883758545, mean loss: 0.3906628866511225
Epoch: 5, step: 1031, loss: 0.3531702160835266, mean loss: 0.39065834318643905
Epoch: 5, step: 1032, loss: 0.4304005205631256, mean loss: 0.3906631586689759
Epoch: 5, step: 1033, loss: 0.33449631929397583, mean loss: 0.39065635386653164
Epoch: 5, step: 1034, loss: 0.33455079793930054, mean loss: 0.39064955731220974
Epoch: 5, step: 1035, loss: 0.3580648601055145, mean loss: 0.3906456105223349
Epoch: 5, step: 1036, loss: 0.365835040807724, mean loss: 0.390642605730072
Epoch: 5, step: 1037, loss: 0.34477686882019043, mean loss: 0.39063705163260165
Epoch: 5, step: 1038, loss: 0.390077143907547, mean loss: 0.39063698383895534
Epoch: 5, step: 1039, loss: 0.37712153792381287, mean loss: 0.39063534758642326
Epoch: 5, step: 1040, loss: 0.35760417580604553, mean loss: 0.3906313491392885
Epoch: 5, step: 1041, loss: 0.3249812424182892, mean loss: 0.39062340310845806
Epoch: 5, step: 1042, loss: 0.30923905968666077, mean loss: 0.39061355385958696
Epoch: 5, step: 1043, loss: 0.33874189853668213, mean loss: 0.39060727703779086
Epoch: 5, step: 1044, loss: 0.3494585454463959, mean loss: 0.39060229836488203
Epoch: 5, step: 1045, loss: 0.3298249840736389, mean loss: 0.3905949456774527
Epoch: 5, step: 1046, loss: 0.38833123445510864, mean loss: 0.39059467185245905
Epoch: 5, step: 1047, loss: 0.3586646616458893, mean loss: 0.390590809974108
Epoch: 5, step: 1048, loss: 0.36095869541168213, mean loss: 0.3905872264555976
Epoch: 5, step: 1049, loss: 0.3971351385116577, mean loss: 0.3905880182224726
Epoch: 5, step: 1050, loss: 0.3608265519142151, mean loss: 0.3905844199312976
Epoch: 5, step: 1051, loss: 0.35452356934547424, mean loss: 0.3905800605441378
Epoch: 5, step: 1052, loss: 0.3553203344345093, mean loss: 0.3905757985199495
Epoch: 5, step: 1053, loss: 0.331147700548172, mean loss: 0.3905686160087129
Epoch: 5, step: 1054, loss: 0.3700491487979889, mean loss: 0.39056613631479015
Epoch: 5, step: 1055, loss: 0.3797665238380432, mean loss: 0.39056483138336473
Epoch: 5, step: 1056, loss: 0.2975809872150421, mean loss: 0.3905535973802032
Epoch: 5, step: 1057, loss: 0.4328315854072571, mean loss: 0.3905587046510448
Epoch: 5, step: 1058, loss: 0.3743295967578888, mean loss: 0.3905567443771116
Epoch: 5, step: 1059, loss: 0.3233158588409424, mean loss: 0.3905486234972159
Epoch: 5, step: 1060, loss: 0.33910343050956726, mean loss: 0.39054241105995136
Epoch: 5, step: 1061, loss: 0.3383847773075104, mean loss: 0.3905361133500078
Epoch: 5, step: 1062, loss: 0.35537096858024597, mean loss: 0.39053186789005734
Epoch: 5, step: 1063, loss: 0.33568546175956726, mean loss: 0.39052524712640085
Epoch: 5, step: 1064, loss: 0.3625817894935608, mean loss: 0.3905218743493782
Epoch: 5, step: 1065, loss: 0.36360490322113037, mean loss: 0.39051862586143127
Epoch: 5, step: 1066, loss: 0.3262704312801361, mean loss: 0.39051087297201637
Epoch: 5, step: 1067, loss: 0.3484807014465332, mean loss: 0.390505801764062
Epoch: 5, step: 1068, loss: 0.34295186400413513, mean loss: 0.3905000647707263
Epoch: 5, step: 1069, loss: 0.36295512318611145, mean loss: 0.3904967420998476
Epoch: 5, step: 1070, loss: 0.3742915391921997, mean loss: 0.39049478754636696
Epoch: 5, step: 1071, loss: 0.3738081455230713, mean loss: 0.39049277516792713
Epoch: 5, step: 1072, loss: 0.35562992095947266, mean loss: 0.39048857127859776
Epoch: 5, step: 1073, loss: 0.3707256615161896, mean loss: 0.3904861884826293
Epoch: 5, step: 1074, loss: 0.3486133813858032, mean loss: 0.39048114052517335
Epoch: 5, step: 1075, loss: 0.4159892797470093, mean loss: 0.39048421527676713
Epoch: 5, step: 1076, loss: 0.34144046902656555, mean loss: 0.3904783042551629
Epoch: 5, step: 1077, loss: 0.3656720221042633, mean loss: 0.3904753148261257
Epoch: 5, step: 1078, loss: 0.3497633934020996, mean loss: 0.39047040918431053
Epoch: 5, step: 1079, loss: 0.3806985914707184, mean loss: 0.39046923185687515
Epoch: 5, step: 1080, loss: 0.3646415174007416, mean loss: 0.3904661204589163
Epoch: 5, step: 1081, loss: 0.3660202622413635, mean loss: 0.39046317588432977
Epoch: 5, step: 1082, loss: 0.3601195216178894, mean loss: 0.39045952134328843
Epoch: 5, step: 1083, loss: 0.3310539126396179, mean loss: 0.39045236748867573
Epoch: 5, step: 1084, loss: 0.3321594297885895, mean loss: 0.3904453484714933
Epoch: 5, step: 1085, loss: 0.37821781635284424, mean loss: 0.39044387633904465
Epoch: 5, step: 1086, loss: 0.38415682315826416, mean loss: 0.3904431195010549
Epoch: 5, step: 1087, loss: 0.3076915144920349, mean loss: 0.39043315902861764
Epoch: 5, step: 1088, loss: 0.3424875736236572, mean loss: 0.39042738870903587
Epoch: 5, step: 1089, loss: 0.3209053575992584, mean loss: 0.39041902264031025
Epoch: 5, step: 1090, loss: 0.35189902782440186, mean loss: 0.39041438781961285
Epoch: 5, step: 1091, loss: 0.36683890223503113, mean loss: 0.39041155150036544
Epoch: 5, step: 1092, loss: 0.3026527762413025, mean loss: 0.3904009946887139
Epoch: 5, step: 1093, loss: 0.35005608201026917, mean loss: 0.39039614204104994
Epoch: 5, step: 1094, loss: 0.3331674635410309, mean loss: 0.3903892594579471
Epoch: 5, step: 1095, loss: 0.3471989929676056, mean loss: 0.390384065823208
Epoch: 5, step: 1096, loss: 0.3173161447048187, mean loss: 0.39037528045334885
Epoch: 5, step: 1097, loss: 0.3334146738052368, mean loss: 0.390368432580465
Epoch: 5, step: 1098, loss: 0.3702499568462372, mean loss: 0.390366014203769
Epoch: 5, step: 1099, loss: 0.38814836740493774, mean loss: 0.39036574765968257
Epoch: 5, step: 1100, loss: 0.37924277782440186, mean loss: 0.3903644109249349
Epoch: 5, step: 1101, loss: 0.32398101687431335, mean loss: 0.3903564340691249
Epoch: 5, step: 1102, loss: 0.3304663300514221, mean loss: 0.39034923833393115
Epoch: 5, step: 1103, loss: 0.3486897945404053, mean loss: 0.39034423359536874
Epoch: 5, step: 1104, loss: 0.3501928448677063, mean loss: 0.3903394106057318
Epoch: 5, step: 1105, loss: 0.35351523756980896, mean loss: 0.3903349878129098
Epoch: 5, step: 1106, loss: 0.3169410824775696, mean loss: 0.3903261738456545
Epoch: 5, step: 1107, loss: 0.35025474429130554, mean loss: 0.3903213621946513
Epoch: 5, step: 1108, loss: 0.34272071719169617, mean loss: 0.3903156471454253
Epoch: 5, step: 1109, loss: 0.3528018295764923, mean loss: 0.3903111436859333
Epoch: 5, step: 1110, loss: 0.36761319637298584, mean loss: 0.3903084191693911
Epoch: 5, step: 1111, loss: 0.3930087685585022, mean loss: 0.3903087432631728
Epoch: 5, step: 1112, loss: 0.3628472089767456, mean loss: 0.39030544774723774
Epoch: 5, step: 1113, loss: 0.3243955373764038, mean loss: 0.3902975391906778
Epoch: 5, step: 1114, loss: 0.3184365928173065, mean loss: 0.3902889176014308
Epoch: 5, step: 1115, loss: 0.331729531288147, mean loss: 0.3902818927230343
Epoch: 5, step: 1116, loss: 0.3676634132862091, mean loss: 0.39027917969923237
Epoch: 5, step: 1117, loss: 0.36937132477760315, mean loss: 0.39027667216086326
Epoch: 5, step: 1118, loss: 0.3465535342693329, mean loss: 0.39027142894969985
Epoch: 5, step: 1119, loss: 0.32601484656333923, mean loss: 0.3902637243235144
Epoch: 5, step: 1120, loss: 0.33811241388320923, mean loss: 0.3902574719184742
Epoch: 5, step: 1121, loss: 0.3162500262260437, mean loss: 0.39024860025152475
Epoch: 5, step: 1122, loss: 0.33893057703971863, mean loss: 0.39024244922393136
Epoch: 5, step: 1123, loss: 0.39294713735580444, mean loss: 0.3902427733715982
Epoch: 5, step: 1124, loss: 0.3123820424079895, mean loss: 0.3902334431461981
Epoch: 5, step: 1125, loss: 0.3480129539966583, mean loss: 0.3902283843768296
Epoch: 5, step: 1126, loss: 0.31572943925857544, mean loss: 0.3902194591408025
Epoch: 5, step: 1127, loss: 0.35361170768737793, mean loss: 0.3902150739286016
Epoch: 5, step: 1128, loss: 0.35005995631217957, mean loss: 0.3902102643564832
Epoch: 5, step: 1129, loss: 0.3647519052028656, mean loss: 0.39020721545119536
Epoch: 5, step: 1130, loss: 0.3460184931755066, mean loss: 0.39020192402235143
Epoch: 5, step: 1131, loss: 0.342929869890213, mean loss: 0.3901962640541843
Epoch: 5, step: 1132, loss: 0.35974159836769104, mean loss: 0.3901926180987567
Epoch: 5, step: 1133, loss: 0.36892998218536377, mean loss: 0.39019007289455354
Epoch: 5, step: 1134, loss: 0.37423089146614075, mean loss: 0.3901881627591342
Epoch: 5, step: 1135, loss: 0.33975180983543396, mean loss: 0.3901821268145526
Epoch: 5, step: 1136, loss: 0.3209275007247925, mean loss: 0.3901738397945586
Epoch: 5, step: 1137, loss: 0.33003726601600647, mean loss: 0.3901666447031757
Epoch: 5, step: 1138, loss: 0.34293806552886963, mean loss: 0.3901609946757592
Epoch: 5, step: 1139, loss: 0.3895937502384186, mean loss: 0.3901609268235538
Epoch: 5, step: 1140, loss: 0.36029037833213806, mean loss: 0.39015735421878267
Epoch: 5, step: 1141, loss: 0.32787495851516724, mean loss: 0.3901499059533314
Epoch: 5, step: 1142, loss: 0.33022943139076233, mean loss: 0.3901427410036049
Epoch: 5, step: 1143, loss: 0.3891731798648834, mean loss: 0.39014262508285663
Epoch: 5, step: 1144, loss: 0.32047149538993835, mean loss: 0.3901342961970595
Epoch: 5, step: 1145, loss: 0.34482264518737793, mean loss: 0.39012888003031204
Epoch: 5, step: 1146, loss: 0.354195773601532, mean loss: 0.39012458540781547
Epoch: 5, step: 1147, loss: 0.36817505955696106, mean loss: 0.3901219623765235
Epoch: 5, step: 1148, loss: 0.3518970012664795, mean loss: 0.390117394929862
Epoch: 5, step: 1149, loss: 0.3327028751373291, mean loss: 0.39011053536955226
Epoch: 5, step: 1150, loss: 0.3693254590034485, mean loss: 0.39010805238348534
Epoch: 5, step: 1151, loss: 0.34585174918174744, mean loss: 0.3901027661552004
Epoch: 5, step: 1152, loss: 0.3435761034488678, mean loss: 0.3900972094058028
Epoch: 5, step: 1153, loss: 0.33531442284584045, mean loss: 0.39009066739642134
Epoch: 5, step: 1154, loss: 0.3444477617740631, mean loss: 0.39008521749724256
Epoch: 5, step: 1155, loss: 0.39373642206192017, mean loss: 0.3900856534099174
Epoch: 5, step: 1156, loss: 0.3801581561565399, mean loss: 0.39008446832011756
Epoch: 5, step: 1157, loss: 0.3461187481880188, mean loss: 0.3900792205616869
Epoch: 5, step: 1158, loss: 0.3345504701137543, mean loss: 0.390072593428324
Epoch: 5, step: 1159, loss: 0.3683934807777405, mean loss: 0.39007000642204115
Epoch: 5, step: 1160, loss: 0.3580639362335205, mean loss: 0.39006618753763733
Epoch: 5, step: 1161, loss: 0.3475983738899231, mean loss: 0.3900611209886457
Epoch: 5, step: 1162, loss: 0.32631075382232666, mean loss: 0.39005351626871654
Epoch: 5, step: 1163, loss: 0.3653373122215271, mean loss: 0.3900505682481956
Epoch: 5, step: 1164, loss: 0.38675370812416077, mean loss: 0.3900501750627306
Epoch: 5, step: 1165, loss: 0.35245779156684875, mean loss: 0.39004569230772274
Epoch: 5, step: 1166, loss: 0.32944437861442566, mean loss: 0.3900384666831021
Epoch: 5, step: 1167, loss: 0.34120112657546997, mean loss: 0.3900326443964894
Epoch: 5, step: 1168, loss: 0.36523541808128357, mean loss: 0.39002968847488784
Epoch: 5, step: 1169, loss: 0.3507661521434784, mean loss: 0.3900250086731797
Epoch: 5, step: 1170, loss: 0.33918842673301697, mean loss: 0.39001895020792643
Epoch: 5, step: 1171, loss: 0.33030542731285095, mean loss: 0.39001183467850614
Epoch: 5, step: 1172, loss: 0.3397020101547241, mean loss: 0.3900058404184652
Epoch: 5, step: 1173, loss: 0.3592393696308136, mean loss: 0.3900021751253049
Epoch: 5, step: 1174, loss: 0.35267359018325806, mean loss: 0.3899977285994035
Epoch: 5, step: 1175, loss: 0.3075651228427887, mean loss: 0.38998791051867976
Epoch: 5, step: 1176, loss: 0.3394283354282379, mean loss: 0.3899818893712354
Epoch: 5, step: 1177, loss: 0.3319736421108246, mean loss: 0.38997498198289765
Epoch: 5, step: 1178, loss: 0.35426124930381775, mean loss: 0.3899707298418476
Epoch: 5, step: 1179, loss: 0.3412266671657562, mean loss: 0.38996492697724333
Epoch: 5, step: 1180, loss: 0.31351494789123535, mean loss: 0.3899558268726027
Epoch: 5, step: 1181, loss: 0.3367817997932434, mean loss: 0.3899494981381253
Epoch: 5, step: 1182, loss: 0.32136619091033936, mean loss: 0.38994133637360934
Epoch: 5, step: 1183, loss: 0.3813078999519348, mean loss: 0.38994030907275
Epoch: 5, step: 1184, loss: 0.3173445165157318, mean loss: 0.3899316718576927
Epoch: 5, step: 1185, loss: 0.3126715123653412, mean loss: 0.38992248078471
Epoch: 5, step: 1186, loss: 0.328655868768692, mean loss: 0.38991519321339846
Epoch: 5, step: 1187, loss: 0.3444465696811676, mean loss: 0.3899097854322933
Epoch: 5, step: 1188, loss: 0.35000473260879517, mean loss: 0.3899050399152493
Epoch: 5, step: 1189, loss: 0.391019344329834, mean loss: 0.38990517241280154
Epoch: 5, step: 1190, loss: 0.3470931351184845, mean loss: 0.3899000824071786
Epoch: 5, step: 1191, loss: 0.4043909013271332, mean loss: 0.38990180504375965
Epoch: 5, step: 1192, loss: 0.34781819581985474, mean loss: 0.3898968028317991
Epoch: 5, step: 1193, loss: 0.3680989742279053, mean loss: 0.3898942121699731
Epoch: 5, step: 1194, loss: 0.34608638286590576, mean loss: 0.38988900624848716
Epoch: 5, step: 1195, loss: 0.31837770342826843, mean loss: 0.38988050918303796
Epoch: 5, step: 1196, loss: 0.34751927852630615, mean loss: 0.3898754763648537
Epoch: 5, step: 1197, loss: 0.35528630018234253, mean loss: 0.3898713674106861
Epoch: 5, step: 1198, loss: 0.363568514585495, mean loss: 0.3898682431853832
Epoch: 5, step: 1199, loss: 0.34507742524147034, mean loss: 0.38986292361080555
Epoch: 5, step: 1200, loss: 0.34111571311950684, mean loss: 0.3898571348433799
Epoch: 5, step: 1201, loss: 0.37430539727211, mean loss: 0.38985528828228144
Epoch: 5, step: 1202, loss: 0.3442632853984833, mean loss: 0.3898498754836487
Epoch: 5, step: 1203, loss: 0.4005271792411804, mean loss: 0.38985114296984974
Epoch: 5, step: 1204, loss: 0.35276180505752563, mean loss: 0.38984674067454855
Epoch: 5, step: 1205, loss: 0.3701722025871277, mean loss: 0.3898444056949512
Epoch: 5, step: 1206, loss: 0.35374289751052856, mean loss: 0.38984012166644944
Epoch: 5, step: 1207, loss: 0.34333622455596924, mean loss: 0.3898346038808407
Epoch: 5, step: 1208, loss: 0.3209246098995209, mean loss: 0.38982642853453847
Epoch: 5, step: 1209, loss: 0.31556999683380127, mean loss: 0.38981761994240316
Epoch: 5, step: 1210, loss: 0.3422163724899292, mean loss: 0.38981197396358064
Epoch: 5, step: 1211, loss: 0.3624679744243622, mean loss: 0.3898087310793848
Epoch: 5, step: 1212, loss: 0.39182785153388977, mean loss: 0.3898089705102462
Epoch: 5, step: 1213, loss: 0.37017184495925903, mean loss: 0.38980664218139266
Epoch: 5, step: 1214, loss: 0.3350285291671753, mean loss: 0.38980014803639984
Epoch: 5, step: 1215, loss: 0.346713125705719, mean loss: 0.38979504051834263
Epoch: 5, step: 1216, loss: 0.33735010027885437, mean loss: 0.38978882445336227
Epoch: 5, step: 1217, loss: 0.32186129689216614, mean loss: 0.3897807742604776
Epoch: 5, step: 1218, loss: 0.3811294734477997, mean loss: 0.38977974910337215
Epoch: 5, step: 1219, loss: 0.32976171374320984, mean loss: 0.3897726379617418
Epoch: 5, step: 1220, loss: 0.32006773352622986, mean loss: 0.3897643800652324
Epoch: 5, step: 1221, loss: 0.33920419216156006, mean loss: 0.3897583909408657
Epoch: 5, step: 1222, loss: 0.34547749161720276, mean loss: 0.38975314625303864
Epoch: 5, step: 1223, loss: 0.35602882504463196, mean loss: 0.38974915237321767
Epoch: 5, step: 1224, loss: 0.31821393966674805, mean loss: 0.38974068165531284
Epoch: 5, step: 1225, loss: 0.3025503158569336, mean loss: 0.38973035838207126
Epoch: 5, step: 1226, loss: 0.33413630723953247, mean loss: 0.389723776867789
Epoch: 5, step: 1227, loss: 0.3371281325817108, mean loss: 0.3897175510576225
Epoch: 5, step: 1228, loss: 0.38884299993515015, mean loss: 0.38971744754819865
Epoch: 5, step: 1229, loss: 0.378980815410614, mean loss: 0.3897161769408451
Epoch: 5, step: 1230, loss: 0.34504950046539307, mean loss: 0.38971089156911687
Epoch: 5, step: 1231, loss: 0.3446590304374695, mean loss: 0.389705561249532
Epoch: 5, step: 1232, loss: 0.3660781979560852, mean loss: 0.3897027661042234
Epoch: 5, step: 1233, loss: 0.3729746639728546, mean loss: 0.3897007873838388
Epoch: 5, step: 1234, loss: 0.34213557839393616, mean loss: 0.38969516169383406
Epoch: 5, step: 1235, loss: 0.33691731095314026, mean loss: 0.3896889202261495
Epoch: 5, step: 1236, loss: 0.35387691855430603, mean loss: 0.3896846856273944
Epoch: 5, step: 1237, loss: 0.376016765832901, mean loss: 0.38968306965201077
Epoch: 5, step: 1238, loss: 0.36722657084465027, mean loss: 0.38968041490572786
Epoch: 5, step: 1239, loss: 0.34448882937431335, mean loss: 0.3896750731107478
Epoch: 5, step: 1240, loss: 0.34121567010879517, mean loss: 0.38966934572592304
Epoch: 5, step: 1241, loss: 0.3384862542152405, mean loss: 0.38966329714503073
Epoch: 5, step: 1242, loss: 0.3582083582878113, mean loss: 0.3896595803851516
Epoch: 5, step: 1243, loss: 0.3326302170753479, mean loss: 0.3896528425114146
Epoch: 5, step: 1244, loss: 0.33539003133773804, mean loss: 0.38964643225610757
Epoch: 5, step: 1245, loss: 0.3459305167198181, mean loss: 0.38964126855240616
Epoch: 5, step: 1246, loss: 0.3439435660839081, mean loss: 0.38963587139845923
Epoch: 5, step: 1247, loss: 0.3579171895980835, mean loss: 0.38963212568733496
Epoch: 5, step: 1248, loss: 0.3821895718574524, mean loss: 0.3896312468877329
Epoch: 5, step: 1249, loss: 0.3546602129936218, mean loss: 0.3896271180761751
Epoch: 5, step: 1250, loss: 0.3560151159763336, mean loss: 0.38962315018547744
Epoch: 5, step: 1251, loss: 0.33343520760536194, mean loss: 0.3896165179920662
Epoch: 5, step: 1252, loss: 0.35436198115348816, mean loss: 0.38961235718280873
Epoch: 5, step: 1253, loss: 0.36197102069854736, mean loss: 0.3896090952832944
Epoch: 5, step: 1254, loss: 0.3270682096481323, mean loss: 0.3896017158277622
Epoch: 5, step: 1255, loss: 0.35562363266944885, mean loss: 0.3895977070874179
Epoch: 5, step: 1256, loss: 0.3571956157684326, mean loss: 0.3895938847338354
Epoch: 5, step: 1257, loss: 0.3826102316379547, mean loss: 0.38959306099556035
Epoch: 5, step: 1258, loss: 0.3447349965572357, mean loss: 0.3895877705055924
Epoch: 5, step: 1259, loss: 0.3652907609939575, mean loss: 0.3895849052922066
Epoch: 5, step: 1260, loss: 0.3407737612724304, mean loss: 0.3895791499397694
Epoch: 5, step: 1261, loss: 0.36421388387680054, mean loss: 0.389576159458036
Epoch: 5, step: 1262, loss: 0.3744150996208191, mean loss: 0.3895743722294804
Epoch: 5, step: 1263, loss: 0.33951646089553833, mean loss: 0.3895684719570459
Epoch: 5, step: 1264, loss: 0.3587339520454407, mean loss: 0.3895648379535207
Epoch: 5, step: 1265, loss: 0.3870430290699005, mean loss: 0.38956454078066144
Epoch: 5, step: 1266, loss: 0.31289246678352356, mean loss: 0.3895555067198629
Epoch: 5, step: 1267, loss: 0.3253719210624695, mean loss: 0.389547945034465
Epoch: 5, step: 1268, loss: 0.3202355206012726, mean loss: 0.38953978006515966
Epoch: 5, step: 1269, loss: 0.3366841673851013, mean loss: 0.389533554433513
Epoch: 5, step: 1270, loss: 0.35735905170440674, mean loss: 0.3895297651857531
Epoch: 5, step: 1271, loss: 0.381605327129364, mean loss: 0.3895288320206499
Epoch: 5, step: 1272, loss: 0.3385370671749115, mean loss: 0.38952282804504107
Epoch: 5, step: 1273, loss: 0.33068645000457764, mean loss: 0.38951590122869534
Epoch: 5, step: 1274, loss: 0.3524457812309265, mean loss: 0.38951153747119116
Epoch: 5, step: 1275, loss: 0.3947249948978424, mean loss: 0.38951215110789394
Epoch: 5, step: 1276, loss: 0.3978314995765686, mean loss: 0.3895131302003346
Epoch: 5, step: 1277, loss: 0.3153628408908844, mean loss: 0.3895044045838002
Epoch: 5, step: 1278, loss: 0.3233090341091156, mean loss: 0.3894966159768494
Epoch: 5, step: 1279, loss: 0.3485064208507538, mean loss: 0.38949179360095226
Epoch: 5, step: 1280, loss: 0.3355598449707031, mean loss: 0.38948544941219443
Epoch: 5, step: 1281, loss: 0.36534225940704346, mean loss: 0.3894826097050661
Epoch: 5, step: 1282, loss: 0.38452908396720886, mean loss: 0.3894820271429424
Epoch: 5, step: 1283, loss: 0.34421953558921814, mean loss: 0.38947670464863926
Epoch: 5, step: 1284, loss: 0.31494376063346863, mean loss: 0.3894679412219473
Epoch: 5, step: 1285, loss: 0.30502721667289734, mean loss: 0.3894580140264912
Epoch: 5, step: 1286, loss: 0.3266957998275757, mean loss: 0.38945063631235005
Epoch: 5, step: 1287, loss: 0.40472182631492615, mean loss: 0.38945243123360096
Epoch: 5, step: 1288, loss: 0.3828136622905731, mean loss: 0.38945165102806056
Epoch: 5, step: 1289, loss: 0.3446594774723053, mean loss: 0.3894463875529071
Epoch: 5, step: 1290, loss: 0.3566303253173828, mean loss: 0.3894425318294627
Epoch: 5, step: 1291, loss: 0.31823956966400146, mean loss: 0.3894341668198098
Epoch: 5, step: 1292, loss: 0.34324193000793457, mean loss: 0.3894287407377222
Epoch: 5, step: 1293, loss: 0.373559832572937, mean loss: 0.38942687687723776
Epoch: 5, step: 1294, loss: 0.3588298559188843, mean loss: 0.3894232835688457
Epoch: 5, step: 1295, loss: 0.3002603054046631, mean loss: 0.3894128135150453
Epoch: 5, step: 1296, loss: 0.3605644702911377, mean loss: 0.38940942636660997
Epoch: 5, step: 1297, loss: 0.29745161533355713, mean loss: 0.389398630662098
Epoch: 5, step: 1298, loss: 0.35561510920524597, mean loss: 0.38939466499459513
Epoch: 5, step: 1299, loss: 0.33175185322761536, mean loss: 0.3893878994063596
Epoch: 5, step: 1300, loss: 0.37507790327072144, mean loss: 0.3893862200264587
Epoch: 5, step: 1301, loss: 0.38336968421936035, mean loss: 0.38938551402601196
Epoch: 5, step: 1302, loss: 0.3389835059642792, mean loss: 0.3893796003796361
Epoch: 5, step: 1303, loss: 0.34986844658851624, mean loss: 0.38937496509646025
Epoch: 5, step: 1304, loss: 0.3524547815322876, mean loss: 0.38937063428313895
Epoch: 5, step: 1305, loss: 0.3580031096935272, mean loss: 0.38936695523967313
Epoch: 5, step: 1306, loss: 0.35751351714134216, mean loss: 0.38936321964238235
Epoch: 5, step: 1307, loss: 0.3675083518028259, mean loss: 0.38936065692335803
Epoch: 5, step: 1308, loss: 0.38661760091781616, mean loss: 0.38936033530816216
Epoch: 5, step: 1309, loss: 0.37054333090782166, mean loss: 0.3893581293287483
Epoch: 5, step: 1310, loss: 0.3479631841182709, mean loss: 0.3893532770318065
Epoch: 5, step: 1311, loss: 0.36062556505203247, mean loss: 0.38934990997695657
Epoch: 5, step: 1312, loss: 0.4060429334640503, mean loss: 0.38935186626706403
Epoch: 5, step: 1313, loss: 0.3761480450630188, mean loss: 0.38935031906514184
Epoch: 5, step: 1314, loss: 0.2992308437824249, mean loss: 0.38933976025140044
Epoch: 5, step: 1315, loss: 0.3526785671710968, mean loss: 0.3893354653599899
Epoch: 5, step: 1316, loss: 0.33747440576553345, mean loss: 0.3893293905023591
Epoch: 5, step: 1317, loss: 0.33724522590637207, mean loss: 0.38932329022540946
Epoch: 5, step: 1318, loss: 0.36136630177497864, mean loss: 0.38932001618998957
Epoch: 5, step: 1319, loss: 0.33047154545783997, mean loss: 0.38931312526835815
Epoch: 5, step: 1320, loss: 0.36243435740470886, mean loss: 0.3893099782401573
Epoch: 5, step: 1321, loss: 0.3435589075088501, mean loss: 0.38930462222625756
Epoch: 5, step: 1322, loss: 0.3577544689178467, mean loss: 0.3893009291262566
Epoch: 5, step: 1323, loss: 0.3336869478225708, mean loss: 0.3892944199992313
Epoch: 5, step: 1324, loss: 0.40117600560188293, mean loss: 0.3892958104715078
Epoch: 5, step: 1325, loss: 0.3781609535217285, mean loss: 0.3892945075394987
Epoch: 5, step: 1326, loss: 0.38180381059646606, mean loss: 0.38929363112707993
Epoch: 5, step: 1327, loss: 0.4083894193172455, mean loss: 0.38929586507516023
Epoch: 5, step: 1328, loss: 0.36017557978630066, mean loss: 0.3892924587954446
Epoch: 5, step: 1329, loss: 0.3275683522224426, mean loss: 0.38928523960169337
Epoch: 5, step: 1330, loss: 0.33699464797973633, mean loss: 0.3892791244582456
Epoch: 5, step: 1331, loss: 0.38346344232559204, mean loss: 0.3892784444205781
Epoch: 5, step: 1332, loss: 0.3172875940799713, mean loss: 0.38927002739142563
Epoch: 5, step: 1333, loss: 0.32419559359550476, mean loss: 0.3892624199055949
Epoch: 5, step: 1334, loss: 0.32833462953567505, mean loss: 0.3892552980130911
Epoch: 5, step: 1335, loss: 0.33691370487213135, mean loss: 0.389249180482336
Epoch: 5, step: 1336, loss: 0.4108189046382904, mean loss: 0.38925170119335106
Epoch: 5, step: 1337, loss: 0.3126080632209778, mean loss: 0.3892427454048523
Epoch: 5, step: 1338, loss: 0.3414231538772583, mean loss: 0.38923715835127976
Epoch: 5, step: 1339, loss: 0.3519483506679535, mean loss: 0.3892328021821579
Epoch: 5, step: 1340, loss: 0.3305765688419342, mean loss: 0.38922595061886617
Epoch: 5, step: 1341, loss: 0.35412049293518066, mean loss: 0.38922185047197483
Epoch: 5, step: 1342, loss: 0.3503117859363556, mean loss: 0.38921730649620284
Epoch: 5, step: 1343, loss: 0.36594584584236145, mean loss: 0.38921458913741563
Epoch: 5, step: 1344, loss: 0.3461551070213318, mean loss: 0.38920956176063615
Epoch: 5, step: 1345, loss: 0.3311921954154968, mean loss: 0.3892027887783404
Epoch: 5, step: 1346, loss: 0.3123301565647125, mean loss: 0.3891938156684754
Epoch: 5, step: 1347, loss: 0.3901747763156891, mean loss: 0.38919393015968073
Epoch: 5, step: 1348, loss: 0.3421383202075958, mean loss: 0.3891884387826295
Epoch: 5, step: 1349, loss: 0.32706135511398315, mean loss: 0.38918118941464014
Epoch: 5, step: 1350, loss: 0.32879313826560974, mean loss: 0.3891741437897248
Epoch: 5, step: 1351, loss: 0.38555508852005005, mean loss: 0.38917372159475633
Epoch: 5, step: 1352, loss: 0.33474642038345337, mean loss: 0.3891673729068745
Epoch: 5, step: 1353, loss: 0.34506991505622864, mean loss: 0.3891622297464067
Epoch: 5, step: 1354, loss: 0.3405439853668213, mean loss: 0.3891565599802983
Epoch: 5, step: 1355, loss: 0.3621672987937927, mean loss: 0.3891534129115965
Epoch: 5, step: 1356, loss: 0.3274373412132263, mean loss: 0.389146217380327
Epoch: 5, step: 1357, loss: 0.351694792509079, mean loss: 0.38914185139468105
Epoch: 5, step: 1358, loss: 0.36237484216690063, mean loss: 0.3891387313329923
Epoch: 5, step: 1359, loss: 0.37683892250061035, mean loss: 0.3891372977888394
Epoch: 5, step: 1360, loss: 0.34885552525520325, mean loss: 0.38913260349067674
Epoch: 5, step: 1361, loss: 0.3523089289665222, mean loss: 0.3891283126873064
Epoch: 5, step: 1362, loss: 0.3768139183521271, mean loss: 0.3891268779448696
Epoch: 5, step: 1363, loss: 0.39840179681777954, mean loss: 0.3891279584340207
Epoch: 5, step: 1364, loss: 0.3543742299079895, mean loss: 0.3891239102419967
Epoch: 5, step: 1365, loss: 0.3242952227592468, mean loss: 0.38911635973099246
Epoch: 5, step: 1366, loss: 0.368976891040802, mean loss: 0.38911401438702015
Epoch: 5, step: 1367, loss: 0.36576807498931885, mean loss: 0.3891112959497358
Epoch: 5, step: 1368, loss: 0.35335269570350647, mean loss: 0.3891071326478094
Epoch: 5, step: 1369, loss: 0.33851906657218933, mean loss: 0.3891012434666597
Epoch: 5, step: 1370, loss: 0.34702634811401367, mean loss: 0.38909634591161923
Epoch: 5, step: 1371, loss: 0.3572675287723541, mean loss: 0.3890926414403507
Epoch: 5, step: 1372, loss: 0.367087185382843, mean loss: 0.3890900805819709
Epoch: 5, step: 1373, loss: 0.3470631241798401, mean loss: 0.38908519031476096
Epoch: 5, step: 1374, loss: 0.3924686014652252, mean loss: 0.38908558396352777
Epoch: 5, step: 1375, loss: 0.3859929144382477, mean loss: 0.3890852241834527
Epoch: 5, step: 1376, loss: 0.33170250058174133, mean loss: 0.38907854944533454
Epoch: 5, step: 1377, loss: 0.41061732172966003, mean loss: 0.38908105453631897
Epoch: 5, step: 1378, loss: 0.338077187538147, mean loss: 0.38907512316441545
Epoch: 5, step: 1379, loss: 0.33518362045288086, mean loss: 0.38906885671061175
Epoch: 5, step: 1380, loss: 0.37189143896102905, mean loss: 0.38906685956868065
Epoch: 5, step: 1381, loss: 0.3623594343662262, mean loss: 0.389063754776167
Epoch: 5, step: 1382, loss: 0.385388046503067, mean loss: 0.3890633275172721
Epoch: 5, step: 1383, loss: 0.3296842873096466, mean loss: 0.3890564261876338
Epoch: 5, step: 1384, loss: 0.3228507936000824, mean loss: 0.3890487323314354
Epoch: 5, step: 1385, loss: 0.33872994780540466, mean loss: 0.38904288538924087
Epoch: 5, step: 1386, loss: 0.3695189356803894, mean loss: 0.38904061700888665
Epoch: 5, step: 1387, loss: 0.36247336864471436, mean loss: 0.38903753066497815
Epoch: 5, step: 1388, loss: 0.3445667028427124, mean loss: 0.3890323650443692
Epoch: 5, step: 1389, loss: 0.3416822850704193, mean loss: 0.3890268656158008
Epoch: 5, step: 1390, loss: 0.3362348675727844, mean loss: 0.3890207348530505
Epoch: 5, step: 1391, loss: 0.40042349696159363, mean loss: 0.3890220589081026
Epoch: 5, step: 1392, loss: 0.3513438105583191, mean loss: 0.3890176843291696
Epoch: 5, step: 1393, loss: 0.3300021290779114, mean loss: 0.38901083320829066
Epoch: 5, step: 1394, loss: 0.33770307898521423, mean loss: 0.38900487757808483
Epoch: 5, step: 1395, loss: 0.3767569959163666, mean loss: 0.3890034560505011
Epoch: 5, step: 1396, loss: 0.3887644410133362, mean loss: 0.38900342831288504
Epoch: 5, step: 1397, loss: 0.3415164351463318, mean loss: 0.38899791810249207
Epoch: 5, step: 1398, loss: 0.3117832541465759, mean loss: 0.38898895944557643
Epoch: 5, step: 1399, loss: 0.366353839635849, mean loss: 0.3889863335616078
Epoch: 5, step: 1400, loss: 0.3936155438423157, mean loss: 0.38898687053066944
Epoch: 5, step: 1401, loss: 0.3092788755893707, mean loss: 0.388977625808454
Epoch: 5, step: 1402, loss: 0.34866389632225037, mean loss: 0.3889729506687711
Epoch: 5, step: 1403, loss: 0.3801301121711731, mean loss: 0.38897192529324953
Epoch: 5, step: 1404, loss: 0.4050028622150421, mean loss: 0.3889737839526028
Epoch: 5, step: 1405, loss: 0.38744163513183594, mean loss: 0.3889736063327534
Epoch: 5, step: 1406, loss: 0.3281789720058441, mean loss: 0.38896655931358953
Epoch: 5, step: 1407, loss: 0.3582715392112732, mean loss: 0.3889630017081071
Epoch: 5, step: 1408, loss: 0.37556594610214233, mean loss: 0.38896144914632635
Epoch: 5, step: 1409, loss: 0.3791198432445526, mean loss: 0.388960308751668
Epoch: 5, step: 1410, loss: 0.34927046298980713, mean loss: 0.38895571022939224
Epoch: 5, step: 1411, loss: 0.318706214427948, mean loss: 0.3889475719652818
Epoch: 5, step: 1412, loss: 0.37097135186195374, mean loss: 0.3889454896972286
Epoch: 5, step: 1413, loss: 0.3550989329814911, mean loss: 0.3889415695493579
Epoch: 5, step: 1414, loss: 0.3693144917488098, mean loss: 0.3889392965814597
Epoch: 5, step: 1415, loss: 0.38106587529182434, mean loss: 0.3889383848837652
Epoch: 5, step: 1416, loss: 0.3713625967502594, mean loss: 0.3889363499424507
Epoch: 5, step: 1417, loss: 0.3867223560810089, mean loss: 0.38893609363383047
Epoch: 5, step: 1418, loss: 0.3269129693508148, mean loss: 0.38892891420053
Epoch: 5, step: 1419, loss: 0.3159029185771942, mean loss: 0.3889204621177032
Epoch: 5, step: 1420, loss: 0.357097864151001, mean loss: 0.3889167793728859
Epoch: 5, step: 1421, loss: 0.3773086667060852, mean loss: 0.38891543615225793
Epoch: 5, step: 1422, loss: 0.3546998202800751, mean loss: 0.38891147738610354
Epoch: 5, step: 1423, loss: 0.32638922333717346, mean loss: 0.3889042443627291
Epoch: 5, step: 1424, loss: 0.3602707087993622, mean loss: 0.38890093221286637
Epoch: 5, step: 1425, loss: 0.3943513333797455, mean loss: 0.38890156260855996
Epoch: 5, step: 1426, loss: 0.34181082248687744, mean loss: 0.38889611670360774
Epoch: 5, step: 1427, loss: 0.43869149684906006, mean loss: 0.3889018747262888
Epoch: 5, step: 1428, loss: 0.3517632782459259, mean loss: 0.3888975807505135
Epoch: 5, step: 1429, loss: 0.3512454330921173, mean loss: 0.3888932279010732
Epoch: 5, step: 1430, loss: 0.35381239652633667, mean loss: 0.3888891727824309
Epoch: 5, step: 1431, loss: 0.3569903075695038, mean loss: 0.38888548590480576
Epoch: 5, step: 1432, loss: 0.379782110452652, mean loss: 0.388884433856331
Epoch: 5, step: 1433, loss: 0.36615416407585144, mean loss: 0.388881807294073
Epoch: 5, step: 1434, loss: 0.3453746438026428, mean loss: 0.38887678046986834
Epoch: 5, step: 1435, loss: 0.35148710012435913, mean loss: 0.38887246095966205
Epoch: 5, step: 1436, loss: 0.3634204566478729, mean loss: 0.3888695209106483
Epoch: 5, step: 1437, loss: 0.3400261104106903, mean loss: 0.38886387949109413
Epoch: 5, step: 1438, loss: 0.34478020668029785, mean loss: 0.3888587884098133
Epoch: 5, step: 1439, loss: 0.32019078731536865, mean loss: 0.3888508590794329
Epoch: 5, step: 1440, loss: 0.3345787823200226, mean loss: 0.38884459281955996
Epoch: 5, step: 1441, loss: 0.3206900358200073, mean loss: 0.3888367245954778
Epoch: 5, step: 1442, loss: 0.4219576418399811, mean loss: 0.3888405478573091
Epoch: 5, step: 1443, loss: 0.3502260744571686, mean loss: 0.38883609096979754
Valid: 5, mean loss: 0.2132987678050995
Epoch: 6, step: 0, loss: 0.3430194556713104, mean loss: 0.38883080341811854
Epoch: 6, step: 1, loss: 0.3552215099334717, mean loss: 0.38882692512438616
Epoch: 6, step: 2, loss: 0.3396000564098358, mean loss: 0.388821245319527
Epoch: 6, step: 3, loss: 0.35937005281448364, mean loss: 0.388817847627729
Epoch: 6, step: 4, loss: 0.32951924204826355, mean loss: 0.38881100732255197
Epoch: 6, step: 5, loss: 0.3509279191493988, mean loss: 0.3888066378775493
Epoch: 6, step: 6, loss: 0.33120352029800415, mean loss: 0.3887999946855784
Epoch: 6, step: 7, loss: 0.401441752910614, mean loss: 0.38880145245290143
Epoch: 6, step: 8, loss: 0.35084760189056396, mean loss: 0.3887970763603657
Epoch: 6, step: 9, loss: 0.35346636176109314, mean loss: 0.3887930031859826
Epoch: 6, step: 10, loss: 0.34090656042099, mean loss: 0.3887874831349434
Epoch: 6, step: 11, loss: 0.3690936863422394, mean loss: 0.3887852132183006
Epoch: 6, step: 12, loss: 0.318573534488678, mean loss: 0.38877712151855076
Epoch: 6, step: 13, loss: 0.3512548804283142, mean loss: 0.3887727976834401
Epoch: 6, step: 14, loss: 0.3068734109401703, mean loss: 0.38876336118306637
Epoch: 6, step: 15, loss: 0.33610591292381287, mean loss: 0.3887572946567692
Epoch: 6, step: 16, loss: 0.3428809940814972, mean loss: 0.3887520099775185
Epoch: 6, step: 17, loss: 0.3224813938140869, mean loss: 0.38874437687268515
Epoch: 6, step: 18, loss: 0.3623237609863281, mean loss: 0.388741334074587
Epoch: 6, step: 19, loss: 0.33070480823516846, mean loss: 0.38873465091868653
Epoch: 6, step: 20, loss: 0.3805333375930786, mean loss: 0.38873370661087703
Epoch: 6, step: 21, loss: 0.3634136915206909, mean loss: 0.3887307915734501
Epoch: 6, step: 22, loss: 0.3412107825279236, mean loss: 0.38872532132951715
Epoch: 6, step: 23, loss: 0.3595839738845825, mean loss: 0.3887219671228591
Epoch: 6, step: 24, loss: 0.37171903252601624, mean loss: 0.38872001028840214
Epoch: 6, step: 25, loss: 0.33343303203582764, mean loss: 0.38871364815051346
Epoch: 6, step: 26, loss: 0.3889525234699249, mean loss: 0.3887136756358799
Epoch: 6, step: 27, loss: 0.343418687582016, mean loss: 0.38870846452358654
Epoch: 6, step: 28, loss: 0.33488354086875916, mean loss: 0.38870227276888103
Epoch: 6, step: 29, loss: 0.39326465129852295, mean loss: 0.38870279754211884
Epoch: 6, step: 30, loss: 0.32414260506629944, mean loss: 0.3886953725631107
Epoch: 6, step: 31, loss: 0.3220183253288269, mean loss: 0.38868770500938093
Epoch: 6, step: 32, loss: 0.34492015838623047, mean loss: 0.38868267252155486
Epoch: 6, step: 33, loss: 0.33144399523735046, mean loss: 0.3886760918504484
Epoch: 6, step: 34, loss: 0.3393707871437073, mean loss: 0.38867042392255935
Epoch: 6, step: 35, loss: 0.3460882604122162, mean loss: 0.38866552942100646
Epoch: 6, step: 36, loss: 0.40396955609321594, mean loss: 0.38866728830236175
Epoch: 6, step: 37, loss: 0.3458153307437897, mean loss: 0.3886623639220401
Epoch: 6, step: 38, loss: 0.32555216550827026, mean loss: 0.3886551123767783
Epoch: 6, step: 39, loss: 0.32150188088417053, mean loss: 0.38864739716176305
Epoch: 6, step: 40, loss: 0.3301348388195038, mean loss: 0.3886406754434009
Epoch: 6, step: 41, loss: 0.37859031558036804, mean loss: 0.38863952102577365
Epoch: 6, step: 42, loss: 0.32694220542907715, mean loss: 0.38863243508163714
Epoch: 6, step: 43, loss: 0.3769415616989136, mean loss: 0.38863109253761063
Epoch: 6, step: 44, loss: 0.33054107427597046, mean loss: 0.38862442242413475
Epoch: 6, step: 45, loss: 0.35410207509994507, mean loss: 0.38862045889401714
Epoch: 6, step: 46, loss: 0.3543529212474823, mean loss: 0.3886165250703865
Epoch: 6, step: 47, loss: 0.34056422114372253, mean loss: 0.38861100942484855
Epoch: 6, step: 48, loss: 0.38891857862472534, mean loss: 0.38861104472488295
Epoch: 6, step: 49, loss: 0.41315650939941406, mean loss: 0.3886138615099041
Epoch: 6, step: 50, loss: 0.32114726305007935, mean loss: 0.38860612007577217
Epoch: 6, step: 51, loss: 0.34363657236099243, mean loss: 0.3886009606508393
Epoch: 6, step: 52, loss: 0.3476368486881256, mean loss: 0.3885962613148335
Epoch: 6, step: 53, loss: 0.3853221833705902, mean loss: 0.38859588576104315
Epoch: 6, step: 54, loss: 0.43067923188209534, mean loss: 0.38860071238635807
Epoch: 6, step: 55, loss: 0.34579986333847046, mean loss: 0.38859580403210947
Epoch: 6, step: 56, loss: 0.358889102935791, mean loss: 0.3885923976909678
Epoch: 6, step: 57, loss: 0.3352845311164856, mean loss: 0.3885862858053252
Epoch: 6, step: 58, loss: 0.39155709743499756, mean loss: 0.38858662637756297
Epoch: 6, step: 59, loss: 0.3727826774120331, mean loss: 0.38858481482907997
Epoch: 6, step: 60, loss: 0.3628784716129303, mean loss: 0.38858186854332455
Epoch: 6, step: 61, loss: 0.35316264629364014, mean loss: 0.38857780949883114
Epoch: 6, step: 62, loss: 0.3313405215740204, mean loss: 0.3885712508546321
Epoch: 6, step: 63, loss: 0.3656296133995056, mean loss: 0.3885686223443829
Epoch: 6, step: 64, loss: 0.3311610817909241, mean loss: 0.3885620456986556
Epoch: 6, step: 65, loss: 0.3419942259788513, mean loss: 0.38855671146959264
Epoch: 6, step: 66, loss: 0.352571576833725, mean loss: 0.3885525899331551
Epoch: 6, step: 67, loss: 0.36287128925323486, mean loss: 0.38854964887719085
Epoch: 6, step: 68, loss: 0.3812639117240906, mean loss: 0.38854881460063606
Epoch: 6, step: 69, loss: 0.3206075131893158, mean loss: 0.3885410356561191
Epoch: 6, step: 70, loss: 0.41017425060272217, mean loss: 0.3885435122691639
Epoch: 6, step: 71, loss: 0.3473399579524994, mean loss: 0.3885387957450892
Epoch: 6, step: 72, loss: 0.3419548273086548, mean loss: 0.38853346394144533
Epoch: 6, step: 73, loss: 0.32334285974502563, mean loss: 0.38852600335501863
Epoch: 6, step: 74, loss: 0.3374597132205963, mean loss: 0.38852015986146854
Epoch: 6, step: 75, loss: 0.3535025119781494, mean loss: 0.3885161532656009
Epoch: 6, step: 76, loss: 0.3436886668205261, mean loss: 0.38851102484935046
Epoch: 6, step: 77, loss: 0.33306121826171875, mean loss: 0.38850468192935644
Epoch: 6, step: 78, loss: 0.3310530185699463, mean loss: 0.38849811076804347
Epoch: 6, step: 79, loss: 0.3341853618621826, mean loss: 0.38849189933747325
Epoch: 6, step: 80, loss: 0.3894136846065521, mean loss: 0.3884920047445938
Epoch: 6, step: 81, loss: 0.3494407832622528, mean loss: 0.38848753970669275
Epoch: 6, step: 82, loss: 0.3261707127094269, mean loss: 0.38848041534096767
Epoch: 6, step: 83, loss: 0.40435224771499634, mean loss: 0.38848222967937346
Epoch: 6, step: 84, loss: 0.3173433244228363, mean loss: 0.3884740985895053
Epoch: 6, step: 85, loss: 0.34749898314476013, mean loss: 0.38846941571916876
Epoch: 6, step: 86, loss: 0.3540009558200836, mean loss: 0.3884654769167577
Epoch: 6, step: 87, loss: 0.3265097439289093, mean loss: 0.3884583978796247
Epoch: 6, step: 88, loss: 0.3664327561855316, mean loss: 0.3884558815261809
Epoch: 6, step: 89, loss: 0.31975120306015015, mean loss: 0.3884480331507564
Epoch: 6, step: 90, loss: 0.31478917598724365, mean loss: 0.3884396198032791
Epoch: 6, step: 91, loss: 0.3660300672054291, mean loss: 0.38843706046652743
Epoch: 6, step: 92, loss: 0.35306504368782043, mean loss: 0.388433021181752
Epoch: 6, step: 93, loss: 0.3739640414714813, mean loss: 0.38843136909455056
Epoch: 6, step: 94, loss: 0.3887767493724823, mean loss: 0.38843140852602426
Epoch: 6, step: 95, loss: 0.40278077125549316, mean loss: 0.38843304658113037
Epoch: 6, step: 96, loss: 0.34076428413391113, mean loss: 0.38842760556270245
Epoch: 6, step: 97, loss: 0.3501987159252167, mean loss: 0.3884232425303311
Epoch: 6, step: 98, loss: 0.4183247983455658, mean loss: 0.3884266547813656
Epoch: 6, step: 99, loss: 0.3606795072555542, mean loss: 0.3884234887444503
Epoch: 6, step: 100, loss: 0.32425498962402344, mean loss: 0.3884161677519665
Epoch: 6, step: 101, loss: 0.3474982678890228, mean loss: 0.38841149995595203
Epoch: 6, step: 102, loss: 0.2947004735469818, mean loss: 0.3884008108916873
Epoch: 6, step: 103, loss: 0.3308981955051422, mean loss: 0.3883942526554434
Epoch: 6, step: 104, loss: 0.3541580140590668, mean loss: 0.38839034842022885
Epoch: 6, step: 105, loss: 0.3491210341453552, mean loss: 0.3883858707333104
Epoch: 6, step: 106, loss: 0.37195050716400146, mean loss: 0.3883839969032375
Epoch: 6, step: 107, loss: 0.337864488363266, mean loss: 0.38837823772533736
Epoch: 6, step: 108, loss: 0.3121781647205353, mean loss: 0.38836955197667616
Epoch: 6, step: 109, loss: 0.37815988063812256, mean loss: 0.38836838834875975
Epoch: 6, step: 110, loss: 0.33454567193984985, mean loss: 0.38836225470586416
Epoch: 6, step: 111, loss: 0.3472110331058502, mean loss: 0.38835756564232726
Epoch: 6, step: 112, loss: 0.37638363242149353, mean loss: 0.38835620140247074
Epoch: 6, step: 113, loss: 0.35766762495040894, mean loss: 0.3883527053240415
Epoch: 6, step: 114, loss: 0.36270928382873535, mean loss: 0.3883497843283136
Epoch: 6, step: 115, loss: 0.34763526916503906, mean loss: 0.3883451471397984
Epoch: 6, step: 116, loss: 0.4102477729320526, mean loss: 0.3883476414600116
Epoch: 6, step: 117, loss: 0.3516448736190796, mean loss: 0.38834346214233445
Epoch: 6, step: 118, loss: 0.35354602336883545, mean loss: 0.3883395002342423
Epoch: 6, step: 119, loss: 0.3195295035839081, mean loss: 0.3883316666736036
Epoch: 6, step: 120, loss: 0.3432215750217438, mean loss: 0.38832653177415544
Epoch: 6, step: 121, loss: 0.3406941592693329, mean loss: 0.38832111037960676
Epoch: 6, step: 122, loss: 0.3434875011444092, mean loss: 0.38831600811384653
Epoch: 6, step: 123, loss: 0.35336118936538696, mean loss: 0.3883120305514036
Epoch: 6, step: 124, loss: 0.3175087571144104, mean loss: 0.3883039746550062
Epoch: 6, step: 125, loss: 0.35705938935279846, mean loss: 0.388300420094676
Epoch: 6, step: 126, loss: 0.3211989998817444, mean loss: 0.38829278712684384
Epoch: 6, step: 127, loss: 0.34961822628974915, mean loss: 0.3882883882914438
Epoch: 6, step: 128, loss: 0.3259827792644501, mean loss: 0.38828130247215265
Epoch: 6, step: 129, loss: 0.33044251799583435, mean loss: 0.38827472539863933
Epoch: 6, step: 130, loss: 0.3249467611312866, mean loss: 0.3882675249478983
Epoch: 6, step: 131, loss: 0.35565394163131714, mean loss: 0.38826381717353303
Epoch: 6, step: 132, loss: 0.36024534702301025, mean loss: 0.388260632170674
Epoch: 6, step: 133, loss: 0.34714818000793457, mean loss: 0.3882559592390802
Epoch: 6, step: 134, loss: 0.3303575813770294, mean loss: 0.38824937913021984
Epoch: 6, step: 135, loss: 0.37832188606262207, mean loss: 0.3882482510060076
Epoch: 6, step: 136, loss: 0.3453395962715149, mean loss: 0.38824337557654115
Epoch: 6, step: 137, loss: 0.352043479681015, mean loss: 0.3882392628867098
Epoch: 6, step: 138, loss: 0.36962762475013733, mean loss: 0.38823714864859366
Epoch: 6, step: 139, loss: 0.34537169337272644, mean loss: 0.3882322797872493
Epoch: 6, step: 140, loss: 0.3666858971118927, mean loss: 0.3882298327250488
Epoch: 6, step: 141, loss: 0.3350282609462738, mean loss: 0.3882237912111062
Epoch: 6, step: 142, loss: 0.3339155614376068, mean loss: 0.3882176247265174
Epoch: 6, step: 143, loss: 0.38964876532554626, mean loss: 0.3882177872084201
Epoch: 6, step: 144, loss: 0.3196403980255127, mean loss: 0.388210002285139
Epoch: 6, step: 145, loss: 0.343930721282959, mean loss: 0.3882049762600536
Epoch: 6, step: 146, loss: 0.34498241543769836, mean loss: 0.38820007073731816
Epoch: 6, step: 147, loss: 0.3429732024669647, mean loss: 0.3881949383192212
Epoch: 6, step: 148, loss: 0.3191978931427002, mean loss: 0.3881871093114853
Epoch: 6, step: 149, loss: 0.3974268436431885, mean loss: 0.3881881576135425
Epoch: 6, step: 150, loss: 0.3393925726413727, mean loss: 0.3881826220962456
Epoch: 6, step: 151, loss: 0.32469233870506287, mean loss: 0.38817542038533465
Epoch: 6, step: 152, loss: 0.3297634720802307, mean loss: 0.38816879546208355
Epoch: 6, step: 153, loss: 0.35189613699913025, mean loss: 0.38816468198301085
Epoch: 6, step: 154, loss: 0.3811470866203308, mean loss: 0.3881638862470586
Epoch: 6, step: 155, loss: 0.3885888457298279, mean loss: 0.38816393442840585
Epoch: 6, step: 156, loss: 0.3472718596458435, mean loss: 0.3881592986643448
Epoch: 6, step: 157, loss: 0.34724152088165283, mean loss: 0.3881546605122497
Epoch: 6, step: 158, loss: 0.35766974091529846, mean loss: 0.3881512053473855
Epoch: 6, step: 159, loss: 0.3077191412448883, mean loss: 0.3881420901995951
Epoch: 6, step: 160, loss: 0.36162325739860535, mean loss: 0.38813908523270546
Epoch: 6, step: 161, loss: 0.42422544956207275, mean loss: 0.3881431738758427
Epoch: 6, step: 162, loss: 0.3326454758644104, mean loss: 0.38813688660972606
Epoch: 6, step: 163, loss: 0.34722644090652466, mean loss: 0.3881322524405254
Epoch: 6, step: 164, loss: 0.35500314831733704, mean loss: 0.3881285001351541
Epoch: 6, step: 165, loss: 0.3198976218700409, mean loss: 0.38812077296887265
Epoch: 6, step: 166, loss: 0.3575995862483978, mean loss: 0.38811731682724426
Epoch: 6, step: 167, loss: 0.3886334002017975, mean loss: 0.38811737526059736
Epoch: 6, step: 168, loss: 0.3548344373703003, mean loss: 0.3881136072386467
Epoch: 6, step: 169, loss: 0.360597163438797, mean loss: 0.3881104924046191
Epoch: 6, step: 170, loss: 0.31683510541915894, mean loss: 0.3881024250150339
Epoch: 6, step: 171, loss: 0.30091145634651184, mean loss: 0.3880925573182629
Epoch: 6, step: 172, loss: 0.3437384068965912, mean loss: 0.38808753817710395
Epoch: 6, step: 173, loss: 0.38346680998802185, mean loss: 0.388087015352009
Epoch: 6, step: 174, loss: 0.3485289216041565, mean loss: 0.3880825399482588
Epoch: 6, step: 175, loss: 0.33634328842163086, mean loss: 0.38807668709175125
Epoch: 6, step: 176, loss: 0.32083895802497864, mean loss: 0.38806908187412126
Epoch: 6, step: 177, loss: 0.3848492205142975, mean loss: 0.388068717718799
Epoch: 6, step: 178, loss: 0.3859867751598358, mean loss: 0.38806848228483326
Epoch: 6, step: 179, loss: 0.330550879240036, mean loss: 0.3880619787114451
Epoch: 6, step: 180, loss: 0.3153148889541626, mean loss: 0.38805375405460424
Epoch: 6, step: 181, loss: 0.3266226649284363, mean loss: 0.38804680954984205
Epoch: 6, step: 182, loss: 0.3344675898551941, mean loss: 0.38804075334777416
Epoch: 6, step: 183, loss: 0.4133129119873047, mean loss: 0.3880436096044016
Epoch: 6, step: 184, loss: 0.35992708802223206, mean loss: 0.3880404322372887
Epoch: 6, step: 185, loss: 0.3355625569820404, mean loss: 0.38803450253387
Epoch: 6, step: 186, loss: 0.3904408812522888, mean loss: 0.38803477441034934
Epoch: 6, step: 187, loss: 0.35984960198402405, mean loss: 0.3880315903646618
Epoch: 6, step: 188, loss: 0.378708153963089, mean loss: 0.3880305372260193
Epoch: 6, step: 189, loss: 0.3792249858379364, mean loss: 0.3880295426979656
Epoch: 6, step: 190, loss: 0.3117120563983917, mean loss: 0.38802092412243766
Epoch: 6, step: 191, loss: 0.33363109827041626, mean loss: 0.38801478254318605
Epoch: 6, step: 192, loss: 0.3772728443145752, mean loss: 0.388013569724147
Epoch: 6, step: 193, loss: 0.3958931565284729, mean loss: 0.38801445926883027
Epoch: 6, step: 194, loss: 0.34124690294265747, mean loss: 0.38800918016776625
Epoch: 6, step: 195, loss: 0.342048704624176, mean loss: 0.38800399275517666
Epoch: 6, step: 196, loss: 0.41607749462127686, mean loss: 0.388007160964393
Epoch: 6, step: 197, loss: 0.4005850851535797, mean loss: 0.3880085802742767
Epoch: 6, step: 198, loss: 0.4103308320045471, mean loss: 0.38801109886298596
Epoch: 6, step: 199, loss: 0.336898535490036, mean loss: 0.38800533255394115
Epoch: 6, step: 200, loss: 0.33800092339515686, mean loss: 0.3879996918986497
Epoch: 6, step: 201, loss: 0.36149030923843384, mean loss: 0.387996701893838
Epoch: 6, step: 202, loss: 0.3527849018573761, mean loss: 0.38799273078748453
Epoch: 6, step: 203, loss: 0.32106804847717285, mean loss: 0.38798518402583476
Epoch: 6, step: 204, loss: 0.36341503262519836, mean loss: 0.38798241368516495
Epoch: 6, step: 205, loss: 0.3306029438972473, mean loss: 0.38797594474832303
Epoch: 6, step: 206, loss: 0.32480084896087646, mean loss: 0.3879688232179671
Epoch: 6, step: 207, loss: 0.3860457241535187, mean loss: 0.38796860645747744
Epoch: 6, step: 208, loss: 0.3422059714794159, mean loss: 0.3879634489419835
Epoch: 6, step: 209, loss: 0.33772850036621094, mean loss: 0.38795778802823816
Epoch: 6, step: 210, loss: 0.3354601562023163, mean loss: 0.3879518728021169
Epoch: 6, step: 211, loss: 0.3536333739757538, mean loss: 0.38794800636466464
Epoch: 6, step: 212, loss: 0.35298827290534973, mean loss: 0.38794406812725796
Epoch: 6, step: 213, loss: 0.3112131655216217, mean loss: 0.3879354253132677
Epoch: 6, step: 214, loss: 0.3178683817386627, mean loss: 0.3879275339917704
Epoch: 6, step: 215, loss: 0.3433923125267029, mean loss: 0.3879225187641279
Epoch: 6, step: 216, loss: 0.34321868419647217, mean loss: 0.38791748511537577
Epoch: 6, step: 217, loss: 0.3677343726158142, mean loss: 0.3879152127541396
Epoch: 6, step: 218, loss: 0.33043384552001953, mean loss: 0.38790874181332746
Epoch: 6, step: 219, loss: 0.34295013546943665, mean loss: 0.38790368118676916
Epoch: 6, step: 220, loss: 0.36023780703544617, mean loss: 0.3879005674136514
Epoch: 6, step: 221, loss: 0.35738223791122437, mean loss: 0.3878971329853932
Epoch: 6, step: 222, loss: 0.38845908641815186, mean loss: 0.3878971962185914
Epoch: 6, step: 223, loss: 0.3398447632789612, mean loss: 0.38789178977924177
Epoch: 6, step: 224, loss: 0.3446943163871765, mean loss: 0.38788693012423087
Epoch: 6, step: 225, loss: 0.3703666627407074, mean loss: 0.3878849593404982
Epoch: 6, step: 226, loss: 0.37246519327163696, mean loss: 0.38788322502871453
Epoch: 6, step: 227, loss: 0.3216513395309448, mean loss: 0.3878757765485641
Epoch: 6, step: 228, loss: 0.33175793290138245, mean loss: 0.3878694662096855
Epoch: 6, step: 229, loss: 0.3187217116355896, mean loss: 0.38786169155772077
Epoch: 6, step: 230, loss: 0.3507302403450012, mean loss: 0.38785751713937194
Epoch: 6, step: 231, loss: 0.3327970504760742, mean loss: 0.38785132778835313
Epoch: 6, step: 232, loss: 0.35441362857818604, mean loss: 0.3878475694766514
Epoch: 6, step: 233, loss: 0.3347705900669098, mean loss: 0.38784160443064
Epoch: 6, step: 234, loss: 0.31969690322875977, mean loss: 0.3878339468622388
Epoch: 6, step: 235, loss: 0.37218815088272095, mean loss: 0.3878321889076344
Epoch: 6, step: 236, loss: 0.38646200299263, mean loss: 0.38783203497145696
Epoch: 6, step: 237, loss: 0.33076944947242737, mean loss: 0.3878256248854652
Epoch: 6, step: 238, loss: 0.34555187821388245, mean loss: 0.38782087662682524
Epoch: 6, step: 239, loss: 0.32244256138801575, mean loss: 0.38781353404874364
Epoch: 6, step: 240, loss: 0.34994950890541077, mean loss: 0.3878092820526579
Epoch: 6, step: 241, loss: 0.34675174951553345, mean loss: 0.3878046719546861
Epoch: 6, step: 242, loss: 0.3381131589412689, mean loss: 0.3877990930265382
Epoch: 6, step: 243, loss: 0.33450591564178467, mean loss: 0.38779311040671505
Epoch: 6, step: 244, loss: 0.36928123235702515, mean loss: 0.3877910325216494
Epoch: 6, step: 245, loss: 0.3457752764225006, mean loss: 0.38778631694857435
Epoch: 6, step: 246, loss: 0.35566550493240356, mean loss: 0.38778271232372685
Epoch: 6, step: 247, loss: 0.32563936710357666, mean loss: 0.3877757393271806
Epoch: 6, step: 248, loss: 0.3636524975299835, mean loss: 0.3877730328039228
Epoch: 6, step: 249, loss: 0.432748019695282, mean loss: 0.38777807823660077
Epoch: 6, step: 250, loss: 0.3451418876647949, mean loss: 0.3877732957138221
Epoch: 6, step: 251, loss: 0.32961270213127136, mean loss: 0.3877667725427159
Epoch: 6, step: 252, loss: 0.31688326597213745, mean loss: 0.3877588232877456
Epoch: 6, step: 253, loss: 0.36749812960624695, mean loss: 0.3877565514001383
Epoch: 6, step: 254, loss: 0.3380831182003021, mean loss: 0.3877509820052286
Epoch: 6, step: 255, loss: 0.34067243337631226, mean loss: 0.38774570414103254
Epoch: 6, step: 256, loss: 0.34712401032447815, mean loss: 0.38774115064996467
Epoch: 6, step: 257, loss: 0.3241661787033081, mean loss: 0.38773402500863463
Epoch: 6, step: 258, loss: 0.3580194413661957, mean loss: 0.3877306948972772
Epoch: 6, step: 259, loss: 0.3377523720264435, mean loss: 0.3877250944576906
Epoch: 6, step: 260, loss: 0.3521283268928528, mean loss: 0.38772110602435
Epoch: 6, step: 261, loss: 0.3461184501647949, mean loss: 0.3877164451845719
Epoch: 6, step: 262, loss: 0.3191494643688202, mean loss: 0.38770876433089024
Epoch: 6, step: 263, loss: 0.3498537838459015, mean loss: 0.38770452430171404
Epoch: 6, step: 264, loss: 0.33623167872428894, mean loss: 0.3876987596197141
Epoch: 6, step: 265, loss: 0.3333633840084076, mean loss: 0.3876926750311798
Epoch: 6, step: 266, loss: 0.3509523570537567, mean loss: 0.38768856123451906
Epoch: 6, step: 267, loss: 0.40359869599342346, mean loss: 0.3876903424856116
Epoch: 6, step: 268, loss: 0.37547561526298523, mean loss: 0.38768897511437883
Epoch: 6, step: 269, loss: 0.35514187812805176, mean loss: 0.3876853320544968
Epoch: 6, step: 270, loss: 0.376100093126297, mean loss: 0.3876840354412983
Epoch: 6, step: 271, loss: 0.35727405548095703, mean loss: 0.3876806323549106
Epoch: 6, step: 272, loss: 0.341933012008667, mean loss: 0.3876755134536746
Epoch: 6, step: 273, loss: 0.37641456723213196, mean loss: 0.3876742535581475
Epoch: 6, step: 274, loss: 0.3963441252708435, mean loss: 0.3876752234509445
Epoch: 6, step: 275, loss: 0.32451963424682617, mean loss: 0.3876681590673646
Epoch: 6, step: 276, loss: 0.30345451831817627, mean loss: 0.38765874025059366
Epoch: 6, step: 277, loss: 0.3180197775363922, mean loss: 0.38765095239969743
Epoch: 6, step: 278, loss: 0.40767982602119446, mean loss: 0.3876531920143258
Epoch: 6, step: 279, loss: 0.322932630777359, mean loss: 0.3876459558156186
Epoch: 6, step: 280, loss: 0.39890167117118835, mean loss: 0.3876472141404208
Epoch: 6, step: 281, loss: 0.420267790555954, mean loss: 0.3876508605272323
Epoch: 6, step: 282, loss: 0.3526886999607086, mean loss: 0.3876469528307344
Epoch: 6, step: 283, loss: 0.37105870246887207, mean loss: 0.3876450989806716
Epoch: 6, step: 284, loss: 0.3522205948829651, mean loss: 0.38764114049323195
Epoch: 6, step: 285, loss: 0.329694002866745, mean loss: 0.387634665952715
Epoch: 6, step: 286, loss: 0.3640088438987732, mean loss: 0.38763202649097284
Epoch: 6, step: 287, loss: 0.3354583978652954, mean loss: 0.3876261983376411
Epoch: 6, step: 288, loss: 0.3163171708583832, mean loss: 0.38761823351830915
Epoch: 6, step: 289, loss: 0.35081544518470764, mean loss: 0.38761412331188366
Epoch: 6, step: 290, loss: 0.376347154378891, mean loss: 0.3876128651355651
Epoch: 6, step: 291, loss: 0.4128108620643616, mean loss: 0.3876156786680493
Epoch: 6, step: 292, loss: 0.44090932607650757, mean loss: 0.3876216286119377
Epoch: 6, step: 293, loss: 0.3299856185913086, mean loss: 0.387615194585367
Epoch: 6, step: 294, loss: 0.38839051127433777, mean loss: 0.387615281125906
Epoch: 6, step: 295, loss: 0.3273591697216034, mean loss: 0.38760855611347245
Epoch: 6, step: 296, loss: 0.33904579281806946, mean loss: 0.38760313676704955
Epoch: 6, step: 297, loss: 0.34701642394065857, mean loss: 0.3875986080108761
Epoch: 6, step: 298, loss: 0.39322105050086975, mean loss: 0.38759923530558654
Epoch: 6, step: 299, loss: 0.35305291414260864, mean loss: 0.3875953814098745
Epoch: 6, step: 300, loss: 0.3429846465587616, mean loss: 0.3875904053100584
Epoch: 6, step: 301, loss: 0.3582802712917328, mean loss: 0.38758713627882724
Epoch: 6, step: 302, loss: 0.3736683428287506, mean loss: 0.3875855840547333
Epoch: 6, step: 303, loss: 0.34347397089004517, mean loss: 0.3875806652753885
Epoch: 6, step: 304, loss: 0.3661862313747406, mean loss: 0.3875782798997724
Epoch: 6, step: 305, loss: 0.3171602487564087, mean loss: 0.3875704295061109
Epoch: 6, step: 306, loss: 0.3515702784061432, mean loss: 0.38756641655871377
Epoch: 6, step: 307, loss: 0.3517661988735199, mean loss: 0.3875624263427435
Epoch: 6, step: 308, loss: 0.3306643068790436, mean loss: 0.3875560853063606
Epoch: 6, step: 309, loss: 0.32146432995796204, mean loss: 0.38754872050188677
Epoch: 6, step: 310, loss: 0.35419586300849915, mean loss: 0.38754500430606575
Epoch: 6, step: 311, loss: 0.3358801305294037, mean loss: 0.3875392484154935
Epoch: 6, step: 312, loss: 0.3517517149448395, mean loss: 0.38753526183495757
Epoch: 6, step: 313, loss: 0.34432366490364075, mean loss: 0.38753044878116705
Epoch: 6, step: 314, loss: 0.375256210565567, mean loss: 0.3875290817872684
Epoch: 6, step: 315, loss: 0.338803231716156, mean loss: 0.38752365574605785
Epoch: 6, step: 316, loss: 0.4042493999004364, mean loss: 0.3875255180936978
Epoch: 6, step: 317, loss: 0.33509135246276855, mean loss: 0.38751968039990675
Epoch: 6, step: 318, loss: 0.3360004723072052, mean loss: 0.3875139452103161
Epoch: 6, step: 319, loss: 0.3243383467197418, mean loss: 0.38750691319801756
Epoch: 6, step: 320, loss: 0.33797112107276917, mean loss: 0.38750140003250555
Epoch: 6, step: 321, loss: 0.3239789605140686, mean loss: 0.38749433098737773
Epoch: 6, step: 322, loss: 0.36864426732063293, mean loss: 0.38749223350616413
Epoch: 6, step: 323, loss: 0.35144272446632385, mean loss: 0.3874882226573613
Epoch: 6, step: 324, loss: 0.37792062759399414, mean loss: 0.3874871582903502
Epoch: 6, step: 325, loss: 0.358844518661499, mean loss: 0.3874839722347741
Epoch: 6, step: 326, loss: 0.3673568367958069, mean loss: 0.387481733647805
Epoch: 6, step: 327, loss: 0.31840813159942627, mean loss: 0.38747405197497936
Epoch: 6, step: 328, loss: 0.35428866744041443, mean loss: 0.38747036183992606
Epoch: 6, step: 329, loss: 0.33744028210639954, mean loss: 0.3874647992337738
Epoch: 6, step: 330, loss: 0.38085150718688965, mean loss: 0.38746406401509154
Epoch: 6, step: 331, loss: 0.34671637415885925, mean loss: 0.38745953448087006
Epoch: 6, step: 332, loss: 0.34925463795661926, mean loss: 0.3874552880768994
Epoch: 6, step: 333, loss: 0.3404042422771454, mean loss: 0.3874500590209092
Epoch: 6, step: 334, loss: 0.356912225484848, mean loss: 0.38744666555124185
Epoch: 6, step: 335, loss: 0.3587310314178467, mean loss: 0.387443474925227
Epoch: 6, step: 336, loss: 0.34832802414894104, mean loss: 0.3874391292468828
Epoch: 6, step: 337, loss: 0.35051849484443665, mean loss: 0.3874350278655895
Epoch: 6, step: 338, loss: 0.3700467050075531, mean loss: 0.3874330964735137
Epoch: 6, step: 339, loss: 0.3336639404296875, mean loss: 0.38742712477692953
Epoch: 6, step: 340, loss: 0.37631872296333313, mean loss: 0.38742589119538445
Epoch: 6, step: 341, loss: 0.3538593649864197, mean loss: 0.38742216406611407
Epoch: 6, step: 342, loss: 0.31813809275627136, mean loss: 0.38741447181882754
Epoch: 6, step: 343, loss: 0.3479906916618347, mean loss: 0.3874100952890588
Epoch: 6, step: 344, loss: 0.3755396604537964, mean loss: 0.38740877766947446
Epoch: 6, step: 345, loss: 0.36976078152656555, mean loss: 0.38740681895736095
Epoch: 6, step: 346, loss: 0.354877233505249, mean loss: 0.3874032089711827
Epoch: 6, step: 347, loss: 0.3156571090221405, mean loss: 0.3873952477971981
Epoch: 6, step: 348, loss: 0.3466988503932953, mean loss: 0.38739073249736405
Epoch: 6, step: 349, loss: 0.3137739598751068, mean loss: 0.3873825655600862
Epoch: 6, step: 350, loss: 0.30980411171913147, mean loss: 0.38737396007435787
Epoch: 6, step: 351, loss: 0.3822406530380249, mean loss: 0.38737339071909654
Epoch: 6, step: 352, loss: 0.35643211007118225, mean loss: 0.38736995928063056
Epoch: 6, step: 353, loss: 0.33363762497901917, mean loss: 0.3873640009379491
Epoch: 6, step: 354, loss: 0.38183650374412537, mean loss: 0.3873633880654362
Epoch: 6, step: 355, loss: 0.3606743812561035, mean loss: 0.3873604291955017
Epoch: 6, step: 356, loss: 0.34708088636398315, mean loss: 0.38735596410927714
Epoch: 6, step: 357, loss: 0.3682660162448883, mean loss: 0.38735384817623963
Epoch: 6, step: 358, loss: 0.3490315079689026, mean loss: 0.3873496009923532
Epoch: 6, step: 359, loss: 0.3529432713985443, mean loss: 0.38734578823419785
Epoch: 6, step: 360, loss: 0.43070217967033386, mean loss: 0.38735059226648993
Epoch: 6, step: 361, loss: 0.3322427570819855, mean loss: 0.3873444868116722
Epoch: 6, step: 362, loss: 0.325050413608551, mean loss: 0.3873375859505663
Epoch: 6, step: 363, loss: 0.31300127506256104, mean loss: 0.3873293519772734
Epoch: 6, step: 364, loss: 0.29915502667427063, mean loss: 0.38731958629720886
Epoch: 6, step: 365, loss: 0.2934807240962982, mean loss: 0.3873091943966329
Epoch: 6, step: 366, loss: 0.3760155141353607, mean loss: 0.38730794385070655
Epoch: 6, step: 367, loss: 0.338983952999115, mean loss: 0.3873025935417106
Epoch: 6, step: 368, loss: 0.366928368806839, mean loss: 0.38730033800924796
Epoch: 6, step: 369, loss: 0.36927521228790283, mean loss: 0.3872983427551278
Epoch: 6, step: 370, loss: 0.3484954535961151, mean loss: 0.3872940480247284
Epoch: 6, step: 371, loss: 0.35809820890426636, mean loss: 0.3872908169668355
Epoch: 6, step: 372, loss: 0.402079313993454, mean loss: 0.3872924534055902
Epoch: 6, step: 373, loss: 0.32874226570129395, mean loss: 0.38728597518167956
Epoch: 6, step: 374, loss: 0.34551969170570374, mean loss: 0.3872813545064416
Epoch: 6, step: 375, loss: 0.39916542172431946, mean loss: 0.38728266911564707
Epoch: 6, step: 376, loss: 0.32595187425613403, mean loss: 0.3872758854860862
Epoch: 6, step: 377, loss: 0.32968947291374207, mean loss: 0.3872695167167241
Epoch: 6, step: 378, loss: 0.3700889050960541, mean loss: 0.3872676168370801
Epoch: 6, step: 379, loss: 0.35233405232429504, mean loss: 0.38726375421384784
Epoch: 6, step: 380, loss: 0.3307488262653351, mean loss: 0.38725750601838643
Epoch: 6, step: 381, loss: 0.33618786931037903, mean loss: 0.38725186046933624
Epoch: 6, step: 382, loss: 0.368525892496109, mean loss: 0.387249790615465
Epoch: 6, step: 383, loss: 0.3524424731731415, mean loss: 0.38724594365288295
Epoch: 6, step: 384, loss: 0.342712938785553, mean loss: 0.38724102233507246
Epoch: 6, step: 385, loss: 0.3395111858844757, mean loss: 0.387235748319995
Epoch: 6, step: 386, loss: 0.3328060209751129, mean loss: 0.3872297346499757
Epoch: 6, step: 387, loss: 0.3526979982852936, mean loss: 0.3872259198315527
Epoch: 6, step: 388, loss: 0.34888389706611633, mean loss: 0.3872216845479157
Epoch: 6, step: 389, loss: 0.3650643825531006, mean loss: 0.3872192373089059
Epoch: 6, step: 390, loss: 0.3930168151855469, mean loss: 0.3872198775715096
Epoch: 6, step: 391, loss: 0.338335245847702, mean loss: 0.38721447953355426
Epoch: 6, step: 392, loss: 0.34450563788414, mean loss: 0.38720976397192797
Epoch: 6, step: 393, loss: 0.33198556303977966, mean loss: 0.3872036672396546
Epoch: 6, step: 394, loss: 0.3533405065536499, mean loss: 0.3871999291713594
Epoch: 6, step: 395, loss: 0.34490180015563965, mean loss: 0.3871952605036976
Epoch: 6, step: 396, loss: 0.3693092465400696, mean loss: 0.3871932865478469
Epoch: 6, step: 397, loss: 0.3279639482498169, mean loss: 0.38718675053611684
Epoch: 6, step: 398, loss: 0.35734987258911133, mean loss: 0.38718345837260065
Epoch: 6, step: 399, loss: 0.33608970046043396, mean loss: 0.3871778213737136
Epoch: 6, step: 400, loss: 0.376604825258255, mean loss: 0.3871766550200329
Epoch: 6, step: 401, loss: 0.33703672885894775, mean loss: 0.38717112447446034
Epoch: 6, step: 402, loss: 0.4274725615978241, mean loss: 0.38717556932249425
Epoch: 6, step: 403, loss: 0.3479759693145752, mean loss: 0.38717124647291246
Epoch: 6, step: 404, loss: 0.31933072209358215, mean loss: 0.3871637659872603
Epoch: 6, step: 405, loss: 0.3282400369644165, mean loss: 0.3871572694349976
Epoch: 6, step: 406, loss: 0.36242714524269104, mean loss: 0.387154543150774
Epoch: 6, step: 407, loss: 0.3388345539569855, mean loss: 0.38714921687330556
Epoch: 6, step: 408, loss: 0.42335495352745056, mean loss: 0.3871532073656073
Epoch: 6, step: 409, loss: 0.3270426392555237, mean loss: 0.3871465828815749
Epoch: 6, step: 410, loss: 0.3354484438896179, mean loss: 0.3871408861169477
Epoch: 6, step: 411, loss: 0.3340131640434265, mean loss: 0.38713503246753456
Epoch: 6, step: 412, loss: 0.32819709181785583, mean loss: 0.38712853935960795
Epoch: 6, step: 413, loss: 0.34292173385620117, mean loss: 0.38712366969608036
Epoch: 6, step: 414, loss: 0.34881120920181274, mean loss: 0.3871194497973587
Epoch: 6, step: 415, loss: 0.4112963378429413, mean loss: 0.38712211245022715
Epoch: 6, step: 416, loss: 0.3261938691139221, mean loss: 0.3871154030301923
Epoch: 6, step: 417, loss: 0.3250064551830292, mean loss: 0.3871085643440167
Epoch: 6, step: 418, loss: 0.30235108733177185, mean loss: 0.3870992329031918
Epoch: 6, step: 419, loss: 0.33515211939811707, mean loss: 0.3870935143746245
Epoch: 6, step: 420, loss: 0.33681902289390564, mean loss: 0.3870879805835975
Epoch: 6, step: 421, loss: 0.35255682468414307, mean loss: 0.38708418010418966
Epoch: 6, step: 422, loss: 0.33880674839019775, mean loss: 0.38707886730219626
Epoch: 6, step: 423, loss: 0.34752127528190613, mean loss: 0.38707451457420106
Epoch: 6, step: 424, loss: 0.33524128794670105, mean loss: 0.387068811721673
Epoch: 6, step: 425, loss: 0.36136290431022644, mean loss: 0.3870659837890645
Epoch: 6, step: 426, loss: 0.3447105586528778, mean loss: 0.38706132473889
Epoch: 6, step: 427, loss: 0.3509961664676666, mean loss: 0.38705735804748315
Epoch: 6, step: 428, loss: 0.3471102714538574, mean loss: 0.38705296487838675
Epoch: 6, step: 429, loss: 0.34045305848121643, mean loss: 0.3870478406309272
Epoch: 6, step: 430, loss: 0.3832705616950989, mean loss: 0.38704742531713543
Epoch: 6, step: 431, loss: 0.3606983721256256, mean loss: 0.3870445285434776
Epoch: 6, step: 432, loss: 0.37675148248672485, mean loss: 0.3870433970665009
Epoch: 6, step: 433, loss: 0.3440956771373749, mean loss: 0.3870386764993511
Epoch: 6, step: 434, loss: 0.31127339601516724, mean loss: 0.38703034972932315
Epoch: 6, step: 435, loss: 0.35606011748313904, mean loss: 0.3870269464070983
Epoch: 6, step: 436, loss: 0.34602591395378113, mean loss: 0.3870224412942037
Epoch: 6, step: 437, loss: 0.35354673862457275, mean loss: 0.38701876345387526
Epoch: 6, step: 438, loss: 0.3755374252796173, mean loss: 0.3870175021841648
Epoch: 6, step: 439, loss: 0.3848479688167572, mean loss: 0.3870172638786543
Epoch: 6, step: 440, loss: 0.3433161675930023, mean loss: 0.3870124641975686
Epoch: 6, step: 441, loss: 0.3661203384399414, mean loss: 0.3870101698723152
Epoch: 6, step: 442, loss: 0.33740341663360596, mean loss: 0.38700472277082854
Epoch: 6, step: 443, loss: 0.35379263758659363, mean loss: 0.3870010762968294
Epoch: 6, step: 444, loss: 0.3747574985027313, mean loss: 0.3869997321780684
Epoch: 6, step: 445, loss: 0.34444326162338257, mean loss: 0.3869950607762512
Epoch: 6, step: 446, loss: 0.34291693568229675, mean loss: 0.3869902228742543
Epoch: 6, step: 447, loss: 0.3190903961658478, mean loss: 0.38698277118124413
Epoch: 6, step: 448, loss: 0.3451422154903412, mean loss: 0.38697817987698746
Epoch: 6, step: 449, loss: 0.3141144812107086, mean loss: 0.386970185176673
Epoch: 6, step: 450, loss: 0.3748219609260559, mean loss: 0.38696885240385337
Epoch: 6, step: 451, loss: 0.36727291345596313, mean loss: 0.38696669181379767
Epoch: 6, step: 452, loss: 0.34382614493370056, mean loss: 0.3869619599341355
Epoch: 6, step: 453, loss: 0.3763207793235779, mean loss: 0.38696079288208346
Epoch: 6, step: 454, loss: 0.34287339448928833, mean loss: 0.386955958207405
Epoch: 6, step: 455, loss: 0.32588452100753784, mean loss: 0.3869492617778875
Epoch: 6, step: 456, loss: 0.351952463388443, mean loss: 0.386945424830361
Epoch: 6, step: 457, loss: 0.3562917411327362, mean loss: 0.3869420644177653
Epoch: 6, step: 458, loss: 0.3225391209125519, mean loss: 0.38693500501367617
Epoch: 6, step: 459, loss: 0.39211106300354004, mean loss: 0.38693557231507797
Epoch: 6, step: 460, loss: 0.3137646019458771, mean loss: 0.38692755357859915
Epoch: 6, step: 461, loss: 0.327852725982666, mean loss: 0.3869210803342866
Epoch: 6, step: 462, loss: 0.3386446535587311, mean loss: 0.3869157909262911
Epoch: 6, step: 463, loss: 0.3449254035949707, mean loss: 0.38691119075239416
Epoch: 6, step: 464, loss: 0.3306030333042145, mean loss: 0.38690502269921767
Epoch: 6, step: 465, loss: 0.3426443040370941, mean loss: 0.3869001748658483
Epoch: 6, step: 466, loss: 0.3253501355648041, mean loss: 0.38689343408835397
Epoch: 6, step: 467, loss: 0.33230170607566833, mean loss: 0.3868874560191454
Epoch: 6, step: 468, loss: 0.3905407190322876, mean loss: 0.3868878560260449
Epoch: 6, step: 469, loss: 0.3606721758842468, mean loss: 0.3868849859056002
Epoch: 6, step: 470, loss: 0.39092910289764404, mean loss: 0.38688542861134645
Epoch: 6, step: 471, loss: 0.36628153920173645, mean loss: 0.3868831733695109
Epoch: 6, step: 472, loss: 0.36121639609336853, mean loss: 0.38688036426616446
Epoch: 6, step: 473, loss: 0.3364194631576538, mean loss: 0.3868748421714929
Epoch: 6, step: 474, loss: 0.3358083665370941, mean loss: 0.3868692544183871
Epoch: 6, step: 475, loss: 0.3547009825706482, mean loss: 0.38686573491380855
Epoch: 6, step: 476, loss: 0.3408510684967041, mean loss: 0.38686070103716297
Epoch: 6, step: 477, loss: 0.34265848994255066, mean loss: 0.3868558659670367
Epoch: 6, step: 478, loss: 0.34061118960380554, mean loss: 0.38685080803458965
Epoch: 6, step: 479, loss: 0.3345121741294861, mean loss: 0.3868450842119841
Epoch: 6, step: 480, loss: 0.34058326482772827, mean loss: 0.38684002551112195
Epoch: 6, step: 481, loss: 0.32516562938690186, mean loss: 0.3868332821920618
Epoch: 6, step: 482, loss: 0.34957975149154663, mean loss: 0.38682920943261057
Epoch: 6, step: 483, loss: 0.34627240896224976, mean loss: 0.3868247760263501
Epoch: 6, step: 484, loss: 0.3597217798233032, mean loss: 0.3868218136265028
Epoch: 6, step: 485, loss: 0.28950753808021545, mean loss: 0.3868111781865524
Epoch: 6, step: 486, loss: 0.3793531060218811, mean loss: 0.3868103631857695
Epoch: 6, step: 487, loss: 0.3516899347305298, mean loss: 0.3868065257263666
Epoch: 6, step: 488, loss: 0.35271507501602173, mean loss: 0.38680280110594595
Epoch: 6, step: 489, loss: 0.3339010775089264, mean loss: 0.38679702202318467
Epoch: 6, step: 490, loss: 0.3356635570526123, mean loss: 0.38679143671843635
Epoch: 6, step: 491, loss: 0.39657559990882874, mean loss: 0.3867925053251631
Epoch: 6, step: 492, loss: 0.37355539202690125, mean loss: 0.3867910597520171
Epoch: 6, step: 493, loss: 0.37496986985206604, mean loss: 0.3867897689472672
Epoch: 6, step: 494, loss: 0.32363778352737427, mean loss: 0.38678287387297744
Epoch: 6, step: 495, loss: 0.3256041407585144, mean loss: 0.3867761949719824
Epoch: 6, step: 496, loss: 0.31268712878227234, mean loss: 0.3867681075288878
Epoch: 6, step: 497, loss: 0.3706957995891571, mean loss: 0.38676635329313797
Epoch: 6, step: 498, loss: 0.35626021027565, mean loss: 0.3867630240185535
Epoch: 6, step: 499, loss: 0.3534144461154938, mean loss: 0.38675938493323014
Epoch: 6, step: 500, loss: 0.31940436363220215, mean loss: 0.3867520357765143
Epoch: 6, step: 501, loss: 0.38097551465034485, mean loss: 0.3867514055647397
Epoch: 6, step: 502, loss: 0.32586634159088135, mean loss: 0.38674476379927947
Epoch: 6, step: 503, loss: 0.3729284107685089, mean loss: 0.38674325677996985
Epoch: 6, step: 504, loss: 0.4175790846347809, mean loss: 0.3867466198324134
Epoch: 6, step: 505, loss: 0.3572658598423004, mean loss: 0.38674340491856496
Epoch: 6, step: 506, loss: 0.40164273977279663, mean loss: 0.38674502953254974
Epoch: 6, step: 507, loss: 0.3726947605609894, mean loss: 0.3867434976672018
Epoch: 6, step: 508, loss: 0.33653542399406433, mean loss: 0.38673802420446624
Epoch: 6, step: 509, loss: 0.34454482793807983, mean loss: 0.38673342498969987
Epoch: 6, step: 510, loss: 0.32939308881759644, mean loss: 0.3867271753617792
Epoch: 6, step: 511, loss: 0.3492186367511749, mean loss: 0.3867230876832035
Epoch: 6, step: 512, loss: 0.3862733244895935, mean loss: 0.38672303867337526
Epoch: 6, step: 513, loss: 0.3685203492641449, mean loss: 0.3867210553775146
Epoch: 6, step: 514, loss: 0.38118046522140503, mean loss: 0.38672045176163533
Epoch: 6, step: 515, loss: 0.4399276375770569, mean loss: 0.3867262477513756
Epoch: 6, step: 516, loss: 0.36735090613365173, mean loss: 0.38672413737760175
Epoch: 6, step: 517, loss: 0.4157598912715912, mean loss: 0.38672729962481306
Epoch: 6, step: 518, loss: 0.3312602639198303, mean loss: 0.38672125943797814
Epoch: 6, step: 519, loss: 0.3140636384487152, mean loss: 0.3867133481116509
Epoch: 6, step: 520, loss: 0.32279086112976074, mean loss: 0.38670638866832135
Epoch: 6, step: 521, loss: 0.31826260685920715, mean loss: 0.38669893778852504
Epoch: 6, step: 522, loss: 0.3522533178329468, mean loss: 0.38669518840135236
Epoch: 6, step: 523, loss: 0.35794612765312195, mean loss: 0.3866920594221677
Epoch: 6, step: 524, loss: 0.41022413969039917, mean loss: 0.38669462031892127
Epoch: 6, step: 525, loss: 0.35425835847854614, mean loss: 0.3866910908018549
Epoch: 6, step: 526, loss: 0.35831737518310547, mean loss: 0.38668800368232287
Epoch: 6, step: 527, loss: 0.34317269921302795, mean loss: 0.3866832696413667
Epoch: 6, step: 528, loss: 0.38257893919944763, mean loss: 0.38668282317879277
Epoch: 6, step: 529, loss: 0.36760446429252625, mean loss: 0.386680748090813
Epoch: 6, step: 530, loss: 0.3457142114639282, mean loss: 0.3866762927850352
Epoch: 6, step: 531, loss: 0.3722003698348999, mean loss: 0.3866747186307344
Epoch: 6, step: 532, loss: 0.3493626117706299, mean loss: 0.3866706616440148
Epoch: 6, step: 533, loss: 0.3114018738269806, mean loss: 0.38666247847508495
Epoch: 6, step: 534, loss: 0.34412682056427, mean loss: 0.3866578545314051
Epoch: 6, step: 535, loss: 0.37160107493400574, mean loss: 0.38665621792492716
Epoch: 6, step: 536, loss: 0.3392177224159241, mean loss: 0.38665106212713246
Epoch: 6, step: 537, loss: 0.3668159246444702, mean loss: 0.3866489066025201
Epoch: 6, step: 538, loss: 0.36407268047332764, mean loss: 0.38664645346483356
Epoch: 6, step: 539, loss: 0.35876893997192383, mean loss: 0.38664342461721374
Epoch: 6, step: 540, loss: 0.3584080934524536, mean loss: 0.3866403572265386
Epoch: 6, step: 541, loss: 0.31440019607543945, mean loss: 0.38663251015276595
Epoch: 6, step: 542, loss: 0.39968109130859375, mean loss: 0.3866339273984655
Epoch: 6, step: 543, loss: 0.3574198782444, mean loss: 0.3866307547171934
Epoch: 6, step: 544, loss: 0.32009974122047424, mean loss: 0.3866235301528002
Epoch: 6, step: 545, loss: 0.3488257825374603, mean loss: 0.3866194261628311
Epoch: 6, step: 546, loss: 0.35173580050468445, mean loss: 0.38661563899252843
Epoch: 6, step: 547, loss: 0.3471912443637848, mean loss: 0.3866113593144315
Epoch: 6, step: 548, loss: 0.3348678648471832, mean loss: 0.3866057429577109
Epoch: 6, step: 549, loss: 0.30560895800590515, mean loss: 0.38659695233637903
Epoch: 6, step: 550, loss: 0.3306548297405243, mean loss: 0.38659088156887
Epoch: 6, step: 551, loss: 0.3356699049472809, mean loss: 0.3865853562892887
Epoch: 6, step: 552, loss: 0.3422139883041382, mean loss: 0.3865805422100888
Epoch: 6, step: 553, loss: 0.33512982726097107, mean loss: 0.38657496066149377
Epoch: 6, step: 554, loss: 0.31696152687072754, mean loss: 0.3865674095785357
Epoch: 6, step: 555, loss: 0.3868500292301178, mean loss: 0.3865674402314263
Epoch: 6, step: 556, loss: 0.35365796089172363, mean loss: 0.38656387126067043
Epoch: 6, step: 557, loss: 0.34713584184646606, mean loss: 0.3865595958291573
Epoch: 6, step: 558, loss: 0.37106654047966003, mean loss: 0.38655791600097233
Epoch: 6, step: 559, loss: 0.356080025434494, mean loss: 0.3865546118064183
Epoch: 6, step: 560, loss: 0.37516435980796814, mean loss: 0.38655337709075455
Epoch: 6, step: 561, loss: 0.3471660315990448, mean loss: 0.3865491079225894
Epoch: 6, step: 562, loss: 0.3310514986515045, mean loss: 0.3865430932255838
Epoch: 6, step: 563, loss: 0.3506140410900116, mean loss: 0.3865391997435578
Epoch: 6, step: 564, loss: 0.37069880962371826, mean loss: 0.3865374833723237
Epoch: 6, step: 565, loss: 0.31759971380233765, mean loss: 0.3865300144915469
Epoch: 6, step: 566, loss: 0.4030849039554596, mean loss: 0.38653180789307046
Epoch: 6, step: 567, loss: 0.35985884070396423, mean loss: 0.3865289187068498
Epoch: 6, step: 568, loss: 0.36016151309013367, mean loss: 0.3865260629280545
Epoch: 6, step: 569, loss: 0.3628706634044647, mean loss: 0.3865235011563929
Epoch: 6, step: 570, loss: 0.38184812664985657, mean loss: 0.386522994889527
Epoch: 6, step: 571, loss: 0.37407439947128296, mean loss: 0.38652164705546266
Epoch: 6, step: 572, loss: 0.3311096131801605, mean loss: 0.38651564813439787
Epoch: 6, step: 573, loss: 0.4262765049934387, mean loss: 0.3865199521890481
Epoch: 6, step: 574, loss: 0.3410491943359375, mean loss: 0.38651503057871656
Epoch: 6, step: 575, loss: 0.36305636167526245, mean loss: 0.3865124917617357
Epoch: 6, step: 576, loss: 0.3785490393638611, mean loss: 0.38651163000950134
Epoch: 6, step: 577, loss: 0.31261146068573, mean loss: 0.386503633886441
Epoch: 6, step: 578, loss: 0.3650452494621277, mean loss: 0.3865013123042248
Epoch: 6, step: 579, loss: 0.33371853828430176, mean loss: 0.3864956023546337
Epoch: 6, step: 580, loss: 0.3355877995491028, mean loss: 0.38649009583188565
Epoch: 6, step: 581, loss: 0.34800785779953003, mean loss: 0.38648593379013435
Epoch: 6, step: 582, loss: 0.32784050703048706, mean loss: 0.3864795916870999
Epoch: 6, step: 583, loss: 0.33666399121284485, mean loss: 0.3864742050521005
Epoch: 6, step: 584, loss: 0.359089732170105, mean loss: 0.3864712442484588
Epoch: 6, step: 585, loss: 0.37582725286483765, mean loss: 0.3864700935466876
Epoch: 6, step: 586, loss: 0.3199332058429718, mean loss: 0.3864629011471952
Epoch: 6, step: 587, loss: 0.348955363035202, mean loss: 0.38645884715474904
Epoch: 6, step: 588, loss: 0.34569257497787476, mean loss: 0.38645444141907664
Epoch: 6, step: 589, loss: 0.31924834847450256, mean loss: 0.38644717903600506
Epoch: 6, step: 590, loss: 0.3838108479976654, mean loss: 0.38644689418121975
Epoch: 6, step: 591, loss: 0.35046571493148804, mean loss: 0.38644300684551863
Epoch: 6, step: 592, loss: 0.3439387083053589, mean loss: 0.38643841526092965
Epoch: 6, step: 593, loss: 0.3502498269081116, mean loss: 0.38643450636177723
Epoch: 6, step: 594, loss: 0.3141755163669586, mean loss: 0.3864267021723405
Epoch: 6, step: 595, loss: 0.3524423837661743, mean loss: 0.38642303215955365
Epoch: 6, step: 596, loss: 0.31981319189071655, mean loss: 0.3864158396489966
Epoch: 6, step: 597, loss: 0.3510158956050873, mean loss: 0.3864120175863704
Epoch: 6, step: 598, loss: 0.3419215679168701, mean loss: 0.38640721455822946
Epoch: 6, step: 599, loss: 0.34450915455818176, mean loss: 0.386402691883359
Epoch: 6, step: 600, loss: 0.3555714786052704, mean loss: 0.38639936417550386
Epoch: 6, step: 601, loss: 0.3604886531829834, mean loss: 0.3863965678544384
Epoch: 6, step: 602, loss: 0.34495750069618225, mean loss: 0.38639209617351056
Epoch: 6, step: 603, loss: 0.30789923667907715, mean loss: 0.38638362693964196
Epoch: 6, step: 604, loss: 0.32952043414115906, mean loss: 0.38637749216859885
Epoch: 6, step: 605, loss: 0.37429359555244446, mean loss: 0.3863761886198808
Epoch: 6, step: 606, loss: 0.3380489647388458, mean loss: 0.38637097588944386
Epoch: 6, step: 607, loss: 0.3327854871749878, mean loss: 0.38636519660895263
Epoch: 6, step: 608, loss: 0.3412010073661804, mean loss: 0.38636032610434323
Epoch: 6, step: 609, loss: 0.33955925703048706, mean loss: 0.38635527962288174
Epoch: 6, step: 610, loss: 0.33171552419662476, mean loss: 0.3863493885441296
Epoch: 6, step: 611, loss: 0.3546479046344757, mean loss: 0.3863459709628543
Epoch: 6, step: 612, loss: 0.3450529873371124, mean loss: 0.3863415198489569
Epoch: 6, step: 613, loss: 0.3343854248523712, mean loss: 0.3863359199249435
Epoch: 6, step: 614, loss: 0.3331720232963562, mean loss: 0.38633019043937084
Epoch: 6, step: 615, loss: 0.3132282495498657, mean loss: 0.3863223130750508
Epoch: 6, step: 616, loss: 0.34326714277267456, mean loss: 0.3863176740091848
Epoch: 6, step: 617, loss: 0.33220991492271423, mean loss: 0.38631184468801627
Epoch: 6, step: 618, loss: 0.37638768553733826, mean loss: 0.3863107756199186
Epoch: 6, step: 619, loss: 0.3728444278240204, mean loss: 0.38630932513006555
Epoch: 6, step: 620, loss: 0.33788445591926575, mean loss: 0.3863041097429669
Epoch: 6, step: 621, loss: 0.36077138781547546, mean loss: 0.38630136014982375
Epoch: 6, step: 622, loss: 0.36900198459625244, mean loss: 0.38629949739806824
Epoch: 6, step: 623, loss: 0.40763524174690247, mean loss: 0.3863017945281661
Epoch: 6, step: 624, loss: 0.362804651260376, mean loss: 0.3862992649616608
Epoch: 6, step: 625, loss: 0.37083956599235535, mean loss: 0.3862976008390591
Epoch: 6, step: 626, loss: 0.3433396518230438, mean loss: 0.3862929772302962
Epoch: 6, step: 627, loss: 0.3940056264400482, mean loss: 0.3862938072614208
Epoch: 6, step: 628, loss: 0.3790391981601715, mean loss: 0.3862930266083377
Epoch: 6, step: 629, loss: 0.3029673993587494, mean loss: 0.38628406107925983
Epoch: 6, step: 630, loss: 0.3364069163799286, mean loss: 0.38627869506046486
Epoch: 6, step: 631, loss: 0.357393354177475, mean loss: 0.38627558777336474
Epoch: 6, step: 632, loss: 0.3575541079044342, mean loss: 0.3862724984456387
Epoch: 6, step: 633, loss: 0.3299185335636139, mean loss: 0.38626643757610957
Epoch: 6, step: 634, loss: 0.37792590260505676, mean loss: 0.3862655406479484
Epoch: 6, step: 635, loss: 0.3417927622795105, mean loss: 0.38626075862876896
Epoch: 6, step: 636, loss: 0.35522183775901794, mean loss: 0.38625742146923026
Epoch: 6, step: 637, loss: 0.3449912965297699, mean loss: 0.38625298520553003
Epoch: 6, step: 638, loss: 0.36281004548072815, mean loss: 0.3862504652722048
Epoch: 6, step: 639, loss: 0.39972561597824097, mean loss: 0.38625191359020844
Epoch: 6, step: 640, loss: 0.3886184096336365, mean loss: 0.3862521679154146
Epoch: 6, step: 641, loss: 0.34094348549842834, mean loss: 0.38624729915521505
Epoch: 6, step: 642, loss: 0.3519870340824127, mean loss: 0.38624361802648693
Epoch: 6, step: 643, loss: 0.3479636609554291, mean loss: 0.3862395054397797
Epoch: 6, step: 644, loss: 0.3491578698158264, mean loss: 0.38623552202205236
Epoch: 6, step: 645, loss: 0.341447114944458, mean loss: 0.38623071123718905
Epoch: 6, step: 646, loss: 0.32352495193481445, mean loss: 0.3862239766480684
Epoch: 6, step: 647, loss: 0.4065006375312805, mean loss: 0.3862261541245378
Epoch: 6, step: 648, loss: 0.3264997601509094, mean loss: 0.38621974089636496
Epoch: 6, step: 649, loss: 0.37165966629981995, mean loss: 0.38621817765021976
Epoch: 6, step: 650, loss: 0.32418006658554077, mean loss: 0.3862115176275612
Epoch: 6, step: 651, loss: 0.34348976612091064, mean loss: 0.38620693178046944
Epoch: 6, step: 652, loss: 0.35603058338165283, mean loss: 0.38620369293229956
Epoch: 6, step: 653, loss: 0.3334682583808899, mean loss: 0.3861980334093814
Epoch: 6, step: 654, loss: 0.34157735109329224, mean loss: 0.38619324526877447
Epoch: 6, step: 655, loss: 0.32307830452919006, mean loss: 0.38618647327942474
Epoch: 6, step: 656, loss: 0.37420833110809326, mean loss: 0.38618518820892034
Epoch: 6, step: 657, loss: 0.31934353709220886, mean loss: 0.38617801789663575
Epoch: 6, step: 658, loss: 0.3841831684112549, mean loss: 0.3861778039258661
Epoch: 6, step: 659, loss: 0.3873527944087982, mean loss: 0.3861779299437214
Epoch: 6, step: 660, loss: 0.3059523105621338, mean loss: 0.3861693266601416
Epoch: 6, step: 661, loss: 0.32835328578948975, mean loss: 0.3861631272133401
Epoch: 6, step: 662, loss: 0.32435864210128784, mean loss: 0.38615650080773145
Epoch: 6, step: 663, loss: 0.3729763329029083, mean loss: 0.38615508783947405
Epoch: 6, step: 664, loss: 0.3534274995326996, mean loss: 0.3861515796833687
Epoch: 6, step: 665, loss: 0.36883682012557983, mean loss: 0.3861497238677677
Epoch: 6, step: 666, loss: 0.35491374135017395, mean loss: 0.38614637631846777
Epoch: 6, step: 667, loss: 0.361826092004776, mean loss: 0.38614377020141744
Epoch: 6, step: 668, loss: 0.33292150497436523, mean loss: 0.3861380676121935
Epoch: 6, step: 669, loss: 0.36671939492225647, mean loss: 0.3861359871887212
Epoch: 6, step: 670, loss: 0.357959508895874, mean loss: 0.38613296881932724
Epoch: 6, step: 671, loss: 0.39899370074272156, mean loss: 0.38613434636130706
Epoch: 6, step: 672, loss: 0.3511838912963867, mean loss: 0.3861306031402441
Epoch: 6, step: 673, loss: 0.34090757369995117, mean loss: 0.3861257602371128
Epoch: 6, step: 674, loss: 0.34349700808525085, mean loss: 0.38612119564217207
Epoch: 6, step: 675, loss: 0.32395297288894653, mean loss: 0.386114539515539
Epoch: 6, step: 676, loss: 0.30665722489356995, mean loss: 0.3861060332191444
Epoch: 6, step: 677, loss: 0.3391458988189697, mean loss: 0.38610100644389284
Epoch: 6, step: 678, loss: 0.3301861882209778, mean loss: 0.3860950217689252
Epoch: 6, step: 679, loss: 0.35895225405693054, mean loss: 0.3860921169350519
Epoch: 6, step: 680, loss: 0.34026819467544556, mean loss: 0.3860872133585661
Epoch: 6, step: 681, loss: 0.29641297459602356, mean loss: 0.38607761842610705
Epoch: 6, step: 682, loss: 0.35537564754486084, mean loss: 0.3860743337389474
Epoch: 6, step: 683, loss: 0.3711036443710327, mean loss: 0.38607273225313565
Epoch: 6, step: 684, loss: 0.3994588851928711, mean loss: 0.3860741640803835
Epoch: 6, step: 685, loss: 0.3322693705558777, mean loss: 0.3860684095570119
Epoch: 6, step: 686, loss: 0.33590346574783325, mean loss: 0.3860630448961404
Epoch: 6, step: 687, loss: 0.3556504249572754, mean loss: 0.386059792905129
Epoch: 6, step: 688, loss: 0.3507075309753418, mean loss: 0.3860560131273112
Epoch: 6, step: 689, loss: 0.3554781377315521, mean loss: 0.38605274416479296
Epoch: 6, step: 690, loss: 0.3388028144836426, mean loss: 0.38604769339732303
Epoch: 6, step: 691, loss: 0.32887452840805054, mean loss: 0.3860415825417235
Epoch: 6, step: 692, loss: 0.3118648827075958, mean loss: 0.38603365513979615
Epoch: 6, step: 693, loss: 0.3309206962585449, mean loss: 0.3860277657447458
Epoch: 6, step: 694, loss: 0.3440760374069214, mean loss: 0.38602328324358776
Epoch: 6, step: 695, loss: 0.31365835666656494, mean loss: 0.3860155519480133
Epoch: 6, step: 696, loss: 0.3202913701534271, mean loss: 0.3860085308838327
Epoch: 6, step: 697, loss: 0.3119739592075348, mean loss: 0.3860006228971123
Epoch: 6, step: 698, loss: 0.4144347608089447, mean loss: 0.38600365975900613
Epoch: 6, step: 699, loss: 0.3576110005378723, mean loss: 0.38600062765101584
Epoch: 6, step: 700, loss: 0.34270986914634705, mean loss: 0.38599600503932285
Epoch: 6, step: 701, loss: 0.32937246561050415, mean loss: 0.385989959391295
Epoch: 6, step: 702, loss: 0.36116573214530945, mean loss: 0.38598730921223595
Epoch: 6, step: 703, loss: 0.31693369150161743, mean loss: 0.3859799379891669
Epoch: 6, step: 704, loss: 0.37431859970092773, mean loss: 0.3859786933164923
Epoch: 6, step: 705, loss: 0.3020867109298706, mean loss: 0.3859697400633027
Epoch: 6, step: 706, loss: 0.3730763792991638, mean loss: 0.3859683641844462
Epoch: 6, step: 707, loss: 0.3513229191303253, mean loss: 0.385964667487364
Epoch: 6, step: 708, loss: 0.3260519802570343, mean loss: 0.3859582754370887
Epoch: 6, step: 709, loss: 0.33763694763183594, mean loss: 0.3859531206122748
Epoch: 6, step: 710, loss: 0.35067012906074524, mean loss: 0.385949357093176
Epoch: 6, step: 711, loss: 0.30492180585861206, mean loss: 0.3859407150761928
Epoch: 6, step: 712, loss: 0.33319181203842163, mean loss: 0.38593508972661006
Epoch: 6, step: 713, loss: 0.3325810730457306, mean loss: 0.3859294004520653
Epoch: 6, step: 714, loss: 0.35672256350517273, mean loss: 0.385926286384793
Epoch: 6, step: 715, loss: 0.3239777088165283, mean loss: 0.3859196820588262
Epoch: 6, step: 716, loss: 0.3663334846496582, mean loss: 0.3859175942006651
Epoch: 6, step: 717, loss: 0.368659645318985, mean loss: 0.38591575472625866
Epoch: 6, step: 718, loss: 0.3345874845981598, mean loss: 0.38591028437880814
Epoch: 6, step: 719, loss: 0.3118230402469635, mean loss: 0.3859023893186918
Epoch: 6, step: 720, loss: 0.38682231307029724, mean loss: 0.38590248733933663
Epoch: 6, step: 721, loss: 0.35383281111717224, mean loss: 0.3858990705828672
Epoch: 6, step: 722, loss: 0.323500394821167, mean loss: 0.3858924232327275
Epoch: 6, step: 723, loss: 0.3918617069721222, mean loss: 0.38589305907462557
Epoch: 6, step: 724, loss: 0.3343065083026886, mean loss: 0.38588756471412156
Epoch: 6, step: 725, loss: 0.33300691843032837, mean loss: 0.38588193312239805
Epoch: 6, step: 726, loss: 0.34483370184898376, mean loss: 0.3858775621042665
Epoch: 6, step: 727, loss: 0.3997478187084198, mean loss: 0.3858790389203444
Epoch: 6, step: 728, loss: 0.3399287462234497, mean loss: 0.38587414694837624
Epoch: 6, step: 729, loss: 0.348375529050827, mean loss: 0.3858701551857727
Epoch: 6, step: 730, loss: 0.4000324010848999, mean loss: 0.385871662609498
Epoch: 6, step: 731, loss: 0.3402848243713379, mean loss: 0.38586681088129043
Epoch: 6, step: 732, loss: 0.31942465901374817, mean loss: 0.38585974031069686
Epoch: 6, step: 733, loss: 0.39690056443214417, mean loss: 0.38586091511641313
Epoch: 6, step: 734, loss: 0.32591766119003296, mean loss: 0.3858545374960358
Epoch: 6, step: 735, loss: 0.3033945560455322, mean loss: 0.3858457651575836
Epoch: 6, step: 736, loss: 0.3855647146701813, mean loss: 0.385845735261776
Epoch: 6, step: 737, loss: 0.32631513476371765, mean loss: 0.38583940356633906
Epoch: 6, step: 738, loss: 0.38566020131111145, mean loss: 0.3858393845083517
Epoch: 6, step: 739, loss: 0.36252403259277344, mean loss: 0.3858369052067869
Epoch: 6, step: 740, loss: 0.35559311509132385, mean loss: 0.3858336894927927
Epoch: 6, step: 741, loss: 0.34259453415870667, mean loss: 0.3858290925168907
Epoch: 6, step: 742, loss: 0.3457610011100769, mean loss: 0.385824833125862
Epoch: 6, step: 743, loss: 0.37594074010849, mean loss: 0.3858237825207369
Epoch: 6, step: 744, loss: 0.31322357058525085, mean loss: 0.38581606648163225
Epoch: 6, step: 745, loss: 0.32159554958343506, mean loss: 0.38580924177207876
Epoch: 6, step: 746, loss: 0.3381659984588623, mean loss: 0.38580417926614813
Epoch: 6, step: 747, loss: 0.3537784814834595, mean loss: 0.38580077662082485
Epoch: 6, step: 748, loss: 0.3408760130405426, mean loss: 0.3857960039911021
Epoch: 6, step: 749, loss: 0.3320601284503937, mean loss: 0.38579029590999514
Epoch: 6, step: 750, loss: 0.4202210009098053, mean loss: 0.38579395291530577
Epoch: 6, step: 751, loss: 0.36229178309440613, mean loss: 0.38579145693295436
Epoch: 6, step: 752, loss: 0.35701242089271545, mean loss: 0.38578840086031546
Epoch: 6, step: 753, loss: 0.34562721848487854, mean loss: 0.38578413655978716
Epoch: 6, step: 754, loss: 0.3654012978076935, mean loss: 0.3857819725467548
Epoch: 6, step: 755, loss: 0.3265632688999176, mean loss: 0.38577568606016804
Epoch: 6, step: 756, loss: 0.3850618004798889, mean loss: 0.38577561028418034
Epoch: 6, step: 757, loss: 0.34248748421669006, mean loss: 0.3857710159171598
Epoch: 6, step: 758, loss: 0.3483273684978485, mean loss: 0.385767042273159
Epoch: 6, step: 759, loss: 0.33596670627593994, mean loss: 0.3857617578572
Epoch: 6, step: 760, loss: 0.32974275946617126, mean loss: 0.38575581419689325
Epoch: 6, step: 761, loss: 0.33830684423446655, mean loss: 0.3857507803575168
Epoch: 6, step: 762, loss: 0.3532329201698303, mean loss: 0.38574733091865104
Epoch: 6, step: 763, loss: 0.3814162313938141, mean loss: 0.3857468715317689
Epoch: 6, step: 764, loss: 0.35545283555984497, mean loss: 0.3857436586739927
Epoch: 6, step: 765, loss: 0.3499370515346527, mean loss: 0.385739861578856
Epoch: 6, step: 766, loss: 0.38205641508102417, mean loss: 0.38573947101088885
Epoch: 6, step: 767, loss: 0.3673160970211029, mean loss: 0.38573751772696285
Epoch: 6, step: 768, loss: 0.3815140724182129, mean loss: 0.3857370699960916
Epoch: 6, step: 769, loss: 0.3918185234069824, mean loss: 0.3857377146275746
Epoch: 6, step: 770, loss: 0.34495416283607483, mean loss: 0.38573339204656865
Epoch: 6, step: 771, loss: 0.3359278738498688, mean loss: 0.38572811380174066
Epoch: 6, step: 772, loss: 0.3369995355606079, mean loss: 0.38572295023511555
Epoch: 6, step: 773, loss: 0.30535438656806946, mean loss: 0.38571443481196793
Epoch: 6, step: 774, loss: 0.3450477421283722, mean loss: 0.3857101264432124
Epoch: 6, step: 775, loss: 0.33772438764572144, mean loss: 0.3857050432081703
Epoch: 6, step: 776, loss: 0.3320237100124359, mean loss: 0.3856993572285923
Epoch: 6, step: 777, loss: 0.31934642791748047, mean loss: 0.3856923298054498
Epoch: 6, step: 778, loss: 0.3695669174194336, mean loss: 0.385690622147673
Epoch: 6, step: 779, loss: 0.3665223717689514, mean loss: 0.38568859247270704
Epoch: 6, step: 780, loss: 0.3496270775794983, mean loss: 0.3856847744192509
Epoch: 6, step: 781, loss: 0.3854173421859741, mean loss: 0.38568474610755993
Epoch: 6, step: 782, loss: 0.3796195685863495, mean loss: 0.38568410408601644
Epoch: 6, step: 783, loss: 0.3535939157009125, mean loss: 0.3856807075800485
Epoch: 6, step: 784, loss: 0.3507208228111267, mean loss: 0.3856770077298243
Epoch: 6, step: 785, loss: 0.33449649810791016, mean loss: 0.38567159180288013
Epoch: 6, step: 786, loss: 0.3620651960372925, mean loss: 0.38566909403589617
Epoch: 6, step: 787, loss: 0.35476696491241455, mean loss: 0.3856658246612534
Epoch: 6, step: 788, loss: 0.34246426820755005, mean loss: 0.3856612545188167
Epoch: 6, step: 789, loss: 0.32258740067481995, mean loss: 0.38565458286091064
Epoch: 6, step: 790, loss: 0.32816123962402344, mean loss: 0.38564850212656515
Epoch: 6, step: 791, loss: 0.3344276547431946, mean loss: 0.3856430853702852
Epoch: 6, step: 792, loss: 0.3406543731689453, mean loss: 0.38563832818384114
Epoch: 6, step: 793, loss: 0.38083788752555847, mean loss: 0.3856378206303776
Epoch: 6, step: 794, loss: 0.390010267496109, mean loss: 0.3856382828829271
Epoch: 6, step: 795, loss: 0.3423021137714386, mean loss: 0.38563370189253476
Epoch: 6, step: 796, loss: 0.33817923069000244, mean loss: 0.3856286860938663
Epoch: 6, step: 797, loss: 0.3173300325870514, mean loss: 0.3856214678890991
Epoch: 6, step: 798, loss: 0.3171505331993103, mean loss: 0.3856142322413458
Epoch: 6, step: 799, loss: 0.2992744743824005, mean loss: 0.38560510927453906
Epoch: 6, step: 800, loss: 0.37685754895210266, mean loss: 0.3856041850737654
Epoch: 6, step: 801, loss: 0.3371797800064087, mean loss: 0.3855990694594545
Epoch: 6, step: 802, loss: 0.3416982591152191, mean loss: 0.3855944322131944
Epoch: 6, step: 803, loss: 0.3146214783191681, mean loss: 0.38558693612596434
Epoch: 6, step: 804, loss: 0.3523593246936798, mean loss: 0.3855834270319278
Epoch: 6, step: 805, loss: 0.33040016889572144, mean loss: 0.3855775998663379
Epoch: 6, step: 806, loss: 0.3409232199192047, mean loss: 0.38557288501257936
Epoch: 6, step: 807, loss: 0.3488267958164215, mean loss: 0.3855690055690409
Epoch: 6, step: 808, loss: 0.3728509843349457, mean loss: 0.3855676630142817
Epoch: 6, step: 809, loss: 0.3479403853416443, mean loss: 0.3855636913784708
Epoch: 6, step: 810, loss: 0.34136849641799927, mean loss: 0.38555902697794725
Epoch: 6, step: 811, loss: 0.3193616569042206, mean loss: 0.385552041185411
Epoch: 6, step: 812, loss: 0.35433658957481384, mean loss: 0.3855487473739083
Epoch: 6, step: 813, loss: 0.352500319480896, mean loss: 0.3855452605171988
Epoch: 6, step: 814, loss: 0.34509915113449097, mean loss: 0.38554099359986754
Epoch: 6, step: 815, loss: 0.3213946521282196, mean loss: 0.3855342271081511
Epoch: 6, step: 816, loss: 0.46190348267555237, mean loss: 0.3855422820871161
Epoch: 6, step: 817, loss: 0.34962108731269836, mean loss: 0.3855384937307805
Epoch: 6, step: 818, loss: 0.366026371717453, mean loss: 0.3855364361411977
Epoch: 6, step: 819, loss: 0.33843982219696045, mean loss: 0.3855314702392635
Epoch: 6, step: 820, loss: 0.35262608528137207, mean loss: 0.38552800103684304
Epoch: 6, step: 821, loss: 0.3365339934825897, mean loss: 0.3855228361614947
Epoch: 6, step: 822, loss: 0.40349826216697693, mean loss: 0.38552473090440664
Epoch: 6, step: 823, loss: 0.4015287160873413, mean loss: 0.38552641766507095
Epoch: 6, step: 824, loss: 0.32740122079849243, mean loss: 0.3855202921305714
Epoch: 6, step: 825, loss: 0.3281407952308655, mean loss: 0.3855142458189908
Epoch: 6, step: 826, loss: 0.3186393082141876, mean loss: 0.3855071996765817
Epoch: 6, step: 827, loss: 0.3228726089000702, mean loss: 0.38550060100498706
Epoch: 6, step: 828, loss: 0.37046346068382263, mean loss: 0.3854990169809355
Epoch: 6, step: 829, loss: 0.3548954725265503, mean loss: 0.385495793519333
Epoch: 6, step: 830, loss: 0.3681561350822449, mean loss: 0.38549396733097735
Epoch: 6, step: 831, loss: 0.3195963501930237, mean loss: 0.38548702781779937
Epoch: 6, step: 832, loss: 0.34451669454574585, mean loss: 0.3854827137888142
Epoch: 6, step: 833, loss: 0.3446506857872009, mean loss: 0.3854784147755481
Epoch: 6, step: 834, loss: 0.3358559012413025, mean loss: 0.385473190803179
Epoch: 6, step: 835, loss: 0.3456091284751892, mean loss: 0.38546899458609185
Epoch: 6, step: 836, loss: 0.35811910033226013, mean loss: 0.3854661159528686
Epoch: 6, step: 837, loss: 0.3422505557537079, mean loss: 0.3854615679040158
Epoch: 6, step: 838, loss: 0.33073553442955017, mean loss: 0.3854558090874869
Epoch: 6, step: 839, loss: 0.33833709359169006, mean loss: 0.38545085131018303
Epoch: 6, step: 840, loss: 0.38122081756591797, mean loss: 0.3854504062777007
Epoch: 6, step: 841, loss: 0.30441996455192566, mean loss: 0.38544188214118424
Epoch: 6, step: 842, loss: 0.348379522562027, mean loss: 0.38543798371270216
Epoch: 6, step: 843, loss: 0.3263015151023865, mean loss: 0.3854317640588727
Epoch: 6, step: 844, loss: 0.3543129563331604, mean loss: 0.385428491495225
Epoch: 6, step: 845, loss: 0.3433046042919159, mean loss: 0.38542406206439395
Epoch: 6, step: 846, loss: 0.3203980624675751, mean loss: 0.3854172251387713
Epoch: 6, step: 847, loss: 0.3845328092575073, mean loss: 0.3854171321598099
Epoch: 6, step: 848, loss: 0.33556467294692993, mean loss: 0.3854118917036748
Epoch: 6, step: 849, loss: 0.3978813886642456, mean loss: 0.3854132023508222
Epoch: 6, step: 850, loss: 0.35616469383239746, mean loss: 0.38541012841403627
Epoch: 6, step: 851, loss: 0.34312883019447327, mean loss: 0.38540568523431584
Epoch: 6, step: 852, loss: 0.37861838936805725, mean loss: 0.3854049720583291
Epoch: 6, step: 853, loss: 0.3318719267845154, mean loss: 0.38539934765769096
Epoch: 6, step: 854, loss: 0.33493468165397644, mean loss: 0.38539404619051965
Epoch: 6, step: 855, loss: 0.3526056408882141, mean loss: 0.3853906020302988
Epoch: 6, step: 856, loss: 0.3503102660179138, mean loss: 0.38538691750808346
Epoch: 6, step: 857, loss: 0.3490080237388611, mean loss: 0.38538309699834083
Epoch: 6, step: 858, loss: 0.31190067529678345, mean loss: 0.3853753806881758
Epoch: 6, step: 859, loss: 0.36430203914642334, mean loss: 0.385373168031567
Epoch: 6, step: 860, loss: 0.3508768081665039, mean loss: 0.3853695463664893
Epoch: 6, step: 861, loss: 0.3262740969657898, mean loss: 0.38536334277112916
Epoch: 6, step: 862, loss: 0.3287760317325592, mean loss: 0.3853574030932622
Epoch: 6, step: 863, loss: 0.3364798426628113, mean loss: 0.3853522732065672
Epoch: 6, step: 864, loss: 0.30444586277008057, mean loss: 0.38534378266081876
Epoch: 6, step: 865, loss: 0.35320863127708435, mean loss: 0.38534041066172287
Epoch: 6, step: 866, loss: 0.3481169641017914, mean loss: 0.38533650514849654
Epoch: 6, step: 867, loss: 0.42847689986228943, mean loss: 0.38534103099771116
Epoch: 6, step: 868, loss: 0.3223644495010376, mean loss: 0.3853344248316043
Epoch: 6, step: 869, loss: 0.32472294569015503, mean loss: 0.38532806742871556
Epoch: 6, step: 870, loss: 0.34978213906288147, mean loss: 0.3853243394865692
Epoch: 6, step: 871, loss: 0.3954336643218994, mean loss: 0.38532539960872053
Epoch: 6, step: 872, loss: 0.3365746736526489, mean loss: 0.38532028786226397
Epoch: 6, step: 873, loss: 0.3469802737236023, mean loss: 0.38531626815015046
Epoch: 6, step: 874, loss: 0.30965691804885864, mean loss: 0.38530833656926133
Epoch: 6, step: 875, loss: 0.3486570417881012, mean loss: 0.3853044947144625
Epoch: 6, step: 876, loss: 0.32759711146354675, mean loss: 0.38529844635650723
Epoch: 6, step: 877, loss: 0.3153437077999115, mean loss: 0.3852911151116365
Epoch: 6, step: 878, loss: 0.3474119007587433, mean loss: 0.3852871457923079
Epoch: 6, step: 879, loss: 0.33829352259635925, mean loss: 0.3852822219005229
Epoch: 6, step: 880, loss: 0.3723958730697632, mean loss: 0.38528087183778525
Epoch: 6, step: 881, loss: 0.33653223514556885, mean loss: 0.38527576512956274
Epoch: 6, step: 882, loss: 0.3792870342731476, mean loss: 0.38527513784027223
Epoch: 6, step: 883, loss: 0.3443332314491272, mean loss: 0.38527084983164306
Epoch: 6, step: 884, loss: 0.35492661595344543, mean loss: 0.38526767209220664
Epoch: 6, step: 885, loss: 0.3468555212020874, mean loss: 0.38526364987745376
Epoch: 6, step: 886, loss: 0.3489571213722229, mean loss: 0.3852598485447655
Epoch: 6, step: 887, loss: 0.3496069610118866, mean loss: 0.3852561160397893
Epoch: 6, step: 888, loss: 0.36511820554733276, mean loss: 0.38525400802026744
Epoch: 6, step: 889, loss: 0.35895100235939026, mean loss: 0.385251254931963
Epoch: 6, step: 890, loss: 0.37118226289749146, mean loss: 0.3852497825099814
Epoch: 6, step: 891, loss: 0.39094457030296326, mean loss: 0.3852503784484277
Epoch: 6, step: 892, loss: 0.3353734016418457, mean loss: 0.3852451595537111
Epoch: 6, step: 893, loss: 0.3808995187282562, mean loss: 0.38524470489365403
Epoch: 6, step: 894, loss: 0.3573705554008484, mean loss: 0.38524178888261806
Epoch: 6, step: 895, loss: 0.3655467629432678, mean loss: 0.38523972873346124
Epoch: 6, step: 896, loss: 0.3433782756328583, mean loss: 0.3852353503783623
Epoch: 6, step: 897, loss: 0.37748900055885315, mean loss: 0.3852345402602051
Epoch: 6, step: 898, loss: 0.35816553235054016, mean loss: 0.38523170966228504
Epoch: 6, step: 899, loss: 0.37697577476501465, mean loss: 0.3852308464319528
Epoch: 6, step: 900, loss: 0.35516515374183655, mean loss: 0.3852277031290056
Epoch: 6, step: 901, loss: 0.3552989065647125, mean loss: 0.38522457446534636
Epoch: 6, step: 902, loss: 0.3114398717880249, mean loss: 0.3852168620473807
Epoch: 6, step: 903, loss: 0.32170775532722473, mean loss: 0.38521022438990576
Epoch: 6, step: 904, loss: 0.3286428153514862, mean loss: 0.3852043128621559
Epoch: 6, step: 905, loss: 0.3409939706325531, mean loss: 0.38519969318167213
Epoch: 6, step: 906, loss: 0.3559553325176239, mean loss: 0.385196637663893
Epoch: 6, step: 907, loss: 0.3754918873310089, mean loss: 0.3851956237952832
Epoch: 6, step: 908, loss: 0.30702728033065796, mean loss: 0.3851874582940334
Epoch: 6, step: 909, loss: 0.35434573888778687, mean loss: 0.38518423689029346
Epoch: 6, step: 910, loss: 0.32729753851890564, mean loss: 0.38517819128210845
Epoch: 6, step: 911, loss: 0.35525181889533997, mean loss: 0.3851750661387932
Epoch: 6, step: 912, loss: 0.33499202132225037, mean loss: 0.3851698261842337
Epoch: 6, step: 913, loss: 0.3268192410469055, mean loss: 0.3851637340371114
Epoch: 6, step: 914, loss: 0.33930525183677673, mean loss: 0.38515894663944983
Epoch: 6, step: 915, loss: 0.33658871054649353, mean loss: 0.38515387667743595
Epoch: 6, step: 916, loss: 0.37004536390304565, mean loss: 0.38515229975302573
Epoch: 6, step: 917, loss: 0.3343924582004547, mean loss: 0.3851470023368754
Epoch: 6, step: 918, loss: 0.39439406991004944, mean loss: 0.38514796728183764
Epoch: 6, step: 919, loss: 0.35912925004959106, mean loss: 0.3851452524741131
Epoch: 6, step: 920, loss: 0.31304502487182617, mean loss: 0.38513773028031
Epoch: 6, step: 921, loss: 0.34439173340797424, mean loss: 0.3851334797068829
Epoch: 6, step: 922, loss: 0.3307982087135315, mean loss: 0.3851278121079475
Epoch: 6, step: 923, loss: 0.28761276602745056, mean loss: 0.38511764157748435
Epoch: 6, step: 924, loss: 0.3371908366680145, mean loss: 0.3851126434749805
Epoch: 6, step: 925, loss: 0.3343844711780548, mean loss: 0.38510735378026756
Epoch: 6, step: 926, loss: 0.3525950014591217, mean loss: 0.38510396389888696
Epoch: 6, step: 927, loss: 0.3505556583404541, mean loss: 0.38510036211557186
Epoch: 6, step: 928, loss: 0.35553061962127686, mean loss: 0.38509727968645746
Epoch: 6, step: 929, loss: 0.3355553448200226, mean loss: 0.3850921158408387
Epoch: 6, step: 930, loss: 0.37236806750297546, mean loss: 0.3850907897284533
Epoch: 6, step: 931, loss: 0.31606557965278625, mean loss: 0.3850835966052691
Epoch: 6, step: 932, loss: 0.3556332588195801, mean loss: 0.3850805279027802
Epoch: 6, step: 933, loss: 0.352303683757782, mean loss: 0.38507711293673047
Epoch: 6, step: 934, loss: 0.3618781268596649, mean loss: 0.3850746961239294
Epoch: 6, step: 935, loss: 0.3765299320220947, mean loss: 0.3850738060443355
Epoch: 6, step: 936, loss: 0.3733106255531311, mean loss: 0.3850725808406597
Epoch: 6, step: 937, loss: 0.4039849638938904, mean loss: 0.3850745504702216
Epoch: 6, step: 938, loss: 0.36809882521629333, mean loss: 0.3850727827179302
Epoch: 6, step: 939, loss: 0.34603577852249146, mean loss: 0.38506871805693527
Epoch: 6, step: 940, loss: 0.3707096576690674, mean loss: 0.38506722310010155
Epoch: 6, step: 941, loss: 0.34781843423843384, mean loss: 0.3850633454414651
Epoch: 6, step: 942, loss: 0.32579275965690613, mean loss: 0.3850571759207214
Epoch: 6, step: 943, loss: 0.3137126863002777, mean loss: 0.38504975039099404
Epoch: 6, step: 944, loss: 0.35016682744026184, mean loss: 0.3850461201565315
Epoch: 6, step: 945, loss: 0.3480948805809021, mean loss: 0.3850422750743696
Epoch: 6, step: 946, loss: 0.42933568358421326, mean loss: 0.38504688369038353
Epoch: 6, step: 947, loss: 0.3413398265838623, mean loss: 0.3850423365558531
Epoch: 6, step: 948, loss: 0.3693418502807617, mean loss: 0.3850407033002331
Epoch: 6, step: 949, loss: 0.3325495719909668, mean loss: 0.38503524343635653
Epoch: 6, step: 950, loss: 0.33813953399658203, mean loss: 0.38503036608748087
Epoch: 6, step: 951, loss: 0.341381311416626, mean loss: 0.3850258268763046
Epoch: 6, step: 952, loss: 0.3292905390262604, mean loss: 0.38502003138001156
Epoch: 6, step: 953, loss: 0.3450740873813629, mean loss: 0.3850158781315193
Epoch: 6, step: 954, loss: 0.31034377217292786, mean loss: 0.3850081151513801
Epoch: 6, step: 955, loss: 0.31635749340057373, mean loss: 0.3850009789121129
Epoch: 6, step: 956, loss: 0.34471774101257324, mean loss: 0.38499679190058606
Epoch: 6, step: 957, loss: 0.3543304204940796, mean loss: 0.3849936047906914
Epoch: 6, step: 958, loss: 0.3548829257488251, mean loss: 0.3849904757582647
Epoch: 6, step: 959, loss: 0.36345288157463074, mean loss: 0.3849882378536322
Epoch: 6, step: 960, loss: 0.3715343177318573, mean loss: 0.3849868400437494
Epoch: 6, step: 961, loss: 0.33884555101394653, mean loss: 0.38498204664160623
Epoch: 6, step: 962, loss: 0.3291475772857666, mean loss: 0.38497624686292586
Epoch: 6, step: 963, loss: 0.3284616768360138, mean loss: 0.38497037704883913
Epoch: 6, step: 964, loss: 0.3259882628917694, mean loss: 0.3849642515826269
Epoch: 6, step: 965, loss: 0.3790629506111145, mean loss: 0.3849636387787877
Epoch: 6, step: 966, loss: 0.4257288873195648, mean loss: 0.38496787149071177
Epoch: 6, step: 967, loss: 0.313681036233902, mean loss: 0.3849604704488454
Epoch: 6, step: 968, loss: 0.4167082905769348, mean loss: 0.3849637661843513
Epoch: 6, step: 969, loss: 0.3821863830089569, mean loss: 0.38496347789463
Epoch: 6, step: 970, loss: 0.3736254572868347, mean loss: 0.38496230114106406
Epoch: 6, step: 971, loss: 0.361386239528656, mean loss: 0.3849598544763056
Epoch: 6, step: 972, loss: 0.3821389973163605, mean loss: 0.3849595617651756
Epoch: 6, step: 973, loss: 0.3431174159049988, mean loss: 0.3849552203929137
Epoch: 6, step: 974, loss: 0.3175310492515564, mean loss: 0.38494822545867347
Epoch: 6, step: 975, loss: 0.3394581973552704, mean loss: 0.3849435065760901
Epoch: 6, step: 976, loss: 0.35432568192481995, mean loss: 0.3849403307826401
Epoch: 6, step: 977, loss: 0.33369407057762146, mean loss: 0.3849350158832204
Epoch: 6, step: 978, loss: 0.37867870926856995, mean loss: 0.3849343670906647
Epoch: 6, step: 979, loss: 0.3296632170677185, mean loss: 0.38492863594694604
Epoch: 6, step: 980, loss: 0.3448840081691742, mean loss: 0.38492448409336616
Epoch: 6, step: 981, loss: 0.307940810918808, mean loss: 0.38491650320251247
Epoch: 6, step: 982, loss: 0.3286423981189728, mean loss: 0.38491066987556277
Epoch: 6, step: 983, loss: 0.355695903301239, mean loss: 0.38490764181103393
Epoch: 6, step: 984, loss: 0.3620153069496155, mean loss: 0.3849052693024982
Epoch: 6, step: 985, loss: 0.3231393098831177, mean loss: 0.3848988686849418
Epoch: 6, step: 986, loss: 0.3651946783065796, mean loss: 0.38489682701150085
Epoch: 6, step: 987, loss: 0.3301236629486084, mean loss: 0.38489115221207454
Epoch: 6, step: 988, loss: 0.3113015294075012, mean loss: 0.38488352871442566
Epoch: 6, step: 989, loss: 0.34410524368286133, mean loss: 0.3848793047362786
Epoch: 6, step: 990, loss: 0.37918680906295776, mean loss: 0.3848787151458412
Epoch: 6, step: 991, loss: 0.3120152950286865, mean loss: 0.38487116922412234
Epoch: 6, step: 992, loss: 0.3665715157985687, mean loss: 0.38486927426156403
Epoch: 6, step: 993, loss: 0.29918479919433594, mean loss: 0.38486040239626407
Epoch: 6, step: 994, loss: 0.35973888635635376, mean loss: 0.3848578015560073
Epoch: 6, step: 995, loss: 0.3677418529987335, mean loss: 0.38485602971868255
Epoch: 6, step: 996, loss: 0.3458351492881775, mean loss: 0.3848519907081836
Epoch: 6, step: 997, loss: 0.3196059465408325, mean loss: 0.38484523785741076
Epoch: 6, step: 998, loss: 0.38844701647758484, mean loss: 0.3848456105965829
Epoch: 6, step: 999, loss: 0.35701340436935425, mean loss: 0.3848427306083557
Epoch: 6, step: 1000, loss: 0.3505238890647888, mean loss: 0.38483917977115517
Epoch: 6, step: 1001, loss: 0.3216528594493866, mean loss: 0.3848326428044345
Epoch: 6, step: 1002, loss: 0.3321238160133362, mean loss: 0.38482719035519575
Epoch: 6, step: 1003, loss: 0.31794872879981995, mean loss: 0.38482027284779446
Epoch: 6, step: 1004, loss: 0.37010878324508667, mean loss: 0.384818751336821
Epoch: 6, step: 1005, loss: 0.3828895390033722, mean loss: 0.3848185518319261
Epoch: 6, step: 1006, loss: 0.36993199586868286, mean loss: 0.38481701253340855
Epoch: 6, step: 1007, loss: 0.32806238532066345, mean loss: 0.3848111446025553
Epoch: 6, step: 1008, loss: 0.2994682192802429, mean loss: 0.38480232180452756
Epoch: 6, step: 1009, loss: 0.3097994327545166, mean loss: 0.38479456876658563
Epoch: 6, step: 1010, loss: 0.3152334988117218, mean loss: 0.3847873789919133
Epoch: 6, step: 1011, loss: 0.34663650393486023, mean loss: 0.38478343615654154
Epoch: 6, step: 1012, loss: 0.3443986773490906, mean loss: 0.3847792628839563
Epoch: 6, step: 1013, loss: 0.33786019682884216, mean loss: 0.3847744148713447
Epoch: 6, step: 1014, loss: 0.3206333518028259, mean loss: 0.3847677880438761
Epoch: 6, step: 1015, loss: 0.36186593770980835, mean loss: 0.38476542215024656
Epoch: 6, step: 1016, loss: 0.34113505482673645, mean loss: 0.3847609153464739
Epoch: 6, step: 1017, loss: 0.404132217168808, mean loss: 0.38476291610063856
Epoch: 6, step: 1018, loss: 0.3111189901828766, mean loss: 0.38475531061412427
Epoch: 6, step: 1019, loss: 0.43271589279174805, mean loss: 0.3847602631732091
Epoch: 6, step: 1020, loss: 0.35324689745903015, mean loss: 0.3847570093409206
Epoch: 6, step: 1021, loss: 0.3729715645313263, mean loss: 0.38475579259047565
Epoch: 6, step: 1022, loss: 0.3386618196964264, mean loss: 0.38475103425735974
Epoch: 6, step: 1023, loss: 0.3336687982082367, mean loss: 0.38474576152448925
Epoch: 6, step: 1024, loss: 0.3383896052837372, mean loss: 0.3847409771136893
Epoch: 6, step: 1025, loss: 0.35290175676345825, mean loss: 0.3847376913324354
Epoch: 6, step: 1026, loss: 0.3148168623447418, mean loss: 0.3847304763051949
Epoch: 6, step: 1027, loss: 0.3932495713233948, mean loss: 0.38473135528734703
Epoch: 6, step: 1028, loss: 0.351409375667572, mean loss: 0.3847279175508754
Epoch: 6, step: 1029, loss: 0.32069453597068787, mean loss: 0.38472131208547616
Epoch: 6, step: 1030, loss: 0.35847097635269165, mean loss: 0.38471860446961925
Epoch: 6, step: 1031, loss: 0.3345947265625, mean loss: 0.3847134349277559
Epoch: 6, step: 1032, loss: 0.3687247037887573, mean loss: 0.3847117860950098
Epoch: 6, step: 1033, loss: 0.3450864851474762, mean loss: 0.38470770016997907
Epoch: 6, step: 1034, loss: 0.3122021555900574, mean loss: 0.38470022460089154
Epoch: 6, step: 1035, loss: 0.36170443892478943, mean loss: 0.3846978539013373
Epoch: 6, step: 1036, loss: 0.3654360771179199, mean loss: 0.38469586835584885
Epoch: 6, step: 1037, loss: 0.314523845911026, mean loss: 0.38468863561801697
Epoch: 6, step: 1038, loss: 0.35300999879837036, mean loss: 0.3846853707889105
Epoch: 6, step: 1039, loss: 0.38211044669151306, mean loss: 0.38468510544223933
Epoch: 6, step: 1040, loss: 0.31057098507881165, mean loss: 0.3846774687477145
Epoch: 6, step: 1041, loss: 0.33839312195777893, mean loss: 0.3846727001152408
Epoch: 6, step: 1042, loss: 0.33857861161231995, mean loss: 0.38466795157413614
Epoch: 6, step: 1043, loss: 0.3442714512348175, mean loss: 0.38466379041835336
Epoch: 6, step: 1044, loss: 0.34367549419403076, mean loss: 0.38465956873782764
Epoch: 6, step: 1045, loss: 0.3214462697505951, mean loss: 0.384653058614348
Epoch: 6, step: 1046, loss: 0.37878933548927307, mean loss: 0.38465245479155685
Epoch: 6, step: 1047, loss: 0.34033966064453125, mean loss: 0.38464789210682176
Epoch: 6, step: 1048, loss: 0.3613109886646271, mean loss: 0.38464548946052896
Epoch: 6, step: 1049, loss: 0.33164528012275696, mean loss: 0.38464003339615405
Epoch: 6, step: 1050, loss: 0.3179958760738373, mean loss: 0.38463317347260056
Epoch: 6, step: 1051, loss: 0.3199014365673065, mean loss: 0.3846265110871636
Epoch: 6, step: 1052, loss: 0.40527793765068054, mean loss: 0.3846286363754793
Epoch: 6, step: 1053, loss: 0.3927788734436035, mean loss: 0.384629475049802
Epoch: 6, step: 1054, loss: 0.37696439027786255, mean loss: 0.3846286863796948
Epoch: 6, step: 1055, loss: 0.3422859311103821, mean loss: 0.38462433012915265
Epoch: 6, step: 1056, loss: 0.31413498520851135, mean loss: 0.3846170788849472
Epoch: 6, step: 1057, loss: 0.32671600580215454, mean loss: 0.38461112320987184
Epoch: 6, step: 1058, loss: 0.3357067406177521, mean loss: 0.3846060934471862
Epoch: 6, step: 1059, loss: 0.35342198610305786, mean loss: 0.3846028865254108
Epoch: 6, step: 1060, loss: 0.33730313181877136, mean loss: 0.3845980227974204
Epoch: 6, step: 1061, loss: 0.3266386389732361, mean loss: 0.3845920635763815
Epoch: 6, step: 1062, loss: 0.3144386112689972, mean loss: 0.3845848513370161
Epoch: 6, step: 1063, loss: 0.3019925057888031, mean loss: 0.38457636116991617
Epoch: 6, step: 1064, loss: 0.3318883776664734, mean loss: 0.3845709456098891
Epoch: 6, step: 1065, loss: 0.34832459688186646, mean loss: 0.38456722039419244
Epoch: 6, step: 1066, loss: 0.4032873511314392, mean loss: 0.3845691441564715
Epoch: 6, step: 1067, loss: 0.3336273431777954, mean loss: 0.3845639096927458
Epoch: 6, step: 1068, loss: 0.34652209281921387, mean loss: 0.3845600011530485
Epoch: 6, step: 1069, loss: 0.3216792941093445, mean loss: 0.3845535412488936
Epoch: 6, step: 1070, loss: 0.3368827998638153, mean loss: 0.3845486444084843
Epoch: 6, step: 1071, loss: 0.34922945499420166, mean loss: 0.38454501671852803
Epoch: 6, step: 1072, loss: 0.3637077510356903, mean loss: 0.3845428767097283
Epoch: 6, step: 1073, loss: 0.4220447242259979, mean loss: 0.3845467277928579
Epoch: 6, step: 1074, loss: 0.34041744470596313, mean loss: 0.38454219660042677
Epoch: 6, step: 1075, loss: 0.34760773181915283, mean loss: 0.3845384045609215
Epoch: 6, step: 1076, loss: 0.42359235882759094, mean loss: 0.38454241379552434
Epoch: 6, step: 1077, loss: 0.37228843569755554, mean loss: 0.3845411559451756
Epoch: 6, step: 1078, loss: 0.3476502299308777, mean loss: 0.38453736954201284
Epoch: 6, step: 1079, loss: 0.32970860600471497, mean loss: 0.38453174261636247
Epoch: 6, step: 1080, loss: 0.3530658781528473, mean loss: 0.3845285136923539
Epoch: 6, step: 1081, loss: 0.32904142141342163, mean loss: 0.3845228203728096
Epoch: 6, step: 1082, loss: 0.31865084171295166, mean loss: 0.3845160621929943
Epoch: 6, step: 1083, loss: 0.33038005232810974, mean loss: 0.3845105086425363
Epoch: 6, step: 1084, loss: 0.3611602187156677, mean loss: 0.3845081134953492
Epoch: 6, step: 1085, loss: 0.3828050494194031, mean loss: 0.38450793882211065
Epoch: 6, step: 1086, loss: 0.4242855906486511, mean loss: 0.38451201816287844
Epoch: 6, step: 1087, loss: 0.36274954676628113, mean loss: 0.38450978657229223
Epoch: 6, step: 1088, loss: 0.37811461091041565, mean loss: 0.3845091308585978
Epoch: 6, step: 1089, loss: 0.3418428599834442, mean loss: 0.3845047566253729
Epoch: 6, step: 1090, loss: 0.3163386583328247, mean loss: 0.3844977688141692
Epoch: 6, step: 1091, loss: 0.3451646566390991, mean loss: 0.3844937371298544
Epoch: 6, step: 1092, loss: 0.2914179563522339, mean loss: 0.3844841977447178
Epoch: 6, step: 1093, loss: 0.3366309404373169, mean loss: 0.3844792937421243
Epoch: 6, step: 1094, loss: 0.3730609714984894, mean loss: 0.38447812371217827
Epoch: 6, step: 1095, loss: 0.338636577129364, mean loss: 0.38447342683240543
Epoch: 6, step: 1096, loss: 0.3364548981189728, mean loss: 0.3844685074052245
Epoch: 6, step: 1097, loss: 0.304561585187912, mean loss: 0.3844603218979291
Epoch: 6, step: 1098, loss: 0.3204614222049713, mean loss: 0.3844537666485495
Epoch: 6, step: 1099, loss: 0.3612948954105377, mean loss: 0.38445139478545676
Epoch: 6, step: 1100, loss: 0.3616374135017395, mean loss: 0.38444905848425004
Epoch: 6, step: 1101, loss: 0.33399608731269836, mean loss: 0.3844438922983836
Epoch: 6, step: 1102, loss: 0.2951483130455017, mean loss: 0.3844347497183434
Epoch: 6, step: 1103, loss: 0.39247485995292664, mean loss: 0.38443557282545177
Epoch: 6, step: 1104, loss: 0.4062023162841797, mean loss: 0.3844378009699352
Epoch: 6, step: 1105, loss: 0.34034833312034607, mean loss: 0.38443328823013484
Epoch: 6, step: 1106, loss: 0.3394757807254791, mean loss: 0.3844286871138208
Epoch: 6, step: 1107, loss: 0.31480497121810913, mean loss: 0.38442156229639385
Epoch: 6, step: 1108, loss: 0.37336334586143494, mean loss: 0.38442043078954485
Epoch: 6, step: 1109, loss: 0.3642313778400421, mean loss: 0.3844183652019707
Epoch: 6, step: 1110, loss: 0.3266694247722626, mean loss: 0.3844124573819779
Epoch: 6, step: 1111, loss: 0.35938236117362976, mean loss: 0.38440989702025447
Epoch: 6, step: 1112, loss: 0.34506142139434814, mean loss: 0.3844058724241999
Epoch: 6, step: 1113, loss: 0.3724288046360016, mean loss: 0.3844046475246511
Epoch: 6, step: 1114, loss: 0.3158622980117798, mean loss: 0.38439763838777485
Epoch: 6, step: 1115, loss: 0.3727779984474182, mean loss: 0.3843964502855315
Epoch: 6, step: 1116, loss: 0.32261306047439575, mean loss: 0.3843901336113866
Epoch: 6, step: 1117, loss: 0.3022697865962982, mean loss: 0.38438173856466656
Epoch: 6, step: 1118, loss: 0.32889583706855774, mean loss: 0.38437606689938025
Epoch: 6, step: 1119, loss: 0.34622204303741455, mean loss: 0.38437216726488904
Epoch: 6, step: 1120, loss: 0.3250720798969269, mean loss: 0.3843661069595883
Epoch: 6, step: 1121, loss: 0.31438493728637695, mean loss: 0.38435895580797647
Epoch: 6, step: 1122, loss: 0.30420389771461487, mean loss: 0.38435076585619415
Epoch: 6, step: 1123, loss: 0.3809342682361603, mean loss: 0.38435041680658033
Epoch: 6, step: 1124, loss: 0.3528200387954712, mean loss: 0.3843471958056598
Epoch: 6, step: 1125, loss: 0.35794177651405334, mean loss: 0.3843444986228925
Epoch: 6, step: 1126, loss: 0.3423158824443817, mean loss: 0.3843402060464265
Epoch: 6, step: 1127, loss: 0.34416764974594116, mean loss: 0.38433610345693503
Epoch: 6, step: 1128, loss: 0.3483593463897705, mean loss: 0.38433242973518816
Epoch: 6, step: 1129, loss: 0.3293633759021759, mean loss: 0.38432681721182355
Epoch: 6, step: 1130, loss: 0.3352019786834717, mean loss: 0.384321801914373
Epoch: 6, step: 1131, loss: 0.373033344745636, mean loss: 0.38432064956063994
Epoch: 6, step: 1132, loss: 0.3449424207210541, mean loss: 0.38431663014358985
Epoch: 6, step: 1133, loss: 0.37570565938949585, mean loss: 0.3843157512937476
Epoch: 6, step: 1134, loss: 0.3449542820453644, mean loss: 0.38431173440740735
Epoch: 6, step: 1135, loss: 0.33654817938804626, mean loss: 0.38430686057526253
Epoch: 6, step: 1136, loss: 0.33166855573654175, mean loss: 0.38430148986769813
Epoch: 6, step: 1137, loss: 0.3839111626148224, mean loss: 0.3843014500465134
Epoch: 6, step: 1138, loss: 0.3602151870727539, mean loss: 0.38429899301672926
Epoch: 6, step: 1139, loss: 0.36723655462265015, mean loss: 0.38429725266193593
Epoch: 6, step: 1140, loss: 0.32499560713768005, mean loss: 0.38429120455938376
Epoch: 6, step: 1141, loss: 0.33531519770622253, mean loss: 0.38428621006551744
Epoch: 6, step: 1142, loss: 0.3247072696685791, mean loss: 0.3842801349211923
Epoch: 6, step: 1143, loss: 0.3930247128009796, mean loss: 0.3842810264972404
Epoch: 6, step: 1144, loss: 0.31925079226493835, mean loss: 0.38427439684750725
Epoch: 6, step: 1145, loss: 0.30016547441482544, mean loss: 0.3842658230531716
Epoch: 6, step: 1146, loss: 0.42302632331848145, mean loss: 0.3842697737717798
Epoch: 6, step: 1147, loss: 0.369723916053772, mean loss: 0.38426829131583623
Epoch: 6, step: 1148, loss: 0.3376566171646118, mean loss: 0.38426354132356566
Epoch: 6, step: 1149, loss: 0.3809882700443268, mean loss: 0.38426320758897436
Epoch: 6, step: 1150, loss: 0.3864571452140808, mean loss: 0.3842634311180243
Epoch: 6, step: 1151, loss: 0.3255593478679657, mean loss: 0.38425745066944544
Epoch: 6, step: 1152, loss: 0.3791349530220032, mean loss: 0.38425692887076485
Epoch: 6, step: 1153, loss: 0.4338594079017639, mean loss: 0.3842619810686698
Epoch: 6, step: 1154, loss: 0.33922672271728516, mean loss: 0.38425739452641994
Epoch: 6, step: 1155, loss: 0.3144727945327759, mean loss: 0.38425028815167517
Epoch: 6, step: 1156, loss: 0.34181708097457886, mean loss: 0.38424596749113377
Epoch: 6, step: 1157, loss: 0.38793060183525085, mean loss: 0.38424634263207696
Epoch: 6, step: 1158, loss: 0.3399840295314789, mean loss: 0.38424183664479195
Epoch: 6, step: 1159, loss: 0.35928353667259216, mean loss: 0.384239296101228
Epoch: 6, step: 1160, loss: 0.3307075500488281, mean loss: 0.38423384757745677
Epoch: 6, step: 1161, loss: 0.3184039294719696, mean loss: 0.38422714801322866
Epoch: 6, step: 1162, loss: 0.3343409597873688, mean loss: 0.38422207157197236
Epoch: 6, step: 1163, loss: 0.322518527507782, mean loss: 0.3842157932300855
Epoch: 6, step: 1164, loss: 0.33696800470352173, mean loss: 0.384210986251906
Epoch: 6, step: 1165, loss: 0.3440977931022644, mean loss: 0.3842069055608429
Epoch: 6, step: 1166, loss: 0.31236350536346436, mean loss: 0.38419959771828394
Epoch: 6, step: 1167, loss: 0.3469594419002533, mean loss: 0.3841958100702146
Epoch: 6, step: 1168, loss: 0.3880016803741455, mean loss: 0.38419619712099295
Epoch: 6, step: 1169, loss: 0.3384239077568054, mean loss: 0.38419154262746397
Epoch: 6, step: 1170, loss: 0.42539042234420776, mean loss: 0.3841957316340442
Epoch: 6, step: 1171, loss: 0.2993338704109192, mean loss: 0.38418710395396866
Epoch: 6, step: 1172, loss: 0.36399316787719727, mean loss: 0.3841850510988221
Epoch: 6, step: 1173, loss: 0.29468631744384766, mean loss: 0.3841759538500261
Epoch: 6, step: 1174, loss: 0.35444462299346924, mean loss: 0.3841729320662212
Epoch: 6, step: 1175, loss: 0.39045295119285583, mean loss: 0.38417357027954707
Epoch: 6, step: 1176, loss: 0.3192738890647888, mean loss: 0.38416697545369455
Epoch: 6, step: 1177, loss: 0.3182273805141449, mean loss: 0.38416027563709837
Epoch: 6, step: 1178, loss: 0.3799564838409424, mean loss: 0.3841598485526936
Epoch: 6, step: 1179, loss: 0.30788183212280273, mean loss: 0.38415209987162596
Epoch: 6, step: 1180, loss: 0.31962165236473083, mean loss: 0.384145545229929
Epoch: 6, step: 1181, loss: 0.3372511565685272, mean loss: 0.38414078244416205
Epoch: 6, step: 1182, loss: 0.39631474018096924, mean loss: 0.3841420187554992
Epoch: 6, step: 1183, loss: 0.34878823161125183, mean loss: 0.3841384288096072
Epoch: 6, step: 1184, loss: 0.3314987123012543, mean loss: 0.3841330841333448
Epoch: 6, step: 1185, loss: 0.3252980709075928, mean loss: 0.38412711103555536
Epoch: 6, step: 1186, loss: 0.37868231534957886, mean loss: 0.38412655832053294
Epoch: 6, step: 1187, loss: 0.35164135694503784, mean loss: 0.3841232610000523
Epoch: 6, step: 1188, loss: 0.361833781003952, mean loss: 0.38412099879767775
Epoch: 6, step: 1189, loss: 0.3542134463787079, mean loss: 0.38411796373045437
Epoch: 6, step: 1190, loss: 0.3600805997848511, mean loss: 0.3841155246270606
Epoch: 6, step: 1191, loss: 0.3172853887081146, mean loss: 0.38410874397203637
Epoch: 6, step: 1192, loss: 0.33778315782546997, mean loss: 0.3841040442067785
Epoch: 6, step: 1193, loss: 0.3146335780620575, mean loss: 0.3840969970911217
Epoch: 6, step: 1194, loss: 0.33907052874565125, mean loss: 0.3840924300489932
Epoch: 6, step: 1195, loss: 0.36741939187049866, mean loss: 0.3840907390714903
Epoch: 6, step: 1196, loss: 0.3958306908607483, mean loss: 0.38409192961522715
Epoch: 6, step: 1197, loss: 0.35159096121788025, mean loss: 0.38408863403944155
Epoch: 6, step: 1198, loss: 0.303844690322876, mean loss: 0.38408049818384826
Epoch: 6, step: 1199, loss: 0.42629846930503845, mean loss: 0.38408477818903086
Epoch: 6, step: 1200, loss: 0.39338499307632446, mean loss: 0.3840857209376256
Epoch: 6, step: 1201, loss: 0.3058813810348511, mean loss: 0.3840777942865104
Epoch: 6, step: 1202, loss: 0.339364618062973, mean loss: 0.3840732626987711
Epoch: 6, step: 1203, loss: 0.33140015602111816, mean loss: 0.3840679249295496
Epoch: 6, step: 1204, loss: 0.3853484094142914, mean loss: 0.38406805467769883
Epoch: 6, step: 1205, loss: 0.35039645433425903, mean loss: 0.3840646431680389
Epoch: 6, step: 1206, loss: 0.32441237568855286, mean loss: 0.3840585999842197
Epoch: 6, step: 1207, loss: 0.3375260531902313, mean loss: 0.38405388639560606
Epoch: 6, step: 1208, loss: 0.37013429403305054, mean loss: 0.3840524765310905
Epoch: 6, step: 1209, loss: 0.3565782904624939, mean loss: 0.384049694053263
Epoch: 6, step: 1210, loss: 0.3474511504173279, mean loss: 0.38404598787162897
Epoch: 6, step: 1211, loss: 0.34095504879951477, mean loss: 0.38404162467407205
Epoch: 6, step: 1212, loss: 0.3352758586406708, mean loss: 0.3840366873686115
Epoch: 6, step: 1213, loss: 0.35119226574897766, mean loss: 0.3840333623613611
Epoch: 6, step: 1214, loss: 0.3713965117931366, mean loss: 0.38403208319843285
Epoch: 6, step: 1215, loss: 0.3081042170524597, mean loss: 0.3840243981917379
Epoch: 6, step: 1216, loss: 0.3813002407550812, mean loss: 0.3840241224952055
Epoch: 6, step: 1217, loss: 0.37321779131889343, mean loss: 0.384023028958353
Epoch: 6, step: 1218, loss: 0.35364410281181335, mean loss: 0.3840199551016145
Epoch: 6, step: 1219, loss: 0.31331345438957214, mean loss: 0.38401280146940975
Epoch: 6, step: 1220, loss: 0.33901193737983704, mean loss: 0.38400824902994696
Epoch: 6, step: 1221, loss: 0.3612750470638275, mean loss: 0.38400594949505257
Epoch: 6, step: 1222, loss: 0.30023324489593506, mean loss: 0.3839974764795171
Epoch: 6, step: 1223, loss: 0.30455246567726135, mean loss: 0.38398944199217866
Epoch: 6, step: 1224, loss: 0.330051451921463, mean loss: 0.3839839876499731
Epoch: 6, step: 1225, loss: 0.32624414563179016, mean loss: 0.38397814944552233
Epoch: 6, step: 1226, loss: 0.3344516158103943, mean loss: 0.3839731422133279
Epoch: 6, step: 1227, loss: 0.4080298840999603, mean loss: 0.3839755741524592
Epoch: 6, step: 1228, loss: 0.30927401781082153, mean loss: 0.3839680232016514
Epoch: 6, step: 1229, loss: 0.35779082775115967, mean loss: 0.38396537743700104
Epoch: 6, step: 1230, loss: 0.35353055596351624, mean loss: 0.38396230165918666
Epoch: 6, step: 1231, loss: 0.3308994472026825, mean loss: 0.383956939608413
Epoch: 6, step: 1232, loss: 0.3252064287662506, mean loss: 0.3839510034145318
Epoch: 6, step: 1233, loss: 0.35568732023239136, mean loss: 0.3839481479201711
Epoch: 6, step: 1234, loss: 0.37096261978149414, mean loss: 0.3839468361181569
Epoch: 6, step: 1235, loss: 0.3288824260234833, mean loss: 0.38394127405653117
Epoch: 6, step: 1236, loss: 0.3441053628921509, mean loss: 0.38393725063352696
Epoch: 6, step: 1237, loss: 0.3456191122531891, mean loss: 0.3839333808962637
Epoch: 6, step: 1238, loss: 0.32929494976997375, mean loss: 0.38392786353474434
Epoch: 6, step: 1239, loss: 0.32984164357185364, mean loss: 0.3839224024866867
Epoch: 6, step: 1240, loss: 0.33470219373703003, mean loss: 0.38391743325814054
Epoch: 6, step: 1241, loss: 0.3655652701854706, mean loss: 0.3839155806271015
Epoch: 6, step: 1242, loss: 0.40320470929145813, mean loss: 0.3839175276472554
Epoch: 6, step: 1243, loss: 0.34606578946113586, mean loss: 0.3839137073264857
Epoch: 6, step: 1244, loss: 0.31703129410743713, mean loss: 0.3839069576632282
Epoch: 6, step: 1245, loss: 0.30240121483802795, mean loss: 0.3838987330675849
Epoch: 6, step: 1246, loss: 0.3699752390384674, mean loss: 0.3838973282149939
Epoch: 6, step: 1247, loss: 0.3301948308944702, mean loss: 0.3838919102874999
Epoch: 6, step: 1248, loss: 0.3064844310283661, mean loss: 0.3838841016040278
Epoch: 6, step: 1249, loss: 0.30274033546447754, mean loss: 0.3838759168384297
Epoch: 6, step: 1250, loss: 0.3866652548313141, mean loss: 0.383876198163492
Epoch: 6, step: 1251, loss: 0.36410462856292725, mean loss: 0.3838742042577235
Epoch: 6, step: 1252, loss: 0.3274843692779541, mean loss: 0.3838685180789416
Epoch: 6, step: 1253, loss: 0.346242755651474, mean loss: 0.3838647243944863
Epoch: 6, step: 1254, loss: 0.33306825160980225, mean loss: 0.38385960326606766
Epoch: 6, step: 1255, loss: 0.3256860077381134, mean loss: 0.38385373899232494
Epoch: 6, step: 1256, loss: 0.427238792181015, mean loss: 0.38385811204475806
Epoch: 6, step: 1257, loss: 0.36037254333496094, mean loss: 0.38385574502513403
Epoch: 6, step: 1258, loss: 0.34476161003112793, mean loss: 0.38385180527556295
Epoch: 6, step: 1259, loss: 0.32243111729621887, mean loss: 0.38384561616955937
Epoch: 6, step: 1260, loss: 0.42822378873825073, mean loss: 0.38385008752195926
Epoch: 6, step: 1261, loss: 0.33257830142974854, mean loss: 0.3838449221193709
Epoch: 6, step: 1262, loss: 0.3315873444080353, mean loss: 0.38383965793303954
Epoch: 6, step: 1263, loss: 0.3446856141090393, mean loss: 0.383835714133299
Epoch: 6, step: 1264, loss: 0.3500728905200958, mean loss: 0.3838323137079174
Epoch: 6, step: 1265, loss: 0.32891252636909485, mean loss: 0.38382678301432843
Epoch: 6, step: 1266, loss: 0.3375668525695801, mean loss: 0.38382212488015816
Epoch: 6, step: 1267, loss: 0.29853373765945435, mean loss: 0.38381353764825915
Epoch: 6, step: 1268, loss: 0.33996352553367615, mean loss: 0.38380912306936915
Epoch: 6, step: 1269, loss: 0.32486405968666077, mean loss: 0.3838031894008184
Epoch: 6, step: 1270, loss: 0.3168995678424835, mean loss: 0.3837964552667914
Epoch: 6, step: 1271, loss: 0.3788224458694458, mean loss: 0.38379595466198085
Epoch: 6, step: 1272, loss: 0.34418267011642456, mean loss: 0.38379196821893513
Epoch: 6, step: 1273, loss: 0.3927733302116394, mean loss: 0.38379287195831857
Epoch: 6, step: 1274, loss: 0.34028053283691406, mean loss: 0.38378849401897647
Epoch: 6, step: 1275, loss: 0.3348177373409271, mean loss: 0.3837835673834958
Epoch: 6, step: 1276, loss: 0.34102657437324524, mean loss: 0.3837792663078484
Epoch: 6, step: 1277, loss: 0.3598610758781433, mean loss: 0.38377686053532484
Epoch: 6, step: 1278, loss: 0.341556191444397, mean loss: 0.383772614264673
Epoch: 6, step: 1279, loss: 0.3590034246444702, mean loss: 0.3837701233968512
Epoch: 6, step: 1280, loss: 0.3208412230014801, mean loss: 0.38376379570450375
Epoch: 6, step: 1281, loss: 0.3491952419281006, mean loss: 0.3837603200807579
Epoch: 6, step: 1282, loss: 0.3183308243751526, mean loss: 0.3837537422687839
Epoch: 6, step: 1283, loss: 0.34661850333213806, mean loss: 0.3837500093336274
Epoch: 6, step: 1284, loss: 0.3853124976158142, mean loss: 0.38375016638340953
Epoch: 6, step: 1285, loss: 0.3518123924732208, mean loss: 0.3837469565568859
Epoch: 6, step: 1286, loss: 0.31816229224205017, mean loss: 0.38374036579572474
Epoch: 6, step: 1287, loss: 0.3552425503730774, mean loss: 0.3837375022692554
Epoch: 6, step: 1288, loss: 0.33118492364883423, mean loss: 0.38373222219504455
Epoch: 6, step: 1289, loss: 0.34921616315841675, mean loss: 0.38372875463838024
Epoch: 6, step: 1290, loss: 0.3469054698944092, mean loss: 0.3837250556645235
Epoch: 6, step: 1291, loss: 0.3152933120727539, mean loss: 0.3837181822471278
Epoch: 6, step: 1292, loss: 0.3543510437011719, mean loss: 0.3837152328508693
Epoch: 6, step: 1293, loss: 0.352247953414917, mean loss: 0.3837120728509259
Epoch: 6, step: 1294, loss: 0.3624044358730316, mean loss: 0.38370993331513137
Epoch: 6, step: 1295, loss: 0.31363171339035034, mean loss: 0.3837028973492755
Epoch: 6, step: 1296, loss: 0.3208391070365906, mean loss: 0.3836965863573758
Epoch: 6, step: 1297, loss: 0.3607446849346161, mean loss: 0.383694282412242
Epoch: 6, step: 1298, loss: 0.3245232403278351, mean loss: 0.38368834333344204
Epoch: 6, step: 1299, loss: 0.39835798740386963, mean loss: 0.38368981559800147
Epoch: 6, step: 1300, loss: 0.3586348593235016, mean loss: 0.3836873013023392
Epoch: 6, step: 1301, loss: 0.39952024817466736, mean loss: 0.3836888899985937
Epoch: 6, step: 1302, loss: 0.35467007756233215, mean loss: 0.38368597850943587
Epoch: 6, step: 1303, loss: 0.32482677698135376, mean loss: 0.38368007369387325
Epoch: 6, step: 1304, loss: 0.31164711713790894, mean loss: 0.38367284799856216
Epoch: 6, step: 1305, loss: 0.3312748670578003, mean loss: 0.38366759243377374
Epoch: 6, step: 1306, loss: 0.3074440658092499, mean loss: 0.38365994791199814
Epoch: 6, step: 1307, loss: 0.3630719482898712, mean loss: 0.3836578833312097
Epoch: 6, step: 1308, loss: 0.3350856602191925, mean loss: 0.38365301295889326
Epoch: 6, step: 1309, loss: 0.3338472545146942, mean loss: 0.3836480193997952
Epoch: 6, step: 1310, loss: 0.33868223428726196, mean loss: 0.3836435115516636
Epoch: 6, step: 1311, loss: 0.41996458172798157, mean loss: 0.3836471523967093
Epoch: 6, step: 1312, loss: 0.3379204571247101, mean loss: 0.38364256918579703
Epoch: 6, step: 1313, loss: 0.3480459451675415, mean loss: 0.3836390016748712
Epoch: 6, step: 1314, loss: 0.3432419002056122, mean loss: 0.38363495346348037
Epoch: 6, step: 1315, loss: 0.3778518736362457, mean loss: 0.3836343739965638
Epoch: 6, step: 1316, loss: 0.3403201997280121, mean loss: 0.3836300343337777
Epoch: 6, step: 1317, loss: 0.3906269371509552, mean loss: 0.383630735285773
Epoch: 6, step: 1318, loss: 0.34792861342430115, mean loss: 0.38362715899389066
Epoch: 6, step: 1319, loss: 0.3307625949382782, mean loss: 0.38362186406559984
Epoch: 6, step: 1320, loss: 0.32171717286109924, mean loss: 0.38361566429682625
Epoch: 6, step: 1321, loss: 0.3445594608783722, mean loss: 0.3836117532009502
Epoch: 6, step: 1322, loss: 0.369440495967865, mean loss: 0.3836103342305654
Epoch: 6, step: 1323, loss: 0.3686501681804657, mean loss: 0.3836088364165836
Epoch: 6, step: 1324, loss: 0.3499336540699005, mean loss: 0.3836054651899997
Epoch: 6, step: 1325, loss: 0.3375883400440216, mean loss: 0.3836008588711663
Epoch: 6, step: 1326, loss: 0.3341909348964691, mean loss: 0.38359591342786986
Epoch: 6, step: 1327, loss: 0.3303253650665283, mean loss: 0.3835905821079778
Epoch: 6, step: 1328, loss: 0.3637321889400482, mean loss: 0.3835885948775998
Epoch: 6, step: 1329, loss: 0.36751362681388855, mean loss: 0.38358698641571626
Epoch: 6, step: 1330, loss: 0.3059341013431549, mean loss: 0.38357921724262245
Epoch: 6, step: 1331, loss: 0.3743530809879303, mean loss: 0.38357829425980383
Epoch: 6, step: 1332, loss: 0.32006409764289856, mean loss: 0.38357194093414443
Epoch: 6, step: 1333, loss: 0.3706512451171875, mean loss: 0.38357064860609713
Epoch: 6, step: 1334, loss: 0.3422774076461792, mean loss: 0.38356651886902743
Epoch: 6, step: 1335, loss: 0.3497256934642792, mean loss: 0.38356313478648696
Epoch: 6, step: 1336, loss: 0.3400677740573883, mean loss: 0.38355878568532414
Epoch: 6, step: 1337, loss: 0.33426061272621155, mean loss: 0.38355385685379456
Epoch: 6, step: 1338, loss: 0.33630257844924927, mean loss: 0.3835491331430673
Epoch: 6, step: 1339, loss: 0.29493263363838196, mean loss: 0.3835402750363595
Epoch: 6, step: 1340, loss: 0.3466797173023224, mean loss: 0.3835365908226929
Epoch: 6, step: 1341, loss: 0.3775484561920166, mean loss: 0.3835359923683025
Epoch: 6, step: 1342, loss: 0.3610047399997711, mean loss: 0.38353374081915004
Epoch: 6, step: 1343, loss: 0.35695573687553406, mean loss: 0.38353108514329637
Epoch: 6, step: 1344, loss: 0.3512226939201355, mean loss: 0.38352785720931465
Epoch: 6, step: 1345, loss: 0.3285469114780426, mean loss: 0.3835223646073435
Epoch: 6, step: 1346, loss: 0.3804962933063507, mean loss: 0.3835220623327155
Epoch: 6, step: 1347, loss: 0.3780462145805359, mean loss: 0.38352151540425444
Epoch: 6, step: 1348, loss: 0.3599717915058136, mean loss: 0.38351916348935394
Epoch: 6, step: 1349, loss: 0.32572728395462036, mean loss: 0.3835133923809522
Epoch: 6, step: 1350, loss: 0.4167887568473816, mean loss: 0.3835167149335699
Epoch: 6, step: 1351, loss: 0.3566518723964691, mean loss: 0.38351403274082463
Epoch: 6, step: 1352, loss: 0.37036073207855225, mean loss: 0.38351271964302464
Epoch: 6, step: 1353, loss: 0.387885719537735, mean loss: 0.3835131561572884
Epoch: 6, step: 1354, loss: 0.34639519453048706, mean loss: 0.3835094514001643
Epoch: 6, step: 1355, loss: 0.3445940315723419, mean loss: 0.3835055676257304
Epoch: 6, step: 1356, loss: 0.39401793479919434, mean loss: 0.3835066166594769
Epoch: 6, step: 1357, loss: 0.356149822473526, mean loss: 0.3835038869853414
Epoch: 6, step: 1358, loss: 0.36620140075683594, mean loss: 0.38350216070715837
Epoch: 6, step: 1359, loss: 0.33485299348831177, mean loss: 0.3834973074382818
Epoch: 6, step: 1360, loss: 0.3303500711917877, mean loss: 0.38349200596833205
Epoch: 6, step: 1361, loss: 0.34437990188598633, mean loss: 0.3834881049006997
Epoch: 6, step: 1362, loss: 0.3154149651527405, mean loss: 0.3834813159169809
Epoch: 6, step: 1363, loss: 0.3955058753490448, mean loss: 0.38348251501544844
Epoch: 6, step: 1364, loss: 0.34328287839889526, mean loss: 0.3834785066759713
Epoch: 6, step: 1365, loss: 0.3223433196544647, mean loss: 0.3834724114429681
Epoch: 6, step: 1366, loss: 0.35355231165885925, mean loss: 0.3834694286795563
Epoch: 6, step: 1367, loss: 0.35147324204444885, mean loss: 0.38346623926701295
Epoch: 6, step: 1368, loss: 0.3856050968170166, mean loss: 0.3834664524492665
Epoch: 6, step: 1369, loss: 0.3173971176147461, mean loss: 0.38345986790323955
Epoch: 6, step: 1370, loss: 0.38110020756721497, mean loss: 0.38345963276020656
Epoch: 6, step: 1371, loss: 0.33693480491638184, mean loss: 0.3834549969662803
Epoch: 6, step: 1372, loss: 0.33737999200820923, mean loss: 0.38345040645069217
Epoch: 6, step: 1373, loss: 0.3678325414657593, mean loss: 0.38344885057651557
Epoch: 6, step: 1374, loss: 0.3703587055206299, mean loss: 0.38344754664733377
Epoch: 6, step: 1375, loss: 0.38534948229789734, mean loss: 0.3834477360831555
Epoch: 6, step: 1376, loss: 0.34681421518325806, mean loss: 0.38344408768947963
Epoch: 6, step: 1377, loss: 0.3434903025627136, mean loss: 0.383440109021373
Epoch: 6, step: 1378, loss: 0.3602355718612671, mean loss: 0.38343779850288645
Epoch: 6, step: 1379, loss: 0.367413192987442, mean loss: 0.3834362030622736
Epoch: 6, step: 1380, loss: 0.38306793570518494, mean loss: 0.3834361664005158
Epoch: 6, step: 1381, loss: 0.31428346037864685, mean loss: 0.3834292827945013
Epoch: 6, step: 1382, loss: 0.3028546869754791, mean loss: 0.38342126302782276
Epoch: 6, step: 1383, loss: 0.3466189503669739, mean loss: 0.3834176003772793
Epoch: 6, step: 1384, loss: 0.32203570008277893, mean loss: 0.3834114921177217
Epoch: 6, step: 1385, loss: 0.33771273493766785, mean loss: 0.3834069449777038
Epoch: 6, step: 1386, loss: 0.35348641872406006, mean loss: 0.3834039681071184
Epoch: 6, step: 1387, loss: 0.3285558223724365, mean loss: 0.38339851166603856
Epoch: 6, step: 1388, loss: 0.3545439839363098, mean loss: 0.3833956414255402
Epoch: 6, step: 1389, loss: 0.3772170841693878, mean loss: 0.3833950268883156
Epoch: 6, step: 1390, loss: 0.4315411150455475, mean loss: 0.38339981516162813
Epoch: 6, step: 1391, loss: 0.35169437527656555, mean loss: 0.3833966622738114
Epoch: 6, step: 1392, loss: 0.3538046181201935, mean loss: 0.3833937198412616
Epoch: 6, step: 1393, loss: 0.3608558773994446, mean loss: 0.3833914790535859
Epoch: 6, step: 1394, loss: 0.3506869375705719, mean loss: 0.3833882277819403
Epoch: 6, step: 1395, loss: 0.3310079872608185, mean loss: 0.38338302099858834
Epoch: 6, step: 1396, loss: 0.3409889042377472, mean loss: 0.3833788072905314
Epoch: 6, step: 1397, loss: 0.38537487387657166, mean loss: 0.38337900566725436
Epoch: 6, step: 1398, loss: 0.32683610916137695, mean loss: 0.3833733867766148
Epoch: 6, step: 1399, loss: 0.3063720762729645, mean loss: 0.3833657356130115
Epoch: 6, step: 1400, loss: 0.34017297625541687, mean loss: 0.38336144423105845
Epoch: 6, step: 1401, loss: 0.35841014981269836, mean loss: 0.3833589654614957
Epoch: 6, step: 1402, loss: 0.32947611808776855, mean loss: 0.3833536130379958
Epoch: 6, step: 1403, loss: 0.3489837646484375, mean loss: 0.383350199266801
Epoch: 6, step: 1404, loss: 0.3612361550331116, mean loss: 0.3833480030165046
Epoch: 6, step: 1405, loss: 0.3251919746398926, mean loss: 0.3833422278399032
Epoch: 6, step: 1406, loss: 0.36873748898506165, mean loss: 0.3833407776622788
Epoch: 6, step: 1407, loss: 0.32936570048332214, mean loss: 0.3833354187388099
Epoch: 6, step: 1408, loss: 0.380043089389801, mean loss: 0.3833350918918577
Epoch: 6, step: 1409, loss: 0.3575754761695862, mean loss: 0.3833325348523776
Epoch: 6, step: 1410, loss: 0.3499753773212433, mean loss: 0.3833292239682554
Epoch: 6, step: 1411, loss: 0.32520562410354614, mean loss: 0.3833234554490152
Epoch: 6, step: 1412, loss: 0.32490259408950806, mean loss: 0.38331765800321194
Epoch: 6, step: 1413, loss: 0.3202306926250458, mean loss: 0.38331139813365667
Epoch: 6, step: 1414, loss: 0.35663339495658875, mean loss: 0.38330875124376906
Epoch: 6, step: 1415, loss: 0.34295615553855896, mean loss: 0.38330474801006814
Epoch: 6, step: 1416, loss: 0.3261054754257202, mean loss: 0.38329907404195146
Epoch: 6, step: 1417, loss: 0.34792467951774597, mean loss: 0.38329556537357967
Epoch: 6, step: 1418, loss: 0.3949477970600128, mean loss: 0.38329672100500745
Epoch: 6, step: 1419, loss: 0.3205496668815613, mean loss: 0.3832904985680654
Epoch: 6, step: 1420, loss: 0.3597683608531952, mean loss: 0.38328816617959593
Epoch: 6, step: 1421, loss: 0.3362392783164978, mean loss: 0.38328350140784667
Epoch: 6, step: 1422, loss: 0.3381272852420807, mean loss: 0.38327902473329867
Epoch: 6, step: 1423, loss: 0.33438193798065186, mean loss: 0.38327417767870386
Epoch: 6, step: 1424, loss: 0.3291330933570862, mean loss: 0.38326881133076834
Epoch: 6, step: 1425, loss: 0.3241509199142456, mean loss: 0.3832629522731453
Epoch: 6, step: 1426, loss: 0.3649207651615143, mean loss: 0.3832611345953025
Epoch: 6, step: 1427, loss: 0.3458421230316162, mean loss: 0.38325742680580943
Epoch: 6, step: 1428, loss: 0.3512365520000458, mean loss: 0.38325425422334575
Epoch: 6, step: 1429, loss: 0.3286855220794678, mean loss: 0.38324884816706045
Epoch: 6, step: 1430, loss: 0.32337626814842224, mean loss: 0.38324291725274456
Epoch: 6, step: 1431, loss: 0.35462433099746704, mean loss: 0.3832400826067209
Epoch: 6, step: 1432, loss: 0.3604878783226013, mean loss: 0.3832378292439117
Epoch: 6, step: 1433, loss: 0.33314672112464905, mean loss: 0.3832328687459795
Epoch: 6, step: 1434, loss: 0.3404090404510498, mean loss: 0.38322862834313814
Epoch: 6, step: 1435, loss: 0.3426974415779114, mean loss: 0.3832246153543495
Epoch: 6, step: 1436, loss: 0.3365691006183624, mean loss: 0.3832199964537717
Epoch: 6, step: 1437, loss: 0.35448622703552246, mean loss: 0.383217152089347
Epoch: 6, step: 1438, loss: 0.32965919375419617, mean loss: 0.38321185089580695
Epoch: 6, step: 1439, loss: 0.340148001909256, mean loss: 0.3832075888363269
Epoch: 6, step: 1440, loss: 0.3034433126449585, mean loss: 0.3831996952909344
Epoch: 6, step: 1441, loss: 0.3227427005767822, mean loss: 0.3831937130037076
Epoch: 6, step: 1442, loss: 0.3350658416748047, mean loss: 0.38318895116821444
Epoch: 6, step: 1443, loss: 0.3161145746707916, mean loss: 0.38318231539689496
Valid: 6, mean loss: 0.21004673341910046
Epoch: 7, step: 0, loss: 0.35964149236679077, mean loss: 0.38317998669741626
Epoch: 7, step: 1, loss: 0.3518894910812378, mean loss: 0.38317689169290425
Epoch: 7, step: 2, loss: 0.3285192847251892, mean loss: 0.38317148593610795
Epoch: 7, step: 3, loss: 0.32958468794822693, mean loss: 0.38316618660877527
Epoch: 7, step: 4, loss: 0.36232131719589233, mean loss: 0.3831641254133424
Epoch: 7, step: 5, loss: 0.3262050151824951, mean loss: 0.383158493703808
Epoch: 7, step: 6, loss: 0.3016863465309143, mean loss: 0.3831504391168408
Epoch: 7, step: 7, loss: 0.3569580018520355, mean loss: 0.3831478499079376
Epoch: 7, step: 8, loss: 0.40356457233428955, mean loss: 0.38314986796886735
Epoch: 7, step: 9, loss: 0.41498658061027527, mean loss: 0.3831530145109351
Epoch: 7, step: 10, loss: 0.35703709721565247, mean loss: 0.38315043363166884
Epoch: 7, step: 11, loss: 0.3884350061416626, mean loss: 0.3831509558226283
Epoch: 7, step: 12, loss: 0.38458555936813354, mean loss: 0.3831510975678655
Epoch: 7, step: 13, loss: 0.3394952714443207, mean loss: 0.3831467846034194
Epoch: 7, step: 14, loss: 0.3405149281024933, mean loss: 0.38314257321781225
Epoch: 7, step: 15, loss: 0.35268741846084595, mean loss: 0.38313956500418556
Epoch: 7, step: 16, loss: 0.35970425605773926, mean loss: 0.38313725040577107
Epoch: 7, step: 17, loss: 0.3548433184623718, mean loss: 0.38313445621932596
Epoch: 7, step: 18, loss: 0.3674928545951843, mean loss: 0.383132911674878
Epoch: 7, step: 19, loss: 0.35568156838417053, mean loss: 0.3831302012341897
Epoch: 7, step: 20, loss: 0.32458481192588806, mean loss: 0.3831244212569651
Epoch: 7, step: 21, loss: 0.3577091097831726, mean loss: 0.38312191234171594
Epoch: 7, step: 22, loss: 0.35552191734313965, mean loss: 0.3831191880306905
Epoch: 7, step: 23, loss: 0.35461440682411194, mean loss: 0.3831163746886843
Epoch: 7, step: 24, loss: 0.3414742648601532, mean loss: 0.38311226513476854
Epoch: 7, step: 25, loss: 0.39772623777389526, mean loss: 0.38311370720824783
Epoch: 7, step: 26, loss: 0.32045915722846985, mean loss: 0.3831075252102232
Epoch: 7, step: 27, loss: 0.3567970395088196, mean loss: 0.3831049294638043
Epoch: 7, step: 28, loss: 0.3623789846897125, mean loss: 0.38310288488012334
Epoch: 7, step: 29, loss: 0.37445980310440063, mean loss: 0.3831020323370403
Epoch: 7, step: 30, loss: 0.3523562252521515, mean loss: 0.3830989999071079
Epoch: 7, step: 31, loss: 0.32910820841789246, mean loss: 0.38309367537145805
Epoch: 7, step: 32, loss: 0.3466458320617676, mean loss: 0.38309008126404165
Epoch: 7, step: 33, loss: 0.3592366874217987, mean loss: 0.3830877293222311
Epoch: 7, step: 34, loss: 0.32737624645233154, mean loss: 0.38308223671818203
Epoch: 7, step: 35, loss: 0.3554386794567108, mean loss: 0.3830795116040987
Epoch: 7, step: 36, loss: 0.3547566533088684, mean loss: 0.38307671979943675
Epoch: 7, step: 37, loss: 0.3362041115760803, mean loss: 0.3830720999878634
Epoch: 7, step: 38, loss: 0.31443551182746887, mean loss: 0.38306533576315066
Epoch: 7, step: 39, loss: 0.3610062301158905, mean loss: 0.38306316202392643
Epoch: 7, step: 40, loss: 0.3353026509284973, mean loss: 0.3830584560912143
Epoch: 7, step: 41, loss: 0.3401228189468384, mean loss: 0.3830542259791804
Epoch: 7, step: 42, loss: 0.3010239601135254, mean loss: 0.3830461449757457
Epoch: 7, step: 43, loss: 0.35775789618492126, mean loss: 0.38304365401349283
Epoch: 7, step: 44, loss: 0.35939568281173706, mean loss: 0.3830413248525353
Epoch: 7, step: 45, loss: 0.329317569732666, mean loss: 0.38303603395681735
Epoch: 7, step: 46, loss: 0.37802234292030334, mean loss: 0.38303554024031944
Epoch: 7, step: 47, loss: 0.3178166151046753, mean loss: 0.3830291185265408
Epoch: 7, step: 48, loss: 0.3332645893096924, mean loss: 0.3830242189962448
Epoch: 7, step: 49, loss: 0.34922003746032715, mean loss: 0.38302089115793647
Epoch: 7, step: 50, loss: 0.36854448914527893, mean loss: 0.38301946617496446
Epoch: 7, step: 51, loss: 0.36890506744384766, mean loss: 0.3830180769624909
Epoch: 7, step: 52, loss: 0.3570556640625, mean loss: 0.3830155218583771
Epoch: 7, step: 53, loss: 0.34903690218925476, mean loss: 0.383012178164255
Epoch: 7, step: 54, loss: 0.3808727264404297, mean loss: 0.3830119676504575
Epoch: 7, step: 55, loss: 0.3455837368965149, mean loss: 0.38300828521925384
Epoch: 7, step: 56, loss: 0.35068464279174805, mean loss: 0.3830051053232944
Epoch: 7, step: 57, loss: 0.33250415325164795, mean loss: 0.3830001376907869
Epoch: 7, step: 58, loss: 0.3844098448753357, mean loss: 0.3830002763459639
Epoch: 7, step: 59, loss: 0.353208988904953, mean loss: 0.38299734643964595
Epoch: 7, step: 60, loss: 0.32414916157722473, mean loss: 0.38299155942176194
Epoch: 7, step: 61, loss: 0.34698089957237244, mean loss: 0.38298801855058695
Epoch: 7, step: 62, loss: 0.32459932565689087, mean loss: 0.38298227784732336
Epoch: 7, step: 63, loss: 0.37021487951278687, mean loss: 0.3829810226960911
Epoch: 7, step: 64, loss: 0.36053571105003357, mean loss: 0.3829788163349738
Epoch: 7, step: 65, loss: 0.3627545237541199, mean loss: 0.38297682849414616
Epoch: 7, step: 66, loss: 0.36876240372657776, mean loss: 0.38297543149908303
Epoch: 7, step: 67, loss: 0.3550630211830139, mean loss: 0.3829726885342328
Epoch: 7, step: 68, loss: 0.34788137674331665, mean loss: 0.3829692404344204
Epoch: 7, step: 69, loss: 0.3434160649776459, mean loss: 0.3829653542902411
Epoch: 7, step: 70, loss: 0.38527920842170715, mean loss: 0.3829655816066898
Epoch: 7, step: 71, loss: 0.37718719244003296, mean loss: 0.3829650139849642
Epoch: 7, step: 72, loss: 0.3315243721008301, mean loss: 0.3829599613730514
Epoch: 7, step: 73, loss: 0.38548681139945984, mean loss: 0.38296020954139026
Epoch: 7, step: 74, loss: 0.3149113655090332, mean loss: 0.38295352694843804
Epoch: 7, step: 75, loss: 0.3469271659851074, mean loss: 0.38294998940317454
Epoch: 7, step: 76, loss: 0.34886273741722107, mean loss: 0.3829466425939467
Epoch: 7, step: 77, loss: 0.31349390745162964, mean loss: 0.3829398241436087
Epoch: 7, step: 78, loss: 0.35837695002555847, mean loss: 0.3829374129455997
Epoch: 7, step: 79, loss: 0.33186274766921997, mean loss: 0.382932399727571
Epoch: 7, step: 80, loss: 0.33297136425971985, mean loss: 0.38292749629882744
Epoch: 7, step: 81, loss: 0.31995657086372375, mean loss: 0.38292131662017825
Epoch: 7, step: 82, loss: 0.35717207193374634, mean loss: 0.3829187899550142
Epoch: 7, step: 83, loss: 0.31570306420326233, mean loss: 0.3829121950054703
Epoch: 7, step: 84, loss: 0.37875720858573914, mean loss: 0.3829117873741135
Epoch: 7, step: 85, loss: 0.3960798382759094, mean loss: 0.3829130791193462
Epoch: 7, step: 86, loss: 0.3388438820838928, mean loss: 0.3829087564908974
Epoch: 7, step: 87, loss: 0.33143022656440735, mean loss: 0.38290370759624004
Epoch: 7, step: 88, loss: 0.32293230295181274, mean loss: 0.38289782631697705
Epoch: 7, step: 89, loss: 0.37422439455986023, mean loss: 0.3828969758137649
Epoch: 7, step: 90, loss: 0.35781610012054443, mean loss: 0.38289451666329005
Epoch: 7, step: 91, loss: 0.3292475938796997, mean loss: 0.3828892571610564
Epoch: 7, step: 92, loss: 0.38272061944007874, mean loss: 0.3828892406295672
Epoch: 7, step: 93, loss: 0.33053284883499146, mean loss: 0.3828841086562488
Epoch: 7, step: 94, loss: 0.33925554156303406, mean loss: 0.382879832603412
Epoch: 7, step: 95, loss: 0.3505365550518036, mean loss: 0.38287666293685463
Epoch: 7, step: 96, loss: 0.3332691490650177, mean loss: 0.3828718018379941
Epoch: 7, step: 97, loss: 0.3448454737663269, mean loss: 0.3828680759583084
Epoch: 7, step: 98, loss: 0.3885814845561981, mean loss: 0.3828686357122614
Epoch: 7, step: 99, loss: 0.3068733811378479, mean loss: 0.38286119103606875
Epoch: 7, step: 100, loss: 0.3284487724304199, mean loss: 0.38285586118803216
Epoch: 7, step: 101, loss: 0.33451730012893677, mean loss: 0.38285112675501953
Epoch: 7, step: 102, loss: 0.32053881883621216, mean loss: 0.3828450242863173
Epoch: 7, step: 103, loss: 0.3228030204772949, mean loss: 0.38283914473247777
Epoch: 7, step: 104, loss: 0.3420711159706116, mean loss: 0.38283515295447307
Epoch: 7, step: 105, loss: 0.33156412839889526, mean loss: 0.3828301332731968
Epoch: 7, step: 106, loss: 0.35569727420806885, mean loss: 0.382827477095119
Epoch: 7, step: 107, loss: 0.3372879922389984, mean loss: 0.38282301943215347
Epoch: 7, step: 108, loss: 0.3590119183063507, mean loss: 0.38282068889470355
Epoch: 7, step: 109, loss: 0.3489204943180084, mean loss: 0.3828173712009693
Epoch: 7, step: 110, loss: 0.39441537857055664, mean loss: 0.38281850614640134
Epoch: 7, step: 111, loss: 0.32544034719467163, mean loss: 0.38281289184513406
Epoch: 7, step: 112, loss: 0.32518336176872253, mean loss: 0.3828072534995635
Epoch: 7, step: 113, loss: 0.311788946390152, mean loss: 0.38280030590544206
Epoch: 7, step: 114, loss: 0.31468141078948975, mean loss: 0.3827936426074751
Epoch: 7, step: 115, loss: 0.33947035670280457, mean loss: 0.3827894051968819
Epoch: 7, step: 116, loss: 0.320227712392807, mean loss: 0.3827832866939182
Epoch: 7, step: 117, loss: 0.3482963442802429, mean loss: 0.3827799142176407
Epoch: 7, step: 118, loss: 0.3164588212966919, mean loss: 0.38277342931562436
Epoch: 7, step: 119, loss: 0.33462023735046387, mean loss: 0.3827687213383106
Epoch: 7, step: 120, loss: 0.38720235228538513, mean loss: 0.3827691547756893
Epoch: 7, step: 121, loss: 0.3134691119194031, mean loss: 0.38276238057795164
Epoch: 7, step: 122, loss: 0.3299078345298767, mean loss: 0.38275721446065636
Epoch: 7, step: 123, loss: 0.3657270669937134, mean loss: 0.3827555500600048
Epoch: 7, step: 124, loss: 0.31916797161102295, mean loss: 0.3827493360877143
Epoch: 7, step: 125, loss: 0.35739463567733765, mean loss: 0.38274685859109414
Epoch: 7, step: 126, loss: 0.3321903645992279, mean loss: 0.38274191902157856
Epoch: 7, step: 127, loss: 0.39042723178863525, mean loss: 0.38274266983368943
Epoch: 7, step: 128, loss: 0.3231534957885742, mean loss: 0.38273684887305204
Epoch: 7, step: 129, loss: 0.34322553873062134, mean loss: 0.3827329895929053
Epoch: 7, step: 130, loss: 0.35376453399658203, mean loss: 0.38273016036587176
Epoch: 7, step: 131, loss: 0.320497065782547, mean loss: 0.38272408291522886
Epoch: 7, step: 132, loss: 0.3696015477180481, mean loss: 0.38272280154278504
Epoch: 7, step: 133, loss: 0.38710886240005493, mean loss: 0.3827232297853995
Epoch: 7, step: 134, loss: 0.3543891906738281, mean loss: 0.38272046359979844
Epoch: 7, step: 135, loss: 0.38311484456062317, mean loss: 0.3827205020985256
Epoch: 7, step: 136, loss: 0.37419942021369934, mean loss: 0.38271967036774135
Epoch: 7, step: 137, loss: 0.3749835193157196, mean loss: 0.3827189153266471
Epoch: 7, step: 138, loss: 0.3520025610923767, mean loss: 0.382715917731816
Epoch: 7, step: 139, loss: 0.33389517664909363, mean loss: 0.3827111538031389
Epoch: 7, step: 140, loss: 0.3814862370491028, mean loss: 0.38271103428740527
Epoch: 7, step: 141, loss: 0.3280251920223236, mean loss: 0.38270569908328184
Epoch: 7, step: 142, loss: 0.33305370807647705, mean loss: 0.38270085545914695
Epoch: 7, step: 143, loss: 0.36250466108322144, mean loss: 0.3826988854831056
Epoch: 7, step: 144, loss: 0.32046613097190857, mean loss: 0.3826928157713616
Epoch: 7, step: 145, loss: 0.42762574553489685, mean loss: 0.3826971977617813
Epoch: 7, step: 146, loss: 0.3465667963027954, mean loss: 0.38269367456319925
Epoch: 7, step: 147, loss: 0.35843729972839355, mean loss: 0.3826913094720492
Epoch: 7, step: 148, loss: 0.35051706433296204, mean loss: 0.3826881726635146
Epoch: 7, step: 149, loss: 0.296225368976593, mean loss: 0.3826797438466218
Epoch: 7, step: 150, loss: 0.3598135709762573, mean loss: 0.3826775149575614
Epoch: 7, step: 151, loss: 0.33314043283462524, mean loss: 0.3826726867819159
Epoch: 7, step: 152, loss: 0.3369598090648651, mean loss: 0.38266823176995635
Epoch: 7, step: 153, loss: 0.35560062527656555, mean loss: 0.3826655941158447
Epoch: 7, step: 154, loss: 0.36209526658058167, mean loss: 0.3826635897966851
Epoch: 7, step: 155, loss: 0.397494912147522, mean loss: 0.38266503478132563
Epoch: 7, step: 156, loss: 0.36868688464164734, mean loss: 0.3826636730521352
Epoch: 7, step: 157, loss: 0.32561102509498596, mean loss: 0.382658115615163
Epoch: 7, step: 158, loss: 0.34190604090690613, mean loss: 0.38265414638610795
Epoch: 7, step: 159, loss: 0.3833045959472656, mean loss: 0.3826542097333578
Epoch: 7, step: 160, loss: 0.3527412712574005, mean loss: 0.38265129679748516
Epoch: 7, step: 161, loss: 0.32074064016342163, mean loss: 0.38264526849596286
Epoch: 7, step: 162, loss: 0.30062180757522583, mean loss: 0.3826372825685049
Epoch: 7, step: 163, loss: 0.3568148910999298, mean loss: 0.38263476870640706
Epoch: 7, step: 164, loss: 0.3478461503982544, mean loss: 0.3826313822936447
Epoch: 7, step: 165, loss: 0.378041535615921, mean loss: 0.38263093554975935
Epoch: 7, step: 166, loss: 0.33494824171066284, mean loss: 0.3826262948982908
Epoch: 7, step: 167, loss: 0.32905787229537964, mean loss: 0.3826210819338491
Epoch: 7, step: 168, loss: 0.3393554985523224, mean loss: 0.3826168719909298
Epoch: 7, step: 169, loss: 0.33860814571380615, mean loss: 0.38261259015338583
Epoch: 7, step: 170, loss: 0.3524789810180664, mean loss: 0.3826096585832783
Epoch: 7, step: 171, loss: 0.32066065073013306, mean loss: 0.3826036324151992
Epoch: 7, step: 172, loss: 0.2891017198562622, mean loss: 0.38259453778310515
Epoch: 7, step: 173, loss: 0.31330883502960205, mean loss: 0.38258779923975234
Epoch: 7, step: 174, loss: 0.3214409649372101, mean loss: 0.3825818528394506
Epoch: 7, step: 175, loss: 0.36640802025794983, mean loss: 0.3825802801213855
Epoch: 7, step: 176, loss: 0.33539173007011414, mean loss: 0.3825756920270684
Epoch: 7, step: 177, loss: 0.38135045766830444, mean loss: 0.38257557291037014
Epoch: 7, step: 178, loss: 0.3544212877750397, mean loss: 0.3825728360303142
Epoch: 7, step: 179, loss: 0.3672923147678375, mean loss: 0.3825713507541417
Epoch: 7, step: 180, loss: 0.3813932240009308, mean loss: 0.38257123625061823
Epoch: 7, step: 181, loss: 0.34112077951431274, mean loss: 0.38256720802353017
Epoch: 7, step: 182, loss: 0.30536842346191406, mean loss: 0.3825597064411221
Epoch: 7, step: 183, loss: 0.37042102217674255, mean loss: 0.38255852701202525
Epoch: 7, step: 184, loss: 0.3515073359012604, mean loss: 0.3825555102830725
Epoch: 7, step: 185, loss: 0.37498462200164795, mean loss: 0.3825547748169484
Epoch: 7, step: 186, loss: 0.34643304347991943, mean loss: 0.3825512661495043
Epoch: 7, step: 187, loss: 0.3450550436973572, mean loss: 0.3825476243252568
Epoch: 7, step: 188, loss: 0.3611370325088501, mean loss: 0.3825455450213997
Epoch: 7, step: 189, loss: 0.36372366547584534, mean loss: 0.3825437172995561
Epoch: 7, step: 190, loss: 0.3234789967536926, mean loss: 0.3825379823038725
Epoch: 7, step: 191, loss: 0.35377442836761475, mean loss: 0.3825351897258204
Epoch: 7, step: 192, loss: 0.35995012521743774, mean loss: 0.3825329972139761
Epoch: 7, step: 193, loss: 0.33279651403427124, mean loss: 0.38252816936664746
Epoch: 7, step: 194, loss: 0.34910568594932556, mean loss: 0.3825249254101865
Epoch: 7, step: 195, loss: 0.34597477316856384, mean loss: 0.38252137822926247
Epoch: 7, step: 196, loss: 0.39171102643013, mean loss: 0.3825222699952208
Epoch: 7, step: 197, loss: 0.36464834213256836, mean loss: 0.3825205356727036
Epoch: 7, step: 198, loss: 0.3595966696739197, mean loss: 0.38251831156617416
Epoch: 7, step: 199, loss: 0.32313576340675354, mean loss: 0.38251255074466084
Epoch: 7, step: 200, loss: 0.31858184933662415, mean loss: 0.38250634929918526
Epoch: 7, step: 201, loss: 0.38944876194000244, mean loss: 0.3825070226660757
Epoch: 7, step: 202, loss: 0.35120585560798645, mean loss: 0.382503986959834
Epoch: 7, step: 203, loss: 0.3494855761528015, mean loss: 0.382500785019298
Epoch: 7, step: 204, loss: 0.3498770296573639, mean loss: 0.3824976216570017
Epoch: 7, step: 205, loss: 0.32917290925979614, mean loss: 0.3824924515278183
Epoch: 7, step: 206, loss: 0.336396723985672, mean loss: 0.38248798272243373
Epoch: 7, step: 207, loss: 0.3514254689216614, mean loss: 0.38248497162183265
Epoch: 7, step: 208, loss: 0.34945783019065857, mean loss: 0.38248177038683884
Epoch: 7, step: 209, loss: 0.3470015525817871, mean loss: 0.38247833171482826
Epoch: 7, step: 210, loss: 0.33895421028137207, mean loss: 0.3824741138524934
Epoch: 7, step: 211, loss: 0.3470029830932617, mean loss: 0.38247067672741986
Epoch: 7, step: 212, loss: 0.32773077487945557, mean loss: 0.3824653729872931
Epoch: 7, step: 213, loss: 0.32808342576026917, mean loss: 0.38246010443979966
Epoch: 7, step: 214, loss: 0.37781018018722534, mean loss: 0.38245965399668697
Epoch: 7, step: 215, loss: 0.37111786007881165, mean loss: 0.3824585554114566
Epoch: 7, step: 216, loss: 0.32919469475746155, mean loss: 0.3824533966840325
Epoch: 7, step: 217, loss: 0.34177249670028687, mean loss: 0.382449457026858
Epoch: 7, step: 218, loss: 0.2981134355068207, mean loss: 0.38244129047107994
Epoch: 7, step: 219, loss: 0.34877514839172363, mean loss: 0.3824380307749065
Epoch: 7, step: 220, loss: 0.3410646319389343, mean loss: 0.3824340252178501
Epoch: 7, step: 221, loss: 0.34603992104530334, mean loss: 0.38243050207127
Epoch: 7, step: 222, loss: 0.4283999502658844, mean loss: 0.38243495173230907
Epoch: 7, step: 223, loss: 0.343548059463501, mean loss: 0.38243118799902714
Epoch: 7, step: 224, loss: 0.3389357924461365, mean loss: 0.3824269786314134
Epoch: 7, step: 225, loss: 0.3187095820903778, mean loss: 0.3824208128295418
Epoch: 7, step: 226, loss: 0.3693470060825348, mean loss: 0.38241954782647003
Epoch: 7, step: 227, loss: 0.3524908423423767, mean loss: 0.3824166522473791
Epoch: 7, step: 228, loss: 0.3518345355987549, mean loss: 0.38241369373749723
Epoch: 7, step: 229, loss: 0.38454148173332214, mean loss: 0.3824138995595127
Epoch: 7, step: 230, loss: 0.35694095492362976, mean loss: 0.38241143578693937
Epoch: 7, step: 231, loss: 0.3048763573169708, mean loss: 0.38240393723002736
Epoch: 7, step: 232, loss: 0.3410211503505707, mean loss: 0.38239993541329015
Epoch: 7, step: 233, loss: 0.31478777527809143, mean loss: 0.3823933977841918
Epoch: 7, step: 234, loss: 0.4112916588783264, mean loss: 0.3823961917763695
Epoch: 7, step: 235, loss: 0.37879258394241333, mean loss: 0.3823958433997421
Epoch: 7, step: 236, loss: 0.32467591762542725, mean loss: 0.3823902638999089
Epoch: 7, step: 237, loss: 0.33879032731056213, mean loss: 0.3823860497169793
Epoch: 7, step: 238, loss: 0.3662988841533661, mean loss: 0.38238449495080906
Epoch: 7, step: 239, loss: 0.30821892619132996, mean loss: 0.3823773278104187
Epoch: 7, step: 240, loss: 0.3454059660434723, mean loss: 0.3823737553530057
Epoch: 7, step: 241, loss: 0.3034525513648987, mean loss: 0.3823661301159054
Epoch: 7, step: 242, loss: 0.33869469165802, mean loss: 0.3823619110608907
Epoch: 7, step: 243, loss: 0.3168061375617981, mean loss: 0.3823555783934352
Epoch: 7, step: 244, loss: 0.3920239806175232, mean loss: 0.38235651226788936
Epoch: 7, step: 245, loss: 0.3616158962249756, mean loss: 0.3823545091177983
Epoch: 7, step: 246, loss: 0.3359283208847046, mean loss: 0.3823500256616676
Epoch: 7, step: 247, loss: 0.3854711353778839, mean loss: 0.38235032704344785
Epoch: 7, step: 248, loss: 0.3469095826148987, mean loss: 0.38234690513126973
Epoch: 7, step: 249, loss: 0.3602795898914337, mean loss: 0.38234477467025024
Epoch: 7, step: 250, loss: 0.35193705558776855, mean loss: 0.38234183927889176
Epoch: 7, step: 251, loss: 0.3460446298122406, mean loss: 0.3823383356872444
Epoch: 7, step: 252, loss: 0.35052865743637085, mean loss: 0.38233526555132596
Epoch: 7, step: 253, loss: 0.3005276322364807, mean loss: 0.3823273705857484
Epoch: 7, step: 254, loss: 0.3904294967651367, mean loss: 0.38232815241786067
Epoch: 7, step: 255, loss: 0.306624174118042, mean loss: 0.3823208479043234
Epoch: 7, step: 256, loss: 0.34714648127555847, mean loss: 0.38231745433301334
Epoch: 7, step: 257, loss: 0.33038029074668884, mean loss: 0.38231244399502506
Epoch: 7, step: 258, loss: 0.33346739411354065, mean loss: 0.382307732405377
Epoch: 7, step: 259, loss: 0.32858479022979736, mean loss: 0.38230255079444186
Epoch: 7, step: 260, loss: 0.3837212324142456, mean loss: 0.3823026876139635
Epoch: 7, step: 261, loss: 0.31888994574546814, mean loss: 0.38229657259546124
Epoch: 7, step: 262, loss: 0.3223438560962677, mean loss: 0.38229079179163333
Epoch: 7, step: 263, loss: 0.36202865839004517, mean loss: 0.38228883825004045
Epoch: 7, step: 264, loss: 0.3569406569004059, mean loss: 0.3822863945807693
Epoch: 7, step: 265, loss: 0.3002217710018158, mean loss: 0.38227848397506475
Epoch: 7, step: 266, loss: 0.3930935859680176, mean loss: 0.38227952639453394
Epoch: 7, step: 267, loss: 0.4071159064769745, mean loss: 0.3822819200317817
Epoch: 7, step: 268, loss: 0.3440750241279602, mean loss: 0.3822782381491659
Epoch: 7, step: 269, loss: 0.29991912841796875, mean loss: 0.3822703022164495
Epoch: 7, step: 270, loss: 0.34501421451568604, mean loss: 0.3822667126521658
Epoch: 7, step: 271, loss: 0.31665509939193726, mean loss: 0.38226039168749715
Epoch: 7, step: 272, loss: 0.31851595640182495, mean loss: 0.3822542511966691
Epoch: 7, step: 273, loss: 0.3340369462966919, mean loss: 0.38224960687910986
Epoch: 7, step: 274, loss: 0.35921207070350647, mean loss: 0.38224738810455766
Epoch: 7, step: 275, loss: 0.3434204161167145, mean loss: 0.3822436489893816
Epoch: 7, step: 276, loss: 0.378314733505249, mean loss: 0.3822432706633841
Epoch: 7, step: 277, loss: 0.33910343050956726, mean loss: 0.3822391170103749
Epoch: 7, step: 278, loss: 0.3451959490776062, mean loss: 0.3822355507094282
Epoch: 7, step: 279, loss: 0.3252294957637787, mean loss: 0.3822300630260488
Epoch: 7, step: 280, loss: 0.4179353415966034, mean loss: 0.3822334998610252
Epoch: 7, step: 281, loss: 0.3266076147556305, mean loss: 0.382228146070351
Epoch: 7, step: 282, loss: 0.3805025815963745, mean loss: 0.3822279800069813
Epoch: 7, step: 283, loss: 0.3323448896408081, mean loss: 0.3822231798635666
Epoch: 7, step: 284, loss: 0.34881120920181274, mean loss: 0.3822199650102363
Epoch: 7, step: 285, loss: 0.3613644242286682, mean loss: 0.3822179585121815
Epoch: 7, step: 286, loss: 0.3632906377315521, mean loss: 0.38221613770210155
Epoch: 7, step: 287, loss: 0.3262425363063812, mean loss: 0.3822107535542182
Epoch: 7, step: 288, loss: 0.33660367131233215, mean loss: 0.38220636699249444
Epoch: 7, step: 289, loss: 0.3255186080932617, mean loss: 0.3822009151980244
Epoch: 7, step: 290, loss: 0.38255420327186584, mean loss: 0.38220094917129815
Epoch: 7, step: 291, loss: 0.342082679271698, mean loss: 0.38219709164534627
Epoch: 7, step: 292, loss: 0.31900060176849365, mean loss: 0.3821910156440121
Epoch: 7, step: 293, loss: 0.36323338747024536, mean loss: 0.38218919314562966
Epoch: 7, step: 294, loss: 0.3567953109741211, mean loss: 0.3821867521303291
Epoch: 7, step: 295, loss: 0.337289959192276, mean loss: 0.38218243679075414
Epoch: 7, step: 296, loss: 0.3631022870540619, mean loss: 0.38218060304258145
Epoch: 7, step: 297, loss: 0.3104611337184906, mean loss: 0.38217371091598873
Epoch: 7, step: 298, loss: 0.34004315733909607, mean loss: 0.38216966262603225
Epoch: 7, step: 299, loss: 0.33156660199165344, mean loss: 0.38216480068707814
Epoch: 7, step: 300, loss: 0.37914279103279114, mean loss: 0.38216451036047094
Epoch: 7, step: 301, loss: 0.34984561800956726, mean loss: 0.38216140575986085
Epoch: 7, step: 302, loss: 0.35214170813560486, mean loss: 0.3821585223002869
Epoch: 7, step: 303, loss: 0.3770069181919098, mean loss: 0.382158027524633
Epoch: 7, step: 304, loss: 0.3487345278263092, mean loss: 0.3821548177388174
Epoch: 7, step: 305, loss: 0.39191171526908875, mean loss: 0.3821557546408272
Epoch: 7, step: 306, loss: 0.32327207922935486, mean loss: 0.3821501009033897
Epoch: 7, step: 307, loss: 0.32392871379852295, mean loss: 0.38214451129249255
Epoch: 7, step: 308, loss: 0.33570849895477295, mean loss: 0.382140053577955
Epoch: 7, step: 309, loss: 0.3370217978954315, mean loss: 0.38213572277975166
Epoch: 7, step: 310, loss: 0.3266168236732483, mean loss: 0.3821303941590485
Epoch: 7, step: 311, loss: 0.348716676235199, mean loss: 0.38212718746826885
Epoch: 7, step: 312, loss: 0.3546900451183319, mean loss: 0.38212455459787736
Epoch: 7, step: 313, loss: 0.3441999852657318, mean loss: 0.382120915702336
Epoch: 7, step: 314, loss: 0.3243483304977417, mean loss: 0.38211537290417763
Epoch: 7, step: 315, loss: 0.3485633432865143, mean loss: 0.38211215417531946
Epoch: 7, step: 316, loss: 0.3367551565170288, mean loss: 0.38210780338417716
Epoch: 7, step: 317, loss: 0.3777959644794464, mean loss: 0.3821073898181974
Epoch: 7, step: 318, loss: 0.33170458674430847, mean loss: 0.3821025559443052
Epoch: 7, step: 319, loss: 0.36260315775871277, mean loss: 0.382100686036539
Epoch: 7, step: 320, loss: 0.3092444837093353, mean loss: 0.38209370011244975
Epoch: 7, step: 321, loss: 0.3135852515697479, mean loss: 0.38208713170894615
Epoch: 7, step: 322, loss: 0.3773343861103058, mean loss: 0.38208667607232466
Epoch: 7, step: 323, loss: 0.376014769077301, mean loss: 0.3820860940260253
Epoch: 7, step: 324, loss: 0.3477512300014496, mean loss: 0.38208280303934605
Epoch: 7, step: 325, loss: 0.32634732127189636, mean loss: 0.3820774613217145
Epoch: 7, step: 326, loss: 0.3682674467563629, mean loss: 0.3820761378895568
Epoch: 7, step: 327, loss: 0.3525579571723938, mean loss: 0.3820733093938959
Epoch: 7, step: 328, loss: 0.3559896647930145, mean loss: 0.382070810242358
Epoch: 7, step: 329, loss: 0.3845866620540619, mean loss: 0.3820710512705063
Epoch: 7, step: 330, loss: 0.3389602601528168, mean loss: 0.38206692148881094
Epoch: 7, step: 331, loss: 0.3263433277606964, mean loss: 0.38206158397983314
Epoch: 7, step: 332, loss: 0.3353346884250641, mean loss: 0.3820571086522252
Epoch: 7, step: 333, loss: 0.3289669156074524, mean loss: 0.3820520243586948
Epoch: 7, step: 334, loss: 0.35714784264564514, mean loss: 0.38204963958595584
Epoch: 7, step: 335, loss: 0.3447927236557007, mean loss: 0.38204607228263043
Epoch: 7, step: 336, loss: 0.35266631841659546, mean loss: 0.38204325947709034
Epoch: 7, step: 337, loss: 0.3460952937602997, mean loss: 0.38203981816312166
Epoch: 7, step: 338, loss: 0.35516226291656494, mean loss: 0.38203724540967604
Epoch: 7, step: 339, loss: 0.34460845589637756, mean loss: 0.38203366302170577
Epoch: 7, step: 340, loss: 0.3212885856628418, mean loss: 0.3820278495393286
Epoch: 7, step: 341, loss: 0.3636902868747711, mean loss: 0.382026094748643
Epoch: 7, step: 342, loss: 0.37114784121513367, mean loss: 0.38202505386704955
Epoch: 7, step: 343, loss: 0.32169121503829956, mean loss: 0.38201928139873453
Epoch: 7, step: 344, loss: 0.3615581691265106, mean loss: 0.38201732395950444
Epoch: 7, step: 345, loss: 0.3529154360294342, mean loss: 0.382014540155417
Epoch: 7, step: 346, loss: 0.3668018579483032, mean loss: 0.3820130850925565
Epoch: 7, step: 347, loss: 0.35819002985954285, mean loss: 0.3820108066825304
Epoch: 7, step: 348, loss: 0.32013586163520813, mean loss: 0.3820048895987542
Epoch: 7, step: 349, loss: 0.3627423048019409, mean loss: 0.3820030476992709
Epoch: 7, step: 350, loss: 0.3798227906227112, mean loss: 0.38200283924176287
Epoch: 7, step: 351, loss: 0.3567926287651062, mean loss: 0.38200042908779763
Epoch: 7, step: 352, loss: 0.3424544334411621, mean loss: 0.3819966487612852
Epoch: 7, step: 353, loss: 0.3704301416873932, mean loss: 0.3819955431880608
Epoch: 7, step: 354, loss: 0.3367546796798706, mean loss: 0.38199121929782776
Epoch: 7, step: 355, loss: 0.3825116753578186, mean loss: 0.3819912690356011
Epoch: 7, step: 356, loss: 0.3567952811717987, mean loss: 0.3819888613922314
Epoch: 7, step: 357, loss: 0.35213297605514526, mean loss: 0.3819860087374123
Epoch: 7, step: 358, loss: 0.3323167562484741, mean loss: 0.3819812634185541
Epoch: 7, step: 359, loss: 0.33897215127944946, mean loss: 0.38197715479110483
Epoch: 7, step: 360, loss: 0.33982834219932556, mean loss: 0.3819731287320169
Epoch: 7, step: 361, loss: 0.3605329394340515, mean loss: 0.38197108095844495
Epoch: 7, step: 362, loss: 0.34544479846954346, mean loss: 0.3819675926304449
Epoch: 7, step: 363, loss: 0.3294106721878052, mean loss: 0.38196257382597176
Epoch: 7, step: 364, loss: 0.33700862526893616, mean loss: 0.3819582814600253
Epoch: 7, step: 365, loss: 0.3655398488044739, mean loss: 0.3819567139182404
Epoch: 7, step: 366, loss: 0.41368159651756287, mean loss: 0.3819597425466508
Epoch: 7, step: 367, loss: 0.2995462417602539, mean loss: 0.38195187566035965
Epoch: 7, step: 368, loss: 0.33771681785583496, mean loss: 0.3819476535492778
Epoch: 7, step: 369, loss: 0.3353985846042633, mean loss: 0.3819432109964104
Epoch: 7, step: 370, loss: 0.3700920045375824, mean loss: 0.38194208004818453
Epoch: 7, step: 371, loss: 0.3507501184940338, mean loss: 0.38193910371597517
Epoch: 7, step: 372, loss: 0.3499210476875305, mean loss: 0.3819360488494521
Epoch: 7, step: 373, loss: 0.33928796648979187, mean loss: 0.38193198015241336
Epoch: 7, step: 374, loss: 0.306504487991333, mean loss: 0.3819247849323274
Epoch: 7, step: 375, loss: 0.3427260220050812, mean loss: 0.3819210460194194
Epoch: 7, step: 376, loss: 0.30799126625061035, mean loss: 0.3819139950151496
Epoch: 7, step: 377, loss: 0.33506864309310913, mean loss: 0.3819095275965036
Epoch: 7, step: 378, loss: 0.34969577193260193, mean loss: 0.38190645581661764
Epoch: 7, step: 379, loss: 0.44109371304512024, mean loss: 0.3819120991477798
Epoch: 7, step: 380, loss: 0.3914868235588074, mean loss: 0.38191301198259825
Epoch: 7, step: 381, loss: 0.3947538733482361, mean loss: 0.38191423608759023
Epoch: 7, step: 382, loss: 0.36977213621139526, mean loss: 0.3819130787050837
Epoch: 7, step: 383, loss: 0.3705345392227173, mean loss: 0.3819119942083736
Epoch: 7, step: 384, loss: 0.3059597313404083, mean loss: 0.38190475583394606
Epoch: 7, step: 385, loss: 0.3045572340488434, mean loss: 0.3818973851915042
Epoch: 7, step: 386, loss: 0.395973801612854, mean loss: 0.3818987264412823
Epoch: 7, step: 387, loss: 0.3698778748512268, mean loss: 0.38189758116197686
Epoch: 7, step: 388, loss: 0.36466649174690247, mean loss: 0.38189593963683494
Epoch: 7, step: 389, loss: 0.32518720626831055, mean loss: 0.3818905377761597
Epoch: 7, step: 390, loss: 0.33116021752357483, mean loss: 0.3818857058569053
Epoch: 7, step: 391, loss: 0.36027565598487854, mean loss: 0.38188364775691747
Epoch: 7, step: 392, loss: 0.37310922145843506, mean loss: 0.38188281217684905
Epoch: 7, step: 393, loss: 0.31461700797080994, mean loss: 0.38187640712979076
Epoch: 7, step: 394, loss: 0.362687885761261, mean loss: 0.3818745801735527
Epoch: 7, step: 395, loss: 0.33909595012664795, mean loss: 0.38187050756977825
Epoch: 7, step: 396, loss: 0.33664631843566895, mean loss: 0.3818662025541539
Epoch: 7, step: 397, loss: 0.3299892544746399, mean loss: 0.38186126471405496
Epoch: 7, step: 398, loss: 0.3282323479652405, mean loss: 0.3818561606009162
Epoch: 7, step: 399, loss: 0.3905826210975647, mean loss: 0.3818569910596616
Epoch: 7, step: 400, loss: 0.35535290837287903, mean loss: 0.38185446902305614
Epoch: 7, step: 401, loss: 0.34793418645858765, mean loss: 0.381851241593697
Epoch: 7, step: 402, loss: 0.372787743806839, mean loss: 0.3818503793067798
Epoch: 7, step: 403, loss: 0.3421166241168976, mean loss: 0.3818465994594444
Epoch: 7, step: 404, loss: 0.32308125495910645, mean loss: 0.38184100968064666
Epoch: 7, step: 405, loss: 0.333800733089447, mean loss: 0.381836440508439
Epoch: 7, step: 406, loss: 0.3348763883113861, mean loss: 0.38183197450252393
Epoch: 7, step: 407, loss: 0.35140275955200195, mean loss: 0.3818290808913647
Epoch: 7, step: 408, loss: 0.3197220265865326, mean loss: 0.3818231754949299
Epoch: 7, step: 409, loss: 0.3484320342540741, mean loss: 0.3818200008285256
Epoch: 7, step: 410, loss: 0.3187463879585266, mean loss: 0.38181400466797133
Epoch: 7, step: 411, loss: 0.33794423937797546, mean loss: 0.3818098345381909
Epoch: 7, step: 412, loss: 0.35277503728866577, mean loss: 0.381807074838804
Epoch: 7, step: 413, loss: 0.37158697843551636, mean loss: 0.38180610353140965
Epoch: 7, step: 414, loss: 0.3628941774368286, mean loss: 0.38180430633231294
Epoch: 7, step: 415, loss: 0.3552951514720917, mean loss: 0.38180178740843795
Epoch: 7, step: 416, loss: 0.32444092631340027, mean loss: 0.38179633744538855
Epoch: 7, step: 417, loss: 0.34283584356307983, mean loss: 0.38179263608742897
Epoch: 7, step: 418, loss: 0.35346707701683044, mean loss: 0.38178994533421623
Epoch: 7, step: 419, loss: 0.33834725618362427, mean loss: 0.3817858189389702
Epoch: 7, step: 420, loss: 0.313569575548172, mean loss: 0.38177934004796527
Epoch: 7, step: 421, loss: 0.3499835729598999, mean loss: 0.3817763205069313
Epoch: 7, step: 422, loss: 0.3671565353870392, mean loss: 0.3817749322451214
Epoch: 7, step: 423, loss: 0.3175707459449768, mean loss: 0.38176883613932
Epoch: 7, step: 424, loss: 0.3827853798866272, mean loss: 0.3817689326496919
Epoch: 7, step: 425, loss: 0.347652405500412, mean loss: 0.381765693943868
Epoch: 7, step: 426, loss: 0.34026116132736206, mean loss: 0.3817617542635057
Epoch: 7, step: 427, loss: 0.357952356338501, mean loss: 0.3817594944497315
Epoch: 7, step: 428, loss: 0.3294912576675415, mean loss: 0.38175453400209153
Epoch: 7, step: 429, loss: 0.35190922021865845, mean loss: 0.38175170184098095
Epoch: 7, step: 430, loss: 0.3650903105735779, mean loss: 0.38175012091382776
Epoch: 7, step: 431, loss: 0.3147284686565399, mean loss: 0.38174376212329103
Epoch: 7, step: 432, loss: 0.3014027178287506, mean loss: 0.3817361403564478
Epoch: 7, step: 433, loss: 0.38553014397621155, mean loss: 0.3817365002505495
Epoch: 7, step: 434, loss: 0.3179072439670563, mean loss: 0.38173044606708334
Epoch: 7, step: 435, loss: 0.37350574135780334, mean loss: 0.38172966603059727
Epoch: 7, step: 436, loss: 0.3591805398464203, mean loss: 0.38172752765921897
Epoch: 7, step: 437, loss: 0.3880525827407837, mean loss: 0.38172812741790296
Epoch: 7, step: 438, loss: 0.3300955891609192, mean loss: 0.3817232319463701
Epoch: 7, step: 439, loss: 0.3296479284763336, mean loss: 0.38171829496272675
Epoch: 7, step: 440, loss: 0.3216134309768677, mean loss: 0.3817125972791562
Epoch: 7, step: 441, loss: 0.36300256848335266, mean loss: 0.38171082381671106
Epoch: 7, step: 442, loss: 0.35343554615974426, mean loss: 0.381708143949622
Epoch: 7, step: 443, loss: 0.31110814213752747, mean loss: 0.3817014532746967
Epoch: 7, step: 444, loss: 0.34640809893608093, mean loss: 0.38169810888406475
Epoch: 7, step: 445, loss: 0.3622224032878876, mean loss: 0.38169626354527414
Epoch: 7, step: 446, loss: 0.2972950041294098, mean loss: 0.38168826721562793
Epoch: 7, step: 447, loss: 0.36475709080696106, mean loss: 0.3816866632769761
Epoch: 7, step: 448, loss: 0.3501669466495514, mean loss: 0.3816836776071241
Epoch: 7, step: 449, loss: 0.3574778437614441, mean loss: 0.38168138495379533
Epoch: 7, step: 450, loss: 0.3576168417930603, mean loss: 0.3816791058986613
Epoch: 7, step: 451, loss: 0.3420383334159851, mean loss: 0.3816753520376307
Epoch: 7, step: 452, loss: 0.3539865016937256, mean loss: 0.38167273023568543
Epoch: 7, step: 453, loss: 0.35959792137145996, mean loss: 0.3816706402140168
Epoch: 7, step: 454, loss: 0.3242940604686737, mean loss: 0.38166520836892115
Epoch: 7, step: 455, loss: 0.3635448217391968, mean loss: 0.3816634930729509
Epoch: 7, step: 456, loss: 0.3475429117679596, mean loss: 0.38166026348645726
Epoch: 7, step: 457, loss: 0.35487890243530273, mean loss: 0.3816577288128768
Epoch: 7, step: 458, loss: 0.3142596185207367, mean loss: 0.38165135064402167
Epoch: 7, step: 459, loss: 0.3421548902988434, mean loss: 0.38164761328024943
Epoch: 7, step: 460, loss: 0.3166400194168091, mean loss: 0.38164146250024533
Epoch: 7, step: 461, loss: 0.33514443039894104, mean loss: 0.3816370635378895
Epoch: 7, step: 462, loss: 0.3178693652153015, mean loss: 0.3816310312137648
Epoch: 7, step: 463, loss: 0.32585668563842773, mean loss: 0.38162575554732747
Epoch: 7, step: 464, loss: 0.32485252618789673, mean loss: 0.3816203859049025
Epoch: 7, step: 465, loss: 0.3418034315109253, mean loss: 0.38161662035218885
Epoch: 7, step: 466, loss: 0.3495909571647644, mean loss: 0.3816135919206818
Epoch: 7, step: 467, loss: 0.3373120129108429, mean loss: 0.3816094030421824
Epoch: 7, step: 468, loss: 0.3620486855506897, mean loss: 0.38160755367870586
Epoch: 7, step: 469, loss: 0.3324255645275116, mean loss: 0.38160290421858567
Epoch: 7, step: 470, loss: 0.30491340160369873, mean loss: 0.3815956549981854
Epoch: 7, step: 471, loss: 0.3692886233329773, mean loss: 0.3815944917626783
Epoch: 7, step: 472, loss: 0.34163782000541687, mean loss: 0.3815907154965638
Epoch: 7, step: 473, loss: 0.3708859980106354, mean loss: 0.3815897038997498
Epoch: 7, step: 474, loss: 0.42084741592407227, mean loss: 0.38159341340669717
Epoch: 7, step: 475, loss: 0.32294729351997375, mean loss: 0.381587872390079
Epoch: 7, step: 476, loss: 0.3397207260131836, mean loss: 0.3815839170621266
Epoch: 7, step: 477, loss: 0.36422768235206604, mean loss: 0.38158227751605533
Epoch: 7, step: 478, loss: 0.36625948548316956, mean loss: 0.3815808301946203
Epoch: 7, step: 479, loss: 0.3336140811443329, mean loss: 0.38157629990098124
Epoch: 7, step: 480, loss: 0.3756673038005829, mean loss: 0.3815757418694296
Epoch: 7, step: 481, loss: 0.3637847900390625, mean loss: 0.38157406189286397
Epoch: 7, step: 482, loss: 0.34408092498779297, mean loss: 0.3815705217987364
Epoch: 7, step: 483, loss: 0.33796021342277527, mean loss: 0.3815664045113142
Epoch: 7, step: 484, loss: 0.35722851753234863, mean loss: 0.38156410696699444
Epoch: 7, step: 485, loss: 0.33347469568252563, mean loss: 0.3815595676606621
Epoch: 7, step: 486, loss: 0.3227716088294983, mean loss: 0.38155401900952185
Epoch: 7, step: 487, loss: 0.3372249901294708, mean loss: 0.3815498354469624
Epoch: 7, step: 488, loss: 0.34407949447631836, mean loss: 0.3815462995083977
Epoch: 7, step: 489, loss: 0.35172128677368164, mean loss: 0.38154348529696774
Epoch: 7, step: 490, loss: 0.34733524918556213, mean loss: 0.38154025780040096
Epoch: 7, step: 491, loss: 0.3403858244419098, mean loss: 0.3815363753066879
Epoch: 7, step: 492, loss: 0.37370458245277405, mean loss: 0.38153563652800154
Epoch: 7, step: 493, loss: 0.323997437953949, mean loss: 0.38153020942004323
Epoch: 7, step: 494, loss: 0.3505594730377197, mean loss: 0.38152728847914136
Epoch: 7, step: 495, loss: 0.39146721363067627, mean loss: 0.3815282258542028
Epoch: 7, step: 496, loss: 0.3421516716480255, mean loss: 0.3815245128363616
Epoch: 7, step: 497, loss: 0.3391830623149872, mean loss: 0.3815205206196426
Epoch: 7, step: 498, loss: 0.32579129934310913, mean loss: 0.38151526661556256
Epoch: 7, step: 499, loss: 0.3378400504589081, mean loss: 0.38151114941946934
Epoch: 7, step: 500, loss: 0.32938021421432495, mean loss: 0.381506235578843
Epoch: 7, step: 501, loss: 0.357982337474823, mean loss: 0.3815040184348181
Epoch: 7, step: 502, loss: 0.35654908418655396, mean loss: 0.38150166663628376
Epoch: 7, step: 503, loss: 0.34625235199928284, mean loss: 0.3814983449895973
Epoch: 7, step: 504, loss: 0.3562309443950653, mean loss: 0.38149596419240567
Epoch: 7, step: 505, loss: 0.31522175669670105, mean loss: 0.38148972015552085
Epoch: 7, step: 506, loss: 0.32695141434669495, mean loss: 0.3814845823028775
Epoch: 7, step: 507, loss: 0.3395971655845642, mean loss: 0.3814806366155453
Epoch: 7, step: 508, loss: 0.32942143082618713, mean loss: 0.38147573323363054
Epoch: 7, step: 509, loss: 0.3517197370529175, mean loss: 0.38147293082299005
Epoch: 7, step: 510, loss: 0.3482021391391754, mean loss: 0.38146979768505956
Epoch: 7, step: 511, loss: 0.36150509119033813, mean loss: 0.38146791776919375
Epoch: 7, step: 512, loss: 0.3077574372291565, mean loss: 0.3814609776994696
Epoch: 7, step: 513, loss: 0.33894872665405273, mean loss: 0.38145697541637363
Epoch: 7, step: 514, loss: 0.4802303910255432, mean loss: 0.381466273488068
Epoch: 7, step: 515, loss: 0.3473680317401886, mean loss: 0.3814630639397107
Epoch: 7, step: 516, loss: 0.3998758792877197, mean loss: 0.38146479691056695
Epoch: 7, step: 517, loss: 0.3246694803237915, mean loss: 0.3814594519720589
Epoch: 7, step: 518, loss: 0.32988691329956055, mean loss: 0.3814545989995669
Epoch: 7, step: 519, loss: 0.3352026045322418, mean loss: 0.38145024709944764
Epoch: 7, step: 520, loss: 0.32796818017959595, mean loss: 0.38144521538744086
Epoch: 7, step: 521, loss: 0.38507646322250366, mean loss: 0.38144555699118826
Epoch: 7, step: 522, loss: 0.38417598605155945, mean loss: 0.3814458138277098
Epoch: 7, step: 523, loss: 0.3379265367984772, mean loss: 0.38144172059247383
Epoch: 7, step: 524, loss: 0.3942340910434723, mean loss: 0.38144292367443106
Epoch: 7, step: 525, loss: 0.3136797547340393, mean loss: 0.3814365513621365
Epoch: 7, step: 526, loss: 0.37052005529403687, mean loss: 0.38143552489330074
Epoch: 7, step: 527, loss: 0.3221975266933441, mean loss: 0.38142995531844176
Epoch: 7, step: 528, loss: 0.37085437774658203, mean loss: 0.38142896109285446
Epoch: 7, step: 529, loss: 0.3400701880455017, mean loss: 0.3814250732593287
Epoch: 7, step: 530, loss: 0.3480542004108429, mean loss: 0.3814219366043001
Epoch: 7, step: 531, loss: 0.32996705174446106, mean loss: 0.38141710061888096
Epoch: 7, step: 532, loss: 0.4254990220069885, mean loss: 0.38142124326725874
Epoch: 7, step: 533, loss: 0.3287944197654724, mean loss: 0.38141629806677935
Epoch: 7, step: 534, loss: 0.3296060860157013, mean loss: 0.3814114300585062
Epoch: 7, step: 535, loss: 0.3654811680316925, mean loss: 0.38140993341607604
Epoch: 7, step: 536, loss: 0.3515487313270569, mean loss: 0.38140712823034667
Epoch: 7, step: 537, loss: 0.35848796367645264, mean loss: 0.3814049753875368
Epoch: 7, step: 538, loss: 0.3887527585029602, mean loss: 0.3814056655146257
Epoch: 7, step: 539, loss: 0.34042105078697205, mean loss: 0.3814018164711689
Epoch: 7, step: 540, loss: 0.33158284425735474, mean loss: 0.3813971381941275
Epoch: 7, step: 541, loss: 0.3564528226852417, mean loss: 0.38139479600487786
Epoch: 7, step: 542, loss: 0.36031728982925415, mean loss: 0.38139281708213113
Epoch: 7, step: 543, loss: 0.3152053952217102, mean loss: 0.3813866034676118
Epoch: 7, step: 544, loss: 0.32525011897087097, mean loss: 0.3813813339205831
Epoch: 7, step: 545, loss: 0.34798967838287354, mean loss: 0.3813781997310263
Epoch: 7, step: 546, loss: 0.3068312108516693, mean loss: 0.3813712032984708
Epoch: 7, step: 547, loss: 0.37349218130111694, mean loss: 0.38137046390076085
Epoch: 7, step: 548, loss: 0.33170032501220703, mean loss: 0.3813658031013906
Epoch: 7, step: 549, loss: 0.37274643778800964, mean loss: 0.3813649943788054
Epoch: 7, step: 550, loss: 0.33523064851760864, mean loss: 0.381360666172983
Epoch: 7, step: 551, loss: 0.37266165018081665, mean loss: 0.38135985013020696
Epoch: 7, step: 552, loss: 0.33242565393447876, mean loss: 0.38135526011086585
Epoch: 7, step: 553, loss: 0.3826344907283783, mean loss: 0.38135538009122766
Epoch: 7, step: 554, loss: 0.3340587317943573, mean loss: 0.3813509445057173
Epoch: 7, step: 555, loss: 0.3417218029499054, mean loss: 0.38134722834465623
Epoch: 7, step: 556, loss: 0.3397950530052185, mean loss: 0.3813433322194486
Epoch: 7, step: 557, loss: 0.35176780819892883, mean loss: 0.38134055934076677
Epoch: 7, step: 558, loss: 0.3885256350040436, mean loss: 0.3813412329205608
Epoch: 7, step: 559, loss: 0.36069217324256897, mean loss: 0.38133929731316696
Epoch: 7, step: 560, loss: 0.35296332836151123, mean loss: 0.3813366376478795
Epoch: 7, step: 561, loss: 0.3465900421142578, mean loss: 0.3813333811721969
Epoch: 7, step: 562, loss: 0.3387277126312256, mean loss: 0.3813293885127891
Epoch: 7, step: 563, loss: 0.32984644174575806, mean loss: 0.38132456439858675
Epoch: 7, step: 564, loss: 0.4446481466293335, mean loss: 0.3813304974616647
Epoch: 7, step: 565, loss: 0.35735008120536804, mean loss: 0.3813282508421916
Epoch: 7, step: 566, loss: 0.34088534116744995, mean loss: 0.3813244622792244
Epoch: 7, step: 567, loss: 0.3498935103416443, mean loss: 0.3813215182035465
Epoch: 7, step: 568, loss: 0.3634876012802124, mean loss: 0.3813198478919493
Epoch: 7, step: 569, loss: 0.35356634855270386, mean loss: 0.3813172487629608
Epoch: 7, step: 570, loss: 0.33363378047943115, mean loss: 0.3813127836006531
Epoch: 7, step: 571, loss: 0.38418978452682495, mean loss: 0.3813130529827623
Epoch: 7, step: 572, loss: 0.3326570987701416, mean loss: 0.38130849760833924
Epoch: 7, step: 573, loss: 0.3634430170059204, mean loss: 0.3813068251237294
Epoch: 7, step: 574, loss: 0.37748825550079346, mean loss: 0.3813064676801627
Epoch: 7, step: 575, loss: 0.3289215564727783, mean loss: 0.3813015645623035
Epoch: 7, step: 576, loss: 0.33718788623809814, mean loss: 0.38129743600092547
Epoch: 7, step: 577, loss: 0.30662351846694946, mean loss: 0.381290447986932
Epoch: 7, step: 578, loss: 0.35994449257850647, mean loss: 0.3812884506111101
Epoch: 7, step: 579, loss: 0.3566329777240753, mean loss: 0.3812861437742008
Epoch: 7, step: 580, loss: 0.31120505928993225, mean loss: 0.381279587399939
Epoch: 7, step: 581, loss: 0.3898550868034363, mean loss: 0.3812803895981994
Epoch: 7, step: 582, loss: 0.32651570439338684, mean loss: 0.3812752670946726
Epoch: 7, step: 583, loss: 0.33285608887672424, mean loss: 0.3812707385520035
Epoch: 7, step: 584, loss: 0.39422866702079773, mean loss: 0.3812719503661313
Epoch: 7, step: 585, loss: 0.3264579176902771, mean loss: 0.3812668246851255
Epoch: 7, step: 586, loss: 0.3878174424171448, mean loss: 0.3812674371786021
Epoch: 7, step: 587, loss: 0.3613356947898865, mean loss: 0.38126557370231295
Epoch: 7, step: 588, loss: 0.3292190432548523, mean loss: 0.38126070817642277
Epoch: 7, step: 589, loss: 0.3143937587738037, mean loss: 0.38125445776051303
Epoch: 7, step: 590, loss: 0.33265700936317444, mean loss: 0.3812499155183972
Epoch: 7, step: 591, loss: 0.37237748503685, mean loss: 0.3812490863192868
Epoch: 7, step: 592, loss: 0.3437994122505188, mean loss: 0.381245586676817
Epoch: 7, step: 593, loss: 0.33575960993766785, mean loss: 0.3812413364453893
Epoch: 7, step: 594, loss: 0.31811559200286865, mean loss: 0.3812354384967354
Epoch: 7, step: 595, loss: 0.33007147908210754, mean loss: 0.3812306586051608
Epoch: 7, step: 596, loss: 0.3519432842731476, mean loss: 0.38122792274581174
Epoch: 7, step: 597, loss: 0.33802691102027893, mean loss: 0.38122388753081776
Epoch: 7, step: 598, loss: 0.33538365364074707, mean loss: 0.38121960619768147
Epoch: 7, step: 599, loss: 0.34455668926239014, mean loss: 0.38121618231675736
Epoch: 7, step: 600, loss: 0.3473326563835144, mean loss: 0.38121301829341875
Epoch: 7, step: 601, loss: 0.3685407340526581, mean loss: 0.3812118350736017
Epoch: 7, step: 602, loss: 0.3269674479961395, mean loss: 0.38120677071106995
Epoch: 7, step: 603, loss: 0.4040713608264923, mean loss: 0.38120890519483724
Epoch: 7, step: 604, loss: 0.33513176441192627, mean loss: 0.3812046041455716
Epoch: 7, step: 605, loss: 0.3550054132938385, mean loss: 0.38120215882255015
Epoch: 7, step: 606, loss: 0.3485802412033081, mean loss: 0.3811991143132063
Epoch: 7, step: 607, loss: 0.35963931679725647, mean loss: 0.3811971023873463
Epoch: 7, step: 608, loss: 0.32914623618125916, mean loss: 0.3811922455369025
Epoch: 7, step: 609, loss: 0.33278095722198486, mean loss: 0.3811877287158244
Epoch: 7, step: 610, loss: 0.3146720230579376, mean loss: 0.3811815233136733
Epoch: 7, step: 611, loss: 0.3451332747936249, mean loss: 0.3811781606039233
Epoch: 7, step: 612, loss: 0.34767410159111023, mean loss: 0.3811750355168034
Epoch: 7, step: 613, loss: 0.3280864357948303, mean loss: 0.38117008414581643
Epoch: 7, step: 614, loss: 0.3310685455799103, mean loss: 0.3811654118023896
Epoch: 7, step: 615, loss: 0.43895500898361206, mean loss: 0.3811708006122722
Epoch: 7, step: 616, loss: 0.3860325813293457, mean loss: 0.3811712539251596
Epoch: 7, step: 617, loss: 0.3387172818183899, mean loss: 0.3811672958818903
Epoch: 7, step: 618, loss: 0.3647662103176117, mean loss: 0.3811657669282626
Epoch: 7, step: 619, loss: 0.34012189507484436, mean loss: 0.38116194106399587
Epoch: 7, step: 620, loss: 0.34613555669784546, mean loss: 0.3811586764182352
Epoch: 7, step: 621, loss: 0.3813709318637848, mean loss: 0.3811586961997306
Epoch: 7, step: 622, loss: 0.35403844714164734, mean loss: 0.381156168919043
Epoch: 7, step: 623, loss: 0.3373126983642578, mean loss: 0.38115208361615865
Epoch: 7, step: 624, loss: 0.3411754071712494, mean loss: 0.38114835896541377
Epoch: 7, step: 625, loss: 0.3464297652244568, mean loss: 0.38114512451472055
Epoch: 7, step: 626, loss: 0.3263397514820099, mean loss: 0.38114001921681345
Epoch: 7, step: 627, loss: 0.32066887617111206, mean loss: 0.38113438665878013
Epoch: 7, step: 628, loss: 0.35324013233184814, mean loss: 0.3811317887027098
Epoch: 7, step: 629, loss: 0.33356574177742004, mean loss: 0.38112735900938466
Epoch: 7, step: 630, loss: 0.3478270173072815, mean loss: 0.38112425813018713
Epoch: 7, step: 631, loss: 0.35553866624832153, mean loss: 0.3811218758590622
Epoch: 7, step: 632, loss: 0.34680747985839844, mean loss: 0.3811186811475828
Epoch: 7, step: 633, loss: 0.3509107232093811, mean loss: 0.381115869012232
Epoch: 7, step: 634, loss: 0.32979533076286316, mean loss: 0.38111109189799486
Epoch: 7, step: 635, loss: 0.3075936734676361, mean loss: 0.38110424924922065
Epoch: 7, step: 636, loss: 0.3311317265033722, mean loss: 0.3810995984793048
Epoch: 7, step: 637, loss: 0.35349351167678833, mean loss: 0.3810970295153366
Epoch: 7, step: 638, loss: 0.3398852050304413, mean loss: 0.38109319478708825
Epoch: 7, step: 639, loss: 0.3790670335292816, mean loss: 0.3810930062718986
Epoch: 7, step: 640, loss: 0.33383408188819885, mean loss: 0.38108860968390124
Epoch: 7, step: 641, loss: 0.31846073269844055, mean loss: 0.3810827838348793
Epoch: 7, step: 642, loss: 0.33273833990097046, mean loss: 0.3810782870956054
Epoch: 7, step: 643, loss: 0.35058915615081787, mean loss: 0.3810754514249446
Epoch: 7, step: 644, loss: 0.3540714383125305, mean loss: 0.38107294012455284
Epoch: 7, step: 645, loss: 0.39703068137168884, mean loss: 0.38107442401345437
Epoch: 7, step: 646, loss: 0.35099026560783386, mean loss: 0.3810716267881261
Epoch: 7, step: 647, loss: 0.3353097140789032, mean loss: 0.3810673722406448
Epoch: 7, step: 648, loss: 0.362356960773468, mean loss: 0.38106563286986606
Epoch: 7, step: 649, loss: 0.37504130601882935, mean loss: 0.38106507288410185
Epoch: 7, step: 650, loss: 0.39008185267448425, mean loss: 0.3810659109526761
Epoch: 7, step: 651, loss: 0.3431001305580139, mean loss: 0.3810623825344238
Epoch: 7, step: 652, loss: 0.3317854404449463, mean loss: 0.3810578033185434
Epoch: 7, step: 653, loss: 0.3441852033138275, mean loss: 0.3810543771338189
Epoch: 7, step: 654, loss: 0.3436557352542877, mean loss: 0.38105090239240114
Epoch: 7, step: 655, loss: 0.3291652500629425, mean loss: 0.38104608209768454
Epoch: 7, step: 656, loss: 0.35120585560798645, mean loss: 0.3810433101305234
Epoch: 7, step: 657, loss: 0.3689512014389038, mean loss: 0.3810421869549065
Epoch: 7, step: 658, loss: 0.3836308419704437, mean loss: 0.38104242737981736
Epoch: 7, step: 659, loss: 0.3467022776603699, mean loss: 0.3810392382871614
Epoch: 7, step: 660, loss: 0.35534244775772095, mean loss: 0.3810368521054798
Epoch: 7, step: 661, loss: 0.3566870093345642, mean loss: 0.38103459121014355
Epoch: 7, step: 662, loss: 0.3498305678367615, mean loss: 0.38103169416962984
Epoch: 7, step: 663, loss: 0.3406153619289398, mean loss: 0.38102794218928815
Epoch: 7, step: 664, loss: 0.3636551797389984, mean loss: 0.3810263295686207
Epoch: 7, step: 665, loss: 0.3387274146080017, mean loss: 0.3810224035508965
Epoch: 7, step: 666, loss: 0.361724853515625, mean loss: 0.38102061259497677
Epoch: 7, step: 667, loss: 0.3653341233730316, mean loss: 0.3810191569074098
Epoch: 7, step: 668, loss: 0.33846980333328247, mean loss: 0.38101520874432415
Epoch: 7, step: 669, loss: 0.30311471223831177, mean loss: 0.38100798101223043
Epoch: 7, step: 670, loss: 0.3223419785499573, mean loss: 0.3810025383920929
Epoch: 7, step: 671, loss: 0.3525903522968292, mean loss: 0.3809999027533086
Epoch: 7, step: 672, loss: 0.3270309567451477, mean loss: 0.3809948968219471
Epoch: 7, step: 673, loss: 0.39350971579551697, mean loss: 0.38099605753600513
Epoch: 7, step: 674, loss: 0.3607524633407593, mean loss: 0.38099418017402836
Epoch: 7, step: 675, loss: 0.3486177623271942, mean loss: 0.38099117790976217
Epoch: 7, step: 676, loss: 0.3704361319541931, mean loss: 0.38099019923141675
Epoch: 7, step: 677, loss: 0.3411323130130768, mean loss: 0.38098650389614713
Epoch: 7, step: 678, loss: 0.3247809112071991, mean loss: 0.38098129340271164
Epoch: 7, step: 679, loss: 0.3298488259315491, mean loss: 0.38097655364858934
Epoch: 7, step: 680, loss: 0.34150823950767517, mean loss: 0.3809728954491139
Epoch: 7, step: 681, loss: 0.3378368616104126, mean loss: 0.38096889767025954
Epoch: 7, step: 682, loss: 0.3275415897369385, mean loss: 0.38096394657138705
Epoch: 7, step: 683, loss: 0.31174471974372864, mean loss: 0.3809575326326521
Epoch: 7, step: 684, loss: 0.3747372627258301, mean loss: 0.38095695630819115
Epoch: 7, step: 685, loss: 0.3227638900279999, mean loss: 0.3809515650661789
Epoch: 7, step: 686, loss: 0.31728416681289673, mean loss: 0.38094566720622025
Epoch: 7, step: 687, loss: 0.32638758420944214, mean loss: 0.380940613660185
Epoch: 7, step: 688, loss: 0.33603858947753906, mean loss: 0.38093645491014494
Epoch: 7, step: 689, loss: 0.36292582750320435, mean loss: 0.3809347869505777
Epoch: 7, step: 690, loss: 0.3456476628780365, mean loss: 0.3809315193217165
Epoch: 7, step: 691, loss: 0.3378109931945801, mean loss: 0.3809275266804084
Epoch: 7, step: 692, loss: 0.3074251115322113, mean loss: 0.38092072153133444
Epoch: 7, step: 693, loss: 0.33685025572776794, mean loss: 0.38091664168817546
Epoch: 7, step: 694, loss: 0.3570442199707031, mean loss: 0.3809144318925893
Epoch: 7, step: 695, loss: 0.3780827522277832, mean loss: 0.38091416979710013
Epoch: 7, step: 696, loss: 0.3869415521621704, mean loss: 0.380914727629804
Epoch: 7, step: 697, loss: 0.352998822927475, mean loss: 0.38091214425901904
Epoch: 7, step: 698, loss: 0.3757643401622772, mean loss: 0.3809116679192303
Epoch: 7, step: 699, loss: 0.3674415946006775, mean loss: 0.3809104216134088
Epoch: 7, step: 700, loss: 0.3700689673423767, mean loss: 0.38090941861088584
Epoch: 7, step: 701, loss: 0.3768156170845032, mean loss: 0.3809090399058418
Epoch: 7, step: 702, loss: 0.36485010385513306, mean loss: 0.38090755448025204
Epoch: 7, step: 703, loss: 0.3529125154018402, mean loss: 0.3809049652239555
Epoch: 7, step: 704, loss: 0.3406354784965515, mean loss: 0.3809012410505783
Epoch: 7, step: 705, loss: 0.3234233558177948, mean loss: 0.38089592591415955
Epoch: 7, step: 706, loss: 0.32188349962234497, mean loss: 0.3808904693791349
Epoch: 7, step: 707, loss: 0.3435024917125702, mean loss: 0.3808870126504305
Epoch: 7, step: 708, loss: 0.3370347321033478, mean loss: 0.3808829586354035
Epoch: 7, step: 709, loss: 0.3571447432041168, mean loss: 0.3808807643097027
Epoch: 7, step: 710, loss: 0.3105562627315521, mean loss: 0.38087426421712683
Epoch: 7, step: 711, loss: 0.34603360295295715, mean loss: 0.3808710441929804
Epoch: 7, step: 712, loss: 0.3693433701992035, mean loss: 0.3808699788871867
Epoch: 7, step: 713, loss: 0.32763537764549255, mean loss: 0.38086505977785
Epoch: 7, step: 714, loss: 0.3521823287010193, mean loss: 0.38086240961328593
Epoch: 7, step: 715, loss: 0.360603004693985, mean loss: 0.3808605379018189
Epoch: 7, step: 716, loss: 0.32093387842178345, mean loss: 0.3808550019517515
Epoch: 7, step: 717, loss: 0.3883168697357178, mean loss: 0.3808556912061191
Epoch: 7, step: 718, loss: 0.32544010877609253, mean loss: 0.3808505729293638
Epoch: 7, step: 719, loss: 0.3287137746810913, mean loss: 0.38084575793137265
Epoch: 7, step: 720, loss: 0.31991520524024963, mean loss: 0.38084013132201894
Epoch: 7, step: 721, loss: 0.34007900953292847, mean loss: 0.380836367598862
Epoch: 7, step: 722, loss: 0.3340354859828949, mean loss: 0.3808320465868026
Epoch: 7, step: 723, loss: 0.3389841616153717, mean loss: 0.3808281832296228
Epoch: 7, step: 724, loss: 0.3680773079395294, mean loss: 0.38082700618953325
Epoch: 7, step: 725, loss: 0.343152791261673, mean loss: 0.38082352878368797
Epoch: 7, step: 726, loss: 0.3488628566265106, mean loss: 0.3808205790216061
Epoch: 7, step: 727, loss: 0.3259904682636261, mean loss: 0.3808155190261504
Epoch: 7, step: 728, loss: 0.3419550061225891, mean loss: 0.3808119331155752
Epoch: 7, step: 729, loss: 0.31884700059890747, mean loss: 0.3808062157385207
Epoch: 7, step: 730, loss: 0.3496091365814209, mean loss: 0.38080333751366996
Epoch: 7, step: 731, loss: 0.3203140199184418, mean loss: 0.38079775731831983
Epoch: 7, step: 732, loss: 0.3404552936553955, mean loss: 0.3807940360321227
Epoch: 7, step: 733, loss: 0.31007224321365356, mean loss: 0.3807875130849895
Epoch: 7, step: 734, loss: 0.35487279295921326, mean loss: 0.3807851230895892
Epoch: 7, step: 735, loss: 0.3878796100616455, mean loss: 0.3807857773211432
Epoch: 7, step: 736, loss: 0.37665116786956787, mean loss: 0.3807853960754584
Epoch: 7, step: 737, loss: 0.3317873775959015, mean loss: 0.3807808784635757
Epoch: 7, step: 738, loss: 0.3630700409412384, mean loss: 0.38077924567685845
Epoch: 7, step: 739, loss: 0.33326056599617004, mean loss: 0.38077486526759585
Epoch: 7, step: 740, loss: 0.33183592557907104, mean loss: 0.38077035435048934
Epoch: 7, step: 741, loss: 0.36846888065338135, mean loss: 0.3807692205741117
Epoch: 7, step: 742, loss: 0.3289054334163666, mean loss: 0.3807644409420817
Epoch: 7, step: 743, loss: 0.3698233366012573, mean loss: 0.3807634327312136
Epoch: 7, step: 744, loss: 0.335448294878006, mean loss: 0.38075925737528865
Epoch: 7, step: 745, loss: 0.3411867916584015, mean loss: 0.38075561148753145
Epoch: 7, step: 746, loss: 0.29828688502311707, mean loss: 0.3807480141843104
Epoch: 7, step: 747, loss: 0.3281762897968292, mean loss: 0.38074317154204923
Epoch: 7, step: 748, loss: 0.3232036828994751, mean loss: 0.3807378717825722
Epoch: 7, step: 749, loss: 0.33575519919395447, mean loss: 0.3807337289687401
Epoch: 7, step: 750, loss: 0.32003870606422424, mean loss: 0.3807281395937604
Epoch: 7, step: 751, loss: 0.339566707611084, mean loss: 0.38072434940665334
Epoch: 7, step: 752, loss: 0.35443997383117676, mean loss: 0.3807219293370856
Epoch: 7, step: 753, loss: 0.34082287549972534, mean loss: 0.38071825606753695
Epoch: 7, step: 754, loss: 0.35411930084228516, mean loss: 0.3807158074847122
Epoch: 7, step: 755, loss: 0.320770263671875, mean loss: 0.38071028966956005
Epoch: 7, step: 756, loss: 0.34436503052711487, mean loss: 0.38070694450074805
Epoch: 7, step: 757, loss: 0.3623611032962799, mean loss: 0.3807052561295715
Epoch: 7, step: 758, loss: 0.3483412563800812, mean loss: 0.3807022779387415
Epoch: 7, step: 759, loss: 0.34827715158462524, mean loss: 0.380699294397487
Epoch: 7, step: 760, loss: 0.33696451783180237, mean loss: 0.3806952705888049
Epoch: 7, step: 761, loss: 0.36941051483154297, mean loss: 0.3806942324328015
Epoch: 7, step: 762, loss: 0.3371714651584625, mean loss: 0.38069022886668297
Epoch: 7, step: 763, loss: 0.3848484754562378, mean loss: 0.38069061133969523
Epoch: 7, step: 764, loss: 0.34829866886138916, mean loss: 0.3806876322223883
Epoch: 7, step: 765, loss: 0.34421318769454956, mean loss: 0.3806842779420381
Epoch: 7, step: 766, loss: 0.364018052816391, mean loss: 0.3806827454155897
Epoch: 7, step: 767, loss: 0.33076736330986023, mean loss: 0.3806781559174189
Epoch: 7, step: 768, loss: 0.40269532799720764, mean loss: 0.38068018011270066
Epoch: 7, step: 769, loss: 0.3599870502948761, mean loss: 0.38067827782093583
Epoch: 7, step: 770, loss: 0.347135066986084, mean loss: 0.3806751945218426
Epoch: 7, step: 771, loss: 0.3915417492389679, mean loss: 0.38067619328606295
Epoch: 7, step: 772, loss: 0.32029861211776733, mean loss: 0.3806706443860383
Epoch: 7, step: 773, loss: 0.3654631972312927, mean loss: 0.38066924689962456
Epoch: 7, step: 774, loss: 0.35294532775878906, mean loss: 0.38066669944771414
Epoch: 7, step: 775, loss: 0.3453187048435211, mean loss: 0.38066345174515953
Epoch: 7, step: 776, loss: 0.3539455235004425, mean loss: 0.3806609971812418
Epoch: 7, step: 777, loss: 0.29334932565689087, mean loss: 0.3806529766345282
Epoch: 7, step: 778, loss: 0.3198219835758209, mean loss: 0.38064738914549917
Epoch: 7, step: 779, loss: 0.3379225432872772, mean loss: 0.3806434651148362
Epoch: 7, step: 780, loss: 0.322391539812088, mean loss: 0.3806381155028147
Epoch: 7, step: 781, loss: 0.353076696395874, mean loss: 0.3806355846103347
Epoch: 7, step: 782, loss: 0.3019273281097412, mean loss: 0.3806283577021995
Epoch: 7, step: 783, loss: 0.30358707904815674, mean loss: 0.38062128450364513
Epoch: 7, step: 784, loss: 0.35760971903800964, mean loss: 0.38061917199419265
Epoch: 7, step: 785, loss: 0.32672539353370667, mean loss: 0.38061422488766977
Epoch: 7, step: 786, loss: 0.3498695492744446, mean loss: 0.3806114029807755
Epoch: 7, step: 787, loss: 0.3483318090438843, mean loss: 0.3806084404629766
Epoch: 7, step: 788, loss: 0.33916276693344116, mean loss: 0.380604637060799
Epoch: 7, step: 789, loss: 0.36281925439834595, mean loss: 0.38060300507486927
Epoch: 7, step: 790, loss: 0.31643158197402954, mean loss: 0.3805971172481787
Epoch: 7, step: 791, loss: 0.3579305410385132, mean loss: 0.38059503774577413
Epoch: 7, step: 792, loss: 0.3727213144302368, mean loss: 0.3805943154521024
Epoch: 7, step: 793, loss: 0.33346691727638245, mean loss: 0.38058999263076915
Epoch: 7, step: 794, loss: 0.377375066280365, mean loss: 0.38058969776455337
Epoch: 7, step: 795, loss: 0.33133652806282043, mean loss: 0.3805851807827392
Epoch: 7, step: 796, loss: 0.35372471809387207, mean loss: 0.3805827176499846
Epoch: 7, step: 797, loss: 0.398728609085083, mean loss: 0.38058438149478885
Epoch: 7, step: 798, loss: 0.39398184418678284, mean loss: 0.38058560983096673
Epoch: 7, step: 799, loss: 0.36537691950798035, mean loss: 0.3805842155615935
Epoch: 7, step: 800, loss: 0.3562390208244324, mean loss: 0.3805819839001454
Epoch: 7, step: 801, loss: 0.3373670279979706, mean loss: 0.38057802285927445
Epoch: 7, step: 802, loss: 0.3748185336589813, mean loss: 0.3805774949984734
Epoch: 7, step: 803, loss: 0.35181155800819397, mean loss: 0.3805748588238958
Epoch: 7, step: 804, loss: 0.35333576798439026, mean loss: 0.38057236280164347
Epoch: 7, step: 805, loss: 0.3334749937057495, mean loss: 0.3805680474847023
Epoch: 7, step: 806, loss: 0.3434971868991852, mean loss: 0.38056465116215665
Epoch: 7, step: 807, loss: 0.34761467576026917, mean loss: 0.3805616326594632
Epoch: 7, step: 808, loss: 0.39648738503456116, mean loss: 0.3805630914624654
Epoch: 7, step: 809, loss: 0.34285232424736023, mean loss: 0.38055963746290367
Epoch: 7, step: 810, loss: 0.3066577613353729, mean loss: 0.380552869272032
Epoch: 7, step: 811, loss: 0.36881211400032043, mean loss: 0.38055179411129286
Epoch: 7, step: 812, loss: 0.31484559178352356, mean loss: 0.38054577761075925
Epoch: 7, step: 813, loss: 0.29990917444229126, mean loss: 0.3805383946586288
Epoch: 7, step: 814, loss: 0.31537124514579773, mean loss: 0.38053242860996883
Epoch: 7, step: 815, loss: 0.3241838216781616, mean loss: 0.3805272703705939
Epoch: 7, step: 816, loss: 0.34126442670822144, mean loss: 0.3805236765176271
Epoch: 7, step: 817, loss: 0.3368644416332245, mean loss: 0.3805196806147455
Epoch: 7, step: 818, loss: 0.3870612680912018, mean loss: 0.38052027927745957
Epoch: 7, step: 819, loss: 0.36978891491889954, mean loss: 0.3805192972712042
Epoch: 7, step: 820, loss: 0.3569612205028534, mean loss: 0.38051714171472434
Epoch: 7, step: 821, loss: 0.33177968859672546, mean loss: 0.3805126826613741
Epoch: 7, step: 822, loss: 0.3162066638469696, mean loss: 0.3805067997578141
Epoch: 7, step: 823, loss: 0.3352068066596985, mean loss: 0.3805026559604213
Epoch: 7, step: 824, loss: 0.36717846989631653, mean loss: 0.3805014372477108
Epoch: 7, step: 825, loss: 0.34350576996803284, mean loss: 0.3804980537039684
Epoch: 7, step: 826, loss: 0.39443111419677734, mean loss: 0.380499327875024
Epoch: 7, step: 827, loss: 0.32769396901130676, mean loss: 0.38049449929429396
Epoch: 7, step: 828, loss: 0.3420727550983429, mean loss: 0.3804909862885158
Epoch: 7, step: 829, loss: 0.31592658162117004, mean loss: 0.38048508352707244
Epoch: 7, step: 830, loss: 0.33735737204551697, mean loss: 0.38048114096271723
Epoch: 7, step: 831, loss: 0.3417474627494812, mean loss: 0.38047760040712186
Epoch: 7, step: 832, loss: 0.33508187532424927, mean loss: 0.3804734512685529
Epoch: 7, step: 833, loss: 0.3147061765193939, mean loss: 0.3804674407334817
Epoch: 7, step: 834, loss: 0.34437891840934753, mean loss: 0.38046414286979496
Epoch: 7, step: 835, loss: 0.33600905537605286, mean loss: 0.3804600808186716
Epoch: 7, step: 836, loss: 0.35907644033432007, mean loss: 0.38045812708267485
Epoch: 7, step: 837, loss: 0.3475840389728546, mean loss: 0.3804551237857527
Epoch: 7, step: 838, loss: 0.3102347254753113, mean loss: 0.3804487092065702
Epoch: 7, step: 839, loss: 0.3304496109485626, mean loss: 0.3804441422447271
Epoch: 7, step: 840, loss: 0.3177623450756073, mean loss: 0.380438417356868
Epoch: 7, step: 841, loss: 0.3461620807647705, mean loss: 0.3804352870978185
Epoch: 7, step: 842, loss: 0.38098663091659546, mean loss: 0.38043533744425434
Epoch: 7, step: 843, loss: 0.3691859245300293, mean loss: 0.3804343102882176
Epoch: 7, step: 844, loss: 0.3418084681034088, mean loss: 0.38043078378021206
Epoch: 7, step: 845, loss: 0.34474197030067444, mean loss: 0.3804275257179992
Epoch: 7, step: 846, loss: 0.3210679292678833, mean loss: 0.38042210722448483
Epoch: 7, step: 847, loss: 0.3645458221435547, mean loss: 0.380420658129461
Epoch: 7, step: 848, loss: 0.3583301901817322, mean loss: 0.38041864202396247
Epoch: 7, step: 849, loss: 0.3214697539806366, mean loss: 0.38041326249411733
Epoch: 7, step: 850, loss: 0.37525251507759094, mean loss: 0.38041279158003605
Epoch: 7, step: 851, loss: 0.33125701546669006, mean loss: 0.3804083065639673
Epoch: 7, step: 852, loss: 0.32890403270721436, mean loss: 0.38040360769763604
Epoch: 7, step: 853, loss: 0.35419803857803345, mean loss: 0.3804012171147935
Epoch: 7, step: 854, loss: 0.33435583114624023, mean loss: 0.3803970170431007
Epoch: 7, step: 855, loss: 0.33549872040748596, mean loss: 0.3803929219777381
Epoch: 7, step: 856, loss: 0.35385391116142273, mean loss: 0.38039050163931437
Epoch: 7, step: 857, loss: 0.3065037429332733, mean loss: 0.38038376383531053
Epoch: 7, step: 858, loss: 0.30625030398368835, mean loss: 0.380377004150816
Epoch: 7, step: 859, loss: 0.3443566560745239, mean loss: 0.3803737200198827
Epoch: 7, step: 860, loss: 0.3280982971191406, mean loss: 0.38036895427798273
Epoch: 7, step: 861, loss: 0.33912524580955505, mean loss: 0.3803651945962627
Epoch: 7, step: 862, loss: 0.36811333894729614, mean loss: 0.3803640778470467
Epoch: 7, step: 863, loss: 0.3137094974517822, mean loss: 0.3803580028761758
Epoch: 7, step: 864, loss: 0.3852643370628357, mean loss: 0.3803584500040521
Epoch: 7, step: 865, loss: 0.3167295455932617, mean loss: 0.38035265185347705
Epoch: 7, step: 866, loss: 0.3438833951950073, mean loss: 0.3803493289143738
Epoch: 7, step: 867, loss: 0.30983319878578186, mean loss: 0.3803429043398358
Epoch: 7, step: 868, loss: 0.28738269209861755, mean loss: 0.3803344357043032
Epoch: 7, step: 869, loss: 0.36497393250465393, mean loss: 0.3803330364965058
Epoch: 7, step: 870, loss: 0.35646533966064453, mean loss: 0.3803308625556336
Epoch: 7, step: 871, loss: 0.3602138161659241, mean loss: 0.3803290304020462
Epoch: 7, step: 872, loss: 0.3868468403816223, mean loss: 0.3803296239554548
Epoch: 7, step: 873, loss: 0.4417610764503479, mean loss: 0.38033521778649604
Epoch: 7, step: 874, loss: 0.33883917331695557, mean loss: 0.3803314395797702
Epoch: 7, step: 875, loss: 0.33268865942955017, mean loss: 0.3803271021088898
Epoch: 7, step: 876, loss: 0.3843303620815277, mean loss: 0.38032746653856414
Epoch: 7, step: 877, loss: 0.32543668150901794, mean loss: 0.3803224701081045
Epoch: 7, step: 878, loss: 0.3357894718647003, mean loss: 0.3803184168635206
Epoch: 7, step: 879, loss: 0.37246468663215637, mean loss: 0.38031770210831206
Epoch: 7, step: 880, loss: 0.367836058139801, mean loss: 0.3803165662775751
Epoch: 7, step: 881, loss: 0.3734618127346039, mean loss: 0.38031594255113804
Epoch: 7, step: 882, loss: 0.4150466322898865, mean loss: 0.3803191024719586
Epoch: 7, step: 883, loss: 0.3385504186153412, mean loss: 0.380315302555305
Epoch: 7, step: 884, loss: 0.33209115266799927, mean loss: 0.38031091575007553
Epoch: 7, step: 885, loss: 0.3528573215007782, mean loss: 0.38030841860670195
Epoch: 7, step: 886, loss: 0.34142687916755676, mean loss: 0.3803048823138926
Epoch: 7, step: 887, loss: 0.3340305984020233, mean loss: 0.3803006740305248
Epoch: 7, step: 888, loss: 0.3969504237174988, mean loss: 0.380302188057049
Epoch: 7, step: 889, loss: 0.31048882007598877, mean loss: 0.38029584023308277
Epoch: 7, step: 890, loss: 0.3536303639411926, mean loss: 0.38029341587847854
Epoch: 7, step: 891, loss: 0.39189478754997253, mean loss: 0.38029447054863047
Epoch: 7, step: 892, loss: 0.3804384469985962, mean loss: 0.3802944836362089
Epoch: 7, step: 893, loss: 0.36918511986732483, mean loss: 0.38029347387764056
Epoch: 7, step: 894, loss: 0.35812899470329285, mean loss: 0.38029145947437104
Epoch: 7, step: 895, loss: 0.33118104934692383, mean loss: 0.3802869965145267
Epoch: 7, step: 896, loss: 0.32261279225349426, mean loss: 0.3802817557871972
Epoch: 7, step: 897, loss: 0.3617303967475891, mean loss: 0.3802800702194124
Epoch: 7, step: 898, loss: 0.41438204050064087, mean loss: 0.38028316842694226
Epoch: 7, step: 899, loss: 0.35222214460372925, mean loss: 0.3802806192787025
Epoch: 7, step: 900, loss: 0.36550065875053406, mean loss: 0.3802792767443644
Epoch: 7, step: 901, loss: 0.32040345668792725, mean loss: 0.38027383843191603
Epoch: 7, step: 902, loss: 0.35897383093833923, mean loss: 0.3802719040020283
Epoch: 7, step: 903, loss: 0.3197241425514221, mean loss: 0.38026640565827147
Epoch: 7, step: 904, loss: 0.3675960898399353, mean loss: 0.3802652551710456
Epoch: 7, step: 905, loss: 0.3716280460357666, mean loss: 0.38026447096829136
Epoch: 7, step: 906, loss: 0.31674227118492126, mean loss: 0.3802587040867858
Epoch: 7, step: 907, loss: 0.38529330492019653, mean loss: 0.38025916111300523
Epoch: 7, step: 908, loss: 0.3612573444843292, mean loss: 0.3802574363406871
Epoch: 7, step: 909, loss: 0.3483642041683197, mean loss: 0.38025454169264095
Epoch: 7, step: 910, loss: 0.31103116273880005, mean loss: 0.3802482595092347
Epoch: 7, step: 911, loss: 0.36974310874938965, mean loss: 0.38024730622876646
Epoch: 7, step: 912, loss: 0.3282647728919983, mean loss: 0.3802425895484891
Epoch: 7, step: 913, loss: 0.3353065848350525, mean loss: 0.3802385126110264
Epoch: 7, step: 914, loss: 0.32904595136642456, mean loss: 0.380233868452336
Epoch: 7, step: 915, loss: 0.3619235157966614, mean loss: 0.3802322074987206
Epoch: 7, step: 916, loss: 0.3642723262310028, mean loss: 0.38023075989044236
Epoch: 7, step: 917, loss: 0.3607000410556793, mean loss: 0.3802289885573356
Epoch: 7, step: 918, loss: 0.35025733709335327, mean loss: 0.38022627053326163
Epoch: 7, step: 919, loss: 0.37707674503326416, mean loss: 0.380225984939727
Epoch: 7, step: 920, loss: 0.4260938763618469, mean loss: 0.38023014378381276
Epoch: 7, step: 921, loss: 0.3441670536994934, mean loss: 0.3802268742380209
Epoch: 7, step: 922, loss: 0.3311239182949066, mean loss: 0.38022242287767793
Epoch: 7, step: 923, loss: 0.3528464436531067, mean loss: 0.3802199413712218
Epoch: 7, step: 924, loss: 0.33728083968162537, mean loss: 0.3802160494921599
Epoch: 7, step: 925, loss: 0.3520718216896057, mean loss: 0.38021349880992295
Epoch: 7, step: 926, loss: 0.37350401282310486, mean loss: 0.38021289079125625
Epoch: 7, step: 927, loss: 0.3403751254081726, mean loss: 0.3802092809901161
Epoch: 7, step: 928, loss: 0.37775933742523193, mean loss: 0.38020905901461866
Epoch: 7, step: 929, loss: 0.38695406913757324, mean loss: 0.3802096700863819
Epoch: 7, step: 930, loss: 0.359419047832489, mean loss: 0.3802077867072485
Epoch: 7, step: 931, loss: 0.315165638923645, mean loss: 0.380201895208355
Epoch: 7, step: 932, loss: 0.3490080237388611, mean loss: 0.3801990699324317
Epoch: 7, step: 933, loss: 0.3499252200126648, mean loss: 0.3801963282325657
Epoch: 7, step: 934, loss: 0.3982606828212738, mean loss: 0.38019796405205214
Epoch: 7, step: 935, loss: 0.3442932665348053, mean loss: 0.38019471299287816
Epoch: 7, step: 936, loss: 0.34650322794914246, mean loss: 0.38019166260944276
Epoch: 7, step: 937, loss: 0.38522636890411377, mean loss: 0.38019211840396516
Epoch: 7, step: 938, loss: 0.3508182466030121, mean loss: 0.38018945941312593
Epoch: 7, step: 939, loss: 0.34893476963043213, mean loss: 0.38018663042237805
Epoch: 7, step: 940, loss: 0.32887712121009827, mean loss: 0.3801819866076245
Epoch: 7, step: 941, loss: 0.33020034432411194, mean loss: 0.3801774633820785
Epoch: 7, step: 942, loss: 0.3325256407260895, mean loss: 0.38017315139016317
Epoch: 7, step: 943, loss: 0.3510834574699402, mean loss: 0.38017051931507084
Epoch: 7, step: 944, loss: 0.4031246304512024, mean loss: 0.3801725960463778
Epoch: 7, step: 945, loss: 0.34756356477737427, mean loss: 0.3801696460706886
Epoch: 7, step: 946, loss: 0.3474510908126831, mean loss: 0.3801666864546544
Epoch: 7, step: 947, loss: 0.36189934611320496, mean loss: 0.3801650341988348
Epoch: 7, step: 948, loss: 0.38317516446113586, mean loss: 0.3801653064363551
Epoch: 7, step: 949, loss: 0.34167584776878357, mean loss: 0.3801618257473817
Epoch: 7, step: 950, loss: 0.35882097482681274, mean loss: 0.38015989602037925
Epoch: 7, step: 951, loss: 0.33208808302879333, mean loss: 0.3801555495635084
Epoch: 7, step: 952, loss: 0.3147260546684265, mean loss: 0.3801496342308174
Epoch: 7, step: 953, loss: 0.3506939709186554, mean loss: 0.3801469714516353
Epoch: 7, step: 954, loss: 0.37153029441833496, mean loss: 0.3801461925781802
Epoch: 7, step: 955, loss: 0.35470232367515564, mean loss: 0.3801438928792555
Epoch: 7, step: 956, loss: 0.36309877038002014, mean loss: 0.38014235242534683
Epoch: 7, step: 957, loss: 0.35502880811691284, mean loss: 0.38014008299246155
Epoch: 7, step: 958, loss: 0.346278578042984, mean loss: 0.38013702331007704
Epoch: 7, step: 959, loss: 0.33938127756118774, mean loss: 0.38013334100561835
Epoch: 7, step: 960, loss: 0.3585318326950073, mean loss: 0.3801313894735639
Epoch: 7, step: 961, loss: 0.3286878168582916, mean loss: 0.38012674235769983
Epoch: 7, step: 962, loss: 0.3809894919395447, mean loss: 0.3801268202864851
Epoch: 7, step: 963, loss: 0.3481130599975586, mean loss: 0.380123928870274
Epoch: 7, step: 964, loss: 0.363668829202652, mean loss: 0.3801224428141314
Epoch: 7, step: 965, loss: 0.33065053820610046, mean loss: 0.3801179754216257
Epoch: 7, step: 966, loss: 0.31208768486976624, mean loss: 0.3801118327317339
Epoch: 7, step: 967, loss: 0.3680191934108734, mean loss: 0.3801107409441462
Epoch: 7, step: 968, loss: 0.3142286241054535, mean loss: 0.3801047932943458
Epoch: 7, step: 969, loss: 0.32453495264053345, mean loss: 0.38009977706030956
Epoch: 7, step: 970, loss: 0.33474865555763245, mean loss: 0.38009568362935886
Epoch: 7, step: 971, loss: 0.32389628887176514, mean loss: 0.38009061148181755
Epoch: 7, step: 972, loss: 0.32385218143463135, mean loss: 0.38008553626928737
Epoch: 7, step: 973, loss: 0.32046234607696533, mean loss: 0.3800801560860901
Epoch: 7, step: 974, loss: 0.3280274271965027, mean loss: 0.380075459458021
Epoch: 7, step: 975, loss: 0.3904247283935547, mean loss: 0.38007639317048364
Epoch: 7, step: 976, loss: 0.3464246094226837, mean loss: 0.3800733573758289
Epoch: 7, step: 977, loss: 0.3205632269382477, mean loss: 0.3800679893323112
Epoch: 7, step: 978, loss: 0.3733330965042114, mean loss: 0.3800673818737716
Epoch: 7, step: 979, loss: 0.33653679490089417, mean loss: 0.38006345595503305
Epoch: 7, step: 980, loss: 0.3216971158981323, mean loss: 0.38005819251017264
Epoch: 7, step: 981, loss: 0.3837811350822449, mean loss: 0.3800585282128392
Epoch: 7, step: 982, loss: 0.31730467081069946, mean loss: 0.38005287012453315
Epoch: 7, step: 983, loss: 0.3266281485557556, mean loss: 0.3800480536151959
Epoch: 7, step: 984, loss: 0.3602571487426758, mean loss: 0.3800462695256915
Epoch: 7, step: 985, loss: 0.3447002172470093, mean loss: 0.3800430834744675
Epoch: 7, step: 986, loss: 0.3377843499183655, mean loss: 0.3800392746656747
Epoch: 7, step: 987, loss: 0.340279221534729, mean loss: 0.3800356913876348
Epoch: 7, step: 988, loss: 0.3287146985530853, mean loss: 0.38003106662483094
Epoch: 7, step: 989, loss: 0.3065652847290039, mean loss: 0.38002444689317694
Epoch: 7, step: 990, loss: 0.4085991084575653, mean loss: 0.38002702141895084
Epoch: 7, step: 991, loss: 0.3733842968940735, mean loss: 0.3800264229752999
Epoch: 7, step: 992, loss: 0.3363245129585266, mean loss: 0.38002248622095197
Epoch: 7, step: 993, loss: 0.3117014169692993, mean loss: 0.3800163322784865
Epoch: 7, step: 994, loss: 0.32253241539001465, mean loss: 0.3800111549465142
Epoch: 7, step: 995, loss: 0.38291773200035095, mean loss: 0.3800114167059751
Epoch: 7, step: 996, loss: 0.32216817140579224, mean loss: 0.3800062079490818
Epoch: 7, step: 997, loss: 0.35712727904319763, mean loss: 0.3800041478978567
Epoch: 7, step: 998, loss: 0.3615138828754425, mean loss: 0.38000248315805096
Epoch: 7, step: 999, loss: 0.34396299719810486, mean loss: 0.37999923869586516
Epoch: 7, step: 1000, loss: 0.30505824089050293, mean loss: 0.3799924927243281
Epoch: 7, step: 1001, loss: 0.41063207387924194, mean loss: 0.37999525056241584
Epoch: 7, step: 1002, loss: 0.361329585313797, mean loss: 0.3799935706357442
Epoch: 7, step: 1003, loss: 0.3325527310371399, mean loss: 0.37998930130172703
Epoch: 7, step: 1004, loss: 0.3423038125038147, mean loss: 0.3799859101842252
Epoch: 7, step: 1005, loss: 0.304876446723938, mean loss: 0.37997915208961835
Epoch: 7, step: 1006, loss: 0.37415385246276855, mean loss: 0.3799786279960847
Epoch: 7, step: 1007, loss: 0.36928823590278625, mean loss: 0.37997766628394963
Epoch: 7, step: 1008, loss: 0.3706405460834503, mean loss: 0.3799768263882763
Epoch: 7, step: 1009, loss: 0.3211808502674103, mean loss: 0.379971538029208
Epoch: 7, step: 1010, loss: 0.34316766262054443, mean loss: 0.3799682280305203
Epoch: 7, step: 1011, loss: 0.34263303875923157, mean loss: 0.37996487054947076
Epoch: 7, step: 1012, loss: 0.3323661983013153, mean loss: 0.37996059047823183
Epoch: 7, step: 1013, loss: 0.3258020579814911, mean loss: 0.37995572098241304
Epoch: 7, step: 1014, loss: 0.30748307704925537, mean loss: 0.379949205416115
Epoch: 7, step: 1015, loss: 0.34400734305381775, mean loss: 0.37994597439648514
Epoch: 7, step: 1016, loss: 0.3132892847061157, mean loss: 0.3799399827839287
Epoch: 7, step: 1017, loss: 0.3063618242740631, mean loss: 0.37993336961131413
Epoch: 7, step: 1018, loss: 0.32794296741485596, mean loss: 0.3799286971567265
Epoch: 7, step: 1019, loss: 0.33004266023635864, mean loss: 0.37992421422745615
Epoch: 7, step: 1020, loss: 0.3787476420402527, mean loss: 0.3799241085061706
Epoch: 7, step: 1021, loss: 0.3411566913127899, mean loss: 0.37992062535997173
Epoch: 7, step: 1022, loss: 0.3504483997821808, mean loss: 0.37991797759916157
Epoch: 7, step: 1023, loss: 0.3175663948059082, mean loss: 0.37991237648680143
Epoch: 7, step: 1024, loss: 0.31712856888771057, mean loss: 0.3799067370538005
Epoch: 7, step: 1025, loss: 0.3289336562156677, mean loss: 0.37990215890750645
Epoch: 7, step: 1026, loss: 0.38071122765541077, mean loss: 0.3799022315674748
Epoch: 7, step: 1027, loss: 0.31940001249313354, mean loss: 0.3798967985377447
Epoch: 7, step: 1028, loss: 0.34956011176109314, mean loss: 0.37989407458274993
Epoch: 7, step: 1029, loss: 0.3516739010810852, mean loss: 0.3798915408986503
Epoch: 7, step: 1030, loss: 0.4198201596736908, mean loss: 0.3798951254770483
Epoch: 7, step: 1031, loss: 0.37964558601379395, mean loss: 0.3798951030767374
Epoch: 7, step: 1032, loss: 0.35335931181907654, mean loss: 0.37989272126260426
Epoch: 7, step: 1033, loss: 0.3474341630935669, mean loss: 0.37988980809098616
Epoch: 7, step: 1034, loss: 0.33914342522621155, mean loss: 0.3798861514111993
Epoch: 7, step: 1035, loss: 0.37483304738998413, mean loss: 0.37988569797401145
Epoch: 7, step: 1036, loss: 0.376679390668869, mean loss: 0.3798854102838091
Epoch: 7, step: 1037, loss: 0.35207539796829224, mean loss: 0.37988291521720985
Epoch: 7, step: 1038, loss: 0.39012181758880615, mean loss: 0.3798838337515574
Epoch: 7, step: 1039, loss: 0.360870361328125, mean loss: 0.37988212820146555
Epoch: 7, step: 1040, loss: 0.3150016665458679, mean loss: 0.3798763088040617
Epoch: 7, step: 1041, loss: 0.34758949279785156, mean loss: 0.3798734131254961
Epoch: 7, step: 1042, loss: 0.32898691296577454, mean loss: 0.37986884972309637
Epoch: 7, step: 1043, loss: 0.3491261601448059, mean loss: 0.3798660930256808
Epoch: 7, step: 1044, loss: 0.3432047665119171, mean loss: 0.37986280589876303
Epoch: 7, step: 1045, loss: 0.3569049537181854, mean loss: 0.3798607476369574
Epoch: 7, step: 1046, loss: 0.3301006555557251, mean loss: 0.37985628684878336
Epoch: 7, step: 1047, loss: 0.32033783197402954, mean loss: 0.3798509517416773
Epoch: 7, step: 1048, loss: 0.35333967208862305, mean loss: 0.37984857554022056
Epoch: 7, step: 1049, loss: 0.3398890793323517, mean loss: 0.3798449942984023
Epoch: 7, step: 1050, loss: 0.3515772819519043, mean loss: 0.3798424611222802
Epoch: 7, step: 1051, loss: 0.319734662771225, mean loss: 0.37983707511884374
Epoch: 7, step: 1052, loss: 0.31462568044662476, mean loss: 0.3798312323274566
Epoch: 7, step: 1053, loss: 0.33292266726493835, mean loss: 0.37982702980415767
Epoch: 7, step: 1054, loss: 0.32791024446487427, mean loss: 0.37982237901267335
Epoch: 7, step: 1055, loss: 0.3349829316139221, mean loss: 0.379818362580624
Epoch: 7, step: 1056, loss: 0.29560378193855286, mean loss: 0.37981081985060683
Epoch: 7, step: 1057, loss: 0.3650153577327728, mean loss: 0.3798094948047428
Epoch: 7, step: 1058, loss: 0.3930053412914276, mean loss: 0.3798106764870645
Epoch: 7, step: 1059, loss: 0.3340328633785248, mean loss: 0.3798065774708478
Epoch: 7, step: 1060, loss: 0.3365439176559448, mean loss: 0.3798027040121841
Epoch: 7, step: 1061, loss: 0.33141028881073, mean loss: 0.37979837165630215
Epoch: 7, step: 1062, loss: 0.37797266244888306, mean loss: 0.37979820822337695
Epoch: 7, step: 1063, loss: 0.31860238313674927, mean loss: 0.37979273061640534
Epoch: 7, step: 1064, loss: 0.3474684953689575, mean loss: 0.3797898375496151
Epoch: 7, step: 1065, loss: 0.3133193552494049, mean loss: 0.3797838888757024
Epoch: 7, step: 1066, loss: 0.3503139615058899, mean loss: 0.37978125174573646
Epoch: 7, step: 1067, loss: 0.3292990028858185, mean loss: 0.3797767347227533
Epoch: 7, step: 1068, loss: 0.35792824625968933, mean loss: 0.37977477995059056
Epoch: 7, step: 1069, loss: 0.36102133989334106, mean loss: 0.37977310224079835
Epoch: 7, step: 1070, loss: 0.432267427444458, mean loss: 0.37977779803874123
Epoch: 7, step: 1071, loss: 0.3504531979560852, mean loss: 0.3797751750870344
Epoch: 7, step: 1072, loss: 0.31477615237236023, mean loss: 0.379769361740937
Epoch: 7, step: 1073, loss: 0.35828322172164917, mean loss: 0.3797674402474636
Epoch: 7, step: 1074, loss: 0.3173168897628784, mean loss: 0.37976185582910676
Epoch: 7, step: 1075, loss: 0.3325297236442566, mean loss: 0.379757632641322
Epoch: 7, step: 1076, loss: 0.40411239862442017, mean loss: 0.3797598100902253
Epoch: 7, step: 1077, loss: 0.3892938792705536, mean loss: 0.3797606624118041
Epoch: 7, step: 1078, loss: 0.3232859671115875, mean loss: 0.37975561416872733
Epoch: 7, step: 1079, loss: 0.3590788245201111, mean loss: 0.3797537660466636
Epoch: 7, step: 1080, loss: 0.3677719533443451, mean loss: 0.37975269519022403
Epoch: 7, step: 1081, loss: 0.335586279630661, mean loss: 0.37974874823619725
Epoch: 7, step: 1082, loss: 0.33964359760284424, mean loss: 0.3797451645394201
Epoch: 7, step: 1083, loss: 0.355063259601593, mean loss: 0.37974295922268153
Epoch: 7, step: 1084, loss: 0.3467823266983032, mean loss: 0.37974001446859196
Epoch: 7, step: 1085, loss: 0.31655198335647583, mean loss: 0.3797343696560931
Epoch: 7, step: 1086, loss: 0.33621180057525635, mean loss: 0.37973048197685405
Epoch: 7, step: 1087, loss: 0.30885472893714905, mean loss: 0.3797241515237422
Epoch: 7, step: 1088, loss: 0.3706274926662445, mean loss: 0.3797233391044462
Epoch: 7, step: 1089, loss: 0.33696943521499634, mean loss: 0.3797195211098142
Epoch: 7, step: 1090, loss: 0.33799082040786743, mean loss: 0.37971579500027747
Epoch: 7, step: 1091, loss: 0.34735769033432007, mean loss: 0.3797129058837894
Epoch: 7, step: 1092, loss: 0.34088918566703796, mean loss: 0.3797094397896713
Epoch: 7, step: 1093, loss: 0.35935887694358826, mean loss: 0.3797076230995404
Epoch: 7, step: 1094, loss: 0.3150281012058258, mean loss: 0.3797018496886778
Epoch: 7, step: 1095, loss: 0.33837890625, mean loss: 0.37969816145738194
Epoch: 7, step: 1096, loss: 0.34591570496559143, mean loss: 0.37969514651258124
Epoch: 7, step: 1097, loss: 0.3272618055343628, mean loss: 0.37969046747090907
Epoch: 7, step: 1098, loss: 0.32811644673347473, mean loss: 0.37968586552384587
Epoch: 7, step: 1099, loss: 0.36205118894577026, mean loss: 0.37968429212300914
Epoch: 7, step: 1100, loss: 0.31648680567741394, mean loss: 0.37967865402090856
Epoch: 7, step: 1101, loss: 0.34446150064468384, mean loss: 0.3796755124371997
Epoch: 7, step: 1102, loss: 0.31956493854522705, mean loss: 0.3796701506876776
Epoch: 7, step: 1103, loss: 0.3766677975654602, mean loss: 0.37966988290734205
Epoch: 7, step: 1104, loss: 0.32413673400878906, mean loss: 0.37966493033899296
Epoch: 7, step: 1105, loss: 0.36562106013298035, mean loss: 0.3796636779874497
Epoch: 7, step: 1106, loss: 0.3327116370201111, mean loss: 0.3796594914479074
Epoch: 7, step: 1107, loss: 0.3458542227745056, mean loss: 0.3796564774260927
Epoch: 7, step: 1108, loss: 0.3705442547798157, mean loss: 0.3796556650678288
Epoch: 7, step: 1109, loss: 0.31780123710632324, mean loss: 0.37965015121259954
Epoch: 7, step: 1110, loss: 0.3576950430870056, mean loss: 0.37964819425492724
Epoch: 7, step: 1111, loss: 0.3632664680480957, mean loss: 0.37964673420802825
Epoch: 7, step: 1112, loss: 0.31087011098861694, mean loss: 0.37964060493049334
Epoch: 7, step: 1113, loss: 0.3172212839126587, mean loss: 0.37963504270263576
Epoch: 7, step: 1114, loss: 0.335053950548172, mean loss: 0.37963107040537525
Epoch: 7, step: 1115, loss: 0.3730442523956299, mean loss: 0.3796304835541627
Epoch: 7, step: 1116, loss: 0.34511834383010864, mean loss: 0.37962740897601355
Epoch: 7, step: 1117, loss: 0.3635624349117279, mean loss: 0.379625977925411
Epoch: 7, step: 1118, loss: 0.35177361965179443, mean loss: 0.37962349708829746
Epoch: 7, step: 1119, loss: 0.3381524384021759, mean loss: 0.3796198035490486
Epoch: 7, step: 1120, loss: 0.31354013085365295, mean loss: 0.3796139188155287
Epoch: 7, step: 1121, loss: 0.353679358959198, mean loss: 0.3796116094157196
Epoch: 7, step: 1122, loss: 0.33681389689445496, mean loss: 0.3796077987387967
Epoch: 7, step: 1123, loss: 0.3675605356693268, mean loss: 0.37960672615483393
Epoch: 7, step: 1124, loss: 0.3336161971092224, mean loss: 0.3796026319209654
Epoch: 7, step: 1125, loss: 0.3731531798839569, mean loss: 0.37960205781984047
Epoch: 7, step: 1126, loss: 0.36172938346862793, mean loss: 0.37960046701660494
Epoch: 7, step: 1127, loss: 0.36422091722488403, mean loss: 0.37959909824214855
Epoch: 7, step: 1128, loss: 0.381343275308609, mean loss: 0.37959925345947226
Epoch: 7, step: 1129, loss: 0.3351113200187683, mean loss: 0.3795952947538805
Epoch: 7, step: 1130, loss: 0.34515097737312317, mean loss: 0.379592230040171
Epoch: 7, step: 1131, loss: 0.3424566686153412, mean loss: 0.3795889261645994
Epoch: 7, step: 1132, loss: 0.34605729579925537, mean loss: 0.37958594318885297
Epoch: 7, step: 1133, loss: 0.365684449672699, mean loss: 0.3795847066212034
Epoch: 7, step: 1134, loss: 0.34531956911087036, mean loss: 0.37958165893486434
Epoch: 7, step: 1135, loss: 0.3492685556411743, mean loss: 0.3795789629989613
Epoch: 7, step: 1136, loss: 0.3463113009929657, mean loss: 0.3795760045585873
Epoch: 7, step: 1137, loss: 0.3681377172470093, mean loss: 0.37957498746030244
Epoch: 7, step: 1138, loss: 0.34377843141555786, mean loss: 0.3795718046954723
Epoch: 7, step: 1139, loss: 0.33428651094436646, mean loss: 0.37956777862028107
Epoch: 7, step: 1140, loss: 0.36664000153541565, mean loss: 0.3795666293823857
Epoch: 7, step: 1141, loss: 0.3378583490848541, mean loss: 0.3795629219796926
Epoch: 7, step: 1142, loss: 0.3637358844280243, mean loss: 0.37956151525695225
Epoch: 7, step: 1143, loss: 0.3335527777671814, mean loss: 0.37955742631832
Epoch: 7, step: 1144, loss: 0.34382423758506775, mean loss: 0.37955425088166017
Epoch: 7, step: 1145, loss: 0.4115528166294098, mean loss: 0.37955709418766226
Epoch: 7, step: 1146, loss: 0.3298811614513397, mean loss: 0.37955268051083096
Epoch: 7, step: 1147, loss: 0.32134899497032166, mean loss: 0.37954750960770905
Epoch: 7, step: 1148, loss: 0.31752416491508484, mean loss: 0.37954199984980797
Epoch: 7, step: 1149, loss: 0.34249937534332275, mean loss: 0.3795387095118699
Epoch: 7, step: 1150, loss: 0.33943554759025574, mean loss: 0.37953514763586654
Epoch: 7, step: 1151, loss: 0.3427670896053314, mean loss: 0.37953188226659207
Epoch: 7, step: 1152, loss: 0.3411024212837219, mean loss: 0.3795284696512841
Epoch: 7, step: 1153, loss: 0.42487281560897827, mean loss: 0.379532495965079
Epoch: 7, step: 1154, loss: 0.3130548596382141, mean loss: 0.3795265936622887
Epoch: 7, step: 1155, loss: 0.3675505816936493, mean loss: 0.37952553045099885
Epoch: 7, step: 1156, loss: 0.3705301582813263, mean loss: 0.37952473192706015
Epoch: 7, step: 1157, loss: 0.3572889566421509, mean loss: 0.3795227582207505
Epoch: 7, step: 1158, loss: 0.3469850420951843, mean loss: 0.37951987034322093
Epoch: 7, step: 1159, loss: 0.35460779070854187, mean loss: 0.3795176594735338
Epoch: 7, step: 1160, loss: 0.34722959995269775, mean loss: 0.37951479426282114
Epoch: 7, step: 1161, loss: 0.40913984179496765, mean loss: 0.3795174229271984
Epoch: 7, step: 1162, loss: 0.3155785799026489, mean loss: 0.3795117500638301
Epoch: 7, step: 1163, loss: 0.3284265100955963, mean loss: 0.37950721801628146
Epoch: 7, step: 1164, loss: 0.2830227315425873, mean loss: 0.3794986591156806
Epoch: 7, step: 1165, loss: 0.35125458240509033, mean loss: 0.37949615387559626
Epoch: 7, step: 1166, loss: 0.3821059465408325, mean loss: 0.37949638534279495
Epoch: 7, step: 1167, loss: 0.3521350920200348, mean loss: 0.3794939588357603
Epoch: 7, step: 1168, loss: 0.33706793189048767, mean loss: 0.3794901966625808
Epoch: 7, step: 1169, loss: 0.3281172215938568, mean loss: 0.3794856415131688
Epoch: 7, step: 1170, loss: 0.356950968503952, mean loss: 0.3794836435813478
Epoch: 7, step: 1171, loss: 0.3171727657318115, mean loss: 0.37947811956735406
Epoch: 7, step: 1172, loss: 0.38385680317878723, mean loss: 0.3794785077141151
Epoch: 7, step: 1173, loss: 0.32079797983169556, mean loss: 0.3794733064618653
Epoch: 7, step: 1174, loss: 0.33000123500823975, mean loss: 0.3794689218060598
Epoch: 7, step: 1175, loss: 0.37839752435684204, mean loss: 0.37946882685768607
Epoch: 7, step: 1176, loss: 0.29514220356941223, mean loss: 0.37946135440546735
Epoch: 7, step: 1177, loss: 0.3483172357082367, mean loss: 0.3794585948698748
Epoch: 7, step: 1178, loss: 0.3176589012145996, mean loss: 0.37945311957142036
Epoch: 7, step: 1179, loss: 0.3498615026473999, mean loss: 0.37945049806035336
Epoch: 7, step: 1180, loss: 0.33933573961257935, mean loss: 0.379446944622631
Epoch: 7, step: 1181, loss: 0.3564457595348358, mean loss: 0.3794449073166002
Epoch: 7, step: 1182, loss: 0.3728288412094116, mean loss: 0.3794443213573311
Epoch: 7, step: 1183, loss: 0.31522756814956665, mean loss: 0.3794386344326758
Epoch: 7, step: 1184, loss: 0.33886897563934326, mean loss: 0.3794350419719662
Epoch: 7, step: 1185, loss: 0.35353684425354004, mean loss: 0.37943274887849016
Epoch: 7, step: 1186, loss: 0.333324134349823, mean loss: 0.3794286666638351
Epoch: 7, step: 1187, loss: 0.38189083337783813, mean loss: 0.3794288846318516
Epoch: 7, step: 1188, loss: 0.36219629645347595, mean loss: 0.37942735921907134
Epoch: 7, step: 1189, loss: 0.3907544016838074, mean loss: 0.37942836178965594
Epoch: 7, step: 1190, loss: 0.3400384485721588, mean loss: 0.3794248756481197
Epoch: 7, step: 1191, loss: 0.36765748262405396, mean loss: 0.3794238342859052
Epoch: 7, step: 1192, loss: 0.3082160949707031, mean loss: 0.379417533273666
Epoch: 7, step: 1193, loss: 0.3439798951148987, mean loss: 0.3794143977544518
Epoch: 7, step: 1194, loss: 0.314769446849823, mean loss: 0.37940867848072757
Epoch: 7, step: 1195, loss: 0.31710341572761536, mean loss: 0.3794031666917367
Epoch: 7, step: 1196, loss: 0.3589974045753479, mean loss: 0.3794013616707622
Epoch: 7, step: 1197, loss: 0.3243807852268219, mean loss: 0.3793964951771797
Epoch: 7, step: 1198, loss: 0.32347387075424194, mean loss: 0.3793915493361589
Epoch: 7, step: 1199, loss: 0.3894694447517395, mean loss: 0.3793924405543598
Epoch: 7, step: 1200, loss: 0.35133999586105347, mean loss: 0.37938996001278286
Epoch: 7, step: 1201, loss: 0.30290257930755615, mean loss: 0.37938319720281777
Epoch: 7, step: 1202, loss: 0.35685044527053833, mean loss: 0.37938120509319595
Epoch: 7, step: 1203, loss: 0.33901357650756836, mean loss: 0.3793776365263125
Epoch: 7, step: 1204, loss: 0.373637855052948, mean loss: 0.3793771291647397
Epoch: 7, step: 1205, loss: 0.4013201594352722, mean loss: 0.379379068622957
Epoch: 7, step: 1206, loss: 0.3366273045539856, mean loss: 0.37937529029648165
Epoch: 7, step: 1207, loss: 0.3950243592262268, mean loss: 0.3793766732117282
Epoch: 7, step: 1208, loss: 0.3616107106208801, mean loss: 0.37937510336436664
Epoch: 7, step: 1209, loss: 0.31667280197143555, mean loss: 0.37936956331299776
Epoch: 7, step: 1210, loss: 0.3591107130050659, mean loss: 0.37936777350380013
Epoch: 7, step: 1211, loss: 0.3168569803237915, mean loss: 0.3793622513489256
Epoch: 7, step: 1212, loss: 0.36272886395454407, mean loss: 0.3793607820982062
Epoch: 7, step: 1213, loss: 0.35110583901405334, mean loss: 0.37935828651941406
Epoch: 7, step: 1214, loss: 0.3386962115764618, mean loss: 0.3793546954150298
Epoch: 7, step: 1215, loss: 0.35598158836364746, mean loss: 0.379352631382263
Epoch: 7, step: 1216, loss: 0.3712482750415802, mean loss: 0.37935191576580907
Epoch: 7, step: 1217, loss: 0.37242257595062256, mean loss: 0.37935130395759653
Epoch: 7, step: 1218, loss: 0.3408050835132599, mean loss: 0.37934790091880033
Epoch: 7, step: 1219, loss: 0.3264206051826477, mean loss: 0.3793432286645863
Epoch: 7, step: 1220, loss: 0.3214699625968933, mean loss: 0.3793381202467147
Epoch: 7, step: 1221, loss: 0.35754096508026123, mean loss: 0.3793361964024811
Epoch: 7, step: 1222, loss: 0.35648879408836365, mean loss: 0.3793341800400847
Epoch: 7, step: 1223, loss: 0.3672100603580475, mean loss: 0.3793331101389479
Epoch: 7, step: 1224, loss: 0.44912463426589966, mean loss: 0.37933926839573134
Epoch: 7, step: 1225, loss: 0.37469884753227234, mean loss: 0.37933885897091546
Epoch: 7, step: 1226, loss: 0.34836938977241516, mean loss: 0.37933612677248596
Epoch: 7, step: 1227, loss: 0.37270647287368774, mean loss: 0.3793355419406318
Epoch: 7, step: 1228, loss: 0.3259468674659729, mean loss: 0.3793308326988152
Epoch: 7, step: 1229, loss: 0.329529345035553, mean loss: 0.3793264402585556
Epoch: 7, step: 1230, loss: 0.33308660984039307, mean loss: 0.3793223623124917
Epoch: 7, step: 1231, loss: 0.34562069177627563, mean loss: 0.379319390383873
Epoch: 7, step: 1232, loss: 0.35032522678375244, mean loss: 0.37931683380477066
Epoch: 7, step: 1233, loss: 0.31379374861717224, mean loss: 0.3793110567738072
Epoch: 7, step: 1234, loss: 0.31896471977233887, mean loss: 0.3793057366347786
Epoch: 7, step: 1235, loss: 0.435062974691391, mean loss: 0.3793106517650727
Epoch: 7, step: 1236, loss: 0.34129953384399414, mean loss: 0.3793073012919197
Epoch: 7, step: 1237, loss: 0.31427791714668274, mean loss: 0.37930156981085633
Epoch: 7, step: 1238, loss: 0.32152265310287476, mean loss: 0.37929647781149894
Epoch: 7, step: 1239, loss: 0.36538076400756836, mean loss: 0.3792952515413365
Epoch: 7, step: 1240, loss: 0.3340339660644531, mean loss: 0.37929126341150327
Epoch: 7, step: 1241, loss: 0.35903599858283997, mean loss: 0.3792894788066725
Epoch: 7, step: 1242, loss: 0.3507591187953949, mean loss: 0.3792869653400166
Epoch: 7, step: 1243, loss: 0.3308708071708679, mean loss: 0.3792827003507487
Epoch: 7, step: 1244, loss: 0.33836787939071655, mean loss: 0.3792790964732749
Epoch: 7, step: 1245, loss: 0.32333624362945557, mean loss: 0.37927416932400204
Epoch: 7, step: 1246, loss: 0.32863515615463257, mean loss: 0.37926970970153007
Epoch: 7, step: 1247, loss: 0.3348439931869507, mean loss: 0.379265797609551
Epoch: 7, step: 1248, loss: 0.31845518946647644, mean loss: 0.37926044314902946
Epoch: 7, step: 1249, loss: 0.39169371128082275, mean loss: 0.37926153781958166
Epoch: 7, step: 1250, loss: 0.33338817954063416, mean loss: 0.3792574993163438
Epoch: 7, step: 1251, loss: 0.3642471134662628, mean loss: 0.3792561779795612
Epoch: 7, step: 1252, loss: 0.3563539385795593, mean loss: 0.3792541621148134
Epoch: 7, step: 1253, loss: 0.3532841205596924, mean loss: 0.3792518764220168
Epoch: 7, step: 1254, loss: 0.3698588013648987, mean loss: 0.3792510497851201
Epoch: 7, step: 1255, loss: 0.32342249155044556, mean loss: 0.3792461370292036
Epoch: 7, step: 1256, loss: 0.35307642817497253, mean loss: 0.3792438343711434
Epoch: 7, step: 1257, loss: 0.3661585748195648, mean loss: 0.37924268310776565
Epoch: 7, step: 1258, loss: 0.36793869733810425, mean loss: 0.37924168865137703
Epoch: 7, step: 1259, loss: 0.33089685440063477, mean loss: 0.3792374359390045
Epoch: 7, step: 1260, loss: 0.3443513810634613, mean loss: 0.379234367414519
Epoch: 7, step: 1261, loss: 0.36227887868881226, mean loss: 0.37923287616660994
Epoch: 7, step: 1262, loss: 0.3863961398601532, mean loss: 0.3792335061256015
Epoch: 7, step: 1263, loss: 0.3359615206718445, mean loss: 0.3792297009914603
Epoch: 7, step: 1264, loss: 0.37370190024375916, mean loss: 0.3792292149454964
Epoch: 7, step: 1265, loss: 0.36814841628074646, mean loss: 0.37922824072370415
Epoch: 7, step: 1266, loss: 0.3501296043395996, mean loss: 0.3792256826018242
Epoch: 7, step: 1267, loss: 0.366863489151001, mean loss: 0.37922459591112
Epoch: 7, step: 1268, loss: 0.3780890703201294, mean loss: 0.37922449610224324
Epoch: 7, step: 1269, loss: 0.357573539018631, mean loss: 0.3792225932232589
Epoch: 7, step: 1270, loss: 0.330463171005249, mean loss: 0.3792183081874721
Epoch: 7, step: 1271, loss: 0.3192831575870514, mean loss: 0.3792130414782805
Epoch: 7, step: 1272, loss: 0.32166799902915955, mean loss: 0.37920798524047633
Epoch: 7, step: 1273, loss: 0.3328837454319, mean loss: 0.37920391528442216
Epoch: 7, step: 1274, loss: 0.3166596591472626, mean loss: 0.3791984207525644
Epoch: 7, step: 1275, loss: 0.3623310327529907, mean loss: 0.379196939077582
Epoch: 7, step: 1276, loss: 0.36394360661506653, mean loss: 0.3791955993031013
Epoch: 7, step: 1277, loss: 0.35967135429382324, mean loss: 0.37919388454418607
Epoch: 7, step: 1278, loss: 0.35509032011032104, mean loss: 0.37919176778257774
Epoch: 7, step: 1279, loss: 0.34900742769241333, mean loss: 0.3791891172434058
Epoch: 7, step: 1280, loss: 0.3291010856628418, mean loss: 0.37918471931280784
Epoch: 7, step: 1281, loss: 0.357191264629364, mean loss: 0.37918278836858627
Epoch: 7, step: 1282, loss: 0.37548166513442993, mean loss: 0.37918246345214046
Epoch: 7, step: 1283, loss: 0.36667293310165405, mean loss: 0.3791813653543218
Epoch: 7, step: 1284, loss: 0.318451464176178, mean loss: 0.37917603489692003
Epoch: 7, step: 1285, loss: 0.34220999479293823, mean loss: 0.37917279055427444
Epoch: 7, step: 1286, loss: 0.3245382606983185, mean loss: 0.37916799594875833
Epoch: 7, step: 1287, loss: 0.351810485124588, mean loss: 0.3791655953247829
Epoch: 7, step: 1288, loss: 0.40529346466064453, mean loss: 0.37916788784644084
Epoch: 7, step: 1289, loss: 0.3744944930076599, mean loss: 0.379167477827592
Epoch: 7, step: 1290, loss: 0.3091389238834381, mean loss: 0.37916133443308864
Epoch: 7, step: 1291, loss: 0.3108970522880554, mean loss: 0.3791553463381636
Epoch: 7, step: 1292, loss: 0.3067508041858673, mean loss: 0.3791489956196168
Epoch: 7, step: 1293, loss: 0.3621031939983368, mean loss: 0.37914750063613833
Epoch: 7, step: 1294, loss: 0.32591524720191956, mean loss: 0.3791428323687145
Epoch: 7, step: 1295, loss: 0.36459189653396606, mean loss: 0.3791415564185361
Epoch: 7, step: 1296, loss: 0.370911568403244, mean loss: 0.37914083480625943
Epoch: 7, step: 1297, loss: 0.34530121088027954, mean loss: 0.3791378679796834
Epoch: 7, step: 1298, loss: 0.34560921788215637, mean loss: 0.37913492867486204
Epoch: 7, step: 1299, loss: 0.3402341306209564, mean loss: 0.3791315187171084
Epoch: 7, step: 1300, loss: 0.36409711837768555, mean loss: 0.3791302009504032
Epoch: 7, step: 1301, loss: 0.3446064889431, mean loss: 0.37912717520877237
Epoch: 7, step: 1302, loss: 0.33624160289764404, mean loss: 0.37912341694286134
Epoch: 7, step: 1303, loss: 0.40089747309684753, mean loss: 0.37912532493936973
Epoch: 7, step: 1304, loss: 0.39071282744407654, mean loss: 0.37912634022917124
Epoch: 7, step: 1305, loss: 0.371881902217865, mean loss: 0.37912570553160585
Epoch: 7, step: 1306, loss: 0.3229605555534363, mean loss: 0.37912078523813425
Epoch: 7, step: 1307, loss: 0.3516920208930969, mean loss: 0.37911838257832825
Epoch: 7, step: 1308, loss: 0.36182549595832825, mean loss: 0.37911686791715454
Epoch: 7, step: 1309, loss: 0.3518753945827484, mean loss: 0.37911448208133963
Epoch: 7, step: 1310, loss: 0.33738207817077637, mean loss: 0.37911082743523133
Epoch: 7, step: 1311, loss: 0.39281922578811646, mean loss: 0.37911202782037606
Epoch: 7, step: 1312, loss: 0.3566715717315674, mean loss: 0.3791100629787607
Epoch: 7, step: 1313, loss: 0.3561573028564453, mean loss: 0.37910805345677484
Epoch: 7, step: 1314, loss: 0.35738280415534973, mean loss: 0.3791061515702913
Epoch: 7, step: 1315, loss: 0.35156139731407166, mean loss: 0.37910374043984174
Epoch: 7, step: 1316, loss: 0.3554878532886505, mean loss: 0.3791016734037672
Epoch: 7, step: 1317, loss: 0.33182692527770996, mean loss: 0.3790975359323751
Epoch: 7, step: 1318, loss: 0.365869402885437, mean loss: 0.3790963783115606
Epoch: 7, step: 1319, loss: 0.31762731075286865, mean loss: 0.3790909994992086
Epoch: 7, step: 1320, loss: 0.41085752844810486, mean loss: 0.3790937789662616
Epoch: 7, step: 1321, loss: 0.29831361770629883, mean loss: 0.37908671158557394
Epoch: 7, step: 1322, loss: 0.29858067631721497, mean loss: 0.379079668804079
Epoch: 7, step: 1323, loss: 0.37869036197662354, mean loss: 0.3790796347499478
Epoch: 7, step: 1324, loss: 0.38006794452667236, mean loss: 0.3790797211935564
Epoch: 7, step: 1325, loss: 0.4105173945426941, mean loss: 0.3790824706839665
Epoch: 7, step: 1326, loss: 0.32089337706565857, mean loss: 0.37907738200065927
Epoch: 7, step: 1327, loss: 0.3425130248069763, mean loss: 0.37907418469765175
Epoch: 7, step: 1328, loss: 0.3348098397254944, mean loss: 0.3790703144217951
Epoch: 7, step: 1329, loss: 0.3217772841453552, mean loss: 0.3790653054140773
Epoch: 7, step: 1330, loss: 0.35959914326667786, mean loss: 0.3790636036777238
Epoch: 7, step: 1331, loss: 0.33518341183662415, mean loss: 0.3790597679966188
Epoch: 7, step: 1332, loss: 0.37777867913246155, mean loss: 0.37905965602311437
Epoch: 7, step: 1333, loss: 0.35999369621276855, mean loss: 0.3790579897095494
Epoch: 7, step: 1334, loss: 0.3408796191215515, mean loss: 0.3790546533143219
Epoch: 7, step: 1335, loss: 0.32824382185935974, mean loss: 0.37905021336050726
Epoch: 7, step: 1336, loss: 0.3513700067996979, mean loss: 0.37904779481908646
Epoch: 7, step: 1337, loss: 0.3674243986606598, mean loss: 0.37904677932055786
Epoch: 7, step: 1338, loss: 0.34448447823524475, mean loss: 0.3790437599878868
Epoch: 7, step: 1339, loss: 0.3243795335292816, mean loss: 0.3790389849855756
Epoch: 7, step: 1340, loss: 0.33299440145492554, mean loss: 0.3790349632733273
Epoch: 7, step: 1341, loss: 0.3190590441226959, mean loss: 0.3790297252017858
Epoch: 7, step: 1342, loss: 0.36831966042518616, mean loss: 0.3790287899066346
Epoch: 7, step: 1343, loss: 0.34334230422973633, mean loss: 0.3790256737273055
Epoch: 7, step: 1344, loss: 0.31389203667640686, mean loss: 0.37901998669010556
Epoch: 7, step: 1345, loss: 0.32066020369529724, mean loss: 0.3790148915457896
Epoch: 7, step: 1346, loss: 0.380825012922287, mean loss: 0.37901504956598836
Epoch: 7, step: 1347, loss: 0.35417526960372925, mean loss: 0.3790128812891062
Epoch: 7, step: 1348, loss: 0.3413645029067993, mean loss: 0.3790095952300696
Epoch: 7, step: 1349, loss: 0.3365322947502136, mean loss: 0.37900588801236323
Epoch: 7, step: 1350, loss: 0.3676701784133911, mean loss: 0.3790048987716268
Epoch: 7, step: 1351, loss: 0.3553306758403778, mean loss: 0.3790028329581075
Epoch: 7, step: 1352, loss: 0.32994839549064636, mean loss: 0.37899855283966516
Epoch: 7, step: 1353, loss: 0.3312080204486847, mean loss: 0.37899438336379787
Epoch: 7, step: 1354, loss: 0.3241370618343353, mean loss: 0.3789895977647811
Epoch: 7, step: 1355, loss: 0.353453129529953, mean loss: 0.37898737022917095
Epoch: 7, step: 1356, loss: 0.3477570116519928, mean loss: 0.37898464625546163
Epoch: 7, step: 1357, loss: 0.32701966166496277, mean loss: 0.37898011416191635
Epoch: 7, step: 1358, loss: 0.32403165102005005, mean loss: 0.37897532228408065
Epoch: 7, step: 1359, loss: 0.36656469106674194, mean loss: 0.3789742400874276
Epoch: 7, step: 1360, loss: 0.3498779535293579, mean loss: 0.37897170313681655
Epoch: 7, step: 1361, loss: 0.3249755799770355, mean loss: 0.37896699554107466
Epoch: 7, step: 1362, loss: 0.34260836243629456, mean loss: 0.37896382592786704
Epoch: 7, step: 1363, loss: 0.37148985266685486, mean loss: 0.37896317443089517
Epoch: 7, step: 1364, loss: 0.34621763229370117, mean loss: 0.37896032029142535
Epoch: 7, step: 1365, loss: 0.3232097923755646, mean loss: 0.37895546143419023
Epoch: 7, step: 1366, loss: 0.33074280619621277, mean loss: 0.3789512598956074
Epoch: 7, step: 1367, loss: 0.31664466857910156, mean loss: 0.3789458306004421
Epoch: 7, step: 1368, loss: 0.3465539813041687, mean loss: 0.37894300827324023
Epoch: 7, step: 1369, loss: 0.3686000406742096, mean loss: 0.3789421071608863
Epoch: 7, step: 1370, loss: 0.3344563841819763, mean loss: 0.3789382317603306
Epoch: 7, step: 1371, loss: 0.37362003326416016, mean loss: 0.37893776850262184
Epoch: 7, step: 1372, loss: 0.34764474630355835, mean loss: 0.37893504286703267
Epoch: 7, step: 1373, loss: 0.2893598973751068, mean loss: 0.3789272415131316
Epoch: 7, step: 1374, loss: 0.3221965432167053, mean loss: 0.37892230110572095
Epoch: 7, step: 1375, loss: 0.38641640543937683, mean loss: 0.37892295367488965
Epoch: 7, step: 1376, loss: 0.33571988344192505, mean loss: 0.3789191919796147
Epoch: 7, step: 1377, loss: 0.3472239077091217, mean loss: 0.378916432508583
Epoch: 7, step: 1378, loss: 0.32600417733192444, mean loss: 0.3789118262358245
Epoch: 7, step: 1379, loss: 0.3321283757686615, mean loss: 0.37890775386026154
Epoch: 7, step: 1380, loss: 0.30695295333862305, mean loss: 0.3789014909304572
Epoch: 7, step: 1381, loss: 0.3694390654563904, mean loss: 0.37890066739473277
Epoch: 7, step: 1382, loss: 0.3504660725593567, mean loss: 0.37889819288469573
Epoch: 7, step: 1383, loss: 0.40926963090896606, mean loss: 0.37890083571779914
Epoch: 7, step: 1384, loss: 0.3164854645729065, mean loss: 0.37889540498856006
Epoch: 7, step: 1385, loss: 0.34078672528266907, mean loss: 0.378892089460484
Epoch: 7, step: 1386, loss: 0.35369569063186646, mean loss: 0.3788898975162623
Epoch: 7, step: 1387, loss: 0.34949228167533875, mean loss: 0.37888734031237914
Epoch: 7, step: 1388, loss: 0.3705103397369385, mean loss: 0.37888661168747045
Epoch: 7, step: 1389, loss: 0.3188181221485138, mean loss: 0.37888138743198785
Epoch: 7, step: 1390, loss: 0.3436163663864136, mean loss: 0.37887832064174126
Epoch: 7, step: 1391, loss: 0.3146253526210785, mean loss: 0.3788727334271308
Epoch: 7, step: 1392, loss: 0.33768078684806824, mean loss: 0.37886915183017583
Epoch: 7, step: 1393, loss: 0.4531807601451874, mean loss: 0.37887561258555014
Epoch: 7, step: 1394, loss: 0.32404622435569763, mean loss: 0.37887084605610305
Epoch: 7, step: 1395, loss: 0.3333054780960083, mean loss: 0.3788668852278729
Epoch: 7, step: 1396, loss: 0.3397958278656006, mean loss: 0.37886348922114865
Epoch: 7, step: 1397, loss: 0.4007273018360138, mean loss: 0.37886538943083187
Epoch: 7, step: 1398, loss: 0.3563121557235718, mean loss: 0.3788634294730925
Epoch: 7, step: 1399, loss: 0.3331676125526428, mean loss: 0.3788594586860817
Epoch: 7, step: 1400, loss: 0.34795883297920227, mean loss: 0.3788567737763843
Epoch: 7, step: 1401, loss: 0.3380947411060333, mean loss: 0.37885323233132173
Epoch: 7, step: 1402, loss: 0.3469226360321045, mean loss: 0.37885045841104553
Epoch: 7, step: 1403, loss: 0.32098960876464844, mean loss: 0.3788454322774765
Epoch: 7, step: 1404, loss: 0.3286866843700409, mean loss: 0.3788410755721949
Epoch: 7, step: 1405, loss: 0.33272671699523926, mean loss: 0.37883707050370635
Epoch: 7, step: 1406, loss: 0.31565016508102417, mean loss: 0.37883158314761234
Epoch: 7, step: 1407, loss: 0.3203641474246979, mean loss: 0.3788265060865041
Epoch: 7, step: 1408, loss: 0.36448049545288086, mean loss: 0.3788252604486962
Epoch: 7, step: 1409, loss: 0.3437959551811218, mean loss: 0.3788222191823941
Epoch: 7, step: 1410, loss: 0.3785560727119446, mean loss: 0.37882219607739626
Epoch: 7, step: 1411, loss: 0.3432547152042389, mean loss: 0.3788191086224594
Epoch: 7, step: 1412, loss: 0.35808444023132324, mean loss: 0.37881730889427684
Epoch: 7, step: 1413, loss: 0.3491162359714508, mean loss: 0.3788147311236708
Epoch: 7, step: 1414, loss: 0.29576462507247925, mean loss: 0.3788075237899859
Epoch: 7, step: 1415, loss: 0.3308251202106476, mean loss: 0.3788033600965132
Epoch: 7, step: 1416, loss: 0.3673994839191437, mean loss: 0.37880237060617244
Epoch: 7, step: 1417, loss: 0.35976406931877136, mean loss: 0.37880071883614924
Epoch: 7, step: 1418, loss: 0.37455621361732483, mean loss: 0.3788003506132622
Epoch: 7, step: 1419, loss: 0.35416463017463684, mean loss: 0.378798213579914
Epoch: 7, step: 1420, loss: 0.35897186398506165, mean loss: 0.37879649388613357
Epoch: 7, step: 1421, loss: 0.3685634434223175, mean loss: 0.3787956063709155
Epoch: 7, step: 1422, loss: 0.35493096709251404, mean loss: 0.37879353676383215
Epoch: 7, step: 1423, loss: 0.3597663640975952, mean loss: 0.37879188681823156
Epoch: 7, step: 1424, loss: 0.3086317181587219, mean loss: 0.3787858033907921
Epoch: 7, step: 1425, loss: 0.34153205156326294, mean loss: 0.37878257348340283
Epoch: 7, step: 1426, loss: 0.3268274664878845, mean loss: 0.37877806935622504
Epoch: 7, step: 1427, loss: 0.34181272983551025, mean loss: 0.3787748650098727
Epoch: 7, step: 1428, loss: 0.34960201382637024, mean loss: 0.3787723363758098
Epoch: 7, step: 1429, loss: 0.3430802822113037, mean loss: 0.3787692429407115
Epoch: 7, step: 1430, loss: 0.3451732099056244, mean loss: 0.37876633142038607
Epoch: 7, step: 1431, loss: 0.34182971715927124, mean loss: 0.3787631306739163
Epoch: 7, step: 1432, loss: 0.3560437858104706, mean loss: 0.378761162097115
Epoch: 7, step: 1433, loss: 0.3447124660015106, mean loss: 0.37875821211478133
Epoch: 7, step: 1434, loss: 0.3199266195297241, mean loss: 0.3787531153814724
Epoch: 7, step: 1435, loss: 0.3549043536186218, mean loss: 0.37875104948041877
Epoch: 7, step: 1436, loss: 0.3477241098880768, mean loss: 0.37874836200189194
Epoch: 7, step: 1437, loss: 0.37592843174934387, mean loss: 0.37874811776750317
Epoch: 7, step: 1438, loss: 0.36935722827911377, mean loss: 0.37874730449223787
Epoch: 7, step: 1439, loss: 0.3271319568157196, mean loss: 0.3787428348570044
Epoch: 7, step: 1440, loss: 0.35855430364608765, mean loss: 0.37874108678087565
Epoch: 7, step: 1441, loss: 0.3486432731151581, mean loss: 0.3787384809095626
Epoch: 7, step: 1442, loss: 0.3466009795665741, mean loss: 0.37873569868279927
Epoch: 7, step: 1443, loss: 0.36734119057655334, mean loss: 0.37873471231610034
Valid: 7, mean loss: 0.20461599032084146
Epoch: 8, step: 0, loss: 0.3615741431713104, mean loss: 0.37873322693835043
Epoch: 8, step: 1, loss: 0.28814786672592163, mean loss: 0.3787253867652318
Epoch: 8, step: 2, loss: 0.3214154541492462, mean loss: 0.37872042701338277
Epoch: 8, step: 3, loss: 0.3299822509288788, mean loss: 0.37871620944882023
Epoch: 8, step: 4, loss: 0.3363087773323059, mean loss: 0.37871254003356397
Epoch: 8, step: 5, loss: 0.3329002857208252, mean loss: 0.37870857635002764
Epoch: 8, step: 6, loss: 0.2866237759590149, mean loss: 0.3787006098477012
Epoch: 8, step: 7, loss: 0.33465278148651123, mean loss: 0.378696799481926
Epoch: 8, step: 8, loss: 0.31964462995529175, mean loss: 0.37869169160462074
Epoch: 8, step: 9, loss: 0.3362807333469391, mean loss: 0.37868802347123054
Epoch: 8, step: 10, loss: 0.3224179148674011, mean loss: 0.3786831570776818
Epoch: 8, step: 11, loss: 0.359842985868454, mean loss: 0.3786815278688259
Epoch: 8, step: 12, loss: 0.31935447454452515, mean loss: 0.3786763979895934
Epoch: 8, step: 13, loss: 0.33702632784843445, mean loss: 0.3786727969114211
Epoch: 8, step: 14, loss: 0.31176987290382385, mean loss: 0.3786670129636379
Epoch: 8, step: 15, loss: 0.3071727156639099, mean loss: 0.3786608326129032
Epoch: 8, step: 16, loss: 0.3410092890262604, mean loss: 0.37865757809275563
Epoch: 8, step: 17, loss: 0.3243151307106018, mean loss: 0.37865288125201385
Epoch: 8, step: 18, loss: 0.3430847227573395, mean loss: 0.3786498073466907
Epoch: 8, step: 19, loss: 0.36575037240982056, mean loss: 0.37864869263575596
Epoch: 8, step: 20, loss: 0.3597641885280609, mean loss: 0.37864706086317257
Epoch: 8, step: 21, loss: 0.3563989996910095, mean loss: 0.37864513861838495
Epoch: 8, step: 22, loss: 0.3438064157962799, mean loss: 0.3786421287935191
Epoch: 8, step: 23, loss: 0.29562827944755554, mean loss: 0.37863495759022386
Epoch: 8, step: 24, loss: 0.34085699915885925, mean loss: 0.37863169439955
Epoch: 8, step: 25, loss: 0.3123951852321625, mean loss: 0.37862597350568516
Epoch: 8, step: 26, loss: 0.38337841629981995, mean loss: 0.37862638394206083
Epoch: 8, step: 27, loss: 0.37003669142723083, mean loss: 0.3786256421724136
Epoch: 8, step: 28, loss: 0.34214866161346436, mean loss: 0.3786224924460896
Epoch: 8, step: 29, loss: 0.35362333059310913, mean loss: 0.3786203339966117
Epoch: 8, step: 30, loss: 0.31266844272613525, mean loss: 0.37861464014430485
Epoch: 8, step: 31, loss: 0.3774242103099823, mean loss: 0.37861453737929845
Epoch: 8, step: 32, loss: 0.34128639101982117, mean loss: 0.378611315269125
Epoch: 8, step: 33, loss: 0.3211982548236847, mean loss: 0.3786063598867285
Epoch: 8, step: 34, loss: 0.30571338534355164, mean loss: 0.3786000689594356
Epoch: 8, step: 35, loss: 0.36910349130630493, mean loss: 0.37859924944117074
Epoch: 8, step: 36, loss: 0.3470670282840729, mean loss: 0.37859652856610326
Epoch: 8, step: 37, loss: 0.3241083025932312, mean loss: 0.3785918272523869
Epoch: 8, step: 38, loss: 0.3136037290096283, mean loss: 0.3785862204800426
Epoch: 8, step: 39, loss: 0.35296157002449036, mean loss: 0.37858400993393704
Epoch: 8, step: 40, loss: 0.4022219181060791, mean loss: 0.3785860489150612
Epoch: 8, step: 41, loss: 0.3428303897380829, mean loss: 0.37858296493548754
Epoch: 8, step: 42, loss: 0.31897661089897156, mean loss: 0.37857782424087466
Epoch: 8, step: 43, loss: 0.32415771484375, mean loss: 0.3785731312338552
Epoch: 8, step: 44, loss: 0.3839332163333893, mean loss: 0.3785735934296903
Epoch: 8, step: 45, loss: 0.30522823333740234, mean loss: 0.3785672694634813
Epoch: 8, step: 46, loss: 0.29468485713005066, mean loss: 0.37856003759760204
Epoch: 8, step: 47, loss: 0.3327600955963135, mean loss: 0.37855608932673984
Epoch: 8, step: 48, loss: 0.3710419237613678, mean loss: 0.37855544160968396
Epoch: 8, step: 49, loss: 0.35630694031715393, mean loss: 0.37855352396606284
Epoch: 8, step: 50, loss: 0.3454954922199249, mean loss: 0.37855067487257443
Epoch: 8, step: 51, loss: 0.2931407690048218, mean loss: 0.37854331448771855
Epoch: 8, step: 52, loss: 0.33774974942207336, mean loss: 0.3785397993162351
Epoch: 8, step: 53, loss: 0.39667439460754395, mean loss: 0.3785413618352159
Epoch: 8, step: 54, loss: 0.31236761808395386, mean loss: 0.3785356606425088
Epoch: 8, step: 55, loss: 0.3668639063835144, mean loss: 0.37853465515023976
Epoch: 8, step: 56, loss: 0.34444475173950195, mean loss: 0.37853171864378693
Epoch: 8, step: 57, loss: 0.3572244942188263, mean loss: 0.3785298833962051
Epoch: 8, step: 58, loss: 0.3457198143005371, mean loss: 0.37852705762158656
Epoch: 8, step: 59, loss: 0.29348284006118774, mean loss: 0.3785197337998883
Epoch: 8, step: 60, loss: 0.36142563819885254, mean loss: 0.3785182618205891
Epoch: 8, step: 61, loss: 0.30423039197921753, mean loss: 0.3785118654136801
Epoch: 8, step: 62, loss: 0.3264857828617096, mean loss: 0.37850738619865193
Epoch: 8, step: 63, loss: 0.3518860936164856, mean loss: 0.37850509442070923
Epoch: 8, step: 64, loss: 0.35788726806640625, mean loss: 0.3785033196228824
Epoch: 8, step: 65, loss: 0.3353632688522339, mean loss: 0.3784996064148629
Epoch: 8, step: 66, loss: 0.3318397104740143, mean loss: 0.3784955905876884
Epoch: 8, step: 67, loss: 0.33003056049346924, mean loss: 0.37849141975893674
Epoch: 8, step: 68, loss: 0.3234918713569641, mean loss: 0.37848668698650734
Epoch: 8, step: 69, loss: 0.3468010425567627, mean loss: 0.37848396063610035
Epoch: 8, step: 70, loss: 0.35820886492729187, mean loss: 0.37848221624173495
Epoch: 8, step: 71, loss: 0.3886736333370209, mean loss: 0.3784830929981953
Epoch: 8, step: 72, loss: 0.3443603217601776, mean loss: 0.3784801577060458
Epoch: 8, step: 73, loss: 0.33753615617752075, mean loss: 0.37847663594434544
Epoch: 8, step: 74, loss: 0.3551836609840393, mean loss: 0.3784746325922374
Epoch: 8, step: 75, loss: 0.31669601798057556, mean loss: 0.37846931967388414
Epoch: 8, step: 76, loss: 0.3302086889743805, mean loss: 0.37846516964974625
Epoch: 8, step: 77, loss: 0.34481966495513916, mean loss: 0.3784622766570812
Epoch: 8, step: 78, loss: 0.3724820017814636, mean loss: 0.3784617624902103
Epoch: 8, step: 79, loss: 0.30413684248924255, mean loss: 0.37845537279626246
Epoch: 8, step: 80, loss: 0.3055974841117859, mean loss: 0.378449109761045
Epoch: 8, step: 81, loss: 0.3834843933582306, mean loss: 0.37844954256864316
Epoch: 8, step: 82, loss: 0.3587226867675781, mean loss: 0.3784478470932842
Epoch: 8, step: 83, loss: 0.36200860142707825, mean loss: 0.37844643430146
Epoch: 8, step: 84, loss: 0.28297027945518494, mean loss: 0.37843822976808833
Epoch: 8, step: 85, loss: 0.36004167795181274, mean loss: 0.378436649036707
Epoch: 8, step: 86, loss: 0.310952752828598, mean loss: 0.37843085095300494
Epoch: 8, step: 87, loss: 0.3032204210758209, mean loss: 0.3784243895758677
Epoch: 8, step: 88, loss: 0.32696181535720825, mean loss: 0.3784199687723097
Epoch: 8, step: 89, loss: 0.34809747338294983, mean loss: 0.3784173641944546
Epoch: 8, step: 90, loss: 0.3351201117038727, mean loss: 0.37841364545766076
Epoch: 8, step: 91, loss: 0.36313188076019287, mean loss: 0.37841233304227967
Epoch: 8, step: 92, loss: 0.3673165738582611, mean loss: 0.37841138020765674
Epoch: 8, step: 93, loss: 0.3485754728317261, mean loss: 0.3784088183059415
Epoch: 8, step: 94, loss: 0.32123395800590515, mean loss: 0.37840390932849666
Epoch: 8, step: 95, loss: 0.3390115201473236, mean loss: 0.37840052742695296
Epoch: 8, step: 96, loss: 0.3156863749027252, mean loss: 0.3783951437757791
Epoch: 8, step: 97, loss: 0.34214064478874207, mean loss: 0.3783920318016171
Epoch: 8, step: 98, loss: 0.3600231111049652, mean loss: 0.378390455205557
Epoch: 8, step: 99, loss: 0.3259483277797699, mean loss: 0.37838595450804363
Epoch: 8, step: 100, loss: 0.33217915892601013, mean loss: 0.3783819892805844
Epoch: 8, step: 101, loss: 0.31630387902259827, mean loss: 0.37837666251636115
Epoch: 8, step: 102, loss: 0.33346986770629883, mean loss: 0.37837280950951346
Epoch: 8, step: 103, loss: 0.3276480734348297, mean loss: 0.37836845769619204
Epoch: 8, step: 104, loss: 0.3464679718017578, mean loss: 0.37836572110136535
Epoch: 8, step: 105, loss: 0.3170870542526245, mean loss: 0.37836046473948093
Epoch: 8, step: 106, loss: 0.40003374218940735, mean loss: 0.37836232367055994
Epoch: 8, step: 107, loss: 0.30794647336006165, mean loss: 0.37835628457533604
Epoch: 8, step: 108, loss: 0.3376102149486542, mean loss: 0.378352790357891
Epoch: 8, step: 109, loss: 0.34181612730026245, mean loss: 0.37834965739072773
Epoch: 8, step: 110, loss: 0.3461780250072479, mean loss: 0.3783468989553009
Epoch: 8, step: 111, loss: 0.36584410071372986, mean loss: 0.3783458270418714
Epoch: 8, step: 112, loss: 0.351294606924057, mean loss: 0.37834350803457456
Epoch: 8, step: 113, loss: 0.3375888466835022, mean loss: 0.3783400145782613
Epoch: 8, step: 114, loss: 0.32094940543174744, mean loss: 0.378335095523736
Epoch: 8, step: 115, loss: 0.3562789559364319, mean loss: 0.3783332052135211
Epoch: 8, step: 116, loss: 0.38781777024269104, mean loss: 0.37833401801367783
Epoch: 8, step: 117, loss: 0.3262677490711212, mean loss: 0.3783295564653537
Epoch: 8, step: 118, loss: 0.3785070776939392, mean loss: 0.37832957167580944
Epoch: 8, step: 119, loss: 0.35140085220336914, mean loss: 0.3783272645545387
Epoch: 8, step: 120, loss: 0.37730586528778076, mean loss: 0.37832717705353064
Epoch: 8, step: 121, loss: 0.3762461841106415, mean loss: 0.37832699879475534
Epoch: 8, step: 122, loss: 0.30766561627388, mean loss: 0.3783209464279441
Epoch: 8, step: 123, loss: 0.35497575998306274, mean loss: 0.37831894701149626
Epoch: 8, step: 124, loss: 0.31042125821113586, mean loss: 0.37831313235971925
Epoch: 8, step: 125, loss: 0.40401190519332886, mean loss: 0.3783153329739369
Epoch: 8, step: 126, loss: 0.37475988268852234, mean loss: 0.3783150285428824
Epoch: 8, step: 127, loss: 0.3051382303237915, mean loss: 0.3783087634060486
Epoch: 8, step: 128, loss: 0.34048211574554443, mean loss: 0.3783055251004531
Epoch: 8, step: 129, loss: 0.339605450630188, mean loss: 0.3783022123051723
Epoch: 8, step: 130, loss: 0.36109092831611633, mean loss: 0.37830073911472556
Epoch: 8, step: 131, loss: 0.36414623260498047, mean loss: 0.3782995276711694
Epoch: 8, step: 132, loss: 0.3915029466152191, mean loss: 0.3783006576171638
Epoch: 8, step: 133, loss: 0.35343971848487854, mean loss: 0.37829853020494986
Epoch: 8, step: 134, loss: 0.3458615839481354, mean loss: 0.37829575473252264
Epoch: 8, step: 135, loss: 0.3349301517009735, mean loss: 0.37829204446532283
Epoch: 8, step: 136, loss: 0.34552326798439026, mean loss: 0.3782892410795344
Epoch: 8, step: 137, loss: 0.3414668142795563, mean loss: 0.3782860911713393
Epoch: 8, step: 138, loss: 0.3288429081439972, mean loss: 0.3782818620050552
Epoch: 8, step: 139, loss: 0.3702753186225891, mean loss: 0.37828117721687676
Epoch: 8, step: 140, loss: 0.3003569543361664, mean loss: 0.37827451303977244
Epoch: 8, step: 141, loss: 0.3701413571834564, mean loss: 0.3782738175415805
Epoch: 8, step: 142, loss: 0.37081795930862427, mean loss: 0.3782731800162934
Epoch: 8, step: 143, loss: 0.3150666058063507, mean loss: 0.3782677758974314
Epoch: 8, step: 144, loss: 0.31799042224884033, mean loss: 0.37826262266552163
Epoch: 8, step: 145, loss: 0.32578325271606445, mean loss: 0.37825813648241774
Epoch: 8, step: 146, loss: 0.3343364894390106, mean loss: 0.37825438217460994
Epoch: 8, step: 147, loss: 0.3558051288127899, mean loss: 0.37825246343500635
Epoch: 8, step: 148, loss: 0.4574461877346039, mean loss: 0.3782592315509195
Epoch: 8, step: 149, loss: 0.3133949935436249, mean loss: 0.3782536885464752
Epoch: 8, step: 150, loss: 0.3026217222213745, mean loss: 0.3782472259329295
Epoch: 8, step: 151, loss: 0.3406399190425873, mean loss: 0.3782440127317256
Epoch: 8, step: 152, loss: 0.3461201786994934, mean loss: 0.3782412682777288
Epoch: 8, step: 153, loss: 0.3689219355583191, mean loss: 0.3782404721618293
Epoch: 8, step: 154, loss: 0.3662693202495575, mean loss: 0.3782394495982424
Epoch: 8, step: 155, loss: 0.33620795607566833, mean loss: 0.3782358596175862
Epoch: 8, step: 156, loss: 0.3644191026687622, mean loss: 0.3782346796058902
Epoch: 8, step: 157, loss: 0.35802868008613586, mean loss: 0.37823295407219937
Epoch: 8, step: 158, loss: 0.345248818397522, mean loss: 0.3782301375633039
Epoch: 8, step: 159, loss: 0.32412031292915344, mean loss: 0.3782255175304629
Epoch: 8, step: 160, loss: 0.3381578028202057, mean loss: 0.37822209674033996
Epoch: 8, step: 161, loss: 0.35243192315101624, mean loss: 0.37821989508645665
Epoch: 8, step: 162, loss: 0.34081417322158813, mean loss: 0.37821670210977165
Epoch: 8, step: 163, loss: 0.3173886239528656, mean loss: 0.37821151022874083
Epoch: 8, step: 164, loss: 0.36311912536621094, mean loss: 0.3782102221528799
Epoch: 8, step: 165, loss: 0.3778558671474457, mean loss: 0.37821019191265076
Epoch: 8, step: 166, loss: 0.3239648938179016, mean loss: 0.37820556307929515
Epoch: 8, step: 167, loss: 0.35172027349472046, mean loss: 0.3782033032422999
Epoch: 8, step: 168, loss: 0.3398169279098511, mean loss: 0.3782000282337398
Epoch: 8, step: 169, loss: 0.35675758123397827, mean loss: 0.378198198985574
Epoch: 8, step: 170, loss: 0.30919349193573, mean loss: 0.37819231271865855
Epoch: 8, step: 171, loss: 0.319313108921051, mean loss: 0.37818729060983924
Epoch: 8, step: 172, loss: 0.3546423017978668, mean loss: 0.378185282508448
Epoch: 8, step: 173, loss: 0.3149493336677551, mean loss: 0.37817988971049127
Epoch: 8, step: 174, loss: 0.33019235730171204, mean loss: 0.3781757976551993
Epoch: 8, step: 175, loss: 0.40128180384635925, mean loss: 0.3781777678126167
Epoch: 8, step: 176, loss: 0.3828130066394806, mean loss: 0.3781781630073329
Epoch: 8, step: 177, loss: 0.3786357343196869, mean loss: 0.37817820201596997
Epoch: 8, step: 178, loss: 0.40306520462036133, mean loss: 0.37818032348921216
Epoch: 8, step: 179, loss: 0.3079366683959961, mean loss: 0.37817433613368084
Epoch: 8, step: 180, loss: 0.37893739342689514, mean loss: 0.37817440116882045
Epoch: 8, step: 181, loss: 0.3200283348560333, mean loss: 0.3781694458197227
Epoch: 8, step: 182, loss: 0.3134133219718933, mean loss: 0.3781639276157306
Epoch: 8, step: 183, loss: 0.3238959312438965, mean loss: 0.3781593035533267
Epoch: 8, step: 184, loss: 0.36096328496932983, mean loss: 0.3781578384414085
Epoch: 8, step: 185, loss: 0.3310232162475586, mean loss: 0.37815382288320487
Epoch: 8, step: 186, loss: 0.33173128962516785, mean loss: 0.378149868327173
Epoch: 8, step: 187, loss: 0.41157424449920654, mean loss: 0.37815271537795425
Epoch: 8, step: 188, loss: 0.3719439208507538, mean loss: 0.37815218656486105
Epoch: 8, step: 189, loss: 0.330701619386673, mean loss: 0.37814814546733266
Epoch: 8, step: 190, loss: 0.33591601252555847, mean loss: 0.37814454910073625
Epoch: 8, step: 191, loss: 0.34243080019950867, mean loss: 0.37814150807988295
Epoch: 8, step: 192, loss: 0.34622523188591003, mean loss: 0.3781387906447025
Epoch: 8, step: 193, loss: 0.34476348757743835, mean loss: 0.3781359492260862
Epoch: 8, step: 194, loss: 0.3601425290107727, mean loss: 0.37813441748009013
Epoch: 8, step: 195, loss: 0.3676396310329437, mean loss: 0.3781335241547201
Epoch: 8, step: 196, loss: 0.34094947576522827, mean loss: 0.3781303592855066
Epoch: 8, step: 197, loss: 0.32126012444496155, mean loss: 0.3781255192655202
Epoch: 8, step: 198, loss: 0.33894768357276917, mean loss: 0.3781221852653761
Epoch: 8, step: 199, loss: 0.3057272732257843, mean loss: 0.37811602504481456
Epoch: 8, step: 200, loss: 0.3352017104625702, mean loss: 0.37811237369498196
Epoch: 8, step: 201, loss: 0.3929322063922882, mean loss: 0.3781136345281194
Epoch: 8, step: 202, loss: 0.39415422081947327, mean loss: 0.37811499910372903
Epoch: 8, step: 203, loss: 0.3460296094417572, mean loss: 0.3781122698259422
Epoch: 8, step: 204, loss: 0.34669730067253113, mean loss: 0.3781095978033894
Epoch: 8, step: 205, loss: 0.32063522934913635, mean loss: 0.3781047096958495
Epoch: 8, step: 206, loss: 0.3197999894618988, mean loss: 0.3780997513898512
Epoch: 8, step: 207, loss: 0.35386019945144653, mean loss: 0.37809769020346184
Epoch: 8, step: 208, loss: 0.3510095179080963, mean loss: 0.37809538698330236
Epoch: 8, step: 209, loss: 0.36304712295532227, mean loss: 0.3780941075865987
Epoch: 8, step: 210, loss: 0.33312442898750305, mean loss: 0.37809028460958616
Epoch: 8, step: 211, loss: 0.3085351884365082, mean loss: 0.3780843720716592
Epoch: 8, step: 212, loss: 0.3083731532096863, mean loss: 0.37807844676618857
Epoch: 8, step: 213, loss: 0.3565336763858795, mean loss: 0.3780766156621277
Epoch: 8, step: 214, loss: 0.343350887298584, mean loss: 0.37807366455068353
Epoch: 8, step: 215, loss: 0.3325532376766205, mean loss: 0.3780697963974821
Epoch: 8, step: 216, loss: 0.32630544900894165, mean loss: 0.378065398033357
Epoch: 8, step: 217, loss: 0.32835403084754944, mean loss: 0.3780611744677507
Epoch: 8, step: 218, loss: 0.33217450976371765, mean loss: 0.37805727618683116
Epoch: 8, step: 219, loss: 0.3274739980697632, mean loss: 0.3780529792722782
Epoch: 8, step: 220, loss: 0.3351127803325653, mean loss: 0.37804933192674695
Epoch: 8, step: 221, loss: 0.32241860032081604, mean loss: 0.37804460704721526
Epoch: 8, step: 222, loss: 0.3400145173072815, mean loss: 0.37804137731560256
Epoch: 8, step: 223, loss: 0.3325861096382141, mean loss: 0.37803751732344243
Epoch: 8, step: 224, loss: 0.3787619471549988, mean loss: 0.37803757883569783
Epoch: 8, step: 225, loss: 0.32796311378479004, mean loss: 0.3780333273103921
Epoch: 8, step: 226, loss: 0.32560446858406067, mean loss: 0.37802887626542
Epoch: 8, step: 227, loss: 0.3663221001625061, mean loss: 0.3780278824813705
Epoch: 8, step: 228, loss: 0.36901286244392395, mean loss: 0.3780271172644927
Epoch: 8, step: 229, loss: 0.33913734555244446, mean loss: 0.3780238164860415
Epoch: 8, step: 230, loss: 0.34867560863494873, mean loss: 0.37802132576145087
Epoch: 8, step: 231, loss: 0.34442463517189026, mean loss: 0.3780184747184613
Epoch: 8, step: 232, loss: 0.35897496342658997, mean loss: 0.37801685880744795
Epoch: 8, step: 233, loss: 0.3564973771572113, mean loss: 0.3780150329562983
Epoch: 8, step: 234, loss: 0.34669187664985657, mean loss: 0.37801237552384676
Epoch: 8, step: 235, loss: 0.3159920275211334, mean loss: 0.37800711421166466
Epoch: 8, step: 236, loss: 0.3512398898601532, mean loss: 0.37800484368622983
Epoch: 8, step: 237, loss: 0.35937368869781494, mean loss: 0.3780032634355947
Epoch: 8, step: 238, loss: 0.34423357248306274, mean loss: 0.3780003994129543
Epoch: 8, step: 239, loss: 0.3686946630477905, mean loss: 0.37799961025620693
Epoch: 8, step: 240, loss: 0.31728100776672363, mean loss: 0.37799446155761546
Epoch: 8, step: 241, loss: 0.3664235472679138, mean loss: 0.377993480472802
Epoch: 8, step: 242, loss: 0.3577028214931488, mean loss: 0.3779917601965002
Epoch: 8, step: 243, loss: 0.33100810647010803, mean loss: 0.3779877771807554
Epoch: 8, step: 244, loss: 0.3648177981376648, mean loss: 0.3779866607970101
Epoch: 8, step: 245, loss: 0.34147271513938904, mean loss: 0.3779835658702719
Epoch: 8, step: 246, loss: 0.35951370000839233, mean loss: 0.3779820004947433
Epoch: 8, step: 247, loss: 0.34306755661964417, mean loss: 0.37797904164356744
Epoch: 8, step: 248, loss: 0.3014257848262787, mean loss: 0.37797255462917734
Epoch: 8, step: 249, loss: 0.3305833339691162, mean loss: 0.37796853927409685
Epoch: 8, step: 250, loss: 0.3603644073009491, mean loss: 0.3779670477776999
Epoch: 8, step: 251, loss: 0.36271771788597107, mean loss: 0.3779657558995322
Epoch: 8, step: 252, loss: 0.3276817798614502, mean loss: 0.3779614963505243
Epoch: 8, step: 253, loss: 0.3174716830253601, mean loss: 0.37795637270040355
Epoch: 8, step: 254, loss: 0.3847806453704834, mean loss: 0.37795695068572327
Epoch: 8, step: 255, loss: 0.32185402512550354, mean loss: 0.3779521994217023
Epoch: 8, step: 256, loss: 0.3721249997615814, mean loss: 0.3779517059675859
Epoch: 8, step: 257, loss: 0.36432501673698425, mean loss: 0.3779505521412328
Epoch: 8, step: 258, loss: 0.3382929861545563, mean loss: 0.3779471944605972
Epoch: 8, step: 259, loss: 0.36442452669143677, mean loss: 0.37794604963603157
Epoch: 8, step: 260, loss: 0.3660796284675598, mean loss: 0.377945045113796
Epoch: 8, step: 261, loss: 0.30718204379081726, mean loss: 0.37793905535576966
Epoch: 8, step: 262, loss: 0.36351242661476135, mean loss: 0.37793783431228756
Epoch: 8, step: 263, loss: 0.3622654974460602, mean loss: 0.37793650794660827
Epoch: 8, step: 264, loss: 0.36045196652412415, mean loss: 0.3779350283374501
Epoch: 8, step: 265, loss: 0.33671119809150696, mean loss: 0.3779315401135335
Epoch: 8, step: 266, loss: 0.3190787434577942, mean loss: 0.3779265606062439
Epoch: 8, step: 267, loss: 0.33047017455101013, mean loss: 0.3779225456835658
Epoch: 8, step: 268, loss: 0.36714640259742737, mean loss: 0.37792163407345786
Epoch: 8, step: 269, loss: 0.34668824076652527, mean loss: 0.37791899210143054
Epoch: 8, step: 270, loss: 0.3258374333381653, mean loss: 0.3779145869962319
Epoch: 8, step: 271, loss: 0.3346806764602661, mean loss: 0.37791093054236385
Epoch: 8, step: 272, loss: 0.32948270440101624, mean loss: 0.37790683513211937
Epoch: 8, step: 273, loss: 0.3863191306591034, mean loss: 0.37790754647116276
Epoch: 8, step: 274, loss: 0.3530564606189728, mean loss: 0.3779054452548059
Epoch: 8, step: 275, loss: 0.36606091260910034, mean loss: 0.37790444385705096
Epoch: 8, step: 276, loss: 0.3851972222328186, mean loss: 0.37790506037394805
Epoch: 8, step: 277, loss: 0.33475247025489807, mean loss: 0.3779014126486633
Epoch: 8, step: 278, loss: 0.31133368611335754, mean loss: 0.37789578609752345
Epoch: 8, step: 279, loss: 0.3450027108192444, mean loss: 0.37789300608778054
Epoch: 8, step: 280, loss: 0.33646881580352783, mean loss: 0.3778895053533696
Epoch: 8, step: 281, loss: 0.3495803773403168, mean loss: 0.3778871131674635
Epoch: 8, step: 282, loss: 0.292958527803421, mean loss: 0.37787993711462325
Epoch: 8, step: 283, loss: 0.3546513319015503, mean loss: 0.37787797457616323
Epoch: 8, step: 284, loss: 0.32247915863990784, mean loss: 0.3778732944362683
Epoch: 8, step: 285, loss: 0.3551229238510132, mean loss: 0.37787137262763637
Epoch: 8, step: 286, loss: 0.3134530186653137, mean loss: 0.3778659314287207
Epoch: 8, step: 287, loss: 0.33650460839271545, mean loss: 0.37786243807373454
Epoch: 8, step: 288, loss: 0.33679723739624023, mean loss: 0.3778589700219925
Epoch: 8, step: 289, loss: 0.36234769225120544, mean loss: 0.3778576601691154
Epoch: 8, step: 290, loss: 0.32750245928764343, mean loss: 0.3778534082734064
Epoch: 8, step: 291, loss: 0.34294450283050537, mean loss: 0.37785046088186275
Epoch: 8, step: 292, loss: 0.3437225818634033, mean loss: 0.37784757967637367
Epoch: 8, step: 293, loss: 0.3410325050354004, mean loss: 0.37784447186997144
Epoch: 8, step: 294, loss: 0.3764549195766449, mean loss: 0.3778443545784805
Epoch: 8, step: 295, loss: 0.3331323266029358, mean loss: 0.3778405807746338
Epoch: 8, step: 296, loss: 0.3175516724586487, mean loss: 0.37783549267367034
Epoch: 8, step: 297, loss: 0.3349818289279938, mean loss: 0.3778318763307382
Epoch: 8, step: 298, loss: 0.34115472435951233, mean loss: 0.3778287814735978
Epoch: 8, step: 299, loss: 0.38438084721565247, mean loss: 0.3778293342972345
Epoch: 8, step: 300, loss: 0.3364328145980835, mean loss: 0.37782584180422013
Epoch: 8, step: 301, loss: 0.346529096364975, mean loss: 0.3778232016198571
Epoch: 8, step: 302, loss: 0.35640832781791687, mean loss: 0.3778213952197051
Epoch: 8, step: 303, loss: 0.3267076015472412, mean loss: 0.3778170840022901
Epoch: 8, step: 304, loss: 0.33521154522895813, mean loss: 0.37781349072078774
Epoch: 8, step: 305, loss: 0.3765060603618622, mean loss: 0.3778133804635471
Epoch: 8, step: 306, loss: 0.3089165985584259, mean loss: 0.37780757080152627
Epoch: 8, step: 307, loss: 0.33663761615753174, mean loss: 0.3778040994731415
Epoch: 8, step: 308, loss: 0.3656638562679291, mean loss: 0.37780307593016826
Epoch: 8, step: 309, loss: 0.3476783037185669, mean loss: 0.3778005363270481
Epoch: 8, step: 310, loss: 0.3365892171859741, mean loss: 0.37779706238966787
Epoch: 8, step: 311, loss: 0.35555046796798706, mean loss: 0.3777951872552763
Epoch: 8, step: 312, loss: 0.3654685914516449, mean loss: 0.37779414835128944
Epoch: 8, step: 313, loss: 0.3888190984725952, mean loss: 0.3777950774723177
Epoch: 8, step: 314, loss: 0.33147624135017395, mean loss: 0.3777911743092502
Epoch: 8, step: 315, loss: 0.3499844968318939, mean loss: 0.3777888313131702
Epoch: 8, step: 316, loss: 0.35973191261291504, mean loss: 0.37778730996186005
Epoch: 8, step: 317, loss: 0.3794405162334442, mean loss: 0.37778744923787283
Epoch: 8, step: 318, loss: 0.34296292066574097, mean loss: 0.37778451565783977
Epoch: 8, step: 319, loss: 0.33122357726097107, mean loss: 0.37778059374591283
Epoch: 8, step: 320, loss: 0.33616092801094055, mean loss: 0.3777770883415723
Epoch: 8, step: 321, loss: 0.31602931022644043, mean loss: 0.37777188809076256
Epoch: 8, step: 322, loss: 0.3505168855190277, mean loss: 0.3777695929326513
Epoch: 8, step: 323, loss: 0.35069623589515686, mean loss: 0.3777673132629782
Epoch: 8, step: 324, loss: 0.3250424861907959, mean loss: 0.37776287402520164
Epoch: 8, step: 325, loss: 0.36770132184028625, mean loss: 0.3777620269505944
Epoch: 8, step: 326, loss: 0.3077428936958313, mean loss: 0.37775613258800034
Epoch: 8, step: 327, loss: 0.3734358251094818, mean loss: 0.3777557689257547
Epoch: 8, step: 328, loss: 0.32361501455307007, mean loss: 0.3777512120067771
Epoch: 8, step: 329, loss: 0.33971917629241943, mean loss: 0.3777480111958265
Epoch: 8, step: 330, loss: 0.3286767303943634, mean loss: 0.37774388165944667
Epoch: 8, step: 331, loss: 0.42671114206314087, mean loss: 0.3777480020953608
Epoch: 8, step: 332, loss: 0.3448752462863922, mean loss: 0.3777452361924741
Epoch: 8, step: 333, loss: 0.4027283191680908, mean loss: 0.3777473380840251
Epoch: 8, step: 334, loss: 0.33906272053718567, mean loss: 0.377744083720641
Epoch: 8, step: 335, loss: 0.3381374776363373, mean loss: 0.37774075207477253
Epoch: 8, step: 336, loss: 0.35820719599723816, mean loss: 0.37773910908073793
Epoch: 8, step: 337, loss: 0.31153589487075806, mean loss: 0.3777335411064562
Epoch: 8, step: 338, loss: 0.31224530935287476, mean loss: 0.3777280337284599
Epoch: 8, step: 339, loss: 0.36921435594558716, mean loss: 0.37772731781206376
Epoch: 8, step: 340, loss: 0.3222087025642395, mean loss: 0.3777226496362252
Epoch: 8, step: 341, loss: 0.3066880404949188, mean loss: 0.37771667733009257
Epoch: 8, step: 342, loss: 0.3638022840023041, mean loss: 0.3777155075618431
Epoch: 8, step: 343, loss: 0.35124489665031433, mean loss: 0.3777132823928021
Epoch: 8, step: 344, loss: 0.409127801656723, mean loss: 0.37771592293405315
Epoch: 8, step: 345, loss: 0.32066091895103455, mean loss: 0.3777111275899631
Epoch: 8, step: 346, loss: 0.3688352704048157, mean loss: 0.377710381656928
Epoch: 8, step: 347, loss: 0.32816195487976074, mean loss: 0.3777062179235854
Epoch: 8, step: 348, loss: 0.3125440776348114, mean loss: 0.37770074257359054
Epoch: 8, step: 349, loss: 0.33323004841804504, mean loss: 0.3776970061684355
Epoch: 8, step: 350, loss: 0.3224647641181946, mean loss: 0.37769236597335437
Epoch: 8, step: 351, loss: 0.3189888596534729, mean loss: 0.37768743456321324
Epoch: 8, step: 352, loss: 0.32594311237335205, mean loss: 0.377683088127078
Epoch: 8, step: 353, loss: 0.33166196942329407, mean loss: 0.37767922275510557
Epoch: 8, step: 354, loss: 0.338484525680542, mean loss: 0.3776759310193976
Epoch: 8, step: 355, loss: 0.32762643694877625, mean loss: 0.37767172800511556
Epoch: 8, step: 356, loss: 0.3520072400569916, mean loss: 0.37766957295532566
Epoch: 8, step: 357, loss: 0.328909695148468, mean loss: 0.37766547892696234
Epoch: 8, step: 358, loss: 0.3529847264289856, mean loss: 0.3776634068295316
Epoch: 8, step: 359, loss: 0.3438663184642792, mean loss: 0.37766056959914496
Epoch: 8, step: 360, loss: 0.3141520619392395, mean loss: 0.3776552385735712
Epoch: 8, step: 361, loss: 0.32934024930000305, mean loss: 0.37765118326139446
Epoch: 8, step: 362, loss: 0.3888259828090668, mean loss: 0.3776521211379826
Epoch: 8, step: 363, loss: 0.34195441007614136, mean loss: 0.37764912535826944
Epoch: 8, step: 364, loss: 0.3435139060020447, mean loss: 0.3776462609444609
Epoch: 8, step: 365, loss: 0.3328927159309387, mean loss: 0.3776425058223755
Epoch: 8, step: 366, loss: 0.3552028238773346, mean loss: 0.37764062314077934
Epoch: 8, step: 367, loss: 0.37710362672805786, mean loss: 0.3776405780907447
Epoch: 8, step: 368, loss: 0.34037861227989197, mean loss: 0.37763745234912816
Epoch: 8, step: 369, loss: 0.32504457235336304, mean loss: 0.37763304093493627
Epoch: 8, step: 370, loss: 0.327164888381958, mean loss: 0.37762880809483285
Epoch: 8, step: 371, loss: 0.3698682487010956, mean loss: 0.37762815725959353
Epoch: 8, step: 372, loss: 0.34207484126091003, mean loss: 0.3776251758494469
Epoch: 8, step: 373, loss: 0.3723686933517456, mean loss: 0.37762473509122974
Epoch: 8, step: 374, loss: 0.325732946395874, mean loss: 0.37762038430824196
Epoch: 8, step: 375, loss: 0.33342161774635315, mean loss: 0.3776166788449152
Epoch: 8, step: 376, loss: 0.33716556429862976, mean loss: 0.37761328785534803
Epoch: 8, step: 377, loss: 0.3544076979160309, mean loss: 0.3776113427095023
Epoch: 8, step: 378, loss: 0.3224664330482483, mean loss: 0.3776067207239469
Epoch: 8, step: 379, loss: 0.32135632634162903, mean loss: 0.37760200647701575
Epoch: 8, step: 380, loss: 0.3652920722961426, mean loss: 0.3776009748894702
Epoch: 8, step: 381, loss: 0.33547449111938477, mean loss: 0.37759744493440317
Epoch: 8, step: 382, loss: 0.31986719369888306, mean loss: 0.37759260787941906
Epoch: 8, step: 383, loss: 0.35273993015289307, mean loss: 0.3775905257180814
Epoch: 8, step: 384, loss: 0.33302029967308044, mean loss: 0.37758679193019123
Epoch: 8, step: 385, loss: 0.31546998023986816, mean loss: 0.3775815886455799
Epoch: 8, step: 386, loss: 0.3420264422893524, mean loss: 0.37757861057820774
Epoch: 8, step: 387, loss: 0.38112005591392517, mean loss: 0.3775789071816697
Epoch: 8, step: 388, loss: 0.3241051137447357, mean loss: 0.3775744290145617
Epoch: 8, step: 389, loss: 0.32052814960479736, mean loss: 0.3775696520693758
Epoch: 8, step: 390, loss: 0.3325369656085968, mean loss: 0.37756588143499076
Epoch: 8, step: 391, loss: 0.33417895436286926, mean loss: 0.3775622489059325
Epoch: 8, step: 392, loss: 0.36935827136039734, mean loss: 0.37756156209324554
Epoch: 8, step: 393, loss: 0.32469481229782104, mean loss: 0.3775571366161155
Epoch: 8, step: 394, loss: 0.31425541639328003, mean loss: 0.37755183807085535
Epoch: 8, step: 395, loss: 0.32853904366493225, mean loss: 0.3775477358952271
Epoch: 8, step: 396, loss: 0.3391191363334656, mean loss: 0.37754451984371135
Epoch: 8, step: 397, loss: 0.3222913444042206, mean loss: 0.3775398961470218
Epoch: 8, step: 398, loss: 0.3669869005680084, mean loss: 0.3775390131250505
Epoch: 8, step: 399, loss: 0.41996845602989197, mean loss: 0.37754256311190665
Epoch: 8, step: 400, loss: 0.3340611755847931, mean loss: 0.37753892541530104
Epoch: 8, step: 401, loss: 0.38858646154403687, mean loss: 0.377539849585966
Epoch: 8, step: 402, loss: 0.32068559527397156, mean loss: 0.37753509389760864
Epoch: 8, step: 403, loss: 0.32698482275009155, mean loss: 0.3775308658722534
Epoch: 8, step: 404, loss: 0.32279837131500244, mean loss: 0.3775262884285336
Epoch: 8, step: 405, loss: 0.342043399810791, mean loss: 0.3775233211356236
Epoch: 8, step: 406, loss: 0.36363959312438965, mean loss: 0.377522160191731
Epoch: 8, step: 407, loss: 0.3382608890533447, mean loss: 0.3775188774767529
Epoch: 8, step: 408, loss: 0.3387403190135956, mean loss: 0.3775156353934435
Epoch: 8, step: 409, loss: 0.30073463916778564, mean loss: 0.3775092166510739
Epoch: 8, step: 410, loss: 0.34875553846359253, mean loss: 0.3775068131002767
Epoch: 8, step: 411, loss: 0.3546796441078186, mean loss: 0.37750490511222984
Epoch: 8, step: 412, loss: 0.31023693084716797, mean loss: 0.37749928305002634
Epoch: 8, step: 413, loss: 0.32710638642311096, mean loss: 0.3774950717098436
Epoch: 8, step: 414, loss: 0.32746776938438416, mean loss: 0.37749089127177843
Epoch: 8, step: 415, loss: 0.3358839452266693, mean loss: 0.37748741475556474
Epoch: 8, step: 416, loss: 0.33300045132637024, mean loss: 0.3774836979067529
Epoch: 8, step: 417, loss: 0.38953420519828796, mean loss: 0.37748470463250827
Epoch: 8, step: 418, loss: 0.29979634284973145, mean loss: 0.3774782149188851
Epoch: 8, step: 419, loss: 0.35724499821662903, mean loss: 0.3774765248740553
Epoch: 8, step: 420, loss: 0.33180707693099976, mean loss: 0.37747271050439496
Epoch: 8, step: 421, loss: 0.3522097170352936, mean loss: 0.37747060068366095
Epoch: 8, step: 422, loss: 0.3164302706718445, mean loss: 0.37746550337009005
Epoch: 8, step: 423, loss: 0.39635607600212097, mean loss: 0.3774670807392143
Epoch: 8, step: 424, loss: 0.30125224590301514, mean loss: 0.3774607173063984
Epoch: 8, step: 425, loss: 0.31980204582214355, mean loss: 0.3774559035919649
Epoch: 8, step: 426, loss: 0.32975155115127563, mean loss: 0.3774519212601809
Epoch: 8, step: 427, loss: 0.3328193426132202, mean loss: 0.3774481956693089
Epoch: 8, step: 428, loss: 0.36377277970314026, mean loss: 0.37744705424405506
Epoch: 8, step: 429, loss: 0.29398632049560547, mean loss: 0.37744008873464524
Epoch: 8, step: 430, loss: 0.3542684018611908, mean loss: 0.3774381550213119
Epoch: 8, step: 431, loss: 0.36261725425720215, mean loss: 0.3774369182972828
Epoch: 8, step: 432, loss: 0.3785862624645233, mean loss: 0.37743701419583664
Epoch: 8, step: 433, loss: 0.3086094856262207, mean loss: 0.3774312718690746
Epoch: 8, step: 434, loss: 0.35544756054878235, mean loss: 0.37742943790633826
Epoch: 8, step: 435, loss: 0.36460065841674805, mean loss: 0.3774283677712457
Epoch: 8, step: 436, loss: 0.3513337969779968, mean loss: 0.37742619122851545
Epoch: 8, step: 437, loss: 0.3535264730453491, mean loss: 0.37742419792424664
Epoch: 8, step: 438, loss: 0.399001806974411, mean loss: 0.3774259974079469
Epoch: 8, step: 439, loss: 0.37449806928634644, mean loss: 0.37742575325116556
Epoch: 8, step: 440, loss: 0.3206407129764557, mean loss: 0.37742101840248093
Epoch: 8, step: 441, loss: 0.324068546295166, mean loss: 0.3774165701390069
Epoch: 8, step: 442, loss: 0.352593332529068, mean loss: 0.3774145006735955
Epoch: 8, step: 443, loss: 0.39362266659736633, mean loss: 0.37741585180446613
Epoch: 8, step: 444, loss: 0.36090150475502014, mean loss: 0.37741447526474375
Epoch: 8, step: 445, loss: 0.34625038504600525, mean loss: 0.3774118778243188
Epoch: 8, step: 446, loss: 0.35848701000213623, mean loss: 0.37741030062056663
Epoch: 8, step: 447, loss: 0.3431686758995056, mean loss: 0.3774074471518399
Epoch: 8, step: 448, loss: 0.38815104961395264, mean loss: 0.3774083423774429
Epoch: 8, step: 449, loss: 0.32855224609375, mean loss: 0.3774042717145298
Epoch: 8, step: 450, loss: 0.35298916697502136, mean loss: 0.37740223763098907
Epoch: 8, step: 451, loss: 0.3554050326347351, mean loss: 0.37740040514140255
Epoch: 8, step: 452, loss: 0.32630306482315063, mean loss: 0.3773961488031836
Epoch: 8, step: 453, loss: 0.34731608629226685, mean loss: 0.37739364338401726
Epoch: 8, step: 454, loss: 0.337057501077652, mean loss: 0.37739028399846664
Epoch: 8, step: 455, loss: 0.35608890652656555, mean loss: 0.37738851006629875
Epoch: 8, step: 456, loss: 0.33619725704193115, mean loss: 0.37738508003440396
Epoch: 8, step: 457, loss: 0.33883994817733765, mean loss: 0.37738187061459905
Epoch: 8, step: 458, loss: 0.3245031535625458, mean loss: 0.37737746809049183
Epoch: 8, step: 459, loss: 0.34225979447364807, mean loss: 0.3773745445412397
Epoch: 8, step: 460, loss: 0.32066109776496887, mean loss: 0.37736982353509835
Epoch: 8, step: 461, loss: 0.3638642430305481, mean loss: 0.37736869938156875
Epoch: 8, step: 462, loss: 0.32183241844177246, mean loss: 0.3773640771359641
Epoch: 8, step: 463, loss: 0.3316614627838135, mean loss: 0.3773602736560746
Epoch: 8, step: 464, loss: 0.33970460295677185, mean loss: 0.3773571401226886
Epoch: 8, step: 465, loss: 0.3045381009578705, mean loss: 0.37735108095817166
Epoch: 8, step: 466, loss: 0.32798609137535095, mean loss: 0.37734697371217923
Epoch: 8, step: 467, loss: 0.3877744674682617, mean loss: 0.377347841224139
Epoch: 8, step: 468, loss: 0.35397008061408997, mean loss: 0.3773458964807225
Epoch: 8, step: 469, loss: 0.3773333728313446, mean loss: 0.3773458954389949
Epoch: 8, step: 470, loss: 0.3557870388031006, mean loss: 0.37734410230444976
Epoch: 8, step: 471, loss: 0.3924623429775238, mean loss: 0.37734535964316174
Epoch: 8, step: 472, loss: 0.3714028596878052, mean loss: 0.3773448654643713
Epoch: 8, step: 473, loss: 0.3391130566596985, mean loss: 0.37734168636834564
Epoch: 8, step: 474, loss: 0.3628447949886322, mean loss: 0.377340481006129
Epoch: 8, step: 475, loss: 0.31363698840141296, mean loss: 0.3773351847397003
Epoch: 8, step: 476, loss: 0.328007310628891, mean loss: 0.37733108399366067
Epoch: 8, step: 477, loss: 0.33067604899406433, mean loss: 0.3773272057696374
Epoch: 8, step: 478, loss: 0.3722246289253235, mean loss: 0.3773267816505414
Epoch: 8, step: 479, loss: 0.3201698362827301, mean loss: 0.37732203123952346
Epoch: 8, step: 480, loss: 0.3828652501106262, mean loss: 0.3773224919075922
Epoch: 8, step: 481, loss: 0.3620646297931671, mean loss: 0.37732122401145507
Epoch: 8, step: 482, loss: 0.3590546250343323, mean loss: 0.37731970622176025
Epoch: 8, step: 483, loss: 0.3558061718940735, mean loss: 0.37731791878952964
Epoch: 8, step: 484, loss: 0.3098376393318176, mean loss: 0.37731231271829446
Epoch: 8, step: 485, loss: 0.3496941328048706, mean loss: 0.37731001846842627
Epoch: 8, step: 486, loss: 0.3211158812046051, mean loss: 0.37730535079359745
Epoch: 8, step: 487, loss: 0.34505265951156616, mean loss: 0.3773026719986405
Epoch: 8, step: 488, loss: 0.3202565908432007, mean loss: 0.37729793434552567
Epoch: 8, step: 489, loss: 0.391204833984375, mean loss: 0.37729908921179695
Epoch: 8, step: 490, loss: 0.3313961923122406, mean loss: 0.3772952776285619
Epoch: 8, step: 491, loss: 0.31897032260894775, mean loss: 0.37729043497205084
Epoch: 8, step: 492, loss: 0.3925012946128845, mean loss: 0.37729169780805255
Epoch: 8, step: 493, loss: 0.3753986656665802, mean loss: 0.3772915406577835
Epoch: 8, step: 494, loss: 0.3165452182292938, mean loss: 0.37728649821381993
Epoch: 8, step: 495, loss: 0.32771456241607666, mean loss: 0.37728238367731615
Epoch: 8, step: 496, loss: 0.34018799662590027, mean loss: 0.37727930504945895
Epoch: 8, step: 497, loss: 0.35198238492012024, mean loss: 0.37727720571998763
Epoch: 8, step: 498, loss: 0.3234272003173828, mean loss: 0.37727273721070187
Epoch: 8, step: 499, loss: 0.3754040598869324, mean loss: 0.3772725821594802
Epoch: 8, step: 500, loss: 0.42267024517059326, mean loss: 0.37727634866267534
Epoch: 8, step: 501, loss: 0.3555792570114136, mean loss: 0.37727454867166393
Epoch: 8, step: 502, loss: 0.31004849076271057, mean loss: 0.37726897205964327
Epoch: 8, step: 503, loss: 0.33276981115341187, mean loss: 0.37726528102108103
Epoch: 8, step: 504, loss: 0.3085620105266571, mean loss: 0.37725958281501865
Epoch: 8, step: 505, loss: 0.38616740703582764, mean loss: 0.37726032156308803
Epoch: 8, step: 506, loss: 0.3460562527179718, mean loss: 0.377257733946466
Epoch: 8, step: 507, loss: 0.3669836223125458, mean loss: 0.37725688203007846
Epoch: 8, step: 508, loss: 0.33389654755592346, mean loss: 0.3772532869438937
Epoch: 8, step: 509, loss: 0.35110247135162354, mean loss: 0.3772511189107655
Epoch: 8, step: 510, loss: 0.36886435747146606, mean loss: 0.3772504236640243
Epoch: 8, step: 511, loss: 0.3543393611907959, mean loss: 0.377248524537493
Epoch: 8, step: 512, loss: 0.33025887608528137, mean loss: 0.37724462982978874
Epoch: 8, step: 513, loss: 0.32517457008361816, mean loss: 0.3772403143930453
Epoch: 8, step: 514, loss: 0.32829704880714417, mean loss: 0.37723625843335473
Epoch: 8, step: 515, loss: 0.3379272222518921, mean loss: 0.3772330011383447
Epoch: 8, step: 516, loss: 0.32557564973831177, mean loss: 0.3772287209700292
Epoch: 8, step: 517, loss: 0.32223212718963623, mean loss: 0.37722416449995627
Epoch: 8, step: 518, loss: 0.35473865270614624, mean loss: 0.37722230172870336
Epoch: 8, step: 519, loss: 0.3798352777957916, mean loss: 0.3772225181780131
Epoch: 8, step: 520, loss: 0.3126092553138733, mean loss: 0.377217166296719
Epoch: 8, step: 521, loss: 0.36685365438461304, mean loss: 0.3772163079637794
Epoch: 8, step: 522, loss: 0.31918296217918396, mean loss: 0.37721150188959435
Epoch: 8, step: 523, loss: 0.37560972571372986, mean loss: 0.37721136924830784
Epoch: 8, step: 524, loss: 0.3681665062904358, mean loss: 0.37721062031538094
Epoch: 8, step: 525, loss: 0.3528735339641571, mean loss: 0.37720860532230666
Epoch: 8, step: 526, loss: 0.353892058134079, mean loss: 0.3772066749847631
Epoch: 8, step: 527, loss: 0.38631266355514526, mean loss: 0.377207428791764
Epoch: 8, step: 528, loss: 0.34126412868499756, mean loss: 0.3772044535993042
Epoch: 8, step: 529, loss: 0.42468011379241943, mean loss: 0.37720838305305304
Epoch: 8, step: 530, loss: 0.3234410285949707, mean loss: 0.3772039332182059
Epoch: 8, step: 531, loss: 0.38779449462890625, mean loss: 0.37720480963010683
Epoch: 8, step: 532, loss: 0.31499409675598145, mean loss: 0.3771996618673535
Epoch: 8, step: 533, loss: 0.32686683535575867, mean loss: 0.37719549731113045
Epoch: 8, step: 534, loss: 0.3464365601539612, mean loss: 0.3771929525161311
Epoch: 8, step: 535, loss: 0.3507070541381836, mean loss: 0.3771907614259278
Epoch: 8, step: 536, loss: 0.3168845772743225, mean loss: 0.3771857729087509
Epoch: 8, step: 537, loss: 0.3244771361351013, mean loss: 0.3771814132200186
Epoch: 8, step: 538, loss: 0.39694944024086, mean loss: 0.37718304815732906
Epoch: 8, step: 539, loss: 0.32200267910957336, mean loss: 0.3771784847791412
Epoch: 8, step: 540, loss: 0.3740405738353729, mean loss: 0.3771782252975449
Epoch: 8, step: 541, loss: 0.31350111961364746, mean loss: 0.3771729601159934
Epoch: 8, step: 542, loss: 0.3353813588619232, mean loss: 0.37716950483684875
Epoch: 8, step: 543, loss: 0.3531230688095093, mean loss: 0.3771675168709073
Epoch: 8, step: 544, loss: 0.3479914665222168, mean loss: 0.37716510502909956
Epoch: 8, step: 545, loss: 0.37377095222473145, mean loss: 0.3771648244742306
Epoch: 8, step: 546, loss: 0.31534767150878906, mean loss: 0.37715971519635927
Epoch: 8, step: 547, loss: 0.3527998924255371, mean loss: 0.3771577019878658
Epoch: 8, step: 548, loss: 0.3514268696308136, mean loss: 0.3771555756485255
Epoch: 8, step: 549, loss: 0.4053999185562134, mean loss: 0.37715790950597944
Epoch: 8, step: 550, loss: 0.3904268741607666, mean loss: 0.37715900584280954
Epoch: 8, step: 551, loss: 0.3235441744327545, mean loss: 0.37715457632930904
Epoch: 8, step: 552, loss: 0.34275180101394653, mean loss: 0.3771517342991302
Epoch: 8, step: 553, loss: 0.35228899121284485, mean loss: 0.3771496805453646
Epoch: 8, step: 554, loss: 0.39738044142723083, mean loss: 0.37715135154238133
Epoch: 8, step: 555, loss: 0.3709244430065155, mean loss: 0.3771508372618613
Epoch: 8, step: 556, loss: 0.34850627183914185, mean loss: 0.3771484717019123
Epoch: 8, step: 557, loss: 0.39596933126449585, mean loss: 0.37715002586042284
Epoch: 8, step: 558, loss: 0.33127743005752563, mean loss: 0.3771462381801485
Epoch: 8, step: 559, loss: 0.3183400332927704, mean loss: 0.37714138297829186
Epoch: 8, step: 560, loss: 0.3320511281490326, mean loss: 0.3771376605102964
Epoch: 8, step: 561, loss: 0.3341965079307556, mean loss: 0.37713411575607986
Epoch: 8, step: 562, loss: 0.3326837718486786, mean loss: 0.3771304467223277
Epoch: 8, step: 563, loss: 0.3316025733947754, mean loss: 0.3771266890569821
Epoch: 8, step: 564, loss: 0.34105047583580017, mean loss: 0.3771237117347719
Epoch: 8, step: 565, loss: 0.36475223302841187, mean loss: 0.3771226908172355
Epoch: 8, step: 566, loss: 0.3181362748146057, mean loss: 0.3771178235496389
Epoch: 8, step: 567, loss: 0.3560970723628998, mean loss: 0.37711608916422745
Epoch: 8, step: 568, loss: 0.320108026266098, mean loss: 0.37711138591673155
Epoch: 8, step: 569, loss: 0.3445419371128082, mean loss: 0.3771086991118475
Epoch: 8, step: 570, loss: 0.3145601749420166, mean loss: 0.3771035396196286
Epoch: 8, step: 571, loss: 0.3649407923221588, mean loss: 0.3771025364237116
Epoch: 8, step: 572, loss: 0.329664409160614, mean loss: 0.37709862400084454
Epoch: 8, step: 573, loss: 0.3800903558731079, mean loss: 0.3770988707212694
Epoch: 8, step: 574, loss: 0.3242853283882141, mean loss: 0.37709451568355745
Epoch: 8, step: 575, loss: 0.3068446218967438, mean loss: 0.37708872331104865
Epoch: 8, step: 576, loss: 0.32321444153785706, mean loss: 0.3770842815366424
Epoch: 8, step: 577, loss: 0.3352605700492859, mean loss: 0.3770808335802131
Epoch: 8, step: 578, loss: 0.3575977385044098, mean loss: 0.37707922752176154
Epoch: 8, step: 579, loss: 0.34189918637275696, mean loss: 0.37707632774916433
Epoch: 8, step: 580, loss: 0.33869925141334534, mean loss: 0.377073164716416
Epoch: 8, step: 581, loss: 0.3331837058067322, mean loss: 0.37706954765205886
Epoch: 8, step: 582, loss: 0.32666724920272827, mean loss: 0.3770653941870033
Epoch: 8, step: 583, loss: 0.33777913451194763, mean loss: 0.37706215701992396
Epoch: 8, step: 584, loss: 0.3741077184677124, mean loss: 0.3770619135958033
Epoch: 8, step: 585, loss: 0.295922189950943, mean loss: 0.3770552288270074
Epoch: 8, step: 586, loss: 0.35274848341941833, mean loss: 0.37705322645898637
Epoch: 8, step: 587, loss: 0.36400070786476135, mean loss: 0.3770521512927101
Epoch: 8, step: 588, loss: 0.3664010465145111, mean loss: 0.37705127400873195
Epoch: 8, step: 589, loss: 0.3585045337677002, mean loss: 0.3770497465223013
Epoch: 8, step: 590, loss: 0.3587861955165863, mean loss: 0.37704824248285423
Epoch: 8, step: 591, loss: 0.323522686958313, mean loss: 0.377043834910759
Epoch: 8, step: 592, loss: 0.344684362411499, mean loss: 0.37704117048321684
Epoch: 8, step: 593, loss: 0.3557935655117035, mean loss: 0.3770394211332274
Epoch: 8, step: 594, loss: 0.3230384886264801, mean loss: 0.3770349755143498
Epoch: 8, step: 595, loss: 0.36257681250572205, mean loss: 0.3770337853461732
Epoch: 8, step: 596, loss: 0.3299776315689087, mean loss: 0.3770299120929197
Epoch: 8, step: 597, loss: 0.34937307238578796, mean loss: 0.37702763580981624
Epoch: 8, step: 598, loss: 0.3515174686908722, mean loss: 0.3770255363803768
Epoch: 8, step: 599, loss: 0.36319684982299805, mean loss: 0.37702439840419527
Epoch: 8, step: 600, loss: 0.31564509868621826, mean loss: 0.3770193478570285
Epoch: 8, step: 601, loss: 0.32663750648498535, mean loss: 0.3770152025681218
Epoch: 8, step: 602, loss: 0.3597276508808136, mean loss: 0.3770137803096531
Epoch: 8, step: 603, loss: 0.36029407382011414, mean loss: 0.37701240488134696
Epoch: 8, step: 604, loss: 0.35093897581100464, mean loss: 0.377010260155751
Epoch: 8, step: 605, loss: 0.3287256956100464, mean loss: 0.37700628873244574
Epoch: 8, step: 606, loss: 0.36693471670150757, mean loss: 0.37700546041004823
Epoch: 8, step: 607, loss: 0.38156023621559143, mean loss: 0.377005834980427
Epoch: 8, step: 608, loss: 0.3573765456676483, mean loss: 0.3770042208624011
Epoch: 8, step: 609, loss: 0.35755881667137146, mean loss: 0.3770026219967383
Epoch: 8, step: 610, loss: 0.3475257158279419, mean loss: 0.37700019850696037
Epoch: 8, step: 611, loss: 0.34380680322647095, mean loss: 0.3769974696845927
Epoch: 8, step: 612, loss: 0.33191072940826416, mean loss: 0.3769937634174101
Epoch: 8, step: 613, loss: 0.31838592886924744, mean loss: 0.3769889460711543
Epoch: 8, step: 614, loss: 0.398494690656662, mean loss: 0.3769907136181737
Epoch: 8, step: 615, loss: 0.4036363661289215, mean loss: 0.3769929034318252
Epoch: 8, step: 616, loss: 0.40871837735176086, mean loss: 0.37699551050503743
Epoch: 8, step: 617, loss: 0.37039393186569214, mean loss: 0.3769949680581484
Epoch: 8, step: 618, loss: 0.3454238176345825, mean loss: 0.3769923740929505
Epoch: 8, step: 619, loss: 0.32638126611709595, mean loss: 0.37698821609853905
Epoch: 8, step: 620, loss: 0.3178490400314331, mean loss: 0.3769833578732809
Epoch: 8, step: 621, loss: 0.3752882778644562, mean loss: 0.37698321863556045
Epoch: 8, step: 622, loss: 0.36552172899246216, mean loss: 0.3769822772401072
Epoch: 8, step: 623, loss: 0.3475128710269928, mean loss: 0.3769798569537888
Epoch: 8, step: 624, loss: 0.3172692060470581, mean loss: 0.37697495339372417
Epoch: 8, step: 625, loss: 0.31205645203590393, mean loss: 0.37696962259216743
Epoch: 8, step: 626, loss: 0.32304269075393677, mean loss: 0.3769651947301231
Epoch: 8, step: 627, loss: 0.33792033791542053, mean loss: 0.37696198907685424
Epoch: 8, step: 628, loss: 0.3472227454185486, mean loss: 0.37695954763168077
Epoch: 8, step: 629, loss: 0.33835989236831665, mean loss: 0.3769563790505559
Epoch: 8, step: 630, loss: 0.34468626976013184, mean loss: 0.37695373026870493
Epoch: 8, step: 631, loss: 0.33507096767425537, mean loss: 0.3769502927471525
Epoch: 8, step: 632, loss: 0.35003820061683655, mean loss: 0.37694808412243935
Epoch: 8, step: 633, loss: 0.34730908274650574, mean loss: 0.3769456519050279
Epoch: 8, step: 634, loss: 0.3737768530845642, mean loss: 0.3769453918903548
Epoch: 8, step: 635, loss: 0.359467476606369, mean loss: 0.37694395786383
Epoch: 8, step: 636, loss: 0.3160029947757721, mean loss: 0.37693895819502304
Epoch: 8, step: 637, loss: 0.35418903827667236, mean loss: 0.37693709191775326
Epoch: 8, step: 638, loss: 0.3701062500476837, mean loss: 0.37693653159933227
Epoch: 8, step: 639, loss: 0.34173858165740967, mean loss: 0.3769336446283725
Epoch: 8, step: 640, loss: 0.32041671872138977, mean loss: 0.37692900943392427
Epoch: 8, step: 641, loss: 0.33382245898246765, mean loss: 0.3769254743715615
Epoch: 8, step: 642, loss: 0.3161229193210602, mean loss: 0.37692048851218873
Epoch: 8, step: 643, loss: 0.3218288719654083, mean loss: 0.37691597132486937
Epoch: 8, step: 644, loss: 0.34238171577453613, mean loss: 0.3769131399519457
Epoch: 8, step: 645, loss: 0.3327001929283142, mean loss: 0.37690951534569683
Epoch: 8, step: 646, loss: 0.33423423767089844, mean loss: 0.3769060170853743
Epoch: 8, step: 647, loss: 0.3652012050151825, mean loss: 0.37690505767454885
Epoch: 8, step: 648, loss: 0.328199565410614, mean loss: 0.3769010657482917
Epoch: 8, step: 649, loss: 0.3213249146938324, mean loss: 0.37689651107274225
Epoch: 8, step: 650, loss: 0.31710827350616455, mean loss: 0.37689161160231965
Epoch: 8, step: 651, loss: 0.3185480833053589, mean loss: 0.37688683091334085
Epoch: 8, step: 652, loss: 0.3526916205883026, mean loss: 0.3768848485118394
Epoch: 8, step: 653, loss: 0.32341232895851135, mean loss: 0.3768804676729443
Epoch: 8, step: 654, loss: 0.3403184711933136, mean loss: 0.3768774725065251
Epoch: 8, step: 655, loss: 0.3705868422985077, mean loss: 0.37687695721899167
Epoch: 8, step: 656, loss: 0.2746741771697998, mean loss: 0.3768685861173413
Epoch: 8, step: 657, loss: 0.3213537931442261, mean loss: 0.37686403945125013
Epoch: 8, step: 658, loss: 0.3385341763496399, mean loss: 0.3768609004894041
Epoch: 8, step: 659, loss: 0.33545181155204773, mean loss: 0.37685750963705095
Epoch: 8, step: 660, loss: 0.3604908287525177, mean loss: 0.3768561695338098
Epoch: 8, step: 661, loss: 0.34535878896713257, mean loss: 0.37685359074057523
Epoch: 8, step: 662, loss: 0.3731856644153595, mean loss: 0.37685329046007376
Epoch: 8, step: 663, loss: 0.3646527826786041, mean loss: 0.37685229172826457
Epoch: 8, step: 664, loss: 0.3385002017021179, mean loss: 0.37684915248867823
Epoch: 8, step: 665, loss: 0.3125647008419037, mean loss: 0.3768438910341319
Epoch: 8, step: 666, loss: 0.3639187514781952, mean loss: 0.3768428332438417
Epoch: 8, step: 667, loss: 0.37730348110198975, mean loss: 0.3768428709400658
Epoch: 8, step: 668, loss: 0.35428687930107117, mean loss: 0.3768410252652733
Epoch: 8, step: 669, loss: 0.3189573884010315, mean loss: 0.3768362892452386
Epoch: 8, step: 670, loss: 0.32109442353248596, mean loss: 0.3768317288373426
Epoch: 8, step: 671, loss: 0.3555387556552887, mean loss: 0.3768299869383585
Epoch: 8, step: 672, loss: 0.36469322443008423, mean loss: 0.37682899415614923
Epoch: 8, step: 673, loss: 0.39062586426734924, mean loss: 0.37683012264217175
Epoch: 8, step: 674, loss: 0.32373589277267456, mean loss: 0.376825780266293
Epoch: 8, step: 675, loss: 0.30758607387542725, mean loss: 0.3768201178761727
Epoch: 8, step: 676, loss: 0.36244142055511475, mean loss: 0.3768189420893282
Epoch: 8, step: 677, loss: 0.35791903734207153, mean loss: 0.37681739671690406
Epoch: 8, step: 678, loss: 0.3228035569190979, mean loss: 0.3768129805743321
Epoch: 8, step: 679, loss: 0.318133145570755, mean loss: 0.3768081833347144
Epoch: 8, step: 680, loss: 0.3574765622615814, mean loss: 0.37680660305015024
Epoch: 8, step: 681, loss: 0.34001901745796204, mean loss: 0.37680359605443403
Epoch: 8, step: 682, loss: 0.33926525712013245, mean loss: 0.3768005279433646
Epoch: 8, step: 683, loss: 0.3416881561279297, mean loss: 0.3767976583477602
Epoch: 8, step: 684, loss: 0.34474554657936096, mean loss: 0.37679503906919776
Epoch: 8, step: 685, loss: 0.31851711869239807, mean loss: 0.376790277023081
Epoch: 8, step: 686, loss: 0.3296211361885071, mean loss: 0.3767864230202348
Epoch: 8, step: 687, loss: 0.3287067115306854, mean loss: 0.37678249493923077
Epoch: 8, step: 688, loss: 0.3139776289463043, mean loss: 0.3767773642419027
Epoch: 8, step: 689, loss: 0.3053690195083618, mean loss: 0.3767715311799248
Epoch: 8, step: 690, loss: 0.31289389729499817, mean loss: 0.37676631369778113
Epoch: 8, step: 691, loss: 0.35336989164352417, mean loss: 0.3767644028498512
Epoch: 8, step: 692, loss: 0.33929404616355896, mean loss: 0.37676134279622225
Epoch: 8, step: 693, loss: 0.329628050327301, mean loss: 0.3767574939237358
Epoch: 8, step: 694, loss: 0.3343912363052368, mean loss: 0.37675403460654644
Epoch: 8, step: 695, loss: 0.3768317699432373, mean loss: 0.37675404095332443
Epoch: 8, step: 696, loss: 0.3646540343761444, mean loss: 0.37675305311704577
Epoch: 8, step: 697, loss: 0.3419662117958069, mean loss: 0.3767502133748971
Epoch: 8, step: 698, loss: 0.3442768156528473, mean loss: 0.37674756270166865
Epoch: 8, step: 699, loss: 0.3416126072406769, mean loss: 0.3767446950102337
Epoch: 8, step: 700, loss: 0.3241671323776245, mean loss: 0.37674040401516046
Epoch: 8, step: 701, loss: 0.33422842621803284, mean loss: 0.3767369347824367
Epoch: 8, step: 702, loss: 0.3386443853378296, mean loss: 0.37673382645526865
Epoch: 8, step: 703, loss: 0.3259052336215973, mean loss: 0.3767296792136863
Epoch: 8, step: 704, loss: 0.3677448630332947, mean loss: 0.37672894617818165
Epoch: 8, step: 705, loss: 0.3181368410587311, mean loss: 0.3767241662707645
Epoch: 8, step: 706, loss: 0.30754154920578003, mean loss: 0.37671852285636975
Epoch: 8, step: 707, loss: 0.3288315534591675, mean loss: 0.3767146169045429
Epoch: 8, step: 708, loss: 0.3612167239189148, mean loss: 0.3767133529054412
Epoch: 8, step: 709, loss: 0.3265730142593384, mean loss: 0.3767092638222047
Epoch: 8, step: 710, loss: 0.38420984148979187, mean loss: 0.3767098754651687
Epoch: 8, step: 711, loss: 0.38573187589645386, mean loss: 0.376710611114258
Epoch: 8, step: 712, loss: 0.34819915890693665, mean loss: 0.37670828649524396
Epoch: 8, step: 713, loss: 0.36995524168014526, mean loss: 0.376707735945365
Epoch: 8, step: 714, loss: 0.4029406011104584, mean loss: 0.3767098744360445
Epoch: 8, step: 715, loss: 0.34652143716812134, mean loss: 0.3767074136896092
Epoch: 8, step: 716, loss: 0.38815298676490784, mean loss: 0.3767083465751806
Epoch: 8, step: 717, loss: 0.36328187584877014, mean loss: 0.37670725232328767
Epoch: 8, step: 718, loss: 0.3262816369533539, mean loss: 0.37670314299109225
Epoch: 8, step: 719, loss: 0.4009038209915161, mean loss: 0.3767051150150493
Epoch: 8, step: 720, loss: 0.34113776683807373, mean loss: 0.3767022169992278
Epoch: 8, step: 721, loss: 0.311044842004776, mean loss: 0.37669686769378585
Epoch: 8, step: 722, loss: 0.37076839804649353, mean loss: 0.37669638472273514
Epoch: 8, step: 723, loss: 0.3327599763870239, mean loss: 0.3766928056735061
Epoch: 8, step: 724, loss: 0.3415308892726898, mean loss: 0.376689941625579
Epoch: 8, step: 725, loss: 0.307146281003952, mean loss: 0.3766842775385435
Epoch: 8, step: 726, loss: 0.3732973337173462, mean loss: 0.37668400170632416
Epoch: 8, step: 727, loss: 0.3378185033798218, mean loss: 0.3766808367634637
Epoch: 8, step: 728, loss: 0.33936235308647156, mean loss: 0.3766777980464474
Epoch: 8, step: 729, loss: 0.3278777003288269, mean loss: 0.3766738247442395
Epoch: 8, step: 730, loss: 0.3645312786102295, mean loss: 0.3766728361790572
Epoch: 8, step: 731, loss: 0.3300197720527649, mean loss: 0.3766690383066927
Epoch: 8, step: 732, loss: 0.34461379051208496, mean loss: 0.3766664290069129
Epoch: 8, step: 733, loss: 0.32763054966926575, mean loss: 0.37666243780722725
Epoch: 8, step: 734, loss: 0.32996824383735657, mean loss: 0.37665863751472545
Epoch: 8, step: 735, loss: 0.3830421566963196, mean loss: 0.3766591570068463
Epoch: 8, step: 736, loss: 0.33033427596092224, mean loss: 0.37665538738514837
Epoch: 8, step: 737, loss: 0.3154623210430145, mean loss: 0.37665040829106033
Epoch: 8, step: 738, loss: 0.3615655303001404, mean loss: 0.3766491809801832
Epoch: 8, step: 739, loss: 0.36468014121055603, mean loss: 0.3766482072542013
Epoch: 8, step: 740, loss: 0.34207844734191895, mean loss: 0.37664539510420436
Epoch: 8, step: 741, loss: 0.3219028115272522, mean loss: 0.3766409423155614
Epoch: 8, step: 742, loss: 0.3614467978477478, mean loss: 0.37663970651690604
Epoch: 8, step: 743, loss: 0.32679471373558044, mean loss: 0.37663565276017363
Epoch: 8, step: 744, loss: 0.3593263030052185, mean loss: 0.376634245152647
Epoch: 8, step: 745, loss: 0.32560810446739197, mean loss: 0.37663009601126746
Epoch: 8, step: 746, loss: 0.36729180812835693, mean loss: 0.376629336739141
Epoch: 8, step: 747, loss: 0.37154608964920044, mean loss: 0.37662892346701987
Epoch: 8, step: 748, loss: 0.32519546151161194, mean loss: 0.37662474222468545
Epoch: 8, step: 749, loss: 0.3115069568157196, mean loss: 0.3766194489564844
Epoch: 8, step: 750, loss: 0.3442234694957733, mean loss: 0.37661681577925443
Epoch: 8, step: 751, loss: 0.34912535548210144, mean loss: 0.37661458142779985
Epoch: 8, step: 752, loss: 0.32011404633522034, mean loss: 0.3766099897548951
Epoch: 8, step: 753, loss: 0.3370489180088043, mean loss: 0.37660677497578365
Epoch: 8, step: 754, loss: 0.3988805413246155, mean loss: 0.3766085848211033
Epoch: 8, step: 755, loss: 0.3546014428138733, mean loss: 0.3766067967855161
Epoch: 8, step: 756, loss: 0.3472696542739868, mean loss: 0.3766044133959222
Epoch: 8, step: 757, loss: 0.3189328908920288, mean loss: 0.37659972846314366
Epoch: 8, step: 758, loss: 0.3562779724597931, mean loss: 0.37659807776409376
Epoch: 8, step: 759, loss: 0.3524496555328369, mean loss: 0.37659611639126794
Epoch: 8, step: 760, loss: 0.3502044081687927, mean loss: 0.37659397298931696
Epoch: 8, step: 761, loss: 0.34212642908096313, mean loss: 0.3765911739358893
Epoch: 8, step: 762, loss: 0.32673054933547974, mean loss: 0.37658712516409876
Epoch: 8, step: 763, loss: 0.35535722970962524, mean loss: 0.3765854013986348
Epoch: 8, step: 764, loss: 0.3375016748905182, mean loss: 0.376582228245553
Epoch: 8, step: 765, loss: 0.34446486830711365, mean loss: 0.37657962089371516
Epoch: 8, step: 766, loss: 0.32897451519966125, mean loss: 0.37657575652926234
Epoch: 8, step: 767, loss: 0.3276398777961731, mean loss: 0.37657178446118333
Epoch: 8, step: 768, loss: 0.38954025506973267, mean loss: 0.3765728370113504
Epoch: 8, step: 769, loss: 0.31390252709388733, mean loss: 0.37656775096120293
Epoch: 8, step: 770, loss: 0.34568339586257935, mean loss: 0.3765652447244831
Epoch: 8, step: 771, loss: 0.3587706685066223, mean loss: 0.3765638008283278
Epoch: 8, step: 772, loss: 0.3233875334262848, mean loss: 0.37655948632387326
Epoch: 8, step: 773, loss: 0.306479811668396, mean loss: 0.3765538008075131
Epoch: 8, step: 774, loss: 0.32880517840385437, mean loss: 0.3765499273084944
Epoch: 8, step: 775, loss: 0.32794293761253357, mean loss: 0.37654598449622184
Epoch: 8, step: 776, loss: 0.28966689109802246, mean loss: 0.37653893776952885
Epoch: 8, step: 777, loss: 0.3937284052371979, mean loss: 0.3765403318869228
Epoch: 8, step: 778, loss: 0.4024983048439026, mean loss: 0.3765424369856948
Epoch: 8, step: 779, loss: 0.36074844002723694, mean loss: 0.3765411562528892
Epoch: 8, step: 780, loss: 0.3302673399448395, mean loss: 0.3765374042204309
Epoch: 8, step: 781, loss: 0.3317364454269409, mean loss: 0.37653377190659976
Epoch: 8, step: 782, loss: 0.30174729228019714, mean loss: 0.37652770895729887
Epoch: 8, step: 783, loss: 0.3281290531158447, mean loss: 0.37652378559025595
Epoch: 8, step: 784, loss: 0.3253503143787384, mean loss: 0.3765196376230669
Epoch: 8, step: 785, loss: 0.34621506929397583, mean loss: 0.37651718142527724
Epoch: 8, step: 786, loss: 0.3393673002719879, mean loss: 0.3765141706560777
Epoch: 8, step: 787, loss: 0.3308682441711426, mean loss: 0.3765104716344825
Epoch: 8, step: 788, loss: 0.3384549021720886, mean loss: 0.37650738796464517
Epoch: 8, step: 789, loss: 0.32192403078079224, mean loss: 0.37650296539478745
Epoch: 8, step: 790, loss: 0.32060766220092773, mean loss: 0.37649843689254375
Epoch: 8, step: 791, loss: 0.3491990864276886, mean loss: 0.37649622534438554
Epoch: 8, step: 792, loss: 0.3655441105365753, mean loss: 0.37649533817429176
Epoch: 8, step: 793, loss: 0.41280558705329895, mean loss: 0.37649827922798357
Epoch: 8, step: 794, loss: 0.32605913281440735, mean loss: 0.3764941940942334
Epoch: 8, step: 795, loss: 0.33220475912094116, mean loss: 0.37649060732431333
Epoch: 8, step: 796, loss: 0.33962106704711914, mean loss: 0.37648762169468525
Epoch: 8, step: 797, loss: 0.3196558654308319, mean loss: 0.37648301993304445
Epoch: 8, step: 798, loss: 0.3526289165019989, mean loss: 0.3764810885830784
Epoch: 8, step: 799, loss: 0.3803957402706146, mean loss: 0.37648140550759973
Epoch: 8, step: 800, loss: 0.32473108172416687, mean loss: 0.3764772162156234
Epoch: 8, step: 801, loss: 0.33476361632347107, mean loss: 0.3764738396898105
Epoch: 8, step: 802, loss: 0.33561018109321594, mean loss: 0.3764705322305959
Epoch: 8, step: 803, loss: 0.35561904311180115, mean loss: 0.3764688446707773
Epoch: 8, step: 804, loss: 0.3961320221424103, mean loss: 0.3764704359289687
Epoch: 8, step: 805, loss: 0.40931031107902527, mean loss: 0.3764730933067928
Epoch: 8, step: 806, loss: 0.3773326873779297, mean loss: 0.3764731628588659
Epoch: 8, step: 807, loss: 0.34591829776763916, mean loss: 0.3764706907824022
Epoch: 8, step: 808, loss: 0.34547659754753113, mean loss: 0.3764681833725458
Epoch: 8, step: 809, loss: 0.33697840571403503, mean loss: 0.3764649889236169
Epoch: 8, step: 810, loss: 0.3351984918117523, mean loss: 0.376461651020429
Epoch: 8, step: 811, loss: 0.35886266827583313, mean loss: 0.3764602276151601
Epoch: 8, step: 812, loss: 0.34855520725250244, mean loss: 0.3764579708403633
Epoch: 8, step: 813, loss: 0.327938050031662, mean loss: 0.3764540471851143
Epoch: 8, step: 814, loss: 0.3182661533355713, mean loss: 0.37644934209140934
Epoch: 8, step: 815, loss: 0.3115082085132599, mean loss: 0.37644409135292467
Epoch: 8, step: 816, loss: 0.3195509612560272, mean loss: 0.37643949169813473
Epoch: 8, step: 817, loss: 0.33541741967201233, mean loss: 0.3764361754433226
Epoch: 8, step: 818, loss: 0.3923748731613159, mean loss: 0.3764374638353457
Epoch: 8, step: 819, loss: 0.33078455924987793, mean loss: 0.376433773817193
Epoch: 8, step: 820, loss: 0.35371819138526917, mean loss: 0.3764319379178612
Epoch: 8, step: 821, loss: 0.38050931692123413, mean loss: 0.3764322674296604
Epoch: 8, step: 822, loss: 0.35723888874053955, mean loss: 0.37643071644956433
Epoch: 8, step: 823, loss: 0.3512728214263916, mean loss: 0.3764286836526168
Epoch: 8, step: 824, loss: 0.32402706146240234, mean loss: 0.3764244498623453
Epoch: 8, step: 825, loss: 0.3441700041294098, mean loss: 0.3764218440741943
Epoch: 8, step: 826, loss: 0.31778016686439514, mean loss: 0.37641710688401664
Epoch: 8, step: 827, loss: 0.34319475293159485, mean loss: 0.37641442333361663
Epoch: 8, step: 828, loss: 0.32259222865104675, mean loss: 0.37641007617307365
Epoch: 8, step: 829, loss: 0.3763851821422577, mean loss: 0.37641007416257205
Epoch: 8, step: 830, loss: 0.3116379678249359, mean loss: 0.3764048434344498
Epoch: 8, step: 831, loss: 0.3462325632572174, mean loss: 0.37640240704231664
Epoch: 8, step: 832, loss: 0.3536619246006012, mean loss: 0.3764005709113161
Epoch: 8, step: 833, loss: 0.4382154941558838, mean loss: 0.3764055616204429
Epoch: 8, step: 834, loss: 0.32648295164108276, mean loss: 0.3764015313782552
Epoch: 8, step: 835, loss: 0.376895934343338, mean loss: 0.3764015712880845
Epoch: 8, step: 836, loss: 0.33848634362220764, mean loss: 0.3763985108935679
Epoch: 8, step: 837, loss: 0.3279530107975006, mean loss: 0.376394600845134
Epoch: 8, step: 838, loss: 0.31426918506622314, mean loss: 0.37638958709194387
Epoch: 8, step: 839, loss: 0.34613391757011414, mean loss: 0.37638714554340275
Epoch: 8, step: 840, loss: 0.3456681966781616, mean loss: 0.3763846668095316
Epoch: 8, step: 841, loss: 0.32755717635154724, mean loss: 0.3763807272024267
Epoch: 8, step: 842, loss: 0.330988347530365, mean loss: 0.3763770650499723
Epoch: 8, step: 843, loss: 0.360658198595047, mean loss: 0.3763757969904003
Epoch: 8, step: 844, loss: 0.36503565311431885, mean loss: 0.3763748822413581
Epoch: 8, step: 845, loss: 0.35946032404899597, mean loss: 0.37637351794403656
Epoch: 8, step: 846, loss: 0.34201666712760925, mean loss: 0.37637074700679835
Epoch: 8, step: 847, loss: 0.33992770314216614, mean loss: 0.376367808051648
Epoch: 8, step: 848, loss: 0.34674015641212463, mean loss: 0.37636541891757497
Epoch: 8, step: 849, loss: 0.32460495829582214, mean loss: 0.3763612453600341
Epoch: 8, step: 850, loss: 0.36034053564071655, mean loss: 0.3763599536798181
Epoch: 8, step: 851, loss: 0.33703991770744324, mean loss: 0.3763567837317391
Epoch: 8, step: 852, loss: 0.34662753343582153, mean loss: 0.37635438717790626
Epoch: 8, step: 853, loss: 0.34744659066200256, mean loss: 0.3763520570314839
Epoch: 8, step: 854, loss: 0.35636067390441895, mean loss: 0.3763504457327713
Epoch: 8, step: 855, loss: 0.34179556369781494, mean loss: 0.37634766084543775
Epoch: 8, step: 856, loss: 0.31514617800712585, mean loss: 0.3763427288216777
Epoch: 8, step: 857, loss: 0.3617345690727234, mean loss: 0.3763415516935754
Epoch: 8, step: 858, loss: 0.33482617139816284, mean loss: 0.376338206646416
Epoch: 8, step: 859, loss: 0.333305299282074, mean loss: 0.37633473960586133
Epoch: 8, step: 860, loss: 0.3625219464302063, mean loss: 0.3763336268375398
Epoch: 8, step: 861, loss: 0.35339686274528503, mean loss: 0.3763317791845599
Epoch: 8, step: 862, loss: 0.3248222768306732, mean loss: 0.3763276302113538
Epoch: 8, step: 863, loss: 0.319053053855896, mean loss: 0.376323017246119
Epoch: 8, step: 864, loss: 0.37024402618408203, mean loss: 0.37632252767608904
Epoch: 8, step: 865, loss: 0.3415600061416626, mean loss: 0.3763197283105282
Epoch: 8, step: 866, loss: 0.2933027446269989, mean loss: 0.37631304363513696
Epoch: 8, step: 867, loss: 0.33556848764419556, mean loss: 0.3763097630750733
Epoch: 8, step: 868, loss: 0.35461533069610596, mean loss: 0.37630801648201484
Epoch: 8, step: 869, loss: 0.34887152910232544, mean loss: 0.3763058077807284
Epoch: 8, step: 870, loss: 0.39629891514778137, mean loss: 0.3763074171429893
Epoch: 8, step: 871, loss: 0.31533104181289673, mean loss: 0.3763025091926247
Epoch: 8, step: 872, loss: 0.35966765880584717, mean loss: 0.376301170371668
Epoch: 8, step: 873, loss: 0.35991767048835754, mean loss: 0.3762998518862436
Epoch: 8, step: 874, loss: 0.36787092685699463, mean loss: 0.3762991736111145
Epoch: 8, step: 875, loss: 0.41693758964538574, mean loss: 0.37630244351906705
Epoch: 8, step: 876, loss: 0.3713465929031372, mean loss: 0.3763020447862152
Epoch: 8, step: 877, loss: 0.3705359697341919, mean loss: 0.376301580902462
Epoch: 8, step: 878, loss: 0.365266889333725, mean loss: 0.3763006932271689
Epoch: 8, step: 879, loss: 0.3516201376914978, mean loss: 0.37629870798299775
Epoch: 8, step: 880, loss: 0.3605341911315918, mean loss: 0.3762974400253969
Epoch: 8, step: 881, loss: 0.379142701625824, mean loss: 0.3762976688545428
Epoch: 8, step: 882, loss: 0.3117367923259735, mean loss: 0.37629247698670776
Epoch: 8, step: 883, loss: 0.37294602394104004, mean loss: 0.3762922078927028
Epoch: 8, step: 884, loss: 0.3296871781349182, mean loss: 0.376288460603987
Epoch: 8, step: 885, loss: 0.3773185610771179, mean loss: 0.3762885434228062
Epoch: 8, step: 886, loss: 0.3479610085487366, mean loss: 0.37628626610671373
Epoch: 8, step: 887, loss: 0.3607324957847595, mean loss: 0.37628501580363316
Epoch: 8, step: 888, loss: 0.37233591079711914, mean loss: 0.3762846983769788
Epoch: 8, step: 889, loss: 0.3758114278316498, mean loss: 0.37628466033883823
Epoch: 8, step: 890, loss: 0.3193446397781372, mean loss: 0.37628008427032095
Epoch: 8, step: 891, loss: 0.32328173518180847, mean loss: 0.37627582532230675
Epoch: 8, step: 892, loss: 0.32106733322143555, mean loss: 0.37627138912366465
Epoch: 8, step: 893, loss: 0.3370983600616455, mean loss: 0.3762682416844021
Epoch: 8, step: 894, loss: 0.34423375129699707, mean loss: 0.37626566801280353
Epoch: 8, step: 895, loss: 0.35823526978492737, mean loss: 0.3762642195553623
Epoch: 8, step: 896, loss: 0.34854811429977417, mean loss: 0.376261993183344
Epoch: 8, step: 897, loss: 0.29637378454208374, mean loss: 0.3762555764597584
Epoch: 8, step: 898, loss: 0.31630179286003113, mean loss: 0.3762507612815719
Epoch: 8, step: 899, loss: 0.31625622510910034, mean loss: 0.37624594321731136
Epoch: 8, step: 900, loss: 0.3222414553165436, mean loss: 0.3762416065524193
Epoch: 8, step: 901, loss: 0.36650148034095764, mean loss: 0.37624082446423784
Epoch: 8, step: 902, loss: 0.38329437375068665, mean loss: 0.3762413907869425
Epoch: 8, step: 903, loss: 0.3321378827095032, mean loss: 0.37623785004287724
Epoch: 8, step: 904, loss: 0.38330528140068054, mean loss: 0.3762384173890567
Epoch: 8, step: 905, loss: 0.33025607466697693, mean loss: 0.37623472639991545
Epoch: 8, step: 906, loss: 0.32849782705307007, mean loss: 0.3762308948805843
Epoch: 8, step: 907, loss: 0.350204199552536, mean loss: 0.37622880606073456
Epoch: 8, step: 908, loss: 0.3404063582420349, mean loss: 0.37622593129564197
Epoch: 8, step: 909, loss: 0.3849494457244873, mean loss: 0.3762266313048242
Epoch: 8, step: 910, loss: 0.32528579235076904, mean loss: 0.37622254393910537
Epoch: 8, step: 911, loss: 0.37837257981300354, mean loss: 0.3762227164387743
Epoch: 8, step: 912, loss: 0.3218504786491394, mean loss: 0.37621835444617185
Epoch: 8, step: 913, loss: 0.32453423738479614, mean loss: 0.37621420843966924
Epoch: 8, step: 914, loss: 0.3142243027687073, mean loss: 0.3762092361202924
Epoch: 8, step: 915, loss: 0.37953898310661316, mean loss: 0.3762095031837337
Epoch: 8, step: 916, loss: 0.35271188616752625, mean loss: 0.37620761870085484
Epoch: 8, step: 917, loss: 0.32062894105911255, mean loss: 0.3762031617098651
Epoch: 8, step: 918, loss: 0.36792805790901184, mean loss: 0.3762024981621303
Epoch: 8, step: 919, loss: 0.3295539915561676, mean loss: 0.37619875790342233
Epoch: 8, step: 920, loss: 0.34421437978744507, mean loss: 0.37619619361430856
Epoch: 8, step: 921, loss: 0.3210410177707672, mean loss: 0.3761917720032902
Epoch: 8, step: 922, loss: 0.3891264796257019, mean loss: 0.37619280885360057
Epoch: 8, step: 923, loss: 0.3413909077644348, mean loss: 0.3761900193456582
Epoch: 8, step: 924, loss: 0.3329443335533142, mean loss: 0.37618655331329526
Epoch: 8, step: 925, loss: 0.3468672037124634, mean loss: 0.37618420362988436
Epoch: 8, step: 926, loss: 0.39121299982070923, mean loss: 0.3761854079568489
Epoch: 8, step: 927, loss: 0.3663245439529419, mean loss: 0.37618461782351525
Epoch: 8, step: 928, loss: 0.37072432041168213, mean loss: 0.3761841803347394
Epoch: 8, step: 929, loss: 0.3134746849536896, mean loss: 0.37617915634055726
Epoch: 8, step: 930, loss: 0.3160017132759094, mean loss: 0.3761743355888898
Epoch: 8, step: 931, loss: 0.3703887462615967, mean loss: 0.37617387214854
Epoch: 8, step: 932, loss: 0.3581473231315613, mean loss: 0.37617242829199077
Epoch: 8, step: 933, loss: 0.3373054265975952, mean loss: 0.3761693154454671
Epoch: 8, step: 934, loss: 0.3133692741394043, mean loss: 0.37616428621175957
Epoch: 8, step: 935, loss: 0.31302520632743835, mean loss: 0.3761592302316279
Epoch: 8, step: 936, loss: 0.3684273958206177, mean loss: 0.37615861114007443
Epoch: 8, step: 937, loss: 0.2958559989929199, mean loss: 0.37615218178762067
Epoch: 8, step: 938, loss: 0.3611750304698944, mean loss: 0.37615098275220976
Epoch: 8, step: 939, loss: 0.32903993129730225, mean loss: 0.37614721145446284
Epoch: 8, step: 940, loss: 0.3878098428249359, mean loss: 0.3761481449877511
Epoch: 8, step: 941, loss: 0.3428193926811218, mean loss: 0.3761454774071279
Epoch: 8, step: 942, loss: 0.3325740396976471, mean loss: 0.3761419902972672
Epoch: 8, step: 943, loss: 0.31499311327934265, mean loss: 0.3761370968211934
Epoch: 8, step: 944, loss: 0.36670514941215515, mean loss: 0.37613634208426383
Epoch: 8, step: 945, loss: 0.3255406618118286, mean loss: 0.3761322937821137
Epoch: 8, step: 946, loss: 0.31199395656585693, mean loss: 0.37612716230461823
Epoch: 8, step: 947, loss: 0.36784467101097107, mean loss: 0.37612649970531475
Epoch: 8, step: 948, loss: 0.31839847564697266, mean loss: 0.37612188183281986
Epoch: 8, step: 949, loss: 0.3473803997039795, mean loss: 0.3761195828820817
Epoch: 8, step: 950, loss: 0.3573269844055176, mean loss: 0.3761180798349349
Epoch: 8, step: 951, loss: 0.38490524888038635, mean loss: 0.37611878258357895
Epoch: 8, step: 952, loss: 0.32340309023857117, mean loss: 0.37611456701441903
Epoch: 8, step: 953, loss: 0.3110594153404236, mean loss: 0.3761093650992044
Epoch: 8, step: 954, loss: 0.40919843316078186, mean loss: 0.37611201074308875
Epoch: 8, step: 955, loss: 0.2925941050052643, mean loss: 0.37610533358401155
Epoch: 8, step: 956, loss: 0.3331499695777893, mean loss: 0.37610189962733986
Epoch: 8, step: 957, loss: 0.3288092017173767, mean loss: 0.37609811923582026
Epoch: 8, step: 958, loss: 0.35406729578971863, mean loss: 0.3760963583195509
Epoch: 8, step: 959, loss: 0.4028800129890442, mean loss: 0.3760984989569126
Epoch: 8, step: 960, loss: 0.350408136844635, mean loss: 0.3760964458631611
Epoch: 8, step: 961, loss: 0.3434106111526489, mean loss: 0.3760938339217586
Epoch: 8, step: 962, loss: 0.33167168498039246, mean loss: 0.3760902844092583
Epoch: 8, step: 963, loss: 0.3461795151233673, mean loss: 0.37608789460666275
Epoch: 8, step: 964, loss: 0.38393598794937134, mean loss: 0.3760885216014173
Epoch: 8, step: 965, loss: 0.35183775424957275, mean loss: 0.37608658432970044
Epoch: 8, step: 966, loss: 0.3521787226200104, mean loss: 0.3760846746035474
Epoch: 8, step: 967, loss: 0.3459872603416443, mean loss: 0.37608227065672134
Epoch: 8, step: 968, loss: 0.3357491195201874, mean loss: 0.3760790494163143
Epoch: 8, step: 969, loss: 0.3355613648891449, mean loss: 0.3760758136964192
Epoch: 8, step: 970, loss: 0.3666287958621979, mean loss: 0.3760750593230395
Epoch: 8, step: 971, loss: 0.3233187794685364, mean loss: 0.3760708469084871
Epoch: 8, step: 972, loss: 0.33163782954216003, mean loss: 0.37606729936219035
Epoch: 8, step: 973, loss: 0.3731887638568878, mean loss: 0.37606706955734404
Epoch: 8, step: 974, loss: 0.351701021194458, mean loss: 0.3760651244748532
Epoch: 8, step: 975, loss: 0.40757280588150024, mean loss: 0.3760676394558084
Epoch: 8, step: 976, loss: 0.30675122141838074, mean loss: 0.3760621069777146
Epoch: 8, step: 977, loss: 0.33127376437187195, mean loss: 0.37605853248907883
Epoch: 8, step: 978, loss: 0.34070253372192383, mean loss: 0.37605571100645435
Epoch: 8, step: 979, loss: 0.29864659905433655, mean loss: 0.37604953409040326
Epoch: 8, step: 980, loss: 0.3538017272949219, mean loss: 0.3760477589522244
Epoch: 8, step: 981, loss: 0.35251501202583313, mean loss: 0.37604588143930545
Epoch: 8, step: 982, loss: 0.36342868208885193, mean loss: 0.37604487488171867
Epoch: 8, step: 983, loss: 0.33084502816200256, mean loss: 0.3760412692781195
Epoch: 8, step: 984, loss: 0.3652641475200653, mean loss: 0.37604040965286956
Epoch: 8, step: 985, loss: 0.3271181881427765, mean loss: 0.37603650773697306
Epoch: 8, step: 986, loss: 0.3515773117542267, mean loss: 0.37603455708732136
Epoch: 8, step: 987, loss: 0.31584131717681885, mean loss: 0.37602975698844493
Epoch: 8, step: 988, loss: 0.3650074899196625, mean loss: 0.37602887808986674
Epoch: 8, step: 989, loss: 0.38263174891471863, mean loss: 0.37602940455062456
Epoch: 8, step: 990, loss: 0.32616686820983887, mean loss: 0.3760254292228449
Epoch: 8, step: 991, loss: 0.3160798251628876, mean loss: 0.3760206503959906
Epoch: 8, step: 992, loss: 0.3193528354167938, mean loss: 0.37601613323258054
Epoch: 8, step: 993, loss: 0.3164370059967041, mean loss: 0.3760113843781858
Epoch: 8, step: 994, loss: 0.34144482016563416, mean loss: 0.3760086294117227
Epoch: 8, step: 995, loss: 0.37303683161735535, mean loss: 0.37600839257734314
Epoch: 8, step: 996, loss: 0.31889912486076355, mean loss: 0.3760038416754612
Epoch: 8, step: 997, loss: 0.40440866351127625, mean loss: 0.3760061050078784
Epoch: 8, step: 998, loss: 0.4018784761428833, mean loss: 0.3760081663871418
Epoch: 8, step: 999, loss: 0.3593995273113251, mean loss: 0.3760068432004723
Epoch: 8, step: 1000, loss: 0.39103415608406067, mean loss: 0.3760080403097596
Epoch: 8, step: 1001, loss: 0.3184923231601715, mean loss: 0.37600345884431835
Epoch: 8, step: 1002, loss: 0.35221678018569946, mean loss: 0.37600156424625714
Epoch: 8, step: 1003, loss: 0.3226287364959717, mean loss: 0.37599731346354365
Epoch: 8, step: 1004, loss: 0.344341516494751, mean loss: 0.37599479249540085
Epoch: 8, step: 1005, loss: 0.32450684905052185, mean loss: 0.37599069248397826
Epoch: 8, step: 1006, loss: 0.38001495599746704, mean loss: 0.3759910129126361
Epoch: 8, step: 1007, loss: 0.3239397704601288, mean loss: 0.37598686870543446
Epoch: 8, step: 1008, loss: 0.33288878202438354, mean loss: 0.37598343760228337
Epoch: 8, step: 1009, loss: 0.36676159501075745, mean loss: 0.375982703496043
Epoch: 8, step: 1010, loss: 0.3518289029598236, mean loss: 0.375980780881975
Epoch: 8, step: 1011, loss: 0.34360459446907043, mean loss: 0.375978203980796
Epoch: 8, step: 1012, loss: 0.32859092950820923, mean loss: 0.3759744326099665
Epoch: 8, step: 1013, loss: 0.3189360499382019, mean loss: 0.3759698935058226
Epoch: 8, step: 1014, loss: 0.33623674511909485, mean loss: 0.3759667318006912
Epoch: 8, step: 1015, loss: 0.32129183411598206, mean loss: 0.37596238147465005
Epoch: 8, step: 1016, loss: 0.33525922894477844, mean loss: 0.3759591430982852
Epoch: 8, step: 1017, loss: 0.3501565158367157, mean loss: 0.37595709038330816
Epoch: 8, step: 1018, loss: 0.3327587842941284, mean loss: 0.37595365403726655
Epoch: 8, step: 1019, loss: 0.3367883265018463, mean loss: 0.37595053875508905
Epoch: 8, step: 1020, loss: 0.316394567489624, mean loss: 0.3759458019403857
Epoch: 8, step: 1021, loss: 0.3473713994026184, mean loss: 0.37594352944137677
Epoch: 8, step: 1022, loss: 0.3844856023788452, mean loss: 0.3759442087314712
Epoch: 8, step: 1023, loss: 0.35906147956848145, mean loss: 0.37594286627527185
Epoch: 8, step: 1024, loss: 0.366035521030426, mean loss: 0.3759420785401009
Epoch: 8, step: 1025, loss: 0.3322809934616089, mean loss: 0.37593860731374706
Epoch: 8, step: 1026, loss: 0.3558851480484009, mean loss: 0.3759370131123586
Epoch: 8, step: 1027, loss: 0.34115397930145264, mean loss: 0.37593424816531484
Epoch: 8, step: 1028, loss: 0.31978321075439453, mean loss: 0.3759297850036098
Epoch: 8, step: 1029, loss: 0.3486834764480591, mean loss: 0.37592761950459885
Epoch: 8, step: 1030, loss: 0.31009700894355774, mean loss: 0.3759223877943103
Epoch: 8, step: 1031, loss: 0.33802324533462524, mean loss: 0.3759193761014893
Epoch: 8, step: 1032, loss: 0.321145236492157, mean loss: 0.3759150237662005
Epoch: 8, step: 1033, loss: 0.33324047923088074, mean loss: 0.37591163313021325
Epoch: 8, step: 1034, loss: 0.3862479031085968, mean loss: 0.37591245431635595
Epoch: 8, step: 1035, loss: 0.35810840129852295, mean loss: 0.3759110399492589
Epoch: 8, step: 1036, loss: 0.3640574812889099, mean loss: 0.3759100983686202
Epoch: 8, step: 1037, loss: 0.33108142018318176, mean loss: 0.37590653771109955
Epoch: 8, step: 1038, loss: 0.3475733697414398, mean loss: 0.3759042874396382
Epoch: 8, step: 1039, loss: 0.3944513201713562, mean loss: 0.3759057603615515
Epoch: 8, step: 1040, loss: 0.37286263704299927, mean loss: 0.37590551870957667
Epoch: 8, step: 1041, loss: 0.3619738519191742, mean loss: 0.3759044124949673
Epoch: 8, step: 1042, loss: 0.31052902340888977, mean loss: 0.37589922191226893
Epoch: 8, step: 1043, loss: 0.34605950117111206, mean loss: 0.3758968529284057
Epoch: 8, step: 1044, loss: 0.327968955039978, mean loss: 0.37589304822110325
Epoch: 8, step: 1045, loss: 0.32499098777770996, mean loss: 0.3758890077336891
Epoch: 8, step: 1046, loss: 0.3395804762840271, mean loss: 0.3758861258754901
Epoch: 8, step: 1047, loss: 0.32051366567611694, mean loss: 0.3758817312357917
Epoch: 8, step: 1048, loss: 0.3597216308116913, mean loss: 0.37588044878992044
Epoch: 8, step: 1049, loss: 0.3127788305282593, mean loss: 0.3758754415197838
Epoch: 8, step: 1050, loss: 0.3450930714607239, mean loss: 0.37587299905608
Epoch: 8, step: 1051, loss: 0.3590497374534607, mean loss: 0.3758716643003197
Epoch: 8, step: 1052, loss: 0.3302248418331146, mean loss: 0.3758680429736662
Epoch: 8, step: 1053, loss: 0.3349488079547882, mean loss: 0.3758647969610517
Epoch: 8, step: 1054, loss: 0.32287800312042236, mean loss: 0.3758605939949344
Epoch: 8, step: 1055, loss: 0.34780290722846985, mean loss: 0.37585836860734184
Epoch: 8, step: 1056, loss: 0.32351934909820557, mean loss: 0.3758542176818514
Epoch: 8, step: 1057, loss: 0.31477877497673035, mean loss: 0.3758493742684727
Epoch: 8, step: 1058, loss: 0.32605883479118347, mean loss: 0.3758454260851821
Epoch: 8, step: 1059, loss: 0.3205154240131378, mean loss: 0.3758410389933591
Epoch: 8, step: 1060, loss: 0.3438107371330261, mean loss: 0.37583849952599524
Epoch: 8, step: 1061, loss: 0.34335529804229736, mean loss: 0.37583592435543206
Epoch: 8, step: 1062, loss: 0.33949968218803406, mean loss: 0.37583304395573586
Epoch: 8, step: 1063, loss: 0.3439403176307678, mean loss: 0.3758305159970861
Epoch: 8, step: 1064, loss: 0.36267268657684326, mean loss: 0.37582947313195014
Epoch: 8, step: 1065, loss: 0.3797209858894348, mean loss: 0.3758297815415838
Epoch: 8, step: 1066, loss: 0.31943321228027344, mean loss: 0.37582531236262656
Epoch: 8, step: 1067, loss: 0.331149160861969, mean loss: 0.3758217722555346
Epoch: 8, step: 1068, loss: 0.32966452836990356, mean loss: 0.37581811507750706
Epoch: 8, step: 1069, loss: 0.3243403732776642, mean loss: 0.37581403666348395
Epoch: 8, step: 1070, loss: 0.3465770483016968, mean loss: 0.3758117204955079
Epoch: 8, step: 1071, loss: 0.33158382773399353, mean loss: 0.3758082170185781
Epoch: 8, step: 1072, loss: 0.33434566855430603, mean loss: 0.3758049328563235
Epoch: 8, step: 1073, loss: 0.3117431700229645, mean loss: 0.3757998590591721
Epoch: 8, step: 1074, loss: 0.3250036835670471, mean loss: 0.37579583623700596
Epoch: 8, step: 1075, loss: 0.3731769323348999, mean loss: 0.3757956288483536
Epoch: 8, step: 1076, loss: 0.3317359983921051, mean loss: 0.375792140081986
Epoch: 8, step: 1077, loss: 0.31955236196517944, mean loss: 0.3757876872096094
Epoch: 8, step: 1078, loss: 0.3412257432937622, mean loss: 0.3757849509303033
Epoch: 8, step: 1079, loss: 0.33558931946754456, mean loss: 0.3757817688822141
Epoch: 8, step: 1080, loss: 0.3231494426727295, mean loss: 0.3757776026250931
Epoch: 8, step: 1081, loss: 0.3071341812610626, mean loss: 0.3757721693956041
Epoch: 8, step: 1082, loss: 0.31732502579689026, mean loss: 0.3757675435828935
Epoch: 8, step: 1083, loss: 0.3232797086238861, mean loss: 0.37576338974980084
Epoch: 8, step: 1084, loss: 0.34643152356147766, mean loss: 0.37576106863987063
Epoch: 8, step: 1085, loss: 0.29812705516815186, mean loss: 0.3757549257364467
Epoch: 8, step: 1086, loss: 0.3390437662601471, mean loss: 0.3757520211427703
Epoch: 8, step: 1087, loss: 0.3656383156776428, mean loss: 0.37575122100784425
Epoch: 8, step: 1088, loss: 0.34281548857688904, mean loss: 0.375748615538939
Epoch: 8, step: 1089, loss: 0.3736679255962372, mean loss: 0.3757484509534349
Epoch: 8, step: 1090, loss: 0.3786020278930664, mean loss: 0.37574867665753514
Epoch: 8, step: 1091, loss: 0.3084399998188019, mean loss: 0.3757433532885982
Epoch: 8, step: 1092, loss: 0.33047544956207275, mean loss: 0.3757397733832027
Epoch: 8, step: 1093, loss: 0.3345458507537842, mean loss: 0.37573651591660223
Epoch: 8, step: 1094, loss: 0.34700170159339905, mean loss: 0.37573424385094845
Epoch: 8, step: 1095, loss: 0.31089991331100464, mean loss: 0.3757291177969842
Epoch: 8, step: 1096, loss: 0.3543424606323242, mean loss: 0.37572742701849066
Epoch: 8, step: 1097, loss: 0.31789639592170715, mean loss: 0.37572285539547906
Epoch: 8, step: 1098, loss: 0.3522012531757355, mean loss: 0.37572099612726156
Epoch: 8, step: 1099, loss: 0.2956981360912323, mean loss: 0.3757146712094592
Epoch: 8, step: 1100, loss: 0.34015199542045593, mean loss: 0.375711860597289
Epoch: 8, step: 1101, loss: 0.386309415102005, mean loss: 0.37571269808381536
Epoch: 8, step: 1102, loss: 0.34542691707611084, mean loss: 0.3757103048968531
Epoch: 8, step: 1103, loss: 0.32863593101501465, mean loss: 0.3757065853666791
Epoch: 8, step: 1104, loss: 0.2969758212566376, mean loss: 0.3757003650329421
Epoch: 8, step: 1105, loss: 0.33890968561172485, mean loss: 0.3756974585169505
Epoch: 8, step: 1106, loss: 0.3347865045070648, mean loss: 0.3756942267487216
Epoch: 8, step: 1107, loss: 0.33990544080734253, mean loss: 0.3756913998304008
Epoch: 8, step: 1108, loss: 0.3382008373737335, mean loss: 0.3756884387244489
Epoch: 8, step: 1109, loss: 0.3317252993583679, mean loss: 0.3756849666711109
Epoch: 8, step: 1110, loss: 0.3826369345188141, mean loss: 0.37568551566959846
Epoch: 8, step: 1111, loss: 0.3475606441497803, mean loss: 0.375683294817457
Epoch: 8, step: 1112, loss: 0.33107906579971313, mean loss: 0.3756797729675543
Epoch: 8, step: 1113, loss: 0.3379070460796356, mean loss: 0.37567679075320976
Epoch: 8, step: 1114, loss: 0.3809056282043457, mean loss: 0.3756772035453035
Epoch: 8, step: 1115, loss: 0.41651061177253723, mean loss: 0.3756804268961266
Epoch: 8, step: 1116, loss: 0.3337131440639496, mean loss: 0.37567711429980233
Epoch: 8, step: 1117, loss: 0.36051782965660095, mean loss: 0.3756759178290333
Epoch: 8, step: 1118, loss: 0.34883415699005127, mean loss: 0.37567379946735396
Epoch: 8, step: 1119, loss: 0.3611304461956024, mean loss: 0.37567265179111725
Epoch: 8, step: 1120, loss: 0.3968539834022522, mean loss: 0.3756743231658203
Epoch: 8, step: 1121, loss: 0.3562298119068146, mean loss: 0.37567278896104994
Epoch: 8, step: 1122, loss: 0.3863847255706787, mean loss: 0.37567363408425386
Epoch: 8, step: 1123, loss: 0.33246365189552307, mean loss: 0.37567022528161986
Epoch: 8, step: 1124, loss: 0.3441200852394104, mean loss: 0.3756677365114028
Epoch: 8, step: 1125, loss: 0.33417749404907227, mean loss: 0.37566446389407654
Epoch: 8, step: 1126, loss: 0.3490683436393738, mean loss: 0.3756623662428221
Epoch: 8, step: 1127, loss: 0.31593620777130127, mean loss: 0.3756576559779584
Epoch: 8, step: 1128, loss: 0.3222617208957672, mean loss: 0.37565344527414307
Epoch: 8, step: 1129, loss: 0.3347642719745636, mean loss: 0.3756502210844806
Epoch: 8, step: 1130, loss: 0.31460344791412354, mean loss: 0.3756454078089803
Epoch: 8, step: 1131, loss: 0.35399356484413147, mean loss: 0.37564370078887904
Epoch: 8, step: 1132, loss: 0.3635689318180084, mean loss: 0.37564274889538507
Epoch: 8, step: 1133, loss: 0.3794002830982208, mean loss: 0.3756430450907345
Epoch: 8, step: 1134, loss: 0.36096957325935364, mean loss: 0.3756418885153556
Epoch: 8, step: 1135, loss: 0.36266854405403137, mean loss: 0.3756408660260381
Epoch: 8, step: 1136, loss: 0.333712637424469, mean loss: 0.3756375617287253
Epoch: 8, step: 1137, loss: 0.3422156870365143, mean loss: 0.3756349280112555
Epoch: 8, step: 1138, loss: 0.3277328312397003, mean loss: 0.37563115351777415
Epoch: 8, step: 1139, loss: 0.3361966609954834, mean loss: 0.3756280464824352
Epoch: 8, step: 1140, loss: 0.30561506748199463, mean loss: 0.3756225306091979
Epoch: 8, step: 1141, loss: 0.35688769817352295, mean loss: 0.375621054728275
Epoch: 8, step: 1142, loss: 0.38840290904045105, mean loss: 0.37562206156989075
Epoch: 8, step: 1143, loss: 0.30190157890319824, mean loss: 0.3756162549786284
Epoch: 8, step: 1144, loss: 0.401172012090683, mean loss: 0.3756182677184183
Epoch: 8, step: 1145, loss: 0.3427087664604187, mean loss: 0.37561567601096374
Epoch: 8, step: 1146, loss: 0.3501586616039276, mean loss: 0.37561367136379414
Epoch: 8, step: 1147, loss: 0.33006706833839417, mean loss: 0.37561008501709925
Epoch: 8, step: 1148, loss: 0.3459862768650055, mean loss: 0.3756077526174337
Epoch: 8, step: 1149, loss: 0.42121464014053345, mean loss: 0.37561134314550193
Epoch: 8, step: 1150, loss: 0.33469969034194946, mean loss: 0.37560812251629594
Epoch: 8, step: 1151, loss: 0.32737475633621216, mean loss: 0.37560432580926034
Epoch: 8, step: 1152, loss: 0.34265750646591187, mean loss: 0.37560173259246826
Epoch: 8, step: 1153, loss: 0.3367038071155548, mean loss: 0.37559867121001295
Epoch: 8, step: 1154, loss: 0.3572084605693817, mean loss: 0.3755972239596281
Epoch: 8, step: 1155, loss: 0.32813867926597595, mean loss: 0.37559348941881177
Epoch: 8, step: 1156, loss: 0.3872254490852356, mean loss: 0.3755944046725427
Epoch: 8, step: 1157, loss: 0.3477712571620941, mean loss: 0.37559221559720746
Epoch: 8, step: 1158, loss: 0.35152122378349304, mean loss: 0.3755903218837456
Epoch: 8, step: 1159, loss: 0.36443716287612915, mean loss: 0.3755894445112623
Epoch: 8, step: 1160, loss: 0.3770667314529419, mean loss: 0.3755895607141209
Epoch: 8, step: 1161, loss: 0.407027930021286, mean loss: 0.37559203345042
Epoch: 8, step: 1162, loss: 0.36722326278686523, mean loss: 0.3755913752694791
Epoch: 8, step: 1163, loss: 0.3806018829345703, mean loss: 0.3755917693012238
Epoch: 8, step: 1164, loss: 0.3278505504131317, mean loss: 0.37558801517533813
Epoch: 8, step: 1165, loss: 0.3402009606361389, mean loss: 0.37558523273670474
Epoch: 8, step: 1166, loss: 0.34050142765045166, mean loss: 0.37558247435907394
Epoch: 8, step: 1167, loss: 0.3253151476383209, mean loss: 0.37557852252521223
Epoch: 8, step: 1168, loss: 0.3688011169433594, mean loss: 0.3755779897521927
Epoch: 8, step: 1169, loss: 0.3488977551460266, mean loss: 0.37557589257921625
Epoch: 8, step: 1170, loss: 0.3470503091812134, mean loss: 0.37557365053069014
Epoch: 8, step: 1171, loss: 0.29714205861091614, mean loss: 0.37556748646342203
Epoch: 8, step: 1172, loss: 0.33513933420181274, mean loss: 0.3755643093984113
Epoch: 8, step: 1173, loss: 0.34867867827415466, mean loss: 0.3755621967447004
Epoch: 8, step: 1174, loss: 0.3574211597442627, mean loss: 0.3755607713469633
Epoch: 8, step: 1175, loss: 0.2999953031539917, mean loss: 0.3755548343994309
Epoch: 8, step: 1176, loss: 0.3505743145942688, mean loss: 0.3755528719106411
Epoch: 8, step: 1177, loss: 0.4150956869125366, mean loss: 0.37555597818047626
Epoch: 8, step: 1178, loss: 0.3175475299358368, mean loss: 0.3755514217082239
Epoch: 8, step: 1179, loss: 0.34313929080963135, mean loss: 0.37554887598635
Epoch: 8, step: 1180, loss: 0.36602896451950073, mean loss: 0.37554812832975165
Epoch: 8, step: 1181, loss: 0.33249908685684204, mean loss: 0.37554474769197305
Epoch: 8, step: 1182, loss: 0.32091569900512695, mean loss: 0.3755404580140235
Epoch: 8, step: 1183, loss: 0.3213045299053192, mean loss: 0.37553619953976874
Epoch: 8, step: 1184, loss: 0.3095429539680481, mean loss: 0.37553101831612334
Epoch: 8, step: 1185, loss: 0.33817046880722046, mean loss: 0.3755280853164759
Epoch: 8, step: 1186, loss: 0.31671351194381714, mean loss: 0.3755234684255604
Epoch: 8, step: 1187, loss: 0.34092843532562256, mean loss: 0.375520752959854
Epoch: 8, step: 1188, loss: 0.3491009473800659, mean loss: 0.3755186793545185
Epoch: 8, step: 1189, loss: 0.3389182388782501, mean loss: 0.3755158069294301
Epoch: 8, step: 1190, loss: 0.3654649257659912, mean loss: 0.3755150181919928
Epoch: 8, step: 1191, loss: 0.3429555296897888, mean loss: 0.37551246330432
Epoch: 8, step: 1192, loss: 0.3562978208065033, mean loss: 0.3755109556823115
Epoch: 8, step: 1193, loss: 0.3974417448043823, mean loss: 0.37551267628400004
Epoch: 8, step: 1194, loss: 0.32732558250427246, mean loss: 0.3755088960146206
Epoch: 8, step: 1195, loss: 0.33364138007164, mean loss: 0.3755056117727048
Epoch: 8, step: 1196, loss: 0.3302256166934967, mean loss: 0.3755020601219809
Epoch: 8, step: 1197, loss: 0.31121787428855896, mean loss: 0.37549701822505277
Epoch: 8, step: 1198, loss: 0.33281973004341125, mean loss: 0.3754936712492719
Epoch: 8, step: 1199, loss: 0.33871012926101685, mean loss: 0.375490786718062
Epoch: 8, step: 1200, loss: 0.320700079202652, mean loss: 0.37548649041856264
Epoch: 8, step: 1201, loss: 0.34672337770462036, mean loss: 0.3754842351956746
Epoch: 8, step: 1202, loss: 0.3219037652015686, mean loss: 0.3754800344532211
Epoch: 8, step: 1203, loss: 0.3225127160549164, mean loss: 0.37547588210778376
Epoch: 8, step: 1204, loss: 0.31302621960639954, mean loss: 0.37547098678266805
Epoch: 8, step: 1205, loss: 0.32008299231529236, mean loss: 0.37546664535027524
Epoch: 8, step: 1206, loss: 0.3294931650161743, mean loss: 0.375463042130561
Epoch: 8, step: 1207, loss: 0.30976858735084534, mean loss: 0.3754578936623181
Epoch: 8, step: 1208, loss: 0.3253089189529419, mean loss: 0.3754539637998693
Epoch: 8, step: 1209, loss: 0.3364725112915039, mean loss: 0.375450909305863
Epoch: 8, step: 1210, loss: 0.3561725616455078, mean loss: 0.3754493988187001
Epoch: 8, step: 1211, loss: 0.3320139944553375, mean loss: 0.37544599585690414
Epoch: 8, step: 1212, loss: 0.40976521372795105, mean loss: 0.3754486843972779
Epoch: 8, step: 1213, loss: 0.34841078519821167, mean loss: 0.3754465664355672
Epoch: 8, step: 1214, loss: 0.3242626488208771, mean loss: 0.3754425573560955
Epoch: 8, step: 1215, loss: 0.3752160966396332, mean loss: 0.3754425396195106
Epoch: 8, step: 1216, loss: 0.32834476232528687, mean loss: 0.37543885117270237
Epoch: 8, step: 1217, loss: 0.32534947991371155, mean loss: 0.37543492874738843
Epoch: 8, step: 1218, loss: 0.32554659247398376, mean loss: 0.37543102237073245
Epoch: 8, step: 1219, loss: 0.31879526376724243, mean loss: 0.37542658800190976
Epoch: 8, step: 1220, loss: 0.356997013092041, mean loss: 0.37542514514784964
Epoch: 8, step: 1221, loss: 0.3479990065097809, mean loss: 0.37542299811961743
Epoch: 8, step: 1222, loss: 0.3247838318347931, mean loss: 0.37541903419270667
Epoch: 8, step: 1223, loss: 0.3332313597202301, mean loss: 0.37541573208919443
Epoch: 8, step: 1224, loss: 0.3404366672039032, mean loss: 0.37541299443051984
Epoch: 8, step: 1225, loss: 0.346857488155365, mean loss: 0.3754107596906329
Epoch: 8, step: 1226, loss: 0.3152984380722046, mean loss: 0.3754060556980186
Epoch: 8, step: 1227, loss: 0.30340176820755005, mean loss: 0.3754004215597173
Epoch: 8, step: 1228, loss: 0.34229835867881775, mean loss: 0.37539783161660795
Epoch: 8, step: 1229, loss: 0.36230605840682983, mean loss: 0.3753968073814953
Epoch: 8, step: 1230, loss: 0.34415149688720703, mean loss: 0.3753943630952953
Epoch: 8, step: 1231, loss: 0.3384374976158142, mean loss: 0.3753914722265938
Epoch: 8, step: 1232, loss: 0.3576374351978302, mean loss: 0.3753900835651133
Epoch: 8, step: 1233, loss: 0.3332558870315552, mean loss: 0.3753867882267327
Epoch: 8, step: 1234, loss: 0.3144789934158325, mean loss: 0.37538202496757805
Epoch: 8, step: 1235, loss: 0.3476621210575104, mean loss: 0.3753798573179135
Epoch: 8, step: 1236, loss: 0.37405380606651306, mean loss: 0.3753797536310536
Epoch: 8, step: 1237, loss: 0.3821920156478882, mean loss: 0.3753802862551362
Epoch: 8, step: 1238, loss: 0.325752854347229, mean loss: 0.375376406383984
Epoch: 8, step: 1239, loss: 0.33522850275039673, mean loss: 0.3753732678674398
Epoch: 8, step: 1240, loss: 0.3750895857810974, mean loss: 0.37537324569264996
Epoch: 8, step: 1241, loss: 0.352409303188324, mean loss: 0.3753714507932827
Epoch: 8, step: 1242, loss: 0.3064632713794708, mean loss: 0.3753660652380335
Epoch: 8, step: 1243, loss: 0.31086716055870056, mean loss: 0.3753610246859329
Epoch: 8, step: 1244, loss: 0.33517220616340637, mean loss: 0.3753578841984341
Epoch: 8, step: 1245, loss: 0.31804007291793823, mean loss: 0.37535340554463814
Epoch: 8, step: 1246, loss: 0.3243534564971924, mean loss: 0.3753494208623155
Epoch: 8, step: 1247, loss: 0.31190425157546997, mean loss: 0.37534446420846496
Epoch: 8, step: 1248, loss: 0.3657981753349304, mean loss: 0.3753437184629081
Epoch: 8, step: 1249, loss: 0.33873817324638367, mean loss: 0.37534085910146325
Epoch: 8, step: 1250, loss: 0.31474390625953674, mean loss: 0.3753361260738258
Epoch: 8, step: 1251, loss: 0.34336304664611816, mean loss: 0.37533362895734446
Epoch: 8, step: 1252, loss: 0.3926706910133362, mean loss: 0.375334982886439
Epoch: 8, step: 1253, loss: 0.34727081656455994, mean loss: 0.3753327914007041
Epoch: 8, step: 1254, loss: 0.3183576464653015, mean loss: 0.3753283426504163
Epoch: 8, step: 1255, loss: 0.3145100474357605, mean loss: 0.3753235941888911
Epoch: 8, step: 1256, loss: 0.33743590116500854, mean loss: 0.3753206362926444
Epoch: 8, step: 1257, loss: 0.31776270270347595, mean loss: 0.37531614308939776
Epoch: 8, step: 1258, loss: 0.33038270473480225, mean loss: 0.3753126356787074
Epoch: 8, step: 1259, loss: 0.30140843987464905, mean loss: 0.3753068673212453
Epoch: 8, step: 1260, loss: 0.36122873425483704, mean loss: 0.3753057685830055
Epoch: 8, step: 1261, loss: 0.3680563271045685, mean loss: 0.37530520283917235
Epoch: 8, step: 1262, loss: 0.31225746870040894, mean loss: 0.3753002830003788
Epoch: 8, step: 1263, loss: 0.38209354877471924, mean loss: 0.3753008130616908
Epoch: 8, step: 1264, loss: 0.3172770142555237, mean loss: 0.3752962859649594
Epoch: 8, step: 1265, loss: 0.3393241763114929, mean loss: 0.375293479590357
Epoch: 8, step: 1266, loss: 0.33885377645492554, mean loss: 0.37529063695808185
Epoch: 8, step: 1267, loss: 0.3210292160511017, mean loss: 0.3752864043979487
Epoch: 8, step: 1268, loss: 0.3149198293685913, mean loss: 0.3752816959840161
Epoch: 8, step: 1269, loss: 0.3749617338180542, mean loss: 0.3752816710298619
Epoch: 8, step: 1270, loss: 0.3615208566188812, mean loss: 0.37528059789452606
Epoch: 8, step: 1271, loss: 0.3180023431777954, mean loss: 0.37527613140554317
Epoch: 8, step: 1272, loss: 0.3605014681816101, mean loss: 0.37527497938501886
Epoch: 8, step: 1273, loss: 0.3265918493270874, mean loss: 0.3752711837254166
Epoch: 8, step: 1274, loss: 0.3294723629951477, mean loss: 0.3752676132240733
Epoch: 8, step: 1275, loss: 0.33967262506484985, mean loss: 0.3752648384354734
Epoch: 8, step: 1276, loss: 0.37170177698135376, mean loss: 0.37526456070054054
Epoch: 8, step: 1277, loss: 0.33498045802116394, mean loss: 0.3752614208640106
Epoch: 8, step: 1278, loss: 0.34387803077697754, mean loss: 0.375258974960333
Epoch: 8, step: 1279, loss: 0.3916248679161072, mean loss: 0.37526025035722793
Epoch: 8, step: 1280, loss: 0.3646897077560425, mean loss: 0.37525942665718887
Epoch: 8, step: 1281, loss: 0.3452087938785553, mean loss: 0.37525708517107553
Epoch: 8, step: 1282, loss: 0.3245082199573517, mean loss: 0.37525313122754506
Epoch: 8, step: 1283, loss: 0.3708290159702301, mean loss: 0.3752527865629099
Epoch: 8, step: 1284, loss: 0.33522477746009827, mean loss: 0.3752496683881726
Epoch: 8, step: 1285, loss: 0.3664616346359253, mean loss: 0.3752489838552428
Epoch: 8, step: 1286, loss: 0.3654673099517822, mean loss: 0.37524822198329766
Epoch: 8, step: 1287, loss: 0.35644420981407166, mean loss: 0.3752467574963686
Epoch: 8, step: 1288, loss: 0.3289773166179657, mean loss: 0.375243154237987
Epoch: 8, step: 1289, loss: 0.332090824842453, mean loss: 0.375239793988073
Epoch: 8, step: 1290, loss: 0.3014957904815674, mean loss: 0.37523405202719884
Epoch: 8, step: 1291, loss: 0.3731362521648407, mean loss: 0.3752338886980286
Epoch: 8, step: 1292, loss: 0.36947497725486755, mean loss: 0.3752334403592631
Epoch: 8, step: 1293, loss: 0.3142750859260559, mean loss: 0.3752286950413094
Epoch: 8, step: 1294, loss: 0.3807345926761627, mean loss: 0.37522912361588984
Epoch: 8, step: 1295, loss: 0.40164506435394287, mean loss: 0.37523117965112784
Epoch: 8, step: 1296, loss: 0.3827070891857147, mean loss: 0.37523176147924947
Epoch: 8, step: 1297, loss: 0.33646705746650696, mean loss: 0.375228744770766
Epoch: 8, step: 1298, loss: 0.3813890814781189, mean loss: 0.37522922413709603
Epoch: 8, step: 1299, loss: 0.3300458490848541, mean loss: 0.3752257084683245
Epoch: 8, step: 1300, loss: 0.44983556866645813, mean loss: 0.3752315133279058
Epoch: 8, step: 1301, loss: 0.31864577531814575, mean loss: 0.3752271111388588
Epoch: 8, step: 1302, loss: 0.3541446328163147, mean loss: 0.3752254711172079
Epoch: 8, step: 1303, loss: 0.41891855001449585, mean loss: 0.3752288697698912
Epoch: 8, step: 1304, loss: 0.33954310417175293, mean loss: 0.3752260941795048
Epoch: 8, step: 1305, loss: 0.3949211537837982, mean loss: 0.3752276259153583
Epoch: 8, step: 1306, loss: 0.3185984492301941, mean loss: 0.3752232220599508
Epoch: 8, step: 1307, loss: 0.35877877473831177, mean loss: 0.3752219433315432
Epoch: 8, step: 1308, loss: 0.4040348529815674, mean loss: 0.3752241836635275
Epoch: 8, step: 1309, loss: 0.31329748034477234, mean loss: 0.37521936896104585
Epoch: 8, step: 1310, loss: 0.3519493043422699, mean loss: 0.3752175598912629
Epoch: 8, step: 1311, loss: 0.42128580808639526, mean loss: 0.37522114106727306
Epoch: 8, step: 1312, loss: 0.3852877914905548, mean loss: 0.37522192355078826
Epoch: 8, step: 1313, loss: 0.33388805389404297, mean loss: 0.3752187109074137
Epoch: 8, step: 1314, loss: 0.31861168146133423, mean loss: 0.3752143115113271
Epoch: 8, step: 1315, loss: 0.3536044955253601, mean loss: 0.3752126321659754
Epoch: 8, step: 1316, loss: 0.33272606134414673, mean loss: 0.3752093306995971
Epoch: 8, step: 1317, loss: 0.38428059220314026, mean loss: 0.3752100355373208
Epoch: 8, step: 1318, loss: 0.3183698058128357, mean loss: 0.3752056193901897
Epoch: 8, step: 1319, loss: 0.3196451961994171, mean loss: 0.37520130301175664
Epoch: 8, step: 1320, loss: 0.3748224079608917, mean loss: 0.3752012735784427
Epoch: 8, step: 1321, loss: 0.3046393394470215, mean loss: 0.3751957926141634
Epoch: 8, step: 1322, loss: 0.32563677430152893, mean loss: 0.37519194337002265
Epoch: 8, step: 1323, loss: 0.3599298596382141, mean loss: 0.37519075805752405
Epoch: 8, step: 1324, loss: 0.36723220348358154, mean loss: 0.3751901400133698
Epoch: 8, step: 1325, loss: 0.3371701240539551, mean loss: 0.37518718769034143
Epoch: 8, step: 1326, loss: 0.32565024495124817, mean loss: 0.375183341355786
Epoch: 8, step: 1327, loss: 0.3198762536048889, mean loss: 0.37517904732723395
Epoch: 8, step: 1328, loss: 0.2958585321903229, mean loss: 0.3751728893802472
Epoch: 8, step: 1329, loss: 0.3572610020637512, mean loss: 0.3751714989216758
Epoch: 8, step: 1330, loss: 0.3084486126899719, mean loss: 0.3751663197796878
Epoch: 8, step: 1331, loss: 0.33518004417419434, mean loss: 0.375163216219023
Epoch: 8, step: 1332, loss: 0.36806297302246094, mean loss: 0.37516266517182106
Epoch: 8, step: 1333, loss: 0.3341868817806244, mean loss: 0.37515948530348403
Epoch: 8, step: 1334, loss: 0.35004013776779175, mean loss: 0.37515753610293034
Epoch: 8, step: 1335, loss: 0.32810401916503906, mean loss: 0.37515388514723996
Epoch: 8, step: 1336, loss: 0.34491950273513794, mean loss: 0.3751515393964127
Epoch: 8, step: 1337, loss: 0.32970356941223145, mean loss: 0.3751480135647615
Epoch: 8, step: 1338, loss: 0.36841508746147156, mean loss: 0.3751474912681124
Epoch: 8, step: 1339, loss: 0.35194897651672363, mean loss: 0.3751456918176973
Epoch: 8, step: 1340, loss: 0.34344762563705444, mean loss: 0.3751432332691686
Epoch: 8, step: 1341, loss: 0.31645530462265015, mean loss: 0.37513868170032677
Epoch: 8, step: 1342, loss: 0.33797967433929443, mean loss: 0.375135800040198
Epoch: 8, step: 1343, loss: 0.32151228189468384, mean loss: 0.375131641888977
Epoch: 8, step: 1344, loss: 0.3543340563774109, mean loss: 0.37513002929802475
Epoch: 8, step: 1345, loss: 0.3130001723766327, mean loss: 0.3751252122832223
Epoch: 8, step: 1346, loss: 0.3437490463256836, mean loss: 0.3751227798337334
Epoch: 8, step: 1347, loss: 0.3683187961578369, mean loss: 0.37512225239313834
Epoch: 8, step: 1348, loss: 0.3634743094444275, mean loss: 0.37512134952181453
Epoch: 8, step: 1349, loss: 0.29751166701316833, mean loss: 0.3751153341999645
Epoch: 8, step: 1350, loss: 0.3386780619621277, mean loss: 0.37511251026194714
Epoch: 8, step: 1351, loss: 0.3525782525539398, mean loss: 0.3751107639617528
Epoch: 8, step: 1352, loss: 0.3666647970676422, mean loss: 0.37511010948930845
Epoch: 8, step: 1353, loss: 0.3535606265068054, mean loss: 0.3751084397633684
Epoch: 8, step: 1354, loss: 0.3071393072605133, mean loss: 0.37510317369592416
Epoch: 8, step: 1355, loss: 0.36397868394851685, mean loss: 0.3751023118668455
Epoch: 8, step: 1356, loss: 0.33358103036880493, mean loss: 0.37509909540689523
Epoch: 8, step: 1357, loss: 0.3662099242210388, mean loss: 0.3750984068576167
Epoch: 8, step: 1358, loss: 0.3416805863380432, mean loss: 0.3750958185359902
Epoch: 8, step: 1359, loss: 0.38456636667251587, mean loss: 0.3750965520047121
Epoch: 8, step: 1360, loss: 0.34481629729270935, mean loss: 0.37509420706126656
Epoch: 8, step: 1361, loss: 0.3357115387916565, mean loss: 0.3750911574509003
Epoch: 8, step: 1362, loss: 0.337710440158844, mean loss: 0.3750882630864178
Epoch: 8, step: 1363, loss: 0.32756805419921875, mean loss: 0.3750845839126111
Epoch: 8, step: 1364, loss: 0.3636489808559418, mean loss: 0.3750836985984471
Epoch: 8, step: 1365, loss: 0.32109683752059937, mean loss: 0.3750795194018936
Epoch: 8, step: 1366, loss: 0.3043558597564697, mean loss: 0.3750740450107143
Epoch: 8, step: 1367, loss: 0.3329795002937317, mean loss: 0.3750707869190179
Epoch: 8, step: 1368, loss: 0.37707850337028503, mean loss: 0.3750709423030014
Epoch: 8, step: 1369, loss: 0.30955445766448975, mean loss: 0.3750658721525109
Epoch: 8, step: 1370, loss: 0.31308797001838684, mean loss: 0.37506107621486995
Epoch: 8, step: 1371, loss: 0.39921921491622925, mean loss: 0.37506294546113284
Epoch: 8, step: 1372, loss: 0.3453807234764099, mean loss: 0.3750606489642675
Epoch: 8, step: 1373, loss: 0.3193513751029968, mean loss: 0.37505633910244934
Epoch: 8, step: 1374, loss: 0.3194591701030731, mean loss: 0.37505203824617955
Epoch: 8, step: 1375, loss: 0.36377614736557007, mean loss: 0.3750511660392736
Epoch: 8, step: 1376, loss: 0.3460348844528198, mean loss: 0.37504892176039767
Epoch: 8, step: 1377, loss: 0.3145309388637543, mean loss: 0.37504424132861913
Epoch: 8, step: 1378, loss: 0.347102552652359, mean loss: 0.3750420804989326
Epoch: 8, step: 1379, loss: 0.3171136677265167, mean loss: 0.37503760103614475
Epoch: 8, step: 1380, loss: 0.3350823223590851, mean loss: 0.37503451163085
Epoch: 8, step: 1381, loss: 0.33552828431129456, mean loss: 0.37503145718309067
Epoch: 8, step: 1382, loss: 0.3297921121120453, mean loss: 0.3750279597462858
Epoch: 8, step: 1383, loss: 0.35407742857933044, mean loss: 0.37502634019378367
Epoch: 8, step: 1384, loss: 0.3495931625366211, mean loss: 0.37502437426832513
Epoch: 8, step: 1385, loss: 0.3219843804836273, mean loss: 0.37502027471709737
Epoch: 8, step: 1386, loss: 0.3714334964752197, mean loss: 0.3750199975103394
Epoch: 8, step: 1387, loss: 0.31818798184394836, mean loss: 0.375015605546223
Epoch: 8, step: 1388, loss: 0.3004366457462311, mean loss: 0.3750098425480157
Epoch: 8, step: 1389, loss: 0.33686766028404236, mean loss: 0.3750068953851148
Epoch: 8, step: 1390, loss: 0.3317887783050537, mean loss: 0.37500355627385157
Epoch: 8, step: 1391, loss: 0.31942275166511536, mean loss: 0.37499926233035585
Epoch: 8, step: 1392, loss: 0.3317895829677582, mean loss: 0.3749959243867975
Epoch: 8, step: 1393, loss: 0.3455996811389923, mean loss: 0.3749936537052551
Epoch: 8, step: 1394, loss: 0.3416111171245575, mean loss: 0.37499107530588993
Epoch: 8, step: 1395, loss: 0.32490602135658264, mean loss: 0.37498720713675576
Epoch: 8, step: 1396, loss: 0.3565060496330261, mean loss: 0.37498577991013565
Epoch: 8, step: 1397, loss: 0.367593914270401, mean loss: 0.3749852091097002
Epoch: 8, step: 1398, loss: 0.4002436101436615, mean loss: 0.3749871594147758
Epoch: 8, step: 1399, loss: 0.3645137548446655, mean loss: 0.3749863507825514
Epoch: 8, step: 1400, loss: 0.37273353338241577, mean loss: 0.3749861768601087
Epoch: 8, step: 1401, loss: 0.36262962222099304, mean loss: 0.3749852229806399
Epoch: 8, step: 1402, loss: 0.3528376519680023, mean loss: 0.37498351340356445
Epoch: 8, step: 1403, loss: 0.3262026906013489, mean loss: 0.3749797482891154
Epoch: 8, step: 1404, loss: 0.37583500146865845, mean loss: 0.3749798142961525
Epoch: 8, step: 1405, loss: 0.3294041156768799, mean loss: 0.3749762971099649
Epoch: 8, step: 1406, loss: 0.31712475419044495, mean loss: 0.37497183291188485
Epoch: 8, step: 1407, loss: 0.3398834466934204, mean loss: 0.37496912547467665
Epoch: 8, step: 1408, loss: 0.34340736269950867, mean loss: 0.3749666903413709
Epoch: 8, step: 1409, loss: 0.32793158292770386, mean loss: 0.37496306164923904
Epoch: 8, step: 1410, loss: 0.33541083335876465, mean loss: 0.37496001048606
Epoch: 8, step: 1411, loss: 0.3501604199409485, mean loss: 0.374958097527826
Epoch: 8, step: 1412, loss: 0.37022408843040466, mean loss: 0.37495773239021724
Epoch: 8, step: 1413, loss: 0.33859187364578247, mean loss: 0.3749549276810745
Epoch: 8, step: 1414, loss: 0.34738031029701233, mean loss: 0.3749528011585648
Epoch: 8, step: 1415, loss: 0.3621298372745514, mean loss: 0.3749518123427193
Epoch: 8, step: 1416, loss: 0.3037496507167816, mean loss: 0.3749463221613926
Epoch: 8, step: 1417, loss: 0.4464881718158722, mean loss: 0.37495183810970834
Epoch: 8, step: 1418, loss: 0.32536935806274414, mean loss: 0.3749480155455231
Epoch: 8, step: 1419, loss: 0.3459964096546173, mean loss: 0.37494578369184667
Epoch: 8, step: 1420, loss: 0.3449166715145111, mean loss: 0.3749434689526054
Epoch: 8, step: 1421, loss: 0.34774988889694214, mean loss: 0.37494137294674323
Epoch: 8, step: 1422, loss: 0.3529819846153259, mean loss: 0.3749396805083362
Epoch: 8, step: 1423, loss: 0.38223597407341003, mean loss: 0.37494024279976385
Epoch: 8, step: 1424, loss: 0.30865105986595154, mean loss: 0.3749351345942515
Epoch: 8, step: 1425, loss: 0.3305148184299469, mean loss: 0.37493171185452545
Epoch: 8, step: 1426, loss: 0.35882776975631714, mean loss: 0.3749304710854294
Epoch: 8, step: 1427, loss: 0.30991342663764954, mean loss: 0.37492546206813754
Epoch: 8, step: 1428, loss: 0.37399962544441223, mean loss: 0.3749253907456952
Epoch: 8, step: 1429, loss: 0.35973453521728516, mean loss: 0.37492422059814257
Epoch: 8, step: 1430, loss: 0.3827153444290161, mean loss: 0.3749248207001091
Epoch: 8, step: 1431, loss: 0.37850573658943176, mean loss: 0.37492509649461686
Epoch: 8, step: 1432, loss: 0.34963321685791016, mean loss: 0.37492314871797944
Epoch: 8, step: 1433, loss: 0.31618422269821167, mean loss: 0.3749186254678624
Epoch: 8, step: 1434, loss: 0.36988240480422974, mean loss: 0.37491823767848353
Epoch: 8, step: 1435, loss: 0.32851356267929077, mean loss: 0.3749146647900481
Epoch: 8, step: 1436, loss: 0.30354994535446167, mean loss: 0.3749091705472707
Epoch: 8, step: 1437, loss: 0.3171009123325348, mean loss: 0.374904720334937
Epoch: 8, step: 1438, loss: 0.3487146198749542, mean loss: 0.37490270431611933
Epoch: 8, step: 1439, loss: 0.3345652222633362, mean loss: 0.3748995995222421
Epoch: 8, step: 1440, loss: 0.3398052453994751, mean loss: 0.3748968985021449
Epoch: 8, step: 1441, loss: 0.3503134250640869, mean loss: 0.37489500659253755
Epoch: 8, step: 1442, loss: 0.36354678869247437, mean loss: 0.3748941333168238
Epoch: 8, step: 1443, loss: 0.3104858100414276, mean loss: 0.37488917730549143
Valid: 8, mean loss: 0.20104682693878811
Epoch: 9, step: 0, loss: 0.3355470895767212, mean loss: 0.37488615029250927
Epoch: 9, step: 1, loss: 0.32416418194770813, mean loss: 0.37488224800228426
Epoch: 9, step: 2, loss: 0.3547595143318176, mean loss: 0.37488069998061563
Epoch: 9, step: 3, loss: 0.3357643485069275, mean loss: 0.3748776910305023
Epoch: 9, step: 4, loss: 0.36323803663253784, mean loss: 0.3748767957413401
Epoch: 9, step: 5, loss: 0.37939462065696716, mean loss: 0.37487714321287646
Epoch: 9, step: 6, loss: 0.3712237775325775, mean loss: 0.3748768622495849
Epoch: 9, step: 7, loss: 0.31824564933776855, mean loss: 0.3748725073424093
Epoch: 9, step: 8, loss: 0.39518406987190247, mean loss: 0.3748740691695934
Epoch: 9, step: 9, loss: 0.32506081461906433, mean loss: 0.3748702391484839
Epoch: 9, step: 10, loss: 0.3185398578643799, mean loss: 0.37486590837418665
Epoch: 9, step: 11, loss: 0.2961527407169342, mean loss: 0.37485985723891163
Epoch: 9, step: 12, loss: 0.3729223310947418, mean loss: 0.37485970830154947
Epoch: 9, step: 13, loss: 0.3254257142543793, mean loss: 0.37485590860946283
Epoch: 9, step: 14, loss: 0.3427915573120117, mean loss: 0.37485344420616584
Epoch: 9, step: 15, loss: 0.34057971835136414, mean loss: 0.3748508101971085
Epoch: 9, step: 16, loss: 0.35965603590011597, mean loss: 0.3748496425359775
Epoch: 9, step: 17, loss: 0.2972438633441925, mean loss: 0.37484367928262025
Epoch: 9, step: 18, loss: 0.3115267753601074, mean loss: 0.37483881436491584
Epoch: 9, step: 19, loss: 0.32804837822914124, mean loss: 0.37483521952501603
Epoch: 9, step: 20, loss: 0.310153603553772, mean loss: 0.3748302505140326
Epoch: 9, step: 21, loss: 0.3406819701194763, mean loss: 0.374827627355299
Epoch: 9, step: 22, loss: 0.3614223301410675, mean loss: 0.3748265976834952
Epoch: 9, step: 23, loss: 0.3295765519142151, mean loss: 0.3748231222575528
Epoch: 9, step: 24, loss: 0.31516018509864807, mean loss: 0.37481854020262934
Epoch: 9, step: 25, loss: 0.31784841418266296, mean loss: 0.3748141652889433
Epoch: 9, step: 26, loss: 0.34227725863456726, mean loss: 0.3748116668702491
Epoch: 9, step: 27, loss: 0.3723120391368866, mean loss: 0.37481147494551526
Epoch: 9, step: 28, loss: 0.31479957699775696, mean loss: 0.37480686750613346
Epoch: 9, step: 29, loss: 0.36813119053840637, mean loss: 0.3748063550174978
Epoch: 9, step: 30, loss: 0.3444170653820038, mean loss: 0.3748040222248644
Epoch: 9, step: 31, loss: 0.33169296383857727, mean loss: 0.3748007131169134
Epoch: 9, step: 32, loss: 0.2965557277202606, mean loss: 0.3747947076686521
Epoch: 9, step: 33, loss: 0.37304118275642395, mean loss: 0.3747945730926803
Epoch: 9, step: 34, loss: 0.36470702290534973, mean loss: 0.3747937989732584
Epoch: 9, step: 35, loss: 0.329291969537735, mean loss: 0.3747903074271077
Epoch: 9, step: 36, loss: 0.32464599609375, mean loss: 0.37478645993909016
Epoch: 9, step: 37, loss: 0.33276861906051636, mean loss: 0.3747832362287266
Epoch: 9, step: 38, loss: 0.34682783484458923, mean loss: 0.37478109158727024
Epoch: 9, step: 39, loss: 0.35506752133369446, mean loss: 0.3747795793465328
Epoch: 9, step: 40, loss: 0.3328515291213989, mean loss: 0.37477636326536184
Epoch: 9, step: 41, loss: 0.30538085103034973, mean loss: 0.3747710407072828
Epoch: 9, step: 42, loss: 0.3524130880832672, mean loss: 0.3747693260088685
Epoch: 9, step: 43, loss: 0.3284054696559906, mean loss: 0.374765770498412
Epoch: 9, step: 44, loss: 0.32376471161842346, mean loss: 0.3747618596741746
Epoch: 9, step: 45, loss: 0.36026573181152344, mean loss: 0.37476074817840227
Epoch: 9, step: 46, loss: 0.34117498993873596, mean loss: 0.3747581731758538
Epoch: 9, step: 47, loss: 0.36472880840301514, mean loss: 0.37475740428864335
Epoch: 9, step: 48, loss: 0.414964497089386, mean loss: 0.3747604864728366
Epoch: 9, step: 49, loss: 0.34715989232063293, mean loss: 0.374758370836308
Epoch: 9, step: 50, loss: 0.3370814919471741, mean loss: 0.374755483055294
Epoch: 9, step: 51, loss: 0.3326502740383148, mean loss: 0.37475225610794444
Epoch: 9, step: 52, loss: 0.34863051772117615, mean loss: 0.37475025428877157
Epoch: 9, step: 53, loss: 0.34288859367370605, mean loss: 0.37474781278221103
Epoch: 9, step: 54, loss: 0.333639919757843, mean loss: 0.3747446629934573
Epoch: 9, step: 55, loss: 0.3611776828765869, mean loss: 0.3747436235374263
Epoch: 9, step: 56, loss: 0.3803557753562927, mean loss: 0.3747440534885348
Epoch: 9, step: 57, loss: 0.3072633743286133, mean loss: 0.37473888413974055
Epoch: 9, step: 58, loss: 0.2960679829120636, mean loss: 0.374732858027046
Epoch: 9, step: 59, loss: 0.33202993869781494, mean loss: 0.3747295872764846
Epoch: 9, step: 60, loss: 0.3219952881336212, mean loss: 0.37472554850041484
Epoch: 9, step: 61, loss: 0.311871200799942, mean loss: 0.37472073502609254
Epoch: 9, step: 62, loss: 0.32231882214546204, mean loss: 0.3747167223212238
Epoch: 9, step: 63, loss: 0.3060902953147888, mean loss: 0.3747114676177777
Epoch: 9, step: 64, loss: 0.363113135099411, mean loss: 0.3747105796051815
Epoch: 9, step: 65, loss: 0.33243250846862793, mean loss: 0.37470734288254054
Epoch: 9, step: 66, loss: 0.3251974582672119, mean loss: 0.3747035527972144
Epoch: 9, step: 67, loss: 0.330745130777359, mean loss: 0.3747001879455595
Epoch: 9, step: 68, loss: 0.3353465497493744, mean loss: 0.37469717580333245
Epoch: 9, step: 69, loss: 0.3500082790851593, mean loss: 0.3746952862505452
Epoch: 9, step: 70, loss: 0.3783039152622223, mean loss: 0.37469556241408786
Epoch: 9, step: 71, loss: 0.3435156047344208, mean loss: 0.374693176436304
Epoch: 9, step: 72, loss: 0.3591914772987366, mean loss: 0.37469199029358935
Epoch: 9, step: 73, loss: 0.3162696659564972, mean loss: 0.374687520337634
Epoch: 9, step: 74, loss: 0.3835809528827667, mean loss: 0.3746882007318307
Epoch: 9, step: 75, loss: 0.3611268997192383, mean loss: 0.37468716330060264
Epoch: 9, step: 76, loss: 0.36527779698371887, mean loss: 0.3746864435448988
Epoch: 9, step: 77, loss: 0.3267238736152649, mean loss: 0.37468277499893504
Epoch: 9, step: 78, loss: 0.34075796604156494, mean loss: 0.3746801803672748
Epoch: 9, step: 79, loss: 0.32520347833633423, mean loss: 0.3746763965876762
Epoch: 9, step: 80, loss: 0.3883512318134308, mean loss: 0.3746774423042187
Epoch: 9, step: 81, loss: 0.3513040244579315, mean loss: 0.3746756550723907
Epoch: 9, step: 82, loss: 0.3539486229419708, mean loss: 0.37467407031574795
Epoch: 9, step: 83, loss: 0.34740516543388367, mean loss: 0.37467198553708725
Epoch: 9, step: 84, loss: 0.3350721001625061, mean loss: 0.37466895825435853
Epoch: 9, step: 85, loss: 0.36130058765411377, mean loss: 0.3746679363639289
Epoch: 9, step: 86, loss: 0.3556765615940094, mean loss: 0.3746664847568992
Epoch: 9, step: 87, loss: 0.32747742533683777, mean loss: 0.37466287813358673
Epoch: 9, step: 88, loss: 0.3242033123970032, mean loss: 0.37465902184273947
Epoch: 9, step: 89, loss: 0.34819909930229187, mean loss: 0.3746569998404056
Epoch: 9, step: 90, loss: 0.33250218629837036, mean loss: 0.37465377871917527
Epoch: 9, step: 91, loss: 0.39471426606178284, mean loss: 0.3746553114581226
Epoch: 9, step: 92, loss: 0.3342762291431427, mean loss: 0.37465222649499974
Epoch: 9, step: 93, loss: 0.350949227809906, mean loss: 0.3746504157235188
Epoch: 9, step: 94, loss: 0.3260790705680847, mean loss: 0.37464670543819645
Epoch: 9, step: 95, loss: 0.33156171441078186, mean loss: 0.3746434144978491
Epoch: 9, step: 96, loss: 0.32150083780288696, mean loss: 0.3746393556437519
Epoch: 9, step: 97, loss: 0.31619977951049805, mean loss: 0.37463489256324684
Epoch: 9, step: 98, loss: 0.3511491119861603, mean loss: 0.3746330990710302
Epoch: 9, step: 99, loss: 0.33084461092948914, mean loss: 0.3746297554173847
Epoch: 9, step: 100, loss: 0.32244011759757996, mean loss: 0.37462577056300433
Epoch: 9, step: 101, loss: 0.3072859048843384, mean loss: 0.3746206293303216
Epoch: 9, step: 102, loss: 0.3203229308128357, mean loss: 0.37461648415141346
Epoch: 9, step: 103, loss: 0.32562777400016785, mean loss: 0.3746127445552187
Epoch: 9, step: 104, loss: 0.35627269744873047, mean loss: 0.3746113446584851
Epoch: 9, step: 105, loss: 0.33033862709999084, mean loss: 0.3746079655776151
Epoch: 9, step: 106, loss: 0.3467605412006378, mean loss: 0.37460584030673233
Epoch: 9, step: 107, loss: 0.3623430132865906, mean loss: 0.37460490449880957
Epoch: 9, step: 108, loss: 0.34341734647750854, mean loss: 0.37460252467751837
Epoch: 9, step: 109, loss: 0.33383452892303467, mean loss: 0.37459941404149255
Epoch: 9, step: 110, loss: 0.37740710377693176, mean loss: 0.37459962825448834
Epoch: 9, step: 111, loss: 0.3682405948638916, mean loss: 0.37459914312835235
Epoch: 9, step: 112, loss: 0.3189021348953247, mean loss: 0.3745948943673307
Epoch: 9, step: 113, loss: 0.37576013803482056, mean loss: 0.37459498324938006
Epoch: 9, step: 114, loss: 0.3462081253528595, mean loss: 0.37459281813170053
Epoch: 9, step: 115, loss: 0.3271847069263458, mean loss: 0.3745892025039393
Epoch: 9, step: 116, loss: 0.37376561760902405, mean loss: 0.37458913969719065
Epoch: 9, step: 117, loss: 0.34356337785720825, mean loss: 0.37458677384681394
Epoch: 9, step: 118, loss: 0.3536294996738434, mean loss: 0.37458517588462004
Epoch: 9, step: 119, loss: 0.32106131315231323, mean loss: 0.3745810950777633
Epoch: 9, step: 120, loss: 0.30914637446403503, mean loss: 0.37457610653460455
Epoch: 9, step: 121, loss: 0.3441695272922516, mean loss: 0.3745737886066245
Epoch: 9, step: 122, loss: 0.3300730586051941, mean loss: 0.3745703965241486
Epoch: 9, step: 123, loss: 0.29999858140945435, mean loss: 0.37456471269677705
Epoch: 9, step: 124, loss: 0.37048542499542236, mean loss: 0.3745644017991548
Epoch: 9, step: 125, loss: 0.38246211409568787, mean loss: 0.3745650036671853
Epoch: 9, step: 126, loss: 0.3602619171142578, mean loss: 0.37456391374212605
Epoch: 9, step: 127, loss: 0.325999915599823, mean loss: 0.37456021334604694
Epoch: 9, step: 128, loss: 0.3311862051486969, mean loss: 0.3745569086597081
Epoch: 9, step: 129, loss: 0.31226444244384766, mean loss: 0.37455216292862353
Epoch: 9, step: 130, loss: 0.30956894159317017, mean loss: 0.37454721258038437
Epoch: 9, step: 131, loss: 0.35183826088905334, mean loss: 0.37454548276992644
Epoch: 9, step: 132, loss: 0.3242000639438629, mean loss: 0.37454164809715423
Epoch: 9, step: 133, loss: 0.3576996326446533, mean loss: 0.3745403653846293
Epoch: 9, step: 134, loss: 0.3376096785068512, mean loss: 0.3745375529037156
Epoch: 9, step: 135, loss: 0.38350608944892883, mean loss: 0.3745382358565442
Epoch: 9, step: 136, loss: 0.3182235658168793, mean loss: 0.3745339478286725
Epoch: 9, step: 137, loss: 0.3059973418712616, mean loss: 0.37452872957026245
Epoch: 9, step: 138, loss: 0.36327579617500305, mean loss: 0.37452787285664274
Epoch: 9, step: 139, loss: 0.3386983573436737, mean loss: 0.3745251452747675
Epoch: 9, step: 140, loss: 0.3435317575931549, mean loss: 0.3745227860308243
Epoch: 9, step: 141, loss: 0.31351199746131897, mean loss: 0.37451814218940477
Epoch: 9, step: 142, loss: 0.32080817222595215, mean loss: 0.37451405436156676
Epoch: 9, step: 143, loss: 0.33193454146385193, mean loss: 0.37451081391157454
Epoch: 9, step: 144, loss: 0.369890421628952, mean loss: 0.37451046231030505
Epoch: 9, step: 145, loss: 0.35605448484420776, mean loss: 0.3745090579595619
Epoch: 9, step: 146, loss: 0.322051078081131, mean loss: 0.3745050666349116
Epoch: 9, step: 147, loss: 0.32694777846336365, mean loss: 0.3745014484602181
Epoch: 9, step: 148, loss: 0.3563605546951294, mean loss: 0.3745000683998328
Epoch: 9, step: 149, loss: 0.37186726927757263, mean loss: 0.374499868126052
Epoch: 9, step: 150, loss: 0.3226308226585388, mean loss: 0.3744959228118763
Epoch: 9, step: 151, loss: 0.3963344991207123, mean loss: 0.3744975837927334
Epoch: 9, step: 152, loss: 0.33985817432403564, mean loss: 0.37449494941677564
Epoch: 9, step: 153, loss: 0.34157803654670715, mean loss: 0.37449244622948513
Epoch: 9, step: 154, loss: 0.35130026936531067, mean loss: 0.374490682699954
Epoch: 9, step: 155, loss: 0.3613148629665375, mean loss: 0.3744896808888429
Epoch: 9, step: 156, loss: 0.3771280348300934, mean loss: 0.3744898814783617
Epoch: 9, step: 157, loss: 0.3247392773628235, mean loss: 0.374486099312928
Epoch: 9, step: 158, loss: 0.35884466767311096, mean loss: 0.37448491030254105
Epoch: 9, step: 159, loss: 0.3656107187271118, mean loss: 0.3744842357668482
Epoch: 9, step: 160, loss: 0.34637171030044556, mean loss: 0.3744820990696173
Epoch: 9, step: 161, loss: 0.34219658374786377, mean loss: 0.3744796453900823
Epoch: 9, step: 162, loss: 0.32515081763267517, mean loss: 0.37447589671406156
Epoch: 9, step: 163, loss: 0.3261346220970154, mean loss: 0.3744722233649265
Epoch: 9, step: 164, loss: 0.3303321599960327, mean loss: 0.3744688695116199
Epoch: 9, step: 165, loss: 0.3465346097946167, mean loss: 0.37446674717005196
Epoch: 9, step: 166, loss: 0.3717292845249176, mean loss: 0.3744665392035819
Epoch: 9, step: 167, loss: 0.3635214567184448, mean loss: 0.37446570776310145
Epoch: 9, step: 168, loss: 0.33188241720199585, mean loss: 0.37446247317969383
Epoch: 9, step: 169, loss: 0.36304840445518494, mean loss: 0.37446160624450286
Epoch: 9, step: 170, loss: 0.3334992527961731, mean loss: 0.37445849525844316
Epoch: 9, step: 171, loss: 0.31849873065948486, mean loss: 0.3744542455800866
Epoch: 9, step: 172, loss: 0.34315717220306396, mean loss: 0.3744518690083365
Epoch: 9, step: 173, loss: 0.31330811977386475, mean loss: 0.37444722635463606
Epoch: 9, step: 174, loss: 0.30942100286483765, mean loss: 0.3744422892789782
Epoch: 9, step: 175, loss: 0.3511427938938141, mean loss: 0.3744405204135527
Epoch: 9, step: 176, loss: 0.34567341208457947, mean loss: 0.37443833662031434
Epoch: 9, step: 177, loss: 0.35109201073646545, mean loss: 0.3744365644686608
Epoch: 9, step: 178, loss: 0.38362908363342285, mean loss: 0.3744372621930756
Epoch: 9, step: 179, loss: 0.40494194626808167, mean loss: 0.37443957736339095
Epoch: 9, step: 180, loss: 0.367916077375412, mean loss: 0.3744390822962294
Epoch: 9, step: 181, loss: 0.3156073987483978, mean loss: 0.37443461790986216
Epoch: 9, step: 182, loss: 0.35297709703445435, mean loss: 0.3744329897498443
Epoch: 9, step: 183, loss: 0.3274560570716858, mean loss: 0.37442942549091573
Epoch: 9, step: 184, loss: 0.34744396805763245, mean loss: 0.3744273781912091
Epoch: 9, step: 185, loss: 0.33145207166671753, mean loss: 0.3744241180405093
Epoch: 9, step: 186, loss: 0.31765317916870117, mean loss: 0.37441981166571814
Epoch: 9, step: 187, loss: 0.32480043172836304, mean loss: 0.37441604805983697
Epoch: 9, step: 188, loss: 0.3328385055065155, mean loss: 0.37441289466260125
Epoch: 9, step: 189, loss: 0.33006030321121216, mean loss: 0.37440953105032676
Epoch: 9, step: 190, loss: 0.35565412044525146, mean loss: 0.3744081087851713
Epoch: 9, step: 191, loss: 0.34217503666877747, mean loss: 0.37440566466384007
Epoch: 9, step: 192, loss: 0.30944082140922546, mean loss: 0.37440073898006915
Epoch: 9, step: 193, loss: 0.3493497967720032, mean loss: 0.37439883974260074
Epoch: 9, step: 194, loss: 0.3322531580924988, mean loss: 0.3743956447094986
Epoch: 9, step: 195, loss: 0.3547188937664032, mean loss: 0.3743941531425684
Epoch: 9, step: 196, loss: 0.36045601963996887, mean loss: 0.3743930966631094
Epoch: 9, step: 197, loss: 0.33462244272232056, mean loss: 0.3743900823646449
Epoch: 9, step: 198, loss: 0.3523450493812561, mean loss: 0.3743884116535435
Epoch: 9, step: 199, loss: 0.3635205328464508, mean loss: 0.37438758807982364
Epoch: 9, step: 200, loss: 0.3459702134132385, mean loss: 0.3743854347590184
Epoch: 9, step: 201, loss: 0.33096885681152344, mean loss: 0.3743821451258962
Epoch: 9, step: 202, loss: 0.3343060612678528, mean loss: 0.37437910882891473
Epoch: 9, step: 203, loss: 0.3427758514881134, mean loss: 0.3743767146427526
Epoch: 9, step: 204, loss: 0.386902779340744, mean loss: 0.3743776635151636
Epoch: 9, step: 205, loss: 0.31826889514923096, mean loss: 0.37437341349483594
Epoch: 9, step: 206, loss: 0.3418653905391693, mean loss: 0.3743709513254081
Epoch: 9, step: 207, loss: 0.3133423328399658, mean loss: 0.3743663293458197
Epoch: 9, step: 208, loss: 0.3416139483451843, mean loss: 0.37436384904434294
Epoch: 9, step: 209, loss: 0.3248961269855499, mean loss: 0.37436010319230156
Epoch: 9, step: 210, loss: 0.3541029095649719, mean loss: 0.37435856936981143
Epoch: 9, step: 211, loss: 0.38902080059051514, mean loss: 0.3743596794721146
Epoch: 9, step: 212, loss: 0.34064391255378723, mean loss: 0.37435712698767837
Epoch: 9, step: 213, loss: 0.34164974093437195, mean loss: 0.37435465103112625
Epoch: 9, step: 214, loss: 0.3479950428009033, mean loss: 0.37435265575383986
Epoch: 9, step: 215, loss: 0.3463957607746124, mean loss: 0.37435053973090776
Epoch: 9, step: 216, loss: 0.32442450523376465, mean loss: 0.37434676117687027
Epoch: 9, step: 217, loss: 0.34354427456855774, mean loss: 0.37434443012748264
Epoch: 9, step: 218, loss: 0.36358845233917236, mean loss: 0.37434361620559176
Epoch: 9, step: 219, loss: 0.37424907088279724, mean loss: 0.37434360905173863
Epoch: 9, step: 220, loss: 0.3571023643016815, mean loss: 0.37434230457683887
Epoch: 9, step: 221, loss: 0.322691410779953, mean loss: 0.374338396958909
Epoch: 9, step: 222, loss: 0.3535250723361969, mean loss: 0.3743368224582189
Epoch: 9, step: 223, loss: 0.3488937020301819, mean loss: 0.3743348978651457
Epoch: 9, step: 224, loss: 0.37321391701698303, mean loss: 0.374334813077244
Epoch: 9, step: 225, loss: 0.32491356134414673, mean loss: 0.37433107527269605
Epoch: 9, step: 226, loss: 0.39890217781066895, mean loss: 0.374332933482069
Epoch: 9, step: 227, loss: 0.30506905913352966, mean loss: 0.37432769574202446
Epoch: 9, step: 228, loss: 0.33773887157440186, mean loss: 0.37432492910125564
Epoch: 9, step: 229, loss: 0.32942304015159607, mean loss: 0.37432153413006636
Epoch: 9, step: 230, loss: 0.37943875789642334, mean loss: 0.3743219210071939
Epoch: 9, step: 231, loss: 0.33427971601486206, mean loss: 0.374318893927893
Epoch: 9, step: 232, loss: 0.39915046095848083, mean loss: 0.3743207709833795
Epoch: 9, step: 233, loss: 0.32895898818969727, mean loss: 0.3743173422771971
Epoch: 9, step: 234, loss: 0.3370342254638672, mean loss: 0.3743145244163541
Epoch: 9, step: 235, loss: 0.3714641034603119, mean loss: 0.3743143089975999
Epoch: 9, step: 236, loss: 0.3378307521343231, mean loss: 0.3743115519843101
Epoch: 9, step: 237, loss: 0.3197980523109436, mean loss: 0.37430743278379075
Epoch: 9, step: 238, loss: 0.36391714215278625, mean loss: 0.37430664772216393
Epoch: 9, step: 239, loss: 0.36616888642311096, mean loss: 0.3743060329018784
Epoch: 9, step: 240, loss: 0.33616235852241516, mean loss: 0.37430315130677533
Epoch: 9, step: 241, loss: 0.3112918734550476, mean loss: 0.3742983914278018
Epoch: 9, step: 242, loss: 0.32215896248817444, mean loss: 0.37429445310701176
Epoch: 9, step: 243, loss: 0.3539220690727234, mean loss: 0.3742929144073113
Epoch: 9, step: 244, loss: 0.34834370017051697, mean loss: 0.37429095464488876
Epoch: 9, step: 245, loss: 0.32815027236938477, mean loss: 0.3742874702254449
Epoch: 9, step: 246, loss: 0.307759165763855, mean loss: 0.3742824465673265
Epoch: 9, step: 247, loss: 0.35793161392211914, mean loss: 0.3742812119831642
Epoch: 9, step: 248, loss: 0.4144528806209564, mean loss: 0.3742842449517288
Epoch: 9, step: 249, loss: 0.3619142472743988, mean loss: 0.3742833110850764
Epoch: 9, step: 250, loss: 0.3478495478630066, mean loss: 0.37428131563227784
Epoch: 9, step: 251, loss: 0.3450171649456024, mean loss: 0.37427910668370545
Epoch: 9, step: 252, loss: 0.328084796667099, mean loss: 0.3742756200575437
Epoch: 9, step: 253, loss: 0.3315194249153137, mean loss: 0.37427239317489147
Epoch: 9, step: 254, loss: 0.3478242754936218, mean loss: 0.37427039724117467
Epoch: 9, step: 255, loss: 0.3669207990169525, mean loss: 0.3742698426382299
Epoch: 9, step: 256, loss: 0.39135023951530457, mean loss: 0.37427113143298407
Epoch: 9, step: 257, loss: 0.36667752265930176, mean loss: 0.37427055850339497
Epoch: 9, step: 258, loss: 0.32455509901046753, mean loss: 0.3742668078086011
Epoch: 9, step: 259, loss: 0.29825857281684875, mean loss: 0.37426107393450697
Epoch: 9, step: 260, loss: 0.3719121813774109, mean loss: 0.37426089675320223
Epoch: 9, step: 261, loss: 0.32697975635528564, mean loss: 0.374257330518446
Epoch: 9, step: 262, loss: 0.36340758204460144, mean loss: 0.37425651222532635
Epoch: 9, step: 263, loss: 0.3297101557254791, mean loss: 0.3742531527715933
Epoch: 9, step: 264, loss: 0.3003219664096832, mean loss: 0.37424757768778655
Epoch: 9, step: 265, loss: 0.33733221888542175, mean loss: 0.37424479414391665
Epoch: 9, step: 266, loss: 0.33943507075309753, mean loss: 0.3742421695700351
Epoch: 9, step: 267, loss: 0.3296782970428467, mean loss: 0.37423880980883734
Epoch: 9, step: 268, loss: 0.3579927980899811, mean loss: 0.37423758508122945
Epoch: 9, step: 269, loss: 0.3296699523925781, mean loss: 0.3742342255431103
Epoch: 9, step: 270, loss: 0.3477582037448883, mean loss: 0.3742322299132167
Epoch: 9, step: 271, loss: 0.3444800078868866, mean loss: 0.374229987508783
Epoch: 9, step: 272, loss: 0.3670656681060791, mean loss: 0.3742294475796698
Epoch: 9, step: 273, loss: 0.3813698887825012, mean loss: 0.3742299856686828
Epoch: 9, step: 274, loss: 0.3802018165588379, mean loss: 0.3742304356597076
Epoch: 9, step: 275, loss: 0.3373357355594635, mean loss: 0.37422765576970607
Epoch: 9, step: 276, loss: 0.3376905620098114, mean loss: 0.37422490303153383
Epoch: 9, step: 277, loss: 0.3547925651073456, mean loss: 0.37422343909165706
Epoch: 9, step: 278, loss: 0.3273286819458008, mean loss: 0.3742199065299135
Epoch: 9, step: 279, loss: 0.30884119868278503, mean loss: 0.3742149819511362
Epoch: 9, step: 280, loss: 0.3532117009162903, mean loss: 0.3742134000214055
Epoch: 9, step: 281, loss: 0.32122567296028137, mean loss: 0.37420940938071706
Epoch: 9, step: 282, loss: 0.3429669439792633, mean loss: 0.3742070566082642
Epoch: 9, step: 283, loss: 0.3209547698497772, mean loss: 0.3742030466469119
Epoch: 9, step: 284, loss: 0.32936644554138184, mean loss: 0.3741996706510452
Epoch: 9, step: 285, loss: 0.3232889175415039, mean loss: 0.37419583758726643
Epoch: 9, step: 286, loss: 0.33013036847114563, mean loss: 0.3741925201537713
Epoch: 9, step: 287, loss: 0.33583134412765503, mean loss: 0.3741896323808094
Epoch: 9, step: 288, loss: 0.356030136346817, mean loss: 0.3741882654635317
Epoch: 9, step: 289, loss: 0.35537102818489075, mean loss: 0.37418684914279715
Epoch: 9, step: 290, loss: 0.32075029611587524, mean loss: 0.37418282742585374
Epoch: 9, step: 291, loss: 0.39149734377861023, mean loss: 0.3741841304448448
Epoch: 9, step: 292, loss: 0.3524908423423767, mean loss: 0.3741824980204259
Epoch: 9, step: 293, loss: 0.3297796845436096, mean loss: 0.37417915695093934
Epoch: 9, step: 294, loss: 0.37909597158432007, mean loss: 0.3741795268865825
Epoch: 9, step: 295, loss: 0.36103349924087524, mean loss: 0.3741785378685532
Epoch: 9, step: 296, loss: 0.33627909421920776, mean loss: 0.374175686785754
Epoch: 9, step: 297, loss: 0.35172396898269653, mean loss: 0.3741739979247789
Epoch: 9, step: 298, loss: 0.34458407759666443, mean loss: 0.3741717722820314
Epoch: 9, step: 299, loss: 0.3181302547454834, mean loss: 0.3741675573664526
Epoch: 9, step: 300, loss: 0.32114121317863464, mean loss: 0.37416356952376717
Epoch: 9, step: 301, loss: 0.33515968918800354, mean loss: 0.3741606364601233
Epoch: 9, step: 302, loss: 0.3843122124671936, mean loss: 0.37416139979390833
Epoch: 9, step: 303, loss: 0.3521411418914795, mean loss: 0.3741597441354194
Epoch: 9, step: 304, loss: 0.34074074029922485, mean loss: 0.3741572316172752
Epoch: 9, step: 305, loss: 0.3304915726184845, mean loss: 0.3741539489786495
Epoch: 9, step: 306, loss: 0.3378768563270569, mean loss: 0.37415122199280787
Epoch: 9, step: 307, loss: 0.3558703064918518, mean loss: 0.37414984790114364
Epoch: 9, step: 308, loss: 0.33892887830734253, mean loss: 0.37414720070312835
Epoch: 9, step: 309, loss: 0.3326173722743988, mean loss: 0.3741440795676685
Epoch: 9, step: 310, loss: 0.34524914622306824, mean loss: 0.3741419081591358
Epoch: 9, step: 311, loss: 0.3056553900241852, mean loss: 0.37413676189236883
Epoch: 9, step: 312, loss: 0.32836779952049255, mean loss: 0.3741333229441104
Epoch: 9, step: 313, loss: 0.3176402151584625, mean loss: 0.37412907853330757
Epoch: 9, step: 314, loss: 0.3413441479206085, mean loss: 0.3741266155379945
Epoch: 9, step: 315, loss: 0.3542931377887726, mean loss: 0.37412512564333184
Epoch: 9, step: 316, loss: 0.36836251616477966, mean loss: 0.3741246927875158
Epoch: 9, step: 317, loss: 0.3360358774662018, mean loss: 0.3741218319781932
Epoch: 9, step: 318, loss: 0.32334426045417786, mean loss: 0.37411801841668185
Epoch: 9, step: 319, loss: 0.31743893027305603, mean loss: 0.37411376195166657
Epoch: 9, step: 320, loss: 0.3158268630504608, mean loss: 0.3741093850725721
Epoch: 9, step: 321, loss: 0.3537534177303314, mean loss: 0.37410785661729784
Epoch: 9, step: 322, loss: 0.3282831609249115, mean loss: 0.37410441606652883
Epoch: 9, step: 323, loss: 0.29771488904953003, mean loss: 0.3740986811170531
Epoch: 9, step: 324, loss: 0.3708975911140442, mean loss: 0.3740984408130216
Epoch: 9, step: 325, loss: 0.321602463722229, mean loss: 0.37409450026527424
Epoch: 9, step: 326, loss: 0.34577980637550354, mean loss: 0.37409237501616444
Epoch: 9, step: 327, loss: 0.3258158564567566, mean loss: 0.37408875174097983
Epoch: 9, step: 328, loss: 0.3262695074081421, mean loss: 0.37408516305472594
Epoch: 9, step: 329, loss: 0.34893345832824707, mean loss: 0.3740832756387927
Epoch: 9, step: 330, loss: 0.3123202323913574, mean loss: 0.37407864120919504
Epoch: 9, step: 331, loss: 0.3983322083950043, mean loss: 0.37408046095463215
Epoch: 9, step: 332, loss: 0.34063720703125, mean loss: 0.3740779518951436
Epoch: 9, step: 333, loss: 0.31557697057724, mean loss: 0.37407356322437707
Epoch: 9, step: 334, loss: 0.3298110365867615, mean loss: 0.3740702429538319
Epoch: 9, step: 335, loss: 0.3518217206001282, mean loss: 0.3740685741477748
Epoch: 9, step: 336, loss: 0.3885175287723541, mean loss: 0.37406965784646407
Epoch: 9, step: 337, loss: 0.3302997052669525, mean loss: 0.3740663752641497
Epoch: 9, step: 338, loss: 0.33796122670173645, mean loss: 0.374063667716451
Epoch: 9, step: 339, loss: 0.3440822660923004, mean loss: 0.3740614195609603
Epoch: 9, step: 340, loss: 0.32917141914367676, mean loss: 0.3740580537365307
Epoch: 9, step: 341, loss: 0.36530056595802307, mean loss: 0.37405739715475095
Epoch: 9, step: 342, loss: 0.3391377031803131, mean loss: 0.37405477929029524
Epoch: 9, step: 343, loss: 0.32679483294487, mean loss: 0.3740512365656816
Epoch: 9, step: 344, loss: 0.3221336305141449, mean loss: 0.3740473449828879
Epoch: 9, step: 345, loss: 0.37063583731651306, mean loss: 0.3740470892860159
Epoch: 9, step: 346, loss: 0.31847864389419556, mean loss: 0.37404292467195666
Epoch: 9, step: 347, loss: 0.3396924138069153, mean loss: 0.3740403504430249
Epoch: 9, step: 348, loss: 0.3474828898906708, mean loss: 0.3740383603747932
Epoch: 9, step: 349, loss: 0.3255299925804138, mean loss: 0.37403472570014956
Epoch: 9, step: 350, loss: 0.36115390062332153, mean loss: 0.3740337606274683
Epoch: 9, step: 351, loss: 0.3206441104412079, mean loss: 0.3740297608035107
Epoch: 9, step: 352, loss: 0.30986976623535156, mean loss: 0.37402495445138184
Epoch: 9, step: 353, loss: 0.3525916635990143, mean loss: 0.37402334896143036
Epoch: 9, step: 354, loss: 0.36143991351127625, mean loss: 0.3740224064525958
Epoch: 9, step: 355, loss: 0.328645795583725, mean loss: 0.37401900796466375
Epoch: 9, step: 356, loss: 0.40540820360183716, mean loss: 0.3740213586870211
Epoch: 9, step: 357, loss: 0.37019503116607666, mean loss: 0.3740210721565792
Epoch: 9, step: 358, loss: 0.33577290177345276, mean loss: 0.37401820819773357
Epoch: 9, step: 359, loss: 0.3092648684978485, mean loss: 0.3740133599392954
Epoch: 9, step: 360, loss: 0.3435285985469818, mean loss: 0.3740110776332842
Epoch: 9, step: 361, loss: 0.3388441503047943, mean loss: 0.37400844498413544
Epoch: 9, step: 362, loss: 0.3210473954677582, mean loss: 0.3740044805369825
Epoch: 9, step: 363, loss: 0.3400358259677887, mean loss: 0.37400193797301773
Epoch: 9, step: 364, loss: 0.3289821743965149, mean loss: 0.37399856848244245
Epoch: 9, step: 365, loss: 0.37978431582450867, mean loss: 0.3739990014825429
Epoch: 9, step: 366, loss: 0.33648645877838135, mean loss: 0.37399619428784825
Epoch: 9, step: 367, loss: 0.30242621898651123, mean loss: 0.37399083885719114
Epoch: 9, step: 368, loss: 0.3521420657634735, mean loss: 0.37398920408180064
Epoch: 9, step: 369, loss: 0.33086225390434265, mean loss: 0.3739859774657467
Epoch: 9, step: 370, loss: 0.33806535601615906, mean loss: 0.3739832902044727
Epoch: 9, step: 371, loss: 0.33741524815559387, mean loss: 0.3739805547135953
Epoch: 9, step: 372, loss: 0.3081154525279999, mean loss: 0.3739756280098639
Epoch: 9, step: 373, loss: 0.3225992023944855, mean loss: 0.37397178534527037
Epoch: 9, step: 374, loss: 0.3445158898830414, mean loss: 0.37396958237649747
Epoch: 9, step: 375, loss: 0.4167390763759613, mean loss: 0.37397278081308133
Epoch: 9, step: 376, loss: 0.35276827216148376, mean loss: 0.3739711951921547
Epoch: 9, step: 377, loss: 0.38846108317375183, mean loss: 0.3739722786292701
Epoch: 9, step: 378, loss: 0.3469385802745819, mean loss: 0.3739702574181782
Epoch: 9, step: 379, loss: 0.3565892279148102, mean loss: 0.37396895799910645
Epoch: 9, step: 380, loss: 0.3118140995502472, mean loss: 0.37396431160167437
Epoch: 9, step: 381, loss: 0.3639872372150421, mean loss: 0.37396356581946577
Epoch: 9, step: 382, loss: 0.34753644466400146, mean loss: 0.37396159055067474
Epoch: 9, step: 383, loss: 0.34604528546333313, mean loss: 0.37395950413026463
Epoch: 9, step: 384, loss: 0.33953359723091125, mean loss: 0.3739569313848122
Epoch: 9, step: 385, loss: 0.34024083614349365, mean loss: 0.37395441187388395
Epoch: 9, step: 386, loss: 0.31952381134033203, mean loss: 0.3739503447289588
Epoch: 9, step: 387, loss: 0.37566182017326355, mean loss: 0.37395047260369313
Epoch: 9, step: 388, loss: 0.3087867796421051, mean loss: 0.37394560419181705
Epoch: 9, step: 389, loss: 0.3789396584033966, mean loss: 0.37394597727221535
Epoch: 9, step: 390, loss: 0.3562834560871124, mean loss: 0.3739446578936253
Epoch: 9, step: 391, loss: 0.3411646783351898, mean loss: 0.37394220943384354
Epoch: 9, step: 392, loss: 0.312602698802948, mean loss: 0.37393762809762493
Epoch: 9, step: 393, loss: 0.36416932940483093, mean loss: 0.3739368985756912
Epoch: 9, step: 394, loss: 0.37998613715171814, mean loss: 0.3739373503148127
Epoch: 9, step: 395, loss: 0.36610570549964905, mean loss: 0.3739367655145726
Epoch: 9, step: 396, loss: 0.35287362337112427, mean loss: 0.37393519281673465
Epoch: 9, step: 397, loss: 0.31377139687538147, mean loss: 0.37393070096994196
Epoch: 9, step: 398, loss: 0.3480750322341919, mean loss: 0.37392877072218267
Epoch: 9, step: 399, loss: 0.36741867661476135, mean loss: 0.37392828474919765
Epoch: 9, step: 400, loss: 0.3419297933578491, mean loss: 0.3739258962673441
Epoch: 9, step: 401, loss: 0.339876651763916, mean loss: 0.37392335489963974
Epoch: 9, step: 402, loss: 0.34094998240470886, mean loss: 0.3739208940165518
Epoch: 9, step: 403, loss: 0.34279265999794006, mean loss: 0.3739185710140131
Epoch: 9, step: 404, loss: 0.37152427434921265, mean loss: 0.3739183923484908
Epoch: 9, step: 405, loss: 0.3649093806743622, mean loss: 0.3739177201345172
Epoch: 9, step: 406, loss: 0.3453141152858734, mean loss: 0.3739155860149284
Epoch: 9, step: 407, loss: 0.3769041895866394, mean loss: 0.3739158089784894
Epoch: 9, step: 408, loss: 0.3289662301540375, mean loss: 0.37391245578350063
Epoch: 9, step: 409, loss: 0.31295710802078247, mean loss: 0.3739079089128634
Epoch: 9, step: 410, loss: 0.3300672173500061, mean loss: 0.3739046389276644
Epoch: 9, step: 411, loss: 0.34720274806022644, mean loss: 0.3739026474381904
Epoch: 9, step: 412, loss: 0.3123585283756256, mean loss: 0.37389805767616024
Epoch: 9, step: 413, loss: 0.33630096912384033, mean loss: 0.3738952540155672
Epoch: 9, step: 414, loss: 0.33646130561828613, mean loss: 0.37389246272868354
Epoch: 9, step: 415, loss: 0.36742016673088074, mean loss: 0.37389198015367625
Epoch: 9, step: 416, loss: 0.33040735125541687, mean loss: 0.3738887381773176
Epoch: 9, step: 417, loss: 0.31180503964424133, mean loss: 0.37388410990099935
Epoch: 9, step: 418, loss: 0.3207413852214813, mean loss: 0.37388014846047163
Epoch: 9, step: 419, loss: 0.33754193782806396, mean loss: 0.3738774398878246
Epoch: 9, step: 420, loss: 0.36154818534851074, mean loss: 0.37387652096000623
Epoch: 9, step: 421, loss: 0.3998837172985077, mean loss: 0.3738784591919587
Epoch: 9, step: 422, loss: 0.3129315674304962, mean loss: 0.37387391735637027
Epoch: 9, step: 423, loss: 0.3232448995113373, mean loss: 0.37387014470228347
Epoch: 9, step: 424, loss: 0.3084878623485565, mean loss: 0.3738652730621409
Epoch: 9, step: 425, loss: 0.32800859212875366, mean loss: 0.37386185653100296
Epoch: 9, step: 426, loss: 0.3427652418613434, mean loss: 0.37385953986448506
Epoch: 9, step: 427, loss: 0.3409065306186676, mean loss: 0.37385708508131715
Epoch: 9, step: 428, loss: 0.3535020649433136, mean loss: 0.3738555688786998
Epoch: 9, step: 429, loss: 0.3252905011177063, mean loss: 0.37385195163843754
Epoch: 9, step: 430, loss: 0.29527682065963745, mean loss: 0.3738460996140852
Epoch: 9, step: 431, loss: 0.3765871226787567, mean loss: 0.37384630374151034
Epoch: 9, step: 432, loss: 0.3354388177394867, mean loss: 0.37384344370085193
Epoch: 9, step: 433, loss: 0.29209113121032715, mean loss: 0.3738373564102718
Epoch: 9, step: 434, loss: 0.2909424602985382, mean loss: 0.3738311845022894
Epoch: 9, step: 435, loss: 0.3694247603416443, mean loss: 0.3738308564480785
Epoch: 9, step: 436, loss: 0.3611472249031067, mean loss: 0.373829912233715
Epoch: 9, step: 437, loss: 0.3432333767414093, mean loss: 0.37382763468901553
Epoch: 9, step: 438, loss: 0.3259507119655609, mean loss: 0.3738240710922367
Epoch: 9, step: 439, loss: 0.3324436545372009, mean loss: 0.3738209912755833
Epoch: 9, step: 440, loss: 0.3438422977924347, mean loss: 0.373818760220029
Epoch: 9, step: 441, loss: 0.31117144227027893, mean loss: 0.37381409826751005
Epoch: 9, step: 442, loss: 0.3733118772506714, mean loss: 0.37381406089709435
Epoch: 9, step: 443, loss: 0.3373810648918152, mean loss: 0.3738113501087011
Epoch: 9, step: 444, loss: 0.3708522915840149, mean loss: 0.3738111299570364
Epoch: 9, step: 445, loss: 0.40818315744400024, mean loss: 0.3738136870190426
Epoch: 9, step: 446, loss: 0.34391021728515625, mean loss: 0.37381146255502906
Epoch: 9, step: 447, loss: 0.330890029668808, mean loss: 0.37380826994621574
Epoch: 9, step: 448, loss: 0.35777607560157776, mean loss: 0.37380707751822434
Epoch: 9, step: 449, loss: 0.31737130880355835, mean loss: 0.37380288030204745
Epoch: 9, step: 450, loss: 0.33904317021369934, mean loss: 0.3738002953604182
Epoch: 9, step: 451, loss: 0.34010934829711914, mean loss: 0.3737977900847591
Epoch: 9, step: 452, loss: 0.3405921161174774, mean loss: 0.3737953210778465
Epoch: 9, step: 453, loss: 0.3347943127155304, mean loss: 0.37379242137462254
Epoch: 9, step: 454, loss: 0.3324693441390991, mean loss: 0.37378934925528307
Epoch: 9, step: 455, loss: 0.35709843039512634, mean loss: 0.373788108479275
Epoch: 9, step: 456, loss: 0.3208073675632477, mean loss: 0.37378417026914224
Epoch: 9, step: 457, loss: 0.3454066216945648, mean loss: 0.37378206104150924
Epoch: 9, step: 458, loss: 0.34087273478507996, mean loss: 0.37377961516070235
Epoch: 9, step: 459, loss: 0.3190426230430603, mean loss: 0.37377554731051527
Epoch: 9, step: 460, loss: 0.32317519187927246, mean loss: 0.3737717871592608
Epoch: 9, step: 461, loss: 0.3205139935016632, mean loss: 0.3737678298258043
Epoch: 9, step: 462, loss: 0.354910284280777, mean loss: 0.3737664287153544
Epoch: 9, step: 463, loss: 0.30332833528518677, mean loss: 0.37376119557319765
Epoch: 9, step: 464, loss: 0.36525341868400574, mean loss: 0.3737605635416332
Epoch: 9, step: 465, loss: 0.34610849618911743, mean loss: 0.3737585094584841
Epoch: 9, step: 466, loss: 0.34935057163238525, mean loss: 0.37375669649422455
Epoch: 9, step: 467, loss: 0.3965356945991516, mean loss: 0.3737583883390036
Epoch: 9, step: 468, loss: 0.3161148130893707, mean loss: 0.37375410734566905
Epoch: 9, step: 469, loss: 0.34568551182746887, mean loss: 0.3737520229408333
Epoch: 9, step: 470, loss: 0.341203510761261, mean loss: 0.3737496060319316
Epoch: 9, step: 471, loss: 0.3509413003921509, mean loss: 0.37374791251354433
Epoch: 9, step: 472, loss: 0.3121020197868347, mean loss: 0.3737433356412653
Epoch: 9, step: 473, loss: 0.3189348578453064, mean loss: 0.373739266711956
Epoch: 9, step: 474, loss: 0.29113948345184326, mean loss: 0.3737331350377477
Epoch: 9, step: 475, loss: 0.3505871593952179, mean loss: 0.373731416957608
Epoch: 9, step: 476, loss: 0.3184666931629181, mean loss: 0.37372731507058987
Epoch: 9, step: 477, loss: 0.36401692032814026, mean loss: 0.3737265943941209
Epoch: 9, step: 478, loss: 0.3356688320636749, mean loss: 0.3737237700703858
Epoch: 9, step: 479, loss: 0.3252023160457611, mean loss: 0.3737201694875701
Epoch: 9, step: 480, loss: 0.3373136818408966, mean loss: 0.3737174681083576
Epoch: 9, step: 481, loss: 0.34398189187049866, mean loss: 0.37371526187774196
Epoch: 9, step: 482, loss: 0.3530452847480774, mean loss: 0.3737137283828885
Epoch: 9, step: 483, loss: 0.39100393652915955, mean loss: 0.3737150110392792
Epoch: 9, step: 484, loss: 0.350947767496109, mean loss: 0.37371332219990944
Epoch: 9, step: 485, loss: 0.3743641972541809, mean loss: 0.3737133704772462
Epoch: 9, step: 486, loss: 0.3633539378643036, mean loss: 0.3737126021443371
Epoch: 9, step: 487, loss: 0.3023642301559448, mean loss: 0.3737073108085326
Epoch: 9, step: 488, loss: 0.33110302686691284, mean loss: 0.3737041514252221
Epoch: 9, step: 489, loss: 0.3435479402542114, mean loss: 0.3737019153128707
Epoch: 9, step: 490, loss: 0.31444329023361206, mean loss: 0.37369752155406005
Epoch: 9, step: 491, loss: 0.3520165979862213, mean loss: 0.3736959141309011
Epoch: 9, step: 492, loss: 0.33995184302330017, mean loss: 0.37369341253173827
Epoch: 9, step: 493, loss: 0.31396177411079407, mean loss: 0.3736889846860436
Epoch: 9, step: 494, loss: 0.349745512008667, mean loss: 0.37368720991229243
Epoch: 9, step: 495, loss: 0.35675060749053955, mean loss: 0.37368595460526444
Epoch: 9, step: 496, loss: 0.30677342414855957, mean loss: 0.373680995550165
Epoch: 9, step: 497, loss: 0.365928590297699, mean loss: 0.37368042104258736
Epoch: 9, step: 498, loss: 0.330909788608551, mean loss: 0.37367725167375193
Epoch: 9, step: 499, loss: 0.3329610228538513, mean loss: 0.3736742347629028
Epoch: 9, step: 500, loss: 0.35443854331970215, mean loss: 0.3736728095801627
Epoch: 9, step: 501, loss: 0.3619113266468048, mean loss: 0.37367193823011574
Epoch: 9, step: 502, loss: 0.3582785129547119, mean loss: 0.37367079789192215
Epoch: 9, step: 503, loss: 0.35432329773902893, mean loss: 0.37366936474376267
Epoch: 9, step: 504, loss: 0.3297552466392517, mean loss: 0.37366611208706285
Epoch: 9, step: 505, loss: 0.3277330696582794, mean loss: 0.3736627101434672
Epoch: 9, step: 506, loss: 0.3591878414154053, mean loss: 0.37366163816918535
Epoch: 9, step: 507, loss: 0.34510377049446106, mean loss: 0.37365952339817865
Epoch: 9, step: 508, loss: 0.3711033761501312, mean loss: 0.37365933412403957
Epoch: 9, step: 509, loss: 0.28397035598754883, mean loss: 0.3736526934474413
Epoch: 9, step: 510, loss: 0.356697142124176, mean loss: 0.37365143813158114
Epoch: 9, step: 511, loss: 0.41852301359176636, mean loss: 0.37365475998348074
Epoch: 9, step: 512, loss: 0.3069116771221161, mean loss: 0.3736498193451758
Epoch: 9, step: 513, loss: 0.38383615016937256, mean loss: 0.3736505733296928
Epoch: 9, step: 514, loss: 0.33699506521224976, mean loss: 0.3736478603174718
Epoch: 9, step: 515, loss: 0.32222649455070496, mean loss: 0.3736440547101771
Epoch: 9, step: 516, loss: 0.3410639762878418, mean loss: 0.37364164369275515
Epoch: 9, step: 517, loss: 0.29214656352996826, mean loss: 0.3736356132739182
Epoch: 9, step: 518, loss: 0.365315705537796, mean loss: 0.3736349976684623
Epoch: 9, step: 519, loss: 0.3901293873786926, mean loss: 0.3736362180287546
Epoch: 9, step: 520, loss: 0.3328235149383545, mean loss: 0.37363319866772104
Epoch: 9, step: 521, loss: 0.37348437309265137, mean loss: 0.3736331876582836
Epoch: 9, step: 522, loss: 0.3299793601036072, mean loss: 0.3736299585860479
Epoch: 9, step: 523, loss: 0.3222576379776001, mean loss: 0.3736261588581923
Epoch: 9, step: 524, loss: 0.33414414525032043, mean loss: 0.37362323880689374
Epoch: 9, step: 525, loss: 0.31714925169944763, mean loss: 0.3736190623546598
Epoch: 9, step: 526, loss: 0.3096924126148224, mean loss: 0.37361433510111103
Epoch: 9, step: 527, loss: 0.3197847008705139, mean loss: 0.37361035479689403
Epoch: 9, step: 528, loss: 0.3417200744152069, mean loss: 0.37360799692034086
Epoch: 9, step: 529, loss: 0.31286466121673584, mean loss: 0.3736035060630509
Epoch: 9, step: 530, loss: 0.3472336530685425, mean loss: 0.3736015566394541
Epoch: 9, step: 531, loss: 0.3269388675689697, mean loss: 0.37359810729815673
Epoch: 9, step: 532, loss: 0.3912714421749115, mean loss: 0.37359941362788374
Epoch: 9, step: 533, loss: 0.29941120743751526, mean loss: 0.37359393039017563
Epoch: 9, step: 534, loss: 0.305539071559906, mean loss: 0.3735889008388616
Epoch: 9, step: 535, loss: 0.33611810207366943, mean loss: 0.3735861317878148
Epoch: 9, step: 536, loss: 0.3449224531650543, mean loss: 0.3735840137298363
Epoch: 9, step: 537, loss: 0.3403048515319824, mean loss: 0.37358155479957195
Epoch: 9, step: 538, loss: 0.3114122748374939, mean loss: 0.3735769615760801
Epoch: 9, step: 539, loss: 0.38209834694862366, mean loss: 0.3735775911110515
Epoch: 9, step: 540, loss: 0.34394124150276184, mean loss: 0.3735754018261576
Epoch: 9, step: 541, loss: 0.3905574381351471, mean loss: 0.3735766562238758
Epoch: 9, step: 542, loss: 0.3082108795642853, mean loss: 0.37357182826193924
Epoch: 9, step: 543, loss: 0.3197483420372009, mean loss: 0.37356785311524615
Epoch: 9, step: 544, loss: 0.3321308195590973, mean loss: 0.3735647929990394
Epoch: 9, step: 545, loss: 0.330001562833786, mean loss: 0.37356157610122775
Epoch: 9, step: 546, loss: 0.3326365351676941, mean loss: 0.3735585542418957
Epoch: 9, step: 547, loss: 0.34199702739715576, mean loss: 0.37355622394605664
Epoch: 9, step: 548, loss: 0.38206616044044495, mean loss: 0.3735568522174848
Epoch: 9, step: 549, loss: 0.3188430070877075, mean loss: 0.3735528131029765
Epoch: 9, step: 550, loss: 0.35496455430984497, mean loss: 0.37355144097196646
Epoch: 9, step: 551, loss: 0.3429329991340637, mean loss: 0.3735491809747833
Epoch: 9, step: 552, loss: 0.3343868553638458, mean loss: 0.37354629055293587
Epoch: 9, step: 553, loss: 0.36402490735054016, mean loss: 0.37354558786782865
Epoch: 9, step: 554, loss: 0.3566068410873413, mean loss: 0.37354433786806623
Epoch: 9, step: 555, loss: 0.32640305161476135, mean loss: 0.373540859319789
Epoch: 9, step: 556, loss: 0.3110129237174988, mean loss: 0.3735362457334537
Epoch: 9, step: 557, loss: 0.34837061166763306, mean loss: 0.37353438903918884
Epoch: 9, step: 558, loss: 0.4014360010623932, mean loss: 0.37353644743919057
Epoch: 9, step: 559, loss: 0.36464381217956543, mean loss: 0.37353579144662197
Epoch: 9, step: 560, loss: 0.37940213084220886, mean loss: 0.3735362241632551
Epoch: 9, step: 561, loss: 0.32706886529922485, mean loss: 0.37353279686137697
Epoch: 9, step: 562, loss: 0.38708630204200745, mean loss: 0.3735337964561244
Epoch: 9, step: 563, loss: 0.3319850265979767, mean loss: 0.3735307323875508
Epoch: 9, step: 564, loss: 0.3610844314098358, mean loss: 0.3735298145864316
Epoch: 9, step: 565, loss: 0.3576453924179077, mean loss: 0.3735286433416175
Epoch: 9, step: 566, loss: 0.3254425525665283, mean loss: 0.3735250979541092
Epoch: 9, step: 567, loss: 0.3831990361213684, mean loss: 0.37352581116099265
Epoch: 9, step: 568, loss: 0.35403957962989807, mean loss: 0.37352437465295496
Epoch: 9, step: 569, loss: 0.3644843101501465, mean loss: 0.3735237082763883
Epoch: 9, step: 570, loss: 0.33565881848335266, mean loss: 0.3735209173211445
Epoch: 9, step: 571, loss: 0.4183717668056488, mean loss: 0.3735242229556879
Epoch: 9, step: 572, loss: 0.3303568363189697, mean loss: 0.3735210416315935
Epoch: 9, step: 573, loss: 0.3095966577529907, mean loss: 0.37351633091796943
Epoch: 9, step: 574, loss: 0.34068161249160767, mean loss: 0.3735139114412598
Epoch: 9, step: 575, loss: 0.336076557636261, mean loss: 0.3735111530155447
Epoch: 9, step: 576, loss: 0.3727480173110962, mean loss: 0.373511096791003
Epoch: 9, step: 577, loss: 0.30716878175735474, mean loss: 0.3735062093359394
Epoch: 9, step: 578, loss: 0.35917744040489197, mean loss: 0.37350515380968297
Epoch: 9, step: 579, loss: 0.31275397539138794, mean loss: 0.3735006789143958
Epoch: 9, step: 580, loss: 0.3225344717502594, mean loss: 0.37349692505071724
Epoch: 9, step: 581, loss: 0.339495450258255, mean loss: 0.3734944208914307
Epoch: 9, step: 582, loss: 0.32675647735595703, mean loss: 0.37349097896319333
Epoch: 9, step: 583, loss: 0.36052364110946655, mean loss: 0.3734900240782262
Epoch: 9, step: 584, loss: 0.35537970066070557, mean loss: 0.37348869057381434
Epoch: 9, step: 585, loss: 0.32185059785842896, mean loss: 0.3734848886232389
Epoch: 9, step: 586, loss: 0.3005608320236206, mean loss: 0.37347951984928623
Epoch: 9, step: 587, loss: 0.3020177185535431, mean loss: 0.3734742591159753
Epoch: 9, step: 588, loss: 0.3547980487346649, mean loss: 0.3734728843489248
Epoch: 9, step: 589, loss: 0.32938772439956665, mean loss: 0.37346963945271183
Epoch: 9, step: 590, loss: 0.4037055969238281, mean loss: 0.37347186481206057
Epoch: 9, step: 591, loss: 0.3402448296546936, mean loss: 0.37346941949007373
Epoch: 9, step: 592, loss: 0.36346372961997986, mean loss: 0.37346868318204
Epoch: 9, step: 593, loss: 0.322481632232666, mean loss: 0.3734649313754948
Epoch: 9, step: 594, loss: 0.360372930765152, mean loss: 0.37346396809092336
Epoch: 9, step: 595, loss: 0.34039902687072754, mean loss: 0.37346153541425914
Epoch: 9, step: 596, loss: 0.3127237558364868, mean loss: 0.37345706710118787
Epoch: 9, step: 597, loss: 0.3415449261665344, mean loss: 0.3734547195845677
Epoch: 9, step: 598, loss: 0.3147522211074829, mean loss: 0.3734504016369048
Epoch: 9, step: 599, loss: 0.3316360116004944, mean loss: 0.3734473261448456
Epoch: 9, step: 600, loss: 0.3524971306324005, mean loss: 0.37344578534941186
Epoch: 9, step: 601, loss: 0.33845698833465576, mean loss: 0.3734432122653543
Epoch: 9, step: 602, loss: 0.33743926882743835, mean loss: 0.3734405647218998
Epoch: 9, step: 603, loss: 0.3844541907310486, mean loss: 0.37344137454734166
Epoch: 9, step: 604, loss: 0.31304219365119934, mean loss: 0.37343693375762793
Epoch: 9, step: 605, loss: 0.3191715180873871, mean loss: 0.37343294424022827
Epoch: 9, step: 606, loss: 0.3131430745124817, mean loss: 0.37342851213924116
Epoch: 9, step: 607, loss: 0.3350861370563507, mean loss: 0.37342569367591544
Epoch: 9, step: 608, loss: 0.34218737483024597, mean loss: 0.3734233975848573
Epoch: 9, step: 609, loss: 0.34672030806541443, mean loss: 0.3734214349882441
Epoch: 9, step: 610, loss: 0.32812419533729553, mean loss: 0.37341810602229636
Epoch: 9, step: 611, loss: 0.3372752070426941, mean loss: 0.3734154500185501
Epoch: 9, step: 612, loss: 0.3405706584453583, mean loss: 0.37341303655748953
Epoch: 9, step: 613, loss: 0.32052135467529297, mean loss: 0.3734091503207605
Epoch: 9, step: 614, loss: 0.3210979700088501, mean loss: 0.3734053070189963
Epoch: 9, step: 615, loss: 0.373073548078537, mean loss: 0.3734052826464618
Epoch: 9, step: 616, loss: 0.33718812465667725, mean loss: 0.37340262216324793
Epoch: 9, step: 617, loss: 0.3540230393409729, mean loss: 0.3734011986592945
Epoch: 9, step: 618, loss: 0.42610350251197815, mean loss: 0.3734050695593204
Epoch: 9, step: 619, loss: 0.3035880923271179, mean loss: 0.37339994199048726
Epoch: 9, step: 620, loss: 0.4018164277076721, mean loss: 0.3734020288294178
Epoch: 9, step: 621, loss: 0.34343022108078003, mean loss: 0.3733998279329757
Epoch: 9, step: 622, loss: 0.3123219609260559, mean loss: 0.37339534317880824
Epoch: 9, step: 623, loss: 0.3542860448360443, mean loss: 0.37339394014662447
Epoch: 9, step: 624, loss: 0.3171491026878357, mean loss: 0.37338981087289574
Epoch: 9, step: 625, loss: 0.3484216630458832, mean loss: 0.3733879779447041
Epoch: 9, step: 626, loss: 0.36468270421028137, mean loss: 0.3733873389317308
Epoch: 9, step: 627, loss: 0.34984758496284485, mean loss: 0.373385611116554
Epoch: 9, step: 628, loss: 0.3543735146522522, mean loss: 0.37338421573332725
Epoch: 9, step: 629, loss: 0.3376465141773224, mean loss: 0.37338159297525036
Epoch: 9, step: 630, loss: 0.36740970611572266, mean loss: 0.37338115473595634
Epoch: 9, step: 631, loss: 0.3764180839061737, mean loss: 0.37338137758077367
Epoch: 9, step: 632, loss: 0.336533784866333, mean loss: 0.3733786739640216
Epoch: 9, step: 633, loss: 0.33247092366218567, mean loss: 0.37337567266172506
Epoch: 9, step: 634, loss: 0.3330935537815094, mean loss: 0.3733727174773013
Epoch: 9, step: 635, loss: 0.3069702982902527, mean loss: 0.37336784640781867
Epoch: 9, step: 636, loss: 0.3257351219654083, mean loss: 0.37336435247952393
Epoch: 9, step: 637, loss: 0.3558257520198822, mean loss: 0.37336306609251646
Epoch: 9, step: 638, loss: 0.3394339382648468, mean loss: 0.37336057770763725
Epoch: 9, step: 639, loss: 0.4089474081993103, mean loss: 0.37336318747813385
Epoch: 9, step: 640, loss: 0.34216544032096863, mean loss: 0.37336089975010295
Epoch: 9, step: 641, loss: 0.31585487723350525, mean loss: 0.37335668314777737
Epoch: 9, step: 642, loss: 0.3409021496772766, mean loss: 0.3733543036087004
Epoch: 9, step: 643, loss: 0.3733951449394226, mean loss: 0.3733543066029329
Epoch: 9, step: 644, loss: 0.38461118936538696, mean loss: 0.37335513182709257
Epoch: 9, step: 645, loss: 0.36450085043907166, mean loss: 0.3733544827813963
Epoch: 9, step: 646, loss: 0.32791244983673096, mean loss: 0.3733511519866338
Epoch: 9, step: 647, loss: 0.32817891240119934, mean loss: 0.37334784120976594
Epoch: 9, step: 648, loss: 0.3597058057785034, mean loss: 0.37334684142703006
Epoch: 9, step: 649, loss: 0.3474762737751007, mean loss: 0.3733449455917925
Epoch: 9, step: 650, loss: 0.3384442627429962, mean loss: 0.37334238820314675
Epoch: 9, step: 651, loss: 0.32571735978126526, mean loss: 0.37333889867878994
Epoch: 9, step: 652, loss: 0.34306418895721436, mean loss: 0.3733366805888404
Epoch: 9, step: 653, loss: 0.3307444751262665, mean loss: 0.3733335602807479
Epoch: 9, step: 654, loss: 0.30463674664497375, mean loss: 0.3733285279158196
Epoch: 9, step: 655, loss: 0.34908899664878845, mean loss: 0.37332675238613405
Epoch: 9, step: 656, loss: 0.3662491738796234, mean loss: 0.373326233996146
Epoch: 9, step: 657, loss: 0.29839637875556946, mean loss: 0.3733207462375961
Epoch: 9, step: 658, loss: 0.3733423054218292, mean loss: 0.3733207478164452
Epoch: 9, step: 659, loss: 0.34415024518966675, mean loss: 0.37331861172222824
Epoch: 9, step: 660, loss: 0.3460981249809265, mean loss: 0.373316618569505
Epoch: 9, step: 661, loss: 0.3284948468208313, mean loss: 0.37331333684657714
Epoch: 9, step: 662, loss: 0.34290722012519836, mean loss: 0.37331111075998796
Epoch: 9, step: 663, loss: 0.33622807264328003, mean loss: 0.3733083960427027
Epoch: 9, step: 664, loss: 0.3380904495716095, mean loss: 0.37330581805086677
Epoch: 9, step: 665, loss: 0.34924671053886414, mean loss: 0.37330405702704067
Epoch: 9, step: 666, loss: 0.34096094965934753, mean loss: 0.3733016898231054
Epoch: 9, step: 667, loss: 0.3347790241241455, mean loss: 0.3732988705413651
Epoch: 9, step: 668, loss: 0.4202139675617218, mean loss: 0.3733023037720289
Epoch: 9, step: 669, loss: 0.3421533405780792, mean loss: 0.37330002446841454
Epoch: 9, step: 670, loss: 0.3457074761390686, mean loss: 0.3732980055507055
Epoch: 9, step: 671, loss: 0.32996171712875366, mean loss: 0.3732948349121028
Epoch: 9, step: 672, loss: 0.31270354986190796, mean loss: 0.3732904021602519
Epoch: 9, step: 673, loss: 0.3866710364818573, mean loss: 0.3732913809923164
Epoch: 9, step: 674, loss: 0.34436938166618347, mean loss: 0.3732892654192547
Epoch: 9, step: 675, loss: 0.3361910581588745, mean loss: 0.37328655197518945
Epoch: 9, step: 676, loss: 0.3495538532733917, mean loss: 0.3732848162406249
Epoch: 9, step: 677, loss: 0.28901612758636475, mean loss: 0.37327865354582784
Epoch: 9, step: 678, loss: 0.36979541182518005, mean loss: 0.3732783988297971
Epoch: 9, step: 679, loss: 0.41792190074920654, mean loss: 0.37328166319817374
Epoch: 9, step: 680, loss: 0.3477294147014618, mean loss: 0.3732797949340444
Epoch: 9, step: 681, loss: 0.31712087988853455, mean loss: 0.3732756891499352
Epoch: 9, step: 682, loss: 0.36100858449935913, mean loss: 0.37327479236620464
Epoch: 9, step: 683, loss: 0.32775866985321045, mean loss: 0.37327146516426657
Epoch: 9, step: 684, loss: 0.3471499979496002, mean loss: 0.3732695558398594
Epoch: 9, step: 685, loss: 0.3563857078552246, mean loss: 0.37326832182085745
Epoch: 9, step: 686, loss: 0.3331737816333771, mean loss: 0.3732653915760144
Epoch: 9, step: 687, loss: 0.32874342799186707, mean loss: 0.3732621379978513
Epoch: 9, step: 688, loss: 0.3444330096244812, mean loss: 0.3732600313753907
Epoch: 9, step: 689, loss: 0.3146181106567383, mean loss: 0.37325574656458266
Epoch: 9, step: 690, loss: 0.35025539994239807, mean loss: 0.3732540661125755
Epoch: 9, step: 691, loss: 0.3782041072845459, mean loss: 0.37325442774620876
Epoch: 9, step: 692, loss: 0.36320963501930237, mean loss: 0.37325369396048835
Epoch: 9, step: 693, loss: 0.32894086837768555, mean loss: 0.3732504570849892
Epoch: 9, step: 694, loss: 0.32021477818489075, mean loss: 0.37324658332274396
Epoch: 9, step: 695, loss: 0.3949893116950989, mean loss: 0.3732481713105012
Epoch: 9, step: 696, loss: 0.3188613951206207, mean loss: 0.373244199443402
Epoch: 9, step: 697, loss: 0.2978695034980774, mean loss: 0.3732386952301739
Epoch: 9, step: 698, loss: 0.3238949775695801, mean loss: 0.37323509218397743
Epoch: 9, step: 699, loss: 0.3096660077571869, mean loss: 0.3732304507496589
Epoch: 9, step: 700, loss: 0.3768266439437866, mean loss: 0.3732307133030059
Epoch: 9, step: 701, loss: 0.32797524333000183, mean loss: 0.373227409501723
Epoch: 9, step: 702, loss: 0.338365763425827, mean loss: 0.37322486467026994
Epoch: 9, step: 703, loss: 0.36088070273399353, mean loss: 0.37322396363655197
Epoch: 9, step: 704, loss: 0.3296204209327698, mean loss: 0.3732207811285085
Epoch: 9, step: 705, loss: 0.3403708040714264, mean loss: 0.37321838366995813
Epoch: 9, step: 706, loss: 0.30769383907318115, mean loss: 0.37321360190358605
Epoch: 9, step: 707, loss: 0.30786722898483276, mean loss: 0.37320883348758205
Epoch: 9, step: 708, loss: 0.34985068440437317, mean loss: 0.3732071291352228
Epoch: 9, step: 709, loss: 0.3507883548736572, mean loss: 0.3732054934447032
Epoch: 9, step: 710, loss: 0.3256533443927765, mean loss: 0.3732020242574958
Epoch: 9, step: 711, loss: 0.34620407223701477, mean loss: 0.37320005475413864
Epoch: 9, step: 712, loss: 0.389539897441864, mean loss: 0.37320124666038185
Epoch: 9, step: 713, loss: 0.34317976236343384, mean loss: 0.3731990569095214
Epoch: 9, step: 714, loss: 0.36607930064201355, mean loss: 0.37319853763621763
Epoch: 9, step: 715, loss: 0.36578476428985596, mean loss: 0.37319799695846484
Epoch: 9, step: 716, loss: 0.352929025888443, mean loss: 0.3731965188740872
Epoch: 9, step: 717, loss: 0.3174585700035095, mean loss: 0.3731924545639756
Epoch: 9, step: 718, loss: 0.3287593424320221, mean loss: 0.37318921481828604
Epoch: 9, step: 719, loss: 0.32692939043045044, mean loss: 0.3731858421276774
Epoch: 9, step: 720, loss: 0.31548964977264404, mean loss: 0.37318163594612497
Epoch: 9, step: 721, loss: 0.3647734224796295, mean loss: 0.37318102301322903
Epoch: 9, step: 722, loss: 0.3219040632247925, mean loss: 0.37317728535306516
Epoch: 9, step: 723, loss: 0.3420881927013397, mean loss: 0.373175019384213
Epoch: 9, step: 724, loss: 0.42693382501602173, mean loss: 0.3731789373789387
Epoch: 9, step: 725, loss: 0.3492153286933899, mean loss: 0.3731771910148019
Epoch: 9, step: 726, loss: 0.37242230772972107, mean loss: 0.3731771360061824
Epoch: 9, step: 727, loss: 0.3124987483024597, mean loss: 0.3731727146721906
Epoch: 9, step: 728, loss: 0.3302614092826843, mean loss: 0.37316958816542267
Epoch: 9, step: 729, loss: 0.3754422068595886, mean loss: 0.37316975373577776
Epoch: 9, step: 730, loss: 0.3493972718715668, mean loss: 0.37316802193116905
Epoch: 9, step: 731, loss: 0.3600163459777832, mean loss: 0.3731670639128158
Epoch: 9, step: 732, loss: 0.3586154878139496, mean loss: 0.37316600399759264
Epoch: 9, step: 733, loss: 0.34918123483657837, mean loss: 0.3731642571098169
Epoch: 9, step: 734, loss: 0.31658855080604553, mean loss: 0.3731601368195027
Epoch: 9, step: 735, loss: 0.34389665722846985, mean loss: 0.3731580057767128
Epoch: 9, step: 736, loss: 0.37434905767440796, mean loss: 0.3731580925058978
Epoch: 9, step: 737, loss: 0.3274702727794647, mean loss: 0.3731547658843945
Epoch: 9, step: 738, loss: 0.30332693457603455, mean loss: 0.3731496819505533
Epoch: 9, step: 739, loss: 0.3580947816371918, mean loss: 0.37314858593276695
Epoch: 9, step: 740, loss: 0.30720722675323486, mean loss: 0.3731437856591133
Epoch: 9, step: 741, loss: 0.2920416593551636, mean loss: 0.37313788217051935
Epoch: 9, step: 742, loss: 0.3410046696662903, mean loss: 0.3731355433385444
Epoch: 9, step: 743, loss: 0.3422303795814514, mean loss: 0.37313329405442813
Epoch: 9, step: 744, loss: 0.33740657567977905, mean loss: 0.37313069404581345
Epoch: 9, step: 745, loss: 0.34190842509269714, mean loss: 0.3731284220134344
Epoch: 9, step: 746, loss: 0.3203979432582855, mean loss: 0.3731245851161954
Epoch: 9, step: 747, loss: 0.361233651638031, mean loss: 0.37312371994350346
Epoch: 9, step: 748, loss: 0.36795729398727417, mean loss: 0.37312334406675146
Epoch: 9, step: 749, loss: 0.32343345880508423, mean loss: 0.3731197292053182
Epoch: 9, step: 750, loss: 0.3995369076728821, mean loss: 0.37312165087393445
Epoch: 9, step: 751, loss: 0.31449732184410095, mean loss: 0.3731173866661202
Epoch: 9, step: 752, loss: 0.3459411561489105, mean loss: 0.3731154100692392
Epoch: 9, step: 753, loss: 0.3368244767189026, mean loss: 0.3731127707286319
Epoch: 9, step: 754, loss: 0.3590626120567322, mean loss: 0.3731117489732198
Epoch: 9, step: 755, loss: 0.34774067997932434, mean loss: 0.37310990407291483
Epoch: 9, step: 756, loss: 0.33974429965019226, mean loss: 0.37310747801282446
Epoch: 9, step: 757, loss: 0.3561113476753235, mean loss: 0.3731062422901011
Epoch: 9, step: 758, loss: 0.2990821599960327, mean loss: 0.37310086067742976
Epoch: 9, step: 759, loss: 0.3449179530143738, mean loss: 0.3730988119054275
Epoch: 9, step: 760, loss: 0.35943108797073364, mean loss: 0.3730978183949285
Epoch: 9, step: 761, loss: 0.30425477027893066, mean loss: 0.37309281453912707
Epoch: 9, step: 762, loss: 0.3529145121574402, mean loss: 0.3730913479861522
Epoch: 9, step: 763, loss: 0.36566871404647827, mean loss: 0.3730908085505461
Epoch: 9, step: 764, loss: 0.327095091342926, mean loss: 0.3730874660814517
Epoch: 9, step: 765, loss: 0.3329002559185028, mean loss: 0.3730845459237593
Epoch: 9, step: 766, loss: 0.32521167397499084, mean loss: 0.37308106754899006
Epoch: 9, step: 767, loss: 0.302780419588089, mean loss: 0.37307595997503185
Epoch: 9, step: 768, loss: 0.3608261048793793, mean loss: 0.37307507004730966
Epoch: 9, step: 769, loss: 0.35386234521865845, mean loss: 0.3730736743822778
Epoch: 9, step: 770, loss: 0.335904985666275, mean loss: 0.37307097454289984
Epoch: 9, step: 771, loss: 0.37315186858177185, mean loss: 0.3730709804184111
Epoch: 9, step: 772, loss: 0.42197185754776, mean loss: 0.37307453193828394
Epoch: 9, step: 773, loss: 0.33654138445854187, mean loss: 0.37307187884115395
Epoch: 9, step: 774, loss: 0.3227144479751587, mean loss: 0.3730682220674363
Epoch: 9, step: 775, loss: 0.32450392842292786, mean loss: 0.37306469576089807
Epoch: 9, step: 776, loss: 0.33945655822753906, mean loss: 0.3730622556144134
Epoch: 9, step: 777, loss: 0.36791446805000305, mean loss: 0.37306188188219586
Epoch: 9, step: 778, loss: 0.32383882999420166, mean loss: 0.3730583085208973
Epoch: 9, step: 779, loss: 0.3787183165550232, mean loss: 0.3730587193809462
Epoch: 9, step: 780, loss: 0.3363931477069855, mean loss: 0.37305605801986075
Epoch: 9, step: 781, loss: 0.3648933470249176, mean loss: 0.373055465574586
Epoch: 9, step: 782, loss: 0.31533995270729065, mean loss: 0.37305127691700074
Epoch: 9, step: 783, loss: 0.3110466003417969, mean loss: 0.37304677730331604
Epoch: 9, step: 784, loss: 0.37349358201026917, mean loss: 0.3730468097251074
Epoch: 9, step: 785, loss: 0.3978497087955475, mean loss: 0.3730486093840154
Epoch: 9, step: 786, loss: 0.3194209635257721, mean loss: 0.37304471852963983
Epoch: 9, step: 787, loss: 0.3787536919116974, mean loss: 0.3730451327035648
Epoch: 9, step: 788, loss: 0.3191939890384674, mean loss: 0.3730412262005786
Epoch: 9, step: 789, loss: 0.32219061255455017, mean loss: 0.3730375376314762
Epoch: 9, step: 790, loss: 0.3782457709312439, mean loss: 0.37303791539555103
Epoch: 9, step: 791, loss: 0.3139636218547821, mean loss: 0.37303363092401487
Epoch: 9, step: 792, loss: 0.3102988004684448, mean loss: 0.3730290812952923
Epoch: 9, step: 793, loss: 0.3341403603553772, mean loss: 0.3730262612285091
Epoch: 9, step: 794, loss: 0.34766918420791626, mean loss: 0.3730244225600282
Epoch: 9, step: 795, loss: 0.32793545722961426, mean loss: 0.37302115334850483
Epoch: 9, step: 796, loss: 0.3554449677467346, mean loss: 0.37301987906549156
Epoch: 9, step: 797, loss: 0.34412944316864014, mean loss: 0.3730177846450264
Epoch: 9, step: 798, loss: 0.33052554726600647, mean loss: 0.37301470438135265
Epoch: 9, step: 799, loss: 0.32719242572784424, mean loss: 0.373011382963648
Epoch: 9, step: 800, loss: 0.3592943847179413, mean loss: 0.3730103887621371
Epoch: 9, step: 801, loss: 0.44870635867118835, mean loss: 0.3730158747724219
Epoch: 9, step: 802, loss: 0.3174179494380951, mean loss: 0.373011845645287
Epoch: 9, step: 803, loss: 0.36466675996780396, mean loss: 0.37301124092893356
Epoch: 9, step: 804, loss: 0.34811803698539734, mean loss: 0.37300943720428004
Epoch: 9, step: 805, loss: 0.3213176131248474, mean loss: 0.3730056919627151
Epoch: 9, step: 806, loss: 0.3550199866294861, mean loss: 0.37300438893400156
Epoch: 9, step: 807, loss: 0.2882661819458008, mean loss: 0.3729982502635446
Epoch: 9, step: 808, loss: 0.3576834797859192, mean loss: 0.37299714089951147
Epoch: 9, step: 809, loss: 0.3134301006793976, mean loss: 0.37299282632322434
Epoch: 9, step: 810, loss: 0.30695104598999023, mean loss: 0.37298804311323425
Epoch: 9, step: 811, loss: 0.34860506653785706, mean loss: 0.3729862772545599
Epoch: 9, step: 812, loss: 0.35402145981788635, mean loss: 0.37298490388810057
Epoch: 9, step: 813, loss: 0.36746200919151306, mean loss: 0.37298450396813704
Epoch: 9, step: 814, loss: 0.3927176594734192, mean loss: 0.3729859327680433
Epoch: 9, step: 815, loss: 0.32778292894363403, mean loss: 0.3729826600339118
Epoch: 9, step: 816, loss: 0.36609309911727905, mean loss: 0.3729821612602264
Epoch: 9, step: 817, loss: 0.34950539469718933, mean loss: 0.3729804617693792
Epoch: 9, step: 818, loss: 0.34463173151016235, mean loss: 0.3729784097440257
Epoch: 9, step: 819, loss: 0.324186235666275, mean loss: 0.3729748781738116
Epoch: 9, step: 820, loss: 0.40355509519577026, mean loss: 0.3729770914051224
Epoch: 9, step: 821, loss: 0.3468148708343506, mean loss: 0.37297519806161605
Epoch: 9, step: 822, loss: 0.3449461758136749, mean loss: 0.3729731697656288
Epoch: 9, step: 823, loss: 0.3343002200126648, mean loss: 0.3729703714335193
Epoch: 9, step: 824, loss: 0.3522692322731018, mean loss: 0.3729688736302373
Epoch: 9, step: 825, loss: 0.3797721564769745, mean loss: 0.37296936583707035
Epoch: 9, step: 826, loss: 0.3536190688610077, mean loss: 0.3729679659747412
Epoch: 9, step: 827, loss: 0.33479878306388855, mean loss: 0.37296520489380147
Epoch: 9, step: 828, loss: 0.34368112683296204, mean loss: 0.3729630866964734
Epoch: 9, step: 829, loss: 0.3117588460445404, mean loss: 0.37295865994682403
Epoch: 9, step: 830, loss: 0.3614426255226135, mean loss: 0.3729578270810958
Epoch: 9, step: 831, loss: 0.31371772289276123, mean loss: 0.3729535430122364
Epoch: 9, step: 832, loss: 0.3729667067527771, mean loss: 0.3729535439641303
Epoch: 9, step: 833, loss: 0.3737636208534241, mean loss: 0.37295360253801957
Epoch: 9, step: 834, loss: 0.2975948452949524, mean loss: 0.3729481539979832
Epoch: 9, step: 835, loss: 0.3452308773994446, mean loss: 0.37294615014629157
Epoch: 9, step: 836, loss: 0.3334427773952484, mean loss: 0.3729432944119786
Epoch: 9, step: 837, loss: 0.33895471692085266, mean loss: 0.372940837524781
Epoch: 9, step: 838, loss: 0.34857800602912903, mean loss: 0.3729390765684026
Epoch: 9, step: 839, loss: 0.32853129506111145, mean loss: 0.3729358669860444
Epoch: 9, step: 840, loss: 0.31449562311172485, mean loss: 0.37293164350957736
Epoch: 9, step: 841, loss: 0.3656010627746582, mean loss: 0.37293111376678684
Epoch: 9, step: 842, loss: 0.3545019328594208, mean loss: 0.372929782082351
Epoch: 9, step: 843, loss: 0.33877328038215637, mean loss: 0.37292731412702584
Epoch: 9, step: 844, loss: 0.3910831809043884, mean loss: 0.3729286258723316
Epoch: 9, step: 845, loss: 0.32980820536613464, mean loss: 0.37292551068518337
Epoch: 9, step: 846, loss: 0.356939435005188, mean loss: 0.37292435587223244
Epoch: 9, step: 847, loss: 0.37571048736572266, mean loss: 0.3729245571241461
Epoch: 9, step: 848, loss: 0.3000360131263733, mean loss: 0.3729192925128065
Epoch: 9, step: 849, loss: 0.3246730864048004, mean loss: 0.37291580802587104
Epoch: 9, step: 850, loss: 0.32445159554481506, mean loss: 0.37291230804663505
Epoch: 9, step: 851, loss: 0.344805508852005, mean loss: 0.37291027838175966
Epoch: 9, step: 852, loss: 0.30166691541671753, mean loss: 0.3729051340852065
Epoch: 9, step: 853, loss: 0.3090275228023529, mean loss: 0.3729005219833088
Epoch: 9, step: 854, loss: 0.3201085925102234, mean loss: 0.37289671056684265
Epoch: 9, step: 855, loss: 0.3186124861240387, mean loss: 0.3728927916941569
Epoch: 9, step: 856, loss: 0.37003612518310547, mean loss: 0.3728925854813141
Epoch: 9, step: 857, loss: 0.3318539261817932, mean loss: 0.3728896232567364
Epoch: 9, step: 858, loss: 0.3337949514389038, mean loss: 0.3728868015554143
Epoch: 9, step: 859, loss: 0.3463023900985718, mean loss: 0.37288488293449507
Epoch: 9, step: 860, loss: 0.3580274283885956, mean loss: 0.372883810736
Epoch: 9, step: 861, loss: 0.3753916621208191, mean loss: 0.37288399170377207
Epoch: 9, step: 862, loss: 0.35076621174812317, mean loss: 0.3728823957892071
Epoch: 9, step: 863, loss: 0.34286749362945557, mean loss: 0.37288023021185074
Epoch: 9, step: 864, loss: 0.354319304227829, mean loss: 0.3728788911363162
Epoch: 9, step: 865, loss: 0.3412801921367645, mean loss: 0.37287661161683855
Epoch: 9, step: 866, loss: 0.3717325031757355, mean loss: 0.37287652908719554
Epoch: 9, step: 867, loss: 0.34785205125808716, mean loss: 0.3728747240902373
Epoch: 9, step: 868, loss: 0.3430006802082062, mean loss: 0.37287256945310193
Epoch: 9, step: 869, loss: 0.34074705839157104, mean loss: 0.3728702525981285
Epoch: 9, step: 870, loss: 0.35338297486305237, mean loss: 0.37286884729938075
Epoch: 9, step: 871, loss: 0.32813122868537903, mean loss: 0.37286562133899614
Epoch: 9, step: 872, loss: 0.32394272089004517, mean loss: 0.3728620938387835
Epoch: 9, step: 873, loss: 0.4739718437194824, mean loss: 0.37286938365492484
Epoch: 9, step: 874, loss: 0.3811408579349518, mean loss: 0.3728699799691257
Epoch: 9, step: 875, loss: 0.33228346705436707, mean loss: 0.3728670541824392
Epoch: 9, step: 876, loss: 0.31541088223457336, mean loss: 0.37286291260008875
Epoch: 9, step: 877, loss: 0.3243534564971924, mean loss: 0.37285941617107743
Epoch: 9, step: 878, loss: 0.4095422923564911, mean loss: 0.3728620599819737
Epoch: 9, step: 879, loss: 0.3610953986644745, mean loss: 0.3728612119954273
Epoch: 9, step: 880, loss: 0.3435159921646118, mean loss: 0.37285909732944544
Epoch: 9, step: 881, loss: 0.32732242345809937, mean loss: 0.37285581611645574
Epoch: 9, step: 882, loss: 0.3408915400505066, mean loss: 0.3728535130487948
Epoch: 9, step: 883, loss: 0.33043545484542847, mean loss: 0.3728504569927283
Epoch: 9, step: 884, loss: 0.44381940364837646, mean loss: 0.372855569660883
Epoch: 9, step: 885, loss: 0.3301120400428772, mean loss: 0.37285249059953607
Epoch: 9, step: 886, loss: 0.3464292585849762, mean loss: 0.37285058731984044
Epoch: 9, step: 887, loss: 0.3499629497528076, mean loss: 0.3728489388296671
Epoch: 9, step: 888, loss: 0.3239501416683197, mean loss: 0.3728454171301956
Epoch: 9, step: 889, loss: 0.3904467821121216, mean loss: 0.3728466846921272
Epoch: 9, step: 890, loss: 0.29763710498809814, mean loss: 0.37284126886583613
Epoch: 9, step: 891, loss: 0.34979957342147827, mean loss: 0.3728396097575812
Epoch: 9, step: 892, loss: 0.3688989579677582, mean loss: 0.37283932603292214
Epoch: 9, step: 893, loss: 0.3284871280193329, mean loss: 0.37283613293011336
Epoch: 9, step: 894, loss: 0.33491095900535583, mean loss: 0.3728334027325808
Epoch: 9, step: 895, loss: 0.3530702292919159, mean loss: 0.37283198010276214
Epoch: 9, step: 896, loss: 0.3216358721256256, mean loss: 0.37282829507375637
Epoch: 9, step: 897, loss: 0.31081628799438477, mean loss: 0.37282383185171236
Epoch: 9, step: 898, loss: 0.3471146821975708, mean loss: 0.37282198160704494
Epoch: 9, step: 899, loss: 0.34538546204566956, mean loss: 0.3728200071885388
Epoch: 9, step: 900, loss: 0.31000205874443054, mean loss: 0.37281548693607824
Epoch: 9, step: 901, loss: 0.37108761072158813, mean loss: 0.3728153626105484
Epoch: 9, step: 902, loss: 0.34295982122421265, mean loss: 0.37281321457533817
Epoch: 9, step: 903, loss: 0.315846711397171, mean loss: 0.372809116265757
Epoch: 9, step: 904, loss: 0.33004871010780334, mean loss: 0.372806040198844
Epoch: 9, step: 905, loss: 0.3367706537246704, mean loss: 0.3728034480979611
Epoch: 9, step: 906, loss: 0.3176106810569763, mean loss: 0.3727994782520976
Epoch: 9, step: 907, loss: 0.3451058566570282, mean loss: 0.3727974864783925
Epoch: 9, step: 908, loss: 0.33906370401382446, mean loss: 0.37279506046023614
Epoch: 9, step: 909, loss: 0.3543310761451721, mean loss: 0.37279373268917937
Epoch: 9, step: 910, loss: 0.3403802812099457, mean loss: 0.3727914019599438
Epoch: 9, step: 911, loss: 0.3110803961753845, mean loss: 0.37278696487295904
Epoch: 9, step: 912, loss: 0.3177228569984436, mean loss: 0.3727830059896551
Epoch: 9, step: 913, loss: 0.3851223289966583, mean loss: 0.3727838930725456
Epoch: 9, step: 914, loss: 0.35078251361846924, mean loss: 0.3727823114911026
Epoch: 9, step: 915, loss: 0.3613636791706085, mean loss: 0.3727814907153464
Epoch: 9, step: 916, loss: 0.364406019449234, mean loss: 0.3727808887264679
Epoch: 9, step: 917, loss: 0.30848169326782227, mean loss: 0.37277626753950094
Epoch: 9, step: 918, loss: 0.3177988827228546, mean loss: 0.37277231659556875
Epoch: 9, step: 919, loss: 0.3798081874847412, mean loss: 0.37277282219134983
Epoch: 9, step: 920, loss: 0.3455987870693207, mean loss: 0.37277086961283995
Epoch: 9, step: 921, loss: 0.39470574259757996, mean loss: 0.37277244562038303
Epoch: 9, step: 922, loss: 0.35216906666755676, mean loss: 0.37277096538624604
Epoch: 9, step: 923, loss: 0.3754943311214447, mean loss: 0.3727711610303362
Epoch: 9, step: 924, loss: 0.34286630153656006, mean loss: 0.3727690128470524
Epoch: 9, step: 925, loss: 0.3528966009616852, mean loss: 0.37276758543634375
Epoch: 9, step: 926, loss: 0.3342576026916504, mean loss: 0.3727648195106995
Epoch: 9, step: 927, loss: 0.35366499423980713, mean loss: 0.3727634477909874
Epoch: 9, step: 928, loss: 0.3385251760482788, mean loss: 0.37276098902820515
Epoch: 9, step: 929, loss: 0.34836095571517944, mean loss: 0.3727592369074732
Epoch: 9, step: 930, loss: 0.40124577283859253, mean loss: 0.3727612823254334
Epoch: 9, step: 931, loss: 0.3175309896469116, mean loss: 0.37275731691096764
Epoch: 9, step: 932, loss: 0.29464152455329895, mean loss: 0.37275170877022834
Epoch: 9, step: 933, loss: 0.32003259658813477, mean loss: 0.3727479241964895
Epoch: 9, step: 934, loss: 0.3178856372833252, mean loss: 0.372743986052285
Epoch: 9, step: 935, loss: 0.3716702163219452, mean loss: 0.37274390898009646
Epoch: 9, step: 936, loss: 0.33681896328926086, mean loss: 0.37274133057302755
Epoch: 9, step: 937, loss: 0.35149192810058594, mean loss: 0.3727398055692618
Epoch: 9, step: 938, loss: 0.33317628502845764, mean loss: 0.3727369664217526
Epoch: 9, step: 939, loss: 0.34068751335144043, mean loss: 0.3727346666619169
Epoch: 9, step: 940, loss: 0.3173297643661499, mean loss: 0.3727306912796757
Epoch: 9, step: 941, loss: 0.3547408878803253, mean loss: 0.37272940057775295
Epoch: 9, step: 942, loss: 0.3763498067855835, mean loss: 0.37272966030988636
Epoch: 9, step: 943, loss: 0.34165486693382263, mean loss: 0.37272743112815204
Epoch: 9, step: 944, loss: 0.36620622873306274, mean loss: 0.3727269633566582
Epoch: 9, step: 945, loss: 0.3085182011127472, mean loss: 0.37272235793690184
Epoch: 9, step: 946, loss: 0.34076109528541565, mean loss: 0.37272006565671456
Epoch: 9, step: 947, loss: 0.32352855801582336, mean loss: 0.3727165378664362
Epoch: 9, step: 948, loss: 0.36484596133232117, mean loss: 0.37271597346510715
Epoch: 9, step: 949, loss: 0.34749284386634827, mean loss: 0.37271416483685543
Epoch: 9, step: 950, loss: 0.33055856823921204, mean loss: 0.37271114228027713
Epoch: 9, step: 951, loss: 0.3338329493999481, mean loss: 0.3727083549134231
Epoch: 9, step: 952, loss: 0.29234546422958374, mean loss: 0.3727025937197401
Epoch: 9, step: 953, loss: 0.36362746357917786, mean loss: 0.37270194317277666
Epoch: 9, step: 954, loss: 0.3064744174480438, mean loss: 0.37269719602019086
Epoch: 9, step: 955, loss: 0.34629079699516296, mean loss: 0.3726953033597103
Epoch: 9, step: 956, loss: 0.3118462562561035, mean loss: 0.3726909423586995
Epoch: 9, step: 957, loss: 0.35786399245262146, mean loss: 0.3726898797995834
Epoch: 9, step: 958, loss: 0.326022207736969, mean loss: 0.37268653564536897
Epoch: 9, step: 959, loss: 0.3692415654659271, mean loss: 0.37268628880027155
Epoch: 9, step: 960, loss: 0.32958459854125977, mean loss: 0.37268320062299426
Epoch: 9, step: 961, loss: 0.31835582852363586, mean loss: 0.3726793084198062
Epoch: 9, step: 962, loss: 0.3249047100543976, mean loss: 0.37267588592547524
Epoch: 9, step: 963, loss: 0.3118922710418701, mean loss: 0.37267153179833457
Epoch: 9, step: 964, loss: 0.34541070461273193, mean loss: 0.3726695791568916
Epoch: 9, step: 965, loss: 0.3422742784023285, mean loss: 0.37266740215497535
Epoch: 9, step: 966, loss: 0.40283316373825073, mean loss: 0.3726695625618781
Epoch: 9, step: 967, loss: 0.34838777780532837, mean loss: 0.37266782367726364
Epoch: 9, step: 968, loss: 0.34355494379997253, mean loss: 0.3726657389740859
Epoch: 9, step: 969, loss: 0.3159652352333069, mean loss: 0.3726616790783576
Epoch: 9, step: 970, loss: 0.35532146692276, mean loss: 0.37266043756535155
Epoch: 9, step: 971, loss: 0.36758193373680115, mean loss: 0.37266007398403506
Epoch: 9, step: 972, loss: 0.3210204243659973, mean loss: 0.37265637725201284
Epoch: 9, step: 973, loss: 0.3405323922634125, mean loss: 0.3726540777541611
Epoch: 9, step: 974, loss: 0.35485562682151794, mean loss: 0.37265280379732674
Epoch: 9, step: 975, loss: 0.34641698002815247, mean loss: 0.37265092605442884
Epoch: 9, step: 976, loss: 0.32556241750717163, mean loss: 0.37264755609031613
Epoch: 9, step: 977, loss: 0.34484726190567017, mean loss: 0.3726455666603616
Epoch: 9, step: 978, loss: 0.3488174378871918, mean loss: 0.3726438616064243
Epoch: 9, step: 979, loss: 0.3584434688091278, mean loss: 0.37264284555084354
Epoch: 9, step: 980, loss: 0.3526422679424286, mean loss: 0.3726414145872885
Epoch: 9, step: 981, loss: 0.3531891405582428, mean loss: 0.37264002295228854
Epoch: 9, step: 982, loss: 0.3540439009666443, mean loss: 0.3726386926624262
Epoch: 9, step: 983, loss: 0.34870633482933044, mean loss: 0.3726369807627243
Epoch: 9, step: 984, loss: 0.37490180134773254, mean loss: 0.3726371427554705
Epoch: 9, step: 985, loss: 0.3414177894592285, mean loss: 0.37263490993088916
Epoch: 9, step: 986, loss: 0.36712974309921265, mean loss: 0.3726345162266174
Epoch: 9, step: 987, loss: 0.35128912329673767, mean loss: 0.3726329898112191
Epoch: 9, step: 988, loss: 0.3229880928993225, mean loss: 0.37262943994372455
Epoch: 9, step: 989, loss: 0.3288087546825409, mean loss: 0.3726263067615952
Epoch: 9, step: 990, loss: 0.32480019330978394, mean loss: 0.3726228874355459
Epoch: 9, step: 991, loss: 0.3860244154930115, mean loss: 0.3726238455087556
Epoch: 9, step: 992, loss: 0.3477897644042969, mean loss: 0.37262207025097416
Epoch: 9, step: 993, loss: 0.31467142701148987, mean loss: 0.37261792796053533
Epoch: 9, step: 994, loss: 0.3199394941329956, mean loss: 0.37261416279479825
Epoch: 9, step: 995, loss: 0.33070066571235657, mean loss: 0.37261116726184496
Epoch: 9, step: 996, loss: 0.3068997859954834, mean loss: 0.37260647124374546
Epoch: 9, step: 997, loss: 0.3839550316333771, mean loss: 0.37260728220275574
Epoch: 9, step: 998, loss: 0.34774354100227356, mean loss: 0.3726055055867357
Epoch: 9, step: 999, loss: 0.3453711271286011, mean loss: 0.3726035597180262
Epoch: 9, step: 1000, loss: 0.37632012367248535, mean loss: 0.3726038252437785
Epoch: 9, step: 1001, loss: 0.360991507768631, mean loss: 0.37260299567402033
Epoch: 9, step: 1002, loss: 0.38289523124694824, mean loss: 0.3726037308862193
Epoch: 9, step: 1003, loss: 0.3164318799972534, mean loss: 0.37259971861115576
Epoch: 9, step: 1004, loss: 0.32407036423683167, mean loss: 0.37259625247628153
Epoch: 9, step: 1005, loss: 0.33958330750465393, mean loss: 0.3725938947456022
Epoch: 9, step: 1006, loss: 0.3303545415401459, mean loss: 0.3725908782953269
Epoch: 9, step: 1007, loss: 0.34491634368896484, mean loss: 0.3725889021074801
Epoch: 9, step: 1008, loss: 0.32994580268859863, mean loss: 0.3725858572592531
Epoch: 9, step: 1009, loss: 0.3683561384677887, mean loss: 0.372585555265908
Epoch: 9, step: 1010, loss: 0.3551516830921173, mean loss: 0.37258431061165126
Epoch: 9, step: 1011, loss: 0.3343147933483124, mean loss: 0.3725815786358329
Epoch: 9, step: 1012, loss: 0.358926385641098, mean loss: 0.37258060389152603
Epoch: 9, step: 1013, loss: 0.34552329778671265, mean loss: 0.3725786726062937
Epoch: 9, step: 1014, loss: 0.35288214683532715, mean loss: 0.37257726681614517
Epoch: 9, step: 1015, loss: 0.3226628303527832, mean loss: 0.3725737045526237
Epoch: 9, step: 1016, loss: 0.3245318531990051, mean loss: 0.3725702761753059
Epoch: 9, step: 1017, loss: 0.40002694725990295, mean loss: 0.3725722354068661
Epoch: 9, step: 1018, loss: 0.3446623980998993, mean loss: 0.37257024398072935
Epoch: 9, step: 1019, loss: 0.3542255759239197, mean loss: 0.3725689351431111
Epoch: 9, step: 1020, loss: 0.3906913101673126, mean loss: 0.3725702280285377
Epoch: 9, step: 1021, loss: 0.3819262981414795, mean loss: 0.3725708954611324
Epoch: 9, step: 1022, loss: 0.36397698521614075, mean loss: 0.3725702824423547
Epoch: 9, step: 1023, loss: 0.31658676266670227, mean loss: 0.3725662893239684
Epoch: 9, step: 1024, loss: 0.31663089990615845, mean loss: 0.3725622999231113
Epoch: 9, step: 1025, loss: 0.34744471311569214, mean loss: 0.37256050862466544
Epoch: 9, step: 1026, loss: 0.3459932506084442, mean loss: 0.3725586140758516
Epoch: 9, step: 1027, loss: 0.34530192613601685, mean loss: 0.3725566705014121
Epoch: 9, step: 1028, loss: 0.38773101568222046, mean loss: 0.37255775245115763
Epoch: 9, step: 1029, loss: 0.348203182220459, mean loss: 0.37255601606371785
Epoch: 9, step: 1030, loss: 0.3176598846912384, mean loss: 0.37255210245914294
Epoch: 9, step: 1031, loss: 0.356164813041687, mean loss: 0.3725509342748389
Epoch: 9, step: 1032, loss: 0.3772115111351013, mean loss: 0.37255126648503634
Epoch: 9, step: 1033, loss: 0.35252049565315247, mean loss: 0.3725498387750697
Epoch: 9, step: 1034, loss: 0.3604709804058075, mean loss: 0.3725489779056827
Epoch: 9, step: 1035, loss: 0.30451318621635437, mean loss: 0.37254412928882913
Epoch: 9, step: 1036, loss: 0.3393162190914154, mean loss: 0.37254176144801127
Epoch: 9, step: 1037, loss: 0.31034407019615173, mean loss: 0.37253732951903507
Epoch: 9, step: 1038, loss: 0.3675975501537323, mean loss: 0.37253697755755555
Epoch: 9, step: 1039, loss: 0.34823089838027954, mean loss: 0.3725352458619744
Epoch: 9, step: 1040, loss: 0.35424694418907166, mean loss: 0.3725339429979954
Epoch: 9, step: 1041, loss: 0.3253960907459259, mean loss: 0.3725305851227816
Epoch: 9, step: 1042, loss: 0.32704558968544006, mean loss: 0.3725273452199796
Epoch: 9, step: 1043, loss: 0.34056326746940613, mean loss: 0.37252506857626516
Epoch: 9, step: 1044, loss: 0.33729735016822815, mean loss: 0.3725225596582103
Epoch: 9, step: 1045, loss: 0.35347339510917664, mean loss: 0.37252120307335423
Epoch: 9, step: 1046, loss: 0.353369802236557, mean loss: 0.3725198393048691
Epoch: 9, step: 1047, loss: 0.3560587763786316, mean loss: 0.3725186671984232
Epoch: 9, step: 1048, loss: 0.3248926103115082, mean loss: 0.3725152762367367
Epoch: 9, step: 1049, loss: 0.3756716549396515, mean loss: 0.3725155009540016
Epoch: 9, step: 1050, loss: 0.353761225938797, mean loss: 0.37251416584508046
Epoch: 9, step: 1051, loss: 0.33989980816841125, mean loss: 0.3725118442080021
Epoch: 9, step: 1052, loss: 0.3341212272644043, mean loss: 0.3725091115852572
Epoch: 9, step: 1053, loss: 0.3336428999900818, mean loss: 0.37250634530685184
Epoch: 9, step: 1054, loss: 0.3084667921066284, mean loss: 0.37250178765592307
Epoch: 9, step: 1055, loss: 0.3205990493297577, mean loss: 0.3724980940366286
Epoch: 9, step: 1056, loss: 0.31487685441970825, mean loss: 0.37249399375628867
Epoch: 9, step: 1057, loss: 0.3296320140361786, mean loss: 0.3724909439498478
Epoch: 9, step: 1058, loss: 0.3251679539680481, mean loss: 0.37248757696372314
Epoch: 9, step: 1059, loss: 0.3442326486110687, mean loss: 0.3724855667952291
Epoch: 9, step: 1060, loss: 0.37059545516967773, mean loss: 0.37248543233470227
Epoch: 9, step: 1061, loss: 0.33321598172187805, mean loss: 0.37248263894655226
Epoch: 9, step: 1062, loss: 0.34774619340896606, mean loss: 0.37248087947251163
Epoch: 9, step: 1063, loss: 0.3707636892795563, mean loss: 0.3724807573394965
Epoch: 9, step: 1064, loss: 0.3220635950565338, mean loss: 0.37247717173660316
Epoch: 9, step: 1065, loss: 0.3509424030780792, mean loss: 0.372475640320826
Epoch: 9, step: 1066, loss: 0.3512442708015442, mean loss: 0.3724741305882284
Epoch: 9, step: 1067, loss: 0.3452097177505493, mean loss: 0.3724721919923213
Epoch: 9, step: 1068, loss: 0.40343302488327026, mean loss: 0.3724743932602126
Epoch: 9, step: 1069, loss: 0.3640340268611908, mean loss: 0.37247379320572666
Epoch: 9, step: 1070, loss: 0.36448678374290466, mean loss: 0.3724732254223
Epoch: 9, step: 1071, loss: 0.34396257996559143, mean loss: 0.372471198791261
Epoch: 9, step: 1072, loss: 0.354947566986084, mean loss: 0.3724699532420532
Epoch: 9, step: 1073, loss: 0.4012331962585449, mean loss: 0.3724719975379321
Epoch: 9, step: 1074, loss: 0.31465673446655273, mean loss: 0.37246788871389175
Epoch: 9, step: 1075, loss: 0.3770449161529541, mean loss: 0.37246821397166885
Epoch: 9, step: 1076, loss: 0.3745034635066986, mean loss: 0.37246835859254107
Epoch: 9, step: 1077, loss: 0.30961325764656067, mean loss: 0.3724638925487052
Epoch: 9, step: 1078, loss: 0.33536216616630554, mean loss: 0.3724612565468308
Epoch: 9, step: 1079, loss: 0.3449137508869171, mean loss: 0.3724592994918678
Epoch: 9, step: 1080, loss: 0.36315399408340454, mean loss: 0.3724586384628553
Epoch: 9, step: 1081, loss: 0.3267638385295868, mean loss: 0.37245539263248645
Epoch: 9, step: 1082, loss: 0.3175111413002014, mean loss: 0.3724514900647379
Epoch: 9, step: 1083, loss: 0.3525129556655884, mean loss: 0.37245007397564706
Epoch: 9, step: 1084, loss: 0.3318161070346832, mean loss: 0.3724471882454474
Epoch: 9, step: 1085, loss: 0.31244146823883057, mean loss: 0.37244292708083965
Epoch: 9, step: 1086, loss: 0.3258230984210968, mean loss: 0.37243961671879605
Epoch: 9, step: 1087, loss: 0.3426893651485443, mean loss: 0.3724375043748902
Epoch: 9, step: 1088, loss: 0.33388379216194153, mean loss: 0.3724347671571257
Epoch: 9, step: 1089, loss: 0.357639342546463, mean loss: 0.3724337167933169
Epoch: 9, step: 1090, loss: 0.3862304985523224, mean loss: 0.3724346961914683
Epoch: 9, step: 1091, loss: 0.31309399008750916, mean loss: 0.37243048404594703
Epoch: 9, step: 1092, loss: 0.3259996771812439, mean loss: 0.3724271885099356
Epoch: 9, step: 1093, loss: 0.35661759972572327, mean loss: 0.37242606646672877
Epoch: 9, step: 1094, loss: 0.34220898151397705, mean loss: 0.3724239220422768
Epoch: 9, step: 1095, loss: 0.35725149512290955, mean loss: 0.3724228453727537
Epoch: 9, step: 1096, loss: 0.28999239206314087, mean loss: 0.372416996337537
Epoch: 9, step: 1097, loss: 0.3294124901294708, mean loss: 0.37241394507414777
Epoch: 9, step: 1098, loss: 0.3429328203201294, mean loss: 0.3724118534725334
Epoch: 9, step: 1099, loss: 0.3533526062965393, mean loss: 0.37241050136930015
Epoch: 9, step: 1100, loss: 0.3364349603652954, mean loss: 0.37240794936951266
Epoch: 9, step: 1101, loss: 0.33862462639808655, mean loss: 0.3724055530492565
Epoch: 9, step: 1102, loss: 0.3255615830421448, mean loss: 0.3724022305462416
Epoch: 9, step: 1103, loss: 0.3372704088687897, mean loss: 0.3723997389276829
Epoch: 9, step: 1104, loss: 0.32893267273902893, mean loss: 0.37239665637565195
Epoch: 9, step: 1105, loss: 0.30471086502075195, mean loss: 0.3723918566457303
Epoch: 9, step: 1106, loss: 0.32011452317237854, mean loss: 0.3723881498221131
Epoch: 9, step: 1107, loss: 0.3364449143409729, mean loss: 0.3723856013794386
Epoch: 9, step: 1108, loss: 0.40930524468421936, mean loss: 0.37238821886567075
Epoch: 9, step: 1109, loss: 0.36118683218955994, mean loss: 0.372387424778993
Epoch: 9, step: 1110, loss: 0.3311810791492462, mean loss: 0.3723845037932675
Epoch: 9, step: 1111, loss: 0.3113519549369812, mean loss: 0.37238017769822523
Epoch: 9, step: 1112, loss: 0.32838040590286255, mean loss: 0.37237705913760466
Epoch: 9, step: 1113, loss: 0.32975339889526367, mean loss: 0.37237403832539756
Epoch: 9, step: 1114, loss: 0.34755054116249084, mean loss: 0.3723722791660777
Epoch: 9, step: 1115, loss: 0.30875200033187866, mean loss: 0.37236777092636436
Epoch: 9, step: 1116, loss: 0.3292631208896637, mean loss: 0.37236471667496235
Epoch: 9, step: 1117, loss: 0.4025830924510956, mean loss: 0.3723668576963437
Epoch: 9, step: 1118, loss: 0.311278373003006, mean loss: 0.372362529783861
Epoch: 9, step: 1119, loss: 0.33249780535697937, mean loss: 0.3723597057030713
Epoch: 9, step: 1120, loss: 0.3550831079483032, mean loss: 0.37235848188797216
Epoch: 9, step: 1121, loss: 0.3220856189727783, mean loss: 0.3723549209825383
Epoch: 9, step: 1122, loss: 0.4064527750015259, mean loss: 0.3723573360157573
Epoch: 9, step: 1123, loss: 0.3567529320716858, mean loss: 0.37235623088799924
Epoch: 9, step: 1124, loss: 0.3302706480026245, mean loss: 0.3723532505337123
Epoch: 9, step: 1125, loss: 0.3705594837665558, mean loss: 0.37235312351439726
Epoch: 9, step: 1126, loss: 0.3165868818759918, mean loss: 0.37234917490279645
Epoch: 9, step: 1127, loss: 0.37321168184280396, mean loss: 0.372349235969558
Epoch: 9, step: 1128, loss: 0.3349496126174927, mean loss: 0.3723465882086127
Epoch: 9, step: 1129, loss: 0.358512282371521, mean loss: 0.372345608858065
Epoch: 9, step: 1130, loss: 0.3344838321208954, mean loss: 0.37234292875777925
Epoch: 9, step: 1131, loss: 0.334277868270874, mean loss: 0.3723402344584809
Epoch: 9, step: 1132, loss: 0.38138696551322937, mean loss: 0.3723408747536932
Epoch: 9, step: 1133, loss: 0.3781723082065582, mean loss: 0.3723412874524514
Epoch: 9, step: 1134, loss: 0.3512353301048279, mean loss: 0.37233979385982896
Epoch: 9, step: 1135, loss: 0.3724229335784912, mean loss: 0.37233979974291126
Epoch: 9, step: 1136, loss: 0.3435828387737274, mean loss: 0.3723377650042875
Epoch: 9, step: 1137, loss: 0.3926798403263092, mean loss: 0.37233920423418154
Epoch: 9, step: 1138, loss: 0.3242970407009125, mean loss: 0.37233580542530054
Epoch: 9, step: 1139, loss: 0.3066064417362213, mean loss: 0.37233115564009334
Epoch: 9, step: 1140, loss: 0.3426978886127472, mean loss: 0.372329059490484
Epoch: 9, step: 1141, loss: 0.3095428943634033, mean loss: 0.37232461853949184
Epoch: 9, step: 1142, loss: 0.37387195229530334, mean loss: 0.3723247279767756
Epoch: 9, step: 1143, loss: 0.3181602358818054, mean loss: 0.3723208973903474
Epoch: 9, step: 1144, loss: 0.35130128264427185, mean loss: 0.37231941095977344
Epoch: 9, step: 1145, loss: 0.2937376797199249, mean loss: 0.3723138543389815
Epoch: 9, step: 1146, loss: 0.3656686246395111, mean loss: 0.37231338447900136
Epoch: 9, step: 1147, loss: 0.3245217204093933, mean loss: 0.3723100055434761
Epoch: 9, step: 1148, loss: 0.3728255331516266, mean loss: 0.37231004198940104
Epoch: 9, step: 1149, loss: 0.3023403286933899, mean loss: 0.3723050957351033
Epoch: 9, step: 1150, loss: 0.34549492597579956, mean loss: 0.37230320062166866
Epoch: 9, step: 1151, loss: 0.3518756330013275, mean loss: 0.37230175677323635
Epoch: 9, step: 1152, loss: 0.3176657259464264, mean loss: 0.3722978952967485
Epoch: 9, step: 1153, loss: 0.3072658181190491, mean loss: 0.3722932993902342
Epoch: 9, step: 1154, loss: 0.31831666827201843, mean loss: 0.3722894850568925
Epoch: 9, step: 1155, loss: 0.3354729115962982, mean loss: 0.3722868835466141
Epoch: 9, step: 1156, loss: 0.3246384561061859, mean loss: 0.3722835168803638
Epoch: 9, step: 1157, loss: 0.3397565186023712, mean loss: 0.3722812188022037
Epoch: 9, step: 1158, loss: 0.341447114944458, mean loss: 0.37227904048331584
Epoch: 9, step: 1159, loss: 0.39214760065078735, mean loss: 0.3722804440267015
Epoch: 9, step: 1160, loss: 0.3203311562538147, mean loss: 0.37227677451425023
Epoch: 9, step: 1161, loss: 0.3803957402706146, mean loss: 0.37227734796853446
Epoch: 9, step: 1162, loss: 0.32692694664001465, mean loss: 0.37227414503038003
Epoch: 9, step: 1163, loss: 0.38378188014030457, mean loss: 0.3722749577235375
Epoch: 9, step: 1164, loss: 0.34241095185279846, mean loss: 0.3722728488325079
Epoch: 9, step: 1165, loss: 0.3228549063205719, mean loss: 0.37226935935768
Epoch: 9, step: 1166, loss: 0.32740095257759094, mean loss: 0.3722661913560716
Epoch: 9, step: 1167, loss: 0.33429548144340515, mean loss: 0.3722635105660467
Epoch: 9, step: 1168, loss: 0.3222242295742035, mean loss: 0.37225997796590604
Epoch: 9, step: 1169, loss: 0.3296920359134674, mean loss: 0.3722569730285876
Epoch: 9, step: 1170, loss: 0.3679828941822052, mean loss: 0.372256671336003
Epoch: 9, step: 1171, loss: 0.395967960357666, mean loss: 0.3722583449165381
Epoch: 9, step: 1172, loss: 0.33600616455078125, mean loss: 0.3722557863605097
Epoch: 9, step: 1173, loss: 0.3617928624153137, mean loss: 0.3722550479749102
Epoch: 9, step: 1174, loss: 0.3625507354736328, mean loss: 0.3722543631740845
Epoch: 9, step: 1175, loss: 0.32599979639053345, mean loss: 0.37225109937456546
Epoch: 9, step: 1176, loss: 0.30654698610305786, mean loss: 0.3722464635096624
Epoch: 9, step: 1177, loss: 0.347706139087677, mean loss: 0.3722447321477023
Epoch: 9, step: 1178, loss: 0.3429015278816223, mean loss: 0.372242662080382
Epoch: 9, step: 1179, loss: 0.33976125717163086, mean loss: 0.372240370784889
Epoch: 9, step: 1180, loss: 0.3359137773513794, mean loss: 0.37223780842378057
Epoch: 9, step: 1181, loss: 0.33246946334838867, mean loss: 0.3722350034904278
Epoch: 9, step: 1182, loss: 0.3447175920009613, mean loss: 0.3722330627744754
Epoch: 9, step: 1183, loss: 0.32486167550086975, mean loss: 0.37222972205604987
Epoch: 9, step: 1184, loss: 0.3607967495918274, mean loss: 0.372228915838402
Epoch: 9, step: 1185, loss: 0.3393504321575165, mean loss: 0.3722265975135056
Epoch: 9, step: 1186, loss: 0.3460335433483124, mean loss: 0.3722247507212779
Epoch: 9, step: 1187, loss: 0.3527074158191681, mean loss: 0.37222337471063904
Epoch: 9, step: 1188, loss: 0.343037873506546, mean loss: 0.3722213172202475
Epoch: 9, step: 1189, loss: 0.3300371766090393, mean loss: 0.3722183435743564
Epoch: 9, step: 1190, loss: 0.323567658662796, mean loss: 0.37221491433033643
Epoch: 9, step: 1191, loss: 0.40746009349823, mean loss: 0.3722173984844926
Epoch: 9, step: 1192, loss: 0.34425684809684753, mean loss: 0.3722154279051433
Epoch: 9, step: 1193, loss: 0.35193201899528503, mean loss: 0.3722139984894343
Epoch: 9, step: 1194, loss: 0.3710169792175293, mean loss: 0.37221391413884086
Epoch: 9, step: 1195, loss: 0.3022820055484772, mean loss: 0.37220898658045654
Epoch: 9, step: 1196, loss: 0.3454388976097107, mean loss: 0.37220710043313243
Epoch: 9, step: 1197, loss: 0.3743034899234772, mean loss: 0.3722072481286017
Epoch: 9, step: 1198, loss: 0.3125636875629425, mean loss: 0.37220304639837515
Epoch: 9, step: 1199, loss: 0.3567691445350647, mean loss: 0.372201959197624
Epoch: 9, step: 1200, loss: 0.3346225321292877, mean loss: 0.3721993121998732
Epoch: 9, step: 1201, loss: 0.3660808205604553, mean loss: 0.3721988812594844
Epoch: 9, step: 1202, loss: 0.3285902440547943, mean loss: 0.37219581001241037
Epoch: 9, step: 1203, loss: 0.3252961337566376, mean loss: 0.3721925072183078
Epoch: 9, step: 1204, loss: 0.36846065521240234, mean loss: 0.3721922444303347
Epoch: 9, step: 1205, loss: 0.3054681718349457, mean loss: 0.3721875462137036
Epoch: 9, step: 1206, loss: 0.3201007843017578, mean loss: 0.372183878906662
Epoch: 9, step: 1207, loss: 0.34030675888061523, mean loss: 0.3721816346712335
Epoch: 9, step: 1208, loss: 0.3233044147491455, mean loss: 0.37217819382505807
Epoch: 9, step: 1209, loss: 0.3658537268638611, mean loss: 0.37217774862817216
Epoch: 9, step: 1210, loss: 0.3784825801849365, mean loss: 0.372178192411628
Epoch: 9, step: 1211, loss: 0.36459988355636597, mean loss: 0.3721776590284034
Epoch: 9, step: 1212, loss: 0.3513980507850647, mean loss: 0.37217619660259976
Epoch: 9, step: 1213, loss: 0.368236243724823, mean loss: 0.3721759193363874
Epoch: 9, step: 1214, loss: 0.33028870820999146, mean loss: 0.37217297181607734
Epoch: 9, step: 1215, loss: 0.3237038850784302, mean loss: 0.3721695613821667
Epoch: 9, step: 1216, loss: 0.35667967796325684, mean loss: 0.3721684715430463
Epoch: 9, step: 1217, loss: 0.29727229475975037, mean loss: 0.3721632023593694
Epoch: 9, step: 1218, loss: 0.3610004484653473, mean loss: 0.3721624170794613
Epoch: 9, step: 1219, loss: 0.3547836244106293, mean loss: 0.37216119459826624
Epoch: 9, step: 1220, loss: 0.30654364824295044, mean loss: 0.3721565791698105
Epoch: 9, step: 1221, loss: 0.3583657145500183, mean loss: 0.3721556092116856
Epoch: 9, step: 1222, loss: 0.3096745014190674, mean loss: 0.37215121501323334
Epoch: 9, step: 1223, loss: 0.388567179441452, mean loss: 0.3721523694411116
Epoch: 9, step: 1224, loss: 0.36489352583885193, mean loss: 0.3721518590098056
Epoch: 9, step: 1225, loss: 0.3629630208015442, mean loss: 0.37215121290952374
Epoch: 9, step: 1226, loss: 0.33713582158088684, mean loss: 0.37214875102445527
Epoch: 9, step: 1227, loss: 0.33368322253227234, mean loss: 0.37214604675501683
Epoch: 9, step: 1228, loss: 0.31846171617507935, mean loss: 0.3721422728126211
Epoch: 9, step: 1229, loss: 0.33658677339553833, mean loss: 0.3721397734804534
Epoch: 9, step: 1230, loss: 0.3143090009689331, mean loss: 0.37213570861980033
Epoch: 9, step: 1231, loss: 0.33181053400039673, mean loss: 0.3721328744073587
Epoch: 9, step: 1232, loss: 0.3548371493816376, mean loss: 0.3721316588809671
Epoch: 9, step: 1233, loss: 0.34941354393959045, mean loss: 0.37213006238659313
Epoch: 9, step: 1234, loss: 0.3770928978919983, mean loss: 0.37213041112073025
Epoch: 9, step: 1235, loss: 0.33838242292404175, mean loss: 0.37212803984556186
Epoch: 9, step: 1236, loss: 0.32999271154403687, mean loss: 0.3721250794487164
Epoch: 9, step: 1237, loss: 0.3779391646385193, mean loss: 0.37212548791332156
Epoch: 9, step: 1238, loss: 0.31559494137763977, mean loss: 0.37212151667717575
Epoch: 9, step: 1239, loss: 0.32937607169151306, mean loss: 0.3721185140468733
Epoch: 9, step: 1240, loss: 0.3255290389060974, mean loss: 0.37211524162465365
Epoch: 9, step: 1241, loss: 0.336527556180954, mean loss: 0.37211274213838846
Epoch: 9, step: 1242, loss: 0.2935744822025299, mean loss: 0.3721072264238063
Epoch: 9, step: 1243, loss: 0.3031455874443054, mean loss: 0.3721023836120802
Epoch: 9, step: 1244, loss: 0.2966986298561096, mean loss: 0.37209708877648184
Epoch: 9, step: 1245, loss: 0.35368412733078003, mean loss: 0.37209579591301845
Epoch: 9, step: 1246, loss: 0.3456110656261444, mean loss: 0.37209393642202027
Epoch: 9, step: 1247, loss: 0.3313472867012024, mean loss: 0.37209107580353384
Epoch: 9, step: 1248, loss: 0.348251074552536, mean loss: 0.37208940223377246
Epoch: 9, step: 1249, loss: 0.3402296006679535, mean loss: 0.37208716583046164
Epoch: 9, step: 1250, loss: 0.33199289441108704, mean loss: 0.37208435160491105
Epoch: 9, step: 1251, loss: 0.34516260027885437, mean loss: 0.3720824620940094
Epoch: 9, step: 1252, loss: 0.32261866331100464, mean loss: 0.37207899070662903
Epoch: 9, step: 1253, loss: 0.3214573860168457, mean loss: 0.37207543831331746
Epoch: 9, step: 1254, loss: 0.33993929624557495, mean loss: 0.3720731833036994
Epoch: 9, step: 1255, loss: 0.36566653847694397, mean loss: 0.3720727337776801
Epoch: 9, step: 1256, loss: 0.3162733316421509, mean loss: 0.37206881885435616
Epoch: 9, step: 1257, loss: 0.3463378846645355, mean loss: 0.3720670136814791
Epoch: 9, step: 1258, loss: 0.3250761032104492, mean loss: 0.37206371723037623
Epoch: 9, step: 1259, loss: 0.33241406083106995, mean loss: 0.3720609359694055
Epoch: 9, step: 1260, loss: 0.381625771522522, mean loss: 0.372061606856377
Epoch: 9, step: 1261, loss: 0.3468720614910126, mean loss: 0.37205984016081206
Epoch: 9, step: 1262, loss: 0.4469894468784332, mean loss: 0.3720650950599437
Epoch: 9, step: 1263, loss: 0.3419376313686371, mean loss: 0.37206298233457963
Epoch: 9, step: 1264, loss: 0.3408845365047455, mean loss: 0.37206079606111847
Epoch: 9, step: 1265, loss: 0.3622668981552124, mean loss: 0.3720601093483218
Epoch: 9, step: 1266, loss: 0.3074921667575836, mean loss: 0.37205558239448383
Epoch: 9, step: 1267, loss: 0.3404597342014313, mean loss: 0.3720533673181944
Epoch: 9, step: 1268, loss: 0.31641414761543274, mean loss: 0.3720494669172338
Epoch: 9, step: 1269, loss: 0.3312588632106781, mean loss: 0.37204660762915676
Epoch: 9, step: 1270, loss: 0.3294403851032257, mean loss: 0.37204362128146445
Epoch: 9, step: 1271, loss: 0.3338291645050049, mean loss: 0.37204094294835705
Epoch: 9, step: 1272, loss: 0.3207721412181854, mean loss: 0.3720373499284026
Epoch: 9, step: 1273, loss: 0.35307276248931885, mean loss: 0.37203602094540056
Epoch: 9, step: 1274, loss: 0.3582345247268677, mean loss: 0.3720350538445514
Epoch: 9, step: 1275, loss: 0.33629435300827026, mean loss: 0.3720325495914098
Epoch: 9, step: 1276, loss: 0.37837767601013184, mean loss: 0.3720329941459126
Epoch: 9, step: 1277, loss: 0.3111850619316101, mean loss: 0.37202873129512
Epoch: 9, step: 1278, loss: 0.3242500126361847, mean loss: 0.37202538427454845
Epoch: 9, step: 1279, loss: 0.3541834354400635, mean loss: 0.37202413448827537
Epoch: 9, step: 1280, loss: 0.32780808210372925, mean loss: 0.37202103747543064
Epoch: 9, step: 1281, loss: 0.3340896964073181, mean loss: 0.3720183808469765
Epoch: 9, step: 1282, loss: 0.3193923234939575, mean loss: 0.3720146952907504
Epoch: 9, step: 1283, loss: 0.3231319785118103, mean loss: 0.3720112721313121
Epoch: 9, step: 1284, loss: 0.33226335048675537, mean loss: 0.3720084888583169
Epoch: 9, step: 1285, loss: 0.31362634897232056, mean loss: 0.3720044010456936
Epoch: 9, step: 1286, loss: 0.2947615087032318, mean loss: 0.37199899301570394
Epoch: 9, step: 1287, loss: 0.32815176248550415, mean loss: 0.3719959233412059
Epoch: 9, step: 1288, loss: 0.31342625617980957, mean loss: 0.37199182325950053
Epoch: 9, step: 1289, loss: 0.3339049518108368, mean loss: 0.3719891572318197
Epoch: 9, step: 1290, loss: 0.3400481343269348, mean loss: 0.3719869215614267
Epoch: 9, step: 1291, loss: 0.34890612959861755, mean loss: 0.3719853061644528
Epoch: 9, step: 1292, loss: 0.3152577877044678, mean loss: 0.3719813361512636
Epoch: 9, step: 1293, loss: 0.3584754467010498, mean loss: 0.3719803910225407
Epoch: 9, step: 1294, loss: 0.36994922161102295, mean loss: 0.37198024889326975
Epoch: 9, step: 1295, loss: 0.3142872452735901, mean loss: 0.37197621215917936
Epoch: 9, step: 1296, loss: 0.29473352432250977, mean loss: 0.3719708079271891
Epoch: 9, step: 1297, loss: 0.3480614423751831, mean loss: 0.371969135241758
Epoch: 9, step: 1298, loss: 0.3318919837474823, mean loss: 0.3719663316634793
Epoch: 9, step: 1299, loss: 0.3509768545627594, mean loss: 0.37196486345719076
Epoch: 9, step: 1300, loss: 0.4062959551811218, mean loss: 0.3719672647366007
Epoch: 9, step: 1301, loss: 0.3786464333534241, mean loss: 0.37196773187666343
Epoch: 9, step: 1302, loss: 0.3318057656288147, mean loss: 0.3719649231511408
Epoch: 9, step: 1303, loss: 0.3356766998767853, mean loss: 0.3719623855131496
Epoch: 9, step: 1304, loss: 0.3335663080215454, mean loss: 0.3719597006605175
Epoch: 9, step: 1305, loss: 0.3336851894855499, mean loss: 0.3719570244955633
Epoch: 9, step: 1306, loss: 0.3640773892402649, mean loss: 0.37195647358769396
Epoch: 9, step: 1307, loss: 0.35602903366088867, mean loss: 0.37195536009217334
Epoch: 9, step: 1308, loss: 0.3283012807369232, mean loss: 0.3719523084263673
Epoch: 9, step: 1309, loss: 0.33886921405792236, mean loss: 0.3719499958935581
Epoch: 9, step: 1310, loss: 0.3298797011375427, mean loss: 0.37194705535432865
Epoch: 9, step: 1311, loss: 0.36323466897010803, mean loss: 0.3719464464371925
Epoch: 9, step: 1312, loss: 0.32053741812705994, mean loss: 0.37194285366143526
Epoch: 9, step: 1313, loss: 0.3517417013645172, mean loss: 0.37194144198063184
Epoch: 9, step: 1314, loss: 0.37564459443092346, mean loss: 0.37194170074329347
Epoch: 9, step: 1315, loss: 0.3680647015571594, mean loss: 0.3719414298517908
Epoch: 9, step: 1316, loss: 0.34593841433525085, mean loss: 0.37193961311068013
Epoch: 9, step: 1317, loss: 0.31594792008399963, mean loss: 0.3719357014372816
Epoch: 9, step: 1318, loss: 0.38072094321250916, mean loss: 0.3719363151461028
Epoch: 9, step: 1319, loss: 0.3622511625289917, mean loss: 0.3719356386196557
Epoch: 9, step: 1320, loss: 0.3663195073604584, mean loss: 0.37193524634953906
Epoch: 9, step: 1321, loss: 0.34234893321990967, mean loss: 0.37193317997762054
Epoch: 9, step: 1322, loss: 0.3139001131057739, mean loss: 0.3719291271061301
Epoch: 9, step: 1323, loss: 0.4391404092311859, mean loss: 0.3719338206314181
Epoch: 9, step: 1324, loss: 0.33692309260368347, mean loss: 0.3719313759188961
Epoch: 9, step: 1325, loss: 0.3279823064804077, mean loss: 0.3719283072783823
Epoch: 9, step: 1326, loss: 0.3435437083244324, mean loss: 0.3719263255288219
Epoch: 9, step: 1327, loss: 0.31367969512939453, mean loss: 0.3719222591625555
Epoch: 9, step: 1328, loss: 0.3478738069534302, mean loss: 0.3719205803875322
Epoch: 9, step: 1329, loss: 0.31489303708076477, mean loss: 0.3719165996850816
Epoch: 9, step: 1330, loss: 0.3526589870452881, mean loss: 0.3719152555367854
Epoch: 9, step: 1331, loss: 0.3219393789768219, mean loss: 0.3719117675498675
Epoch: 9, step: 1332, loss: 0.3403986990451813, mean loss: 0.3719095682988029
Epoch: 9, step: 1333, loss: 0.33593884110450745, mean loss: 0.3719070581294244
Epoch: 9, step: 1334, loss: 0.37024056911468506, mean loss: 0.37190694184381873
Epoch: 9, step: 1335, loss: 0.31633245944976807, mean loss: 0.3719030641936377
Epoch: 9, step: 1336, loss: 0.3278711140155792, mean loss: 0.3718999921256702
Epoch: 9, step: 1337, loss: 0.3184535801410675, mean loss: 0.3718962634796548
Epoch: 9, step: 1338, loss: 0.3649355173110962, mean loss: 0.37189577790266365
Epoch: 9, step: 1339, loss: 0.36465784907341003, mean loss: 0.3718952730248156
Epoch: 9, step: 1340, loss: 0.36594998836517334, mean loss: 0.37189485834359504
Epoch: 9, step: 1341, loss: 0.34590867161750793, mean loss: 0.37189304594390704
Epoch: 9, step: 1342, loss: 0.3977397382259369, mean loss: 0.37189484848887405
Epoch: 9, step: 1343, loss: 0.313789039850235, mean loss: 0.3718907964799034
Epoch: 9, step: 1344, loss: 0.3335639238357544, mean loss: 0.3718881239415418
Epoch: 9, step: 1345, loss: 0.3242398798465729, mean loss: 0.371884801654267
Epoch: 9, step: 1346, loss: 0.3281112611293793, mean loss: 0.3718817497445881
Epoch: 9, step: 1347, loss: 0.3415597081184387, mean loss: 0.3718796358264602
Epoch: 9, step: 1348, loss: 0.37555167078971863, mean loss: 0.3718798918065901
Epoch: 9, step: 1349, loss: 0.3790462017059326, mean loss: 0.37188039134025097
Epoch: 9, step: 1350, loss: 0.375892698764801, mean loss: 0.3718806710020217
Epoch: 9, step: 1351, loss: 0.31093698740005493, mean loss: 0.3718764234634378
Epoch: 9, step: 1352, loss: 0.3845190107822418, mean loss: 0.37187730454137485
Epoch: 9, step: 1353, loss: 0.32300087809562683, mean loss: 0.371873898518626
Epoch: 9, step: 1354, loss: 0.3213287591934204, mean loss: 0.3718703764547054
Epoch: 9, step: 1355, loss: 0.32175835967063904, mean loss: 0.37186688481473995
Epoch: 9, step: 1356, loss: 0.39545944333076477, mean loss: 0.37186852855183433
Epoch: 9, step: 1357, loss: 0.3706752061843872, mean loss: 0.37186844541665476
Epoch: 9, step: 1358, loss: 0.3524216115474701, mean loss: 0.3718670907086179
Epoch: 9, step: 1359, loss: 0.3585032522678375, mean loss: 0.3718661598198995
Epoch: 9, step: 1360, loss: 0.3433852791786194, mean loss: 0.3718641760572303
Epoch: 9, step: 1361, loss: 0.35247117280960083, mean loss: 0.37186282538142257
Epoch: 9, step: 1362, loss: 0.3278190791606903, mean loss: 0.37185975805457383
Epoch: 9, step: 1363, loss: 0.34688621759414673, mean loss: 0.37185801895008497
Epoch: 9, step: 1364, loss: 0.3387967646121979, mean loss: 0.3718557167946405
Epoch: 9, step: 1365, loss: 0.3220825493335724, mean loss: 0.37185225117930415
Epoch: 9, step: 1366, loss: 0.3067992329597473, mean loss: 0.3718477219710455
Epoch: 9, step: 1367, loss: 0.31557679176330566, mean loss: 0.37184380447381576
Epoch: 9, step: 1368, loss: 0.3669629395008087, mean loss: 0.3718434646990178
Epoch: 9, step: 1369, loss: 0.3147469758987427, mean loss: 0.37183949028103086
Epoch: 9, step: 1370, loss: 0.3139127492904663, mean loss: 0.3718354583508443
Epoch: 9, step: 1371, loss: 0.32154950499534607, mean loss: 0.3718319584932889
Epoch: 9, step: 1372, loss: 0.30150696635246277, mean loss: 0.3718270642771193
Epoch: 9, step: 1373, loss: 0.3353786766529083, mean loss: 0.37182452785487685
Epoch: 9, step: 1374, loss: 0.3465970456600189, mean loss: 0.37182277241112244
Epoch: 9, step: 1375, loss: 0.33357998728752136, mean loss: 0.3718201114881386
Epoch: 9, step: 1376, loss: 0.35084784030914307, mean loss: 0.37181865234452355
Epoch: 9, step: 1377, loss: 0.31606268882751465, mean loss: 0.3718147733989609
Epoch: 9, step: 1378, loss: 0.3171212375164032, mean loss: 0.37181096863124735
Epoch: 9, step: 1379, loss: 0.3605588376522064, mean loss: 0.37181018592875853
Epoch: 9, step: 1380, loss: 0.314073383808136, mean loss: 0.37180617001430344
Epoch: 9, step: 1381, loss: 0.3604218661785126, mean loss: 0.3718053782279746
Epoch: 9, step: 1382, loss: 0.37351176142692566, mean loss: 0.371805496899871
Epoch: 9, step: 1383, loss: 0.3350208103656769, mean loss: 0.3718029388549104
Epoch: 9, step: 1384, loss: 0.3215287923812866, mean loss: 0.3717994429821287
Epoch: 9, step: 1385, loss: 0.3438856303691864, mean loss: 0.37179750209681284
Epoch: 9, step: 1386, loss: 0.3081928789615631, mean loss: 0.37179307988843247
Epoch: 9, step: 1387, loss: 0.3486495018005371, mean loss: 0.3717914709077534
Epoch: 9, step: 1388, loss: 0.33412832021713257, mean loss: 0.3717888526838611
Epoch: 9, step: 1389, loss: 0.2976773679256439, mean loss: 0.37178370104443675
Epoch: 9, step: 1390, loss: 0.30057811737060547, mean loss: 0.37177875174411884
Epoch: 9, step: 1391, loss: 0.36692917346954346, mean loss: 0.3717784146869688
Epoch: 9, step: 1392, loss: 0.33692190051078796, mean loss: 0.3717759922452303
Epoch: 9, step: 1393, loss: 0.33888673782348633, mean loss: 0.3717737066820321
Epoch: 9, step: 1394, loss: 0.3685202896595001, mean loss: 0.37177348060899873
Epoch: 9, step: 1395, loss: 0.40702131390571594, mean loss: 0.3717759297358259
Epoch: 9, step: 1396, loss: 0.3530345857143402, mean loss: 0.3717746276206295
Epoch: 9, step: 1397, loss: 0.32164278626441956, mean loss: 0.3717711447915788
Epoch: 9, step: 1398, loss: 0.3381202518939972, mean loss: 0.3717688071123223
Epoch: 9, step: 1399, loss: 0.34347233176231384, mean loss: 0.37176684153331774
Epoch: 9, step: 1400, loss: 0.32636672258377075, mean loss: 0.3717636880903123
Epoch: 9, step: 1401, loss: 0.31824612617492676, mean loss: 0.37175997107670516
Epoch: 9, step: 1402, loss: 0.3146633505821228, mean loss: 0.3717560057582459
Epoch: 9, step: 1403, loss: 0.3864744305610657, mean loss: 0.37175702787107945
Epoch: 9, step: 1404, loss: 0.3194577395915985, mean loss: 0.3717533962282575
Epoch: 9, step: 1405, loss: 0.3701806366443634, mean loss: 0.37175328702400917
Epoch: 9, step: 1406, loss: 0.2981901168823242, mean loss: 0.3717481795345874
Epoch: 9, step: 1407, loss: 0.35491684079170227, mean loss: 0.37174701101620755
Epoch: 9, step: 1408, loss: 0.33859553933143616, mean loss: 0.3717447096297664
Epoch: 9, step: 1409, loss: 0.34541189670562744, mean loss: 0.3717428817238297
Epoch: 9, step: 1410, loss: 0.3235062062740326, mean loss: 0.37173953358227
Epoch: 9, step: 1411, loss: 0.3109486997127533, mean loss: 0.3717353143406078
Epoch: 9, step: 1412, loss: 0.32381471991539, mean loss: 0.3717319886001383
Epoch: 9, step: 1413, loss: 0.3052413761615753, mean loss: 0.37172737440080184
Epoch: 9, step: 1414, loss: 0.29547685384750366, mean loss: 0.37172208326760126
Epoch: 9, step: 1415, loss: 0.3314899802207947, mean loss: 0.37171929169786444
Epoch: 9, step: 1416, loss: 0.3036314845085144, mean loss: 0.3717145676426928
Epoch: 9, step: 1417, loss: 0.33484458923339844, mean loss: 0.3717120097144002
Epoch: 9, step: 1418, loss: 0.32949358224868774, mean loss: 0.3717090809299767
Epoch: 9, step: 1419, loss: 0.322617769241333, mean loss: 0.37170567559481515
Epoch: 9, step: 1420, loss: 0.363518625497818, mean loss: 0.3717051077200772
Epoch: 9, step: 1421, loss: 0.3288857042789459, mean loss: 0.3717021378627155
Epoch: 9, step: 1422, loss: 0.4256137013435364, mean loss: 0.3717058767879864
Epoch: 9, step: 1423, loss: 0.3615949749946594, mean loss: 0.3717051756158787
Epoch: 9, step: 1424, loss: 0.33834171295166016, mean loss: 0.37170286208265185
Epoch: 9, step: 1425, loss: 0.3763556182384491, mean loss: 0.3717031846978339
Epoch: 9, step: 1426, loss: 0.3493478000164032, mean loss: 0.37170163471622947
Epoch: 9, step: 1427, loss: 0.33309802412986755, mean loss: 0.3716989583705149
Epoch: 9, step: 1428, loss: 0.35765141248703003, mean loss: 0.3716979845371781
Epoch: 9, step: 1429, loss: 0.3416944742202759, mean loss: 0.3716959047153067
Epoch: 9, step: 1430, loss: 0.32091712951660156, mean loss: 0.3716923850109192
Epoch: 9, step: 1431, loss: 0.3193408250808716, mean loss: 0.3716887565412817
Epoch: 9, step: 1432, loss: 0.32061174511909485, mean loss: 0.37168521665553617
Epoch: 9, step: 1433, loss: 0.3525194525718689, mean loss: 0.371683888466757
Epoch: 9, step: 1434, loss: 0.33885300159454346, mean loss: 0.37168161344168094
Epoch: 9, step: 1435, loss: 0.30473020672798157, mean loss: 0.37167697434753505
Epoch: 9, step: 1436, loss: 0.366562157869339, mean loss: 0.37167661996407503
Epoch: 9, step: 1437, loss: 0.32833629846572876, mean loss: 0.3716736173091285
Epoch: 9, step: 1438, loss: 0.3319156765937805, mean loss: 0.3716708630354385
Epoch: 9, step: 1439, loss: 0.31815990805625916, mean loss: 0.3716671562638273
Epoch: 9, step: 1440, loss: 0.33917149901390076, mean loss: 0.37166490540442093
Epoch: 9, step: 1441, loss: 0.3624466359615326, mean loss: 0.37166426693167937
Epoch: 9, step: 1442, loss: 0.3739016652107239, mean loss: 0.3716644218868895
Epoch: 9, step: 1443, loss: 0.3379571735858917, mean loss: 0.3716620875899157
Valid: 9, mean loss: 0.19768135994672775
Epoch: 10, step: 0, loss: 0.310139536857605, mean loss: 0.3716578273204931
Epoch: 10, step: 1, loss: 0.32257547974586487, mean loss: 0.3716544287366699
Epoch: 10, step: 2, loss: 0.37633249163627625, mean loss: 0.37165475263495273
Epoch: 10, step: 3, loss: 0.35281720757484436, mean loss: 0.37165344845708925
Epoch: 10, step: 4, loss: 0.370681494474411, mean loss: 0.3716533811705553
Epoch: 10, step: 5, loss: 0.29914963245391846, mean loss: 0.3716483622207618
Epoch: 10, step: 6, loss: 0.33068299293518066, mean loss: 0.3716455266584108
Epoch: 10, step: 7, loss: 0.319349467754364, mean loss: 0.3716419070530049
Epoch: 10, step: 8, loss: 0.44445812702178955, mean loss: 0.3716469465865345
Epoch: 10, step: 9, loss: 0.3210945725440979, mean loss: 0.37164344815234474
Epoch: 10, step: 10, loss: 0.3371257781982422, mean loss: 0.371641059551559
Epoch: 10, step: 11, loss: 0.33824488520622253, mean loss: 0.3716387487174637
Epoch: 10, step: 12, loss: 0.33646664023399353, mean loss: 0.3716363151667487
Epoch: 10, step: 13, loss: 0.3167838156223297, mean loss: 0.3716325201965298
Epoch: 10, step: 14, loss: 0.31573474407196045, mean loss: 0.37162865317638977
Epoch: 10, step: 15, loss: 0.3813493847846985, mean loss: 0.3716293256121679
Epoch: 10, step: 16, loss: 0.28911513090133667, mean loss: 0.37162361805218236
Epoch: 10, step: 17, loss: 0.38581857085227966, mean loss: 0.3716245998582966
Epoch: 10, step: 18, loss: 0.3366738557815552, mean loss: 0.37162218262722413
Epoch: 10, step: 19, loss: 0.39805054664611816, mean loss: 0.3716240103149156
Epoch: 10, step: 20, loss: 0.3063697814941406, mean loss: 0.3716194978863961
Epoch: 10, step: 21, loss: 0.332561731338501, mean loss: 0.3716167971695832
Epoch: 10, step: 22, loss: 0.3343413472175598, mean loss: 0.3716142198723453
Epoch: 10, step: 23, loss: 0.3576417863368988, mean loss: 0.3716132538578586
Epoch: 10, step: 24, loss: 0.38197943568229675, mean loss: 0.371613970496768
Epoch: 10, step: 25, loss: 0.34274372458457947, mean loss: 0.3716119747656804
Epoch: 10, step: 26, loss: 0.3577764928340912, mean loss: 0.3716110184179973
Epoch: 10, step: 27, loss: 0.33458343148231506, mean loss: 0.3716084591432575
Epoch: 10, step: 28, loss: 0.3313969671726227, mean loss: 0.37160567999528804
Epoch: 10, step: 29, loss: 0.33071595430374146, mean loss: 0.371602854167666
Epoch: 10, step: 30, loss: 0.32745063304901123, mean loss: 0.3715998030847333
Epoch: 10, step: 31, loss: 0.3702431619167328, mean loss: 0.37159970934225345
Epoch: 10, step: 32, loss: 0.324553906917572, mean loss: 0.37159645875133074
Epoch: 10, step: 33, loss: 0.3508412539958954, mean loss: 0.3715950247866523
Epoch: 10, step: 34, loss: 0.31655648350715637, mean loss: 0.37159122246946547
Epoch: 10, step: 35, loss: 0.32037365436553955, mean loss: 0.3715876843672201
Epoch: 10, step: 36, loss: 0.32833975553512573, mean loss: 0.37158469701287655
Epoch: 10, step: 37, loss: 0.29747965931892395, mean loss: 0.3715795785546852
Epoch: 10, step: 38, loss: 0.3167562782764435, mean loss: 0.3715757921536714
Epoch: 10, step: 39, loss: 0.3191714286804199, mean loss: 0.3715721730677962
Epoch: 10, step: 40, loss: 0.39023399353027344, mean loss: 0.37157346177855255
Epoch: 10, step: 41, loss: 0.369790643453598, mean loss: 0.3715733386727436
Epoch: 10, step: 42, loss: 0.3641650676727295, mean loss: 0.37157282715779505
Epoch: 10, step: 43, loss: 0.34206336736679077, mean loss: 0.37157078977448993
Epoch: 10, step: 44, loss: 0.324738472700119, mean loss: 0.3715675566148714
Epoch: 10, step: 45, loss: 0.3335256278514862, mean loss: 0.37156493049801625
Epoch: 10, step: 46, loss: 0.3342377841472626, mean loss: 0.3715623539020094
Epoch: 10, step: 47, loss: 0.3632556200027466, mean loss: 0.3715617805493107
Epoch: 10, step: 48, loss: 0.3292742371559143, mean loss: 0.3715588619529001
Epoch: 10, step: 49, loss: 0.3419531583786011, mean loss: 0.37155681877114893
Epoch: 10, step: 50, loss: 0.3117212951183319, mean loss: 0.3715526896203896
Epoch: 10, step: 51, loss: 0.32633838057518005, mean loss: 0.37154956967082814
Epoch: 10, step: 52, loss: 0.3194847106933594, mean loss: 0.37154597725662974
Epoch: 10, step: 53, loss: 0.3153301477432251, mean loss: 0.37154209869794935
Epoch: 10, step: 54, loss: 0.3300819993019104, mean loss: 0.3715392383944381
Epoch: 10, step: 55, loss: 0.3238779306411743, mean loss: 0.3715359505006913
Epoch: 10, step: 56, loss: 0.29153281450271606, mean loss: 0.3715304319012571
Epoch: 10, step: 57, loss: 0.3345770835876465, mean loss: 0.3715278830429102
Epoch: 10, step: 58, loss: 0.3823949694633484, mean loss: 0.3715286325488361
Epoch: 10, step: 59, loss: 0.3410678803920746, mean loss: 0.37152653180730805
Epoch: 10, step: 60, loss: 0.32028722763061523, mean loss: 0.37152299830588215
Epoch: 10, step: 61, loss: 0.34466198086738586, mean loss: 0.37152114607740067
Epoch: 10, step: 62, loss: 0.3100896179676056, mean loss: 0.37151691029665806
Epoch: 10, step: 63, loss: 0.3350980579853058, mean loss: 0.3715143993443476
Epoch: 10, step: 64, loss: 0.30235496163368225, mean loss: 0.37150963137208215
Epoch: 10, step: 65, loss: 0.31870168447494507, mean loss: 0.37150599095109105
Epoch: 10, step: 66, loss: 0.3552100360393524, mean loss: 0.3715048676344224
Epoch: 10, step: 67, loss: 0.33272460103034973, mean loss: 0.3715021946080505
Epoch: 10, step: 68, loss: 0.37051519751548767, mean loss: 0.3715021265815089
Epoch: 10, step: 69, loss: 0.33902886509895325, mean loss: 0.37149988858967686
Epoch: 10, step: 70, loss: 0.3212629556655884, mean loss: 0.3714964265999502
Epoch: 10, step: 71, loss: 0.33340826630592346, mean loss: 0.3714938020023555
Epoch: 10, step: 72, loss: 0.31084755063056946, mean loss: 0.37148962324872964
Epoch: 10, step: 73, loss: 0.39361661672592163, mean loss: 0.37149114777632214
Epoch: 10, step: 74, loss: 0.34166765213012695, mean loss: 0.3714890931090368
Epoch: 10, step: 75, loss: 0.3596358895301819, mean loss: 0.3714882765477542
Epoch: 10, step: 76, loss: 0.3141727149486542, mean loss: 0.3714843283792897
Epoch: 10, step: 77, loss: 0.3495485484600067, mean loss: 0.3714828174425271
Epoch: 10, step: 78, loss: 0.36850953102111816, mean loss: 0.3714826126566313
Epoch: 10, step: 79, loss: 0.3313419818878174, mean loss: 0.37147984815038
Epoch: 10, step: 80, loss: 0.3499126732349396, mean loss: 0.3714783629100442
Epoch: 10, step: 81, loss: 0.3393377363681793, mean loss: 0.3714761496731249
Epoch: 10, step: 82, loss: 0.3404434025287628, mean loss: 0.3714740128730737
Epoch: 10, step: 83, loss: 0.3485649824142456, mean loss: 0.3714724355506791
Epoch: 10, step: 84, loss: 0.34576913714408875, mean loss: 0.3714706659604274
Epoch: 10, step: 85, loss: 0.30717095732688904, mean loss: 0.371466239434981
Epoch: 10, step: 86, loss: 0.3440168499946594, mean loss: 0.3714643498920995
Epoch: 10, step: 87, loss: 0.2960372865200043, mean loss: 0.37145915805128366
Epoch: 10, step: 88, loss: 0.335812509059906, mean loss: 0.3714567045686633
Epoch: 10, step: 89, loss: 0.3387836813926697, mean loss: 0.3714544559091192
Epoch: 10, step: 90, loss: 0.3460600972175598, mean loss: 0.3714527083102828
Epoch: 10, step: 91, loss: 0.3381483256816864, mean loss: 0.37145041651406563
Epoch: 10, step: 92, loss: 0.3422309160232544, mean loss: 0.371448405951863
Epoch: 10, step: 93, loss: 0.3230542838573456, mean loss: 0.37144507623381606
Epoch: 10, step: 94, loss: 0.3126632571220398, mean loss: 0.37144103207701445
Epoch: 10, step: 95, loss: 0.3286490738391876, mean loss: 0.3714380882163762
Epoch: 10, step: 96, loss: 0.35618144273757935, mean loss: 0.3714370387119751
Epoch: 10, step: 97, loss: 0.3468870222568512, mean loss: 0.3714353500328958
Epoch: 10, step: 98, loss: 0.35997340083122253, mean loss: 0.3714345616740539
Epoch: 10, step: 99, loss: 0.34075137972831726, mean loss: 0.3714324514139476
Epoch: 10, step: 100, loss: 0.34206002950668335, mean loss: 0.37143043144132487
Epoch: 10, step: 101, loss: 0.32542869448661804, mean loss: 0.37142726807060866
Epoch: 10, step: 102, loss: 0.30134016275405884, mean loss: 0.371422448768861
Epoch: 10, step: 103, loss: 0.3325933516025543, mean loss: 0.37141977900145406
Epoch: 10, step: 104, loss: 0.35829946398735046, mean loss: 0.3714188769516078
Epoch: 10, step: 105, loss: 0.33108699321746826, mean loss: 0.3714161042385778
Epoch: 10, step: 106, loss: 0.35643312335014343, mean loss: 0.3714150742680761
Epoch: 10, step: 107, loss: 0.3450315594673157, mean loss: 0.37141326071880465
Epoch: 10, step: 108, loss: 0.3506299555301666, mean loss: 0.3714118322147708
Epoch: 10, step: 109, loss: 0.3394111692905426, mean loss: 0.37140963285649425
Epoch: 10, step: 110, loss: 0.3299661874771118, mean loss: 0.371406784705482
Epoch: 10, step: 111, loss: 0.35498958826065063, mean loss: 0.37140565653090496
Epoch: 10, step: 112, loss: 0.3749714493751526, mean loss: 0.37140590155205827
Epoch: 10, step: 113, loss: 0.31882932782173157, mean loss: 0.3714022890349681
Epoch: 10, step: 114, loss: 0.3577723205089569, mean loss: 0.37140135258917445
Epoch: 10, step: 115, loss: 0.3374727964401245, mean loss: 0.3713990216908405
Epoch: 10, step: 116, loss: 0.3644048571586609, mean loss: 0.37139854122339994
Epoch: 10, step: 117, loss: 0.35539868474006653, mean loss: 0.37139744218119064
Epoch: 10, step: 118, loss: 0.39005306363105774, mean loss: 0.37139872356187953
Epoch: 10, step: 119, loss: 0.37177085876464844, mean loss: 0.371398749120616
Epoch: 10, step: 120, loss: 0.30710500478744507, mean loss: 0.37139433364473295
Epoch: 10, step: 121, loss: 0.359760046005249, mean loss: 0.37139353469626163
Epoch: 10, step: 122, loss: 0.3422873318195343, mean loss: 0.37139153605567404
Epoch: 10, step: 123, loss: 0.3343862295150757, mean loss: 0.37138899518046525
Epoch: 10, step: 124, loss: 0.32862237095832825, mean loss: 0.37138605892064913
Epoch: 10, step: 125, loss: 0.3710445165634155, mean loss: 0.37138603547273225
Epoch: 10, step: 126, loss: 0.3578910231590271, mean loss: 0.37138510906288025
Epoch: 10, step: 127, loss: 0.3422985374927521, mean loss: 0.3713831124558257
Epoch: 10, step: 128, loss: 0.3269377052783966, mean loss: 0.3713800617723761
Epoch: 10, step: 129, loss: 0.3666118085384369, mean loss: 0.3713797345072262
Epoch: 10, step: 130, loss: 0.3575437366962433, mean loss: 0.3713787849500365
Epoch: 10, step: 131, loss: 0.324161559343338, mean loss: 0.3713755446792702
Epoch: 10, step: 132, loss: 0.33976975083351135, mean loss: 0.3713733758880916
Epoch: 10, step: 133, loss: 0.33833086490631104, mean loss: 0.37137110866488715
Epoch: 10, step: 134, loss: 0.3180542290210724, mean loss: 0.3713674505599373
Epoch: 10, step: 135, loss: 0.3859662711620331, mean loss: 0.3713684521255659
Epoch: 10, step: 136, loss: 0.3412892520427704, mean loss: 0.3713663886557105
Epoch: 10, step: 137, loss: 0.33950212597846985, mean loss: 0.37136420287832833
Epoch: 10, step: 138, loss: 0.3631947934627533, mean loss: 0.37136364252374876
Epoch: 10, step: 139, loss: 0.3438502550125122, mean loss: 0.37136175546013345
Epoch: 10, step: 140, loss: 0.345965176820755, mean loss: 0.37136001370177396
Epoch: 10, step: 141, loss: 0.3312259912490845, mean loss: 0.37135726140288133
Epoch: 10, step: 142, loss: 0.34232258796691895, mean loss: 0.37135527040833727
Epoch: 10, step: 143, loss: 0.35009390115737915, mean loss: 0.3713538125525192
Epoch: 10, step: 144, loss: 0.34259089827537537, mean loss: 0.3713518404637789
Epoch: 10, step: 145, loss: 0.3546842336654663, mean loss: 0.37135069775112306
Epoch: 10, step: 146, loss: 0.34534674882888794, mean loss: 0.3713489150714136
Epoch: 10, step: 147, loss: 0.3373377025127411, mean loss: 0.37134658362004547
Epoch: 10, step: 148, loss: 0.30956268310546875, mean loss: 0.37134234865531074
Epoch: 10, step: 149, loss: 0.3175744116306305, mean loss: 0.3713386633957477
Epoch: 10, step: 150, loss: 0.3753376305103302, mean loss: 0.37133893746655267
Epoch: 10, step: 151, loss: 0.31992077827453613, mean loss: 0.3713354137440203
Epoch: 10, step: 152, loss: 0.3127438426017761, mean loss: 0.37133139869768694
Epoch: 10, step: 153, loss: 0.39921021461486816, mean loss: 0.3713333089906784
Epoch: 10, step: 154, loss: 0.39196252822875977, mean loss: 0.37133472243495647
Epoch: 10, step: 155, loss: 0.37794631719589233, mean loss: 0.3713351754080149
Epoch: 10, step: 156, loss: 0.3834148347377777, mean loss: 0.3713360029519849
Epoch: 10, step: 157, loss: 0.3488726317882538, mean loss: 0.37133446415412463
Epoch: 10, step: 158, loss: 0.3530035614967346, mean loss: 0.37133320852684487
Epoch: 10, step: 159, loss: 0.34920063614845276, mean loss: 0.3713316925972299
Epoch: 10, step: 160, loss: 0.36945468187332153, mean loss: 0.37133156404365664
Epoch: 10, step: 161, loss: 0.3614101707935333, mean loss: 0.3713308845892497
Epoch: 10, step: 162, loss: 0.30979833006858826, mean loss: 0.37132667089654814
Epoch: 10, step: 163, loss: 0.3299977779388428, mean loss: 0.37132384092578957
Epoch: 10, step: 164, loss: 0.33573803305625916, mean loss: 0.3713214043761237
Epoch: 10, step: 165, loss: 0.35679057240486145, mean loss: 0.3713204095225039
Epoch: 10, step: 166, loss: 0.3429155945777893, mean loss: 0.3713184649195776
Epoch: 10, step: 167, loss: 0.33766016364097595, mean loss: 0.3713161608189972
Epoch: 10, step: 168, loss: 0.3182120621204376, mean loss: 0.37131252579273266
Epoch: 10, step: 169, loss: 0.37489521503448486, mean loss: 0.37131277101444665
Epoch: 10, step: 170, loss: 0.3560318946838379, mean loss: 0.37131172516704875
Epoch: 10, step: 171, loss: 0.3705589473247528, mean loss: 0.3713116736492659
Epoch: 10, step: 172, loss: 0.3277173936367035, mean loss: 0.37130869039599745
Epoch: 10, step: 173, loss: 0.3889571726322174, mean loss: 0.37130989803813763
Epoch: 10, step: 174, loss: 0.3704068660736084, mean loss: 0.37130983625011404
Epoch: 10, step: 175, loss: 0.3425792157649994, mean loss: 0.3713078705535839
Epoch: 10, step: 176, loss: 0.31135469675064087, mean loss: 0.3713037689476591
Epoch: 10, step: 177, loss: 0.3298725187778473, mean loss: 0.37130093468509445
Epoch: 10, step: 178, loss: 0.35726454854011536, mean loss: 0.3712999745382893
Epoch: 10, step: 179, loss: 0.3461654484272003, mean loss: 0.3712982553504568
Epoch: 10, step: 180, loss: 0.32462722063064575, mean loss: 0.37129506329555495
Epoch: 10, step: 181, loss: 0.38636717200279236, mean loss: 0.37129609407853315
Epoch: 10, step: 182, loss: 0.35016608238220215, mean loss: 0.3712946490938039
Epoch: 10, step: 183, loss: 0.3239874243736267, mean loss: 0.37129141419058176
Epoch: 10, step: 184, loss: 0.33311164379119873, mean loss: 0.3712888036079903
Epoch: 10, step: 185, loss: 0.3293277621269226, mean loss: 0.3712859346731154
Epoch: 10, step: 186, loss: 0.326386421918869, mean loss: 0.37128286504074004
Epoch: 10, step: 187, loss: 0.32712259888648987, mean loss: 0.3712798461546207
Epoch: 10, step: 188, loss: 0.32957011461257935, mean loss: 0.37127699498697136
Epoch: 10, step: 189, loss: 0.33853599429130554, mean loss: 0.37127475705117535
Epoch: 10, step: 190, loss: 0.3557232916355133, mean loss: 0.3712736941391792
Epoch: 10, step: 191, loss: 0.342547744512558, mean loss: 0.37127173091134796
Epoch: 10, step: 192, loss: 0.33965441584587097, mean loss: 0.3712695702255648
Epoch: 10, step: 193, loss: 0.3343413770198822, mean loss: 0.3712670467737945
Epoch: 10, step: 194, loss: 0.3363703191280365, mean loss: 0.3712646623031662
Epoch: 10, step: 195, loss: 0.3644770681858063, mean loss: 0.37126419854297776
Epoch: 10, step: 196, loss: 0.3159344494342804, mean loss: 0.37126041841391383
Epoch: 10, step: 197, loss: 0.3679260015487671, mean loss: 0.3712601906220799
Epoch: 10, step: 198, loss: 0.30609726905822754, mean loss: 0.37125573929879524
Epoch: 10, step: 199, loss: 0.3532249331474304, mean loss: 0.3712545076863532
Epoch: 10, step: 200, loss: 0.3771745264530182, mean loss: 0.37125491203160055
Epoch: 10, step: 201, loss: 0.38507211208343506, mean loss: 0.3712558557005018
Epoch: 10, step: 202, loss: 0.33819350600242615, mean loss: 0.3712535978059653
Epoch: 10, step: 203, loss: 0.3661328852176666, mean loss: 0.3712532481260562
Epoch: 10, step: 204, loss: 0.39607465267181396, mean loss: 0.37125494299833656
Epoch: 10, step: 205, loss: 0.3479151725769043, mean loss: 0.3712533494048352
Epoch: 10, step: 206, loss: 0.31439557671546936, mean loss: 0.3712494675332786
Epoch: 10, step: 207, loss: 0.39696642756462097, mean loss: 0.37125122319685255
Epoch: 10, step: 208, loss: 0.328229159116745, mean loss: 0.37124828633672013
Epoch: 10, step: 209, loss: 0.3466326892375946, mean loss: 0.3712466060911844
Epoch: 10, step: 210, loss: 0.34659096598625183, mean loss: 0.37124492322720887
Epoch: 10, step: 211, loss: 0.32228705286979675, mean loss: 0.3712415818492156
Epoch: 10, step: 212, loss: 0.32487064599990845, mean loss: 0.3712384172456634
Epoch: 10, step: 213, loss: 0.32496094703674316, mean loss: 0.37123525923623196
Epoch: 10, step: 214, loss: 0.33419087529182434, mean loss: 0.3712327314720597
Epoch: 10, step: 215, loss: 0.3236406743526459, mean loss: 0.37122948419742
Epoch: 10, step: 216, loss: 0.35789087414741516, mean loss: 0.3712285741469288
Epoch: 10, step: 217, loss: 0.31046396493911743, mean loss: 0.3712244286557835
Epoch: 10, step: 218, loss: 0.30305784940719604, mean loss: 0.37121977850370974
Epoch: 10, step: 219, loss: 0.3311450481414795, mean loss: 0.37121704489318025
Epoch: 10, step: 220, loss: 0.3349824845790863, mean loss: 0.37121457340008196
Epoch: 10, step: 221, loss: 0.35982757806777954, mean loss: 0.371213796766926
Epoch: 10, step: 222, loss: 0.3494703769683838, mean loss: 0.3712123138903115
Epoch: 10, step: 223, loss: 0.3228473365306854, mean loss: 0.3712090156785439
Epoch: 10, step: 224, loss: 0.33037322759628296, mean loss: 0.37120623110383666
Epoch: 10, step: 225, loss: 0.30572786927223206, mean loss: 0.3712017664671374
Epoch: 10, step: 226, loss: 0.32568907737731934, mean loss: 0.37119866339976915
Epoch: 10, step: 227, loss: 0.3554706871509552, mean loss: 0.37119759113523076
Epoch: 10, step: 228, loss: 0.3287704288959503, mean loss: 0.3711946988343078
Epoch: 10, step: 229, loss: 0.3404003977775574, mean loss: 0.37119259969994806
Epoch: 10, step: 230, loss: 0.3147089183330536, mean loss: 0.37118874967736154
Epoch: 10, step: 231, loss: 0.34755945205688477, mean loss: 0.37118713917452484
Epoch: 10, step: 232, loss: 0.317848265171051, mean loss: 0.3711835040028487
Epoch: 10, step: 233, loss: 0.29941338300704956, mean loss: 0.37117861303099403
Epoch: 10, step: 234, loss: 0.3326743245124817, mean loss: 0.37117598922939143
Epoch: 10, step: 235, loss: 0.34649473428726196, mean loss: 0.37117430748675434
Epoch: 10, step: 236, loss: 0.34198787808418274, mean loss: 0.3711723189039784
Epoch: 10, step: 237, loss: 0.3372777998447418, mean loss: 0.3711700096984286
Epoch: 10, step: 238, loss: 0.30517956614494324, mean loss: 0.3711655141303686
Epoch: 10, step: 239, loss: 0.3222457766532898, mean loss: 0.3711621817231835
Epoch: 10, step: 240, loss: 0.33767709136009216, mean loss: 0.3711599008778485
Epoch: 10, step: 241, loss: 0.3172275125980377, mean loss: 0.3711562275098959
Epoch: 10, step: 242, loss: 0.3619716167449951, mean loss: 0.3711556019830441
Epoch: 10, step: 243, loss: 0.31918856501579285, mean loss: 0.37115206295846176
Epoch: 10, step: 244, loss: 0.34023362398147583, mean loss: 0.37114995751488145
Epoch: 10, step: 245, loss: 0.35174545645713806, mean loss: 0.3711486362224221
Epoch: 10, step: 246, loss: 0.3727854788303375, mean loss: 0.3711487476708192
Epoch: 10, step: 247, loss: 0.29305499792099, mean loss: 0.37114343083055845
Epoch: 10, step: 248, loss: 0.3610975742340088, mean loss: 0.3711427469271888
Epoch: 10, step: 249, loss: 0.3329361379146576, mean loss: 0.37114014606884893
Epoch: 10, step: 250, loss: 0.3180761933326721, mean loss: 0.3711365340647147
Epoch: 10, step: 251, loss: 0.31507304310798645, mean loss: 0.3711327181451015
Epoch: 10, step: 252, loss: 0.31283751130104065, mean loss: 0.37112875059546263
Epoch: 10, step: 253, loss: 0.4109998345375061, mean loss: 0.371131464021619
Epoch: 10, step: 254, loss: 0.31839126348495483, mean loss: 0.3711278750321303
Epoch: 10, step: 255, loss: 0.33383679389953613, mean loss: 0.37112533753341415
Epoch: 10, step: 256, loss: 0.3155137002468109, mean loss: 0.3711215536566171
Epoch: 10, step: 257, loss: 0.33055317401885986, mean loss: 0.3711187935273724
Epoch: 10, step: 258, loss: 0.3221079409122467, mean loss: 0.37111545922894296
Epoch: 10, step: 259, loss: 0.32541751861572266, mean loss: 0.3711123505254999
Epoch: 10, step: 260, loss: 0.3383306562900543, mean loss: 0.37111012062996657
Epoch: 10, step: 261, loss: 0.33544063568115234, mean loss: 0.3711076944644824
Epoch: 10, step: 262, loss: 0.3334355354309082, mean loss: 0.37110513225547515
Epoch: 10, step: 263, loss: 0.3211383521556854, mean loss: 0.37110173407946184
Epoch: 10, step: 264, loss: 0.351717472076416, mean loss: 0.3711004158705531
Epoch: 10, step: 265, loss: 0.3604210317134857, mean loss: 0.37109968967824
Epoch: 10, step: 266, loss: 0.3487151265144348, mean loss: 0.37109816764361947
Epoch: 10, step: 267, loss: 0.3711613714694977, mean loss: 0.3710981719408608
Epoch: 10, step: 268, loss: 0.30381321907043457, mean loss: 0.3710935975338399
Epoch: 10, step: 269, loss: 0.29859012365341187, mean loss: 0.37108866867769574
Epoch: 10, step: 270, loss: 0.35594072937965393, mean loss: 0.3710876389761596
Epoch: 10, step: 271, loss: 0.40206995606422424, mean loss: 0.3710897448976582
Epoch: 10, step: 272, loss: 0.34623607993125916, mean loss: 0.3710880556660286
Epoch: 10, step: 273, loss: 0.3310633599758148, mean loss: 0.3710853354882598
Epoch: 10, step: 274, loss: 0.3452712893486023, mean loss: 0.3710835812207681
Epoch: 10, step: 275, loss: 0.3206871449947357, mean loss: 0.3710801566192306
Epoch: 10, step: 276, loss: 0.32692083716392517, mean loss: 0.371077156053935
Epoch: 10, step: 277, loss: 0.3109202980995178, mean loss: 0.371073068755528
Epoch: 10, step: 278, loss: 0.3734699785709381, mean loss: 0.37107323160013805
Epoch: 10, step: 279, loss: 0.3549487292766571, mean loss: 0.37107213618557805
Epoch: 10, step: 280, loss: 0.33920127153396606, mean loss: 0.3710699711923947
Epoch: 10, step: 281, loss: 0.34005796909332275, mean loss: 0.3710678646849841
Epoch: 10, step: 282, loss: 0.2930767238140106, mean loss: 0.37106256745338245
Epoch: 10, step: 283, loss: 0.3591599762439728, mean loss: 0.37106175907310474
Epoch: 10, step: 284, loss: 0.33640405535697937, mean loss: 0.37105940540901533
Epoch: 10, step: 285, loss: 0.33541250228881836, mean loss: 0.37105698473109056
Epoch: 10, step: 286, loss: 0.30108949542045593, mean loss: 0.3710522337642059
Epoch: 10, step: 287, loss: 0.3347243070602417, mean loss: 0.37104976717494026
Epoch: 10, step: 288, loss: 0.3245584964752197, mean loss: 0.3710466107304634
Epoch: 10, step: 289, loss: 0.32763031125068665, mean loss: 0.371043663255957
Epoch: 10, step: 290, loss: 0.3129359185695648, mean loss: 0.37103971866667684
Epoch: 10, step: 291, loss: 0.3540298342704773, mean loss: 0.37103856404514574
Epoch: 10, step: 292, loss: 0.3764917552471161, mean loss: 0.3710389341796195
Epoch: 10, step: 293, loss: 0.33944082260131836, mean loss: 0.3710367896084522
Epoch: 10, step: 294, loss: 0.36678218841552734, mean loss: 0.37103650086727863
Epoch: 10, step: 295, loss: 0.3431008756160736, mean loss: 0.3710346051272371
Epoch: 10, step: 296, loss: 0.3407624661922455, mean loss: 0.37103255096838966
Epoch: 10, step: 297, loss: 0.3251034915447235, mean loss: 0.3710294345985007
Epoch: 10, step: 298, loss: 0.3393241763114929, mean loss: 0.3710272834852442
Epoch: 10, step: 299, loss: 0.34958672523498535, mean loss: 0.37102582890191654
Epoch: 10, step: 300, loss: 0.341465562582016, mean loss: 0.3710238235924857
Epoch: 10, step: 301, loss: 0.350624144077301, mean loss: 0.3710224398128415
Epoch: 10, step: 302, loss: 0.3153553903102875, mean loss: 0.3710186639836682
Epoch: 10, step: 303, loss: 0.29935142397880554, mean loss: 0.37101380321047195
Epoch: 10, step: 304, loss: 0.3309404253959656, mean loss: 0.37101108545002337
Epoch: 10, step: 305, loss: 0.3468899130821228, mean loss: 0.3710094496727029
Epoch: 10, step: 306, loss: 0.31450578570365906, mean loss: 0.37100561813652816
Epoch: 10, step: 307, loss: 0.313114732503891, mean loss: 0.37100169279847334
Epoch: 10, step: 308, loss: 0.3652596175670624, mean loss: 0.37100130347884275
Epoch: 10, step: 309, loss: 0.30528613924980164, mean loss: 0.3709968482134713
Epoch: 10, step: 310, loss: 0.397024005651474, mean loss: 0.3709986126468953
Epoch: 10, step: 311, loss: 0.33073389530181885, mean loss: 0.37099588320564364
Epoch: 10, step: 312, loss: 0.32068973779678345, mean loss: 0.3709924733130517
Epoch: 10, step: 313, loss: 0.310525506734848, mean loss: 0.37098837496910575
Epoch: 10, step: 314, loss: 0.34753429889678955, mean loss: 0.37098678540109
Epoch: 10, step: 315, loss: 0.3498779833316803, mean loss: 0.37098535487777273
Epoch: 10, step: 316, loss: 0.36550092697143555, mean loss: 0.37098498322852785
Epoch: 10, step: 317, loss: 0.39396190643310547, mean loss: 0.3709865401416058
Epoch: 10, step: 318, loss: 0.33963829278945923, mean loss: 0.370984416132706
Epoch: 10, step: 319, loss: 0.3182401955127716, mean loss: 0.37098084267602444
Epoch: 10, step: 320, loss: 0.3664209544658661, mean loss: 0.370980533761438
Epoch: 10, step: 321, loss: 0.3335532248020172, mean loss: 0.37097799837944645
Epoch: 10, step: 322, loss: 0.3113802373409271, mean loss: 0.3709739614112802
Epoch: 10, step: 323, loss: 0.32970988750457764, mean loss: 0.37097116649974493
Epoch: 10, step: 324, loss: 0.3306627571582794, mean loss: 0.37096843650249867
Epoch: 10, step: 325, loss: 0.335244745016098, mean loss: 0.37096601718166117
Epoch: 10, step: 326, loss: 0.30713924765586853, mean loss: 0.3709616949246336
Epoch: 10, step: 327, loss: 0.34198564291000366, mean loss: 0.37095973284093814
Epoch: 10, step: 328, loss: 0.35124820470809937, mean loss: 0.3709583981853668
Epoch: 10, step: 329, loss: 0.39482182264328003, mean loss: 0.3709600138539151
Epoch: 10, step: 330, loss: 0.31801727414131165, mean loss: 0.3709564296186086
Epoch: 10, step: 331, loss: 0.38149338960647583, mean loss: 0.3709571429248628
Epoch: 10, step: 332, loss: 0.32662686705589294, mean loss: 0.37095414216158734
Epoch: 10, step: 333, loss: 0.350475937128067, mean loss: 0.37095275606404887
Epoch: 10, step: 334, loss: 0.3586047887802124, mean loss: 0.37095192033022256
Epoch: 10, step: 335, loss: 0.3107234239578247, mean loss: 0.37094784422732785
Epoch: 10, step: 336, loss: 0.33418241143226624, mean loss: 0.37094535620994984
Epoch: 10, step: 337, loss: 0.299909770488739, mean loss: 0.3709405493628987
Epoch: 10, step: 338, loss: 0.31521499156951904, mean loss: 0.370936778772345
Epoch: 10, step: 339, loss: 0.30630114674568176, mean loss: 0.3709324055902052
Epoch: 10, step: 340, loss: 0.327259361743927, mean loss: 0.370929450915701
Epoch: 10, step: 341, loss: 0.37614235281944275, mean loss: 0.3709298035677037
Epoch: 10, step: 342, loss: 0.3483431339263916, mean loss: 0.37092827568637776
Epoch: 10, step: 343, loss: 0.35320231318473816, mean loss: 0.3709270766899964
Epoch: 10, step: 344, loss: 0.3161333203315735, mean loss: 0.37092337065304287
Epoch: 10, step: 345, loss: 0.33219635486602783, mean loss: 0.37092075148519577
Epoch: 10, step: 346, loss: 0.32625412940979004, mean loss: 0.37091773081690094
Epoch: 10, step: 347, loss: 0.3449711203575134, mean loss: 0.3709159762449196
Epoch: 10, step: 348, loss: 0.3257303833961487, mean loss: 0.3709129208934524
Epoch: 10, step: 349, loss: 0.3774733245372772, mean loss: 0.3709133644636785
Epoch: 10, step: 350, loss: 0.35301733016967773, mean loss: 0.3709121545364056
Epoch: 10, step: 351, loss: 0.37014999985694885, mean loss: 0.37091210301161653
Epoch: 10, step: 352, loss: 0.32612359523773193, mean loss: 0.37090907532907924
Epoch: 10, step: 353, loss: 0.3288935124874115, mean loss: 0.37090623528833017
Epoch: 10, step: 354, loss: 0.3476971387863159, mean loss: 0.3709046665761638
Epoch: 10, step: 355, loss: 0.3304991126060486, mean loss: 0.3709019357331001
Epoch: 10, step: 356, loss: 0.3726274371147156, mean loss: 0.3709020523446688
Epoch: 10, step: 357, loss: 0.35346707701683044, mean loss: 0.3709008741465793
Epoch: 10, step: 358, loss: 0.3300047516822815, mean loss: 0.37089811070834267
Epoch: 10, step: 359, loss: 0.3184821605682373, mean loss: 0.37089456909008994
Epoch: 10, step: 360, loss: 0.3369978368282318, mean loss: 0.3708922789250834
Epoch: 10, step: 361, loss: 0.3077838122844696, mean loss: 0.37088801541564953
Epoch: 10, step: 362, loss: 0.3103393614292145, mean loss: 0.37088392511949425
Epoch: 10, step: 363, loss: 0.32223573327064514, mean loss: 0.3708806389676536
Epoch: 10, step: 364, loss: 0.3012310266494751, mean loss: 0.3708759345021137
Epoch: 10, step: 365, loss: 0.3278109133243561, mean loss: 0.37087302588255555
Epoch: 10, step: 366, loss: 0.3541380763053894, mean loss: 0.3708718956772758
Epoch: 10, step: 367, loss: 0.3388696014881134, mean loss: 0.3708697345282895
Epoch: 10, step: 368, loss: 0.37223196029663086, mean loss: 0.37086982651463346
Epoch: 10, step: 369, loss: 0.3527309000492096, mean loss: 0.37086860173904496
Epoch: 10, step: 370, loss: 0.3327622413635254, mean loss: 0.3708660288972128
Epoch: 10, step: 371, loss: 0.34714052081108093, mean loss: 0.37086442712107953
Epoch: 10, step: 372, loss: 0.3290954828262329, mean loss: 0.37086160737192037
Epoch: 10, step: 373, loss: 0.32079368829727173, mean loss: 0.37085822760149545
Epoch: 10, step: 374, loss: 0.30990129709243774, mean loss: 0.37085411306011784
Epoch: 10, step: 375, loss: 0.32234469056129456, mean loss: 0.3708508389360291
Epoch: 10, step: 376, loss: 0.3165678381919861, mean loss: 0.3708471753738543
Epoch: 10, step: 377, loss: 0.3018089234828949, mean loss: 0.3708425162935539
Epoch: 10, step: 378, loss: 0.37582695484161377, mean loss: 0.3708428526481357
Epoch: 10, step: 379, loss: 0.36882007122039795, mean loss: 0.37084271615816083
Epoch: 10, step: 380, loss: 0.34539175033569336, mean loss: 0.3708409989349085
Epoch: 10, step: 381, loss: 0.3181401789188385, mean loss: 0.37083744335401414
Epoch: 10, step: 382, loss: 0.308384507894516, mean loss: 0.3708332301086887
Epoch: 10, step: 383, loss: 0.3486558496952057, mean loss: 0.3708317340630591
Epoch: 10, step: 384, loss: 0.3201674818992615, mean loss: 0.3708283165755607
Epoch: 10, step: 385, loss: 0.3711606562137604, mean loss: 0.3708283389915622
Epoch: 10, step: 386, loss: 0.36014804244041443, mean loss: 0.3708276186640144
Epoch: 10, step: 387, loss: 0.3510274589061737, mean loss: 0.3708262833416677
Epoch: 10, step: 388, loss: 0.3928261697292328, mean loss: 0.37082776691347885
Epoch: 10, step: 389, loss: 0.30107754468917847, mean loss: 0.3708230635943808
Epoch: 10, step: 390, loss: 0.29666054248809814, mean loss: 0.3708180630872601
Epoch: 10, step: 391, loss: 0.34306299686431885, mean loss: 0.37081619179099373
Epoch: 10, step: 392, loss: 0.32590174674987793, mean loss: 0.37081316378283347
Epoch: 10, step: 393, loss: 0.3147774040699005, mean loss: 0.3708093862609437
Epoch: 10, step: 394, loss: 0.3394915759563446, mean loss: 0.370807275185089
Epoch: 10, step: 395, loss: 0.35085979104042053, mean loss: 0.3708059306525907
Epoch: 10, step: 396, loss: 0.33004230260849, mean loss: 0.3708031832219751
Epoch: 10, step: 397, loss: 0.36551550030708313, mean loss: 0.3708028268610831
Epoch: 10, step: 398, loss: 0.3858911991119385, mean loss: 0.37080384366627556
Epoch: 10, step: 399, loss: 0.30601465702056885, mean loss: 0.37079947781811884
Epoch: 10, step: 400, loss: 0.30402350425720215, mean loss: 0.37079497839263803
Epoch: 10, step: 401, loss: 0.33321359753608704, mean loss: 0.37079244629582786
Epoch: 10, step: 402, loss: 0.31255847215652466, mean loss: 0.3707885229667071
Epoch: 10, step: 403, loss: 0.34376874566078186, mean loss: 0.37078670271762965
Epoch: 10, step: 404, loss: 0.3512580692768097, mean loss: 0.3707853872152086
Epoch: 10, step: 405, loss: 0.3652847409248352, mean loss: 0.3707850167015153
Epoch: 10, step: 406, loss: 0.31161677837371826, mean loss: 0.37078103150327135
Epoch: 10, step: 407, loss: 0.34421515464782715, mean loss: 0.37077924231436676
Epoch: 10, step: 408, loss: 0.3676094710826874, mean loss: 0.3707790288473837
Epoch: 10, step: 409, loss: 0.33280789852142334, mean loss: 0.37077647186891055
Epoch: 10, step: 410, loss: 0.3150079846382141, mean loss: 0.37077271666810047
Epoch: 10, step: 411, loss: 0.33872658014297485, mean loss: 0.370770558969708
Epoch: 10, step: 412, loss: 0.3365918695926666, mean loss: 0.3707682578393386
Epoch: 10, step: 413, loss: 0.3643032908439636, mean loss: 0.37076782260526053
Epoch: 10, step: 414, loss: 0.31893500685691833, mean loss: 0.3707643333547894
Epoch: 10, step: 415, loss: 0.29989907145500183, mean loss: 0.370759563210612
Epoch: 10, step: 416, loss: 0.3282424807548523, mean loss: 0.3707567014563914
Epoch: 10, step: 417, loss: 0.3875574469566345, mean loss: 0.37075783221056424
Epoch: 10, step: 418, loss: 0.3364850580692291, mean loss: 0.37075552567754444
Epoch: 10, step: 419, loss: 0.3710561692714691, mean loss: 0.3707555459092802
Epoch: 10, step: 420, loss: 0.34264904260635376, mean loss: 0.3707536546164128
Epoch: 10, step: 421, loss: 0.3225705325603485, mean loss: 0.37075041258155506
Epoch: 10, step: 422, loss: 0.37631508708000183, mean loss: 0.3707507869793549
Epoch: 10, step: 423, loss: 0.32679954171180725, mean loss: 0.3707478300871813
Epoch: 10, step: 424, loss: 0.3455650508403778, mean loss: 0.370746135988342
Epoch: 10, step: 425, loss: 0.36867189407348633, mean loss: 0.37074599645908635
Epoch: 10, step: 426, loss: 0.345865398645401, mean loss: 0.3707443229137972
Epoch: 10, step: 427, loss: 0.312876433134079, mean loss: 0.37074043080391156
Epoch: 10, step: 428, loss: 0.3018621504306793, mean loss: 0.3707357984627741
Epoch: 10, step: 429, loss: 0.3518083989620209, mean loss: 0.3707345256047041
Epoch: 10, step: 430, loss: 0.39644932746887207, mean loss: 0.3707362547958724
Epoch: 10, step: 431, loss: 0.28987741470336914, mean loss: 0.37073081781092804
Epoch: 10, step: 432, loss: 0.3496525287628174, mean loss: 0.3707294005925425
Epoch: 10, step: 433, loss: 0.3182131052017212, mean loss: 0.3707258698479284
Epoch: 10, step: 434, loss: 0.35686010122299194, mean loss: 0.37072493769541576
Epoch: 10, step: 435, loss: 0.35683390498161316, mean loss: 0.3707240039072527
Epoch: 10, step: 436, loss: 0.32508572936058044, mean loss: 0.37072093620042024
Epoch: 10, step: 437, loss: 0.37808749079704285, mean loss: 0.37072143133112306
Epoch: 10, step: 438, loss: 0.3489198088645935, mean loss: 0.370719966069851
Epoch: 10, step: 439, loss: 0.3476845622062683, mean loss: 0.3707184179916344
Epoch: 10, step: 440, loss: 0.3378671109676361, mean loss: 0.3707162103908667
Epoch: 10, step: 441, loss: 0.32647404074668884, mean loss: 0.37071323752635627
Epoch: 10, step: 442, loss: 0.3329399824142456, mean loss: 0.3707106995128434
Epoch: 10, step: 443, loss: 0.3669528067111969, mean loss: 0.3707104470341548
Epoch: 10, step: 444, loss: 0.39470237493515015, mean loss: 0.37071205885329495
Epoch: 10, step: 445, loss: 0.33672574162483215, mean loss: 0.37070977574720676
Epoch: 10, step: 446, loss: 0.40308645367622375, mean loss: 0.3707119505761131
Epoch: 10, step: 447, loss: 0.38134193420410156, mean loss: 0.37071266457286406
Epoch: 10, step: 448, loss: 0.34288129210472107, mean loss: 0.3707107953155286
Epoch: 10, step: 449, loss: 0.3174622356891632, mean loss: 0.3707072191866081
Epoch: 10, step: 450, loss: 0.40316540002822876, mean loss: 0.3707093989046151
Epoch: 10, step: 451, loss: 0.37694671750068665, mean loss: 0.37070981774148026
Epoch: 10, step: 452, loss: 0.3230554461479187, mean loss: 0.37070661795825366
Epoch: 10, step: 453, loss: 0.3262391984462738, mean loss: 0.37070363236543025
Epoch: 10, step: 454, loss: 0.3404764235019684, mean loss: 0.3707016030127036
Epoch: 10, step: 455, loss: 0.296245276927948, mean loss: 0.3706966046019836
Epoch: 10, step: 456, loss: 0.3516519069671631, mean loss: 0.3706953261769561
Epoch: 10, step: 457, loss: 0.35679638385772705, mean loss: 0.3706943932368085
Epoch: 10, step: 458, loss: 0.31752532720565796, mean loss: 0.3706908246036095
Epoch: 10, step: 459, loss: 0.3965896666049957, mean loss: 0.37069256278092505
Epoch: 10, step: 460, loss: 0.3364643454551697, mean loss: 0.37069026573929525
Epoch: 10, step: 461, loss: 0.2970217168331146, mean loss: 0.37068532220494377
Epoch: 10, step: 462, loss: 0.3637674152851105, mean loss: 0.37068485800935097
Epoch: 10, step: 463, loss: 0.33640918135643005, mean loss: 0.37068255824575375
Epoch: 10, step: 464, loss: 0.326555460691452, mean loss: 0.3706795976890577
Epoch: 10, step: 465, loss: 0.36131736636161804, mean loss: 0.3706789696043048
Epoch: 10, step: 466, loss: 0.3362014591693878, mean loss: 0.37067665676399925
Epoch: 10, step: 467, loss: 0.3142109811306, mean loss: 0.3706728691549549
Epoch: 10, step: 468, loss: 0.36574238538742065, mean loss: 0.3706725384497589
Epoch: 10, step: 469, loss: 0.3604928255081177, mean loss: 0.3706718557057655
Epoch: 10, step: 470, loss: 0.33507540822029114, mean loss: 0.3706694684448517
Epoch: 10, step: 471, loss: 0.32083621621131897, mean loss: 0.3706661266226794
Epoch: 10, step: 472, loss: 0.30807146430015564, mean loss: 0.3706619293007239
Epoch: 10, step: 473, loss: 0.3575451970100403, mean loss: 0.3706610498094881
Epoch: 10, step: 474, loss: 0.37202000617980957, mean loss: 0.3706611409228887
Epoch: 10, step: 475, loss: 0.3116898536682129, mean loss: 0.37065718736380754
Epoch: 10, step: 476, loss: 0.33338892459869385, mean loss: 0.3706546889886138
Epoch: 10, step: 477, loss: 0.37798258662223816, mean loss: 0.3706551802004139
Epoch: 10, step: 478, loss: 0.334902822971344, mean loss: 0.3706527837692034
Epoch: 10, step: 479, loss: 0.3787562847137451, mean loss: 0.37065332689929353
Epoch: 10, step: 480, loss: 0.3286074697971344, mean loss: 0.37065050900122354
Epoch: 10, step: 481, loss: 0.3516978919506073, mean loss: 0.3706492388888358
Epoch: 10, step: 482, loss: 0.3607398271560669, mean loss: 0.37064857485266794
Epoch: 10, step: 483, loss: 0.3429449200630188, mean loss: 0.370646718537016
Epoch: 10, step: 484, loss: 0.32960236072540283, mean loss: 0.37064396849629155
Epoch: 10, step: 485, loss: 0.34055018424987793, mean loss: 0.3706419522974274
Epoch: 10, step: 486, loss: 0.29137012362480164, mean loss: 0.3706366416637654
Epoch: 10, step: 487, loss: 0.3070454001426697, mean loss: 0.3706323818003195
Epoch: 10, step: 488, loss: 0.3668425381183624, mean loss: 0.37063212794248024
Epoch: 10, step: 489, loss: 0.35248276591300964, mean loss: 0.3706309123120697
Epoch: 10, step: 490, loss: 0.32092759013175964, mean loss: 0.37062758344446667
Epoch: 10, step: 491, loss: 0.33077019453048706, mean loss: 0.37062491418456084
Epoch: 10, step: 492, loss: 0.3646526336669922, mean loss: 0.3706245142461347
Epoch: 10, step: 493, loss: 0.3648873567581177, mean loss: 0.3706241300786318
Epoch: 10, step: 494, loss: 0.3835255205631256, mean loss: 0.37062499391462006
Epoch: 10, step: 495, loss: 0.31430330872535706, mean loss: 0.3706212230465704
Epoch: 10, step: 496, loss: 0.3254387378692627, mean loss: 0.3706181981764374
Epoch: 10, step: 497, loss: 0.323930948972702, mean loss: 0.37061507277483047
Epoch: 10, step: 498, loss: 0.3891841471195221, mean loss: 0.37061631576795884
Epoch: 10, step: 499, loss: 0.3412868082523346, mean loss: 0.3706143526148453
Epoch: 10, step: 500, loss: 0.33019882440567017, mean loss: 0.3706116476065989
Epoch: 10, step: 501, loss: 0.3263452351093292, mean loss: 0.3706086850572416
Epoch: 10, step: 502, loss: 0.3000200092792511, mean loss: 0.37060396119484595
Epoch: 10, step: 503, loss: 0.31917494535446167, mean loss: 0.3706005197457132
Epoch: 10, step: 504, loss: 0.3327610492706299, mean loss: 0.3705979878306596
Epoch: 10, step: 505, loss: 0.37576746940612793, mean loss: 0.3705983337079228
Epoch: 10, step: 506, loss: 0.3283659517765045, mean loss: 0.37059550823244736
Epoch: 10, step: 507, loss: 0.3483169674873352, mean loss: 0.37059401782966805
Epoch: 10, step: 508, loss: 0.32708361744880676, mean loss: 0.3705911072403055
Epoch: 10, step: 509, loss: 0.34931379556655884, mean loss: 0.3705896840087554
Epoch: 10, step: 510, loss: 0.353498637676239, mean loss: 0.37058854087141796
Epoch: 10, step: 511, loss: 0.33611956238746643, mean loss: 0.37058623556253056
Epoch: 10, step: 512, loss: 0.328285813331604, mean loss: 0.3705834066705202
Epoch: 10, step: 513, loss: 0.3310275673866272, mean loss: 0.37058076150272
Epoch: 10, step: 514, loss: 0.4034276008605957, mean loss: 0.3705829578811458
Epoch: 10, step: 515, loss: 0.3313996493816376, mean loss: 0.3705803379755227
Epoch: 10, step: 516, loss: 0.3596092164516449, mean loss: 0.37057960446469007
Epoch: 10, step: 517, loss: 0.3663035035133362, mean loss: 0.37057931859084653
Epoch: 10, step: 518, loss: 0.34214136004447937, mean loss: 0.3705774175307124
Epoch: 10, step: 519, loss: 0.30204904079437256, mean loss: 0.37057283675686636
Epoch: 10, step: 520, loss: 0.3122406601905823, mean loss: 0.3705689378078278
Epoch: 10, step: 521, loss: 0.3188179135322571, mean loss: 0.37056547897717174
Epoch: 10, step: 522, loss: 0.32701802253723145, mean loss: 0.370562568634564
Epoch: 10, step: 523, loss: 0.3328830301761627, mean loss: 0.3705600506221035
Epoch: 10, step: 524, loss: 0.3542953133583069, mean loss: 0.3705589637702984
Epoch: 10, step: 525, loss: 0.3431365489959717, mean loss: 0.37055713145606783
Epoch: 10, step: 526, loss: 0.32365062832832336, mean loss: 0.3705539974610703
Epoch: 10, step: 527, loss: 0.3458250164985657, mean loss: 0.37055234533780984
Epoch: 10, step: 528, loss: 0.35922059416770935, mean loss: 0.37055158832323504
Epoch: 10, step: 529, loss: 0.3528161644935608, mean loss: 0.3705504035921843
Epoch: 10, step: 530, loss: 0.2914665639400482, mean loss: 0.3705451211234346
Epoch: 10, step: 531, loss: 0.3595091700553894, mean loss: 0.37054438401743217
Epoch: 10, step: 532, loss: 0.37240055203437805, mean loss: 0.37054450798510846
Epoch: 10, step: 533, loss: 0.35985976457595825, mean loss: 0.3705437944320559
Epoch: 10, step: 534, loss: 0.33003371953964233, mean loss: 0.37054108925176255
Epoch: 10, step: 535, loss: 0.30415260791778564, mean loss: 0.3705366562602205
Epoch: 10, step: 536, loss: 0.37233030796051025, mean loss: 0.3705367760206331
Epoch: 10, step: 537, loss: 0.3378494083881378, mean loss: 0.3705345936619983
Epoch: 10, step: 538, loss: 0.3082887530326843, mean loss: 0.370530438121533
Epoch: 10, step: 539, loss: 0.34894290566444397, mean loss: 0.37052899703124886
Epoch: 10, step: 540, loss: 0.302204966545105, mean loss: 0.3705244363189809
Epoch: 10, step: 541, loss: 0.3581269681453705, mean loss: 0.37052360882811364
Epoch: 10, step: 542, loss: 0.3516835570335388, mean loss: 0.370522351399575
Epoch: 10, step: 543, loss: 0.3570961058139801, mean loss: 0.37052145536076125
Epoch: 10, step: 544, loss: 0.3455379009246826, mean loss: 0.370519788123228
Epoch: 10, step: 545, loss: 0.3833729326725006, mean loss: 0.37052064580002964
Epoch: 10, step: 546, loss: 0.34777194261550903, mean loss: 0.3705191279043077
Epoch: 10, step: 547, loss: 0.31806355714797974, mean loss: 0.37051562806638694
Epoch: 10, step: 548, loss: 0.3428969979286194, mean loss: 0.37051378547314273
Epoch: 10, step: 549, loss: 0.32924404740333557, mean loss: 0.3705110323218372
Epoch: 10, step: 550, loss: 0.31997600197792053, mean loss: 0.3705076612971995
Epoch: 10, step: 551, loss: 0.3369634747505188, mean loss: 0.37050542382477775
Epoch: 10, step: 552, loss: 0.30502963066101074, mean loss: 0.3705010567339244
Epoch: 10, step: 553, loss: 0.3415833115577698, mean loss: 0.37049912811279756
Epoch: 10, step: 554, loss: 0.33718860149383545, mean loss: 0.3704969066705422
Epoch: 10, step: 555, loss: 0.3583126664161682, mean loss: 0.37049609417119206
Epoch: 10, step: 556, loss: 0.33412817120552063, mean loss: 0.3704936691579917
Epoch: 10, step: 557, loss: 0.36155012249946594, mean loss: 0.37049307284203903
Epoch: 10, step: 558, loss: 0.3434353470802307, mean loss: 0.37049126887339034
Epoch: 10, step: 559, loss: 0.3628699779510498, mean loss: 0.37049076078732884
Epoch: 10, step: 560, loss: 0.3394743800163269, mean loss: 0.37048869316645217
Epoch: 10, step: 561, loss: 0.32630470395088196, mean loss: 0.37048574795986533
Epoch: 10, step: 562, loss: 0.3064943552017212, mean loss: 0.37048148272006276
Epoch: 10, step: 563, loss: 0.32042258977890015, mean loss: 0.37047814635023196
Epoch: 10, step: 564, loss: 0.30932584404945374, mean loss: 0.3704740708885658
Epoch: 10, step: 565, loss: 0.3309912383556366, mean loss: 0.37047143975218483
Epoch: 10, step: 566, loss: 0.32471856474876404, mean loss: 0.3704683909832768
Epoch: 10, step: 567, loss: 0.33655846118927, mean loss: 0.37046613152633423
Epoch: 10, step: 568, loss: 0.3637012541294098, mean loss: 0.3704656808049406
Epoch: 10, step: 569, loss: 0.34213533997535706, mean loss: 0.37046379337383933
Epoch: 10, step: 570, loss: 0.34705790877342224, mean loss: 0.3704622341249818
Epoch: 10, step: 571, loss: 0.35244035720825195, mean loss: 0.3704610336269191
Epoch: 10, step: 572, loss: 0.36429181694984436, mean loss: 0.3704606227019423
Epoch: 10, step: 573, loss: 0.32947009801864624, mean loss: 0.37045789254844
Epoch: 10, step: 574, loss: 0.35014060139656067, mean loss: 0.37045653941549617
Epoch: 10, step: 575, loss: 0.3450039327144623, mean loss: 0.370454844383084
Epoch: 10, step: 576, loss: 0.3448212444782257, mean loss: 0.37045313741099206
Epoch: 10, step: 577, loss: 0.34540244936943054, mean loss: 0.3704514693667757
Epoch: 10, step: 578, loss: 0.3196966052055359, mean loss: 0.37044808998970924
Epoch: 10, step: 579, loss: 0.3136562705039978, mean loss: 0.37044430890985003
Epoch: 10, step: 580, loss: 0.3713289499282837, mean loss: 0.37044436780346685
Epoch: 10, step: 581, loss: 0.3164605498313904, mean loss: 0.3704407741529561
Epoch: 10, step: 582, loss: 0.2926906645298004, mean loss: 0.37043559874793563
Epoch: 10, step: 583, loss: 0.3769649863243103, mean loss: 0.3704360333450853
Epoch: 10, step: 584, loss: 0.3341861665248871, mean loss: 0.3704336207083585
Epoch: 10, step: 585, loss: 0.31359022855758667, mean loss: 0.37042983770608573
Epoch: 10, step: 586, loss: 0.3412684500217438, mean loss: 0.3704278971066524
Epoch: 10, step: 587, loss: 0.30741843581199646, mean loss: 0.37042370430246724
Epoch: 10, step: 588, loss: 0.36703255772590637, mean loss: 0.37042347866226655
Epoch: 10, step: 589, loss: 0.3502485752105713, mean loss: 0.370422136353321
Epoch: 10, step: 590, loss: 0.34518688917160034, mean loss: 0.37042045747319446
Epoch: 10, step: 591, loss: 0.3304232358932495, mean loss: 0.3704177966681399
Epoch: 10, step: 592, loss: 0.356801837682724, mean loss: 0.37041689093016444
Epoch: 10, step: 593, loss: 0.36909520626068115, mean loss: 0.3704168030171227
Epoch: 10, step: 594, loss: 0.3614535331726074, mean loss: 0.3704162068568404
Epoch: 10, step: 595, loss: 0.33470091223716736, mean loss: 0.37041383153796437
Epoch: 10, step: 596, loss: 0.3463694155216217, mean loss: 0.37041223252113814
Epoch: 10, step: 597, loss: 0.3677290380001068, mean loss: 0.37041205409352
Epoch: 10, step: 598, loss: 0.33699676394462585, mean loss: 0.3704098321844736
Epoch: 10, step: 599, loss: 0.36101728677749634, mean loss: 0.37040920768012475
Epoch: 10, step: 600, loss: 0.3229154646396637, mean loss: 0.3704060500614132
Epoch: 10, step: 601, loss: 0.37484392523765564, mean loss: 0.370406345093668
Epoch: 10, step: 602, loss: 0.3392009735107422, mean loss: 0.37040427068220866
Epoch: 10, step: 603, loss: 0.3182997703552246, mean loss: 0.37040080720837676
Epoch: 10, step: 604, loss: 0.36180853843688965, mean loss: 0.3704002361037725
Epoch: 10, step: 605, loss: 0.34575900435447693, mean loss: 0.37039859837735023
Epoch: 10, step: 606, loss: 0.31571346521377563, mean loss: 0.37039496408924205
Epoch: 10, step: 607, loss: 0.3213164508342743, mean loss: 0.37039170262504384
Epoch: 10, step: 608, loss: 0.3388928771018982, mean loss: 0.370389609540751
Epoch: 10, step: 609, loss: 0.3062880337238312, mean loss: 0.37038535029983294
Epoch: 10, step: 610, loss: 0.3435652256011963, mean loss: 0.37038356835014863
Epoch: 10, step: 611, loss: 0.3243114650249481, mean loss: 0.37038050748758383
Epoch: 10, step: 612, loss: 0.34425482153892517, mean loss: 0.37037877190756996
Epoch: 10, step: 613, loss: 0.32963794469833374, mean loss: 0.3703760655951474
Epoch: 10, step: 614, loss: 0.306365042924881, mean loss: 0.37037181378361167
Epoch: 10, step: 615, loss: 0.3633182644844055, mean loss: 0.37037134529601207
Epoch: 10, step: 616, loss: 0.35603606700897217, mean loss: 0.3703703932286489
Epoch: 10, step: 617, loss: 0.34922757744789124, mean loss: 0.3703689891367522
Epoch: 10, step: 618, loss: 0.32591918110847473, mean loss: 0.37036603742627816
Epoch: 10, step: 619, loss: 0.31946349143981934, mean loss: 0.37036265744314495
Epoch: 10, step: 620, loss: 0.3720610737800598, mean loss: 0.3703627702123062
Epoch: 10, step: 621, loss: 0.34425464272499084, mean loss: 0.37036103683509947
Epoch: 10, step: 622, loss: 0.3175507187843323, mean loss: 0.3703575308722733
Epoch: 10, step: 623, loss: 0.3543202877044678, mean loss: 0.3703564662650529
Epoch: 10, step: 624, loss: 0.3332427144050598, mean loss: 0.370354002690419
Epoch: 10, step: 625, loss: 0.37552204728126526, mean loss: 0.37035434571740633
Epoch: 10, step: 626, loss: 0.385035902261734, mean loss: 0.37035532013544203
Epoch: 10, step: 627, loss: 0.31971967220306396, mean loss: 0.3703519596597364
Epoch: 10, step: 628, loss: 0.40533730387687683, mean loss: 0.3703542813363053
Epoch: 10, step: 629, loss: 0.36165761947631836, mean loss: 0.3703537042519085
Epoch: 10, step: 630, loss: 0.33708199858665466, mean loss: 0.3703514965878076
Epoch: 10, step: 631, loss: 0.30986183881759644, mean loss: 0.37034748320817845
Epoch: 10, step: 632, loss: 0.34905141592025757, mean loss: 0.37034607034628714
Epoch: 10, step: 633, loss: 0.3443916440010071, mean loss: 0.3703443485454151
Epoch: 10, step: 634, loss: 0.310884565114975, mean loss: 0.37034040428117426
Epoch: 10, step: 635, loss: 0.354684978723526, mean loss: 0.3703393658475342
Epoch: 10, step: 636, loss: 0.3238013982772827, mean loss: 0.3703362791613519
Epoch: 10, step: 637, loss: 0.323316365480423, mean loss: 0.37033316071635386
Epoch: 10, step: 638, loss: 0.34393709897994995, mean loss: 0.37033141019829985
Epoch: 10, step: 639, loss: 0.35605189204216003, mean loss: 0.3703304632806502
Epoch: 10, step: 640, loss: 0.30256348848342896, mean loss: 0.3703259697474099
Epoch: 10, step: 641, loss: 0.3720547556877136, mean loss: 0.370326084373185
Epoch: 10, step: 642, loss: 0.4453717768192291, mean loss: 0.37033105988816517
Epoch: 10, step: 643, loss: 0.3137401342391968, mean loss: 0.37032730816941356
Epoch: 10, step: 644, loss: 0.35158461332321167, mean loss: 0.37032606569710025
Epoch: 10, step: 645, loss: 0.3521352708339691, mean loss: 0.37032485989073255
Epoch: 10, step: 646, loss: 0.3096074163913727, mean loss: 0.37032083540319366
Epoch: 10, step: 647, loss: 0.42767614126205444, mean loss: 0.37032463678878874
Epoch: 10, step: 648, loss: 0.33676090836524963, mean loss: 0.3703224124049049
Epoch: 10, step: 649, loss: 0.3171386420726776, mean loss: 0.3703188879668444
Epoch: 10, step: 650, loss: 0.380182147026062, mean loss: 0.3703195415523629
Epoch: 10, step: 651, loss: 0.34275826811790466, mean loss: 0.3703177153349342
Epoch: 10, step: 652, loss: 0.31343314051628113, mean loss: 0.37031394639735926
Epoch: 10, step: 653, loss: 0.36730194091796875, mean loss: 0.3703137468475064
Epoch: 10, step: 654, loss: 0.3724488914012909, mean loss: 0.3703138882946448
Epoch: 10, step: 655, loss: 0.3639708161354065, mean loss: 0.3703134681123343
Epoch: 10, step: 656, loss: 0.29455703496932983, mean loss: 0.3703084501330574
Epoch: 10, step: 657, loss: 0.3649337589740753, mean loss: 0.37030809414609495
Epoch: 10, step: 658, loss: 0.3086863160133362, mean loss: 0.3703040129633588
Epoch: 10, step: 659, loss: 0.3370276987552643, mean loss: 0.370301809233941
Epoch: 10, step: 660, loss: 0.37560412287712097, mean loss: 0.3703021603572867
Epoch: 10, step: 661, loss: 0.38860857486724854, mean loss: 0.3703033725420642
Epoch: 10, step: 662, loss: 0.3906160891056061, mean loss: 0.37030471748787386
Epoch: 10, step: 663, loss: 0.3260498344898224, mean loss: 0.37030178747708214
Epoch: 10, step: 664, loss: 0.31263166666030884, mean loss: 0.3702979695280046
Epoch: 10, step: 665, loss: 0.3166709840297699, mean loss: 0.37029441948262537
Epoch: 10, step: 666, loss: 0.37624141573905945, mean loss: 0.3702948131409464
Epoch: 10, step: 667, loss: 0.38185855746269226, mean loss: 0.3702955785463159
Epoch: 10, step: 668, loss: 0.31391534209251404, mean loss: 0.37029184697993467
Epoch: 10, step: 669, loss: 0.3167388141155243, mean loss: 0.3702883027686266
Epoch: 10, step: 670, loss: 0.3346332907676697, mean loss: 0.37028594322842406
Epoch: 10, step: 671, loss: 0.33813104033470154, mean loss: 0.3702838154556016
Epoch: 10, step: 672, loss: 0.35311853885650635, mean loss: 0.370282679660154
Epoch: 10, step: 673, loss: 0.3233862519264221, mean loss: 0.37027957681327467
Epoch: 10, step: 674, loss: 0.3497524559497833, mean loss: 0.3702782187503661
Epoch: 10, step: 675, loss: 0.3833674490451813, mean loss: 0.3702790846692795
Epoch: 10, step: 676, loss: 0.34611380100250244, mean loss: 0.3702774861190601
Epoch: 10, step: 677, loss: 0.34941887855529785, mean loss: 0.37027610639902014
Epoch: 10, step: 678, loss: 0.3011123538017273, mean loss: 0.37027153177420385
Epoch: 10, step: 679, loss: 0.3193143904209137, mean loss: 0.37026816159289744
Epoch: 10, step: 680, loss: 0.36373671889305115, mean loss: 0.3702677296477417
Epoch: 10, step: 681, loss: 0.318562775850296, mean loss: 0.37026431046021374
Epoch: 10, step: 682, loss: 0.3363906741142273, mean loss: 0.37026207058476934
Epoch: 10, step: 683, loss: 0.3340681493282318, mean loss: 0.37025967744001553
Epoch: 10, step: 684, loss: 0.32893484830856323, mean loss: 0.37025694521990765
Epoch: 10, step: 685, loss: 0.3595883846282959, mean loss: 0.37025623990716194
Epoch: 10, step: 686, loss: 0.33140069246292114, mean loss: 0.370253671285
Epoch: 10, step: 687, loss: 0.3359050154685974, mean loss: 0.3702514007498455
Epoch: 10, step: 688, loss: 0.3342125713825226, mean loss: 0.3702490186473029
Epoch: 10, step: 689, loss: 0.34540611505508423, mean loss: 0.37024737668407803
Epoch: 10, step: 690, loss: 0.33981022238731384, mean loss: 0.37024536510822076
Epoch: 10, step: 691, loss: 0.349637508392334, mean loss: 0.37024400323558554
Epoch: 10, step: 692, loss: 0.37580543756484985, mean loss: 0.37024437073934086
Epoch: 10, step: 693, loss: 0.3506670594215393, mean loss: 0.37024307714139465
Epoch: 10, step: 694, loss: 0.30532944202423096, mean loss: 0.37023878816649425
Epoch: 10, step: 695, loss: 0.342598021030426, mean loss: 0.3702369620058748
Epoch: 10, step: 696, loss: 0.32961544394493103, mean loss: 0.37023427841480255
Epoch: 10, step: 697, loss: 0.3503674268722534, mean loss: 0.37023296603195527
Epoch: 10, step: 698, loss: 0.3354494571685791, mean loss: 0.37023066842254493
Epoch: 10, step: 699, loss: 0.3938072621822357, mean loss: 0.3702322256612345
Epoch: 10, step: 700, loss: 0.3584219515323639, mean loss: 0.3702314456418085
Epoch: 10, step: 701, loss: 0.33760225772857666, mean loss: 0.3702292907621418
Epoch: 10, step: 702, loss: 0.3246573507785797, mean loss: 0.37022628132279795
Epoch: 10, step: 703, loss: 0.3241419494152069, mean loss: 0.37022323824752673
Epoch: 10, step: 704, loss: 0.34829458594322205, mean loss: 0.37022179033387176
Epoch: 10, step: 705, loss: 0.3445093035697937, mean loss: 0.3702200926918036
Epoch: 10, step: 706, loss: 0.3307885527610779, mean loss: 0.3702174894343975
Epoch: 10, step: 707, loss: 0.312857985496521, mean loss: 0.370213702828645
Epoch: 10, step: 708, loss: 0.32601630687713623, mean loss: 0.37021078531620516
Epoch: 10, step: 709, loss: 0.4184260964393616, mean loss: 0.37021396784499216
Epoch: 10, step: 710, loss: 0.3536854684352875, mean loss: 0.37021287692693994
Epoch: 10, step: 711, loss: 0.33469831943511963, mean loss: 0.3702105330411498
Epoch: 10, step: 712, loss: 0.3477849066257477, mean loss: 0.37020905309484115
Epoch: 10, step: 713, loss: 0.32691100239753723, mean loss: 0.3702061958920764
Epoch: 10, step: 714, loss: 0.39053356647491455, mean loss: 0.3702075371900363
Epoch: 10, step: 715, loss: 0.3269043266773224, mean loss: 0.37020468002386364
Epoch: 10, step: 716, loss: 0.3462156653404236, mean loss: 0.37020309732183265
Epoch: 10, step: 717, loss: 0.34783658385276794, mean loss: 0.37020162176348265
Epoch: 10, step: 718, loss: 0.33574244379997253, mean loss: 0.37019934858068937
Epoch: 10, step: 719, loss: 0.3616134226322174, mean loss: 0.37019878222673497
Epoch: 10, step: 720, loss: 0.32265686988830566, mean loss: 0.3701956464235334
Epoch: 10, step: 721, loss: 0.30407965183258057, mean loss: 0.37019128578545196
Epoch: 10, step: 722, loss: 0.34134969115257263, mean loss: 0.3701893836820006
Epoch: 10, step: 723, loss: 0.3396986126899719, mean loss: 0.37018737294796
Epoch: 10, step: 724, loss: 0.3448609709739685, mean loss: 0.3701857028917797
Epoch: 10, step: 725, loss: 0.3814283311367035, mean loss: 0.3701864441965565
Epoch: 10, step: 726, loss: 0.360784113407135, mean loss: 0.37018582427628294
Epoch: 10, step: 727, loss: 0.29655721783638, mean loss: 0.37018097006963474
Epoch: 10, step: 728, loss: 0.3224885165691376, mean loss: 0.3701778259959647
Epoch: 10, step: 729, loss: 0.38570407032966614, mean loss: 0.3701788494794409
Epoch: 10, step: 730, loss: 0.3434717655181885, mean loss: 0.37017708907577856
Epoch: 10, step: 731, loss: 0.3348795473575592, mean loss: 0.3701747625834428
Epoch: 10, step: 732, loss: 0.36961090564727783, mean loss: 0.37017472542158053
Epoch: 10, step: 733, loss: 0.30994030833244324, mean loss: 0.37017075584091036
Epoch: 10, step: 734, loss: 0.314654141664505, mean loss: 0.370167097414935
Epoch: 10, step: 735, loss: 0.34479427337646484, mean loss: 0.37016542551034626
Epoch: 10, step: 736, loss: 0.31704628467559814, mean loss: 0.37016192553401134
Epoch: 10, step: 737, loss: 0.3393542766571045, mean loss: 0.3701598957772004
Epoch: 10, step: 738, loss: 0.3635280430316925, mean loss: 0.3701594588674734
Epoch: 10, step: 739, loss: 0.3227749466896057, mean loss: 0.37015633735810727
Epoch: 10, step: 740, loss: 0.35393044352531433, mean loss: 0.3701552685290556
Epoch: 10, step: 741, loss: 0.3575569689273834, mean loss: 0.37015443871087605
Epoch: 10, step: 742, loss: 0.29043909907341003, mean loss: 0.3701491884085881
Epoch: 10, step: 743, loss: 0.3369388282299042, mean loss: 0.37014700121416116
Epoch: 10, step: 744, loss: 0.34297099709510803, mean loss: 0.37014521155304037
Epoch: 10, step: 745, loss: 0.3486636281013489, mean loss: 0.3701437969880824
Epoch: 10, step: 746, loss: 0.35416966676712036, mean loss: 0.37014274515887186
Epoch: 10, step: 747, loss: 0.3438217341899872, mean loss: 0.3701410121452447
Epoch: 10, step: 748, loss: 0.36256644129753113, mean loss: 0.3701405134573227
Epoch: 10, step: 749, loss: 0.3168753385543823, mean loss: 0.37013700686252987
Epoch: 10, step: 750, loss: 0.3405493497848511, mean loss: 0.3701350591528941
Epoch: 10, step: 751, loss: 0.34728190302848816, mean loss: 0.37013355486404964
Epoch: 10, step: 752, loss: 0.33510923385620117, mean loss: 0.37013124957075616
Epoch: 10, step: 753, loss: 0.3188018798828125, mean loss: 0.3701278713050139
Epoch: 10, step: 754, loss: 0.3191218674182892, mean loss: 0.3701245145426653
Epoch: 10, step: 755, loss: 0.3618530333042145, mean loss: 0.37012397022302607
Epoch: 10, step: 756, loss: 0.3432804048061371, mean loss: 0.3701222038503593
Epoch: 10, step: 757, loss: 0.32665860652923584, mean loss: 0.3701193440268746
Epoch: 10, step: 758, loss: 0.33689334988594055, mean loss: 0.37011715796238737
Epoch: 10, step: 759, loss: 0.33353450894355774, mean loss: 0.37011475120916243
Epoch: 10, step: 760, loss: 0.3262040317058563, mean loss: 0.37011186253608147
Epoch: 10, step: 761, loss: 0.3866001069545746, mean loss: 0.3701129471462919
Epoch: 10, step: 762, loss: 0.35602807998657227, mean loss: 0.37011202069314714
Epoch: 10, step: 763, loss: 0.3289758563041687, mean loss: 0.37010931507854644
Epoch: 10, step: 764, loss: 0.36805179715156555, mean loss: 0.3701091797600376
Epoch: 10, step: 765, loss: 0.3395686745643616, mean loss: 0.3701071713090843
Epoch: 10, step: 766, loss: 0.38044095039367676, mean loss: 0.370107850850025
Epoch: 10, step: 767, loss: 0.33844441175460815, mean loss: 0.37010576882483465
Epoch: 10, step: 768, loss: 0.38015151023864746, mean loss: 0.3701064293377818
Epoch: 10, step: 769, loss: 0.41212698817253113, mean loss: 0.3701091920306704
Epoch: 10, step: 770, loss: 0.3041819632053375, mean loss: 0.37010485784956293
Epoch: 10, step: 771, loss: 0.32284605503082275, mean loss: 0.37010175117044
Epoch: 10, step: 772, loss: 0.3274989426136017, mean loss: 0.3700989507491847
Epoch: 10, step: 773, loss: 0.3361721634864807, mean loss: 0.37009672077762806
Epoch: 10, step: 774, loss: 0.320203959941864, mean loss: 0.3700934415951873
Epoch: 10, step: 775, loss: 0.35339075326919556, mean loss: 0.3700923438895928
Epoch: 10, step: 776, loss: 0.36101284623146057, mean loss: 0.37009174722154664
Epoch: 10, step: 777, loss: 0.31878507137298584, mean loss: 0.37008837577484877
Epoch: 10, step: 778, loss: 0.3377951979637146, mean loss: 0.3700862538760505
Epoch: 10, step: 779, loss: 0.35702261328697205, mean loss: 0.37008539555538106
Epoch: 10, step: 780, loss: 0.32172533869743347, mean loss: 0.3700822183622362
Epoch: 10, step: 781, loss: 0.30266085267066956, mean loss: 0.3700777891567644
Epoch: 10, step: 782, loss: 0.3117586374282837, mean loss: 0.3700739581673584
Epoch: 10, step: 783, loss: 0.3611414432525635, mean loss: 0.3700733714283335
Epoch: 10, step: 784, loss: 0.33268001675605774, mean loss: 0.3700709153787656
Epoch: 10, step: 785, loss: 0.33763474225997925, mean loss: 0.3700687850639673
Epoch: 10, step: 786, loss: 0.33544909954071045, mean loss: 0.37006651149166
Epoch: 10, step: 787, loss: 0.36325764656066895, mean loss: 0.3700660643636766
Epoch: 10, step: 788, loss: 0.35209640860557556, mean loss: 0.3700648844007271
Epoch: 10, step: 789, loss: 0.3025208115577698, mean loss: 0.37006044946488714
Epoch: 10, step: 790, loss: 0.3254691958427429, mean loss: 0.3700575218006745
Epoch: 10, step: 791, loss: 0.360359787940979, mean loss: 0.3700568851322226
Epoch: 10, step: 792, loss: 0.3340268135070801, mean loss: 0.37005451986788696
Epoch: 10, step: 793, loss: 0.3638535141944885, mean loss: 0.37005411281749484
Epoch: 10, step: 794, loss: 0.31665658950805664, mean loss: 0.3700506078930899
Epoch: 10, step: 795, loss: 0.3512340486049652, mean loss: 0.37004937288657325
Epoch: 10, step: 796, loss: 0.35021647810935974, mean loss: 0.370048071259299
Epoch: 10, step: 797, loss: 0.3154805600643158, mean loss: 0.3700444902439955
Epoch: 10, step: 798, loss: 0.33181485533714294, mean loss: 0.37004198157315704
Epoch: 10, step: 799, loss: 0.326233446598053, mean loss: 0.37003910699737125
Epoch: 10, step: 800, loss: 0.33838698267936707, mean loss: 0.3700370302225981
Epoch: 10, step: 801, loss: 0.3418921232223511, mean loss: 0.37003518368625116
Epoch: 10, step: 802, loss: 0.3104543387889862, mean loss: 0.3700312749514288
Epoch: 10, step: 803, loss: 0.32249096035957336, mean loss: 0.3700281563267508
Epoch: 10, step: 804, loss: 0.3411557972431183, mean loss: 0.370026262436355
Epoch: 10, step: 805, loss: 0.3153575360774994, mean loss: 0.3700226766613085
Epoch: 10, step: 806, loss: 0.33087384700775146, mean loss: 0.37002010901982796
Epoch: 10, step: 807, loss: 0.34301429986953735, mean loss: 0.37001833791482075
Epoch: 10, step: 808, loss: 0.3219245970249176, mean loss: 0.37001518402008077
Epoch: 10, step: 809, loss: 0.33166858553886414, mean loss: 0.37001266948903283
Epoch: 10, step: 810, loss: 0.33946967124938965, mean loss: 0.37001066680079997
Epoch: 10, step: 811, loss: 0.3237399756908417, mean loss: 0.3700076330549889
Epoch: 10, step: 812, loss: 0.3459259271621704, mean loss: 0.37000605423732075
Epoch: 10, step: 813, loss: 0.33998632431030273, mean loss: 0.37000408624663456
Epoch: 10, step: 814, loss: 0.33471935987472534, mean loss: 0.3700017732524443
Epoch: 10, step: 815, loss: 0.3340340554714203, mean loss: 0.3699994156411582
Epoch: 10, step: 816, loss: 0.42690524458885193, mean loss: 0.37000314545887775
Epoch: 10, step: 817, loss: 0.3384583294391632, mean loss: 0.37000107803090426
Epoch: 10, step: 818, loss: 0.4028712213039398, mean loss: 0.37000323217883485
Epoch: 10, step: 819, loss: 0.3060223162174225, mean loss: 0.3699990394582607
Epoch: 10, step: 820, loss: 0.38063669204711914, mean loss: 0.36999973650646123
Epoch: 10, step: 821, loss: 0.34860411286354065, mean loss: 0.3699983346178724
Epoch: 10, step: 822, loss: 0.38475820422172546, mean loss: 0.3699993016538158
Epoch: 10, step: 823, loss: 0.30913737416267395, mean loss: 0.3699953143682097
Epoch: 10, step: 824, loss: 0.3656314015388489, mean loss: 0.36999502849118193
Epoch: 10, step: 825, loss: 0.30322346091270447, mean loss: 0.3699906546167172
Epoch: 10, step: 826, loss: 0.31918296217918396, mean loss: 0.3699873266745912
Epoch: 10, step: 827, loss: 0.34078025817871094, mean loss: 0.36998541371490457
Epoch: 10, step: 828, loss: 0.33310994505882263, mean loss: 0.3699829986603066
Epoch: 10, step: 829, loss: 0.345292329788208, mean loss: 0.36998138172062933
Epoch: 10, step: 830, loss: 0.34200921654701233, mean loss: 0.3699795500026558
Epoch: 10, step: 831, loss: 0.3403787314891815, mean loss: 0.3699776117615274
Epoch: 10, step: 832, loss: 0.3526691198348999, mean loss: 0.3699764784876502
Epoch: 10, step: 833, loss: 0.3291122019290924, mean loss: 0.36997380307344574
Epoch: 10, step: 834, loss: 0.3175708055496216, mean loss: 0.36997037243530995
Epoch: 10, step: 835, loss: 0.33259904384613037, mean loss: 0.36996792602731116
Epoch: 10, step: 836, loss: 0.3610735535621643, mean loss: 0.36996734382056473
Epoch: 10, step: 837, loss: 0.32282963395118713, mean loss: 0.369964258488069
Epoch: 10, step: 838, loss: 0.32916712760925293, mean loss: 0.36996158834402304
Epoch: 10, step: 839, loss: 0.334908664226532, mean loss: 0.36995929430448654
Epoch: 10, step: 840, loss: 0.3250110149383545, mean loss: 0.36995635285566997
Epoch: 10, step: 841, loss: 0.3604890704154968, mean loss: 0.3699557333502099
Epoch: 10, step: 842, loss: 0.3296542167663574, mean loss: 0.36995309633414086
Epoch: 10, step: 843, loss: 0.3036985993385315, mean loss: 0.3699487614416392
Epoch: 10, step: 844, loss: 0.32503122091293335, mean loss: 0.3699458227736295
Epoch: 10, step: 845, loss: 0.3474329113960266, mean loss: 0.36994434999387166
Epoch: 10, step: 846, loss: 0.3417716324329376, mean loss: 0.36994250707390297
Epoch: 10, step: 847, loss: 0.3567304313182831, mean loss: 0.36994164286172637
Epoch: 10, step: 848, loss: 0.3134218156337738, mean loss: 0.3699379460975673
Epoch: 10, step: 849, loss: 0.42765572667121887, mean loss: 0.36994172096876243
Epoch: 10, step: 850, loss: 0.34273433685302734, mean loss: 0.3699399416617115
Epoch: 10, step: 851, loss: 0.33199647068977356, mean loss: 0.3699374603988962
Epoch: 10, step: 852, loss: 0.3438582420349121, mean loss: 0.3699357550946155
Epoch: 10, step: 853, loss: 0.31125888228416443, mean loss: 0.36993191850034257
Epoch: 10, step: 854, loss: 0.34489697217941284, mean loss: 0.3699302816944373
Epoch: 10, step: 855, loss: 0.3399384617805481, mean loss: 0.36992832093215217
Epoch: 10, step: 856, loss: 0.3775961101055145, mean loss: 0.3699288221931297
Epoch: 10, step: 857, loss: 0.36306360363960266, mean loss: 0.36992837342737256
Epoch: 10, step: 858, loss: 0.31854236125946045, mean loss: 0.36992501464495753
Epoch: 10, step: 859, loss: 0.3488217890262604, mean loss: 0.36992363534916545
Epoch: 10, step: 860, loss: 0.37647417187690735, mean loss: 0.3699240634608266
Epoch: 10, step: 861, loss: 0.3577550947666168, mean loss: 0.36992326820735033
Epoch: 10, step: 862, loss: 0.3710269331932068, mean loss: 0.36992334032817537
Epoch: 10, step: 863, loss: 0.33565574884414673, mean loss: 0.3699211012017062
Epoch: 10, step: 864, loss: 0.3319531977176666, mean loss: 0.3699186204500901
Epoch: 10, step: 865, loss: 0.34386882185935974, mean loss: 0.36991691851630004
Epoch: 10, step: 866, loss: 0.41628941893577576, mean loss: 0.36991994801263633
Epoch: 10, step: 867, loss: 0.3931295871734619, mean loss: 0.3699214641897438
Epoch: 10, step: 868, loss: 0.34387558698654175, mean loss: 0.3699197628456192
Epoch: 10, step: 869, loss: 0.3354404866695404, mean loss: 0.36991751077010154
Epoch: 10, step: 870, loss: 0.33165502548217773, mean loss: 0.36991501175075026
Epoch: 10, step: 871, loss: 0.35052385926246643, mean loss: 0.36991374534841953
Epoch: 10, step: 872, loss: 0.37479257583618164, mean loss: 0.3699140639555173
Epoch: 10, step: 873, loss: 0.344085693359375, mean loss: 0.36991237737000104
Epoch: 10, step: 874, loss: 0.37270301580429077, mean loss: 0.3699125595860268
Epoch: 10, step: 875, loss: 0.33755436539649963, mean loss: 0.36991044688073893
Epoch: 10, step: 876, loss: 0.3664798438549042, mean loss: 0.36991022290717845
Epoch: 10, step: 877, loss: 0.32214510440826416, mean loss: 0.36990710467251997
Epoch: 10, step: 878, loss: 0.3524623513221741, mean loss: 0.36990596590671604
Epoch: 10, step: 879, loss: 0.3755263090133667, mean loss: 0.3699063327698431
Epoch: 10, step: 880, loss: 0.33001217246055603, mean loss: 0.3699037288823482
Epoch: 10, step: 881, loss: 0.3200170397758484, mean loss: 0.36990047299609924
Epoch: 10, step: 882, loss: 0.3491460680961609, mean loss: 0.3698991185351647
Epoch: 10, step: 883, loss: 0.33562058210372925, mean loss: 0.3698968816168385
Epoch: 10, step: 884, loss: 0.3173637092113495, mean loss: 0.36989345367736665
Epoch: 10, step: 885, loss: 0.29956984519958496, mean loss: 0.36988886516056657
Epoch: 10, step: 886, loss: 0.32341745495796204, mean loss: 0.3698858331640765
Epoch: 10, step: 887, loss: 0.29365822672843933, mean loss: 0.3698808600686671
Epoch: 10, step: 888, loss: 0.36120161414146423, mean loss: 0.36988029387087684
Epoch: 10, step: 889, loss: 0.37639009952545166, mean loss: 0.3698807185157336
Epoch: 10, step: 890, loss: 0.340290367603302, mean loss: 0.3698787884165286
Epoch: 10, step: 891, loss: 0.34715667366981506, mean loss: 0.36987730641060984
Epoch: 10, step: 892, loss: 0.34328824281692505, mean loss: 0.36987557230354706
Epoch: 10, step: 893, loss: 0.4154096245765686, mean loss: 0.3698785417865439
Epoch: 10, step: 894, loss: 0.35532236099243164, mean loss: 0.3698775925735805
Epoch: 10, step: 895, loss: 0.33442166447639465, mean loss: 0.36987528063252045
Epoch: 10, step: 896, loss: 0.33120259642601013, mean loss: 0.369872759103916
Epoch: 10, step: 897, loss: 0.3799792528152466, mean loss: 0.3698734180225306
Epoch: 10, step: 898, loss: 0.355995774269104, mean loss: 0.36987251329316406
Epoch: 10, step: 899, loss: 0.32649698853492737, mean loss: 0.36986968568398815
Epoch: 10, step: 900, loss: 0.3653006851673126, mean loss: 0.36986938785460827
Epoch: 10, step: 901, loss: 0.3272368013858795, mean loss: 0.369866609039169
Epoch: 10, step: 902, loss: 0.3511155843734741, mean loss: 0.36986538691672455
Epoch: 10, step: 903, loss: 0.32615968585014343, mean loss: 0.36986253852640477
Epoch: 10, step: 904, loss: 0.33276721835136414, mean loss: 0.3698601211057352
Epoch: 10, step: 905, loss: 0.3532164692878723, mean loss: 0.3698590365461224
Epoch: 10, step: 906, loss: 0.32190391421318054, mean loss: 0.36985591182322325
Epoch: 10, step: 907, loss: 0.3270021975040436, mean loss: 0.36985311968650714
Epoch: 10, step: 908, loss: 0.34292691946029663, mean loss: 0.36985136542237096
Epoch: 10, step: 909, loss: 0.34243738651275635, mean loss: 0.36984957949540614
Epoch: 10, step: 910, loss: 0.32017773389816284, mean loss: 0.3698463437553503
Epoch: 10, step: 911, loss: 0.3264545202255249, mean loss: 0.3698435172947243
Epoch: 10, step: 912, loss: 0.35651808977127075, mean loss: 0.369842649358326
Epoch: 10, step: 913, loss: 0.31684595346450806, mean loss: 0.3698391977043014
Epoch: 10, step: 914, loss: 0.36678075790405273, mean loss: 0.369838998522289
Epoch: 10, step: 915, loss: 0.33689531683921814, mean loss: 0.3698368531926665
Epoch: 10, step: 916, loss: 0.3327386677265167, mean loss: 0.3698344374743969
Epoch: 10, step: 917, loss: 0.35129407048225403, mean loss: 0.3698332302620651
Epoch: 10, step: 918, loss: 0.34257248044013977, mean loss: 0.36983145535811157
Epoch: 10, step: 919, loss: 0.3402019739151001, mean loss: 0.36982952635541344
Epoch: 10, step: 920, loss: 0.3627942204475403, mean loss: 0.3698290683575026
Epoch: 10, step: 921, loss: 0.38831382989883423, mean loss: 0.36983027163582194
Epoch: 10, step: 922, loss: 0.3613683581352234, mean loss: 0.3698297208375729
Epoch: 10, step: 923, loss: 0.337931364774704, mean loss: 0.369827644662354
Epoch: 10, step: 924, loss: 0.3251824676990509, mean loss: 0.36982473902115887
Epoch: 10, step: 925, loss: 0.3163374066352844, mean loss: 0.36982125813267874
Epoch: 10, step: 926, loss: 0.3418906629085541, mean loss: 0.36981944056287175
Epoch: 10, step: 927, loss: 0.3455449342727661, mean loss: 0.3698178610140502
Epoch: 10, step: 928, loss: 0.3069092333316803, mean loss: 0.36981376779863717
Epoch: 10, step: 929, loss: 0.3020974397659302, mean loss: 0.3698093620518556
Epoch: 10, step: 930, loss: 0.33768221735954285, mean loss: 0.3698072719376996
Epoch: 10, step: 931, loss: 0.3079698085784912, mean loss: 0.36980324920393953
Epoch: 10, step: 932, loss: 0.34063294529914856, mean loss: 0.3698013517015714
Epoch: 10, step: 933, loss: 0.3744233250617981, mean loss: 0.36980165233727846
Epoch: 10, step: 934, loss: 0.3332599103450775, mean loss: 0.3697992756386123
Epoch: 10, step: 935, loss: 0.3222554326057434, mean loss: 0.36979618355724964
Epoch: 10, step: 936, loss: 0.35003361105918884, mean loss: 0.3697948983538616
Epoch: 10, step: 937, loss: 0.33985912799835205, mean loss: 0.36979295169172377
Epoch: 10, step: 938, loss: 0.34781381487846375, mean loss: 0.36979152252618547
Epoch: 10, step: 939, loss: 0.34991663694381714, mean loss: 0.36979023027094604
Epoch: 10, step: 940, loss: 0.3145557940006256, mean loss: 0.36978663918868415
Epoch: 10, step: 941, loss: 0.30691277980804443, mean loss: 0.36978255169295016
Epoch: 10, step: 942, loss: 0.30868539214134216, mean loss: 0.3697785799605474
Epoch: 10, step: 943, loss: 0.32596251368522644, mean loss: 0.3697757318023132
Epoch: 10, step: 944, loss: 0.3349165916442871, mean loss: 0.3697734660148476
Epoch: 10, step: 945, loss: 0.3277137875556946, mean loss: 0.36977073238177477
Epoch: 10, step: 946, loss: 0.39067062735557556, mean loss: 0.36977209066441424
Epoch: 10, step: 947, loss: 0.346939355134964, mean loss: 0.36977060686304114
Epoch: 10, step: 948, loss: 0.32245099544525146, mean loss: 0.369767531964645
Epoch: 10, step: 949, loss: 0.3272339701652527, mean loss: 0.36976476825042803
Epoch: 10, step: 950, loss: 0.3801412880420685, mean loss: 0.369765442444424
Epoch: 10, step: 951, loss: 0.34487950801849365, mean loss: 0.36976382563475496
Epoch: 10, step: 952, loss: 0.37579649686813354, mean loss: 0.36976421754479416
Epoch: 10, step: 953, loss: 0.35469236969947815, mean loss: 0.36976323847191866
Epoch: 10, step: 954, loss: 0.34006211161613464, mean loss: 0.369761309200931
Epoch: 10, step: 955, loss: 0.3882405459880829, mean loss: 0.3697625094631281
Epoch: 10, step: 956, loss: 0.37310871481895447, mean loss: 0.3697627267915269
Epoch: 10, step: 957, loss: 0.3695279061794281, mean loss: 0.3697627115414547
Epoch: 10, step: 958, loss: 0.3680969476699829, mean loss: 0.36976260336794525
Epoch: 10, step: 959, loss: 0.3253308832645416, mean loss: 0.36975971819131515
Epoch: 10, step: 960, loss: 0.3112330734729767, mean loss: 0.3697559180066052
Epoch: 10, step: 961, loss: 0.32941168546676636, mean loss: 0.36975329859142925
Epoch: 10, step: 962, loss: 0.3675481975078583, mean loss: 0.3697531554309356
Epoch: 10, step: 963, loss: 0.3025699853897095, mean loss: 0.3697487940202604
Epoch: 10, step: 964, loss: 0.33781901001930237, mean loss: 0.3697467213306141
Epoch: 10, step: 965, loss: 0.3771815001964569, mean loss: 0.3697472039204405
Epoch: 10, step: 966, loss: 0.3474249541759491, mean loss: 0.3697457550822667
Epoch: 10, step: 967, loss: 0.3345527946949005, mean loss: 0.3697434710116289
Epoch: 10, step: 968, loss: 0.32263562083244324, mean loss: 0.36974041384697326
Epoch: 10, step: 969, loss: 0.3582403361797333, mean loss: 0.3697396675732765
Epoch: 10, step: 970, loss: 0.3140806555747986, mean loss: 0.3697360559314623
Epoch: 10, step: 971, loss: 0.3122579753398895, mean loss: 0.36973232649462145
Epoch: 10, step: 972, loss: 0.3608144223690033, mean loss: 0.3697317478983634
Epoch: 10, step: 973, loss: 0.3425086736679077, mean loss: 0.3697299817718401
Epoch: 10, step: 974, loss: 0.3339475691318512, mean loss: 0.36972766049953126
Epoch: 10, step: 975, loss: 0.36446741223335266, mean loss: 0.3697273192794829
Epoch: 10, step: 976, loss: 0.3093266785144806, mean loss: 0.369723401484791
Epoch: 10, step: 977, loss: 0.35403141379356384, mean loss: 0.36972238371415334
Epoch: 10, step: 978, loss: 0.28306862711906433, mean loss: 0.3697167637805263
Epoch: 10, step: 979, loss: 0.3363274037837982, mean loss: 0.36971459845238125
Epoch: 10, step: 980, loss: 0.3544163107872009, mean loss: 0.36971360640986356
Epoch: 10, step: 981, loss: 0.30889442563056946, mean loss: 0.3697096627462156
Epoch: 10, step: 982, loss: 0.3602111041545868, mean loss: 0.3697090468765021
Epoch: 10, step: 983, loss: 0.34115782380104065, mean loss: 0.36970719578579436
Epoch: 10, step: 984, loss: 0.34168100357055664, mean loss: 0.3697053788527496
Epoch: 10, step: 985, loss: 0.3405665457248688, mean loss: 0.3697034899098527
Epoch: 10, step: 986, loss: 0.3533075153827667, mean loss: 0.3697024270995508
Epoch: 10, step: 987, loss: 0.3470020294189453, mean loss: 0.3697009557229835
Epoch: 10, step: 988, loss: 0.34193456172943115, mean loss: 0.3696991560992883
Epoch: 10, step: 989, loss: 0.33333849906921387, mean loss: 0.36969679960822993
Epoch: 10, step: 990, loss: 0.3334695100784302, mean loss: 0.3696944519127125
Epoch: 10, step: 991, loss: 0.3134792149066925, mean loss: 0.3696908091420408
Epoch: 10, step: 992, loss: 0.3179750442504883, mean loss: 0.3696874581561734
Epoch: 10, step: 993, loss: 0.34240928292274475, mean loss: 0.36968569074816293
Epoch: 10, step: 994, loss: 0.32405179738998413, mean loss: 0.36968273422769915
Epoch: 10, step: 995, loss: 0.33905425667762756, mean loss: 0.36968075000396566
Epoch: 10, step: 996, loss: 0.3666461110115051, mean loss: 0.36968055342179346
Epoch: 10, step: 997, loss: 0.3787948191165924, mean loss: 0.3696811438004497
Epoch: 10, step: 998, loss: 0.37569668889045715, mean loss: 0.3696815334335276
Epoch: 10, step: 999, loss: 0.3264184892177582, mean loss: 0.36967873142289187
Epoch: 10, step: 1000, loss: 0.309831440448761, mean loss: 0.3696748555540379
Epoch: 10, step: 1001, loss: 0.360984206199646, mean loss: 0.36967429276104774
Epoch: 10, step: 1002, loss: 0.29585006833076477, mean loss: 0.36966951232820244
Epoch: 10, step: 1003, loss: 0.35699766874313354, mean loss: 0.3696686918255098
Epoch: 10, step: 1004, loss: 0.3033237159252167, mean loss: 0.36966439626216246
Epoch: 10, step: 1005, loss: 0.35888904333114624, mean loss: 0.36966369864770365
Epoch: 10, step: 1006, loss: 0.29464274644851685, mean loss: 0.36965884197959986
Epoch: 10, step: 1007, loss: 0.2987469732761383, mean loss: 0.369654251620414
Epoch: 10, step: 1008, loss: 0.3231341242790222, mean loss: 0.36965124041403546
Epoch: 10, step: 1009, loss: 0.3336271047592163, mean loss: 0.3696489087547698
Epoch: 10, step: 1010, loss: 0.3426113426685333, mean loss: 0.36964715886375393
Epoch: 10, step: 1011, loss: 0.32418978214263916, mean loss: 0.3696442170195447
Epoch: 10, step: 1012, loss: 0.3669695556163788, mean loss: 0.36964404393591027
Epoch: 10, step: 1013, loss: 0.3549444079399109, mean loss: 0.3696430927494216
Epoch: 10, step: 1014, loss: 0.36014893651008606, mean loss: 0.36964247843973286
Epoch: 10, step: 1015, loss: 0.31921833753585815, mean loss: 0.36963921600825617
Epoch: 10, step: 1016, loss: 0.33363357186317444, mean loss: 0.3696368866012467
Epoch: 10, step: 1017, loss: 0.32084596157073975, mean loss: 0.3696337302469298
Epoch: 10, step: 1018, loss: 0.3682481348514557, mean loss: 0.36963364061659176
Epoch: 10, step: 1019, loss: 0.3439548909664154, mean loss: 0.36963197963666616
Epoch: 10, step: 1020, loss: 0.35662683844566345, mean loss: 0.3696311384788374
Epoch: 10, step: 1021, loss: 0.3223489224910736, mean loss: 0.3696280805163495
Epoch: 10, step: 1022, loss: 0.3647345006465912, mean loss: 0.369627764046074
Epoch: 10, step: 1023, loss: 0.3436565697193146, mean loss: 0.36962608458446466
Epoch: 10, step: 1024, loss: 0.33072131872177124, mean loss: 0.3696235689190355
Epoch: 10, step: 1025, loss: 0.3440592288970947, mean loss: 0.3696219159809764
Epoch: 10, step: 1026, loss: 0.35468506813049316, mean loss: 0.3696209502573163
Epoch: 10, step: 1027, loss: 0.3061331510543823, mean loss: 0.36961684579654547
Epoch: 10, step: 1028, loss: 0.3142373263835907, mean loss: 0.36961326576426073
Epoch: 10, step: 1029, loss: 0.3517443537712097, mean loss: 0.3696121106956122
Epoch: 10, step: 1030, loss: 0.3547356426715851, mean loss: 0.3696111491244129
Epoch: 10, step: 1031, loss: 0.4043254554271698, mean loss: 0.3696133928101874
Epoch: 10, step: 1032, loss: 0.35142892599105835, mean loss: 0.3696122175715899
Epoch: 10, step: 1033, loss: 0.33505702018737793, mean loss: 0.369609984458149
Epoch: 10, step: 1034, loss: 0.33998146653175354, mean loss: 0.36960806985279027
Epoch: 10, step: 1035, loss: 0.38975492119789124, mean loss: 0.369609371665361
Epoch: 10, step: 1036, loss: 0.31018343567848206, mean loss: 0.3696055320364932
Epoch: 10, step: 1037, loss: 0.3299114406108856, mean loss: 0.36960296748736376
Epoch: 10, step: 1038, loss: 0.34440985321998596, mean loss: 0.3696013399200618
Epoch: 10, step: 1039, loss: 0.35954520106315613, mean loss: 0.3696006902986886
Epoch: 10, step: 1040, loss: 0.3147406280040741, mean loss: 0.3695971465959372
Epoch: 10, step: 1041, loss: 0.33994337916374207, mean loss: 0.3695952312253499
Epoch: 10, step: 1042, loss: 0.3385879695415497, mean loss: 0.3695932285603829
Epoch: 10, step: 1043, loss: 0.3589951694011688, mean loss: 0.36959254410809933
Epoch: 10, step: 1044, loss: 0.36662331223487854, mean loss: 0.3695923523591892
Epoch: 10, step: 1045, loss: 0.33145177364349365, mean loss: 0.36958988945213017
Epoch: 10, step: 1046, loss: 0.3269667625427246, mean loss: 0.3695871372646885
Epoch: 10, step: 1047, loss: 0.3204488158226013, mean loss: 0.36958396459414083
Epoch: 10, step: 1048, loss: 0.3117896616458893, mean loss: 0.3695802332814061
Epoch: 10, step: 1049, loss: 0.3103703260421753, mean loss: 0.36957641082128734
Epoch: 10, step: 1050, loss: 0.3435388505458832, mean loss: 0.3695747300027298
Epoch: 10, step: 1051, loss: 0.3667442202568054, mean loss: 0.36957454729489697
Epoch: 10, step: 1052, loss: 0.2943347096443176, mean loss: 0.3695696909186206
Epoch: 10, step: 1053, loss: 0.35473892092704773, mean loss: 0.3695687337242233
Epoch: 10, step: 1054, loss: 0.3234228491783142, mean loss: 0.3695657556096995
Epoch: 10, step: 1055, loss: 0.3313449025154114, mean loss: 0.36956328911169395
Epoch: 10, step: 1056, loss: 0.3618152141571045, mean loss: 0.36956278913912155
Epoch: 10, step: 1057, loss: 0.3733294904232025, mean loss: 0.3695630321834682
Epoch: 10, step: 1058, loss: 0.3302631080150604, mean loss: 0.36956049654089973
Epoch: 10, step: 1059, loss: 0.34954744577407837, mean loss: 0.36955920537633413
Epoch: 10, step: 1060, loss: 0.2986789345741272, mean loss: 0.3695546327506453
Epoch: 10, step: 1061, loss: 0.35736557841300964, mean loss: 0.3695538464614996
Epoch: 10, step: 1062, loss: 0.33759984374046326, mean loss: 0.3695517853118691
Epoch: 10, step: 1063, loss: 0.3239111006259918, mean loss: 0.3695488415112573
Epoch: 10, step: 1064, loss: 0.3064122498035431, mean loss: 0.3695447694963132
Epoch: 10, step: 1065, loss: 0.3200124204158783, mean loss: 0.3695415750974302
Epoch: 10, step: 1066, loss: 0.3573567867279053, mean loss: 0.3695407893369111
Epoch: 10, step: 1067, loss: 0.3370939791202545, mean loss: 0.369538697074194
Epoch: 10, step: 1068, loss: 0.351246178150177, mean loss: 0.3695375175965408
Epoch: 10, step: 1069, loss: 0.34806495904922485, mean loss: 0.3695361331633656
Epoch: 10, step: 1070, loss: 0.328792005777359, mean loss: 0.3695335063741588
Epoch: 10, step: 1071, loss: 0.3305405378341675, mean loss: 0.36953099264488215
Epoch: 10, step: 1072, loss: 0.3136138916015625, mean loss: 0.3695273881131318
Epoch: 10, step: 1073, loss: 0.34447845816612244, mean loss: 0.3695257735114851
Epoch: 10, step: 1074, loss: 0.3425982892513275, mean loss: 0.3695240379340271
Epoch: 10, step: 1075, loss: 0.3244403600692749, mean loss: 0.3695211323090036
Epoch: 10, step: 1076, loss: 0.3201289176940918, mean loss: 0.3695179492056579
Epoch: 10, step: 1077, loss: 0.3165326714515686, mean loss: 0.3695145347657975
Epoch: 10, step: 1078, loss: 0.3440876305103302, mean loss: 0.3695128963287683
Epoch: 10, step: 1079, loss: 0.3144175112247467, mean loss: 0.3695093463683879
Epoch: 10, step: 1080, loss: 0.32694968581199646, mean loss: 0.36950660429889776
Epoch: 10, step: 1081, loss: 0.36069610714912415, mean loss: 0.3695060366853718
Epoch: 10, step: 1082, loss: 0.38837936520576477, mean loss: 0.3695072525153351
Epoch: 10, step: 1083, loss: 0.339856892824173, mean loss: 0.3695053425462749
Epoch: 10, step: 1084, loss: 0.3584692180156708, mean loss: 0.3695046316847914
Epoch: 10, step: 1085, loss: 0.3357114791870117, mean loss: 0.3695024551323956
Epoch: 10, step: 1086, loss: 0.3179761469364166, mean loss: 0.36949913663505574
Epoch: 10, step: 1087, loss: 0.2882988750934601, mean loss: 0.36949390735494614
Epoch: 10, step: 1088, loss: 0.3248327672481537, mean loss: 0.3694910313719397
Epoch: 10, step: 1089, loss: 0.31361350417137146, mean loss: 0.369487433334129
Epoch: 10, step: 1090, loss: 0.33699819445610046, mean loss: 0.3694853414379936
Epoch: 10, step: 1091, loss: 0.3183034062385559, mean loss: 0.36948204618076985
Epoch: 10, step: 1092, loss: 0.33517131209373474, mean loss: 0.36947983728782663
Epoch: 10, step: 1093, loss: 0.32726535201072693, mean loss: 0.36947711973373387
Epoch: 10, step: 1094, loss: 0.320136696100235, mean loss: 0.3694739436523928
Epoch: 10, step: 1095, loss: 0.346347451210022, mean loss: 0.36947245507795645
Epoch: 10, step: 1096, loss: 0.3631037473678589, mean loss: 0.36947204517207305
Epoch: 10, step: 1097, loss: 0.38874369859695435, mean loss: 0.3694732854638368
Epoch: 10, step: 1098, loss: 0.32425060868263245, mean loss: 0.3694703751943998
Epoch: 10, step: 1099, loss: 0.3271210491657257, mean loss: 0.36946765001254467
Epoch: 10, step: 1100, loss: 0.3658103346824646, mean loss: 0.36946741467921157
Epoch: 10, step: 1101, loss: 0.3680858910083771, mean loss: 0.3694673257895146
Epoch: 10, step: 1102, loss: 0.3717558979988098, mean loss: 0.36946747303085853
Epoch: 10, step: 1103, loss: 0.3383430242538452, mean loss: 0.36946547068598096
Epoch: 10, step: 1104, loss: 0.3381176292896271, mean loss: 0.36946345409920733
Epoch: 10, step: 1105, loss: 0.3083890676498413, mean loss: 0.3694595254753524
Epoch: 10, step: 1106, loss: 0.38218170404434204, mean loss: 0.3694603437797564
Epoch: 10, step: 1107, loss: 0.36039161682128906, mean loss: 0.36945976050686224
Epoch: 10, step: 1108, loss: 0.3424268662929535, mean loss: 0.36945802194526894
Epoch: 10, step: 1109, loss: 0.39786699414253235, mean loss: 0.3694598488888186
Epoch: 10, step: 1110, loss: 0.3196670413017273, mean loss: 0.36945664698491615
Epoch: 10, step: 1111, loss: 0.2929699718952179, mean loss: 0.36945172886023186
Epoch: 10, step: 1112, loss: 0.321647584438324, mean loss: 0.3694486552317086
Epoch: 10, step: 1113, loss: 0.34579169750213623, mean loss: 0.3694471342751875
Epoch: 10, step: 1114, loss: 0.36383581161499023, mean loss: 0.36944677353441857
Epoch: 10, step: 1115, loss: 0.33840030431747437, mean loss: 0.3694447777469914
Epoch: 10, step: 1116, loss: 0.3695225417613983, mean loss: 0.36944478274564246
Epoch: 10, step: 1117, loss: 0.33199435472488403, mean loss: 0.36944237559639315
Epoch: 10, step: 1118, loss: 0.3428746461868286, mean loss: 0.36944066804903086
Epoch: 10, step: 1119, loss: 0.3391149044036865, mean loss: 0.36943871909249837
Epoch: 10, step: 1120, loss: 0.31734538078308105, mean loss: 0.36943537140672567
Epoch: 10, step: 1121, loss: 0.3268028795719147, mean loss: 0.36943263188148245
Epoch: 10, step: 1122, loss: 0.31099942326545715, mean loss: 0.36942887725778417
Epoch: 10, step: 1123, loss: 0.31889718770980835, mean loss: 0.3694256305545236
Epoch: 10, step: 1124, loss: 0.32671719789505005, mean loss: 0.3694228866783489
Epoch: 10, step: 1125, loss: 0.36914166808128357, mean loss: 0.3694228686121407
Epoch: 10, step: 1126, loss: 0.32225608825683594, mean loss: 0.36941983869113115
Epoch: 10, step: 1127, loss: 0.37194374203681946, mean loss: 0.36942000081236354
Epoch: 10, step: 1128, loss: 0.3041410744190216, mean loss: 0.3694158079337976
Epoch: 10, step: 1129, loss: 0.33146828413009644, mean loss: 0.36941337071325786
Epoch: 10, step: 1130, loss: 0.3002045452594757, mean loss: 0.36940892598745645
Epoch: 10, step: 1131, loss: 0.3682190477848053, mean loss: 0.369408849576064
Epoch: 10, step: 1132, loss: 0.3599283993244171, mean loss: 0.3694082408012453
Epoch: 10, step: 1133, loss: 0.34794309735298157, mean loss: 0.36940686253339833
Epoch: 10, step: 1134, loss: 0.36133289337158203, mean loss: 0.36940634414051476
Epoch: 10, step: 1135, loss: 0.38729241490364075, mean loss: 0.3694074924501426
Epoch: 10, step: 1136, loss: 0.3356305658817291, mean loss: 0.3694053240655648
Epoch: 10, step: 1137, loss: 0.3593485951423645, mean loss: 0.36940467849303155
Epoch: 10, step: 1138, loss: 0.3576596677303314, mean loss: 0.36940392459286064
Epoch: 10, step: 1139, loss: 0.32454100251197815, mean loss: 0.3694010450728298
Epoch: 10, step: 1140, loss: 0.33224746584892273, mean loss: 0.3693986605288837
Epoch: 10, step: 1141, loss: 0.32698678970336914, mean loss: 0.3693959386786189
Epoch: 10, step: 1142, loss: 0.3206970691680908, mean loss: 0.3693928135506262
Epoch: 10, step: 1143, loss: 0.2955353856086731, mean loss: 0.36938807423928494
Epoch: 10, step: 1144, loss: 0.3504406809806824, mean loss: 0.369386858493808
Epoch: 10, step: 1145, loss: 0.34324946999549866, mean loss: 0.3693851815152055
Epoch: 10, step: 1146, loss: 0.3391050100326538, mean loss: 0.36938323885969243
Epoch: 10, step: 1147, loss: 0.29161888360977173, mean loss: 0.3693782501276389
Epoch: 10, step: 1148, loss: 0.35543420910835266, mean loss: 0.3693773556481329
Epoch: 10, step: 1149, loss: 0.3274795114994049, mean loss: 0.3693746681661477
Epoch: 10, step: 1150, loss: 0.3534655272960663, mean loss: 0.36937364776072984
Epoch: 10, step: 1151, loss: 0.3166615068912506, mean loss: 0.3693702670436397
Epoch: 10, step: 1152, loss: 0.3975784182548523, mean loss: 0.3693720760702036
Epoch: 10, step: 1153, loss: 0.3546349108219147, mean loss: 0.36937113101664143
Epoch: 10, step: 1154, loss: 0.3071930408477783, mean loss: 0.36936714396372905
Epoch: 10, step: 1155, loss: 0.3483957052230835, mean loss: 0.36936579929594626
Epoch: 10, step: 1156, loss: 0.34130558371543884, mean loss: 0.3693640002182018
Epoch: 10, step: 1157, loss: 0.30578377842903137, mean loss: 0.36935992404037205
Epoch: 10, step: 1158, loss: 0.34321045875549316, mean loss: 0.3693582476851387
Epoch: 10, step: 1159, loss: 0.35891231894493103, mean loss: 0.369357578074322
Epoch: 10, step: 1160, loss: 0.3321356475353241, mean loss: 0.3693551922060739
Epoch: 10, step: 1161, loss: 0.3614196479320526, mean loss: 0.36935468358254653
Epoch: 10, step: 1162, loss: 0.3761026859283447, mean loss: 0.36935511606363003
Epoch: 10, step: 1163, loss: 0.3321229815483093, mean loss: 0.36935273000015173
Epoch: 10, step: 1164, loss: 0.3245798945426941, mean loss: 0.369349860866191
Epoch: 10, step: 1165, loss: 0.3195434808731079, mean loss: 0.3693466693770206
Epoch: 10, step: 1166, loss: 0.36629238724708557, mean loss: 0.36934647367751844
Epoch: 10, step: 1167, loss: 0.3660259544849396, mean loss: 0.3693462609328239
Epoch: 10, step: 1168, loss: 0.37838488817214966, mean loss: 0.3693468399979299
Epoch: 10, step: 1169, loss: 0.33506911993026733, mean loss: 0.3693446441157987
Epoch: 10, step: 1170, loss: 0.3345756530761719, mean loss: 0.3693424169047911
Epoch: 10, step: 1171, loss: 0.34990569949150085, mean loss: 0.36934117191904847
Epoch: 10, step: 1172, loss: 0.365242063999176, mean loss: 0.3693409093745074
Epoch: 10, step: 1173, loss: 0.33268359303474426, mean loss: 0.36933856165346607
Epoch: 10, step: 1174, loss: 0.38376593589782715, mean loss: 0.3693394855967414
Epoch: 10, step: 1175, loss: 0.32267504930496216, mean loss: 0.3693364973515895
Epoch: 10, step: 1176, loss: 0.31703293323516846, mean loss: 0.3693331482087249
Epoch: 10, step: 1177, loss: 0.34102293848991394, mean loss: 0.3693313355432288
Epoch: 10, step: 1178, loss: 0.33568406105041504, mean loss: 0.3693291812904282
Epoch: 10, step: 1179, loss: 0.32798832654953003, mean loss: 0.36932653462879306
Epoch: 10, step: 1180, loss: 0.3371363580226898, mean loss: 0.3693244739299514
Epoch: 10, step: 1181, loss: 0.34679338335990906, mean loss: 0.3693230316632397
Epoch: 10, step: 1182, loss: 0.40088045597076416, mean loss: 0.3693250515969469
Epoch: 10, step: 1183, loss: 0.33194035291671753, mean loss: 0.36932265882309384
Epoch: 10, step: 1184, loss: 0.32276690006256104, mean loss: 0.3693196792545332
Epoch: 10, step: 1185, loss: 0.3714715540409088, mean loss: 0.369319816965706
Epoch: 10, step: 1186, loss: 0.3471444845199585, mean loss: 0.3693183979260665
Epoch: 10, step: 1187, loss: 0.3565168082714081, mean loss: 0.36931757878160437
Epoch: 10, step: 1188, loss: 0.35049712657928467, mean loss: 0.3693163745809388
Epoch: 10, step: 1189, loss: 0.3527604639530182, mean loss: 0.3693153153416152
Epoch: 10, step: 1190, loss: 0.3434131145477295, mean loss: 0.36931365823709256
Epoch: 10, step: 1191, loss: 0.33311209082603455, mean loss: 0.3693113423742848
Epoch: 10, step: 1192, loss: 0.3583616614341736, mean loss: 0.3693106419533202
Epoch: 10, step: 1193, loss: 0.3545331358909607, mean loss: 0.36930969673737657
Epoch: 10, step: 1194, loss: 0.3485189378261566, mean loss: 0.3693083669798511
Epoch: 10, step: 1195, loss: 0.3528321385383606, mean loss: 0.36930731324306154
Epoch: 10, step: 1196, loss: 0.33702513575553894, mean loss: 0.3693052487692183
Epoch: 10, step: 1197, loss: 0.3621421158313751, mean loss: 0.3693047907098157
Epoch: 10, step: 1198, loss: 0.33710190653800964, mean loss: 0.36930273157021776
Epoch: 10, step: 1199, loss: 0.34374967217445374, mean loss: 0.36930109774289066
Epoch: 10, step: 1200, loss: 0.349040687084198, mean loss: 0.3692998024030365
Epoch: 10, step: 1201, loss: 0.3182816207408905, mean loss: 0.36929654078804725
Epoch: 10, step: 1202, loss: 0.36599910259246826, mean loss: 0.3692963299948365
Epoch: 10, step: 1203, loss: 0.3054541051387787, mean loss: 0.36929224905486874
Epoch: 10, step: 1204, loss: 0.3393971025943756, mean loss: 0.3692903382113749
Epoch: 10, step: 1205, loss: 0.3317596912384033, mean loss: 0.36928793947387184
Epoch: 10, step: 1206, loss: 0.3396151661872864, mean loss: 0.36928604308649493
Epoch: 10, step: 1207, loss: 0.31819233298301697, mean loss: 0.3692827778954096
Epoch: 10, step: 1208, loss: 0.3435930907726288, mean loss: 0.3692811362769597
Epoch: 10, step: 1209, loss: 0.31277650594711304, mean loss: 0.3692775257574498
Epoch: 10, step: 1210, loss: 0.3522418439388275, mean loss: 0.3692764372850315
Epoch: 10, step: 1211, loss: 0.35027816891670227, mean loss: 0.36927522349328806
Epoch: 10, step: 1212, loss: 0.3580520451068878, mean loss: 0.36927450649473276
Epoch: 10, step: 1213, loss: 0.3387426733970642, mean loss: 0.36927255607738907
Epoch: 10, step: 1214, loss: 0.3559482991695404, mean loss: 0.3692717049590941
Epoch: 10, step: 1215, loss: 0.3224482238292694, mean loss: 0.3692687141899877
Epoch: 10, step: 1216, loss: 0.36278408765792847, mean loss: 0.3692683000221055
Epoch: 10, step: 1217, loss: 0.3471890687942505, mean loss: 0.36926688992942264
Epoch: 10, step: 1218, loss: 0.3486191928386688, mean loss: 0.36926557134604626
Epoch: 10, step: 1219, loss: 0.3591161072254181, mean loss: 0.36926492323211774
Epoch: 10, step: 1220, loss: 0.3292437791824341, mean loss: 0.3692623677666909
Epoch: 10, step: 1221, loss: 0.3600541949272156, mean loss: 0.3692617798358494
Epoch: 10, step: 1222, loss: 0.36332210898399353, mean loss: 0.36926140061916984
Epoch: 10, step: 1223, loss: 0.34313130378723145, mean loss: 0.3692597324567061
Epoch: 10, step: 1224, loss: 0.3340221047401428, mean loss: 0.3692574830071232
Epoch: 10, step: 1225, loss: 0.3404496908187866, mean loss: 0.3692556441336272
Epoch: 10, step: 1226, loss: 0.3356724977493286, mean loss: 0.3692535005741465
Epoch: 10, step: 1227, loss: 0.33179762959480286, mean loss: 0.3692511099773263
Epoch: 10, step: 1228, loss: 0.34056341648101807, mean loss: 0.369249279120635
Epoch: 10, step: 1229, loss: 0.36832568049430847, mean loss: 0.3692492201800717
Epoch: 10, step: 1230, loss: 0.3858358561992645, mean loss: 0.36925027860876286
Epoch: 10, step: 1231, loss: 0.372528076171875, mean loss: 0.36925048775868397
Epoch: 10, step: 1232, loss: 0.33584219217300415, mean loss: 0.3692483561759885
Epoch: 10, step: 1233, loss: 0.3422994315624237, mean loss: 0.36924663683666137
Epoch: 10, step: 1234, loss: 0.31143918633461, mean loss: 0.36924294896103127
Epoch: 10, step: 1235, loss: 0.32246822118759155, mean loss: 0.36923996511771834
Epoch: 10, step: 1236, loss: 0.3319392800331116, mean loss: 0.369237585792268
Epoch: 10, step: 1237, loss: 0.3417920470237732, mean loss: 0.3692358352157424
Epoch: 10, step: 1238, loss: 0.3304833769798279, mean loss: 0.36923336360031817
Epoch: 10, step: 1239, loss: 0.3502729535102844, mean loss: 0.369232154390491
Epoch: 10, step: 1240, loss: 0.3049676716327667, mean loss: 0.3692280561516824
Epoch: 10, step: 1241, loss: 0.3495989143848419, mean loss: 0.3692268044528068
Epoch: 10, step: 1242, loss: 0.36802124977111816, mean loss: 0.3692267275826492
Epoch: 10, step: 1243, loss: 0.3127276599407196, mean loss: 0.36922312524474804
Epoch: 10, step: 1244, loss: 0.3351253867149353, mean loss: 0.3692209513372868
Epoch: 10, step: 1245, loss: 0.29741472005844116, mean loss: 0.36921637360993254
Epoch: 10, step: 1246, loss: 0.3553980886936188, mean loss: 0.3692154927350096
Epoch: 10, step: 1247, loss: 0.35309159755706787, mean loss: 0.36921446494974836
Epoch: 10, step: 1248, loss: 0.3064141571521759, mean loss: 0.369210462125617
Epoch: 10, step: 1249, loss: 0.3105696141719818, mean loss: 0.36920672465920823
Epoch: 10, step: 1250, loss: 0.32592642307281494, mean loss: 0.36920396637091646
Epoch: 10, step: 1251, loss: 0.3275020718574524, mean loss: 0.36920130884513813
Epoch: 10, step: 1252, loss: 0.33006802201271057, mean loss: 0.36919881516726694
Epoch: 10, step: 1253, loss: 0.3506508469581604, mean loss: 0.3691976333163552
Epoch: 10, step: 1254, loss: 0.37579572200775146, mean loss: 0.36919805371066494
Epoch: 10, step: 1255, loss: 0.3264240324497223, mean loss: 0.3691953285564052
Epoch: 10, step: 1256, loss: 0.32391175627708435, mean loss: 0.36919244370119214
Epoch: 10, step: 1257, loss: 0.33349165320396423, mean loss: 0.3691901694757814
Epoch: 10, step: 1258, loss: 0.36460110545158386, mean loss: 0.369189877160091
Epoch: 10, step: 1259, loss: 0.3414192497730255, mean loss: 0.3691881083303211
Epoch: 10, step: 1260, loss: 0.33718299865722656, mean loss: 0.3691860699181389
Epoch: 10, step: 1261, loss: 0.3453423082828522, mean loss: 0.36918455140064843
Epoch: 10, step: 1262, loss: 0.330434113740921, mean loss: 0.36918208369144256
Epoch: 10, step: 1263, loss: 0.33589664101600647, mean loss: 0.3691799641395656
Epoch: 10, step: 1264, loss: 0.33865490555763245, mean loss: 0.3691780204873159
Epoch: 10, step: 1265, loss: 0.3564601540565491, mean loss: 0.3691772107415862
Epoch: 10, step: 1266, loss: 0.3528573215007782, mean loss: 0.36917617172145245
Epoch: 10, step: 1267, loss: 0.34592461585998535, mean loss: 0.3691746914848939
Epoch: 10, step: 1268, loss: 0.3596763014793396, mean loss: 0.3691740868385125
Epoch: 10, step: 1269, loss: 0.31418395042419434, mean loss: 0.3691705865115606
Epoch: 10, step: 1270, loss: 0.31944793462753296, mean loss: 0.36916742168106703
Epoch: 10, step: 1271, loss: 0.3468479514122009, mean loss: 0.3691660011445173
Epoch: 10, step: 1272, loss: 0.3363298177719116, mean loss: 0.3691639113982325
Epoch: 10, step: 1273, loss: 0.3358398675918579, mean loss: 0.3691617907387056
Epoch: 10, step: 1274, loss: 0.35904139280319214, mean loss: 0.369161146742655
Epoch: 10, step: 1275, loss: 0.33132362365722656, mean loss: 0.3691587391629219
Epoch: 10, step: 1276, loss: 0.3139042556285858, mean loss: 0.369155223575753
Epoch: 10, step: 1277, loss: 0.3220512866973877, mean loss: 0.36915222676083514
Epoch: 10, step: 1278, loss: 0.33028391003608704, mean loss: 0.36914975406430706
Epoch: 10, step: 1279, loss: 0.31043487787246704, mean loss: 0.3691460190212923
Epoch: 10, step: 1280, loss: 0.33339831233024597, mean loss: 0.3691437451387981
Epoch: 10, step: 1281, loss: 0.34285274147987366, mean loss: 0.36914207289584816
Epoch: 10, step: 1282, loss: 0.3869417905807495, mean loss: 0.36914320497736475
Epoch: 10, step: 1283, loss: 0.31780219078063965, mean loss: 0.3691399398403642
Epoch: 10, step: 1284, loss: 0.33527517318725586, mean loss: 0.3691377862780969
Epoch: 10, step: 1285, loss: 0.32740461826324463, mean loss: 0.3691351325093054
Epoch: 10, step: 1286, loss: 0.3036864995956421, mean loss: 0.3691309709633708
Epoch: 10, step: 1287, loss: 0.3136264681816101, mean loss: 0.36912744193852454
Epoch: 10, step: 1288, loss: 0.33945468068122864, mean loss: 0.36912555543834924
Epoch: 10, step: 1289, loss: 0.3049462139606476, mean loss: 0.3691214753784969
Epoch: 10, step: 1290, loss: 0.33899855613708496, mean loss: 0.3691195605021863
Epoch: 10, step: 1291, loss: 0.3331124186515808, mean loss: 0.3691172717186972
Epoch: 10, step: 1292, loss: 0.3364144563674927, mean loss: 0.3691151931058865
Epoch: 10, step: 1293, loss: 0.3180287480354309, mean loss: 0.36911194622365245
Epoch: 10, step: 1294, loss: 0.3675782084465027, mean loss: 0.3691118487506447
Epoch: 10, step: 1295, loss: 0.3400246798992157, mean loss: 0.3691100003032088
Epoch: 10, step: 1296, loss: 0.29919907450675964, mean loss: 0.36910555784748045
Epoch: 10, step: 1297, loss: 0.36616623401641846, mean loss: 0.3691053710814472
Epoch: 10, step: 1298, loss: 0.3560320734977722, mean loss: 0.3691045404506839
Epoch: 10, step: 1299, loss: 0.37823134660720825, mean loss: 0.36910512029859727
Epoch: 10, step: 1300, loss: 0.3491039276123047, mean loss: 0.36910384965551957
Epoch: 10, step: 1301, loss: 0.3316565454006195, mean loss: 0.3691014708406133
Epoch: 10, step: 1302, loss: 0.38427501916885376, mean loss: 0.36910243466887527
Epoch: 10, step: 1303, loss: 0.3629554808139801, mean loss: 0.369102044237355
Epoch: 10, step: 1304, loss: 0.30113548040390015, mean loss: 0.3690977275295853
Epoch: 10, step: 1305, loss: 0.35304445028305054, mean loss: 0.36909670801496275
Epoch: 10, step: 1306, loss: 0.32625362277030945, mean loss: 0.3690939873008429
Epoch: 10, step: 1307, loss: 0.3394899368286133, mean loss: 0.3690921074398782
Epoch: 10, step: 1308, loss: 0.3004046380519867, mean loss: 0.3690877460537973
Epoch: 10, step: 1309, loss: 0.3005235493183136, mean loss: 0.3690833927714649
Epoch: 10, step: 1310, loss: 0.31657111644744873, mean loss: 0.36908005887035866
Epoch: 10, step: 1311, loss: 0.3401086926460266, mean loss: 0.3690782196520864
Epoch: 10, step: 1312, loss: 0.33875572681427, mean loss: 0.369076294781088
Epoch: 10, step: 1313, loss: 0.34455668926239014, mean loss: 0.36907473837601507
Epoch: 10, step: 1314, loss: 0.34872010350227356, mean loss: 0.3690734464283874
Epoch: 10, step: 1315, loss: 0.40165191888809204, mean loss: 0.3690755141151391
Epoch: 10, step: 1316, loss: 0.32902607321739197, mean loss: 0.3690729724231357
Epoch: 10, step: 1317, loss: 0.373087614774704, mean loss: 0.3690732271916565
Epoch: 10, step: 1318, loss: 0.32329094409942627, mean loss: 0.3690703220401182
Epoch: 10, step: 1319, loss: 0.34269049763679504, mean loss: 0.3690686481933921
Epoch: 10, step: 1320, loss: 0.33161020278930664, mean loss: 0.36906627153928356
Epoch: 10, step: 1321, loss: 0.32221829891204834, mean loss: 0.36906329932937193
Epoch: 10, step: 1322, loss: 0.3459545969963074, mean loss: 0.36906183332021547
Epoch: 10, step: 1323, loss: 0.3087247312068939, mean loss: 0.3690580057953415
Epoch: 10, step: 1324, loss: 0.33750036358833313, mean loss: 0.3690560040419506
Epoch: 10, step: 1325, loss: 0.3299328684806824, mean loss: 0.36905352255421997
Epoch: 10, step: 1326, loss: 0.32015177607536316, mean loss: 0.36905042102910557
Epoch: 10, step: 1327, loss: 0.3809136748313904, mean loss: 0.3690511733917262
Epoch: 10, step: 1328, loss: 0.3409186601638794, mean loss: 0.36904938935258436
Epoch: 10, step: 1329, loss: 0.327908992767334, mean loss: 0.36904678057664364
Epoch: 10, step: 1330, loss: 0.3390873670578003, mean loss: 0.3690448809245278
Epoch: 10, step: 1331, loss: 0.333224356174469, mean loss: 0.3690426097778914
Epoch: 10, step: 1332, loss: 0.33420225977897644, mean loss: 0.3690404009178141
Epoch: 10, step: 1333, loss: 0.3479125499725342, mean loss: 0.3690390615079659
Epoch: 10, step: 1334, loss: 0.3196577727794647, mean loss: 0.3690359311568579
Epoch: 10, step: 1335, loss: 0.35080447793006897, mean loss: 0.36903477551200325
Epoch: 10, step: 1336, loss: 0.3524726927280426, mean loss: 0.36903372575078225
Epoch: 10, step: 1337, loss: 0.3609507381916046, mean loss: 0.3690332134559693
Epoch: 10, step: 1338, loss: 0.37477368116378784, mean loss: 0.3690335772602476
Epoch: 10, step: 1339, loss: 0.38170138001441956, mean loss: 0.3690343800360875
Epoch: 10, step: 1340, loss: 0.37881430983543396, mean loss: 0.36903499976422893
Epoch: 10, step: 1341, loss: 0.30189356207847595, mean loss: 0.36903074545947123
Epoch: 10, step: 1342, loss: 0.32962915301322937, mean loss: 0.3690282490017353
Epoch: 10, step: 1343, loss: 0.33735284209251404, mean loss: 0.36902624219693875
Epoch: 10, step: 1344, loss: 0.37079375982284546, mean loss: 0.36902635417144786
Epoch: 10, step: 1345, loss: 0.3283616602420807, mean loss: 0.3690237781741129
Epoch: 10, step: 1346, loss: 0.37547481060028076, mean loss: 0.3690241868035185
Epoch: 10, step: 1347, loss: 0.3358292281627655, mean loss: 0.3690220842599005
Epoch: 10, step: 1348, loss: 0.3367910087108612, mean loss: 0.3690200428972082
Epoch: 10, step: 1349, loss: 0.31847941875457764, mean loss: 0.3690168420977058
Epoch: 10, step: 1350, loss: 0.34728407859802246, mean loss: 0.36901546582239075
Epoch: 10, step: 1351, loss: 0.33501148223876953, mean loss: 0.3690133125812824
Epoch: 10, step: 1352, loss: 0.3409135043621063, mean loss: 0.3690115333241293
Epoch: 10, step: 1353, loss: 0.37194758653640747, mean loss: 0.36901171922087567
Epoch: 10, step: 1354, loss: 0.32429036498069763, mean loss: 0.369008887859417
Epoch: 10, step: 1355, loss: 0.31921276450157166, mean loss: 0.36900573540795095
Epoch: 10, step: 1356, loss: 0.337180495262146, mean loss: 0.36900372076971927
Epoch: 10, step: 1357, loss: 0.3620344400405884, mean loss: 0.3690032796201605
Epoch: 10, step: 1358, loss: 0.3007601797580719, mean loss: 0.3689989601632416
Epoch: 10, step: 1359, loss: 0.35612624883651733, mean loss: 0.36899814543467657
Epoch: 10, step: 1360, loss: 0.3467238247394562, mean loss: 0.36899673575676406
Epoch: 10, step: 1361, loss: 0.3469410240650177, mean loss: 0.3689953400023221
Epoch: 10, step: 1362, loss: 0.3236367404460907, mean loss: 0.3689924697498665
Epoch: 10, step: 1363, loss: 0.2855825424194336, mean loss: 0.3689871919766869
Epoch: 10, step: 1364, loss: 0.32624995708465576, mean loss: 0.3689844879441091
Epoch: 10, step: 1365, loss: 0.31469807028770447, mean loss: 0.36898105339914794
Epoch: 10, step: 1366, loss: 0.3389892876148224, mean loss: 0.36897915602673165
Epoch: 10, step: 1367, loss: 0.3414270579814911, mean loss: 0.36897741310554966
Epoch: 10, step: 1368, loss: 0.3373369574546814, mean loss: 0.36897541168511505
Epoch: 10, step: 1369, loss: 0.29662758111953735, mean loss: 0.36897083560475036
Epoch: 10, step: 1370, loss: 0.3084825277328491, mean loss: 0.3689670098943037
Epoch: 10, step: 1371, loss: 0.3251306712627411, mean loss: 0.368964237548071
Epoch: 10, step: 1372, loss: 0.39081907272338867, mean loss: 0.3689656196283325
Epoch: 10, step: 1373, loss: 0.32933253049850464, mean loss: 0.3689631134256558
Epoch: 10, step: 1374, loss: 0.3250204622745514, mean loss: 0.36896033488306007
Epoch: 10, step: 1375, loss: 0.31396621465682983, mean loss: 0.368956857763673
Epoch: 10, step: 1376, loss: 0.3448960781097412, mean loss: 0.36895533656624907
Epoch: 10, step: 1377, loss: 0.3210099935531616, mean loss: 0.3689523055039774
Epoch: 10, step: 1378, loss: 0.3324248492717743, mean loss: 0.3689499964164098
Epoch: 10, step: 1379, loss: 0.3628523349761963, mean loss: 0.3689496109763693
Epoch: 10, step: 1380, loss: 0.3625512421131134, mean loss: 0.3689492065538383
Epoch: 10, step: 1381, loss: 0.3820498287677765, mean loss: 0.36895003455423103
Epoch: 10, step: 1382, loss: 0.3254248797893524, mean loss: 0.36894728380186015
Epoch: 10, step: 1383, loss: 0.2921695113182068, mean loss: 0.36894243181927144
Epoch: 10, step: 1384, loss: 0.3319661021232605, mean loss: 0.36894009524235544
Epoch: 10, step: 1385, loss: 0.33472248911857605, mean loss: 0.36893793312898987
Epoch: 10, step: 1386, loss: 0.39255571365356445, mean loss: 0.36893942537518465
Epoch: 10, step: 1387, loss: 0.3984362483024597, mean loss: 0.36894128896015604
Epoch: 10, step: 1388, loss: 0.34479188919067383, mean loss: 0.3689397633173631
Epoch: 10, step: 1389, loss: 0.3180762827396393, mean loss: 0.3689365502105673
Epoch: 10, step: 1390, loss: 0.35783764719963074, mean loss: 0.3689358491239012
Epoch: 10, step: 1391, loss: 0.39324790239334106, mean loss: 0.36893738475131843
Epoch: 10, step: 1392, loss: 0.30535203218460083, mean loss: 0.36893336874976684
Epoch: 10, step: 1393, loss: 0.3124217092990875, mean loss: 0.3689297997426018
Epoch: 10, step: 1394, loss: 0.34708619117736816, mean loss: 0.36892842029147677
Epoch: 10, step: 1395, loss: 0.334460973739624, mean loss: 0.3689262437666882
Epoch: 10, step: 1396, loss: 0.37018269300460815, mean loss: 0.36892632310300427
Epoch: 10, step: 1397, loss: 0.3436688184738159, mean loss: 0.36892472836221446
Epoch: 10, step: 1398, loss: 0.34499016404151917, mean loss: 0.3689232172463409
Epoch: 10, step: 1399, loss: 0.36135461926460266, mean loss: 0.3689227394308118
Epoch: 10, step: 1400, loss: 0.3586375415325165, mean loss: 0.3689220901537524
Epoch: 10, step: 1401, loss: 0.34215614199638367, mean loss: 0.3689204005976258
Epoch: 10, step: 1402, loss: 0.3517718017101288, mean loss: 0.3689193181890613
Epoch: 10, step: 1403, loss: 0.3455124795436859, mean loss: 0.3689178408576649
Epoch: 10, step: 1404, loss: 0.32647621631622314, mean loss: 0.36891516230767807
Epoch: 10, step: 1405, loss: 0.31721076369285583, mean loss: 0.36891189937705743
Epoch: 10, step: 1406, loss: 0.31822094321250916, mean loss: 0.3689087006040301
Epoch: 10, step: 1407, loss: 0.3342646360397339, mean loss: 0.36890651458279305
Epoch: 10, step: 1408, loss: 0.38978132605552673, mean loss: 0.36890783168869706
Epoch: 10, step: 1409, loss: 0.3401772677898407, mean loss: 0.36890601903482334
Epoch: 10, step: 1410, loss: 0.3486786186695099, mean loss: 0.36890474293865494
Epoch: 10, step: 1411, loss: 0.3191451132297516, mean loss: 0.3689016039259304
Epoch: 10, step: 1412, loss: 0.36432766914367676, mean loss: 0.3689013154042132
Epoch: 10, step: 1413, loss: 0.4205329418182373, mean loss: 0.3689045720981967
Epoch: 10, step: 1414, loss: 0.3684006631374359, mean loss: 0.36890454031585923
Epoch: 10, step: 1415, loss: 0.3722258508205414, mean loss: 0.3689047497829698
Epoch: 10, step: 1416, loss: 0.38003045320510864, mean loss: 0.3689054514102273
Epoch: 10, step: 1417, loss: 0.3309642970561981, mean loss: 0.3689030588541449
Epoch: 10, step: 1418, loss: 0.3041190505027771, mean loss: 0.36889897385456416
Epoch: 10, step: 1419, loss: 0.4259706735610962, mean loss: 0.36890257232238927
Epoch: 10, step: 1420, loss: 0.34172073006629944, mean loss: 0.36890085856901583
Epoch: 10, step: 1421, loss: 0.3328830301761627, mean loss: 0.36889858786996194
Epoch: 10, step: 1422, loss: 0.3229730427265167, mean loss: 0.368895692733787
Epoch: 10, step: 1423, loss: 0.34793052077293396, mean loss: 0.36889437117730933
Epoch: 10, step: 1424, loss: 0.38503512740135193, mean loss: 0.36889538855872905
Epoch: 10, step: 1425, loss: 0.3321865499019623, mean loss: 0.36889307487924733
Epoch: 10, step: 1426, loss: 0.3116423189640045, mean loss: 0.3688894667141301
Epoch: 10, step: 1427, loss: 0.3569731116294861, mean loss: 0.368888715746454
Epoch: 10, step: 1428, loss: 0.32039275765419006, mean loss: 0.3688856597279215
Epoch: 10, step: 1429, loss: 0.33001360297203064, mean loss: 0.3688832103229589
Epoch: 10, step: 1430, loss: 0.3676525950431824, mean loss: 0.36888313278434887
Epoch: 10, step: 1431, loss: 0.31525561213493347, mean loss: 0.36887975403430795
Epoch: 10, step: 1432, loss: 0.36009302735328674, mean loss: 0.36887920046997347
Epoch: 10, step: 1433, loss: 0.3100441098213196, mean loss: 0.36887549408905823
Epoch: 10, step: 1434, loss: 0.3662334084510803, mean loss: 0.36887532765846687
Epoch: 10, step: 1435, loss: 0.3021204471588135, mean loss: 0.3688711228914916
Epoch: 10, step: 1436, loss: 0.305610716342926, mean loss: 0.3688671384859648
Epoch: 10, step: 1437, loss: 0.32240918278694153, mean loss: 0.36886421255349855
Epoch: 10, step: 1438, loss: 0.33681514859199524, mean loss: 0.3688621942233794
Epoch: 10, step: 1439, loss: 0.3311900496482849, mean loss: 0.3688598219220837
Epoch: 10, step: 1440, loss: 0.30884262919425964, mean loss: 0.3688560427398705
Epoch: 10, step: 1441, loss: 0.34024176001548767, mean loss: 0.3688542410598098
Epoch: 10, step: 1442, loss: 0.34956374764442444, mean loss: 0.3688530265226685
Epoch: 10, step: 1443, loss: 0.38812175393104553, mean loss: 0.3688542396130367
Valid: 10, mean loss: 0.19616134713093442
Epoch: 11, step: 0, loss: 0.3585706949234009, mean loss: 0.368853592238489
Epoch: 11, step: 1, loss: 0.31462669372558594, mean loss: 0.36885017873612763
Epoch: 11, step: 2, loss: 0.35371941328048706, mean loss: 0.3688492263369676
Epoch: 11, step: 3, loss: 0.32422423362731934, mean loss: 0.3688464176138615
Epoch: 11, step: 4, loss: 0.34357529878616333, mean loss: 0.36884482713498756
Epoch: 11, step: 5, loss: 0.34830278158187866, mean loss: 0.36884353436937695
Epoch: 11, step: 6, loss: 0.3024773895740509, mean loss: 0.3688393580340428
Epoch: 11, step: 7, loss: 0.3351130485534668, mean loss: 0.36883723581471983
Epoch: 11, step: 8, loss: 0.41537895798683167, mean loss: 0.3688401642563087
Epoch: 11, step: 9, loss: 0.3281409442424774, mean loss: 0.3688376035906479
Epoch: 11, step: 10, loss: 0.32828328013420105, mean loss: 0.36883505220194346
Epoch: 11, step: 11, loss: 0.33524173498153687, mean loss: 0.36883293888304436
Epoch: 11, step: 12, loss: 0.35026493668556213, mean loss: 0.36883177086378305
Epoch: 11, step: 13, loss: 0.38380786776542664, mean loss: 0.36883271287516195
Epoch: 11, step: 14, loss: 0.4117419123649597, mean loss: 0.3688354117366935
Epoch: 11, step: 15, loss: 0.3085538148880005, mean loss: 0.3688316204412942
Epoch: 11, step: 16, loss: 0.3198906183242798, mean loss: 0.3688285425844225
Epoch: 11, step: 17, loss: 0.36377280950546265, mean loss: 0.36882822465377985
Epoch: 11, step: 18, loss: 0.3528560698032379, mean loss: 0.3688272203052387
Epoch: 11, step: 19, loss: 0.39071014523506165, mean loss: 0.3688285962436774
Epoch: 11, step: 20, loss: 0.35836106538772583, mean loss: 0.3688279381153621
Epoch: 11, step: 21, loss: 0.34831276535987854, mean loss: 0.36882664833963247
Epoch: 11, step: 22, loss: 0.3465501368045807, mean loss: 0.3688252479177091
Epoch: 11, step: 23, loss: 0.30597683787345886, mean loss: 0.36882129717531253
Epoch: 11, step: 24, loss: 0.34945887327194214, mean loss: 0.36882008010171247
Epoch: 11, step: 25, loss: 0.32175618410110474, mean loss: 0.3688171219687143
Epoch: 11, step: 26, loss: 0.3844878673553467, mean loss: 0.3688181068688077
Epoch: 11, step: 27, loss: 0.39755573868751526, mean loss: 0.3688199129039899
Epoch: 11, step: 28, loss: 0.34494292736053467, mean loss: 0.3688184124335856
Epoch: 11, step: 29, loss: 0.33581826090812683, mean loss: 0.3688163387782177
Epoch: 11, step: 30, loss: 0.31686943769454956, mean loss: 0.3688130747567861
Epoch: 11, step: 31, loss: 0.4057387709617615, mean loss: 0.36881539479298897
Epoch: 11, step: 32, loss: 0.3299838602542877, mean loss: 0.36881295516651796
Epoch: 11, step: 33, loss: 0.3422132432460785, mean loss: 0.36881128412041164
Epoch: 11, step: 34, loss: 0.3298845589160919, mean loss: 0.3688088388207569
Epoch: 11, step: 35, loss: 0.3232061564922333, mean loss: 0.36880597433066087
Epoch: 11, step: 36, loss: 0.34861546754837036, mean loss: 0.36880470616240624
Epoch: 11, step: 37, loss: 0.3245350122451782, mean loss: 0.36880192575203585
Epoch: 11, step: 38, loss: 0.329260915517807, mean loss: 0.36879944248818897
Epoch: 11, step: 39, loss: 0.3115386664867401, mean loss: 0.36879584660926396
Epoch: 11, step: 40, loss: 0.3395162522792816, mean loss: 0.3687940080162134
Epoch: 11, step: 41, loss: 0.3228311538696289, mean loss: 0.36879112198995784
Epoch: 11, step: 42, loss: 0.35690179467201233, mean loss: 0.36879037550114524
Epoch: 11, step: 43, loss: 0.32376599311828613, mean loss: 0.3687875487568972
Epoch: 11, step: 44, loss: 0.34158822894096375, mean loss: 0.3687858412222236
Epoch: 11, step: 45, loss: 0.3371916711330414, mean loss: 0.3687838579096003
Epoch: 11, step: 46, loss: 0.36070239543914795, mean loss: 0.368783350630555
Epoch: 11, step: 47, loss: 0.3045351505279541, mean loss: 0.36877931797928065
Epoch: 11, step: 48, loss: 0.2908251881599426, mean loss: 0.36877442535831667
Epoch: 11, step: 49, loss: 0.34998127818107605, mean loss: 0.368773245921441
Epoch: 11, step: 50, loss: 0.3343196213245392, mean loss: 0.3687710837862294
Epoch: 11, step: 51, loss: 0.38061225414276123, mean loss: 0.368771826831558
Epoch: 11, step: 52, loss: 0.3556331396102905, mean loss: 0.36877100241747623
Epoch: 11, step: 53, loss: 0.37734583020210266, mean loss: 0.36877154042900745
Epoch: 11, step: 54, loss: 0.3271838426589966, mean loss: 0.3687689312504034
Epoch: 11, step: 55, loss: 0.3216247260570526, mean loss: 0.3687659736465644
Epoch: 11, step: 56, loss: 0.311628520488739, mean loss: 0.36876238933860644
Epoch: 11, step: 57, loss: 0.32482078671455383, mean loss: 0.36875963299670306
Epoch: 11, step: 58, loss: 0.3303474187850952, mean loss: 0.3687572236500173
Epoch: 11, step: 59, loss: 0.36731305718421936, mean loss: 0.36875713307259217
Epoch: 11, step: 60, loss: 0.3214483857154846, mean loss: 0.3687541660768344
Epoch: 11, step: 61, loss: 0.30697062611579895, mean loss: 0.36875029152898786
Epoch: 11, step: 62, loss: 0.3123953938484192, mean loss: 0.3687467576418818
Epoch: 11, step: 63, loss: 0.413387656211853, mean loss: 0.36874955679529103
Epoch: 11, step: 64, loss: 0.32794150710105896, mean loss: 0.3687469981364601
Epoch: 11, step: 65, loss: 0.3847678303718567, mean loss: 0.36874800257735263
Epoch: 11, step: 66, loss: 0.3645322024822235, mean loss: 0.3687477382804374
Epoch: 11, step: 67, loss: 0.4195670485496521, mean loss: 0.3687509240446218
Epoch: 11, step: 68, loss: 0.3384636342525482, mean loss: 0.3687490255120704
Epoch: 11, step: 69, loss: 0.36323678493499756, mean loss: 0.36874868000369776
Epoch: 11, step: 70, loss: 0.340711385011673, mean loss: 0.3687469227304297
Epoch: 11, step: 71, loss: 0.350315660238266, mean loss: 0.368745767599915
Epoch: 11, step: 72, loss: 0.3084125518798828, mean loss: 0.3687419866125289
Epoch: 11, step: 73, loss: 0.32150858640670776, mean loss: 0.36873902675539105
Epoch: 11, step: 74, loss: 0.31165313720703125, mean loss: 0.368735449721144
Epoch: 11, step: 75, loss: 0.3593578636646271, mean loss: 0.36873486215309537
Epoch: 11, step: 76, loss: 0.3751903176307678, mean loss: 0.368735266604914
Epoch: 11, step: 77, loss: 0.32476940751075745, mean loss: 0.3687325121970018
Epoch: 11, step: 78, loss: 0.3241114616394043, mean loss: 0.36872971691725753
Epoch: 11, step: 79, loss: 0.31396546959877014, mean loss: 0.36872628643321104
Epoch: 11, step: 80, loss: 0.38128387928009033, mean loss: 0.36872707300338625
Epoch: 11, step: 81, loss: 0.3529140055179596, mean loss: 0.368726082582023
Epoch: 11, step: 82, loss: 0.3492625951766968, mean loss: 0.3687248635999096
Epoch: 11, step: 83, loss: 0.3310544788837433, mean loss: 0.3687225044826303
Epoch: 11, step: 84, loss: 0.3253058195114136, mean loss: 0.3687197856721242
Epoch: 11, step: 85, loss: 0.30930203199386597, mean loss: 0.36871606508642113
Epoch: 11, step: 86, loss: 0.3734893202781677, mean loss: 0.36871636395657276
Epoch: 11, step: 87, loss: 0.3498479425907135, mean loss: 0.36871518261288594
Epoch: 11, step: 88, loss: 0.34892797470092773, mean loss: 0.36871394382193173
Epoch: 11, step: 89, loss: 0.3421233594417572, mean loss: 0.3687122792054061
Epoch: 11, step: 90, loss: 0.32935208082199097, mean loss: 0.3687098153432225
Epoch: 11, step: 91, loss: 0.36606302857398987, mean loss: 0.36870964967054043
Epoch: 11, step: 92, loss: 0.37666597962379456, mean loss: 0.3687101476570181
Epoch: 11, step: 93, loss: 0.3139178156852722, mean loss: 0.36870671842107045
Epoch: 11, step: 94, loss: 0.380982905626297, mean loss: 0.36870748669112524
Epoch: 11, step: 95, loss: 0.3349659740924835, mean loss: 0.36870537520723295
Epoch: 11, step: 96, loss: 0.30004724860191345, mean loss: 0.36870107897254145
Epoch: 11, step: 97, loss: 0.3197233974933624, mean loss: 0.3686980144198272
Epoch: 11, step: 98, loss: 0.3249073326587677, mean loss: 0.36869527459114915
Epoch: 11, step: 99, loss: 0.33144766092300415, mean loss: 0.3686929442849887
Epoch: 11, step: 100, loss: 0.30632975697517395, mean loss: 0.36868904292825994
Epoch: 11, step: 101, loss: 0.3292846977710724, mean loss: 0.36868657799987525
Epoch: 11, step: 102, loss: 0.33617064356803894, mean loss: 0.36868454410143076
Epoch: 11, step: 103, loss: 0.32407358288764954, mean loss: 0.36868175382364654
Epoch: 11, step: 104, loss: 0.37555965781211853, mean loss: 0.3686821839883841
Epoch: 11, step: 105, loss: 0.29679450392723083, mean loss: 0.3686776881985116
Epoch: 11, step: 106, loss: 0.35632196068763733, mean loss: 0.36867691553091664
Epoch: 11, step: 107, loss: 0.30253562331199646, mean loss: 0.3686727796322036
Epoch: 11, step: 108, loss: 0.3455428183078766, mean loss: 0.3686713333768841
Epoch: 11, step: 109, loss: 0.33866173028945923, mean loss: 0.36866945707307724
Epoch: 11, step: 110, loss: 0.3543260395526886, mean loss: 0.3686685603292498
Epoch: 11, step: 111, loss: 0.3525027930736542, mean loss: 0.368667549716143
Epoch: 11, step: 112, loss: 0.32512956857681274, mean loss: 0.3686648280820154
Epoch: 11, step: 113, loss: 0.3407911956310272, mean loss: 0.36866308576219725
Epoch: 11, step: 114, loss: 0.3682677745819092, mean loss: 0.3686630610537042
Epoch: 11, step: 115, loss: 0.40145039558410645, mean loss: 0.36866511026211235
Epoch: 11, step: 116, loss: 0.34081029891967773, mean loss: 0.3686633694452045
Epoch: 11, step: 117, loss: 0.3474069833755493, mean loss: 0.3686620410871199
Epoch: 11, step: 118, loss: 0.3389677107334137, mean loss: 0.368660185539388
Epoch: 11, step: 119, loss: 0.31298205256462097, mean loss: 0.3686567065258305
Epoch: 11, step: 120, loss: 0.39948081970214844, mean loss: 0.3686586324310586
Epoch: 11, step: 121, loss: 0.30094602704048157, mean loss: 0.368654401979641
Epoch: 11, step: 122, loss: 0.33947691321372986, mean loss: 0.3686525791840662
Epoch: 11, step: 123, loss: 0.35897403955459595, mean loss: 0.36865197457764254
Epoch: 11, step: 124, loss: 0.34064459800720215, mean loss: 0.3686502251006877
Epoch: 11, step: 125, loss: 0.33019596338272095, mean loss: 0.36864782321051165
Epoch: 11, step: 126, loss: 0.34724321961402893, mean loss: 0.36864648634188407
Epoch: 11, step: 127, loss: 0.3547045886516571, mean loss: 0.3686456156263151
Epoch: 11, step: 128, loss: 0.3401433527469635, mean loss: 0.3686438356810906
Epoch: 11, step: 129, loss: 0.32343560457229614, mean loss: 0.36864101263681004
Epoch: 11, step: 130, loss: 0.34777936339378357, mean loss: 0.3686397100049497
Epoch: 11, step: 131, loss: 0.36793819069862366, mean loss: 0.36863966620379424
Epoch: 11, step: 132, loss: 0.31869763135910034, mean loss: 0.3686365481395597
Epoch: 11, step: 133, loss: 0.32317814230918884, mean loss: 0.36863371018189767
Epoch: 11, step: 134, loss: 0.33706822991371155, mean loss: 0.3686317396793527
Epoch: 11, step: 135, loss: 0.37806689739227295, mean loss: 0.3686323286405083
Epoch: 11, step: 136, loss: 0.33755579590797424, mean loss: 0.3686303889031179
Epoch: 11, step: 137, loss: 0.36904895305633545, mean loss: 0.3686304150274565
Epoch: 11, step: 138, loss: 0.3174917697906494, mean loss: 0.3686272234500218
Epoch: 11, step: 139, loss: 0.28574222326278687, mean loss: 0.36862205089634065
Epoch: 11, step: 140, loss: 0.3133690059185028, mean loss: 0.3686186029684169
Epoch: 11, step: 141, loss: 0.3238150179386139, mean loss: 0.36861580728733434
Epoch: 11, step: 142, loss: 0.32025855779647827, mean loss: 0.36861279005082775
Epoch: 11, step: 143, loss: 0.3473823070526123, mean loss: 0.3686114654636679
Epoch: 11, step: 144, loss: 0.38893741369247437, mean loss: 0.3686127335370492
Epoch: 11, step: 145, loss: 0.3340741991996765, mean loss: 0.3686105789185628
Epoch: 11, step: 146, loss: 0.30044084787368774, mean loss: 0.3686063265493379
Epoch: 11, step: 147, loss: 0.3454228341579437, mean loss: 0.36860488047321566
Epoch: 11, step: 148, loss: 0.35033118724823, mean loss: 0.36860374071813395
Epoch: 11, step: 149, loss: 0.3343197703361511, mean loss: 0.3686016025136696
Epoch: 11, step: 150, loss: 0.34121963381767273, mean loss: 0.3685998948760833
Epoch: 11, step: 151, loss: 0.3440351188182831, mean loss: 0.3685983630242463
Epoch: 11, step: 152, loss: 0.3439164459705353, mean loss: 0.3685968239635084
Epoch: 11, step: 153, loss: 0.33026885986328125, mean loss: 0.3685944341415792
Epoch: 11, step: 154, loss: 0.3292728066444397, mean loss: 0.36859198251569875
Epoch: 11, step: 155, loss: 0.3473217487335205, mean loss: 0.3685906564412734
Epoch: 11, step: 156, loss: 0.3285503387451172, mean loss: 0.368588160317734
Epoch: 11, step: 157, loss: 0.3103941082954407, mean loss: 0.3685845327119478
Epoch: 11, step: 158, loss: 0.33017006516456604, mean loss: 0.36858213824286173
Epoch: 11, step: 159, loss: 0.34879887104034424, mean loss: 0.3685809051795856
Epoch: 11, step: 160, loss: 0.3434218764305115, mean loss: 0.36857933715037094
Epoch: 11, step: 161, loss: 0.30062103271484375, mean loss: 0.36857510193259485
Epoch: 11, step: 162, loss: 0.33160069584846497, mean loss: 0.3685727978006023
Epoch: 11, step: 163, loss: 0.3404443562030792, mean loss: 0.36857104503131033
Epoch: 11, step: 164, loss: 0.3532217741012573, mean loss: 0.3685700886308536
Epoch: 11, step: 165, loss: 0.32581642270088196, mean loss: 0.3685674248510449
Epoch: 11, step: 166, loss: 0.3537490665912628, mean loss: 0.36856650164636856
Epoch: 11, step: 167, loss: 0.3378061056137085, mean loss: 0.3685645853495811
Epoch: 11, step: 168, loss: 0.38636457920074463, mean loss: 0.3685656941762086
Epoch: 11, step: 169, loss: 0.32992297410964966, mean loss: 0.36856328712998543
Epoch: 11, step: 170, loss: 0.33570337295532227, mean loss: 0.36856124042091193
Epoch: 11, step: 171, loss: 0.34463274478912354, mean loss: 0.36855975010603703
Epoch: 11, step: 172, loss: 0.31815260648727417, mean loss: 0.36855661084318475
Epoch: 11, step: 173, loss: 0.31257861852645874, mean loss: 0.3685531248553708
Epoch: 11, step: 174, loss: 0.334262877702713, mean loss: 0.3685509895887195
Epoch: 11, step: 175, loss: 0.31716781854629517, mean loss: 0.3685477901384678
Epoch: 11, step: 176, loss: 0.3136161267757416, mean loss: 0.36854436994898004
Epoch: 11, step: 177, loss: 0.3560248911380768, mean loss: 0.36854359050191177
Epoch: 11, step: 178, loss: 0.3401358425617218, mean loss: 0.36854182198121577
Epoch: 11, step: 179, loss: 0.3152993321418762, mean loss: 0.3685385075831929
Epoch: 11, step: 180, loss: 0.33147087693214417, mean loss: 0.36853620022989997
Epoch: 11, step: 181, loss: 0.3111845850944519, mean loss: 0.3685326304791757
Epoch: 11, step: 182, loss: 0.2809305489063263, mean loss: 0.3685271781805778
Epoch: 11, step: 183, loss: 0.34065452218055725, mean loss: 0.36852544351191957
Epoch: 11, step: 184, loss: 0.31747278571128845, mean loss: 0.3685222664220073
Epoch: 11, step: 185, loss: 0.3495542109012604, mean loss: 0.3685210860825225
Epoch: 11, step: 186, loss: 0.3123757839202881, mean loss: 0.36851759250389254
Epoch: 11, step: 187, loss: 0.3356454074382782, mean loss: 0.3685155471962105
Epoch: 11, step: 188, loss: 0.38631460070610046, mean loss: 0.36851665458459537
Epoch: 11, step: 189, loss: 0.35536500811576843, mean loss: 0.3685158363908372
Epoch: 11, step: 190, loss: 0.38715773820877075, mean loss: 0.36851699607368743
Epoch: 11, step: 191, loss: 0.3100673258304596, mean loss: 0.3685133602395096
Epoch: 11, step: 192, loss: 0.3598855137825012, mean loss: 0.3685128235817714
Epoch: 11, step: 193, loss: 0.36463063955307007, mean loss: 0.36851258212238414
Epoch: 11, step: 194, loss: 0.35199207067489624, mean loss: 0.36851155466349694
Epoch: 11, step: 195, loss: 0.327113538980484, mean loss: 0.3685089801600341
Epoch: 11, step: 196, loss: 0.3324737846851349, mean loss: 0.3685067393046473
Epoch: 11, step: 197, loss: 0.36071276664733887, mean loss: 0.3685062546651337
Epoch: 11, step: 198, loss: 0.31855154037475586, mean loss: 0.3685031486081611
Epoch: 11, step: 199, loss: 0.31645944714546204, mean loss: 0.36849991286447403
Epoch: 11, step: 200, loss: 0.3190128207206726, mean loss: 0.36849683626564633
Epoch: 11, step: 201, loss: 0.36956557631492615, mean loss: 0.368496902704789
Epoch: 11, step: 202, loss: 0.36960074305534363, mean loss: 0.36849697132170645
Epoch: 11, step: 203, loss: 0.2857822775840759, mean loss: 0.3684918299309968
Epoch: 11, step: 204, loss: 0.33017268776893616, mean loss: 0.3684894482328078
Epoch: 11, step: 205, loss: 0.3199140131473541, mean loss: 0.3684864292498939
Epoch: 11, step: 206, loss: 0.3483980596065521, mean loss: 0.3684851808271953
Epoch: 11, step: 207, loss: 0.35586175322532654, mean loss: 0.36848439637357844
Epoch: 11, step: 208, loss: 0.3093787729740143, mean loss: 0.3684807236199962
Epoch: 11, step: 209, loss: 0.31399255990982056, mean loss: 0.3684773380002801
Epoch: 11, step: 210, loss: 0.3254280984401703, mean loss: 0.36847466330381784
Epoch: 11, step: 211, loss: 0.3819635510444641, mean loss: 0.3684755013311377
Epoch: 11, step: 212, loss: 0.3351908326148987, mean loss: 0.36847343357511386
Epoch: 11, step: 213, loss: 0.35060951113700867, mean loss: 0.36847232387686324
Epoch: 11, step: 214, loss: 0.3489045202732086, mean loss: 0.3684711084098402
Epoch: 11, step: 215, loss: 0.31724098324775696, mean loss: 0.3684679264144885
Epoch: 11, step: 216, loss: 0.32140830159187317, mean loss: 0.3684650036379639
Epoch: 11, step: 217, loss: 0.3301468789577484, mean loss: 0.36846262392583623
Epoch: 11, step: 218, loss: 0.35630926489830017, mean loss: 0.3684618691994481
Epoch: 11, step: 219, loss: 0.35897722840309143, mean loss: 0.36846128023765
Epoch: 11, step: 220, loss: 0.3215808570384979, mean loss: 0.3684583693141356
Epoch: 11, step: 221, loss: 0.354153037071228, mean loss: 0.36845748111518845
Epoch: 11, step: 222, loss: 0.30577415227890015, mean loss: 0.3684535894327624
Epoch: 11, step: 223, loss: 0.3101784288883209, mean loss: 0.36844997165522675
Epoch: 11, step: 224, loss: 0.31432875990867615, mean loss: 0.36844661196736617
Epoch: 11, step: 225, loss: 0.34042540192604065, mean loss: 0.36844487259989
Epoch: 11, step: 226, loss: 0.31665387749671936, mean loss: 0.36844165796423095
Epoch: 11, step: 227, loss: 0.3896183669567108, mean loss: 0.36844297230813566
Epoch: 11, step: 228, loss: 0.38046982884407043, mean loss: 0.3684437187151695
Epoch: 11, step: 229, loss: 0.33478665351867676, mean loss: 0.3684416300304732
Epoch: 11, step: 230, loss: 0.34833061695098877, mean loss: 0.36844038206192964
Epoch: 11, step: 231, loss: 0.3508645296096802, mean loss: 0.3684392914778857
Epoch: 11, step: 232, loss: 0.33675119280815125, mean loss: 0.368437325349036
Epoch: 11, step: 233, loss: 0.34602880477905273, mean loss: 0.36843593506980965
Epoch: 11, step: 234, loss: 0.32015207409858704, mean loss: 0.3684329396072517
Epoch: 11, step: 235, loss: 0.32472294569015503, mean loss: 0.36843022806916753
Epoch: 11, step: 236, loss: 0.3052050769329071, mean loss: 0.36842630615668465
Epoch: 11, step: 237, loss: 0.3293897211551666, mean loss: 0.3684238848327173
Epoch: 11, step: 238, loss: 0.33081191778182983, mean loss: 0.3684215520182876
Epoch: 11, step: 239, loss: 0.3314652442932129, mean loss: 0.3684192600121027
Epoch: 11, step: 240, loss: 0.29995501041412354, mean loss: 0.3684150141671664
Epoch: 11, step: 241, loss: 0.31722497940063477, mean loss: 0.3684118397882276
Epoch: 11, step: 242, loss: 0.3174152076244354, mean loss: 0.3684086775985976
Epoch: 11, step: 243, loss: 0.34310197830200195, mean loss: 0.36840710848281777
Epoch: 11, step: 244, loss: 0.31614911556243896, mean loss: 0.3684038684807767
Epoch: 11, step: 245, loss: 0.3404824435710907, mean loss: 0.3684021374562938
Epoch: 11, step: 246, loss: 0.3292244076728821, mean loss: 0.3683997087333514
Epoch: 11, step: 247, loss: 0.3239270746707916, mean loss: 0.36839695193729005
Epoch: 11, step: 248, loss: 0.3473377227783203, mean loss: 0.36839564658619856
Epoch: 11, step: 249, loss: 0.3484821021556854, mean loss: 0.3683944123265958
Epoch: 11, step: 250, loss: 0.3560613691806793, mean loss: 0.36839364796073615
Epoch: 11, step: 251, loss: 0.33818554878234863, mean loss: 0.36839177586733146
Epoch: 11, step: 252, loss: 0.3362494111061096, mean loss: 0.36838978402468653
Epoch: 11, step: 253, loss: 0.2888563275337219, mean loss: 0.36838485569053786
Epoch: 11, step: 254, loss: 0.33540070056915283, mean loss: 0.3683828119359607
Epoch: 11, step: 255, loss: 0.29953819513320923, mean loss: 0.3683785464702356
Epoch: 11, step: 256, loss: 0.31382742524147034, mean loss: 0.36837516680842847
Epoch: 11, step: 257, loss: 0.3439120650291443, mean loss: 0.3683736513145752
Epoch: 11, step: 258, loss: 0.34649795293807983, mean loss: 0.3683722961948096
Epoch: 11, step: 259, loss: 0.3557857275009155, mean loss: 0.36837151655106
Epoch: 11, step: 260, loss: 0.3954432010650635, mean loss: 0.3683731933354833
Epoch: 11, step: 261, loss: 0.3369840383529663, mean loss: 0.3683712492530491
Epoch: 11, step: 262, loss: 0.35009557008743286, mean loss: 0.3683701174218008
Epoch: 11, step: 263, loss: 0.36625754833221436, mean loss: 0.368369986596368
Epoch: 11, step: 264, loss: 0.3833540380001068, mean loss: 0.3683709144588613
Epoch: 11, step: 265, loss: 0.30775508284568787, mean loss: 0.3683671611565942
Epoch: 11, step: 266, loss: 0.3589334189891815, mean loss: 0.3683665770601192
Epoch: 11, step: 267, loss: 0.3313145637512207, mean loss: 0.36836428310189057
Epoch: 11, step: 268, loss: 0.3395426273345947, mean loss: 0.3683624988106897
Epoch: 11, step: 269, loss: 0.3478425145149231, mean loss: 0.3683612285380454
Epoch: 11, step: 270, loss: 0.30930522084236145, mean loss: 0.36835757295106336
Epoch: 11, step: 271, loss: 0.3269525468349457, mean loss: 0.3683550101244902
Epoch: 11, step: 272, loss: 0.3400465250015259, mean loss: 0.36835325803653307
Epoch: 11, step: 273, loss: 0.3516150712966919, mean loss: 0.36835222212944435
Epoch: 11, step: 274, loss: 0.3346174657344818, mean loss: 0.3683501344534499
Epoch: 11, step: 275, loss: 0.3215843737125397, mean loss: 0.368347240532612
Epoch: 11, step: 276, loss: 0.351671427488327, mean loss: 0.36834620867734036
Epoch: 11, step: 277, loss: 0.32049280405044556, mean loss: 0.36834324781824945
Epoch: 11, step: 278, loss: 0.34217920899391174, mean loss: 0.3683416290569536
Epoch: 11, step: 279, loss: 0.3735480308532715, mean loss: 0.36834195115555524
Epoch: 11, step: 280, loss: 0.3547622561454773, mean loss: 0.3683411110878157
Epoch: 11, step: 281, loss: 0.3144242763519287, mean loss: 0.36833777588833927
Epoch: 11, step: 282, loss: 0.35086846351623535, mean loss: 0.36833669533459573
Epoch: 11, step: 283, loss: 0.3498995006084442, mean loss: 0.3683355549836107
Epoch: 11, step: 284, loss: 0.35149073600769043, mean loss: 0.36833451318640764
Epoch: 11, step: 285, loss: 0.34565258026123047, mean loss: 0.3683331104694673
Epoch: 11, step: 286, loss: 0.3388102650642395, mean loss: 0.3683312848034352
Epoch: 11, step: 287, loss: 0.3786832094192505, mean loss: 0.3683319249174975
Epoch: 11, step: 288, loss: 0.3296111822128296, mean loss: 0.3683295307579288
Epoch: 11, step: 289, loss: 0.3007226884365082, mean loss: 0.36832535078746254
Epoch: 11, step: 290, loss: 0.3607270419597626, mean loss: 0.36832488103112077
Epoch: 11, step: 291, loss: 0.347623348236084, mean loss: 0.3683236012627729
Epoch: 11, step: 292, loss: 0.32961058616638184, mean loss: 0.36832120817288627
Epoch: 11, step: 293, loss: 0.3110041320323944, mean loss: 0.3683176652704175
Epoch: 11, step: 294, loss: 0.3327476978302002, mean loss: 0.36831546674347265
Epoch: 11, step: 295, loss: 0.35828107595443726, mean loss: 0.3683148465709888
Epoch: 11, step: 296, loss: 0.342107355594635, mean loss: 0.3683132269250475
Epoch: 11, step: 297, loss: 0.3683013916015625, mean loss: 0.3683132261936593
Epoch: 11, step: 298, loss: 0.33156996965408325, mean loss: 0.3683109557087962
Epoch: 11, step: 299, loss: 0.3580067455768585, mean loss: 0.3683103190176116
Epoch: 11, step: 300, loss: 0.3227769136428833, mean loss: 0.3683075057086604
Epoch: 11, step: 301, loss: 0.3255826234817505, mean loss: 0.3683048660890986
Epoch: 11, step: 302, loss: 0.30421051383018494, mean loss: 0.36830090647012914
Epoch: 11, step: 303, loss: 0.2981686294078827, mean loss: 0.368296574108067
Epoch: 11, step: 304, loss: 0.3464055061340332, mean loss: 0.3682952218894016
Epoch: 11, step: 305, loss: 0.33115747570991516, mean loss: 0.36829292801996494
Epoch: 11, step: 306, loss: 0.3208678960800171, mean loss: 0.36828999892158065
Epoch: 11, step: 307, loss: 0.3455219864845276, mean loss: 0.36828859279433035
Epoch: 11, step: 308, loss: 0.3309023678302765, mean loss: 0.3682862840050409
Epoch: 11, step: 309, loss: 0.35323217511177063, mean loss: 0.3682853543947597
Epoch: 11, step: 310, loss: 0.33612000942230225, mean loss: 0.36828336826663544
Epoch: 11, step: 311, loss: 0.3621436655521393, mean loss: 0.36828298917903884
Epoch: 11, step: 312, loss: 0.34078314900398254, mean loss: 0.3682812913436264
Epoch: 11, step: 313, loss: 0.32786741852760315, mean loss: 0.3682787963520956
Epoch: 11, step: 314, loss: 0.36269843578338623, mean loss: 0.3682784518641291
Epoch: 11, step: 315, loss: 0.3531600534915924, mean loss: 0.3682775186296617
Epoch: 11, step: 316, loss: 0.29920047521591187, mean loss: 0.3682732548778307
Epoch: 11, step: 317, loss: 0.310348778963089, mean loss: 0.36826967973427344
Epoch: 11, step: 318, loss: 0.33220380544662476, mean loss: 0.36826745385793647
Epoch: 11, step: 319, loss: 0.3406696617603302, mean loss: 0.3682657507110531
Epoch: 11, step: 320, loss: 0.3240680992603302, mean loss: 0.36826302330275623
Epoch: 11, step: 321, loss: 0.3258644938468933, mean loss: 0.3682604070785519
Epoch: 11, step: 322, loss: 0.33431899547576904, mean loss: 0.36825831283460775
Epoch: 11, step: 323, loss: 0.3051553964614868, mean loss: 0.36825441951548304
Epoch: 11, step: 324, loss: 0.3054407835006714, mean loss: 0.36825054428345055
Epoch: 11, step: 325, loss: 0.337930828332901, mean loss: 0.36824867385063437
Epoch: 11, step: 326, loss: 0.33359116315841675, mean loss: 0.36824653594978357
Epoch: 11, step: 327, loss: 0.3374258875846863, mean loss: 0.3682446348488482
Epoch: 11, step: 328, loss: 0.3470248579978943, mean loss: 0.36824332603636123
Epoch: 11, step: 329, loss: 0.35694655776023865, mean loss: 0.3682426293070979
Epoch: 11, step: 330, loss: 0.4007178544998169, mean loss: 0.36824463209619396
Epoch: 11, step: 331, loss: 0.32995349168777466, mean loss: 0.3682422707777179
Epoch: 11, step: 332, loss: 0.3149684965610504, mean loss: 0.36823898572041897
Epoch: 11, step: 333, loss: 0.34303873777389526, mean loss: 0.3682374318760518
Epoch: 11, step: 334, loss: 0.30608779191970825, mean loss: 0.3682335999727312
Epoch: 11, step: 335, loss: 0.3220536708831787, mean loss: 0.3682307528747602
Epoch: 11, step: 336, loss: 0.3200240135192871, mean loss: 0.3682277810025356
Epoch: 11, step: 337, loss: 0.3271813988685608, mean loss: 0.3682252507114412
Epoch: 11, step: 338, loss: 0.3674510717391968, mean loss: 0.3682252029903679
Epoch: 11, step: 339, loss: 0.3003440797328949, mean loss: 0.3682210189960842
Epoch: 11, step: 340, loss: 0.36980828642845154, mean loss: 0.36822111682458547
Epoch: 11, step: 341, loss: 0.33098700642585754, mean loss: 0.3682188221055913
Epoch: 11, step: 342, loss: 0.4258608818054199, mean loss: 0.3682223743370389
Epoch: 11, step: 343, loss: 0.34037521481513977, mean loss: 0.3682206583424911
Epoch: 11, step: 344, loss: 0.29850274324417114, mean loss: 0.36821636245764927
Epoch: 11, step: 345, loss: 0.3064298927783966, mean loss: 0.3682125555279093
Epoch: 11, step: 346, loss: 0.3129225969314575, mean loss: 0.3682091490860021
Epoch: 11, step: 347, loss: 0.3182045519351959, mean loss: 0.36820606846764636
Epoch: 11, step: 348, loss: 0.3694905638694763, mean loss: 0.368206147596298
Epoch: 11, step: 349, loss: 0.3233805298805237, mean loss: 0.36820338637800826
Epoch: 11, step: 350, loss: 0.3181447982788086, mean loss: 0.3682003030033178
Epoch: 11, step: 351, loss: 0.37340036034584045, mean loss: 0.36820062328277964
Epoch: 11, step: 352, loss: 0.33808818459510803, mean loss: 0.36819876872598417
Epoch: 11, step: 353, loss: 0.3360806703567505, mean loss: 0.3681967907669763
Epoch: 11, step: 354, loss: 0.3321288824081421, mean loss: 0.36819456969989345
Epoch: 11, step: 355, loss: 0.3681791424751282, mean loss: 0.36819456874994116
Epoch: 11, step: 356, loss: 0.3411526083946228, mean loss: 0.3681929037071264
Epoch: 11, step: 357, loss: 0.3236953318119049, mean loss: 0.3681901640462536
Epoch: 11, step: 358, loss: 0.3319738209247589, mean loss: 0.36818793438774705
Epoch: 11, step: 359, loss: 0.31129372119903564, mean loss: 0.3681844319121752
Epoch: 11, step: 360, loss: 0.35943713784217834, mean loss: 0.3681838934514753
Epoch: 11, step: 361, loss: 0.2975594699382782, mean loss: 0.36817954626302807
Epoch: 11, step: 362, loss: 0.3323712646961212, mean loss: 0.368177342269579
Epoch: 11, step: 363, loss: 0.33844250440597534, mean loss: 0.3681755122081644
Epoch: 11, step: 364, loss: 0.35035452246665955, mean loss: 0.3681744154643807
Epoch: 11, step: 365, loss: 0.3037768602371216, mean loss: 0.36817045253790515
Epoch: 11, step: 366, loss: 0.29662737250328064, mean loss: 0.3681660501577418
Epoch: 11, step: 367, loss: 0.3702973425388336, mean loss: 0.3681661812980557
Epoch: 11, step: 368, loss: 0.32334545254707336, mean loss: 0.3681634236084752
Epoch: 11, step: 369, loss: 0.3444936275482178, mean loss: 0.3681619673641009
Epoch: 11, step: 370, loss: 0.36297330260276794, mean loss: 0.36816164815987074
Epoch: 11, step: 371, loss: 0.3761439919471741, mean loss: 0.36816213919971985
Epoch: 11, step: 372, loss: 0.3023656904697418, mean loss: 0.3681580919309292
Epoch: 11, step: 373, loss: 0.31947416067123413, mean loss: 0.36815509747089353
Epoch: 11, step: 374, loss: 0.40553322434425354, mean loss: 0.36815739639006895
Epoch: 11, step: 375, loss: 0.3722814619541168, mean loss: 0.36815765002263745
Epoch: 11, step: 376, loss: 0.3515692949295044, mean loss: 0.36815662989133596
Epoch: 11, step: 377, loss: 0.3466799259185791, mean loss: 0.3681553092232771
Epoch: 11, step: 378, loss: 0.3244580328464508, mean loss: 0.36815262230964635
Epoch: 11, step: 379, loss: 0.3148719370365143, mean loss: 0.36814934632063545
Epoch: 11, step: 380, loss: 0.35003143548965454, mean loss: 0.3681482324005106
Epoch: 11, step: 381, loss: 0.3927050530910492, mean loss: 0.3681497421029999
Epoch: 11, step: 382, loss: 0.3276527523994446, mean loss: 0.36814725258497544
Epoch: 11, step: 383, loss: 0.34283071756362915, mean loss: 0.36814569636816813
Epoch: 11, step: 384, loss: 0.38886725902557373, mean loss: 0.3681469700520244
Epoch: 11, step: 385, loss: 0.3165183663368225, mean loss: 0.3681437968127057
Epoch: 11, step: 386, loss: 0.3592265546321869, mean loss: 0.3681432487675837
Epoch: 11, step: 387, loss: 0.32452431321144104, mean loss: 0.3681405681545333
Epoch: 11, step: 388, loss: 0.3512999415397644, mean loss: 0.3681395332730354
Epoch: 11, step: 389, loss: 0.30729544162750244, mean loss: 0.3681357945430584
Epoch: 11, step: 390, loss: 0.3349364995956421, mean loss: 0.36813375464782355
Epoch: 11, step: 391, loss: 0.35554051399230957, mean loss: 0.3681329809171369
Epoch: 11, step: 392, loss: 0.3509276211261749, mean loss: 0.3681319238820696
Epoch: 11, step: 393, loss: 0.32357415556907654, mean loss: 0.3681291865821364
Epoch: 11, step: 394, loss: 0.3522121012210846, mean loss: 0.36812820881413094
Epoch: 11, step: 395, loss: 0.356891006231308, mean loss: 0.368127518568272
Epoch: 11, step: 396, loss: 0.3458443582057953, mean loss: 0.3681261499078481
Epoch: 11, step: 397, loss: 0.3410820960998535, mean loss: 0.36812448892923316
Epoch: 11, step: 398, loss: 0.3642295002937317, mean loss: 0.3681242497233967
Epoch: 11, step: 399, loss: 0.3120485544204712, mean loss: 0.3681208061164633
Epoch: 11, step: 400, loss: 0.3388673663139343, mean loss: 0.36811900977382883
Epoch: 11, step: 401, loss: 0.3315274119377136, mean loss: 0.3681167629607479
Epoch: 11, step: 402, loss: 0.3412896692752838, mean loss: 0.36811511581310347
Epoch: 11, step: 403, loss: 0.37824469804763794, mean loss: 0.3681157377177102
Epoch: 11, step: 404, loss: 0.3383961319923401, mean loss: 0.3681139131977443
Epoch: 11, step: 405, loss: 0.3523564040660858, mean loss: 0.36811294588594984
Epoch: 11, step: 406, loss: 0.3537904918193817, mean loss: 0.3681120667223585
Epoch: 11, step: 407, loss: 0.39227616786956787, mean loss: 0.3681135499104967
Epoch: 11, step: 408, loss: 0.3262748122215271, mean loss: 0.36811098201399584
Epoch: 11, step: 409, loss: 0.3327265977859497, mean loss: 0.36810881039350807
Epoch: 11, step: 410, loss: 0.3281813859939575, mean loss: 0.3681063601066471
Epoch: 11, step: 411, loss: 0.31142887473106384, mean loss: 0.36810288210680814
Epoch: 11, step: 412, loss: 0.32928410172462463, mean loss: 0.368100500148142
Epoch: 11, step: 413, loss: 0.3468887209892273, mean loss: 0.36809919865230456
Epoch: 11, step: 414, loss: 0.31062522530555725, mean loss: 0.36809567242533686
Epoch: 11, step: 415, loss: 0.3183371424674988, mean loss: 0.3680926197547873
Epoch: 11, step: 416, loss: 0.3640229105949402, mean loss: 0.3680923700946953
Epoch: 11, step: 417, loss: 0.3104250133037567, mean loss: 0.3680888326540874
Epoch: 11, step: 418, loss: 0.3559398353099823, mean loss: 0.3680880874539804
Epoch: 11, step: 419, loss: 0.4171386957168579, mean loss: 0.3680910959554686
Epoch: 11, step: 420, loss: 0.3426536023616791, mean loss: 0.368089535851599
Epoch: 11, step: 421, loss: 0.33848825097084045, mean loss: 0.3680877204900829
Epoch: 11, step: 422, loss: 0.35855966806411743, mean loss: 0.36808713619791233
Epoch: 11, step: 423, loss: 0.3023432791233063, mean loss: 0.3680831048110424
Epoch: 11, step: 424, loss: 0.36191797256469727, mean loss: 0.36808272679079307
Epoch: 11, step: 425, loss: 0.31269070506095886, mean loss: 0.3680793305908096
Epoch: 11, step: 426, loss: 0.392032265663147, mean loss: 0.3680807991050069
Epoch: 11, step: 427, loss: 0.30921101570129395, mean loss: 0.3680771901187757
Epoch: 11, step: 428, loss: 0.3182034194469452, mean loss: 0.36807413281658286
Epoch: 11, step: 429, loss: 0.3309907913208008, mean loss: 0.36807185971731254
Epoch: 11, step: 430, loss: 0.33257290720939636, mean loss: 0.3680696838697791
Epoch: 11, step: 431, loss: 0.3808481991291046, mean loss: 0.3680704670589958
Epoch: 11, step: 432, loss: 0.30925896763801575, mean loss: 0.36806686275064127
Epoch: 11, step: 433, loss: 0.357117235660553, mean loss: 0.3680661917353765
Epoch: 11, step: 434, loss: 0.3620850145816803, mean loss: 0.36806582521922027
Epoch: 11, step: 435, loss: 0.3513352572917938, mean loss: 0.36806480006187176
Epoch: 11, step: 436, loss: 0.34589865803718567, mean loss: 0.3680634419256041
Epoch: 11, step: 437, loss: 0.3678430914878845, mean loss: 0.36806342842539347
Epoch: 11, step: 438, loss: 0.34176820516586304, mean loss: 0.36806181749460504
Epoch: 11, step: 439, loss: 0.35236266255378723, mean loss: 0.36806085577229797
Epoch: 11, step: 440, loss: 0.3409408628940582, mean loss: 0.3680591945169915
Epoch: 11, step: 441, loss: 0.2931065261363983, mean loss: 0.36805460351684566
Epoch: 11, step: 442, loss: 0.36269181966781616, mean loss: 0.36805427505577815
Epoch: 11, step: 443, loss: 0.3579198718070984, mean loss: 0.36805365437944004
Epoch: 11, step: 444, loss: 0.3791385889053345, mean loss: 0.36805433322900377
Epoch: 11, step: 445, loss: 0.34263190627098083, mean loss: 0.36805277643617107
Epoch: 11, step: 446, loss: 0.34857186675071716, mean loss: 0.3680515835570035
Epoch: 11, step: 447, loss: 0.3548286259174347, mean loss: 0.3680507739220758
Epoch: 11, step: 448, loss: 0.35880398750305176, mean loss: 0.36805020778074116
Epoch: 11, step: 449, loss: 0.3510344624519348, mean loss: 0.3680491660429348
Epoch: 11, step: 450, loss: 0.3604162335395813, mean loss: 0.3680486987682177
Epoch: 11, step: 451, loss: 0.31570616364479065, mean loss: 0.3680454946463321
Epoch: 11, step: 452, loss: 0.33637070655822754, mean loss: 0.3680435558088413
Epoch: 11, step: 453, loss: 0.3417237401008606, mean loss: 0.3680419448518265
Epoch: 11, step: 454, loss: 0.37451115250587463, mean loss: 0.36804234078839876
Epoch: 11, step: 455, loss: 0.3647868037223816, mean loss: 0.3680421415511242
Epoch: 11, step: 456, loss: 0.35048598051071167, mean loss: 0.3680410671884144
Epoch: 11, step: 457, loss: 0.3556062579154968, mean loss: 0.3680403062773097
Epoch: 11, step: 458, loss: 0.31992197036743164, mean loss: 0.3680373619992757
Epoch: 11, step: 459, loss: 0.3179382383823395, mean loss: 0.36803429670781607
Epoch: 11, step: 460, loss: 0.3407963514328003, mean loss: 0.3680326302688271
Epoch: 11, step: 461, loss: 0.30151084065437317, mean loss: 0.3680285606622191
Epoch: 11, step: 462, loss: 0.3392053246498108, mean loss: 0.3680267974496411
Epoch: 11, step: 463, loss: 0.36152732372283936, mean loss: 0.36802639987967983
Epoch: 11, step: 464, loss: 0.3621019721031189, mean loss: 0.36802603750719365
Epoch: 11, step: 465, loss: 0.32297611236572266, mean loss: 0.36802328216009017
Epoch: 11, step: 466, loss: 0.31836992502212524, mean loss: 0.36802024544324485
Epoch: 11, step: 467, loss: 0.35024794936180115, mean loss: 0.3680191585856078
Epoch: 11, step: 468, loss: 0.33509281277656555, mean loss: 0.36801714511127226
Epoch: 11, step: 469, loss: 0.29335442185401917, mean loss: 0.3680125797007759
Epoch: 11, step: 470, loss: 0.3462733030319214, mean loss: 0.3680112504878949
Epoch: 11, step: 471, loss: 0.36079928278923035, mean loss: 0.3680108095507649
Epoch: 11, step: 472, loss: 0.3127054274082184, mean loss: 0.36800742840616973
Epoch: 11, step: 473, loss: 0.34129709005355835, mean loss: 0.368005795545285
Epoch: 11, step: 474, loss: 0.32909995317459106, mean loss: 0.36800341729219066
Epoch: 11, step: 475, loss: 0.2879503667354584, mean loss: 0.36799852407394146
Epoch: 11, step: 476, loss: 0.3864991366863251, mean loss: 0.3679996548491149
Epoch: 11, step: 477, loss: 0.3572908937931061, mean loss: 0.36799900035937916
Epoch: 11, step: 478, loss: 0.34018853306770325, mean loss: 0.3679973007647271
Epoch: 11, step: 479, loss: 0.2928384840488434, mean loss: 0.36799270782799304
Epoch: 11, step: 480, loss: 0.31754958629608154, mean loss: 0.3679896254496532
Epoch: 11, step: 481, loss: 0.31555745005607605, mean loss: 0.3679864217239173
Epoch: 11, step: 482, loss: 0.35363203287124634, mean loss: 0.3679855446915441
Epoch: 11, step: 483, loss: 0.3232713043689728, mean loss: 0.36798281288311774
Epoch: 11, step: 484, loss: 0.3288516700267792, mean loss: 0.3679804223190725
Epoch: 11, step: 485, loss: 0.32486072182655334, mean loss: 0.3679777882506246
Epoch: 11, step: 486, loss: 0.36131083965301514, mean loss: 0.3679773810092467
Epoch: 11, step: 487, loss: 0.3567989468574524, mean loss: 0.3679766982316904
Epoch: 11, step: 488, loss: 0.3073401153087616, mean loss: 0.36797299478193024
Epoch: 11, step: 489, loss: 0.309928297996521, mean loss: 0.3679694498511384
Epoch: 11, step: 490, loss: 0.31977811455726624, mean loss: 0.36796650686883037
Epoch: 11, step: 491, loss: 0.3307051658630371, mean loss: 0.367964231506043
Epoch: 11, step: 492, loss: 0.33329451084136963, mean loss: 0.36796211452975525
Epoch: 11, step: 493, loss: 0.32343730330467224, mean loss: 0.36795939595537347
Epoch: 11, step: 494, loss: 0.3407881259918213, mean loss: 0.3679577370464069
Epoch: 11, step: 495, loss: 0.35571298003196716, mean loss: 0.3679569895032436
Epoch: 11, step: 496, loss: 0.31672364473342896, mean loss: 0.3679538618953583
Epoch: 11, step: 497, loss: 0.33843284845352173, mean loss: 0.36795205985571466
Epoch: 11, step: 498, loss: 0.37376734614372253, mean loss: 0.36795241481428687
Epoch: 11, step: 499, loss: 0.38202738761901855, mean loss: 0.3679532738824512
Epoch: 11, step: 500, loss: 0.3868670165538788, mean loss: 0.36795442821523555
Epoch: 11, step: 501, loss: 0.35554924607276917, mean loss: 0.3679536711554197
Epoch: 11, step: 502, loss: 0.3149539530277252, mean loss: 0.36795043690155216
Epoch: 11, step: 503, loss: 0.41965457797050476, mean loss: 0.36795359190161736
Epoch: 11, step: 504, loss: 0.32239866256713867, mean loss: 0.3679508122976553
Epoch: 11, step: 505, loss: 0.32634490728378296, mean loss: 0.36794827380436584
Epoch: 11, step: 506, loss: 0.3487822413444519, mean loss: 0.3679471045021598
Epoch: 11, step: 507, loss: 0.33885034918785095, mean loss: 0.3679453294438805
Epoch: 11, step: 508, loss: 0.2934235632419586, mean loss: 0.3679407834934015
Epoch: 11, step: 509, loss: 0.3402520418167114, mean loss: 0.3679390945375837
Epoch: 11, step: 510, loss: 0.3421429693698883, mean loss: 0.3679375211234228
Epoch: 11, step: 511, loss: 0.3338460922241211, mean loss: 0.3679354418706234
Epoch: 11, step: 512, loss: 0.3580089211463928, mean loss: 0.36793483648422803
Epoch: 11, step: 513, loss: 0.3488524556159973, mean loss: 0.36793367278250416
Epoch: 11, step: 514, loss: 0.29299333691596985, mean loss: 0.36792910297118236
Epoch: 11, step: 515, loss: 0.341528058052063, mean loss: 0.36792749315137024
Epoch: 11, step: 516, loss: 0.3205384910106659, mean loss: 0.36792460375425173
Epoch: 11, step: 517, loss: 0.3135812282562256, mean loss: 0.36792129053784534
Epoch: 11, step: 518, loss: 0.34921795129776, mean loss: 0.367920150298911
Epoch: 11, step: 519, loss: 0.36442887783050537, mean loss: 0.36791993746835333
Epoch: 11, step: 520, loss: 0.3287748694419861, mean loss: 0.3679175513014514
Epoch: 11, step: 521, loss: 0.3766976296901703, mean loss: 0.36791808647628915
Epoch: 11, step: 522, loss: 0.338540643453598, mean loss: 0.36791629593304404
Epoch: 11, step: 523, loss: 0.3095836341381073, mean loss: 0.3679127407976348
Epoch: 11, step: 524, loss: 0.30379199981689453, mean loss: 0.3679088331408013
Epoch: 11, step: 525, loss: 0.35298630595207214, mean loss: 0.3679079237850921
Epoch: 11, step: 526, loss: 0.3542861044406891, mean loss: 0.36790709374308705
Epoch: 11, step: 527, loss: 0.32542872428894043, mean loss: 0.3679045054924501
Epoch: 11, step: 528, loss: 0.3979337513446808, mean loss: 0.3679063350937327
Epoch: 11, step: 529, loss: 0.34152162075042725, mean loss: 0.36790472764190235
Epoch: 11, step: 530, loss: 0.3526443839073181, mean loss: 0.3679037979834354
Epoch: 11, step: 531, loss: 0.3750489056110382, mean loss: 0.36790423323609306
Epoch: 11, step: 532, loss: 0.3255027234554291, mean loss: 0.3679016504554522
Epoch: 11, step: 533, loss: 0.34535107016563416, mean loss: 0.36790027692759925
Epoch: 11, step: 534, loss: 0.3186052441596985, mean loss: 0.36789727461121163
Epoch: 11, step: 535, loss: 0.42766183614730835, mean loss: 0.36790091435308353
Epoch: 11, step: 536, loss: 0.32634544372558594, mean loss: 0.3678983837233638
Epoch: 11, step: 537, loss: 0.3677532374858856, mean loss: 0.36789837488484
Epoch: 11, step: 538, loss: 0.33355972170829773, mean loss: 0.36789628399686725
Epoch: 11, step: 539, loss: 0.3644280433654785, mean loss: 0.36789607282780784
Epoch: 11, step: 540, loss: 0.3248762786388397, mean loss: 0.367893453662256
Epoch: 11, step: 541, loss: 0.3560454547405243, mean loss: 0.3678927323668145
Epoch: 11, step: 542, loss: 0.3146115243434906, mean loss: 0.3678894888525987
Epoch: 11, step: 543, loss: 0.30470535159111023, mean loss: 0.36788564272785673
Epoch: 11, step: 544, loss: 0.37413114309310913, mean loss: 0.36788602287883154
Epoch: 11, step: 545, loss: 0.3120538890361786, mean loss: 0.3678826246966135
Epoch: 11, step: 546, loss: 0.33039939403533936, mean loss: 0.36788034344588855
Epoch: 11, step: 547, loss: 0.30317938327789307, mean loss: 0.3678764059483126
Epoch: 11, step: 548, loss: 0.3835500478744507, mean loss: 0.36787735973897323
Epoch: 11, step: 549, loss: 0.32155635952949524, mean loss: 0.3678745411311961
Epoch: 11, step: 550, loss: 0.3851604461669922, mean loss: 0.3678755929051563
Epoch: 11, step: 551, loss: 0.30908986926078796, mean loss: 0.36787201626098226
Epoch: 11, step: 552, loss: 0.32132643461227417, mean loss: 0.3678691845044787
Epoch: 11, step: 553, loss: 0.3854036331176758, mean loss: 0.36787025120654787
Epoch: 11, step: 554, loss: 0.31053757667541504, mean loss: 0.36786676360544496
Epoch: 11, step: 555, loss: 0.3215939998626709, mean loss: 0.36786394896044844
Epoch: 11, step: 556, loss: 0.3241961896419525, mean loss: 0.36786129293226777
Epoch: 11, step: 557, loss: 0.3293011486530304, mean loss: 0.36785894771001504
Epoch: 11, step: 558, loss: 0.34536445140838623, mean loss: 0.36785757968129146
Epoch: 11, step: 559, loss: 0.30326423048973083, mean loss: 0.3678536516011898
Epoch: 11, step: 560, loss: 0.35567355155944824, mean loss: 0.3678529109444527
Epoch: 11, step: 561, loss: 0.3256257176399231, mean loss: 0.36785034331747324
Epoch: 11, step: 562, loss: 0.37288737297058105, mean loss: 0.3678506495757363
Epoch: 11, step: 563, loss: 0.359073668718338, mean loss: 0.3678501159557912
Epoch: 11, step: 564, loss: 0.34207883477211, mean loss: 0.3678485492173157
Epoch: 11, step: 565, loss: 0.3477177917957306, mean loss: 0.36784732546306514
Epoch: 11, step: 566, loss: 0.3534161448478699, mean loss: 0.3678464482409744
Epoch: 11, step: 567, loss: 0.3267819583415985, mean loss: 0.3678439522228672
Epoch: 11, step: 568, loss: 0.326008141040802, mean loss: 0.36784140947618377
Epoch: 11, step: 569, loss: 0.3386293947696686, mean loss: 0.36783963410152065
Epoch: 11, step: 570, loss: 0.32984447479248047, mean loss: 0.36783732506722655
Epoch: 11, step: 571, loss: 0.31534504890441895, mean loss: 0.3678341352108725
Epoch: 11, step: 572, loss: 0.2932513654232025, mean loss: 0.367829603232396
Epoch: 11, step: 573, loss: 0.31929656863212585, mean loss: 0.3678266543300628
Epoch: 11, step: 574, loss: 0.3726532459259033, mean loss: 0.36782694757944584
Epoch: 11, step: 575, loss: 0.3422934412956238, mean loss: 0.3678253963336206
Epoch: 11, step: 576, loss: 0.3449194133281708, mean loss: 0.3678240048031543
Epoch: 11, step: 577, loss: 0.3201746344566345, mean loss: 0.3678211102963905
Epoch: 11, step: 578, loss: 0.3375011384487152, mean loss: 0.36781926859245756
Epoch: 11, step: 579, loss: 0.35520339012145996, mean loss: 0.36781850232189933
Epoch: 11, step: 580, loss: 0.3336576819419861, mean loss: 0.36781642756815625
Epoch: 11, step: 581, loss: 0.34130170941352844, mean loss: 0.36781481729740717
Epoch: 11, step: 582, loss: 0.35686275362968445, mean loss: 0.3678141522057895
Epoch: 11, step: 583, loss: 0.34992459416389465, mean loss: 0.36781306588334345
Epoch: 11, step: 584, loss: 0.3459704518318176, mean loss: 0.36781173959674124
Epoch: 11, step: 585, loss: 0.3566552698612213, mean loss: 0.36781106221545795
Epoch: 11, step: 586, loss: 0.35294845700263977, mean loss: 0.3678101598655574
Epoch: 11, step: 587, loss: 0.2963699996471405, mean loss: 0.367805822799007
Epoch: 11, step: 588, loss: 0.32534947991371155, mean loss: 0.36780324546986926
Epoch: 11, step: 589, loss: 0.3699256479740143, mean loss: 0.3678033743033344
Epoch: 11, step: 590, loss: 0.3607413172721863, mean loss: 0.3678029456504038
Epoch: 11, step: 591, loss: 0.31888386607170105, mean loss: 0.36779997653899454
Epoch: 11, step: 592, loss: 0.366213858127594, mean loss: 0.3677998802764218
Epoch: 11, step: 593, loss: 0.3366411626338959, mean loss: 0.36779798934805413
Epoch: 11, step: 594, loss: 0.3638940155506134, mean loss: 0.36779775244206486
Epoch: 11, step: 595, loss: 0.3638722002506256, mean loss: 0.36779751424108237
Epoch: 11, step: 596, loss: 0.3433937132358551, mean loss: 0.3677960335177643
Epoch: 11, step: 597, loss: 0.38331183791160583, mean loss: 0.36779697489650437
Epoch: 11, step: 598, loss: 0.3354121148586273, mean loss: 0.36779501015343347
Epoch: 11, step: 599, loss: 0.37368088960647583, mean loss: 0.36779536721964634
Epoch: 11, step: 600, loss: 0.3551912009716034, mean loss: 0.3677946026357065
Epoch: 11, step: 601, loss: 0.3686142861843109, mean loss: 0.367794652355684
Epoch: 11, step: 602, loss: 0.3129594027996063, mean loss: 0.3677913263867657
Epoch: 11, step: 603, loss: 0.3514648675918579, mean loss: 0.3677903361842672
Epoch: 11, step: 604, loss: 0.3150874376296997, mean loss: 0.3677871399383727
Epoch: 11, step: 605, loss: 0.3047621548175812, mean loss: 0.3677833179259336
Epoch: 11, step: 606, loss: 0.3443944752216339, mean loss: 0.3677818996467083
Epoch: 11, step: 607, loss: 0.3097603917121887, mean loss: 0.3677783814859071
Epoch: 11, step: 608, loss: 0.3460013270378113, mean loss: 0.36777706110426345
Epoch: 11, step: 609, loss: 0.3381476104259491, mean loss: 0.3677752647267517
Epoch: 11, step: 610, loss: 0.3288600444793701, mean loss: 0.36777290551364183
Epoch: 11, step: 611, loss: 0.3251304626464844, mean loss: 0.3677703204964942
Epoch: 11, step: 612, loss: 0.3455665409564972, mean loss: 0.3677689745681715
Epoch: 11, step: 613, loss: 0.31859737634658813, mean loss: 0.3677659941100419
Epoch: 11, step: 614, loss: 0.33078983426094055, mean loss: 0.36776375299483194
Epoch: 11, step: 615, loss: 0.3410624563694, mean loss: 0.3677621347344304
Epoch: 11, step: 616, loss: 0.3285757899284363, mean loss: 0.3677597599483686
Epoch: 11, step: 617, loss: 0.3583267331123352, mean loss: 0.3677591883190609
Epoch: 11, step: 618, loss: 0.328830361366272, mean loss: 0.36775682942510507
Epoch: 11, step: 619, loss: 0.349669873714447, mean loss: 0.3677557335116471
Epoch: 11, step: 620, loss: 0.33943605422973633, mean loss: 0.3677540176873949
Epoch: 11, step: 621, loss: 0.3736756145954132, mean loss: 0.3677543764415999
Epoch: 11, step: 622, loss: 0.38237595558166504, mean loss: 0.36775526222212573
Epoch: 11, step: 623, loss: 0.3371927738189697, mean loss: 0.3677534108477374
Epoch: 11, step: 624, loss: 0.3425862193107605, mean loss: 0.3677518863949215
Epoch: 11, step: 625, loss: 0.34988072514533997, mean loss: 0.36775080395026677
Epoch: 11, step: 626, loss: 0.36948519945144653, mean loss: 0.36775090899511576
Epoch: 11, step: 627, loss: 0.350884348154068, mean loss: 0.3677498875221966
Epoch: 11, step: 628, loss: 0.34095776081085205, mean loss: 0.3677482650352644
Epoch: 11, step: 629, loss: 0.33328181505203247, mean loss: 0.3677461779303847
Epoch: 11, step: 630, loss: 0.3394972085952759, mean loss: 0.3677444674266405
Epoch: 11, step: 631, loss: 0.39181995391845703, mean loss: 0.3677459251335
Epoch: 11, step: 632, loss: 0.36196795105934143, mean loss: 0.3677455753136735
Epoch: 11, step: 633, loss: 0.3318890929222107, mean loss: 0.36774340456162175
Epoch: 11, step: 634, loss: 0.324720174074173, mean loss: 0.36774080009219334
Epoch: 11, step: 635, loss: 0.3365963101387024, mean loss: 0.3677389148325109
Epoch: 11, step: 636, loss: 0.3428210914134979, mean loss: 0.36773740658098747
Epoch: 11, step: 637, loss: 0.34902065992355347, mean loss: 0.36773627374315565
Epoch: 11, step: 638, loss: 0.32970812916755676, mean loss: 0.36773397221531107
Epoch: 11, step: 639, loss: 0.33394530415534973, mean loss: 0.36773192739153593
Epoch: 11, step: 640, loss: 0.33568841218948364, mean loss: 0.3677299882983316
Epoch: 11, step: 641, loss: 0.35446834564208984, mean loss: 0.36772918582691344
Epoch: 11, step: 642, loss: 0.3544270396232605, mean loss: 0.36772838095330035
Epoch: 11, step: 643, loss: 0.38722512125968933, mean loss: 0.36772956057214756
Epoch: 11, step: 644, loss: 0.35884711146354675, mean loss: 0.3677290231863947
Epoch: 11, step: 645, loss: 0.33030346035957336, mean loss: 0.36772675908701014
Epoch: 11, step: 646, loss: 0.3373253047466278, mean loss: 0.3677249200298242
Epoch: 11, step: 647, loss: 0.3654490113258362, mean loss: 0.36772478236295364
Epoch: 11, step: 648, loss: 0.28194186091423035, mean loss: 0.36771959377519287
Epoch: 11, step: 649, loss: 0.3154928684234619, mean loss: 0.36771643502804446
Epoch: 11, step: 650, loss: 0.3641078472137451, mean loss: 0.36771621678868466
Epoch: 11, step: 651, loss: 0.337630033493042, mean loss: 0.3677143973533136
Epoch: 11, step: 652, loss: 0.3038298487663269, mean loss: 0.3677105342252622
Epoch: 11, step: 653, loss: 0.33728301525115967, mean loss: 0.3677086943704445
Epoch: 11, step: 654, loss: 0.34951460361480713, mean loss: 0.3677075942984477
Epoch: 11, step: 655, loss: 0.34445899724960327, mean loss: 0.36770618870007715
Epoch: 11, step: 656, loss: 0.32781165838241577, mean loss: 0.36770377684285466
Epoch: 11, step: 657, loss: 0.2865290641784668, mean loss: 0.3676988696543246
Epoch: 11, step: 658, loss: 0.40446117520332336, mean loss: 0.3677010918815838
Epoch: 11, step: 659, loss: 0.32797861099243164, mean loss: 0.3676986908612206
Epoch: 11, step: 660, loss: 0.34220120310783386, mean loss: 0.3676971497619306
Epoch: 11, step: 661, loss: 0.3113837242126465, mean loss: 0.36769374631544505
Epoch: 11, step: 662, loss: 0.33842939138412476, mean loss: 0.3676919777558916
Epoch: 11, step: 663, loss: 0.3217914402484894, mean loss: 0.3676892039743163
Epoch: 11, step: 664, loss: 0.36539626121520996, mean loss: 0.36768906541955415
Epoch: 11, step: 665, loss: 0.34615910053253174, mean loss: 0.36768776451533136
Epoch: 11, step: 666, loss: 0.33483293652534485, mean loss: 0.36768577944929365
Epoch: 11, step: 667, loss: 0.36683887243270874, mean loss: 0.3676857282828475
Epoch: 11, step: 668, loss: 0.3493759334087372, mean loss: 0.3676846221513382
Epoch: 11, step: 669, loss: 0.39821749925613403, mean loss: 0.36768646659238596
Epoch: 11, step: 670, loss: 0.33900153636932373, mean loss: 0.3676847338874495
Epoch: 11, step: 671, loss: 0.3519458770751953, mean loss: 0.3676837832437667
Epoch: 11, step: 672, loss: 0.3121581971645355, mean loss: 0.3676804296419017
Epoch: 11, step: 673, loss: 0.33307668566703796, mean loss: 0.36767833979143816
Epoch: 11, step: 674, loss: 0.3466202914714813, mean loss: 0.3676770680933694
Epoch: 11, step: 675, loss: 0.3474418520927429, mean loss: 0.36767584616003607
Epoch: 11, step: 676, loss: 0.36197394132614136, mean loss: 0.3676755018629022
Epoch: 11, step: 677, loss: 0.30495476722717285, mean loss: 0.36767171483629696
Epoch: 11, step: 678, loss: 0.35875949263572693, mean loss: 0.3676711767561061
Epoch: 11, step: 679, loss: 0.3279321491718292, mean loss: 0.3676687776358704
Epoch: 11, step: 680, loss: 0.3232778012752533, mean loss: 0.3676660978304759
Epoch: 11, step: 681, loss: 0.3366944193840027, mean loss: 0.36766422823742706
Epoch: 11, step: 682, loss: 0.34322527050971985, mean loss: 0.3676627530785131
Epoch: 11, step: 683, loss: 0.3861779570579529, mean loss: 0.3676638706065177
Epoch: 11, step: 684, loss: 0.37663719058036804, mean loss: 0.3676644121793328
Epoch: 11, step: 685, loss: 0.33063215017318726, mean loss: 0.3676621772812033
Epoch: 11, step: 686, loss: 0.33052632212638855, mean loss: 0.3676599362664695
Epoch: 11, step: 687, loss: 0.33505427837371826, mean loss: 0.36765796875151097
Epoch: 11, step: 688, loss: 0.3260682225227356, mean loss: 0.36765545926341414
Epoch: 11, step: 689, loss: 0.35205066204071045, mean loss: 0.36765451774071456
Epoch: 11, step: 690, loss: 0.30226796865463257, mean loss: 0.36765057285087527
Epoch: 11, step: 691, loss: 0.36193040013313293, mean loss: 0.3676502277632354
Epoch: 11, step: 692, loss: 0.35084736347198486, mean loss: 0.36764921413807455
Epoch: 11, step: 693, loss: 0.3461371064186096, mean loss: 0.36764791650822054
Epoch: 11, step: 694, loss: 0.3319028913974762, mean loss: 0.36764576046593145
Epoch: 11, step: 695, loss: 0.3541508913040161, mean loss: 0.36764494654137403
Epoch: 11, step: 696, loss: 0.348663866519928, mean loss: 0.36764380179256384
Epoch: 11, step: 697, loss: 0.3119206726551056, mean loss: 0.3676404413336845
Epoch: 11, step: 698, loss: 0.3648083209991455, mean loss: 0.36764027054912596
Epoch: 11, step: 699, loss: 0.3265162706375122, mean loss: 0.36763779080962333
Epoch: 11, step: 700, loss: 0.3367646634578705, mean loss: 0.36763592930058797
Epoch: 11, step: 701, loss: 0.3346957862377167, mean loss: 0.3676339432796629
Epoch: 11, step: 702, loss: 0.3145039975643158, mean loss: 0.3676307401720657
Epoch: 11, step: 703, loss: 0.29857751727104187, mean loss: 0.3676265773300775
Epoch: 11, step: 704, loss: 0.2996308207511902, mean loss: 0.3676224784840603
Epoch: 11, step: 705, loss: 0.3175256550312042, mean loss: 0.367619458784033
Epoch: 11, step: 706, loss: 0.34557682275772095, mean loss: 0.367618130194073
Epoch: 11, step: 707, loss: 0.3696403503417969, mean loss: 0.36761825207330084
Epoch: 11, step: 708, loss: 0.3785732686519623, mean loss: 0.36761891229246424
Epoch: 11, step: 709, loss: 0.31202781200408936, mean loss: 0.3676155622201316
Epoch: 11, step: 710, loss: 0.2900927662849426, mean loss: 0.36761089076511894
Epoch: 11, step: 711, loss: 0.3617812991142273, mean loss: 0.36761053950025685
Epoch: 11, step: 712, loss: 0.33277755975723267, mean loss: 0.3676084407486907
Epoch: 11, step: 713, loss: 0.3434070348739624, mean loss: 0.3676069826570005
Epoch: 11, step: 714, loss: 0.3457657992839813, mean loss: 0.3676056668437965
Epoch: 11, step: 715, loss: 0.32677939534187317, mean loss: 0.3676032074298506
Epoch: 11, step: 716, loss: 0.3605138063430786, mean loss: 0.36760278038322164
Epoch: 11, step: 717, loss: 0.32364487648010254, mean loss: 0.36760013263572716
Epoch: 11, step: 718, loss: 0.3210419714450836, mean loss: 0.36759732843400517
Epoch: 11, step: 719, loss: 0.3511432111263275, mean loss: 0.36759633746090786
Epoch: 11, step: 720, loss: 0.3613676428794861, mean loss: 0.3675959623513275
Epoch: 11, step: 721, loss: 0.3214770555496216, mean loss: 0.3675931851077528
Epoch: 11, step: 722, loss: 0.3635573089122772, mean loss: 0.3675929420851602
Epoch: 11, step: 723, loss: 0.33710020780563354, mean loss: 0.3675911060582888
Epoch: 11, step: 724, loss: 0.3384687006473541, mean loss: 0.36758935264716164
Epoch: 11, step: 725, loss: 0.3460707366466522, mean loss: 0.3675880571254277
Epoch: 11, step: 726, loss: 0.3256499767303467, mean loss: 0.3675855324080479
Epoch: 11, step: 727, loss: 0.32192087173461914, mean loss: 0.36758278351202855
Epoch: 11, step: 728, loss: 0.3774857223033905, mean loss: 0.36758337960778437
Epoch: 11, step: 729, loss: 0.35314932465553284, mean loss: 0.367582510819115
Epoch: 11, step: 730, loss: 0.36208853125572205, mean loss: 0.3675821801552833
Epoch: 11, step: 731, loss: 0.33239802718162537, mean loss: 0.36758006266894644
Epoch: 11, step: 732, loss: 0.337973952293396, mean loss: 0.3675782809929294
Epoch: 11, step: 733, loss: 0.3282424807548523, mean loss: 0.3675759139331004
Epoch: 11, step: 734, loss: 0.33451077342033386, mean loss: 0.36757392433441743
Epoch: 11, step: 735, loss: 0.31474778056144714, mean loss: 0.3675707458660797
Epoch: 11, step: 736, loss: 0.3491916358470917, mean loss: 0.36756964008965115
Epoch: 11, step: 737, loss: 0.3704415261745453, mean loss: 0.3675698128658565
Epoch: 11, step: 738, loss: 0.3576413691043854, mean loss: 0.36756921559437955
Epoch: 11, step: 739, loss: 0.36084938049316406, mean loss: 0.3675688113694577
Epoch: 11, step: 740, loss: 0.30775120854377747, mean loss: 0.3675652133181599
Epoch: 11, step: 741, loss: 0.3624173104763031, mean loss: 0.367564903688493
Epoch: 11, step: 742, loss: 0.3752295672893524, mean loss: 0.36756536466543416
Epoch: 11, step: 743, loss: 0.3500370681285858, mean loss: 0.36756431052202926
Epoch: 11, step: 744, loss: 0.3874485492706299, mean loss: 0.3675655062787644
Epoch: 11, step: 745, loss: 0.3642783463001251, mean loss: 0.36756530861430387
Epoch: 11, step: 746, loss: 0.31791532039642334, mean loss: 0.3675623232262804
Epoch: 11, step: 747, loss: 0.3431861996650696, mean loss: 0.36756085761038565
Epoch: 11, step: 748, loss: 0.3202880918979645, mean loss: 0.3675580155033868
Epoch: 11, step: 749, loss: 0.3115565776824951, mean loss: 0.367554648818415
Epoch: 11, step: 750, loss: 0.31491005420684814, mean loss: 0.36755148412982996
Epoch: 11, step: 751, loss: 0.30785998702049255, mean loss: 0.36754789603791427
Epoch: 11, step: 752, loss: 0.3364162743091583, mean loss: 0.36754602480982457
Epoch: 11, step: 753, loss: 0.35385024547576904, mean loss: 0.3675452016472249
Epoch: 11, step: 754, loss: 0.3355657160282135, mean loss: 0.36754327968763484
Epoch: 11, step: 755, loss: 0.34172287583351135, mean loss: 0.3675417279806725
Epoch: 11, step: 756, loss: 0.350264310836792, mean loss: 0.3675406897367482
Epoch: 11, step: 757, loss: 0.32378533482551575, mean loss: 0.367538060524219
Epoch: 11, step: 758, loss: 0.2978920042514801, mean loss: 0.3675338758185606
Epoch: 11, step: 759, loss: 0.32049256563186646, mean loss: 0.36753104949615095
Epoch: 11, step: 760, loss: 0.3563990294933319, mean loss: 0.36753038070552296
Epoch: 11, step: 761, loss: 0.33042025566101074, mean loss: 0.3675281513335991
Epoch: 11, step: 762, loss: 0.36854496598243713, mean loss: 0.3675282124145536
Epoch: 11, step: 763, loss: 0.34561800956726074, mean loss: 0.3675268963283662
Epoch: 11, step: 764, loss: 0.36761006712913513, mean loss: 0.3675269013239095
Epoch: 11, step: 765, loss: 0.36388280987739563, mean loss: 0.3675266824595584
Epoch: 11, step: 766, loss: 0.4002712666988373, mean loss: 0.3675286489831449
Epoch: 11, step: 767, loss: 0.35934022068977356, mean loss: 0.3675281572447175
Epoch: 11, step: 768, loss: 0.33630579710006714, mean loss: 0.367526282365708
Epoch: 11, step: 769, loss: 0.31825506687164307, mean loss: 0.3675233238443021
Epoch: 11, step: 770, loss: 0.3103651702404022, mean loss: 0.36751989195276175
Epoch: 11, step: 771, loss: 0.4003154933452606, mean loss: 0.3675218609490029
Epoch: 11, step: 772, loss: 0.3570657968521118, mean loss: 0.3675212332210749
Epoch: 11, step: 773, loss: 0.3518062233924866, mean loss: 0.36752028982992174
Epoch: 11, step: 774, loss: 0.33986860513687134, mean loss: 0.36751862996530243
Epoch: 11, step: 775, loss: 0.31113579869270325, mean loss: 0.36751524564169663
Epoch: 11, step: 776, loss: 0.3551436960697174, mean loss: 0.3675145030962569
Epoch: 11, step: 777, loss: 0.3029754161834717, mean loss: 0.3675106296664818
Epoch: 11, step: 778, loss: 0.3416534662246704, mean loss: 0.36750907789528564
Epoch: 11, step: 779, loss: 0.34401753544807434, mean loss: 0.3675076681771839
Epoch: 11, step: 780, loss: 0.32162150740623474, mean loss: 0.36750491473219316
Epoch: 11, step: 781, loss: 0.32952409982681274, mean loss: 0.3675026357921412
Epoch: 11, step: 782, loss: 0.3090847432613373, mean loss: 0.36749913078868945
Epoch: 11, step: 783, loss: 0.33712682127952576, mean loss: 0.3674973085958943
Epoch: 11, step: 784, loss: 0.3121711015701294, mean loss: 0.3674939894881478
Epoch: 11, step: 785, loss: 0.32177621126174927, mean loss: 0.3674912469699579
Epoch: 11, step: 786, loss: 0.3646860122680664, mean loss: 0.36749107869962605
Epoch: 11, step: 787, loss: 0.3387438654899597, mean loss: 0.3674893544186034
Epoch: 11, step: 788, loss: 0.32825830578804016, mean loss: 0.3674870014498137
Epoch: 11, step: 789, loss: 0.3248271048069, mean loss: 0.3674844429817411
Epoch: 11, step: 790, loss: 0.32833462953567505, mean loss: 0.36748209516684177
Epoch: 11, step: 791, loss: 0.3560372591018677, mean loss: 0.36748140886100916
Epoch: 11, step: 792, loss: 0.3400183618068695, mean loss: 0.36747976209917826
Epoch: 11, step: 793, loss: 0.300912082195282, mean loss: 0.36747577075249976
Epoch: 11, step: 794, loss: 0.3164432942867279, mean loss: 0.3674727110680783
Epoch: 11, step: 795, loss: 0.3626229166984558, mean loss: 0.36747242031302013
Epoch: 11, step: 796, loss: 0.33026015758514404, mean loss: 0.3674701894957593
Epoch: 11, step: 797, loss: 0.3698461055755615, mean loss: 0.3674703319196941
Epoch: 11, step: 798, loss: 0.3293502926826477, mean loss: 0.3674680469566037
Epoch: 11, step: 799, loss: 0.34391841292381287, mean loss: 0.3674666354465322
Epoch: 11, step: 800, loss: 0.39532437920570374, mean loss: 0.3674683050745669
Epoch: 11, step: 801, loss: 0.33557212352752686, mean loss: 0.36746639352107613
Epoch: 11, step: 802, loss: 0.37172287702560425, mean loss: 0.36746664859889144
Epoch: 11, step: 803, loss: 0.3212009072303772, mean loss: 0.36746387620307597
Epoch: 11, step: 804, loss: 0.34439054131507874, mean loss: 0.3674624936555963
Epoch: 11, step: 805, loss: 0.33823511004447937, mean loss: 0.36746074246424754
Epoch: 11, step: 806, loss: 0.3317541480064392, mean loss: 0.36745860319191764
Epoch: 11, step: 807, loss: 0.37410813570022583, mean loss: 0.36745900155835115
Epoch: 11, step: 808, loss: 0.3163265287876129, mean loss: 0.3674559384496966
Epoch: 11, step: 809, loss: 0.3661833703517914, mean loss: 0.3674558622206264
Epoch: 11, step: 810, loss: 0.37749412655830383, mean loss: 0.3674564634943214
Epoch: 11, step: 811, loss: 0.3851558268070221, mean loss: 0.3674575235903511
Epoch: 11, step: 812, loss: 0.3368842303752899, mean loss: 0.3674556925252966
Epoch: 11, step: 813, loss: 0.3258066475391388, mean loss: 0.367453198271794
Epoch: 11, step: 814, loss: 0.33284008502960205, mean loss: 0.3674511255061648
Epoch: 11, step: 815, loss: 0.32417333126068115, mean loss: 0.3674485340214795
Epoch: 11, step: 816, loss: 0.34693485498428345, mean loss: 0.3674473057310156
Epoch: 11, step: 817, loss: 0.32342174649238586, mean loss: 0.3674446697856654
Epoch: 11, step: 818, loss: 0.36930033564567566, mean loss: 0.3674447808834239
Epoch: 11, step: 819, loss: 0.32362258434295654, mean loss: 0.36744215742817127
Epoch: 11, step: 820, loss: 0.3364160656929016, mean loss: 0.36744030013444273
Epoch: 11, step: 821, loss: 0.33046311140060425, mean loss: 0.3674380867267608
Epoch: 11, step: 822, loss: 0.32883626222610474, mean loss: 0.3674357762087444
Epoch: 11, step: 823, loss: 0.3308800458908081, mean loss: 0.36743358829096145
Epoch: 11, step: 824, loss: 0.31697091460227966, mean loss: 0.3674305682015672
Epoch: 11, step: 825, loss: 0.31447169184684753, mean loss: 0.3674273989091462
Epoch: 11, step: 826, loss: 0.3220718204975128, mean loss: 0.3674246847939878
Epoch: 11, step: 827, loss: 0.3570544421672821, mean loss: 0.36742406426726293
Epoch: 11, step: 828, loss: 0.42152804136276245, mean loss: 0.36742730150636393
Epoch: 11, step: 829, loss: 0.3287694752216339, mean loss: 0.3674249886054255
Epoch: 11, step: 830, loss: 0.3259039521217346, mean loss: 0.36742250454700587
Epoch: 11, step: 831, loss: 0.3018610179424286, mean loss: 0.3674185824671659
Epoch: 11, step: 832, loss: 0.36536604166030884, mean loss: 0.36741845968551806
Epoch: 11, step: 833, loss: 0.3357360064983368, mean loss: 0.3674165645752664
Epoch: 11, step: 834, loss: 0.3220688998699188, mean loss: 0.36741385223214146
Epoch: 11, step: 835, loss: 0.3466837406158447, mean loss: 0.36741261239292994
Epoch: 11, step: 836, loss: 0.378756582736969, mean loss: 0.36741329081948004
Epoch: 11, step: 837, loss: 0.3304547667503357, mean loss: 0.36741108064581246
Epoch: 11, step: 838, loss: 0.3401857912540436, mean loss: 0.36740945263113856
Epoch: 11, step: 839, loss: 0.3311993479728699, mean loss: 0.36740728747300305
Epoch: 11, step: 840, loss: 0.35677897930145264, mean loss: 0.3674066519986729
Epoch: 11, step: 841, loss: 0.33237195014953613, mean loss: 0.3674045573734278
Epoch: 11, step: 842, loss: 0.3519017994403839, mean loss: 0.36740363056300557
Epoch: 11, step: 843, loss: 0.31757834553718567, mean loss: 0.3674006520069902
Epoch: 11, step: 844, loss: 0.34359556436538696, mean loss: 0.3673992290236892
Epoch: 11, step: 845, loss: 0.320183128118515, mean loss: 0.36739640678215274
Epoch: 11, step: 846, loss: 0.38001134991645813, mean loss: 0.36739716076835405
Epoch: 11, step: 847, loss: 0.29938533902168274, mean loss: 0.36739309599296877
Epoch: 11, step: 848, loss: 0.4035849869251251, mean loss: 0.3673952588980624
Epoch: 11, step: 849, loss: 0.33229967951774597, mean loss: 0.36739316163623736
Epoch: 11, step: 850, loss: 0.3502841293811798, mean loss: 0.3673921392859383
Epoch: 11, step: 851, loss: 0.3474544882774353, mean loss: 0.3673909479826992
Epoch: 11, step: 852, loss: 0.35944879055023193, mean loss: 0.367390473455757
Epoch: 11, step: 853, loss: 0.3461228609085083, mean loss: 0.36738920283725135
Epoch: 11, step: 854, loss: 0.31236541271209717, mean loss: 0.3673859156761231
Epoch: 11, step: 855, loss: 0.3222038745880127, mean loss: 0.3673832166294631
Epoch: 11, step: 856, loss: 0.3361562192440033, mean loss: 0.3673813513288607
Epoch: 11, step: 857, loss: 0.32787463068962097, mean loss: 0.3673789915916346
Epoch: 11, step: 858, loss: 0.28590065240859985, mean loss: 0.36737412517945145
Epoch: 11, step: 859, loss: 0.3542790114879608, mean loss: 0.3673733431014718
Epoch: 11, step: 860, loss: 0.3313556909561157, mean loss: 0.3673711921518065
Epoch: 11, step: 861, loss: 0.3886629045009613, mean loss: 0.36737246360244247
Epoch: 11, step: 862, loss: 0.3535394072532654, mean loss: 0.3673716376003914
Epoch: 11, step: 863, loss: 0.3869154155254364, mean loss: 0.3673728045324385
Epoch: 11, step: 864, loss: 0.33759117126464844, mean loss: 0.36737102641832614
Epoch: 11, step: 865, loss: 0.3396477997303009, mean loss: 0.36736937130031494
Epoch: 11, step: 866, loss: 0.34132441878318787, mean loss: 0.36736781647060224
Epoch: 11, step: 867, loss: 0.3903205692768097, mean loss: 0.3673691866206026
Epoch: 11, step: 868, loss: 0.33623841404914856, mean loss: 0.3673673283998319
Epoch: 11, step: 869, loss: 0.31870391964912415, mean loss: 0.36736442381532963
Epoch: 11, step: 870, loss: 0.33747828006744385, mean loss: 0.36736264010039393
Epoch: 11, step: 871, loss: 0.30824679136276245, mean loss: 0.36735911205976746
Epoch: 11, step: 872, loss: 0.31524816155433655, mean loss: 0.36735600225786347
Epoch: 11, step: 873, loss: 0.3267444670200348, mean loss: 0.36735357884604597
Epoch: 11, step: 874, loss: 0.3176652491092682, mean loss: 0.36735061397166585
Epoch: 11, step: 875, loss: 0.321586549282074, mean loss: 0.3673478834188801
Epoch: 11, step: 876, loss: 0.3884333074092865, mean loss: 0.3673491414240105
Epoch: 11, step: 877, loss: 0.3251170217990875, mean loss: 0.3673466219084619
Epoch: 11, step: 878, loss: 0.2944699227809906, mean loss: 0.36734227443491135
Epoch: 11, step: 879, loss: 0.3695586323738098, mean loss: 0.36734240664428497
Epoch: 11, step: 880, loss: 0.3175685405731201, mean loss: 0.36733943772892136
Epoch: 11, step: 881, loss: 0.31404924392700195, mean loss: 0.3673362592609623
Epoch: 11, step: 882, loss: 0.3469102382659912, mean loss: 0.36733504103343234
Epoch: 11, step: 883, loss: 0.378572016954422, mean loss: 0.3673357111775116
Epoch: 11, step: 884, loss: 0.36895760893821716, mean loss: 0.36733580789751646
Epoch: 11, step: 885, loss: 0.31769466400146484, mean loss: 0.36733284778160136
Epoch: 11, step: 886, loss: 0.3574570417404175, mean loss: 0.36733225891951554
Epoch: 11, step: 887, loss: 0.3795987367630005, mean loss: 0.3673329902859503
Epoch: 11, step: 888, loss: 0.32550105452537537, mean loss: 0.36733049628155273
Epoch: 11, step: 889, loss: 0.3515187203884125, mean loss: 0.36732955364557485
Epoch: 11, step: 890, loss: 0.32347026467323303, mean loss: 0.36732693908289393
Epoch: 11, step: 891, loss: 0.3967280685901642, mean loss: 0.3673286916537992
Epoch: 11, step: 892, loss: 0.3401198983192444, mean loss: 0.36732706986245783
Epoch: 11, step: 893, loss: 0.3745321035385132, mean loss: 0.3673274992958632
Epoch: 11, step: 894, loss: 0.30221956968307495, mean loss: 0.36732361897345944
Epoch: 11, step: 895, loss: 0.37799322605133057, mean loss: 0.36732425482608627
Epoch: 11, step: 896, loss: 0.33517569303512573, mean loss: 0.3673223390545714
Epoch: 11, step: 897, loss: 0.36347874999046326, mean loss: 0.3673221100241183
Epoch: 11, step: 898, loss: 0.341731995344162, mean loss: 0.3673205852600904
Epoch: 11, step: 899, loss: 0.2954898476600647, mean loss: 0.3673163055450285
Epoch: 11, step: 900, loss: 0.3286627233028412, mean loss: 0.36731400268043257
Epoch: 11, step: 901, loss: 0.39364534616470337, mean loss: 0.3673155713295142
Epoch: 11, step: 902, loss: 0.3307899236679077, mean loss: 0.3673133955001426
Epoch: 11, step: 903, loss: 0.3133816421031952, mean loss: 0.36731018298207035
Epoch: 11, step: 904, loss: 0.3340011537075043, mean loss: 0.36730819900272227
Epoch: 11, step: 905, loss: 0.33728092908859253, mean loss: 0.36730641060070235
Epoch: 11, step: 906, loss: 0.3384567201137543, mean loss: 0.36730469243677605
Epoch: 11, step: 907, loss: 0.32535549998283386, mean loss: 0.3673021942714322
Epoch: 11, step: 908, loss: 0.3284907937049866, mean loss: 0.36729988310603195
Epoch: 11, step: 909, loss: 0.3255551755428314, mean loss: 0.36729739741426326
Epoch: 11, step: 910, loss: 0.33884602785110474, mean loss: 0.36729570337618267
Epoch: 11, step: 911, loss: 0.3842746913433075, mean loss: 0.36729671427091753
Epoch: 11, step: 912, loss: 0.31039929389953613, mean loss: 0.3672933269148199
Epoch: 11, step: 913, loss: 0.3232000768184662, mean loss: 0.3672907020041105
Epoch: 11, step: 914, loss: 0.31769999861717224, mean loss: 0.3672877500008135
Epoch: 11, step: 915, loss: 0.35400035977363586, mean loss: 0.3672869590847285
Epoch: 11, step: 916, loss: 0.34058651328086853, mean loss: 0.3672853698670746
Epoch: 11, step: 917, loss: 0.30859139561653137, mean loss: 0.36728187659399697
Epoch: 11, step: 918, loss: 0.365995317697525, mean loss: 0.367281800026783
Epoch: 11, step: 919, loss: 0.3781385123729706, mean loss: 0.36728244610583244
Epoch: 11, step: 920, loss: 0.31577229499816895, mean loss: 0.36727938093766177
Epoch: 11, step: 921, loss: 0.29936182498931885, mean loss: 0.3672753396693083
Epoch: 11, step: 922, loss: 0.3652910888195038, mean loss: 0.36727522160833076
Epoch: 11, step: 923, loss: 0.34717997908592224, mean loss: 0.36727402603226444
Epoch: 11, step: 924, loss: 0.31613433361053467, mean loss: 0.36727098363281047
Epoch: 11, step: 925, loss: 0.3460996150970459, mean loss: 0.3672697241819755
Epoch: 11, step: 926, loss: 0.3754453957080841, mean loss: 0.36727021051066067
Epoch: 11, step: 927, loss: 0.30744561553001404, mean loss: 0.3672666520646114
Epoch: 11, step: 928, loss: 0.30635353922843933, mean loss: 0.3672630290875796
Epoch: 11, step: 929, loss: 0.33420926332473755, mean loss: 0.3672610632397288
Epoch: 11, step: 930, loss: 0.32234987616539, mean loss: 0.36725839233951624
Epoch: 11, step: 931, loss: 0.3558746576309204, mean loss: 0.3672577153809822
Epoch: 11, step: 932, loss: 0.3473239541053772, mean loss: 0.36725653004701797
Epoch: 11, step: 933, loss: 0.32767254114151, mean loss: 0.3672541763789893
Epoch: 11, step: 934, loss: 0.3153400719165802, mean loss: 0.3672510897445603
Epoch: 11, step: 935, loss: 0.3476267457008362, mean loss: 0.3672499230178038
Epoch: 11, step: 936, loss: 0.298888236284256, mean loss: 0.36724585894986883
Epoch: 11, step: 937, loss: 0.2957629859447479, mean loss: 0.3672416095816008
Epoch: 11, step: 938, loss: 0.29133090376853943, mean loss: 0.36723709726478376
Epoch: 11, step: 939, loss: 0.3247216045856476, mean loss: 0.3672345701908014
Epoch: 11, step: 940, loss: 0.34752827882766724, mean loss: 0.36723339894020035
Epoch: 11, step: 941, loss: 0.3642960488796234, mean loss: 0.36723322436810596
Epoch: 11, step: 942, loss: 0.3825873136520386, mean loss: 0.3672341368355264
Epoch: 11, step: 943, loss: 0.34633293747901917, mean loss: 0.36723289478659865
Epoch: 11, step: 944, loss: 0.3059764802455902, mean loss: 0.36722925485466323
Epoch: 11, step: 945, loss: 0.31626346707344055, mean loss: 0.3672262265844445
Epoch: 11, step: 946, loss: 0.33848750591278076, mean loss: 0.3672245190970301
Epoch: 11, step: 947, loss: 0.3485267460346222, mean loss: 0.3672234082502464
Epoch: 11, step: 948, loss: 0.38076427578926086, mean loss: 0.36722421267414823
Epoch: 11, step: 949, loss: 0.3490438163280487, mean loss: 0.3672231326933744
Epoch: 11, step: 950, loss: 0.33013638854026794, mean loss: 0.3672209297385688
Epoch: 11, step: 951, loss: 0.32617664337158203, mean loss: 0.3672184918503313
Epoch: 11, step: 952, loss: 0.35448890924453735, mean loss: 0.367217735802187
Epoch: 11, step: 953, loss: 0.36770761013031006, mean loss: 0.36721776489556673
Epoch: 11, step: 954, loss: 0.33416640758514404, mean loss: 0.36721580210933774
Epoch: 11, step: 955, loss: 0.34093180298805237, mean loss: 0.367214241301789
Epoch: 11, step: 956, loss: 0.33195677399635315, mean loss: 0.3672121477522785
Epoch: 11, step: 957, loss: 0.362072229385376, mean loss: 0.36721184256771805
Epoch: 11, step: 958, loss: 0.30147403478622437, mean loss: 0.3672079395927266
Epoch: 11, step: 959, loss: 0.3132793605327606, mean loss: 0.3672047379435304
Epoch: 11, step: 960, loss: 0.3521094024181366, mean loss: 0.3672038418120062
Epoch: 11, step: 961, loss: 0.3424755036830902, mean loss: 0.367202373906383
Epoch: 11, step: 962, loss: 0.34556958079338074, mean loss: 0.3672010898324759
Epoch: 11, step: 963, loss: 0.33270877599716187, mean loss: 0.36719904256788455
Epoch: 11, step: 964, loss: 0.33573609590530396, mean loss: 0.36719717521987205
Epoch: 11, step: 965, loss: 0.361358106136322, mean loss: 0.36719682868758224
Epoch: 11, step: 966, loss: 0.3109603822231293, mean loss: 0.36719349141107255
Epoch: 11, step: 967, loss: 0.32346847653388977, mean loss: 0.36719089676267014
Epoch: 11, step: 968, loss: 0.33022716641426086, mean loss: 0.3671887034599734
Epoch: 11, step: 969, loss: 0.3523849546909332, mean loss: 0.3671878251077265
Epoch: 11, step: 970, loss: 0.32424846291542053, mean loss: 0.3671852775335828
Epoch: 11, step: 971, loss: 0.32897326350212097, mean loss: 0.36718301056549835
Epoch: 11, step: 972, loss: 0.31232407689094543, mean loss: 0.36717975619439586
Epoch: 11, step: 973, loss: 0.3251509666442871, mean loss: 0.36717726308788556
Epoch: 11, step: 974, loss: 0.3135140538215637, mean loss: 0.36717408002784246
Epoch: 11, step: 975, loss: 0.32387489080429077, mean loss: 0.367171511867153
Epoch: 11, step: 976, loss: 0.3555639386177063, mean loss: 0.36717082343982077
Epoch: 11, step: 977, loss: 0.3101799488067627, mean loss: 0.3671674435990763
Epoch: 11, step: 978, loss: 0.331194669008255, mean loss: 0.36716531036213207
Epoch: 11, step: 979, loss: 0.3233352601528168, mean loss: 0.3671627113316405
Epoch: 11, step: 980, loss: 0.3466578423976898, mean loss: 0.3671614955078081
Epoch: 11, step: 981, loss: 0.33255451917648315, mean loss: 0.3671594436296905
Epoch: 11, step: 982, loss: 0.32446542382240295, mean loss: 0.36715691241371806
Epoch: 11, step: 983, loss: 0.3782489597797394, mean loss: 0.36715756999300225
Epoch: 11, step: 984, loss: 0.3575529456138611, mean loss: 0.36715700062763507
Epoch: 11, step: 985, loss: 0.39908042550086975, mean loss: 0.36715889294683324
Epoch: 11, step: 986, loss: 0.34051305055618286, mean loss: 0.36715731355957754
Epoch: 11, step: 987, loss: 0.3242626488208771, mean loss: 0.36715477120154416
Epoch: 11, step: 988, loss: 0.33826959133148193, mean loss: 0.3671530592842876
Epoch: 11, step: 989, loss: 0.3354281485080719, mean loss: 0.36715117917816126
Epoch: 11, step: 990, loss: 0.3480110466480255, mean loss: 0.3671500449480854
Epoch: 11, step: 991, loss: 0.35113251209259033, mean loss: 0.367149095817198
Epoch: 11, step: 992, loss: 0.3526618182659149, mean loss: 0.36714823741359837
Epoch: 11, step: 993, loss: 0.31093305349349976, mean loss: 0.36714490673556066
Epoch: 11, step: 994, loss: 0.3329343795776367, mean loss: 0.3671428799254915
Epoch: 11, step: 995, loss: 0.3223164975643158, mean loss: 0.3671402243341194
Epoch: 11, step: 996, loss: 0.348160982131958, mean loss: 0.3671391000380349
Epoch: 11, step: 997, loss: 0.3330884575843811, mean loss: 0.3671370830588586
Epoch: 11, step: 998, loss: 0.3423895835876465, mean loss: 0.3671356172352804
Epoch: 11, step: 999, loss: 0.3497872054576874, mean loss: 0.36713458972925234
Epoch: 11, step: 1000, loss: 0.3729500472545624, mean loss: 0.3671349341448594
Epoch: 11, step: 1001, loss: 0.3069401681423187, mean loss: 0.36713136937131907
Epoch: 11, step: 1002, loss: 0.33729976415634155, mean loss: 0.3671296028286996
Epoch: 11, step: 1003, loss: 0.33576714992523193, mean loss: 0.36712774574361534
Epoch: 11, step: 1004, loss: 0.31892886757850647, mean loss: 0.36712489188144676
Epoch: 11, step: 1005, loss: 0.35746562480926514, mean loss: 0.3671243199887841
Epoch: 11, step: 1006, loss: 0.3777724802494049, mean loss: 0.36712495039315685
Epoch: 11, step: 1007, loss: 0.3182842433452606, mean loss: 0.3671220590418043
Epoch: 11, step: 1008, loss: 0.337619423866272, mean loss: 0.3671203126003684
Epoch: 11, step: 1009, loss: 0.33098340034484863, mean loss: 0.36711817356211485
Epoch: 11, step: 1010, loss: 0.3344820737838745, mean loss: 0.36711624186044106
Epoch: 11, step: 1011, loss: 0.31383681297302246, mean loss: 0.3671130884851518
Epoch: 11, step: 1012, loss: 0.3559170067310333, mean loss: 0.3671124258774845
Epoch: 11, step: 1013, loss: 0.32953521609306335, mean loss: 0.36711020211077927
Epoch: 11, step: 1014, loss: 0.3706551790237427, mean loss: 0.3671104118851395
Epoch: 11, step: 1015, loss: 0.32053178548812866, mean loss: 0.36710765575340004
Epoch: 11, step: 1016, loss: 0.319375604391098, mean loss: 0.36710483153877593
Epoch: 11, step: 1017, loss: 0.35368630290031433, mean loss: 0.3671040376369514
Epoch: 11, step: 1018, loss: 0.33045557141304016, mean loss: 0.3671018694735352
Epoch: 11, step: 1019, loss: 0.3309497535228729, mean loss: 0.3670997308012712
Epoch: 11, step: 1020, loss: 0.3539890646934509, mean loss: 0.3670989552516641
Epoch: 11, step: 1021, loss: 0.3310958743095398, mean loss: 0.36709682564791735
Epoch: 11, step: 1022, loss: 0.350925087928772, mean loss: 0.3670958691365481
Epoch: 11, step: 1023, loss: 0.3268616497516632, mean loss: 0.36709348953994386
Epoch: 11, step: 1024, loss: 0.3141025900840759, mean loss: 0.3670903556526971
Epoch: 11, step: 1025, loss: 0.35280340909957886, mean loss: 0.36708951077117413
Epoch: 11, step: 1026, loss: 0.36469680070877075, mean loss: 0.3670893692827901
Epoch: 11, step: 1027, loss: 0.33106428384780884, mean loss: 0.36708723913346214
Epoch: 11, step: 1028, loss: 0.3266865015029907, mean loss: 0.3670848503947623
Epoch: 11, step: 1029, loss: 0.37012964487075806, mean loss: 0.36708503041099005
Epoch: 11, step: 1030, loss: 0.3446899652481079, mean loss: 0.36708370643433247
Epoch: 11, step: 1031, loss: 0.35315898060798645, mean loss: 0.36708288326539024
Epoch: 11, step: 1032, loss: 0.3164784610271454, mean loss: 0.3670798919299148
Epoch: 11, step: 1033, loss: 0.36127814650535583, mean loss: 0.3670795489966234
Epoch: 11, step: 1034, loss: 0.40775373578071594, mean loss: 0.3670819530504554
Epoch: 11, step: 1035, loss: 0.3652941882610321, mean loss: 0.36708184739059785
Epoch: 11, step: 1036, loss: 0.33642587065696716, mean loss: 0.3670800356787171
Epoch: 11, step: 1037, loss: 0.34468376636505127, mean loss: 0.3670787121785804
Epoch: 11, step: 1038, loss: 0.34106016159057617, mean loss: 0.36707717471178447
Epoch: 11, step: 1039, loss: 0.3104076087474823, mean loss: 0.36707382623825785
Epoch: 11, step: 1040, loss: 0.3221837878227234, mean loss: 0.36707117394647554
Epoch: 11, step: 1041, loss: 0.30326589941978455, mean loss: 0.36706740428592216
Epoch: 11, step: 1042, loss: 0.3040091097354889, mean loss: 0.36706367897756564
Epoch: 11, step: 1043, loss: 0.356152206659317, mean loss: 0.3670630343962614
Epoch: 11, step: 1044, loss: 0.3400060832500458, mean loss: 0.3670614361358121
Epoch: 11, step: 1045, loss: 0.3059004545211792, mean loss: 0.3670578235556813
Epoch: 11, step: 1046, loss: 0.34554484486579895, mean loss: 0.3670565529290975
Epoch: 11, step: 1047, loss: 0.4116256833076477, mean loss: 0.3670591851716193
Epoch: 11, step: 1048, loss: 0.3136919140815735, mean loss: 0.36705603349908106
Epoch: 11, step: 1049, loss: 0.32158544659614563, mean loss: 0.3670533483339161
Epoch: 11, step: 1050, loss: 0.3261917531490326, mean loss: 0.36705093548507145
Epoch: 11, step: 1051, loss: 0.31213077902793884, mean loss: 0.3670476926794233
Epoch: 11, step: 1052, loss: 0.35486900806427, mean loss: 0.36704697362146643
Epoch: 11, step: 1053, loss: 0.3359067142009735, mean loss: 0.3670451351364375
Epoch: 11, step: 1054, loss: 0.3487997055053711, mean loss: 0.36704405801089107
Epoch: 11, step: 1055, loss: 0.3292520344257355, mean loss: 0.3670418270767951
Epoch: 11, step: 1056, loss: 0.3206038773059845, mean loss: 0.3670390859192619
Epoch: 11, step: 1057, loss: 0.33115845918655396, mean loss: 0.36703696806855163
Epoch: 11, step: 1058, loss: 0.3309345841407776, mean loss: 0.3670348372544144
Epoch: 11, step: 1059, loss: 0.35518932342529297, mean loss: 0.3670341381565727
Epoch: 11, step: 1060, loss: 0.3459772765636444, mean loss: 0.3670328954972872
Epoch: 11, step: 1061, loss: 0.34429553151130676, mean loss: 0.36703155374324575
Epoch: 11, step: 1062, loss: 0.3445983827114105, mean loss: 0.36703023001804175
Epoch: 11, step: 1063, loss: 0.34921202063560486, mean loss: 0.36702917867219664
Epoch: 11, step: 1064, loss: 0.3670407235622406, mean loss: 0.3670291793533513
Epoch: 11, step: 1065, loss: 0.322630912065506, mean loss: 0.36702655998654965
Epoch: 11, step: 1066, loss: 0.34549182653427124, mean loss: 0.36702528957575076
Epoch: 11, step: 1067, loss: 0.3170832693576813, mean loss: 0.36702234349150004
Epoch: 11, step: 1068, loss: 0.3202047348022461, mean loss: 0.3670195818794733
Epoch: 11, step: 1069, loss: 0.2987358868122101, mean loss: 0.367015554293354
Epoch: 11, step: 1070, loss: 0.3151737451553345, mean loss: 0.36701249668149094
Epoch: 11, step: 1071, loss: 0.2875940203666687, mean loss: 0.3670078128836427
Epoch: 11, step: 1072, loss: 0.388176292181015, mean loss: 0.3670090612459295
Epoch: 11, step: 1073, loss: 0.31551286578178406, mean loss: 0.36700602455554954
Epoch: 11, step: 1074, loss: 0.33737462759017944, mean loss: 0.36700427731827345
Epoch: 11, step: 1075, loss: 0.33122146129608154, mean loss: 0.3670021674824231
Epoch: 11, step: 1076, loss: 0.3858814537525177, mean loss: 0.36700328058225623
Epoch: 11, step: 1077, loss: 0.3244595527648926, mean loss: 0.3670007724035145
Epoch: 11, step: 1078, loss: 0.3113691806793213, mean loss: 0.3669974928190233
Epoch: 11, step: 1079, loss: 0.34042683243751526, mean loss: 0.36699592652213686
Epoch: 11, step: 1080, loss: 0.3332669734954834, mean loss: 0.3669939383728279
Epoch: 11, step: 1081, loss: 0.3467685282230377, mean loss: 0.36699274625859063
Epoch: 11, step: 1082, loss: 0.3044686019420624, mean loss: 0.3669890612144275
Epoch: 11, step: 1083, loss: 0.3245787024497986, mean loss: 0.3669865617826285
Epoch: 11, step: 1084, loss: 0.34219542145729065, mean loss: 0.36698510081614105
Epoch: 11, step: 1085, loss: 0.3285026252269745, mean loss: 0.3669828331393238
Epoch: 11, step: 1086, loss: 0.34505370259284973, mean loss: 0.3669815409862069
Epoch: 11, step: 1087, loss: 0.31415557861328125, mean loss: 0.3669784284501255
Epoch: 11, step: 1088, loss: 0.3091578185558319, mean loss: 0.3669750218272601
Epoch: 11, step: 1089, loss: 0.31234875321388245, mean loss: 0.36697180359533993
Epoch: 11, step: 1090, loss: 0.34248101711273193, mean loss: 0.36697036083914064
Epoch: 11, step: 1091, loss: 0.35461142659187317, mean loss: 0.36696963281520995
Epoch: 11, step: 1092, loss: 0.324512243270874, mean loss: 0.3669671319381678
Epoch: 11, step: 1093, loss: 0.3551279306411743, mean loss: 0.3669664346121402
Epoch: 11, step: 1094, loss: 0.3035144507884979, mean loss: 0.3669626975261031
Epoch: 11, step: 1095, loss: 0.33490681648254395, mean loss: 0.3669608096650287
Epoch: 11, step: 1096, loss: 0.33525553345680237, mean loss: 0.36695894256201894
Epoch: 11, step: 1097, loss: 0.35967811942100525, mean loss: 0.36695851382434724
Epoch: 11, step: 1098, loss: 0.318478524684906, mean loss: 0.36695565920566153
Epoch: 11, step: 1099, loss: 0.33174729347229004, mean loss: 0.3669535861742359
Epoch: 11, step: 1100, loss: 0.31352120637893677, mean loss: 0.3669504403173154
Epoch: 11, step: 1101, loss: 0.3341358006000519, mean loss: 0.3669485084534441
Epoch: 11, step: 1102, loss: 0.34160536527633667, mean loss: 0.3669470165394406
Epoch: 11, step: 1103, loss: 0.32235148549079895, mean loss: 0.3669443914198828
Epoch: 11, step: 1104, loss: 0.35568150877952576, mean loss: 0.3669437284684059
Epoch: 11, step: 1105, loss: 0.3439771831035614, mean loss: 0.36694237669999125
Epoch: 11, step: 1106, loss: 0.35548800230026245, mean loss: 0.36694170255636227
Epoch: 11, step: 1107, loss: 0.3049110174179077, mean loss: 0.36693805197460977
Epoch: 11, step: 1108, loss: 0.3243272304534912, mean loss: 0.3669355444231756
Epoch: 11, step: 1109, loss: 0.30480828881263733, mean loss: 0.36693188858843334
Epoch: 11, step: 1110, loss: 0.33602359890937805, mean loss: 0.3669300699188435
Epoch: 11, step: 1111, loss: 0.34451666474342346, mean loss: 0.3669287511729518
Epoch: 11, step: 1112, loss: 0.3820059597492218, mean loss: 0.3669296382241124
Epoch: 11, step: 1113, loss: 0.30187684297561646, mean loss: 0.3669258111388525
Epoch: 11, step: 1114, loss: 0.3576894998550415, mean loss: 0.3669252677944626
Epoch: 11, step: 1115, loss: 0.3305515646934509, mean loss: 0.36692312816486844
Epoch: 11, step: 1116, loss: 0.3434711992740631, mean loss: 0.3669217487207833
Epoch: 11, step: 1117, loss: 0.3331219553947449, mean loss: 0.3669197607315276
Epoch: 11, step: 1118, loss: 0.3538667857646942, mean loss: 0.36691899304494485
Epoch: 11, step: 1119, loss: 0.344387024641037, mean loss: 0.3669176679468265
Epoch: 11, step: 1120, loss: 0.34146472811698914, mean loss: 0.3669161711553046
Epoch: 11, step: 1121, loss: 0.3641340136528015, mean loss: 0.3669160075567216
Epoch: 11, step: 1122, loss: 0.3781226575374603, mean loss: 0.36691666650009674
Epoch: 11, step: 1123, loss: 0.3153245151042938, mean loss: 0.36691363309514635
Epoch: 11, step: 1124, loss: 0.35013777017593384, mean loss: 0.3669126468018358
Epoch: 11, step: 1125, loss: 0.3827797770500183, mean loss: 0.3669135796137257
Epoch: 11, step: 1126, loss: 0.3431735932826996, mean loss: 0.36691218404695536
Epoch: 11, step: 1127, loss: 0.34140151739120483, mean loss: 0.3669106844780243
Epoch: 11, step: 1128, loss: 0.40290772914886475, mean loss: 0.36691280033323326
Epoch: 11, step: 1129, loss: 0.34407028555870056, mean loss: 0.3669114577615409
Epoch: 11, step: 1130, loss: 0.3256451189517975, mean loss: 0.3669090324698095
Epoch: 11, step: 1131, loss: 0.31456246972084045, mean loss: 0.3669059561555906
Epoch: 11, step: 1132, loss: 0.32360005378723145, mean loss: 0.36690341129443005
Epoch: 11, step: 1133, loss: 0.31103959679603577, mean loss: 0.3669001286634218
Epoch: 11, step: 1134, loss: 0.38098815083503723, mean loss: 0.36690095644544024
Epoch: 11, step: 1135, loss: 0.31591564416885376, mean loss: 0.3668979608336731
Epoch: 11, step: 1136, loss: 0.40440642833709717, mean loss: 0.36690016449194834
Epoch: 11, step: 1137, loss: 0.34910982847213745, mean loss: 0.36689911935412556
Epoch: 11, step: 1138, loss: 0.3812888562679291, mean loss: 0.36689996466558145
Epoch: 11, step: 1139, loss: 0.3173815906047821, mean loss: 0.3668970559265036
Epoch: 11, step: 1140, loss: 0.33231449127197266, mean loss: 0.366895024645173
Epoch: 11, step: 1141, loss: 0.316194623708725, mean loss: 0.3668920468229636
Epoch: 11, step: 1142, loss: 0.3436947762966156, mean loss: 0.366890684441421
Epoch: 11, step: 1143, loss: 0.3289448618888855, mean loss: 0.3668884560045786
Epoch: 11, step: 1144, loss: 0.3135818839073181, mean loss: 0.36688532566385995
Epoch: 11, step: 1145, loss: 0.3653748333454132, mean loss: 0.36688523696789294
Epoch: 11, step: 1146, loss: 0.3259733319282532, mean loss: 0.36688283476572986
Epoch: 11, step: 1147, loss: 0.34206244349479675, mean loss: 0.36688137748582905
Epoch: 11, step: 1148, loss: 0.3717535138130188, mean loss: 0.36688166352682755
Epoch: 11, step: 1149, loss: 0.33210447430610657, mean loss: 0.36687962189308204
Epoch: 11, step: 1150, loss: 0.34017878770828247, mean loss: 0.3668780544827982
Epoch: 11, step: 1151, loss: 0.37446674704551697, mean loss: 0.3668784999331717
Epoch: 11, step: 1152, loss: 0.3075210154056549, mean loss: 0.36687501589933197
Epoch: 11, step: 1153, loss: 0.3551139235496521, mean loss: 0.3668743256133624
Epoch: 11, step: 1154, loss: 0.3319002091884613, mean loss: 0.36687227302128395
Epoch: 11, step: 1155, loss: 0.2941904067993164, mean loss: 0.36686800765354793
Epoch: 11, step: 1156, loss: 0.32201340794563293, mean loss: 0.3668653754958279
Epoch: 11, step: 1157, loss: 0.351372092962265, mean loss: 0.3668644663723369
Epoch: 11, step: 1158, loss: 0.34507760405540466, mean loss: 0.3668631880256657
Epoch: 11, step: 1159, loss: 0.3284834623336792, mean loss: 0.3668609362229379
Epoch: 11, step: 1160, loss: 0.37617552280426025, mean loss: 0.3668614826932566
Epoch: 11, step: 1161, loss: 0.3407283127307892, mean loss: 0.36685994959634455
Epoch: 11, step: 1162, loss: 0.2770146131515503, mean loss: 0.3668546791477938
Epoch: 11, step: 1163, loss: 0.3291783332824707, mean loss: 0.3668524691321987
Epoch: 11, step: 1164, loss: 0.37067922949790955, mean loss: 0.3668526935887865
Epoch: 11, step: 1165, loss: 0.3181118071079254, mean loss: 0.3668498348857671
Epoch: 11, step: 1166, loss: 0.35141852498054504, mean loss: 0.3668489298766823
Epoch: 11, step: 1167, loss: 0.3769245445728302, mean loss: 0.3668495207525148
Epoch: 11, step: 1168, loss: 0.3147929608821869, mean loss: 0.3668464681189682
Epoch: 11, step: 1169, loss: 0.3349776566028595, mean loss: 0.3668445994188676
Epoch: 11, step: 1170, loss: 0.3340443968772888, mean loss: 0.36684267621731137
Epoch: 11, step: 1171, loss: 0.3532049059867859, mean loss: 0.36684187662946954
Epoch: 11, step: 1172, loss: 0.33995509147644043, mean loss: 0.36684030033908127
Epoch: 11, step: 1173, loss: 0.30808311700820923, mean loss: 0.36683685578618347
Epoch: 11, step: 1174, loss: 0.3445178270339966, mean loss: 0.3668355474428602
Epoch: 11, step: 1175, loss: 0.3627994954586029, mean loss: 0.36683531086302523
Epoch: 11, step: 1176, loss: 0.3180847465991974, mean loss: 0.3668324534358953
Epoch: 11, step: 1177, loss: 0.3180249333381653, mean loss: 0.3668295928380699
Epoch: 11, step: 1178, loss: 0.36161333322525024, mean loss: 0.36682928713217916
Epoch: 11, step: 1179, loss: 0.3469732105731964, mean loss: 0.36682812350837707
Epoch: 11, step: 1180, loss: 0.3790505826473236, mean loss: 0.36682883973803654
Epoch: 11, step: 1181, loss: 0.33038559556007385, mean loss: 0.36682670430828274
Epoch: 11, step: 1182, loss: 0.36183595657348633, mean loss: 0.366826411887369
Epoch: 11, step: 1183, loss: 0.40640103816986084, mean loss: 0.3668287305319836
Epoch: 11, step: 1184, loss: 0.3304710388183594, mean loss: 0.3668266004897015
Epoch: 11, step: 1185, loss: 0.341435968875885, mean loss: 0.36682511304789633
Epoch: 11, step: 1186, loss: 0.3517468273639679, mean loss: 0.3668242297788621
Epoch: 11, step: 1187, loss: 0.36728963255882263, mean loss: 0.3668242570400371
Epoch: 11, step: 1188, loss: 0.3162045478820801, mean loss: 0.3668212921417089
Epoch: 11, step: 1189, loss: 0.3500911295413971, mean loss: 0.36682031227977846
Epoch: 11, step: 1190, loss: 0.31986865401268005, mean loss: 0.366817562548694
Epoch: 11, step: 1191, loss: 0.3817130923271179, mean loss: 0.3668184348565986
Epoch: 11, step: 1192, loss: 0.35736748576164246, mean loss: 0.3668178814251355
Epoch: 11, step: 1193, loss: 0.32154449820518494, mean loss: 0.36681523044825176
Epoch: 11, step: 1194, loss: 0.2907177209854126, mean loss: 0.36681077482968727
Epoch: 11, step: 1195, loss: 0.33702540397644043, mean loss: 0.36680903095551554
Epoch: 11, step: 1196, loss: 0.31057095527648926, mean loss: 0.36680573852089937
Epoch: 11, step: 1197, loss: 0.34018242359161377, mean loss: 0.3668041799613086
Epoch: 11, step: 1198, loss: 0.34241196513175964, mean loss: 0.36680275209648217
Epoch: 11, step: 1199, loss: 0.34262770414352417, mean loss: 0.3668013370269462
Epoch: 11, step: 1200, loss: 0.3052574694156647, mean loss: 0.36679773481052175
Epoch: 11, step: 1201, loss: 0.362888365983963, mean loss: 0.36679750600513567
Epoch: 11, step: 1202, loss: 0.32395070791244507, mean loss: 0.366794998438091
Epoch: 11, step: 1203, loss: 0.34792378544807434, mean loss: 0.36679389408339824
Epoch: 11, step: 1204, loss: 0.3199569582939148, mean loss: 0.36679115331823997
Epoch: 11, step: 1205, loss: 0.36034026741981506, mean loss: 0.3667907758527105
Epoch: 11, step: 1206, loss: 0.3409741222858429, mean loss: 0.3667892653118664
Epoch: 11, step: 1207, loss: 0.3140677213668823, mean loss: 0.36678618073756586
Epoch: 11, step: 1208, loss: 0.3381801247596741, mean loss: 0.3667845071837147
Epoch: 11, step: 1209, loss: 0.30806589126586914, mean loss: 0.36678107214124844
Epoch: 11, step: 1210, loss: 0.3514799475669861, mean loss: 0.36678017707692706
Epoch: 11, step: 1211, loss: 0.31709691882133484, mean loss: 0.3667772709434306
Epoch: 11, step: 1212, loss: 0.3694981634616852, mean loss: 0.3667774300878722
Epoch: 11, step: 1213, loss: 0.3462468981742859, mean loss: 0.36677622933153153
Epoch: 11, step: 1214, loss: 0.32049819827079773, mean loss: 0.3667735228556522
Epoch: 11, step: 1215, loss: 0.33142319321632385, mean loss: 0.36677145558491303
Epoch: 11, step: 1216, loss: 0.38451695442199707, mean loss: 0.36677249327269956
Epoch: 11, step: 1217, loss: 0.345913290977478, mean loss: 0.3667712735789623
Epoch: 11, step: 1218, loss: 0.33198291063308716, mean loss: 0.3667692395286234
Epoch: 11, step: 1219, loss: 0.3467405438423157, mean loss: 0.36676806853378674
Epoch: 11, step: 1220, loss: 0.3213641047477722, mean loss: 0.36676541410737423
Epoch: 11, step: 1221, loss: 0.365311861038208, mean loss: 0.36676532913408594
Epoch: 11, step: 1222, loss: 0.3160310983657837, mean loss: 0.3667623634340352
Epoch: 11, step: 1223, loss: 0.33721691370010376, mean loss: 0.36676063643790857
Epoch: 11, step: 1224, loss: 0.3180710971355438, mean loss: 0.36675779059424135
Epoch: 11, step: 1225, loss: 0.30580374598503113, mean loss: 0.3667542281135512
Epoch: 11, step: 1226, loss: 0.3226177394390106, mean loss: 0.3667516486916194
Epoch: 11, step: 1227, loss: 0.33739233016967773, mean loss: 0.3667499329764183
Epoch: 11, step: 1228, loss: 0.31136783957481384, mean loss: 0.36674669671781945
Epoch: 11, step: 1229, loss: 0.31327688694000244, mean loss: 0.366743572386291
Epoch: 11, step: 1230, loss: 0.3330654799938202, mean loss: 0.36674160463330285
Epoch: 11, step: 1231, loss: 0.42513182759284973, mean loss: 0.36674501607423293
Epoch: 11, step: 1232, loss: 0.37331533432006836, mean loss: 0.3667453999217673
Epoch: 11, step: 1233, loss: 0.35560405254364014, mean loss: 0.36674474906609617
Epoch: 11, step: 1234, loss: 0.28567492961883545, mean loss: 0.36674001340283036
Epoch: 11, step: 1235, loss: 0.3227788805961609, mean loss: 0.3667374455796524
Epoch: 11, step: 1236, loss: 0.3421594798564911, mean loss: 0.3667360100346653
Epoch: 11, step: 1237, loss: 0.3012986481189728, mean loss: 0.3667321882053279
Epoch: 11, step: 1238, loss: 0.3242293894290924, mean loss: 0.3667297060001783
Epoch: 11, step: 1239, loss: 0.37208205461502075, mean loss: 0.36673001856433474
Epoch: 11, step: 1240, loss: 0.319134920835495, mean loss: 0.36672723928855494
Epoch: 11, step: 1241, loss: 0.29496508836746216, mean loss: 0.3667230490426761
Epoch: 11, step: 1242, loss: 0.32488083839416504, mean loss: 0.36672060598722866
Epoch: 11, step: 1243, loss: 0.3304499089717865, mean loss: 0.3667184883612936
Epoch: 11, step: 1244, loss: 0.3180437982082367, mean loss: 0.36671564670736445
Epoch: 11, step: 1245, loss: 0.30285125970840454, mean loss: 0.36671191848862544
Epoch: 11, step: 1246, loss: 0.3428020477294922, mean loss: 0.3667105227807999
Epoch: 11, step: 1247, loss: 0.28745466470718384, mean loss: 0.36670589659249303
Epoch: 11, step: 1248, loss: 0.32744938135147095, mean loss: 0.36670360531161744
Epoch: 11, step: 1249, loss: 0.35185548663139343, mean loss: 0.36670273872362397
Epoch: 11, step: 1250, loss: 0.31358882784843445, mean loss: 0.36669963899144564
Epoch: 11, step: 1251, loss: 0.38811731338500977, mean loss: 0.366700888855731
Epoch: 11, step: 1252, loss: 0.33376458287239075, mean loss: 0.36669896691455206
Epoch: 11, step: 1253, loss: 0.31638628244400024, mean loss: 0.3666960311761654
Epoch: 11, step: 1254, loss: 0.32049480080604553, mean loss: 0.3666933354978662
Epoch: 11, step: 1255, loss: 0.3546488881111145, mean loss: 0.36669263278798364
Epoch: 11, step: 1256, loss: 0.3284000754356384, mean loss: 0.3666903988134575
Epoch: 11, step: 1257, loss: 0.33068645000457764, mean loss: 0.36668829847809353
Epoch: 11, step: 1258, loss: 0.36219480633735657, mean loss: 0.366688036359903
Epoch: 11, step: 1259, loss: 0.36594459414482117, mean loss: 0.3666879929953314
Epoch: 11, step: 1260, loss: 0.3300338387489319, mean loss: 0.36668585510357016
Epoch: 11, step: 1261, loss: 0.32534894347190857, mean loss: 0.36668344422571925
Epoch: 11, step: 1262, loss: 0.31243130564689636, mean loss: 0.36668028028225513
Epoch: 11, step: 1263, loss: 0.34145134687423706, mean loss: 0.36667880903584693
Epoch: 11, step: 1264, loss: 0.3226807415485382, mean loss: 0.3666762434012626
Epoch: 11, step: 1265, loss: 0.33616986870765686, mean loss: 0.36667446460390435
Epoch: 11, step: 1266, loss: 0.3285042345523834, mean loss: 0.36667223906428265
Epoch: 11, step: 1267, loss: 0.3666592240333557, mean loss: 0.3666722383054772
Epoch: 11, step: 1268, loss: 0.2991558015346527, mean loss: 0.3666683021755424
Epoch: 11, step: 1269, loss: 0.3419633209705353, mean loss: 0.36666686198776083
Epoch: 11, step: 1270, loss: 0.34315750002861023, mean loss: 0.3666654915790194
Epoch: 11, step: 1271, loss: 0.34382012486457825, mean loss: 0.36666415995354057
Epoch: 11, step: 1272, loss: 0.3513060510158539, mean loss: 0.3666632648023523
Epoch: 11, step: 1273, loss: 0.3484921455383301, mean loss: 0.36666220575588626
Epoch: 11, step: 1274, loss: 0.3278297483921051, mean loss: 0.3666599426602884
Epoch: 11, step: 1275, loss: 0.3761078119277954, mean loss: 0.36666049323542055
Epoch: 11, step: 1276, loss: 0.3402152359485626, mean loss: 0.36665895222631345
Epoch: 11, step: 1277, loss: 0.33414629101753235, mean loss: 0.36665705776988594
Epoch: 11, step: 1278, loss: 0.39099225401878357, mean loss: 0.3666584756569831
Epoch: 11, step: 1279, loss: 0.3306788206100464, mean loss: 0.36665637942911977
Epoch: 11, step: 1280, loss: 0.34027963876724243, mean loss: 0.3666548427707649
Epoch: 11, step: 1281, loss: 0.34566596150398254, mean loss: 0.3666536200700037
Epoch: 11, step: 1282, loss: 0.3128560781478882, mean loss: 0.3666504862934602
Epoch: 11, step: 1283, loss: 0.323682963848114, mean loss: 0.3666479835253774
Epoch: 11, step: 1284, loss: 0.3063346743583679, mean loss: 0.3666444706062111
Epoch: 11, step: 1285, loss: 0.4172718822956085, mean loss: 0.3666474192032809
Epoch: 11, step: 1286, loss: 0.30834996700286865, mean loss: 0.3666440240922099
Epoch: 11, step: 1287, loss: 0.3331380784511566, mean loss: 0.3666420728957482
Epoch: 11, step: 1288, loss: 0.33194077014923096, mean loss: 0.3666400522061339
Epoch: 11, step: 1289, loss: 0.35273441672325134, mean loss: 0.36663924251500296
Epoch: 11, step: 1290, loss: 0.3705601990222931, mean loss: 0.3666394708094139
Epoch: 11, step: 1291, loss: 0.3301441967487335, mean loss: 0.36663734602634096
Epoch: 11, step: 1292, loss: 0.3337319791316986, mean loss: 0.3666354303619703
Epoch: 11, step: 1293, loss: 0.31975868344306946, mean loss: 0.36663270147927624
Epoch: 11, step: 1294, loss: 0.34382864832878113, mean loss: 0.36663137404152374
Epoch: 11, step: 1295, loss: 0.3347858786582947, mean loss: 0.36662952040384134
Epoch: 11, step: 1296, loss: 0.33841681480407715, mean loss: 0.3666278783163261
Epoch: 11, step: 1297, loss: 0.33095675706863403, mean loss: 0.3666258022412913
Epoch: 11, step: 1298, loss: 0.3314102590084076, mean loss: 0.3666237528003769
Epoch: 11, step: 1299, loss: 0.322873592376709, mean loss: 0.3666212068180431
Epoch: 11, step: 1300, loss: 0.34871768951416016, mean loss: 0.3666201650073184
Epoch: 11, step: 1301, loss: 0.3379156291484833, mean loss: 0.36661849477946673
Epoch: 11, step: 1302, loss: 0.3379702866077423, mean loss: 0.36661682792613737
Epoch: 11, step: 1303, loss: 0.3465671241283417, mean loss: 0.36661566143185076
Epoch: 11, step: 1304, loss: 0.30627745389938354, mean loss: 0.3666121511515824
Epoch: 11, step: 1305, loss: 0.34376779198646545, mean loss: 0.36661082221853036
Epoch: 11, step: 1306, loss: 0.3473762273788452, mean loss: 0.3666097033426744
Epoch: 11, step: 1307, loss: 0.34086060523986816, mean loss: 0.3666082056054651
Epoch: 11, step: 1308, loss: 0.3143291771411896, mean loss: 0.36660516488956535
Epoch: 11, step: 1309, loss: 0.34908947348594666, mean loss: 0.3666041461800502
Epoch: 11, step: 1310, loss: 0.3538917303085327, mean loss: 0.3666034068711888
Epoch: 11, step: 1311, loss: 0.3279883861541748, mean loss: 0.3666011612896165
Epoch: 11, step: 1312, loss: 0.3761938214302063, mean loss: 0.36660171909970785
Epoch: 11, step: 1313, loss: 0.39419227838516235, mean loss: 0.3666033233885371
Epoch: 11, step: 1314, loss: 0.3817202150821686, mean loss: 0.3666042023286902
Epoch: 11, step: 1315, loss: 0.32539913058280945, mean loss: 0.36660180668498404
Epoch: 11, step: 1316, loss: 0.3051585555076599, mean loss: 0.3665982346106176
Epoch: 11, step: 1317, loss: 0.38324394822120667, mean loss: 0.36659920227214593
Epoch: 11, step: 1318, loss: 0.33775824308395386, mean loss: 0.36659752576460725
Epoch: 11, step: 1319, loss: 0.30118417739868164, mean loss: 0.36659372354719466
Epoch: 11, step: 1320, loss: 0.3250965476036072, mean loss: 0.3665913116218274
Epoch: 11, step: 1321, loss: 0.32900241017341614, mean loss: 0.3665891269826638
Epoch: 11, step: 1322, loss: 0.34337911009788513, mean loss: 0.36658777811203647
Epoch: 11, step: 1323, loss: 0.3244818150997162, mean loss: 0.3665853312290162
Epoch: 11, step: 1324, loss: 0.3075318932533264, mean loss: 0.3665818996851743
Epoch: 11, step: 1325, loss: 0.3326595723628998, mean loss: 0.36657992860281974
Epoch: 11, step: 1326, loss: 0.3305397927761078, mean loss: 0.36657783458528287
Epoch: 11, step: 1327, loss: 0.3472723364830017, mean loss: 0.36657671295513516
Epoch: 11, step: 1328, loss: 0.3219067454338074, mean loss: 0.3665741178254354
Epoch: 11, step: 1329, loss: 0.3151821792125702, mean loss: 0.3665711323520642
Epoch: 11, step: 1330, loss: 0.3230472505092621, mean loss: 0.36656860409868963
Epoch: 11, step: 1331, loss: 0.32409635186195374, mean loss: 0.3665661370766034
Epoch: 11, step: 1332, loss: 0.37706896662712097, mean loss: 0.36656674710329507
Epoch: 11, step: 1333, loss: 0.34269091486930847, mean loss: 0.3665653604246893
Epoch: 11, step: 1334, loss: 0.30668357014656067, mean loss: 0.3665618827668533
Epoch: 11, step: 1335, loss: 0.3469819128513336, mean loss: 0.36656074571865843
Epoch: 11, step: 1336, loss: 0.37122294306755066, mean loss: 0.3665610164461045
Epoch: 11, step: 1337, loss: 0.3465632498264313, mean loss: 0.3665598552704792
Epoch: 11, step: 1338, loss: 0.32886141538619995, mean loss: 0.36655766642765947
Epoch: 11, step: 1339, loss: 0.30723515152931213, mean loss: 0.36655422225006434
Epoch: 11, step: 1340, loss: 0.36891913414001465, mean loss: 0.3665543595453845
Epoch: 11, step: 1341, loss: 0.3507412374019623, mean loss: 0.3665534415654621
Epoch: 11, step: 1342, loss: 0.31275302171707153, mean loss: 0.36655031853650477
Epoch: 11, step: 1343, loss: 0.3608405888080597, mean loss: 0.3665499871149974
Epoch: 11, step: 1344, loss: 0.3729555010795593, mean loss: 0.36655035890175025
Epoch: 11, step: 1345, loss: 0.3325637876987457, mean loss: 0.3665483863787553
Epoch: 11, step: 1346, loss: 0.3408753275871277, mean loss: 0.3665468964444049
Epoch: 11, step: 1347, loss: 0.3631593585014343, mean loss: 0.36654669986026245
Epoch: 11, step: 1348, loss: 0.35909220576286316, mean loss: 0.36654626728937534
Epoch: 11, step: 1349, loss: 0.3363170325756073, mean loss: 0.3665445132430301
Epoch: 11, step: 1350, loss: 0.3494342565536499, mean loss: 0.3665435204808201
Epoch: 11, step: 1351, loss: 0.34794381260871887, mean loss: 0.36654244136107816
Epoch: 11, step: 1352, loss: 0.37430939078330994, mean loss: 0.3665428919585964
Epoch: 11, step: 1353, loss: 0.3216557800769806, mean loss: 0.3665402879957306
Epoch: 11, step: 1354, loss: 0.3478216826915741, mean loss: 0.36653920216677854
Epoch: 11, step: 1355, loss: 0.36200186610221863, mean loss: 0.3665389389802319
Epoch: 11, step: 1356, loss: 0.3344377875328064, mean loss: 0.36653707707248595
Epoch: 11, step: 1357, loss: 0.33300215005874634, mean loss: 0.36653513211673755
Epoch: 11, step: 1358, loss: 0.31190595030784607, mean loss: 0.36653196392200293
Epoch: 11, step: 1359, loss: 0.32031863927841187, mean loss: 0.36652928395652834
Epoch: 11, step: 1360, loss: 0.32783204317092896, mean loss: 0.36652703998779623
Epoch: 11, step: 1361, loss: 0.3631736934185028, mean loss: 0.36652684554580567
Epoch: 11, step: 1362, loss: 0.33939129114151, mean loss: 0.36652527219656206
Epoch: 11, step: 1363, loss: 0.3283061981201172, mean loss: 0.3665230563411541
Epoch: 11, step: 1364, loss: 0.3805367350578308, mean loss: 0.36652386877542376
Epoch: 11, step: 1365, loss: 0.33047449588775635, mean loss: 0.3665217789567056
Epoch: 11, step: 1366, loss: 0.33782389760017395, mean loss: 0.36652011540784724
Epoch: 11, step: 1367, loss: 0.3155752122402191, mean loss: 0.3665171624225025
Epoch: 11, step: 1368, loss: 0.30936598777770996, mean loss: 0.366513849887022
Epoch: 11, step: 1369, loss: 0.30504196882247925, mean loss: 0.3665102871258614
Epoch: 11, step: 1370, loss: 0.33890631794929504, mean loss: 0.3665086873594646
Epoch: 11, step: 1371, loss: 0.2917817234992981, mean loss: 0.3665043568678176
Epoch: 11, step: 1372, loss: 0.37784844636917114, mean loss: 0.3665050142294391
Epoch: 11, step: 1373, loss: 0.3555667996406555, mean loss: 0.3665043804239814
Epoch: 11, step: 1374, loss: 0.3373713791370392, mean loss: 0.3665026924350315
Epoch: 11, step: 1375, loss: 0.3011007010936737, mean loss: 0.36649890321189466
Epoch: 11, step: 1376, loss: 0.33212172985076904, mean loss: 0.3664969116022914
Epoch: 11, step: 1377, loss: 0.35698989033699036, mean loss: 0.3664963608537533
Epoch: 11, step: 1378, loss: 0.31279256939888, mean loss: 0.36649324993494115
Epoch: 11, step: 1379, loss: 0.36388543248176575, mean loss: 0.3664930988797133
Epoch: 11, step: 1380, loss: 0.347210168838501, mean loss: 0.3664919819998963
Epoch: 11, step: 1381, loss: 0.33406180143356323, mean loss: 0.3664901037315906
Epoch: 11, step: 1382, loss: 0.3250507116317749, mean loss: 0.3664877038131276
Epoch: 11, step: 1383, loss: 0.3483232855796814, mean loss: 0.36648665190102236
Epoch: 11, step: 1384, loss: 0.33980634808540344, mean loss: 0.36648510691846314
Epoch: 11, step: 1385, loss: 0.3276672661304474, mean loss: 0.3664828592148854
Epoch: 11, step: 1386, loss: 0.33478841185569763, mean loss: 0.36648102408968364
Epoch: 11, step: 1387, loss: 0.303101509809494, mean loss: 0.3664773545948782
Epoch: 11, step: 1388, loss: 0.3367597460746765, mean loss: 0.3664756341289186
Epoch: 11, step: 1389, loss: 0.36721864342689514, mean loss: 0.36647567714207696
Epoch: 11, step: 1390, loss: 0.33576861023902893, mean loss: 0.36647389959840676
Epoch: 11, step: 1391, loss: 0.3410523533821106, mean loss: 0.366472428103488
Epoch: 11, step: 1392, loss: 0.31375542283058167, mean loss: 0.3664693768211315
Epoch: 11, step: 1393, loss: 0.35748204588890076, mean loss: 0.36646885666075807
Epoch: 11, step: 1394, loss: 0.34108683466911316, mean loss: 0.3664673877087359
Epoch: 11, step: 1395, loss: 0.3192249834537506, mean loss: 0.36646465377330445
Epoch: 11, step: 1396, loss: 0.29547956585884094, mean loss: 0.3664605460776899
Epoch: 11, step: 1397, loss: 0.3324505686759949, mean loss: 0.3664585781354725
Epoch: 11, step: 1398, loss: 0.322626531124115, mean loss: 0.36645604199897935
Epoch: 11, step: 1399, loss: 0.3215785622596741, mean loss: 0.3664534455236415
Epoch: 11, step: 1400, loss: 0.35626330971717834, mean loss: 0.3664528559872917
Epoch: 11, step: 1401, loss: 0.33575424551963806, mean loss: 0.36645108006397414
Epoch: 11, step: 1402, loss: 0.34121665358543396, mean loss: 0.3664496203296953
Epoch: 11, step: 1403, loss: 0.3376498222351074, mean loss: 0.36644795444595546
Epoch: 11, step: 1404, loss: 0.3142203390598297, mean loss: 0.3664449335878731
Epoch: 11, step: 1405, loss: 0.335525780916214, mean loss: 0.36644314531993377
Epoch: 11, step: 1406, loss: 0.3404020369052887, mean loss: 0.36644163927005724
Epoch: 11, step: 1407, loss: 0.30997946858406067, mean loss: 0.36643837405084106
Epoch: 11, step: 1408, loss: 0.3810995817184448, mean loss: 0.3664392218625376
Epoch: 11, step: 1409, loss: 0.33870992064476013, mean loss: 0.3664376184566617
Epoch: 11, step: 1410, loss: 0.3282252550125122, mean loss: 0.36643540901095806
Epoch: 11, step: 1411, loss: 0.3123651444911957, mean loss: 0.36643228283932766
Epoch: 11, step: 1412, loss: 0.39102163910865784, mean loss: 0.36643370443592066
Epoch: 11, step: 1413, loss: 0.37853312492370605, mean loss: 0.36643440390525167
Epoch: 11, step: 1414, loss: 0.327153742313385, mean loss: 0.3664321332155244
Epoch: 11, step: 1415, loss: 0.31288933753967285, mean loss: 0.3664290382562368
Epoch: 11, step: 1416, loss: 0.3241109848022461, mean loss: 0.36642659226736596
Epoch: 11, step: 1417, loss: 0.3469337821006775, mean loss: 0.3664254656455785
Epoch: 11, step: 1418, loss: 0.3464081287384033, mean loss: 0.3664243087746944
Epoch: 11, step: 1419, loss: 0.4101352393627167, mean loss: 0.36642683483402105
Epoch: 11, step: 1420, loss: 0.32009145617485046, mean loss: 0.3664241572622985
Epoch: 11, step: 1421, loss: 0.33788982033729553, mean loss: 0.36642250845050345
Epoch: 11, step: 1422, loss: 0.32642409205436707, mean loss: 0.36642019733844494
Epoch: 11, step: 1423, loss: 0.37433922290802, mean loss: 0.36642065487401054
Epoch: 11, step: 1424, loss: 0.3204652965068817, mean loss: 0.36641799987612694
Epoch: 11, step: 1425, loss: 0.3276950716972351, mean loss: 0.36641576284965793
Epoch: 11, step: 1426, loss: 0.3390049338340759, mean loss: 0.3664141794154822
Epoch: 11, step: 1427, loss: 0.32969364523887634, mean loss: 0.36641205831253765
Epoch: 11, step: 1428, loss: 0.29621753096580505, mean loss: 0.36640800387209715
Epoch: 11, step: 1429, loss: 0.3443658947944641, mean loss: 0.3664067307919841
Epoch: 11, step: 1430, loss: 0.3079169988632202, mean loss: 0.3664033528115089
Epoch: 11, step: 1431, loss: 0.32818782329559326, mean loss: 0.36640114586247235
Epoch: 11, step: 1432, loss: 0.3455897867679596, mean loss: 0.3663999440746861
Epoch: 11, step: 1433, loss: 0.33096742630004883, mean loss: 0.3663978980810509
Epoch: 11, step: 1434, loss: 0.31366321444511414, mean loss: 0.36639485317755555
Epoch: 11, step: 1435, loss: 0.3593143820762634, mean loss: 0.3663944443743742
Epoch: 11, step: 1436, loss: 0.3111882507801056, mean loss: 0.3663912571338226
Epoch: 11, step: 1437, loss: 0.35906487703323364, mean loss: 0.3663908341815018
Epoch: 11, step: 1438, loss: 0.36518293619155884, mean loss: 0.3663907644535107
Epoch: 11, step: 1439, loss: 0.32771235704421997, mean loss: 0.3663885318047339
Epoch: 11, step: 1440, loss: 0.32644620537757874, mean loss: 0.36638622633134704
Epoch: 11, step: 1441, loss: 0.3371513783931732, mean loss: 0.36638453899163
Epoch: 11, step: 1442, loss: 0.34426525235176086, mean loss: 0.36638326241249686
Epoch: 11, step: 1443, loss: 0.3576336205005646, mean loss: 0.3663827574700966
Valid: 11, mean loss: 0.1946713998913765
Epoch: 12, step: 0, loss: 0.3511502742767334, mean loss: 0.36638187845323505
Epoch: 12, step: 1, loss: 0.34522148966789246, mean loss: 0.36638065742676157
Epoch: 12, step: 2, loss: 0.33655184507369995, mean loss: 0.3663789363020513
Epoch: 12, step: 3, loss: 0.3248246908187866, mean loss: 0.36637653875730847
Epoch: 12, step: 4, loss: 0.35523587465286255, mean loss: 0.36637589601432663
Epoch: 12, step: 5, loss: 0.3541606068611145, mean loss: 0.3663751913132101
Epoch: 12, step: 6, loss: 0.3284730613231659, mean loss: 0.3663730048621002
Epoch: 12, step: 7, loss: 0.3484674394130707, mean loss: 0.3663719720076096
Epoch: 12, step: 8, loss: 0.331146776676178, mean loss: 0.3663699402146044
Epoch: 12, step: 9, loss: 0.3212032914161682, mean loss: 0.36636733514776865
Epoch: 12, step: 10, loss: 0.33784472942352295, mean loss: 0.36636569015061055
Epoch: 12, step: 11, loss: 0.32161372900009155, mean loss: 0.36636310929933313
Epoch: 12, step: 12, loss: 0.3438447415828705, mean loss: 0.36636181073709817
Epoch: 12, step: 13, loss: 0.3592451810836792, mean loss: 0.36636140036749526
Epoch: 12, step: 14, loss: 0.30121785402297974, mean loss: 0.3663576441807718
Epoch: 12, step: 15, loss: 0.34567901492118835, mean loss: 0.3663564519166309
Epoch: 12, step: 16, loss: 0.31166908144950867, mean loss: 0.3663532989981837
Epoch: 12, step: 17, loss: 0.3414442241191864, mean loss: 0.36635186298556527
Epoch: 12, step: 18, loss: 0.3690730035305023, mean loss: 0.3663520198507607
Epoch: 12, step: 19, loss: 0.3106074929237366, mean loss: 0.3663488065393169
Epoch: 12, step: 20, loss: 0.3640908896923065, mean loss: 0.3663486763925161
Epoch: 12, step: 21, loss: 0.32316261529922485, mean loss: 0.3663461872823666
Epoch: 12, step: 22, loss: 0.36310291290283203, mean loss: 0.3663460003608993
Epoch: 12, step: 23, loss: 0.3249732553958893, mean loss: 0.36634361603949744
Epoch: 12, step: 24, loss: 0.3314938545227051, mean loss: 0.36634160775496355
Epoch: 12, step: 25, loss: 0.34250423312187195, mean loss: 0.36634023415956
Epoch: 12, step: 26, loss: 0.4035343825817108, mean loss: 0.36634237729689345
Epoch: 12, step: 27, loss: 0.3340112864971161, mean loss: 0.3663405144776494
Epoch: 12, step: 28, loss: 0.3156546950340271, mean loss: 0.3663375942829474
Epoch: 12, step: 29, loss: 0.3414752185344696, mean loss: 0.36633616195343083
Epoch: 12, step: 30, loss: 0.34686797857284546, mean loss: 0.36633504044969323
Epoch: 12, step: 31, loss: 0.3331533372402191, mean loss: 0.3663331290612595
Epoch: 12, step: 32, loss: 0.35509344935417175, mean loss: 0.3663324816515649
Epoch: 12, step: 33, loss: 0.3609468340873718, mean loss: 0.3663321714541473
Epoch: 12, step: 34, loss: 0.35551851987838745, mean loss: 0.36633154865557704
Epoch: 12, step: 35, loss: 0.3132421672344208, mean loss: 0.3663284912159651
Epoch: 12, step: 36, loss: 0.3363594710826874, mean loss: 0.3663267653869911
Epoch: 12, step: 37, loss: 0.33898720145225525, mean loss: 0.36632519107143574
Epoch: 12, step: 38, loss: 0.34755608439445496, mean loss: 0.3663241103374761
Epoch: 12, step: 39, loss: 0.3234144449234009, mean loss: 0.36632163972108883
Epoch: 12, step: 40, loss: 0.32313865423202515, mean loss: 0.3663191535108586
Epoch: 12, step: 41, loss: 0.3238467574119568, mean loss: 0.36631670835276425
Epoch: 12, step: 42, loss: 0.32345637679100037, mean loss: 0.3663142410030687
Epoch: 12, step: 43, loss: 0.33295518159866333, mean loss: 0.366312320725645
Epoch: 12, step: 44, loss: 0.32400450110435486, mean loss: 0.3663098854629028
Epoch: 12, step: 45, loss: 0.38096052408218384, mean loss: 0.3663107287136579
Epoch: 12, step: 46, loss: 0.3694567382335663, mean loss: 0.366310909778954
Epoch: 12, step: 47, loss: 0.3116970360279083, mean loss: 0.3663077667153173
Epoch: 12, step: 48, loss: 0.36076343059539795, mean loss: 0.3663074476535621
Epoch: 12, step: 49, loss: 0.33984968066215515, mean loss: 0.3663059251672581
Epoch: 12, step: 50, loss: 0.3373827338218689, mean loss: 0.3663042609062911
Epoch: 12, step: 51, loss: 0.38475462794303894, mean loss: 0.3663053224924267
Epoch: 12, step: 52, loss: 0.3429301381111145, mean loss: 0.36630397762248934
Epoch: 12, step: 53, loss: 0.3582872152328491, mean loss: 0.3663035164119043
Epoch: 12, step: 54, loss: 0.3627580404281616, mean loss: 0.36630331244964326
Epoch: 12, step: 55, loss: 0.3524996340274811, mean loss: 0.36630251840463507
Epoch: 12, step: 56, loss: 0.2970004081726074, mean loss: 0.366298532088257
Epoch: 12, step: 57, loss: 0.3628913462162018, mean loss: 0.3662983361152976
Epoch: 12, step: 58, loss: 0.34632256627082825, mean loss: 0.366297187224181
Epoch: 12, step: 59, loss: 0.3376559019088745, mean loss: 0.36629554003730985
Epoch: 12, step: 60, loss: 0.3406441807746887, mean loss: 0.36629406488869504
Epoch: 12, step: 61, loss: 0.3245374262332916, mean loss: 0.3662916637018833
Epoch: 12, step: 62, loss: 0.3452973961830139, mean loss: 0.3662904565103751
Epoch: 12, step: 63, loss: 0.3313404321670532, mean loss: 0.3662884469643572
Epoch: 12, step: 64, loss: 0.30023640394210815, mean loss: 0.3662846493421516
Epoch: 12, step: 65, loss: 0.3394710421562195, mean loss: 0.3662831077986777
Epoch: 12, step: 66, loss: 0.3468439280986786, mean loss: 0.3662819902833169
Epoch: 12, step: 67, loss: 0.3393404185771942, mean loss: 0.36628044156109885
Epoch: 12, step: 68, loss: 0.37772971391677856, mean loss: 0.3662810996787258
Epoch: 12, step: 69, loss: 0.36124879121780396, mean loss: 0.36628081043234917
Epoch: 12, step: 70, loss: 0.3334624469280243, mean loss: 0.3662789242111006
Epoch: 12, step: 71, loss: 0.33370307087898254, mean loss: 0.3662770520356217
Epoch: 12, step: 72, loss: 0.3302076458930969, mean loss: 0.36627497920037416
Epoch: 12, step: 73, loss: 0.3524404466152191, mean loss: 0.36627418420367347
Epoch: 12, step: 74, loss: 0.3310433626174927, mean loss: 0.36627215979284855
Epoch: 12, step: 75, loss: 0.3403422236442566, mean loss: 0.3662706699091351
Epoch: 12, step: 76, loss: 0.3495458662509918, mean loss: 0.36626970898964883
Epoch: 12, step: 77, loss: 0.31223443150520325, mean loss: 0.3662666045844159
Epoch: 12, step: 78, loss: 0.3247453570365906, mean loss: 0.3662642192654323
Epoch: 12, step: 79, loss: 0.39336615800857544, mean loss: 0.3662657761323178
Epoch: 12, step: 80, loss: 0.3214486241340637, mean loss: 0.36626320176549615
Epoch: 12, step: 81, loss: 0.31403523683547974, mean loss: 0.366260201882387
Epoch: 12, step: 82, loss: 0.3212057054042816, mean loss: 0.3662576141794131
Epoch: 12, step: 83, loss: 0.3434111475944519, mean loss: 0.36625630206899584
Epoch: 12, step: 84, loss: 0.3153766095638275, mean loss: 0.3662533801317935
Epoch: 12, step: 85, loss: 0.3403741121292114, mean loss: 0.366251894013268
Epoch: 12, step: 86, loss: 0.37188631296157837, mean loss: 0.36625221755153664
Epoch: 12, step: 87, loss: 0.3349544405937195, mean loss: 0.36625042048120143
Epoch: 12, step: 88, loss: 0.4158506393432617, mean loss: 0.3662532682861542
Epoch: 12, step: 89, loss: 0.3437528610229492, mean loss: 0.366251976495635
Epoch: 12, step: 90, loss: 0.3888275921344757, mean loss: 0.36625327252960016
Epoch: 12, step: 91, loss: 0.31650015711784363, mean loss: 0.3662504164380151
Epoch: 12, step: 92, loss: 0.35288816690444946, mean loss: 0.366249649418353
Epoch: 12, step: 93, loss: 0.36638787388801575, mean loss: 0.3662496573522566
Epoch: 12, step: 94, loss: 0.3365810215473175, mean loss: 0.36624795450912945
Epoch: 12, step: 95, loss: 0.3987659513950348, mean loss: 0.36624982078535107
Epoch: 12, step: 96, loss: 0.33143100142478943, mean loss: 0.36624782257477084
Epoch: 12, step: 97, loss: 0.30615660548210144, mean loss: 0.3662443742092772
Epoch: 12, step: 98, loss: 0.35285791754722595, mean loss: 0.366243606064636
Epoch: 12, step: 99, loss: 0.32195693254470825, mean loss: 0.36624106494267594
Epoch: 12, step: 100, loss: 0.3333362936973572, mean loss: 0.3662391770104225
Epoch: 12, step: 101, loss: 0.34419819712638855, mean loss: 0.3662379124676868
Epoch: 12, step: 102, loss: 0.3155365586280823, mean loss: 0.3662350037789231
Epoch: 12, step: 103, loss: 0.3281669616699219, mean loss: 0.3662328199765993
Epoch: 12, step: 104, loss: 0.3439931273460388, mean loss: 0.3662315442528208
Epoch: 12, step: 105, loss: 0.3310968577861786, mean loss: 0.3662295289559029
Epoch: 12, step: 106, loss: 0.32861223816871643, mean loss: 0.3662273713825856
Epoch: 12, step: 107, loss: 0.2895870506763458, mean loss: 0.3662229758606364
Epoch: 12, step: 108, loss: 0.3246559798717499, mean loss: 0.3662205920219033
Epoch: 12, step: 109, loss: 0.3414987325668335, mean loss: 0.3662191743215102
Epoch: 12, step: 110, loss: 0.31774795055389404, mean loss: 0.3662163948488473
Epoch: 12, step: 111, loss: 0.3321031630039215, mean loss: 0.3662144388149113
Epoch: 12, step: 112, loss: 0.3635411262512207, mean loss: 0.3662142855374293
Epoch: 12, step: 113, loss: 0.33074262738227844, mean loss: 0.36621225184529793
Epoch: 12, step: 114, loss: 0.33717861771583557, mean loss: 0.36621058735902096
Epoch: 12, step: 115, loss: 0.3153737485408783, mean loss: 0.3662076730710814
Epoch: 12, step: 116, loss: 0.34305858612060547, mean loss: 0.3662063460956185
Epoch: 12, step: 117, loss: 0.3449171185493469, mean loss: 0.3662051258028553
Epoch: 12, step: 118, loss: 0.31479495763778687, mean loss: 0.3662021791548261
Epoch: 12, step: 119, loss: 0.33640292286872864, mean loss: 0.36620047126530947
Epoch: 12, step: 120, loss: 0.3701678216457367, mean loss: 0.36620069863366184
Epoch: 12, step: 121, loss: 0.3397825062274933, mean loss: 0.36619918469713425
Epoch: 12, step: 122, loss: 0.3032330274581909, mean loss: 0.3661955765281331
Epoch: 12, step: 123, loss: 0.3447713255882263, mean loss: 0.36619434891806324
Epoch: 12, step: 124, loss: 0.32225945591926575, mean loss: 0.36619183159193025
Epoch: 12, step: 125, loss: 0.32608386874198914, mean loss: 0.3661895336680819
Epoch: 12, step: 126, loss: 0.33476704359054565, mean loss: 0.3661877334681347
Epoch: 12, step: 127, loss: 0.3559757173061371, mean loss: 0.36618714845346
Epoch: 12, step: 128, loss: 0.3377799391746521, mean loss: 0.36618552118592956
Epoch: 12, step: 129, loss: 0.3569110333919525, mean loss: 0.36618498994020876
Epoch: 12, step: 130, loss: 0.31313568353652954, mean loss: 0.3661819514324819
Epoch: 12, step: 131, loss: 0.32731005549430847, mean loss: 0.36617972509250835
Epoch: 12, step: 132, loss: 0.342045396566391, mean loss: 0.3661783429077236
Epoch: 12, step: 133, loss: 0.3355587124824524, mean loss: 0.3661765894069548
Epoch: 12, step: 134, loss: 0.3366384506225586, mean loss: 0.3661748979370593
Epoch: 12, step: 135, loss: 0.3489808142185211, mean loss: 0.36617391339264116
Epoch: 12, step: 136, loss: 0.33771899342536926, mean loss: 0.3661722841387066
Epoch: 12, step: 137, loss: 0.3120459020137787, mean loss: 0.36616918518175456
Epoch: 12, step: 138, loss: 0.33583682775497437, mean loss: 0.36616744862954603
Epoch: 12, step: 139, loss: 0.35186684131622314, mean loss: 0.36616662995498034
Epoch: 12, step: 140, loss: 0.3888047933578491, mean loss: 0.3661679258599207
Epoch: 12, step: 141, loss: 0.3326044976711273, mean loss: 0.3661660046562465
Epoch: 12, step: 142, loss: 0.2979620099067688, mean loss: 0.3661621008158968
Epoch: 12, step: 143, loss: 0.3948427140712738, mean loss: 0.3661637423345126
Epoch: 12, step: 144, loss: 0.3468513786792755, mean loss: 0.36616263706560315
Epoch: 12, step: 145, loss: 0.3269422650337219, mean loss: 0.3661603925668031
Epoch: 12, step: 146, loss: 0.32731860876083374, mean loss: 0.3661581698610059
Epoch: 12, step: 147, loss: 0.36490771174430847, mean loss: 0.36615809830812673
Epoch: 12, step: 148, loss: 0.3770810067653656, mean loss: 0.36615872329573657
Epoch: 12, step: 149, loss: 0.3199250102043152, mean loss: 0.3661560780438146
Epoch: 12, step: 150, loss: 0.3459828197956085, mean loss: 0.36615492390122933
Epoch: 12, step: 151, loss: 0.3568669855594635, mean loss: 0.36615439255464227
Epoch: 12, step: 152, loss: 0.34496137499809265, mean loss: 0.36615318020880644
Epoch: 12, step: 153, loss: 0.36211544275283813, mean loss: 0.36615294924338737
Epoch: 12, step: 154, loss: 0.41499269008636475, mean loss: 0.36615574279946145
Epoch: 12, step: 155, loss: 0.38204094767570496, mean loss: 0.3661566513561348
Epoch: 12, step: 156, loss: 0.33385413885116577, mean loss: 0.3661548039147562
Epoch: 12, step: 157, loss: 0.38708949089050293, mean loss: 0.36615600114036384
Epoch: 12, step: 158, loss: 0.31321975588798523, mean loss: 0.3661529739633036
Epoch: 12, step: 159, loss: 0.2704506516456604, mean loss: 0.36614750150662945
Epoch: 12, step: 160, loss: 0.30274051427841187, mean loss: 0.3661438759713085
Epoch: 12, step: 161, loss: 0.31908121705055237, mean loss: 0.3661411851388945
Epoch: 12, step: 162, loss: 0.3347947299480438, mean loss: 0.3661393929912076
Epoch: 12, step: 163, loss: 0.3133505880832672, mean loss: 0.36613637510846647
Epoch: 12, step: 164, loss: 0.36452850699424744, mean loss: 0.36613628319352254
Epoch: 12, step: 165, loss: 0.32667872309684753, mean loss: 0.36613402770249154
Epoch: 12, step: 166, loss: 0.38353270292282104, mean loss: 0.3661350221966453
Epoch: 12, step: 167, loss: 0.32206788659095764, mean loss: 0.36613250349890836
Epoch: 12, step: 168, loss: 0.30162563920021057, mean loss: 0.3661288167603647
Epoch: 12, step: 169, loss: 0.3483298718929291, mean loss: 0.36612779956154956
Epoch: 12, step: 170, loss: 0.33191874623298645, mean loss: 0.3661258446467928
Epoch: 12, step: 171, loss: 0.31644243001937866, mean loss: 0.3661230055945284
Epoch: 12, step: 172, loss: 0.3431968092918396, mean loss: 0.366121695601025
Epoch: 12, step: 173, loss: 0.32888928055763245, mean loss: 0.36611956827757375
Epoch: 12, step: 174, loss: 0.3495262861251831, mean loss: 0.36611862025254077
Epoch: 12, step: 175, loss: 0.33502891659736633, mean loss: 0.366116844104023
Epoch: 12, step: 176, loss: 0.3245770037174225, mean loss: 0.36611447107686584
Epoch: 12, step: 177, loss: 0.3460303246974945, mean loss: 0.3661133238047089
Epoch: 12, step: 178, loss: 0.33656248450279236, mean loss: 0.3661116358604979
Epoch: 12, step: 179, loss: 0.3889583349227905, mean loss: 0.36611294078961953
Epoch: 12, step: 180, loss: 0.32936543226242065, mean loss: 0.36611084201136107
Epoch: 12, step: 181, loss: 0.3968770205974579, mean loss: 0.3661125990746727
Epoch: 12, step: 182, loss: 0.3167344033718109, mean loss: 0.3661097792359597
Epoch: 12, step: 183, loss: 0.3521003723144531, mean loss: 0.3661089792469852
Epoch: 12, step: 184, loss: 0.34321898221969604, mean loss: 0.3661076722180908
Epoch: 12, step: 185, loss: 0.34655749797821045, mean loss: 0.36610655595828495
Epoch: 12, step: 186, loss: 0.3330106735229492, mean loss: 0.3661046663846375
Epoch: 12, step: 187, loss: 0.31624749302864075, mean loss: 0.36610182000570646
Epoch: 12, step: 188, loss: 0.37464138865470886, mean loss: 0.3661023075074847
Epoch: 12, step: 189, loss: 0.367946982383728, mean loss: 0.36610241280916733
Epoch: 12, step: 190, loss: 0.2899801731109619, mean loss: 0.36609806768446285
Epoch: 12, step: 191, loss: 0.31469419598579407, mean loss: 0.36609513367352114
Epoch: 12, step: 192, loss: 0.34192878007888794, mean loss: 0.36609375439416525
Epoch: 12, step: 193, loss: 0.3393504023551941, mean loss: 0.3660922281213631
Epoch: 12, step: 194, loss: 0.3494357466697693, mean loss: 0.36609127757171683
Epoch: 12, step: 195, loss: 0.3479032516479492, mean loss: 0.366090239679345
Epoch: 12, step: 196, loss: 0.3596225678920746, mean loss: 0.36608987062532006
Epoch: 12, step: 197, loss: 0.3771727383136749, mean loss: 0.3660905029925281
Epoch: 12, step: 198, loss: 0.32055002450942993, mean loss: 0.36608790468828417
Epoch: 12, step: 199, loss: 0.33148375153541565, mean loss: 0.3660859304668583
Epoch: 12, step: 200, loss: 0.3444705605506897, mean loss: 0.36608469734632
Epoch: 12, step: 201, loss: 0.3507392108440399, mean loss: 0.36608382196203576
Epoch: 12, step: 202, loss: 0.3118799924850464, mean loss: 0.36608073007740416
Epoch: 12, step: 203, loss: 0.32626184821128845, mean loss: 0.36607845886579876
Epoch: 12, step: 204, loss: 0.32257896661758423, mean loss: 0.3660759778589974
Epoch: 12, step: 205, loss: 0.3361508846282959, mean loss: 0.3660742711695238
Epoch: 12, step: 206, loss: 0.3034569323062897, mean loss: 0.3660707001778578
Epoch: 12, step: 207, loss: 0.35058876872062683, mean loss: 0.366069817312241
Epoch: 12, step: 208, loss: 0.315457284450531, mean loss: 0.36606693126942513
Epoch: 12, step: 209, loss: 0.3530983626842499, mean loss: 0.36606619181403766
Epoch: 12, step: 210, loss: 0.33540138602256775, mean loss: 0.3660644434358068
Epoch: 12, step: 211, loss: 0.36728280782699585, mean loss: 0.36606451289785874
Epoch: 12, step: 212, loss: 0.31663835048675537, mean loss: 0.36606169514730796
Epoch: 12, step: 213, loss: 0.33492812514305115, mean loss: 0.36605992034568874
Epoch: 12, step: 214, loss: 0.37158632278442383, mean loss: 0.36606023536606375
Epoch: 12, step: 215, loss: 0.3315613865852356, mean loss: 0.3660582689474146
Epoch: 12, step: 216, loss: 0.3334601819515228, mean loss: 0.3660564109772239
Epoch: 12, step: 217, loss: 0.3703656792640686, mean loss: 0.36605665657555325
Epoch: 12, step: 218, loss: 0.3420828580856323, mean loss: 0.36605529031360023
Epoch: 12, step: 219, loss: 0.35521945357322693, mean loss: 0.36605467281663534
Epoch: 12, step: 220, loss: 0.36813807487487793, mean loss: 0.366054791535768
Epoch: 12, step: 221, loss: 0.37298229336738586, mean loss: 0.36605518626521705
Epoch: 12, step: 222, loss: 0.35442104935646057, mean loss: 0.3660545233892038
Epoch: 12, step: 223, loss: 0.30485692620277405, mean loss: 0.36605103674396755
Epoch: 12, step: 224, loss: 0.3453192710876465, mean loss: 0.3660498556486758
Epoch: 12, step: 225, loss: 0.3339240252971649, mean loss: 0.366048025534152
Epoch: 12, step: 226, loss: 0.36771878600120544, mean loss: 0.36604812070706383
Epoch: 12, step: 227, loss: 0.3754202127456665, mean loss: 0.3660486545468929
Epoch: 12, step: 228, loss: 0.34434404969215393, mean loss: 0.36604741831035736
Epoch: 12, step: 229, loss: 0.34965425729751587, mean loss: 0.36604648465270767
Epoch: 12, step: 230, loss: 0.34144821763038635, mean loss: 0.3660450837604574
Epoch: 12, step: 231, loss: 0.3208904564380646, mean loss: 0.36604251231243223
Epoch: 12, step: 232, loss: 0.3186764121055603, mean loss: 0.3660398150799166
Epoch: 12, step: 233, loss: 0.3969363570213318, mean loss: 0.3660415743637078
Epoch: 12, step: 234, loss: 0.3516373634338379, mean loss: 0.36604075421846327
Epoch: 12, step: 235, loss: 0.361103355884552, mean loss: 0.36604047310947135
Epoch: 12, step: 236, loss: 0.31915971636772156, mean loss: 0.3660378041224664
Epoch: 12, step: 237, loss: 0.3378564119338989, mean loss: 0.3660361998077568
Epoch: 12, step: 238, loss: 0.3388576805591583, mean loss: 0.3660346526728306
Epoch: 12, step: 239, loss: 0.34403470158576965, mean loss: 0.36603340039874777
Epoch: 12, step: 240, loss: 0.3388555347919464, mean loss: 0.36603185347714684
Epoch: 12, step: 241, loss: 0.3450353145599365, mean loss: 0.36603065845501154
Epoch: 12, step: 242, loss: 0.3969844579696655, mean loss: 0.36603242009632475
Epoch: 12, step: 243, loss: 0.3416730761528015, mean loss: 0.3660310338372795
Epoch: 12, step: 244, loss: 0.3622191846370697, mean loss: 0.36603081692217104
Epoch: 12, step: 245, loss: 0.3716658055782318, mean loss: 0.3660311375656589
Epoch: 12, step: 246, loss: 0.3305407464504242, mean loss: 0.3660291181977434
Epoch: 12, step: 247, loss: 0.3065960705280304, mean loss: 0.3660257367089138
Epoch: 12, step: 248, loss: 0.32380184531211853, mean loss: 0.3660233344849053
Epoch: 12, step: 249, loss: 0.3194328248500824, mean loss: 0.36602068398373144
Epoch: 12, step: 250, loss: 0.3502272963523865, mean loss: 0.36601978556017883
Epoch: 12, step: 251, loss: 0.37393492460250854, mean loss: 0.36602023579561926
Epoch: 12, step: 252, loss: 0.3319254219532013, mean loss: 0.366018296496726
Epoch: 12, step: 253, loss: 0.31328198313713074, mean loss: 0.3660152970476668
Epoch: 12, step: 254, loss: 0.3180091977119446, mean loss: 0.3660125667912068
Epoch: 12, step: 255, loss: 0.35172441601753235, mean loss: 0.36601175422576243
Epoch: 12, step: 256, loss: 0.300932914018631, mean loss: 0.3660080534102829
Epoch: 12, step: 257, loss: 0.34875214099884033, mean loss: 0.36600707218019013
Epoch: 12, step: 258, loss: 0.3725164234638214, mean loss: 0.36600744230308113
Epoch: 12, step: 259, loss: 0.323819637298584, mean loss: 0.36600504363324915
Epoch: 12, step: 260, loss: 0.32328757643699646, mean loss: 0.366002614986527
Epoch: 12, step: 261, loss: 0.3654353618621826, mean loss: 0.36600258273791275
Epoch: 12, step: 262, loss: 0.31732451915740967, mean loss: 0.365999815523793
Epoch: 12, step: 263, loss: 0.34118789434432983, mean loss: 0.36599840511444903
Epoch: 12, step: 264, loss: 0.34507203102111816, mean loss: 0.3659972156428357
Epoch: 12, step: 265, loss: 0.3260684609413147, mean loss: 0.3659949461899142
Epoch: 12, step: 266, loss: 0.3225042521953583, mean loss: 0.3659924744255496
Epoch: 12, step: 267, loss: 0.36481255292892456, mean loss: 0.36599240736931543
Epoch: 12, step: 268, loss: 0.33117276430130005, mean loss: 0.3659904286432219
Epoch: 12, step: 269, loss: 0.30520570278167725, mean loss: 0.36598697457310814
Epoch: 12, step: 270, loss: 0.3843398690223694, mean loss: 0.36598801741045395
Epoch: 12, step: 271, loss: 0.35712528228759766, mean loss: 0.36598751384595835
Epoch: 12, step: 272, loss: 0.3325832486152649, mean loss: 0.365985615984176
Epoch: 12, step: 273, loss: 0.3559320569038391, mean loss: 0.3659850448241328
Epoch: 12, step: 274, loss: 0.3309020400047302, mean loss: 0.36598305181130436
Epoch: 12, step: 275, loss: 0.36049768328666687, mean loss: 0.3659827402134559
Epoch: 12, step: 276, loss: 0.3421862721443176, mean loss: 0.3659813885254088
Epoch: 12, step: 277, loss: 0.3158285319805145, mean loss: 0.3659785399024084
Epoch: 12, step: 278, loss: 0.3986404240131378, mean loss: 0.36598039495347395
Epoch: 12, step: 279, loss: 0.4313400089740753, mean loss: 0.3659841068806673
Epoch: 12, step: 280, loss: 0.3123265504837036, mean loss: 0.3659810597140822
Epoch: 12, step: 281, loss: 0.34823551774024963, mean loss: 0.3659800520172069
Epoch: 12, step: 282, loss: 0.3195328116416931, mean loss: 0.3659774146178329
Epoch: 12, step: 283, loss: 0.3318970799446106, mean loss: 0.36597547955454235
Epoch: 12, step: 284, loss: 0.31718435883522034, mean loss: 0.36597270937792736
Epoch: 12, step: 285, loss: 0.3344123661518097, mean loss: 0.3659709176018841
Epoch: 12, step: 286, loss: 0.36310040950775146, mean loss: 0.3659707546437181
Epoch: 12, step: 287, loss: 0.35448428988456726, mean loss: 0.3659701025964452
Epoch: 12, step: 288, loss: 0.46786201000213623, mean loss: 0.3659758863228121
Epoch: 12, step: 289, loss: 0.35315173864364624, mean loss: 0.3659751584225011
Epoch: 12, step: 290, loss: 0.3165576159954071, mean loss: 0.3659723536354856
Epoch: 12, step: 291, loss: 0.33183181285858154, mean loss: 0.3659704160338524
Epoch: 12, step: 292, loss: 0.35744979977607727, mean loss: 0.36596993248489046
Epoch: 12, step: 293, loss: 0.3728444576263428, mean loss: 0.3659703225952719
Epoch: 12, step: 294, loss: 0.314306378364563, mean loss: 0.36596739097498987
Epoch: 12, step: 295, loss: 0.3293003439903259, mean loss: 0.3659653104571174
Epoch: 12, step: 296, loss: 0.36502140760421753, mean loss: 0.3659652569023456
Epoch: 12, step: 297, loss: 0.34520813822746277, mean loss: 0.36596407926030117
Epoch: 12, step: 298, loss: 0.3208951950073242, mean loss: 0.3659615224506198
Epoch: 12, step: 299, loss: 0.3566262722015381, mean loss: 0.3659609928811707
Epoch: 12, step: 300, loss: 0.3094901144504547, mean loss: 0.36595778958668823
Epoch: 12, step: 301, loss: 0.33302444219589233, mean loss: 0.3659559215579083
Epoch: 12, step: 302, loss: 0.31499090790748596, mean loss: 0.3659530309099785
Epoch: 12, step: 303, loss: 0.37168359756469727, mean loss: 0.36595335591943035
Epoch: 12, step: 304, loss: 0.3301268517971039, mean loss: 0.36595132413220627
Epoch: 12, step: 305, loss: 0.3545973300933838, mean loss: 0.36595068026274735
Epoch: 12, step: 306, loss: 0.33264076709747314, mean loss: 0.36594879141028547
Epoch: 12, step: 307, loss: 0.3188570737838745, mean loss: 0.3659461212062921
Epoch: 12, step: 308, loss: 0.3197782039642334, mean loss: 0.36594350353224087
Epoch: 12, step: 309, loss: 0.3445984125137329, mean loss: 0.36594229335585926
Epoch: 12, step: 310, loss: 0.3311406373977661, mean loss: 0.36594032036102064
Epoch: 12, step: 311, loss: 0.3507970869541168, mean loss: 0.36593946190107696
Epoch: 12, step: 312, loss: 0.33031395077705383, mean loss: 0.3659374424287611
Epoch: 12, step: 313, loss: 0.32388046383857727, mean loss: 0.36593505851658614
Epoch: 12, step: 314, loss: 0.3447476923465729, mean loss: 0.3659338576229643
Epoch: 12, step: 315, loss: 0.34399643540382385, mean loss: 0.3659326142868603
Epoch: 12, step: 316, loss: 0.3151605427265167, mean loss: 0.3659297368671062
Epoch: 12, step: 317, loss: 0.3577004373073578, mean loss: 0.36592927051214985
Epoch: 12, step: 318, loss: 0.3556935489177704, mean loss: 0.36592869048599275
Epoch: 12, step: 319, loss: 0.352183073759079, mean loss: 0.36592791160925164
Epoch: 12, step: 320, loss: 0.3445875644683838, mean loss: 0.3659267024559205
Epoch: 12, step: 321, loss: 0.33107632398605347, mean loss: 0.3659247279302282
Epoch: 12, step: 322, loss: 0.34874966740608215, mean loss: 0.3659237548941099
Epoch: 12, step: 323, loss: 0.3243340849876404, mean loss: 0.3659213988058532
Epoch: 12, step: 324, loss: 0.36872681975364685, mean loss: 0.36592155772620377
Epoch: 12, step: 325, loss: 0.3206423819065094, mean loss: 0.36591899291506635
Epoch: 12, step: 326, loss: 0.3190212547779083, mean loss: 0.36591633657192635
Epoch: 12, step: 327, loss: 0.35254210233688354, mean loss: 0.3659155790824477
Epoch: 12, step: 328, loss: 0.3137612044811249, mean loss: 0.36591262533183316
Epoch: 12, step: 329, loss: 0.38485202193260193, mean loss: 0.3659136978993154
Epoch: 12, step: 330, loss: 0.38206008076667786, mean loss: 0.36591461224230576
Epoch: 12, step: 331, loss: 0.33623233437538147, mean loss: 0.36591293147911963
Epoch: 12, step: 332, loss: 0.33846163749694824, mean loss: 0.36591137713372685
Epoch: 12, step: 333, loss: 0.3073699176311493, mean loss: 0.36590806259066816
Epoch: 12, step: 334, loss: 0.36204326152801514, mean loss: 0.36590784378293095
Epoch: 12, step: 335, loss: 0.30627235770225525, mean loss: 0.36590446767977874
Epoch: 12, step: 336, loss: 0.3610689640045166, mean loss: 0.3659041939461996
Epoch: 12, step: 337, loss: 0.331241637468338, mean loss: 0.3659022318406591
Epoch: 12, step: 338, loss: 0.2984003722667694, mean loss: 0.3658984110527736
Epoch: 12, step: 339, loss: 0.3267901539802551, mean loss: 0.36589619754490216
Epoch: 12, step: 340, loss: 0.34197136759757996, mean loss: 0.36589484348808243
Epoch: 12, step: 341, loss: 0.30762964487075806, mean loss: 0.3658915460801245
Epoch: 12, step: 342, loss: 0.32896092534065247, mean loss: 0.36588945618024676
Epoch: 12, step: 343, loss: 0.3576599955558777, mean loss: 0.3658889905023029
Epoch: 12, step: 344, loss: 0.3547801971435547, mean loss: 0.36588836192801677
Epoch: 12, step: 345, loss: 0.33311936259269714, mean loss: 0.36588650784861565
Epoch: 12, step: 346, loss: 0.343735933303833, mean loss: 0.36588525463364846
Epoch: 12, step: 347, loss: 0.29666435718536377, mean loss: 0.3658813385385224
Epoch: 12, step: 348, loss: 0.3155932128429413, mean loss: 0.36587849370480086
Epoch: 12, step: 349, loss: 0.2929869592189789, mean loss: 0.3658743704140165
Epoch: 12, step: 350, loss: 0.35309189558029175, mean loss: 0.36587364738246303
Epoch: 12, step: 351, loss: 0.3314599394798279, mean loss: 0.3658717009057717
Epoch: 12, step: 352, loss: 0.3579442501068115, mean loss: 0.36587125254590525
Epoch: 12, step: 353, loss: 0.34184959530830383, mean loss: 0.36586989400856573
Epoch: 12, step: 354, loss: 0.3338192403316498, mean loss: 0.3658680814963406
Epoch: 12, step: 355, loss: 0.3198489844799042, mean loss: 0.3658654791949938
Epoch: 12, step: 356, loss: 0.3456607460975647, mean loss: 0.36586433671644714
Epoch: 12, step: 357, loss: 0.333008736371994, mean loss: 0.36586247899845864
Epoch: 12, step: 358, loss: 0.3330734074115753, mean loss: 0.3658606251469526
Epoch: 12, step: 359, loss: 0.35130709409713745, mean loss: 0.3658598023557354
Epoch: 12, step: 360, loss: 0.3564528822898865, mean loss: 0.3658592705608309
Epoch: 12, step: 361, loss: 0.32485640048980713, mean loss: 0.3658569527049761
Epoch: 12, step: 362, loss: 0.30822762846946716, mean loss: 0.36585369515456995
Epoch: 12, step: 363, loss: 0.2989228367805481, mean loss: 0.36584991204025985
Epoch: 12, step: 364, loss: 0.35205915570259094, mean loss: 0.3658491325932278
Epoch: 12, step: 365, loss: 0.30796802043914795, mean loss: 0.3658458613650062
Epoch: 12, step: 366, loss: 0.33226677775382996, mean loss: 0.3658439637055763
Epoch: 12, step: 367, loss: 0.3552219569683075, mean loss: 0.36584336345655183
Epoch: 12, step: 368, loss: 0.4090602397918701, mean loss: 0.36584580550188917
Epoch: 12, step: 369, loss: 0.3622751832008362, mean loss: 0.3658456037490187
Epoch: 12, step: 370, loss: 0.3320330083370209, mean loss: 0.36584369332496014
Epoch: 12, step: 371, loss: 0.3614216148853302, mean loss: 0.36584344349002007
Epoch: 12, step: 372, loss: 0.31880906224250793, mean loss: 0.36584078633046707
Epoch: 12, step: 373, loss: 0.3600187599658966, mean loss: 0.3658404574395867
Epoch: 12, step: 374, loss: 0.3470604419708252, mean loss: 0.36583939660156667
Epoch: 12, step: 375, loss: 0.34110358357429504, mean loss: 0.36583799941375444
Epoch: 12, step: 376, loss: 0.38199108839035034, mean loss: 0.3658389117599265
Epoch: 12, step: 377, loss: 0.30891069769859314, mean loss: 0.36583569656654225
Epoch: 12, step: 378, loss: 0.3284410536289215, mean loss: 0.36583358471004834
Epoch: 12, step: 379, loss: 0.33883994817733765, mean loss: 0.36583206033482063
Epoch: 12, step: 380, loss: 0.3542366325855255, mean loss: 0.3658314055588452
Epoch: 12, step: 381, loss: 0.3203023374080658, mean loss: 0.36582883474754363
Epoch: 12, step: 382, loss: 0.30176952481269836, mean loss: 0.3658252178252956
Epoch: 12, step: 383, loss: 0.3122032880783081, mean loss: 0.3658221903902376
Epoch: 12, step: 384, loss: 0.34720131754875183, mean loss: 0.3658211391356313
Epoch: 12, step: 385, loss: 0.3424900472164154, mean loss: 0.3658198220366181
Epoch: 12, step: 386, loss: 0.34740233421325684, mean loss: 0.36581878238164645
Epoch: 12, step: 387, loss: 0.3187236189842224, mean loss: 0.36581612404097147
Epoch: 12, step: 388, loss: 0.41424933075904846, mean loss: 0.3658188577547333
Epoch: 12, step: 389, loss: 0.31929802894592285, mean loss: 0.36581623212944775
Epoch: 12, step: 390, loss: 0.32400503754615784, mean loss: 0.36581387244805585
Epoch: 12, step: 391, loss: 0.3278747498989105, mean loss: 0.36581173141405193
Epoch: 12, step: 392, loss: 0.3677899241447449, mean loss: 0.3658118430439109
Epoch: 12, step: 393, loss: 0.30296942591667175, mean loss: 0.3658082970323362
Epoch: 12, step: 394, loss: 0.35745349526405334, mean loss: 0.36580782562220426
Epoch: 12, step: 395, loss: 0.33342814445495605, mean loss: 0.36580599873881636
Epoch: 12, step: 396, loss: 0.31954658031463623, mean loss: 0.3658033888985668
Epoch: 12, step: 397, loss: 0.32009628415107727, mean loss: 0.36580081036394263
Epoch: 12, step: 398, loss: 0.3492625951766968, mean loss: 0.36579987742463044
Epoch: 12, step: 399, loss: 0.33550819754600525, mean loss: 0.36579816873330157
Epoch: 12, step: 400, loss: 0.33918213844299316, mean loss: 0.36579666746248596
Epoch: 12, step: 401, loss: 0.34918445348739624, mean loss: 0.365795730507383
Epoch: 12, step: 402, loss: 0.3709382712841034, mean loss: 0.36579602053844595
Epoch: 12, step: 403, loss: 0.3556995689868927, mean loss: 0.36579545114686285
Epoch: 12, step: 404, loss: 0.3363950550556183, mean loss: 0.3657937931986256
Epoch: 12, step: 405, loss: 0.33740484714508057, mean loss: 0.3657921923783903
Epoch: 12, step: 406, loss: 0.3083236813545227, mean loss: 0.3657889519774304
Epoch: 12, step: 407, loss: 0.34027788043022156, mean loss: 0.36578751359946765
Epoch: 12, step: 408, loss: 0.3749002516269684, mean loss: 0.36578802736944155
Epoch: 12, step: 409, loss: 0.3063529431819916, mean loss: 0.3657846766487184
Epoch: 12, step: 410, loss: 0.32192060351371765, mean loss: 0.3657822039009234
Epoch: 12, step: 411, loss: 0.3079341650009155, mean loss: 0.365778943019362
Epoch: 12, step: 412, loss: 0.3663650155067444, mean loss: 0.3657789760542804
Epoch: 12, step: 413, loss: 0.3322124183177948, mean loss: 0.3657770841279059
Epoch: 12, step: 414, loss: 0.36903107166290283, mean loss: 0.3657772675234723
Epoch: 12, step: 415, loss: 0.3496038615703583, mean loss: 0.3657763560375642
Epoch: 12, step: 416, loss: 0.3611711859703064, mean loss: 0.3657760965182592
Epoch: 12, step: 417, loss: 0.3606884181499481, mean loss: 0.3657758098238848
Epoch: 12, step: 418, loss: 0.31326085329055786, mean loss: 0.3657728507346566
Epoch: 12, step: 419, loss: 0.3552612066268921, mean loss: 0.36577225846261985
Epoch: 12, step: 420, loss: 0.32484737038612366, mean loss: 0.3657699527052208
Epoch: 12, step: 421, loss: 0.3415588140487671, mean loss: 0.36576858869740914
Epoch: 12, step: 422, loss: 0.3300855755805969, mean loss: 0.36576657850006156
Epoch: 12, step: 423, loss: 0.3478338420391083, mean loss: 0.3657655683188729
Epoch: 12, step: 424, loss: 0.3607980012893677, mean loss: 0.3657652885032345
Epoch: 12, step: 425, loss: 0.3311289846897125, mean loss: 0.36576333760181434
Epoch: 12, step: 426, loss: 0.3255203366279602, mean loss: 0.3657610710289631
Epoch: 12, step: 427, loss: 0.3377257287502289, mean loss: 0.36575949210678027
Epoch: 12, step: 428, loss: 0.32067036628723145, mean loss: 0.3657569528757266
Epoch: 12, step: 429, loss: 0.32245495915412903, mean loss: 0.36575451442580426
Epoch: 12, step: 430, loss: 0.35148629546165466, mean loss: 0.3657537109898583
Epoch: 12, step: 431, loss: 0.34022921323776245, mean loss: 0.36575227379966957
Epoch: 12, step: 432, loss: 0.3257147967815399, mean loss: 0.36575001956415254
Epoch: 12, step: 433, loss: 0.35827597975730896, mean loss: 0.3657495987759639
Epoch: 12, step: 434, loss: 0.3480435311794281, mean loss: 0.36574860198107584
Epoch: 12, step: 435, loss: 0.32258087396621704, mean loss: 0.3657461719130723
Epoch: 12, step: 436, loss: 0.3284997344017029, mean loss: 0.3657440752940173
Epoch: 12, step: 437, loss: 0.3590637445449829, mean loss: 0.36574369927630096
Epoch: 12, step: 438, loss: 0.31242695450782776, mean loss: 0.36574069839012047
Epoch: 12, step: 439, loss: 0.31008315086364746, mean loss: 0.36573756593021917
Epoch: 12, step: 440, loss: 0.3378891050815582, mean loss: 0.36573599868046686
Epoch: 12, step: 441, loss: 0.3298592269420624, mean loss: 0.3657339797287652
Epoch: 12, step: 442, loss: 0.3732852041721344, mean loss: 0.3657344046471403
Epoch: 12, step: 443, loss: 0.35890358686447144, mean loss: 0.36573402028872354
Epoch: 12, step: 444, loss: 0.3559776246547699, mean loss: 0.36573347134394024
Epoch: 12, step: 445, loss: 0.3145256042480469, mean loss: 0.36573059028919197
Epoch: 12, step: 446, loss: 0.3250645101070404, mean loss: 0.36572830246470917
Epoch: 12, step: 447, loss: 0.3791906237602234, mean loss: 0.36572905979601517
Epoch: 12, step: 448, loss: 0.31899771094322205, mean loss: 0.36572643104263425
Epoch: 12, step: 449, loss: 0.3352527320384979, mean loss: 0.36572471691849184
Epoch: 12, step: 450, loss: 0.3580847382545471, mean loss: 0.3657242871992352
Epoch: 12, step: 451, loss: 0.3427717387676239, mean loss: 0.36572299627975086
Epoch: 12, step: 452, loss: 0.352105975151062, mean loss: 0.365722230461117
Epoch: 12, step: 453, loss: 0.3263072371482849, mean loss: 0.3657200138941778
Epoch: 12, step: 454, loss: 0.34886687994003296, mean loss: 0.3657190661837828
Epoch: 12, step: 455, loss: 0.34383538365364075, mean loss: 0.36571783565732474
Epoch: 12, step: 456, loss: 0.3737078607082367, mean loss: 0.36571828491372343
Epoch: 12, step: 457, loss: 0.3426770269870758, mean loss: 0.36571698944212067
Epoch: 12, step: 458, loss: 0.35722416639328003, mean loss: 0.3657165119685136
Epoch: 12, step: 459, loss: 0.3439061939716339, mean loss: 0.3657152858431484
Epoch: 12, step: 460, loss: 0.33793729543685913, mean loss: 0.36571372431690147
Epoch: 12, step: 461, loss: 0.3460841476917267, mean loss: 0.3657126209118073
Epoch: 12, step: 462, loss: 0.32333552837371826, mean loss: 0.3657102389719198
Epoch: 12, step: 463, loss: 0.39708268642425537, mean loss: 0.36571200226145734
Epoch: 12, step: 464, loss: 0.3381730020046234, mean loss: 0.36571045451794826
Epoch: 12, step: 465, loss: 0.3631106913089752, mean loss: 0.36571030841458707
Epoch: 12, step: 466, loss: 0.3488004207611084, mean loss: 0.36570935815397154
Epoch: 12, step: 467, loss: 0.3409661054611206, mean loss: 0.36570796777114994
Epoch: 12, step: 468, loss: 0.34438368678092957, mean loss: 0.3657067695758929
Epoch: 12, step: 469, loss: 0.3234997093677521, mean loss: 0.3657043981262801
Epoch: 12, step: 470, loss: 0.31716781854629517, mean loss: 0.3657016711989482
Epoch: 12, step: 471, loss: 0.3337635397911072, mean loss: 0.3656998769219028
Epoch: 12, step: 472, loss: 0.2976957857608795, mean loss: 0.3656960566819634
Epoch: 12, step: 473, loss: 0.3387855887413025, mean loss: 0.3656945450277706
Epoch: 12, step: 474, loss: 0.29283273220062256, mean loss: 0.3656904523572753
Epoch: 12, step: 475, loss: 0.3364722430706024, mean loss: 0.36568881125363084
Epoch: 12, step: 476, loss: 0.353575199842453, mean loss: 0.36568813090477315
Epoch: 12, step: 477, loss: 0.3482130169868469, mean loss: 0.365687149487615
Epoch: 12, step: 478, loss: 0.3244935870170593, mean loss: 0.365684836152271
Epoch: 12, step: 479, loss: 0.2999410033226013, mean loss: 0.365681144337759
Epoch: 12, step: 480, loss: 0.3901223838329315, mean loss: 0.36568251674718655
Epoch: 12, step: 481, loss: 0.360106885433197, mean loss: 0.3656822036853497
Epoch: 12, step: 482, loss: 0.32824793457984924, mean loss: 0.3656801019353578
Epoch: 12, step: 483, loss: 0.35284364223480225, mean loss: 0.36567938127177707
Epoch: 12, step: 484, loss: 0.38096705079078674, mean loss: 0.36568023950281725
Epoch: 12, step: 485, loss: 0.3499937951564789, mean loss: 0.3656793589344808
Epoch: 12, step: 486, loss: 0.35546210408210754, mean loss: 0.3656787854147024
Epoch: 12, step: 487, loss: 0.3251335918903351, mean loss: 0.3656765096404812
Epoch: 12, step: 488, loss: 0.3407926559448242, mean loss: 0.3656751130050378
Epoch: 12, step: 489, loss: 0.37475061416625977, mean loss: 0.36567562234958606
Epoch: 12, step: 490, loss: 0.36913958191871643, mean loss: 0.36567581674655386
Epoch: 12, step: 491, loss: 0.3147539794445038, mean loss: 0.36567295917992637
Epoch: 12, step: 492, loss: 0.3375042676925659, mean loss: 0.3656713785339757
Epoch: 12, step: 493, loss: 0.31262677907943726, mean loss: 0.36566840217893953
Epoch: 12, step: 494, loss: 0.37142735719680786, mean loss: 0.3656687252982246
Epoch: 12, step: 495, loss: 0.35805556178092957, mean loss: 0.3656682981683145
Epoch: 12, step: 496, loss: 0.32535362243652344, mean loss: 0.3656660364754263
Epoch: 12, step: 497, loss: 0.32850682735443115, mean loss: 0.36566395192425827
Epoch: 12, step: 498, loss: 0.3452804386615753, mean loss: 0.36566280851744487
Epoch: 12, step: 499, loss: 0.3299793303012848, mean loss: 0.3656608069761494
Epoch: 12, step: 500, loss: 0.30875304341316223, mean loss: 0.3656576151110104
Epoch: 12, step: 501, loss: 0.34995073080062866, mean loss: 0.36565673418648376
Epoch: 12, step: 502, loss: 0.329603910446167, mean loss: 0.365654712268266
Epoch: 12, step: 503, loss: 0.3155597746372223, mean loss: 0.36565190299630373
Epoch: 12, step: 504, loss: 0.34249812364578247, mean loss: 0.36565060462926785
Epoch: 12, step: 505, loss: 0.34591054916381836, mean loss: 0.3656494977516484
Epoch: 12, step: 506, loss: 0.32235997915267944, mean loss: 0.3656470705288506
Epoch: 12, step: 507, loss: 0.3776766359806061, mean loss: 0.3656477449830697
Epoch: 12, step: 508, loss: 0.3310173749923706, mean loss: 0.36564580349234865
Epoch: 12, step: 509, loss: 0.3591799736022949, mean loss: 0.36564544101730156
Epoch: 12, step: 510, loss: 0.36797696352005005, mean loss: 0.36564557171535095
Epoch: 12, step: 511, loss: 0.3307573199272156, mean loss: 0.3656436160958561
Epoch: 12, step: 512, loss: 0.3267272710800171, mean loss: 0.3656414348086516
Epoch: 12, step: 513, loss: 0.3439772427082062, mean loss: 0.3656402205842316
Epoch: 12, step: 514, loss: 0.31680867075920105, mean loss: 0.3656374838499479
Epoch: 12, step: 515, loss: 0.3690335750579834, mean loss: 0.3656376741711319
Epoch: 12, step: 516, loss: 0.3439588248729706, mean loss: 0.3656364593294789
Epoch: 12, step: 517, loss: 0.30500251054763794, mean loss: 0.36563306170823145
Epoch: 12, step: 518, loss: 0.3487720191478729, mean loss: 0.3656321169532272
Epoch: 12, step: 519, loss: 0.3676230013370514, mean loss: 0.3656322284998646
Epoch: 12, step: 520, loss: 0.3368290662765503, mean loss: 0.365630614786927
Epoch: 12, step: 521, loss: 0.3457704782485962, mean loss: 0.3656295021742358
Epoch: 12, step: 522, loss: 0.34152743220329285, mean loss: 0.36562815199385534
Epoch: 12, step: 523, loss: 0.33377605676651, mean loss: 0.36562636776266405
Epoch: 12, step: 524, loss: 0.35823214054107666, mean loss: 0.36562595358985156
Epoch: 12, step: 525, loss: 0.3526524007320404, mean loss: 0.3656252269430017
Epoch: 12, step: 526, loss: 0.350231796503067, mean loss: 0.3656243648074408
Epoch: 12, step: 527, loss: 0.33116936683654785, mean loss: 0.36562243520405985
Epoch: 12, step: 528, loss: 0.32791680097579956, mean loss: 0.3656203236716508
Epoch: 12, step: 529, loss: 0.38435298204421997, mean loss: 0.3656213726501687
Epoch: 12, step: 530, loss: 0.3356468379497528, mean loss: 0.365619694250779
Epoch: 12, step: 531, loss: 0.3654255270957947, mean loss: 0.3656196833791578
Epoch: 12, step: 532, loss: 0.3691835403442383, mean loss: 0.3656198829120487
Epoch: 12, step: 533, loss: 0.31290972232818604, mean loss: 0.36561693194571887
Epoch: 12, step: 534, loss: 0.3334621787071228, mean loss: 0.36561513186996236
Epoch: 12, step: 535, loss: 0.3133715093135834, mean loss: 0.36561220735011485
Epoch: 12, step: 536, loss: 0.35609158873558044, mean loss: 0.3656116744299573
Epoch: 12, step: 537, loss: 0.324081689119339, mean loss: 0.3656093499037449
Epoch: 12, step: 538, loss: 0.3617820143699646, mean loss: 0.3656091356912003
Epoch: 12, step: 539, loss: 0.30498242378234863, mean loss: 0.36560574265829743
Epoch: 12, step: 540, loss: 0.34596920013427734, mean loss: 0.3656046437415968
Epoch: 12, step: 541, loss: 0.32095393538475037, mean loss: 0.36560214510095007
Epoch: 12, step: 542, loss: 0.4069392681121826, mean loss: 0.3656044581848856
Epoch: 12, step: 543, loss: 0.3896414637565613, mean loss: 0.3656058031381964
Epoch: 12, step: 544, loss: 0.3190588355064392, mean loss: 0.365603198820643
Epoch: 12, step: 545, loss: 0.34257394075393677, mean loss: 0.3656019103984618
Epoch: 12, step: 546, loss: 0.31009456515312195, mean loss: 0.3655988050924341
Epoch: 12, step: 547, loss: 0.3444669842720032, mean loss: 0.36559762295880127
Epoch: 12, step: 548, loss: 0.3573385775089264, mean loss: 0.3655971609659921
Epoch: 12, step: 549, loss: 0.3330400288105011, mean loss: 0.36559533989360393
Epoch: 12, step: 550, loss: 0.4215753376483917, mean loss: 0.3655984709410761
Epoch: 12, step: 551, loss: 0.35325688123703003, mean loss: 0.3655977806955669
Epoch: 12, step: 552, loss: 0.32421791553497314, mean loss: 0.36559546651486335
Epoch: 12, step: 553, loss: 0.36532509326934814, mean loss: 0.36559545139500843
Epoch: 12, step: 554, loss: 0.30341485142707825, mean loss: 0.3655919743162203
Epoch: 12, step: 555, loss: 0.3183351457118988, mean loss: 0.3655893319080004
Epoch: 12, step: 556, loss: 0.3270335793495178, mean loss: 0.36558717614884145
Epoch: 12, step: 557, loss: 0.3421151638031006, mean loss: 0.36558586383684627
Epoch: 12, step: 558, loss: 0.3093496263027191, mean loss: 0.3655827198642665
Epoch: 12, step: 559, loss: 0.34255555272102356, mean loss: 0.36558143256735554
Epoch: 12, step: 560, loss: 0.3211938738822937, mean loss: 0.3655789512906668
Epoch: 12, step: 561, loss: 0.33298587799072266, mean loss: 0.3655771294307842
Epoch: 12, step: 562, loss: 0.35902899503707886, mean loss: 0.36557676342919715
Epoch: 12, step: 563, loss: 0.3591229021549225, mean loss: 0.36557640271707587
Epoch: 12, step: 564, loss: 0.34518998861312866, mean loss: 0.3655752633657036
Epoch: 12, step: 565, loss: 0.31378495693206787, mean loss: 0.3655723690823442
Epoch: 12, step: 566, loss: 0.34302303194999695, mean loss: 0.3655711089908587
Epoch: 12, step: 567, loss: 0.347070574760437, mean loss: 0.365570075210448
Epoch: 12, step: 568, loss: 0.35739076137542725, mean loss: 0.36556961818894523
Epoch: 12, step: 569, loss: 0.38115328550338745, mean loss: 0.36557048888216875
Epoch: 12, step: 570, loss: 0.3176330626010895, mean loss: 0.3655678106640403
Epoch: 12, step: 571, loss: 0.33983421325683594, mean loss: 0.36556637303290024
Epoch: 12, step: 572, loss: 0.4010150134563446, mean loss: 0.36556835329324455
Epoch: 12, step: 573, loss: 0.354768842458725, mean loss: 0.36556775003602
Epoch: 12, step: 574, loss: 0.32464122772216797, mean loss: 0.36556546402125634
Epoch: 12, step: 575, loss: 0.3411654531955719, mean loss: 0.36556410119670174
Epoch: 12, step: 576, loss: 0.3205888867378235, mean loss: 0.3655615893165309
Epoch: 12, step: 577, loss: 0.3644053637981415, mean loss: 0.3655615247445707
Epoch: 12, step: 578, loss: 0.3380706012248993, mean loss: 0.36555998953914715
Epoch: 12, step: 579, loss: 0.32997170090675354, mean loss: 0.36555800225476964
Epoch: 12, step: 580, loss: 0.327718585729599, mean loss: 0.3655558893832232
Epoch: 12, step: 581, loss: 0.3516075313091278, mean loss: 0.36555511058042733
Epoch: 12, step: 582, loss: 0.31179192662239075, mean loss: 0.3655521088952083
Epoch: 12, step: 583, loss: 0.3182244300842285, mean loss: 0.3655494666621349
Epoch: 12, step: 584, loss: 0.3207884430885315, mean loss: 0.3655469678610645
Epoch: 12, step: 585, loss: 0.34938234090805054, mean loss: 0.36554606551502494
Epoch: 12, step: 586, loss: 0.3594183623790741, mean loss: 0.36554572347186914
Epoch: 12, step: 587, loss: 0.378945529460907, mean loss: 0.3655464713958471
Epoch: 12, step: 588, loss: 0.3706425428390503, mean loss: 0.36554675582244994
Epoch: 12, step: 589, loss: 0.35364532470703125, mean loss: 0.3655460916059573
Epoch: 12, step: 590, loss: 0.34533417224884033, mean loss: 0.3655449636457275
Epoch: 12, step: 591, loss: 0.3915638327598572, mean loss: 0.3655464155915486
Epoch: 12, step: 592, loss: 0.3405238687992096, mean loss: 0.3655450193219882
Epoch: 12, step: 593, loss: 0.3435609042644501, mean loss: 0.36554379266675674
Epoch: 12, step: 594, loss: 0.37980353832244873, mean loss: 0.3655445882782981
Epoch: 12, step: 595, loss: 0.3165835440158844, mean loss: 0.3655418566868976
Epoch: 12, step: 596, loss: 0.30235326290130615, mean loss: 0.36553833152127496
Epoch: 12, step: 597, loss: 0.3596445620059967, mean loss: 0.36553800273797055
Epoch: 12, step: 598, loss: 0.29679805040359497, mean loss: 0.3655341683009574
Epoch: 12, step: 599, loss: 0.32367557287216187, mean loss: 0.36553183348416646
Epoch: 12, step: 600, loss: 0.3536805212497711, mean loss: 0.3655311724705999
Epoch: 12, step: 601, loss: 0.338129460811615, mean loss: 0.3655296442100501
Epoch: 12, step: 602, loss: 0.35675695538520813, mean loss: 0.3655291549630017
Epoch: 12, step: 603, loss: 0.2996804714202881, mean loss: 0.36552548283030356
Epoch: 12, step: 604, loss: 0.3104777932167053, mean loss: 0.3655224131994769
Epoch: 12, step: 605, loss: 0.3811420202255249, mean loss: 0.36552328414890406
Epoch: 12, step: 606, loss: 0.32183071970939636, mean loss: 0.3655208479869615
Epoch: 12, step: 607, loss: 0.3552398383617401, mean loss: 0.3655202747816969
Epoch: 12, step: 608, loss: 0.3458506464958191, mean loss: 0.36551917818648666
Epoch: 12, step: 609, loss: 0.29041334986686707, mean loss: 0.36551499121869097
Epoch: 12, step: 610, loss: 0.3477988839149475, mean loss: 0.3655140036437256
Epoch: 12, step: 611, loss: 0.3535064458847046, mean loss: 0.36551333432612476
Epoch: 12, step: 612, loss: 0.339551717042923, mean loss: 0.3655118872709281
Epoch: 12, step: 613, loss: 0.2971966564655304, mean loss: 0.36550807971152527
Epoch: 12, step: 614, loss: 0.31596577167510986, mean loss: 0.36550531861761476
Epoch: 12, step: 615, loss: 0.33685195446014404, mean loss: 0.3655037217961615
Epoch: 12, step: 616, loss: 0.31180301308631897, mean loss: 0.36550072927965493
Epoch: 12, step: 617, loss: 0.3251464366912842, mean loss: 0.36549848062855783
Epoch: 12, step: 618, loss: 0.38582736253738403, mean loss: 0.36549961334611003
Epoch: 12, step: 619, loss: 0.33972373604774475, mean loss: 0.365498177204072
Epoch: 12, step: 620, loss: 0.37359148263931274, mean loss: 0.3654986281097177
Epoch: 12, step: 621, loss: 0.34893590211868286, mean loss: 0.36549770539517784
Epoch: 12, step: 622, loss: 0.32498788833618164, mean loss: 0.3654954487065778
Epoch: 12, step: 623, loss: 0.34521645307540894, mean loss: 0.36549431908338087
Epoch: 12, step: 624, loss: 0.3408736288547516, mean loss: 0.3654929476863871
Epoch: 12, step: 625, loss: 0.3548930585384369, mean loss: 0.3654923572948784
Epoch: 12, step: 626, loss: 0.3273249864578247, mean loss: 0.36549023157107796
Epoch: 12, step: 627, loss: 0.33942416310310364, mean loss: 0.3654887799076525
Epoch: 12, step: 628, loss: 0.32027626037597656, mean loss: 0.3654862620862162
Epoch: 12, step: 629, loss: 0.33002084493637085, mean loss: 0.36548428717714226
Epoch: 12, step: 630, loss: 0.35634109377861023, mean loss: 0.365483778062303
Epoch: 12, step: 631, loss: 0.3278037905693054, mean loss: 0.3654816800674537
Epoch: 12, step: 632, loss: 0.3158053755760193, mean loss: 0.3654789142802207
Epoch: 12, step: 633, loss: 0.3246590793132782, mean loss: 0.3654766417139716
Epoch: 12, step: 634, loss: 0.3772110342979431, mean loss: 0.36547729496746956
Epoch: 12, step: 635, loss: 0.35851261019706726, mean loss: 0.3654769072651332
Epoch: 12, step: 636, loss: 0.3671979606151581, mean loss: 0.3654770030654867
Epoch: 12, step: 637, loss: 0.3411022126674652, mean loss: 0.3654756463477756
Epoch: 12, step: 638, loss: 0.3013624846935272, mean loss: 0.36547207796342346
Epoch: 12, step: 639, loss: 0.32343247532844543, mean loss: 0.3654697382704896
Epoch: 12, step: 640, loss: 0.356360524892807, mean loss: 0.3654692313300156
Epoch: 12, step: 641, loss: 0.3409406840801239, mean loss: 0.3654678663579928
Epoch: 12, step: 642, loss: 0.32472535967826843, mean loss: 0.36546559923280886
Epoch: 12, step: 643, loss: 0.3381669223308563, mean loss: 0.3654640802768272
Epoch: 12, step: 644, loss: 0.3544817566871643, mean loss: 0.3654634692311704
Epoch: 12, step: 645, loss: 0.32102760672569275, mean loss: 0.3654609970011434
Epoch: 12, step: 646, loss: 0.3282862603664398, mean loss: 0.3654589288655865
Epoch: 12, step: 647, loss: 0.36049723625183105, mean loss: 0.36545865284797335
Epoch: 12, step: 648, loss: 0.41542765498161316, mean loss: 0.365461432455368
Epoch: 12, step: 649, loss: 0.35157740116119385, mean loss: 0.36546066017639955
Epoch: 12, step: 650, loss: 0.3308798670768738, mean loss: 0.3654587367772617
Epoch: 12, step: 651, loss: 0.3586277365684509, mean loss: 0.3654583568551144
Epoch: 12, step: 652, loss: 0.36059898138046265, mean loss: 0.36545808660454576
Epoch: 12, step: 653, loss: 0.34196871519088745, mean loss: 0.3654567803331959
Epoch: 12, step: 654, loss: 0.3262285888195038, mean loss: 0.36545459892900783
Epoch: 12, step: 655, loss: 0.343720018863678, mean loss: 0.36545339037807006
Epoch: 12, step: 656, loss: 0.36016374826431274, mean loss: 0.36545309626396866
Epoch: 12, step: 657, loss: 0.3414081037044525, mean loss: 0.3654517593912588
Epoch: 12, step: 658, loss: 0.3199911117553711, mean loss: 0.3654492319743668
Epoch: 12, step: 659, loss: 0.343110591173172, mean loss: 0.3654479901108577
Epoch: 12, step: 660, loss: 0.33535370230674744, mean loss: 0.3654463171836353
Epoch: 12, step: 661, loss: 0.36672115325927734, mean loss: 0.3654463880472304
Epoch: 12, step: 662, loss: 0.3176693320274353, mean loss: 0.36544373243853606
Epoch: 12, step: 663, loss: 0.3715460002422333, mean loss: 0.3654440716041543
Epoch: 12, step: 664, loss: 0.3805803656578064, mean loss: 0.36544491283652547
Epoch: 12, step: 665, loss: 0.3508896231651306, mean loss: 0.36544410393968924
Epoch: 12, step: 666, loss: 0.31092333793640137, mean loss: 0.365441074166641
Epoch: 12, step: 667, loss: 0.3228777348995209, mean loss: 0.3654387090110916
Epoch: 12, step: 668, loss: 0.35180795192718506, mean loss: 0.3654379516205774
Epoch: 12, step: 669, loss: 0.32894614338874817, mean loss: 0.36543592407261477
Epoch: 12, step: 670, loss: 0.34668368101119995, mean loss: 0.36543488222345305
Epoch: 12, step: 671, loss: 0.3225652873516083, mean loss: 0.3654325005792935
Epoch: 12, step: 672, loss: 0.30944469571113586, mean loss: 0.365429390318482
Epoch: 12, step: 673, loss: 0.4847099781036377, mean loss: 0.3654360162815853
Epoch: 12, step: 674, loss: 0.335694819688797, mean loss: 0.36543436426822123
Epoch: 12, step: 675, loss: 0.32684221863746643, mean loss: 0.365432220736471
Epoch: 12, step: 676, loss: 0.3799475431442261, mean loss: 0.36543302691933177
Epoch: 12, step: 677, loss: 0.39972126483917236, mean loss: 0.36543493118668263
Epoch: 12, step: 678, loss: 0.34088191390037537, mean loss: 0.36543356766042695
Epoch: 12, step: 679, loss: 0.3206976354122162, mean loss: 0.36543108343495784
Epoch: 12, step: 680, loss: 0.2888111174106598, mean loss: 0.3654268288974475
Epoch: 12, step: 681, loss: 0.3517385721206665, mean loss: 0.36542606886098017
Epoch: 12, step: 682, loss: 0.33033445477485657, mean loss: 0.3654241205175186
Epoch: 12, step: 683, loss: 0.34289929270744324, mean loss: 0.3654228699718929
Epoch: 12, step: 684, loss: 0.3599260747432709, mean loss: 0.3654225648147714
Epoch: 12, step: 685, loss: 0.3215302526950836, mean loss: 0.3654201282480944
Epoch: 12, step: 686, loss: 0.3427131772041321, mean loss: 0.3654188678011866
Epoch: 12, step: 687, loss: 0.3584830164909363, mean loss: 0.3654184828183208
Epoch: 12, step: 688, loss: 0.405450701713562, mean loss: 0.3654207047320076
Epoch: 12, step: 689, loss: 0.3302296996116638, mean loss: 0.36541875162927034
Epoch: 12, step: 690, loss: 0.3313811123371124, mean loss: 0.36541686264323936
Epoch: 12, step: 691, loss: 0.3500942587852478, mean loss: 0.36541601233225945
Epoch: 12, step: 692, loss: 0.3295750617980957, mean loss: 0.3654140234886584
Epoch: 12, step: 693, loss: 0.3485238254070282, mean loss: 0.36541308628978586
Epoch: 12, step: 694, loss: 0.31454992294311523, mean loss: 0.36541026416453776
Epoch: 12, step: 695, loss: 0.34912624955177307, mean loss: 0.3654093607016764
Epoch: 12, step: 696, loss: 0.31884586811065674, mean loss: 0.3654067774288558
Epoch: 12, step: 697, loss: 0.37503865361213684, mean loss: 0.3654073117612747
Epoch: 12, step: 698, loss: 0.3824380040168762, mean loss: 0.36540825649374575
Epoch: 12, step: 699, loss: 0.336266428232193, mean loss: 0.36540664001780493
Epoch: 12, step: 700, loss: 0.3254126012325287, mean loss: 0.36540442170071663
Epoch: 12, step: 701, loss: 0.3893289268016815, mean loss: 0.36540574862834285
Epoch: 12, step: 702, loss: 0.3371792137622833, mean loss: 0.36540418318356077
Epoch: 12, step: 703, loss: 0.32642287015914917, mean loss: 0.36540202139823336
Epoch: 12, step: 704, loss: 0.30257177352905273, mean loss: 0.36539853721657367
Epoch: 12, step: 705, loss: 0.35277071595191956, mean loss: 0.36539783699359124
Epoch: 12, step: 706, loss: 0.36166366934776306, mean loss: 0.36539762994243263
Epoch: 12, step: 707, loss: 0.3337971568107605, mean loss: 0.36539587786474736
Epoch: 12, step: 708, loss: 0.2973400056362152, mean loss: 0.36539210473882683
Epoch: 12, step: 709, loss: 0.3350071907043457, mean loss: 0.36539042024420243
Epoch: 12, step: 710, loss: 0.3381134867668152, mean loss: 0.3653889081352453
Epoch: 12, step: 711, loss: 0.3196449875831604, mean loss: 0.3653863724412014
Epoch: 12, step: 712, loss: 0.3327861726284027, mean loss: 0.3653845654349483
Epoch: 12, step: 713, loss: 0.295630544424057, mean loss: 0.3653806992326974
Epoch: 12, step: 714, loss: 0.34608030319213867, mean loss: 0.36537962954384073
Epoch: 12, step: 715, loss: 0.330245703458786, mean loss: 0.36537768241869745
Epoch: 12, step: 716, loss: 0.3266730308532715, mean loss: 0.3653755375225176
Epoch: 12, step: 717, loss: 0.31496837735176086, mean loss: 0.3653727442630601
Epoch: 12, step: 718, loss: 0.32617393136024475, mean loss: 0.36537057222267094
Epoch: 12, step: 719, loss: 0.3166232407093048, mean loss: 0.36536787124020675
Epoch: 12, step: 720, loss: 0.3192664682865143, mean loss: 0.3653653170043514
Epoch: 12, step: 721, loss: 0.351333349943161, mean loss: 0.3653645396100544
Epoch: 12, step: 722, loss: 0.33665362000465393, mean loss: 0.3653629490655081
Epoch: 12, step: 723, loss: 0.3243767321109772, mean loss: 0.3653606786125414
Epoch: 12, step: 724, loss: 0.33559003472328186, mean loss: 0.36535902954347316
Epoch: 12, step: 725, loss: 0.32113367319107056, mean loss: 0.3653565799280775
Epoch: 12, step: 726, loss: 0.3253415524959564, mean loss: 0.3653543636429802
Epoch: 12, step: 727, loss: 0.38548779487609863, mean loss: 0.3653554786978779
Epoch: 12, step: 728, loss: 0.33997592329978943, mean loss: 0.36535407317340546
Epoch: 12, step: 729, loss: 0.32623329758644104, mean loss: 0.3653519067775927
Epoch: 12, step: 730, loss: 0.3392058312892914, mean loss: 0.36535045896345636
Epoch: 12, step: 731, loss: 0.3379007577896118, mean loss: 0.36534893904644783
Epoch: 12, step: 732, loss: 0.39100226759910583, mean loss: 0.36535035941788646
Epoch: 12, step: 733, loss: 0.3491387963294983, mean loss: 0.36534946186705664
Epoch: 12, step: 734, loss: 0.34878668189048767, mean loss: 0.3653485449219215
Epoch: 12, step: 735, loss: 0.399090051651001, mean loss: 0.3653504128086979
Epoch: 12, step: 736, loss: 0.32333940267562866, mean loss: 0.3653480872614998
Epoch: 12, step: 737, loss: 0.32766780257225037, mean loss: 0.36534600155992286
Epoch: 12, step: 738, loss: 0.32916831970214844, mean loss: 0.3653439991421525
Epoch: 12, step: 739, loss: 0.3144182562828064, mean loss: 0.36534118058210935
Epoch: 12, step: 740, loss: 0.3672487139701843, mean loss: 0.3653412861515038
Epoch: 12, step: 741, loss: 0.3537438213825226, mean loss: 0.3653406443438243
Epoch: 12, step: 742, loss: 0.33617085218429565, mean loss: 0.3653390301668468
Epoch: 12, step: 743, loss: 0.30907320976257324, mean loss: 0.3653359167416363
Epoch: 12, step: 744, loss: 0.30893948674201965, mean loss: 0.36533279626191517
Epoch: 12, step: 745, loss: 0.3804725110530853, mean loss: 0.3653336339135026
Epoch: 12, step: 746, loss: 0.34283247590065, mean loss: 0.3653323890361575
Epoch: 12, step: 747, loss: 0.35503914952278137, mean loss: 0.36533181959382993
Epoch: 12, step: 748, loss: 0.3094697892665863, mean loss: 0.3653287293670043
Epoch: 12, step: 749, loss: 0.3451002538204193, mean loss: 0.36532761041161393
Epoch: 12, step: 750, loss: 0.3178877532482147, mean loss: 0.3653249863805744
Epoch: 12, step: 751, loss: 0.3425701856613159, mean loss: 0.36532372781858774
Epoch: 12, step: 752, loss: 0.34638649225234985, mean loss: 0.3653226804630451
Epoch: 12, step: 753, loss: 0.3459835648536682, mean loss: 0.3653216109400051
Epoch: 12, step: 754, loss: 0.369319349527359, mean loss: 0.3653218320171819
Epoch: 12, step: 755, loss: 0.3546355962753296, mean loss: 0.36532124109505504
Epoch: 12, step: 756, loss: 0.3240993916988373, mean loss: 0.36531896175585704
Epoch: 12, step: 757, loss: 0.33481982350349426, mean loss: 0.36531727541624337
Epoch: 12, step: 758, loss: 0.31420865654945374, mean loss: 0.3653144497061274
Epoch: 12, step: 759, loss: 0.3589237928390503, mean loss: 0.36531409639692425
Epoch: 12, step: 760, loss: 0.32187819480895996, mean loss: 0.36531169516404305
Epoch: 12, step: 761, loss: 0.31777384877204895, mean loss: 0.3653090673118379
Epoch: 12, step: 762, loss: 0.31216803193092346, mean loss: 0.36530612988243205
Epoch: 12, step: 763, loss: 0.301266610622406, mean loss: 0.3653025902229549
Epoch: 12, step: 764, loss: 0.35988929867744446, mean loss: 0.3653022910303641
Epoch: 12, step: 765, loss: 0.34865832328796387, mean loss: 0.3653013711692089
Epoch: 12, step: 766, loss: 0.33606991171836853, mean loss: 0.36529975572519396
Epoch: 12, step: 767, loss: 0.3952348828315735, mean loss: 0.3653014099651976
Epoch: 12, step: 768, loss: 0.342709481716156, mean loss: 0.3653001615854524
Epoch: 12, step: 769, loss: 0.29772382974624634, mean loss: 0.3652964276738689
Epoch: 12, step: 770, loss: 0.31133565306663513, mean loss: 0.3652934462508838
Epoch: 12, step: 771, loss: 0.3586174547672272, mean loss: 0.3652930774115753
Epoch: 12, step: 772, loss: 0.33274686336517334, mean loss: 0.36529127937754147
Epoch: 12, step: 773, loss: 0.41837766766548157, mean loss: 0.3652942120031236
Epoch: 12, step: 774, loss: 0.35259735584259033, mean loss: 0.3652935106356066
Epoch: 12, step: 775, loss: 0.4205252528190613, mean loss: 0.36529656143886463
Epoch: 12, step: 776, loss: 0.3372642397880554, mean loss: 0.3652950131195246
Epoch: 12, step: 777, loss: 0.3844384551048279, mean loss: 0.36529607041776746
Epoch: 12, step: 778, loss: 0.3433820903301239, mean loss: 0.3652948601686877
Epoch: 12, step: 779, loss: 0.34279462695121765, mean loss: 0.3652936176110768
Epoch: 12, step: 780, loss: 0.4089910387992859, mean loss: 0.36529603063339655
Epoch: 12, step: 781, loss: 0.39156290888786316, mean loss: 0.36529748104080983
Epoch: 12, step: 782, loss: 0.32593342661857605, mean loss: 0.365295307552078
Epoch: 12, step: 783, loss: 0.31362947821617126, mean loss: 0.36529245497757845
Epoch: 12, step: 784, loss: 0.30138829350471497, mean loss: 0.3652889268949045
Epoch: 12, step: 785, loss: 0.3399784564971924, mean loss: 0.3652875296071493
Epoch: 12, step: 786, loss: 0.3199998140335083, mean loss: 0.365285029595249
Epoch: 12, step: 787, loss: 0.36711975932121277, mean loss: 0.3652851308720058
Epoch: 12, step: 788, loss: 0.3345111310482025, mean loss: 0.3652834322464153
Epoch: 12, step: 789, loss: 0.3321048319339752, mean loss: 0.3652816009957081
Epoch: 12, step: 790, loss: 0.3645099699497223, mean loss: 0.365281558408863
Epoch: 12, step: 791, loss: 0.3647674024105072, mean loss: 0.3652815300338079
Epoch: 12, step: 792, loss: 0.3069734275341034, mean loss: 0.36527831232493424
Epoch: 12, step: 793, loss: 0.35114821791648865, mean loss: 0.36527753260446144
Epoch: 12, step: 794, loss: 0.3161584436893463, mean loss: 0.3652748222866931
Epoch: 12, step: 795, loss: 0.3656180500984192, mean loss: 0.3652748412244448
Epoch: 12, step: 796, loss: 0.3332637548446655, mean loss: 0.3652730750955411
Epoch: 12, step: 797, loss: 0.35298195481300354, mean loss: 0.3652723970021789
Epoch: 12, step: 798, loss: 0.3599046468734741, mean loss: 0.36527210088312284
Epoch: 12, step: 799, loss: 0.33244824409484863, mean loss: 0.3652702902114112
Epoch: 12, step: 800, loss: 0.315434992313385, mean loss: 0.3652675412843938
Epoch: 12, step: 801, loss: 0.3113359212875366, mean loss: 0.3652645665673504
Epoch: 12, step: 802, loss: 0.3612011671066284, mean loss: 0.3652643424539832
Epoch: 12, step: 803, loss: 0.3219001591205597, mean loss: 0.3652619508709624
Epoch: 12, step: 804, loss: 0.3044436573982239, mean loss: 0.3652585968593001
Epoch: 12, step: 805, loss: 0.3674629032611847, mean loss: 0.36525871841584595
Epoch: 12, step: 806, loss: 0.33259308338165283, mean loss: 0.3652569171677051
Epoch: 12, step: 807, loss: 0.32987502217292786, mean loss: 0.3652549662471606
Epoch: 12, step: 808, loss: 0.3525087833404541, mean loss: 0.36525426347476675
Epoch: 12, step: 809, loss: 0.30469730496406555, mean loss: 0.36525092479583243
Epoch: 12, step: 810, loss: 0.34789812564849854, mean loss: 0.3652499681389524
Epoch: 12, step: 811, loss: 0.35313424468040466, mean loss: 0.36524930023798996
Epoch: 12, step: 812, loss: 0.32752862572669983, mean loss: 0.3652472209328518
Epoch: 12, step: 813, loss: 0.32694604992866516, mean loss: 0.365245109744945
Epoch: 12, step: 814, loss: 0.3616311848163605, mean loss: 0.3652449105538008
Epoch: 12, step: 815, loss: 0.3350088894367218, mean loss: 0.36524324410642883
Epoch: 12, step: 816, loss: 0.3128420114517212, mean loss: 0.3652403561906033
Epoch: 12, step: 817, loss: 0.3379290997982025, mean loss: 0.365238851106486
Epoch: 12, step: 818, loss: 0.2887742221355438, mean loss: 0.36523463748280327
Epoch: 12, step: 819, loss: 0.3157699406147003, mean loss: 0.36523191185480747
Epoch: 12, step: 820, loss: 0.347464382648468, mean loss: 0.3652309328736401
Epoch: 12, step: 821, loss: 0.32848066091537476, mean loss: 0.36522890806526775
Epoch: 12, step: 822, loss: 0.33800843358039856, mean loss: 0.3652274083972338
Epoch: 12, step: 823, loss: 0.35445746779441833, mean loss: 0.3652268150774562
Epoch: 12, step: 824, loss: 0.3197062015533447, mean loss: 0.3652243074691532
Epoch: 12, step: 825, loss: 0.35583606362342834, mean loss: 0.36522379032451036
Epoch: 12, step: 826, loss: 0.3435143232345581, mean loss: 0.3652225945400383
Epoch: 12, step: 827, loss: 0.3775002658367157, mean loss: 0.3652232707722093
Epoch: 12, step: 828, loss: 0.3356686234474182, mean loss: 0.36522164304475846
Epoch: 12, step: 829, loss: 0.3460927903652191, mean loss: 0.3652205895778194
Epoch: 12, step: 830, loss: 0.32722124457359314, mean loss: 0.36521849698764347
Epoch: 12, step: 831, loss: 0.3267977833747864, mean loss: 0.36521638130958106
Epoch: 12, step: 832, loss: 0.34620991349220276, mean loss: 0.36521533475554674
Epoch: 12, step: 833, loss: 0.3259267807006836, mean loss: 0.36521317152715477
Epoch: 12, step: 834, loss: 0.3453751802444458, mean loss: 0.3652120793071866
Epoch: 12, step: 835, loss: 0.36784258484840393, mean loss: 0.3652122241269147
Epoch: 12, step: 836, loss: 0.3375820815563202, mean loss: 0.3652107030620883
Epoch: 12, step: 837, loss: 0.3761395514011383, mean loss: 0.3652113046721477
Epoch: 12, step: 838, loss: 0.3035111725330353, mean loss: 0.3652079083969157
Epoch: 12, step: 839, loss: 0.33925285935401917, mean loss: 0.3652064797834721
Epoch: 12, step: 840, loss: 0.34300026297569275, mean loss: 0.36520525757989414
Epoch: 12, step: 841, loss: 0.3566192388534546, mean loss: 0.3652047850417144
Epoch: 12, step: 842, loss: 0.3951219916343689, mean loss: 0.36520643146770043
Epoch: 12, step: 843, loss: 0.34881454706192017, mean loss: 0.3652055294269561
Epoch: 12, step: 844, loss: 0.35660260915756226, mean loss: 0.365205056036747
Epoch: 12, step: 845, loss: 0.36152714490890503, mean loss: 0.36520485366461497
Epoch: 12, step: 846, loss: 0.330168753862381, mean loss: 0.3652029259562352
Epoch: 12, step: 847, loss: 0.3265238106250763, mean loss: 0.3652007979239217
Epoch: 12, step: 848, loss: 0.3276957869529724, mean loss: 0.36519873460153784
Epoch: 12, step: 849, loss: 0.3372719883918762, mean loss: 0.36519719830787467
Epoch: 12, step: 850, loss: 0.35423392057418823, mean loss: 0.3651965952341229
Epoch: 12, step: 851, loss: 0.35701024532318115, mean loss: 0.36519614493984837
Epoch: 12, step: 852, loss: 0.3240323066711426, mean loss: 0.3651938808268585
Epoch: 12, step: 853, loss: 0.36374688148498535, mean loss: 0.3651938012426905
Epoch: 12, step: 854, loss: 0.3182200491428375, mean loss: 0.3651912178542453
Epoch: 12, step: 855, loss: 0.3680492043495178, mean loss: 0.3651913750246421
Epoch: 12, step: 856, loss: 0.3295690417289734, mean loss: 0.3651894161391158
Epoch: 12, step: 857, loss: 0.32390648126602173, mean loss: 0.36518714609980685
Epoch: 12, step: 858, loss: 0.3340413570404053, mean loss: 0.36518543356947974
Epoch: 12, step: 859, loss: 0.32793107628822327, mean loss: 0.365183385276249
Epoch: 12, step: 860, loss: 0.3592893183231354, mean loss: 0.3651830612305646
Epoch: 12, step: 861, loss: 0.34245747327804565, mean loss: 0.36518181188543253
Epoch: 12, step: 862, loss: 0.31961366534233093, mean loss: 0.3651793069023891
Epoch: 12, step: 863, loss: 0.3148093819618225, mean loss: 0.36517653810704276
Epoch: 12, step: 864, loss: 0.3623597025871277, mean loss: 0.3651763832763101
Epoch: 12, step: 865, loss: 0.43490326404571533, mean loss: 0.36518021568703724
Epoch: 12, step: 866, loss: 0.3208300471305847, mean loss: 0.3651777781949484
Epoch: 12, step: 867, loss: 0.32660651206970215, mean loss: 0.3651756584287292
Epoch: 12, step: 868, loss: 0.3379095792770386, mean loss: 0.36517416004552583
Epoch: 12, step: 869, loss: 0.3047032058238983, mean loss: 0.3651708371004647
Epoch: 12, step: 870, loss: 0.30577126145362854, mean loss: 0.36516757320818233
Epoch: 12, step: 871, loss: 0.33670157194137573, mean loss: 0.36516600914217867
Epoch: 12, step: 872, loss: 0.3570970892906189, mean loss: 0.3651655658192925
Epoch: 12, step: 873, loss: 0.3577802777290344, mean loss: 0.36516516007881944
Epoch: 12, step: 874, loss: 0.40224701166152954, mean loss: 0.3651671972074017
Epoch: 12, step: 875, loss: 0.37093478441238403, mean loss: 0.36516751403816444
Epoch: 12, step: 876, loss: 0.29794350266456604, mean loss: 0.36516382142561987
Epoch: 12, step: 877, loss: 0.34296125173568726, mean loss: 0.36516260190624766
Epoch: 12, step: 878, loss: 0.38411039113998413, mean loss: 0.36516364259330397
Epoch: 12, step: 879, loss: 0.3468804359436035, mean loss: 0.36516263846288605
Epoch: 12, step: 880, loss: 0.4007084369659424, mean loss: 0.36516459056341344
Epoch: 12, step: 881, loss: 0.3466266691684723, mean loss: 0.36516357255564874
Epoch: 12, step: 882, loss: 0.3103053569793701, mean loss: 0.36516056018864107
Epoch: 12, step: 883, loss: 0.3340992033481598, mean loss: 0.3651588546452169
Epoch: 12, step: 884, loss: 0.3727151155471802, mean loss: 0.36515926952804245
Epoch: 12, step: 885, loss: 0.3351934850215912, mean loss: 0.36515762432190946
Epoch: 12, step: 886, loss: 0.32796981930732727, mean loss: 0.36515558271855975
Epoch: 12, step: 887, loss: 0.33210569620132446, mean loss: 0.365153768385747
Epoch: 12, step: 888, loss: 0.3876641094684601, mean loss: 0.3651550040634701
Epoch: 12, step: 889, loss: 0.348480761051178, mean loss: 0.3651540888014758
Epoch: 12, step: 890, loss: 0.3346118628978729, mean loss: 0.36515241240727725
Epoch: 12, step: 891, loss: 0.32838499546051025, mean loss: 0.3651503944370826
Epoch: 12, step: 892, loss: 0.3045370280742645, mean loss: 0.36514706787068324
Epoch: 12, step: 893, loss: 0.3637363016605377, mean loss: 0.36514699044964216
Epoch: 12, step: 894, loss: 0.30359381437301636, mean loss: 0.3651436126756161
Epoch: 12, step: 895, loss: 0.3241136372089386, mean loss: 0.36514136125027224
Epoch: 12, step: 896, loss: 0.33876004815101624, mean loss: 0.3651399137159458
Epoch: 12, step: 897, loss: 0.3314666450023651, mean loss: 0.36513806617568934
Epoch: 12, step: 898, loss: 0.3549441993236542, mean loss: 0.3651375069028056
Epoch: 12, step: 899, loss: 0.3184053301811218, mean loss: 0.36513494314503064
Epoch: 12, step: 900, loss: 0.3093222379684448, mean loss: 0.3651318813914963
Epoch: 12, step: 901, loss: 0.3138299882411957, mean loss: 0.36512906724486166
Epoch: 12, step: 902, loss: 0.3827494978904724, mean loss: 0.36513003375413955
Epoch: 12, step: 903, loss: 0.343690425157547, mean loss: 0.36512885782124155
Epoch: 12, step: 904, loss: 0.3318983316421509, mean loss: 0.3651270352727756
Epoch: 12, step: 905, loss: 0.3058529198169708, mean loss: 0.3651237845260686
Epoch: 12, step: 906, loss: 0.30568280816078186, mean loss: 0.36512052480704665
Epoch: 12, step: 907, loss: 0.34296348690986633, mean loss: 0.365119309790711
Epoch: 12, step: 908, loss: 0.33834508061408997, mean loss: 0.36511784166387123
Epoch: 12, step: 909, loss: 0.34801310300827026, mean loss: 0.3651169038012407
Epoch: 12, step: 910, loss: 0.32731398940086365, mean loss: 0.36511483115940724
Epoch: 12, step: 911, loss: 0.3747529089450836, mean loss: 0.3651153595627946
Epoch: 12, step: 912, loss: 0.3023532032966614, mean loss: 0.3651119188437405
Epoch: 12, step: 913, loss: 0.3037821352481842, mean loss: 0.3651085568338953
Epoch: 12, step: 914, loss: 0.38341838121414185, mean loss: 0.3651095604969102
Epoch: 12, step: 915, loss: 0.314382404088974, mean loss: 0.3651067800125642
Epoch: 12, step: 916, loss: 0.2909949719905853, mean loss: 0.3651027179786907
Epoch: 12, step: 917, loss: 0.3499046564102173, mean loss: 0.36510188502562874
Epoch: 12, step: 918, loss: 0.3575303852558136, mean loss: 0.3651014700807189
Epoch: 12, step: 919, loss: 0.3277953267097473, mean loss: 0.365099425684436
Epoch: 12, step: 920, loss: 0.3063218295574188, mean loss: 0.3650962048177514
Epoch: 12, step: 921, loss: 0.3674985468387604, mean loss: 0.36509633645293066
Epoch: 12, step: 922, loss: 0.34908992052078247, mean loss: 0.36509545943709965
Epoch: 12, step: 923, loss: 0.2994005084037781, mean loss: 0.3650918601082024
Epoch: 12, step: 924, loss: 0.3690433204174042, mean loss: 0.3650920765909893
Epoch: 12, step: 925, loss: 0.3099927604198456, mean loss: 0.36508905811196163
Epoch: 12, step: 926, loss: 0.3176499903202057, mean loss: 0.3650864594229563
Epoch: 12, step: 927, loss: 0.36566033959388733, mean loss: 0.3650864908581103
Epoch: 12, step: 928, loss: 0.36699000000953674, mean loss: 0.36508659511999075
Epoch: 12, step: 929, loss: 0.32124465703964233, mean loss: 0.36508419387461444
Epoch: 12, step: 930, loss: 0.3323831260204315, mean loss: 0.3650824029184912
Epoch: 12, step: 931, loss: 0.3229690194129944, mean loss: 0.36508009659956975
Epoch: 12, step: 932, loss: 0.3219326138496399, mean loss: 0.365077733778106
Epoch: 12, step: 933, loss: 0.33082231879234314, mean loss: 0.3650758580024524
Epoch: 12, step: 934, loss: 0.3374340534210205, mean loss: 0.36507434446116227
Epoch: 12, step: 935, loss: 0.341496080160141, mean loss: 0.3650730534918072
Epoch: 12, step: 936, loss: 0.3302861154079437, mean loss: 0.3650711489236121
Epoch: 12, step: 937, loss: 0.36182308197021484, mean loss: 0.365070971103238
Epoch: 12, step: 938, loss: 0.38054749369621277, mean loss: 0.3650718183426639
Epoch: 12, step: 939, loss: 0.33758896589279175, mean loss: 0.3650703139167579
Epoch: 12, step: 940, loss: 0.3666382133960724, mean loss: 0.36507039973970823
Epoch: 12, step: 941, loss: 0.316815048456192, mean loss: 0.36506775850537415
Epoch: 12, step: 942, loss: 0.3731756806373596, mean loss: 0.36506820226445313
Epoch: 12, step: 943, loss: 0.34763407707214355, mean loss: 0.3650672481201234
Epoch: 12, step: 944, loss: 0.3314597010612488, mean loss: 0.36506540892858075
Epoch: 12, step: 945, loss: 0.4255082607269287, mean loss: 0.3650687165159616
Epoch: 12, step: 946, loss: 0.33886611461639404, mean loss: 0.36506728272105604
Epoch: 12, step: 947, loss: 0.35642096400260925, mean loss: 0.36506680962416843
Epoch: 12, step: 948, loss: 0.31643056869506836, mean loss: 0.36506414856158
Epoch: 12, step: 949, loss: 0.3254926800727844, mean loss: 0.3650619835835469
Epoch: 12, step: 950, loss: 0.3383234739303589, mean loss: 0.3650605207841786
Epoch: 12, step: 951, loss: 0.3152715861797333, mean loss: 0.3650577971006663
Epoch: 12, step: 952, loss: 0.29332053661346436, mean loss: 0.36505387295754027
Epoch: 12, step: 953, loss: 0.3447200059890747, mean loss: 0.36505276072326787
Epoch: 12, step: 954, loss: 0.3385251760482788, mean loss: 0.3650513097806066
Epoch: 12, step: 955, loss: 0.3373104929924011, mean loss: 0.3650497925624493
Epoch: 12, step: 956, loss: 0.35526663064956665, mean loss: 0.36504925752488226
Epoch: 12, step: 957, loss: 0.32272064685821533, mean loss: 0.3650469427151553
Epoch: 12, step: 958, loss: 0.3416088819503784, mean loss: 0.3650456610363253
Epoch: 12, step: 959, loss: 0.31443357467651367, mean loss: 0.3650428935337903
Epoch: 12, step: 960, loss: 0.318556010723114, mean loss: 0.36504035173911537
Epoch: 12, step: 961, loss: 0.3266335725784302, mean loss: 0.36503825186053906
Epoch: 12, step: 962, loss: 0.3480430245399475, mean loss: 0.3650373227026297
Epoch: 12, step: 963, loss: 0.3268849849700928, mean loss: 0.3650352369636327
Epoch: 12, step: 964, loss: 0.36450859904289246, mean loss: 0.36503520817459206
Epoch: 12, step: 965, loss: 0.32865598797798157, mean loss: 0.3650332195870663
Epoch: 12, step: 966, loss: 0.32994940876960754, mean loss: 0.36503130191498007
Epoch: 12, step: 967, loss: 0.3401181995868683, mean loss: 0.3650299402456355
Epoch: 12, step: 968, loss: 0.3553183674812317, mean loss: 0.3650294094715871
Epoch: 12, step: 969, loss: 0.4146347641944885, mean loss: 0.36503212044298955
Epoch: 12, step: 970, loss: 0.3029050827026367, mean loss: 0.3650287253373696
Epoch: 12, step: 971, loss: 0.34392520785331726, mean loss: 0.36502757213969284
Epoch: 12, step: 972, loss: 0.3517690896987915, mean loss: 0.365026847672044
Epoch: 12, step: 973, loss: 0.384566068649292, mean loss: 0.36502791527235967
Epoch: 12, step: 974, loss: 0.37685060501098633, mean loss: 0.36502856121508703
Epoch: 12, step: 975, loss: 0.31540730595588684, mean loss: 0.3650258502636415
Epoch: 12, step: 976, loss: 0.35354602336883545, mean loss: 0.36502522312204655
Epoch: 12, step: 977, loss: 0.33311954140663147, mean loss: 0.3650234802136168
Epoch: 12, step: 978, loss: 0.33895596861839294, mean loss: 0.3650220563040961
Epoch: 12, step: 979, loss: 0.3160044550895691, mean loss: 0.3650193789170951
Epoch: 12, step: 980, loss: 0.3306858241558075, mean loss: 0.36501750368880514
Epoch: 12, step: 981, loss: 0.39115482568740845, mean loss: 0.3650189311777182
Epoch: 12, step: 982, loss: 0.34828701615333557, mean loss: 0.36501801741467826
Epoch: 12, step: 983, loss: 0.3407015800476074, mean loss: 0.3650166895183607
Epoch: 12, step: 984, loss: 0.33382540941238403, mean loss: 0.36501498628677076
Epoch: 12, step: 985, loss: 0.3784087896347046, mean loss: 0.3650157176290962
Epoch: 12, step: 986, loss: 0.3398573696613312, mean loss: 0.3650143439819235
Epoch: 12, step: 987, loss: 0.31862685084342957, mean loss: 0.36501181136054667
Epoch: 12, step: 988, loss: 0.320068359375, mean loss: 0.36500935771355286
Epoch: 12, step: 989, loss: 0.3337046205997467, mean loss: 0.3650076487531252
Epoch: 12, step: 990, loss: 0.35242199897766113, mean loss: 0.36500696172600716
Epoch: 12, step: 991, loss: 0.31138142943382263, mean loss: 0.36500403456813096
Epoch: 12, step: 992, loss: 0.36754581332206726, mean loss: 0.3650041733039398
Epoch: 12, step: 993, loss: 0.34471645951271057, mean loss: 0.36500306601686466
Epoch: 12, step: 994, loss: 0.32204344868659973, mean loss: 0.36500072144352347
Epoch: 12, step: 995, loss: 0.3830954134464264, mean loss: 0.3650017089294437
Epoch: 12, step: 996, loss: 0.34328773617744446, mean loss: 0.3650005239923222
Epoch: 12, step: 997, loss: 0.34579673409461975, mean loss: 0.3649994760937138
Epoch: 12, step: 998, loss: 0.3085295259952545, mean loss: 0.3649963948501879
Epoch: 12, step: 999, loss: 0.3664572536945343, mean loss: 0.3649964745565849
Epoch: 12, step: 1000, loss: 0.34038299322128296, mean loss: 0.3649951316856517
Epoch: 12, step: 1001, loss: 0.33451342582702637, mean loss: 0.36499346874479743
Epoch: 12, step: 1002, loss: 0.32371631264686584, mean loss: 0.36499121697696707
Epoch: 12, step: 1003, loss: 0.3157568573951721, mean loss: 0.36498853127112035
Epoch: 12, step: 1004, loss: 0.35999956727027893, mean loss: 0.3649882591408634
Epoch: 12, step: 1005, loss: 0.36263149976730347, mean loss: 0.36498813059502655
Epoch: 12, step: 1006, loss: 0.3611582815647125, mean loss: 0.36498792171315964
Epoch: 12, step: 1007, loss: 0.3063511550426483, mean loss: 0.3649847238092182
Epoch: 12, step: 1008, loss: 0.33975744247436523, mean loss: 0.36498334805084254
Epoch: 12, step: 1009, loss: 0.2995961904525757, mean loss: 0.36497978238623363
Epoch: 12, step: 1010, loss: 0.36203834414482117, mean loss: 0.3649796219937236
Epoch: 12, step: 1011, loss: 0.3233589828014374, mean loss: 0.3649773526022736
Epoch: 12, step: 1012, loss: 0.3365404009819031, mean loss: 0.36497580214419495
Epoch: 12, step: 1013, loss: 0.339659720659256, mean loss: 0.3649744219194929
Epoch: 12, step: 1014, loss: 0.3738921284675598, mean loss: 0.3649749080835091
Epoch: 12, step: 1015, loss: 0.33497047424316406, mean loss: 0.36497327242968003
Epoch: 12, step: 1016, loss: 0.32036951184272766, mean loss: 0.3649708410445295
Epoch: 12, step: 1017, loss: 0.3443087935447693, mean loss: 0.36496971480188806
Epoch: 12, step: 1018, loss: 0.39970695972442627, mean loss: 0.3649716081492976
Epoch: 12, step: 1019, loss: 0.3253975808620453, mean loss: 0.36496945129147723
Epoch: 12, step: 1020, loss: 0.4073762893676758, mean loss: 0.3649717624167743
Epoch: 12, step: 1021, loss: 0.34315812587738037, mean loss: 0.3649705736627395
Epoch: 12, step: 1022, loss: 0.33004945516586304, mean loss: 0.36496867070821404
Epoch: 12, step: 1023, loss: 0.3342849612236023, mean loss: 0.36496699875368677
Epoch: 12, step: 1024, loss: 0.326099693775177, mean loss: 0.36496488099065194
Epoch: 12, step: 1025, loss: 0.33776864409446716, mean loss: 0.364963399229897
Epoch: 12, step: 1026, loss: 0.3789287805557251, mean loss: 0.3649641600787843
Epoch: 12, step: 1027, loss: 0.33271291851997375, mean loss: 0.36496240309242783
Epoch: 12, step: 1028, loss: 0.33468303084373474, mean loss: 0.3649607536196246
Epoch: 12, step: 1029, loss: 0.32027655839920044, mean loss: 0.364958319574782
Epoch: 12, step: 1030, loss: 0.3199641704559326, mean loss: 0.3649558687795797
Epoch: 12, step: 1031, loss: 0.3213791251182556, mean loss: 0.36495349531859594
Epoch: 12, step: 1032, loss: 0.3150881826877594, mean loss: 0.36495077949088334
Epoch: 12, step: 1033, loss: 0.37612980604171753, mean loss: 0.3649513883040056
Epoch: 12, step: 1034, loss: 0.3394722044467926, mean loss: 0.36495000077561385
Epoch: 12, step: 1035, loss: 0.3356001377105713, mean loss: 0.364948402547392
Epoch: 12, step: 1036, loss: 0.33868342638015747, mean loss: 0.364946972382613
Epoch: 12, step: 1037, loss: 0.3422743082046509, mean loss: 0.3649457378914784
Epoch: 12, step: 1038, loss: 0.3431475758552551, mean loss: 0.3649445510802389
Epoch: 12, step: 1039, loss: 0.36457598209381104, mean loss: 0.36494453101441865
Epoch: 12, step: 1040, loss: 0.3616597354412079, mean loss: 0.3649443521916426
Epoch: 12, step: 1041, loss: 0.332322359085083, mean loss: 0.36494257636186
Epoch: 12, step: 1042, loss: 0.3265855312347412, mean loss: 0.3649404884491102
Epoch: 12, step: 1043, loss: 0.3501865863800049, mean loss: 0.3649396853845517
Epoch: 12, step: 1044, loss: 0.3248928189277649, mean loss: 0.36493750572600614
Epoch: 12, step: 1045, loss: 0.39716386795043945, mean loss: 0.36493925963708834
Epoch: 12, step: 1046, loss: 0.3056620657444, mean loss: 0.36493603366735267
Epoch: 12, step: 1047, loss: 0.3095076084136963, mean loss: 0.36493301731856875
Epoch: 12, step: 1048, loss: 0.3245691657066345, mean loss: 0.3649308208854397
Epoch: 12, step: 1049, loss: 0.3158898651599884, mean loss: 0.36492815242555693
Epoch: 12, step: 1050, loss: 0.3645506203174591, mean loss: 0.3649281318840635
Epoch: 12, step: 1051, loss: 0.2924797832965851, mean loss: 0.3649241901893634
Epoch: 12, step: 1052, loss: 0.3843299150466919, mean loss: 0.3649252459384988
Epoch: 12, step: 1053, loss: 0.3567759394645691, mean loss: 0.36492480260771465
Epoch: 12, step: 1054, loss: 0.31229227781295776, mean loss: 0.36492193949914725
Epoch: 12, step: 1055, loss: 0.36548060178756714, mean loss: 0.3649219698876529
Epoch: 12, step: 1056, loss: 0.31581053137779236, mean loss: 0.36491929861006195
Epoch: 12, step: 1057, loss: 0.3297470211982727, mean loss: 0.3649173856177084
Epoch: 12, step: 1058, loss: 0.3082570731639862, mean loss: 0.3649143040757247
Epoch: 12, step: 1059, loss: 0.34570443630218506, mean loss: 0.3649132593798484
Epoch: 12, step: 1060, loss: 0.31866857409477234, mean loss: 0.3649107445783211
Epoch: 12, step: 1061, loss: 0.3148859441280365, mean loss: 0.3649080243607871
Epoch: 12, step: 1062, loss: 0.34315207600593567, mean loss: 0.36490684139366436
Epoch: 12, step: 1063, loss: 0.28036099672317505, mean loss: 0.3649022445121577
Epoch: 12, step: 1064, loss: 0.33747294545173645, mean loss: 0.364900753222044
Epoch: 12, step: 1065, loss: 0.3844773471355438, mean loss: 0.36490181751441725
Epoch: 12, step: 1066, loss: 0.3839879333972931, mean loss: 0.36490285508527254
Epoch: 12, step: 1067, loss: 0.33231043815612793, mean loss: 0.3649010833731107
Epoch: 12, step: 1068, loss: 0.35551396012306213, mean loss: 0.3649005731201755
Epoch: 12, step: 1069, loss: 0.3737857937812805, mean loss: 0.3649010560650967
Epoch: 12, step: 1070, loss: 0.30857130885124207, mean loss: 0.3648979944994022
Epoch: 12, step: 1071, loss: 0.32389700412750244, mean loss: 0.36489576618470804
Epoch: 12, step: 1072, loss: 0.3464330732822418, mean loss: 0.3648947628320151
Epoch: 12, step: 1073, loss: 0.3438148498535156, mean loss: 0.364893617309084
Epoch: 12, step: 1074, loss: 0.33005672693252563, mean loss: 0.3648917243084658
Epoch: 12, step: 1075, loss: 0.3532498776912689, mean loss: 0.3648910917369261
Epoch: 12, step: 1076, loss: 0.37964925169944763, mean loss: 0.36489189359294144
Epoch: 12, step: 1077, loss: 0.34381622076034546, mean loss: 0.36489074854932346
Epoch: 12, step: 1078, loss: 0.3870885670185089, mean loss: 0.3648919544937179
Epoch: 12, step: 1079, loss: 0.34455999732017517, mean loss: 0.3648908499762704
Epoch: 12, step: 1080, loss: 0.3090611398220062, mean loss: 0.3648878172362979
Epoch: 12, step: 1081, loss: 0.32914605736732483, mean loss: 0.36488587580447446
Epoch: 12, step: 1082, loss: 0.3202441930770874, mean loss: 0.3648834510756315
Epoch: 12, step: 1083, loss: 0.3365842401981354, mean loss: 0.3648819140774305
Epoch: 12, step: 1084, loss: 0.3341347575187683, mean loss: 0.3648802442161065
Epoch: 12, step: 1085, loss: 0.3762097656726837, mean loss: 0.36488085948283056
Epoch: 12, step: 1086, loss: 0.34175586700439453, mean loss: 0.3648796037134861
Epoch: 12, step: 1087, loss: 0.3273833990097046, mean loss: 0.36487756764676677
Epoch: 12, step: 1088, loss: 0.38121306896209717, mean loss: 0.3648784546262594
Epoch: 12, step: 1089, loss: 0.32001233100891113, mean loss: 0.3648760186330127
Epoch: 12, step: 1090, loss: 0.3116181194782257, mean loss: 0.3648731271677239
Epoch: 12, step: 1091, loss: 0.43199366331100464, mean loss: 0.36487677106219424
Epoch: 12, step: 1092, loss: 0.355024129152298, mean loss: 0.3648762362029624
Epoch: 12, step: 1093, loss: 0.33427029848098755, mean loss: 0.36487457482321417
Epoch: 12, step: 1094, loss: 0.30520015954971313, mean loss: 0.36487133569737834
Epoch: 12, step: 1095, loss: 0.34274935722351074, mean loss: 0.3648701349820899
Epoch: 12, step: 1096, loss: 0.33011823892593384, mean loss: 0.3648682488547599
Epoch: 12, step: 1097, loss: 0.36499080061912537, mean loss: 0.36486825550578367
Epoch: 12, step: 1098, loss: 0.3174782693386078, mean loss: 0.3648656837368486
Epoch: 12, step: 1099, loss: 0.3249191343784332, mean loss: 0.3648635160274195
Epoch: 12, step: 1100, loss: 0.3361571431159973, mean loss: 0.3648619583534865
Epoch: 12, step: 1101, loss: 0.3338499367237091, mean loss: 0.3648602756610486
Epoch: 12, step: 1102, loss: 0.35819488763809204, mean loss: 0.36485991402098444
Epoch: 12, step: 1103, loss: 0.3007398545742035, mean loss: 0.36485643528512035
Epoch: 12, step: 1104, loss: 0.3314164876937866, mean loss: 0.3648546211502757
Epoch: 12, step: 1105, loss: 0.33508262038230896, mean loss: 0.3648530060911042
Epoch: 12, step: 1106, loss: 0.3299610912799835, mean loss: 0.3648511133916298
Epoch: 12, step: 1107, loss: 0.33450570702552795, mean loss: 0.3648494674051704
Epoch: 12, step: 1108, loss: 0.33226969838142395, mean loss: 0.3648477003189295
Epoch: 12, step: 1109, loss: 0.35939425230026245, mean loss: 0.36484740454671893
Epoch: 12, step: 1110, loss: 0.3048359751701355, mean loss: 0.3648441499543128
Epoch: 12, step: 1111, loss: 0.36744940280914307, mean loss: 0.36484429123700557
Epoch: 12, step: 1112, loss: 0.34865477681159973, mean loss: 0.3648434133283008
Epoch: 12, step: 1113, loss: 0.37106311321258545, mean loss: 0.3648437505856419
Epoch: 12, step: 1114, loss: 0.3248920440673828, mean loss: 0.36484158435962016
Epoch: 12, step: 1115, loss: 0.3326214551925659, mean loss: 0.3648398374430529
Epoch: 12, step: 1116, loss: 0.3011235296726227, mean loss: 0.36483638304848687
Epoch: 12, step: 1117, loss: 0.3724372982978821, mean loss: 0.36483679511154926
Epoch: 12, step: 1118, loss: 0.3755947947502136, mean loss: 0.3648373782957873
Epoch: 12, step: 1119, loss: 0.3154969811439514, mean loss: 0.364834703729593
Epoch: 12, step: 1120, loss: 0.34019145369529724, mean loss: 0.36483336797968596
Epoch: 12, step: 1121, loss: 0.3706890940666199, mean loss: 0.3648336853632137
Epoch: 12, step: 1122, loss: 0.3113166391849518, mean loss: 0.36483078486751275
Epoch: 12, step: 1123, loss: 0.3001156449317932, mean loss: 0.3648272776520382
Epoch: 12, step: 1124, loss: 0.3409816324710846, mean loss: 0.36482598541526473
Epoch: 12, step: 1125, loss: 0.37662115693092346, mean loss: 0.3648266245813813
Epoch: 12, step: 1126, loss: 0.30260413885116577, mean loss: 0.3648232530026368
Epoch: 12, step: 1127, loss: 0.34901902079582214, mean loss: 0.3648223966831631
Epoch: 12, step: 1128, loss: 0.31406673789024353, mean loss: 0.3648196467422847
Epoch: 12, step: 1129, loss: 0.36731183528900146, mean loss: 0.3648197817617097
Epoch: 12, step: 1130, loss: 0.35340866446495056, mean loss: 0.36481916357452204
Epoch: 12, step: 1131, loss: 0.38734760880470276, mean loss: 0.3648203839670047
Epoch: 12, step: 1132, loss: 0.3519189953804016, mean loss: 0.3648196851214066
Epoch: 12, step: 1133, loss: 0.3638693392276764, mean loss: 0.36481963364562425
Epoch: 12, step: 1134, loss: 0.3340243399143219, mean loss: 0.36481796569925956
Epoch: 12, step: 1135, loss: 0.3614792823791504, mean loss: 0.3648177848780226
Epoch: 12, step: 1136, loss: 0.3588108420372009, mean loss: 0.3648174595629486
Epoch: 12, step: 1137, loss: 0.33118292689323425, mean loss: 0.364815638132608
Epoch: 12, step: 1138, loss: 0.3628242015838623, mean loss: 0.3648155302950302
Epoch: 12, step: 1139, loss: 0.34954237937927246, mean loss: 0.3648147032888078
Epoch: 12, step: 1140, loss: 0.38140496611595154, mean loss: 0.36481560156499093
Epoch: 12, step: 1141, loss: 0.3050212264060974, mean loss: 0.3648123641868015
Epoch: 12, step: 1142, loss: 0.3705493211746216, mean loss: 0.3648126747794596
Epoch: 12, step: 1143, loss: 0.3521288335323334, mean loss: 0.3648119881271617
Epoch: 12, step: 1144, loss: 0.3540697395801544, mean loss: 0.36481140661638667
Epoch: 12, step: 1145, loss: 0.33083197474479675, mean loss: 0.3648095673053619
Epoch: 12, step: 1146, loss: 0.34848690032958984, mean loss: 0.36480868380511966
Epoch: 12, step: 1147, loss: 0.35627487301826477, mean loss: 0.36480822191884626
Epoch: 12, step: 1148, loss: 0.3393942713737488, mean loss: 0.36480684648178696
Epoch: 12, step: 1149, loss: 0.3658216595649719, mean loss: 0.36480690140185856
Epoch: 12, step: 1150, loss: 0.3034856617450714, mean loss: 0.36480358297339077
Epoch: 12, step: 1151, loss: 0.3140973746776581, mean loss: 0.3648008391309505
Epoch: 12, step: 1152, loss: 0.34318807721138, mean loss: 0.364799669672484
Epoch: 12, step: 1153, loss: 0.34811651706695557, mean loss: 0.36479876700217745
Epoch: 12, step: 1154, loss: 0.3648931384086609, mean loss: 0.3647987721080264
Epoch: 12, step: 1155, loss: 0.37498393654823303, mean loss: 0.36479932313401864
Epoch: 12, step: 1156, loss: 0.316936194896698, mean loss: 0.3647967338384689
Epoch: 12, step: 1157, loss: 0.3045113682746887, mean loss: 0.3647934727021731
Epoch: 12, step: 1158, loss: 0.33511096239089966, mean loss: 0.36479186711390504
Epoch: 12, step: 1159, loss: 0.29878413677215576, mean loss: 0.36478829681261005
Epoch: 12, step: 1160, loss: 0.3561367988586426, mean loss: 0.36478782888584527
Epoch: 12, step: 1161, loss: 0.35321494936943054, mean loss: 0.36478720298646633
Epoch: 12, step: 1162, loss: 0.30265557765960693, mean loss: 0.3647838428855888
Epoch: 12, step: 1163, loss: 0.33333855867385864, mean loss: 0.3647821424051534
Epoch: 12, step: 1164, loss: 0.3181791603565216, mean loss: 0.3647796223715164
Epoch: 12, step: 1165, loss: 0.3835751712322235, mean loss: 0.364780638676743
Epoch: 12, step: 1166, loss: 0.323695570230484, mean loss: 0.36477841726184995
Epoch: 12, step: 1167, loss: 0.35921576619148254, mean loss: 0.36477811651298153
Epoch: 12, step: 1168, loss: 0.3082409203052521, mean loss: 0.36477505995266324
Epoch: 12, step: 1169, loss: 0.3123432695865631, mean loss: 0.36477222549540483
Epoch: 12, step: 1170, loss: 0.32232874631881714, mean loss: 0.36476993112926737
Epoch: 12, step: 1171, loss: 0.3341785669326782, mean loss: 0.3647682775420135
Epoch: 12, step: 1172, loss: 0.3434376120567322, mean loss: 0.3647671245953898
Epoch: 12, step: 1173, loss: 0.3404783010482788, mean loss: 0.36476581182792966
Epoch: 12, step: 1174, loss: 0.3437345623970032, mean loss: 0.3647646751879561
Epoch: 12, step: 1175, loss: 0.30528751015663147, mean loss: 0.36476146090104344
Epoch: 12, step: 1176, loss: 0.3115018904209137, mean loss: 0.3647585827832115
Epoch: 12, step: 1177, loss: 0.3441890478134155, mean loss: 0.3647574712769449
Epoch: 12, step: 1178, loss: 0.39055517315864563, mean loss: 0.36475886521987905
Epoch: 12, step: 1179, loss: 0.3491847515106201, mean loss: 0.36475802373977806
Epoch: 12, step: 1180, loss: 0.4000673294067383, mean loss: 0.36475993142283314
Epoch: 12, step: 1181, loss: 0.3240712881088257, mean loss: 0.36475773322492316
Epoch: 12, step: 1182, loss: 0.380788654088974, mean loss: 0.3647585992462545
Epoch: 12, step: 1183, loss: 0.30623510479927063, mean loss: 0.36475543786474807
Epoch: 12, step: 1184, loss: 0.36904376745224, mean loss: 0.3647556695035742
Epoch: 12, step: 1185, loss: 0.4057391881942749, mean loss: 0.3647578831537141
Epoch: 12, step: 1186, loss: 0.3309016227722168, mean loss: 0.36475605456822224
Epoch: 12, step: 1187, loss: 0.37099939584732056, mean loss: 0.36475639175450864
Epoch: 12, step: 1188, loss: 0.32009270787239075, mean loss: 0.364753979717792
Epoch: 12, step: 1189, loss: 0.31993618607521057, mean loss: 0.3647515594891689
Epoch: 12, step: 1190, loss: 0.3048248887062073, mean loss: 0.36474832353308145
Epoch: 12, step: 1191, loss: 0.34776848554611206, mean loss: 0.3647474066951772
Epoch: 12, step: 1192, loss: 0.3058905303478241, mean loss: 0.3647442288496857
Epoch: 12, step: 1193, loss: 0.3798806667327881, mean loss: 0.3647450460636952
Epoch: 12, step: 1194, loss: 0.3384582996368408, mean loss: 0.3647436269228202
Epoch: 12, step: 1195, loss: 0.3412289619445801, mean loss: 0.36474235750665857
Epoch: 12, step: 1196, loss: 0.38759905099868774, mean loss: 0.36474359133626677
Epoch: 12, step: 1197, loss: 0.33024856448173523, mean loss: 0.36474172935705623
Epoch: 12, step: 1198, loss: 0.34085574746131897, mean loss: 0.3647404401045115
Epoch: 12, step: 1199, loss: 0.3346758484840393, mean loss: 0.36473881744736447
Epoch: 12, step: 1200, loss: 0.3043319582939148, mean loss: 0.36473555732220103
Epoch: 12, step: 1201, loss: 0.3372979164123535, mean loss: 0.3647340766076349
Epoch: 12, step: 1202, loss: 0.34944772720336914, mean loss: 0.3647332517007543
Epoch: 12, step: 1203, loss: 0.3140428960323334, mean loss: 0.3647305164128378
Epoch: 12, step: 1204, loss: 0.36634957790374756, mean loss: 0.36473060377384203
Epoch: 12, step: 1205, loss: 0.3079921007156372, mean loss: 0.36472754245394035
Epoch: 12, step: 1206, loss: 0.3463032841682434, mean loss: 0.3647265484286754
Epoch: 12, step: 1207, loss: 0.32321232557296753, mean loss: 0.3647243087748744
Epoch: 12, step: 1208, loss: 0.3225906193256378, mean loss: 0.36472203582404905
Epoch: 12, step: 1209, loss: 0.32286763191223145, mean loss: 0.3647197780614041
Epoch: 12, step: 1210, loss: 0.32144972681999207, mean loss: 0.3647174440600426
Epoch: 12, step: 1211, loss: 0.31876039505004883, mean loss: 0.3647149652548101
Epoch: 12, step: 1212, loss: 0.3755805194377899, mean loss: 0.3647155512832974
Epoch: 12, step: 1213, loss: 0.32068997621536255, mean loss: 0.36471317691294536
Epoch: 12, step: 1214, loss: 0.40259525179862976, mean loss: 0.364715219844234
Epoch: 12, step: 1215, loss: 0.36836281418800354, mean loss: 0.3647154165436701
Epoch: 12, step: 1216, loss: 0.31918662786483765, mean loss: 0.3647129614997942
Epoch: 12, step: 1217, loss: 0.32695409655570984, mean loss: 0.36471092554244794
Epoch: 12, step: 1218, loss: 0.3487405776977539, mean loss: 0.3647100644679968
Epoch: 12, step: 1219, loss: 0.39452630281448364, mean loss: 0.3647116719856993
Epoch: 12, step: 1220, loss: 0.3722158968448639, mean loss: 0.36471207654793225
Epoch: 12, step: 1221, loss: 0.339966356754303, mean loss: 0.3647107425468652
Epoch: 12, step: 1222, loss: 0.32149776816368103, mean loss: 0.3647084131320421
Epoch: 12, step: 1223, loss: 0.3399076461791992, mean loss: 0.36470707630760524
Epoch: 12, step: 1224, loss: 0.34492582082748413, mean loss: 0.3647060101050784
Epoch: 12, step: 1225, loss: 0.3274599611759186, mean loss: 0.364704002664692
Epoch: 12, step: 1226, loss: 0.33013850450515747, mean loss: 0.3647021397976395
Epoch: 12, step: 1227, loss: 0.3209590017795563, mean loss: 0.3646997824394794
Epoch: 12, step: 1228, loss: 0.29978325963020325, mean loss: 0.364696284216555
Epoch: 12, step: 1229, loss: 0.3430211842060089, mean loss: 0.36469511625125645
Epoch: 12, step: 1230, loss: 0.3462139070034027, mean loss: 0.36469412044279437
Epoch: 12, step: 1231, loss: 0.31007474660873413, mean loss: 0.3646911775886007
Epoch: 12, step: 1232, loss: 0.3181232810020447, mean loss: 0.3646886686776268
Epoch: 12, step: 1233, loss: 0.4062572717666626, mean loss: 0.3646909081239736
Epoch: 12, step: 1234, loss: 0.33210980892181396, mean loss: 0.3646891529605193
Epoch: 12, step: 1235, loss: 0.33065226674079895, mean loss: 0.36468731947171196
Epoch: 12, step: 1236, loss: 0.3854443430900574, mean loss: 0.3646884375446243
Epoch: 12, step: 1237, loss: 0.3209128975868225, mean loss: 0.3646860797109521
Epoch: 12, step: 1238, loss: 0.33210912346839905, mean loss: 0.36468432514875887
Epoch: 12, step: 1239, loss: 0.35874634981155396, mean loss: 0.36468400535258605
Epoch: 12, step: 1240, loss: 0.3331958055496216, mean loss: 0.36468230961238446
Epoch: 12, step: 1241, loss: 0.31625810265541077, mean loss: 0.3646797019544977
Epoch: 12, step: 1242, loss: 0.30196091532707214, mean loss: 0.36467632471112754
Epoch: 12, step: 1243, loss: 0.32021281123161316, mean loss: 0.36467393059560527
Epoch: 12, step: 1244, loss: 0.37199702858924866, mean loss: 0.3646743248829037
Epoch: 12, step: 1245, loss: 0.35123977065086365, mean loss: 0.3646736015839787
Epoch: 12, step: 1246, loss: 0.3197706341743469, mean loss: 0.3646711841967696
Epoch: 12, step: 1247, loss: 0.33244675397872925, mean loss: 0.36466944946215407
Epoch: 12, step: 1248, loss: 0.36893945932388306, mean loss: 0.3646696793168056
Epoch: 12, step: 1249, loss: 0.34557101130485535, mean loss: 0.36466865129075265
Epoch: 12, step: 1250, loss: 0.3607909679412842, mean loss: 0.36466844257750924
Epoch: 12, step: 1251, loss: 0.3624369502067566, mean loss: 0.3646683224756594
Epoch: 12, step: 1252, loss: 0.36846640706062317, mean loss: 0.3646685268825581
Epoch: 12, step: 1253, loss: 0.36891499161720276, mean loss: 0.3646687554082676
Epoch: 12, step: 1254, loss: 0.3432258665561676, mean loss: 0.3646676015101429
Epoch: 12, step: 1255, loss: 0.31129008531570435, mean loss: 0.3646647292804725
Epoch: 12, step: 1256, loss: 0.34339994192123413, mean loss: 0.36466358508960034
Epoch: 12, step: 1257, loss: 0.3133927583694458, mean loss: 0.3646608265171953
Epoch: 12, step: 1258, loss: 0.3855026364326477, mean loss: 0.3646619478283222
Epoch: 12, step: 1259, loss: 0.3166884481906891, mean loss: 0.36465936694282414
Epoch: 12, step: 1260, loss: 0.4256405532360077, mean loss: 0.3646626474413067
Epoch: 12, step: 1261, loss: 0.3329905569553375, mean loss: 0.3646609437247663
Epoch: 12, step: 1262, loss: 0.35440945625305176, mean loss: 0.3646603923027088
Epoch: 12, step: 1263, loss: 0.3220210671424866, mean loss: 0.3646580988794536
Epoch: 12, step: 1264, loss: 0.3583541214466095, mean loss: 0.3646577598283358
Epoch: 12, step: 1265, loss: 0.3284262418746948, mean loss: 0.3646558112686954
Epoch: 12, step: 1266, loss: 0.3695198595523834, mean loss: 0.36465607284698437
Epoch: 12, step: 1267, loss: 0.35128548741340637, mean loss: 0.36465535384368075
Epoch: 12, step: 1268, loss: 0.33630481362342834, mean loss: 0.36465382937520624
Epoch: 12, step: 1269, loss: 0.31181466579437256, mean loss: 0.3646509882544631
Epoch: 12, step: 1270, loss: 0.34555160999298096, mean loss: 0.3646499613509596
Epoch: 12, step: 1271, loss: 0.3603844940662384, mean loss: 0.36464973202476153
Epoch: 12, step: 1272, loss: 0.3129788637161255, mean loss: 0.364646954170436
Epoch: 12, step: 1273, loss: 0.3197876513004303, mean loss: 0.36464454263926355
Epoch: 12, step: 1274, loss: 0.35541948676109314, mean loss: 0.3646440467484998
Epoch: 12, step: 1275, loss: 0.3701084554195404, mean loss: 0.3646443404707462
Epoch: 12, step: 1276, loss: 0.3148925304412842, mean loss: 0.36464166636109663
Epoch: 12, step: 1277, loss: 0.30016598105430603, mean loss: 0.3646382010442469
Epoch: 12, step: 1278, loss: 0.31502634286880493, mean loss: 0.3646355347434904
Epoch: 12, step: 1279, loss: 0.35544681549072266, mean loss: 0.36463504093871546
Epoch: 12, step: 1280, loss: 0.31652358174324036, mean loss: 0.3646324555521178
Epoch: 12, step: 1281, loss: 0.36735185980796814, mean loss: 0.36463260167808537
Epoch: 12, step: 1282, loss: 0.34229016304016113, mean loss: 0.36463140118167797
Epoch: 12, step: 1283, loss: 0.32712915539741516, mean loss: 0.36462938623187224
Epoch: 12, step: 1284, loss: 0.4059737026691437, mean loss: 0.3646316074920902
Epoch: 12, step: 1285, loss: 0.3024253845214844, mean loss: 0.3646282655869129
Epoch: 12, step: 1286, loss: 0.3367399275302887, mean loss: 0.36462676742209654
Epoch: 12, step: 1287, loss: 0.3548918664455414, mean loss: 0.3646262444901575
Epoch: 12, step: 1288, loss: 0.37722593545913696, mean loss: 0.3646269212743316
Epoch: 12, step: 1289, loss: 0.3220970332622528, mean loss: 0.3646246369318667
Epoch: 12, step: 1290, loss: 0.3084326684474945, mean loss: 0.364621618941186
Epoch: 12, step: 1291, loss: 0.34926801919937134, mean loss: 0.36462079436547484
Epoch: 12, step: 1292, loss: 0.4078840911388397, mean loss: 0.36462311772602335
Epoch: 12, step: 1293, loss: 0.3520459234714508, mean loss: 0.36462244233163743
Epoch: 12, step: 1294, loss: 0.3305225968360901, mean loss: 0.3646206112708258
Epoch: 12, step: 1295, loss: 0.32112330198287964, mean loss: 0.364618275719425
Epoch: 12, step: 1296, loss: 0.32454127073287964, mean loss: 0.3646161239339224
Epoch: 12, step: 1297, loss: 0.3336831033229828, mean loss: 0.3646144631897685
Epoch: 12, step: 1298, loss: 0.3390097916126251, mean loss: 0.36461308858990926
Epoch: 12, step: 1299, loss: 0.3606155812740326, mean loss: 0.3646128739932099
Epoch: 12, step: 1300, loss: 0.35043901205062866, mean loss: 0.364612113143892
Epoch: 12, step: 1301, loss: 0.3165411651134491, mean loss: 0.36460953284609116
Epoch: 12, step: 1302, loss: 0.3823387026786804, mean loss: 0.364610484441273
Epoch: 12, step: 1303, loss: 0.37996605038642883, mean loss: 0.36461130859144175
Epoch: 12, step: 1304, loss: 0.3297047019004822, mean loss: 0.3646094352158881
Epoch: 12, step: 1305, loss: 0.3597440719604492, mean loss: 0.36460917411450056
Epoch: 12, step: 1306, loss: 0.33234766125679016, mean loss: 0.36460744288225705
Epoch: 12, step: 1307, loss: 0.3185626268386841, mean loss: 0.36460497213660115
Epoch: 12, step: 1308, loss: 0.3245692849159241, mean loss: 0.3646028239535663
Epoch: 12, step: 1309, loss: 0.3663112223148346, mean loss: 0.3646029156156739
Epoch: 12, step: 1310, loss: 0.3299639821052551, mean loss: 0.3646010572040901
Epoch: 12, step: 1311, loss: 0.31512725353240967, mean loss: 0.36459840303007335
Epoch: 12, step: 1312, loss: 0.2986757159233093, mean loss: 0.3645948665949515
Epoch: 12, step: 1313, loss: 0.3318197429180145, mean loss: 0.3645931084615068
Epoch: 12, step: 1314, loss: 0.3561369776725769, mean loss: 0.36459265487942294
Epoch: 12, step: 1315, loss: 0.31768500804901123, mean loss: 0.36459013891467124
Epoch: 12, step: 1316, loss: 0.31292229890823364, mean loss: 0.3645873677781732
Epoch: 12, step: 1317, loss: 0.3110833764076233, mean loss: 0.36458449831601664
Epoch: 12, step: 1318, loss: 0.31726545095443726, mean loss: 0.36458196069348425
Epoch: 12, step: 1319, loss: 0.329527884721756, mean loss: 0.3645800809167805
Epoch: 12, step: 1320, loss: 0.3109937608242035, mean loss: 0.364577207501579
Epoch: 12, step: 1321, loss: 0.34410008788108826, mean loss: 0.36457610953269853
Epoch: 12, step: 1322, loss: 0.2953438460826874, mean loss: 0.3645723975460249
Epoch: 12, step: 1323, loss: 0.2925097942352295, mean loss: 0.36456853401378647
Epoch: 12, step: 1324, loss: 0.36031562089920044, mean loss: 0.3645683060122256
Epoch: 12, step: 1325, loss: 0.30973824858665466, mean loss: 0.36456536669318274
Epoch: 12, step: 1326, loss: 0.34247061610221863, mean loss: 0.3645641823055874
Epoch: 12, step: 1327, loss: 0.31337714195251465, mean loss: 0.3645614385748652
Epoch: 12, step: 1328, loss: 0.35727807879447937, mean loss: 0.3645610481927148
Epoch: 12, step: 1329, loss: 0.33314549922943115, mean loss: 0.36455936443513287
Epoch: 12, step: 1330, loss: 0.3579913079738617, mean loss: 0.3645590124303919
Epoch: 12, step: 1331, loss: 0.3249262869358063, mean loss: 0.36455688849011886
Epoch: 12, step: 1332, loss: 0.3261723816394806, mean loss: 0.3645548315528245
Epoch: 12, step: 1333, loss: 0.313150018453598, mean loss: 0.3645520770349218
Epoch: 12, step: 1334, loss: 0.3105272948741913, mean loss: 0.3645491822815509
Epoch: 12, step: 1335, loss: 0.3060626983642578, mean loss: 0.3645460486293908
Epoch: 12, step: 1336, loss: 0.30652275681495667, mean loss: 0.3645429399611982
Epoch: 12, step: 1337, loss: 0.2996528744697571, mean loss: 0.3645394635835334
Epoch: 12, step: 1338, loss: 0.3336344063282013, mean loss: 0.3645378079850304
Epoch: 12, step: 1339, loss: 0.35014811158180237, mean loss: 0.36453703716349606
Epoch: 12, step: 1340, loss: 0.30453404784202576, mean loss: 0.3645338231193951
Epoch: 12, step: 1341, loss: 0.3761832118034363, mean loss: 0.36453444708236693
Epoch: 12, step: 1342, loss: 0.3267422616481781, mean loss: 0.3645324229708874
Epoch: 12, step: 1343, loss: 0.34832218289375305, mean loss: 0.36453155481321403
Epoch: 12, step: 1344, loss: 0.351044625043869, mean loss: 0.3645308325441748
Epoch: 12, step: 1345, loss: 0.3077540099620819, mean loss: 0.36452779212313047
Epoch: 12, step: 1346, loss: 0.3472593128681183, mean loss: 0.364526867438833
Epoch: 12, step: 1347, loss: 0.3121579885482788, mean loss: 0.364524063365215
Epoch: 12, step: 1348, loss: 0.3010243773460388, mean loss: 0.3645206634784013
Epoch: 12, step: 1349, loss: 0.31389564275741577, mean loss: 0.36451795306932533
Epoch: 12, step: 1350, loss: 0.3172151446342468, mean loss: 0.36451542066349873
Epoch: 12, step: 1351, loss: 0.36349961161613464, mean loss: 0.3645153662839994
Epoch: 12, step: 1352, loss: 0.3795047998428345, mean loss: 0.3645161686732483
Epoch: 12, step: 1353, loss: 0.30502378940582275, mean loss: 0.36451298419732137
Epoch: 12, step: 1354, loss: 0.32704606652259827, mean loss: 0.36451097879574373
Epoch: 12, step: 1355, loss: 0.3147278428077698, mean loss: 0.3645083143161897
Epoch: 12, step: 1356, loss: 0.31848931312561035, mean loss: 0.36450585143145914
Epoch: 12, step: 1357, loss: 0.31162235140800476, mean loss: 0.36450302131800394
Epoch: 12, step: 1358, loss: 0.36893898248672485, mean loss: 0.3645032587002038
Epoch: 12, step: 1359, loss: 0.3357180058956146, mean loss: 0.3645017183934398
Epoch: 12, step: 1360, loss: 0.34379130601882935, mean loss: 0.36450061023289754
Epoch: 12, step: 1361, loss: 0.32569828629493713, mean loss: 0.36449853413209826
Epoch: 12, step: 1362, loss: 0.31869372725486755, mean loss: 0.3644960834977353
Epoch: 12, step: 1363, loss: 0.3407285809516907, mean loss: 0.3644948119643228
Epoch: 12, step: 1364, loss: 0.3557322323322296, mean loss: 0.3644943432017041
Epoch: 12, step: 1365, loss: 0.32907068729400635, mean loss: 0.3644924482805579
Epoch: 12, step: 1366, loss: 0.3452313244342804, mean loss: 0.3644914179984586
Epoch: 12, step: 1367, loss: 0.364406943321228, mean loss: 0.36449141348012964
Epoch: 12, step: 1368, loss: 0.2935805916786194, mean loss: 0.36448762084912995
Epoch: 12, step: 1369, loss: 0.31637656688690186, mean loss: 0.36448504779030216
Epoch: 12, step: 1370, loss: 0.33331695199012756, mean loss: 0.3644833809580758
Epoch: 12, step: 1371, loss: 0.35817888379096985, mean loss: 0.3644830438191899
Epoch: 12, step: 1372, loss: 0.30511677265167236, mean loss: 0.36447986932204174
Epoch: 12, step: 1373, loss: 0.3264431953430176, mean loss: 0.36447783549282675
Epoch: 12, step: 1374, loss: 0.3661576807498932, mean loss: 0.3644779253097148
Epoch: 12, step: 1375, loss: 0.3116852045059204, mean loss: 0.36447510277331596
Epoch: 12, step: 1376, loss: 0.30321624875068665, mean loss: 0.36447182777443743
Epoch: 12, step: 1377, loss: 0.37045884132385254, mean loss: 0.3644721478328973
Epoch: 12, step: 1378, loss: 0.34867164492607117, mean loss: 0.36447130320238963
Epoch: 12, step: 1379, loss: 0.3413480520248413, mean loss: 0.3644700671936673
Epoch: 12, step: 1380, loss: 0.32537832856178284, mean loss: 0.3644679777319841
Epoch: 12, step: 1381, loss: 0.3105233907699585, mean loss: 0.36446509453652914
Epoch: 12, step: 1382, loss: 0.32385018467903137, mean loss: 0.364462923893065
Epoch: 12, step: 1383, loss: 0.3219108283519745, mean loss: 0.36446064983922033
Epoch: 12, step: 1384, loss: 0.3612673878669739, mean loss: 0.36446047919517754
Epoch: 12, step: 1385, loss: 0.3088810443878174, mean loss: 0.364457509256372
Epoch: 12, step: 1386, loss: 0.32809218764305115, mean loss: 0.36445556614541214
Epoch: 12, step: 1387, loss: 0.3283129930496216, mean loss: 0.36445363503977546
Epoch: 12, step: 1388, loss: 0.3851678967475891, mean loss: 0.3644547417482067
Epoch: 12, step: 1389, loss: 0.3184051811695099, mean loss: 0.3644522815729434
Epoch: 12, step: 1390, loss: 0.3192793130874634, mean loss: 0.364449868358109
Epoch: 12, step: 1391, loss: 0.329003244638443, mean loss: 0.3644479748418847
Epoch: 12, step: 1392, loss: 0.3656780421733856, mean loss: 0.3644480405470998
Epoch: 12, step: 1393, loss: 0.37489551305770874, mean loss: 0.3644485985789613
Epoch: 12, step: 1394, loss: 0.3560622036457062, mean loss: 0.3644481506595609
Epoch: 12, step: 1395, loss: 0.29026588797569275, mean loss: 0.36444418877840923
Epoch: 12, step: 1396, loss: 0.31061089038848877, mean loss: 0.3644413138359051
Epoch: 12, step: 1397, loss: 0.34917426109313965, mean loss: 0.3644404985495256
Epoch: 12, step: 1398, loss: 0.3040568232536316, mean loss: 0.36443727413155713
Epoch: 12, step: 1399, loss: 0.3183411955833435, mean loss: 0.36443481278605583
Epoch: 12, step: 1400, loss: 0.3858179450035095, mean loss: 0.36443595449849203
Epoch: 12, step: 1401, loss: 0.3468721807003021, mean loss: 0.36443501676363893
Epoch: 12, step: 1402, loss: 0.3318544924259186, mean loss: 0.36443327737309184
Epoch: 12, step: 1403, loss: 0.37456178665161133, mean loss: 0.36443381807933134
Epoch: 12, step: 1404, loss: 0.3164379894733429, mean loss: 0.3644312559788346
Epoch: 12, step: 1405, loss: 0.3408823013305664, mean loss: 0.36442999896193223
Epoch: 12, step: 1406, loss: 0.313710480928421, mean loss: 0.36442729175520505
Epoch: 12, step: 1407, loss: 0.37523603439331055, mean loss: 0.36442786865222887
Epoch: 12, step: 1408, loss: 0.33720332384109497, mean loss: 0.364426415669104
Epoch: 12, step: 1409, loss: 0.3252900242805481, mean loss: 0.3644243270581856
Epoch: 12, step: 1410, loss: 0.30126529932022095, mean loss: 0.3644209565993704
Epoch: 12, step: 1411, loss: 0.3565390110015869, mean loss: 0.3644205360046213
Epoch: 12, step: 1412, loss: 0.37353479862213135, mean loss: 0.36442102233206475
Epoch: 12, step: 1413, loss: 0.31543949246406555, mean loss: 0.36441840886872745
Epoch: 12, step: 1414, loss: 0.32589730620384216, mean loss: 0.36441635364263425
Epoch: 12, step: 1415, loss: 0.32546931505203247, mean loss: 0.3644142758023339
Epoch: 12, step: 1416, loss: 0.30910173058509827, mean loss: 0.36441132501304513
Epoch: 12, step: 1417, loss: 0.3207769989967346, mean loss: 0.3644089973524233
Epoch: 12, step: 1418, loss: 0.3255419135093689, mean loss: 0.36440692410956615
Epoch: 12, step: 1419, loss: 0.3088042438030243, mean loss: 0.3644039583169319
Epoch: 12, step: 1420, loss: 0.3268197774887085, mean loss: 0.3644019537203759
Epoch: 12, step: 1421, loss: 0.35739070177078247, mean loss: 0.3644015797869386
Epoch: 12, step: 1422, loss: 0.36330386996269226, mean loss: 0.3644015212455369
Epoch: 12, step: 1423, loss: 0.32801222801208496, mean loss: 0.36439958069022366
Epoch: 12, step: 1424, loss: 0.3203355371952057, mean loss: 0.36439723098385696
Epoch: 12, step: 1425, loss: 0.30402350425720215, mean loss: 0.3643940117385372
Epoch: 12, step: 1426, loss: 0.3070681095123291, mean loss: 0.3643909551721695
Epoch: 12, step: 1427, loss: 0.3295955955982208, mean loss: 0.36438910001330976
Epoch: 12, step: 1428, loss: 0.3633674383163452, mean loss: 0.3643890455450208
Epoch: 12, step: 1429, loss: 0.31372418999671936, mean loss: 0.36438634457180674
Epoch: 12, step: 1430, loss: 0.33173617720603943, mean loss: 0.3643846040649905
Epoch: 12, step: 1431, loss: 0.3986581563949585, mean loss: 0.36438643101340895
Epoch: 12, step: 1432, loss: 0.38625097274780273, mean loss: 0.36438759643858537
Epoch: 12, step: 1433, loss: 0.3187077045440674, mean loss: 0.364385161735894
Epoch: 12, step: 1434, loss: 0.32110410928726196, mean loss: 0.364382855012425
Epoch: 12, step: 1435, loss: 0.3261864185333252, mean loss: 0.36438081938907824
Epoch: 12, step: 1436, loss: 0.34832340478897095, mean loss: 0.3643799636782016
Epoch: 12, step: 1437, loss: 0.31106096506118774, mean loss: 0.3643771224228133
Epoch: 12, step: 1438, loss: 0.3442167341709137, mean loss: 0.3643760481760902
Epoch: 12, step: 1439, loss: 0.3168121874332428, mean loss: 0.3643735138697846
Epoch: 12, step: 1440, loss: 0.3421049118041992, mean loss: 0.3643723274132837
Epoch: 12, step: 1441, loss: 0.32505232095718384, mean loss: 0.36437023258076073
Epoch: 12, step: 1442, loss: 0.29785123467445374, mean loss: 0.36436668886982865
Epoch: 12, step: 1443, loss: 0.32317227125167847, mean loss: 0.3643644944090563
Valid: 12, mean loss: 0.1946614185969035
Epoch: 13, step: 0, loss: 0.3031511604785919, mean loss: 0.3643612336977193
Epoch: 13, step: 1, loss: 0.33171576261520386, mean loss: 0.36435949483167673
Epoch: 13, step: 2, loss: 0.32106050848960876, mean loss: 0.3643571886273443
Epoch: 13, step: 3, loss: 0.29151204228401184, mean loss: 0.36435330893271584
Epoch: 13, step: 4, loss: 0.3586638569831848, mean loss: 0.36435300593160014
Epoch: 13, step: 5, loss: 0.330883264541626, mean loss: 0.36435122354043015
Epoch: 13, step: 6, loss: 0.3253985345363617, mean loss: 0.3643491492718853
Epoch: 13, step: 7, loss: 0.3635880947113037, mean loss: 0.36434910874714826
Epoch: 13, step: 8, loss: 0.331139475107193, mean loss: 0.3643473404902056
Epoch: 13, step: 9, loss: 0.34371137619018555, mean loss: 0.36434624178057406
Epoch: 13, step: 10, loss: 0.3248741924762726, mean loss: 0.36434414030321133
Epoch: 13, step: 11, loss: 0.32523420453071594, mean loss: 0.3643420582154892
Epoch: 13, step: 12, loss: 0.38367873430252075, mean loss: 0.36434308758339373
Epoch: 13, step: 13, loss: 0.3255297839641571, mean loss: 0.36434102150739994
Epoch: 13, step: 14, loss: 0.2911015450954437, mean loss: 0.3643371230948587
Epoch: 13, step: 15, loss: 0.3384036719799042, mean loss: 0.3643357427749143
Epoch: 13, step: 16, loss: 0.3261145353317261, mean loss: 0.36433370854172237
Epoch: 13, step: 17, loss: 0.30025067925453186, mean loss: 0.36433029805586353
Epoch: 13, step: 18, loss: 0.37922272086143494, mean loss: 0.3643310905854152
Epoch: 13, step: 19, loss: 0.32993239164352417, mean loss: 0.36432926008845146
Epoch: 13, step: 20, loss: 0.3742256164550781, mean loss: 0.3643297866864596
Epoch: 13, step: 21, loss: 0.3312761187553406, mean loss: 0.364328027951335
Epoch: 13, step: 22, loss: 0.3401729166507721, mean loss: 0.3643267427631839
Epoch: 13, step: 23, loss: 0.35001859068870544, mean loss: 0.3643259815293004
Epoch: 13, step: 24, loss: 0.34133636951446533, mean loss: 0.36432475848243046
Epoch: 13, step: 25, loss: 0.3111732602119446, mean loss: 0.3643219309742769
Epoch: 13, step: 26, loss: 0.3575451672077179, mean loss: 0.36432157048894437
Epoch: 13, step: 27, loss: 0.31906944513320923, mean loss: 0.3643191634609999
Epoch: 13, step: 28, loss: 0.37879061698913574, mean loss: 0.36431993317822386
Epoch: 13, step: 29, loss: 0.34943312406539917, mean loss: 0.3643191414109059
Epoch: 13, step: 30, loss: 0.33812886476516724, mean loss: 0.36431774853335197
Epoch: 13, step: 31, loss: 0.3580327033996582, mean loss: 0.36431741429355546
Epoch: 13, step: 32, loss: 0.3678373098373413, mean loss: 0.3643176014722603
Epoch: 13, step: 33, loss: 0.3107856810092926, mean loss: 0.3643147549381508
Epoch: 13, step: 34, loss: 0.3211897909641266, mean loss: 0.3643124619108751
Epoch: 13, step: 35, loss: 0.3123018741607666, mean loss: 0.36430969656699214
Epoch: 13, step: 36, loss: 0.33192941546440125, mean loss: 0.36430797503575163
Epoch: 13, step: 37, loss: 0.32406020164489746, mean loss: 0.36430583533488026
Epoch: 13, step: 38, loss: 0.34248459339141846, mean loss: 0.36430467530926
Epoch: 13, step: 39, loss: 0.3238913416862488, mean loss: 0.3643025270350933
Epoch: 13, step: 40, loss: 0.34581461548805237, mean loss: 0.3643015443150834
Epoch: 13, step: 41, loss: 0.30221429467201233, mean loss: 0.36429824425929286
Epoch: 13, step: 42, loss: 0.313603013753891, mean loss: 0.36429554985427
Epoch: 13, step: 43, loss: 0.34656524658203125, mean loss: 0.36429460755498894
Epoch: 13, step: 44, loss: 0.34772005677223206, mean loss: 0.3642937267264412
Epoch: 13, step: 45, loss: 0.33347997069358826, mean loss: 0.36429208926464757
Epoch: 13, step: 46, loss: 0.330485999584198, mean loss: 0.36429029288387915
Epoch: 13, step: 47, loss: 0.2985670566558838, mean loss: 0.36428680068216673
Epoch: 13, step: 48, loss: 0.36449721455574036, mean loss: 0.36428681186190603
Epoch: 13, step: 49, loss: 0.3342719078063965, mean loss: 0.36428521719056106
Epoch: 13, step: 50, loss: 0.332474023103714, mean loss: 0.36428352717334345
Epoch: 13, step: 51, loss: 0.3026241362094879, mean loss: 0.3642802516000878
Epoch: 13, step: 52, loss: 0.36482521891593933, mean loss: 0.3642802805492148
Epoch: 13, step: 53, loss: 0.33062195777893066, mean loss: 0.36427849268547474
Epoch: 13, step: 54, loss: 0.33589333295822144, mean loss: 0.3642769850018434
Epoch: 13, step: 55, loss: 0.3113168776035309, mean loss: 0.36427417216418684
Epoch: 13, step: 56, loss: 0.35054874420166016, mean loss: 0.36427344321267785
Epoch: 13, step: 57, loss: 0.3353050649166107, mean loss: 0.36427190479641147
Epoch: 13, step: 58, loss: 0.33930671215057373, mean loss: 0.36427057904670906
Epoch: 13, step: 59, loss: 0.3417227268218994, mean loss: 0.36426938173085177
Epoch: 13, step: 60, loss: 0.3734785318374634, mean loss: 0.36426987072092804
Epoch: 13, step: 61, loss: 0.3223336935043335, mean loss: 0.36426764410007123
Epoch: 13, step: 62, loss: 0.3326619267463684, mean loss: 0.36426596606888706
Epoch: 13, step: 63, loss: 0.3753083646297455, mean loss: 0.36426655230792726
Epoch: 13, step: 64, loss: 0.3079088628292084, mean loss: 0.36426356044672437
Epoch: 13, step: 65, loss: 0.33839449286460876, mean loss: 0.3642621872081862
Epoch: 13, step: 66, loss: 0.3849349319934845, mean loss: 0.36426328454587853
Epoch: 13, step: 67, loss: 0.3930629789829254, mean loss: 0.3642648131920801
Epoch: 13, step: 68, loss: 0.326186865568161, mean loss: 0.3642627921768673
Epoch: 13, step: 69, loss: 0.33030611276626587, mean loss: 0.36426098999666295
Epoch: 13, step: 70, loss: 0.31831470131874084, mean loss: 0.36425855162227044
Epoch: 13, step: 71, loss: 0.3214398920536041, mean loss: 0.3642562793520747
Epoch: 13, step: 72, loss: 0.38352710008621216, mean loss: 0.3642573019480277
Epoch: 13, step: 73, loss: 0.32129064202308655, mean loss: 0.36425502206582855
Epoch: 13, step: 74, loss: 0.30826419591903687, mean loss: 0.3642520512574162
Epoch: 13, step: 75, loss: 0.380939781665802, mean loss: 0.36425293664209407
Epoch: 13, step: 76, loss: 0.34207314252853394, mean loss: 0.3642517599327666
Epoch: 13, step: 77, loss: 0.291517436504364, mean loss: 0.3642479013479693
Epoch: 13, step: 78, loss: 0.3366972804069519, mean loss: 0.36424643985409944
Epoch: 13, step: 79, loss: 0.3031065762042999, mean loss: 0.36424319670410743
Epoch: 13, step: 80, loss: 0.2959069311618805, mean loss: 0.36423957201490453
Epoch: 13, step: 81, loss: 0.32659199833869934, mean loss: 0.36423757521986494
Epoch: 13, step: 82, loss: 0.3053564727306366, mean loss: 0.3642344523822893
Epoch: 13, step: 83, loss: 0.32979199290275574, mean loss: 0.3642326257775227
Epoch: 13, step: 84, loss: 0.3225633203983307, mean loss: 0.3642304160248908
Epoch: 13, step: 85, loss: 0.40556788444519043, mean loss: 0.36423260806372953
Epoch: 13, step: 86, loss: 0.3747093379497528, mean loss: 0.3642331635931789
Epoch: 13, step: 87, loss: 0.3494517505168915, mean loss: 0.3642323798491134
Epoch: 13, step: 88, loss: 0.3467763662338257, mean loss: 0.3642314543407302
Epoch: 13, step: 89, loss: 0.3671991527080536, mean loss: 0.3642316116781476
Epoch: 13, step: 90, loss: 0.3731226921081543, mean loss: 0.3642320830284328
Epoch: 13, step: 91, loss: 0.34347987174987793, mean loss: 0.36423098293241507
Epoch: 13, step: 92, loss: 0.35470157861709595, mean loss: 0.3642304777956902
Epoch: 13, step: 93, loss: 0.3404923379421234, mean loss: 0.36422921954593646
Epoch: 13, step: 94, loss: 0.3844405710697174, mean loss: 0.36423029080005864
Epoch: 13, step: 95, loss: 0.34199634194374084, mean loss: 0.36422911240548284
Epoch: 13, step: 96, loss: 0.3543175160884857, mean loss: 0.36422858712081924
Epoch: 13, step: 97, loss: 0.30798450112342834, mean loss: 0.3642256065121283
Epoch: 13, step: 98, loss: 0.31258752942085266, mean loss: 0.36422287014007115
Epoch: 13, step: 99, loss: 0.3484342396259308, mean loss: 0.36422203352336313
Epoch: 13, step: 100, loss: 0.3149525821208954, mean loss: 0.36421942294468446
Epoch: 13, step: 101, loss: 0.3486844003200531, mean loss: 0.36421859985352073
Epoch: 13, step: 102, loss: 0.3679504990577698, mean loss: 0.36421879757003484
Epoch: 13, step: 103, loss: 0.32664865255355835, mean loss: 0.3642168072042255
Epoch: 13, step: 104, loss: 0.38222718238830566, mean loss: 0.3642177612951925
Epoch: 13, step: 105, loss: 0.32840830087661743, mean loss: 0.36421586440672876
Epoch: 13, step: 106, loss: 0.3073103129863739, mean loss: 0.3642128501818535
Epoch: 13, step: 107, loss: 0.3315531015396118, mean loss: 0.3642111203222856
Epoch: 13, step: 108, loss: 0.3635347783565521, mean loss: 0.36421108450098555
Epoch: 13, step: 109, loss: 0.3259848654270172, mean loss: 0.3642090600216362
Epoch: 13, step: 110, loss: 0.2859061062335968, mean loss: 0.3642049132783334
Epoch: 13, step: 111, loss: 0.290762722492218, mean loss: 0.36420102415575417
Epoch: 13, step: 112, loss: 0.36568549275398254, mean loss: 0.36420110276145173
Epoch: 13, step: 113, loss: 0.3469594717025757, mean loss: 0.36420018982959435
Epoch: 13, step: 114, loss: 0.372875452041626, mean loss: 0.3642006491541145
Epoch: 13, step: 115, loss: 0.31507813930511475, mean loss: 0.3641980484282648
Epoch: 13, step: 116, loss: 0.3375513553619385, mean loss: 0.36419663772928307
Epoch: 13, step: 117, loss: 0.3105258047580719, mean loss: 0.3641937964993746
Epoch: 13, step: 118, loss: 0.38674840331077576, mean loss: 0.36419499043335435
Epoch: 13, step: 119, loss: 0.342180460691452, mean loss: 0.36419382515017934
Epoch: 13, step: 120, loss: 0.341839998960495, mean loss: 0.36419264196983797
Epoch: 13, step: 121, loss: 0.37966814637184143, mean loss: 0.36419346103961686
Epoch: 13, step: 122, loss: 0.4046671986579895, mean loss: 0.3641956030738914
Epoch: 13, step: 123, loss: 0.4386822581291199, mean loss: 0.3641995450010218
Epoch: 13, step: 124, loss: 0.35130929946899414, mean loss: 0.3641988628691738
Epoch: 13, step: 125, loss: 0.39081433415412903, mean loss: 0.3642002712442021
Epoch: 13, step: 126, loss: 0.3581952154636383, mean loss: 0.3641999534995712
Epoch: 13, step: 127, loss: 0.3330419063568115, mean loss: 0.3641983049256483
Epoch: 13, step: 128, loss: 0.32811641693115234, mean loss: 0.3641963959320504
Epoch: 13, step: 129, loss: 0.35583874583244324, mean loss: 0.36419595377513053
Epoch: 13, step: 130, loss: 0.3050820529460907, mean loss: 0.3641928265518946
Epoch: 13, step: 131, loss: 0.3076981008052826, mean loss: 0.36418983804545435
Epoch: 13, step: 132, loss: 0.3490805923938751, mean loss: 0.36418903882590126
Epoch: 13, step: 133, loss: 0.3177606761455536, mean loss: 0.3641865830783777
Epoch: 13, step: 134, loss: 0.3594079315662384, mean loss: 0.3641863303332826
Epoch: 13, step: 135, loss: 0.35253873467445374, mean loss: 0.3641857143191268
Epoch: 13, step: 136, loss: 0.32893767952919006, mean loss: 0.3641838502314019
Epoch: 13, step: 137, loss: 0.3634324073791504, mean loss: 0.36418381049354615
Epoch: 13, step: 138, loss: 0.32617422938346863, mean loss: 0.36418180057439276
Epoch: 13, step: 139, loss: 0.34099435806274414, mean loss: 0.36418057450403996
Epoch: 13, step: 140, loss: 0.3230087459087372, mean loss: 0.3641783975977535
Epoch: 13, step: 141, loss: 0.3349161148071289, mean loss: 0.3641768504748398
Epoch: 13, step: 142, loss: 0.35728615522384644, mean loss: 0.3641764861769148
Epoch: 13, step: 143, loss: 0.3312990665435791, mean loss: 0.36417474810228834
Epoch: 13, step: 144, loss: 0.32310277223587036, mean loss: 0.3641725769347741
Epoch: 13, step: 145, loss: 0.3554210364818573, mean loss: 0.36417211433088087
Epoch: 13, step: 146, loss: 0.32801294326782227, mean loss: 0.36417020306860154
Epoch: 13, step: 147, loss: 0.36615097522735596, mean loss: 0.36417030776057613
Epoch: 13, step: 148, loss: 0.3547329604625702, mean loss: 0.3641698089842272
Epoch: 13, step: 149, loss: 0.3195362687110901, mean loss: 0.364167450166963
Epoch: 13, step: 150, loss: 0.353649377822876, mean loss: 0.36416689433161215
Epoch: 13, step: 151, loss: 0.2902039885520935, mean loss: 0.36416298591342466
Epoch: 13, step: 152, loss: 0.34576597809791565, mean loss: 0.36416201381261537
Epoch: 13, step: 153, loss: 0.36039888858795166, mean loss: 0.36416181497898836
Epoch: 13, step: 154, loss: 0.3216061592102051, mean loss: 0.3641595665690043
Epoch: 13, step: 155, loss: 0.3465907871723175, mean loss: 0.36415863837905305
Epoch: 13, step: 156, loss: 0.33398085832595825, mean loss: 0.3641570441173354
Epoch: 13, step: 157, loss: 0.3617950677871704, mean loss: 0.36415691934309713
Epoch: 13, step: 158, loss: 0.3245612382888794, mean loss: 0.3641548277641497
Epoch: 13, step: 159, loss: 0.32287096977233887, mean loss: 0.36415264712512624
Epoch: 13, step: 160, loss: 0.340166300535202, mean loss: 0.36415138021831855
Epoch: 13, step: 161, loss: 0.36550095677375793, mean loss: 0.36415145149626066
Epoch: 13, step: 162, loss: 0.31378716230392456, mean loss: 0.36414879164470576
Epoch: 13, step: 163, loss: 0.31491315364837646, mean loss: 0.3641461915370803
Epoch: 13, step: 164, loss: 0.30731526017189026, mean loss: 0.36414319048457117
Epoch: 13, step: 165, loss: 0.3706692159175873, mean loss: 0.36414353508407654
Epoch: 13, step: 166, loss: 0.3303281366825104, mean loss: 0.3641417495939027
Epoch: 13, step: 167, loss: 0.39829984307289124, mean loss: 0.36414355308352675
Epoch: 13, step: 168, loss: 0.30816277861595154, mean loss: 0.36414059754926414
Epoch: 13, step: 169, loss: 0.36404290795326233, mean loss: 0.3641405923919631
Epoch: 13, step: 170, loss: 0.32310473918914795, mean loss: 0.3641384261113738
Epoch: 13, step: 171, loss: 0.33583366870880127, mean loss: 0.36413693198355485
Epoch: 13, step: 172, loss: 0.33293941617012024, mean loss: 0.3641352852421553
Epoch: 13, step: 173, loss: 0.36021727323532104, mean loss: 0.3641350784432528
Epoch: 13, step: 174, loss: 0.35941267013549805, mean loss: 0.3641348292001902
Epoch: 13, step: 175, loss: 0.3113571107387543, mean loss: 0.3641320438023402
Epoch: 13, step: 176, loss: 0.3636277914047241, mean loss: 0.3641320171913107
Epoch: 13, step: 177, loss: 0.3414723873138428, mean loss: 0.36413082143247816
Epoch: 13, step: 178, loss: 0.3391455113887787, mean loss: 0.3641295030160335
Epoch: 13, step: 179, loss: 0.34500715136528015, mean loss: 0.3641284940274491
Epoch: 13, step: 180, loss: 0.32974886894226074, mean loss: 0.3641266800863799
Epoch: 13, step: 181, loss: 0.33748459815979004, mean loss: 0.3641252744684667
Epoch: 13, step: 182, loss: 0.3020539879798889, mean loss: 0.3641219998028646
Epoch: 13, step: 183, loss: 0.3510169982910156, mean loss: 0.36412130846494983
Epoch: 13, step: 184, loss: 0.3490537405014038, mean loss: 0.36412051363623416
Epoch: 13, step: 185, loss: 0.3870384097099304, mean loss: 0.3641217225135458
Epoch: 13, step: 186, loss: 0.35073143243789673, mean loss: 0.3641210162373669
Epoch: 13, step: 187, loss: 0.35004720091819763, mean loss: 0.36412027394752944
Epoch: 13, step: 188, loss: 0.33656787872314453, mean loss: 0.36411882083876806
Epoch: 13, step: 189, loss: 0.35234275460243225, mean loss: 0.3641181998037382
Epoch: 13, step: 190, loss: 0.327908992767334, mean loss: 0.3641162903375653
Epoch: 13, step: 191, loss: 0.35773766040802, mean loss: 0.36411595398289703
Epoch: 13, step: 192, loss: 0.35079097747802734, mean loss: 0.3641152513740647
Epoch: 13, step: 193, loss: 0.33748117089271545, mean loss: 0.3641138470673853
Epoch: 13, step: 194, loss: 0.3284498453140259, mean loss: 0.36411196674884505
Epoch: 13, step: 195, loss: 0.34855225682258606, mean loss: 0.36411114643516274
Epoch: 13, step: 196, loss: 0.31905823945999146, mean loss: 0.3641087713544007
Epoch: 13, step: 197, loss: 0.3402227461338043, mean loss: 0.3641075122070511
Epoch: 13, step: 198, loss: 0.3335922062397003, mean loss: 0.36410590368320067
Epoch: 13, step: 199, loss: 0.3661498427391052, mean loss: 0.3641060114177071
Epoch: 13, step: 200, loss: 0.2936088442802429, mean loss: 0.36410229576034464
Epoch: 13, step: 201, loss: 0.33067968487739563, mean loss: 0.36410053426509414
Epoch: 13, step: 202, loss: 0.3382111191749573, mean loss: 0.36409916986904195
Epoch: 13, step: 203, loss: 0.3589153289794922, mean loss: 0.364098896690243
Epoch: 13, step: 204, loss: 0.3369670510292053, mean loss: 0.3640974669676493
Epoch: 13, step: 205, loss: 0.3485346734523773, mean loss: 0.3640966469237292
Epoch: 13, step: 206, loss: 0.35190916061401367, mean loss: 0.3640960047673295
Epoch: 13, step: 207, loss: 0.33553212881088257, mean loss: 0.36409449982128334
Epoch: 13, step: 208, loss: 0.32454705238342285, mean loss: 0.3640924162931532
Epoch: 13, step: 209, loss: 0.34981614351272583, mean loss: 0.36409166419786393
Epoch: 13, step: 210, loss: 0.3763016164302826, mean loss: 0.3640923074024276
Epoch: 13, step: 211, loss: 0.3875713348388672, mean loss: 0.3640935441822125
Epoch: 13, step: 212, loss: 0.31666892766952515, mean loss: 0.36409104617765564
Epoch: 13, step: 213, loss: 0.3247673213481903, mean loss: 0.36408897498178344
Epoch: 13, step: 214, loss: 0.3063683807849884, mean loss: 0.36408593497576897
Epoch: 13, step: 215, loss: 0.31049424409866333, mean loss: 0.36408311257789255
Epoch: 13, step: 216, loss: 0.37486737966537476, mean loss: 0.364083680499694
Epoch: 13, step: 217, loss: 0.32574477791786194, mean loss: 0.3640816616001373
Epoch: 13, step: 218, loss: 0.33737608790397644, mean loss: 0.3640802553775215
Epoch: 13, step: 219, loss: 0.3453509509563446, mean loss: 0.3640792692094285
Epoch: 13, step: 220, loss: 0.37062880396842957, mean loss: 0.3640796140488303
Epoch: 13, step: 221, loss: 0.333077609539032, mean loss: 0.3640779818489509
Epoch: 13, step: 222, loss: 0.3585633635520935, mean loss: 0.36407769152948277
Epoch: 13, step: 223, loss: 0.32086601853370667, mean loss: 0.3640754167520035
Epoch: 13, step: 224, loss: 0.3354514241218567, mean loss: 0.3640739099881655
Epoch: 13, step: 225, loss: 0.33901187777519226, mean loss: 0.36407259079497606
Epoch: 13, step: 226, loss: 0.3085770606994629, mean loss: 0.3640696698238673
Epoch: 13, step: 227, loss: 0.33511418104171753, mean loss: 0.3640681458507735
Epoch: 13, step: 228, loss: 0.3258303105831146, mean loss: 0.36406613343904426
Epoch: 13, step: 229, loss: 0.3334011733531952, mean loss: 0.36406451966364767
Epoch: 13, step: 230, loss: 0.31268951296806335, mean loss: 0.36406181614279853
Epoch: 13, step: 231, loss: 0.34531161189079285, mean loss: 0.36406082949765795
Epoch: 13, step: 232, loss: 0.29775357246398926, mean loss: 0.36405734056016603
Epoch: 13, step: 233, loss: 0.3309069573879242, mean loss: 0.3640555963539589
Epoch: 13, step: 234, loss: 0.3465651571750641, mean loss: 0.3640546761435533
Epoch: 13, step: 235, loss: 0.28725141286849976, mean loss: 0.36405063556783385
Epoch: 13, step: 236, loss: 0.34299182891845703, mean loss: 0.3640495277343524
Epoch: 13, step: 237, loss: 0.31825125217437744, mean loss: 0.3640471185667795
Epoch: 13, step: 238, loss: 0.35216617584228516, mean loss: 0.36404649361581826
Epoch: 13, step: 239, loss: 0.33946654200553894, mean loss: 0.36404520075070096
Epoch: 13, step: 240, loss: 0.33405619859695435, mean loss: 0.36404362346136454
Epoch: 13, step: 241, loss: 0.3247169256210327, mean loss: 0.3640415551591746
Epoch: 13, step: 242, loss: 0.3017696738243103, mean loss: 0.36403828027716906
Epoch: 13, step: 243, loss: 0.3481147885322571, mean loss: 0.3640374429038127
Epoch: 13, step: 244, loss: 0.3043815493583679, mean loss: 0.3640343059267109
Epoch: 13, step: 245, loss: 0.38099581003189087, mean loss: 0.36403519779252774
Epoch: 13, step: 246, loss: 0.375698447227478, mean loss: 0.36403581103451915
Epoch: 13, step: 247, loss: 0.3557186424732208, mean loss: 0.36403537374910583
Epoch: 13, step: 248, loss: 0.32424837350845337, mean loss: 0.36403328200838553
Epoch: 13, step: 249, loss: 0.30563005805015564, mean loss: 0.36403021170957583
Epoch: 13, step: 250, loss: 0.3344872295856476, mean loss: 0.36402865869574397
Epoch: 13, step: 251, loss: 0.3543268144130707, mean loss: 0.36402814871654493
Epoch: 13, step: 252, loss: 0.33674684166908264, mean loss: 0.3640267147450838
Epoch: 13, step: 253, loss: 0.3554891347885132, mean loss: 0.36402626601282495
Epoch: 13, step: 254, loss: 0.3409605026245117, mean loss: 0.36402505374797034
Epoch: 13, step: 255, loss: 0.3230244815349579, mean loss: 0.36402289899853724
Epoch: 13, step: 256, loss: 0.33755603432655334, mean loss: 0.36402150812856654
Epoch: 13, step: 257, loss: 0.3345426917076111, mean loss: 0.364019959057814
Epoch: 13, step: 258, loss: 0.31496524810791016, mean loss: 0.3640173814365145
Epoch: 13, step: 259, loss: 0.3790983557701111, mean loss: 0.3640181738374358
Epoch: 13, step: 260, loss: 0.29806452989578247, mean loss: 0.364014708611568
Epoch: 13, step: 261, loss: 0.31177663803100586, mean loss: 0.3640119641505729
Epoch: 13, step: 262, loss: 0.3362440764904022, mean loss: 0.36401050537002866
Epoch: 13, step: 263, loss: 0.33092421293258667, mean loss: 0.3640087672794404
Epoch: 13, step: 264, loss: 0.3154165744781494, mean loss: 0.3640062147662923
Epoch: 13, step: 265, loss: 0.31639525294303894, mean loss: 0.3640037139278732
Epoch: 13, step: 266, loss: 0.3575170338153839, mean loss: 0.3640033732229983
Epoch: 13, step: 267, loss: 0.3497614860534668, mean loss: 0.3640026252247226
Epoch: 13, step: 268, loss: 0.3527359366416931, mean loss: 0.3640020335179539
Epoch: 13, step: 269, loss: 0.36865195631980896, mean loss: 0.3640022777109379
Epoch: 13, step: 270, loss: 0.3406597971916199, mean loss: 0.3640010519334596
Epoch: 13, step: 271, loss: 0.3391040563583374, mean loss: 0.3639997445927972
Epoch: 13, step: 272, loss: 0.32720932364463806, mean loss: 0.36399781283008004
Epoch: 13, step: 273, loss: 0.3188304901123047, mean loss: 0.36399544134406103
Epoch: 13, step: 274, loss: 0.3490521013736725, mean loss: 0.3639946567932147
Epoch: 13, step: 275, loss: 0.3646160960197449, mean loss: 0.3639946894181216
Epoch: 13, step: 276, loss: 0.3210827708244324, mean loss: 0.36399243670571707
Epoch: 13, step: 277, loss: 0.3708287477493286, mean loss: 0.36399279556718916
Epoch: 13, step: 278, loss: 0.3259789049625397, mean loss: 0.3639908001921115
Epoch: 13, step: 279, loss: 0.33121639490127563, mean loss: 0.36398907993149365
Epoch: 13, step: 280, loss: 0.31715160608291626, mean loss: 0.3639866216585787
Epoch: 13, step: 281, loss: 0.32684004306793213, mean loss: 0.36398467211629937
Epoch: 13, step: 282, loss: 0.3510386347770691, mean loss: 0.363983992712608
Epoch: 13, step: 283, loss: 0.3142847418785095, mean loss: 0.363981384649487
Epoch: 13, step: 284, loss: 0.3308502435684204, mean loss: 0.3639796461208056
Epoch: 13, step: 285, loss: 0.3530585765838623, mean loss: 0.36397907307696376
Epoch: 13, step: 286, loss: 0.38052132725715637, mean loss: 0.3639799410267082
Epoch: 13, step: 287, loss: 0.33866772055625916, mean loss: 0.36397861299835194
Epoch: 13, step: 288, loss: 0.3386196792125702, mean loss: 0.3639772825889408
Epoch: 13, step: 289, loss: 0.35263535380363464, mean loss: 0.3639766875869061
Epoch: 13, step: 290, loss: 0.32738515734672546, mean loss: 0.36397476808156903
Epoch: 13, step: 291, loss: 0.32037827372550964, mean loss: 0.3639724812323057
Epoch: 13, step: 292, loss: 0.3418459892272949, mean loss: 0.3639713206505063
Epoch: 13, step: 293, loss: 0.31618115305900574, mean loss: 0.36396881408554294
Epoch: 13, step: 294, loss: 0.3543711304664612, mean loss: 0.36396831071932806
Epoch: 13, step: 295, loss: 0.3742190897464752, mean loss: 0.363968848310005
Epoch: 13, step: 296, loss: 0.31039124727249146, mean loss: 0.3639660386398053
Epoch: 13, step: 297, loss: 0.342011034488678, mean loss: 0.3639648873548472
Epoch: 13, step: 298, loss: 0.3237062990665436, mean loss: 0.36396277637019575
Epoch: 13, step: 299, loss: 0.3365020751953125, mean loss: 0.3639613365263841
Epoch: 13, step: 300, loss: 0.2985885441303253, mean loss: 0.36395790902193303
Epoch: 13, step: 301, loss: 0.34892821311950684, mean loss: 0.36395712105423345
Epoch: 13, step: 302, loss: 0.3539501130580902, mean loss: 0.363956596440446
Epoch: 13, step: 303, loss: 0.3460451662540436, mean loss: 0.36395565748939823
Epoch: 13, step: 304, loss: 0.30277231335639954, mean loss: 0.36395245031090406
Epoch: 13, step: 305, loss: 0.31430405378341675, mean loss: 0.3639498479208984
Epoch: 13, step: 306, loss: 0.425733357667923, mean loss: 0.3639530862200622
Epoch: 13, step: 307, loss: 0.3349281847476959, mean loss: 0.36395156499881104
Epoch: 13, step: 308, loss: 0.33727577328681946, mean loss: 0.363950166969792
Epoch: 13, step: 309, loss: 0.29088354110717773, mean loss: 0.36394633788343506
Epoch: 13, step: 310, loss: 0.3392954468727112, mean loss: 0.36394504611112405
Epoch: 13, step: 311, loss: 0.366099089384079, mean loss: 0.36394515898281093
Epoch: 13, step: 312, loss: 0.34272268414497375, mean loss: 0.3639440469851773
Epoch: 13, step: 313, loss: 0.319574236869812, mean loss: 0.3639417222544786
Epoch: 13, step: 314, loss: 0.3835790157318115, mean loss: 0.36394275108527846
Epoch: 13, step: 315, loss: 0.34517526626586914, mean loss: 0.36394176787672755
Epoch: 13, step: 316, loss: 0.3098861575126648, mean loss: 0.3639389361091984
Epoch: 13, step: 317, loss: 0.3202163279056549, mean loss: 0.3639366457682763
Epoch: 13, step: 318, loss: 0.3691444396972656, mean loss: 0.3639369185561831
Epoch: 13, step: 319, loss: 0.3365285098552704, mean loss: 0.36393548295966616
Epoch: 13, step: 320, loss: 0.31581804156303406, mean loss: 0.36393296279827736
Epoch: 13, step: 321, loss: 0.3316112458705902, mean loss: 0.36393127003002934
Epoch: 13, step: 322, loss: 0.34040698409080505, mean loss: 0.3639300380695193
Epoch: 13, step: 323, loss: 0.30270150303840637, mean loss: 0.36392683171556917
Epoch: 13, step: 324, loss: 0.349667489528656, mean loss: 0.3639260850358715
Epoch: 13, step: 325, loss: 0.3535076379776001, mean loss: 0.36392553951031603
Epoch: 13, step: 326, loss: 0.3477749526500702, mean loss: 0.3639246938855786
Epoch: 13, step: 327, loss: 0.31012141704559326, mean loss: 0.3639218769600896
Epoch: 13, step: 328, loss: 0.3555343449115753, mean loss: 0.3639214378452763
Epoch: 13, step: 329, loss: 0.38667312264442444, mean loss: 0.3639226289082435
Epoch: 13, step: 330, loss: 0.3242816925048828, mean loss: 0.3639205537924814
Epoch: 13, step: 331, loss: 0.3134118616580963, mean loss: 0.3639179099120305
Epoch: 13, step: 332, loss: 0.3282308280467987, mean loss: 0.3639160419674157
Epoch: 13, step: 333, loss: 0.3264314830303192, mean loss: 0.3639140800413748
Epoch: 13, step: 334, loss: 0.3747618496417999, mean loss: 0.36391464777935567
Epoch: 13, step: 335, loss: 0.34447231888771057, mean loss: 0.36391363028255375
Epoch: 13, step: 336, loss: 0.2989623248577118, mean loss: 0.36391023129226513
Epoch: 13, step: 337, loss: 0.3203294277191162, mean loss: 0.3639079507687919
Epoch: 13, step: 338, loss: 0.3410157561302185, mean loss: 0.36390675291443375
Epoch: 13, step: 339, loss: 0.36031532287597656, mean loss: 0.3639065649995092
Epoch: 13, step: 340, loss: 0.34550660848617554, mean loss: 0.3639056023062369
Epoch: 13, step: 341, loss: 0.33217963576316833, mean loss: 0.3639039424774966
Epoch: 13, step: 342, loss: 0.3021421432495117, mean loss: 0.363900711412928
Epoch: 13, step: 343, loss: 0.34331855177879333, mean loss: 0.36389963471489317
Epoch: 13, step: 344, loss: 0.363662987947464, mean loss: 0.3638996223360279
Epoch: 13, step: 345, loss: 0.32007622718811035, mean loss: 0.3638973300776773
Epoch: 13, step: 346, loss: 0.32481658458709717, mean loss: 0.3638952859987249
Epoch: 13, step: 347, loss: 0.33227166533470154, mean loss: 0.36389363204366926
Epoch: 13, step: 348, loss: 0.36679548025131226, mean loss: 0.36389378380603565
Epoch: 13, step: 349, loss: 0.39740458130836487, mean loss: 0.36389553627949567
Epoch: 13, step: 350, loss: 0.33902719616889954, mean loss: 0.3638942358381365
Epoch: 13, step: 351, loss: 0.301988422870636, mean loss: 0.3638909987636245
Epoch: 13, step: 352, loss: 0.321135938167572, mean loss: 0.36388876320490054
Epoch: 13, step: 353, loss: 0.3536141812801361, mean loss: 0.36388822599994786
Epoch: 13, step: 354, loss: 0.32128608226776123, mean loss: 0.3638859986698003
Epoch: 13, step: 355, loss: 0.3259429335594177, mean loss: 0.36388401502984263
Epoch: 13, step: 356, loss: 0.3120300769805908, mean loss: 0.3638813042797747
Epoch: 13, step: 357, loss: 0.34772247076034546, mean loss: 0.3638804595942797
Epoch: 13, step: 358, loss: 0.34871262311935425, mean loss: 0.3638796667535252
Epoch: 13, step: 359, loss: 0.3469861149787903, mean loss: 0.36387878375374605
Epoch: 13, step: 360, loss: 0.3095512390136719, mean loss: 0.3638759442855633
Epoch: 13, step: 361, loss: 0.3527137339115143, mean loss: 0.3638753609151037
Epoch: 13, step: 362, loss: 0.32839518785476685, mean loss: 0.36387350671217394
Epoch: 13, step: 363, loss: 0.34136396646499634, mean loss: 0.36387233041930983
Epoch: 13, step: 364, loss: 0.3160612881183624, mean loss: 0.36386983206312545
Epoch: 13, step: 365, loss: 0.38710999488830566, mean loss: 0.3638710464095998
Epoch: 13, step: 366, loss: 0.28764766454696655, mean loss: 0.3638670637886759
Epoch: 13, step: 367, loss: 0.3423652648925781, mean loss: 0.3638659403927043
Epoch: 13, step: 368, loss: 0.32163578271865845, mean loss: 0.36386373412565065
Epoch: 13, step: 369, loss: 0.3111765682697296, mean loss: 0.3638609816877729
Epoch: 13, step: 370, loss: 0.3104568123817444, mean loss: 0.36385819193855357
Epoch: 13, step: 371, loss: 0.30566084384918213, mean loss: 0.36385515196007
Epoch: 13, step: 372, loss: 0.3104006052017212, mean loss: 0.36385235987092096
Epoch: 13, step: 373, loss: 0.33789923787117004, mean loss: 0.3638510043333674
Epoch: 13, step: 374, loss: 0.31285473704338074, mean loss: 0.36384834092566437
Epoch: 13, step: 375, loss: 0.3566739857196808, mean loss: 0.36384796624657484
Epoch: 13, step: 376, loss: 0.3380139470100403, mean loss: 0.3638466171411784
Epoch: 13, step: 377, loss: 0.41746339201927185, mean loss: 0.3638494169727647
Epoch: 13, step: 378, loss: 0.3668883442878723, mean loss: 0.3638495756551998
Epoch: 13, step: 379, loss: 0.3339398205280304, mean loss: 0.3638480139511936
Epoch: 13, step: 380, loss: 0.27429625391960144, mean loss: 0.363843338351547
Epoch: 13, step: 381, loss: 0.3163316547870636, mean loss: 0.36384085784180675
Epoch: 13, step: 382, loss: 0.3290327787399292, mean loss: 0.363839040662005
Epoch: 13, step: 383, loss: 0.3593518137931824, mean loss: 0.36383880641545724
Epoch: 13, step: 384, loss: 0.3494219481945038, mean loss: 0.3638380538519963
Epoch: 13, step: 385, loss: 0.37879082560539246, mean loss: 0.3638388343495301
Epoch: 13, step: 386, loss: 0.30907052755355835, mean loss: 0.3638359757292057
Epoch: 13, step: 387, loss: 0.3449004292488098, mean loss: 0.36383498744389875
Epoch: 13, step: 388, loss: 0.34764787554740906, mean loss: 0.36383414264916486
Epoch: 13, step: 389, loss: 0.3375283479690552, mean loss: 0.3638327698386712
Epoch: 13, step: 390, loss: 0.3435128927230835, mean loss: 0.36383170946831606
Epoch: 13, step: 391, loss: 0.3174223303794861, mean loss: 0.3638292877724755
Epoch: 13, step: 392, loss: 0.3360297679901123, mean loss: 0.36382783723661416
Epoch: 13, step: 393, loss: 0.29837316274642944, mean loss: 0.36382442209133137
Epoch: 13, step: 394, loss: 0.3661770522594452, mean loss: 0.3638245448351185
Epoch: 13, step: 395, loss: 0.32479625940322876, mean loss: 0.36382250871839106
Epoch: 13, step: 396, loss: 0.3459613025188446, mean loss: 0.3638215769428055
Epoch: 13, step: 397, loss: 0.370655357837677, mean loss: 0.3638219334258986
Epoch: 13, step: 398, loss: 0.32496681809425354, mean loss: 0.3638199066607151
Epoch: 13, step: 399, loss: 0.34357479214668274, mean loss: 0.36381885068770686
Epoch: 13, step: 400, loss: 0.3094066381454468, mean loss: 0.363816012727422
Epoch: 13, step: 401, loss: 0.3066444396972656, mean loss: 0.3638130310035756
Epoch: 13, step: 402, loss: 0.3352110981941223, mean loss: 0.36381153937735344
Epoch: 13, step: 403, loss: 0.3646750748157501, mean loss: 0.36381158440944766
Epoch: 13, step: 404, loss: 0.3189624845981598, mean loss: 0.36380924571727413
Epoch: 13, step: 405, loss: 0.3546728789806366, mean loss: 0.3638087693189669
Epoch: 13, step: 406, loss: 0.3631993532180786, mean loss: 0.36380873754379084
Epoch: 13, step: 407, loss: 0.31742948293685913, mean loss: 0.36380631943875397
Epoch: 13, step: 408, loss: 0.3604357838630676, mean loss: 0.3638061437161339
Epoch: 13, step: 409, loss: 0.3582945168018341, mean loss: 0.3638058563828572
Epoch: 13, step: 410, loss: 0.3463270664215088, mean loss: 0.36380494522245677
Epoch: 13, step: 411, loss: 0.3337099552154541, mean loss: 0.363803376467765
Epoch: 13, step: 412, loss: 0.3617294728755951, mean loss: 0.3638032683674996
Epoch: 13, step: 413, loss: 0.31401723623275757, mean loss: 0.3638006734528673
Epoch: 13, step: 414, loss: 0.35702112317085266, mean loss: 0.36380032011204894
Epoch: 13, step: 415, loss: 0.3418344557285309, mean loss: 0.3637991753411305
Epoch: 13, step: 416, loss: 0.30377689003944397, mean loss: 0.36379604738838145
Epoch: 13, step: 417, loss: 0.32554522156715393, mean loss: 0.36379405411970916
Epoch: 13, step: 418, loss: 0.33389273285865784, mean loss: 0.36379249602887176
Epoch: 13, step: 419, loss: 0.3359629809856415, mean loss: 0.3637910459707724
Epoch: 13, step: 420, loss: 0.31367412209510803, mean loss: 0.3637884347623174
Epoch: 13, step: 421, loss: 0.34895971417427063, mean loss: 0.3637876621916918
Epoch: 13, step: 422, loss: 0.3653986155986786, mean loss: 0.3637877461173707
Epoch: 13, step: 423, loss: 0.30638155341148376, mean loss: 0.36378475558847373
Epoch: 13, step: 424, loss: 0.3299574553966522, mean loss: 0.36378299347459175
Epoch: 13, step: 425, loss: 0.33699822425842285, mean loss: 0.3637815982891966
Epoch: 13, step: 426, loss: 0.3361853361129761, mean loss: 0.3637801609090114
Epoch: 13, step: 427, loss: 0.3137977719306946, mean loss: 0.3637775576595854
Epoch: 13, step: 428, loss: 0.3811887204647064, mean loss: 0.36377846444375317
Epoch: 13, step: 429, loss: 0.2912994623184204, mean loss: 0.3637746898889086
Epoch: 13, step: 430, loss: 0.33038464188575745, mean loss: 0.3637729510955949
Epoch: 13, step: 431, loss: 0.30649080872535706, mean loss: 0.36376996827210134
Epoch: 13, step: 432, loss: 0.31477317214012146, mean loss: 0.3637674170200247
Epoch: 13, step: 433, loss: 0.321136474609375, mean loss: 0.363765197352087
Epoch: 13, step: 434, loss: 0.3270161747932434, mean loss: 0.3637632840380578
Epoch: 13, step: 435, loss: 0.3447795510292053, mean loss: 0.3637622957137654
Epoch: 13, step: 436, loss: 0.3231333792209625, mean loss: 0.3637601806158169
Epoch: 13, step: 437, loss: 0.33343181014060974, mean loss: 0.3637586018354694
Epoch: 13, step: 438, loss: 0.34243446588516235, mean loss: 0.36375749183932393
Epoch: 13, step: 439, loss: 0.33095479011535645, mean loss: 0.36375578443240514
Epoch: 13, step: 440, loss: 0.36701640486717224, mean loss: 0.36375595414147893
Epoch: 13, step: 441, loss: 0.31741246581077576, mean loss: 0.3637535421768526
Epoch: 13, step: 442, loss: 0.3660072088241577, mean loss: 0.3637536594636934
Epoch: 13, step: 443, loss: 0.3422497808933258, mean loss: 0.3637525404025688
Epoch: 13, step: 444, loss: 0.3196417987346649, mean loss: 0.3637502450004942
Epoch: 13, step: 445, loss: 0.28786835074424744, mean loss: 0.36374629652020196
Epoch: 13, step: 446, loss: 0.34502458572387695, mean loss: 0.36374532239507595
Epoch: 13, step: 447, loss: 0.3192669749259949, mean loss: 0.3637430082250724
Epoch: 13, step: 448, loss: 0.3381540775299072, mean loss: 0.3637416769243755
Epoch: 13, step: 449, loss: 0.3152470290660858, mean loss: 0.36373915405225715
Epoch: 13, step: 450, loss: 0.3283976912498474, mean loss: 0.3637373155534379
Epoch: 13, step: 451, loss: 0.35512471199035645, mean loss: 0.363736867540352
Epoch: 13, step: 452, loss: 0.31918802857398987, mean loss: 0.3637345503055553
Epoch: 13, step: 453, loss: 0.32791799306869507, mean loss: 0.3637326873825741
Epoch: 13, step: 454, loss: 0.3227497339248657, mean loss: 0.3637305558512141
Epoch: 13, step: 455, loss: 0.30793648958206177, mean loss: 0.363727654141922
Epoch: 13, step: 456, loss: 0.2968335449695587, mean loss: 0.3637241753281942
Epoch: 13, step: 457, loss: 0.3242572546005249, mean loss: 0.36372212296622186
Epoch: 13, step: 458, loss: 0.33159658312797546, mean loss: 0.36372045245819634
Epoch: 13, step: 459, loss: 0.28907138109207153, mean loss: 0.3637165709549015
Epoch: 13, step: 460, loss: 0.32114002108573914, mean loss: 0.3637143572311003
Epoch: 13, step: 461, loss: 0.3551364541053772, mean loss: 0.36371391125506175
Epoch: 13, step: 462, loss: 0.3359687030315399, mean loss: 0.3637124688215695
Epoch: 13, step: 463, loss: 0.34715017676353455, mean loss: 0.36371160781657585
Epoch: 13, step: 464, loss: 0.30814066529273987, mean loss: 0.3637087190635206
Epoch: 13, step: 465, loss: 0.40736833214759827, mean loss: 0.36371098851008904
Epoch: 13, step: 466, loss: 0.33157745003700256, mean loss: 0.3637093182809465
Epoch: 13, step: 467, loss: 0.3369113504886627, mean loss: 0.36370792545517766
Epoch: 13, step: 468, loss: 0.3343813121318817, mean loss: 0.3637064012821449
Epoch: 13, step: 469, loss: 0.3624122440814972, mean loss: 0.3637063340252485
Epoch: 13, step: 470, loss: 0.3513571321964264, mean loss: 0.3637056922749066
Epoch: 13, step: 471, loss: 0.3582444489002228, mean loss: 0.36370540848549826
Epoch: 13, step: 472, loss: 0.35831791162490845, mean loss: 0.3637051285428191
Epoch: 13, step: 473, loss: 0.38616758584976196, mean loss: 0.3637062956662373
Epoch: 13, step: 474, loss: 0.3419318199157715, mean loss: 0.3637051643483306
Epoch: 13, step: 475, loss: 0.3108353614807129, mean loss: 0.3637024175796862
Epoch: 13, step: 476, loss: 0.35249921679496765, mean loss: 0.3637018355649953
Epoch: 13, step: 477, loss: 0.37354329228401184, mean loss: 0.3637023468095002
Epoch: 13, step: 478, loss: 0.32919612526893616, mean loss: 0.36370055437162474
Epoch: 13, step: 479, loss: 0.2963305413722992, mean loss: 0.36369705499426136
Epoch: 13, step: 480, loss: 0.3091511130332947, mean loss: 0.36369422188035905
Epoch: 13, step: 481, loss: 0.46009522676467896, mean loss: 0.36369922868439375
Epoch: 13, step: 482, loss: 0.34242093563079834, mean loss: 0.3636981236055543
Epoch: 13, step: 483, loss: 0.36089831590652466, mean loss: 0.3636979782063178
Epoch: 13, step: 484, loss: 0.33326417207717896, mean loss: 0.3636963978040677
Epoch: 13, step: 485, loss: 0.36402252316474915, mean loss: 0.36369641473860714
Epoch: 13, step: 486, loss: 0.4022960364818573, mean loss: 0.36369841897671623
Epoch: 13, step: 487, loss: 0.37108245491981506, mean loss: 0.36369880236383684
Epoch: 13, step: 488, loss: 0.35328859090805054, mean loss: 0.36369826188247784
Epoch: 13, step: 489, loss: 0.32005199790000916, mean loss: 0.36369599595661434
Epoch: 13, step: 490, loss: 0.30849042534828186, mean loss: 0.3636931300701684
Epoch: 13, step: 491, loss: 0.33649539947509766, mean loss: 0.363691718227841
Epoch: 13, step: 492, loss: 0.3159026801586151, mean loss: 0.3636892376133552
Epoch: 13, step: 493, loss: 0.3342932462692261, mean loss: 0.3636877118170641
Epoch: 13, step: 494, loss: 0.3835834860801697, mean loss: 0.36368874445184185
Epoch: 13, step: 495, loss: 0.3534553050994873, mean loss: 0.3636882133412257
Epoch: 13, step: 496, loss: 0.3382571041584015, mean loss: 0.3636868935472985
Epoch: 13, step: 497, loss: 0.3277037441730499, mean loss: 0.3636850262328525
Epoch: 13, step: 498, loss: 0.35735204815864563, mean loss: 0.3636846976054811
Epoch: 13, step: 499, loss: 0.36361488699913025, mean loss: 0.363684693983096
Epoch: 13, step: 500, loss: 0.3838241696357727, mean loss: 0.3636857389411022
Epoch: 13, step: 501, loss: 0.3292265832424164, mean loss: 0.3636839510841084
Epoch: 13, step: 502, loss: 0.3333413600921631, mean loss: 0.3636823768900232
Epoch: 13, step: 503, loss: 0.3164327144622803, mean loss: 0.36367992567283974
Epoch: 13, step: 504, loss: 0.37092092633247375, mean loss: 0.36368030130186185
Epoch: 13, step: 505, loss: 0.33291319012641907, mean loss: 0.36367870533178326
Epoch: 13, step: 506, loss: 0.3271910846233368, mean loss: 0.36367681272217134
Epoch: 13, step: 507, loss: 0.3417026400566101, mean loss: 0.3636756729829252
Epoch: 13, step: 508, loss: 0.35267338156700134, mean loss: 0.36367510235425365
Epoch: 13, step: 509, loss: 0.35205891728401184, mean loss: 0.36367449991752143
Epoch: 13, step: 510, loss: 0.3294336795806885, mean loss: 0.3636727242176647
Epoch: 13, step: 511, loss: 0.3209063708782196, mean loss: 0.3636705065059172
Epoch: 13, step: 512, loss: 0.3634610176086426, mean loss: 0.3636704956431276
Epoch: 13, step: 513, loss: 0.30727440118789673, mean loss: 0.36366757144451434
Epoch: 13, step: 514, loss: 0.32849282026290894, mean loss: 0.3636657476901108
Epoch: 13, step: 515, loss: 0.3183745741844177, mean loss: 0.36366339953719157
Epoch: 13, step: 516, loss: 0.3127996623516083, mean loss: 0.3636607626074811
Epoch: 13, step: 517, loss: 0.29473310708999634, mean loss: 0.3636571893749504
Epoch: 13, step: 518, loss: 0.3110986649990082, mean loss: 0.3636544648648485
Epoch: 13, step: 519, loss: 0.358148992061615, mean loss: 0.3636541794888997
Epoch: 13, step: 520, loss: 0.28923627734184265, mean loss: 0.36365032224004534
Epoch: 13, step: 521, loss: 0.3326728343963623, mean loss: 0.3636487166897269
Epoch: 13, step: 522, loss: 0.3376237452030182, mean loss: 0.3636473678961801
Epoch: 13, step: 523, loss: 0.29219764471054077, mean loss: 0.36364366507055895
Epoch: 13, step: 524, loss: 0.3032185435295105, mean loss: 0.36364053374851196
Epoch: 13, step: 525, loss: 0.3757866621017456, mean loss: 0.3636411631468099
Epoch: 13, step: 526, loss: 0.32575464248657227, mean loss: 0.36363920001293454
Epoch: 13, step: 527, loss: 0.32093214988708496, mean loss: 0.3636369872124099
Epoch: 13, step: 528, loss: 0.3404735326766968, mean loss: 0.3636357870956006
Epoch: 13, step: 529, loss: 0.3085034191608429, mean loss: 0.36363293079221576
Epoch: 13, step: 530, loss: 0.3775593042373657, mean loss: 0.3636336522538251
Epoch: 13, step: 531, loss: 0.3391202688217163, mean loss: 0.3636323823935147
Epoch: 13, step: 532, loss: 0.3236924707889557, mean loss: 0.3636303135040247
Epoch: 13, step: 533, loss: 0.33730992674827576, mean loss: 0.3636289501772477
Epoch: 13, step: 534, loss: 0.3327956199645996, mean loss: 0.36362735317459516
Epoch: 13, step: 535, loss: 0.3398192226886749, mean loss: 0.3636261201038221
Epoch: 13, step: 536, loss: 0.3101128935813904, mean loss: 0.3636233486901537
Epoch: 13, step: 537, loss: 0.3442133069038391, mean loss: 0.3636223435093259
Epoch: 13, step: 538, loss: 0.35628825426101685, mean loss: 0.3636219637211612
Epoch: 13, step: 539, loss: 0.3033442199230194, mean loss: 0.3636188424626795
Epoch: 13, step: 540, loss: 0.3087122142314911, mean loss: 0.3636159994746284
Epoch: 13, step: 541, loss: 0.34987127780914307, mean loss: 0.36361528782910363
Epoch: 13, step: 542, loss: 0.309591144323349, mean loss: 0.3636124908245214
Epoch: 13, step: 543, loss: 0.33590933680534363, mean loss: 0.3636110566169205
Epoch: 13, step: 544, loss: 0.3383384644985199, mean loss: 0.36360974830858495
Epoch: 13, step: 545, loss: 0.32797771692276, mean loss: 0.3636079038096003
Epoch: 13, step: 546, loss: 0.35687655210494995, mean loss: 0.3636075553779162
Epoch: 13, step: 547, loss: 0.3434315323829651, mean loss: 0.3636065110703078
Epoch: 13, step: 548, loss: 0.3480406701564789, mean loss: 0.36360570542666026
Epoch: 13, step: 549, loss: 0.3372408151626587, mean loss: 0.36360434092555977
Epoch: 13, step: 550, loss: 0.33169129490852356, mean loss: 0.36360268936803675
Epoch: 13, step: 551, loss: 0.3249901235103607, mean loss: 0.36360069120172245
Epoch: 13, step: 552, loss: 0.38468196988105774, mean loss: 0.363601782082896
Epoch: 13, step: 553, loss: 0.3268844783306122, mean loss: 0.36359988219136374
Epoch: 13, step: 554, loss: 0.32244330644607544, mean loss: 0.36359775270537287
Epoch: 13, step: 555, loss: 0.31337884068489075, mean loss: 0.36359515445868307
Epoch: 13, step: 556, loss: 0.36391764879226685, mean loss: 0.3635951711431641
Epoch: 13, step: 557, loss: 0.3361072540283203, mean loss: 0.36359374910916953
Epoch: 13, step: 558, loss: 0.348693311214447, mean loss: 0.3635929783038364
Epoch: 13, step: 559, loss: 0.38710707426071167, mean loss: 0.36359419463406384
Epoch: 13, step: 560, loss: 0.34970390796661377, mean loss: 0.36359347615857285
Epoch: 13, step: 561, loss: 0.33677351474761963, mean loss: 0.3635920889670237
Epoch: 13, step: 562, loss: 0.33865970373153687, mean loss: 0.3635907994720542
Epoch: 13, step: 563, loss: 0.330138236284256, mean loss: 0.3635890694056916
Epoch: 13, step: 564, loss: 0.3378100097179413, mean loss: 0.36358773625889074
Epoch: 13, step: 565, loss: 0.34368786215782166, mean loss: 0.3635867072034506
Epoch: 13, step: 566, loss: 0.38622814416885376, mean loss: 0.3635878779691037
Epoch: 13, step: 567, loss: 0.324984610080719, mean loss: 0.3635858819366379
Epoch: 13, step: 568, loss: 0.3227589428424835, mean loss: 0.36358377103549033
Epoch: 13, step: 569, loss: 0.3080735206604004, mean loss: 0.3635809011021652
Epoch: 13, step: 570, loss: 0.3859047293663025, mean loss: 0.3635820552058856
Epoch: 13, step: 571, loss: 0.3400762677192688, mean loss: 0.3635808400597169
Epoch: 13, step: 572, loss: 0.2859902083873749, mean loss: 0.3635768291715457
Epoch: 13, step: 573, loss: 0.3360954523086548, mean loss: 0.36357540865170374
Epoch: 13, step: 574, loss: 0.4392063021659851, mean loss: 0.36357931783108627
Epoch: 13, step: 575, loss: 0.31698107719421387, mean loss: 0.36357690940434256
Epoch: 13, step: 576, loss: 0.33663585782051086, mean loss: 0.3635755170299778
Epoch: 13, step: 577, loss: 0.3517366647720337, mean loss: 0.36357490520298774
Epoch: 13, step: 578, loss: 0.3369104862213135, mean loss: 0.3635735272680499
Epoch: 13, step: 579, loss: 0.3137437403202057, mean loss: 0.3635709523514032
Epoch: 13, step: 580, loss: 0.3414459228515625, mean loss: 0.3635698091162717
Epoch: 13, step: 581, loss: 0.3187880218029022, mean loss: 0.36356749529032806
Epoch: 13, step: 582, loss: 0.3167319595813751, mean loss: 0.3635650754744816
Epoch: 13, step: 583, loss: 0.33061838150024414, mean loss: 0.3635633733307549
Epoch: 13, step: 584, loss: 0.3292437195777893, mean loss: 0.36356160034662754
Epoch: 13, step: 585, loss: 0.32354187965393066, mean loss: 0.36355953299872523
Epoch: 13, step: 586, loss: 0.32098305225372314, mean loss: 0.3635573336867388
Epoch: 13, step: 587, loss: 0.37111130356788635, mean loss: 0.3635577238711335
Epoch: 13, step: 588, loss: 0.32778793573379517, mean loss: 0.3635558763535395
Epoch: 13, step: 589, loss: 0.3513537347316742, mean loss: 0.36355524614273366
Epoch: 13, step: 590, loss: 0.3331984877586365, mean loss: 0.3635536783712941
Epoch: 13, step: 591, loss: 0.3080657422542572, mean loss: 0.36355081285094104
Epoch: 13, step: 592, loss: 0.4021807312965393, mean loss: 0.36355280768277404
Epoch: 13, step: 593, loss: 0.3431603014469147, mean loss: 0.3635517546771851
Epoch: 13, step: 594, loss: 0.3108987808227539, mean loss: 0.3635490359817829
Epoch: 13, step: 595, loss: 0.37541335821151733, mean loss: 0.3635496485552148
Epoch: 13, step: 596, loss: 0.334701269865036, mean loss: 0.3635481591454007
Epoch: 13, step: 597, loss: 0.3046506941318512, mean loss: 0.3635451184915538
Epoch: 13, step: 598, loss: 0.3247673809528351, mean loss: 0.3635431166466548
Epoch: 13, step: 599, loss: 0.3271566927433014, mean loss: 0.3635412383468456
Epoch: 13, step: 600, loss: 0.32649195194244385, mean loss: 0.3635393259282009
Epoch: 13, step: 601, loss: 0.3505496680736542, mean loss: 0.36353865545964226
Epoch: 13, step: 602, loss: 0.34252259135246277, mean loss: 0.3635375707595593
Epoch: 13, step: 603, loss: 0.3168500065803528, mean loss: 0.3635351612031916
Epoch: 13, step: 604, loss: 0.30545130372047424, mean loss: 0.3635321636361027
Epoch: 13, step: 605, loss: 0.2945401966571808, mean loss: 0.3635286033116637
Epoch: 13, step: 606, loss: 0.33270928263664246, mean loss: 0.36352701296537776
Epoch: 13, step: 607, loss: 0.3159041106700897, mean loss: 0.3635245556432779
Epoch: 13, step: 608, loss: 0.3331174850463867, mean loss: 0.3635229867319422
Epoch: 13, step: 609, loss: 0.3945070505142212, mean loss: 0.3635245853318691
Epoch: 13, step: 610, loss: 0.31750917434692383, mean loss: 0.3635222113231509
Epoch: 13, step: 611, loss: 0.35938403010368347, mean loss: 0.363521997838771
Epoch: 13, step: 612, loss: 0.3516522943973541, mean loss: 0.3635213855249489
Epoch: 13, step: 613, loss: 0.35655730962753296, mean loss: 0.36352102629272476
Epoch: 13, step: 614, loss: 0.3633594810962677, mean loss: 0.363521017960069
Epoch: 13, step: 615, loss: 0.302509069442749, mean loss: 0.3635178710677378
Epoch: 13, step: 616, loss: 0.3087460398674011, mean loss: 0.36351504617572683
Epoch: 13, step: 617, loss: 0.3216326832771301, mean loss: 0.36351288617764027
Epoch: 13, step: 618, loss: 0.3547174036502838, mean loss: 0.36351243259182586
Epoch: 13, step: 619, loss: 0.3840598464012146, mean loss: 0.36351349217380863
Epoch: 13, step: 620, loss: 0.3128732442855835, mean loss: 0.36351088090954375
Epoch: 13, step: 621, loss: 0.30649489164352417, mean loss: 0.36350794103178435
Epoch: 13, step: 622, loss: 0.32045233249664307, mean loss: 0.36350572109837187
Epoch: 13, step: 623, loss: 0.3595806360244751, mean loss: 0.3635055187326741
Epoch: 13, step: 624, loss: 0.3157546818256378, mean loss: 0.3635030569686432
Epoch: 13, step: 625, loss: 0.3441847860813141, mean loss: 0.363502061078815
Epoch: 13, step: 626, loss: 0.36615583300590515, mean loss: 0.3635021978782339
Epoch: 13, step: 627, loss: 0.31612688302993774, mean loss: 0.3634997558516953
Epoch: 13, step: 628, loss: 0.35152822732925415, mean loss: 0.36349913879440326
Epoch: 13, step: 629, loss: 0.3361818790435791, mean loss: 0.36349773083338116
Epoch: 13, step: 630, loss: 0.31028497219085693, mean loss: 0.3634949883317761
Epoch: 13, step: 631, loss: 0.3065628111362457, mean loss: 0.36349205428842446
Epoch: 13, step: 632, loss: 0.33186548948287964, mean loss: 0.3634904244731807
Epoch: 13, step: 633, loss: 0.2971692681312561, mean loss: 0.3634870069138515
Epoch: 13, step: 634, loss: 0.3186782896518707, mean loss: 0.36348469801926386
Epoch: 13, step: 635, loss: 0.31705963611602783, mean loss: 0.36348230596125153
Epoch: 13, step: 636, loss: 0.3498572111129761, mean loss: 0.3634816039624444
Epoch: 13, step: 637, loss: 0.3459309935569763, mean loss: 0.36348069975788977
Epoch: 13, step: 638, loss: 0.3494476079940796, mean loss: 0.36347997681256167
Epoch: 13, step: 639, loss: 0.34364083409309387, mean loss: 0.36347895480850645
Epoch: 13, step: 640, loss: 0.3123396039009094, mean loss: 0.3634763205247323
Epoch: 13, step: 641, loss: 0.34673652052879333, mean loss: 0.363475458270689
Epoch: 13, step: 642, loss: 0.29951211810112, mean loss: 0.3634721637386174
Epoch: 13, step: 643, loss: 0.34126418828964233, mean loss: 0.36347101994095316
Epoch: 13, step: 644, loss: 0.34640005230903625, mean loss: 0.3634701407645803
Epoch: 13, step: 645, loss: 0.3556782305240631, mean loss: 0.36346973949203726
Epoch: 13, step: 646, loss: 0.3531602919101715, mean loss: 0.36346920859716203
Epoch: 13, step: 647, loss: 0.3596836030483246, mean loss: 0.3634690136638176
Epoch: 13, step: 648, loss: 0.3525896668434143, mean loss: 0.36346845347912987
Epoch: 13, step: 649, loss: 0.3105553686618805, mean loss: 0.36346572909004443
Epoch: 13, step: 650, loss: 0.30414336919784546, mean loss: 0.36346267485743916
Epoch: 13, step: 651, loss: 0.33034059405326843, mean loss: 0.3634609696432297
Epoch: 13, step: 652, loss: 0.31500503420829773, mean loss: 0.363458475129179
Epoch: 13, step: 653, loss: 0.3426216244697571, mean loss: 0.3634574025022533
Epoch: 13, step: 654, loss: 0.3352392613887787, mean loss: 0.3634559499804479
Epoch: 13, step: 655, loss: 0.319790244102478, mean loss: 0.36345370241477576
Epoch: 13, step: 656, loss: 0.33915701508522034, mean loss: 0.36345245187757214
Epoch: 13, step: 657, loss: 0.3034502863883972, mean loss: 0.36344936375788667
Epoch: 13, step: 658, loss: 0.39038804173469543, mean loss: 0.36345075013419137
Epoch: 13, step: 659, loss: 0.3402946889400482, mean loss: 0.36344955848839094
Epoch: 13, step: 660, loss: 0.3339928388595581, mean loss: 0.3634480426792195
Epoch: 13, step: 661, loss: 0.32513368129730225, mean loss: 0.3634460711673649
Epoch: 13, step: 662, loss: 0.3257046341896057, mean loss: 0.36344412923595365
Epoch: 13, step: 663, loss: 0.3733014166355133, mean loss: 0.3634446364024179
Epoch: 13, step: 664, loss: 0.37757986783981323, mean loss: 0.363445363635604
Epoch: 13, step: 665, loss: 0.3120554983615875, mean loss: 0.3634427198520216
Epoch: 13, step: 666, loss: 0.34492018818855286, mean loss: 0.3634417669978797
Epoch: 13, step: 667, loss: 0.30514585971832275, mean loss: 0.3634387682372172
Epoch: 13, step: 668, loss: 0.323157399892807, mean loss: 0.3634366962569516
Epoch: 13, step: 669, loss: 0.2867889404296875, mean loss: 0.36343275387675267
Epoch: 13, step: 670, loss: 0.3413976728916168, mean loss: 0.36343162055982703
Epoch: 13, step: 671, loss: 0.30346882343292236, mean loss: 0.36342853668834346
Epoch: 13, step: 672, loss: 0.3167306184768677, mean loss: 0.36342613514973654
Epoch: 13, step: 673, loss: 0.3449196219444275, mean loss: 0.36342518346233527
Epoch: 13, step: 674, loss: 0.31262147426605225, mean loss: 0.3634225710434945
Epoch: 13, step: 675, loss: 0.33508574962615967, mean loss: 0.36342111398768323
Epoch: 13, step: 676, loss: 0.336551308631897, mean loss: 0.3634197324356571
Epoch: 13, step: 677, loss: 0.32547715306282043, mean loss: 0.36341778166036803
Epoch: 13, step: 678, loss: 0.3015592694282532, mean loss: 0.3634146014376426
Epoch: 13, step: 679, loss: 0.3576643764972687, mean loss: 0.3634143058266545
Epoch: 13, step: 680, loss: 0.35665082931518555, mean loss: 0.36341395814370014
Epoch: 13, step: 681, loss: 0.30375704169273376, mean loss: 0.3634108915807079
Epoch: 13, step: 682, loss: 0.37784668803215027, mean loss: 0.3634116335902916
Epoch: 13, step: 683, loss: 0.31335535645484924, mean loss: 0.36340906079644214
Epoch: 13, step: 684, loss: 0.3551996648311615, mean loss: 0.3634086388713784
Epoch: 13, step: 685, loss: 0.34433209896087646, mean loss: 0.3634076584756589
Epoch: 13, step: 686, loss: 0.35055413842201233, mean loss: 0.36340699793194886
Epoch: 13, step: 687, loss: 0.3436117470264435, mean loss: 0.3634059807042559
Epoch: 13, step: 688, loss: 0.3135611116886139, mean loss: 0.36340341943458754
Epoch: 13, step: 689, loss: 0.2932899594306946, mean loss: 0.3633998168521189
Epoch: 13, step: 690, loss: 0.3578417897224426, mean loss: 0.363399531283238
Epoch: 13, step: 691, loss: 0.31631457805633545, mean loss: 0.36339711220426
Epoch: 13, step: 692, loss: 0.3680332899093628, mean loss: 0.3633973503844658
Epoch: 13, step: 693, loss: 0.3246377408504486, mean loss: 0.3633953592404437
Epoch: 13, step: 694, loss: 0.3467366397380829, mean loss: 0.36339450349895797
Epoch: 13, step: 695, loss: 0.358630508184433, mean loss: 0.36339425878993215
Epoch: 13, step: 696, loss: 0.32634609937667847, mean loss: 0.3633923558591492
Epoch: 13, step: 697, loss: 0.2834051549434662, mean loss: 0.36338824763105904
Epoch: 13, step: 698, loss: 0.33568355441093445, mean loss: 0.36338682476149814
Epoch: 13, step: 699, loss: 0.33754992485046387, mean loss: 0.36338549788701624
Epoch: 13, step: 700, loss: 0.384437620639801, mean loss: 0.36338657897995275
Epoch: 13, step: 701, loss: 0.33885636925697327, mean loss: 0.36338531934096113
Epoch: 13, step: 702, loss: 0.3293784558773041, mean loss: 0.3633835731605522
Epoch: 13, step: 703, loss: 0.37232398986816406, mean loss: 0.3633840322084423
Epoch: 13, step: 704, loss: 0.33806708455085754, mean loss: 0.3633827323702918
Epoch: 13, step: 705, loss: 0.3351638615131378, mean loss: 0.36338128361421534
Epoch: 13, step: 706, loss: 0.34689027070999146, mean loss: 0.3633804370095178
Epoch: 13, step: 707, loss: 0.35266172885894775, mean loss: 0.3633798867678263
Epoch: 13, step: 708, loss: 0.3443066477775574, mean loss: 0.3633789076990418
Epoch: 13, step: 709, loss: 0.35911619663238525, mean loss: 0.3633786888965027
Epoch: 13, step: 710, loss: 0.36874887347221375, mean loss: 0.36337896453088014
Epoch: 13, step: 711, loss: 0.32797104120254517, mean loss: 0.363377147248837
Epoch: 13, step: 712, loss: 0.32280710339546204, mean loss: 0.3633750651321394
Epoch: 13, step: 713, loss: 0.3261075019836426, mean loss: 0.3633731526019563
Epoch: 13, step: 714, loss: 0.3537086546421051, mean loss: 0.3633726566560457
Epoch: 13, step: 715, loss: 0.38325297832489014, mean loss: 0.3633736767874942
Epoch: 13, step: 716, loss: 0.30995887517929077, mean loss: 0.36337093602082543
Epoch: 13, step: 717, loss: 0.2998417019844055, mean loss: 0.36336767643980766
Epoch: 13, step: 718, loss: 0.3852293789386749, mean loss: 0.363368798070432
Epoch: 13, step: 719, loss: 0.3313955068588257, mean loss: 0.36336715774151696
Epoch: 13, step: 720, loss: 0.3388054072856903, mean loss: 0.3633658977122523
Epoch: 13, step: 721, loss: 0.3726608157157898, mean loss: 0.36336637452142456
Epoch: 13, step: 722, loss: 0.3232152760028839, mean loss: 0.3633643149626393
Epoch: 13, step: 723, loss: 0.3204599916934967, mean loss: 0.3633621142895131
Epoch: 13, step: 724, loss: 0.3889552056789398, mean loss: 0.36336342695768714
Epoch: 13, step: 725, loss: 0.3182504177093506, mean loss: 0.36336111323272824
Epoch: 13, step: 726, loss: 0.38079020380973816, mean loss: 0.36336200707808325
Epoch: 13, step: 727, loss: 0.33454516530036926, mean loss: 0.3633605292913254
Epoch: 13, step: 728, loss: 0.3524772822856903, mean loss: 0.36335997120471414
Epoch: 13, step: 729, loss: 0.29684802889823914, mean loss: 0.36335656068567473
Epoch: 13, step: 730, loss: 0.32042306661605835, mean loss: 0.36335435930670384
Epoch: 13, step: 731, loss: 0.34621673822402954, mean loss: 0.36335348063458106
Epoch: 13, step: 732, loss: 0.3078898787498474, mean loss: 0.3633506370764224
Epoch: 13, step: 733, loss: 0.3687746226787567, mean loss: 0.36335091514397094
Epoch: 13, step: 734, loss: 0.3840903341770172, mean loss: 0.3633519783222676
Epoch: 13, step: 735, loss: 0.35531410574913025, mean loss: 0.36335156629271187
Epoch: 13, step: 736, loss: 0.3549532890319824, mean loss: 0.3633511358105108
Epoch: 13, step: 737, loss: 0.334224134683609, mean loss: 0.3633496428837488
Epoch: 13, step: 738, loss: 0.32108086347579956, mean loss: 0.3633474764761117
Epoch: 13, step: 739, loss: 0.31714770197868347, mean loss: 0.3633451087139911
Epoch: 13, step: 740, loss: 0.3584630489349365, mean loss: 0.363344858518748
Epoch: 13, step: 741, loss: 0.3164486587047577, mean loss: 0.3633424553108042
Epoch: 13, step: 742, loss: 0.3080872595310211, mean loss: 0.3633396238890374
Epoch: 13, step: 743, loss: 0.3325636684894562, mean loss: 0.3633380469288304
Epoch: 13, step: 744, loss: 0.3109454810619354, mean loss: 0.3633353624708775
Epoch: 13, step: 745, loss: 0.3080953359603882, mean loss: 0.36333253226150614
Epoch: 13, step: 746, loss: 0.39401859045028687, mean loss: 0.36333410437371416
Epoch: 13, step: 747, loss: 0.3799777030944824, mean loss: 0.36333495701709123
Epoch: 13, step: 748, loss: 0.2969610393047333, mean loss: 0.3633315568881167
Epoch: 13, step: 749, loss: 0.32601648569107056, mean loss: 0.3633296454512149
Epoch: 13, step: 750, loss: 0.39483508467674255, mean loss: 0.3633312592113555
Epoch: 13, step: 751, loss: 0.30965980887413025, mean loss: 0.36332851021266993
Epoch: 13, step: 752, loss: 0.344154417514801, mean loss: 0.3633275281848749
Epoch: 13, step: 753, loss: 0.35816192626953125, mean loss: 0.36332726363494583
Epoch: 13, step: 754, loss: 0.3493923842906952, mean loss: 0.36332655001383946
Epoch: 13, step: 755, loss: 0.3337797224521637, mean loss: 0.36332503696449686
Epoch: 13, step: 756, loss: 0.34470289945602417, mean loss: 0.3633240834012059
Epoch: 13, step: 757, loss: 0.3376542329788208, mean loss: 0.36332276902074395
Epoch: 13, step: 758, loss: 0.37407684326171875, mean loss: 0.36332331963639297
Epoch: 13, step: 759, loss: 0.3227522671222687, mean loss: 0.36332124247826714
Epoch: 13, step: 760, loss: 0.3930724859237671, mean loss: 0.36332276560545934
Epoch: 13, step: 761, loss: 0.3753555119037628, mean loss: 0.36332338159533845
Epoch: 13, step: 762, loss: 0.3652704060077667, mean loss: 0.363323481263852
Epoch: 13, step: 763, loss: 0.3407934010028839, mean loss: 0.3633223280042154
Epoch: 13, step: 764, loss: 0.3441120982170105, mean loss: 0.3633213447299262
Epoch: 13, step: 765, loss: 0.3314584195613861, mean loss: 0.36331971391176837
Epoch: 13, step: 766, loss: 0.35799360275268555, mean loss: 0.3633194413230402
Epoch: 13, step: 767, loss: 0.32906973361968994, mean loss: 0.36331768852326013
Epoch: 13, step: 768, loss: 0.3264175355434418, mean loss: 0.36331580017808945
Epoch: 13, step: 769, loss: 0.38806700706481934, mean loss: 0.36331706674276487
Epoch: 13, step: 770, loss: 0.34087157249450684, mean loss: 0.363315918224408
Epoch: 13, step: 771, loss: 0.32507044076919556, mean loss: 0.36331396133342075
Epoch: 13, step: 772, loss: 0.3085057735443115, mean loss: 0.3633111571283663
Epoch: 13, step: 773, loss: 0.31599855422973633, mean loss: 0.36330873655111784
Epoch: 13, step: 774, loss: 0.354062020778656, mean loss: 0.36330826350073814
Epoch: 13, step: 775, loss: 0.34670332074165344, mean loss: 0.3633074140561525
Epoch: 13, step: 776, loss: 0.33122462034225464, mean loss: 0.3633057729085893
Epoch: 13, step: 777, loss: 0.339633584022522, mean loss: 0.36330456205493783
Epoch: 13, step: 778, loss: 0.32246509194374084, mean loss: 0.3633024731863321
Epoch: 13, step: 779, loss: 0.3103596866130829, mean loss: 0.36329976539241976
Epoch: 13, step: 780, loss: 0.32445505261421204, mean loss: 0.36329777875544444
Epoch: 13, step: 781, loss: 0.3886682391166687, mean loss: 0.36329907621173785
Epoch: 13, step: 782, loss: 0.3036428987979889, mean loss: 0.3632960255250892
Epoch: 13, step: 783, loss: 0.3070342242717743, mean loss: 0.36329314856654693
Epoch: 13, step: 784, loss: 0.35992687940597534, mean loss: 0.3632929764404969
Epoch: 13, step: 785, loss: 0.3092651665210724, mean loss: 0.36329021400006745
Epoch: 13, step: 786, loss: 0.3378027081489563, mean loss: 0.3632889108912249
Epoch: 13, step: 787, loss: 0.3282412886619568, mean loss: 0.36328711909049743
Epoch: 13, step: 788, loss: 0.3287961483001709, mean loss: 0.3632853558385783
Epoch: 13, step: 789, loss: 0.35030868649482727, mean loss: 0.36328469247750356
Epoch: 13, step: 790, loss: 0.3425315320491791, mean loss: 0.3632836316401868
Epoch: 13, step: 791, loss: 0.3320990800857544, mean loss: 0.3632820376639266
Epoch: 13, step: 792, loss: 0.3304853141307831, mean loss: 0.3632803613683205
Epoch: 13, step: 793, loss: 0.3808639943599701, mean loss: 0.3632812600513927
Epoch: 13, step: 794, loss: 0.36368849873542786, mean loss: 0.3632812808639181
Epoch: 13, step: 795, loss: 0.3104517161846161, mean loss: 0.3632785810701385
Epoch: 13, step: 796, loss: 0.3174274265766144, mean loss: 0.36327623801967635
Epoch: 13, step: 797, loss: 0.3223952353000641, mean loss: 0.36327414905683936
Epoch: 13, step: 798, loss: 0.3671730160713196, mean loss: 0.363274348273385
Epoch: 13, step: 799, loss: 0.3387301564216614, mean loss: 0.36327309422720416
Epoch: 13, step: 800, loss: 0.34385544061660767, mean loss: 0.36327210216397365
Epoch: 13, step: 801, loss: 0.33410993218421936, mean loss: 0.36327061232183716
Epoch: 13, step: 802, loss: 0.2937898635864258, mean loss: 0.36326706285830024
Epoch: 13, step: 803, loss: 0.32068395614624023, mean loss: 0.3632648875872177
Epoch: 13, step: 804, loss: 0.3037077486515045, mean loss: 0.3632618453877522
Epoch: 13, step: 805, loss: 0.36735427379608154, mean loss: 0.36326205441974774
Epoch: 13, step: 806, loss: 0.3434317111968994, mean loss: 0.36326104158235956
Epoch: 13, step: 807, loss: 0.3323115110397339, mean loss: 0.3632594609117496
Epoch: 13, step: 808, loss: 0.30485954880714417, mean loss: 0.3632564784332192
Epoch: 13, step: 809, loss: 0.3248908221721649, mean loss: 0.36325451920248375
Epoch: 13, step: 810, loss: 0.3588707149028778, mean loss: 0.36325429534483683
Epoch: 13, step: 811, loss: 0.37952131032943726, mean loss: 0.3632551259726445
Epoch: 13, step: 812, loss: 0.3638743758201599, mean loss: 0.36325515759122234
Epoch: 13, step: 813, loss: 0.3562639057636261, mean loss: 0.3632548006397352
Epoch: 13, step: 814, loss: 0.32584837079048157, mean loss: 0.3632528908817401
Epoch: 13, step: 815, loss: 0.32526612281799316, mean loss: 0.36325095159400966
Epoch: 13, step: 816, loss: 0.3165673315525055, mean loss: 0.36324856843917575
Epoch: 13, step: 817, loss: 0.3898237347602844, mean loss: 0.363249925007135
Epoch: 13, step: 818, loss: 0.3127622604370117, mean loss: 0.3632473479225262
Epoch: 13, step: 819, loss: 0.36006391048431396, mean loss: 0.3632471854359277
Epoch: 13, step: 820, loss: 0.3104900121688843, mean loss: 0.36324449278175186
Epoch: 13, step: 821, loss: 0.33295926451683044, mean loss: 0.36324294714389
Epoch: 13, step: 822, loss: 0.32725051045417786, mean loss: 0.3632411103265034
Epoch: 13, step: 823, loss: 0.3287786841392517, mean loss: 0.3632393516805457
Epoch: 13, step: 824, loss: 0.3327593505382538, mean loss: 0.36323779634038433
Epoch: 13, step: 825, loss: 0.3521794378757477, mean loss: 0.36323723208084435
Epoch: 13, step: 826, loss: 0.3292068839073181, mean loss: 0.3632354957500023
Epoch: 13, step: 827, loss: 0.3295736610889435, mean loss: 0.36323377830945835
Epoch: 13, step: 828, loss: 0.32872313261032104, mean loss: 0.36323201765205826
Epoch: 13, step: 829, loss: 0.3346543610095978, mean loss: 0.3632305597571168
Epoch: 13, step: 830, loss: 0.32805898785591125, mean loss: 0.3632287655637841
Epoch: 13, step: 831, loss: 0.3408099114894867, mean loss: 0.3632276219780835
Epoch: 13, step: 832, loss: 0.3486875891685486, mean loss: 0.36322688032887107
Epoch: 13, step: 833, loss: 0.3054494857788086, mean loss: 0.36322393340473813
Epoch: 13, step: 834, loss: 0.3661477863788605, mean loss: 0.3632240825276521
Epoch: 13, step: 835, loss: 0.3217758536338806, mean loss: 0.36322196868488926
Epoch: 13, step: 836, loss: 0.3346668779850006, mean loss: 0.36322051246118076
Epoch: 13, step: 837, loss: 0.3419908285140991, mean loss: 0.3632194298663849
Epoch: 13, step: 838, loss: 0.3530277907848358, mean loss: 0.3632189101764618
Epoch: 13, step: 839, loss: 0.3010577857494354, mean loss: 0.36321574063105966
Epoch: 13, step: 840, loss: 0.38561004400253296, mean loss: 0.3632168824402358
Epoch: 13, step: 841, loss: 0.3198975622653961, mean loss: 0.3632146738484047
Epoch: 13, step: 842, loss: 0.32714712619781494, mean loss: 0.363212835074627
Epoch: 13, step: 843, loss: 0.40013960003852844, mean loss: 0.3632147175565277
Epoch: 13, step: 844, loss: 0.3712787926197052, mean loss: 0.3632151286323835
Epoch: 13, step: 845, loss: 0.32158058881759644, mean loss: 0.3632130063701847
Epoch: 13, step: 846, loss: 0.3207469582557678, mean loss: 0.36321084183335234
Epoch: 13, step: 847, loss: 0.3195958733558655, mean loss: 0.36320861884821076
Epoch: 13, step: 848, loss: 0.43620675802230835, mean loss: 0.3632123392569144
Epoch: 13, step: 849, loss: 0.35520291328430176, mean loss: 0.36321193107090005
Epoch: 13, step: 850, loss: 0.30460071563720703, mean loss: 0.3632089442077581
Epoch: 13, step: 851, loss: 0.32040104269981384, mean loss: 0.36320676280225933
Epoch: 13, step: 852, loss: 0.33769798278808594, mean loss: 0.3632054629918127
Epoch: 13, step: 853, loss: 0.32867008447647095, mean loss: 0.36320370331696733
Epoch: 13, step: 854, loss: 0.3371056616306305, mean loss: 0.3632023736159592
Epoch: 13, step: 855, loss: 0.334780216217041, mean loss: 0.36320092557451844
Epoch: 13, step: 856, loss: 0.3738954961299896, mean loss: 0.36320147040973955
Epoch: 13, step: 857, loss: 0.32822689414024353, mean loss: 0.3631996887196596
Epoch: 13, step: 858, loss: 0.3287258744239807, mean loss: 0.36319793262907346
Epoch: 13, step: 859, loss: 0.3094859719276428, mean loss: 0.3631951966897549
Epoch: 13, step: 860, loss: 0.35451269149780273, mean loss: 0.36319475444938454
Epoch: 13, step: 861, loss: 0.3730136752128601, mean loss: 0.36319525454721296
Epoch: 13, step: 862, loss: 0.3864251673221588, mean loss: 0.363196437634189
Epoch: 13, step: 863, loss: 0.3334525525569916, mean loss: 0.36319492287124966
Epoch: 13, step: 864, loss: 0.3075377643108368, mean loss: 0.3631920885707679
Epoch: 13, step: 865, loss: 0.3545053005218506, mean loss: 0.36319164622490535
Epoch: 13, step: 866, loss: 0.377043753862381, mean loss: 0.36319235156161483
Epoch: 13, step: 867, loss: 0.34109926223754883, mean loss: 0.36319122665889975
Epoch: 13, step: 868, loss: 0.32390156388282776, mean loss: 0.3631892262687579
Epoch: 13, step: 869, loss: 0.3099856972694397, mean loss: 0.3631865176072672
Epoch: 13, step: 870, loss: 0.32485896348953247, mean loss: 0.36318456640052094
Epoch: 13, step: 871, loss: 0.32461780309677124, mean loss: 0.3631826031158893
Epoch: 13, step: 872, loss: 0.34349924325942993, mean loss: 0.3631816011632369
Epoch: 13, step: 873, loss: 0.3434084355831146, mean loss: 0.3631805946903885
Epoch: 13, step: 874, loss: 0.3350260257720947, mean loss: 0.3631791616691171
Epoch: 13, step: 875, loss: 0.32342463731765747, mean loss: 0.36317713833216925
Epoch: 13, step: 876, loss: 0.3326316773891449, mean loss: 0.36317558377667314
Epoch: 13, step: 877, loss: 0.31819120049476624, mean loss: 0.3631732944950812
Epoch: 13, step: 878, loss: 0.3137461543083191, mean loss: 0.3631707792469927
Epoch: 13, step: 879, loss: 0.3570304214954376, mean loss: 0.3631704667923951
Epoch: 13, step: 880, loss: 0.3603214919567108, mean loss: 0.36317032182853026
Epoch: 13, step: 881, loss: 0.32198187708854675, mean loss: 0.36316822615107325
Epoch: 13, step: 882, loss: 0.3091215491294861, mean loss: 0.3631654763837356
Epoch: 13, step: 883, loss: 0.3230457901954651, mean loss: 0.36316343529265965
Epoch: 13, step: 884, loss: 0.30494755506515503, mean loss: 0.36316047370746213
Epoch: 13, step: 885, loss: 0.3216627240180969, mean loss: 0.3631583627221285
Epoch: 13, step: 886, loss: 0.3598346710205078, mean loss: 0.36315819365494795
Epoch: 13, step: 887, loss: 0.3160356879234314, mean loss: 0.36315579678283544
Epoch: 13, step: 888, loss: 0.35196852684020996, mean loss: 0.36315522777464954
Epoch: 13, step: 889, loss: 0.327846497297287, mean loss: 0.3631534319893542
Epoch: 13, step: 890, loss: 0.38520482182502747, mean loss: 0.36315455345555137
Epoch: 13, step: 891, loss: 0.3376932740211487, mean loss: 0.3631532586386558
Epoch: 13, step: 892, loss: 0.3765548765659332, mean loss: 0.3631539401346094
Epoch: 13, step: 893, loss: 0.3605146110057831, mean loss: 0.36315380592688395
Epoch: 13, step: 894, loss: 0.3774240016937256, mean loss: 0.3631545315177604
Epoch: 13, step: 895, loss: 0.32669174671173096, mean loss: 0.3631526776035441
Epoch: 13, step: 896, loss: 0.327650785446167, mean loss: 0.3631508726367355
Epoch: 13, step: 897, loss: 0.34129536151885986, mean loss: 0.3631497615278836
Epoch: 13, step: 898, loss: 0.36274126172065735, mean loss: 0.36314974076128265
Epoch: 13, step: 899, loss: 0.3038930594921112, mean loss: 0.3631467285265699
Epoch: 13, step: 900, loss: 0.3173050880432129, mean loss: 0.36314439834609497
Epoch: 13, step: 901, loss: 0.2858325242996216, mean loss: 0.3631404686991474
Epoch: 13, step: 902, loss: 0.3269328773021698, mean loss: 0.3631386284149595
Epoch: 13, step: 903, loss: 0.33180660009384155, mean loss: 0.36313703601669145
Epoch: 13, step: 904, loss: 0.33959975838661194, mean loss: 0.363135839834467
Epoch: 13, step: 905, loss: 0.331925630569458, mean loss: 0.3631342537886664
Epoch: 13, step: 906, loss: 0.3359537422657013, mean loss: 0.36313287259493077
Epoch: 13, step: 907, loss: 0.3177550733089447, mean loss: 0.3631305668124467
Epoch: 13, step: 908, loss: 0.3489537835121155, mean loss: 0.3631298464840437
Epoch: 13, step: 909, loss: 0.35774609446525574, mean loss: 0.36312957294720705
Epoch: 13, step: 910, loss: 0.3197217881679535, mean loss: 0.36312736760326664
Epoch: 13, step: 911, loss: 0.30266523361206055, mean loss: 0.3631242959646774
Epoch: 13, step: 912, loss: 0.358045756816864, mean loss: 0.3631240379743727
Epoch: 13, step: 913, loss: 0.3322729468345642, mean loss: 0.36312247081542015
Epoch: 13, step: 914, loss: 0.41898787021636963, mean loss: 0.36312530849507685
Epoch: 13, step: 915, loss: 0.33969148993492126, mean loss: 0.36312411823610896
Epoch: 13, step: 916, loss: 0.3885466754436493, mean loss: 0.36312540944222443
Epoch: 13, step: 917, loss: 0.3582841157913208, mean loss: 0.3631251635664677
Epoch: 13, step: 918, loss: 0.31174349784851074, mean loss: 0.36312255416797506
Epoch: 13, step: 919, loss: 0.32186809182167053, mean loss: 0.36312045918207486
Epoch: 13, step: 920, loss: 0.30001434683799744, mean loss: 0.3631172546874654
Epoch: 13, step: 921, loss: 0.35778653621673584, mean loss: 0.3631169840101794
Epoch: 13, step: 922, loss: 0.3557068705558777, mean loss: 0.36311660776679505
Epoch: 13, step: 923, loss: 0.3397437334060669, mean loss: 0.36311542108552164
Epoch: 13, step: 924, loss: 0.361840158700943, mean loss: 0.36311535634153097
Epoch: 13, step: 925, loss: 0.35234537720680237, mean loss: 0.3631148095865744
Epoch: 13, step: 926, loss: 0.31242409348487854, mean loss: 0.3631122363231548
Epoch: 13, step: 927, loss: 0.31443390250205994, mean loss: 0.36310976534174255
Epoch: 13, step: 928, loss: 0.31213268637657166, mean loss: 0.3631071778041066
Epoch: 13, step: 929, loss: 0.32434016466140747, mean loss: 0.3631052101351825
Epoch: 13, step: 930, loss: 0.3509209454059601, mean loss: 0.36310459173875914
Epoch: 13, step: 931, loss: 0.3039257824420929, mean loss: 0.36310158834811274
Epoch: 13, step: 932, loss: 0.3132686913013458, mean loss: 0.36309905940129483
Epoch: 13, step: 933, loss: 0.3757433295249939, mean loss: 0.3630997010469928
Epoch: 13, step: 934, loss: 0.3001061975955963, mean loss: 0.36309650454303727
Epoch: 13, step: 935, loss: 0.3853193521499634, mean loss: 0.36309763214845675
Epoch: 13, step: 936, loss: 0.31714361906051636, mean loss: 0.3630953005226468
Epoch: 13, step: 937, loss: 0.3202161490917206, mean loss: 0.3630931250202911
Epoch: 13, step: 938, loss: 0.3260135352611542, mean loss: 0.3630912438580082
Epoch: 13, step: 939, loss: 0.31575411558151245, mean loss: 0.3630888424209
Epoch: 13, step: 940, loss: 0.3009439706802368, mean loss: 0.3630856899392006
Epoch: 13, step: 941, loss: 0.29938840866088867, mean loss: 0.3630824588708594
Epoch: 13, step: 942, loss: 0.30625247955322266, mean loss: 0.3630795762951902
Epoch: 13, step: 943, loss: 0.34758907556533813, mean loss: 0.36307879061347337
Epoch: 13, step: 944, loss: 0.3546432852745056, mean loss: 0.3630783627844254
Epoch: 13, step: 945, loss: 0.34372109174728394, mean loss: 0.3630773810788246
Epoch: 13, step: 946, loss: 0.32580918073654175, mean loss: 0.36307549111481313
Epoch: 13, step: 947, loss: 0.3347063958644867, mean loss: 0.3630740525197193
Epoch: 13, step: 948, loss: 0.31343743205070496, mean loss: 0.3630715355773498
Epoch: 13, step: 949, loss: 0.325435072183609, mean loss: 0.36306962722812586
Epoch: 13, step: 950, loss: 0.3222269117832184, mean loss: 0.363067556411544
Epoch: 13, step: 951, loss: 0.3325023651123047, mean loss: 0.36306600676688267
Epoch: 13, step: 952, loss: 0.3680727481842041, mean loss: 0.3630662605940775
Epoch: 13, step: 953, loss: 0.3119104206562042, mean loss: 0.3630636672735899
Epoch: 13, step: 954, loss: 0.3624444901943207, mean loss: 0.3630636358862994
Epoch: 13, step: 955, loss: 0.33950385451316833, mean loss: 0.3630624416556945
Epoch: 13, step: 956, loss: 0.33563661575317383, mean loss: 0.3630610515281715
Epoch: 13, step: 957, loss: 0.34878769516944885, mean loss: 0.36306032809399214
Epoch: 13, step: 958, loss: 0.30414295196533203, mean loss: 0.3630573420630698
Epoch: 13, step: 959, loss: 0.32555150985717773, mean loss: 0.3630554413012511
Epoch: 13, step: 960, loss: 0.31060028076171875, mean loss: 0.3630527830556453
Epoch: 13, step: 961, loss: 0.3288032114505768, mean loss: 0.36305104749409645
Epoch: 13, step: 962, loss: 0.36109498143196106, mean loss: 0.3630509483774984
Epoch: 13, step: 963, loss: 0.33635780215263367, mean loss: 0.3630495958670492
Epoch: 13, step: 964, loss: 0.3747035264968872, mean loss: 0.3630501863281441
Epoch: 13, step: 965, loss: 0.29975464940071106, mean loss: 0.36304697954240456
Epoch: 13, step: 966, loss: 0.3060027062892914, mean loss: 0.3630440896151918
Epoch: 13, step: 967, loss: 0.3637388050556183, mean loss: 0.36304412480847653
Epoch: 13, step: 968, loss: 0.3446563184261322, mean loss: 0.36304319335584584
Epoch: 13, step: 969, loss: 0.3288660943508148, mean loss: 0.36304146216857985
Epoch: 13, step: 970, loss: 0.3511675298213959, mean loss: 0.36304086074365216
Epoch: 13, step: 971, loss: 0.33689382672309875, mean loss: 0.3630395364408756
Epoch: 13, step: 972, loss: 0.31928205490112305, mean loss: 0.36303732031114455
Epoch: 13, step: 973, loss: 0.3597548305988312, mean loss: 0.36303715407546583
Epoch: 13, step: 974, loss: 0.3084414005279541, mean loss: 0.3630343893135502
Epoch: 13, step: 975, loss: 0.30832991003990173, mean loss: 0.3630316191859791
Epoch: 13, step: 976, loss: 0.3724820911884308, mean loss: 0.3630320977151199
Epoch: 13, step: 977, loss: 0.32609984278678894, mean loss: 0.3630302277275286
Epoch: 13, step: 978, loss: 0.35713738203048706, mean loss: 0.3630299293707012
Epoch: 13, step: 979, loss: 0.3107841908931732, mean loss: 0.3630272842847111
Epoch: 13, step: 980, loss: 0.32035794854164124, mean loss: 0.3630251241401385
Epoch: 13, step: 981, loss: 0.31905537843704224, mean loss: 0.36302289827470857
Epoch: 13, step: 982, loss: 0.3524794578552246, mean loss: 0.36302236456474046
Epoch: 13, step: 983, loss: 0.33578401803970337, mean loss: 0.36302098582681147
Epoch: 13, step: 984, loss: 0.39692121744155884, mean loss: 0.36302270168608236
Epoch: 13, step: 985, loss: 0.3826170861721039, mean loss: 0.3630236934051069
Epoch: 13, step: 986, loss: 0.30964699387550354, mean loss: 0.3630209920184208
Epoch: 13, step: 987, loss: 0.3177492022514343, mean loss: 0.36301870093594274
Epoch: 13, step: 988, loss: 0.3751053214073181, mean loss: 0.3630193125760658
Epoch: 13, step: 989, loss: 0.3241250216960907, mean loss: 0.36301734444071104
Epoch: 13, step: 990, loss: 0.33380210399627686, mean loss: 0.3630158661610751
Epoch: 13, step: 991, loss: 0.3693571090698242, mean loss: 0.3630161870092288
Epoch: 13, step: 992, loss: 0.32761552929878235, mean loss: 0.3630143959311761
Epoch: 13, step: 993, loss: 0.34378674626350403, mean loss: 0.363013423167356
Epoch: 13, step: 994, loss: 0.32128164172172546, mean loss: 0.3630113119829858
Epoch: 13, step: 995, loss: 0.32748445868492126, mean loss: 0.3630095147929161
Epoch: 13, step: 996, loss: 0.4126044511795044, mean loss: 0.36301202351548106
Epoch: 13, step: 997, loss: 0.35404959321022034, mean loss: 0.36301157018061486
Epoch: 13, step: 998, loss: 0.33703047037124634, mean loss: 0.36301025607916276
Epoch: 13, step: 999, loss: 0.338506281375885, mean loss: 0.36300901675209907
Epoch: 13, step: 1000, loss: 0.3581177592277527, mean loss: 0.36300876938156734
Epoch: 13, step: 1001, loss: 0.34353142976760864, mean loss: 0.36300778438411546
Epoch: 13, step: 1002, loss: 0.3234640657901764, mean loss: 0.36300578470175926
Epoch: 13, step: 1003, loss: 0.34547099471092224, mean loss: 0.3630048980315534
Epoch: 13, step: 1004, loss: 0.33381110429763794, mean loss: 0.3630034218828082
Epoch: 13, step: 1005, loss: 0.383707195520401, mean loss: 0.3630044686910617
Epoch: 13, step: 1006, loss: 0.28737157583236694, mean loss: 0.36300064479233785
Epoch: 13, step: 1007, loss: 0.2977123558521271, mean loss: 0.3629973440699445
Epoch: 13, step: 1008, loss: 0.3226068913936615, mean loss: 0.3629953021887112
Epoch: 13, step: 1009, loss: 0.33931639790534973, mean loss: 0.3629941051962795
Epoch: 13, step: 1010, loss: 0.3131537139415741, mean loss: 0.3629915858417198
Epoch: 13, step: 1011, loss: 0.3271912932395935, mean loss: 0.36298977628386486
Epoch: 13, step: 1012, loss: 0.36958274245262146, mean loss: 0.3629901095144016
Epoch: 13, step: 1013, loss: 0.3569411635398865, mean loss: 0.36298980379591506
Epoch: 13, step: 1014, loss: 0.3466332256793976, mean loss: 0.36298897716337264
Epoch: 13, step: 1015, loss: 0.3265208601951599, mean loss: 0.3629871342223494
Epoch: 13, step: 1016, loss: 0.3727565407752991, mean loss: 0.36298762790098665
Epoch: 13, step: 1017, loss: 0.3319149911403656, mean loss: 0.3629860577829088
Epoch: 13, step: 1018, loss: 0.356540322303772, mean loss: 0.3629857320926719
Epoch: 13, step: 1019, loss: 0.3035849928855896, mean loss: 0.36298273084271193
Epoch: 13, step: 1020, loss: 0.3260704576969147, mean loss: 0.3629808659271789
Epoch: 13, step: 1021, loss: 0.2928870618343353, mean loss: 0.362977324762983
Epoch: 13, step: 1022, loss: 0.3551887571811676, mean loss: 0.362976931301625
Epoch: 13, step: 1023, loss: 0.38249272108078003, mean loss: 0.36297791714673405
Epoch: 13, step: 1024, loss: 0.3223381042480469, mean loss: 0.3629758643198967
Epoch: 13, step: 1025, loss: 0.33658289909362793, mean loss: 0.36297453120719714
Epoch: 13, step: 1026, loss: 0.34187930822372437, mean loss: 0.36297346573808337
Epoch: 13, step: 1027, loss: 0.34866148233413696, mean loss: 0.36297274291063875
Epoch: 13, step: 1028, loss: 0.32000479102134705, mean loss: 0.36297057292165386
Epoch: 13, step: 1029, loss: 0.33781880140304565, mean loss: 0.36296930275846234
Epoch: 13, step: 1030, loss: 0.31442248821258545, mean loss: 0.3629668512705794
Epoch: 13, step: 1031, loss: 0.35938066244125366, mean loss: 0.36296667018651413
Epoch: 13, step: 1032, loss: 0.3401641547679901, mean loss: 0.3629655188350666
Epoch: 13, step: 1033, loss: 0.30557358264923096, mean loss: 0.36296262113052324
Epoch: 13, step: 1034, loss: 0.3204134404659271, mean loss: 0.3629604729414656
Epoch: 13, step: 1035, loss: 0.34450623393058777, mean loss: 0.3629595412856189
Epoch: 13, step: 1036, loss: 0.3446105718612671, mean loss: 0.36295861499103443
Epoch: 13, step: 1037, loss: 0.3109198212623596, mean loss: 0.3629559880958437
Epoch: 13, step: 1038, loss: 0.3767242729663849, mean loss: 0.36295668307766543
Epoch: 13, step: 1039, loss: 0.3165389597415924, mean loss: 0.36295434016814915
Epoch: 13, step: 1040, loss: 0.36484354734420776, mean loss: 0.3629544355200482
Epoch: 13, step: 1041, loss: 0.3548756241798401, mean loss: 0.36295402778756913
Epoch: 13, step: 1042, loss: 0.34799692034721375, mean loss: 0.3629532729499491
Epoch: 13, step: 1043, loss: 0.3278021514415741, mean loss: 0.362951499074217
Epoch: 13, step: 1044, loss: 0.3365086019039154, mean loss: 0.3629501647200175
Epoch: 13, step: 1045, loss: 0.3630061149597168, mean loss: 0.3629501675432206
Epoch: 13, step: 1046, loss: 0.32835695147514343, mean loss: 0.3629484220860296
Epoch: 13, step: 1047, loss: 0.31537121534347534, mean loss: 0.36294602162151185
Epoch: 13, step: 1048, loss: 0.3483608365058899, mean loss: 0.3629452857764427
Epoch: 13, step: 1049, loss: 0.3633507490158081, mean loss: 0.36294530623165605
Epoch: 13, step: 1050, loss: 0.3387896418571472, mean loss: 0.36294408766411457
Epoch: 13, step: 1051, loss: 0.33727970719337463, mean loss: 0.3629427930525089
Epoch: 13, step: 1052, loss: 0.36210888624191284, mean loss: 0.3629427509891137
Epoch: 13, step: 1053, loss: 0.3368781507015228, mean loss: 0.362941436321491
Epoch: 13, step: 1054, loss: 0.39675208926200867, mean loss: 0.362943141604839
Epoch: 13, step: 1055, loss: 0.3190149962902069, mean loss: 0.3629409261446153
Epoch: 13, step: 1056, loss: 0.3266356289386749, mean loss: 0.3629390952253957
Epoch: 13, step: 1057, loss: 0.3248162269592285, mean loss: 0.36293717274086384
Epoch: 13, step: 1058, loss: 0.30826863646507263, mean loss: 0.3629344160197567
Epoch: 13, step: 1059, loss: 0.35582801699638367, mean loss: 0.36293405768983417
Epoch: 13, step: 1060, loss: 0.31224653124809265, mean loss: 0.36293150197327884
Epoch: 13, step: 1061, loss: 0.346157431602478, mean loss: 0.3629306562502592
Epoch: 13, step: 1062, loss: 0.3647785186767578, mean loss: 0.3629307494119646
Epoch: 13, step: 1063, loss: 0.3153024911880493, mean loss: 0.36292834831001747
Epoch: 13, step: 1064, loss: 0.34498846530914307, mean loss: 0.3629274439452949
Epoch: 13, step: 1065, loss: 0.3373773396015167, mean loss: 0.3629261560077839
Epoch: 13, step: 1066, loss: 0.3063557744026184, mean loss: 0.3629233045343424
Epoch: 13, step: 1067, loss: 0.3077748119831085, mean loss: 0.36292052487241944
Epoch: 13, step: 1068, loss: 0.34549176692962646, mean loss: 0.3629196464510726
Epoch: 13, step: 1069, loss: 0.3289550542831421, mean loss: 0.3629179346986198
Epoch: 13, step: 1070, loss: 0.3063928484916687, mean loss: 0.3629150860826743
Epoch: 13, step: 1071, loss: 0.33585038781166077, mean loss: 0.36291372220955037
Epoch: 13, step: 1072, loss: 0.3168897330760956, mean loss: 0.3629114030365026
Epoch: 13, step: 1073, loss: 0.3064444661140442, mean loss: 0.3629085577811906
Epoch: 13, step: 1074, loss: 0.371848464012146, mean loss: 0.3629090082223772
Epoch: 13, step: 1075, loss: 0.3339298963546753, mean loss: 0.3629075481703887
Epoch: 13, step: 1076, loss: 0.37325313687324524, mean loss: 0.36290806938499415
Epoch: 13, step: 1077, loss: 0.3421452045440674, mean loss: 0.36290702339684094
Epoch: 13, step: 1078, loss: 0.3443073630332947, mean loss: 0.36290608643344546
Epoch: 13, step: 1079, loss: 0.31854939460754395, mean loss: 0.36290385206452414
Epoch: 13, step: 1080, loss: 0.34121084213256836, mean loss: 0.36290275938281696
Epoch: 13, step: 1081, loss: 0.35062000155448914, mean loss: 0.3629021407287509
Epoch: 13, step: 1082, loss: 0.31335458159446716, mean loss: 0.36289964525863583
Epoch: 13, step: 1083, loss: 0.3227762281894684, mean loss: 0.3628976245385981
Epoch: 13, step: 1084, loss: 0.35462135076522827, mean loss: 0.362897207744834
Epoch: 13, step: 1085, loss: 0.3492587208747864, mean loss: 0.36289652094420605
Epoch: 13, step: 1086, loss: 0.35296347737312317, mean loss: 0.3628960207657695
Epoch: 13, step: 1087, loss: 0.3816260099411011, mean loss: 0.36289696386693643
Epoch: 13, step: 1088, loss: 0.31571587920188904, mean loss: 0.3628945883025306
Epoch: 13, step: 1089, loss: 0.35963526368141174, mean loss: 0.3628944242040198
Epoch: 13, step: 1090, loss: 0.3119456171989441, mean loss: 0.36289185919334643
Epoch: 13, step: 1091, loss: 0.3700201213359833, mean loss: 0.36289221804665606
Epoch: 13, step: 1092, loss: 0.34754496812820435, mean loss: 0.3628914454692627
Epoch: 13, step: 1093, loss: 0.35512372851371765, mean loss: 0.36289105446367753
Epoch: 13, step: 1094, loss: 0.340399831533432, mean loss: 0.3628899223741356
Epoch: 13, step: 1095, loss: 0.3281054198741913, mean loss: 0.3628881715938608
Epoch: 13, step: 1096, loss: 0.36438217759132385, mean loss: 0.3628882467866736
Epoch: 13, step: 1097, loss: 0.31470349431037903, mean loss: 0.36288582178654893
Epoch: 13, step: 1098, loss: 0.342608779668808, mean loss: 0.36288480135264434
Epoch: 13, step: 1099, loss: 0.37954381108283997, mean loss: 0.36288563966835136
Epoch: 13, step: 1100, loss: 0.34614479541778564, mean loss: 0.36288479727695344
Epoch: 13, step: 1101, loss: 0.3295263648033142, mean loss: 0.36288311878080404
Epoch: 13, step: 1102, loss: 0.34337127208709717, mean loss: 0.36288213705266853
Epoch: 13, step: 1103, loss: 0.33991381525993347, mean loss: 0.3628809814719786
Epoch: 13, step: 1104, loss: 0.3469371795654297, mean loss: 0.3628801793488259
Epoch: 13, step: 1105, loss: 0.3297780156135559, mean loss: 0.36287851408251465
Epoch: 13, step: 1106, loss: 0.3581400513648987, mean loss: 0.36287827571726905
Epoch: 13, step: 1107, loss: 0.37512585520744324, mean loss: 0.3628788917926961
Epoch: 13, step: 1108, loss: 0.3795629143714905, mean loss: 0.36287973098703136
Epoch: 13, step: 1109, loss: 0.31779879331588745, mean loss: 0.36287746356234213
Epoch: 13, step: 1110, loss: 0.3422568738460541, mean loss: 0.3628764264658418
Epoch: 13, step: 1111, loss: 0.3434008061885834, mean loss: 0.36287544700394897
Epoch: 13, step: 1112, loss: 0.30258047580718994, mean loss: 0.36287241482033333
Epoch: 13, step: 1113, loss: 0.34380489587783813, mean loss: 0.36287145597899056
Epoch: 13, step: 1114, loss: 0.32347598671913147, mean loss: 0.3628694750130701
Epoch: 13, step: 1115, loss: 0.332272469997406, mean loss: 0.3628679365474116
Epoch: 13, step: 1116, loss: 0.37480229139328003, mean loss: 0.36286853659542034
Epoch: 13, step: 1117, loss: 0.3315272033214569, mean loss: 0.3628669608622241
Epoch: 13, step: 1118, loss: 0.3566950857639313, mean loss: 0.36286665057741696
Epoch: 13, step: 1119, loss: 0.3174915015697479, mean loss: 0.36286436950216017
Epoch: 13, step: 1120, loss: 0.30336976051330566, mean loss: 0.36286137877130065
Epoch: 13, step: 1121, loss: 0.3714558780193329, mean loss: 0.36286181078594065
Epoch: 13, step: 1122, loss: 0.4127653241157532, mean loss: 0.3628643191304156
Epoch: 13, step: 1123, loss: 0.3992088735103607, mean loss: 0.36286614585711346
Epoch: 13, step: 1124, loss: 0.35014110803604126, mean loss: 0.36286550631156284
Epoch: 13, step: 1125, loss: 0.3277924060821533, mean loss: 0.3628637436670644
Epoch: 13, step: 1126, loss: 0.30488747358322144, mean loss: 0.36286083014024983
Epoch: 13, step: 1127, loss: 0.3551277220249176, mean loss: 0.3628604415418521
Epoch: 13, step: 1128, loss: 0.3379347026348114, mean loss: 0.3628591890550973
Epoch: 13, step: 1129, loss: 0.35183462500572205, mean loss: 0.3628586351125765
Epoch: 13, step: 1130, loss: 0.33438241481781006, mean loss: 0.3628572043624235
Epoch: 13, step: 1131, loss: 0.3554052710533142, mean loss: 0.362856829968668
Epoch: 13, step: 1132, loss: 0.3550645709037781, mean loss: 0.3628564384962207
Epoch: 13, step: 1133, loss: 0.32274025678634644, mean loss: 0.3628544232153149
Epoch: 13, step: 1134, loss: 0.3374731242656708, mean loss: 0.3628531482216469
Epoch: 13, step: 1135, loss: 0.3597487509250641, mean loss: 0.36285299228447104
Epoch: 13, step: 1136, loss: 0.3768143355846405, mean loss: 0.36285369354235947
Epoch: 13, step: 1137, loss: 0.39157938957214355, mean loss: 0.3628551363196588
Epoch: 13, step: 1138, loss: 0.39459457993507385, mean loss: 0.36285673038543226
Epoch: 13, step: 1139, loss: 0.35092175006866455, mean loss: 0.3628561309991166
Epoch: 13, step: 1140, loss: 0.40757283568382263, mean loss: 0.3628583766027266
Epoch: 13, step: 1141, loss: 0.3156028091907501, mean loss: 0.36285600362053255
Epoch: 13, step: 1142, loss: 0.35646089911460876, mean loss: 0.36285568250054734
Epoch: 13, step: 1143, loss: 0.42034968733787537, mean loss: 0.3628585693254538
Epoch: 13, step: 1144, loss: 0.3336847424507141, mean loss: 0.362857104555314
Epoch: 13, step: 1145, loss: 0.3673437237739563, mean loss: 0.3628573298098184
Epoch: 13, step: 1146, loss: 0.3242809474468231, mean loss: 0.3628553931472167
Epoch: 13, step: 1147, loss: 0.3184840679168701, mean loss: 0.3628531656710505
Epoch: 13, step: 1148, loss: 0.3300449550151825, mean loss: 0.3628515187552001
Epoch: 13, step: 1149, loss: 0.344383180141449, mean loss: 0.36285059172284323
Epoch: 13, step: 1150, loss: 0.32536348700523376, mean loss: 0.36284871012344966
Epoch: 13, step: 1151, loss: 0.3362760841846466, mean loss: 0.36284737642409515
Epoch: 13, step: 1152, loss: 0.36398619413375854, mean loss: 0.3628474335793127
Epoch: 13, step: 1153, loss: 0.3358064591884613, mean loss: 0.3628460765094346
Epoch: 13, step: 1154, loss: 0.3118847608566284, mean loss: 0.3628435191091409
Epoch: 13, step: 1155, loss: 0.31458336114883423, mean loss: 0.3628410973830289
Epoch: 13, step: 1156, loss: 0.33612900972366333, mean loss: 0.3628397570203584
Epoch: 13, step: 1157, loss: 0.3114757835865021, mean loss: 0.36283717980142044
Epoch: 13, step: 1158, loss: 0.3468383252620697, mean loss: 0.3628363770893368
Epoch: 13, step: 1159, loss: 0.3061160147190094, mean loss: 0.36283353139586044
Epoch: 13, step: 1160, loss: 0.32332584261894226, mean loss: 0.36283154937164047
Epoch: 13, step: 1161, loss: 0.33242183923721313, mean loss: 0.36283002385191865
Epoch: 13, step: 1162, loss: 0.3429301977157593, mean loss: 0.3628290256163462
Epoch: 13, step: 1163, loss: 0.34286871552467346, mean loss: 0.36282802439693956
Epoch: 13, step: 1164, loss: 0.3254043459892273, mean loss: 0.3628261473001643
Epoch: 13, step: 1165, loss: 0.3193124532699585, mean loss: 0.3628239648498669
Epoch: 13, step: 1166, loss: 0.32934069633483887, mean loss: 0.36282228556462115
Epoch: 13, step: 1167, loss: 0.313410222530365, mean loss: 0.36281980752735765
Epoch: 13, step: 1168, loss: 0.3244807720184326, mean loss: 0.3628178849038428
Epoch: 13, step: 1169, loss: 0.32677486538887024, mean loss: 0.3628160775114291
Epoch: 13, step: 1170, loss: 0.2909183204174042, mean loss: 0.36281247234886105
Epoch: 13, step: 1171, loss: 0.3411201238632202, mean loss: 0.3628113846859807
Epoch: 13, step: 1172, loss: 0.3822437822818756, mean loss: 0.36281235898518327
Epoch: 13, step: 1173, loss: 0.3074756860733032, mean loss: 0.362809584660862
Epoch: 13, step: 1174, loss: 0.35344985127449036, mean loss: 0.36280911543073285
Epoch: 13, step: 1175, loss: 0.32920485734939575, mean loss: 0.3628074308378874
Epoch: 13, step: 1176, loss: 0.34082576632499695, mean loss: 0.3628063289448345
Epoch: 13, step: 1177, loss: 0.35005030035972595, mean loss: 0.36280568954490544
Epoch: 13, step: 1178, loss: 0.31640881299972534, mean loss: 0.3628033640035017
Epoch: 13, step: 1179, loss: 0.3448205590248108, mean loss: 0.3628024627001247
Epoch: 13, step: 1180, loss: 0.35791322588920593, mean loss: 0.3628022176624456
Epoch: 13, step: 1181, loss: 0.3382156491279602, mean loss: 0.36280098550004536
Epoch: 13, step: 1182, loss: 0.34103700518608093, mean loss: 0.36279989484706043
Epoch: 13, step: 1183, loss: 0.3437967896461487, mean loss: 0.3627989425968499
Epoch: 13, step: 1184, loss: 0.32885053753852844, mean loss: 0.3627972415192802
Epoch: 13, step: 1185, loss: 0.31695908308029175, mean loss: 0.36279494478822305
Epoch: 13, step: 1186, loss: 0.30561673641204834, mean loss: 0.36279208000499863
Epoch: 13, step: 1187, loss: 0.30670663714408875, mean loss: 0.3627892701130717
Epoch: 13, step: 1188, loss: 0.31473860144615173, mean loss: 0.3627868628855447
Epoch: 13, step: 1189, loss: 0.42745324969291687, mean loss: 0.3627901023598863
Epoch: 13, step: 1190, loss: 0.2931656241416931, mean loss: 0.3627866146837746
Epoch: 13, step: 1191, loss: 0.338024377822876, mean loss: 0.3627853743393115
Epoch: 13, step: 1192, loss: 0.3361179530620575, mean loss: 0.3627840386307577
Epoch: 13, step: 1193, loss: 0.3271400034427643, mean loss: 0.362782253394096
Epoch: 13, step: 1194, loss: 0.36244967579841614, mean loss: 0.3627822367377332
Epoch: 13, step: 1195, loss: 0.3563578426837921, mean loss: 0.36278191500325535
Epoch: 13, step: 1196, loss: 0.32260990142822266, mean loss: 0.3627799032844124
Epoch: 13, step: 1197, loss: 0.32366618514060974, mean loss: 0.36277794466056945
Epoch: 13, step: 1198, loss: 0.35744866728782654, mean loss: 0.36277767780976716
Epoch: 13, step: 1199, loss: 0.29937809705734253, mean loss: 0.362774503386537
Epoch: 13, step: 1200, loss: 0.3170289099216461, mean loss: 0.362772213014862
Epoch: 13, step: 1201, loss: 0.33424991369247437, mean loss: 0.36277078504353316
Epoch: 13, step: 1202, loss: 0.33582428097724915, mean loss: 0.3627694360320655
Epoch: 13, step: 1203, loss: 0.3230009973049164, mean loss: 0.36276744522115606
Epoch: 13, step: 1204, loss: 0.37651461362838745, mean loss: 0.3627681333709487
Epoch: 13, step: 1205, loss: 0.3048727512359619, mean loss: 0.3627652354140894
Epoch: 13, step: 1206, loss: 0.32796308398246765, mean loss: 0.3627634934774844
Epoch: 13, step: 1207, loss: 0.37671053409576416, mean loss: 0.3627641915275654
Epoch: 13, step: 1208, loss: 0.33430588245391846, mean loss: 0.36276276725905665
Epoch: 13, step: 1209, loss: 0.31732264161109924, mean loss: 0.36276049320612663
Epoch: 13, step: 1210, loss: 0.3284040689468384, mean loss: 0.36275877392352346
Epoch: 13, step: 1211, loss: 0.352798730134964, mean loss: 0.3627582755226133
Epoch: 13, step: 1212, loss: 0.33664172887802124, mean loss: 0.3627569687151755
Epoch: 13, step: 1213, loss: 0.344780832529068, mean loss: 0.3627560692787607
Epoch: 13, step: 1214, loss: 0.3332243859767914, mean loss: 0.3627545917341916
Epoch: 13, step: 1215, loss: 0.30692145228385925, mean loss: 0.3627517984012193
Epoch: 13, step: 1216, loss: 0.3049907982349396, mean loss: 0.36274890876190935
Epoch: 13, step: 1217, loss: 0.3287038803100586, mean loss: 0.36274720565893526
Epoch: 13, step: 1218, loss: 0.336500346660614, mean loss: 0.36274589272516516
Epoch: 13, step: 1219, loss: 0.3397725224494934, mean loss: 0.3627447435970001
Epoch: 13, step: 1220, loss: 0.3300948143005371, mean loss: 0.36274311052896147
Epoch: 13, step: 1221, loss: 0.3358634412288666, mean loss: 0.3627417661421804
Epoch: 13, step: 1222, loss: 0.3679877519607544, mean loss: 0.36274202850706255
Epoch: 13, step: 1223, loss: 0.39292269945144653, mean loss: 0.36274353784247687
Epoch: 13, step: 1224, loss: 0.32113873958587646, mean loss: 0.36274145729048124
Epoch: 13, step: 1225, loss: 0.32636600732803345, mean loss: 0.3627396383360877
Epoch: 13, step: 1226, loss: 0.3295023441314697, mean loss: 0.3627379763882801
Epoch: 13, step: 1227, loss: 0.30848440527915955, mean loss: 0.36273526370972464
Epoch: 13, step: 1228, loss: 0.3742879033088684, mean loss: 0.36273584131282444
Epoch: 13, step: 1229, loss: 0.32546475529670715, mean loss: 0.36273397794486045
Epoch: 13, step: 1230, loss: 0.3368707001209259, mean loss: 0.36273268497491473
Epoch: 13, step: 1231, loss: 0.31057727336883545, mean loss: 0.36273007772578425
Epoch: 13, step: 1232, loss: 0.4258098900318146, mean loss: 0.36273323092809895
Epoch: 13, step: 1233, loss: 0.30800870060920715, mean loss: 0.36273049552220477
Epoch: 13, step: 1234, loss: 0.33442816138267517, mean loss: 0.36272908090061534
Epoch: 13, step: 1235, loss: 0.3329271674156189, mean loss: 0.36272759140074107
Epoch: 13, step: 1236, loss: 0.3673635721206665, mean loss: 0.36272782309551443
Epoch: 13, step: 1237, loss: 0.37084195017814636, mean loss: 0.36272822859911674
Epoch: 13, step: 1238, loss: 0.3496478199958801, mean loss: 0.36272757493820007
Epoch: 13, step: 1239, loss: 0.36774009466171265, mean loss: 0.3627278254139008
Epoch: 13, step: 1240, loss: 0.3297291398048401, mean loss: 0.362726176551381
Epoch: 13, step: 1241, loss: 0.3194810152053833, mean loss: 0.3627240158058356
Epoch: 13, step: 1242, loss: 0.33514344692230225, mean loss: 0.3627226378108876
Epoch: 13, step: 1243, loss: 0.3581121265888214, mean loss: 0.3627224074695995
Epoch: 13, step: 1244, loss: 0.34013277292251587, mean loss: 0.36272127894711625
Epoch: 13, step: 1245, loss: 0.3454514145851135, mean loss: 0.36272041623034323
Epoch: 13, step: 1246, loss: 0.31770336627960205, mean loss: 0.3627181675141261
Epoch: 13, step: 1247, loss: 0.3166040778160095, mean loss: 0.3627158641130423
Epoch: 13, step: 1248, loss: 0.3547965884208679, mean loss: 0.3627154685645836
Epoch: 13, step: 1249, loss: 0.35369154810905457, mean loss: 0.3627150178643311
Epoch: 13, step: 1250, loss: 0.33360034227371216, mean loss: 0.3627135638027224
Epoch: 13, step: 1251, loss: 0.3190736770629883, mean loss: 0.3627113844236403
Epoch: 13, step: 1252, loss: 0.3205379843711853, mean loss: 0.3627092783861845
Epoch: 13, step: 1253, loss: 0.3534272611141205, mean loss: 0.3627088148878687
Epoch: 13, step: 1254, loss: 0.3412884771823883, mean loss: 0.36270774531490696
Epoch: 13, step: 1255, loss: 0.31823858618736267, mean loss: 0.36270552496543984
Epoch: 13, step: 1256, loss: 0.33073365688323975, mean loss: 0.36270392868664
Epoch: 13, step: 1257, loss: 0.3237455487251282, mean loss: 0.36270198368514417
Epoch: 13, step: 1258, loss: 0.37168028950691223, mean loss: 0.3627024319056934
Epoch: 13, step: 1259, loss: 0.36514416337013245, mean loss: 0.36270255379724015
Epoch: 13, step: 1260, loss: 0.3559749722480774, mean loss: 0.36270221797227387
Epoch: 13, step: 1261, loss: 0.3786095976829529, mean loss: 0.36270301199142685
Epoch: 13, step: 1262, loss: 0.35906872153282166, mean loss: 0.3627028305943488
Epoch: 13, step: 1263, loss: 0.32076939940452576, mean loss: 0.36270073769001715
Epoch: 13, step: 1264, loss: 0.347078800201416, mean loss: 0.3626999580355036
Epoch: 13, step: 1265, loss: 0.3519062101840973, mean loss: 0.36269941937157246
Epoch: 13, step: 1266, loss: 0.3173515200614929, mean loss: 0.3626971563894221
Epoch: 13, step: 1267, loss: 0.33102673292160034, mean loss: 0.3626955760289696
Epoch: 13, step: 1268, loss: 0.31071901321411133, mean loss: 0.36269298251752735
Epoch: 13, step: 1269, loss: 0.394562691450119, mean loss: 0.3626945726636671
Epoch: 13, step: 1270, loss: 0.33715036511421204, mean loss: 0.36269329819340074
Epoch: 13, step: 1271, loss: 0.33156293630599976, mean loss: 0.36269174509212915
Epoch: 13, step: 1272, loss: 0.3387584388256073, mean loss: 0.36269055111326826
Epoch: 13, step: 1273, loss: 0.30240824818611145, mean loss: 0.36268754391467867
Epoch: 13, step: 1274, loss: 0.35706889629364014, mean loss: 0.3626872636409409
Epoch: 13, step: 1275, loss: 0.325589120388031, mean loss: 0.3626854131748968
Epoch: 13, step: 1276, loss: 0.33948513865470886, mean loss: 0.3626842559962584
Epoch: 13, step: 1277, loss: 0.3143153190612793, mean loss: 0.3626818435804512
Epoch: 13, step: 1278, loss: 0.3624631464481354, mean loss: 0.36268183267340753
Epoch: 13, step: 1279, loss: 0.3528378903865814, mean loss: 0.36268134175268707
Epoch: 13, step: 1280, loss: 0.3638186454772949, mean loss: 0.36268139846757885
Epoch: 13, step: 1281, loss: 0.30252471566200256, mean loss: 0.3626783987327227
Epoch: 13, step: 1282, loss: 0.3244306147098541, mean loss: 0.36267649158816906
Epoch: 13, step: 1283, loss: 0.33738642930984497, mean loss: 0.36267523061577783
Epoch: 13, step: 1284, loss: 0.3379824757575989, mean loss: 0.36267399948675266
Epoch: 13, step: 1285, loss: 0.2914851903915405, mean loss: 0.3626704503388269
Epoch: 13, step: 1286, loss: 0.3399892747402191, mean loss: 0.3626693196156802
Epoch: 13, step: 1287, loss: 0.33313342928886414, mean loss: 0.36266784723829604
Epoch: 13, step: 1288, loss: 0.32592514157295227, mean loss: 0.3626660156892374
Epoch: 13, step: 1289, loss: 0.32405537366867065, mean loss: 0.3626640911232908
Epoch: 13, step: 1290, loss: 0.3846478760242462, mean loss: 0.36266518686096216
Epoch: 13, step: 1291, loss: 0.341537207365036, mean loss: 0.36266413383168106
Epoch: 13, step: 1292, loss: 0.3257552981376648, mean loss: 0.36266229436815284
Epoch: 13, step: 1293, loss: 0.34372860193252563, mean loss: 0.3626613507973148
Epoch: 13, step: 1294, loss: 0.34066087007522583, mean loss: 0.36266025444605543
Epoch: 13, step: 1295, loss: 0.34389039874076843, mean loss: 0.36265931913333344
Epoch: 13, step: 1296, loss: 0.3666800260543823, mean loss: 0.36265951947749214
Epoch: 13, step: 1297, loss: 0.3231358528137207, mean loss: 0.3626575501866768
Epoch: 13, step: 1298, loss: 0.3819062411785126, mean loss: 0.3626585092166699
Epoch: 13, step: 1299, loss: 0.3515596389770508, mean loss: 0.36265795626378833
Epoch: 13, step: 1300, loss: 0.34851527214050293, mean loss: 0.3626572517012355
Epoch: 13, step: 1301, loss: 0.33946022391319275, mean loss: 0.3626560961254764
Epoch: 13, step: 1302, loss: 0.3430868089199066, mean loss: 0.36265512131664923
Epoch: 13, step: 1303, loss: 0.3260045051574707, mean loss: 0.3626532957230968
Epoch: 13, step: 1304, loss: 0.3114995062351227, mean loss: 0.3626507478429609
Epoch: 13, step: 1305, loss: 0.3569883704185486, mean loss: 0.36265046582396376
Epoch: 13, step: 1306, loss: 0.3390953242778778, mean loss: 0.36264929270072327
Epoch: 13, step: 1307, loss: 0.32731905579566956, mean loss: 0.3626475332267738
Epoch: 13, step: 1308, loss: 0.3520612120628357, mean loss: 0.3626470060457985
Epoch: 13, step: 1309, loss: 0.30655622482299805, mean loss: 0.3626442129583957
Epoch: 13, step: 1310, loss: 0.3753473460674286, mean loss: 0.36264484549004483
Epoch: 13, step: 1311, loss: 0.4077616035938263, mean loss: 0.3626470918930574
Epoch: 13, step: 1312, loss: 0.3601216673851013, mean loss: 0.36264696615621356
Epoch: 13, step: 1313, loss: 0.3275323212146759, mean loss: 0.3626452179412907
Epoch: 13, step: 1314, loss: 0.35688239336013794, mean loss: 0.36264493104804724
Epoch: 13, step: 1315, loss: 0.3392831087112427, mean loss: 0.36264376807401616
Epoch: 13, step: 1316, loss: 0.36480507254600525, mean loss: 0.36264387566048
Epoch: 13, step: 1317, loss: 0.34137409925460815, mean loss: 0.3626428169359202
Epoch: 13, step: 1318, loss: 0.29392209649086, mean loss: 0.3626393964630495
Epoch: 13, step: 1319, loss: 0.33584699034690857, mean loss: 0.36263806297678053
Epoch: 13, step: 1320, loss: 0.37601351737976074, mean loss: 0.36263872865410113
Epoch: 13, step: 1321, loss: 0.3633129894733429, mean loss: 0.36263876220943203
Epoch: 13, step: 1322, loss: 0.34257346391677856, mean loss: 0.3626377636874966
Epoch: 13, step: 1323, loss: 0.3589378595352173, mean loss: 0.36263757957602405
Epoch: 13, step: 1324, loss: 0.33762621879577637, mean loss: 0.36263633504396553
Epoch: 13, step: 1325, loss: 0.3662756383419037, mean loss: 0.3626365161218488
Epoch: 13, step: 1326, loss: 0.3306950330734253, mean loss: 0.36263492691427385
Epoch: 13, step: 1327, loss: 0.3162047564983368, mean loss: 0.36263261695554666
Epoch: 13, step: 1328, loss: 0.33240482211112976, mean loss: 0.3626311131599721
Epoch: 13, step: 1329, loss: 0.3255743086338043, mean loss: 0.3626292697212831
Epoch: 13, step: 1330, loss: 0.37172093987464905, mean loss: 0.36262972197568066
Epoch: 13, step: 1331, loss: 0.39222127199172974, mean loss: 0.36263119389917925
Epoch: 13, step: 1332, loss: 0.3076101243495941, mean loss: 0.3626284572133026
Epoch: 13, step: 1333, loss: 0.3106703460216522, mean loss: 0.3626258730040521
Epoch: 13, step: 1334, loss: 0.3307805359363556, mean loss: 0.3626242892104942
Epoch: 13, step: 1335, loss: 0.294622004032135, mean loss: 0.3626209073582375
Epoch: 13, step: 1336, loss: 0.3236972689628601, mean loss: 0.36261897172551605
Epoch: 13, step: 1337, loss: 0.3283793330192566, mean loss: 0.3626172691079772
Epoch: 13, step: 1338, loss: 0.32364019751548767, mean loss: 0.3626153310108367
Epoch: 13, step: 1339, loss: 0.3312036991119385, mean loss: 0.3626137691755195
Epoch: 13, step: 1340, loss: 0.3775186538696289, mean loss: 0.3626145102327807
Epoch: 13, step: 1341, loss: 0.3373427987098694, mean loss: 0.3626132538088211
Epoch: 13, step: 1342, loss: 0.3405134081840515, mean loss: 0.36261215513392053
Epoch: 13, step: 1343, loss: 0.36435699462890625, mean loss: 0.3626122418728097
Epoch: 13, step: 1344, loss: 0.3041495978832245, mean loss: 0.3626093357414785
Epoch: 13, step: 1345, loss: 0.36329156160354614, mean loss: 0.36260936965269547
Epoch: 13, step: 1346, loss: 0.35372740030288696, mean loss: 0.36260892818098467
Epoch: 13, step: 1347, loss: 0.2983320355415344, mean loss: 0.3626057335044121
Epoch: 13, step: 1348, loss: 0.3264528214931488, mean loss: 0.36260393672930097
Epoch: 13, step: 1349, loss: 0.31417354941368103, mean loss: 0.3626015298916449
Epoch: 13, step: 1350, loss: 0.3450925052165985, mean loss: 0.3626006597915269
Epoch: 13, step: 1351, loss: 0.3365730345249176, mean loss: 0.36259936642911056
Epoch: 13, step: 1352, loss: 0.3162393569946289, mean loss: 0.3625970628261573
Epoch: 13, step: 1353, loss: 0.31872132420539856, mean loss: 0.3625948827735576
Epoch: 13, step: 1354, loss: 0.33517831563949585, mean loss: 0.3625935205950345
Epoch: 13, step: 1355, loss: 0.33185654878616333, mean loss: 0.36259199351972604
Epoch: 13, step: 1356, loss: 0.36858242750167847, mean loss: 0.3625922911218912
Epoch: 13, step: 1357, loss: 0.3521174490451813, mean loss: 0.3625917707621258
Epoch: 13, step: 1358, loss: 0.346981406211853, mean loss: 0.3625909953230244
Epoch: 13, step: 1359, loss: 0.32924336194992065, mean loss: 0.36258933887391986
Epoch: 13, step: 1360, loss: 0.3787692189216614, mean loss: 0.3625901425236515
Epoch: 13, step: 1361, loss: 0.3253655731678009, mean loss: 0.36258829368241996
Epoch: 13, step: 1362, loss: 0.37631943821907043, mean loss: 0.36258897563645703
Epoch: 13, step: 1363, loss: 0.3524778485298157, mean loss: 0.3625884734946659
Epoch: 13, step: 1364, loss: 0.3596319556236267, mean loss: 0.36258832667449054
Epoch: 13, step: 1365, loss: 0.32423362135887146, mean loss: 0.3625864220809204
Epoch: 13, step: 1366, loss: 0.3184942901134491, mean loss: 0.3625842326905849
Epoch: 13, step: 1367, loss: 0.3232419490814209, mean loss: 0.36258227925048514
Epoch: 13, step: 1368, loss: 0.32103973627090454, mean loss: 0.3625802166645669
Epoch: 13, step: 1369, loss: 0.33791643381118774, mean loss: 0.36257899216934036
Epoch: 13, step: 1370, loss: 0.37188467383384705, mean loss: 0.36257945415026
Epoch: 13, step: 1371, loss: 0.3450078070163727, mean loss: 0.36257858184847613
Epoch: 13, step: 1372, loss: 0.36591753363609314, mean loss: 0.3625787475944075
Epoch: 13, step: 1373, loss: 0.3164699375629425, mean loss: 0.362576458861655
Epoch: 13, step: 1374, loss: 0.39349496364593506, mean loss: 0.3625779935072491
Epoch: 13, step: 1375, loss: 0.36599674820899963, mean loss: 0.3625781631893368
Epoch: 13, step: 1376, loss: 0.331283837556839, mean loss: 0.362576610043988
Epoch: 13, step: 1377, loss: 0.3368397355079651, mean loss: 0.362575332779743
Epoch: 13, step: 1378, loss: 0.3310728669166565, mean loss: 0.3625737694595176
Epoch: 13, step: 1379, loss: 0.30188578367233276, mean loss: 0.3625707579477179
Epoch: 13, step: 1380, loss: 0.3585936725139618, mean loss: 0.3625705606031323
Epoch: 13, step: 1381, loss: 0.31985512375831604, mean loss: 0.36256844115107095
Epoch: 13, step: 1382, loss: 0.3618602156639099, mean loss: 0.3625684060121234
Epoch: 13, step: 1383, loss: 0.3284425437450409, mean loss: 0.36256671292508896
Epoch: 13, step: 1384, loss: 0.30095794796943665, mean loss: 0.36256365647993566
Epoch: 13, step: 1385, loss: 0.33298352360725403, mean loss: 0.3625621890658632
Epoch: 13, step: 1386, loss: 0.36875489354133606, mean loss: 0.3625624962589023
Epoch: 13, step: 1387, loss: 0.3743915557861328, mean loss: 0.36256308301780743
Epoch: 13, step: 1388, loss: 0.3085433542728424, mean loss: 0.3625604036006781
Epoch: 13, step: 1389, loss: 0.3872816562652588, mean loss: 0.36256162973165046
Epoch: 13, step: 1390, loss: 0.340839684009552, mean loss: 0.36256055241449914
Epoch: 13, step: 1391, loss: 0.3021443486213684, mean loss: 0.3625575561734858
Epoch: 13, step: 1392, loss: 0.37908047437667847, mean loss: 0.36255837555946163
Epoch: 13, step: 1393, loss: 0.3298381268978119, mean loss: 0.3625567530141546
Epoch: 13, step: 1394, loss: 0.30405378341674805, mean loss: 0.36255385208840474
Epoch: 13, step: 1395, loss: 0.33577191829681396, mean loss: 0.36255252414642775
Epoch: 13, step: 1396, loss: 0.32535549998283386, mean loss: 0.36255067987927697
Epoch: 13, step: 1397, loss: 0.3234827220439911, mean loss: 0.3625487429453238
Epoch: 13, step: 1398, loss: 0.34633588790893555, mean loss: 0.3625479391748099
Epoch: 13, step: 1399, loss: 0.3919045329093933, mean loss: 0.3625493944887963
Epoch: 13, step: 1400, loss: 0.35411733388900757, mean loss: 0.36254897650135764
Epoch: 13, step: 1401, loss: 0.3383646309375763, mean loss: 0.3625477777135335
Epoch: 13, step: 1402, loss: 0.33490410447120667, mean loss: 0.36254640751907297
Epoch: 13, step: 1403, loss: 0.30808958411216736, mean loss: 0.3625437084298875
Epoch: 13, step: 1404, loss: 0.31432974338531494, mean loss: 0.3625413188791592
Epoch: 13, step: 1405, loss: 0.3282725214958191, mean loss: 0.36253962055438055
Epoch: 13, step: 1406, loss: 0.30622008442878723, mean loss: 0.36253682955700084
Epoch: 13, step: 1407, loss: 0.31650304794311523, mean loss: 0.36253454839834803
Epoch: 13, step: 1408, loss: 0.3192892372608185, mean loss: 0.3625324055257878
Epoch: 13, step: 1409, loss: 0.380944162607193, mean loss: 0.3625333178118388
Epoch: 13, step: 1410, loss: 0.3250638544559479, mean loss: 0.3625314613255208
Epoch: 13, step: 1411, loss: 0.29768702387809753, mean loss: 0.36252824866016964
Epoch: 13, step: 1412, loss: 0.3373027443885803, mean loss: 0.36252699894482304
Epoch: 13, step: 1413, loss: 0.3492795526981354, mean loss: 0.3625263426758125
Epoch: 13, step: 1414, loss: 0.33402934670448303, mean loss: 0.36252493102494954
Epoch: 13, step: 1415, loss: 0.34100356698036194, mean loss: 0.3625238649775925
Epoch: 13, step: 1416, loss: 0.3405226767063141, mean loss: 0.36252277521642196
Epoch: 13, step: 1417, loss: 0.3526270389556885, mean loss: 0.3625222850858494
Epoch: 13, step: 1418, loss: 0.3065754473209381, mean loss: 0.362519514205865
Epoch: 13, step: 1419, loss: 0.30760014057159424, mean loss: 0.36251679434782047
Epoch: 13, step: 1420, loss: 0.3239876329898834, mean loss: 0.362514886302391
Epoch: 13, step: 1421, loss: 0.31507354974746704, mean loss: 0.36251253702356784
Epoch: 13, step: 1422, loss: 0.30865779519081116, mean loss: 0.3625098702871562
Epoch: 13, step: 1423, loss: 0.29582828283309937, mean loss: 0.3625065685646639
Epoch: 13, step: 1424, loss: 0.30569523572921753, mean loss: 0.36250375570469284
Epoch: 13, step: 1425, loss: 0.3252629041671753, mean loss: 0.3625019119156277
Epoch: 13, step: 1426, loss: 0.33625364303588867, mean loss: 0.36250061243204534
Epoch: 13, step: 1427, loss: 0.32388392090797424, mean loss: 0.3624987007146432
Epoch: 13, step: 1428, loss: 0.3591345250606537, mean loss: 0.3624985341795383
Epoch: 13, step: 1429, loss: 0.36225274205207825, mean loss: 0.36249852201281585
Epoch: 13, step: 1430, loss: 0.32899048924446106, mean loss: 0.3624968634456343
Epoch: 13, step: 1431, loss: 0.3359469473361969, mean loss: 0.3624955493535679
Epoch: 13, step: 1432, loss: 0.33052873611450195, mean loss: 0.36249396722967586
Epoch: 13, step: 1433, loss: 0.31887906789779663, mean loss: 0.36249180871738584
Epoch: 13, step: 1434, loss: 0.37625178694725037, mean loss: 0.36249248966845377
Epoch: 13, step: 1435, loss: 0.34015482664108276, mean loss: 0.3624913842813285
Epoch: 13, step: 1436, loss: 0.3216971158981323, mean loss: 0.36248936566247636
Epoch: 13, step: 1437, loss: 0.33840930461883545, mean loss: 0.3624881741700942
Epoch: 13, step: 1438, loss: 0.3425742983818054, mean loss: 0.36248718887120807
Epoch: 13, step: 1439, loss: 0.3123418986797333, mean loss: 0.3624847079049409
Epoch: 13, step: 1440, loss: 0.355199933052063, mean loss: 0.36248434750446334
Epoch: 13, step: 1441, loss: 0.4235227406024933, mean loss: 0.3624873671142931
Epoch: 13, step: 1442, loss: 0.3840895891189575, mean loss: 0.3624884357376918
Epoch: 13, step: 1443, loss: 0.33324193954467773, mean loss: 0.36248698903724696
Valid: 13, mean loss: 0.1919595425327619
Epoch: 14, step: 0, loss: 0.32120153307914734, mean loss: 0.3624849469214059
Epoch: 14, step: 1, loss: 0.3701596260070801, mean loss: 0.36248532651775994
Epoch: 14, step: 2, loss: 0.3821339011192322, mean loss: 0.3624862983054152
Epoch: 14, step: 3, loss: 0.3402545154094696, mean loss: 0.3624851988107121
Epoch: 14, step: 4, loss: 0.3373081386089325, mean loss: 0.3624839537159986
Epoch: 14, step: 5, loss: 0.31940677762031555, mean loss: 0.36248182350256297
Epoch: 14, step: 6, loss: 0.3377067744731903, mean loss: 0.36248059840989477
Epoch: 14, step: 7, loss: 0.3410998582839966, mean loss: 0.36247954121348824
Epoch: 14, step: 8, loss: 0.33948472142219543, mean loss: 0.36247840426318956
Epoch: 14, step: 9, loss: 0.30099204182624817, mean loss: 0.36247536429668914
Epoch: 14, step: 10, loss: 0.3383549451828003, mean loss: 0.3624741718104522
Epoch: 14, step: 11, loss: 0.38868170976638794, mean loss: 0.3624754674174305
Epoch: 14, step: 12, loss: 0.3744819760322571, mean loss: 0.36247606094694823
Epoch: 14, step: 13, loss: 0.38651764392852783, mean loss: 0.36247724935935466
Epoch: 14, step: 14, loss: 0.3100120723247528, mean loss: 0.3624746560531891
Epoch: 14, step: 15, loss: 0.33382120728492737, mean loss: 0.3624732398091812
Epoch: 14, step: 16, loss: 0.287441223859787, mean loss: 0.36246953141122
Epoch: 14, step: 17, loss: 0.3910139799118042, mean loss: 0.3624709421282557
Epoch: 14, step: 18, loss: 0.36007362604141235, mean loss: 0.36247082365451777
Epoch: 14, step: 19, loss: 0.3204152286052704, mean loss: 0.36246874539818996
Epoch: 14, step: 20, loss: 0.3311656415462494, mean loss: 0.36246719857287735
Epoch: 14, step: 21, loss: 0.34699082374572754, mean loss: 0.36246643385428723
Epoch: 14, step: 22, loss: 0.37398573756217957, mean loss: 0.36246700301796664
Epoch: 14, step: 23, loss: 0.38587114214897156, mean loss: 0.3624681593489514
Epoch: 14, step: 24, loss: 0.40108412504196167, mean loss: 0.36247006715813535
Epoch: 14, step: 25, loss: 0.3565576374530792, mean loss: 0.36246977507090555
Epoch: 14, step: 26, loss: 0.3558712303638458, mean loss: 0.36246944910416606
Epoch: 14, step: 27, loss: 0.3155005872249603, mean loss: 0.3624671289667486
Epoch: 14, step: 28, loss: 0.3617528975009918, mean loss: 0.362467093687348
Epoch: 14, step: 29, loss: 0.3687405288219452, mean loss: 0.36246740354782087
Epoch: 14, step: 30, loss: 0.3339534401893616, mean loss: 0.362465995242227
Epoch: 14, step: 31, loss: 0.368679404258728, mean loss: 0.3624663021075478
Epoch: 14, step: 32, loss: 0.35399743914604187, mean loss: 0.3624658838714393
Epoch: 14, step: 33, loss: 0.34989431500434875, mean loss: 0.36246526305322363
Epoch: 14, step: 34, loss: 0.35601431131362915, mean loss: 0.36246494450343647
Epoch: 14, step: 35, loss: 0.32758161425590515, mean loss: 0.36246322203996384
Epoch: 14, step: 36, loss: 0.34912264347076416, mean loss: 0.3624625633435451
Epoch: 14, step: 37, loss: 0.3748297393321991, mean loss: 0.36246317394767213
Epoch: 14, step: 38, loss: 0.3708336651325226, mean loss: 0.3624635872032231
Epoch: 14, step: 39, loss: 0.3073749244213104, mean loss: 0.3624608675812453
Epoch: 14, step: 40, loss: 0.35134419798851013, mean loss: 0.36246031879960966
Epoch: 14, step: 41, loss: 0.30066221952438354, mean loss: 0.36245726824677743
Epoch: 14, step: 42, loss: 0.3459291160106659, mean loss: 0.3624564524043254
Epoch: 14, step: 43, loss: 0.3362656533718109, mean loss: 0.36245515966992103
Epoch: 14, step: 44, loss: 0.30403226613998413, mean loss: 0.3624522761551128
Epoch: 14, step: 45, loss: 0.322750449180603, mean loss: 0.3624503167322041
Epoch: 14, step: 46, loss: 0.31809359788894653, mean loss: 0.36244812768226864
Epoch: 14, step: 47, loss: 0.34951552748680115, mean loss: 0.362447489476574
Epoch: 14, step: 48, loss: 0.3758195638656616, mean loss: 0.362448149337141
Epoch: 14, step: 49, loss: 0.31746476888656616, mean loss: 0.36244592968943296
Epoch: 14, step: 50, loss: 0.324240118265152, mean loss: 0.36244404456526935
Epoch: 14, step: 51, loss: 0.31641268730163574, mean loss: 0.3624417734306106
Epoch: 14, step: 52, loss: 0.354610800743103, mean loss: 0.3624413870784133
Epoch: 14, step: 53, loss: 0.36926183104515076, mean loss: 0.36244172355813536
Epoch: 14, step: 54, loss: 0.33043476939201355, mean loss: 0.3624401446052388
Epoch: 14, step: 55, loss: 0.3576017916202545, mean loss: 0.3624399059335249
Epoch: 14, step: 56, loss: 0.3122401833534241, mean loss: 0.36243742974733734
Epoch: 14, step: 57, loss: 0.2840422987937927, mean loss: 0.3624335629656981
Epoch: 14, step: 58, loss: 0.3613949716091156, mean loss: 0.36243351174047705
Epoch: 14, step: 59, loss: 0.3530094623565674, mean loss: 0.3624330469520876
Epoch: 14, step: 60, loss: 0.3264448940753937, mean loss: 0.362431272125788
Epoch: 14, step: 61, loss: 0.32349205017089844, mean loss: 0.36242935185643427
Epoch: 14, step: 62, loss: 0.3059278726577759, mean loss: 0.3624265656500533
Epoch: 14, step: 63, loss: 0.3663586974143982, mean loss: 0.36242675954215214
Epoch: 14, step: 64, loss: 0.36819300055503845, mean loss: 0.36242704385954344
Epoch: 14, step: 65, loss: 0.33746156096458435, mean loss: 0.3624258129413453
Epoch: 14, step: 66, loss: 0.36762675642967224, mean loss: 0.362426069360193
Epoch: 14, step: 67, loss: 0.4363701045513153, mean loss: 0.3624297147967534
Epoch: 14, step: 68, loss: 0.38100701570510864, mean loss: 0.36243063061143954
Epoch: 14, step: 69, loss: 0.29825687408447266, mean loss: 0.36242746716095514
Epoch: 14, step: 70, loss: 0.33586040139198303, mean loss: 0.3624261575998683
Epoch: 14, step: 71, loss: 0.33248791098594666, mean loss: 0.3624246819370817
Epoch: 14, step: 72, loss: 0.3338077664375305, mean loss: 0.3624232714725197
Epoch: 14, step: 73, loss: 0.34977880120277405, mean loss: 0.362422648285222
Epoch: 14, step: 74, loss: 0.35083553194999695, mean loss: 0.3624220772381403
Epoch: 14, step: 75, loss: 0.3205440640449524, mean loss: 0.36242001346851715
Epoch: 14, step: 76, loss: 0.33513516187667847, mean loss: 0.36241866892352176
Epoch: 14, step: 77, loss: 0.32359370589256287, mean loss: 0.3624167557983108
Epoch: 14, step: 78, loss: 0.32482194900512695, mean loss: 0.36241490338112464
Epoch: 14, step: 79, loss: 0.34702548384666443, mean loss: 0.3624141451322315
Epoch: 14, step: 80, loss: 0.40451979637145996, mean loss: 0.3624162196088162
Epoch: 14, step: 81, loss: 0.30729347467422485, mean loss: 0.36241350393510774
Epoch: 14, step: 82, loss: 0.33973929286003113, mean loss: 0.36241238692387195
Epoch: 14, step: 83, loss: 0.3310978412628174, mean loss: 0.36241084433541576
Epoch: 14, step: 84, loss: 0.34535157680511475, mean loss: 0.36241000401880424
Epoch: 14, step: 85, loss: 0.34132012724876404, mean loss: 0.3624089652109641
Epoch: 14, step: 86, loss: 0.3309559226036072, mean loss: 0.3624074160289414
Epoch: 14, step: 87, loss: 0.3384498357772827, mean loss: 0.36240623608507555
Epoch: 14, step: 88, loss: 0.3392398953437805, mean loss: 0.36240509516703856
Epoch: 14, step: 89, loss: 0.3626547157764435, mean loss: 0.36240510745998694
Epoch: 14, step: 90, loss: 0.33937785029411316, mean loss: 0.36240397350336284
Epoch: 14, step: 91, loss: 0.35530975461006165, mean loss: 0.36240362417211935
Epoch: 14, step: 92, loss: 0.31205499172210693, mean loss: 0.3624011450430411
Epoch: 14, step: 93, loss: 0.34514763951301575, mean loss: 0.36240029553513714
Epoch: 14, step: 94, loss: 0.34676194190979004, mean loss: 0.3623995255901012
Epoch: 14, step: 95, loss: 0.32240888476371765, mean loss: 0.36239755677162805
Epoch: 14, step: 96, loss: 0.38567212224006653, mean loss: 0.36239870256818535
Epoch: 14, step: 97, loss: 0.3409475088119507, mean loss: 0.3623976465873959
Epoch: 14, step: 98, loss: 0.3522098660469055, mean loss: 0.36239714509684506
Epoch: 14, step: 99, loss: 0.3860333561897278, mean loss: 0.3623983085252312
Epoch: 14, step: 100, loss: 0.3016842007637024, mean loss: 0.36239532018503523
Epoch: 14, step: 101, loss: 0.32232797145843506, mean loss: 0.36239334817259666
Epoch: 14, step: 102, loss: 0.31081271171569824, mean loss: 0.36239080963051995
Epoch: 14, step: 103, loss: 0.33253341913223267, mean loss: 0.3623893402707513
Epoch: 14, step: 104, loss: 0.3349069654941559, mean loss: 0.3623879878582334
Epoch: 14, step: 105, loss: 0.3330788314342499, mean loss: 0.36238654562044065
Epoch: 14, step: 106, loss: 0.32111525535583496, mean loss: 0.3623845148528244
Epoch: 14, step: 107, loss: 0.35419419407844543, mean loss: 0.36238411186518543
Epoch: 14, step: 108, loss: 0.346849262714386, mean loss: 0.362383347542964
Epoch: 14, step: 109, loss: 0.3777382969856262, mean loss: 0.3623841029768635
Epoch: 14, step: 110, loss: 0.2998661696910858, mean loss: 0.3623810273664298
Epoch: 14, step: 111, loss: 0.31248489022254944, mean loss: 0.3623785728142287
Epoch: 14, step: 112, loss: 0.3402828872203827, mean loss: 0.3623774859095313
Epoch: 14, step: 113, loss: 0.32841166853904724, mean loss: 0.3623758151856075
Epoch: 14, step: 114, loss: 0.3259345591068268, mean loss: 0.36237402278700054
Epoch: 14, step: 115, loss: 0.34402135014533997, mean loss: 0.3623731201373526
Epoch: 14, step: 116, loss: 0.3410308361053467, mean loss: 0.3623720704996193
Epoch: 14, step: 117, loss: 0.32358744740486145, mean loss: 0.3623701631216762
Epoch: 14, step: 118, loss: 0.34581896662712097, mean loss: 0.36236934919512126
Epoch: 14, step: 119, loss: 0.3123425245285034, mean loss: 0.3623668891821066
Epoch: 14, step: 120, loss: 0.37505945563316345, mean loss: 0.36236751329414135
Epoch: 14, step: 121, loss: 0.3566136360168457, mean loss: 0.3623672303815011
Epoch: 14, step: 122, loss: 0.29971423745155334, mean loss: 0.36236414994524907
Epoch: 14, step: 123, loss: 0.2936672270298004, mean loss: 0.36236077251541055
Epoch: 14, step: 124, loss: 0.3182302415370941, mean loss: 0.3623586029794498
Epoch: 14, step: 125, loss: 0.35676109790802, mean loss: 0.36235832780960064
Epoch: 14, step: 126, loss: 0.29547372460365295, mean loss: 0.3623550399659588
Epoch: 14, step: 127, loss: 0.3829779326915741, mean loss: 0.36235605367480295
Epoch: 14, step: 128, loss: 0.3175889551639557, mean loss: 0.3623538532767439
Epoch: 14, step: 129, loss: 0.3770405054092407, mean loss: 0.3623545751214373
Epoch: 14, step: 130, loss: 0.3473794460296631, mean loss: 0.36235383913435854
Epoch: 14, step: 131, loss: 0.3161756992340088, mean loss: 0.3623515697152559
Epoch: 14, step: 132, loss: 0.331589013338089, mean loss: 0.36235005796743647
Epoch: 14, step: 133, loss: 0.3191714882850647, mean loss: 0.36234793617040045
Epoch: 14, step: 134, loss: 0.31283411383628845, mean loss: 0.36234550317829517
Epoch: 14, step: 135, loss: 0.3009338080883026, mean loss: 0.36234248570113864
Epoch: 14, step: 136, loss: 0.3408488929271698, mean loss: 0.36234142966061517
Epoch: 14, step: 137, loss: 0.3447248041629791, mean loss: 0.3623405641488977
Epoch: 14, step: 138, loss: 0.3139544725418091, mean loss: 0.36233818703803516
Epoch: 14, step: 139, loss: 0.3132350444793701, mean loss: 0.36233577481841645
Epoch: 14, step: 140, loss: 0.3936575949192047, mean loss: 0.3623373134449381
Epoch: 14, step: 141, loss: 0.3211040794849396, mean loss: 0.36233528803802384
Epoch: 14, step: 142, loss: 0.31646284461021423, mean loss: 0.362333034860391
Epoch: 14, step: 143, loss: 0.30499792098999023, mean loss: 0.3623302187938944
Epoch: 14, step: 144, loss: 0.3612663745880127, mean loss: 0.36233016654478056
Epoch: 14, step: 145, loss: 0.3258735239505768, mean loss: 0.36232837611935115
Epoch: 14, step: 146, loss: 0.3063735067844391, mean loss: 0.36232562824971826
Epoch: 14, step: 147, loss: 0.2909873127937317, mean loss: 0.36232212509142636
Epoch: 14, step: 148, loss: 0.3061041533946991, mean loss: 0.3623193645723153
Epoch: 14, step: 149, loss: 0.3195746839046478, mean loss: 0.362317265746789
Epoch: 14, step: 150, loss: 0.2917330861091614, mean loss: 0.36231380013184145
Epoch: 14, step: 151, loss: 0.3228012025356293, mean loss: 0.36231186019676703
Epoch: 14, step: 152, loss: 0.29927492141723633, mean loss: 0.3623087654479438
Epoch: 14, step: 153, loss: 0.3385516107082367, mean loss: 0.36230759916641514
Epoch: 14, step: 154, loss: 0.398286908864975, mean loss: 0.362309365368845
Epoch: 14, step: 155, loss: 0.3430560231208801, mean loss: 0.3623084202803781
Epoch: 14, step: 156, loss: 0.32823410630226135, mean loss: 0.36230674775723576
Epoch: 14, step: 157, loss: 0.37805718183517456, mean loss: 0.362307520822617
Epoch: 14, step: 158, loss: 0.31835484504699707, mean loss: 0.3623053636360759
Epoch: 14, step: 159, loss: 0.34782668948173523, mean loss: 0.3623046530611763
Epoch: 14, step: 160, loss: 0.3422965407371521, mean loss: 0.36230367116431594
Epoch: 14, step: 161, loss: 0.3444784879684448, mean loss: 0.3623027964374931
Epoch: 14, step: 162, loss: 0.28982236981391907, mean loss: 0.3622992398141738
Epoch: 14, step: 163, loss: 0.3613908886909485, mean loss: 0.36229919524346116
Epoch: 14, step: 164, loss: 0.3668650984764099, mean loss: 0.3622994192709001
Epoch: 14, step: 165, loss: 0.34231990575790405, mean loss: 0.3622984390180538
Epoch: 14, step: 166, loss: 0.35076192021369934, mean loss: 0.3622978730307701
Epoch: 14, step: 167, loss: 0.3206249177455902, mean loss: 0.362295828635397
Epoch: 14, step: 168, loss: 0.33583149313926697, mean loss: 0.36229453040947124
Epoch: 14, step: 169, loss: 0.3300705552101135, mean loss: 0.3622929497180556
Epoch: 14, step: 170, loss: 0.3454952836036682, mean loss: 0.36229212577799014
Epoch: 14, step: 171, loss: 0.31716275215148926, mean loss: 0.36228991225171847
Epoch: 14, step: 172, loss: 0.3677074909210205, mean loss: 0.3622901779625758
Epoch: 14, step: 173, loss: 0.3227427005767822, mean loss: 0.3622882384099821
Epoch: 14, step: 174, loss: 0.3283783495426178, mean loss: 0.36228657542685877
Epoch: 14, step: 175, loss: 0.366869181394577, mean loss: 0.36228680015253395
Epoch: 14, step: 176, loss: 0.3593407869338989, mean loss: 0.36228665569055096
Epoch: 14, step: 177, loss: 0.36330562829971313, mean loss: 0.3622867056548841
Epoch: 14, step: 178, loss: 0.3511018455028534, mean loss: 0.362286157243011
Epoch: 14, step: 179, loss: 0.322419673204422, mean loss: 0.362284202620338
Epoch: 14, step: 180, loss: 0.3939208984375, mean loss: 0.3622857536668555
Epoch: 14, step: 181, loss: 0.31593188643455505, mean loss: 0.3622834811956705
Epoch: 14, step: 182, loss: 0.33430713415145874, mean loss: 0.36228210973888125
Epoch: 14, step: 183, loss: 0.3339571952819824, mean loss: 0.3622807212626824
Epoch: 14, step: 184, loss: 0.33277633786201477, mean loss: 0.3622792750402717
Epoch: 14, step: 185, loss: 0.3338855803012848, mean loss: 0.3622778833289326
Epoch: 14, step: 186, loss: 0.3120805621147156, mean loss: 0.36227542303773946
Epoch: 14, step: 187, loss: 0.37265998125076294, mean loss: 0.36227593198491714
Epoch: 14, step: 188, loss: 0.30870306491851807, mean loss: 0.3622733065074819
Epoch: 14, step: 189, loss: 0.3064621686935425, mean loss: 0.36227057147181524
Epoch: 14, step: 190, loss: 0.3411608040332794, mean loss: 0.3622695370342478
Epoch: 14, step: 191, loss: 0.3374755084514618, mean loss: 0.3622683221171279
Epoch: 14, step: 192, loss: 0.3198011815547943, mean loss: 0.3622662413125533
Epoch: 14, step: 193, loss: 0.34588733315467834, mean loss: 0.36226543881827805
Epoch: 14, step: 194, loss: 0.3452654182910919, mean loss: 0.36226460593304327
Epoch: 14, step: 195, loss: 0.33338022232055664, mean loss: 0.36226319086427916
Epoch: 14, step: 196, loss: 0.3462364077568054, mean loss: 0.36226240573798185
Epoch: 14, step: 197, loss: 0.3490269184112549, mean loss: 0.3622617573845319
Epoch: 14, step: 198, loss: 0.3261216878890991, mean loss: 0.36225998711416724
Epoch: 14, step: 199, loss: 0.3263149857521057, mean loss: 0.362258226485182
Epoch: 14, step: 200, loss: 0.3222224712371826, mean loss: 0.36225626558224583
Epoch: 14, step: 201, loss: 0.3880481421947479, mean loss: 0.3622575287753408
Epoch: 14, step: 202, loss: 0.34307894110679626, mean loss: 0.3622565895232879
Epoch: 14, step: 203, loss: 0.4533992111682892, mean loss: 0.36226105292297667
Epoch: 14, step: 204, loss: 0.3578890264034271, mean loss: 0.36226083882834276
Epoch: 14, step: 205, loss: 0.2936040163040161, mean loss: 0.3622574769234106
Epoch: 14, step: 206, loss: 0.36496973037719727, mean loss: 0.36225760972728144
Epoch: 14, step: 207, loss: 0.34960320591926575, mean loss: 0.3622569901422928
Epoch: 14, step: 208, loss: 0.3213132917881012, mean loss: 0.3622549855548581
Epoch: 14, step: 209, loss: 0.3338993787765503, mean loss: 0.3622535973434227
Epoch: 14, step: 210, loss: 0.32635927200317383, mean loss: 0.3622518401433767
Epoch: 14, step: 211, loss: 0.3530375063419342, mean loss: 0.36225138907945453
Epoch: 14, step: 212, loss: 0.35316377878189087, mean loss: 0.3622509442407303
Epoch: 14, step: 213, loss: 0.3475901782512665, mean loss: 0.3622502266310392
Epoch: 14, step: 214, loss: 0.3032873570919037, mean loss: 0.3622473406798112
Epoch: 14, step: 215, loss: 0.32866376638412476, mean loss: 0.3622456970044835
Epoch: 14, step: 216, loss: 0.34892332553863525, mean loss: 0.36224504500176896
Epoch: 14, step: 217, loss: 0.3040625751018524, mean loss: 0.3622421976654716
Epoch: 14, step: 218, loss: 0.3186953067779541, mean loss: 0.3622400666700771
Epoch: 14, step: 219, loss: 0.3083508610725403, mean loss: 0.36223742969583567
Epoch: 14, step: 220, loss: 0.32096898555755615, mean loss: 0.36223541039534446
Epoch: 14, step: 221, loss: 0.3161579668521881, mean loss: 0.36223315589668786
Epoch: 14, step: 222, loss: 0.360556036233902, mean loss: 0.3622330738418093
Epoch: 14, step: 223, loss: 0.34453263878822327, mean loss: 0.36223220787140553
Epoch: 14, step: 224, loss: 0.3263415992259979, mean loss: 0.3622304520566878
Epoch: 14, step: 225, loss: 0.2962963581085205, mean loss: 0.36222722663383544
Epoch: 14, step: 226, loss: 0.3022429049015045, mean loss: 0.3622242924107893
Epoch: 14, step: 227, loss: 0.3294393718242645, mean loss: 0.36222268876568137
Epoch: 14, step: 228, loss: 0.40474727749824524, mean loss: 0.36222476871621856
Epoch: 14, step: 229, loss: 0.31462258100509644, mean loss: 0.36222244052548636
Epoch: 14, step: 230, loss: 0.33463254570961, mean loss: 0.3622210911884288
Epoch: 14, step: 231, loss: 0.4192168116569519, mean loss: 0.3622238785378258
Epoch: 14, step: 232, loss: 0.3528764247894287, mean loss: 0.3622234214272703
Epoch: 14, step: 233, loss: 0.38992512226104736, mean loss: 0.36222477603366804
Epoch: 14, step: 234, loss: 0.3499642014503479, mean loss: 0.3622241765238845
Epoch: 14, step: 235, loss: 0.3112172782421112, mean loss: 0.36222168254293974
Epoch: 14, step: 236, loss: 0.32251137495040894, mean loss: 0.36221974100343
Epoch: 14, step: 237, loss: 0.3369494676589966, mean loss: 0.3622185055348985
Epoch: 14, step: 238, loss: 0.38606879115104675, mean loss: 0.3622196715229511
Epoch: 14, step: 239, loss: 0.32587558031082153, mean loss: 0.36221789482705685
Epoch: 14, step: 240, loss: 0.3516381084918976, mean loss: 0.36221737765511886
Epoch: 14, step: 241, loss: 0.38886594772338867, mean loss: 0.3622186802541055
Epoch: 14, step: 242, loss: 0.3376481235027313, mean loss: 0.3622174792884302
Epoch: 14, step: 243, loss: 0.334246426820755, mean loss: 0.36221611217931643
Epoch: 14, step: 244, loss: 0.33252206444740295, mean loss: 0.36221466092826654
Epoch: 14, step: 245, loss: 0.3471631407737732, mean loss: 0.3622139253442496
Epoch: 14, step: 246, loss: 0.3427755832672119, mean loss: 0.36221297541793984
Epoch: 14, step: 247, loss: 0.3536146283149719, mean loss: 0.36221255524851537
Epoch: 14, step: 248, loss: 0.3167118728160858, mean loss: 0.3622103319070821
Epoch: 14, step: 249, loss: 0.32299351692199707, mean loss: 0.36220841571364004
Epoch: 14, step: 250, loss: 0.3545195460319519, mean loss: 0.36220804004208673
Epoch: 14, step: 251, loss: 0.3094687759876251, mean loss: 0.362205463372942
Epoch: 14, step: 252, loss: 0.3130566477775574, mean loss: 0.36220306223875887
Epoch: 14, step: 253, loss: 0.3414682447910309, mean loss: 0.3622020493019026
Epoch: 14, step: 254, loss: 0.3580155074596405, mean loss: 0.3622018447910413
Epoch: 14, step: 255, loss: 0.3090214133262634, mean loss: 0.36219924707555357
Epoch: 14, step: 256, loss: 0.3034678101539612, mean loss: 0.3621963783490884
Epoch: 14, step: 257, loss: 0.30955538153648376, mean loss: 0.3621938072346597
Epoch: 14, step: 258, loss: 0.3717685043811798, mean loss: 0.362194274863336
Epoch: 14, step: 259, loss: 0.29705092310905457, mean loss: 0.36219109341423683
Epoch: 14, step: 260, loss: 0.31291770935058594, mean loss: 0.36218868713479824
Epoch: 14, step: 261, loss: 0.3537219762802124, mean loss: 0.3621882736808059
Epoch: 14, step: 262, loss: 0.33282119035720825, mean loss: 0.3621868396711705
Epoch: 14, step: 263, loss: 0.3488381803035736, mean loss: 0.3621861878811623
Epoch: 14, step: 264, loss: 0.30953988432884216, mean loss: 0.3621836173863841
Epoch: 14, step: 265, loss: 0.3120526671409607, mean loss: 0.3621811698250988
Epoch: 14, step: 266, loss: 0.3627196252346039, mean loss: 0.3621811961130161
Epoch: 14, step: 267, loss: 0.33972516655921936, mean loss: 0.3621800998413136
Epoch: 14, step: 268, loss: 0.3563303053379059, mean loss: 0.36217981427653434
Epoch: 14, step: 269, loss: 0.32133927941322327, mean loss: 0.3621778206938504
Epoch: 14, step: 270, loss: 0.35311636328697205, mean loss: 0.3621773783910532
Epoch: 14, step: 271, loss: 0.3543192744255066, mean loss: 0.3621769948443934
Epoch: 14, step: 272, loss: 0.3894091248512268, mean loss: 0.36217832395415994
Epoch: 14, step: 273, loss: 0.3355039358139038, mean loss: 0.3621770221294581
Epoch: 14, step: 274, loss: 0.3442102372646332, mean loss: 0.36217614531598563
Epoch: 14, step: 275, loss: 0.37363380193710327, mean loss: 0.3621767044442611
Epoch: 14, step: 276, loss: 0.3063744306564331, mean loss: 0.362173981452323
Epoch: 14, step: 277, loss: 0.36209216713905334, mean loss: 0.36217397746021246
Epoch: 14, step: 278, loss: 0.3239234387874603, mean loss: 0.3621721111250735
Epoch: 14, step: 279, loss: 0.33945897221565247, mean loss: 0.3621710029508488
Epoch: 14, step: 280, loss: 0.32039597630500793, mean loss: 0.36216896484641176
Epoch: 14, step: 281, loss: 0.303534597158432, mean loss: 0.3621661043542814
Epoch: 14, step: 282, loss: 0.38462650775909424, mean loss: 0.36216720003716374
Epoch: 14, step: 283, loss: 0.3506489396095276, mean loss: 0.3621666381708014
Epoch: 14, step: 284, loss: 0.33260130882263184, mean loss: 0.36216519602996206
Epoch: 14, step: 285, loss: 0.3167785704135895, mean loss: 0.3621629822642018
Epoch: 14, step: 286, loss: 0.30341458320617676, mean loss: 0.3621601169079584
Epoch: 14, step: 287, loss: 0.312366783618927, mean loss: 0.3621576884387188
Epoch: 14, step: 288, loss: 0.34359973669052124, mean loss: 0.3621567833935226
Epoch: 14, step: 289, loss: 0.3317033052444458, mean loss: 0.3621552982926668
Epoch: 14, step: 290, loss: 0.33709654211997986, mean loss: 0.36215407633157193
Epoch: 14, step: 291, loss: 0.34127694368362427, mean loss: 0.36215305833212547
Epoch: 14, step: 292, loss: 0.3586619794368744, mean loss: 0.36215288811032553
Epoch: 14, step: 293, loss: 0.34177327156066895, mean loss: 0.3621518944673928
Epoch: 14, step: 294, loss: 0.33842015266418457, mean loss: 0.3621507374422939
Epoch: 14, step: 295, loss: 0.3211383819580078, mean loss: 0.36214873800998676
Epoch: 14, step: 296, loss: 0.37312376499176025, mean loss: 0.36214927303787064
Epoch: 14, step: 297, loss: 0.31033119559288025, mean loss: 0.3621467470518394
Epoch: 14, step: 298, loss: 0.32396945357322693, mean loss: 0.36214488610650775
Epoch: 14, step: 299, loss: 0.3359232544898987, mean loss: 0.36214360800007295
Epoch: 14, step: 300, loss: 0.37482890486717224, mean loss: 0.36214422628232024
Epoch: 14, step: 301, loss: 0.3176754117012024, mean loss: 0.3621420589748545
Epoch: 14, step: 302, loss: 0.31168705224990845, mean loss: 0.3621396000340326
Epoch: 14, step: 303, loss: 0.33166539669036865, mean loss: 0.3621381149364038
Epoch: 14, step: 304, loss: 0.37554141879081726, mean loss: 0.3621387680870229
Epoch: 14, step: 305, loss: 0.3399280309677124, mean loss: 0.3621376857979127
Epoch: 14, step: 306, loss: 0.33825793862342834, mean loss: 0.36213652223765475
Epoch: 14, step: 307, loss: 0.327877014875412, mean loss: 0.3621348529964073
Epoch: 14, step: 308, loss: 0.3403026759624481, mean loss: 0.3621337893093411
Epoch: 14, step: 309, loss: 0.3460463881492615, mean loss: 0.36213300555209854
Epoch: 14, step: 310, loss: 0.3659075200557709, mean loss: 0.3621331894325732
Epoch: 14, step: 311, loss: 0.35489681363105774, mean loss: 0.3621328369201121
Epoch: 14, step: 312, loss: 0.3168984353542328, mean loss: 0.3621306334809984
Epoch: 14, step: 313, loss: 0.3420204222202301, mean loss: 0.3621296539285746
Epoch: 14, step: 314, loss: 0.3292280435562134, mean loss: 0.36212805139531407
Epoch: 14, step: 315, loss: 0.34765592217445374, mean loss: 0.36212734653805606
Epoch: 14, step: 316, loss: 0.33159753680229187, mean loss: 0.3621258596725354
Epoch: 14, step: 317, loss: 0.33333566784858704, mean loss: 0.3621244575983256
Epoch: 14, step: 318, loss: 0.34777653217315674, mean loss: 0.36212375889243686
Epoch: 14, step: 319, loss: 0.3333711624145508, mean loss: 0.36212235878547944
Epoch: 14, step: 320, loss: 0.3058130741119385, mean loss: 0.3621196169398022
Epoch: 14, step: 321, loss: 0.39050695300102234, mean loss: 0.36212099912580187
Epoch: 14, step: 322, loss: 0.3624386191368103, mean loss: 0.36212101459004115
Epoch: 14, step: 323, loss: 0.335134357213974, mean loss: 0.3621197007313568
Epoch: 14, step: 324, loss: 0.3317643404006958, mean loss: 0.3621182229376598
Epoch: 14, step: 325, loss: 0.4018080234527588, mean loss: 0.3621201550669809
Epoch: 14, step: 326, loss: 0.3229755759239197, mean loss: 0.3621182495722069
Epoch: 14, step: 327, loss: 0.3338547945022583, mean loss: 0.3621168738199157
Epoch: 14, step: 328, loss: 0.36840516328811646, mean loss: 0.36211717989387376
Epoch: 14, step: 329, loss: 0.37877362966537476, mean loss: 0.362117990584508
Epoch: 14, step: 330, loss: 0.33251771330833435, mean loss: 0.36211654997141235
Epoch: 14, step: 331, loss: 0.31042855978012085, mean loss: 0.362114034495931
Epoch: 14, step: 332, loss: 0.3344881236553192, mean loss: 0.36211269010394886
Epoch: 14, step: 333, loss: 0.3253662884235382, mean loss: 0.3621109019578817
Epoch: 14, step: 334, loss: 0.32854828238487244, mean loss: 0.36210926881985567
Epoch: 14, step: 335, loss: 0.3197118043899536, mean loss: 0.36210720588367284
Epoch: 14, step: 336, loss: 0.3580440878868103, mean loss: 0.36210700819389535
Epoch: 14, step: 337, loss: 0.35257798433303833, mean loss: 0.3621065445846776
Epoch: 14, step: 338, loss: 0.32567691802978516, mean loss: 0.36210477228467497
Epoch: 14, step: 339, loss: 0.36447852849960327, mean loss: 0.3621048877622102
Epoch: 14, step: 340, loss: 0.34473180770874023, mean loss: 0.3621040426447294
Epoch: 14, step: 341, loss: 0.30867183208465576, mean loss: 0.362101443548973
Epoch: 14, step: 342, loss: 0.34095966815948486, mean loss: 0.3621004152024878
Epoch: 14, step: 343, loss: 0.35681942105293274, mean loss: 0.3621001583447957
Epoch: 14, step: 344, loss: 0.3358575701713562, mean loss: 0.36209888201639856
Epoch: 14, step: 345, loss: 0.3324888050556183, mean loss: 0.36209744197763966
Epoch: 14, step: 346, loss: 0.3673185408115387, mean loss: 0.3620976958850867
Epoch: 14, step: 347, loss: 0.3487545847892761, mean loss: 0.36209704702732093
Epoch: 14, step: 348, loss: 0.39396217465400696, mean loss: 0.3620985965107941
Epoch: 14, step: 349, loss: 0.37708425521850586, mean loss: 0.3620993251726004
Epoch: 14, step: 350, loss: 0.33696693181991577, mean loss: 0.36209810319597024
Epoch: 14, step: 351, loss: 0.3260338604450226, mean loss: 0.3620963497808229
Epoch: 14, step: 352, loss: 0.3562990725040436, mean loss: 0.3620960679354596
Epoch: 14, step: 353, loss: 0.3748862147331238, mean loss: 0.36209668972188636
Epoch: 14, step: 354, loss: 0.3416704535484314, mean loss: 0.3620956967591634
Epoch: 14, step: 355, loss: 0.3377131223678589, mean loss: 0.3620945115280536
Epoch: 14, step: 356, loss: 0.4183856248855591, mean loss: 0.36209724769260704
Epoch: 14, step: 357, loss: 0.3095056116580963, mean loss: 0.36209469147427154
Epoch: 14, step: 358, loss: 0.3191031217575073, mean loss: 0.3620926019690605
Epoch: 14, step: 359, loss: 0.3340960144996643, mean loss: 0.3620912413262014
Epoch: 14, step: 360, loss: 0.35600408911705017, mean loss: 0.3620909455030878
Epoch: 14, step: 361, loss: 0.3613864779472351, mean loss: 0.362090911269073
Epoch: 14, step: 362, loss: 0.31955134868621826, mean loss: 0.36208884413449005
Epoch: 14, step: 363, loss: 0.34041839838027954, mean loss: 0.3620877911487877
Epoch: 14, step: 364, loss: 0.3227888345718384, mean loss: 0.3620858816712804
Epoch: 14, step: 365, loss: 0.3402671813964844, mean loss: 0.3620848215847837
Epoch: 14, step: 366, loss: 0.3232364356517792, mean loss: 0.362082934183242
Epoch: 14, step: 367, loss: 0.3259654939174652, mean loss: 0.3620811795466181
Epoch: 14, step: 368, loss: 0.31813332438468933, mean loss: 0.3620790446010188
Epoch: 14, step: 369, loss: 0.3247658610343933, mean loss: 0.36207723204959713
Epoch: 14, step: 370, loss: 0.40325748920440674, mean loss: 0.36207923235353434
Epoch: 14, step: 371, loss: 0.35532405972480774, mean loss: 0.36207890424139966
Epoch: 14, step: 372, loss: 0.3504765033721924, mean loss: 0.3620783407171455
Epoch: 14, step: 373, loss: 0.2928774952888489, mean loss: 0.3620749798213015
Epoch: 14, step: 374, loss: 0.3416425287723541, mean loss: 0.36207398752121656
Epoch: 14, step: 375, loss: 0.31668978929519653, mean loss: 0.36207178354888625
Epoch: 14, step: 376, loss: 0.32916271686553955, mean loss: 0.3620701854783437
Epoch: 14, step: 377, loss: 0.3493160307407379, mean loss: 0.3620695661642358
Epoch: 14, step: 378, loss: 0.3055119216442108, mean loss: 0.3620668199809622
Epoch: 14, step: 379, loss: 0.34991317987442017, mean loss: 0.3620662298838508
Epoch: 14, step: 380, loss: 0.2997610569000244, mean loss: 0.36206320492036176
Epoch: 14, step: 381, loss: 0.33506181836128235, mean loss: 0.36206189404617206
Epoch: 14, step: 382, loss: 0.37664714455604553, mean loss: 0.36206260210241314
Epoch: 14, step: 383, loss: 0.31707891821861267, mean loss: 0.3620604184284382
Epoch: 14, step: 384, loss: 0.33728283643722534, mean loss: 0.3620592156915812
Epoch: 14, step: 385, loss: 0.29674971103668213, mean loss: 0.36205604563505006
Epoch: 14, step: 386, loss: 0.36093875765800476, mean loss: 0.36205599140566713
Epoch: 14, step: 387, loss: 0.348609060049057, mean loss: 0.36205533876873464
Epoch: 14, step: 388, loss: 0.32174357771873474, mean loss: 0.36205338236198625
Epoch: 14, step: 389, loss: 0.3127475380897522, mean loss: 0.36205098957132953
Epoch: 14, step: 390, loss: 0.32916060090065, mean loss: 0.362049393492877
Epoch: 14, step: 391, loss: 0.3085924983024597, mean loss: 0.36204679950533863
Epoch: 14, step: 392, loss: 0.31850624084472656, mean loss: 0.36204468680900886
Epoch: 14, step: 393, loss: 0.3048907518386841, mean loss: 0.36204191369231936
Epoch: 14, step: 394, loss: 0.3287612497806549, mean loss: 0.3620402989883306
Epoch: 14, step: 395, loss: 0.36005401611328125, mean loss: 0.362040202622967
Epoch: 14, step: 396, loss: 0.30479133129119873, mean loss: 0.36203742530422
Epoch: 14, step: 397, loss: 0.33763590455055237, mean loss: 0.36203624156885794
Epoch: 14, step: 398, loss: 0.3423723578453064, mean loss: 0.362035287705956
Epoch: 14, step: 399, loss: 0.35358741879463196, mean loss: 0.36203487793350203
Epoch: 14, step: 400, loss: 0.30371665954589844, mean loss: 0.36203204928634736
Epoch: 14, step: 401, loss: 0.351697713136673, mean loss: 0.3620315480575109
Epoch: 14, step: 402, loss: 0.341071218252182, mean loss: 0.3620305315033713
Epoch: 14, step: 403, loss: 0.32269829511642456, mean loss: 0.3620286240234301
Epoch: 14, step: 404, loss: 0.30275434255599976, mean loss: 0.3620257495614027
Epoch: 14, step: 405, loss: 0.3506627082824707, mean loss: 0.36202519854592025
Epoch: 14, step: 406, loss: 0.3515702784061432, mean loss: 0.36202469159154216
Epoch: 14, step: 407, loss: 0.3713113069534302, mean loss: 0.36202514187351276
Epoch: 14, step: 408, loss: 0.31657344102859497, mean loss: 0.3620229381546839
Epoch: 14, step: 409, loss: 0.31097301840782166, mean loss: 0.36202046312706115
Epoch: 14, step: 410, loss: 0.3548658788204193, mean loss: 0.3620201162717595
Epoch: 14, step: 411, loss: 0.3987296521663666, mean loss: 0.36202189586919475
Epoch: 14, step: 412, loss: 0.3055761754512787, mean loss: 0.36201915963765574
Epoch: 14, step: 413, loss: 0.4264846444129944, mean loss: 0.3620222844793802
Epoch: 14, step: 414, loss: 0.3233069181442261, mean loss: 0.36202040791661855
Epoch: 14, step: 415, loss: 0.38857805728912354, mean loss: 0.3620216951233543
Epoch: 14, step: 416, loss: 0.31750020384788513, mean loss: 0.3620195373425529
Epoch: 14, step: 417, loss: 0.3361816108226776, mean loss: 0.36201828514101564
Epoch: 14, step: 418, loss: 0.3542982041835785, mean loss: 0.36201791101545433
Epoch: 14, step: 419, loss: 0.3499889373779297, mean loss: 0.3620173281033765
Epoch: 14, step: 420, loss: 0.35266199707984924, mean loss: 0.3620168747753238
Epoch: 14, step: 421, loss: 0.3370179235935211, mean loss: 0.3620156634684539
Epoch: 14, step: 422, loss: 0.3325316309928894, mean loss: 0.36201423490929524
Epoch: 14, step: 423, loss: 0.31624385714530945, mean loss: 0.36201201735223304
Epoch: 14, step: 424, loss: 0.3251171410083771, mean loss: 0.36201022989637605
Epoch: 14, step: 425, loss: 0.3097783625125885, mean loss: 0.36200769952783696
Epoch: 14, step: 426, loss: 0.37864452600479126, mean loss: 0.3620085054584903
Epoch: 14, step: 427, loss: 0.3329663872718811, mean loss: 0.36200709865175773
Epoch: 14, step: 428, loss: 0.33312010765075684, mean loss: 0.3620056994271997
Epoch: 14, step: 429, loss: 0.3547654449939728, mean loss: 0.36200534874162216
Epoch: 14, step: 430, loss: 0.30845460295677185, mean loss: 0.36200275510836866
Epoch: 14, step: 431, loss: 0.33212974667549133, mean loss: 0.36200130833345423
Epoch: 14, step: 432, loss: 0.3019962012767792, mean loss: 0.36199840237640757
Epoch: 14, step: 433, loss: 0.3758171796798706, mean loss: 0.3619990715665918
Epoch: 14, step: 434, loss: 0.33379819989204407, mean loss: 0.36199770597307696
Epoch: 14, step: 435, loss: 0.29209765791893005, mean loss: 0.3619943213106688
Epoch: 14, step: 436, loss: 0.36148548126220703, mean loss: 0.3619942966730835
Epoch: 14, step: 437, loss: 0.33484429121017456, mean loss: 0.3619929821574709
Epoch: 14, step: 438, loss: 0.3227618932723999, mean loss: 0.36199108280676234
Epoch: 14, step: 439, loss: 0.3312920331954956, mean loss: 0.3619895966018044
Epoch: 14, step: 440, loss: 0.3317515552043915, mean loss: 0.36198813278608105
Epoch: 14, step: 441, loss: 0.3243435323238373, mean loss: 0.36198631050897473
Epoch: 14, step: 442, loss: 0.2988983988761902, mean loss: 0.36198325673523774
Epoch: 14, step: 443, loss: 0.32275834679603577, mean loss: 0.36198135814327553
Epoch: 14, step: 444, loss: 0.37067997455596924, mean loss: 0.36198177915950963
Epoch: 14, step: 445, loss: 0.3806961178779602, mean loss: 0.36198268489654956
Epoch: 14, step: 446, loss: 0.3631768822669983, mean loss: 0.3619827426905471
Epoch: 14, step: 447, loss: 0.3835011422634125, mean loss: 0.361983784037797
Epoch: 14, step: 448, loss: 0.3439955413341522, mean loss: 0.3619829135687574
Epoch: 14, step: 449, loss: 0.31555068492889404, mean loss: 0.36198066677553953
Epoch: 14, step: 450, loss: 0.35808175802230835, mean loss: 0.3619804781217072
Epoch: 14, step: 451, loss: 0.34944140911102295, mean loss: 0.3619798714317028
Epoch: 14, step: 452, loss: 0.3500378727912903, mean loss: 0.3619792936582914
Epoch: 14, step: 453, loss: 0.3774939477443695, mean loss: 0.3619800442462975
Epoch: 14, step: 454, loss: 0.35086360573768616, mean loss: 0.36197950646687177
Epoch: 14, step: 455, loss: 0.3418540954589844, mean loss: 0.3619785329079027
Epoch: 14, step: 456, loss: 0.34847491979599, mean loss: 0.3619778797074426
Epoch: 14, step: 457, loss: 0.3429994285106659, mean loss: 0.36197696172102506
Epoch: 14, step: 458, loss: 0.2990105152130127, mean loss: 0.3619739161855229
Epoch: 14, step: 459, loss: 0.30189764499664307, mean loss: 0.36197101058138337
Epoch: 14, step: 460, loss: 0.2928362488746643, mean loss: 0.3619676670227575
Epoch: 14, step: 461, loss: 0.2962813675403595, mean loss: 0.36196449039544915
Epoch: 14, step: 462, loss: 0.3637023866176605, mean loss: 0.361964574437048
Epoch: 14, step: 463, loss: 0.31347426772117615, mean loss: 0.36196222964465363
Epoch: 14, step: 464, loss: 0.34014707803726196, mean loss: 0.36196117480438444
Epoch: 14, step: 465, loss: 0.3056320250034332, mean loss: 0.3619584512210849
Epoch: 14, step: 466, loss: 0.33403539657592773, mean loss: 0.3619571011725114
Epoch: 14, step: 467, loss: 0.3045353293418884, mean loss: 0.3619543250280601
Epoch: 14, step: 468, loss: 0.33868885040283203, mean loss: 0.36195320027705086
Epoch: 14, step: 469, loss: 0.3327155113220215, mean loss: 0.3619517868723832
Epoch: 14, step: 470, loss: 0.3175904452800751, mean loss: 0.36194964246567407
Epoch: 14, step: 471, loss: 0.3159357011318207, mean loss: 0.3619474182805748
Epoch: 14, step: 472, loss: 0.35199159383773804, mean loss: 0.361946937067155
Epoch: 14, step: 473, loss: 0.32538869976997375, mean loss: 0.36194517011513483
Epoch: 14, step: 474, loss: 0.3897392451763153, mean loss: 0.3619465134081154
Epoch: 14, step: 475, loss: 0.3095380663871765, mean loss: 0.36194398062022537
Epoch: 14, step: 476, loss: 0.3310191333293915, mean loss: 0.36194248616087726
Epoch: 14, step: 477, loss: 0.318601131439209, mean loss: 0.36194039176855475
Epoch: 14, step: 478, loss: 0.3256390690803528, mean loss: 0.3619386376577701
Epoch: 14, step: 479, loss: 0.3602871596813202, mean loss: 0.36193855786080564
Epoch: 14, step: 480, loss: 0.36948445439338684, mean loss: 0.361938922449709
Epoch: 14, step: 481, loss: 0.3397430181503296, mean loss: 0.36193785008019025
Epoch: 14, step: 482, loss: 0.3165297210216522, mean loss: 0.3619356563447896
Epoch: 14, step: 483, loss: 0.3545774817466736, mean loss: 0.3619353008774177
Epoch: 14, step: 484, loss: 0.433989942073822, mean loss: 0.3619387816098073
Epoch: 14, step: 485, loss: 0.3205357789993286, mean loss: 0.3619367816579857
Epoch: 14, step: 486, loss: 0.29496219754219055, mean loss: 0.3619335466396736
Epoch: 14, step: 487, loss: 0.33464133739471436, mean loss: 0.3619322284301853
Epoch: 14, step: 488, loss: 0.3266341984272003, mean loss: 0.3619305236231337
Epoch: 14, step: 489, loss: 0.3183078467845917, mean loss: 0.36192841685809757
Epoch: 14, step: 490, loss: 0.3257330656051636, mean loss: 0.3619266688815074
Epoch: 14, step: 491, loss: 0.29113054275512695, mean loss: 0.36192325010006415
Epoch: 14, step: 492, loss: 0.35583946108818054, mean loss: 0.36192295632494165
Epoch: 14, step: 493, loss: 0.3434152901172638, mean loss: 0.36192206266650573
Epoch: 14, step: 494, loss: 0.32526856660842896, mean loss: 0.36192029290666516
Epoch: 14, step: 495, loss: 0.33191946148872375, mean loss: 0.3619188444308339
Epoch: 14, step: 496, loss: 0.29485923051834106, mean loss: 0.36191560686921015
Epoch: 14, step: 497, loss: 0.36371108889579773, mean loss: 0.3619156935488484
Epoch: 14, step: 498, loss: 0.3332335650920868, mean loss: 0.36191430894211624
Epoch: 14, step: 499, loss: 0.31296995282173157, mean loss: 0.36191194630665957
Epoch: 14, step: 500, loss: 0.34111320972442627, mean loss: 0.3619109423612726
Epoch: 14, step: 501, loss: 0.31486764550209045, mean loss: 0.3619086717127129
Epoch: 14, step: 502, loss: 0.3184944987297058, mean loss: 0.3619065763329657
Epoch: 14, step: 503, loss: 0.30243369936943054, mean loss: 0.3619037060203709
Epoch: 14, step: 504, loss: 0.38732844591140747, mean loss: 0.36190493302388865
Epoch: 14, step: 505, loss: 0.3585103452205658, mean loss: 0.36190476920824327
Epoch: 14, step: 506, loss: 0.35848867893218994, mean loss: 0.361904604362889
Epoch: 14, step: 507, loss: 0.318482369184494, mean loss: 0.36190250909965904
Epoch: 14, step: 508, loss: 0.3527258634567261, mean loss: 0.3619020663182046
Epoch: 14, step: 509, loss: 0.3011987805366516, mean loss: 0.3618991374710666
Epoch: 14, step: 510, loss: 0.35423827171325684, mean loss: 0.3618987678630308
Epoch: 14, step: 511, loss: 0.3335671126842499, mean loss: 0.36189740103288903
Epoch: 14, step: 512, loss: 0.2835977375507355, mean loss: 0.36189362373232065
Epoch: 14, step: 513, loss: 0.3317144811153412, mean loss: 0.36189216791260925
Epoch: 14, step: 514, loss: 0.36090579628944397, mean loss: 0.3618921203330606
Epoch: 14, step: 515, loss: 0.33370742201805115, mean loss: 0.3618907608550404
Epoch: 14, step: 516, loss: 0.2988240718841553, mean loss: 0.3618877190044172
Epoch: 14, step: 517, loss: 0.37618589401245117, mean loss: 0.36188840860483235
Epoch: 14, step: 518, loss: 0.28922492265701294, mean loss: 0.3618849042167953
Epoch: 14, step: 519, loss: 0.35165902972221375, mean loss: 0.3618844110708417
Epoch: 14, step: 520, loss: 0.3163161277770996, mean loss: 0.36188221363228773
Epoch: 14, step: 521, loss: 0.32829394936561584, mean loss: 0.3618805939840928
Epoch: 14, step: 522, loss: 0.3522810935974121, mean loss: 0.36188013111219025
Epoch: 14, step: 523, loss: 0.30877992510795593, mean loss: 0.3618775708322479
Epoch: 14, step: 524, loss: 0.35325223207473755, mean loss: 0.3618771549728989
Epoch: 14, step: 525, loss: 0.37764421105384827, mean loss: 0.3618779151240936
Epoch: 14, step: 526, loss: 0.3142003118991852, mean loss: 0.3618756166328809
Epoch: 14, step: 527, loss: 0.30812734365463257, mean loss: 0.36187302560545237
Epoch: 14, step: 528, loss: 0.3609102964401245, mean loss: 0.3618729791976835
Epoch: 14, step: 529, loss: 0.35058435797691345, mean loss: 0.3618724350628517
Epoch: 14, step: 530, loss: 0.35862138867378235, mean loss: 0.36187227836326197
Epoch: 14, step: 531, loss: 0.32186588644981384, mean loss: 0.36187035015852353
Epoch: 14, step: 532, loss: 0.3073783218860626, mean loss: 0.3618677239101129
Epoch: 14, step: 533, loss: 0.31821587681770325, mean loss: 0.3618656202066386
Epoch: 14, step: 534, loss: 0.4252908527851105, mean loss: 0.36186867669705247
Epoch: 14, step: 535, loss: 0.3065773844718933, mean loss: 0.36186601231327137
Epoch: 14, step: 536, loss: 0.33410799503326416, mean loss: 0.36186467477087847
Epoch: 14, step: 537, loss: 0.32211190462112427, mean loss: 0.3618627593439656
Epoch: 14, step: 538, loss: 0.318636417388916, mean loss: 0.36186067664861726
Epoch: 14, step: 539, loss: 0.3566652834415436, mean loss: 0.36186042634059995
Epoch: 14, step: 540, loss: 0.3582008183002472, mean loss: 0.36186025003342454
Epoch: 14, step: 541, loss: 0.2973230481147766, mean loss: 0.36185714100548744
Epoch: 14, step: 542, loss: 0.3453182876110077, mean loss: 0.3618563442978717
Epoch: 14, step: 543, loss: 0.3027660548686981, mean loss: 0.36185349794481636
Epoch: 14, step: 544, loss: 0.34617966413497925, mean loss: 0.3618527429795541
Epoch: 14, step: 545, loss: 0.3808230757713318, mean loss: 0.36185365668405234
Epoch: 14, step: 546, loss: 0.3240780830383301, mean loss: 0.36185183731432513
Epoch: 14, step: 547, loss: 0.3821488320827484, mean loss: 0.3618528148232236
Epoch: 14, step: 548, loss: 0.3561581075191498, mean loss: 0.36185254057774785
Epoch: 14, step: 549, loss: 0.32554367184638977, mean loss: 0.3618507921009718
Epoch: 14, step: 550, loss: 0.3248768150806427, mean loss: 0.36184901168121836
Epoch: 14, step: 551, loss: 0.3402719795703888, mean loss: 0.36184797272551195
Epoch: 14, step: 552, loss: 0.3247423768043518, mean loss: 0.36184618613993147
Epoch: 14, step: 553, loss: 0.31026121973991394, mean loss: 0.36184370251131326
Epoch: 14, step: 554, loss: 0.35461655259132385, mean loss: 0.3618433545670679
Epoch: 14, step: 555, loss: 0.39238807559013367, mean loss: 0.36184482504275745
Epoch: 14, step: 556, loss: 0.3133889138698578, mean loss: 0.3618424924036984
Epoch: 14, step: 557, loss: 0.3472016453742981, mean loss: 0.3618417876358622
Epoch: 14, step: 558, loss: 0.3552815020084381, mean loss: 0.361841471857974
Epoch: 14, step: 559, loss: 0.3214826285839081, mean loss: 0.36183952928754304
Epoch: 14, step: 560, loss: 0.32524970173835754, mean loss: 0.3618377682138775
Epoch: 14, step: 561, loss: 0.3520664572715759, mean loss: 0.3618372979419099
Epoch: 14, step: 562, loss: 0.30257171392440796, mean loss: 0.36183444575537455
Epoch: 14, step: 563, loss: 0.2939135432243347, mean loss: 0.36183117718451163
Epoch: 14, step: 564, loss: 0.29515573382377625, mean loss: 0.36182796870352607
Epoch: 14, step: 565, loss: 0.35311248898506165, mean loss: 0.3618275493271562
Epoch: 14, step: 566, loss: 0.3775700628757477, mean loss: 0.36182830679785577
Epoch: 14, step: 567, loss: 0.3420499265193939, mean loss: 0.36182735518217646
Epoch: 14, step: 568, loss: 0.3593910038471222, mean loss: 0.36182723796536936
Epoch: 14, step: 569, loss: 0.3022761344909668, mean loss: 0.3618243730032086
Epoch: 14, step: 570, loss: 0.33774349093437195, mean loss: 0.361823214544457
Epoch: 14, step: 571, loss: 0.32977238297462463, mean loss: 0.36182167274959603
Epoch: 14, step: 572, loss: 0.3631014823913574, mean loss: 0.3618217343114625
Epoch: 14, step: 573, loss: 0.36672332882881165, mean loss: 0.3618219700783945
Epoch: 14, step: 574, loss: 0.3755505084991455, mean loss: 0.36182263038999185
Epoch: 14, step: 575, loss: 0.35670584440231323, mean loss: 0.361822384296014
Epoch: 14, step: 576, loss: 0.33461320400238037, mean loss: 0.36182107572196054
Epoch: 14, step: 577, loss: 0.31543809175491333, mean loss: 0.3618188451273675
Epoch: 14, step: 578, loss: 0.33780092000961304, mean loss: 0.3618176901417884
Epoch: 14, step: 579, loss: 0.35987526178359985, mean loss: 0.3618175967378473
Epoch: 14, step: 580, loss: 0.2998679280281067, mean loss: 0.3618146179587585
Epoch: 14, step: 581, loss: 0.33093637228012085, mean loss: 0.3618131332849592
Epoch: 14, step: 582, loss: 0.30117928981781006, mean loss: 0.3618102180561757
Epoch: 14, step: 583, loss: 0.36772456765174866, mean loss: 0.36181050239990625
Epoch: 14, step: 584, loss: 0.3428933620452881, mean loss: 0.3618095929657274
Epoch: 14, step: 585, loss: 0.31943878531455994, mean loss: 0.3618075561035194
Epoch: 14, step: 586, loss: 0.33068037033081055, mean loss: 0.3618060598200135
Epoch: 14, step: 587, loss: 0.29974740743637085, mean loss: 0.36180307680461343
Epoch: 14, step: 588, loss: 0.3674715757369995, mean loss: 0.36180334926310576
Epoch: 14, step: 589, loss: 0.3419783413410187, mean loss: 0.3618023964125856
Epoch: 14, step: 590, loss: 0.33911898732185364, mean loss: 0.3618013062309597
Epoch: 14, step: 591, loss: 0.38561564683914185, mean loss: 0.3618024507109966
Epoch: 14, step: 592, loss: 0.2925507724285126, mean loss: 0.36179912274337284
Epoch: 14, step: 593, loss: 0.3474915623664856, mean loss: 0.36179843521043786
Epoch: 14, step: 594, loss: 0.3818354904651642, mean loss: 0.36179939802122324
Epoch: 14, step: 595, loss: 0.32131561636924744, mean loss: 0.3617974528078054
Epoch: 14, step: 596, loss: 0.31030192971229553, mean loss: 0.3617949786078777
Epoch: 14, step: 597, loss: 0.35808125138282776, mean loss: 0.36179480018339294
Epoch: 14, step: 598, loss: 0.3169897198677063, mean loss: 0.3617926476453043
Epoch: 14, step: 599, loss: 0.29774942994117737, mean loss: 0.3617895710110948
Epoch: 14, step: 600, loss: 0.3881480395793915, mean loss: 0.36179083721028626
Epoch: 14, step: 601, loss: 0.3490700125694275, mean loss: 0.36179022616097123
Epoch: 14, step: 602, loss: 0.3453739881515503, mean loss: 0.3617894376390437
Epoch: 14, step: 603, loss: 0.33143728971481323, mean loss: 0.3617879798029282
Epoch: 14, step: 604, loss: 0.32444441318511963, mean loss: 0.3617861862499472
Epoch: 14, step: 605, loss: 0.3891774117946625, mean loss: 0.36178750174440233
Epoch: 14, step: 606, loss: 0.3543258309364319, mean loss: 0.36178714340646795
Epoch: 14, step: 607, loss: 0.3959342837333679, mean loss: 0.36178878320383284
Epoch: 14, step: 608, loss: 0.3256376087665558, mean loss: 0.36178704725307953
Epoch: 14, step: 609, loss: 0.3521115779876709, mean loss: 0.3617865826670205
Epoch: 14, step: 610, loss: 0.36051318049430847, mean loss: 0.3617865215251291
Epoch: 14, step: 611, loss: 0.34547388553619385, mean loss: 0.3617857383181006
Epoch: 14, step: 612, loss: 0.3413905203342438, mean loss: 0.3617847591439692
Epoch: 14, step: 613, loss: 0.3152277171611786, mean loss: 0.3617825240483387
Epoch: 14, step: 614, loss: 0.31945937871932983, mean loss: 0.3617804923098082
Epoch: 14, step: 615, loss: 0.3360404968261719, mean loss: 0.36177925671094663
Epoch: 14, step: 616, loss: 0.3628760874271393, mean loss: 0.3617793093596634
Epoch: 14, step: 617, loss: 0.33179810643196106, mean loss: 0.36177787030797254
Epoch: 14, step: 618, loss: 0.3194756805896759, mean loss: 0.3617758399652935
Epoch: 14, step: 619, loss: 0.34575703740119934, mean loss: 0.36177507116117735
Epoch: 14, step: 620, loss: 0.3101794123649597, mean loss: 0.3617725950053586
Epoch: 14, step: 621, loss: 0.33458411693573, mean loss: 0.3617712902506763
Epoch: 14, step: 622, loss: 0.34852421283721924, mean loss: 0.36177065456386726
Epoch: 14, step: 623, loss: 0.3362138867378235, mean loss: 0.361769428231438
Epoch: 14, step: 624, loss: 0.31354695558547974, mean loss: 0.36176711440423936
Epoch: 14, step: 625, loss: 0.3376248776912689, mean loss: 0.36176595605874884
Epoch: 14, step: 626, loss: 0.35116690397262573, mean loss: 0.3617654475402013
Epoch: 14, step: 627, loss: 0.33730652928352356, mean loss: 0.3617642741129197
Epoch: 14, step: 628, loss: 0.3461362421512604, mean loss: 0.36176352438723197
Epoch: 14, step: 629, loss: 0.3060532510280609, mean loss: 0.36176085191897145
Epoch: 14, step: 630, loss: 0.28599995374679565, mean loss: 0.3617572177798544
Epoch: 14, step: 631, loss: 0.3331523835659027, mean loss: 0.3617558457137467
Epoch: 14, step: 632, loss: 0.3572540581226349, mean loss: 0.3617556297903167
Epoch: 14, step: 633, loss: 0.3101827800273895, mean loss: 0.3617531562723425
Epoch: 14, step: 634, loss: 0.32269200682640076, mean loss: 0.36175128292576697
Epoch: 14, step: 635, loss: 0.3128136396408081, mean loss: 0.3617489360217153
Epoch: 14, step: 636, loss: 0.3285631537437439, mean loss: 0.36174734460646196
Epoch: 14, step: 637, loss: 0.33702850341796875, mean loss: 0.3617461592779308
Epoch: 14, step: 638, loss: 0.3218058943748474, mean loss: 0.36174424413696205
Epoch: 14, step: 639, loss: 0.27874991297721863, mean loss: 0.36174026473865173
Epoch: 14, step: 640, loss: 0.31750577688217163, mean loss: 0.36173814389251585
Epoch: 14, step: 641, loss: 0.34514120221138, mean loss: 0.36173734818143705
Epoch: 14, step: 642, loss: 0.3336373567581177, mean loss: 0.3617360010415251
Epoch: 14, step: 643, loss: 0.345720112323761, mean loss: 0.36173523326162493
Epoch: 14, step: 644, loss: 0.3229312598705292, mean loss: 0.3617333731411422
Epoch: 14, step: 645, loss: 0.340356707572937, mean loss: 0.36173234847114083
Epoch: 14, step: 646, loss: 0.34353137016296387, mean loss: 0.36173147606648626
Epoch: 14, step: 647, loss: 0.3667118549346924, mean loss: 0.3617317147732955
Epoch: 14, step: 648, loss: 0.33973056077957153, mean loss: 0.3617306603206718
Epoch: 14, step: 649, loss: 0.34023424983024597, mean loss: 0.3617296301083412
Epoch: 14, step: 650, loss: 0.3246190547943115, mean loss: 0.3617278516746749
Epoch: 14, step: 651, loss: 0.34405282139778137, mean loss: 0.3617270046826164
Epoch: 14, step: 652, loss: 0.32355016469955444, mean loss: 0.3617251753261555
Epoch: 14, step: 653, loss: 0.38137927651405334, mean loss: 0.3617261170655512
Epoch: 14, step: 654, loss: 0.35169747471809387, mean loss: 0.3617256365594735
Epoch: 14, step: 655, loss: 0.33844301104545593, mean loss: 0.36172452106380876
Epoch: 14, step: 656, loss: 0.30516135692596436, mean loss: 0.36172181119152697
Epoch: 14, step: 657, loss: 0.3107198476791382, mean loss: 0.36171936786664854
Epoch: 14, step: 658, loss: 0.32717108726501465, mean loss: 0.3617177128591946
Epoch: 14, step: 659, loss: 0.3594519793987274, mean loss: 0.36171760432626393
Epoch: 14, step: 660, loss: 0.32903677225112915, mean loss: 0.36171603892740034
Epoch: 14, step: 661, loss: 0.3736319839954376, mean loss: 0.3617166096690934
Epoch: 14, step: 662, loss: 0.31579652428627014, mean loss: 0.3617144103259552
Epoch: 14, step: 663, loss: 0.33498138189315796, mean loss: 0.3617131300085015
Epoch: 14, step: 664, loss: 0.338418573141098, mean loss: 0.3617120144222333
Epoch: 14, step: 665, loss: 0.33809950947761536, mean loss: 0.36171088366344845
Epoch: 14, step: 666, loss: 0.33415648341178894, mean loss: 0.3617095641978424
Epoch: 14, step: 667, loss: 0.32170000672340393, mean loss: 0.3617076483983081
Epoch: 14, step: 668, loss: 0.36953598260879517, mean loss: 0.36170802322877066
Epoch: 14, step: 669, loss: 0.3030397891998291, mean loss: 0.36170521425462393
Epoch: 14, step: 670, loss: 0.3579413890838623, mean loss: 0.36170503405520943
Epoch: 14, step: 671, loss: 0.34226125478744507, mean loss: 0.36170410319637814
Epoch: 14, step: 672, loss: 0.32418376207351685, mean loss: 0.36170230701938916
Epoch: 14, step: 673, loss: 0.3555185794830322, mean loss: 0.3617020110056248
Epoch: 14, step: 674, loss: 0.3471500277519226, mean loss: 0.3617013144385264
Epoch: 14, step: 675, loss: 0.32195305824279785, mean loss: 0.3616994118798343
Epoch: 14, step: 676, loss: 0.3592086434364319, mean loss: 0.36169929266438205
Epoch: 14, step: 677, loss: 0.30606627464294434, mean loss: 0.3616966300330993
Epoch: 14, step: 678, loss: 0.32047152519226074, mean loss: 0.36169465706804355
Epoch: 14, step: 679, loss: 0.3251541256904602, mean loss: 0.3616929083825833
Epoch: 14, step: 680, loss: 0.32235944271087646, mean loss: 0.3616910261283998
Epoch: 14, step: 681, loss: 0.3173482120037079, mean loss: 0.3616889042596026
Epoch: 14, step: 682, loss: 0.345110684633255, mean loss: 0.36168811100539777
Epoch: 14, step: 683, loss: 0.33996328711509705, mean loss: 0.36168707154013985
Epoch: 14, step: 684, loss: 0.33560675382614136, mean loss: 0.3616858237377517
Epoch: 14, step: 685, loss: 0.36756280064582825, mean loss: 0.361686104905913
Epoch: 14, step: 686, loss: 0.3265537619590759, mean loss: 0.3616844241738197
Epoch: 14, step: 687, loss: 0.32225245237350464, mean loss: 0.36168253783762566
Epoch: 14, step: 688, loss: 0.36214005947113037, mean loss: 0.3616825597233771
Epoch: 14, step: 689, loss: 0.31336450576782227, mean loss: 0.36168024851827063
Epoch: 14, step: 690, loss: 0.30842164158821106, mean loss: 0.36167770111276387
Epoch: 14, step: 691, loss: 0.32311272621154785, mean loss: 0.36167585660468554
Epoch: 14, step: 692, loss: 0.3615226149559021, mean loss: 0.36167584927570523
Epoch: 14, step: 693, loss: 0.31731075048446655, mean loss: 0.36167372755888116
Epoch: 14, step: 694, loss: 0.379634827375412, mean loss: 0.36167458648957873
Epoch: 14, step: 695, loss: 0.36075305938720703, mean loss: 0.36167454242267444
Epoch: 14, step: 696, loss: 0.33691248297691345, mean loss: 0.3616733583716322
Epoch: 14, step: 697, loss: 0.3398537039756775, mean loss: 0.3616723150678933
Epoch: 14, step: 698, loss: 0.3111647665500641, mean loss: 0.36166990017195655
Epoch: 14, step: 699, loss: 0.36532407999038696, mean loss: 0.3616700748793489
Epoch: 14, step: 700, loss: 0.3325750231742859, mean loss: 0.3616686839030279
Epoch: 14, step: 701, loss: 0.3247447907924652, mean loss: 0.36166691872982254
Epoch: 14, step: 702, loss: 0.3101175129413605, mean loss: 0.36166445449129353
Epoch: 14, step: 703, loss: 0.3311121463775635, mean loss: 0.36166299405591523
Epoch: 14, step: 704, loss: 0.31178662180900574, mean loss: 0.36166061002206185
Epoch: 14, step: 705, loss: 0.32243821024894714, mean loss: 0.36165873532558096
Epoch: 14, step: 706, loss: 0.33675509691238403, mean loss: 0.3616575450737809
Epoch: 14, step: 707, loss: 0.34061530232429504, mean loss: 0.3616565394227223
Epoch: 14, step: 708, loss: 0.3315926790237427, mean loss: 0.3616551026790951
Epoch: 14, step: 709, loss: 0.31133219599723816, mean loss: 0.36165269787613796
Epoch: 14, step: 710, loss: 0.34907981753349304, mean loss: 0.36165209707906515
Epoch: 14, step: 711, loss: 0.3396032154560089, mean loss: 0.3616510435201191
Epoch: 14, step: 712, loss: 0.36211225390434265, mean loss: 0.3616510655570241
Epoch: 14, step: 713, loss: 0.31841790676116943, mean loss: 0.3616489999498193
Epoch: 14, step: 714, loss: 0.32662421464920044, mean loss: 0.3616473266047665
Epoch: 14, step: 715, loss: 0.34941303730010986, mean loss: 0.36164674212696674
Epoch: 14, step: 716, loss: 0.33725059032440186, mean loss: 0.3616455766871443
Epoch: 14, step: 717, loss: 0.3767838776111603, mean loss: 0.3616462998313558
Epoch: 14, step: 718, loss: 0.3122233748435974, mean loss: 0.3616439390515618
Epoch: 14, step: 719, loss: 0.3152666985988617, mean loss: 0.3616417238604817
Epoch: 14, step: 720, loss: 0.3087964355945587, mean loss: 0.3616391998461403
Epoch: 14, step: 721, loss: 0.3970720171928406, mean loss: 0.3616408921193921
Epoch: 14, step: 722, loss: 0.32156994938850403, mean loss: 0.3616389784204222
Epoch: 14, step: 723, loss: 0.3572346568107605, mean loss: 0.3616387680898773
Epoch: 14, step: 724, loss: 0.3128473460674286, mean loss: 0.3616364381427868
Epoch: 14, step: 725, loss: 0.3670295774936676, mean loss: 0.36163669567021256
Epoch: 14, step: 726, loss: 0.40557339787483215, mean loss: 0.3616387935884766
Epoch: 14, step: 727, loss: 0.31176695227622986, mean loss: 0.3616364123890251
Epoch: 14, step: 728, loss: 0.32319188117980957, mean loss: 0.3616345768898029
Epoch: 14, step: 729, loss: 0.3511037528514862, mean loss: 0.3616340741291785
Epoch: 14, step: 730, loss: 0.3271031081676483, mean loss: 0.3616324256369857
Epoch: 14, step: 731, loss: 0.3329685628414154, mean loss: 0.3616310573028824
Epoch: 14, step: 732, loss: 0.33768051862716675, mean loss: 0.3616299140245075
Epoch: 14, step: 733, loss: 0.3872344493865967, mean loss: 0.36163113619803317
Epoch: 14, step: 734, loss: 0.3256371319293976, mean loss: 0.36162941818914246
Epoch: 14, step: 735, loss: 0.31811895966529846, mean loss: 0.3616273415158643
Epoch: 14, step: 736, loss: 0.3524966239929199, mean loss: 0.3616269057444939
Epoch: 14, step: 737, loss: 0.29879826307296753, mean loss: 0.3616239073364252
Epoch: 14, step: 738, loss: 0.3518734872341156, mean loss: 0.3616234420336286
Epoch: 14, step: 739, loss: 0.32233697175979614, mean loss: 0.3616215673213613
Epoch: 14, step: 740, loss: 0.3372959494590759, mean loss: 0.3616204065818536
Epoch: 14, step: 741, loss: 0.3229619264602661, mean loss: 0.36161856201270953
Epoch: 14, step: 742, loss: 0.32617929577827454, mean loss: 0.36161687112735075
Epoch: 14, step: 743, loss: 0.28748220205307007, mean loss: 0.36161333416794833
Epoch: 14, step: 744, loss: 0.3118177056312561, mean loss: 0.3616109585356533
Epoch: 14, step: 745, loss: 0.29715877771377563, mean loss: 0.36160788382041514
Epoch: 14, step: 746, loss: 0.323474258184433, mean loss: 0.3616060647284132
Epoch: 14, step: 747, loss: 0.31009557843208313, mean loss: 0.3616036076359549
Epoch: 14, step: 748, loss: 0.35103341937065125, mean loss: 0.3616031034533522
Epoch: 14, step: 749, loss: 0.3296626806259155, mean loss: 0.3616015800143163
Epoch: 14, step: 750, loss: 0.3549075424671173, mean loss: 0.3616012607489208
Epoch: 14, step: 751, loss: 0.2963064908981323, mean loss: 0.36159814672899276
Epoch: 14, step: 752, loss: 0.33087921142578125, mean loss: 0.36159668175997645
Epoch: 14, step: 753, loss: 0.3248805105686188, mean loss: 0.36159493086960015
Epoch: 14, step: 754, loss: 0.40809381008148193, mean loss: 0.36159714816392147
Epoch: 14, step: 755, loss: 0.33206629753112793, mean loss: 0.361595740055461
Epoch: 14, step: 756, loss: 0.3537824749946594, mean loss: 0.36159536751624105
Epoch: 14, step: 757, loss: 0.3230865001678467, mean loss: 0.3615935314874746
Epoch: 14, step: 758, loss: 0.33633407950401306, mean loss: 0.3615923272227793
Epoch: 14, step: 759, loss: 0.36269140243530273, mean loss: 0.36159237961957624
Epoch: 14, step: 760, loss: 0.3052102327346802, mean loss: 0.36158969181164924
Epoch: 14, step: 761, loss: 0.3307887017726898, mean loss: 0.36158822355966913
Epoch: 14, step: 762, loss: 0.3103325068950653, mean loss: 0.36158578036806494
Epoch: 14, step: 763, loss: 0.43950390815734863, mean loss: 0.3615894942921731
Epoch: 14, step: 764, loss: 0.3386301100254059, mean loss: 0.3615883999980848
Epoch: 14, step: 765, loss: 0.350966215133667, mean loss: 0.3615878937458274
Epoch: 14, step: 766, loss: 0.3497011661529541, mean loss: 0.36158732725259035
Epoch: 14, step: 767, loss: 0.3218109607696533, mean loss: 0.3615854316956668
Epoch: 14, step: 768, loss: 0.3442050814628601, mean loss: 0.36158460346835053
Epoch: 14, step: 769, loss: 0.36491256952285767, mean loss: 0.36158476204864476
Epoch: 14, step: 770, loss: 0.36392754316329956, mean loss: 0.3615848736787546
Epoch: 14, step: 771, loss: 0.315970242023468, mean loss: 0.3615827003115135
Epoch: 14, step: 772, loss: 0.3254896402359009, mean loss: 0.36158098069361483
Epoch: 14, step: 773, loss: 0.3226247727870941, mean loss: 0.3615791247523139
Epoch: 14, step: 774, loss: 0.40055978298187256, mean loss: 0.3615809817699991
Epoch: 14, step: 775, loss: 0.31830841302871704, mean loss: 0.36157892038619854
Epoch: 14, step: 776, loss: 0.34086352586746216, mean loss: 0.3615779336099151
Epoch: 14, step: 777, loss: 0.3468092083930969, mean loss: 0.3615772301362932
Epoch: 14, step: 778, loss: 0.30621105432510376, mean loss: 0.36157459302384687
Epoch: 14, step: 779, loss: 0.3229789435863495, mean loss: 0.36157275478563783
Epoch: 14, step: 780, loss: 0.37115341424942017, mean loss: 0.3615732110727009
Epoch: 14, step: 781, loss: 0.33555546402931213, mean loss: 0.36157197201436
Epoch: 14, step: 782, loss: 0.31341323256492615, mean loss: 0.3615696786318442
Epoch: 14, step: 783, loss: 0.30340760946273804, mean loss: 0.36156690900950283
Epoch: 14, step: 784, loss: 0.3499376177787781, mean loss: 0.36156635526009895
Epoch: 14, step: 785, loss: 0.34818291664123535, mean loss: 0.36156571801418813
Epoch: 14, step: 786, loss: 0.3345322608947754, mean loss: 0.36156443089058105
Epoch: 14, step: 787, loss: 0.30970677733421326, mean loss: 0.36156196194878154
Epoch: 14, step: 788, loss: 0.34048399329185486, mean loss: 0.3615609584749107
Epoch: 14, step: 789, loss: 0.3151203691959381, mean loss: 0.36155874764994267
Epoch: 14, step: 790, loss: 0.32185208797454834, mean loss: 0.3615568574866792
Epoch: 14, step: 791, loss: 0.32335221767425537, mean loss: 0.36155503891090746
Epoch: 14, step: 792, loss: 0.305020272731781, mean loss: 0.3615523479324611
Epoch: 14, step: 793, loss: 0.32979729771614075, mean loss: 0.36155083650693914
Epoch: 14, step: 794, loss: 0.3572219908237457, mean loss: 0.36155063047934966
Epoch: 14, step: 795, loss: 0.30285775661468506, mean loss: 0.3615478371767671
Epoch: 14, step: 796, loss: 0.3183734118938446, mean loss: 0.3615457825236817
Epoch: 14, step: 797, loss: 0.32431700825691223, mean loss: 0.36154401090598554
Epoch: 14, step: 798, loss: 0.38029125332832336, mean loss: 0.361544902994609
Epoch: 14, step: 799, loss: 0.37026122212409973, mean loss: 0.3615453177414271
Epoch: 14, step: 800, loss: 0.3418467044830322, mean loss: 0.3615443804709671
Epoch: 14, step: 801, loss: 0.30197376012802124, mean loss: 0.36154154620413187
Epoch: 14, step: 802, loss: 0.324766606092453, mean loss: 0.36153979659948315
Epoch: 14, step: 803, loss: 0.3247479796409607, mean loss: 0.36153804627517494
Epoch: 14, step: 804, loss: 0.375178724527359, mean loss: 0.36153869518237497
Epoch: 14, step: 805, loss: 0.3080158233642578, mean loss: 0.3615361491414741
Epoch: 14, step: 806, loss: 0.3331829607486725, mean loss: 0.3615348004667658
Epoch: 14, step: 807, loss: 0.32726991176605225, mean loss: 0.3615331706680262
Epoch: 14, step: 808, loss: 0.41091054677963257, mean loss: 0.36153551917580795
Epoch: 14, step: 809, loss: 0.3158969283103943, mean loss: 0.3615333485969596
Epoch: 14, step: 810, loss: 0.355117529630661, mean loss: 0.3615330434740716
Epoch: 14, step: 811, loss: 0.3384840190410614, mean loss: 0.36153194736296107
Epoch: 14, step: 812, loss: 0.3961702883243561, mean loss: 0.36153359453310524
Epoch: 14, step: 813, loss: 0.35337895154953003, mean loss: 0.36153320677071893
Epoch: 14, step: 814, loss: 0.3817092776298523, mean loss: 0.3615341661198159
Epoch: 14, step: 815, loss: 0.3999989926815033, mean loss: 0.36153599499137173
Epoch: 14, step: 816, loss: 0.37498706579208374, mean loss: 0.36153663451358925
Epoch: 14, step: 817, loss: 0.3260323405265808, mean loss: 0.36153494656579105
Epoch: 14, step: 818, loss: 0.3563217520713806, mean loss: 0.36153469873149136
Epoch: 14, step: 819, loss: 0.31398099660873413, mean loss: 0.36153243814477704
Epoch: 14, step: 820, loss: 0.2991929352283478, mean loss: 0.3615294748181185
Epoch: 14, step: 821, loss: 0.31055495142936707, mean loss: 0.3615270518442907
Epoch: 14, step: 822, loss: 0.3566950857639313, mean loss: 0.3615268221771924
Epoch: 14, step: 823, loss: 0.30948060750961304, mean loss: 0.36152434849778803
Epoch: 14, step: 824, loss: 0.3077389597892761, mean loss: 0.36152179227951375
Epoch: 14, step: 825, loss: 0.365503191947937, mean loss: 0.36152198149155007
Epoch: 14, step: 826, loss: 0.3215504288673401, mean loss: 0.36152008197377106
Epoch: 14, step: 827, loss: 0.3349073827266693, mean loss: 0.3615188173520619
Epoch: 14, step: 828, loss: 0.3476316034793854, mean loss: 0.3615181574701958
Epoch: 14, step: 829, loss: 0.3216497004032135, mean loss: 0.3615162631217653
Epoch: 14, step: 830, loss: 0.33983924984931946, mean loss: 0.3615152331881276
Epoch: 14, step: 831, loss: 0.3118631839752197, mean loss: 0.36151287419681194
Epoch: 14, step: 832, loss: 0.3526670038700104, mean loss: 0.36151245394547804
Epoch: 14, step: 833, loss: 0.31650882959365845, mean loss: 0.3615103160060789
Epoch: 14, step: 834, loss: 0.31973591446876526, mean loss: 0.36150833156821194
Epoch: 14, step: 835, loss: 0.3611695468425751, mean loss: 0.3615083154754547
Epoch: 14, step: 836, loss: 0.334656685590744, mean loss: 0.3615070400453552
Epoch: 14, step: 837, loss: 0.32840123772621155, mean loss: 0.36150546762195257
Epoch: 14, step: 838, loss: 0.3277476727962494, mean loss: 0.36150386430707127
Epoch: 14, step: 839, loss: 0.36058342456817627, mean loss: 0.36150382059317787
Epoch: 14, step: 840, loss: 0.30332091450691223, mean loss: 0.3615010574784851
Epoch: 14, step: 841, loss: 0.34267178177833557, mean loss: 0.3615001633159008
Epoch: 14, step: 842, loss: 0.3440268337726593, mean loss: 0.3614993335837415
Epoch: 14, step: 843, loss: 0.3317803740501404, mean loss: 0.36149792242706846
Epoch: 14, step: 844, loss: 0.35649874806404114, mean loss: 0.3614976850606394
Epoch: 14, step: 845, loss: 0.3358226716518402, mean loss: 0.36149646603996666
Epoch: 14, step: 846, loss: 0.3960200846195221, mean loss: 0.36149810510460983
Epoch: 14, step: 847, loss: 0.3515825867652893, mean loss: 0.3614976343716845
Epoch: 14, step: 848, loss: 0.3231320381164551, mean loss: 0.36149581307587364
Epoch: 14, step: 849, loss: 0.3427325487136841, mean loss: 0.36149492238640424
Epoch: 14, step: 850, loss: 0.3372296392917633, mean loss: 0.3614937705715709
Epoch: 14, step: 851, loss: 0.3678779900074005, mean loss: 0.3614940736007828
Epoch: 14, step: 852, loss: 0.3084275424480438, mean loss: 0.36149155489884377
Epoch: 14, step: 853, loss: 0.3271534740924835, mean loss: 0.3614899251845198
Epoch: 14, step: 854, loss: 0.37423834204673767, mean loss: 0.3614905302064391
Epoch: 14, step: 855, loss: 0.32812485098838806, mean loss: 0.36148894679341625
Epoch: 14, step: 856, loss: 0.33540838956832886, mean loss: 0.3614877091643542
Epoch: 14, step: 857, loss: 0.3800097107887268, mean loss: 0.3614885880673448
Epoch: 14, step: 858, loss: 0.3096601665019989, mean loss: 0.3614861288302598
Epoch: 14, step: 859, loss: 0.35961437225341797, mean loss: 0.36148604002040136
Epoch: 14, step: 860, loss: 0.3150995671749115, mean loss: 0.3614838392103788
Epoch: 14, step: 861, loss: 0.33885329961776733, mean loss: 0.36148276555350467
Epoch: 14, step: 862, loss: 0.33590584993362427, mean loss: 0.36148155216977584
Epoch: 14, step: 863, loss: 0.35922476649284363, mean loss: 0.36148144511163177
Epoch: 14, step: 864, loss: 0.3066498935222626, mean loss: 0.3614788441177705
Epoch: 14, step: 865, loss: 0.31991642713546753, mean loss: 0.361476872653157
Epoch: 14, step: 866, loss: 0.359075665473938, mean loss: 0.3614767587601067
Epoch: 14, step: 867, loss: 0.3925652801990509, mean loss: 0.3614782332678585
Epoch: 14, step: 868, loss: 0.2959080934524536, mean loss: 0.36147512346753524
Epoch: 14, step: 869, loss: 0.3192186653614044, mean loss: 0.3614731194621238
Epoch: 14, step: 870, loss: 0.3584214746952057, mean loss: 0.36147297474524764
Epoch: 14, step: 871, loss: 0.3665986955165863, mean loss: 0.3614732178086378
Epoch: 14, step: 872, loss: 0.30663400888442993, mean loss: 0.36147061743835357
Epoch: 14, step: 873, loss: 0.3443165123462677, mean loss: 0.36146980406210455
Epoch: 14, step: 874, loss: 0.35467904806137085, mean loss: 0.36146948208799234
Epoch: 14, step: 875, loss: 0.35579922795295715, mean loss: 0.3614692132536412
Epoch: 14, step: 876, loss: 0.38768821954727173, mean loss: 0.3614704562729506
Epoch: 14, step: 877, loss: 0.319803386926651, mean loss: 0.36146848096862966
Epoch: 14, step: 878, loss: 0.3581353425979614, mean loss: 0.3614683229625443
Epoch: 14, step: 879, loss: 0.33474838733673096, mean loss: 0.36146705637477283
Epoch: 14, step: 880, loss: 0.37300774455070496, mean loss: 0.3614676034045958
Epoch: 14, step: 881, loss: 0.3511224687099457, mean loss: 0.36146711306737456
Epoch: 14, step: 882, loss: 0.3156532645225525, mean loss: 0.36146494169202287
Epoch: 14, step: 883, loss: 0.3055976331233978, mean loss: 0.3614622939522803
Epoch: 14, step: 884, loss: 0.31674686074256897, mean loss: 0.3614601748378682
Epoch: 14, step: 885, loss: 0.3638944923877716, mean loss: 0.36146029019743364
Epoch: 14, step: 886, loss: 0.3444845378398895, mean loss: 0.36145948577378023
Epoch: 14, step: 887, loss: 0.3190740942955017, mean loss: 0.36145747736819467
Epoch: 14, step: 888, loss: 0.36479687690734863, mean loss: 0.3614576355960809
Epoch: 14, step: 889, loss: 0.299969345331192, mean loss: 0.3614547222875305
Epoch: 14, step: 890, loss: 0.33942002058029175, mean loss: 0.3614536783352063
Epoch: 14, step: 891, loss: 0.34327590465545654, mean loss: 0.3614528171558582
Epoch: 14, step: 892, loss: 0.3380376994609833, mean loss: 0.3614517079077794
Epoch: 14, step: 893, loss: 0.3279464840888977, mean loss: 0.3614501207346947
Epoch: 14, step: 894, loss: 0.35761240124702454, mean loss: 0.3614499389470253
Epoch: 14, step: 895, loss: 0.3004058301448822, mean loss: 0.3614470475057217
Epoch: 14, step: 896, loss: 0.3286193311214447, mean loss: 0.36144549264774867
Epoch: 14, step: 897, loss: 0.32455962896347046, mean loss: 0.361443745661688
Epoch: 14, step: 898, loss: 0.35085251927375793, mean loss: 0.3614432440644165
Epoch: 14, step: 899, loss: 0.3192756474018097, mean loss: 0.3614412471143946
Epoch: 14, step: 900, loss: 0.3728266656398773, mean loss: 0.36144178627329626
Epoch: 14, step: 901, loss: 0.38185861706733704, mean loss: 0.36144275307085255
Epoch: 14, step: 902, loss: 0.42054903507232666, mean loss: 0.36144555179626575
Epoch: 14, step: 903, loss: 0.33228182792663574, mean loss: 0.361444170938128
Epoch: 14, step: 904, loss: 0.31456100940704346, mean loss: 0.36144195119656597
Epoch: 14, step: 905, loss: 0.36837640404701233, mean loss: 0.36144227950131225
Epoch: 14, step: 906, loss: 0.34962958097457886, mean loss: 0.36144172026737165
Epoch: 14, step: 907, loss: 0.33935946226119995, mean loss: 0.36144067490389853
Epoch: 14, step: 908, loss: 0.31840547919273376, mean loss: 0.3614386377348708
Epoch: 14, step: 909, loss: 0.3084985613822937, mean loss: 0.36143613181437695
Epoch: 14, step: 910, loss: 0.3042536675930023, mean loss: 0.361433425208412
Epoch: 14, step: 911, loss: 0.3539898991584778, mean loss: 0.3614330729021809
Epoch: 14, step: 912, loss: 0.32098087668418884, mean loss: 0.3614311583678339
Epoch: 14, step: 913, loss: 0.3189885914325714, mean loss: 0.3614291497276571
Epoch: 14, step: 914, loss: 0.3317490518093109, mean loss: 0.3614277451515406
Epoch: 14, step: 915, loss: 0.3280204236507416, mean loss: 0.3614261642637164
Epoch: 14, step: 916, loss: 0.35293325781822205, mean loss: 0.36142576238483287
Epoch: 14, step: 917, loss: 0.31241142749786377, mean loss: 0.3614234431677
Epoch: 14, step: 918, loss: 0.31943634152412415, mean loss: 0.3614214565530019
Epoch: 14, step: 919, loss: 0.3201603293418884, mean loss: 0.3614195043800642
Epoch: 14, step: 920, loss: 0.35809457302093506, mean loss: 0.3614193470762198
Epoch: 14, step: 921, loss: 0.3682011663913727, mean loss: 0.3614196679116496
Epoch: 14, step: 922, loss: 0.36776092648506165, mean loss: 0.36141996789076747
Epoch: 14, step: 923, loss: 0.33832693099975586, mean loss: 0.3614188755049164
Epoch: 14, step: 924, loss: 0.3441509008407593, mean loss: 0.36141805870463906
Epoch: 14, step: 925, loss: 0.3133105933666229, mean loss: 0.36141578325930096
Epoch: 14, step: 926, loss: 0.3178597688674927, mean loss: 0.36141372319145854
Epoch: 14, step: 927, loss: 0.37351083755493164, mean loss: 0.3614142953213471
Epoch: 14, step: 928, loss: 0.3440893590450287, mean loss: 0.3614134759817266
Epoch: 14, step: 929, loss: 0.3747052848339081, mean loss: 0.3614141045549249
Epoch: 14, step: 930, loss: 0.3421323299407959, mean loss: 0.3614131927577615
Epoch: 14, step: 931, loss: 0.3418070077896118, mean loss: 0.3614122656637116
Epoch: 14, step: 932, loss: 0.3396953344345093, mean loss: 0.3614112388099015
Epoch: 14, step: 933, loss: 0.30575552582740784, mean loss: 0.36140860733411034
Epoch: 14, step: 934, loss: 0.3610237240791321, mean loss: 0.3614085891371809
Epoch: 14, step: 935, loss: 0.3288951516151428, mean loss: 0.3614070520041664
Epoch: 14, step: 936, loss: 0.32870814204216003, mean loss: 0.3614055061756805
Epoch: 14, step: 937, loss: 0.3113873600959778, mean loss: 0.3614031416986984
Epoch: 14, step: 938, loss: 0.36759617924690247, mean loss: 0.36140343444450546
Epoch: 14, step: 939, loss: 0.32966527342796326, mean loss: 0.3614019342478229
Epoch: 14, step: 940, loss: 0.3576365113258362, mean loss: 0.36140175627254656
Epoch: 14, step: 941, loss: 0.35793834924697876, mean loss: 0.36140159257999405
Epoch: 14, step: 942, loss: 0.348703533411026, mean loss: 0.3614009924543185
Epoch: 14, step: 943, loss: 0.34474825859069824, mean loss: 0.36140020546311513
Epoch: 14, step: 944, loss: 0.3160596489906311, mean loss: 0.36139806281595893
Epoch: 14, step: 945, loss: 0.33767470717430115, mean loss: 0.361396941780346
Epoch: 14, step: 946, loss: 0.3247019350528717, mean loss: 0.36139520785761636
Epoch: 14, step: 947, loss: 0.34793373942375183, mean loss: 0.3613945718025968
Epoch: 14, step: 948, loss: 0.31182369589805603, mean loss: 0.36139222968703316
Epoch: 14, step: 949, loss: 0.2990635931491852, mean loss: 0.3613892849342911
Epoch: 14, step: 950, loss: 0.31916964054107666, mean loss: 0.36138729033683314
Epoch: 14, step: 951, loss: 0.3632451295852661, mean loss: 0.36138737810323757
Epoch: 14, step: 952, loss: 0.30665323138237, mean loss: 0.3613847925230627
Epoch: 14, step: 953, loss: 0.3560750186443329, mean loss: 0.36138454170710244
Epoch: 14, step: 954, loss: 0.3026801645755768, mean loss: 0.361381768839636
Epoch: 14, step: 955, loss: 0.34519273042678833, mean loss: 0.36138100419584174
Epoch: 14, step: 956, loss: 0.3506883978843689, mean loss: 0.3613804991844446
Epoch: 14, step: 957, loss: 0.3630222976207733, mean loss: 0.36138057672286134
Epoch: 14, step: 958, loss: 0.336862713098526, mean loss: 0.3613794188544493
Epoch: 14, step: 959, loss: 0.34962910413742065, mean loss: 0.3613788639661457
Epoch: 14, step: 960, loss: 0.34786999225616455, mean loss: 0.36137822606315145
Epoch: 14, step: 961, loss: 0.3114987313747406, mean loss: 0.36137587081267036
Epoch: 14, step: 962, loss: 0.3109351098537445, mean loss: 0.36137348917232104
Epoch: 14, step: 963, loss: 0.338382363319397, mean loss: 0.3613724036611854
Epoch: 14, step: 964, loss: 0.3243873715400696, mean loss: 0.36137065751926
Epoch: 14, step: 965, loss: 0.3640260696411133, mean loss: 0.36137078288098795
Epoch: 14, step: 966, loss: 0.342250257730484, mean loss: 0.36136988024561284
Epoch: 14, step: 967, loss: 0.33917036652565, mean loss: 0.36136883230784284
Epoch: 14, step: 968, loss: 0.319500595331192, mean loss: 0.3613668559926681
Epoch: 14, step: 969, loss: 0.2978639602661133, mean loss: 0.3613638585936439
Epoch: 14, step: 970, loss: 0.30451998114585876, mean loss: 0.3613611756334585
Epoch: 14, step: 971, loss: 0.3649906814098358, mean loss: 0.36136134693352345
Epoch: 14, step: 972, loss: 0.4103463590145111, mean loss: 0.36136365874682663
Epoch: 14, step: 973, loss: 0.3216885030269623, mean loss: 0.36136178639403194
Epoch: 14, step: 974, loss: 0.3472473621368408, mean loss: 0.36136112033654255
Epoch: 14, step: 975, loss: 0.37439101934432983, mean loss: 0.3613617351864391
Epoch: 14, step: 976, loss: 0.3534892201423645, mean loss: 0.36136136371873545
Epoch: 14, step: 977, loss: 0.33917075395584106, mean loss: 0.36136031669553254
Epoch: 14, step: 978, loss: 0.3176639974117279, mean loss: 0.36135825506216224
Epoch: 14, step: 979, loss: 0.30972835421562195, mean loss: 0.3613558192298898
Epoch: 14, step: 980, loss: 0.349541038274765, mean loss: 0.36135526185002687
Epoch: 14, step: 981, loss: 0.4027668237686157, mean loss: 0.3613572154098872
Epoch: 14, step: 982, loss: 0.35278812050819397, mean loss: 0.36135681118823043
Epoch: 14, step: 983, loss: 0.3402281403541565, mean loss: 0.36135581455281374
Epoch: 14, step: 984, loss: 0.3735017478466034, mean loss: 0.3613563874471722
Epoch: 14, step: 985, loss: 0.3329317569732666, mean loss: 0.36135504678919306
Epoch: 14, step: 986, loss: 0.39637336134910583, mean loss: 0.3613566983627704
Epoch: 14, step: 987, loss: 0.3596649467945099, mean loss: 0.3613566185782218
Epoch: 14, step: 988, loss: 0.335666686296463, mean loss: 0.3613554070746952
Epoch: 14, step: 989, loss: 0.3396424651145935, mean loss: 0.36135438316910434
Epoch: 14, step: 990, loss: 0.3396882712841034, mean loss: 0.3613533615200316
Epoch: 14, step: 991, loss: 0.3411012887954712, mean loss: 0.3613524065939318
Epoch: 14, step: 992, loss: 0.31381991505622864, mean loss: 0.3613501654467048
Epoch: 14, step: 993, loss: 0.33569929003715515, mean loss: 0.3613489560702121
Epoch: 14, step: 994, loss: 0.330703467130661, mean loss: 0.36134751127793735
Epoch: 14, step: 995, loss: 0.36345723271369934, mean loss: 0.36134761073680194
Epoch: 14, step: 996, loss: 0.36364394426345825, mean loss: 0.36134771898804063
Epoch: 14, step: 997, loss: 0.3505474030971527, mean loss: 0.3613472098753843
Epoch: 14, step: 998, loss: 0.36485353112220764, mean loss: 0.3613473751509557
Epoch: 14, step: 999, loss: 0.3580653667449951, mean loss: 0.3613472204559894
Epoch: 14, step: 1000, loss: 0.3834962844848633, mean loss: 0.36134826438604684
Epoch: 14, step: 1001, loss: 0.31804752349853516, mean loss: 0.3613462236309857
Epoch: 14, step: 1002, loss: 0.31723639369010925, mean loss: 0.36134414484169586
Epoch: 14, step: 1003, loss: 0.336332768201828, mean loss: 0.36134296617173167
Epoch: 14, step: 1004, loss: 0.35352379083633423, mean loss: 0.3613425977076944
Epoch: 14, step: 1005, loss: 0.3595689535140991, mean loss: 0.36134251413196194
Epoch: 14, step: 1006, loss: 0.3020414412021637, mean loss: 0.3613397199429722
Epoch: 14, step: 1007, loss: 0.3182670772075653, mean loss: 0.3613376905120103
Epoch: 14, step: 1008, loss: 0.3420805335044861, mean loss: 0.3613367832254611
Epoch: 14, step: 1009, loss: 0.32585760951042175, mean loss: 0.361335111729479
Epoch: 14, step: 1010, loss: 0.34483271837234497, mean loss: 0.3613343343048143
Epoch: 14, step: 1011, loss: 0.34662818908691406, mean loss: 0.36133364153369985
Epoch: 14, step: 1012, loss: 0.3847775459289551, mean loss: 0.36133474586760134
Epoch: 14, step: 1013, loss: 0.3946789801120758, mean loss: 0.3613363164862657
Epoch: 14, step: 1014, loss: 0.3279661238193512, mean loss: 0.3613347447189129
Epoch: 14, step: 1015, loss: 0.32915472984313965, mean loss: 0.3613332290814376
Epoch: 14, step: 1016, loss: 0.3557341992855072, mean loss: 0.36133296538672677
Epoch: 14, step: 1017, loss: 0.32961729168891907, mean loss: 0.3613314717598219
Epoch: 14, step: 1018, loss: 0.3184424042701721, mean loss: 0.36132945202506844
Epoch: 14, step: 1019, loss: 0.3312491774559021, mean loss: 0.36132803554952836
Epoch: 14, step: 1020, loss: 0.3340231776237488, mean loss: 0.36132674982847895
Epoch: 14, step: 1021, loss: 0.28297945857048035, mean loss: 0.3613230608139174
Epoch: 14, step: 1022, loss: 0.4095836579799652, mean loss: 0.3613253330770732
Epoch: 14, step: 1023, loss: 0.3625820577144623, mean loss: 0.36132539224489985
Epoch: 14, step: 1024, loss: 0.3938567638397217, mean loss: 0.36132692378162573
Epoch: 14, step: 1025, loss: 0.3272216320037842, mean loss: 0.36132531822227265
Epoch: 14, step: 1026, loss: 0.33765101432800293, mean loss: 0.3613242037702699
Epoch: 14, step: 1027, loss: 0.37458187341690063, mean loss: 0.36132482783681324
Epoch: 14, step: 1028, loss: 0.30164751410484314, mean loss: 0.36132201883169524
Epoch: 14, step: 1029, loss: 0.3373076915740967, mean loss: 0.36132088853294453
Epoch: 14, step: 1030, loss: 0.35071614384651184, mean loss: 0.3613203894156721
Epoch: 14, step: 1031, loss: 0.28864026069641113, mean loss: 0.3613169688523853
Epoch: 14, step: 1032, loss: 0.34994253516197205, mean loss: 0.36131643355972726
Epoch: 14, step: 1033, loss: 0.36771783232688904, mean loss: 0.3613167348020222
Epoch: 14, step: 1034, loss: 0.3551253378391266, mean loss: 0.36131644345587555
Epoch: 14, step: 1035, loss: 0.3081634044647217, mean loss: 0.36131394237178976
Epoch: 14, step: 1036, loss: 0.344651997089386, mean loss: 0.3613131583909267
Epoch: 14, step: 1037, loss: 0.33259162306785583, mean loss: 0.3613118070436357
Epoch: 14, step: 1038, loss: 0.3313996493816376, mean loss: 0.36131039974381624
Epoch: 14, step: 1039, loss: 0.32229000329971313, mean loss: 0.3613085640081913
Epoch: 14, step: 1040, loss: 0.39696064591407776, mean loss: 0.3613102412007352
Epoch: 14, step: 1041, loss: 0.3154503405094147, mean loss: 0.3613080838999218
Epoch: 14, step: 1042, loss: 0.36880549788475037, mean loss: 0.3613084365700373
Epoch: 14, step: 1043, loss: 0.3386072814464569, mean loss: 0.3613073687828725
Epoch: 14, step: 1044, loss: 0.31332725286483765, mean loss: 0.3613051120632489
Epoch: 14, step: 1045, loss: 0.34904128313064575, mean loss: 0.36130453526760725
Epoch: 14, step: 1046, loss: 0.38613376021385193, mean loss: 0.36130570298735265
Epoch: 14, step: 1047, loss: 0.29410824179649353, mean loss: 0.361302542835867
Epoch: 14, step: 1048, loss: 0.33433908224105835, mean loss: 0.3613012748621734
Epoch: 14, step: 1049, loss: 0.3062116205692291, mean loss: 0.3612986843583507
Epoch: 14, step: 1050, loss: 0.302092045545578, mean loss: 0.36129590039075715
Epoch: 14, step: 1051, loss: 0.3324207067489624, mean loss: 0.3612945427081522
Epoch: 14, step: 1052, loss: 0.3375804126262665, mean loss: 0.3612934277459969
Epoch: 14, step: 1053, loss: 0.3570670783519745, mean loss: 0.3612932290459783
Epoch: 14, step: 1054, loss: 0.3088013231754303, mean loss: 0.36129076127737925
Epoch: 14, step: 1055, loss: 0.3446982502937317, mean loss: 0.36128998126087947
Epoch: 14, step: 1056, loss: 0.318145215511322, mean loss: 0.3612879531141324
Epoch: 14, step: 1057, loss: 0.32497769594192505, mean loss: 0.3612862463238169
Epoch: 14, step: 1058, loss: 0.30986830592155457, mean loss: 0.36128382949935617
Epoch: 14, step: 1059, loss: 0.36922794580459595, mean loss: 0.3612842028832773
Epoch: 14, step: 1060, loss: 0.3206160366535187, mean loss: 0.36128229151578045
Epoch: 14, step: 1061, loss: 0.34891676902770996, mean loss: 0.36128171037457885
Epoch: 14, step: 1062, loss: 0.35070836544036865, mean loss: 0.3612812134835156
Epoch: 14, step: 1063, loss: 0.32763171195983887, mean loss: 0.36127963220994774
Epoch: 14, step: 1064, loss: 0.3406356871128082, mean loss: 0.36127866214533155
Epoch: 14, step: 1065, loss: 0.3167225122451782, mean loss: 0.3612765685380625
Epoch: 14, step: 1066, loss: 0.34296682476997375, mean loss: 0.3612757082390554
Epoch: 14, step: 1067, loss: 0.3420107662677765, mean loss: 0.3612748031017705
Epoch: 14, step: 1068, loss: 0.3066968023777008, mean loss: 0.361272238948577
Epoch: 14, step: 1069, loss: 0.33708611130714417, mean loss: 0.3612711027027985
Epoch: 14, step: 1070, loss: 0.34005820751190186, mean loss: 0.3612701061840222
Epoch: 14, step: 1071, loss: 0.335487961769104, mean loss: 0.3612688950723906
Epoch: 14, step: 1072, loss: 0.3494510054588318, mean loss: 0.36126833995521207
Epoch: 14, step: 1073, loss: 0.29859891533851624, mean loss: 0.36126539634672844
Epoch: 14, step: 1074, loss: 0.3311362862586975, mean loss: 0.3612639812365839
Epoch: 14, step: 1075, loss: 0.3537169396877289, mean loss: 0.361263626782256
Epoch: 14, step: 1076, loss: 0.33681660890579224, mean loss: 0.3612624786576199
Epoch: 14, step: 1077, loss: 0.3328181803226471, mean loss: 0.3612611428682738
Epoch: 14, step: 1078, loss: 0.355307400226593, mean loss: 0.36126086328420987
Epoch: 14, step: 1079, loss: 0.34320080280303955, mean loss: 0.36126001523478835
Epoch: 14, step: 1080, loss: 0.33845219016075134, mean loss: 0.36125894429404204
Epoch: 14, step: 1081, loss: 0.31470590829849243, mean loss: 0.3612567585002588
Epoch: 14, step: 1082, loss: 0.3858409523963928, mean loss: 0.3612579127419554
Epoch: 14, step: 1083, loss: 0.3013674318790436, mean loss: 0.36125510098229047
Epoch: 14, step: 1084, loss: 0.3295159935951233, mean loss: 0.3612536109533065
Epoch: 14, step: 1085, loss: 0.35459911823272705, mean loss: 0.3612532985651401
Epoch: 14, step: 1086, loss: 0.36313846707344055, mean loss: 0.36125338705824006
Epoch: 14, step: 1087, loss: 0.3370281755924225, mean loss: 0.36125224993791216
Epoch: 14, step: 1088, loss: 0.35096198320388794, mean loss: 0.36125176694017763
Epoch: 14, step: 1089, loss: 0.33780714869499207, mean loss: 0.3612506665638402
Epoch: 14, step: 1090, loss: 0.3238963484764099, mean loss: 0.36124891341613813
Epoch: 14, step: 1091, loss: 0.3209691345691681, mean loss: 0.36124702305670287
Epoch: 14, step: 1092, loss: 0.3817392885684967, mean loss: 0.3612479847285557
Epoch: 14, step: 1093, loss: 0.34653210639953613, mean loss: 0.36124729416645673
Epoch: 14, step: 1094, loss: 0.3459891676902771, mean loss: 0.36124657819224265
Epoch: 14, step: 1095, loss: 0.3485502004623413, mean loss: 0.36124598245379813
Epoch: 14, step: 1096, loss: 0.3504609763622284, mean loss: 0.36124547642432825
Epoch: 14, step: 1097, loss: 0.3458971679210663, mean loss: 0.36124475631977243
Epoch: 14, step: 1098, loss: 0.31660720705986023, mean loss: 0.3612426621349608
Epoch: 14, step: 1099, loss: 0.2898977994918823, mean loss: 0.3612393151250789
Epoch: 14, step: 1100, loss: 0.32834693789482117, mean loss: 0.36123777211352803
Epoch: 14, step: 1101, loss: 0.33255302906036377, mean loss: 0.36123642654907295
Epoch: 14, step: 1102, loss: 0.3313179314136505, mean loss: 0.3612350231767227
Epoch: 14, step: 1103, loss: 0.3255998492240906, mean loss: 0.3612333517332915
Epoch: 14, step: 1104, loss: 0.3314478099346161, mean loss: 0.3612319547283762
Epoch: 14, step: 1105, loss: 0.32689693570137024, mean loss: 0.3612303444188824
Epoch: 14, step: 1106, loss: 0.31692612171173096, mean loss: 0.3612282666520247
Epoch: 14, step: 1107, loss: 0.3081563711166382, mean loss: 0.3612257778180566
Epoch: 14, step: 1108, loss: 0.3169386088848114, mean loss: 0.36122370104577367
Epoch: 14, step: 1109, loss: 0.31628164649009705, mean loss: 0.3612215936625534
Epoch: 14, step: 1110, loss: 0.32729604840278625, mean loss: 0.36122000293037076
Epoch: 14, step: 1111, loss: 0.34902772307395935, mean loss: 0.3612194312743385
Epoch: 14, step: 1112, loss: 0.3341861963272095, mean loss: 0.3612181638340015
Epoch: 14, step: 1113, loss: 0.32515084743499756, mean loss: 0.3612164729143391
Epoch: 14, step: 1114, loss: 0.3101223409175873, mean loss: 0.3612140776149159
Epoch: 14, step: 1115, loss: 0.337649941444397, mean loss: 0.36121297297699306
Epoch: 14, step: 1116, loss: 0.36954331398010254, mean loss: 0.361213363467829
Epoch: 14, step: 1117, loss: 0.35340237617492676, mean loss: 0.36121299733924117
Epoch: 14, step: 1118, loss: 0.4548914432525635, mean loss: 0.36121738817335947
Epoch: 14, step: 1119, loss: 0.366357684135437, mean loss: 0.3612176290946175
Epoch: 14, step: 1120, loss: 0.32040542364120483, mean loss: 0.36121571635123967
Epoch: 14, step: 1121, loss: 0.3169235587120056, mean loss: 0.3612136406104186
Epoch: 14, step: 1122, loss: 0.3665456473827362, mean loss: 0.361213890481864
Epoch: 14, step: 1123, loss: 0.32836949825286865, mean loss: 0.36121235138194696
Epoch: 14, step: 1124, loss: 0.3093368113040924, mean loss: 0.3612099205895718
Epoch: 14, step: 1125, loss: 0.31217944622039795, mean loss: 0.36120762321939237
Epoch: 14, step: 1126, loss: 0.3114328682422638, mean loss: 0.36120529108450145
Epoch: 14, step: 1127, loss: 0.3373042345046997, mean loss: 0.3612041712823753
Epoch: 14, step: 1128, loss: 0.3681677579879761, mean loss: 0.3612044975220898
Epoch: 14, step: 1129, loss: 0.3148220181465149, mean loss: 0.36120232463352164
Epoch: 14, step: 1130, loss: 0.39140206575393677, mean loss: 0.36120373934009026
Epoch: 14, step: 1131, loss: 0.3602094054222107, mean loss: 0.3612036927627098
Epoch: 14, step: 1132, loss: 0.32296323776245117, mean loss: 0.3612019015567985
Epoch: 14, step: 1133, loss: 0.3539260923862457, mean loss: 0.36120156076948373
Epoch: 14, step: 1134, loss: 0.3548356592655182, mean loss: 0.3612012626147601
Epoch: 14, step: 1135, loss: 0.30430370569229126, mean loss: 0.361198597873428
Epoch: 14, step: 1136, loss: 0.31008589267730713, mean loss: 0.3611962041720654
Epoch: 14, step: 1137, loss: 0.33673590421676636, mean loss: 0.36119505870517604
Epoch: 14, step: 1138, loss: 0.3278103172779083, mean loss: 0.3611934953831705
Epoch: 14, step: 1139, loss: 0.304995596408844, mean loss: 0.3611908639026042
Epoch: 14, step: 1140, loss: 0.35774025321006775, mean loss: 0.36119070233446765
Epoch: 14, step: 1141, loss: 0.3181926906108856, mean loss: 0.3611886891304353
Epoch: 14, step: 1142, loss: 0.32076045870780945, mean loss: 0.3611867963344044
Epoch: 14, step: 1143, loss: 0.37421250343322754, mean loss: 0.3611874061521525
Epoch: 14, step: 1144, loss: 0.312924861907959, mean loss: 0.3611851467755201
Epoch: 14, step: 1145, loss: 0.3282780945301056, mean loss: 0.36118360632742325
Epoch: 14, step: 1146, loss: 0.34186041355133057, mean loss: 0.3611827018106056
Epoch: 14, step: 1147, loss: 0.30089640617370605, mean loss: 0.36117987994692663
Epoch: 14, step: 1148, loss: 0.348703533411026, mean loss: 0.36117929598500126
Epoch: 14, step: 1149, loss: 0.344929575920105, mean loss: 0.3611785354439517
Epoch: 14, step: 1150, loss: 0.3524724841117859, mean loss: 0.36117812799080745
Epoch: 14, step: 1151, loss: 0.31325340270996094, mean loss: 0.36117588516390364
Epoch: 14, step: 1152, loss: 0.35072651505470276, mean loss: 0.3611753961672211
Epoch: 14, step: 1153, loss: 0.3710941672325134, mean loss: 0.36117586031186616
Epoch: 14, step: 1154, loss: 0.3185703754425049, mean loss: 0.36117386669973434
Epoch: 14, step: 1155, loss: 0.29613691568374634, mean loss: 0.36117082360825875
Epoch: 14, step: 1156, loss: 0.32937732338905334, mean loss: 0.3611693360538574
Epoch: 14, step: 1157, loss: 0.31830260157585144, mean loss: 0.36116733049876815
Epoch: 14, step: 1158, loss: 0.32095393538475037, mean loss: 0.36116544917034177
Epoch: 14, step: 1159, loss: 0.3099399507045746, mean loss: 0.36116305276790606
Epoch: 14, step: 1160, loss: 0.33600640296936035, mean loss: 0.36116187595872806
Epoch: 14, step: 1161, loss: 0.40204957127571106, mean loss: 0.3611637885649268
Epoch: 14, step: 1162, loss: 0.37582141160964966, mean loss: 0.36116447417337644
Epoch: 14, step: 1163, loss: 0.3200657069683075, mean loss: 0.3611625518736943
Epoch: 14, step: 1164, loss: 0.323566198348999, mean loss: 0.3611607934735481
Epoch: 14, step: 1165, loss: 0.33974653482437134, mean loss: 0.36115979196486564
Epoch: 14, step: 1166, loss: 0.3028634786605835, mean loss: 0.3611570656723293
Epoch: 14, step: 1167, loss: 0.3695420026779175, mean loss: 0.36115745778498387
Epoch: 14, step: 1168, loss: 0.3228539824485779, mean loss: 0.3611556666474886
Epoch: 14, step: 1169, loss: 0.3786119520664215, mean loss: 0.3611564828957547
Epoch: 14, step: 1170, loss: 0.34230726957321167, mean loss: 0.3611556015560005
Epoch: 14, step: 1171, loss: 0.3031885027885437, mean loss: 0.361152891293294
Epoch: 14, step: 1172, loss: 0.36728236079216003, mean loss: 0.36115317786440526
Epoch: 14, step: 1173, loss: 0.3445492088794708, mean loss: 0.36115240161527085
Epoch: 14, step: 1174, loss: 0.37948840856552124, mean loss: 0.36115325879852317
Epoch: 14, step: 1175, loss: 0.3426564037799835, mean loss: 0.3611523941362654
Epoch: 14, step: 1176, loss: 0.33838900923728943, mean loss: 0.3611513300786344
Epoch: 14, step: 1177, loss: 0.38033437728881836, mean loss: 0.3611522267341084
Epoch: 14, step: 1178, loss: 0.33484479784965515, mean loss: 0.3611509971277104
Epoch: 14, step: 1179, loss: 0.32030731439590454, mean loss: 0.36114908818759395
Epoch: 14, step: 1180, loss: 0.3273653984069824, mean loss: 0.3611475092891605
Epoch: 14, step: 1181, loss: 0.3358630836009979, mean loss: 0.3611463276635091
Epoch: 14, step: 1182, loss: 0.3303288221359253, mean loss: 0.3611448875258612
Epoch: 14, step: 1183, loss: 0.32895416021347046, mean loss: 0.36114338328626716
Epoch: 14, step: 1184, loss: 0.31518471240997314, mean loss: 0.3611412357851749
Epoch: 14, step: 1185, loss: 0.3336745798587799, mean loss: 0.3611399524165212
Epoch: 14, step: 1186, loss: 0.393468976020813, mean loss: 0.3611414629068078
Epoch: 14, step: 1187, loss: 0.34060782194137573, mean loss: 0.3611405035701901
Epoch: 14, step: 1188, loss: 0.30865195393562317, mean loss: 0.36113805140716115
Epoch: 14, step: 1189, loss: 0.3157811462879181, mean loss: 0.3611359325196941
Epoch: 14, step: 1190, loss: 0.3202238380908966, mean loss: 0.3611340213647248
Epoch: 14, step: 1191, loss: 0.3438388407230377, mean loss: 0.3611332134807262
Epoch: 14, step: 1192, loss: 0.34987199306488037, mean loss: 0.36113268747668975
Epoch: 14, step: 1193, loss: 0.328091561794281, mean loss: 0.3611311442200021
Epoch: 14, step: 1194, loss: 0.33451080322265625, mean loss: 0.3611299009179145
Epoch: 14, step: 1195, loss: 0.32765746116638184, mean loss: 0.3611283376618081
Epoch: 14, step: 1196, loss: 0.36417022347450256, mean loss: 0.3611284797197081
Epoch: 14, step: 1197, loss: 0.30688342452049255, mean loss: 0.361125946561251
Epoch: 14, step: 1198, loss: 0.32236525416374207, mean loss: 0.3611241365826193
Epoch: 14, step: 1199, loss: 0.3241368532180786, mean loss: 0.3611224094961716
Epoch: 14, step: 1200, loss: 0.3343714773654938, mean loss: 0.3611211604448511
Epoch: 14, step: 1201, loss: 0.3128999173641205, mean loss: 0.36111890900946586
Epoch: 14, step: 1202, loss: 0.30374380946159363, mean loss: 0.3611162303083338
Epoch: 14, step: 1203, loss: 0.39499738812446594, mean loss: 0.3611178120617332
Epoch: 14, step: 1204, loss: 0.34474480152130127, mean loss: 0.3611170477178398
Epoch: 14, step: 1205, loss: 0.32852986454963684, mean loss: 0.36111552651612344
Epoch: 14, step: 1206, loss: 0.3345850706100464, mean loss: 0.36111428810619456
Epoch: 14, step: 1207, loss: 0.38031503558158875, mean loss: 0.36111518433227163
Epoch: 14, step: 1208, loss: 0.3547055125236511, mean loss: 0.3611148851643926
Epoch: 14, step: 1209, loss: 0.3186761140823364, mean loss: 0.36111290445072314
Epoch: 14, step: 1210, loss: 0.30829429626464844, mean loss: 0.36111043940157084
Epoch: 14, step: 1211, loss: 0.3239355981349945, mean loss: 0.3611087045293818
Epoch: 14, step: 1212, loss: 0.31234636902809143, mean loss: 0.3611064289992357
Epoch: 14, step: 1213, loss: 0.3560246229171753, mean loss: 0.3611061918640942
Epoch: 14, step: 1214, loss: 0.3292681574821472, mean loss: 0.3611047062575251
Epoch: 14, step: 1215, loss: 0.3039066195487976, mean loss: 0.3611020374404894
Epoch: 14, step: 1216, loss: 0.3597109019756317, mean loss: 0.36110197253424836
Epoch: 14, step: 1217, loss: 0.3524520993232727, mean loss: 0.36110156897573337
Epoch: 14, step: 1218, loss: 0.3463931679725647, mean loss: 0.3611008827895424
Epoch: 14, step: 1219, loss: 0.3085845410823822, mean loss: 0.36109843287623267
Epoch: 14, step: 1220, loss: 0.3567749261856079, mean loss: 0.36109823119191625
Epoch: 14, step: 1221, loss: 0.3323410749435425, mean loss: 0.3610968897815119
Epoch: 14, step: 1222, loss: 0.31628939509391785, mean loss: 0.36109479978222614
Epoch: 14, step: 1223, loss: 0.32210227847099304, mean loss: 0.3610929811011948
Epoch: 14, step: 1224, loss: 0.309314101934433, mean loss: 0.3610905661541696
Epoch: 14, step: 1225, loss: 0.30264756083488464, mean loss: 0.3610878405219842
Epoch: 14, step: 1226, loss: 0.3174825608730316, mean loss: 0.36108580697818676
Epoch: 14, step: 1227, loss: 0.39319658279418945, mean loss: 0.36108730440291237
Epoch: 14, step: 1228, loss: 0.344066858291626, mean loss: 0.3610865107239144
Epoch: 14, step: 1229, loss: 0.3403421640396118, mean loss: 0.3610855434411258
Epoch: 14, step: 1230, loss: 0.3405238687992096, mean loss: 0.3610845847208087
Epoch: 14, step: 1231, loss: 0.34965166449546814, mean loss: 0.36108405166783286
Epoch: 14, step: 1232, loss: 0.3326604664325714, mean loss: 0.3610827264971846
Epoch: 14, step: 1233, loss: 0.3168218731880188, mean loss: 0.3610806630541399
Epoch: 14, step: 1234, loss: 0.31575480103492737, mean loss: 0.36107855005884737
Epoch: 14, step: 1235, loss: 0.32253164052963257, mean loss: 0.36107675316767035
Epoch: 14, step: 1236, loss: 0.3281479477882385, mean loss: 0.36107521823990363
Epoch: 14, step: 1237, loss: 0.30715441703796387, mean loss: 0.3610727049183225
Epoch: 14, step: 1238, loss: 0.29099375009536743, mean loss: 0.3610694385955622
Epoch: 14, step: 1239, loss: 0.35890674591064453, mean loss: 0.36106933779892325
Epoch: 14, step: 1240, loss: 0.33358076214790344, mean loss: 0.36106805669831965
Epoch: 14, step: 1241, loss: 0.33064714074134827, mean loss: 0.3610666390025439
Epoch: 14, step: 1242, loss: 0.3232713043689728, mean loss: 0.3610648777212804
Epoch: 14, step: 1243, loss: 0.30460357666015625, mean loss: 0.361062246719367
Epoch: 14, step: 1244, loss: 0.33264851570129395, mean loss: 0.36106092274886153
Epoch: 14, step: 1245, loss: 0.3181394338607788, mean loss: 0.3610589228658642
Epoch: 14, step: 1246, loss: 0.33313366770744324, mean loss: 0.3610576217777051
Epoch: 14, step: 1247, loss: 0.35105210542678833, mean loss: 0.3610571556243157
Epoch: 14, step: 1248, loss: 0.3184620440006256, mean loss: 0.3610551712259172
Epoch: 14, step: 1249, loss: 0.34720152616500854, mean loss: 0.3610545258497381
Epoch: 14, step: 1250, loss: 0.36463916301727295, mean loss: 0.3610546928333486
Epoch: 14, step: 1251, loss: 0.33548885583877563, mean loss: 0.3610535019521769
Epoch: 14, step: 1252, loss: 0.3418557643890381, mean loss: 0.3610526077448285
Epoch: 14, step: 1253, loss: 0.3207987844944, mean loss: 0.36105073285785827
Epoch: 14, step: 1254, loss: 0.3774281442165375, mean loss: 0.3610514956267726
Epoch: 14, step: 1255, loss: 0.348875492811203, mean loss: 0.361050928562558
Epoch: 14, step: 1256, loss: 0.32433995604515076, mean loss: 0.36104921892848185
Epoch: 14, step: 1257, loss: 0.32289910316467285, mean loss: 0.3610474423560797
Epoch: 14, step: 1258, loss: 0.3242051899433136, mean loss: 0.36104572676807445
Epoch: 14, step: 1259, loss: 0.3148306906223297, mean loss: 0.36104357482934535
Epoch: 14, step: 1260, loss: 0.354213684797287, mean loss: 0.36104325681984534
Epoch: 14, step: 1261, loss: 0.36571556329727173, mean loss: 0.3610434743590239
Epoch: 14, step: 1262, loss: 0.28997802734375, mean loss: 0.36104016575773823
Epoch: 14, step: 1263, loss: 0.3315945267677307, mean loss: 0.3610387949179342
Epoch: 14, step: 1264, loss: 0.3357063829898834, mean loss: 0.36103761562404996
Epoch: 14, step: 1265, loss: 0.34032103419303894, mean loss: 0.361036651254744
Epoch: 14, step: 1266, loss: 0.2990034818649292, mean loss: 0.3610337637078748
Epoch: 14, step: 1267, loss: 0.358084112405777, mean loss: 0.36103362641261777
Epoch: 14, step: 1268, loss: 0.31065618991851807, mean loss: 0.36103128164014886
Epoch: 14, step: 1269, loss: 0.3186458945274353, mean loss: 0.36102930894224733
Epoch: 14, step: 1270, loss: 0.32427695393562317, mean loss: 0.36102759849616334
Epoch: 14, step: 1271, loss: 0.28642573952674866, mean loss: 0.3610241267045136
Epoch: 14, step: 1272, loss: 0.4020140767097473, mean loss: 0.36102603418973883
Epoch: 14, step: 1273, loss: 0.35184305906295776, mean loss: 0.361025606875866
Epoch: 14, step: 1274, loss: 0.4110773205757141, mean loss: 0.36102793583746384
Epoch: 14, step: 1275, loss: 0.35579460859298706, mean loss: 0.36102769233628923
Epoch: 14, step: 1276, loss: 0.3242431879043579, mean loss: 0.36102598087188537
Epoch: 14, step: 1277, loss: 0.3228188455104828, mean loss: 0.36102420329975543
Epoch: 14, step: 1278, loss: 0.3315916955471039, mean loss: 0.36102283402747104
Epoch: 14, step: 1279, loss: 0.31986895203590393, mean loss: 0.3610209195372407
Epoch: 14, step: 1280, loss: 0.3203609883785248, mean loss: 0.3610190281137324
Epoch: 14, step: 1281, loss: 0.33312368392944336, mean loss: 0.36101773053515834
Epoch: 14, step: 1282, loss: 0.34876424074172974, mean loss: 0.36101716057889094
Epoch: 14, step: 1283, loss: 0.3138047456741333, mean loss: 0.3610149646526163
Epoch: 14, step: 1284, loss: 0.3124590814113617, mean loss: 0.36101270634447985
Epoch: 14, step: 1285, loss: 0.3230895400047302, mean loss: 0.3610109426403435
Epoch: 14, step: 1286, loss: 0.32344329357147217, mean loss: 0.3610091955516085
Epoch: 14, step: 1287, loss: 0.3241358995437622, mean loss: 0.3610074808336022
Epoch: 14, step: 1288, loss: 0.3378603756427765, mean loss: 0.36100640447437454
Epoch: 14, step: 1289, loss: 0.40383562445640564, mean loss: 0.36100839597535017
Epoch: 14, step: 1290, loss: 0.30616268515586853, mean loss: 0.3610058458423321
Epoch: 14, step: 1291, loss: 0.33045971393585205, mean loss: 0.3610044256204655
Epoch: 14, step: 1292, loss: 0.38061702251434326, mean loss: 0.36100533745257735
Epoch: 14, step: 1293, loss: 0.33521273732185364, mean loss: 0.36100413835447737
Epoch: 14, step: 1294, loss: 0.3642463684082031, mean loss: 0.3610042890787605
Epoch: 14, step: 1295, loss: 0.3875410556793213, mean loss: 0.36100552265846486
Epoch: 14, step: 1296, loss: 0.33053964376449585, mean loss: 0.3610041064971255
Epoch: 14, step: 1297, loss: 0.3760736286640167, mean loss: 0.36100480694902504
Epoch: 14, step: 1298, loss: 0.3142348825931549, mean loss: 0.3610026331203308
Epoch: 14, step: 1299, loss: 0.345419317483902, mean loss: 0.36100190885394134
Epoch: 14, step: 1300, loss: 0.36476999521255493, mean loss: 0.3610020839753039
Epoch: 14, step: 1301, loss: 0.3124917149543762, mean loss: 0.3609998295664824
Epoch: 14, step: 1302, loss: 0.29835888743400574, mean loss: 0.36099691860676625
Epoch: 14, step: 1303, loss: 0.3711526095867157, mean loss: 0.36099739052549207
Epoch: 14, step: 1304, loss: 0.3524382412433624, mean loss: 0.36099699281398784
Epoch: 14, step: 1305, loss: 0.31023481488227844, mean loss: 0.36099463419592576
Epoch: 14, step: 1306, loss: 0.3333992063999176, mean loss: 0.36099335205924427
Epoch: 14, step: 1307, loss: 0.31184983253479004, mean loss: 0.3609910688628345
Epoch: 14, step: 1308, loss: 0.2945329546928406, mean loss: 0.36098798137785565
Epoch: 14, step: 1309, loss: 0.3201088011264801, mean loss: 0.36098608231717316
Epoch: 14, step: 1310, loss: 0.3463013470172882, mean loss: 0.3609854001628878
Epoch: 14, step: 1311, loss: 0.35307827591896057, mean loss: 0.3609850328680047
Epoch: 14, step: 1312, loss: 0.3213944435119629, mean loss: 0.3609831939256778
Epoch: 14, step: 1313, loss: 0.2932196259498596, mean loss: 0.3609800465235424
Epoch: 14, step: 1314, loss: 0.3279411792755127, mean loss: 0.36097851204454706
Epoch: 14, step: 1315, loss: 0.3295292854309082, mean loss: 0.3609770514637086
Epoch: 14, step: 1316, loss: 0.3334389925003052, mean loss: 0.36097577258668434
Epoch: 14, step: 1317, loss: 0.3757704496383667, mean loss: 0.36097645962471964
Epoch: 14, step: 1318, loss: 0.3261157274246216, mean loss: 0.3609748408305613
Epoch: 14, step: 1319, loss: 0.30268195271492004, mean loss: 0.3609721340656971
Epoch: 14, step: 1320, loss: 0.31768572330474854, mean loss: 0.3609701242030997
Epoch: 14, step: 1321, loss: 0.3199354112148285, mean loss: 0.3609682189791705
Epoch: 14, step: 1322, loss: 0.3109125792980194, mean loss: 0.360965895025427
Epoch: 14, step: 1323, loss: 0.31322145462036133, mean loss: 0.36096367847759014
Epoch: 14, step: 1324, loss: 0.30329185724258423, mean loss: 0.360961001172858
Epoch: 14, step: 1325, loss: 0.38201576471328735, mean loss: 0.36096197855488105
Epoch: 14, step: 1326, loss: 0.3473624885082245, mean loss: 0.36096134728300405
Epoch: 14, step: 1327, loss: 0.3678014576435089, mean loss: 0.36096166477791497
Epoch: 14, step: 1328, loss: 0.338887482881546, mean loss: 0.3609606402162117
Epoch: 14, step: 1329, loss: 0.33627986907958984, mean loss: 0.3609594947241883
Epoch: 14, step: 1330, loss: 0.33152779936790466, mean loss: 0.36095812879411193
Epoch: 14, step: 1331, loss: 0.3468411862850189, mean loss: 0.36095747365477143
Epoch: 14, step: 1332, loss: 0.33483102917671204, mean loss: 0.36095626123449776
Epoch: 14, step: 1333, loss: 0.35359907150268555, mean loss: 0.3609559198335821
Epoch: 14, step: 1334, loss: 0.3553222417831421, mean loss: 0.3609556584221371
Epoch: 14, step: 1335, loss: 0.3414159119129181, mean loss: 0.360954751789504
Epoch: 14, step: 1336, loss: 0.3236025273799896, mean loss: 0.3609530187488874
Epoch: 14, step: 1337, loss: 0.3274894654750824, mean loss: 0.36095146620396423
Epoch: 14, step: 1338, loss: 0.3202129602432251, mean loss: 0.36094957622456453
Epoch: 14, step: 1339, loss: 0.2866809368133545, mean loss: 0.3609461308432595
Epoch: 14, step: 1340, loss: 0.3250805139541626, mean loss: 0.36094446708592365
Epoch: 14, step: 1341, loss: 0.34037286043167114, mean loss: 0.3609435128412509
Epoch: 14, step: 1342, loss: 0.30954888463020325, mean loss: 0.36094112893530855
Epoch: 14, step: 1343, loss: 0.3644220530986786, mean loss: 0.36094129038819184
Epoch: 14, step: 1344, loss: 0.3228094279766083, mean loss: 0.36093952183096295
Epoch: 14, step: 1345, loss: 0.3219471573829651, mean loss: 0.3609377134474898
Epoch: 14, step: 1346, loss: 0.3393644094467163, mean loss: 0.3609367129696342
Epoch: 14, step: 1347, loss: 0.31776344776153564, mean loss: 0.3609347108705242
Epoch: 14, step: 1348, loss: 0.3747042417526245, mean loss: 0.3609353493834332
Epoch: 14, step: 1349, loss: 0.3253718614578247, mean loss: 0.3609337003299265
Epoch: 14, step: 1350, loss: 0.35878968238830566, mean loss: 0.36093360091795723
Epoch: 14, step: 1351, loss: 0.3438214957714081, mean loss: 0.360932807515456
Epoch: 14, step: 1352, loss: 0.3488253057003021, mean loss: 0.3609322461773404
Epoch: 14, step: 1353, loss: 0.345389723777771, mean loss: 0.3609315256153376
Epoch: 14, step: 1354, loss: 0.3645320236682892, mean loss: 0.3609316925291595
Epoch: 14, step: 1355, loss: 0.32251179218292236, mean loss: 0.3609299115213556
Epoch: 14, step: 1356, loss: 0.323768675327301, mean loss: 0.360928188940528
Epoch: 14, step: 1357, loss: 0.2829921841621399, mean loss: 0.36092457644378295
Epoch: 14, step: 1358, loss: 0.3460466265678406, mean loss: 0.3609238868516682
Epoch: 14, step: 1359, loss: 0.3632131814956665, mean loss: 0.36092399295542443
Epoch: 14, step: 1360, loss: 0.3283510208129883, mean loss: 0.360922483339994
Epoch: 14, step: 1361, loss: 0.31294018030166626, mean loss: 0.36092025967222874
Epoch: 14, step: 1362, loss: 0.3363434374332428, mean loss: 0.360919120749098
Epoch: 14, step: 1363, loss: 0.33815905451774597, mean loss: 0.36091806606576937
Epoch: 14, step: 1364, loss: 0.3084813952445984, mean loss: 0.36091563630483053
Epoch: 14, step: 1365, loss: 0.31198495626449585, mean loss: 0.3609133691062372
Epoch: 14, step: 1366, loss: 0.3457854688167572, mean loss: 0.3609126681888351
Epoch: 14, step: 1367, loss: 0.3195345997810364, mean loss: 0.36091075111746707
Epoch: 14, step: 1368, loss: 0.3249284625053406, mean loss: 0.36090908411313016
Epoch: 14, step: 1369, loss: 0.31032195687294006, mean loss: 0.3609067405975534
Epoch: 14, step: 1370, loss: 0.3111650347709656, mean loss: 0.3609044363539889
Epoch: 14, step: 1371, loss: 0.33125388622283936, mean loss: 0.3609030628802937
Epoch: 14, step: 1372, loss: 0.35659998655319214, mean loss: 0.36090286356229256
Epoch: 14, step: 1373, loss: 0.3301101624965668, mean loss: 0.3609014373139801
Epoch: 14, step: 1374, loss: 0.34074917435646057, mean loss: 0.3609005039499415
Epoch: 14, step: 1375, loss: 0.31701356172561646, mean loss: 0.36089847139426234
Epoch: 14, step: 1376, loss: 0.35993918776512146, mean loss: 0.360898426968586
Epoch: 14, step: 1377, loss: 0.32035940885543823, mean loss: 0.3608965496407119
Epoch: 14, step: 1378, loss: 0.3398002088069916, mean loss: 0.36089557273212963
Epoch: 14, step: 1379, loss: 0.36434298753738403, mean loss: 0.3608957323642284
Epoch: 14, step: 1380, loss: 0.30645987391471863, mean loss: 0.36089321183552303
Epoch: 14, step: 1381, loss: 0.3180665373802185, mean loss: 0.36089122893551123
Epoch: 14, step: 1382, loss: 0.3435378074645996, mean loss: 0.36089042549917294
Epoch: 14, step: 1383, loss: 0.3122239410877228, mean loss: 0.3608881724211909
Epoch: 14, step: 1384, loss: 0.31200432777404785, mean loss: 0.36088590938500525
Epoch: 14, step: 1385, loss: 0.35464003682136536, mean loss: 0.36088562025101006
Epoch: 14, step: 1386, loss: 0.33264902234077454, mean loss: 0.3608843131826441
Epoch: 14, step: 1387, loss: 0.33584192395210266, mean loss: 0.36088315402743065
Epoch: 14, step: 1388, loss: 0.31561562418937683, mean loss: 0.36088105879346455
Epoch: 14, step: 1389, loss: 0.304433137178421, mean loss: 0.3608784461894835
Epoch: 14, step: 1390, loss: 0.3720436990261078, mean loss: 0.3608789629318742
Epoch: 14, step: 1391, loss: 0.3345249891281128, mean loss: 0.3608777432922128
Epoch: 14, step: 1392, loss: 0.4012765884399414, mean loss: 0.36087961283014364
Epoch: 14, step: 1393, loss: 0.3113079369068146, mean loss: 0.3608773189071486
Epoch: 14, step: 1394, loss: 0.3232399523258209, mean loss: 0.36087557732339115
Epoch: 14, step: 1395, loss: 0.36498817801475525, mean loss: 0.36087576761585327
Epoch: 14, step: 1396, loss: 0.31894350051879883, mean loss: 0.3608738274748688
Epoch: 14, step: 1397, loss: 0.2876250743865967, mean loss: 0.36087043852543377
Epoch: 14, step: 1398, loss: 0.3093026876449585, mean loss: 0.36086805278632295
Epoch: 14, step: 1399, loss: 0.33461928367614746, mean loss: 0.36086683846502804
Epoch: 14, step: 1400, loss: 0.3390146791934967, mean loss: 0.3608658275865865
Epoch: 14, step: 1401, loss: 0.30771559476852417, mean loss: 0.36086336897650145
Epoch: 14, step: 1402, loss: 0.3112648129463196, mean loss: 0.3608610747651119
Epoch: 14, step: 1403, loss: 0.36101025342941284, mean loss: 0.36086108166514264
Epoch: 14, step: 1404, loss: 0.40715092420578003, mean loss: 0.36086322263191295
Epoch: 14, step: 1405, loss: 0.3163163363933563, mean loss: 0.3608611623744789
Epoch: 14, step: 1406, loss: 0.31025516986846924, mean loss: 0.3608588219965246
Epoch: 14, step: 1407, loss: 0.31157901883125305, mean loss: 0.3608565430563116
Epoch: 14, step: 1408, loss: 0.4023316502571106, mean loss: 0.360858460980344
Epoch: 14, step: 1409, loss: 0.31224605441093445, mean loss: 0.3608562131117336
Epoch: 14, step: 1410, loss: 0.3789708912372589, mean loss: 0.36085705070724505
Epoch: 14, step: 1411, loss: 0.34746745228767395, mean loss: 0.3608564316209486
Epoch: 14, step: 1412, loss: 0.35239261388778687, mean loss: 0.36085604030291574
Epoch: 14, step: 1413, loss: 0.30637913942337036, mean loss: 0.3608535217222001
Epoch: 14, step: 1414, loss: 0.33541566133499146, mean loss: 0.36085234573124325
Epoch: 14, step: 1415, loss: 0.3418205678462982, mean loss: 0.36085146593381884
Epoch: 14, step: 1416, loss: 0.3254135251045227, mean loss: 0.36084982779112806
Epoch: 14, step: 1417, loss: 0.40488964319229126, mean loss: 0.36085186346716586
Epoch: 14, step: 1418, loss: 0.3255644738674164, mean loss: 0.3608502324345983
Epoch: 14, step: 1419, loss: 0.415955126285553, mean loss: 0.3608527793422453
Epoch: 14, step: 1420, loss: 0.3500864803791046, mean loss: 0.3608522817548273
Epoch: 14, step: 1421, loss: 0.31741803884506226, mean loss: 0.3608502744416325
Epoch: 14, step: 1422, loss: 0.30878138542175293, mean loss: 0.36084786818954045
Epoch: 14, step: 1423, loss: 0.3295598328113556, mean loss: 0.3608464223468705
Epoch: 14, step: 1424, loss: 0.38063541054725647, mean loss: 0.3608473367680248
Epoch: 14, step: 1425, loss: 0.3120136857032776, mean loss: 0.360845080338348
Epoch: 14, step: 1426, loss: 0.3284343183040619, mean loss: 0.36084358282127393
Epoch: 14, step: 1427, loss: 0.2962574064731598, mean loss: 0.3608405987990808
Epoch: 14, step: 1428, loss: 0.33461546897888184, mean loss: 0.36083938719687153
Epoch: 14, step: 1429, loss: 0.33795231580734253, mean loss: 0.36083832986196485
Epoch: 14, step: 1430, loss: 0.2744397222995758, mean loss: 0.3608343386110958
Epoch: 14, step: 1431, loss: 0.30197766423225403, mean loss: 0.36083161980684697
Epoch: 14, step: 1432, loss: 0.31293436884880066, mean loss: 0.36082940736050034
Epoch: 14, step: 1433, loss: 0.30722230672836304, mean loss: 0.3608269312819492
Epoch: 14, step: 1434, loss: 0.31786665320396423, mean loss: 0.3608249470651427
Epoch: 14, step: 1435, loss: 0.3123049736022949, mean loss: 0.36082270616483497
Epoch: 14, step: 1436, loss: 0.3709099590778351, mean loss: 0.3608231720242038
Epoch: 14, step: 1437, loss: 0.3413938879966736, mean loss: 0.36082227476346546
Epoch: 14, step: 1438, loss: 0.35961201786994934, mean loss: 0.36082221887536137
Epoch: 14, step: 1439, loss: 0.28993988037109375, mean loss: 0.3608189457714408
Epoch: 14, step: 1440, loss: 0.3374994695186615, mean loss: 0.36081786900751905
Epoch: 14, step: 1441, loss: 0.3121969401836395, mean loss: 0.36081562406667395
Epoch: 14, step: 1442, loss: 0.3214244246482849, mean loss: 0.3608138053677766
Epoch: 14, step: 1443, loss: 0.35433220863342285, mean loss: 0.3608135061250834
Valid: 14, mean loss: 0.19203306237856546
Epoch: 15, step: 0, loss: 0.3148835599422455, mean loss: 0.36081138572684773
Epoch: 15, step: 1, loss: 0.30408135056495667, mean loss: 0.3608087668534675
Epoch: 15, step: 2, loss: 0.33588141202926636, mean loss: 0.3608076161654361
Epoch: 15, step: 3, loss: 0.36064085364341736, mean loss: 0.3608076084677569
Epoch: 15, step: 4, loss: 0.3604103922843933, mean loss: 0.36080759013329194
Epoch: 15, step: 5, loss: 0.3390301764011383, mean loss: 0.36080658499096147
Epoch: 15, step: 6, loss: 0.32338228821754456, mean loss: 0.3608048577422988
Epoch: 15, step: 7, loss: 0.31908515095710754, mean loss: 0.3608029323358568
Epoch: 15, step: 8, loss: 0.30649685859680176, mean loss: 0.36080042617157887
Epoch: 15, step: 9, loss: 0.31750744581222534, mean loss: 0.3607984283413823
Epoch: 15, step: 10, loss: 0.3295917510986328, mean loss: 0.36079698832120594
Epoch: 15, step: 11, loss: 0.3398083448410034, mean loss: 0.36079601985297594
Epoch: 15, step: 12, loss: 0.37481099367141724, mean loss: 0.3607966665088989
Epoch: 15, step: 13, loss: 0.33648696541786194, mean loss: 0.3607955449023154
Epoch: 15, step: 14, loss: 0.33395934104919434, mean loss: 0.3607943067844906
Epoch: 15, step: 15, loss: 0.3072696924209595, mean loss: 0.3607918374813736
Epoch: 15, step: 16, loss: 0.3022299110889435, mean loss: 0.36078913591167333
Epoch: 15, step: 17, loss: 0.30970337986946106, mean loss: 0.36078677934021647
Epoch: 15, step: 18, loss: 0.3429209291934967, mean loss: 0.3607859552316254
Epoch: 15, step: 19, loss: 0.37650880217552185, mean loss: 0.3607866804551929
Epoch: 15, step: 20, loss: 0.3801432251930237, mean loss: 0.360787573243567
Epoch: 15, step: 21, loss: 0.32108113169670105, mean loss: 0.3607857419345758
Epoch: 15, step: 22, loss: 0.36417803168296814, mean loss: 0.3607858983838563
Epoch: 15, step: 23, loss: 0.366426944732666, mean loss: 0.3607861585317233
Epoch: 15, step: 24, loss: 0.3081699311733246, mean loss: 0.3607837321435583
Epoch: 15, step: 25, loss: 0.37650880217552185, mean loss: 0.36078445726898634
Epoch: 15, step: 26, loss: 0.31168702244758606, mean loss: 0.36078219335812634
Epoch: 15, step: 27, loss: 0.3042241632938385, mean loss: 0.36077958555519085
Epoch: 15, step: 28, loss: 0.3458099961280823, mean loss: 0.36077889536249286
Epoch: 15, step: 29, loss: 0.35012418031692505, mean loss: 0.3607784041354276
Epoch: 15, step: 30, loss: 0.3372374176979065, mean loss: 0.3607773188472234
Epoch: 15, step: 31, loss: 0.32027119398117065, mean loss: 0.3607754515171079
Epoch: 15, step: 32, loss: 0.3077462613582611, mean loss: 0.3607730069870678
Epoch: 15, step: 33, loss: 0.3366394340991974, mean loss: 0.36077189453326086
Epoch: 15, step: 34, loss: 0.38372960686683655, mean loss: 0.36077295273618015
Epoch: 15, step: 35, loss: 0.37673473358154297, mean loss: 0.3607736884377309
Epoch: 15, step: 36, loss: 0.3543224632740021, mean loss: 0.3607733911051428
Epoch: 15, step: 37, loss: 0.32874301075935364, mean loss: 0.36077191491469457
Epoch: 15, step: 38, loss: 0.30684882402420044, mean loss: 0.36076942986511207
Epoch: 15, step: 39, loss: 0.3296743929386139, mean loss: 0.3607679969141016
Epoch: 15, step: 40, loss: 0.3694722354412079, mean loss: 0.36076839801260063
Epoch: 15, step: 41, loss: 0.330147385597229, mean loss: 0.3607669870360816
Epoch: 15, step: 42, loss: 0.32080331444740295, mean loss: 0.3607651456467535
Epoch: 15, step: 43, loss: 0.35316693782806396, mean loss: 0.36076479556345925
Epoch: 15, step: 44, loss: 0.356405645608902, mean loss: 0.3607645947272485
Epoch: 15, step: 45, loss: 0.35005730390548706, mean loss: 0.36076410144010107
Epoch: 15, step: 46, loss: 0.35116690397262573, mean loss: 0.3607636593155575
Epoch: 15, step: 47, loss: 0.3075529932975769, mean loss: 0.36076120811480117
Epoch: 15, step: 48, loss: 0.34375670552253723, mean loss: 0.36076042482203813
Epoch: 15, step: 49, loss: 0.3240886628627777, mean loss: 0.36075873565750755
Epoch: 15, step: 50, loss: 0.3369174599647522, mean loss: 0.36075763753785883
Epoch: 15, step: 51, loss: 0.3490677773952484, mean loss: 0.3607570991323622
Epoch: 15, step: 52, loss: 0.3630875051021576, mean loss: 0.36075720646004467
Epoch: 15, step: 53, loss: 0.3548037111759186, mean loss: 0.36075693228231215
Epoch: 15, step: 54, loss: 0.3217897415161133, mean loss: 0.3607551377996612
Epoch: 15, step: 55, loss: 0.31803566217422485, mean loss: 0.36075317061069334
Epoch: 15, step: 56, loss: 0.33066388964653015, mean loss: 0.3607517850933123
Epoch: 15, step: 57, loss: 0.35090044140815735, mean loss: 0.36075133149060096
Epoch: 15, step: 58, loss: 0.329622745513916, mean loss: 0.3607498982484638
Epoch: 15, step: 59, loss: 0.3095785677433014, mean loss: 0.3607475422940207
Epoch: 15, step: 60, loss: 0.35401585698127747, mean loss: 0.36074723237802636
Epoch: 15, step: 61, loss: 0.3526197075843811, mean loss: 0.360746858217047
Epoch: 15, step: 62, loss: 0.32130661606788635, mean loss: 0.3607450426187342
Epoch: 15, step: 63, loss: 0.3361748158931732, mean loss: 0.3607439116011166
Epoch: 15, step: 64, loss: 0.32431864738464355, mean loss: 0.3607422349491388
Epoch: 15, step: 65, loss: 0.32357174158096313, mean loss: 0.3607405240730747
Epoch: 15, step: 66, loss: 0.32169008255004883, mean loss: 0.3607387267498583
Epoch: 15, step: 67, loss: 0.370064914226532, mean loss: 0.3607391559742451
Epoch: 15, step: 68, loss: 0.33293718099594116, mean loss: 0.3607378764871551
Epoch: 15, step: 69, loss: 0.33456990122795105, mean loss: 0.3607366722545155
Epoch: 15, step: 70, loss: 0.30349189043045044, mean loss: 0.3607340380093439
Epoch: 15, step: 71, loss: 0.34278520941734314, mean loss: 0.3607332120923279
Epoch: 15, step: 72, loss: 0.3077526390552521, mean loss: 0.3607307742985103
Epoch: 15, step: 73, loss: 0.3563489317893982, mean loss: 0.36073057268617437
Epoch: 15, step: 74, loss: 0.33720389008522034, mean loss: 0.36072949025311246
Epoch: 15, step: 75, loss: 0.36065977811813354, mean loss: 0.3607294870458924
Epoch: 15, step: 76, loss: 0.31517085433006287, mean loss: 0.36072739114338903
Epoch: 15, step: 77, loss: 0.3484324514865875, mean loss: 0.3607268255467538
Epoch: 15, step: 78, loss: 0.3238868713378906, mean loss: 0.3607251308986923
Epoch: 15, step: 79, loss: 0.33714529871940613, mean loss: 0.3607240462697972
Epoch: 15, step: 80, loss: 0.28833192586898804, mean loss: 0.36072071651861737
Epoch: 15, step: 81, loss: 0.30992934107780457, mean loss: 0.3607183804237116
Epoch: 15, step: 82, loss: 0.32136961817741394, mean loss: 0.3607165707027786
Epoch: 15, step: 83, loss: 0.38701698184013367, mean loss: 0.3607177802507522
Epoch: 15, step: 84, loss: 0.3200666010379791, mean loss: 0.36071591080125975
Epoch: 15, step: 85, loss: 0.4008696675300598, mean loss: 0.36071775729057864
Epoch: 15, step: 86, loss: 0.35410141944885254, mean loss: 0.3607174530491733
Epoch: 15, step: 87, loss: 0.30352848768234253, mean loss: 0.36071482342965117
Epoch: 15, step: 88, loss: 0.3090055286884308, mean loss: 0.3607124458814999
Epoch: 15, step: 89, loss: 0.3382066786289215, mean loss: 0.36071141113358024
Epoch: 15, step: 90, loss: 0.34714850783348083, mean loss: 0.3607107875804884
Epoch: 15, step: 91, loss: 0.31050875782966614, mean loss: 0.3607084796534127
Epoch: 15, step: 92, loss: 0.33881592750549316, mean loss: 0.36070747323810687
Epoch: 15, step: 93, loss: 0.3387296795845032, mean loss: 0.3607064629506354
Epoch: 15, step: 94, loss: 0.2996964454650879, mean loss: 0.360703658537053
Epoch: 15, step: 95, loss: 0.32291388511657715, mean loss: 0.36070192155537345
Epoch: 15, step: 96, loss: 0.3761303126811981, mean loss: 0.36070263067846603
Epoch: 15, step: 97, loss: 0.36273032426834106, mean loss: 0.3607027238714796
Epoch: 15, step: 98, loss: 0.3291114866733551, mean loss: 0.3607012720015776
Epoch: 15, step: 99, loss: 0.35877346992492676, mean loss: 0.36070118340773216
Epoch: 15, step: 100, loss: 0.3197110593318939, mean loss: 0.36069929975697734
Epoch: 15, step: 101, loss: 0.30726736783981323, mean loss: 0.3606968444710699
Epoch: 15, step: 102, loss: 0.3125017583370209, mean loss: 0.3606946299286753
Epoch: 15, step: 103, loss: 0.31887945532798767, mean loss: 0.3606927086286109
Epoch: 15, step: 104, loss: 0.34031492471694946, mean loss: 0.360691772364705
Epoch: 15, step: 105, loss: 0.34947332739830017, mean loss: 0.3606912569532851
Epoch: 15, step: 106, loss: 0.35936328768730164, mean loss: 0.36069119594491156
Epoch: 15, step: 107, loss: 0.34319913387298584, mean loss: 0.3606903923771942
Epoch: 15, step: 108, loss: 0.3088062107563019, mean loss: 0.3606880089796279
Epoch: 15, step: 109, loss: 0.32037779688835144, mean loss: 0.36068615733920106
Epoch: 15, step: 110, loss: 0.3626248240470886, mean loss: 0.36068624638732505
Epoch: 15, step: 111, loss: 0.34996095299720764, mean loss: 0.3606857537686685
Epoch: 15, step: 112, loss: 0.3511815071105957, mean loss: 0.360685317253413
Epoch: 15, step: 113, loss: 0.29324182868003845, mean loss: 0.3606822198212199
Epoch: 15, step: 114, loss: 0.35808736085891724, mean loss: 0.360682100654333
Epoch: 15, step: 115, loss: 0.3398257791996002, mean loss: 0.3606811428879179
Epoch: 15, step: 116, loss: 0.35014569759368896, mean loss: 0.3606806591001926
Epoch: 15, step: 117, loss: 0.32997316122055054, mean loss: 0.36067924907641263
Epoch: 15, step: 118, loss: 0.3192456066608429, mean loss: 0.3606773466179703
Epoch: 15, step: 119, loss: 0.32614240050315857, mean loss: 0.3606757609914269
Epoch: 15, step: 120, loss: 0.3226337432861328, mean loss: 0.3606740144225042
Epoch: 15, step: 121, loss: 0.3455163836479187, mean loss: 0.36067331854376145
Epoch: 15, step: 122, loss: 0.3284631371498108, mean loss: 0.3606718398594024
Epoch: 15, step: 123, loss: 0.29571855068206787, mean loss: 0.36066885816232297
Epoch: 15, step: 124, loss: 0.3244110345840454, mean loss: 0.36066719381421286
Epoch: 15, step: 125, loss: 0.3196509778499603, mean loss: 0.3606653111273514
Epoch: 15, step: 126, loss: 0.3465731739997864, mean loss: 0.360664664313328
Epoch: 15, step: 127, loss: 0.30199724435806274, mean loss: 0.3606619716650833
Epoch: 15, step: 128, loss: 0.3266161382198334, mean loss: 0.36066040914117464
Epoch: 15, step: 129, loss: 0.34063106775283813, mean loss: 0.36065948994239594
Epoch: 15, step: 130, loss: 0.33306172490119934, mean loss: 0.3606582234670143
Epoch: 15, step: 131, loss: 0.3383947014808655, mean loss: 0.3606572018296251
Epoch: 15, step: 132, loss: 0.37473785877227783, mean loss: 0.3606578479387859
Epoch: 15, step: 133, loss: 0.33041056990623474, mean loss: 0.3606564600669848
Epoch: 15, step: 134, loss: 0.3539138734340668, mean loss: 0.360656150703065
Epoch: 15, step: 135, loss: 0.3740687072277069, mean loss: 0.360656766070863
Epoch: 15, step: 136, loss: 0.31898272037506104, mean loss: 0.36065485415428294
Epoch: 15, step: 137, loss: 0.31003671884536743, mean loss: 0.3606525320084297
Epoch: 15, step: 138, loss: 0.3069919943809509, mean loss: 0.3606500704029603
Epoch: 15, step: 139, loss: 0.3125537037849426, mean loss: 0.36064786414761085
Epoch: 15, step: 140, loss: 0.3111700415611267, mean loss: 0.36064559462682805
Epoch: 15, step: 141, loss: 0.30732184648513794, mean loss: 0.36064314880772236
Epoch: 15, step: 142, loss: 0.309498131275177, mean loss: 0.3606408030288143
Epoch: 15, step: 143, loss: 0.34072446823120117, mean loss: 0.360639889603076
Epoch: 15, step: 144, loss: 0.31488344073295593, mean loss: 0.3606377911646963
Epoch: 15, step: 145, loss: 0.3387831151485443, mean loss: 0.36063678893246587
Epoch: 15, step: 146, loss: 0.32668328285217285, mean loss: 0.3606352319321412
Epoch: 15, step: 147, loss: 0.31544217467308044, mean loss: 0.3606331596166029
Epoch: 15, step: 148, loss: 0.3235498368740082, mean loss: 0.3606314592487391
Epoch: 15, step: 149, loss: 0.3380464017391205, mean loss: 0.3606304237119436
Epoch: 15, step: 150, loss: 0.339088499546051, mean loss: 0.36062943604864683
Epoch: 15, step: 151, loss: 0.35891249775886536, mean loss: 0.36062935733333923
Epoch: 15, step: 152, loss: 0.37461769580841064, mean loss: 0.3606299986178244
Epoch: 15, step: 153, loss: 0.31422388553619385, mean loss: 0.36062787126323187
Epoch: 15, step: 154, loss: 0.3072497248649597, mean loss: 0.36062542440802225
Epoch: 15, step: 155, loss: 0.30565792322158813, mean loss: 0.3606229048122583
Epoch: 15, step: 156, loss: 0.34050309658050537, mean loss: 0.36062198260442807
Epoch: 15, step: 157, loss: 0.32620537281036377, mean loss: 0.3606204051633338
Epoch: 15, step: 158, loss: 0.3355248272418976, mean loss: 0.36061925499247716
Epoch: 15, step: 159, loss: 0.35003548860549927, mean loss: 0.36061876994360514
Epoch: 15, step: 160, loss: 0.334541916847229, mean loss: 0.36061757490886354
Epoch: 15, step: 161, loss: 0.3354906141757965, mean loss: 0.3606164234580005
Epoch: 15, step: 162, loss: 0.3653777539730072, mean loss: 0.3606166416374678
Epoch: 15, step: 163, loss: 0.32952311635017395, mean loss: 0.3606152168974895
Epoch: 15, step: 164, loss: 0.3143908381462097, mean loss: 0.3606130989419912
Epoch: 15, step: 165, loss: 0.3372545838356018, mean loss: 0.36061202872687587
Epoch: 15, step: 166, loss: 0.2939984202384949, mean loss: 0.3606089768366258
Epoch: 15, step: 167, loss: 0.3737126290798187, mean loss: 0.3606095771505457
Epoch: 15, step: 168, loss: 0.33690693974494934, mean loss: 0.36060849131805656
Epoch: 15, step: 169, loss: 0.3309912085533142, mean loss: 0.3606071345941553
Epoch: 15, step: 170, loss: 0.3692361116409302, mean loss: 0.36060752985671984
Epoch: 15, step: 171, loss: 0.3526248633861542, mean loss: 0.360607164216079
Epoch: 15, step: 172, loss: 0.32437658309936523, mean loss: 0.360605504774815
Epoch: 15, step: 173, loss: 0.3381580114364624, mean loss: 0.36060447667674145
Epoch: 15, step: 174, loss: 0.3079237937927246, mean loss: 0.3606020640052102
Epoch: 15, step: 175, loss: 0.34731873869895935, mean loss: 0.3606014556829302
Epoch: 15, step: 176, loss: 0.2995555102825165, mean loss: 0.36059866015490893
Epoch: 15, step: 177, loss: 0.34113600850105286, mean loss: 0.36059776892624085
Epoch: 15, step: 178, loss: 0.3239496946334839, mean loss: 0.36059609082402494
Epoch: 15, step: 179, loss: 0.348757803440094, mean loss: 0.3605955487778993
Epoch: 15, step: 180, loss: 0.3387443423271179, mean loss: 0.36059454831059234
Epoch: 15, step: 181, loss: 0.3259211480617523, mean loss: 0.36059296084606307
Epoch: 15, step: 182, loss: 0.31678029894828796, mean loss: 0.36059095504732214
Epoch: 15, step: 183, loss: 0.32007455825805664, mean loss: 0.36058910024065716
Epoch: 15, step: 184, loss: 0.3552037477493286, mean loss: 0.3605888537150224
Epoch: 15, step: 185, loss: 0.33793914318084717, mean loss: 0.36058781692519665
Epoch: 15, step: 186, loss: 0.382399320602417, mean loss: 0.3605888153004279
Epoch: 15, step: 187, loss: 0.3914172053337097, mean loss: 0.36059022633988386
Epoch: 15, step: 188, loss: 0.31635206937789917, mean loss: 0.36058820161760996
Epoch: 15, step: 189, loss: 0.40534743666648865, mean loss: 0.3605902500951866
Epoch: 15, step: 190, loss: 0.3359082043170929, mean loss: 0.36058912053380365
Epoch: 15, step: 191, loss: 0.33386537432670593, mean loss: 0.3605878975909972
Epoch: 15, step: 192, loss: 0.33446887135505676, mean loss: 0.3605867023763248
Epoch: 15, step: 193, loss: 0.35174787044525146, mean loss: 0.3605862979271653
Epoch: 15, step: 194, loss: 0.34566906094551086, mean loss: 0.3605856153722817
Epoch: 15, step: 195, loss: 0.33455607295036316, mean loss: 0.3605844244159117
Epoch: 15, step: 196, loss: 0.3229210376739502, mean loss: 0.3605827012431642
Epoch: 15, step: 197, loss: 0.33366450667381287, mean loss: 0.36058146974007294
Epoch: 15, step: 198, loss: 0.339970201253891, mean loss: 0.36058052682097846
Epoch: 15, step: 199, loss: 0.31585052609443665, mean loss: 0.36057848061783454
Epoch: 15, step: 200, loss: 0.3256206214427948, mean loss: 0.36057688152085016
Epoch: 15, step: 201, loss: 0.3112107813358307, mean loss: 0.36057462344289826
Epoch: 15, step: 202, loss: 0.32357484102249146, mean loss: 0.3605729310959001
Epoch: 15, step: 203, loss: 0.3641569912433624, mean loss: 0.36057309502108065
Epoch: 15, step: 204, loss: 0.28732120990753174, mean loss: 0.3605697448319604
Epoch: 15, step: 205, loss: 0.3663194179534912, mean loss: 0.36057000778234555
Epoch: 15, step: 206, loss: 0.3276244103908539, mean loss: 0.36056850114689526
Epoch: 15, step: 207, loss: 0.34785687923431396, mean loss: 0.3605679198581669
Epoch: 15, step: 208, loss: 0.34015730023384094, mean loss: 0.36056698654527536
Epoch: 15, step: 209, loss: 0.3607969582080841, mean loss: 0.3605669970606692
Epoch: 15, step: 210, loss: 0.3780823051929474, mean loss: 0.36056779790690996
Epoch: 15, step: 211, loss: 0.32279473543167114, mean loss: 0.36056607090149323
Epoch: 15, step: 212, loss: 0.32290181517601013, mean loss: 0.36056434894951017
Epoch: 15, step: 213, loss: 0.34203076362609863, mean loss: 0.3605635016611622
Epoch: 15, step: 214, loss: 0.3528865575790405, mean loss: 0.360563150715147
Epoch: 15, step: 215, loss: 0.3444382846355438, mean loss: 0.36056241361210806
Epoch: 15, step: 216, loss: 0.35981297492980957, mean loss: 0.3605623793551861
Epoch: 15, step: 217, loss: 0.3256230056285858, mean loss: 0.36056078234569133
Epoch: 15, step: 218, loss: 0.3507601320743561, mean loss: 0.3605603343978751
Epoch: 15, step: 219, loss: 0.36180976033210754, mean loss: 0.360560391501437
Epoch: 15, step: 220, loss: 0.32868269085884094, mean loss: 0.3605589346347196
Epoch: 15, step: 221, loss: 0.30730560421943665, mean loss: 0.3605565009755287
Epoch: 15, step: 222, loss: 0.3486882746219635, mean loss: 0.3605559586263831
Epoch: 15, step: 223, loss: 0.33915892243385315, mean loss: 0.36055498087843063
Epoch: 15, step: 224, loss: 0.3288958966732025, mean loss: 0.36055353426731773
Epoch: 15, step: 225, loss: 0.3279857933521271, mean loss: 0.3605520462045874
Epoch: 15, step: 226, loss: 0.37548384070396423, mean loss: 0.36055272842665986
Epoch: 15, step: 227, loss: 0.326249897480011, mean loss: 0.3605511612286086
Epoch: 15, step: 228, loss: 0.3356601893901825, mean loss: 0.3605500240833832
Epoch: 15, step: 229, loss: 0.361263245344162, mean loss: 0.3605500566654417
Epoch: 15, step: 230, loss: 0.34721001982688904, mean loss: 0.3605494472809075
Epoch: 15, step: 231, loss: 0.3771897852420807, mean loss: 0.360550207391357
Epoch: 15, step: 232, loss: 0.3504965603351593, mean loss: 0.36054974817393337
Epoch: 15, step: 233, loss: 0.3715384304523468, mean loss: 0.3605502500777554
Epoch: 15, step: 234, loss: 0.3258328139781952, mean loss: 0.3605486644446839
Epoch: 15, step: 235, loss: 0.33352479338645935, mean loss: 0.3605474302525457
Epoch: 15, step: 236, loss: 0.3430599272251129, mean loss: 0.360546631627025
Epoch: 15, step: 237, loss: 0.3669801950454712, mean loss: 0.36054692542387484
Epoch: 15, step: 238, loss: 0.3562218248844147, mean loss: 0.3605467279216812
Epoch: 15, step: 239, loss: 0.3467450439929962, mean loss: 0.36054609770780316
Epoch: 15, step: 240, loss: 0.3518444001674652, mean loss: 0.36054570038815836
Epoch: 15, step: 241, loss: 0.3133496642112732, mean loss: 0.3605435455148054
Epoch: 15, step: 242, loss: 0.3362315595149994, mean loss: 0.360542435530511
Epoch: 15, step: 243, loss: 0.3276965618133545, mean loss: 0.36054093599281395
Epoch: 15, step: 244, loss: 0.3131050765514374, mean loss: 0.3605387704662473
Epoch: 15, step: 245, loss: 0.3453637361526489, mean loss: 0.36053807773209623
Epoch: 15, step: 246, loss: 0.35528287291526794, mean loss: 0.3605378378450822
Epoch: 15, step: 247, loss: 0.3154950439929962, mean loss: 0.3605357818475538
Epoch: 15, step: 248, loss: 0.35477402806282043, mean loss: 0.36053551886185
Epoch: 15, step: 249, loss: 0.3038482666015625, mean loss: 0.360532931584248
Epoch: 15, step: 250, loss: 0.34967660903930664, mean loss: 0.36053243611062535
Epoch: 15, step: 251, loss: 0.333997905254364, mean loss: 0.36053122515175096
Epoch: 15, step: 252, loss: 0.3246476650238037, mean loss: 0.3605295876050833
Epoch: 15, step: 253, loss: 0.33451759815216064, mean loss: 0.3605284006018227
Epoch: 15, step: 254, loss: 0.33218204975128174, mean loss: 0.3605271071338395
Epoch: 15, step: 255, loss: 0.385641872882843, mean loss: 0.36052825308956815
Epoch: 15, step: 256, loss: 0.32778459787368774, mean loss: 0.36052675910520826
Epoch: 15, step: 257, loss: 0.3233320713043213, mean loss: 0.360525062112426
Epoch: 15, step: 258, loss: 0.3439021408557892, mean loss: 0.3605243037328806
Epoch: 15, step: 259, loss: 0.34397006034851074, mean loss: 0.36052354852104734
Epoch: 15, step: 260, loss: 0.35900789499282837, mean loss: 0.36052347937942386
Epoch: 15, step: 261, loss: 0.33963435888290405, mean loss: 0.36052252649554023
Epoch: 15, step: 262, loss: 0.31834736466407776, mean loss: 0.3605206027094785
Epoch: 15, step: 263, loss: 0.3516046702861786, mean loss: 0.3605201960349472
Epoch: 15, step: 264, loss: 0.36639684438705444, mean loss: 0.3605204640690796
Epoch: 15, step: 265, loss: 0.34232696890830994, mean loss: 0.3605196343009887
Epoch: 15, step: 266, loss: 0.3066083490848541, mean loss: 0.360517175629706
Epoch: 15, step: 267, loss: 0.32985952496528625, mean loss: 0.3605157775245133
Epoch: 15, step: 268, loss: 0.37435582280158997, mean loss: 0.3605164086543084
Epoch: 15, step: 269, loss: 0.3128085732460022, mean loss: 0.36051423319441744
Epoch: 15, step: 270, loss: 0.32919225096702576, mean loss: 0.3605128049885797
Epoch: 15, step: 271, loss: 0.32436761260032654, mean loss: 0.36051115693129404
Epoch: 15, step: 272, loss: 0.3134204149246216, mean loss: 0.36050900990434803
Epoch: 15, step: 273, loss: 0.3714531362056732, mean loss: 0.36050950886150596
Epoch: 15, step: 274, loss: 0.30670827627182007, mean loss: 0.3605070561041506
Epoch: 15, step: 275, loss: 0.34148380160331726, mean loss: 0.3605061888879535
Epoch: 15, step: 276, loss: 0.321449339389801, mean loss: 0.36050440847816645
Epoch: 15, step: 277, loss: 0.3401007056236267, mean loss: 0.36050347841604347
Epoch: 15, step: 278, loss: 0.3183055520057678, mean loss: 0.36050155499535835
Epoch: 15, step: 279, loss: 0.3175090551376343, mean loss: 0.3604995954465955
Epoch: 15, step: 280, loss: 0.3538670539855957, mean loss: 0.3604992931567518
Epoch: 15, step: 281, loss: 0.35726404190063477, mean loss: 0.36049914571115627
Epoch: 15, step: 282, loss: 0.32050591707229614, mean loss: 0.36049732311494614
Epoch: 15, step: 283, loss: 0.32346829771995544, mean loss: 0.3604956356821447
Epoch: 15, step: 284, loss: 0.38165247440338135, mean loss: 0.3604965997668438
Epoch: 15, step: 285, loss: 0.3267507553100586, mean loss: 0.3604950620905266
Epoch: 15, step: 286, loss: 0.3043151795864105, mean loss: 0.36049250229271806
Epoch: 15, step: 287, loss: 0.3677468001842499, mean loss: 0.36049283281476524
Epoch: 15, step: 288, loss: 0.3162948191165924, mean loss: 0.3604908191460925
Epoch: 15, step: 289, loss: 0.3740435838699341, mean loss: 0.3604914365841209
Epoch: 15, step: 290, loss: 0.32462093234062195, mean loss: 0.3604898024670309
Epoch: 15, step: 291, loss: 0.3315621316432953, mean loss: 0.3604884846977696
Epoch: 15, step: 292, loss: 0.3140715956687927, mean loss: 0.3604863703221021
Epoch: 15, step: 293, loss: 0.38162317872047424, mean loss: 0.3604873330991996
Epoch: 15, step: 294, loss: 0.32113713026046753, mean loss: 0.360485540787524
Epoch: 15, step: 295, loss: 0.38084766268730164, mean loss: 0.360486468193331
Epoch: 15, step: 296, loss: 0.320867121219635, mean loss: 0.3604846637871292
Epoch: 15, step: 297, loss: 0.3456595242023468, mean loss: 0.3604839886282083
Epoch: 15, step: 298, loss: 0.3347693085670471, mean loss: 0.3604828175967378
Epoch: 15, step: 299, loss: 0.31489822268486023, mean loss: 0.36048074179551226
Epoch: 15, step: 300, loss: 0.32239845395088196, mean loss: 0.36047900770836483
Epoch: 15, step: 301, loss: 0.3398093581199646, mean loss: 0.36047806655320647
Epoch: 15, step: 302, loss: 0.31845518946647644, mean loss: 0.3604761532045252
Epoch: 15, step: 303, loss: 0.34576040506362915, mean loss: 0.36047548321052864
Epoch: 15, step: 304, loss: 0.35749709606170654, mean loss: 0.3604753476135722
Epoch: 15, step: 305, loss: 0.40453410148620605, mean loss: 0.36047735338402986
Epoch: 15, step: 306, loss: 0.33886364102363586, mean loss: 0.36047636946668293
Epoch: 15, step: 307, loss: 0.33684760332107544, mean loss: 0.36047529386735
Epoch: 15, step: 308, loss: 0.34784919023513794, mean loss: 0.36047471914371065
Epoch: 15, step: 309, loss: 0.3356596529483795, mean loss: 0.36047358964593207
Epoch: 15, step: 310, loss: 0.3410474956035614, mean loss: 0.3604727054761609
Epoch: 15, step: 311, loss: 0.33815327286720276, mean loss: 0.36047168966364457
Epoch: 15, step: 312, loss: 0.34447112679481506, mean loss: 0.36047096147164215
Epoch: 15, step: 313, loss: 0.3155291676521301, mean loss: 0.360468916245747
Epoch: 15, step: 314, loss: 0.29485321044921875, mean loss: 0.36046593032056856
Epoch: 15, step: 315, loss: 0.3721907436847687, mean loss: 0.3604664638486612
Epoch: 15, step: 316, loss: 0.32282504439353943, mean loss: 0.3604647510844325
Epoch: 15, step: 317, loss: 0.3166920840740204, mean loss: 0.36046275942609185
Epoch: 15, step: 318, loss: 0.3405313193798065, mean loss: 0.3604618525859241
Epoch: 15, step: 319, loss: 0.32921987771987915, mean loss: 0.36046043120399207
Epoch: 15, step: 320, loss: 0.34056907892227173, mean loss: 0.3604595262700818
Epoch: 15, step: 321, loss: 0.3398808538913727, mean loss: 0.3604585901099336
Epoch: 15, step: 322, loss: 0.34664663672447205, mean loss: 0.36045796180836487
Epoch: 15, step: 323, loss: 0.34435924887657166, mean loss: 0.36045722951611
Epoch: 15, step: 324, loss: 0.3700403869152069, mean loss: 0.3604576654113749
Epoch: 15, step: 325, loss: 0.3423600494861603, mean loss: 0.3604568422686511
Epoch: 15, step: 326, loss: 0.34894299507141113, mean loss: 0.36045631860252125
Epoch: 15, step: 327, loss: 0.35174235701560974, mean loss: 0.36045592229719164
Epoch: 15, step: 328, loss: 0.35119616985321045, mean loss: 0.3604555011887991
Epoch: 15, step: 329, loss: 0.30304673314094543, mean loss: 0.36045289051267143
Epoch: 15, step: 330, loss: 0.33261168003082275, mean loss: 0.36045162448518375
Epoch: 15, step: 331, loss: 0.33873090147972107, mean loss: 0.36045063682044176
Epoch: 15, step: 332, loss: 0.30715739727020264, mean loss: 0.3604482136294469
Epoch: 15, step: 333, loss: 0.30557724833488464, mean loss: 0.36044571881425663
Epoch: 15, step: 334, loss: 0.3942752182483673, mean loss: 0.3604472568683341
Epoch: 15, step: 335, loss: 0.35784095525741577, mean loss: 0.3604471383785355
Epoch: 15, step: 336, loss: 0.3189700245857239, mean loss: 0.36044525279805667
Epoch: 15, step: 337, loss: 0.35252073407173157, mean loss: 0.3604448925599111
Epoch: 15, step: 338, loss: 0.3113709092140198, mean loss: 0.3604426618229073
Epoch: 15, step: 339, loss: 0.3433273434638977, mean loss: 0.360441883853891
Epoch: 15, step: 340, loss: 0.37393826246261597, mean loss: 0.3604424972977621
Epoch: 15, step: 341, loss: 0.32916533946990967, mean loss: 0.36044107573800266
Epoch: 15, step: 342, loss: 0.38435330986976624, mean loss: 0.3604421625095398
Epoch: 15, step: 343, loss: 0.3661693334579468, mean loss: 0.3604424227881686
Epoch: 15, step: 344, loss: 0.351416677236557, mean loss: 0.3604420126202272
Epoch: 15, step: 345, loss: 0.34239357709884644, mean loss: 0.36044119246047435
Epoch: 15, step: 346, loss: 0.36260831356048584, mean loss: 0.3604412909346462
Epoch: 15, step: 347, loss: 0.3428764343261719, mean loss: 0.3604404928222958
Epoch: 15, step: 348, loss: 0.3202207684516907, mean loss: 0.36043866540058783
Epoch: 15, step: 349, loss: 0.34816816449165344, mean loss: 0.3604381079039541
Epoch: 15, step: 350, loss: 0.35101065039634705, mean loss: 0.3604376795973116
Epoch: 15, step: 351, loss: 0.31092774868011475, mean loss: 0.36043543037275605
Epoch: 15, step: 352, loss: 0.3757045269012451, mean loss: 0.36043612401272007
Epoch: 15, step: 353, loss: 0.3150465488433838, mean loss: 0.360434062162299
Epoch: 15, step: 354, loss: 0.33943185210227966, mean loss: 0.36043310816683866
Epoch: 15, step: 355, loss: 0.33223527669906616, mean loss: 0.36043182737870877
Epoch: 15, step: 356, loss: 0.33111271262168884, mean loss: 0.3604304957206828
Epoch: 15, step: 357, loss: 0.3627544343471527, mean loss: 0.36043060126789994
Epoch: 15, step: 358, loss: 0.325639009475708, mean loss: 0.3604290211965165
Epoch: 15, step: 359, loss: 0.3391265571117401, mean loss: 0.36042805378216203
Epoch: 15, step: 360, loss: 0.32953134179115295, mean loss: 0.36042665072544383
Epoch: 15, step: 361, loss: 0.3549141585826874, mean loss: 0.36042640040793666
Epoch: 15, step: 362, loss: 0.31575387716293335, mean loss: 0.36042437195934907
Epoch: 15, step: 363, loss: 0.318488746881485, mean loss: 0.36042246787175924
Epoch: 15, step: 364, loss: 0.33224502205848694, mean loss: 0.3604211885325623
Epoch: 15, step: 365, loss: 0.3484456539154053, mean loss: 0.36042064483263414
Epoch: 15, step: 366, loss: 0.35720160603523254, mean loss: 0.3604204986920432
Epoch: 15, step: 367, loss: 0.3415376543998718, mean loss: 0.3604196414719464
Epoch: 15, step: 368, loss: 0.30911198258399963, mean loss: 0.3604173123758055
Epoch: 15, step: 369, loss: 0.3525082767009735, mean loss: 0.3604169533637458
Epoch: 15, step: 370, loss: 0.32015445828437805, mean loss: 0.3604151258255006
Epoch: 15, step: 371, loss: 0.32151803374290466, mean loss: 0.3604133603438338
Epoch: 15, step: 372, loss: 0.35109037160873413, mean loss: 0.36041293720632483
Epoch: 15, step: 373, loss: 0.3327927589416504, mean loss: 0.36041168368094295
Epoch: 15, step: 374, loss: 0.3623666763305664, mean loss: 0.36041177240309635
Epoch: 15, step: 375, loss: 0.31641218066215515, mean loss: 0.3604097756890039
Epoch: 15, step: 376, loss: 0.3743972182273865, mean loss: 0.3604104104143539
Epoch: 15, step: 377, loss: 0.33438417315483093, mean loss: 0.36040922944342824
Epoch: 15, step: 378, loss: 0.32160502672195435, mean loss: 0.36040746873728363
Epoch: 15, step: 379, loss: 0.37157684564590454, mean loss: 0.36040797551482034
Epoch: 15, step: 380, loss: 0.3012276887893677, mean loss: 0.36040529050566805
Epoch: 15, step: 381, loss: 0.3496898412704468, mean loss: 0.360404804367875
Epoch: 15, step: 382, loss: 0.33366188406944275, mean loss: 0.3604035911518745
Epoch: 15, step: 383, loss: 0.32360929250717163, mean loss: 0.360401922022014
Epoch: 15, step: 384, loss: 0.3638680875301361, mean loss: 0.360402079253382
Epoch: 15, step: 385, loss: 0.3522126376628876, mean loss: 0.3604017077827483
Epoch: 15, step: 386, loss: 0.31343144178390503, mean loss: 0.36039957732209615
Epoch: 15, step: 387, loss: 0.3195536732673645, mean loss: 0.3603977247321082
Epoch: 15, step: 388, loss: 0.295808345079422, mean loss: 0.3603947953756905
Epoch: 15, step: 389, loss: 0.367068350315094, mean loss: 0.3603950980312433
Epoch: 15, step: 390, loss: 0.3452313244342804, mean loss: 0.3603944103629472
Epoch: 15, step: 391, loss: 0.3806283175945282, mean loss: 0.3603953279172385
Epoch: 15, step: 392, loss: 0.34000861644744873, mean loss: 0.36039440347559926
Epoch: 15, step: 393, loss: 0.3157859742641449, mean loss: 0.36039238078451324
Epoch: 15, step: 394, loss: 0.3013453185558319, mean loss: 0.36038970352029975
Epoch: 15, step: 395, loss: 0.29023832082748413, mean loss: 0.36038652291716716
Epoch: 15, step: 396, loss: 0.3368498980998993, mean loss: 0.3603854558352967
Epoch: 15, step: 397, loss: 0.32146385312080383, mean loss: 0.36038369132343184
Epoch: 15, step: 398, loss: 0.350730836391449, mean loss: 0.36038325373084235
Epoch: 15, step: 399, loss: 0.3454391062259674, mean loss: 0.3603825762989518
Epoch: 15, step: 400, loss: 0.3072725832462311, mean loss: 0.3603801688834651
Epoch: 15, step: 401, loss: 0.28913387656211853, mean loss: 0.36037693951657535
Epoch: 15, step: 402, loss: 0.2971075773239136, mean loss: 0.36037407184843445
Epoch: 15, step: 403, loss: 0.3434089422225952, mean loss: 0.3603733029429946
Epoch: 15, step: 404, loss: 0.30504968762397766, mean loss: 0.36037079564114466
Epoch: 15, step: 405, loss: 0.3137798607349396, mean loss: 0.3603686842056826
Epoch: 15, step: 406, loss: 0.34530380368232727, mean loss: 0.36036800151748194
Epoch: 15, step: 407, loss: 0.32995790243148804, mean loss: 0.3603666234995788
Epoch: 15, step: 408, loss: 0.4180377125740051, mean loss: 0.36036923671671933
Epoch: 15, step: 409, loss: 0.32552680373191833, mean loss: 0.3603676579929774
Epoch: 15, step: 410, loss: 0.3148227035999298, mean loss: 0.3603655944274664
Epoch: 15, step: 411, loss: 0.34052127599716187, mean loss: 0.36036469535540994
Epoch: 15, step: 412, loss: 0.31993722915649414, mean loss: 0.3603628638206752
Epoch: 15, step: 413, loss: 0.3670390248298645, mean loss: 0.3603631662652258
Epoch: 15, step: 414, loss: 0.3408227860927582, mean loss: 0.36036228108379104
Epoch: 15, step: 415, loss: 0.32832756638526917, mean loss: 0.3603608299733227
Epoch: 15, step: 416, loss: 0.34709692001342773, mean loss: 0.3603602291711322
Epoch: 15, step: 417, loss: 0.36172837018966675, mean loss: 0.36036029113965373
Epoch: 15, step: 418, loss: 0.36030319333076477, mean loss: 0.3603602885535851
Epoch: 15, step: 419, loss: 0.3459213674068451, mean loss: 0.360359634616939
Epoch: 15, step: 420, loss: 0.3394026756286621, mean loss: 0.360358685522288
Epoch: 15, step: 421, loss: 0.3139019012451172, mean loss: 0.36035658169182533
Epoch: 15, step: 422, loss: 0.35251015424728394, mean loss: 0.3603562263765401
Epoch: 15, step: 423, loss: 0.3598713278770447, mean loss: 0.36035620441953503
Epoch: 15, step: 424, loss: 0.3579839766025543, mean loss: 0.36035609700600474
Epoch: 15, step: 425, loss: 0.30516165494918823, mean loss: 0.3603535979368181
Epoch: 15, step: 426, loss: 0.33092108368873596, mean loss: 0.3603522653649773
Epoch: 15, step: 427, loss: 0.3565736711025238, mean loss: 0.3603520942949726
Epoch: 15, step: 428, loss: 0.334777295589447, mean loss: 0.36035093648797795
Epoch: 15, step: 429, loss: 0.3354305922985077, mean loss: 0.3603498083601287
Epoch: 15, step: 430, loss: 0.36554038524627686, mean loss: 0.3603500433235476
Epoch: 15, step: 431, loss: 0.31709352135658264, mean loss: 0.3603480853060767
Epoch: 15, step: 432, loss: 0.304318904876709, mean loss: 0.36034554924576667
Epoch: 15, step: 433, loss: 0.3021724820137024, mean loss: 0.3603429162654448
Epoch: 15, step: 434, loss: 0.3525923192501068, mean loss: 0.36034256548033433
Epoch: 15, step: 435, loss: 0.3425407111644745, mean loss: 0.3603417598207436
Epoch: 15, step: 436, loss: 0.34124496579170227, mean loss: 0.3603408955951008
Epoch: 15, step: 437, loss: 0.334815114736557, mean loss: 0.3603397404778568
Epoch: 15, step: 438, loss: 0.35651829838752747, mean loss: 0.36033956755410046
Epoch: 15, step: 439, loss: 0.3669355809688568, mean loss: 0.3603398660162459
Epoch: 15, step: 440, loss: 0.3634307384490967, mean loss: 0.36034000586839887
Epoch: 15, step: 441, loss: 0.33586129546165466, mean loss: 0.3603388983346731
Epoch: 15, step: 442, loss: 0.3291968107223511, mean loss: 0.3603374893816978
Epoch: 15, step: 443, loss: 0.3334437310695648, mean loss: 0.3603362726897727
Epoch: 15, step: 444, loss: 0.3535187542438507, mean loss: 0.36033596427455233
Epoch: 15, step: 445, loss: 0.3145400285720825, mean loss: 0.36033389262270654
Epoch: 15, step: 446, loss: 0.3591451346874237, mean loss: 0.36033383884978687
Epoch: 15, step: 447, loss: 0.3123955726623535, mean loss: 0.36033167048240006
Epoch: 15, step: 448, loss: 0.3620997965335846, mean loss: 0.3603317504555355
Epoch: 15, step: 449, loss: 0.36868757009506226, mean loss: 0.3603321283759172
Epoch: 15, step: 450, loss: 0.32809707522392273, mean loss: 0.36033067050186574
Epoch: 15, step: 451, loss: 0.33084866404533386, mean loss: 0.36032933719838994
Epoch: 15, step: 452, loss: 0.34490835666656494, mean loss: 0.36032863982668406
Epoch: 15, step: 453, loss: 0.40181463956832886, mean loss: 0.36033051583282233
Epoch: 15, step: 454, loss: 0.30898821353912354, mean loss: 0.3603281942274733
Epoch: 15, step: 455, loss: 0.3143519461154938, mean loss: 0.36032611535931847
Epoch: 15, step: 456, loss: 0.3328281044960022, mean loss: 0.36032487206181596
Epoch: 15, step: 457, loss: 0.3650883436203003, mean loss: 0.360325087428104
Epoch: 15, step: 458, loss: 0.3116161525249481, mean loss: 0.36032288529713496
Epoch: 15, step: 459, loss: 0.34822314977645874, mean loss: 0.3603223382928167
Epoch: 15, step: 460, loss: 0.3287194073200226, mean loss: 0.3603209096534707
Epoch: 15, step: 461, loss: 0.311352401971817, mean loss: 0.3603186960874422
Epoch: 15, step: 462, loss: 0.3078215420246124, mean loss: 0.3603163231202107
Epoch: 15, step: 463, loss: 0.31564807891845703, mean loss: 0.360314304125264
Epoch: 15, step: 464, loss: 0.3709907531738281, mean loss: 0.3603147866766334
Epoch: 15, step: 465, loss: 0.3484521806240082, mean loss: 0.36031425053788024
Epoch: 15, step: 466, loss: 0.30001071095466614, mean loss: 0.36031152520052845
Epoch: 15, step: 467, loss: 0.3381149172782898, mean loss: 0.36031052210002584
Epoch: 15, step: 468, loss: 0.2955683171749115, mean loss: 0.3603075964276084
Epoch: 15, step: 469, loss: 0.3109194040298462, mean loss: 0.3603053646972696
Epoch: 15, step: 470, loss: 0.3282563388347626, mean loss: 0.36030391654644667
Epoch: 15, step: 471, loss: 0.32818469405174255, mean loss: 0.3603024652893305
Epoch: 15, step: 472, loss: 0.3767518997192383, mean loss: 0.3603032084978621
Epoch: 15, step: 473, loss: 0.3896596431732178, mean loss: 0.36030453480285335
Epoch: 15, step: 474, loss: 0.33767369389533997, mean loss: 0.3603035124020895
Epoch: 15, step: 475, loss: 0.30886340141296387, mean loss: 0.3603011885806679
Epoch: 15, step: 476, loss: 0.32560110092163086, mean loss: 0.36029962106530183
Epoch: 15, step: 477, loss: 0.3826526999473572, mean loss: 0.36030063078067276
Epoch: 15, step: 478, loss: 0.331133633852005, mean loss: 0.3602993133319656
Epoch: 15, step: 479, loss: 0.3350829780101776, mean loss: 0.36029817438276407
Epoch: 15, step: 480, loss: 0.3660033643245697, mean loss: 0.36029843205811485
Epoch: 15, step: 481, loss: 0.34760943055152893, mean loss: 0.3602978589842504
Epoch: 15, step: 482, loss: 0.29987719655036926, mean loss: 0.36029513032677696
Epoch: 15, step: 483, loss: 0.326653391122818, mean loss: 0.36029361110083746
Epoch: 15, step: 484, loss: 0.34634289145469666, mean loss: 0.3602929811293023
Epoch: 15, step: 485, loss: 0.38057518005371094, mean loss: 0.3602938969695861
Epoch: 15, step: 486, loss: 0.34604814648628235, mean loss: 0.36029325373346005
Epoch: 15, step: 487, loss: 0.35394060611724854, mean loss: 0.3602929669063147
Epoch: 15, step: 488, loss: 0.32616785168647766, mean loss: 0.36029142619950083
Epoch: 15, step: 489, loss: 0.31892314553260803, mean loss: 0.3602895585570328
Epoch: 15, step: 490, loss: 0.37818244099617004, mean loss: 0.360290366325641
Epoch: 15, step: 491, loss: 0.3108905851840973, mean loss: 0.3602881362885725
Epoch: 15, step: 492, loss: 0.34211307764053345, mean loss: 0.3602873158552836
Epoch: 15, step: 493, loss: 0.35503095388412476, mean loss: 0.36028707859059234
Epoch: 15, step: 494, loss: 0.3053688108921051, mean loss: 0.36028459977011396
Epoch: 15, step: 495, loss: 0.33681830763816833, mean loss: 0.36028354063073265
Epoch: 15, step: 496, loss: 0.3594058156013489, mean loss: 0.36028350101683954
Epoch: 15, step: 497, loss: 0.34706059098243713, mean loss: 0.36028290426126436
Epoch: 15, step: 498, loss: 0.33025622367858887, mean loss: 0.3602815492055045
Epoch: 15, step: 499, loss: 0.29761552810668945, mean loss: 0.3602787213164657
Epoch: 15, step: 500, loss: 0.34468647837638855, mean loss: 0.36027801772714485
Epoch: 15, step: 501, loss: 0.31988826394081116, mean loss: 0.36027619524930954
Epoch: 15, step: 502, loss: 0.33772286772727966, mean loss: 0.36027517763763595
Epoch: 15, step: 503, loss: 0.32842573523521423, mean loss: 0.3602737406478145
Epoch: 15, step: 504, loss: 0.3501616418361664, mean loss: 0.3602732844286035
Epoch: 15, step: 505, loss: 0.40590614080429077, mean loss: 0.36027534311561854
Epoch: 15, step: 506, loss: 0.2797355651855469, mean loss: 0.36027170979681444
Epoch: 15, step: 507, loss: 0.3053242266178131, mean loss: 0.36026923111208065
Epoch: 15, step: 508, loss: 0.3293611705303192, mean loss: 0.36026783691024106
Epoch: 15, step: 509, loss: 0.3220854699611664, mean loss: 0.3602661146564319
Epoch: 15, step: 510, loss: 0.34462326765060425, mean loss: 0.36026540910201366
Epoch: 15, step: 511, loss: 0.3252260088920593, mean loss: 0.36026382875742546
Epoch: 15, step: 512, loss: 0.32084453105926514, mean loss: 0.36026205095118824
Epoch: 15, step: 513, loss: 0.39839237928390503, mean loss: 0.3602637705474872
Epoch: 15, step: 514, loss: 0.32467007637023926, mean loss: 0.36026216542035405
Epoch: 15, step: 515, loss: 0.3319370746612549, mean loss: 0.36026088813451534
Epoch: 15, step: 516, loss: 0.33106034994125366, mean loss: 0.3602595714308046
Epoch: 15, step: 517, loss: 0.3167569041252136, mean loss: 0.3602576099073442
Epoch: 15, step: 518, loss: 0.3508748412132263, mean loss: 0.3602571868599257
Epoch: 15, step: 519, loss: 0.34775644540786743, mean loss: 0.36025662325571234
Epoch: 15, step: 520, loss: 0.31269970536231995, mean loss: 0.3602544792172157
Epoch: 15, step: 521, loss: 0.33205661177635193, mean loss: 0.3602532080123
Epoch: 15, step: 522, loss: 0.30650001764297485, mean loss: 0.3602507848418375
Epoch: 15, step: 523, loss: 0.346823126077652, mean loss: 0.3602501795561016
Epoch: 15, step: 524, loss: 0.3271297514438629, mean loss: 0.36024868663619575
Epoch: 15, step: 525, loss: 0.34239640831947327, mean loss: 0.360247881972069
Epoch: 15, step: 526, loss: 0.31021127104759216, mean loss: 0.36024562675005045
Epoch: 15, step: 527, loss: 0.3552119731903076, mean loss: 0.36024539988627
Epoch: 15, step: 528, loss: 0.33482539653778076, mean loss: 0.36024425427342815
Epoch: 15, step: 529, loss: 0.3173842132091522, mean loss: 0.3602423227709016
Epoch: 15, step: 530, loss: 0.3333801329135895, mean loss: 0.36024111227160655
Epoch: 15, step: 531, loss: 0.3066052198410034, mean loss: 0.36023869536946024
Epoch: 15, step: 532, loss: 0.37422746419906616, mean loss: 0.36023932569293293
Epoch: 15, step: 533, loss: 0.3605484366416931, mean loss: 0.3602393396206138
Epoch: 15, step: 534, loss: 0.36716318130493164, mean loss: 0.3602396515756345
Epoch: 15, step: 535, loss: 0.34697145223617554, mean loss: 0.36023905380129045
Epoch: 15, step: 536, loss: 0.3111061453819275, mean loss: 0.36023684030809683
Epoch: 15, step: 537, loss: 0.38225868344306946, mean loss: 0.360237832372388
Epoch: 15, step: 538, loss: 0.3419678807258606, mean loss: 0.3602370093645207
Epoch: 15, step: 539, loss: 0.3370164930820465, mean loss: 0.36023596339531877
Epoch: 15, step: 540, loss: 0.3375351130962372, mean loss: 0.3602349408805537
Epoch: 15, step: 541, loss: 0.3239441215991974, mean loss: 0.3602333063062234
Epoch: 15, step: 542, loss: 0.3524235785007477, mean loss: 0.36023295456421534
Epoch: 15, step: 543, loss: 0.3161908984184265, mean loss: 0.3602309710452032
Epoch: 15, step: 544, loss: 0.39579489827156067, mean loss: 0.3602325726631823
Epoch: 15, step: 545, loss: 0.3220513164997101, mean loss: 0.3602308532514844
Epoch: 15, step: 546, loss: 0.3487319052219391, mean loss: 0.360230335444125
Epoch: 15, step: 547, loss: 0.3201110064983368, mean loss: 0.36022852891814583
Epoch: 15, step: 548, loss: 0.33817747235298157, mean loss: 0.3602275360298319
Epoch: 15, step: 549, loss: 0.35411837697029114, mean loss: 0.3602272609663893
Epoch: 15, step: 550, loss: 0.3503660261631012, mean loss: 0.36022681698661335
Epoch: 15, step: 551, loss: 0.3179289698600769, mean loss: 0.36022491270752427
Epoch: 15, step: 552, loss: 0.32291632890701294, mean loss: 0.36022323312422616
Epoch: 15, step: 553, loss: 0.3150007426738739, mean loss: 0.3602211973589227
Epoch: 15, step: 554, loss: 0.3305707573890686, mean loss: 0.3602198626553454
Epoch: 15, step: 555, loss: 0.3086727559566498, mean loss: 0.3602175423858685
Epoch: 15, step: 556, loss: 0.31942394375801086, mean loss: 0.36021570624243654
Epoch: 15, step: 557, loss: 0.3194088935852051, mean loss: 0.36021386958690244
Epoch: 15, step: 558, loss: 0.3788015842437744, mean loss: 0.36021470615536444
Epoch: 15, step: 559, loss: 0.3281909227371216, mean loss: 0.3602132649409892
Epoch: 15, step: 560, loss: 0.31169500946998596, mean loss: 0.36021108149940373
Epoch: 15, step: 561, loss: 0.38003623485565186, mean loss: 0.36021197364022617
Epoch: 15, step: 562, loss: 0.3762913942337036, mean loss: 0.3602126971888287
Epoch: 15, step: 563, loss: 0.3065444529056549, mean loss: 0.3602102823110262
Epoch: 15, step: 564, loss: 0.38340863585472107, mean loss: 0.3602113261064612
Epoch: 15, step: 565, loss: 0.34626442193984985, mean loss: 0.3602106986024494
Epoch: 15, step: 566, loss: 0.3133719265460968, mean loss: 0.3602085913107746
Epoch: 15, step: 567, loss: 0.31714701652526855, mean loss: 0.3602066540435987
Epoch: 15, step: 568, loss: 0.3655633330345154, mean loss: 0.3602068950206553
Epoch: 15, step: 569, loss: 0.3823392391204834, mean loss: 0.36020789062767733
Epoch: 15, step: 570, loss: 0.3383026719093323, mean loss: 0.3602069052820465
Epoch: 15, step: 571, loss: 0.31072312593460083, mean loss: 0.3602046794913238
Epoch: 15, step: 572, loss: 0.32724177837371826, mean loss: 0.36020319687984004
Epoch: 15, step: 573, loss: 0.37654051184654236, mean loss: 0.360203931669575
Epoch: 15, step: 574, loss: 0.3532956838607788, mean loss: 0.36020362097707176
Epoch: 15, step: 575, loss: 0.31435713171958923, mean loss: 0.36020155916337965
Epoch: 15, step: 576, loss: 0.3095814287662506, mean loss: 0.3601992827713125
Epoch: 15, step: 577, loss: 0.346689909696579, mean loss: 0.3601986752808424
Epoch: 15, step: 578, loss: 0.29990848898887634, mean loss: 0.360195964269273
Epoch: 15, step: 579, loss: 0.37145206332206726, mean loss: 0.3601964703888347
Epoch: 15, step: 580, loss: 0.33246102929115295, mean loss: 0.360195223347735
Epoch: 15, step: 581, loss: 0.3269748389720917, mean loss: 0.36019372975973146
Epoch: 15, step: 582, loss: 0.33775147795677185, mean loss: 0.360192720801776
Epoch: 15, step: 583, loss: 0.36868205666542053, mean loss: 0.36019310244787667
Epoch: 15, step: 584, loss: 0.3274202048778534, mean loss: 0.36019162917758807
Epoch: 15, step: 585, loss: 0.327714741230011, mean loss: 0.36019016927972114
Epoch: 15, step: 586, loss: 0.3111084997653961, mean loss: 0.36018796306452294
Epoch: 15, step: 587, loss: 0.30620211362838745, mean loss: 0.3601855365160945
Epoch: 15, step: 588, loss: 0.3600729703903198, mean loss: 0.3601855314567154
Epoch: 15, step: 589, loss: 0.33430910110473633, mean loss: 0.3601843684710816
Epoch: 15, step: 590, loss: 0.3451637327671051, mean loss: 0.3601836934166704
Epoch: 15, step: 591, loss: 0.38067781925201416, mean loss: 0.36018461441819094
Epoch: 15, step: 592, loss: 0.3454635739326477, mean loss: 0.360183952887589
Epoch: 15, step: 593, loss: 0.2935836911201477, mean loss: 0.36018096015541645
Epoch: 15, step: 594, loss: 0.36577174067497253, mean loss: 0.3601812113699983
Epoch: 15, step: 595, loss: 0.37650591135025024, mean loss: 0.3601819448665826
Epoch: 15, step: 596, loss: 0.33649736642837524, mean loss: 0.360180880725933
Epoch: 15, step: 597, loss: 0.3360827565193176, mean loss: 0.3601797980534464
Epoch: 15, step: 598, loss: 0.3342372179031372, mean loss: 0.360178632566221
Epoch: 15, step: 599, loss: 0.29687657952308655, mean loss: 0.36017578880822265
Epoch: 15, step: 600, loss: 0.31236064434051514, mean loss: 0.3601736408748653
Epoch: 15, step: 601, loss: 0.3440264165401459, mean loss: 0.36017291554810515
Epoch: 15, step: 602, loss: 0.3458213806152344, mean loss: 0.36017227091194054
Epoch: 15, step: 603, loss: 0.3008383512496948, mean loss: 0.3601696058957861
Epoch: 15, step: 604, loss: 0.33922961354255676, mean loss: 0.36016866540657194
Epoch: 15, step: 605, loss: 0.3470557928085327, mean loss: 0.3601680764874757
Epoch: 15, step: 606, loss: 0.34487974643707275, mean loss: 0.36016738989610503
Epoch: 15, step: 607, loss: 0.33880993723869324, mean loss: 0.36016643078650123
Epoch: 15, step: 608, loss: 0.3690407872200012, mean loss: 0.3601668292936831
Epoch: 15, step: 609, loss: 0.3671347498893738, mean loss: 0.3601671421774099
Epoch: 15, step: 610, loss: 0.3462979197502136, mean loss: 0.3601665194293327
Epoch: 15, step: 611, loss: 0.3540104925632477, mean loss: 0.36016624302726435
Epoch: 15, step: 612, loss: 0.3251112997531891, mean loss: 0.360164669151124
Epoch: 15, step: 613, loss: 0.358227014541626, mean loss: 0.36016458215935737
Epoch: 15, step: 614, loss: 0.3007030785083771, mean loss: 0.36016191273158404
Epoch: 15, step: 615, loss: 0.31873252987861633, mean loss: 0.3601600529101236
Epoch: 15, step: 616, loss: 0.3289448618888855, mean loss: 0.3601586516805585
Epoch: 15, step: 617, loss: 0.3460511267185211, mean loss: 0.3601580184313906
Epoch: 15, step: 618, loss: 0.39982083439826965, mean loss: 0.36015979870949855
Epoch: 15, step: 619, loss: 0.344234436750412, mean loss: 0.3601590839266458
Epoch: 15, step: 620, loss: 0.30501267313957214, mean loss: 0.36015660888464646
Epoch: 15, step: 621, loss: 0.36085087060928345, mean loss: 0.36015664004260917
Epoch: 15, step: 622, loss: 0.31465259194374084, mean loss: 0.3601545979455801
Epoch: 15, step: 623, loss: 0.3319873809814453, mean loss: 0.36015333393476673
Epoch: 15, step: 624, loss: 0.3043699562549591, mean loss: 0.3601508307542561
Epoch: 15, step: 625, loss: 0.3013344705104828, mean loss: 0.36014819159243955
Epoch: 15, step: 626, loss: 0.3116275370121002, mean loss: 0.36014601450918116
Epoch: 15, step: 627, loss: 0.3495539426803589, mean loss: 0.360145539272649
Epoch: 15, step: 628, loss: 0.32541757822036743, mean loss: 0.36014398119642066
Epoch: 15, step: 629, loss: 0.38159897923469543, mean loss: 0.3601449437355879
Epoch: 15, step: 630, loss: 0.34084072709083557, mean loss: 0.36014407772613816
Epoch: 15, step: 631, loss: 0.3509047031402588, mean loss: 0.3601436632557189
Epoch: 15, step: 632, loss: 0.32377180457115173, mean loss: 0.36014203171852405
Epoch: 15, step: 633, loss: 0.33006522059440613, mean loss: 0.36014068261961296
Epoch: 15, step: 634, loss: 0.3500230610370636, mean loss: 0.36014022881285884
Epoch: 15, step: 635, loss: 0.3347338140010834, mean loss: 0.3601390893073506
Epoch: 15, step: 636, loss: 0.34571412205696106, mean loss: 0.3601384423607995
Epoch: 15, step: 637, loss: 0.317752867937088, mean loss: 0.3601365414919133
Epoch: 15, step: 638, loss: 0.3581494987010956, mean loss: 0.3601364523828595
Epoch: 15, step: 639, loss: 0.32498493790626526, mean loss: 0.3601348760817619
Epoch: 15, step: 640, loss: 0.3514680564403534, mean loss: 0.36013448745256854
Epoch: 15, step: 641, loss: 0.3124465346336365, mean loss: 0.3601323491711221
Epoch: 15, step: 642, loss: 0.32557791471481323, mean loss: 0.3601307998533417
Epoch: 15, step: 643, loss: 0.29966306686401367, mean loss: 0.36012808878209934
Epoch: 15, step: 644, loss: 0.3593592643737793, mean loss: 0.3601280543133969
Epoch: 15, step: 645, loss: 0.3803829252719879, mean loss: 0.3601289623592571
Epoch: 15, step: 646, loss: 0.3418991267681122, mean loss: 0.36012814513436847
Epoch: 15, step: 647, loss: 0.325507253408432, mean loss: 0.36012659318476625
Epoch: 15, step: 648, loss: 0.3600779175758362, mean loss: 0.3601265910028841
Epoch: 15, step: 649, loss: 0.3091517686843872, mean loss: 0.36012430616100516
Epoch: 15, step: 650, loss: 0.35302573442459106, mean loss: 0.3601239879963448
Epoch: 15, step: 651, loss: 0.34846940636634827, mean loss: 0.3601234656504489
Epoch: 15, step: 652, loss: 0.3395025134086609, mean loss: 0.36012254148282274
Epoch: 15, step: 653, loss: 0.3342186510562897, mean loss: 0.36012138060219057
Epoch: 15, step: 654, loss: 0.3366432785987854, mean loss: 0.3601203284802097
Epoch: 15, step: 655, loss: 0.34406110644340515, mean loss: 0.36011960885204886
Epoch: 15, step: 656, loss: 0.32903555035591125, mean loss: 0.36011821600988836
Epoch: 15, step: 657, loss: 0.30381515622138977, mean loss: 0.3601156932453132
Epoch: 15, step: 658, loss: 0.3465326428413391, mean loss: 0.36011508465844083
Epoch: 15, step: 659, loss: 0.2881815731525421, mean loss: 0.3601118618308644
Epoch: 15, step: 660, loss: 0.30688706040382385, mean loss: 0.36010947731397774
Epoch: 15, step: 661, loss: 0.32794854044914246, mean loss: 0.36010803654088996
Epoch: 15, step: 662, loss: 0.3607134521007538, mean loss: 0.36010806366159775
Epoch: 15, step: 663, loss: 0.3818068504333496, mean loss: 0.36010903565527147
Epoch: 15, step: 664, loss: 0.3149811923503876, mean loss: 0.360107014251316
Epoch: 15, step: 665, loss: 0.35100340843200684, mean loss: 0.3601066064932842
Epoch: 15, step: 666, loss: 0.3557262122631073, mean loss: 0.36010641030059237
Epoch: 15, step: 667, loss: 0.35344836115837097, mean loss: 0.36010611210777876
Epoch: 15, step: 668, loss: 0.31880807876586914, mean loss: 0.3601042625832438
Epoch: 15, step: 669, loss: 0.3287495970726013, mean loss: 0.36010285843342243
Epoch: 15, step: 670, loss: 0.3459831178188324, mean loss: 0.36010222614017023
Epoch: 15, step: 671, loss: 0.3598997890949249, mean loss: 0.3601022170752837
Epoch: 15, step: 672, loss: 0.2994841933250427, mean loss: 0.36009950279490266
Epoch: 15, step: 673, loss: 0.3165202736854553, mean loss: 0.36009755154438283
Epoch: 15, step: 674, loss: 0.3126879334449768, mean loss: 0.3600954288840694
Epoch: 15, step: 675, loss: 0.3706198036670685, mean loss: 0.36009590006847053
Epoch: 15, step: 676, loss: 0.3171437382698059, mean loss: 0.36009397715304775
Epoch: 15, step: 677, loss: 0.3102530241012573, mean loss: 0.3600917459348075
Epoch: 15, step: 678, loss: 0.3302780091762543, mean loss: 0.3600904113300016
Epoch: 15, step: 679, loss: 0.36468759179115295, mean loss: 0.3600906171124752
Epoch: 15, step: 680, loss: 0.35237690806388855, mean loss: 0.3600902718410438
Epoch: 15, step: 681, loss: 0.3416939973831177, mean loss: 0.36008944844678825
Epoch: 15, step: 682, loss: 0.3211372196674347, mean loss: 0.3600877050717366
Epoch: 15, step: 683, loss: 0.31864532828330994, mean loss: 0.36008585032877255
Epoch: 15, step: 684, loss: 0.33960625529289246, mean loss: 0.36008493381075796
Epoch: 15, step: 685, loss: 0.3406559228897095, mean loss: 0.3600840643481731
Epoch: 15, step: 686, loss: 0.33633434772491455, mean loss: 0.3600830015783774
Epoch: 15, step: 687, loss: 0.3605833351612091, mean loss: 0.3600830239666709
Epoch: 15, step: 688, loss: 0.2997225821018219, mean loss: 0.36008032315491806
Epoch: 15, step: 689, loss: 0.36463719606399536, mean loss: 0.3600805270418491
Epoch: 15, step: 690, loss: 0.34234392642974854, mean loss: 0.36007973349343464
Epoch: 15, step: 691, loss: 0.36613214015960693, mean loss: 0.36008000427039716
Epoch: 15, step: 692, loss: 0.3463347554206848, mean loss: 0.3600793893529879
Epoch: 15, step: 693, loss: 0.34676891565322876, mean loss: 0.3600787939126327
Epoch: 15, step: 694, loss: 0.32701170444488525, mean loss: 0.36007731473171267
Epoch: 15, step: 695, loss: 0.35458365082740784, mean loss: 0.360077068996165
Epoch: 15, step: 696, loss: 0.3209637999534607, mean loss: 0.3600753195096935
Epoch: 15, step: 697, loss: 0.33246415853500366, mean loss: 0.36007408455303486
Epoch: 15, step: 698, loss: 0.30859115719795227, mean loss: 0.36007178199355744
Epoch: 15, step: 699, loss: 0.34128841757774353, mean loss: 0.36007094195042616
Epoch: 15, step: 700, loss: 0.31409040093421936, mean loss: 0.3600688856675669
Epoch: 15, step: 701, loss: 0.34454411268234253, mean loss: 0.3600681914196023
Epoch: 15, step: 702, loss: 0.3503846526145935, mean loss: 0.36006775840351296
Epoch: 15, step: 703, loss: 0.3278340995311737, mean loss: 0.3600663170844791
Epoch: 15, step: 704, loss: 0.38974615931510925, mean loss: 0.36006764415097725
Epoch: 15, step: 705, loss: 0.3352521061897278, mean loss: 0.36006653463036736
Epoch: 15, step: 706, loss: 0.3089495301246643, mean loss: 0.3600642492543891
Epoch: 15, step: 707, loss: 0.33061718940734863, mean loss: 0.36006293277281515
Epoch: 15, step: 708, loss: 0.3280392587184906, mean loss: 0.3600615011632638
Epoch: 15, step: 709, loss: 0.33128252625465393, mean loss: 0.36006021466460897
Epoch: 15, step: 710, loss: 0.31922709941864014, mean loss: 0.36005838939460555
Epoch: 15, step: 711, loss: 0.32413578033447266, mean loss: 0.3600567836995823
Epoch: 15, step: 712, loss: 0.3257174789905548, mean loss: 0.3600552488448597
Epoch: 15, step: 713, loss: 0.3156368136405945, mean loss: 0.3600532635746709
Epoch: 15, step: 714, loss: 0.3424779176712036, mean loss: 0.36005247808435115
Epoch: 15, step: 715, loss: 0.34726518392562866, mean loss: 0.36005190661071157
Epoch: 15, step: 716, loss: 0.2978578209877014, mean loss: 0.36004912723520893
Epoch: 15, step: 717, loss: 0.3904666006565094, mean loss: 0.360050486493115
Epoch: 15, step: 718, loss: 0.342294842004776, mean loss: 0.360049693086596
Epoch: 15, step: 719, loss: 0.30047255754470825, mean loss: 0.36004703101619645
Epoch: 15, step: 720, loss: 0.3393792510032654, mean loss: 0.36004610756416067
Epoch: 15, step: 721, loss: 0.37782740592956543, mean loss: 0.3600469020105178
Epoch: 15, step: 722, loss: 0.3353837728500366, mean loss: 0.36004580014172627
Epoch: 15, step: 723, loss: 0.3442050516605377, mean loss: 0.3600450924599678
Epoch: 15, step: 724, loss: 0.33632466197013855, mean loss: 0.36004403280258607
Epoch: 15, step: 725, loss: 0.3487577438354492, mean loss: 0.3600435286352955
Epoch: 15, step: 726, loss: 0.35255733132362366, mean loss: 0.36004319423598735
Epoch: 15, step: 727, loss: 0.3014971911907196, mean loss: 0.3600405791742112
Epoch: 15, step: 728, loss: 0.34712016582489014, mean loss: 0.3600400020866526
Epoch: 15, step: 729, loss: 0.3379417061805725, mean loss: 0.360039015114973
Epoch: 15, step: 730, loss: 0.32524001598358154, mean loss: 0.3600374609637903
Epoch: 15, step: 731, loss: 0.3203265368938446, mean loss: 0.3600356875213077
Epoch: 15, step: 732, loss: 0.368052214384079, mean loss: 0.3600360455138439
Epoch: 15, step: 733, loss: 0.33471915125846863, mean loss: 0.36003491499253215
Epoch: 15, step: 734, loss: 0.35367679595947266, mean loss: 0.36003463108456013
Epoch: 15, step: 735, loss: 0.3398311138153076, mean loss: 0.36003372898073494
Epoch: 15, step: 736, loss: 0.35596179962158203, mean loss: 0.36003354717382513
Epoch: 15, step: 737, loss: 0.32169607281684875, mean loss: 0.36003183552660856
Epoch: 15, step: 738, loss: 0.3259308636188507, mean loss: 0.3600303130938255
Epoch: 15, step: 739, loss: 0.34183424711227417, mean loss: 0.36002950076945134
Epoch: 15, step: 740, loss: 0.32004785537719727, mean loss: 0.360027715954247
Epoch: 15, step: 741, loss: 0.32790717482566833, mean loss: 0.3600262821295381
Epoch: 15, step: 742, loss: 0.3232173025608063, mean loss: 0.36002463909157134
Epoch: 15, step: 743, loss: 0.3802649676799774, mean loss: 0.36002554251634317
Epoch: 15, step: 744, loss: 0.37726983428001404, mean loss: 0.3600263121789972
Epoch: 15, step: 745, loss: 0.35727304220199585, mean loss: 0.3600261892980735
Epoch: 15, step: 746, loss: 0.37061792612075806, mean loss: 0.36002666199574934
Epoch: 15, step: 747, loss: 0.32770130038261414, mean loss: 0.36002521941445637
Epoch: 15, step: 748, loss: 0.3646165132522583, mean loss: 0.36002542430061096
Epoch: 15, step: 749, loss: 0.3420305848121643, mean loss: 0.36002462131803675
Epoch: 15, step: 750, loss: 0.3046998381614685, mean loss: 0.3600221526739264
Epoch: 15, step: 751, loss: 0.3260687589645386, mean loss: 0.3600206377090099
Epoch: 15, step: 752, loss: 0.3699726164340973, mean loss: 0.3600210817360801
Epoch: 15, step: 753, loss: 0.33250272274017334, mean loss: 0.36001985400524245
Epoch: 15, step: 754, loss: 0.3322734832763672, mean loss: 0.36001861615689407
Epoch: 15, step: 755, loss: 0.3355545401573181, mean loss: 0.3600175247901917
Epoch: 15, step: 756, loss: 0.3425207734107971, mean loss: 0.36001674427757274
Epoch: 15, step: 757, loss: 0.2973145544528961, mean loss: 0.36001394732022485
Epoch: 15, step: 758, loss: 0.3027087450027466, mean loss: 0.36001139122038467
Epoch: 15, step: 759, loss: 0.3555740714073181, mean loss: 0.36001119330246256
Epoch: 15, step: 760, loss: 0.3408155143260956, mean loss: 0.36001033715514635
Epoch: 15, step: 761, loss: 0.3126889765262604, mean loss: 0.36000822666720467
Epoch: 15, step: 762, loss: 0.3160986304283142, mean loss: 0.36000626842806455
Epoch: 15, step: 763, loss: 0.3540153503417969, mean loss: 0.36000600126261295
Epoch: 15, step: 764, loss: 0.3206842541694641, mean loss: 0.3600042477844817
Epoch: 15, step: 765, loss: 0.3383468985557556, mean loss: 0.3600032820594648
Epoch: 15, step: 766, loss: 0.3363446295261383, mean loss: 0.36000222714117286
Epoch: 15, step: 767, loss: 0.30520957708358765, mean loss: 0.35999978409453215
Epoch: 15, step: 768, loss: 0.36910879611968994, mean loss: 0.3600001902210659
Epoch: 15, step: 769, loss: 0.37741145491600037, mean loss: 0.36000096647004914
Epoch: 15, step: 770, loss: 0.33680951595306396, mean loss: 0.359999932568283
Epoch: 15, step: 771, loss: 0.33178791403770447, mean loss: 0.3599986748998392
Epoch: 15, step: 772, loss: 0.33583247661590576, mean loss: 0.359997597638738
Epoch: 15, step: 773, loss: 0.3075309991836548, mean loss: 0.35999525892970463
Epoch: 15, step: 774, loss: 0.3074060380458832, mean loss: 0.35999291485923957
Epoch: 15, step: 775, loss: 0.3426624536514282, mean loss: 0.3599921424193569
Epoch: 15, step: 776, loss: 0.3335605561733246, mean loss: 0.35999096438369055
Epoch: 15, step: 777, loss: 0.3257640302181244, mean loss: 0.359989438983291
Epoch: 15, step: 778, loss: 0.34690025448799133, mean loss: 0.3599888556603044
Epoch: 15, step: 779, loss: 0.385618656873703, mean loss: 0.3599899978083086
Epoch: 15, step: 780, loss: 0.3243817389011383, mean loss: 0.35998841105821244
Epoch: 15, step: 781, loss: 0.32207807898521423, mean loss: 0.35998672180003255
Epoch: 15, step: 782, loss: 0.34487012028694153, mean loss: 0.35998604824473635
Epoch: 15, step: 783, loss: 0.31525665521621704, mean loss: 0.3599840553115235
Epoch: 15, step: 784, loss: 0.33212175965309143, mean loss: 0.35998281395283965
Epoch: 15, step: 785, loss: 0.36393213272094727, mean loss: 0.35998298990039235
Epoch: 15, step: 786, loss: 0.33046379685401917, mean loss: 0.35998167483855575
Epoch: 15, step: 787, loss: 0.3127739429473877, mean loss: 0.35997957185691415
Epoch: 15, step: 788, loss: 0.3448674976825714, mean loss: 0.3599788986833129
Epoch: 15, step: 789, loss: 0.3655567169189453, mean loss: 0.3599791471384682
Epoch: 15, step: 790, loss: 0.36571940779685974, mean loss: 0.35997940281797725
Epoch: 15, step: 791, loss: 0.30987483263015747, mean loss: 0.35997717118737915
Epoch: 15, step: 792, loss: 0.3574085235595703, mean loss: 0.3599770567862912
Epoch: 15, step: 793, loss: 0.30854180455207825, mean loss: 0.35997476609188334
Epoch: 15, step: 794, loss: 0.3887653052806854, mean loss: 0.35997604823569046
Epoch: 15, step: 795, loss: 0.30374205112457275, mean loss: 0.35997354404985543
Epoch: 15, step: 796, loss: 0.32967767119407654, mean loss: 0.3599721949884111
Epoch: 15, step: 797, loss: 0.3630475699901581, mean loss: 0.3599723319273639
Epoch: 15, step: 798, loss: 0.31623244285583496, mean loss: 0.3599703843834362
Epoch: 15, step: 799, loss: 0.3738517761230469, mean loss: 0.35997100243293484
Epoch: 15, step: 800, loss: 0.33902785181999207, mean loss: 0.3599700700100412
Epoch: 15, step: 801, loss: 0.2884357273578644, mean loss: 0.3599668853273481
Epoch: 15, step: 802, loss: 0.3008359670639038, mean loss: 0.35996425295775086
Epoch: 15, step: 803, loss: 0.36339160799980164, mean loss: 0.35996440552875525
Epoch: 15, step: 804, loss: 0.33603838086128235, mean loss: 0.3599633404931591
Epoch: 15, step: 805, loss: 0.3247508406639099, mean loss: 0.3599617731246988
Epoch: 15, step: 806, loss: 0.43975645303726196, mean loss: 0.35996532476398807
Epoch: 15, step: 807, loss: 0.326469361782074, mean loss: 0.359963833934231
Epoch: 15, step: 808, loss: 0.3060908913612366, mean loss: 0.35996143627779
Epoch: 15, step: 809, loss: 0.3300105929374695, mean loss: 0.35996010335196266
Epoch: 15, step: 810, loss: 0.32134705781936646, mean loss: 0.3599583850018433
Epoch: 15, step: 811, loss: 0.3249320685863495, mean loss: 0.35995682633699744
Epoch: 15, step: 812, loss: 0.30516454577445984, mean loss: 0.35995438819876213
Epoch: 15, step: 813, loss: 0.3156062662601471, mean loss: 0.3599524148908535
Epoch: 15, step: 814, loss: 0.3359794616699219, mean loss: 0.35995134824109953
Epoch: 15, step: 815, loss: 0.3748086094856262, mean loss: 0.35995200926891785
Epoch: 15, step: 816, loss: 0.30339646339416504, mean loss: 0.35994949311703484
Epoch: 15, step: 817, loss: 0.33174705505371094, mean loss: 0.35994823844855617
Epoch: 15, step: 818, loss: 0.3400925099849701, mean loss: 0.35994735514732107
Epoch: 15, step: 819, loss: 0.3184119462966919, mean loss: 0.359945507486785
Epoch: 15, step: 820, loss: 0.3075976073741913, mean loss: 0.3599431789471243
Epoch: 15, step: 821, loss: 0.3672869801521301, mean loss: 0.35994350559961097
Epoch: 15, step: 822, loss: 0.328380823135376, mean loss: 0.3599421017530396
Epoch: 15, step: 823, loss: 0.3642086088657379, mean loss: 0.3599422915105166
Epoch: 15, step: 824, loss: 0.31556621193885803, mean loss: 0.35994031792458947
Epoch: 15, step: 825, loss: 0.3557969927787781, mean loss: 0.35994013366215305
Epoch: 15, step: 826, loss: 0.3515251576900482, mean loss: 0.35993975944700773
Epoch: 15, step: 827, loss: 0.32085171341896057, mean loss: 0.3599380212734917
Epoch: 15, step: 828, loss: 0.32381319999694824, mean loss: 0.3599364149405611
Epoch: 15, step: 829, loss: 0.3470710813999176, mean loss: 0.3599358428937163
Epoch: 15, step: 830, loss: 0.3051208257675171, mean loss: 0.35993340569585375
Epoch: 15, step: 831, loss: 0.3447185754776001, mean loss: 0.35993272924066
Epoch: 15, step: 832, loss: 0.3645012676715851, mean loss: 0.35993293235000207
Epoch: 15, step: 833, loss: 0.3400416076183319, mean loss: 0.3599320480553132
Epoch: 15, step: 834, loss: 0.4355788230895996, mean loss: 0.35993541088149833
Epoch: 15, step: 835, loss: 0.37252429127693176, mean loss: 0.35993597048677906
Epoch: 15, step: 836, loss: 0.31265681982040405, mean loss: 0.3599338689109838
Epoch: 15, step: 837, loss: 0.30979683995246887, mean loss: 0.3599316404004958
Epoch: 15, step: 838, loss: 0.3201298117637634, mean loss: 0.3599298713517098
Epoch: 15, step: 839, loss: 0.30370596051216125, mean loss: 0.359927372511228
Epoch: 15, step: 840, loss: 0.3509010970592499, mean loss: 0.35992697136125906
Epoch: 15, step: 841, loss: 0.34760037064552307, mean loss: 0.3599264235610317
Epoch: 15, step: 842, loss: 0.3386765718460083, mean loss: 0.35992547924908597
Epoch: 15, step: 843, loss: 0.3218117952346802, mean loss: 0.35992378560866584
Epoch: 15, step: 844, loss: 0.3543124794960022, mean loss: 0.359923536272691
Epoch: 15, step: 845, loss: 0.34081515669822693, mean loss: 0.3599226872377859
Epoch: 15, step: 846, loss: 0.34956061840057373, mean loss: 0.3599222268446266
Epoch: 15, step: 847, loss: 0.31099873781204224, mean loss: 0.3599200532401734
Epoch: 15, step: 848, loss: 0.3690283000469208, mean loss: 0.35992045788928295
Epoch: 15, step: 849, loss: 0.331647664308548, mean loss: 0.3599192018789062
Epoch: 15, step: 850, loss: 0.3253697454929352, mean loss: 0.35991766709784867
Epoch: 15, step: 851, loss: 0.3724580705165863, mean loss: 0.3599182241520162
Epoch: 15, step: 852, loss: 0.3476201593875885, mean loss: 0.3599176778869798
Epoch: 15, step: 853, loss: 0.3686339259147644, mean loss: 0.359918065034889
Epoch: 15, step: 854, loss: 0.33569127321243286, mean loss: 0.3599169890059384
Epoch: 15, step: 855, loss: 0.3338411748409271, mean loss: 0.35991583090440327
Epoch: 15, step: 856, loss: 0.38190168142318726, mean loss: 0.35991680731558234
Epoch: 15, step: 857, loss: 0.39303576946258545, mean loss: 0.3599182780928337
Epoch: 15, step: 858, loss: 0.32510027289390564, mean loss: 0.35991673193158324
Epoch: 15, step: 859, loss: 0.33513686060905457, mean loss: 0.35991563158205736
Epoch: 15, step: 860, loss: 0.3583190441131592, mean loss: 0.35991556068878133
Epoch: 15, step: 861, loss: 0.3406464457511902, mean loss: 0.35991470512022894
Epoch: 15, step: 862, loss: 0.31552016735076904, mean loss: 0.3599127340445388
Epoch: 15, step: 863, loss: 0.36281171441078186, mean loss: 0.3599128627508239
Epoch: 15, step: 864, loss: 0.3490326404571533, mean loss: 0.35991237972208723
Epoch: 15, step: 865, loss: 0.32039061188697815, mean loss: 0.3599106252264895
Epoch: 15, step: 866, loss: 0.37418022751808167, mean loss: 0.35991125867090246
Epoch: 15, step: 867, loss: 0.33026671409606934, mean loss: 0.3599099427731497
Epoch: 15, step: 868, loss: 0.32929694652557373, mean loss: 0.3599085839469147
Epoch: 15, step: 869, loss: 0.34076210856437683, mean loss: 0.35990773412554844
Epoch: 15, step: 870, loss: 0.31383877992630005, mean loss: 0.359905689433604
Epoch: 15, step: 871, loss: 0.3206495940685272, mean loss: 0.35990394719610336
Epoch: 15, step: 872, loss: 0.33394747972488403, mean loss: 0.35990279526482605
Epoch: 15, step: 873, loss: 0.3188474178314209, mean loss: 0.3599009733345237
Epoch: 15, step: 874, loss: 0.3127118647098541, mean loss: 0.3598988792981969
Epoch: 15, step: 875, loss: 0.32317936420440674, mean loss: 0.35989724992674266
Epoch: 15, step: 876, loss: 0.3095647990703583, mean loss: 0.3598950166015061
Epoch: 15, step: 877, loss: 0.4029912054538727, mean loss: 0.359896928758257
Epoch: 15, step: 878, loss: 0.302649587392807, mean loss: 0.3598943888345086
Epoch: 15, step: 879, loss: 0.36728566884994507, mean loss: 0.3598947167528766
Epoch: 15, step: 880, loss: 0.3456577658653259, mean loss: 0.35989408515042387
Epoch: 15, step: 881, loss: 0.320943683385849, mean loss: 0.3598923572468765
Epoch: 15, step: 882, loss: 0.2968757450580597, mean loss: 0.3598895618508694
Epoch: 15, step: 883, loss: 0.31334230303764343, mean loss: 0.35988749712150403
Epoch: 15, step: 884, loss: 0.33398517966270447, mean loss: 0.3598863482052273
Epoch: 15, step: 885, loss: 0.35758155584335327, mean loss: 0.35988624597900704
Epoch: 15, step: 886, loss: 0.30709612369537354, mean loss: 0.35988390464214254
Epoch: 15, step: 887, loss: 0.33606335520744324, mean loss: 0.35988284820478955
Epoch: 15, step: 888, loss: 0.4151171147823334, mean loss: 0.3598852977265678
Epoch: 15, step: 889, loss: 0.34860947728157043, mean loss: 0.35988479769018444
Epoch: 15, step: 890, loss: 0.33754611015319824, mean loss: 0.35988380710495377
Epoch: 15, step: 891, loss: 0.3702934980392456, mean loss: 0.3598842686911073
Epoch: 15, step: 892, loss: 0.35636964440345764, mean loss: 0.35988411285266947
Epoch: 15, step: 893, loss: 0.33713921904563904, mean loss: 0.35988310438881355
Epoch: 15, step: 894, loss: 0.37697818875312805, mean loss: 0.359883862317626
Epoch: 15, step: 895, loss: 0.35077759623527527, mean loss: 0.35988345859949855
Epoch: 15, step: 896, loss: 0.3117981553077698, mean loss: 0.35988132687527585
Epoch: 15, step: 897, loss: 0.3135438859462738, mean loss: 0.35987927272859044
Epoch: 15, step: 898, loss: 0.34292516112327576, mean loss: 0.359878521183238
Epoch: 15, step: 899, loss: 0.30606627464294434, mean loss: 0.35987613588862183
Epoch: 15, step: 900, loss: 0.32725822925567627, mean loss: 0.3598746901235124
Epoch: 15, step: 901, loss: 0.3284440338611603, mean loss: 0.3598732970441639
Epoch: 15, step: 902, loss: 0.3726511001586914, mean loss: 0.3598738633608378
Epoch: 15, step: 903, loss: 0.33322811126708984, mean loss: 0.35987268246418413
Epoch: 15, step: 904, loss: 0.3324282467365265, mean loss: 0.35987146622506483
Epoch: 15, step: 905, loss: 0.32860812544822693, mean loss: 0.3598700808071451
Epoch: 15, step: 906, loss: 0.3115219175815582, mean loss: 0.3598679383795639
Epoch: 15, step: 907, loss: 0.30972346663475037, mean loss: 0.3598657164515355
Epoch: 15, step: 908, loss: 0.34354355931282043, mean loss: 0.35986499324017746
Epoch: 15, step: 909, loss: 0.3360743522644043, mean loss: 0.35986393915772397
Epoch: 15, step: 910, loss: 0.3185616433620453, mean loss: 0.35986210927443146
Epoch: 15, step: 911, loss: 0.3321433961391449, mean loss: 0.3598608812612676
Epoch: 15, step: 912, loss: 0.31020522117614746, mean loss: 0.35985868148010935
Epoch: 15, step: 913, loss: 0.38815557956695557, mean loss: 0.3598599349973454
Epoch: 15, step: 914, loss: 0.3378288447856903, mean loss: 0.3598589590908023
Epoch: 15, step: 915, loss: 0.3320057988166809, mean loss: 0.35985772533990423
Epoch: 15, step: 916, loss: 0.3155064880847931, mean loss: 0.3598557608965657
Epoch: 15, step: 917, loss: 0.32516050338745117, mean loss: 0.35985422421229296
Epoch: 15, step: 918, loss: 0.3432665467262268, mean loss: 0.3598534895616226
Epoch: 15, step: 919, loss: 0.3316209018230438, mean loss: 0.35985223922558457
Epoch: 15, step: 920, loss: 0.33262965083122253, mean loss: 0.3598510336727572
Epoch: 15, step: 921, loss: 0.332501083612442, mean loss: 0.3598498225333515
Epoch: 15, step: 922, loss: 0.33013129234313965, mean loss: 0.3598485065642513
Epoch: 15, step: 923, loss: 0.3123953938484192, mean loss: 0.35984640538143536
Epoch: 15, step: 924, loss: 0.36363381147384644, mean loss: 0.3598465730770782
Epoch: 15, step: 925, loss: 0.3258645236492157, mean loss: 0.3598450685145426
Epoch: 15, step: 926, loss: 0.3504461646080017, mean loss: 0.3598446523944777
Epoch: 15, step: 927, loss: 0.3249267041683197, mean loss: 0.3598431065317087
Epoch: 15, step: 928, loss: 0.3287213146686554, mean loss: 0.3598417287906904
Epoch: 15, step: 929, loss: 0.3222280442714691, mean loss: 0.3598400637316147
Epoch: 15, step: 930, loss: 0.3441557288169861, mean loss: 0.3598393694580139
Epoch: 15, step: 931, loss: 0.34193965792655945, mean loss: 0.3598385771549185
Epoch: 15, step: 932, loss: 0.362345427274704, mean loss: 0.3598386881118574
Epoch: 15, step: 933, loss: 0.3350995182991028, mean loss: 0.3598375931676327
Epoch: 15, step: 934, loss: 0.39690205454826355, mean loss: 0.3598392335509644
Epoch: 15, step: 935, loss: 0.3449261486530304, mean loss: 0.35983857356313925
Epoch: 15, step: 936, loss: 0.3465993106365204, mean loss: 0.3598379876772727
Epoch: 15, step: 937, loss: 0.32465749979019165, mean loss: 0.359836430880747
Epoch: 15, step: 938, loss: 0.30629467964172363, mean loss: 0.35983406167187765
Epoch: 15, step: 939, loss: 0.32314589619636536, mean loss: 0.35983243830172384
Epoch: 15, step: 940, loss: 0.34285491704940796, mean loss: 0.3598316871172076
Epoch: 15, step: 941, loss: 0.32630887627601624, mean loss: 0.35983020393824816
Epoch: 15, step: 942, loss: 0.3390219211578369, mean loss: 0.35982928333997444
Epoch: 15, step: 943, loss: 0.3725411295890808, mean loss: 0.3598298457115126
Epoch: 15, step: 944, loss: 0.3970523178577423, mean loss: 0.3598314923592519
Epoch: 15, step: 945, loss: 0.37707993388175964, mean loss: 0.35983225536206187
Epoch: 15, step: 946, loss: 0.3293501138687134, mean loss: 0.3598309070123696
Epoch: 15, step: 947, loss: 0.3638857901096344, mean loss: 0.35983108636848676
Epoch: 15, step: 948, loss: 0.3160449266433716, mean loss: 0.359829149699031
Epoch: 15, step: 949, loss: 0.3694135248661041, mean loss: 0.3598295735988615
Epoch: 15, step: 950, loss: 0.32797959446907043, mean loss: 0.35982816499335396
Epoch: 15, step: 951, loss: 0.3426039218902588, mean loss: 0.35982740326316187
Epoch: 15, step: 952, loss: 0.31975647807121277, mean loss: 0.3598256312326842
Epoch: 15, step: 953, loss: 0.3730888366699219, mean loss: 0.35982621773686024
Epoch: 15, step: 954, loss: 0.36976882815361023, mean loss: 0.35982665738357333
Epoch: 15, step: 955, loss: 0.28100115060806274, mean loss: 0.3598231719968217
Epoch: 15, step: 956, loss: 0.3074829876422882, mean loss: 0.3598208578002282
Epoch: 15, step: 957, loss: 0.37420567870140076, mean loss: 0.3598214937901876
Epoch: 15, step: 958, loss: 0.34787365794181824, mean loss: 0.3598209655689643
Epoch: 15, step: 959, loss: 0.33737483620643616, mean loss: 0.35981997325555304
Epoch: 15, step: 960, loss: 0.33624863624572754, mean loss: 0.3598189312442799
Epoch: 15, step: 961, loss: 0.3526422381401062, mean loss: 0.35981861400030923
Epoch: 15, step: 962, loss: 0.31432199478149414, mean loss: 0.35981660292223744
Epoch: 15, step: 963, loss: 0.3283904194831848, mean loss: 0.35981521385825943
Epoch: 15, step: 964, loss: 0.3206639885902405, mean loss: 0.35981348341736363
Epoch: 15, step: 965, loss: 0.30982473492622375, mean loss: 0.35981127406756735
Epoch: 15, step: 966, loss: 0.3371541500091553, mean loss: 0.35981027273623495
Epoch: 15, step: 967, loss: 0.3207930028438568, mean loss: 0.35980854844465404
Epoch: 15, step: 968, loss: 0.3643297851085663, mean loss: 0.3598087482429953
Epoch: 15, step: 969, loss: 0.3260071873664856, mean loss: 0.3598072545814453
Epoch: 15, step: 970, loss: 0.3353916108608246, mean loss: 0.35980617572307755
Epoch: 15, step: 971, loss: 0.3245367109775543, mean loss: 0.35980461733386115
Epoch: 15, step: 972, loss: 0.3689025044441223, mean loss: 0.3598050193082839
Epoch: 15, step: 973, loss: 0.33654657006263733, mean loss: 0.3598039917192919
Epoch: 15, step: 974, loss: 0.31184840202331543, mean loss: 0.3598018730716358
Epoch: 15, step: 975, loss: 0.33854275941848755, mean loss: 0.35980093389891743
Epoch: 15, step: 976, loss: 0.3848802149295807, mean loss: 0.3598020417878175
Epoch: 15, step: 977, loss: 0.312790185213089, mean loss: 0.35979996510893353
Epoch: 15, step: 978, loss: 0.3297138810157776, mean loss: 0.3597986361595942
Epoch: 15, step: 979, loss: 0.3308989703655243, mean loss: 0.35979735967258913
Epoch: 15, step: 980, loss: 0.3700959086418152, mean loss: 0.35979781453540305
Epoch: 15, step: 981, loss: 0.3156628906726837, mean loss: 0.3597958652851662
Epoch: 15, step: 982, loss: 0.3381337523460388, mean loss: 0.3597949086048262
Epoch: 15, step: 983, loss: 0.3205415606498718, mean loss: 0.3597931751059764
Epoch: 15, step: 984, loss: 0.3491973280906677, mean loss: 0.35979270719486955
Epoch: 15, step: 985, loss: 0.32432740926742554, mean loss: 0.3597911411214823
Epoch: 15, step: 986, loss: 0.3559400141239166, mean loss: 0.3597909710712771
Epoch: 15, step: 987, loss: 0.33999502658843994, mean loss: 0.3597900970009626
Epoch: 15, step: 988, loss: 0.31637901067733765, mean loss: 0.35978818031208787
Epoch: 15, step: 989, loss: 0.33424389362335205, mean loss: 0.3597870525290111
Epoch: 15, step: 990, loss: 0.3367125391960144, mean loss: 0.3597860338316762
Epoch: 15, step: 991, loss: 0.3223779797554016, mean loss: 0.3597843824077809
Epoch: 15, step: 992, loss: 0.3452473282814026, mean loss: 0.35978374068023367
Epoch: 15, step: 993, loss: 0.3179432153701782, mean loss: 0.35978189374259306
Epoch: 15, step: 994, loss: 0.31354382634162903, mean loss: 0.35977985277735797
Epoch: 15, step: 995, loss: 0.3495349586009979, mean loss: 0.35977940058393565
Epoch: 15, step: 996, loss: 0.3063616156578064, mean loss: 0.35977704291147566
Epoch: 15, step: 997, loss: 0.2949097454547882, mean loss: 0.3597741800243075
Epoch: 15, step: 998, loss: 0.35068029165267944, mean loss: 0.3597737786876037
Epoch: 15, step: 999, loss: 0.32015466690063477, mean loss: 0.359772030271373
Epoch: 15, step: 1000, loss: 0.3538724184036255, mean loss: 0.35977176992929333
Epoch: 15, step: 1001, loss: 0.31859585642814636, mean loss: 0.35976995297079445
Epoch: 15, step: 1002, loss: 0.3228176236152649, mean loss: 0.3597683224572104
Epoch: 15, step: 1003, loss: 0.351951539516449, mean loss: 0.35976797755856316
Epoch: 15, step: 1004, loss: 0.31707990169525146, mean loss: 0.3597660941226107
Epoch: 15, step: 1005, loss: 0.31582021713256836, mean loss: 0.3597641552768951
Epoch: 15, step: 1006, loss: 0.3598118722438812, mean loss: 0.35976415738202444
Epoch: 15, step: 1007, loss: 0.32930630445480347, mean loss: 0.35976281373225705
Epoch: 15, step: 1008, loss: 0.40192896127700806, mean loss: 0.35976467381199345
Epoch: 15, step: 1009, loss: 0.3197449743747711, mean loss: 0.35976290849662346
Epoch: 15, step: 1010, loss: 0.3500983715057373, mean loss: 0.3597624822014891
Epoch: 15, step: 1011, loss: 0.3297349214553833, mean loss: 0.35976115776779355
Epoch: 15, step: 1012, loss: 0.30936673283576965, mean loss: 0.3597589351053787
Epoch: 15, step: 1013, loss: 0.3319283127784729, mean loss: 0.35975770768091336
Epoch: 15, step: 1014, loss: 0.38926810026168823, mean loss: 0.3597590091315233
Epoch: 15, step: 1015, loss: 0.3327259123325348, mean loss: 0.35975781698578335
Epoch: 15, step: 1016, loss: 0.34123530983924866, mean loss: 0.35975700018871376
Epoch: 15, step: 1017, loss: 0.3188757002353668, mean loss: 0.3597551975032938
Epoch: 15, step: 1018, loss: 0.34087884426116943, mean loss: 0.35975436517588777
Epoch: 15, step: 1019, loss: 0.3718107044696808, mean loss: 0.3597548967605127
Epoch: 15, step: 1020, loss: 0.3579809069633484, mean loss: 0.3597548185457163
Epoch: 15, step: 1021, loss: 0.3293178081512451, mean loss: 0.3597534766441911
Epoch: 15, step: 1022, loss: 0.35073378682136536, mean loss: 0.35975307900323433
Epoch: 15, step: 1023, loss: 0.31655943393707275, mean loss: 0.3597511748573577
Epoch: 15, step: 1024, loss: 0.32327231764793396, mean loss: 0.35974956679664755
Epoch: 15, step: 1025, loss: 0.3472377061843872, mean loss: 0.35974901527321407
Epoch: 15, step: 1026, loss: 0.32030636072158813, mean loss: 0.35974727671568985
Epoch: 15, step: 1027, loss: 0.35491225123405457, mean loss: 0.35974706360631564
Epoch: 15, step: 1028, loss: 0.3126924932003021, mean loss: 0.35974498971278107
Epoch: 15, step: 1029, loss: 0.31519582867622375, mean loss: 0.3597430263297473
Epoch: 15, step: 1030, loss: 0.34485480189323425, mean loss: 0.3597423702006901
Epoch: 15, step: 1031, loss: 0.31665241718292236, mean loss: 0.3597404712956567
Epoch: 15, step: 1032, loss: 0.29493504762649536, mean loss: 0.35973761555055167
Epoch: 15, step: 1033, loss: 0.35316288471221924, mean loss: 0.35973732583825596
Epoch: 15, step: 1034, loss: 0.3573496639728546, mean loss: 0.35973722063174063
Epoch: 15, step: 1035, loss: 0.3567095696926117, mean loss: 0.35973708723154063
Epoch: 15, step: 1036, loss: 0.3205474019050598, mean loss: 0.3597353605854937
Epoch: 15, step: 1037, loss: 0.32054227590560913, mean loss: 0.35973363386575274
Epoch: 15, step: 1038, loss: 0.31809985637664795, mean loss: 0.35973179969783836
Epoch: 15, step: 1039, loss: 0.3642268478870392, mean loss: 0.35973199771758235
Epoch: 15, step: 1040, loss: 0.32573986053466797, mean loss: 0.3597305003325692
Epoch: 15, step: 1041, loss: 0.3296913504600525, mean loss: 0.3597291771385831
Epoch: 15, step: 1042, loss: 0.31418576836586, mean loss: 0.35972717108613306
Epoch: 15, step: 1043, loss: 0.3264169692993164, mean loss: 0.35972570393489156
Epoch: 15, step: 1044, loss: 0.3149625062942505, mean loss: 0.35972373242211286
Epoch: 15, step: 1045, loss: 0.3345224857330322, mean loss: 0.35972262252839804
Epoch: 15, step: 1046, loss: 0.34875836968421936, mean loss: 0.3597221396705637
Epoch: 15, step: 1047, loss: 0.3222455084323883, mean loss: 0.35972048929927436
Epoch: 15, step: 1048, loss: 0.3422642946243286, mean loss: 0.3597197206086814
Epoch: 15, step: 1049, loss: 0.30543023347854614, mean loss: 0.35971733005442647
Epoch: 15, step: 1050, loss: 0.32274729013442993, mean loss: 0.35971570220713134
Epoch: 15, step: 1051, loss: 0.34125009179115295, mean loss: 0.3597148891739147
Epoch: 15, step: 1052, loss: 0.32702335715293884, mean loss: 0.3597134498426057
Epoch: 15, step: 1053, loss: 0.33608272671699524, mean loss: 0.3597124094832183
Epoch: 15, step: 1054, loss: 0.35234299302101135, mean loss: 0.35971208505370206
Epoch: 15, step: 1055, loss: 0.31353405117988586, mean loss: 0.3597100522119221
Epoch: 15, step: 1056, loss: 0.3278113305568695, mean loss: 0.3597086480334806
Epoch: 15, step: 1057, loss: 0.3114175796508789, mean loss: 0.3597065223591967
Epoch: 15, step: 1058, loss: 0.3218630254268646, mean loss: 0.35970485663900953
Epoch: 15, step: 1059, loss: 0.400358647108078, mean loss: 0.35970664597837876
Epoch: 15, step: 1060, loss: 0.3583386242389679, mean loss: 0.3597065857688044
Epoch: 15, step: 1061, loss: 0.37459680438041687, mean loss: 0.35970724109045793
Epoch: 15, step: 1062, loss: 0.3653506338596344, mean loss: 0.3597074894464307
Epoch: 15, step: 1063, loss: 0.38457930088043213, mean loss: 0.35970858396374433
Epoch: 15, step: 1064, loss: 0.3728155493736267, mean loss: 0.35970916072789877
Epoch: 15, step: 1065, loss: 0.3491504192352295, mean loss: 0.3597086961172549
Epoch: 15, step: 1066, loss: 0.3313981890678406, mean loss: 0.35970745043999663
Epoch: 15, step: 1067, loss: 0.3157009780406952, mean loss: 0.3597055142171702
Epoch: 15, step: 1068, loss: 0.332333505153656, mean loss: 0.3597043099402964
Epoch: 15, step: 1069, loss: 0.3418121933937073, mean loss: 0.35970352278162737
Epoch: 15, step: 1070, loss: 0.3520054817199707, mean loss: 0.3597031841233606
Epoch: 15, step: 1071, loss: 0.2949539124965668, mean loss: 0.35970033574787114
Epoch: 15, step: 1072, loss: 0.40956348180770874, mean loss: 0.3597025291735545
Epoch: 15, step: 1073, loss: 0.35308945178985596, mean loss: 0.35970223828425285
Epoch: 15, step: 1074, loss: 0.35647833347320557, mean loss: 0.3597020964806544
Epoch: 15, step: 1075, loss: 0.28472015261650085, mean loss: 0.35969879854153297
Epoch: 15, step: 1076, loss: 0.3187577724456787, mean loss: 0.35969699790705634
Epoch: 15, step: 1077, loss: 0.3187493681907654, mean loss: 0.359695197061348
Epoch: 15, step: 1078, loss: 0.34306782484054565, mean loss: 0.35969446583428344
Epoch: 15, step: 1079, loss: 0.3213873505592346, mean loss: 0.3596927812645704
Epoch: 15, step: 1080, loss: 0.30356737971305847, mean loss: 0.35969031323759043
Epoch: 15, step: 1081, loss: 0.3423670828342438, mean loss: 0.3596895515090528
Epoch: 15, step: 1082, loss: 0.3320646286010742, mean loss: 0.35968833685298685
Epoch: 15, step: 1083, loss: 0.32342085242271423, mean loss: 0.35968674225729436
Epoch: 15, step: 1084, loss: 0.3365834951400757, mean loss: 0.35968572650670666
Epoch: 15, step: 1085, loss: 0.36703619360923767, mean loss: 0.35968604966098006
Epoch: 15, step: 1086, loss: 0.32481124997138977, mean loss: 0.3596845165005769
Epoch: 15, step: 1087, loss: 0.3238898813724518, mean loss: 0.3596829429716896
Epoch: 15, step: 1088, loss: 0.3436349332332611, mean loss: 0.3596822375336599
Epoch: 15, step: 1089, loss: 0.35064980387687683, mean loss: 0.3596818405036091
Epoch: 15, step: 1090, loss: 0.36017268896102905, mean loss: 0.3596818620784171
Epoch: 15, step: 1091, loss: 0.3076612055301666, mean loss: 0.35967957565715536
Epoch: 15, step: 1092, loss: 0.3562082350254059, mean loss: 0.3596794230908726
Epoch: 15, step: 1093, loss: 0.3155660033226013, mean loss: 0.3596774843803264
Epoch: 15, step: 1094, loss: 0.3166486918926239, mean loss: 0.359675593420428
Epoch: 15, step: 1095, loss: 0.3428778350353241, mean loss: 0.3596748552521038
Epoch: 15, step: 1096, loss: 0.3417809307575226, mean loss: 0.35967406894791193
Epoch: 15, step: 1097, loss: 0.31461623311042786, mean loss: 0.3596720890799166
Epoch: 15, step: 1098, loss: 0.3829098641872406, mean loss: 0.35967311011665404
Epoch: 15, step: 1099, loss: 0.34717947244644165, mean loss: 0.35967256118705515
Epoch: 15, step: 1100, loss: 0.319754958152771, mean loss: 0.3596708074151192
Epoch: 15, step: 1101, loss: 0.3658038079738617, mean loss: 0.359671076855439
Epoch: 15, step: 1102, loss: 0.3530746102333069, mean loss: 0.3596707870664559
Epoch: 15, step: 1103, loss: 0.43204012513160706, mean loss: 0.35967396617988345
Epoch: 15, step: 1104, loss: 0.31136631965637207, mean loss: 0.3596718441659795
Epoch: 15, step: 1105, loss: 0.31518033146858215, mean loss: 0.35966988986954196
Epoch: 15, step: 1106, loss: 0.33022964000701904, mean loss: 0.3596685967589054
Epoch: 15, step: 1107, loss: 0.30861979722976685, mean loss: 0.35966635462962177
Epoch: 15, step: 1108, loss: 0.33043086528778076, mean loss: 0.3596650706255223
Epoch: 15, step: 1109, loss: 0.32668206095695496, mean loss: 0.35966362209633174
Epoch: 15, step: 1110, loss: 0.3543209433555603, mean loss: 0.3596633874698884
Epoch: 15, step: 1111, loss: 0.3037581741809845, mean loss: 0.35966093247193964
Epoch: 15, step: 1112, loss: 0.3372838497161865, mean loss: 0.35965994985731903
Epoch: 15, step: 1113, loss: 0.32647016644477844, mean loss: 0.359658492503169
Epoch: 15, step: 1114, loss: 0.3001672923564911, mean loss: 0.35965588037582996
Epoch: 15, step: 1115, loss: 0.34759780764579773, mean loss: 0.3596553509557066
Epoch: 15, step: 1116, loss: 0.3157598376274109, mean loss: 0.3596534237698029
Epoch: 15, step: 1117, loss: 0.3196272552013397, mean loss: 0.35965166654052166
Epoch: 15, step: 1118, loss: 0.31091824173927307, mean loss: 0.359649527139108
Epoch: 15, step: 1119, loss: 0.31446540355682373, mean loss: 0.3596475436393898
Epoch: 15, step: 1120, loss: 0.3136310577392578, mean loss: 0.35964552368917246
Epoch: 15, step: 1121, loss: 0.33936819434165955, mean loss: 0.3596446336299438
Epoch: 15, step: 1122, loss: 0.3345257341861725, mean loss: 0.3596435311017674
Epoch: 15, step: 1123, loss: 0.2948448359966278, mean loss: 0.35964068705791624
Epoch: 15, step: 1124, loss: 0.3668465316295624, mean loss: 0.35964100331179255
Epoch: 15, step: 1125, loss: 0.29931843280792236, mean loss: 0.3596383559594488
Epoch: 15, step: 1126, loss: 0.33814021944999695, mean loss: 0.35963741252079917
Epoch: 15, step: 1127, loss: 0.300498366355896, mean loss: 0.3596348173370988
Epoch: 15, step: 1128, loss: 0.3006886839866638, mean loss: 0.3596322307324496
Epoch: 15, step: 1129, loss: 0.3041543662548065, mean loss: 0.35962979642510084
Epoch: 15, step: 1130, loss: 0.34469306468963623, mean loss: 0.35962914104658583
Epoch: 15, step: 1131, loss: 0.2877405285835266, mean loss: 0.3596259869305599
Epoch: 15, step: 1132, loss: 0.3469603955745697, mean loss: 0.35962543125156393
Epoch: 15, step: 1133, loss: 0.354208379983902, mean loss: 0.3596251935990559
Epoch: 15, step: 1134, loss: 0.3585045039653778, mean loss: 0.35962514443522026
Epoch: 15, step: 1135, loss: 0.3765007555484772, mean loss: 0.35962588472347756
Epoch: 15, step: 1136, loss: 0.30868539214134216, mean loss: 0.35962365019733017
Epoch: 15, step: 1137, loss: 0.35331931710243225, mean loss: 0.3596233736672356
Epoch: 15, step: 1138, loss: 0.3496473729610443, mean loss: 0.35962293610415363
Epoch: 15, step: 1139, loss: 0.3639742136001587, mean loss: 0.35962312694965787
Epoch: 15, step: 1140, loss: 0.40197092294692993, mean loss: 0.35962498422767186
Epoch: 15, step: 1141, loss: 0.3053654432296753, mean loss: 0.3596226046319786
Epoch: 15, step: 1142, loss: 0.37487101554870605, mean loss: 0.359623273333944
Epoch: 15, step: 1143, loss: 0.35341310501098633, mean loss: 0.3596230010059172
Epoch: 15, step: 1144, loss: 0.32457149028778076, mean loss: 0.35962146399601946
Epoch: 15, step: 1145, loss: 0.35653936862945557, mean loss: 0.35962132885196235
Epoch: 15, step: 1146, loss: 0.31464844942092896, mean loss: 0.35961935696265507
Epoch: 15, step: 1147, loss: 0.3152860105037689, mean loss: 0.35961741319965707
Epoch: 15, step: 1148, loss: 0.3581830859184265, mean loss: 0.3596173503153885
Epoch: 15, step: 1149, loss: 0.3346126973628998, mean loss: 0.3596162541008794
Epoch: 15, step: 1150, loss: 0.3686823546886444, mean loss: 0.3596166515451207
Epoch: 15, step: 1151, loss: 0.3013210892677307, mean loss: 0.3596140960672022
Epoch: 15, step: 1152, loss: 0.3687863349914551, mean loss: 0.3596144981291372
Epoch: 15, step: 1153, loss: 0.32744115591049194, mean loss: 0.35961308788357665
Epoch: 15, step: 1154, loss: 0.34317120909690857, mean loss: 0.35961236722266116
Epoch: 15, step: 1155, loss: 0.3456524610519409, mean loss: 0.3596117553754412
Epoch: 15, step: 1156, loss: 0.33993932604789734, mean loss: 0.35961089319244927
Epoch: 15, step: 1157, loss: 0.31410497426986694, mean loss: 0.35960889889325903
Epoch: 15, step: 1158, loss: 0.40141555666923523, mean loss: 0.35961073099185126
Epoch: 15, step: 1159, loss: 0.36113241314888, mean loss: 0.3596107976738038
Epoch: 15, step: 1160, loss: 0.3583362400531769, mean loss: 0.3596107418235947
Epoch: 15, step: 1161, loss: 0.3105289041996002, mean loss: 0.3596085911865943
Epoch: 15, step: 1162, loss: 0.3532783091068268, mean loss: 0.3596083138224406
Epoch: 15, step: 1163, loss: 0.30612215399742126, mean loss: 0.3596059704049929
Epoch: 15, step: 1164, loss: 0.29599109292030334, mean loss: 0.35960318333478547
Epoch: 15, step: 1165, loss: 0.3098101317882538, mean loss: 0.35960100191659805
Epoch: 15, step: 1166, loss: 0.3140808939933777, mean loss: 0.35959900778211157
Epoch: 15, step: 1167, loss: 0.34643682837486267, mean loss: 0.3595984312016224
Epoch: 15, step: 1168, loss: 0.3354094922542572, mean loss: 0.359597371630947
Epoch: 15, step: 1169, loss: 0.3386911451816559, mean loss: 0.3595964558961047
Epoch: 15, step: 1170, loss: 0.32517150044441223, mean loss: 0.35959494807973874
Epoch: 15, step: 1171, loss: 0.33782505989074707, mean loss: 0.3595939945983009
Epoch: 15, step: 1172, loss: 0.3347732424736023, mean loss: 0.3595929075421924
Epoch: 15, step: 1173, loss: 0.33111435174942017, mean loss: 0.3595916603425869
Epoch: 15, step: 1174, loss: 0.2924458682537079, mean loss: 0.35958871986559593
Epoch: 15, step: 1175, loss: 0.3415903151035309, mean loss: 0.3595879317063403
Epoch: 15, step: 1176, loss: 0.39670443534851074, mean loss: 0.35958955698565204
Epoch: 15, step: 1177, loss: 0.34595566987991333, mean loss: 0.3595889600031183
Epoch: 15, step: 1178, loss: 0.31681114435195923, mean loss: 0.359587086986977
Epoch: 15, step: 1179, loss: 0.3537663519382477, mean loss: 0.3595868321386824
Epoch: 15, step: 1180, loss: 0.32463228702545166, mean loss: 0.3595853017965296
Epoch: 15, step: 1181, loss: 0.357463538646698, mean loss: 0.35958520890785306
Epoch: 15, step: 1182, loss: 0.3429042100906372, mean loss: 0.35958447866231535
Epoch: 15, step: 1183, loss: 0.314656138420105, mean loss: 0.35958251191655094
Epoch: 15, step: 1184, loss: 0.3008161783218384, mean loss: 0.35957993952287204
Epoch: 15, step: 1185, loss: 0.30791175365448, mean loss: 0.3595776779372173
Epoch: 15, step: 1186, loss: 0.3187115490436554, mean loss: 0.3595758892503484
Epoch: 15, step: 1187, loss: 0.29049333930015564, mean loss: 0.3595728656793597
Epoch: 15, step: 1188, loss: 0.2893106937408447, mean loss: 0.3595697906138453
Epoch: 15, step: 1189, loss: 0.3232247233390808, mean loss: 0.3595682000200915
Epoch: 15, step: 1190, loss: 0.3237830102443695, mean loss: 0.35956663399717015
Epoch: 15, step: 1191, loss: 0.39130669832229614, mean loss: 0.35956802293749596
Epoch: 15, step: 1192, loss: 0.3206227123737335, mean loss: 0.35956631877127865
Epoch: 15, step: 1193, loss: 0.34263402223587036, mean loss: 0.3595655778814329
Epoch: 15, step: 1194, loss: 0.3143482208251953, mean loss: 0.3595635994365825
Epoch: 15, step: 1195, loss: 0.32570040225982666, mean loss: 0.3595621178476266
Epoch: 15, step: 1196, loss: 0.33620011806488037, mean loss: 0.359561095753748
Epoch: 15, step: 1197, loss: 0.3202551007270813, mean loss: 0.3595593761809496
Epoch: 15, step: 1198, loss: 0.41392263770103455, mean loss: 0.3595617543804124
Epoch: 15, step: 1199, loss: 0.3199663460254669, mean loss: 0.3595600222978072
Epoch: 15, step: 1200, loss: 0.3712974488735199, mean loss: 0.35956053572357927
Epoch: 15, step: 1201, loss: 0.3383464217185974, mean loss: 0.3595596078032746
Epoch: 15, step: 1202, loss: 0.31556037068367004, mean loss: 0.359557683329797
Epoch: 15, step: 1203, loss: 0.31607234477996826, mean loss: 0.35955578141680933
Epoch: 15, step: 1204, loss: 0.2853486239910126, mean loss: 0.35955253596929454
Epoch: 15, step: 1205, loss: 0.3074004352092743, mean loss: 0.3595502551986849
Epoch: 15, step: 1206, loss: 0.33399784564971924, mean loss: 0.3595491377626614
Epoch: 15, step: 1207, loss: 0.2979055345058441, mean loss: 0.35954644213544185
Epoch: 15, step: 1208, loss: 0.3596644103527069, mean loss: 0.3595464472938754
Epoch: 15, step: 1209, loss: 0.3120523691177368, mean loss: 0.35954437059609773
Epoch: 15, step: 1210, loss: 0.3124151825904846, mean loss: 0.3595423099433932
Epoch: 15, step: 1211, loss: 0.3349352180957794, mean loss: 0.3595412340824345
Epoch: 15, step: 1212, loss: 0.3115434944629669, mean loss: 0.3595391356371226
Epoch: 15, step: 1213, loss: 0.3200300931930542, mean loss: 0.35953740839036014
Epoch: 15, step: 1214, loss: 0.31428784132003784, mean loss: 0.3595354302672095
Epoch: 15, step: 1215, loss: 0.2926517724990845, mean loss: 0.3595325065192742
Epoch: 15, step: 1216, loss: 0.3709902763366699, mean loss: 0.35953300736159693
Epoch: 15, step: 1217, loss: 0.3611614406108856, mean loss: 0.35953307854060074
Epoch: 15, step: 1218, loss: 0.3028480112552643, mean loss: 0.3595306009381144
Epoch: 15, step: 1219, loss: 0.3362959921360016, mean loss: 0.35952958543947794
Epoch: 15, step: 1220, loss: 0.30452364683151245, mean loss: 0.3595271814388395
Epoch: 15, step: 1221, loss: 0.32832369208335876, mean loss: 0.359525817769171
Epoch: 15, step: 1222, loss: 0.3258143663406372, mean loss: 0.35952434455973914
Epoch: 15, step: 1223, loss: 0.3377190828323364, mean loss: 0.35952339169914976
Epoch: 15, step: 1224, loss: 0.3122163414955139, mean loss: 0.3595213245350596
Epoch: 15, step: 1225, loss: 0.3569835126399994, mean loss: 0.3595212136457869
Epoch: 15, step: 1226, loss: 0.3467201888561249, mean loss: 0.35952065433155656
Epoch: 15, step: 1227, loss: 0.3294382095336914, mean loss: 0.3595193399989457
Epoch: 15, step: 1228, loss: 0.34932973980903625, mean loss: 0.3595188948243994
Epoch: 15, step: 1229, loss: 0.3503972291946411, mean loss: 0.3595184963243719
Epoch: 15, step: 1230, loss: 0.3241913914680481, mean loss: 0.3595169530495103
Epoch: 15, step: 1231, loss: 0.32417091727256775, mean loss: 0.35951540901509754
Epoch: 15, step: 1232, loss: 0.3362097442150116, mean loss: 0.3595143909892905
Epoch: 15, step: 1233, loss: 0.33905279636383057, mean loss: 0.3595134972357033
Epoch: 15, step: 1234, loss: 0.32046738266944885, mean loss: 0.35951179179283077
Epoch: 15, step: 1235, loss: 0.37838155031204224, mean loss: 0.3595126159437095
Epoch: 15, step: 1236, loss: 0.37318724393844604, mean loss: 0.35951321316727564
Epoch: 15, step: 1237, loss: 0.3550061583518982, mean loss: 0.35951301633546434
Epoch: 15, step: 1238, loss: 0.32178762555122375, mean loss: 0.359511368866545
Epoch: 15, step: 1239, loss: 0.3342505693435669, mean loss: 0.3595102657748628
Epoch: 15, step: 1240, loss: 0.3208877742290497, mean loss: 0.3595085792768258
Epoch: 15, step: 1241, loss: 0.32925108075141907, mean loss: 0.3595072581040668
Epoch: 15, step: 1242, loss: 0.3497968912124634, mean loss: 0.35950683412612106
Epoch: 15, step: 1243, loss: 0.36945512890815735, mean loss: 0.3595072684736054
Epoch: 15, step: 1244, loss: 0.2998647689819336, mean loss: 0.35950466456618385
Epoch: 15, step: 1245, loss: 0.3122951090335846, mean loss: 0.3595026035535438
Epoch: 15, step: 1246, loss: 0.3185829520225525, mean loss: 0.35950081721523974
Epoch: 15, step: 1247, loss: 0.3537108302116394, mean loss: 0.35950056446567613
Epoch: 15, step: 1248, loss: 0.31694212555885315, mean loss: 0.3594987067486694
Epoch: 15, step: 1249, loss: 0.3034808039665222, mean loss: 0.3594962616197832
Epoch: 15, step: 1250, loss: 0.3549404442310333, mean loss: 0.3594960627713092
Epoch: 15, step: 1251, loss: 0.3909066617488861, mean loss: 0.3594974336947981
Epoch: 15, step: 1252, loss: 0.35510721802711487, mean loss: 0.3594972420910942
Epoch: 15, step: 1253, loss: 0.30109167098999023, mean loss: 0.35949469318775557
Epoch: 15, step: 1254, loss: 0.3051656484603882, mean loss: 0.35949232229337513
Epoch: 15, step: 1255, loss: 0.3022140562534332, mean loss: 0.35948982280541736
Epoch: 15, step: 1256, loss: 0.350478857755661, mean loss: 0.359489429605389
Epoch: 15, step: 1257, loss: 0.319616436958313, mean loss: 0.3594876897942079
Epoch: 15, step: 1258, loss: 0.30392685532569885, mean loss: 0.3594852655682614
Epoch: 15, step: 1259, loss: 0.32470929622650146, mean loss: 0.3594837482921121
Epoch: 15, step: 1260, loss: 0.331835001707077, mean loss: 0.35948254202944535
Epoch: 15, step: 1261, loss: 0.3492610454559326, mean loss: 0.3594820961042829
Epoch: 15, step: 1262, loss: 0.34604257345199585, mean loss: 0.3594815098144145
Epoch: 15, step: 1263, loss: 0.33602985739707947, mean loss: 0.35948048679694733
Epoch: 15, step: 1264, loss: 0.32744747400283813, mean loss: 0.3594790895008603
Epoch: 15, step: 1265, loss: 0.3110026717185974, mean loss: 0.35947697502743353
Epoch: 15, step: 1266, loss: 0.34172341227531433, mean loss: 0.3594762006756757
Epoch: 15, step: 1267, loss: 0.31584280729293823, mean loss: 0.35947429761420574
Epoch: 15, step: 1268, loss: 0.3185500502586365, mean loss: 0.3594725127894268
Epoch: 15, step: 1269, loss: 0.33718568086624146, mean loss: 0.35947154083862337
Epoch: 15, step: 1270, loss: 0.31168505549430847, mean loss: 0.3594694569135724
Epoch: 15, step: 1271, loss: 0.3167709708213806, mean loss: 0.3594675949527276
Epoch: 15, step: 1272, loss: 0.3212052583694458, mean loss: 0.35946592651263765
Epoch: 15, step: 1273, loss: 0.3302559554576874, mean loss: 0.35946465285906415
Epoch: 15, step: 1274, loss: 0.3118351995944977, mean loss: 0.3594625761442935
Epoch: 15, step: 1275, loss: 0.3387768566608429, mean loss: 0.3594616742555822
Epoch: 15, step: 1276, loss: 0.35332900285720825, mean loss: 0.3594614068853333
Epoch: 15, step: 1277, loss: 0.3026130497455597, mean loss: 0.3594589285368661
Epoch: 15, step: 1278, loss: 0.3289993405342102, mean loss: 0.35945760068525956
Epoch: 15, step: 1279, loss: 0.31186261773109436, mean loss: 0.3594555259257585
Epoch: 15, step: 1280, loss: 0.3572918772697449, mean loss: 0.3594554316121429
Epoch: 15, step: 1281, loss: 0.3580671548843384, mean loss: 0.3594553710996885
Epoch: 15, step: 1282, loss: 0.34186097979545593, mean loss: 0.3594546042256396
Epoch: 15, step: 1283, loss: 0.3302961587905884, mean loss: 0.3594533333728922
Epoch: 15, step: 1284, loss: 0.3227696716785431, mean loss: 0.3594517346079458
Epoch: 15, step: 1285, loss: 0.356784850358963, mean loss: 0.35945161838358214
Epoch: 15, step: 1286, loss: 0.3343258202075958, mean loss: 0.3594505234344308
Epoch: 15, step: 1287, loss: 0.32642412185668945, mean loss: 0.3594490842501194
Epoch: 15, step: 1288, loss: 0.3243349492549896, mean loss: 0.35944755415578
Epoch: 15, step: 1289, loss: 0.3331446349620819, mean loss: 0.3594464080590831
Epoch: 15, step: 1290, loss: 0.3458908498287201, mean loss: 0.3594458174286866
Epoch: 15, step: 1291, loss: 0.33332741260528564, mean loss: 0.35944467947099995
Epoch: 15, step: 1292, loss: 0.32861214876174927, mean loss: 0.359443336181203
Epoch: 15, step: 1293, loss: 0.34133490920066833, mean loss: 0.35944254728048936
Epoch: 15, step: 1294, loss: 0.3757026791572571, mean loss: 0.35944325562864343
Epoch: 15, step: 1295, loss: 0.3459587097167969, mean loss: 0.35944266822030085
Epoch: 15, step: 1296, loss: 0.3041348457336426, mean loss: 0.35944025902822496
Epoch: 15, step: 1297, loss: 0.33871111273765564, mean loss: 0.35943935611219174
Epoch: 15, step: 1298, loss: 0.3046456277370453, mean loss: 0.3594369695218187
Epoch: 15, step: 1299, loss: 0.39569413661956787, mean loss: 0.35943854866672714
Epoch: 15, step: 1300, loss: 0.3051406145095825, mean loss: 0.35943618387712056
Epoch: 15, step: 1301, loss: 0.28275635838508606, mean loss: 0.3594328444543572
Epoch: 15, step: 1302, loss: 0.2912580072879791, mean loss: 0.35942987555494654
Epoch: 15, step: 1303, loss: 0.3799532353878021, mean loss: 0.3594307692738036
Epoch: 15, step: 1304, loss: 0.3459412753582001, mean loss: 0.3594301818802083
Epoch: 15, step: 1305, loss: 0.30968785285949707, mean loss: 0.3594280159684683
Epoch: 15, step: 1306, loss: 0.3112235367298126, mean loss: 0.35942591711013944
Epoch: 15, step: 1307, loss: 0.3240838944911957, mean loss: 0.35942437835959
Epoch: 15, step: 1308, loss: 0.32858267426490784, mean loss: 0.3594230356061356
Epoch: 15, step: 1309, loss: 0.3121213912963867, mean loss: 0.3594209763268883
Epoch: 15, step: 1310, loss: 0.3105434477329254, mean loss: 0.35941884853408024
Epoch: 15, step: 1311, loss: 0.3248080015182495, mean loss: 0.35941734188045776
Epoch: 15, step: 1312, loss: 0.33525407314300537, mean loss: 0.35941629006882075
Epoch: 15, step: 1313, loss: 0.3077428340911865, mean loss: 0.35941404085423134
Epoch: 15, step: 1314, loss: 0.32138562202453613, mean loss: 0.35941238564557715
Epoch: 15, step: 1315, loss: 0.3305118978023529, mean loss: 0.35941112779008255
Epoch: 15, step: 1316, loss: 0.37644585967063904, mean loss: 0.359411869171981
Epoch: 15, step: 1317, loss: 0.38299599289894104, mean loss: 0.35941289555041805
Epoch: 15, step: 1318, loss: 0.35652872920036316, mean loss: 0.35941277003728217
Epoch: 15, step: 1319, loss: 0.3318790793418884, mean loss: 0.35941157187841816
Epoch: 15, step: 1320, loss: 0.31951087713241577, mean loss: 0.359409835631312
Epoch: 15, step: 1321, loss: 0.37458592653274536, mean loss: 0.3594104959781444
Epoch: 15, step: 1322, loss: 0.305871844291687, mean loss: 0.35940816648888335
Epoch: 15, step: 1323, loss: 0.3260178864002228, mean loss: 0.35940671372695815
Epoch: 15, step: 1324, loss: 0.3421557545661926, mean loss: 0.35940596319577867
Epoch: 15, step: 1325, loss: 0.3383171558380127, mean loss: 0.35940504573265514
Epoch: 15, step: 1326, loss: 0.33670443296432495, mean loss: 0.35940405819131577
Epoch: 15, step: 1327, loss: 0.3321388065814972, mean loss: 0.3594028721267773
Epoch: 15, step: 1328, loss: 0.3038918077945709, mean loss: 0.35940045744739446
Epoch: 15, step: 1329, loss: 0.334940642118454, mean loss: 0.3593993935145833
Epoch: 15, step: 1330, loss: 0.2972962558269501, mean loss: 0.3593966923211733
Epoch: 15, step: 1331, loss: 0.3789539635181427, mean loss: 0.3593975429331774
Epoch: 15, step: 1332, loss: 0.3423856794834137, mean loss: 0.3593968030617622
Epoch: 15, step: 1333, loss: 0.31086599826812744, mean loss: 0.3593946924761836
Epoch: 15, step: 1334, loss: 0.3395340144634247, mean loss: 0.35939382878068404
Epoch: 15, step: 1335, loss: 0.3272238075733185, mean loss: 0.35939242984081593
Epoch: 15, step: 1336, loss: 0.3223065137863159, mean loss: 0.3593908171993386
Epoch: 15, step: 1337, loss: 0.3487482964992523, mean loss: 0.3593903544408074
Epoch: 15, step: 1338, loss: 0.3517783582210541, mean loss: 0.35939002347006
Epoch: 15, step: 1339, loss: 0.31217077374458313, mean loss: 0.35938797045920234
Epoch: 15, step: 1340, loss: 0.3888302445411682, mean loss: 0.35938925050242143
Epoch: 15, step: 1341, loss: 0.31725576519966125, mean loss: 0.3593874187710371
Epoch: 15, step: 1342, loss: 0.3281441032886505, mean loss: 0.3593860605431763
Epoch: 15, step: 1343, loss: 0.32042762637138367, mean loss: 0.3593843669927428
Epoch: 15, step: 1344, loss: 0.3306245505809784, mean loss: 0.3593831168377151
Epoch: 15, step: 1345, loss: 0.3262759745121002, mean loss: 0.35938167777215285
Epoch: 15, step: 1346, loss: 0.3522976040840149, mean loss: 0.3593813698626606
Epoch: 15, step: 1347, loss: 0.3459525406360626, mean loss: 0.3593807862035322
Epoch: 15, step: 1348, loss: 0.36583080887794495, mean loss: 0.35938106652960783
Epoch: 15, step: 1349, loss: 0.3642807602882385, mean loss: 0.3593812794671897
Epoch: 15, step: 1350, loss: 0.33894261717796326, mean loss: 0.3593803912544962
Epoch: 15, step: 1351, loss: 0.32870814204216003, mean loss: 0.3593790583738595
Epoch: 15, step: 1352, loss: 0.35160183906555176, mean loss: 0.35937872042490415
Epoch: 15, step: 1353, loss: 0.33082592487335205, mean loss: 0.3593774797542015
Epoch: 15, step: 1354, loss: 0.32349762320518494, mean loss: 0.3593759207771626
Epoch: 15, step: 1355, loss: 0.3023606240749359, mean loss: 0.35937344357449047
Epoch: 15, step: 1356, loss: 0.3137637972831726, mean loss: 0.3593714620110247
Epoch: 15, step: 1357, loss: 0.3041236400604248, mean loss: 0.3593690618102275
Epoch: 15, step: 1358, loss: 0.3324683606624603, mean loss: 0.3593678931799157
Epoch: 15, step: 1359, loss: 0.3459465205669403, mean loss: 0.35936731014895945
Epoch: 15, step: 1360, loss: 0.3588630259037018, mean loss: 0.35936728824355807
Epoch: 15, step: 1361, loss: 0.317049503326416, mean loss: 0.3593654500980921
Epoch: 15, step: 1362, loss: 0.36357027292251587, mean loss: 0.35936563273384003
Epoch: 15, step: 1363, loss: 0.3242475688457489, mean loss: 0.3593641074530944
Epoch: 15, step: 1364, loss: 0.3599281311035156, mean loss: 0.35936413194923555
Epoch: 15, step: 1365, loss: 0.36545881628990173, mean loss: 0.35936439663629977
Epoch: 15, step: 1366, loss: 0.33660534024238586, mean loss: 0.359363408272362
Epoch: 15, step: 1367, loss: 0.37096908688545227, mean loss: 0.35936391225354203
Epoch: 15, step: 1368, loss: 0.33000895380973816, mean loss: 0.3593626375582255
Epoch: 15, step: 1369, loss: 0.3164740800857544, mean loss: 0.3593607752674104
Epoch: 15, step: 1370, loss: 0.38647979497909546, mean loss: 0.35936195276815774
Epoch: 15, step: 1371, loss: 0.3661392033100128, mean loss: 0.3593622470218284
Epoch: 15, step: 1372, loss: 0.3388544023036957, mean loss: 0.3593613566538903
Epoch: 15, step: 1373, loss: 0.31953638792037964, mean loss: 0.3593596276893712
Epoch: 15, step: 1374, loss: 0.31765055656433105, mean loss: 0.3593578170068826
Epoch: 15, step: 1375, loss: 0.319354772567749, mean loss: 0.3593560804621509
Epoch: 15, step: 1376, loss: 0.3709780275821686, mean loss: 0.35935658495262796
Epoch: 15, step: 1377, loss: 0.3260400593280792, mean loss: 0.3593551387973356
Epoch: 15, step: 1378, loss: 0.312304824590683, mean loss: 0.35935309659436643
Epoch: 15, step: 1379, loss: 0.36471423506736755, mean loss: 0.3593533292826682
Epoch: 15, step: 1380, loss: 0.39578747749328613, mean loss: 0.3593549105572748
Epoch: 15, step: 1381, loss: 0.3348926305770874, mean loss: 0.359353848918529
Epoch: 15, step: 1382, loss: 0.37142443656921387, mean loss: 0.3593543727473556
Epoch: 15, step: 1383, loss: 0.3473929166793823, mean loss: 0.35935385367705236
Epoch: 15, step: 1384, loss: 0.3392767906188965, mean loss: 0.35935298246581093
Epoch: 15, step: 1385, loss: 0.3255966305732727, mean loss: 0.3593515177278133
Epoch: 15, step: 1386, loss: 0.31474000215530396, mean loss: 0.35934958205221246
Epoch: 15, step: 1387, loss: 0.36677899956703186, mean loss: 0.35934990439764436
Epoch: 15, step: 1388, loss: 0.31914448738098145, mean loss: 0.35934816005224907
Epoch: 15, step: 1389, loss: 0.34205594658851624, mean loss: 0.3593474098477604
Epoch: 15, step: 1390, loss: 0.2988528609275818, mean loss: 0.35934478546925536
Epoch: 15, step: 1391, loss: 0.36919233202934265, mean loss: 0.3593452126576364
Epoch: 15, step: 1392, loss: 0.3138596713542938, mean loss: 0.35934323957208125
Epoch: 15, step: 1393, loss: 0.3368591070175171, mean loss: 0.3593422642908912
Epoch: 15, step: 1394, loss: 0.4253231883049011, mean loss: 0.35934512618306275
Epoch: 15, step: 1395, loss: 0.3783821165561676, mean loss: 0.3593459518679332
Epoch: 15, step: 1396, loss: 0.3127819001674652, mean loss: 0.3593439323488414
Epoch: 15, step: 1397, loss: 0.45696204900741577, mean loss: 0.35934816593877367
Epoch: 15, step: 1398, loss: 0.31699585914611816, mean loss: 0.35934632924564763
Epoch: 15, step: 1399, loss: 0.33329540491104126, mean loss: 0.3593451995438118
Epoch: 15, step: 1400, loss: 0.42344528436660767, mean loss: 0.35934797913207
Epoch: 15, step: 1401, loss: 0.3681236505508423, mean loss: 0.35934835965723777
Epoch: 15, step: 1402, loss: 0.3576883375644684, mean loss: 0.35934828767952054
Epoch: 15, step: 1403, loss: 0.3508964478969574, mean loss: 0.3593479212279171
Epoch: 15, step: 1404, loss: 0.34448638558387756, mean loss: 0.3593472768951339
Epoch: 15, step: 1405, loss: 0.31846746802330017, mean loss: 0.3593455045978621
Epoch: 15, step: 1406, loss: 0.376170814037323, mean loss: 0.35934623400825094
Epoch: 15, step: 1407, loss: 0.2975333631038666, mean loss: 0.35934355441440213
Epoch: 15, step: 1408, loss: 0.29762494564056396, mean loss: 0.35934087902280415
Epoch: 15, step: 1409, loss: 0.3117225468158722, mean loss: 0.35933881494251774
Epoch: 15, step: 1410, loss: 0.32008230686187744, mean loss: 0.3593371133904359
Epoch: 15, step: 1411, loss: 0.35095900297164917, mean loss: 0.3593367502615169
Epoch: 15, step: 1412, loss: 0.38121524453163147, mean loss: 0.35933769849080094
Epoch: 15, step: 1413, loss: 0.3240070343017578, mean loss: 0.3593361673014021
Epoch: 15, step: 1414, loss: 0.3119438588619232, mean loss: 0.35933411346354993
Epoch: 15, step: 1415, loss: 0.39385107159614563, mean loss: 0.35933560925823416
Epoch: 15, step: 1416, loss: 0.40637093782424927, mean loss: 0.35933764744901137
Epoch: 15, step: 1417, loss: 0.364871621131897, mean loss: 0.3593378872433472
Epoch: 15, step: 1418, loss: 0.3391910195350647, mean loss: 0.35933701429097886
Epoch: 15, step: 1419, loss: 0.37288376688957214, mean loss: 0.3593376012386651
Epoch: 15, step: 1420, loss: 0.34996604919433594, mean loss: 0.3593371952098083
Epoch: 15, step: 1421, loss: 0.2981475591659546, mean loss: 0.35933454424212596
Epoch: 15, step: 1422, loss: 0.3333110809326172, mean loss: 0.35933341685559433
Epoch: 15, step: 1423, loss: 0.30403080582618713, mean loss: 0.35933102114380133
Epoch: 15, step: 1424, loss: 0.32959339022636414, mean loss: 0.3593297329639912
Epoch: 15, step: 1425, loss: 0.34349313378334045, mean loss: 0.3593290469811799
Epoch: 15, step: 1426, loss: 0.3663816452026367, mean loss: 0.3593293524603769
Epoch: 15, step: 1427, loss: 0.3517920672893524, mean loss: 0.35932902600138644
Epoch: 15, step: 1428, loss: 0.3329218924045563, mean loss: 0.3593278822908058
Epoch: 15, step: 1429, loss: 0.32285651564598083, mean loss: 0.35932630275998534
Epoch: 15, step: 1430, loss: 0.32978615164756775, mean loss: 0.3593250234671391
Epoch: 15, step: 1431, loss: 0.35427045822143555, mean loss: 0.3593248045789854
Epoch: 15, step: 1432, loss: 0.33631017804145813, mean loss: 0.35932380797280444
Epoch: 15, step: 1433, loss: 0.3503129780292511, mean loss: 0.35932341779224053
Epoch: 15, step: 1434, loss: 0.31769755482673645, mean loss: 0.3593216154167062
Epoch: 15, step: 1435, loss: 0.3542618453502655, mean loss: 0.3593213963411058
Epoch: 15, step: 1436, loss: 0.33644989132881165, mean loss: 0.3593204061040615
Epoch: 15, step: 1437, loss: 0.3783235251903534, mean loss: 0.3593212288211403
Epoch: 15, step: 1438, loss: 0.3422631323337555, mean loss: 0.3593204903434362
Epoch: 15, step: 1439, loss: 0.3316386938095093, mean loss: 0.3593192919972659
Epoch: 15, step: 1440, loss: 0.3502538204193115, mean loss: 0.35931889956959706
Epoch: 15, step: 1441, loss: 0.34893926978111267, mean loss: 0.35931845027387427
Epoch: 15, step: 1442, loss: 0.3097301721572876, mean loss: 0.35931630387392116
Epoch: 15, step: 1443, loss: 0.3316883146762848, mean loss: 0.3593151080641394
Valid: 15, mean loss: 0.18923287093639374
Epoch: 16, step: 0, loss: 0.36965805292129517, mean loss: 0.35931555571377616
Epoch: 16, step: 1, loss: 0.3322262763977051, mean loss: 0.35931438332221916
Epoch: 16, step: 2, loss: 0.3268027901649475, mean loss: 0.3593129763203082
Epoch: 16, step: 3, loss: 0.3299841284751892, mean loss: 0.3593117071127677
Epoch: 16, step: 4, loss: 0.33334997296333313, mean loss: 0.3593105836658791
Epoch: 16, step: 5, loss: 0.34059664607048035, mean loss: 0.3593097738892631
Epoch: 16, step: 6, loss: 0.30665597319602966, mean loss: 0.35930749558885666
Epoch: 16, step: 7, loss: 0.3448925018310547, mean loss: 0.35930687188715377
Epoch: 16, step: 8, loss: 0.3600323498249054, mean loss: 0.35930690327546067
Epoch: 16, step: 9, loss: 0.3043135404586792, mean loss: 0.3593045240523571
Epoch: 16, step: 10, loss: 0.31855127215385437, mean loss: 0.3593027609871657
Epoch: 16, step: 11, loss: 0.3488684296607971, mean loss: 0.3593023095971619
Epoch: 16, step: 12, loss: 0.34816259145736694, mean loss: 0.35930182771291486
Epoch: 16, step: 13, loss: 0.32201793789863586, mean loss: 0.3593002149484104
Epoch: 16, step: 14, loss: 0.37610408663749695, mean loss: 0.35930094179090744
Epoch: 16, step: 15, loss: 0.3188387155532837, mean loss: 0.3592991916946169
Epoch: 16, step: 16, loss: 0.338749498128891, mean loss: 0.3592983029054829
Epoch: 16, step: 17, loss: 0.3144061863422394, mean loss: 0.35929636137289217
Epoch: 16, step: 18, loss: 0.36710286140441895, mean loss: 0.3592966989804704
Epoch: 16, step: 19, loss: 0.32618483901023865, mean loss: 0.35929526705433434
Epoch: 16, step: 20, loss: 0.2983258366584778, mean loss: 0.35929263053842536
Epoch: 16, step: 21, loss: 0.31082233786582947, mean loss: 0.3592905346164037
Epoch: 16, step: 22, loss: 0.31384924054145813, mean loss: 0.3592885697574045
Epoch: 16, step: 23, loss: 0.36830273270606995, mean loss: 0.3592889595084832
Epoch: 16, step: 24, loss: 0.3294947147369385, mean loss: 0.3592876713315291
Epoch: 16, step: 25, loss: 0.32099971175193787, mean loss: 0.35928601599389054
Epoch: 16, step: 26, loss: 0.3402542769908905, mean loss: 0.3592851932132497
Epoch: 16, step: 27, loss: 0.33863595128059387, mean loss: 0.35928430054327165
Epoch: 16, step: 28, loss: 0.3258334994316101, mean loss: 0.35928285452238756
Epoch: 16, step: 29, loss: 0.3699309527873993, mean loss: 0.35928331480155523
Epoch: 16, step: 30, loss: 0.3252228796482086, mean loss: 0.3592818425545203
Epoch: 16, step: 31, loss: 0.3371882140636444, mean loss: 0.3592808876086139
Epoch: 16, step: 32, loss: 0.37033671140670776, mean loss: 0.3592813654503305
Epoch: 16, step: 33, loss: 0.3489392101764679, mean loss: 0.35928091847326793
Epoch: 16, step: 34, loss: 0.3710860013961792, mean loss: 0.3592814286544738
Epoch: 16, step: 35, loss: 0.3253205418586731, mean loss: 0.35927996102755955
Epoch: 16, step: 36, loss: 0.2909105718135834, mean loss: 0.3592770065576052
Epoch: 16, step: 37, loss: 0.31684547662734985, mean loss: 0.3592751730285269
Epoch: 16, step: 38, loss: 0.32385846972465515, mean loss: 0.3592736426865961
Epoch: 16, step: 39, loss: 0.33189329504966736, mean loss: 0.3592724596435769
Epoch: 16, step: 40, loss: 0.334952175617218, mean loss: 0.359271408864401
Epoch: 16, step: 41, loss: 0.322061151266098, mean loss: 0.35926980123208446
Epoch: 16, step: 42, loss: 0.30635637044906616, mean loss: 0.3592675152584903
Epoch: 16, step: 43, loss: 0.32919880747795105, mean loss: 0.3592662162820007
Epoch: 16, step: 44, loss: 0.3133595287799835, mean loss: 0.3592642331860786
Epoch: 16, step: 45, loss: 0.2973827123641968, mean loss: 0.3592615601182245
Epoch: 16, step: 46, loss: 0.35770365595817566, mean loss: 0.3592614928250553
Epoch: 16, step: 47, loss: 0.3062833845615387, mean loss: 0.35925920455154703
Epoch: 16, step: 48, loss: 0.37078219652175903, mean loss: 0.35925970224048454
Epoch: 16, step: 49, loss: 0.3381027579307556, mean loss: 0.3592587884914861
Epoch: 16, step: 50, loss: 0.3023552894592285, mean loss: 0.35925633098774906
Epoch: 16, step: 51, loss: 0.317486435174942, mean loss: 0.3592545271401151
Epoch: 16, step: 52, loss: 0.3416130542755127, mean loss: 0.3592537653198074
Epoch: 16, step: 53, loss: 0.3607231676578522, mean loss: 0.3592538287709836
Epoch: 16, step: 54, loss: 0.33380094170570374, mean loss: 0.3592527297214968
Epoch: 16, step: 55, loss: 0.30173343420028687, mean loss: 0.359250246159514
Epoch: 16, step: 56, loss: 0.32046788930892944, mean loss: 0.35924857169136276
Epoch: 16, step: 57, loss: 0.3433755338191986, mean loss: 0.3592478863862133
Epoch: 16, step: 58, loss: 0.3640984892845154, mean loss: 0.35924809579789996
Epoch: 16, step: 59, loss: 0.30785515904426575, mean loss: 0.3592458771423675
Epoch: 16, step: 60, loss: 0.29486241936683655, mean loss: 0.3592430978003526
Epoch: 16, step: 61, loss: 0.34660154581069946, mean loss: 0.359242552106146
Epoch: 16, step: 62, loss: 0.3254050612449646, mean loss: 0.35924109151604533
Epoch: 16, step: 63, loss: 0.32307538390159607, mean loss: 0.359239530496207
Epoch: 16, step: 64, loss: 0.3183177709579468, mean loss: 0.35923776426721404
Epoch: 16, step: 65, loss: 0.3280181288719177, mean loss: 0.35923641685092594
Epoch: 16, step: 66, loss: 0.3632819950580597, mean loss: 0.3592365914475427
Epoch: 16, step: 67, loss: 0.34344279766082764, mean loss: 0.35923590985796106
Epoch: 16, step: 68, loss: 0.33025163412094116, mean loss: 0.35923465908008434
Epoch: 16, step: 69, loss: 0.30238139629364014, mean loss: 0.35923220575900094
Epoch: 16, step: 70, loss: 0.3229026198387146, mean loss: 0.359230638139328
Epoch: 16, step: 71, loss: 0.3142252266407013, mean loss: 0.35922869624204207
Epoch: 16, step: 72, loss: 0.34622451663017273, mean loss: 0.3592281351608145
Epoch: 16, step: 73, loss: 0.30134204030036926, mean loss: 0.3592256377022391
Epoch: 16, step: 74, loss: 0.3317622244358063, mean loss: 0.3592244528619411
Epoch: 16, step: 75, loss: 0.3284687399864197, mean loss: 0.3592231260408507
Epoch: 16, step: 76, loss: 0.34571343660354614, mean loss: 0.3592225432493647
Epoch: 16, step: 77, loss: 0.348725289106369, mean loss: 0.3592220904301885
Epoch: 16, step: 78, loss: 0.3604887127876282, mean loss: 0.35922214506601463
Epoch: 16, step: 79, loss: 0.3113847076892853, mean loss: 0.35922008168448527
Epoch: 16, step: 80, loss: 0.28918156027793884, mean loss: 0.35921706082956156
Epoch: 16, step: 81, loss: 0.33799126744270325, mean loss: 0.35921614537224306
Epoch: 16, step: 82, loss: 0.3742964565753937, mean loss: 0.35921679575009285
Epoch: 16, step: 83, loss: 0.31191009283065796, mean loss: 0.35921475561282706
Epoch: 16, step: 84, loss: 0.3178834617137909, mean loss: 0.3592129732464508
Epoch: 16, step: 85, loss: 0.3514305055141449, mean loss: 0.3592126376506021
Epoch: 16, step: 86, loss: 0.3643578588962555, mean loss: 0.3592128595134474
Epoch: 16, step: 87, loss: 0.30981284379959106, mean loss: 0.35921072946792676
Epoch: 16, step: 88, loss: 0.3490917980670929, mean loss: 0.35921029317545056
Epoch: 16, step: 89, loss: 0.31735244393348694, mean loss: 0.3592084884910821
Epoch: 16, step: 90, loss: 0.31188908219337463, mean loss: 0.3592064484218302
Epoch: 16, step: 91, loss: 0.29897746443748474, mean loss: 0.3592038518972577
Epoch: 16, step: 92, loss: 0.3269810378551483, mean loss: 0.3592024628032351
Epoch: 16, step: 93, loss: 0.3531593680381775, mean loss: 0.3592022023025555
Epoch: 16, step: 94, loss: 0.34294596314430237, mean loss: 0.3592015015723879
Epoch: 16, step: 95, loss: 0.3309635818004608, mean loss: 0.3592002844206736
Epoch: 16, step: 96, loss: 0.28927794098854065, mean loss: 0.3591972706564638
Epoch: 16, step: 97, loss: 0.37182509899139404, mean loss: 0.35919781491249064
Epoch: 16, step: 98, loss: 0.3807506561279297, mean loss: 0.3591987437941532
Epoch: 16, step: 99, loss: 0.39291536808013916, mean loss: 0.35920019684639787
Epoch: 16, step: 100, loss: 0.32908743619918823, mean loss: 0.3591988991622502
Epoch: 16, step: 101, loss: 0.31713607907295227, mean loss: 0.3591970865784318
Epoch: 16, step: 102, loss: 0.3467685282230377, mean loss: 0.3591965510262986
Epoch: 16, step: 103, loss: 0.3417063057422638, mean loss: 0.3591957973962881
Epoch: 16, step: 104, loss: 0.3748379051685333, mean loss: 0.35919647136361854
Epoch: 16, step: 105, loss: 0.3163314759731293, mean loss: 0.3591946245305556
Epoch: 16, step: 106, loss: 0.3418225646018982, mean loss: 0.35919387608973324
Epoch: 16, step: 107, loss: 0.3166253864765167, mean loss: 0.35919204218961204
Epoch: 16, step: 108, loss: 0.3597657084465027, mean loss: 0.359192066902758
Epoch: 16, step: 109, loss: 0.35760805010795593, mean loss: 0.3591919986673486
Epoch: 16, step: 110, loss: 0.3653198480606079, mean loss: 0.35919226262812365
Epoch: 16, step: 111, loss: 0.3426602780818939, mean loss: 0.35919155053368246
Epoch: 16, step: 112, loss: 0.29836925864219666, mean loss: 0.3591889308028003
Epoch: 16, step: 113, loss: 0.3168907165527344, mean loss: 0.3591871090173644
Epoch: 16, step: 114, loss: 0.36855003237724304, mean loss: 0.35918751226140416
Epoch: 16, step: 115, loss: 0.3582841157913208, mean loss: 0.35918747335544077
Epoch: 16, step: 116, loss: 0.31118619441986084, mean loss: 0.3591854062059237
Epoch: 16, step: 117, loss: 0.3394416868686676, mean loss: 0.35918455598977794
Epoch: 16, step: 118, loss: 0.3276579678058624, mean loss: 0.3591831984309706
Epoch: 16, step: 119, loss: 0.3634475767612457, mean loss: 0.3591833820504302
Epoch: 16, step: 120, loss: 0.3200967013835907, mean loss: 0.35918169909324327
Epoch: 16, step: 121, loss: 0.3246821463108063, mean loss: 0.35918021370821
Epoch: 16, step: 122, loss: 0.33001241087913513, mean loss: 0.35917895793678756
Epoch: 16, step: 123, loss: 0.33219921588897705, mean loss: 0.3591777964187039
Epoch: 16, step: 124, loss: 0.30763283371925354, mean loss: 0.35917557742681017
Epoch: 16, step: 125, loss: 0.3222162127494812, mean loss: 0.3591739864080983
Epoch: 16, step: 126, loss: 0.3590511381626129, mean loss: 0.3591739811199813
Epoch: 16, step: 127, loss: 0.34831956028938293, mean loss: 0.3591735139014538
Epoch: 16, step: 128, loss: 0.3252250850200653, mean loss: 0.35917205268555913
Epoch: 16, step: 129, loss: 0.3626265823841095, mean loss: 0.359172201369802
Epoch: 16, step: 130, loss: 0.3150806725025177, mean loss: 0.35917030373567815
Epoch: 16, step: 131, loss: 0.3185894191265106, mean loss: 0.3591685572696509
Epoch: 16, step: 132, loss: 0.40345990657806396, mean loss: 0.35917046333968183
Epoch: 16, step: 133, loss: 0.3140384554862976, mean loss: 0.35916852117564646
Epoch: 16, step: 134, loss: 0.37363380193710327, mean loss: 0.3591691436327557
Epoch: 16, step: 135, loss: 0.3236134350299835, mean loss: 0.3591676136969294
Epoch: 16, step: 136, loss: 0.33246976137161255, mean loss: 0.3591664649575324
Epoch: 16, step: 137, loss: 0.32415708899497986, mean loss: 0.35916495865962506
Epoch: 16, step: 138, loss: 0.30319836735725403, mean loss: 0.3591625507694516
Epoch: 16, step: 139, loss: 0.35064804553985596, mean loss: 0.3591621844596413
Epoch: 16, step: 140, loss: 0.41909611225128174, mean loss: 0.3591647628174727
Epoch: 16, step: 141, loss: 0.31264153122901917, mean loss: 0.35916276147394743
Epoch: 16, step: 142, loss: 0.3473799228668213, mean loss: 0.3591622546197896
Epoch: 16, step: 143, loss: 0.3388656973838806, mean loss: 0.35916138157448524
Epoch: 16, step: 144, loss: 0.3330007493495941, mean loss: 0.3591602563376052
Epoch: 16, step: 145, loss: 0.33652329444885254, mean loss: 0.35915928270483577
Epoch: 16, step: 146, loss: 0.3265001177787781, mean loss: 0.35915787806998456
Epoch: 16, step: 147, loss: 0.3194085359573364, mean loss: 0.3591561685679154
Epoch: 16, step: 148, loss: 0.329236775636673, mean loss: 0.3591548818783299
Epoch: 16, step: 149, loss: 0.3271160423755646, mean loss: 0.35915350410076463
Epoch: 16, step: 150, loss: 0.3125932216644287, mean loss: 0.35915150193854417
Epoch: 16, step: 151, loss: 0.3227560818195343, mean loss: 0.35914993694799896
Epoch: 16, step: 152, loss: 0.37422558665275574, mean loss: 0.35915058516787707
Epoch: 16, step: 153, loss: 0.3335055410861969, mean loss: 0.3591494825346291
Epoch: 16, step: 154, loss: 0.3696504831314087, mean loss: 0.3591499340158018
Epoch: 16, step: 155, loss: 0.3716064989566803, mean loss: 0.3591504695516978
Epoch: 16, step: 156, loss: 0.34302178025245667, mean loss: 0.35914977617268146
Epoch: 16, step: 157, loss: 0.3397013247013092, mean loss: 0.35914894011166043
Epoch: 16, step: 158, loss: 0.329140305519104, mean loss: 0.3591476501389745
Epoch: 16, step: 159, loss: 0.33141136169433594, mean loss: 0.3591464578982401
Epoch: 16, step: 160, loss: 0.3576328158378601, mean loss: 0.3591463928373306
Epoch: 16, step: 161, loss: 0.28348273038864136, mean loss: 0.3591431407242708
Epoch: 16, step: 162, loss: 0.3374718129634857, mean loss: 0.35914220930518964
Epoch: 16, step: 163, loss: 0.32377660274505615, mean loss: 0.35914068938054805
Epoch: 16, step: 164, loss: 0.34129205346107483, mean loss: 0.3591399223241245
Epoch: 16, step: 165, loss: 0.3218100368976593, mean loss: 0.35913831811761715
Epoch: 16, step: 166, loss: 0.33241593837738037, mean loss: 0.3591371698051364
Epoch: 16, step: 167, loss: 0.32155242562294006, mean loss: 0.35913555478519044
Epoch: 16, step: 168, loss: 0.35002627968788147, mean loss: 0.3591351633756129
Epoch: 16, step: 169, loss: 0.33402377367019653, mean loss: 0.3591340844295914
Epoch: 16, step: 170, loss: 0.32003629207611084, mean loss: 0.35913240461037105
Epoch: 16, step: 171, loss: 0.3452269732952118, mean loss: 0.3591318071953807
Epoch: 16, step: 172, loss: 0.34066343307495117, mean loss: 0.35913101377809664
Epoch: 16, step: 173, loss: 0.30950847268104553, mean loss: 0.3591288820425052
Epoch: 16, step: 174, loss: 0.3524029850959778, mean loss: 0.35912859311699524
Epoch: 16, step: 175, loss: 0.4134994447231293, mean loss: 0.35913092863467594
Epoch: 16, step: 176, loss: 0.3496248722076416, mean loss: 0.3591305203164582
Epoch: 16, step: 177, loss: 0.3633228540420532, mean loss: 0.3591307003840523
Epoch: 16, step: 178, loss: 0.30290281772613525, mean loss: 0.3591282854082048
Epoch: 16, step: 179, loss: 0.32671043276786804, mean loss: 0.3591268931279849
Epoch: 16, step: 180, loss: 0.34427475929260254, mean loss: 0.35912625528672076
Epoch: 16, step: 181, loss: 0.3262963891029358, mean loss: 0.3591248454324657
Epoch: 16, step: 182, loss: 0.3771428167819977, mean loss: 0.35912561916765484
Epoch: 16, step: 183, loss: 0.3009483218193054, mean loss: 0.35912312100133104
Epoch: 16, step: 184, loss: 0.3124251961708069, mean loss: 0.35912111585191153
Epoch: 16, step: 185, loss: 0.2997307777404785, mean loss: 0.35911856581592566
Epoch: 16, step: 186, loss: 0.32832229137420654, mean loss: 0.3591172435766727
Epoch: 16, step: 187, loss: 0.36825940012931824, mean loss: 0.35911763607867137
Epoch: 16, step: 188, loss: 0.31601303815841675, mean loss: 0.3591157855399722
Epoch: 16, step: 189, loss: 0.42526817321777344, mean loss: 0.35911862542954365
Epoch: 16, step: 190, loss: 0.33486294746398926, mean loss: 0.35911758418987993
Epoch: 16, step: 191, loss: 0.3331783711910248, mean loss: 0.35911647072778347
Epoch: 16, step: 192, loss: 0.33738642930984497, mean loss: 0.35911553798788487
Epoch: 16, step: 193, loss: 0.3154788315296173, mean loss: 0.3591136650070943
Epoch: 16, step: 194, loss: 0.33213767409324646, mean loss: 0.3591125071895522
Epoch: 16, step: 195, loss: 0.3231942355632782, mean loss: 0.35911096563283
Epoch: 16, step: 196, loss: 0.32482656836509705, mean loss: 0.35910949426261984
Epoch: 16, step: 197, loss: 0.30290326476097107, mean loss: 0.35910708218513715
Epoch: 16, step: 198, loss: 0.3053424656391144, mean loss: 0.3591047749879288
Epoch: 16, step: 199, loss: 0.3532942235469818, mean loss: 0.3591045256508433
Epoch: 16, step: 200, loss: 0.31801074743270874, mean loss: 0.3591027623477659
Epoch: 16, step: 201, loss: 0.3815251588821411, mean loss: 0.3591037244346334
Epoch: 16, step: 202, loss: 0.2944093644618988, mean loss: 0.35910094868657605
Epoch: 16, step: 203, loss: 0.3283851146697998, mean loss: 0.35909963086290964
Epoch: 16, step: 204, loss: 0.34486284852027893, mean loss: 0.3590990200781337
Epoch: 16, step: 205, loss: 0.3029744327068329, mean loss: 0.3590966123309277
Epoch: 16, step: 206, loss: 0.33943745493888855, mean loss: 0.35909576898841167
Epoch: 16, step: 207, loss: 0.31435537338256836, mean loss: 0.35909384978818837
Epoch: 16, step: 208, loss: 0.3125567138195038, mean loss: 0.35909185359996854
Epoch: 16, step: 209, loss: 0.32874876260757446, mean loss: 0.3590905521034003
Epoch: 16, step: 210, loss: 0.3290152847766876, mean loss: 0.35908926214983705
Epoch: 16, step: 211, loss: 0.32360705733299255, mean loss: 0.359087740353439
Epoch: 16, step: 212, loss: 0.39746779203414917, mean loss: 0.3590893863650048
Epoch: 16, step: 213, loss: 0.34605157375335693, mean loss: 0.35908882723417834
Epoch: 16, step: 214, loss: 0.35223883390426636, mean loss: 0.35908853348258823
Epoch: 16, step: 215, loss: 0.310156911611557, mean loss: 0.3590864352140689
Epoch: 16, step: 216, loss: 0.3523786664009094, mean loss: 0.35908614758623075
Epoch: 16, step: 217, loss: 0.3270155191421509, mean loss: 0.3590847724628089
Epoch: 16, step: 218, loss: 0.2910885810852051, mean loss: 0.35908185704920953
Epoch: 16, step: 219, loss: 0.36378246545791626, mean loss: 0.35908205858446973
Epoch: 16, step: 220, loss: 0.3269381523132324, mean loss: 0.3590806804963123
Epoch: 16, step: 221, loss: 0.3434123396873474, mean loss: 0.3590800087848826
Epoch: 16, step: 222, loss: 0.34624114632606506, mean loss: 0.3590794583985295
Epoch: 16, step: 223, loss: 0.34130480885505676, mean loss: 0.35907869645367596
Epoch: 16, step: 224, loss: 0.337181955575943, mean loss: 0.3590777578476115
Epoch: 16, step: 225, loss: 0.344407856464386, mean loss: 0.35907712904772365
Epoch: 16, step: 226, loss: 0.3548555076122284, mean loss: 0.35907694810299623
Epoch: 16, step: 227, loss: 0.31722232699394226, mean loss: 0.35907515423101316
Epoch: 16, step: 228, loss: 0.3412165641784668, mean loss: 0.35907438885193405
Epoch: 16, step: 229, loss: 0.3146926760673523, mean loss: 0.3590724868328724
Epoch: 16, step: 230, loss: 0.3062301576137543, mean loss: 0.3590702223233708
Epoch: 16, step: 231, loss: 0.34894654154777527, mean loss: 0.3590697885009173
Epoch: 16, step: 232, loss: 0.2792997658252716, mean loss: 0.35906637032280203
Epoch: 16, step: 233, loss: 0.320158451795578, mean loss: 0.3590647031740092
Epoch: 16, step: 234, loss: 0.34204399585723877, mean loss: 0.3590639738922355
Epoch: 16, step: 235, loss: 0.3007383346557617, mean loss: 0.35906147493597
Epoch: 16, step: 236, loss: 0.30689623951911926, mean loss: 0.359059240017354
Epoch: 16, step: 237, loss: 0.3175911605358124, mean loss: 0.3590574634738067
Epoch: 16, step: 238, loss: 0.3748714327812195, mean loss: 0.3590581409346861
Epoch: 16, step: 239, loss: 0.3342887759208679, mean loss: 0.3590570798755268
Epoch: 16, step: 240, loss: 0.333941787481308, mean loss: 0.35905600404376864
Epoch: 16, step: 241, loss: 0.329685240983963, mean loss: 0.3590547459797294
Epoch: 16, step: 242, loss: 0.34621813893318176, mean loss: 0.35905419616146383
Epoch: 16, step: 243, loss: 0.29973679780960083, mean loss: 0.35905165558418306
Epoch: 16, step: 244, loss: 0.34032392501831055, mean loss: 0.3590508535056972
Epoch: 16, step: 245, loss: 0.32214829325675964, mean loss: 0.3590492730962647
Epoch: 16, step: 246, loss: 0.33360159397125244, mean loss: 0.35904818330657157
Epoch: 16, step: 247, loss: 0.3604263365268707, mean loss: 0.3590482423230678
Epoch: 16, step: 248, loss: 0.35341042280197144, mean loss: 0.35904800090571154
Epoch: 16, step: 249, loss: 0.29649069905281067, mean loss: 0.359045322251012
Epoch: 16, step: 250, loss: 0.3805833160877228, mean loss: 0.35904624445156164
Epoch: 16, step: 251, loss: 0.35868650674819946, mean loss: 0.3590462290491938
Epoch: 16, step: 252, loss: 0.33140331506729126, mean loss: 0.3590450455532833
Epoch: 16, step: 253, loss: 0.31890714168548584, mean loss: 0.3590433271739757
Epoch: 16, step: 254, loss: 0.33067435026168823, mean loss: 0.3590421126966046
Epoch: 16, step: 255, loss: 0.32308855652809143, mean loss: 0.3590405735888919
Epoch: 16, step: 256, loss: 0.31805315613746643, mean loss: 0.3590388190656501
Epoch: 16, step: 257, loss: 0.29864248633384705, mean loss: 0.35903623382753985
Epoch: 16, step: 258, loss: 0.3445838689804077, mean loss: 0.3590356152269814
Epoch: 16, step: 259, loss: 0.3358462154865265, mean loss: 0.35903462270002795
Epoch: 16, step: 260, loss: 0.31980642676353455, mean loss: 0.3590329437701783
Epoch: 16, step: 261, loss: 0.3121608793735504, mean loss: 0.3590309377758106
Epoch: 16, step: 262, loss: 0.38501980900764465, mean loss: 0.35903204997982613
Epoch: 16, step: 263, loss: 0.3109806776046753, mean loss: 0.35902999369035443
Epoch: 16, step: 264, loss: 0.3249094784259796, mean loss: 0.3590285336143878
Epoch: 16, step: 265, loss: 0.351453572511673, mean loss: 0.3590282094825477
Epoch: 16, step: 266, loss: 0.2966623902320862, mean loss: 0.35902554096946526
Epoch: 16, step: 267, loss: 0.31326824426651, mean loss: 0.3590235831867893
Epoch: 16, step: 268, loss: 0.328498512506485, mean loss: 0.3590222771896695
Epoch: 16, step: 269, loss: 0.3682089149951935, mean loss: 0.35902267021772655
Epoch: 16, step: 270, loss: 0.3310673236846924, mean loss: 0.3590214742670727
Epoch: 16, step: 271, loss: 0.3237718939781189, mean loss: 0.35901996632814864
Epoch: 16, step: 272, loss: 0.3327924311161041, mean loss: 0.3590188443905513
Epoch: 16, step: 273, loss: 0.3914632797241211, mean loss: 0.359020232209669
Epoch: 16, step: 274, loss: 0.37367600202560425, mean loss: 0.35902085908720077
Epoch: 16, step: 275, loss: 0.2960754632949829, mean loss: 0.35901816681193166
Epoch: 16, step: 276, loss: 0.33555909991264343, mean loss: 0.3590171634730283
Epoch: 16, step: 277, loss: 0.35415521264076233, mean loss: 0.35901695553740126
Epoch: 16, step: 278, loss: 0.40091076493263245, mean loss: 0.3590187471727515
Epoch: 16, step: 279, loss: 0.3518396317958832, mean loss: 0.3590184401630279
Epoch: 16, step: 280, loss: 0.3291710615158081, mean loss: 0.35901716381585463
Epoch: 16, step: 281, loss: 0.3161681592464447, mean loss: 0.3590153315655951
Epoch: 16, step: 282, loss: 0.32685187458992004, mean loss: 0.35901395629484745
Epoch: 16, step: 283, loss: 0.3220193386077881, mean loss: 0.35901237451711154
Epoch: 16, step: 284, loss: 0.3500622510910034, mean loss: 0.3590119918533198
Epoch: 16, step: 285, loss: 0.33397746086120605, mean loss: 0.3590109215441709
Epoch: 16, step: 286, loss: 0.34243085980415344, mean loss: 0.3590102127219
Epoch: 16, step: 287, loss: 0.36148110032081604, mean loss: 0.35901031835149977
Epoch: 16, step: 288, loss: 0.3979577422142029, mean loss: 0.35901198326937533
Epoch: 16, step: 289, loss: 0.3463749289512634, mean loss: 0.3590114430858104
Epoch: 16, step: 290, loss: 0.3359121084213257, mean loss: 0.3590104557237816
Epoch: 16, step: 291, loss: 0.335377037525177, mean loss: 0.3590094455759701
Epoch: 16, step: 292, loss: 0.38330817222595215, mean loss: 0.3590104841162381
Epoch: 16, step: 293, loss: 0.35844290256500244, mean loss: 0.35901045985854296
Epoch: 16, step: 294, loss: 0.3083086311817169, mean loss: 0.3590082930211278
Epoch: 16, step: 295, loss: 0.33148640394210815, mean loss: 0.35900711687202186
Epoch: 16, step: 296, loss: 0.3412749469280243, mean loss: 0.3590063591193641
Epoch: 16, step: 297, loss: 0.31552979350090027, mean loss: 0.35900450130526196
Epoch: 16, step: 298, loss: 0.33847174048423767, mean loss: 0.35900362394933233
Epoch: 16, step: 299, loss: 0.3431532680988312, mean loss: 0.3590029466994669
Epoch: 16, step: 300, loss: 0.3513604402542114, mean loss: 0.3590026201663994
Epoch: 16, step: 301, loss: 0.3033958077430725, mean loss: 0.3590002444160609
Epoch: 16, step: 302, loss: 0.3304451107978821, mean loss: 0.3589990244761447
Epoch: 16, step: 303, loss: 0.3227764368057251, mean loss: 0.35899747703135354
Epoch: 16, step: 304, loss: 0.34357795119285583, mean loss: 0.3589968183306043
Epoch: 16, step: 305, loss: 0.34020474553108215, mean loss: 0.35899601559362015
Epoch: 16, step: 306, loss: 0.33736035227775574, mean loss: 0.35899509142706104
Epoch: 16, step: 307, loss: 0.3223632574081421, mean loss: 0.35899352676645885
Epoch: 16, step: 308, loss: 0.3102976679801941, mean loss: 0.35899144690233264
Epoch: 16, step: 309, loss: 0.2950434386730194, mean loss: 0.35898871571551155
Epoch: 16, step: 310, loss: 0.3400048315525055, mean loss: 0.3589879049581268
Epoch: 16, step: 311, loss: 0.3372877538204193, mean loss: 0.3589869782348975
Epoch: 16, step: 312, loss: 0.37049099802970886, mean loss: 0.35898746950277105
Epoch: 16, step: 313, loss: 0.3451615869998932, mean loss: 0.35898687910724186
Epoch: 16, step: 314, loss: 0.3464581072330475, mean loss: 0.35898634412402847
Epoch: 16, step: 315, loss: 0.33431476354599, mean loss: 0.3589852906833548
Epoch: 16, step: 316, loss: 0.3198654055595398, mean loss: 0.3589836203923713
Epoch: 16, step: 317, loss: 0.3407881259918213, mean loss: 0.35898284353751686
Epoch: 16, step: 318, loss: 0.3219340741634369, mean loss: 0.3589812618114624
Epoch: 16, step: 319, loss: 0.35006454586982727, mean loss: 0.358980881145652
Epoch: 16, step: 320, loss: 0.2933051586151123, mean loss: 0.3589780774862057
Epoch: 16, step: 321, loss: 0.3477885127067566, mean loss: 0.35897759983040534
Epoch: 16, step: 322, loss: 0.3559974730014801, mean loss: 0.3589774726213376
Epoch: 16, step: 323, loss: 0.35444724559783936, mean loss: 0.3589772792532728
Epoch: 16, step: 324, loss: 0.34663885831832886, mean loss: 0.3589767526229883
Epoch: 16, step: 325, loss: 0.33014237880706787, mean loss: 0.3589755219625608
Epoch: 16, step: 326, loss: 0.3370043635368347, mean loss: 0.35897458426641354
Epoch: 16, step: 327, loss: 0.368556410074234, mean loss: 0.35897499318694137
Epoch: 16, step: 328, loss: 0.3764614462852478, mean loss: 0.35897573941888344
Epoch: 16, step: 329, loss: 0.35087963938713074, mean loss: 0.35897539393368966
Epoch: 16, step: 330, loss: 0.3555160462856293, mean loss: 0.3589752463191111
Epoch: 16, step: 331, loss: 0.3258041739463806, mean loss: 0.35897383092943824
Epoch: 16, step: 332, loss: 0.3219423294067383, mean loss: 0.358972250884999
Epoch: 16, step: 333, loss: 0.3701642155647278, mean loss: 0.35897272839863836
Epoch: 16, step: 334, loss: 0.35212597250938416, mean loss: 0.3589724362890821
Epoch: 16, step: 335, loss: 0.3356783390045166, mean loss: 0.3589714425136007
Epoch: 16, step: 336, loss: 0.3616574704647064, mean loss: 0.35897155710034834
Epoch: 16, step: 337, loss: 0.34056535363197327, mean loss: 0.358970771919755
Epoch: 16, step: 338, loss: 0.32296544313430786, mean loss: 0.3589692360528103
Epoch: 16, step: 339, loss: 0.35276347398757935, mean loss: 0.3589689713470406
Epoch: 16, step: 340, loss: 0.3182539641857147, mean loss: 0.35896723472911946
Epoch: 16, step: 341, loss: 0.319316029548645, mean loss: 0.3589655435576966
Epoch: 16, step: 342, loss: 0.3177952170372009, mean loss: 0.3589637876688187
Epoch: 16, step: 343, loss: 0.3083292245864868, mean loss: 0.35896162822822325
Epoch: 16, step: 344, loss: 0.3131740093231201, mean loss: 0.35895967558124875
Epoch: 16, step: 345, loss: 0.316843181848526, mean loss: 0.3589578795687228
Epoch: 16, step: 346, loss: 0.31197381019592285, mean loss: 0.35895587606911206
Epoch: 16, step: 347, loss: 0.29952889680862427, mean loss: 0.358953342085688
Epoch: 16, step: 348, loss: 0.32487624883651733, mean loss: 0.3589518890906235
Epoch: 16, step: 349, loss: 0.35329344868659973, mean loss: 0.3589516478336778
Epoch: 16, step: 350, loss: 0.33037933707237244, mean loss: 0.3589504296579898
Epoch: 16, step: 351, loss: 0.3866177797317505, mean loss: 0.3589516092005407
Epoch: 16, step: 352, loss: 0.37729519605636597, mean loss: 0.358952391209615
Epoch: 16, step: 353, loss: 0.3801768720149994, mean loss: 0.3589532959960761
Epoch: 16, step: 354, loss: 0.3298845589160919, mean loss: 0.35895205686665543
Epoch: 16, step: 355, loss: 0.3650347590446472, mean loss: 0.3589523161463732
Epoch: 16, step: 356, loss: 0.32663294672966003, mean loss: 0.3589509385678635
Epoch: 16, step: 357, loss: 0.35502034425735474, mean loss: 0.3589507710376312
Epoch: 16, step: 358, loss: 0.3510546088218689, mean loss: 0.358950434500862
Epoch: 16, step: 359, loss: 0.3398793935775757, mean loss: 0.3589496217220978
Epoch: 16, step: 360, loss: 0.348810076713562, mean loss: 0.35894918960852407
Epoch: 16, step: 361, loss: 0.3393484950065613, mean loss: 0.35894835432792227
Epoch: 16, step: 362, loss: 0.32913485169410706, mean loss: 0.3589470838842084
Epoch: 16, step: 363, loss: 0.3536551594734192, mean loss: 0.3589468583888781
Epoch: 16, step: 364, loss: 0.31766876578330994, mean loss: 0.3589450995541341
Epoch: 16, step: 365, loss: 0.32085922360420227, mean loss: 0.35894347680696964
Epoch: 16, step: 366, loss: 0.3304154872894287, mean loss: 0.3589422613500433
Epoch: 16, step: 367, loss: 0.34568122029304504, mean loss: 0.3589416963772648
Epoch: 16, step: 368, loss: 0.3174516260623932, mean loss: 0.3589399288115376
Epoch: 16, step: 369, loss: 0.31631070375442505, mean loss: 0.3589381127927484
Epoch: 16, step: 370, loss: 0.3241245448589325, mean loss: 0.35893662978665963
Epoch: 16, step: 371, loss: 0.32999131083488464, mean loss: 0.35893539681175113
Epoch: 16, step: 372, loss: 0.3122175931930542, mean loss: 0.3589334068725077
Epoch: 16, step: 373, loss: 0.3163711428642273, mean loss: 0.3589315940151941
Epoch: 16, step: 374, loss: 0.3268653154373169, mean loss: 0.3589302282722503
Epoch: 16, step: 375, loss: 0.4013608396053314, mean loss: 0.3589320353681333
Epoch: 16, step: 376, loss: 0.33307555317878723, mean loss: 0.3589309342019909
Epoch: 16, step: 377, loss: 0.34337157011032104, mean loss: 0.35893027159386165
Epoch: 16, step: 378, loss: 0.33619973063468933, mean loss: 0.35892930363657516
Epoch: 16, step: 379, loss: 0.3020921051502228, mean loss: 0.3589268833845531
Epoch: 16, step: 380, loss: 0.32508760690689087, mean loss: 0.3589254424956249
Epoch: 16, step: 381, loss: 0.37217897176742554, mean loss: 0.35892600681178227
Epoch: 16, step: 382, loss: 0.3225732147693634, mean loss: 0.35892445902824066
Epoch: 16, step: 383, loss: 0.3171720802783966, mean loss: 0.35892268142355954
Epoch: 16, step: 384, loss: 0.32357582449913025, mean loss: 0.3589211765976017
Epoch: 16, step: 385, loss: 0.36704298853874207, mean loss: 0.35892152235375074
Epoch: 16, step: 386, loss: 0.29407158493995667, mean loss: 0.35891876172468373
Epoch: 16, step: 387, loss: 0.31757214665412903, mean loss: 0.3589170016950962
Epoch: 16, step: 388, loss: 0.35336849093437195, mean loss: 0.3589167655179047
Epoch: 16, step: 389, loss: 0.2986726462841034, mean loss: 0.35891420128366475
Epoch: 16, step: 390, loss: 0.3144480586051941, mean loss: 0.3589123087047042
Epoch: 16, step: 391, loss: 0.33060985803604126, mean loss: 0.358911104140069
Epoch: 16, step: 392, loss: 0.33136188983917236, mean loss: 0.35890993168340213
Epoch: 16, step: 393, loss: 0.31235456466674805, mean loss: 0.35890795043533774
Epoch: 16, step: 394, loss: 0.3080022931098938, mean loss: 0.3589057841449711
Epoch: 16, step: 395, loss: 0.3160196840763092, mean loss: 0.35890395920454266
Epoch: 16, step: 396, loss: 0.2890684902667999, mean loss: 0.3589009876089111
Epoch: 16, step: 397, loss: 0.3016245365142822, mean loss: 0.3588985505205316
Epoch: 16, step: 398, loss: 0.335801899433136, mean loss: 0.35889756780976756
Epoch: 16, step: 399, loss: 0.34392473101615906, mean loss: 0.3588969307762076
Epoch: 16, step: 400, loss: 0.31238314509391785, mean loss: 0.35889495188721876
Epoch: 16, step: 401, loss: 0.3428279161453247, mean loss: 0.35889426835808824
Epoch: 16, step: 402, loss: 0.37727776169776917, mean loss: 0.3588950504014515
Epoch: 16, step: 403, loss: 0.32005423307418823, mean loss: 0.3588933981631782
Epoch: 16, step: 404, loss: 0.36074912548065186, mean loss: 0.35889347710006697
Epoch: 16, step: 405, loss: 0.3101368248462677, mean loss: 0.35889140323140456
Epoch: 16, step: 406, loss: 0.3333338499069214, mean loss: 0.3588903161847743
Epoch: 16, step: 407, loss: 0.329575777053833, mean loss: 0.3588890693942362
Epoch: 16, step: 408, loss: 0.31357541680336, mean loss: 0.3588871422197969
Epoch: 16, step: 409, loss: 0.3529950678348541, mean loss: 0.3588868916425074
Epoch: 16, step: 410, loss: 0.3368230164051056, mean loss: 0.3588859533531076
Epoch: 16, step: 411, loss: 0.3133171796798706, mean loss: 0.3588840155756933
Epoch: 16, step: 412, loss: 0.30861422419548035, mean loss: 0.35888187798197896
Epoch: 16, step: 413, loss: 0.33341696858406067, mean loss: 0.3588807951981794
Epoch: 16, step: 414, loss: 0.34064966440200806, mean loss: 0.35888002003210956
Epoch: 16, step: 415, loss: 0.3369026482105255, mean loss: 0.35887908562004234
Epoch: 16, step: 416, loss: 0.35781100392341614, mean loss: 0.3588790402103363
Epoch: 16, step: 417, loss: 0.3227604627609253, mean loss: 0.3588775046871049
Epoch: 16, step: 418, loss: 0.3525565266609192, mean loss: 0.35887723597231397
Epoch: 16, step: 419, loss: 0.3376403748989105, mean loss: 0.35887633319808027
Epoch: 16, step: 420, loss: 0.28574907779693604, mean loss: 0.3588732247068836
Epoch: 16, step: 421, loss: 0.3475721776485443, mean loss: 0.3588727443427308
Epoch: 16, step: 422, loss: 0.351940393447876, mean loss: 0.3588724496876156
Epoch: 16, step: 423, loss: 0.3183225989341736, mean loss: 0.3588707262155503
Epoch: 16, step: 424, loss: 0.3666253685951233, mean loss: 0.358871055793619
Epoch: 16, step: 425, loss: 0.3092591166496277, mean loss: 0.3588689473389167
Epoch: 16, step: 426, loss: 0.3299073278903961, mean loss: 0.3588677165531682
Epoch: 16, step: 427, loss: 0.314644455909729, mean loss: 0.3588658372713118
Epoch: 16, step: 428, loss: 0.33708715438842773, mean loss: 0.3588649118184209
Epoch: 16, step: 429, loss: 0.3635270297527313, mean loss: 0.35886510991980336
Epoch: 16, step: 430, loss: 0.32487404346466064, mean loss: 0.3588636656424949
Epoch: 16, step: 431, loss: 0.32253551483154297, mean loss: 0.3588621221282694
Epoch: 16, step: 432, loss: 0.35798490047454834, mean loss: 0.3588620848583687
Epoch: 16, step: 433, loss: 0.34148433804512024, mean loss: 0.3588613465736031
Epoch: 16, step: 434, loss: 0.3107467591762543, mean loss: 0.35885930253658377
Epoch: 16, step: 435, loss: 0.36183252930641174, mean loss: 0.3588594288418841
Epoch: 16, step: 436, loss: 0.2920289933681488, mean loss: 0.3588565899465324
Epoch: 16, step: 437, loss: 0.3199184834957123, mean loss: 0.35885493596189005
Epoch: 16, step: 438, loss: 0.3461708426475525, mean loss: 0.3588543971990597
Epoch: 16, step: 439, loss: 0.33296480774879456, mean loss: 0.35885329757327605
Epoch: 16, step: 440, loss: 0.3444352447986603, mean loss: 0.35885268521172264
Epoch: 16, step: 441, loss: 0.28818178176879883, mean loss: 0.3588496838143115
Epoch: 16, step: 442, loss: 0.37579435110092163, mean loss: 0.3588504034247624
Epoch: 16, step: 443, loss: 0.29658275842666626, mean loss: 0.3588477591388358
Epoch: 16, step: 444, loss: 0.3392795920372009, mean loss: 0.35884692818350433
Epoch: 16, step: 445, loss: 0.31889548897743225, mean loss: 0.3588452317317334
Epoch: 16, step: 446, loss: 0.3288654386997223, mean loss: 0.35884395875848246
Epoch: 16, step: 447, loss: 0.3440585434436798, mean loss: 0.35884333098099797
Epoch: 16, step: 448, loss: 0.38597726821899414, mean loss: 0.3588444830184131
Epoch: 16, step: 449, loss: 0.3091047406196594, mean loss: 0.3588423712861214
Epoch: 16, step: 450, loss: 0.36159005761146545, mean loss: 0.35884248793593354
Epoch: 16, step: 451, loss: 0.4015159606933594, mean loss: 0.3588442995114454
Epoch: 16, step: 452, loss: 0.29992610216140747, mean loss: 0.35884179842058705
Epoch: 16, step: 453, loss: 0.3480668365955353, mean loss: 0.35884134104042636
Epoch: 16, step: 454, loss: 0.324055016040802, mean loss: 0.3588398644783906
Epoch: 16, step: 455, loss: 0.37566834688186646, mean loss: 0.35884057876032627
Epoch: 16, step: 456, loss: 0.35242190957069397, mean loss: 0.35884030633261993
Epoch: 16, step: 457, loss: 0.329374223947525, mean loss: 0.3588390557561669
Epoch: 16, step: 458, loss: 0.31936827301979065, mean loss: 0.3588373806391302
Epoch: 16, step: 459, loss: 0.4178195893764496, mean loss: 0.3588398837034969
Epoch: 16, step: 460, loss: 0.3367321193218231, mean loss: 0.3588389455424792
Epoch: 16, step: 461, loss: 0.3072546124458313, mean loss: 0.3588367566121093
Epoch: 16, step: 462, loss: 0.3462812900543213, mean loss: 0.35883622385585867
Epoch: 16, step: 463, loss: 0.33231228590011597, mean loss: 0.3588350984341871
Epoch: 16, step: 464, loss: 0.3260855972766876, mean loss: 0.35883370891824845
Epoch: 16, step: 465, loss: 0.3168315291404724, mean loss: 0.3588319268995901
Epoch: 16, step: 466, loss: 0.32673555612564087, mean loss: 0.35883056521061746
Epoch: 16, step: 467, loss: 0.3311708867549896, mean loss: 0.35882939179815965
Epoch: 16, step: 468, loss: 0.3183116018772125, mean loss: 0.35882767297620566
Epoch: 16, step: 469, loss: 0.3535557687282562, mean loss: 0.358827449344058
Epoch: 16, step: 470, loss: 0.3521362245082855, mean loss: 0.35882716551691757
Epoch: 16, step: 471, loss: 0.3100903034210205, mean loss: 0.3588250982933811
Epoch: 16, step: 472, loss: 0.3638041913509369, mean loss: 0.35882530947771574
Epoch: 16, step: 473, loss: 0.3471539616584778, mean loss: 0.35882481446762926
Epoch: 16, step: 474, loss: 0.3471272885799408, mean loss: 0.35882431836830836
Epoch: 16, step: 475, loss: 0.32543349266052246, mean loss: 0.3588229023027567
Epoch: 16, step: 476, loss: 0.30874761939048767, mean loss: 0.3588207787591024
Epoch: 16, step: 477, loss: 0.34472787380218506, mean loss: 0.3588201811463063
Epoch: 16, step: 478, loss: 0.32737067341804504, mean loss: 0.35881884757942645
Epoch: 16, step: 479, loss: 0.31701281666755676, mean loss: 0.35881707493564624
Epoch: 16, step: 480, loss: 0.30556127429008484, mean loss: 0.358814816898731
Epoch: 16, step: 481, loss: 0.3444027304649353, mean loss: 0.35881420585461865
Epoch: 16, step: 482, loss: 0.3216933012008667, mean loss: 0.35881263206801356
Epoch: 16, step: 483, loss: 0.33927032351493835, mean loss: 0.35881180358282816
Epoch: 16, step: 484, loss: 0.33984699845314026, mean loss: 0.3588109996146595
Epoch: 16, step: 485, loss: 0.383912593126297, mean loss: 0.3588120636923836
Epoch: 16, step: 486, loss: 0.31625697016716003, mean loss: 0.3588102598225381
Epoch: 16, step: 487, loss: 0.34143301844596863, mean loss: 0.35880952324906507
Epoch: 16, step: 488, loss: 0.31938859820365906, mean loss: 0.358807852375287
Epoch: 16, step: 489, loss: 0.3271869719028473, mean loss: 0.35880651216673937
Epoch: 16, step: 490, loss: 0.3388836979866028, mean loss: 0.35880566780080675
Epoch: 16, step: 491, loss: 0.31414899230003357, mean loss: 0.35880377524802237
Epoch: 16, step: 492, loss: 0.3412742018699646, mean loss: 0.3588030323750564
Epoch: 16, step: 493, loss: 0.33146825432777405, mean loss: 0.35880187402358393
Epoch: 16, step: 494, loss: 0.3740352988243103, mean loss: 0.35880251953503783
Epoch: 16, step: 495, loss: 0.3149304986000061, mean loss: 0.3588006605510999
Epoch: 16, step: 496, loss: 0.31308209896087646, mean loss: 0.3587987234059963
Epoch: 16, step: 497, loss: 0.31476011872291565, mean loss: 0.35879685752155077
Epoch: 16, step: 498, loss: 0.297624409198761, mean loss: 0.35879426579811213
Epoch: 16, step: 499, loss: 0.3227977752685547, mean loss: 0.3587927407815671
Epoch: 16, step: 500, loss: 0.3223611116409302, mean loss: 0.3587911973954565
Epoch: 16, step: 501, loss: 0.30781713128089905, mean loss: 0.35878903802639295
Epoch: 16, step: 502, loss: 0.3086767792701721, mean loss: 0.3587869152552337
Epoch: 16, step: 503, loss: 0.34457188844680786, mean loss: 0.3587863131277003
Epoch: 16, step: 504, loss: 0.3243744671344757, mean loss: 0.358784855554487
Epoch: 16, step: 505, loss: 0.3919968605041504, mean loss: 0.3587862622467763
Epoch: 16, step: 506, loss: 0.33808714151382446, mean loss: 0.35878538557400796
Epoch: 16, step: 507, loss: 0.3078693747520447, mean loss: 0.3587832292123774
Epoch: 16, step: 508, loss: 0.3177945613861084, mean loss: 0.35878149336060816
Epoch: 16, step: 509, loss: 0.3136891722679138, mean loss: 0.35877958380182556
Epoch: 16, step: 510, loss: 0.36037904024124146, mean loss: 0.3587796515323544
Epoch: 16, step: 511, loss: 0.3108002841472626, mean loss: 0.3587776198857002
Epoch: 16, step: 512, loss: 0.3468644917011261, mean loss: 0.35877711545549384
Epoch: 16, step: 513, loss: 0.30775272846221924, mean loss: 0.35877495505296214
Epoch: 16, step: 514, loss: 0.33487918972969055, mean loss: 0.35877394333505186
Epoch: 16, step: 515, loss: 0.3240529000759125, mean loss: 0.3587724733501552
Epoch: 16, step: 516, loss: 0.39455121755599976, mean loss: 0.3587739880508117
Epoch: 16, step: 517, loss: 0.3216593563556671, mean loss: 0.3587724168615942
Epoch: 16, step: 518, loss: 0.33066999912261963, mean loss: 0.358771227240558
Epoch: 16, step: 519, loss: 0.31808796525001526, mean loss: 0.35876950512482864
Epoch: 16, step: 520, loss: 0.2892496585845947, mean loss: 0.3587665624858216
Epoch: 16, step: 521, loss: 0.3372606635093689, mean loss: 0.3587656522217491
Epoch: 16, step: 522, loss: 0.3529798090457916, mean loss: 0.3587654073390651
Epoch: 16, step: 523, loss: 0.30649110674858093, mean loss: 0.3587631949511952
Epoch: 16, step: 524, loss: 0.3203434646129608, mean loss: 0.35876156899451744
Epoch: 16, step: 525, loss: 0.37114009261131287, mean loss: 0.3587620928423218
Epoch: 16, step: 526, loss: 0.31069067120552063, mean loss: 0.35876005858978754
Epoch: 16, step: 527, loss: 0.290842741727829, mean loss: 0.358757184634267
Epoch: 16, step: 528, loss: 0.3611263334751129, mean loss: 0.3587572848817532
Epoch: 16, step: 529, loss: 0.31638237833976746, mean loss: 0.35875549191794925
Epoch: 16, step: 530, loss: 0.3416535258293152, mean loss: 0.35875476833148473
Epoch: 16, step: 531, loss: 0.3256470561027527, mean loss: 0.35875336759903304
Epoch: 16, step: 532, loss: 0.3734545409679413, mean loss: 0.35875398955500754
Epoch: 16, step: 533, loss: 0.3188326954841614, mean loss: 0.3587523006941026
Epoch: 16, step: 534, loss: 0.2847820818424225, mean loss: 0.3587491715338652
Epoch: 16, step: 535, loss: 0.3034036457538605, mean loss: 0.35874683035257166
Epoch: 16, step: 536, loss: 0.35113897919654846, mean loss: 0.3587465085450696
Epoch: 16, step: 537, loss: 0.3601888120174408, mean loss: 0.35874656955105355
Epoch: 16, step: 538, loss: 0.32204920053482056, mean loss: 0.35874501740585135
Epoch: 16, step: 539, loss: 0.32738038897514343, mean loss: 0.3587436908693757
Epoch: 16, step: 540, loss: 0.3331994116306305, mean loss: 0.3587426105446035
Epoch: 16, step: 541, loss: 0.33488962054252625, mean loss: 0.358741601790903
Epoch: 16, step: 542, loss: 0.3366401195526123, mean loss: 0.35874066714878183
Epoch: 16, step: 543, loss: 0.3080865442752838, mean loss: 0.35873852514426247
Epoch: 16, step: 544, loss: 0.36964479088783264, mean loss: 0.3587389863166479
Epoch: 16, step: 545, loss: 0.372002512216568, mean loss: 0.35873954714226736
Epoch: 16, step: 546, loss: 0.34274595975875854, mean loss: 0.35873887090923773
Epoch: 16, step: 547, loss: 0.31411242485046387, mean loss: 0.3587369841154757
Epoch: 16, step: 548, loss: 0.3866705298423767, mean loss: 0.35873816508811035
Epoch: 16, step: 549, loss: 0.3349732458591461, mean loss: 0.35873716039887266
Epoch: 16, step: 550, loss: 0.35322922468185425, mean loss: 0.358736927554412
Epoch: 16, step: 551, loss: 0.35820960998535156, mean loss: 0.3587369052633413
Epoch: 16, step: 552, loss: 0.3535064458847046, mean loss: 0.35873668416770876
Epoch: 16, step: 553, loss: 0.3557804226875305, mean loss: 0.3587365592094925
Epoch: 16, step: 554, loss: 0.351218044757843, mean loss: 0.3587362414228383
Epoch: 16, step: 555, loss: 0.3233377933502197, mean loss: 0.3587347452923196
Epoch: 16, step: 556, loss: 0.3340059518814087, mean loss: 0.35873370016348266
Epoch: 16, step: 557, loss: 0.31577184796333313, mean loss: 0.35873188451593807
Epoch: 16, step: 558, loss: 0.36967355012893677, mean loss: 0.35873234691147593
Epoch: 16, step: 559, loss: 0.3329768180847168, mean loss: 0.35873125852705967
Epoch: 16, step: 560, loss: 0.33140334486961365, mean loss: 0.3587301037451599
Epoch: 16, step: 561, loss: 0.3521086573600769, mean loss: 0.35872982395785386
Epoch: 16, step: 562, loss: 0.333132803440094, mean loss: 0.35872874240883973
Epoch: 16, step: 563, loss: 0.32488274574279785, mean loss: 0.3587273123768697
Epoch: 16, step: 564, loss: 0.35415053367614746, mean loss: 0.35872711901091847
Epoch: 16, step: 565, loss: 0.35247349739074707, mean loss: 0.3587268548105965
Epoch: 16, step: 566, loss: 0.35663309693336487, mean loss: 0.3587267663581493
Epoch: 16, step: 567, loss: 0.34639057517051697, mean loss: 0.3587262452280721
Epoch: 16, step: 568, loss: 0.3258833587169647, mean loss: 0.3587248578717374
Epoch: 16, step: 569, loss: 0.31310203671455383, mean loss: 0.35872293074403794
Epoch: 16, step: 570, loss: 0.34248846769332886, mean loss: 0.3587222450222618
Epoch: 16, step: 571, loss: 0.33134713768959045, mean loss: 0.35872108878356723
Epoch: 16, step: 572, loss: 0.32370874285697937, mean loss: 0.35871961003432
Epoch: 16, step: 573, loss: 0.3391169309616089, mean loss: 0.358718782148558
Epoch: 16, step: 574, loss: 0.31380611658096313, mean loss: 0.35871688541873126
Epoch: 16, step: 575, loss: 0.37029165029525757, mean loss: 0.35871737421792366
Epoch: 16, step: 576, loss: 0.3345088064670563, mean loss: 0.35871635193982093
Epoch: 16, step: 577, loss: 0.3444436192512512, mean loss: 0.3587157492570793
Epoch: 16, step: 578, loss: 0.3182010352611542, mean loss: 0.35871403854838546
Epoch: 16, step: 579, loss: 0.31594714522361755, mean loss: 0.35871223281906084
Epoch: 16, step: 580, loss: 0.35276761651039124, mean loss: 0.35871198183251624
Epoch: 16, step: 581, loss: 0.3033684194087982, mean loss: 0.35870964528086446
Epoch: 16, step: 582, loss: 0.3677802085876465, mean loss: 0.35871002821510295
Epoch: 16, step: 583, loss: 0.3731708228588104, mean loss: 0.35871063868431285
Epoch: 16, step: 584, loss: 0.34259268641471863, mean loss: 0.358709958286142
Epoch: 16, step: 585, loss: 0.33349454402923584, mean loss: 0.3587088938955022
Epoch: 16, step: 586, loss: 0.329363614320755, mean loss: 0.3587076552276716
Epoch: 16, step: 587, loss: 0.3158831298351288, mean loss: 0.35870584767552777
Epoch: 16, step: 588, loss: 0.38732489943504333, mean loss: 0.3587070555872215
Epoch: 16, step: 589, loss: 0.3833489418029785, mean loss: 0.3587080955925484
Epoch: 16, step: 590, loss: 0.31837332248687744, mean loss: 0.35870639334426374
Epoch: 16, step: 591, loss: 0.3113681674003601, mean loss: 0.35870439561359424
Epoch: 16, step: 592, loss: 0.3564276695251465, mean loss: 0.35870429953704075
Epoch: 16, step: 593, loss: 0.31983470916748047, mean loss: 0.35870265933152257
Epoch: 16, step: 594, loss: 0.36462682485580444, mean loss: 0.3587029093068601
Epoch: 16, step: 595, loss: 0.34727275371551514, mean loss: 0.35870242702181404
Epoch: 16, step: 596, loss: 0.3255425989627838, mean loss: 0.3587010279319841
Epoch: 16, step: 597, loss: 0.3805749714374542, mean loss: 0.35870195080530726
Epoch: 16, step: 598, loss: 0.31009209156036377, mean loss: 0.35869990001598756
Epoch: 16, step: 599, loss: 0.345705509185791, mean loss: 0.3586993518219768
Epoch: 16, step: 600, loss: 0.3267562687397003, mean loss: 0.35869800429685206
Epoch: 16, step: 601, loss: 0.32555779814720154, mean loss: 0.3586966063298332
Epoch: 16, step: 602, loss: 0.33298662304878235, mean loss: 0.3586955218407253
Epoch: 16, step: 603, loss: 0.31530147790908813, mean loss: 0.3586936914862487
Epoch: 16, step: 604, loss: 0.3629232347011566, mean loss: 0.35869386988024315
Epoch: 16, step: 605, loss: 0.33471429347991943, mean loss: 0.35869285851050886
Epoch: 16, step: 606, loss: 0.3218276798725128, mean loss: 0.3586913037393631
Epoch: 16, step: 607, loss: 0.34254589676856995, mean loss: 0.3586906228433201
Epoch: 16, step: 608, loss: 0.3139983117580414, mean loss: 0.3586887381256089
Epoch: 16, step: 609, loss: 0.33067139983177185, mean loss: 0.3586875566573499
Epoch: 16, step: 610, loss: 0.32800841331481934, mean loss: 0.35868626299749995
Epoch: 16, step: 611, loss: 0.32452234625816345, mean loss: 0.3586848224545442
Epoch: 16, step: 612, loss: 0.33605581521987915, mean loss: 0.35868386832850657
Epoch: 16, step: 613, loss: 0.38116681575775146, mean loss: 0.3586848162561324
Epoch: 16, step: 614, loss: 0.35545843839645386, mean loss: 0.3586846802310951
Epoch: 16, step: 615, loss: 0.37221869826316833, mean loss: 0.35868525080521113
Epoch: 16, step: 616, loss: 0.33033105731010437, mean loss: 0.35868405548488336
Epoch: 16, step: 617, loss: 0.3035689890384674, mean loss: 0.35868173211137155
Epoch: 16, step: 618, loss: 0.37775886058807373, mean loss: 0.35868253627309127
Epoch: 16, step: 619, loss: 0.3108382523059845, mean loss: 0.35868051956916414
Epoch: 16, step: 620, loss: 0.3174647092819214, mean loss: 0.3586787823379613
Epoch: 16, step: 621, loss: 0.31590381264686584, mean loss: 0.3586769794647551
Epoch: 16, step: 622, loss: 0.3432827591896057, mean loss: 0.3586763306587419
Epoch: 16, step: 623, loss: 0.31318214535713196, mean loss: 0.35867441333805317
Epoch: 16, step: 624, loss: 0.32920873165130615, mean loss: 0.3586731715797959
Epoch: 16, step: 625, loss: 0.34209632873535156, mean loss: 0.3586724730192041
Epoch: 16, step: 626, loss: 0.3287256062030792, mean loss: 0.35867121108895184
Epoch: 16, step: 627, loss: 0.33769428730010986, mean loss: 0.35867032718014563
Epoch: 16, step: 628, loss: 0.3499175012111664, mean loss: 0.3586699583761188
Epoch: 16, step: 629, loss: 0.3560192584991455, mean loss: 0.35866984669246343
Epoch: 16, step: 630, loss: 0.3156264126300812, mean loss: 0.35866803319197627
Epoch: 16, step: 631, loss: 0.3345372676849365, mean loss: 0.35866701656046684
Epoch: 16, step: 632, loss: 0.3301609754562378, mean loss: 0.35866581564876343
Epoch: 16, step: 633, loss: 0.32878217101097107, mean loss: 0.3586645567539687
Epoch: 16, step: 634, loss: 0.3486674726009369, mean loss: 0.3586641356290623
Epoch: 16, step: 635, loss: 0.34529879689216614, mean loss: 0.3586635726409099
Epoch: 16, step: 636, loss: 0.3137846887111664, mean loss: 0.3586616822873473
Epoch: 16, step: 637, loss: 0.3344850242137909, mean loss: 0.35866066397978796
Epoch: 16, step: 638, loss: 0.3297519385814667, mean loss: 0.35865944641143527
Epoch: 16, step: 639, loss: 0.31005892157554626, mean loss: 0.3586573995564472
Epoch: 16, step: 640, loss: 0.3224172592163086, mean loss: 0.35865587333449145
Epoch: 16, step: 641, loss: 0.3066945970058441, mean loss: 0.3586536851227367
Epoch: 16, step: 642, loss: 0.33296340703964233, mean loss: 0.3586526032901649
Epoch: 16, step: 643, loss: 0.32937538623809814, mean loss: 0.35865137046141926
Epoch: 16, step: 644, loss: 0.34731346368789673, mean loss: 0.35865089305576964
Epoch: 16, step: 645, loss: 0.34694135189056396, mean loss: 0.3586504000224574
Epoch: 16, step: 646, loss: 0.336129367351532, mean loss: 0.358649451808375
Epoch: 16, step: 647, loss: 0.30645114183425903, mean loss: 0.35864725416986143
Epoch: 16, step: 648, loss: 0.3257666826248169, mean loss: 0.35864586989959896
Epoch: 16, step: 649, loss: 0.3362017869949341, mean loss: 0.35864492504471535
Epoch: 16, step: 650, loss: 0.39952313899993896, mean loss: 0.35864664587039224
Epoch: 16, step: 651, loss: 0.31960442662239075, mean loss: 0.3586450024026684
Epoch: 16, step: 652, loss: 0.3579798638820648, mean loss: 0.35864497440508786
Epoch: 16, step: 653, loss: 0.31121334433555603, mean loss: 0.3586429779563098
Epoch: 16, step: 654, loss: 0.3153226971626282, mean loss: 0.35864115463542956
Epoch: 16, step: 655, loss: 0.3524318337440491, mean loss: 0.3586408933003752
Epoch: 16, step: 656, loss: 0.36271893978118896, mean loss: 0.3586410649281047
Epoch: 16, step: 657, loss: 0.3075905740261078, mean loss: 0.3586389165192628
Epoch: 16, step: 658, loss: 0.35096266865730286, mean loss: 0.35863859348564486
Epoch: 16, step: 659, loss: 0.3523297607898712, mean loss: 0.3586383280070766
Epoch: 16, step: 660, loss: 0.3321349024772644, mean loss: 0.3586372127777255
Epoch: 16, step: 661, loss: 0.3538026809692383, mean loss: 0.3586370093555338
Epoch: 16, step: 662, loss: 0.32934632897377014, mean loss: 0.35863577694587406
Epoch: 16, step: 663, loss: 0.36796826124191284, mean loss: 0.35863616959499456
Epoch: 16, step: 664, loss: 0.3436183035373688, mean loss: 0.3586355377692527
Epoch: 16, step: 665, loss: 0.3114067316055298, mean loss: 0.35863355086112636
Epoch: 16, step: 666, loss: 0.34459978342056274, mean loss: 0.3586329604876696
Epoch: 16, step: 667, loss: 0.3163358271121979, mean loss: 0.3586311812039167
Epoch: 16, step: 668, loss: 0.3519554138183594, mean loss: 0.3586309003909193
Epoch: 16, step: 669, loss: 0.3276505172252655, mean loss: 0.3586295972705708
Epoch: 16, step: 670, loss: 0.3751608431339264, mean loss: 0.35863029259111184
Epoch: 16, step: 671, loss: 0.27673694491386414, mean loss: 0.35862684822083607
Epoch: 16, step: 672, loss: 0.32117995619773865, mean loss: 0.3586252733000293
Epoch: 16, step: 673, loss: 0.33549243211746216, mean loss: 0.35862430043262317
Epoch: 16, step: 674, loss: 0.31229570508003235, mean loss: 0.35862235213389937
Epoch: 16, step: 675, loss: 0.3197622001171112, mean loss: 0.3586207179811653
Epoch: 16, step: 676, loss: 0.31122249364852905, mean loss: 0.35861872486799373
Epoch: 16, step: 677, loss: 0.3829999566078186, mean loss: 0.35861975006485436
Epoch: 16, step: 678, loss: 0.34573614597320557, mean loss: 0.35861920835001215
Epoch: 16, step: 679, loss: 0.3098576068878174, mean loss: 0.3586171581649524
Epoch: 16, step: 680, loss: 0.351278156042099, mean loss: 0.35861684960905066
Epoch: 16, step: 681, loss: 0.3413255512714386, mean loss: 0.35861612265629117
Epoch: 16, step: 682, loss: 0.3394812047481537, mean loss: 0.3586153182287506
Epoch: 16, step: 683, loss: 0.3453003466129303, mean loss: 0.3586147584939425
Epoch: 16, step: 684, loss: 0.33220672607421875, mean loss: 0.3586136483996796
Epoch: 16, step: 685, loss: 0.3364044427871704, mean loss: 0.3586127148475311
Epoch: 16, step: 686, loss: 0.3500567376613617, mean loss: 0.3586123552166965
Epoch: 16, step: 687, loss: 0.34877148270606995, mean loss: 0.3586119415956259
Epoch: 16, step: 688, loss: 0.32528629899024963, mean loss: 0.35861054094658606
Epoch: 16, step: 689, loss: 0.3352452218532562, mean loss: 0.3586095589629308
Epoch: 16, step: 690, loss: 0.32818636298179626, mean loss: 0.35860828040878157
Epoch: 16, step: 691, loss: 0.36244648694992065, mean loss: 0.3586084417050726
Epoch: 16, step: 692, loss: 0.30666765570640564, mean loss: 0.3586062590439809
Epoch: 16, step: 693, loss: 0.3105829954147339, mean loss: 0.3586042410902189
Epoch: 16, step: 694, loss: 0.3391292095184326, mean loss: 0.35860342277719853
Epoch: 16, step: 695, loss: 0.3628181517124176, mean loss: 0.3586035998666496
Epoch: 16, step: 696, loss: 0.32682305574417114, mean loss: 0.35860226460577305
Epoch: 16, step: 697, loss: 0.3379153609275818, mean loss: 0.3586013954811752
Epoch: 16, step: 698, loss: 0.35668495297431946, mean loss: 0.3586013149685294
Epoch: 16, step: 699, loss: 0.3267778158187866, mean loss: 0.358599978071405
Epoch: 16, step: 700, loss: 0.34976330399513245, mean loss: 0.3585996068605637
Epoch: 16, step: 701, loss: 0.34582966566085815, mean loss: 0.3585990704436436
Epoch: 16, step: 702, loss: 0.3715435266494751, mean loss: 0.35859961416843905
Epoch: 16, step: 703, loss: 0.29921719431877136, mean loss: 0.3585971199471752
Epoch: 16, step: 704, loss: 0.35319599509239197, mean loss: 0.3585968930949405
Epoch: 16, step: 705, loss: 0.34391647577285767, mean loss: 0.3585962765297443
Epoch: 16, step: 706, loss: 0.349191278219223, mean loss: 0.35859588154430433
Epoch: 16, step: 707, loss: 0.3265562653541565, mean loss: 0.35859453602035885
Epoch: 16, step: 708, loss: 0.2970646321773529, mean loss: 0.35859195214164374
Epoch: 16, step: 709, loss: 0.3597196936607361, mean loss: 0.35859199949788456
Epoch: 16, step: 710, loss: 0.3130796551704407, mean loss: 0.35859008841897094
Epoch: 16, step: 711, loss: 0.33778420090675354, mean loss: 0.35858921480931727
Epoch: 16, step: 712, loss: 0.3731372654438019, mean loss: 0.35858982563564445
Epoch: 16, step: 713, loss: 0.2946960926055908, mean loss: 0.3585871430538563
Epoch: 16, step: 714, loss: 0.3373253047466278, mean loss: 0.3585862504119189
Epoch: 16, step: 715, loss: 0.35027816891670227, mean loss: 0.3585859016259619
Epoch: 16, step: 716, loss: 0.28621706366539, mean loss: 0.35858286359909647
Epoch: 16, step: 717, loss: 0.3389405906200409, mean loss: 0.3585820390556921
Epoch: 16, step: 718, loss: 0.30777642130851746, mean loss: 0.35857990642681464
Epoch: 16, step: 719, loss: 0.35404491424560547, mean loss: 0.35857971607287825
Epoch: 16, step: 720, loss: 0.3239791989326477, mean loss: 0.3585782637951389
Epoch: 16, step: 721, loss: 0.30386194586753845, mean loss: 0.3585759672989613
Epoch: 16, step: 722, loss: 0.3064529597759247, mean loss: 0.35857377973831484
Epoch: 16, step: 723, loss: 0.3455498218536377, mean loss: 0.35857323315623135
Epoch: 16, step: 724, loss: 0.3756856620311737, mean loss: 0.35857395129081
Epoch: 16, step: 725, loss: 0.3418348431587219, mean loss: 0.3585732488523655
Epoch: 16, step: 726, loss: 0.30566656589508057, mean loss: 0.35857102877419184
Epoch: 16, step: 727, loss: 0.29265302419662476, mean loss: 0.3585682628290518
Epoch: 16, step: 728, loss: 0.34212297201156616, mean loss: 0.35856757280719903
Epoch: 16, step: 729, loss: 0.33341100811958313, mean loss: 0.35856651731652656
Epoch: 16, step: 730, loss: 0.36838972568511963, mean loss: 0.3585669294502949
Epoch: 16, step: 731, loss: 0.34868207573890686, mean loss: 0.35856651474758844
Epoch: 16, step: 732, loss: 0.37811094522476196, mean loss: 0.3585673346674809
Epoch: 16, step: 733, loss: 0.32528430223464966, mean loss: 0.35856593844999485
Epoch: 16, step: 734, loss: 0.3918439745903015, mean loss: 0.3585673343993275
Epoch: 16, step: 735, loss: 0.33402374386787415, mean loss: 0.3585663048863018
Epoch: 16, step: 736, loss: 0.3143864870071411, mean loss: 0.35856445178375246
Epoch: 16, step: 737, loss: 0.3557463586330414, mean loss: 0.3585643335850631
Epoch: 16, step: 738, loss: 0.3556953966617584, mean loss: 0.35856421325889093
Epoch: 16, step: 739, loss: 0.33319440484046936, mean loss: 0.35856314926759675
Epoch: 16, step: 740, loss: 0.32461389899253845, mean loss: 0.35856172552046844
Epoch: 16, step: 741, loss: 0.30923905968666077, mean loss: 0.3585596571372665
Epoch: 16, step: 742, loss: 0.2950681447982788, mean loss: 0.358556994684449
Epoch: 16, step: 743, loss: 0.32600343227386475, mean loss: 0.3585556296407384
Epoch: 16, step: 744, loss: 0.36433711647987366, mean loss: 0.35855587206125245
Epoch: 16, step: 745, loss: 0.3837105929851532, mean loss: 0.3585569267665323
Epoch: 16, step: 746, loss: 0.32588449120521545, mean loss: 0.3585555569105279
Epoch: 16, step: 747, loss: 0.3568897843360901, mean loss: 0.3585554870726705
Epoch: 16, step: 748, loss: 0.3478901982307434, mean loss: 0.3585550399469906
Epoch: 16, step: 749, loss: 0.32434573769569397, mean loss: 0.35855360583521684
Epoch: 16, step: 750, loss: 0.3005184233188629, mean loss: 0.35855117300425826
Epoch: 16, step: 751, loss: 0.28978046774864197, mean loss: 0.3585482902617509
Epoch: 16, step: 752, loss: 0.3346620500087738, mean loss: 0.3585472890361042
Epoch: 16, step: 753, loss: 0.358582079410553, mean loss: 0.358547290494331
Epoch: 16, step: 754, loss: 0.31366416811943054, mean loss: 0.3585454093122875
Epoch: 16, step: 755, loss: 0.324311226606369, mean loss: 0.35854397451837694
Epoch: 16, step: 756, loss: 0.2963797450065613, mean loss: 0.3585413692533205
Epoch: 16, step: 757, loss: 0.3089504837989807, mean loss: 0.3585392910165652
Epoch: 16, step: 758, loss: 0.34369733929634094, mean loss: 0.3585386690515264
Epoch: 16, step: 759, loss: 0.35274598002433777, mean loss: 0.3585384263139708
Epoch: 16, step: 760, loss: 0.4284297227859497, mean loss: 0.3585413549247595
Epoch: 16, step: 761, loss: 0.34261658787727356, mean loss: 0.35854068766727826
Epoch: 16, step: 762, loss: 0.3843088448047638, mean loss: 0.3585417673235877
Epoch: 16, step: 763, loss: 0.3079547882080078, mean loss: 0.3585396478758286
Epoch: 16, step: 764, loss: 0.31042420864105225, mean loss: 0.3585376320628815
Epoch: 16, step: 765, loss: 0.3520898222923279, mean loss: 0.35853736194098074
Epoch: 16, step: 766, loss: 0.3157584071159363, mean loss: 0.3585355698520517
Epoch: 16, step: 767, loss: 0.3756338953971863, mean loss: 0.358536286102284
Epoch: 16, step: 768, loss: 0.32073065638542175, mean loss: 0.3585347024877522
Epoch: 16, step: 769, loss: 0.32816505432128906, mean loss: 0.358533430407323
Epoch: 16, step: 770, loss: 0.3190420866012573, mean loss: 0.3585317763196243
Epoch: 16, step: 771, loss: 0.3440295159816742, mean loss: 0.3585311689205483
Epoch: 16, step: 772, loss: 0.3332612216472626, mean loss: 0.358530110582094
Epoch: 16, step: 773, loss: 0.3356493413448334, mean loss: 0.35852915234567395
Epoch: 16, step: 774, loss: 0.3172678053379059, mean loss: 0.3585274244112124
Epoch: 16, step: 775, loss: 0.3278287649154663, mean loss: 0.3585261388727075
Epoch: 16, step: 776, loss: 0.32428646087646484, mean loss: 0.35852470511038614
Epoch: 16, step: 777, loss: 0.3270963728427887, mean loss: 0.3585233891262865
Epoch: 16, step: 778, loss: 0.3495205342769623, mean loss: 0.358523012169671
Epoch: 16, step: 779, loss: 0.34355488419532776, mean loss: 0.3585223854686169
Epoch: 16, step: 780, loss: 0.3518467843532562, mean loss: 0.358522105979351
Epoch: 16, step: 781, loss: 0.36106234788894653, mean loss: 0.35852221232791964
Epoch: 16, step: 782, loss: 0.3759714663028717, mean loss: 0.35852294281956676
Epoch: 16, step: 783, loss: 0.3632310926914215, mean loss: 0.35852313991224394
Epoch: 16, step: 784, loss: 0.34306904673576355, mean loss: 0.3585224929997245
Epoch: 16, step: 785, loss: 0.3854326605796814, mean loss: 0.35852361941946415
Epoch: 16, step: 786, loss: 0.28750577569007874, mean loss: 0.35852064684218693
Epoch: 16, step: 787, loss: 0.33840715885162354, mean loss: 0.35851980499186087
Epoch: 16, step: 788, loss: 0.34682929515838623, mean loss: 0.3585193157058845
Epoch: 16, step: 789, loss: 0.3478984832763672, mean loss: 0.35851887120800097
Epoch: 16, step: 790, loss: 0.30772313475608826, mean loss: 0.35851674541865375
Epoch: 16, step: 791, loss: 0.3615345060825348, mean loss: 0.3585168717059263
Epoch: 16, step: 792, loss: 0.33691778779029846, mean loss: 0.35851596786511297
Epoch: 16, step: 793, loss: 0.33364546298980713, mean loss: 0.35851492717112704
Epoch: 16, step: 794, loss: 0.3078935146331787, mean loss: 0.35851280903176813
Epoch: 16, step: 795, loss: 0.3993220329284668, mean loss: 0.35851451653067595
Epoch: 16, step: 796, loss: 0.330095112323761, mean loss: 0.35851332748401654
Epoch: 16, step: 797, loss: 0.39646801352500916, mean loss: 0.3585149154133129
Epoch: 16, step: 798, loss: 0.3303285241127014, mean loss: 0.3585137362144131
Epoch: 16, step: 799, loss: 0.3071783483028412, mean loss: 0.35851158864965776
Epoch: 16, step: 800, loss: 0.38667944073677063, mean loss: 0.35851276697436335
Epoch: 16, step: 801, loss: 0.33766382932662964, mean loss: 0.35851189485281865
Epoch: 16, step: 802, loss: 0.3281078040599823, mean loss: 0.3585106230876121
Epoch: 16, step: 803, loss: 0.31452953815460205, mean loss: 0.3585087834906181
Epoch: 16, step: 804, loss: 0.34372758865356445, mean loss: 0.3585081652633883
Epoch: 16, step: 805, loss: 0.35079771280288696, mean loss: 0.3585078427852427
Epoch: 16, step: 806, loss: 0.2896038591861725, mean loss: 0.35850496109967545
Epoch: 16, step: 807, loss: 0.36497658491134644, mean loss: 0.35850523174302656
Epoch: 16, step: 808, loss: 0.3205065131187439, mean loss: 0.3585036427028131
Epoch: 16, step: 809, loss: 0.33790284395217896, mean loss: 0.3585027812493235
Epoch: 16, step: 810, loss: 0.3153243362903595, mean loss: 0.358500975752984
Epoch: 16, step: 811, loss: 0.3292945623397827, mean loss: 0.3584997545448634
Epoch: 16, step: 812, loss: 0.27518126368522644, mean loss: 0.35849627089344976
Epoch: 16, step: 813, loss: 0.3135802745819092, mean loss: 0.3584943929773902
Epoch: 16, step: 814, loss: 0.3367879390716553, mean loss: 0.3584934854790038
Epoch: 16, step: 815, loss: 0.3385849595069885, mean loss: 0.3584926531827675
Epoch: 16, step: 816, loss: 0.31471243500709534, mean loss: 0.3584908229826013
Epoch: 16, step: 817, loss: 0.3384561538696289, mean loss: 0.35848998548284744
Epoch: 16, step: 818, loss: 0.31051504611968994, mean loss: 0.3584879800930818
Epoch: 16, step: 819, loss: 0.3101091980934143, mean loss: 0.35848595790690896
Epoch: 16, step: 820, loss: 0.32469451427459717, mean loss: 0.3584845455163705
Epoch: 16, step: 821, loss: 0.3518141508102417, mean loss: 0.35848426672364686
Epoch: 16, step: 822, loss: 0.35452204942703247, mean loss: 0.35848410112757145
Epoch: 16, step: 823, loss: 0.3386135399341583, mean loss: 0.3584832706962277
Epoch: 16, step: 824, loss: 0.32772335410118103, mean loss: 0.35848198523019925
Epoch: 16, step: 825, loss: 0.3630245327949524, mean loss: 0.358482175056675
Epoch: 16, step: 826, loss: 0.3198941946029663, mean loss: 0.35848056258830957
Epoch: 16, step: 827, loss: 0.3338455259799957, mean loss: 0.35847953321188436
Epoch: 16, step: 828, loss: 0.3493711054325104, mean loss: 0.35847915263160696
Epoch: 16, step: 829, loss: 0.37787967920303345, mean loss: 0.3584799632159878
Epoch: 16, step: 830, loss: 0.32095617055892944, mean loss: 0.35847839547867183
Epoch: 16, step: 831, loss: 0.30685245990753174, mean loss: 0.3584762386464705
Epoch: 16, step: 832, loss: 0.38239994645118713, mean loss: 0.3584772380911714
Epoch: 16, step: 833, loss: 0.39134860038757324, mean loss: 0.3584786112786681
Epoch: 16, step: 834, loss: 0.349870890378952, mean loss: 0.3584782517097262
Epoch: 16, step: 835, loss: 0.3237640857696533, mean loss: 0.3584768016610236
Epoch: 16, step: 836, loss: 0.3138350546360016, mean loss: 0.35847493700428307
Epoch: 16, step: 837, loss: 0.3442152440547943, mean loss: 0.3584743414110599
Epoch: 16, step: 838, loss: 0.340503990650177, mean loss: 0.35847359086389535
Epoch: 16, step: 839, loss: 0.3361901044845581, mean loss: 0.35847266021377927
Epoch: 16, step: 840, loss: 0.41541123390197754, mean loss: 0.35847503810368064
Epoch: 16, step: 841, loss: 0.3741883635520935, mean loss: 0.3584756943020206
Epoch: 16, step: 842, loss: 0.35656797885894775, mean loss: 0.3584756146379523
Epoch: 16, step: 843, loss: 0.34837856888771057, mean loss: 0.35847519301419456
Epoch: 16, step: 844, loss: 0.34048786759376526, mean loss: 0.35847444194628275
Epoch: 16, step: 845, loss: 0.3671529293060303, mean loss: 0.3584748043048364
Epoch: 16, step: 846, loss: 0.31496819853782654, mean loss: 0.3584729878209415
Epoch: 16, step: 847, loss: 0.3059481978416443, mean loss: 0.3584707949021882
Epoch: 16, step: 848, loss: 0.37025949358940125, mean loss: 0.3584712870617794
Epoch: 16, step: 849, loss: 0.33178621530532837, mean loss: 0.35847017304859763
Epoch: 16, step: 850, loss: 0.31753796339035034, mean loss: 0.3584684643360258
Epoch: 16, step: 851, loss: 0.2941300868988037, mean loss: 0.35846577864653517
Epoch: 16, step: 852, loss: 0.3375055193901062, mean loss: 0.3584649037348494
Epoch: 16, step: 853, loss: 0.3204796314239502, mean loss: 0.3584633182405548
Epoch: 16, step: 854, loss: 0.3381219208240509, mean loss: 0.35846246923193936
Epoch: 16, step: 855, loss: 0.3245888650417328, mean loss: 0.35846105547550405
Epoch: 16, step: 856, loss: 0.316854864358902, mean loss: 0.3584593190625365
Epoch: 16, step: 857, loss: 0.3119489252567291, mean loss: 0.3584573780562012
Epoch: 16, step: 858, loss: 0.31509581208229065, mean loss: 0.3584555685346065
Epoch: 16, step: 859, loss: 0.35955575108528137, mean loss: 0.35845561444441076
Epoch: 16, step: 860, loss: 0.3204748332500458, mean loss: 0.3584540296006305
Epoch: 16, step: 861, loss: 0.37844744324684143, mean loss: 0.3584548638413735
Epoch: 16, step: 862, loss: 0.3449903726577759, mean loss: 0.3584543020484422
Epoch: 16, step: 863, loss: 0.29642197489738464, mean loss: 0.35845171391730274
Epoch: 16, step: 864, loss: 0.3047727346420288, mean loss: 0.358449474400457
Epoch: 16, step: 865, loss: 0.3355591297149658, mean loss: 0.35844851944239753
Epoch: 16, step: 866, loss: 0.3398377299308777, mean loss: 0.3584477430546994
Epoch: 16, step: 867, loss: 0.34976840019226074, mean loss: 0.35844738099300816
Epoch: 16, step: 868, loss: 0.3328075110912323, mean loss: 0.35844631146187306
Epoch: 16, step: 869, loss: 0.3524304926395416, mean loss: 0.3584460605309136
Epoch: 16, step: 870, loss: 0.33821460604667664, mean loss: 0.3584452166746265
Epoch: 16, step: 871, loss: 0.313078373670578, mean loss: 0.358443324497324
Epoch: 16, step: 872, loss: 0.3284298777580261, mean loss: 0.35844207273744
Epoch: 16, step: 873, loss: 0.34642723202705383, mean loss: 0.3584415716597559
Epoch: 16, step: 874, loss: 0.30679044127464294, mean loss: 0.3584394176445599
Epoch: 16, step: 875, loss: 0.35796114802360535, mean loss: 0.3584393977000386
Epoch: 16, step: 876, loss: 0.34812402725219727, mean loss: 0.35843896755240306
Epoch: 16, step: 877, loss: 0.30568572878837585, mean loss: 0.35843676785101186
Epoch: 16, step: 878, loss: 0.33568739891052246, mean loss: 0.3584358192887411
Epoch: 16, step: 879, loss: 0.3489179313182831, mean loss: 0.35843542244551346
Epoch: 16, step: 880, loss: 0.33715543150901794, mean loss: 0.3584345352247114
Epoch: 16, step: 881, loss: 0.31078073382377625, mean loss: 0.35843254849072487
Epoch: 16, step: 882, loss: 0.3541930019855499, mean loss: 0.35843237174721776
Epoch: 16, step: 883, loss: 0.31384190917015076, mean loss: 0.35843051288184435
Epoch: 16, step: 884, loss: 0.34051647782325745, mean loss: 0.3584297661214517
Epoch: 16, step: 885, loss: 0.3207198977470398, mean loss: 0.358428194221978
Epoch: 16, step: 886, loss: 0.364901602268219, mean loss: 0.3584284640484982
Epoch: 16, step: 887, loss: 0.334966778755188, mean loss: 0.35842748615231224
Epoch: 16, step: 888, loss: 0.3524094820022583, mean loss: 0.3584272353289825
Epoch: 16, step: 889, loss: 0.34099510312080383, mean loss: 0.3584265088085104
Epoch: 16, step: 890, loss: 0.3694567382335663, mean loss: 0.3584269684971716
Epoch: 16, step: 891, loss: 0.283296674489975, mean loss: 0.3584238375464295
Epoch: 16, step: 892, loss: 0.3420355021953583, mean loss: 0.3584231546137566
Epoch: 16, step: 893, loss: 0.34230345487594604, mean loss: 0.35842248290362505
Epoch: 16, step: 894, loss: 0.33374783396720886, mean loss: 0.358421454750413
Epoch: 16, step: 895, loss: 0.35091790556907654, mean loss: 0.3584211421025304
Epoch: 16, step: 896, loss: 0.3098607659339905, mean loss: 0.35841911883782607
Epoch: 16, step: 897, loss: 0.34319788217544556, mean loss: 0.3584184846724789
Epoch: 16, step: 898, loss: 0.36151039600372314, mean loss: 0.358418613486016
Epoch: 16, step: 899, loss: 0.34754008054733276, mean loss: 0.358418160289343
Epoch: 16, step: 900, loss: 0.32706737518310547, mean loss: 0.3584168542787158
Epoch: 16, step: 901, loss: 0.3594425618648529, mean loss: 0.3584168970058501
Epoch: 16, step: 902, loss: 0.3188095688819885, mean loss: 0.3584152471817103
Epoch: 16, step: 903, loss: 0.30489322543144226, mean loss: 0.35841301784058444
Epoch: 16, step: 904, loss: 0.359294593334198, mean loss: 0.3584130545591272
Epoch: 16, step: 905, loss: 0.3594852685928345, mean loss: 0.35841309921610487
Epoch: 16, step: 906, loss: 0.35694584250450134, mean loss: 0.35841303810841624
Epoch: 16, step: 907, loss: 0.3420059382915497, mean loss: 0.35841235482090095
Epoch: 16, step: 908, loss: 0.3378202021121979, mean loss: 0.3584114972790399
Epoch: 16, step: 909, loss: 0.3737162947654724, mean loss: 0.3584121346071605
Epoch: 16, step: 910, loss: 0.37604930996894836, mean loss: 0.35841286903045266
Epoch: 16, step: 911, loss: 0.381030797958374, mean loss: 0.35841381081630075
Epoch: 16, step: 912, loss: 0.32013559341430664, mean loss: 0.35841221701951503
Epoch: 16, step: 913, loss: 0.34068772196769714, mean loss: 0.35841147905236326
Epoch: 16, step: 914, loss: 0.31892406940460205, mean loss: 0.3584098350451337
Epoch: 16, step: 915, loss: 0.3740845322608948, mean loss: 0.3584104876137105
Epoch: 16, step: 916, loss: 0.36422795057296753, mean loss: 0.3584107297960909
Epoch: 16, step: 917, loss: 0.3107471764087677, mean loss: 0.35840874563351544
Epoch: 16, step: 918, loss: 0.3710649907588959, mean loss: 0.3584092724721753
Epoch: 16, step: 919, loss: 0.36161375045776367, mean loss: 0.35840940585870484
Epoch: 16, step: 920, loss: 0.2924403250217438, mean loss: 0.35840666000726523
Epoch: 16, step: 921, loss: 0.31979453563690186, mean loss: 0.3584050529097721
Epoch: 16, step: 922, loss: 0.34827524423599243, mean loss: 0.35840463130871186
Epoch: 16, step: 923, loss: 0.2914135456085205, mean loss: 0.3584018432661906
Epoch: 16, step: 924, loss: 0.3380913734436035, mean loss: 0.3584009980179563
Epoch: 16, step: 925, loss: 0.32200494408607483, mean loss: 0.3583994834089703
Epoch: 16, step: 926, loss: 0.33695414662361145, mean loss: 0.35839859100595817
Epoch: 16, step: 927, loss: 0.34799957275390625, mean loss: 0.35839815829048494
Epoch: 16, step: 928, loss: 0.3226131796836853, mean loss: 0.3583966692970756
Epoch: 16, step: 929, loss: 0.37930160760879517, mean loss: 0.3583975391039455
Epoch: 16, step: 930, loss: 0.3234672546386719, mean loss: 0.35839608579483523
Epoch: 16, step: 931, loss: 0.3286883234977722, mean loss: 0.3583948498253604
Epoch: 16, step: 932, loss: 0.33306196331977844, mean loss: 0.3583937959132039
Epoch: 16, step: 933, loss: 0.3214212954044342, mean loss: 0.3583922578276515
Epoch: 16, step: 934, loss: 0.3708430230617523, mean loss: 0.35839277576788336
Epoch: 16, step: 935, loss: 0.3067494332790375, mean loss: 0.35839062754232226
Epoch: 16, step: 936, loss: 0.3199392259120941, mean loss: 0.35838902813291207
Epoch: 16, step: 937, loss: 0.33436718583106995, mean loss: 0.3583880289713489
Epoch: 16, step: 938, loss: 0.3473827838897705, mean loss: 0.35838757123957327
Epoch: 16, step: 939, loss: 0.2919252812862396, mean loss: 0.3583848070451816
Epoch: 16, step: 940, loss: 0.36506494879722595, mean loss: 0.3583850848635119
Epoch: 16, step: 941, loss: 0.2971682846546173, mean loss: 0.3583825390429925
Epoch: 16, step: 942, loss: 0.322704553604126, mean loss: 0.3583810553658004
Epoch: 16, step: 943, loss: 0.32049664855003357, mean loss: 0.3583794799995822
Epoch: 16, step: 944, loss: 0.3067820072174072, mean loss: 0.3583773344853079
Epoch: 16, step: 945, loss: 0.3349032700061798, mean loss: 0.3583763584327308
Epoch: 16, step: 946, loss: 0.3200381398200989, mean loss: 0.35837476439428695
Epoch: 16, step: 947, loss: 0.3245087265968323, mean loss: 0.3583733563601194
Epoch: 16, step: 948, loss: 0.31168457865715027, mean loss: 0.35837141528093164
Epoch: 16, step: 949, loss: 0.34318676590919495, mean loss: 0.3583707840075729
Epoch: 16, step: 950, loss: 0.3439770042896271, mean loss: 0.35837018563801487
Epoch: 16, step: 951, loss: 0.35966989398002625, mean loss: 0.35837023966646275
Epoch: 16, step: 952, loss: 0.3154885172843933, mean loss: 0.3583684571614795
Epoch: 16, step: 953, loss: 0.3236081004142761, mean loss: 0.35836701230501816
Epoch: 16, step: 954, loss: 0.29487502574920654, mean loss: 0.3583643732931492
Epoch: 16, step: 955, loss: 0.3351374566555023, mean loss: 0.35836340791839283
Epoch: 16, step: 956, loss: 0.35877272486686707, mean loss: 0.35836342493002776
Epoch: 16, step: 957, loss: 0.32095375657081604, mean loss: 0.35836187021020566
Epoch: 16, step: 958, loss: 0.3543855845928192, mean loss: 0.35836170496540587
Epoch: 16, step: 959, loss: 0.30029022693634033, mean loss: 0.35835929175571385
Epoch: 16, step: 960, loss: 0.3387686014175415, mean loss: 0.35835847768173346
Epoch: 16, step: 961, loss: 0.36989814043045044, mean loss: 0.35835895718238786
Epoch: 16, step: 962, loss: 0.3749485909938812, mean loss: 0.3583596464928051
Epoch: 16, step: 963, loss: 0.3608211278915405, mean loss: 0.3583597487647595
Epoch: 16, step: 964, loss: 0.3992226719856262, mean loss: 0.35836144650555557
Epoch: 16, step: 965, loss: 0.35380318760871887, mean loss: 0.3583612571304456
Epoch: 16, step: 966, loss: 0.3199995458126068, mean loss: 0.3583596634404735
Epoch: 16, step: 967, loss: 0.3669995367527008, mean loss: 0.35836002235844094
Epoch: 16, step: 968, loss: 0.2938501834869385, mean loss: 0.35835734259942165
Epoch: 16, step: 969, loss: 0.36394017934799194, mean loss: 0.35835757450258476
Epoch: 16, step: 970, loss: 0.3314785659313202, mean loss: 0.3583564580328622
Epoch: 16, step: 971, loss: 0.33664849400520325, mean loss: 0.35835555638956484
Epoch: 16, step: 972, loss: 0.30712080001831055, mean loss: 0.35835342843523615
Epoch: 16, step: 973, loss: 0.3287484347820282, mean loss: 0.3583521988898564
Epoch: 16, step: 974, loss: 0.31662020087242126, mean loss: 0.3583504657614866
Epoch: 16, step: 975, loss: 0.3353988826274872, mean loss: 0.35834951262265213
Epoch: 16, step: 976, loss: 0.3507877290248871, mean loss: 0.3583491986081346
Epoch: 16, step: 977, loss: 0.3288115859031677, mean loss: 0.35834797206496105
Epoch: 16, step: 978, loss: 0.3224373161792755, mean loss: 0.35834648094442434
Epoch: 16, step: 979, loss: 0.33995622396469116, mean loss: 0.35834571735627535
Epoch: 16, step: 980, loss: 0.3418395221233368, mean loss: 0.35834503202535434
Epoch: 16, step: 981, loss: 0.33187153935432434, mean loss: 0.3583439329016862
Epoch: 16, step: 982, loss: 0.33065149188041687, mean loss: 0.35834278321758184
Epoch: 16, step: 983, loss: 0.35544103384017944, mean loss: 0.35834266275306104
Epoch: 16, step: 984, loss: 0.3191831111907959, mean loss: 0.3583410371334188
Epoch: 16, step: 985, loss: 0.3590007424354553, mean loss: 0.3583410645184459
Epoch: 16, step: 986, loss: 0.32736626267433167, mean loss: 0.3583397787768061
Epoch: 16, step: 987, loss: 0.32112470269203186, mean loss: 0.358338234070012
Epoch: 16, step: 988, loss: 0.38700011372566223, mean loss: 0.3583394237051614
Epoch: 16, step: 989, loss: 0.3129502832889557, mean loss: 0.3583375398693344
Epoch: 16, step: 990, loss: 0.34627220034599304, mean loss: 0.35833703912895165
Epoch: 16, step: 991, loss: 0.3495312035083771, mean loss: 0.35833667368092625
Epoch: 16, step: 992, loss: 0.31506481766700745, mean loss: 0.35833487794469293
Epoch: 16, step: 993, loss: 0.31220558285713196, mean loss: 0.3583329637072007
Epoch: 16, step: 994, loss: 0.38193458318710327, mean loss: 0.3583339430681484
Epoch: 16, step: 995, loss: 0.31915998458862305, mean loss: 0.35833231759269285
Epoch: 16, step: 996, loss: 0.31592661142349243, mean loss: 0.35833055809283104
Epoch: 16, step: 997, loss: 0.30013200640678406, mean loss: 0.35832814341555586
Epoch: 16, step: 998, loss: 0.31654348969459534, mean loss: 0.3583264098282961
Epoch: 16, step: 999, loss: 0.316127747297287, mean loss: 0.3583246591370195
Epoch: 16, step: 1000, loss: 0.34605666995048523, mean loss: 0.35832415019741415
Epoch: 16, step: 1001, loss: 0.3516499102115631, mean loss: 0.35832387332692606
Epoch: 16, step: 1002, loss: 0.28936710953712463, mean loss: 0.3583210128812551
Epoch: 16, step: 1003, loss: 0.3396979570388794, mean loss: 0.3583202403967752
Epoch: 16, step: 1004, loss: 0.3382394015789032, mean loss: 0.35831940747799723
Epoch: 16, step: 1005, loss: 0.3129372298717499, mean loss: 0.3583175251811243
Epoch: 16, step: 1006, loss: 0.3157402575016022, mean loss: 0.3583157592955252
Epoch: 16, step: 1007, loss: 0.32704946398735046, mean loss: 0.35831446258453864
Epoch: 16, step: 1008, loss: 0.3332041800022125, mean loss: 0.3583134212258283
Epoch: 16, step: 1009, loss: 0.3426520526409149, mean loss: 0.3583127717537961
Epoch: 16, step: 1010, loss: 0.33012714982032776, mean loss: 0.3583116029533842
Epoch: 16, step: 1011, loss: 0.3818555176258087, mean loss: 0.358312579231153
Epoch: 16, step: 1012, loss: 0.315133661031723, mean loss: 0.3583107888377293
Epoch: 16, step: 1013, loss: 0.36104777455329895, mean loss: 0.3583109023208422
Epoch: 16, step: 1014, loss: 0.34658747911453247, mean loss: 0.35831041625495197
Epoch: 16, step: 1015, loss: 0.29397740960121155, mean loss: 0.3583077490490376
Epoch: 16, step: 1016, loss: 0.33338040113449097, mean loss: 0.3583067156197472
Epoch: 16, step: 1017, loss: 0.40313881635665894, mean loss: 0.3583085741762822
Epoch: 16, step: 1018, loss: 0.3738270699977875, mean loss: 0.35830921748332617
Epoch: 16, step: 1019, loss: 0.294816255569458, mean loss: 0.35830658554161193
Epoch: 16, step: 1020, loss: 0.33606284856796265, mean loss: 0.3583056635214265
Epoch: 16, step: 1021, loss: 0.4000069499015808, mean loss: 0.3583073920005105
Epoch: 16, step: 1022, loss: 0.3427075147628784, mean loss: 0.3583067454270767
Epoch: 16, step: 1023, loss: 0.3837921917438507, mean loss: 0.35830780168728543
Epoch: 16, step: 1024, loss: 0.33588746190071106, mean loss: 0.35830687250083815
Epoch: 16, step: 1025, loss: 0.3239559531211853, mean loss: 0.3583054489235742
Epoch: 16, step: 1026, loss: 0.34049075841903687, mean loss: 0.35830471067441316
Epoch: 16, step: 1027, loss: 0.3316522538661957, mean loss: 0.3583036062298247
Epoch: 16, step: 1028, loss: 0.32833331823349, mean loss: 0.3583023643499094
Epoch: 16, step: 1029, loss: 0.315676212310791, mean loss: 0.3583005981216821
Epoch: 16, step: 1030, loss: 0.3293384909629822, mean loss: 0.3582993981172421
Epoch: 16, step: 1031, loss: 0.34657007455825806, mean loss: 0.3582989121492458
Epoch: 16, step: 1032, loss: 0.31504347920417786, mean loss: 0.3582971200693293
Epoch: 16, step: 1033, loss: 0.31288546323776245, mean loss: 0.3582952387346358
Epoch: 16, step: 1034, loss: 0.33253607153892517, mean loss: 0.3582941716163958
Epoch: 16, step: 1035, loss: 0.34600117802619934, mean loss: 0.3582936623788817
Epoch: 16, step: 1036, loss: 0.3862869441509247, mean loss: 0.35829482195312357
Epoch: 16, step: 1037, loss: 0.36866992712020874, mean loss: 0.3582952517064649
Epoch: 16, step: 1038, loss: 0.3219677805900574, mean loss: 0.3582937470272156
Epoch: 16, step: 1039, loss: 0.3226340711116791, mean loss: 0.3582922700691343
Epoch: 16, step: 1040, loss: 0.3482930660247803, mean loss: 0.35829185593767665
Epoch: 16, step: 1041, loss: 0.362064927816391, mean loss: 0.3582920121984188
Epoch: 16, step: 1042, loss: 0.34199970960617065, mean loss: 0.3582913374850965
Epoch: 16, step: 1043, loss: 0.3377872705459595, mean loss: 0.35829048838509076
Epoch: 16, step: 1044, loss: 0.37579548358917236, mean loss: 0.35829121325962815
Epoch: 16, step: 1045, loss: 0.3315369784832001, mean loss: 0.3582901054238196
Epoch: 16, step: 1046, loss: 0.3220714330673218, mean loss: 0.3582886057479322
Epoch: 16, step: 1047, loss: 0.30227720737457275, mean loss: 0.35828628662742984
Epoch: 16, step: 1048, loss: 0.3134665787220001, mean loss: 0.35828443096942025
Epoch: 16, step: 1049, loss: 0.3739137649536133, mean loss: 0.3582850780396357
Epoch: 16, step: 1050, loss: 0.3335428535938263, mean loss: 0.35828405372895694
Epoch: 16, step: 1051, loss: 0.32701775431632996, mean loss: 0.35828275937975124
Epoch: 16, step: 1052, loss: 0.32641518115997314, mean loss: 0.3582814401936677
Epoch: 16, step: 1053, loss: 0.34221547842025757, mean loss: 0.3582807751567535
Epoch: 16, step: 1054, loss: 0.3131648600101471, mean loss: 0.3582789076988642
Epoch: 16, step: 1055, loss: 0.307417094707489, mean loss: 0.35827680249137284
Epoch: 16, step: 1056, loss: 0.32236024737358093, mean loss: 0.35827531594052153
Epoch: 16, step: 1057, loss: 0.3906887173652649, mean loss: 0.3582766574437673
Epoch: 16, step: 1058, loss: 0.3626657724380493, mean loss: 0.3582768390898789
Epoch: 16, step: 1059, loss: 0.299458771944046, mean loss: 0.35827440497023205
Epoch: 16, step: 1060, loss: 0.3384665846824646, mean loss: 0.3582735852797587
Epoch: 16, step: 1061, loss: 0.3521234691143036, mean loss: 0.3582733307851727
Epoch: 16, step: 1062, loss: 0.3444312512874603, mean loss: 0.3582727580173696
Epoch: 16, step: 1063, loss: 0.32736778259277344, mean loss: 0.35827147926135233
Epoch: 16, step: 1064, loss: 0.34050747752189636, mean loss: 0.3582707442701761
Epoch: 16, step: 1065, loss: 0.3513006865978241, mean loss: 0.3582704558937726
Epoch: 16, step: 1066, loss: 0.320468932390213, mean loss: 0.35826889197322714
Epoch: 16, step: 1067, loss: 0.3066776394844055, mean loss: 0.35826675763380594
Epoch: 16, step: 1068, loss: 0.33550530672073364, mean loss: 0.3582658160274305
Epoch: 16, step: 1069, loss: 0.37698137760162354, mean loss: 0.3582665902295309
Epoch: 16, step: 1070, loss: 0.3389420509338379, mean loss: 0.3582657908690636
Epoch: 16, step: 1071, loss: 0.37635597586631775, mean loss: 0.35826653913945566
Epoch: 16, step: 1072, loss: 0.33393827080726624, mean loss: 0.3582655328827517
Epoch: 16, step: 1073, loss: 0.3431021273136139, mean loss: 0.3582649057256018
Epoch: 16, step: 1074, loss: 0.3515925109386444, mean loss: 0.3582646297673411
Epoch: 16, step: 1075, loss: 0.3052345812320709, mean loss: 0.35826243663051166
Epoch: 16, step: 1076, loss: 0.35580548644065857, mean loss: 0.3582623350238705
Epoch: 16, step: 1077, loss: 0.3464946746826172, mean loss: 0.3582618483949589
Epoch: 16, step: 1078, loss: 0.3356049954891205, mean loss: 0.35826091150322065
Epoch: 16, step: 1079, loss: 0.34555909037590027, mean loss: 0.35826038628732887
Epoch: 16, step: 1080, loss: 0.35160472989082336, mean loss: 0.35826011108962796
Epoch: 16, step: 1081, loss: 0.3473478853702545, mean loss: 0.3582596599101969
Epoch: 16, step: 1082, loss: 0.30176669359207153, mean loss: 0.3582573242353998
Epoch: 16, step: 1083, loss: 0.2988007962703705, mean loss: 0.35825486613518626
Epoch: 16, step: 1084, loss: 0.34009286761283875, mean loss: 0.35825411529809
Epoch: 16, step: 1085, loss: 0.32453590631484985, mean loss: 0.35825272140768144
Epoch: 16, step: 1086, loss: 0.3225475251674652, mean loss: 0.35825124543743464
Epoch: 16, step: 1087, loss: 0.34164315462112427, mean loss: 0.35825055892574414
Epoch: 16, step: 1088, loss: 0.3601740896701813, mean loss: 0.35825063843348376
Epoch: 16, step: 1089, loss: 0.33917495608329773, mean loss: 0.3582498499866643
Epoch: 16, step: 1090, loss: 0.38786742091178894, mean loss: 0.3582510741061487
Epoch: 16, step: 1091, loss: 0.3322778344154358, mean loss: 0.35825000065435125
Epoch: 16, step: 1092, loss: 0.32797694206237793, mean loss: 0.35824874954642083
Epoch: 16, step: 1093, loss: 0.34807702898979187, mean loss: 0.3582483291926496
Epoch: 16, step: 1094, loss: 0.32057836651802063, mean loss: 0.35824677251829634
Epoch: 16, step: 1095, loss: 0.32348668575286865, mean loss: 0.3582453361510746
Epoch: 16, step: 1096, loss: 0.3080354332923889, mean loss: 0.35824326144743185
Epoch: 16, step: 1097, loss: 0.3498629331588745, mean loss: 0.3582429151814915
Epoch: 16, step: 1098, loss: 0.36470651626586914, mean loss: 0.35824318223933904
Epoch: 16, step: 1099, loss: 0.34661611914634705, mean loss: 0.35824270186158774
Epoch: 16, step: 1100, loss: 0.34346625208854675, mean loss: 0.35824209139062
Epoch: 16, step: 1101, loss: 0.3431882858276367, mean loss: 0.35824146948672997
Epoch: 16, step: 1102, loss: 0.32988446950912476, mean loss: 0.3582402980487171
Epoch: 16, step: 1103, loss: 0.3563770055770874, mean loss: 0.3582402210786051
Epoch: 16, step: 1104, loss: 0.34621644020080566, mean loss: 0.358239724412866
Epoch: 16, step: 1105, loss: 0.3070293366909027, mean loss: 0.35823760915521535
Epoch: 16, step: 1106, loss: 0.325378954410553, mean loss: 0.3582362519764642
Epoch: 16, step: 1107, loss: 0.3312767744064331, mean loss: 0.35823513850060223
Epoch: 16, step: 1108, loss: 0.33938610553741455, mean loss: 0.3582343600331276
Epoch: 16, step: 1109, loss: 0.33056366443634033, mean loss: 0.3582332172770527
Epoch: 16, step: 1110, loss: 0.33150750398635864, mean loss: 0.3582321135928367
Epoch: 16, step: 1111, loss: 0.3031020164489746, mean loss: 0.3582298369948377
Epoch: 16, step: 1112, loss: 0.3269318640232086, mean loss: 0.3582285445980515
Epoch: 16, step: 1113, loss: 0.32822099328041077, mean loss: 0.3582273055382068
Epoch: 16, step: 1114, loss: 0.32815033197402954, mean loss: 0.35822606366308546
Epoch: 16, step: 1115, loss: 0.3678496181964874, mean loss: 0.3582264610022487
Epoch: 16, step: 1116, loss: 0.33702489733695984, mean loss: 0.35822558566416746
Epoch: 16, step: 1117, loss: 0.32774481177330017, mean loss: 0.3582243272720491
Epoch: 16, step: 1118, loss: 0.30736321210861206, mean loss: 0.3582222275686613
Epoch: 16, step: 1119, loss: 0.33278900384902954, mean loss: 0.35822117765024486
Epoch: 16, step: 1120, loss: 0.349107950925827, mean loss: 0.3582208014592552
Epoch: 16, step: 1121, loss: 0.2938462197780609, mean loss: 0.3582181442074728
Epoch: 16, step: 1122, loss: 0.35200634598731995, mean loss: 0.35821788780766184
Epoch: 16, step: 1123, loss: 0.3377732038497925, mean loss: 0.35821704396236065
Epoch: 16, step: 1124, loss: 0.328073650598526, mean loss: 0.35821579985846186
Epoch: 16, step: 1125, loss: 0.3707068860530853, mean loss: 0.35821631537997217
Epoch: 16, step: 1126, loss: 0.370303213596344, mean loss: 0.35821681419959234
Epoch: 16, step: 1127, loss: 0.3555149734020233, mean loss: 0.35821670270071493
Epoch: 16, step: 1128, loss: 0.33305245637893677, mean loss: 0.35821566427186496
Epoch: 16, step: 1129, loss: 0.3285379707813263, mean loss: 0.3582144396414494
Epoch: 16, step: 1130, loss: 0.3094647228717804, mean loss: 0.35821242809959797
Epoch: 16, step: 1131, loss: 0.36830490827560425, mean loss: 0.3582128445247579
Epoch: 16, step: 1132, loss: 0.33124110102653503, mean loss: 0.3582117316913421
Epoch: 16, step: 1133, loss: 0.3010006248950958, mean loss: 0.35820937130241576
Epoch: 16, step: 1134, loss: 0.3550775945186615, mean loss: 0.35820924209837335
Epoch: 16, step: 1135, loss: 0.37557047605514526, mean loss: 0.3582099583208963
Epoch: 16, step: 1136, loss: 0.3544465899467468, mean loss: 0.35820980307283007
Epoch: 16, step: 1137, loss: 0.3341224789619446, mean loss: 0.3582088094533222
Epoch: 16, step: 1138, loss: 0.3282340168952942, mean loss: 0.3582075730224944
Epoch: 16, step: 1139, loss: 0.3426404297351837, mean loss: 0.3582069309195705
Epoch: 16, step: 1140, loss: 0.39978256821632385, mean loss: 0.3582086457324101
Epoch: 16, step: 1141, loss: 0.3665344715118408, mean loss: 0.35820898912207355
Epoch: 16, step: 1142, loss: 0.32961198687553406, mean loss: 0.3582078097183433
Epoch: 16, step: 1143, loss: 0.30933523178100586, mean loss: 0.35820579418807535
Epoch: 16, step: 1144, loss: 0.32972368597984314, mean loss: 0.35820461961971345
Epoch: 16, step: 1145, loss: 0.3326508700847626, mean loss: 0.35820356585684604
Epoch: 16, step: 1146, loss: 0.2987092137336731, mean loss: 0.3582011125826667
Epoch: 16, step: 1147, loss: 0.31361526250839233, mean loss: 0.358199274142535
Epoch: 16, step: 1148, loss: 0.2961883544921875, mean loss: 0.3581967173075187
Epoch: 16, step: 1149, loss: 0.32696282863616943, mean loss: 0.3581954295245274
Epoch: 16, step: 1150, loss: 0.33551162481307983, mean loss: 0.3581944943027293
Epoch: 16, step: 1151, loss: 0.3649098873138428, mean loss: 0.35819477115765225
Epoch: 16, step: 1152, loss: 0.3577826917171478, mean loss: 0.3581947541695894
Epoch: 16, step: 1153, loss: 0.34390467405319214, mean loss: 0.3581941650822732
Epoch: 16, step: 1154, loss: 0.350988507270813, mean loss: 0.35819386805198294
Epoch: 16, step: 1155, loss: 0.33692505955696106, mean loss: 0.358192991349242
Epoch: 16, step: 1156, loss: 0.3628838062286377, mean loss: 0.3581931846972029
Epoch: 16, step: 1157, loss: 0.3543403744697571, mean loss: 0.3581930258970122
Epoch: 16, step: 1158, loss: 0.355624258518219, mean loss: 0.3581929200252165
Epoch: 16, step: 1159, loss: 0.3482164144515991, mean loss: 0.3581925088602984
Epoch: 16, step: 1160, loss: 0.35078808665275574, mean loss: 0.3581922037120516
Epoch: 16, step: 1161, loss: 0.33667218685150146, mean loss: 0.35819131687380634
Epoch: 16, step: 1162, loss: 0.36156314611434937, mean loss: 0.3581914558209049
Epoch: 16, step: 1163, loss: 0.3370024263858795, mean loss: 0.358190582694589
Epoch: 16, step: 1164, loss: 0.35900217294692993, mean loss: 0.3581906161360267
Epoch: 16, step: 1165, loss: 0.3259408473968506, mean loss: 0.3581892873445665
Epoch: 16, step: 1166, loss: 0.3559474050998688, mean loss: 0.3581891949758036
Epoch: 16, step: 1167, loss: 0.3817773163318634, mean loss: 0.3581901668001838
Epoch: 16, step: 1168, loss: 0.3725128769874573, mean loss: 0.3581907568677563
Epoch: 16, step: 1169, loss: 0.37734198570251465, mean loss: 0.35819154582832463
Epoch: 16, step: 1170, loss: 0.34377557039260864, mean loss: 0.35819095196733863
Epoch: 16, step: 1171, loss: 0.32062745094299316, mean loss: 0.35818940461600296
Epoch: 16, step: 1172, loss: 0.3131888806819916, mean loss: 0.35818755098812743
Epoch: 16, step: 1173, loss: 0.3119388520717621, mean loss: 0.3581856460248308
Epoch: 16, step: 1174, loss: 0.3589475750923157, mean loss: 0.35818567740705687
Epoch: 16, step: 1175, loss: 0.3571818768978119, mean loss: 0.35818563606436704
Epoch: 16, step: 1176, loss: 0.3371172845363617, mean loss: 0.3581847683755763
Epoch: 16, step: 1177, loss: 0.35610711574554443, mean loss: 0.3581846828120877
Epoch: 16, step: 1178, loss: 0.3000839650630951, mean loss: 0.35818229016217834
Epoch: 16, step: 1179, loss: 0.32078585028648376, mean loss: 0.3581807502000685
Epoch: 16, step: 1180, loss: 0.3178207576274872, mean loss: 0.3581790882691411
Epoch: 16, step: 1181, loss: 0.40684449672698975, mean loss: 0.35818109211532645
Epoch: 16, step: 1182, loss: 0.28081679344177246, mean loss: 0.35817790669519745
Epoch: 16, step: 1183, loss: 0.31781160831451416, mean loss: 0.35817624470992154
Epoch: 16, step: 1184, loss: 0.3215946853160858, mean loss: 0.358174738614183
Epoch: 16, step: 1185, loss: 0.3492579460144043, mean loss: 0.3581743715169166
Epoch: 16, step: 1186, loss: 0.3347010314464569, mean loss: 0.35817340517794044
Epoch: 16, step: 1187, loss: 0.30786848068237305, mean loss: 0.35817133433467946
Epoch: 16, step: 1188, loss: 0.35898566246032715, mean loss: 0.35817136785578124
Epoch: 16, step: 1189, loss: 0.3360424041748047, mean loss: 0.3581704569739305
Epoch: 16, step: 1190, loss: 0.33009663224220276, mean loss: 0.35816930143473596
Epoch: 16, step: 1191, loss: 0.3262893855571747, mean loss: 0.3581679892880502
Epoch: 16, step: 1192, loss: 0.3405216634273529, mean loss: 0.3581672630121371
Epoch: 16, step: 1193, loss: 0.31658032536506653, mean loss: 0.3581655514746588
Epoch: 16, step: 1194, loss: 0.29841727018356323, mean loss: 0.3581630925964625
Epoch: 16, step: 1195, loss: 0.3450668454170227, mean loss: 0.3581625536562494
Epoch: 16, step: 1196, loss: 0.32947275042533875, mean loss: 0.3581613730544951
Epoch: 16, step: 1197, loss: 0.3126581907272339, mean loss: 0.35815950064965896
Epoch: 16, step: 1198, loss: 0.3306940197944641, mean loss: 0.35815837052247895
Epoch: 16, step: 1199, loss: 0.33861637115478516, mean loss: 0.3581575664573305
Epoch: 16, step: 1200, loss: 0.35101059079170227, mean loss: 0.35815727240361045
Epoch: 16, step: 1201, loss: 0.3260551393032074, mean loss: 0.35815595165428515
Epoch: 16, step: 1202, loss: 0.35630542039871216, mean loss: 0.3581558755226665
Epoch: 16, step: 1203, loss: 0.3239865303039551, mean loss: 0.358154469839549
Epoch: 16, step: 1204, loss: 0.3195295035839081, mean loss: 0.35815288092325237
Epoch: 16, step: 1205, loss: 0.383253276348114, mean loss: 0.35815391343643316
Epoch: 16, step: 1206, loss: 0.3258300721645355, mean loss: 0.3581525838390792
Epoch: 16, step: 1207, loss: 0.33775627613067627, mean loss: 0.35815174489914386
Epoch: 16, step: 1208, loss: 0.32820865511894226, mean loss: 0.35815051333209
Epoch: 16, step: 1209, loss: 0.32378149032592773, mean loss: 0.35814909978339354
Epoch: 16, step: 1210, loss: 0.34168049693107605, mean loss: 0.3581484224811993
Epoch: 16, step: 1211, loss: 0.3508085310459137, mean loss: 0.3581481206268057
Epoch: 16, step: 1212, loss: 0.3439950942993164, mean loss: 0.3581475386049145
Epoch: 16, step: 1213, loss: 0.35318562388420105, mean loss: 0.35814733456203596
Epoch: 16, step: 1214, loss: 0.3135475516319275, mean loss: 0.35814550061397354
Epoch: 16, step: 1215, loss: 0.293361634016037, mean loss: 0.3581428368036694
Epoch: 16, step: 1216, loss: 0.3125162124633789, mean loss: 0.3581409607860574
Epoch: 16, step: 1217, loss: 0.3888510763645172, mean loss: 0.3581422234336842
Epoch: 16, step: 1218, loss: 0.310604989528656, mean loss: 0.35814026901877216
Epoch: 16, step: 1219, loss: 0.3145294189453125, mean loss: 0.3581384761043636
Epoch: 16, step: 1220, loss: 0.354819118976593, mean loss: 0.3581383396456944
Epoch: 16, step: 1221, loss: 0.3404024541378021, mean loss: 0.358137610553961
Epoch: 16, step: 1222, loss: 0.32192692160606384, mean loss: 0.358136122056039
Epoch: 16, step: 1223, loss: 0.3088971674442291, mean loss: 0.35813409809374813
Epoch: 16, step: 1224, loss: 0.3580145239830017, mean loss: 0.35813409317886835
Epoch: 16, step: 1225, loss: 0.349713534116745, mean loss: 0.3581337470810853
Epoch: 16, step: 1226, loss: 0.33175432682037354, mean loss: 0.35813266289135776
Epoch: 16, step: 1227, loss: 0.3750631809234619, mean loss: 0.35813335870419816
Epoch: 16, step: 1228, loss: 0.34379705786705017, mean loss: 0.3581327695330792
Epoch: 16, step: 1229, loss: 0.3252609670162201, mean loss: 0.3581314186740952
Epoch: 16, step: 1230, loss: 0.3323845863342285, mean loss: 0.3581303606575618
Epoch: 16, step: 1231, loss: 0.3162214756011963, mean loss: 0.35812863856333693
Epoch: 16, step: 1232, loss: 0.3322165608406067, mean loss: 0.3581275738438677
Epoch: 16, step: 1233, loss: 0.36516228318214417, mean loss: 0.35812786288607895
Epoch: 16, step: 1234, loss: 0.3301999568939209, mean loss: 0.35812671543113045
Epoch: 16, step: 1235, loss: 0.3590848445892334, mean loss: 0.3581267547955166
Epoch: 16, step: 1236, loss: 0.3257176876068115, mean loss: 0.35812542333554415
Epoch: 16, step: 1237, loss: 0.33464550971984863, mean loss: 0.35812445875113796
Epoch: 16, step: 1238, loss: 0.34050703048706055, mean loss: 0.3581237350347405
Epoch: 16, step: 1239, loss: 0.3484242856502533, mean loss: 0.35812333660188705
Epoch: 16, step: 1240, loss: 0.31636330485343933, mean loss: 0.3581216212586236
Epoch: 16, step: 1241, loss: 0.3266443908214569, mean loss: 0.3581203283468337
Epoch: 16, step: 1242, loss: 0.30210959911346436, mean loss: 0.35811802782811547
Epoch: 16, step: 1243, loss: 0.3156008720397949, mean loss: 0.3581162816002615
Epoch: 16, step: 1244, loss: 0.33339911699295044, mean loss: 0.3581152664799441
Epoch: 16, step: 1245, loss: 0.30727720260620117, mean loss: 0.35811317867444625
Epoch: 16, step: 1246, loss: 0.32454854249954224, mean loss: 0.3581118003065692
Epoch: 16, step: 1247, loss: 0.3498457670211792, mean loss: 0.3581114608669632
Epoch: 16, step: 1248, loss: 0.36892464756965637, mean loss: 0.35811190488563455
Epoch: 16, step: 1249, loss: 0.30601248145103455, mean loss: 0.35810976563034036
Epoch: 16, step: 1250, loss: 0.37370890378952026, mean loss: 0.3581104061205132
Epoch: 16, step: 1251, loss: 0.3574620187282562, mean loss: 0.3581103794992539
Epoch: 16, step: 1252, loss: 0.353439599275589, mean loss: 0.35811018773589126
Epoch: 16, step: 1253, loss: 0.3638947904109955, mean loss: 0.358110425218553
Epoch: 16, step: 1254, loss: 0.3620940148830414, mean loss: 0.3581105887552197
Epoch: 16, step: 1255, loss: 0.3153379261493683, mean loss: 0.3581088328987909
Epoch: 16, step: 1256, loss: 0.31087756156921387, mean loss: 0.3581068940920371
Epoch: 16, step: 1257, loss: 0.36211854219436646, mean loss: 0.35810705876029514
Epoch: 16, step: 1258, loss: 0.32758238911628723, mean loss: 0.3581058058493382
Epoch: 16, step: 1259, loss: 0.31264835596084595, mean loss: 0.3581039400863318
Epoch: 16, step: 1260, loss: 0.3431210219860077, mean loss: 0.3581033251502308
Epoch: 16, step: 1261, loss: 0.3212139308452606, mean loss: 0.3581018111801781
Epoch: 16, step: 1262, loss: 0.35508376359939575, mean loss: 0.3581016873221906
Epoch: 16, step: 1263, loss: 0.3573060929775238, mean loss: 0.35810165467304644
Epoch: 16, step: 1264, loss: 0.3444471061229706, mean loss: 0.3581010943485132
Epoch: 16, step: 1265, loss: 0.31711089611053467, mean loss: 0.3580994123543303
Epoch: 16, step: 1266, loss: 0.33997195959091187, mean loss: 0.358098668541899
Epoch: 16, step: 1267, loss: 0.3555479049682617, mean loss: 0.3580985638823071
Epoch: 16, step: 1268, loss: 0.3217708468437195, mean loss: 0.358097073392132
Epoch: 16, step: 1269, loss: 0.32184898853302, mean loss: 0.35809558623020293
Epoch: 16, step: 1270, loss: 0.35409095883369446, mean loss: 0.3580954219377969
Epoch: 16, step: 1271, loss: 0.33644187450408936, mean loss: 0.3580945336235766
Epoch: 16, step: 1272, loss: 0.37115678191185, mean loss: 0.35809506946671926
Epoch: 16, step: 1273, loss: 0.3438492715358734, mean loss: 0.35809448509564984
Epoch: 16, step: 1274, loss: 0.3231138288974762, mean loss: 0.3580930502272714
Epoch: 16, step: 1275, loss: 0.328624963760376, mean loss: 0.3580918415280726
Epoch: 16, step: 1276, loss: 0.3576427102088928, mean loss: 0.35809182310670684
Epoch: 16, step: 1277, loss: 0.32873037457466125, mean loss: 0.3580906188802885
Epoch: 16, step: 1278, loss: 0.3230975568294525, mean loss: 0.3580891837385073
Epoch: 16, step: 1279, loss: 0.3207939565181732, mean loss: 0.35808765424264033
Epoch: 16, step: 1280, loss: 0.4452367424964905, mean loss: 0.35809122812364313
Epoch: 16, step: 1281, loss: 0.306927889585495, mean loss: 0.3580891300617003
Epoch: 16, step: 1282, loss: 0.3242640197277069, mean loss: 0.35808774304770374
Epoch: 16, step: 1283, loss: 0.3465762138366699, mean loss: 0.3580872710315806
Epoch: 16, step: 1284, loss: 0.31489527225494385, mean loss: 0.35808550006931167
Epoch: 16, step: 1285, loss: 0.3515540361404419, mean loss: 0.35808523227661265
Epoch: 16, step: 1286, loss: 0.29376181960105896, mean loss: 0.3580825950984455
Epoch: 16, step: 1287, loss: 0.31525543332099915, mean loss: 0.3580808393112293
Epoch: 16, step: 1288, loss: 0.3228178322315216, mean loss: 0.3580793936912941
Epoch: 16, step: 1289, loss: 0.34321311116218567, mean loss: 0.3580787842675617
Epoch: 16, step: 1290, loss: 0.3447549343109131, mean loss: 0.35807823809621686
Epoch: 16, step: 1291, loss: 0.352970689535141, mean loss: 0.3580780287361348
Epoch: 16, step: 1292, loss: 0.30745264887809753, mean loss: 0.35807595367035383
Epoch: 16, step: 1293, loss: 0.33414289355278015, mean loss: 0.35807497272682903
Epoch: 16, step: 1294, loss: 0.32439616322517395, mean loss: 0.35807359239118
Epoch: 16, step: 1295, loss: 0.3362813889980316, mean loss: 0.3580726992680901
Epoch: 16, step: 1296, loss: 0.3644961714744568, mean loss: 0.35807296251435894
Epoch: 16, step: 1297, loss: 0.30549758672714233, mean loss: 0.35807080796244567
Epoch: 16, step: 1298, loss: 0.30145666003227234, mean loss: 0.3580684879957231
Epoch: 16, step: 1299, loss: 0.33627867698669434, mean loss: 0.3580675951170553
Epoch: 16, step: 1300, loss: 0.37868013978004456, mean loss: 0.3580684397204015
Epoch: 16, step: 1301, loss: 0.32429808378219604, mean loss: 0.3580670560296722
Epoch: 16, step: 1302, loss: 0.34921228885650635, mean loss: 0.3580666932334591
Epoch: 16, step: 1303, loss: 0.331974059343338, mean loss: 0.35806562421371596
Epoch: 16, step: 1304, loss: 0.34265589714050293, mean loss: 0.3580649929003859
Epoch: 16, step: 1305, loss: 0.3443349599838257, mean loss: 0.3580644304246417
Epoch: 16, step: 1306, loss: 0.3626292645931244, mean loss: 0.3580646174237064
Epoch: 16, step: 1307, loss: 0.34391388297080994, mean loss: 0.35806403776065326
Epoch: 16, step: 1308, loss: 0.3223838210105896, mean loss: 0.3580625762353696
Epoch: 16, step: 1309, loss: 0.3677729666233063, mean loss: 0.35806297397397807
Epoch: 16, step: 1310, loss: 0.33705055713653564, mean loss: 0.3580621133384328
Epoch: 16, step: 1311, loss: 0.37671589851379395, mean loss: 0.35806287733684267
Epoch: 16, step: 1312, loss: 0.3646332621574402, mean loss: 0.3580631464274279
Epoch: 16, step: 1313, loss: 0.3780982196331024, mean loss: 0.3580639669316955
Epoch: 16, step: 1314, loss: 0.33721214532852173, mean loss: 0.358063113013779
Epoch: 16, step: 1315, loss: 0.3240091800689697, mean loss: 0.3580617185038304
Epoch: 16, step: 1316, loss: 0.3521173596382141, mean loss: 0.35806147509205916
Epoch: 16, step: 1317, loss: 0.3792361319065094, mean loss: 0.3580623421241128
Epoch: 16, step: 1318, loss: 0.34899646043777466, mean loss: 0.3580619709214888
Epoch: 16, step: 1319, loss: 0.3270222544670105, mean loss: 0.3580607000519975
Epoch: 16, step: 1320, loss: 0.42888784408569336, mean loss: 0.3580635998327154
Epoch: 16, step: 1321, loss: 0.30046314001083374, mean loss: 0.3580612416709279
Epoch: 16, step: 1322, loss: 0.32828742265701294, mean loss: 0.3580600227812151
Epoch: 16, step: 1323, loss: 0.312953919172287, mean loss: 0.35805817628933656
Epoch: 16, step: 1324, loss: 0.3639741539955139, mean loss: 0.35805841845961395
Epoch: 16, step: 1325, loss: 0.33485713601112366, mean loss: 0.358057468755052
Epoch: 16, step: 1326, loss: 0.34227272868156433, mean loss: 0.3580568226603333
Epoch: 16, step: 1327, loss: 0.3453553318977356, mean loss: 0.35805630278923134
Epoch: 16, step: 1328, loss: 0.33287203311920166, mean loss: 0.3580552720410764
Epoch: 16, step: 1329, loss: 0.3396860659122467, mean loss: 0.35805452025233414
Epoch: 16, step: 1330, loss: 0.33661192655563354, mean loss: 0.35805364271627127
Epoch: 16, step: 1331, loss: 0.36276909708976746, mean loss: 0.35805383568788585
Epoch: 16, step: 1332, loss: 0.34433645009994507, mean loss: 0.35805327435115925
Epoch: 16, step: 1333, loss: 0.3438360393047333, mean loss: 0.35805269258362316
Epoch: 16, step: 1334, loss: 0.2781654894351959, mean loss: 0.35804942374270704
Epoch: 16, step: 1335, loss: 0.3215709924697876, mean loss: 0.35804793117186934
Epoch: 16, step: 1336, loss: 0.3524007797241211, mean loss: 0.35804770011948
Epoch: 16, step: 1337, loss: 0.3082383871078491, mean loss: 0.35804566226198015
Epoch: 16, step: 1338, loss: 0.37288716435432434, mean loss: 0.3580462694502178
Epoch: 16, step: 1339, loss: 0.30514153838157654, mean loss: 0.3580441051264136
Epoch: 16, step: 1340, loss: 0.3266531527042389, mean loss: 0.3580428209802724
Epoch: 16, step: 1341, loss: 0.3539092540740967, mean loss: 0.35804265189056833
Epoch: 16, step: 1342, loss: 0.32443520426750183, mean loss: 0.3580412771841576
Epoch: 16, step: 1343, loss: 0.35400792956352234, mean loss: 0.35804111220756973
Epoch: 16, step: 1344, loss: 0.3486500084400177, mean loss: 0.3580407280976361
Epoch: 16, step: 1345, loss: 0.34841617941856384, mean loss: 0.3580403344555633
Epoch: 16, step: 1346, loss: 0.3270409405231476, mean loss: 0.3580390666385443
Epoch: 16, step: 1347, loss: 0.32519352436065674, mean loss: 0.35803772337246065
Epoch: 16, step: 1348, loss: 0.3379606306552887, mean loss: 0.35803690232421637
Epoch: 16, step: 1349, loss: 0.32118839025497437, mean loss: 0.35803539547412766
Epoch: 16, step: 1350, loss: 0.308515340089798, mean loss: 0.35803337052808865
Epoch: 16, step: 1351, loss: 0.35254859924316406, mean loss: 0.35803314625710053
Epoch: 16, step: 1352, loss: 0.36286601424217224, mean loss: 0.3580333438638383
Epoch: 16, step: 1353, loss: 0.3550538718700409, mean loss: 0.3580332220439023
Epoch: 16, step: 1354, loss: 0.33159688115119934, mean loss: 0.35803214120082233
Epoch: 16, step: 1355, loss: 0.3164856731891632, mean loss: 0.3580304426534793
Epoch: 16, step: 1356, loss: 0.3091203272342682, mean loss: 0.3580284431393376
Epoch: 16, step: 1357, loss: 0.36114707589149475, mean loss: 0.3580285706282082
Epoch: 16, step: 1358, loss: 0.3225034773349762, mean loss: 0.3580271184312866
Epoch: 16, step: 1359, loss: 0.35669204592704773, mean loss: 0.3580270638583425
Epoch: 16, step: 1360, loss: 0.3356499671936035, mean loss: 0.3580261492008046
Epoch: 16, step: 1361, loss: 0.30290818214416504, mean loss: 0.35802389636147425
Epoch: 16, step: 1362, loss: 0.3191097378730774, mean loss: 0.35802230588620193
Epoch: 16, step: 1363, loss: 0.36214402318000793, mean loss: 0.3580224743395816
Epoch: 16, step: 1364, loss: 0.316775381565094, mean loss: 0.3580207886518635
Epoch: 16, step: 1365, loss: 0.35831284523010254, mean loss: 0.3580208005871548
Epoch: 16, step: 1366, loss: 0.34715649485588074, mean loss: 0.3580203566205931
Epoch: 16, step: 1367, loss: 0.35617339611053467, mean loss: 0.3580202811481957
Epoch: 16, step: 1368, loss: 0.2984085977077484, mean loss: 0.3580178453338925
Epoch: 16, step: 1369, loss: 0.37654176354408264, mean loss: 0.35801860221540804
Epoch: 16, step: 1370, loss: 0.3480464220046997, mean loss: 0.3580181947718856
Epoch: 16, step: 1371, loss: 0.33837971091270447, mean loss: 0.35801739241513375
Epoch: 16, step: 1372, loss: 0.33839690685272217, mean loss: 0.3580165908264765
Epoch: 16, step: 1373, loss: 0.30960163474082947, mean loss: 0.35801461292974945
Epoch: 16, step: 1374, loss: 0.31573569774627686, mean loss: 0.35801288577932733
Epoch: 16, step: 1375, loss: 0.31332698464393616, mean loss: 0.3580110603748692
Epoch: 16, step: 1376, loss: 0.3271985352039337, mean loss: 0.35800980174470004
Epoch: 16, step: 1377, loss: 0.31993257999420166, mean loss: 0.3580082464297033
Epoch: 16, step: 1378, loss: 0.32444557547569275, mean loss: 0.3580068755735601
Epoch: 16, step: 1379, loss: 0.3292315602302551, mean loss: 0.35800570030336964
Epoch: 16, step: 1380, loss: 0.31479957699775696, mean loss: 0.358003935707768
Epoch: 16, step: 1381, loss: 0.3202695846557617, mean loss: 0.35800239464956934
Epoch: 16, step: 1382, loss: 0.3798077404499054, mean loss: 0.35800328513618673
Epoch: 16, step: 1383, loss: 0.3328022360801697, mean loss: 0.3580022560178816
Epoch: 16, step: 1384, loss: 0.3408709168434143, mean loss: 0.35800155646546317
Epoch: 16, step: 1385, loss: 0.317388117313385, mean loss: 0.3579998980971842
Epoch: 16, step: 1386, loss: 0.2895408570766449, mean loss: 0.3579971028237768
Epoch: 16, step: 1387, loss: 0.33560213446617126, mean loss: 0.357996188444863
Epoch: 16, step: 1388, loss: 0.35341164469718933, mean loss: 0.35799600126714903
Epoch: 16, step: 1389, loss: 0.3314729928970337, mean loss: 0.35799491843019426
Epoch: 16, step: 1390, loss: 0.32082992792129517, mean loss: 0.3579934011821637
Epoch: 16, step: 1391, loss: 0.3413067162036896, mean loss: 0.3579927199817645
Epoch: 16, step: 1392, loss: 0.37966689467430115, mean loss: 0.35799360475029507
Epoch: 16, step: 1393, loss: 0.3044447898864746, mean loss: 0.357991418905946
Epoch: 16, step: 1394, loss: 0.3598211705684662, mean loss: 0.35799149359273574
Epoch: 16, step: 1395, loss: 0.3180076479911804, mean loss: 0.35798986159903773
Epoch: 16, step: 1396, loss: 0.33848726749420166, mean loss: 0.357989065607278
Epoch: 16, step: 1397, loss: 0.31858140230178833, mean loss: 0.3579874572625182
Epoch: 16, step: 1398, loss: 0.32956379652023315, mean loss: 0.35798629725514186
Epoch: 16, step: 1399, loss: 0.3068329393863678, mean loss: 0.3579842097038087
Epoch: 16, step: 1400, loss: 0.33820128440856934, mean loss: 0.35798340240222554
Epoch: 16, step: 1401, loss: 0.39845919609069824, mean loss: 0.357985054070947
Epoch: 16, step: 1402, loss: 0.35718467831611633, mean loss: 0.35798502141188
Epoch: 16, step: 1403, loss: 0.35594063997268677, mean loss: 0.35798493799497777
Epoch: 16, step: 1404, loss: 0.3699629306793213, mean loss: 0.35798542671310923
Epoch: 16, step: 1405, loss: 0.3159439265727997, mean loss: 0.35798371143362573
Epoch: 16, step: 1406, loss: 0.3380460739135742, mean loss: 0.3579828980177096
Epoch: 16, step: 1407, loss: 0.3003503084182739, mean loss: 0.3579805468187214
Epoch: 16, step: 1408, loss: 0.28305965662002563, mean loss: 0.3579774904449524
Epoch: 16, step: 1409, loss: 0.33500051498413086, mean loss: 0.3579765531448194
Epoch: 16, step: 1410, loss: 0.3061424493789673, mean loss: 0.357974438761635
Epoch: 16, step: 1411, loss: 0.3158573806285858, mean loss: 0.3579727208199588
Epoch: 16, step: 1412, loss: 0.3646501302719116, mean loss: 0.3579729931783
Epoch: 16, step: 1413, loss: 0.3279438018798828, mean loss: 0.35797176839686196
Epoch: 16, step: 1414, loss: 0.36666637659072876, mean loss: 0.35797212300382775
Epoch: 16, step: 1415, loss: 0.32385918498039246, mean loss: 0.35797073177470773
Epoch: 16, step: 1416, loss: 0.3660476505756378, mean loss: 0.35797106116253047
Epoch: 16, step: 1417, loss: 0.3913935124874115, mean loss: 0.3579724241203367
Epoch: 16, step: 1418, loss: 0.31000056862831116, mean loss: 0.3579704679218499
Epoch: 16, step: 1419, loss: 0.3142468333244324, mean loss: 0.3579686850302092
Epoch: 16, step: 1420, loss: 0.3833366334438324, mean loss: 0.35796971940119443
Epoch: 16, step: 1421, loss: 0.31981897354125977, mean loss: 0.35796816387865266
Epoch: 16, step: 1422, loss: 0.3395351469516754, mean loss: 0.3579674123388424
Epoch: 16, step: 1423, loss: 0.3468376696109772, mean loss: 0.357966958582208
Epoch: 16, step: 1424, loss: 0.33697763085365295, mean loss: 0.35796610288781655
Epoch: 16, step: 1425, loss: 0.3148729205131531, mean loss: 0.35796434613354117
Epoch: 16, step: 1426, loss: 0.33223846554756165, mean loss: 0.3579632974245368
Epoch: 16, step: 1427, loss: 0.33176031708717346, mean loss: 0.35796222931022337
Epoch: 16, step: 1428, loss: 0.3330128788948059, mean loss: 0.3579612123391878
Epoch: 16, step: 1429, loss: 0.34361425042152405, mean loss: 0.3579606275604352
Epoch: 16, step: 1430, loss: 0.3594547212123871, mean loss: 0.35796068845685464
Epoch: 16, step: 1431, loss: 0.3578740358352661, mean loss: 0.35796068492520233
Epoch: 16, step: 1432, loss: 0.32122063636779785, mean loss: 0.3579591875926614
Epoch: 16, step: 1433, loss: 0.30333733558654785, mean loss: 0.3579569615819023
Epoch: 16, step: 1434, loss: 0.3766961395740509, mean loss: 0.35795772523070596
Epoch: 16, step: 1435, loss: 0.3378158509731293, mean loss: 0.35795690445343387
Epoch: 16, step: 1436, loss: 0.3968864977359772, mean loss: 0.35795849076178654
Epoch: 16, step: 1437, loss: 0.34653881192207336, mean loss: 0.3579580254501233
Epoch: 16, step: 1438, loss: 0.3465975224971771, mean loss: 0.3579575625685296
Epoch: 16, step: 1439, loss: 0.31529700756073, mean loss: 0.3579558244429182
Epoch: 16, step: 1440, loss: 0.38787567615509033, mean loss: 0.35795704342241347
Epoch: 16, step: 1441, loss: 0.3497655391693115, mean loss: 0.35795670970187843
Epoch: 16, step: 1442, loss: 0.3509489893913269, mean loss: 0.35795642422013685
Epoch: 16, step: 1443, loss: 0.3396105170249939, mean loss: 0.357955676871791
Valid: 16, mean loss: 0.18906777600447336
Epoch: 17, step: 0, loss: 0.311335951089859, mean loss: 0.3579537778239364
Epoch: 17, step: 1, loss: 0.3170730173587799, mean loss: 0.3579521126198441
Epoch: 17, step: 2, loss: 0.30277034640312195, mean loss: 0.3579498649816128
Epoch: 17, step: 3, loss: 0.36540383100509644, mean loss: 0.3579501685807503
Epoch: 17, step: 4, loss: 0.35840559005737305, mean loss: 0.35795018712925664
Epoch: 17, step: 5, loss: 0.32755303382873535, mean loss: 0.35794894915771225
Epoch: 17, step: 6, loss: 0.34722164273262024, mean loss: 0.35794851228919566
Epoch: 17, step: 7, loss: 0.3078572452068329, mean loss: 0.3579464724102625
Epoch: 17, step: 8, loss: 0.3405945301055908, mean loss: 0.3579457658116428
Epoch: 17, step: 9, loss: 0.3264879882335663, mean loss: 0.3579444848531943
Epoch: 17, step: 10, loss: 0.33379846811294556, mean loss: 0.3579435016691583
Epoch: 17, step: 11, loss: 0.4029054641723633, mean loss: 0.3579453323679573
Epoch: 17, step: 12, loss: 0.33297351002693176, mean loss: 0.3579443156413443
Epoch: 17, step: 13, loss: 0.33949190378189087, mean loss: 0.3579435643828206
Epoch: 17, step: 14, loss: 0.3268211781978607, mean loss: 0.35794229733945515
Epoch: 17, step: 15, loss: 0.34893369674682617, mean loss: 0.35794193059948637
Epoch: 17, step: 16, loss: 0.34821611642837524, mean loss: 0.35794153467788364
Epoch: 17, step: 17, loss: 0.3060573935508728, mean loss: 0.3579394226473892
Epoch: 17, step: 18, loss: 0.3661506772041321, mean loss: 0.3579397568865945
Epoch: 17, step: 19, loss: 0.36104440689086914, mean loss: 0.3579398832562625
Epoch: 17, step: 20, loss: 0.3461446464061737, mean loss: 0.35793940317010314
Epoch: 17, step: 21, loss: 0.343212366104126, mean loss: 0.35793880377909515
Epoch: 17, step: 22, loss: 0.37933337688446045, mean loss: 0.35793967450365277
Epoch: 17, step: 23, loss: 0.3228260278701782, mean loss: 0.35793824549312725
Epoch: 17, step: 24, loss: 0.32481488585472107, mean loss: 0.35793689753562763
Epoch: 17, step: 25, loss: 0.3138359487056732, mean loss: 0.35793510291737946
Epoch: 17, step: 26, loss: 0.30933883786201477, mean loss: 0.35793312544982886
Epoch: 17, step: 27, loss: 0.3203970491886139, mean loss: 0.35793159810297576
Epoch: 17, step: 28, loss: 0.3657349646091461, mean loss: 0.3579319156098524
Epoch: 17, step: 29, loss: 0.28704577684402466, mean loss: 0.3579290314801931
Epoch: 17, step: 30, loss: 0.4115837812423706, mean loss: 0.3579312144310765
Epoch: 17, step: 31, loss: 0.3418969213962555, mean loss: 0.3579305621001963
Epoch: 17, step: 32, loss: 0.3362058401107788, mean loss: 0.3579296782988054
Epoch: 17, step: 33, loss: 0.34975922107696533, mean loss: 0.35792934592319636
Epoch: 17, step: 34, loss: 0.3093191683292389, mean loss: 0.35792736853322793
Epoch: 17, step: 35, loss: 0.32991451025009155, mean loss: 0.3579262290580293
Epoch: 17, step: 36, loss: 0.3360385596752167, mean loss: 0.3579253387725144
Epoch: 17, step: 37, loss: 0.3686654269695282, mean loss: 0.35792577561007227
Epoch: 17, step: 38, loss: 0.3230411112308502, mean loss: 0.35792435678449863
Epoch: 17, step: 39, loss: 0.33214232325553894, mean loss: 0.35792330822286167
Epoch: 17, step: 40, loss: 0.322541743516922, mean loss: 0.3579218693044548
Epoch: 17, step: 41, loss: 0.30700796842575073, mean loss: 0.35791979879201563
Epoch: 17, step: 42, loss: 0.31744638085365295, mean loss: 0.3579181529289788
Epoch: 17, step: 43, loss: 0.29899683594703674, mean loss: 0.3579157569743195
Epoch: 17, step: 44, loss: 0.345443457365036, mean loss: 0.35791524982595985
Epoch: 17, step: 45, loss: 0.35485753417015076, mean loss: 0.3579151254982516
Epoch: 17, step: 46, loss: 0.3628735840320587, mean loss: 0.3579153271025831
Epoch: 17, step: 47, loss: 0.2934585213661194, mean loss: 0.3579127064811107
Epoch: 17, step: 48, loss: 0.33129677176475525, mean loss: 0.35791162440058394
Epoch: 17, step: 49, loss: 0.3401750922203064, mean loss: 0.3579109033447184
Epoch: 17, step: 50, loss: 0.33395734429359436, mean loss: 0.357909929583222
Epoch: 17, step: 51, loss: 0.3195454478263855, mean loss: 0.35790837005144327
Epoch: 17, step: 52, loss: 0.30916449427604675, mean loss: 0.35790638867362223
Epoch: 17, step: 53, loss: 0.3200019299983978, mean loss: 0.35790484796722943
Epoch: 17, step: 54, loss: 0.36703017354011536, mean loss: 0.3579052188701914
Epoch: 17, step: 55, loss: 0.35539254546165466, mean loss: 0.35790511674560155
Epoch: 17, step: 56, loss: 0.3619271516799927, mean loss: 0.35790528020973217
Epoch: 17, step: 57, loss: 0.31169211864471436, mean loss: 0.35790340208400817
Epoch: 17, step: 58, loss: 0.3192591071128845, mean loss: 0.3579018316245872
Epoch: 17, step: 59, loss: 0.31732481718063354, mean loss: 0.35790018268869467
Epoch: 17, step: 60, loss: 0.3238198459148407, mean loss: 0.35789879781581185
Epoch: 17, step: 61, loss: 0.31932640075683594, mean loss: 0.3578972304693243
Epoch: 17, step: 62, loss: 0.29631298780441284, mean loss: 0.35789472816374285
Epoch: 17, step: 63, loss: 0.33243459463119507, mean loss: 0.3578936937035798
Epoch: 17, step: 64, loss: 0.3285352885723114, mean loss: 0.35789250090281877
Epoch: 17, step: 65, loss: 0.3328491449356079, mean loss: 0.3578914834592514
Epoch: 17, step: 66, loss: 0.32614147663116455, mean loss: 0.3578901935950699
Epoch: 17, step: 67, loss: 0.29151085019111633, mean loss: 0.35788749700165895
Epoch: 17, step: 68, loss: 0.356934130191803, mean loss: 0.3578874582736738
Epoch: 17, step: 69, loss: 0.30769747495651245, mean loss: 0.35788541952221886
Epoch: 17, step: 70, loss: 0.34820422530174255, mean loss: 0.3578850262814609
Epoch: 17, step: 71, loss: 0.3134301006793976, mean loss: 0.35788322063866634
Epoch: 17, step: 72, loss: 0.3584686517715454, mean loss: 0.3578832444163818
Epoch: 17, step: 73, loss: 0.33211272954940796, mean loss: 0.3578821977705014
Epoch: 17, step: 74, loss: 0.34403425455093384, mean loss: 0.3578816353718002
Epoch: 17, step: 75, loss: 0.3681560158729553, mean loss: 0.3578820526224703
Epoch: 17, step: 76, loss: 0.32449108362197876, mean loss: 0.3578806966440337
Epoch: 17, step: 77, loss: 0.32143929600715637, mean loss: 0.3578792168502939
Epoch: 17, step: 78, loss: 0.3765367269515991, mean loss: 0.35787997445414743
Epoch: 17, step: 79, loss: 0.3492386043071747, mean loss: 0.3578796235783091
Epoch: 17, step: 80, loss: 0.35529467463493347, mean loss: 0.3578795186228118
Epoch: 17, step: 81, loss: 0.30375662446022034, mean loss: 0.3578773211849652
Epoch: 17, step: 82, loss: 0.3655037581920624, mean loss: 0.3578776308125486
Epoch: 17, step: 83, loss: 0.3351778984069824, mean loss: 0.35787670925796894
Epoch: 17, step: 84, loss: 0.3505084812641144, mean loss: 0.3578764101377646
Epoch: 17, step: 85, loss: 0.33888599276542664, mean loss: 0.35787563923505405
Epoch: 17, step: 86, loss: 0.31607359647750854, mean loss: 0.357873942379249
Epoch: 17, step: 87, loss: 0.3078112304210663, mean loss: 0.35787191028345594
Epoch: 17, step: 88, loss: 0.32497864961624146, mean loss: 0.3578705751671403
Epoch: 17, step: 89, loss: 0.3656870126724243, mean loss: 0.35787089241843933
Epoch: 17, step: 90, loss: 0.3476189970970154, mean loss: 0.3578704763343726
Epoch: 17, step: 91, loss: 0.3401924669742584, mean loss: 0.357869758882694
Epoch: 17, step: 92, loss: 0.31813493371009827, mean loss: 0.3578681463334804
Epoch: 17, step: 93, loss: 0.3324171304702759, mean loss: 0.3578671135027092
Epoch: 17, step: 94, loss: 0.33503487706184387, mean loss: 0.35786618698254363
Epoch: 17, step: 95, loss: 0.33602550625801086, mean loss: 0.35786530073515177
Epoch: 17, step: 96, loss: 0.34354323148727417, mean loss: 0.3578647196002665
Epoch: 17, step: 97, loss: 0.30151158571243286, mean loss: 0.35786243309803945
Epoch: 17, step: 98, loss: 0.2914988100528717, mean loss: 0.357859740534115
Epoch: 17, step: 99, loss: 0.3304471969604492, mean loss: 0.35785862837314564
Epoch: 17, step: 100, loss: 0.3355865776538849, mean loss: 0.35785772480502037
Epoch: 17, step: 101, loss: 0.34209275245666504, mean loss: 0.35785708525238963
Epoch: 17, step: 102, loss: 0.3121265470981598, mean loss: 0.3578552301334024
Epoch: 17, step: 103, loss: 0.29754725098609924, mean loss: 0.35785278376072893
Epoch: 17, step: 104, loss: 0.3356780707836151, mean loss: 0.35785188428752174
Epoch: 17, step: 105, loss: 0.30376243591308594, mean loss: 0.3578496903454282
Epoch: 17, step: 106, loss: 0.3048842251300812, mean loss: 0.35784754208076724
Epoch: 17, step: 107, loss: 0.33196377754211426, mean loss: 0.3578464922849959
Epoch: 17, step: 108, loss: 0.298570454120636, mean loss: 0.35784408826024977
Epoch: 17, step: 109, loss: 0.3610190153121948, mean loss: 0.3578442170187481
Epoch: 17, step: 110, loss: 0.31522417068481445, mean loss: 0.3578424886418336
Epoch: 17, step: 111, loss: 0.34067195653915405, mean loss: 0.35784179235099406
Epoch: 17, step: 112, loss: 0.32186636328697205, mean loss: 0.35784033355252426
Epoch: 17, step: 113, loss: 0.3284757435321808, mean loss: 0.357839142870908
Epoch: 17, step: 114, loss: 0.3627176582813263, mean loss: 0.3578393406779635
Epoch: 17, step: 115, loss: 0.3223739564418793, mean loss: 0.357837902736663
Epoch: 17, step: 116, loss: 0.354073703289032, mean loss: 0.357837750123671
Epoch: 17, step: 117, loss: 0.3660362660884857, mean loss: 0.3578380825049231
Epoch: 17, step: 118, loss: 0.32652413845062256, mean loss: 0.35783681303785964
Epoch: 17, step: 119, loss: 0.3762661814689636, mean loss: 0.35783756013403406
Epoch: 17, step: 120, loss: 0.35861676931381226, mean loss: 0.3578375917206075
Epoch: 17, step: 121, loss: 0.3331342041492462, mean loss: 0.3578365903672402
Epoch: 17, step: 122, loss: 0.35951754450798035, mean loss: 0.35783665850206003
Epoch: 17, step: 123, loss: 0.32483139634132385, mean loss: 0.3578353207401372
Epoch: 17, step: 124, loss: 0.35900840163230896, mean loss: 0.35783536828526313
Epoch: 17, step: 125, loss: 0.38044387102127075, mean loss: 0.35783628457377475
Epoch: 17, step: 126, loss: 0.3616885244846344, mean loss: 0.3578364406929201
Epoch: 17, step: 127, loss: 0.32954835891723633, mean loss: 0.3578352943125596
Epoch: 17, step: 128, loss: 0.3351028859615326, mean loss: 0.35783437311434463
Epoch: 17, step: 129, loss: 0.33088552951812744, mean loss: 0.35783328109539675
Epoch: 17, step: 130, loss: 0.3091585338115692, mean loss: 0.3578313087809884
Epoch: 17, step: 131, loss: 0.36472970247268677, mean loss: 0.3578315882945091
Epoch: 17, step: 132, loss: 0.32609081268310547, mean loss: 0.3578303022536027
Epoch: 17, step: 133, loss: 0.31508392095565796, mean loss: 0.35782857036877574
Epoch: 17, step: 134, loss: 0.3122137486934662, mean loss: 0.35782672234294116
Epoch: 17, step: 135, loss: 0.3269138038158417, mean loss: 0.3578254699965416
Epoch: 17, step: 136, loss: 0.3975074589252472, mean loss: 0.3578270775310333
Epoch: 17, step: 137, loss: 0.34486737847328186, mean loss: 0.35782655254930046
Epoch: 17, step: 138, loss: 0.323810875415802, mean loss: 0.3578251746711811
Epoch: 17, step: 139, loss: 0.30256274342536926, mean loss: 0.35782293623828876
Epoch: 17, step: 140, loss: 0.3524148464202881, mean loss: 0.35782271718973196
Epoch: 17, step: 141, loss: 0.3310103714466095, mean loss: 0.3578216312300016
Epoch: 17, step: 142, loss: 0.30591505765914917, mean loss: 0.3578195289832894
Epoch: 17, step: 143, loss: 0.33871856331825256, mean loss: 0.35781875541429276
Epoch: 17, step: 144, loss: 0.3481106162071228, mean loss: 0.35781836226079955
Epoch: 17, step: 145, loss: 0.33333057165145874, mean loss: 0.35781737061138635
Epoch: 17, step: 146, loss: 0.33581221103668213, mean loss: 0.35781647953385753
Epoch: 17, step: 147, loss: 0.3334135115146637, mean loss: 0.35781549139942204
Epoch: 17, step: 148, loss: 0.35622304677963257, mean loss: 0.35781542692014845
Epoch: 17, step: 149, loss: 0.31863629817962646, mean loss: 0.3578138405921567
Epoch: 17, step: 150, loss: 0.35957393050193787, mean loss: 0.3578139118537426
Epoch: 17, step: 151, loss: 0.355616956949234, mean loss: 0.3578138229081999
Epoch: 17, step: 152, loss: 0.30923524498939514, mean loss: 0.35781185624377665
Epoch: 17, step: 153, loss: 0.31414085626602173, mean loss: 0.3578100883302483
Epoch: 17, step: 154, loss: 0.3543993830680847, mean loss: 0.35780995026178447
Epoch: 17, step: 155, loss: 0.3173593580722809, mean loss: 0.35780831285115505
Epoch: 17, step: 156, loss: 0.2888402044773102, mean loss: 0.35780552118516135
Epoch: 17, step: 157, loss: 0.34383127093315125, mean loss: 0.35780495556343983
Epoch: 17, step: 158, loss: 0.3231835663318634, mean loss: 0.3578035542848859
Epoch: 17, step: 159, loss: 0.351602703332901, mean loss: 0.357803303319573
Epoch: 17, step: 160, loss: 0.30421191453933716, mean loss: 0.35780113441800754
Epoch: 17, step: 161, loss: 0.3108590841293335, mean loss: 0.3577992346992585
Epoch: 17, step: 162, loss: 0.32544955611228943, mean loss: 0.3577979255786812
Epoch: 17, step: 163, loss: 0.38024574518203735, mean loss: 0.3577988339559717
Epoch: 17, step: 164, loss: 0.323089599609375, mean loss: 0.35779742946301873
Epoch: 17, step: 165, loss: 0.3321247696876526, mean loss: 0.3577963906728684
Epoch: 17, step: 166, loss: 0.31537431478500366, mean loss: 0.3577946742222964
Epoch: 17, step: 167, loss: 0.3517288267612457, mean loss: 0.35779442880040524
Epoch: 17, step: 168, loss: 0.3538377285003662, mean loss: 0.3577942687202863
Epoch: 17, step: 169, loss: 0.3188376724720001, mean loss: 0.35779269267868713
Epoch: 17, step: 170, loss: 0.32784226536750793, mean loss: 0.3577914810428074
Epoch: 17, step: 171, loss: 0.36143070459365845, mean loss: 0.3577916282605886
Epoch: 17, step: 172, loss: 0.3608153760433197, mean loss: 0.3577917505755347
Epoch: 17, step: 173, loss: 0.34735700488090515, mean loss: 0.35779132849213957
Epoch: 17, step: 174, loss: 0.31519049406051636, mean loss: 0.35778960536653054
Epoch: 17, step: 175, loss: 0.31819969415664673, mean loss: 0.35778800409201145
Epoch: 17, step: 176, loss: 0.30158179998397827, mean loss: 0.3577857308380536
Epoch: 17, step: 177, loss: 0.33478280901908875, mean loss: 0.3577848005249492
Epoch: 17, step: 178, loss: 0.3183857202529907, mean loss: 0.3577832071622173
Epoch: 17, step: 179, loss: 0.3101294934749603, mean loss: 0.35778128004665244
Epoch: 17, step: 180, loss: 0.34545785188674927, mean loss: 0.35778078170752997
Epoch: 17, step: 181, loss: 0.32607701420783997, mean loss: 0.3577794997112704
Epoch: 17, step: 182, loss: 0.2980668842792511, mean loss: 0.3577770852268002
Epoch: 17, step: 183, loss: 0.34829163551330566, mean loss: 0.35777670169737624
Epoch: 17, step: 184, loss: 0.3890220522880554, mean loss: 0.3577779650035094
Epoch: 17, step: 185, loss: 0.31829896569252014, mean loss: 0.3577763688605761
Epoch: 17, step: 186, loss: 0.3140813410282135, mean loss: 0.35777460233428415
Epoch: 17, step: 187, loss: 0.3441278636455536, mean loss: 0.3577740506388326
Epoch: 17, step: 188, loss: 0.36186373233795166, mean loss: 0.3577742159653354
Epoch: 17, step: 189, loss: 0.3402610421180725, mean loss: 0.357773508019105
Epoch: 17, step: 190, loss: 0.34177476167678833, mean loss: 0.35777286131768854
Epoch: 17, step: 191, loss: 0.31960082054138184, mean loss: 0.3577713183896054
Epoch: 17, step: 192, loss: 0.2998136281967163, mean loss: 0.35776897581290307
Epoch: 17, step: 193, loss: 0.30367934703826904, mean loss: 0.3577667896667235
Epoch: 17, step: 194, loss: 0.32668259739875793, mean loss: 0.357765533384451
Epoch: 17, step: 195, loss: 0.33451130986213684, mean loss: 0.3577645935920358
Epoch: 17, step: 196, loss: 0.34476956725120544, mean loss: 0.35776406843437397
Epoch: 17, step: 197, loss: 0.32216957211494446, mean loss: 0.3577626300404388
Epoch: 17, step: 198, loss: 0.3850350081920624, mean loss: 0.3577637320882891
Epoch: 17, step: 199, loss: 0.3175545632839203, mean loss: 0.3577621073441157
Epoch: 17, step: 200, loss: 0.3744511008262634, mean loss: 0.3577627816741283
Epoch: 17, step: 201, loss: 0.3181864619255066, mean loss: 0.3577611826309061
Epoch: 17, step: 202, loss: 0.3169146478176117, mean loss: 0.3577595323325419
Epoch: 17, step: 203, loss: 0.3505499064922333, mean loss: 0.35775924105806545
Epoch: 17, step: 204, loss: 0.3196432292461395, mean loss: 0.35775770120383316
Epoch: 17, step: 205, loss: 0.3362511694431305, mean loss: 0.3577568323934687
Epoch: 17, step: 206, loss: 0.3347288966178894, mean loss: 0.35775590215974723
Epoch: 17, step: 207, loss: 0.32877424359321594, mean loss: 0.35775473146744774
Epoch: 17, step: 208, loss: 0.31848791241645813, mean loss: 0.35775314537789527
Epoch: 17, step: 209, loss: 0.3419720530509949, mean loss: 0.357752507964036
Epoch: 17, step: 210, loss: 0.31893378496170044, mean loss: 0.35775094010091546
Epoch: 17, step: 211, loss: 0.31822702288627625, mean loss: 0.3577493438199294
Epoch: 17, step: 212, loss: 0.30337849259376526, mean loss: 0.3577471479937824
Epoch: 17, step: 213, loss: 0.32590457797050476, mean loss: 0.35774586204878506
Epoch: 17, step: 214, loss: 0.33275580406188965, mean loss: 0.35774485287954116
Epoch: 17, step: 215, loss: 0.36065366864204407, mean loss: 0.3577449703410079
Epoch: 17, step: 216, loss: 0.31113797426223755, mean loss: 0.3577430883706433
Epoch: 17, step: 217, loss: 0.3205564320087433, mean loss: 0.35774158685015706
Epoch: 17, step: 218, loss: 0.37503114342689514, mean loss: 0.35774228493860444
Epoch: 17, step: 219, loss: 0.30826663970947266, mean loss: 0.3577402873754088
Epoch: 17, step: 220, loss: 0.33507877588272095, mean loss: 0.3577393724611413
Epoch: 17, step: 221, loss: 0.31702089309692383, mean loss: 0.3577377285984298
Epoch: 17, step: 222, loss: 0.32393670082092285, mean loss: 0.35773636405812953
Epoch: 17, step: 223, loss: 0.3491612374782562, mean loss: 0.35773601789606835
Epoch: 17, step: 224, loss: 0.32770493626594543, mean loss: 0.3577348056455686
Epoch: 17, step: 225, loss: 0.31556329131126404, mean loss: 0.35773310339666514
Epoch: 17, step: 226, loss: 0.3395259976387024, mean loss: 0.35773236849835
Epoch: 17, step: 227, loss: 0.40800055861473083, mean loss: 0.3577343974049579
Epoch: 17, step: 228, loss: 0.3373497426509857, mean loss: 0.3577335746800617
Epoch: 17, step: 229, loss: 0.36547091603279114, mean loss: 0.35773388694664304
Epoch: 17, step: 230, loss: 0.3092058002948761, mean loss: 0.35773192851060237
Epoch: 17, step: 231, loss: 0.3268809914588928, mean loss: 0.3577306835171782
Epoch: 17, step: 232, loss: 0.36856943368911743, mean loss: 0.3577311208986467
Epoch: 17, step: 233, loss: 0.3432932496070862, mean loss: 0.35773053830356594
Epoch: 17, step: 234, loss: 0.29267996549606323, mean loss: 0.35772791349733557
Epoch: 17, step: 235, loss: 0.3373200297355652, mean loss: 0.35772709006755177
Epoch: 17, step: 236, loss: 0.3300835192203522, mean loss: 0.35772597473283935
Epoch: 17, step: 237, loss: 0.31032413244247437, mean loss: 0.35772406228862524
Epoch: 17, step: 238, loss: 0.2996726334095001, mean loss: 0.35772172027753557
Epoch: 17, step: 239, loss: 0.40721946954727173, mean loss: 0.3577237171207367
Epoch: 17, step: 240, loss: 0.3454431891441345, mean loss: 0.3577232217184221
Epoch: 17, step: 241, loss: 0.3345637917518616, mean loss: 0.3577222874937361
Epoch: 17, step: 242, loss: 0.34596601128578186, mean loss: 0.35772181327824626
Epoch: 17, step: 243, loss: 0.32726290822029114, mean loss: 0.35772058470027523
Epoch: 17, step: 244, loss: 0.33905133605003357, mean loss: 0.35771983169544924
Epoch: 17, step: 245, loss: 0.3558973968029022, mean loss: 0.3577197581923883
Epoch: 17, step: 246, loss: 0.37063971161842346, mean loss: 0.3577202792633069
Epoch: 17, step: 247, loss: 0.3630116581916809, mean loss: 0.35772049265977923
Epoch: 17, step: 248, loss: 0.33951589465141296, mean loss: 0.35771975851460003
Epoch: 17, step: 249, loss: 0.30979958176612854, mean loss: 0.35771782609356817
Epoch: 17, step: 250, loss: 0.33480212092399597, mean loss: 0.35771690203593803
Epoch: 17, step: 251, loss: 0.33837053179740906, mean loss: 0.3577161219403639
Epoch: 17, step: 252, loss: 0.32964736223220825, mean loss: 0.3577149901811724
Epoch: 17, step: 253, loss: 0.3145528733730316, mean loss: 0.3577132499135808
Epoch: 17, step: 254, loss: 0.3425056040287018, mean loss: 0.357712636776223
Epoch: 17, step: 255, loss: 0.3204694092273712, mean loss: 0.35771113527535425
Epoch: 17, step: 256, loss: 0.3721981942653656, mean loss: 0.3577117193132091
Epoch: 17, step: 257, loss: 0.3092626929283142, mean loss: 0.3577097661959639
Epoch: 17, step: 258, loss: 0.3288237154483795, mean loss: 0.3577086017645233
Epoch: 17, step: 259, loss: 0.3153649866580963, mean loss: 0.35770689491128616
Epoch: 17, step: 260, loss: 0.3131459355354309, mean loss: 0.35770509875024076
Epoch: 17, step: 261, loss: 0.30359387397766113, mean loss: 0.35770291772546153
Epoch: 17, step: 262, loss: 0.34029620885849, mean loss: 0.35770221615322073
Epoch: 17, step: 263, loss: 0.3243969976902008, mean loss: 0.35770087385036475
Epoch: 17, step: 264, loss: 0.36453723907470703, mean loss: 0.3577011493658294
Epoch: 17, step: 265, loss: 0.31990355253219604, mean loss: 0.35769962612907463
Epoch: 17, step: 266, loss: 0.33066198229789734, mean loss: 0.35769853656051404
Epoch: 17, step: 267, loss: 0.34379842877388, mean loss: 0.357697976433669
Epoch: 17, step: 268, loss: 0.3026272654533386, mean loss: 0.3576957573616224
Epoch: 17, step: 269, loss: 0.3364467918872833, mean loss: 0.3576949011699279
Epoch: 17, step: 270, loss: 0.3177061378955841, mean loss: 0.357693289954195
Epoch: 17, step: 271, loss: 0.32306474447250366, mean loss: 0.3576918947670282
Epoch: 17, step: 272, loss: 0.3221288025379181, mean loss: 0.35769046198461696
Epoch: 17, step: 273, loss: 0.3693796992301941, mean loss: 0.35769093290707465
Epoch: 17, step: 274, loss: 0.32603850960731506, mean loss: 0.357689657782259
Epoch: 17, step: 275, loss: 0.3009416162967682, mean loss: 0.3576873717670525
Epoch: 17, step: 276, loss: 0.3468691110610962, mean loss: 0.35768693598615803
Epoch: 17, step: 277, loss: 0.37621498107910156, mean loss: 0.35768768230232223
Epoch: 17, step: 278, loss: 0.3618699610233307, mean loss: 0.3576878507591926
Epoch: 17, step: 279, loss: 0.3775959610939026, mean loss: 0.35768865260027266
Epoch: 17, step: 280, loss: 0.30487650632858276, mean loss: 0.35768652556550395
Epoch: 17, step: 281, loss: 0.3496628701686859, mean loss: 0.3576862024219117
Epoch: 17, step: 282, loss: 0.3267851769924164, mean loss: 0.3576849579683887
Epoch: 17, step: 283, loss: 0.33297625184059143, mean loss: 0.3576839629335092
Epoch: 17, step: 284, loss: 0.33134859800338745, mean loss: 0.35768290243478046
Epoch: 17, step: 285, loss: 0.31776073575019836, mean loss: 0.3576812948739089
Epoch: 17, step: 286, loss: 0.33661481738090515, mean loss: 0.357680446616309
Epoch: 17, step: 287, loss: 0.3115585744380951, mean loss: 0.35767858955912674
Epoch: 17, step: 288, loss: 0.3191334307193756, mean loss: 0.35767703763422276
Epoch: 17, step: 289, loss: 0.3559642434120178, mean loss: 0.357676968675602
Epoch: 17, step: 290, loss: 0.35118409991264343, mean loss: 0.3576767072774474
Epoch: 17, step: 291, loss: 0.34148186445236206, mean loss: 0.3576760553111501
Epoch: 17, step: 292, loss: 0.3053446114063263, mean loss: 0.3576739486550612
Epoch: 17, step: 293, loss: 0.3235757648944855, mean loss: 0.3576725760528649
Epoch: 17, step: 294, loss: 0.34904831647872925, mean loss: 0.3576722289023769
Epoch: 17, step: 295, loss: 0.3522997796535492, mean loss: 0.35767201265502346
Epoch: 17, step: 296, loss: 0.3325527012348175, mean loss: 0.357671001614113
Epoch: 17, step: 297, loss: 0.2930205464363098, mean loss: 0.3576683995672975
Epoch: 17, step: 298, loss: 0.3522432744503021, mean loss: 0.3576681812260444
Epoch: 17, step: 299, loss: 0.3063904047012329, mean loss: 0.35766611756794214
Epoch: 17, step: 300, loss: 0.3637007176876068, mean loss: 0.3576663604187659
Epoch: 17, step: 301, loss: 0.34396451711654663, mean loss: 0.35766580903674167
Epoch: 17, step: 302, loss: 0.3222968876361847, mean loss: 0.357664385797379
Epoch: 17, step: 303, loss: 0.3353980481624603, mean loss: 0.3576634898398048
Epoch: 17, step: 304, loss: 0.32940730452537537, mean loss: 0.35766235290722864
Epoch: 17, step: 305, loss: 0.34376853704452515, mean loss: 0.35766179388993313
Epoch: 17, step: 306, loss: 0.33240675926208496, mean loss: 0.35766077779519856
Epoch: 17, step: 307, loss: 0.3790976405143738, mean loss: 0.35766164023737423
Epoch: 17, step: 308, loss: 0.337507039308548, mean loss: 0.3576608294154356
Epoch: 17, step: 309, loss: 0.32696446776390076, mean loss: 0.3576595945469163
Epoch: 17, step: 310, loss: 0.34448638558387756, mean loss: 0.3576590646298254
Epoch: 17, step: 311, loss: 0.31180086731910706, mean loss: 0.3576572199718483
Epoch: 17, step: 312, loss: 0.33368393778800964, mean loss: 0.3576562556790932
Epoch: 17, step: 313, loss: 0.33631953597068787, mean loss: 0.3576553974730073
Epoch: 17, step: 314, loss: 0.32574623823165894, mean loss: 0.3576541140736089
Epoch: 17, step: 315, loss: 0.2996022701263428, mean loss: 0.35765177929867537
Epoch: 17, step: 316, loss: 0.3772745132446289, mean loss: 0.35765256846955595
Epoch: 17, step: 317, loss: 0.34371745586395264, mean loss: 0.3576520080612633
Epoch: 17, step: 318, loss: 0.3188360631465912, mean loss: 0.3576504471192552
Epoch: 17, step: 319, loss: 0.3294123411178589, mean loss: 0.35764931159947067
Epoch: 17, step: 320, loss: 0.34476011991500854, mean loss: 0.3576487933159979
Epoch: 17, step: 321, loss: 0.3604883849620819, mean loss: 0.3576489074933862
Epoch: 17, step: 322, loss: 0.30284082889556885, mean loss: 0.3576467037991802
Epoch: 17, step: 323, loss: 0.347569078207016, mean loss: 0.3576462986196372
Epoch: 17, step: 324, loss: 0.3507002592086792, mean loss: 0.35764601935941887
Epoch: 17, step: 325, loss: 0.3657904863357544, mean loss: 0.3576463467883397
Epoch: 17, step: 326, loss: 0.3291431665420532, mean loss: 0.3576452009318474
Epoch: 17, step: 327, loss: 0.32768601179122925, mean loss: 0.3576439965907499
Epoch: 17, step: 328, loss: 0.313711941242218, mean loss: 0.3576422306199597
Epoch: 17, step: 329, loss: 0.3332653045654297, mean loss: 0.3576412507612068
Epoch: 17, step: 330, loss: 0.35064083337783813, mean loss: 0.3576409693826392
Epoch: 17, step: 331, loss: 0.3633838891983032, mean loss: 0.3576412002073906
Epoch: 17, step: 332, loss: 0.3407976031303406, mean loss: 0.3576405232411482
Epoch: 17, step: 333, loss: 0.3742857277393341, mean loss: 0.3576411922068462
Epoch: 17, step: 334, loss: 0.3393397033214569, mean loss: 0.35764045670514283
Epoch: 17, step: 335, loss: 0.3535195589065552, mean loss: 0.35764029110082685
Epoch: 17, step: 336, loss: 0.34914612770080566, mean loss: 0.3576399497641421
Epoch: 17, step: 337, loss: 0.33017292618751526, mean loss: 0.35763884605026375
Epoch: 17, step: 338, loss: 0.326352059841156, mean loss: 0.3576375888964803
Epoch: 17, step: 339, loss: 0.31297338008880615, mean loss: 0.35763579428828324
Epoch: 17, step: 340, loss: 0.3339754641056061, mean loss: 0.35763484365426085
Epoch: 17, step: 341, loss: 0.3029659688472748, mean loss: 0.3576326472350239
Epoch: 17, step: 342, loss: 0.32168909907341003, mean loss: 0.3576312031970921
Epoch: 17, step: 343, loss: 0.31137263774871826, mean loss: 0.35762934482631237
Epoch: 17, step: 344, loss: 0.3444008529186249, mean loss: 0.3576288134121836
Epoch: 17, step: 345, loss: 0.3239523470401764, mean loss: 0.35762746061768
Epoch: 17, step: 346, loss: 0.33521345257759094, mean loss: 0.35762656027592304
Epoch: 17, step: 347, loss: 0.3284798860549927, mean loss: 0.35762538953868733
Epoch: 17, step: 348, loss: 0.301155686378479, mean loss: 0.3576231214058537
Epoch: 17, step: 349, loss: 0.32114818692207336, mean loss: 0.35762165643137844
Epoch: 17, step: 350, loss: 0.3475933372974396, mean loss: 0.357621253671463
Epoch: 17, step: 351, loss: 0.3331669569015503, mean loss: 0.35762027157119114
Epoch: 17, step: 352, loss: 0.36053645610809326, mean loss: 0.35762038868233276
Epoch: 17, step: 353, loss: 0.35286518931388855, mean loss: 0.35762019772580844
Epoch: 17, step: 354, loss: 0.3330625891685486, mean loss: 0.3576192115952797
Epoch: 17, step: 355, loss: 0.2796494960784912, mean loss: 0.35761608078434504
Epoch: 17, step: 356, loss: 0.31728893518447876, mean loss: 0.3576144615454131
Epoch: 17, step: 357, loss: 0.3116355240345001, mean loss: 0.3576126154465811
Epoch: 17, step: 358, loss: 0.37515631318092346, mean loss: 0.35761331981474
Epoch: 17, step: 359, loss: 0.386129766702652, mean loss: 0.35761446468574076
Epoch: 17, step: 360, loss: 0.3386734127998352, mean loss: 0.35761370427577305
Epoch: 17, step: 361, loss: 0.33578282594680786, mean loss: 0.3576128278856354
Epoch: 17, step: 362, loss: 0.33819475769996643, mean loss: 0.35761204838781574
Epoch: 17, step: 363, loss: 0.31814464926719666, mean loss: 0.35761046411521136
Epoch: 17, step: 364, loss: 0.36909395456314087, mean loss: 0.35761092505891334
Epoch: 17, step: 365, loss: 0.3483898341655731, mean loss: 0.35761055494207566
Epoch: 17, step: 366, loss: 0.35518956184387207, mean loss: 0.35761045777197337
Epoch: 17, step: 367, loss: 0.32512912154197693, mean loss: 0.35760915413831507
Epoch: 17, step: 368, loss: 0.34769392013549805, mean loss: 0.35760875620782573
Epoch: 17, step: 369, loss: 0.3306838572025299, mean loss: 0.35760767566769386
Epoch: 17, step: 370, loss: 0.3103056848049164, mean loss: 0.3576057774377945
Epoch: 17, step: 371, loss: 0.3488672077655792, mean loss: 0.3576054267728799
Epoch: 17, step: 372, loss: 0.34246861934661865, mean loss: 0.3576048193812252
Epoch: 17, step: 373, loss: 0.3397086262702942, mean loss: 0.3576041012930657
Epoch: 17, step: 374, loss: 0.3087054491043091, mean loss: 0.357602139304052
Epoch: 17, step: 375, loss: 0.2922428846359253, mean loss: 0.35759951696194525
Epoch: 17, step: 376, loss: 0.3802628815174103, mean loss: 0.3576004262243146
Epoch: 17, step: 377, loss: 0.33626797795295715, mean loss: 0.3575995703931234
Epoch: 17, step: 378, loss: 0.34680721163749695, mean loss: 0.3575991374345341
Epoch: 17, step: 379, loss: 0.332838237285614, mean loss: 0.35759814413783364
Epoch: 17, step: 380, loss: 0.3451457917690277, mean loss: 0.3575976446251228
Epoch: 17, step: 381, loss: 0.32211726903915405, mean loss: 0.35759622142513936
Epoch: 17, step: 382, loss: 0.33498644828796387, mean loss: 0.35759531453118654
Epoch: 17, step: 383, loss: 0.36507391929626465, mean loss: 0.3575956144912686
Epoch: 17, step: 384, loss: 0.37110304832458496, mean loss: 0.3575961562405099
Epoch: 17, step: 385, loss: 0.33483144640922546, mean loss: 0.35759524324180003
Epoch: 17, step: 386, loss: 0.38094958662986755, mean loss: 0.35759617985071873
Epoch: 17, step: 387, loss: 0.3397711515426636, mean loss: 0.3575954650196188
Epoch: 17, step: 388, loss: 0.33256784081459045, mean loss: 0.3575944613854926
Epoch: 17, step: 389, loss: 0.31024277210235596, mean loss: 0.3575925626089555
Epoch: 17, step: 390, loss: 0.3139488101005554, mean loss: 0.357590812588806
Epoch: 17, step: 391, loss: 0.3476340174674988, mean loss: 0.3575904133588492
Epoch: 17, step: 392, loss: 0.3033389747142792, mean loss: 0.3575882381678527
Epoch: 17, step: 393, loss: 0.310107946395874, mean loss: 0.3575863345397646
Epoch: 17, step: 394, loss: 0.3211623728275299, mean loss: 0.35758487425183966
Epoch: 17, step: 395, loss: 0.3537366986274719, mean loss: 0.35758471997924407
Epoch: 17, step: 396, loss: 0.32724374532699585, mean loss: 0.35758350366436525
Epoch: 17, step: 397, loss: 0.3505703806877136, mean loss: 0.3575832225322007
Epoch: 17, step: 398, loss: 0.35170191526412964, mean loss: 0.3575829867801156
Epoch: 17, step: 399, loss: 0.359285444021225, mean loss: 0.3575830550203449
Epoch: 17, step: 400, loss: 0.3062012195587158, mean loss: 0.3575809955455979
Epoch: 17, step: 401, loss: 0.30917128920555115, mean loss: 0.3575790552768067
Epoch: 17, step: 402, loss: 0.33817818760871887, mean loss: 0.3575782777180849
Epoch: 17, step: 403, loss: 0.30136948823928833, mean loss: 0.3575760250413665
Epoch: 17, step: 404, loss: 0.3535272181034088, mean loss: 0.3575758627840452
Epoch: 17, step: 405, loss: 0.3322690725326538, mean loss: 0.3575748486464219
Epoch: 17, step: 406, loss: 0.30794379115104675, mean loss: 0.3575728598242422
Epoch: 17, step: 407, loss: 0.3494623005390167, mean loss: 0.3575725348298807
Epoch: 17, step: 408, loss: 0.31343865394592285, mean loss: 0.35757076643300273
Epoch: 17, step: 409, loss: 0.3624510169029236, mean loss: 0.35757096197152627
Epoch: 17, step: 410, loss: 0.33640655875205994, mean loss: 0.35757011400473193
Epoch: 17, step: 411, loss: 0.3282765746116638, mean loss: 0.35756894038536524
Epoch: 17, step: 412, loss: 0.3266201913356781, mean loss: 0.3575677005011839
Epoch: 17, step: 413, loss: 0.32686883211135864, mean loss: 0.3575664706771157
Epoch: 17, step: 414, loss: 0.3719014525413513, mean loss: 0.35756704492627905
Epoch: 17, step: 415, loss: 0.3111610412597656, mean loss: 0.35756518600929194
Epoch: 17, step: 416, loss: 0.3031180202960968, mean loss: 0.35756300506934746
Epoch: 17, step: 417, loss: 0.36252060532569885, mean loss: 0.3575632036434184
Epoch: 17, step: 418, loss: 0.34489884972572327, mean loss: 0.3575626963997
Epoch: 17, step: 419, loss: 0.3554297387599945, mean loss: 0.357562610972047
Epoch: 17, step: 420, loss: 0.3331729769706726, mean loss: 0.35756163417545916
Epoch: 17, step: 421, loss: 0.32281002402305603, mean loss: 0.3575602424409717
Epoch: 17, step: 422, loss: 0.3342748284339905, mean loss: 0.3575593099427134
Epoch: 17, step: 423, loss: 0.33801180124282837, mean loss: 0.3575585271656551
Epoch: 17, step: 424, loss: 0.3551357388496399, mean loss: 0.35755843014934485
Epoch: 17, step: 425, loss: 0.3551269769668579, mean loss: 0.3575583327899638
Epoch: 17, step: 426, loss: 0.3663746118545532, mean loss: 0.3575586857941305
Epoch: 17, step: 427, loss: 0.34476014971733093, mean loss: 0.3575581733607514
Epoch: 17, step: 428, loss: 0.3648551404476166, mean loss: 0.3575584655082105
Epoch: 17, step: 429, loss: 0.37079429626464844, mean loss: 0.3575589954077524
Epoch: 17, step: 430, loss: 0.320333331823349, mean loss: 0.3575575051293752
Epoch: 17, step: 431, loss: 0.3300016522407532, mean loss: 0.35755640201276634
Epoch: 17, step: 432, loss: 0.3514159023761749, mean loss: 0.3575561562059677
Epoch: 17, step: 433, loss: 0.3223385214805603, mean loss: 0.35755474648558
Epoch: 17, step: 434, loss: 0.31824344396591187, mean loss: 0.3575531729634842
Epoch: 17, step: 435, loss: 0.3597273528575897, mean loss: 0.3575532599863746
Epoch: 17, step: 436, loss: 0.3633444607257843, mean loss: 0.35755349177347645
Epoch: 17, step: 437, loss: 0.3256879448890686, mean loss: 0.35755221643741286
Epoch: 17, step: 438, loss: 0.304624080657959, mean loss: 0.3575500982105037
Epoch: 17, step: 439, loss: 0.36234718561172485, mean loss: 0.3575502901861481
Epoch: 17, step: 440, loss: 0.36879777908325195, mean loss: 0.3575507402837469
Epoch: 17, step: 441, loss: 0.31229034066200256, mean loss: 0.3575489291433058
Epoch: 17, step: 442, loss: 0.36190930008888245, mean loss: 0.3575491036209556
Epoch: 17, step: 443, loss: 0.31727197766304016, mean loss: 0.357547492020205
Epoch: 17, step: 444, loss: 0.34494733810424805, mean loss: 0.35754698787288713
Epoch: 17, step: 445, loss: 0.29863086342811584, mean loss: 0.3575446306621788
Epoch: 17, step: 446, loss: 0.35638171434402466, mean loss: 0.35754458413622087
Epoch: 17, step: 447, loss: 0.460252046585083, mean loss: 0.35754869309215176
Epoch: 17, step: 448, loss: 0.35704076290130615, mean loss: 0.3575486727725058
Epoch: 17, step: 449, loss: 0.3211060166358948, mean loss: 0.3575472149496345
Epoch: 17, step: 450, loss: 0.33511221408843994, mean loss: 0.3575463175137026
Epoch: 17, step: 451, loss: 0.3057152330875397, mean loss: 0.35754424427032555
Epoch: 17, step: 452, loss: 0.32323259115219116, mean loss: 0.3575428718590973
Epoch: 17, step: 453, loss: 0.32643190026283264, mean loss: 0.3575416275197806
Epoch: 17, step: 454, loss: 0.3358978033065796, mean loss: 0.35754076187068995
Epoch: 17, step: 455, loss: 0.3292519152164459, mean loss: 0.35753963049784343
Epoch: 17, step: 456, loss: 0.3121255338191986, mean loss: 0.3575378142972164
Epoch: 17, step: 457, loss: 0.356001079082489, mean loss: 0.35753775284255696
Epoch: 17, step: 458, loss: 0.338288277387619, mean loss: 0.35753698307907256
Epoch: 17, step: 459, loss: 0.3425978720188141, mean loss: 0.3575363857057896
Epoch: 17, step: 460, loss: 0.3562663197517395, mean loss: 0.35753633492143383
Epoch: 17, step: 461, loss: 0.3422711491584778, mean loss: 0.35753572455814864
Epoch: 17, step: 462, loss: 0.3281066119670868, mean loss: 0.35753454791136957
Epoch: 17, step: 463, loss: 0.34248366951942444, mean loss: 0.3575339461650721
Epoch: 17, step: 464, loss: 0.3143707811832428, mean loss: 0.3575322205358001
Epoch: 17, step: 465, loss: 0.3264402747154236, mean loss: 0.35753097755403707
Epoch: 17, step: 466, loss: 0.32526811957359314, mean loss: 0.35752968781356215
Epoch: 17, step: 467, loss: 0.32606834173202515, mean loss: 0.3575284301646142
Epoch: 17, step: 468, loss: 0.33410584926605225, mean loss: 0.35752749389803956
Epoch: 17, step: 469, loss: 0.31491321325302124, mean loss: 0.35752579055322203
Epoch: 17, step: 470, loss: 0.3573179244995117, mean loss: 0.35752578224489423
Epoch: 17, step: 471, loss: 0.3147568702697754, mean loss: 0.3575240728559264
Epoch: 17, step: 472, loss: 0.3171197175979614, mean loss: 0.357522458038163
Epoch: 17, step: 473, loss: 0.34963029623031616, mean loss: 0.35752214262925053
Epoch: 17, step: 474, loss: 0.29739218950271606, mean loss: 0.35751973964187383
Epoch: 17, step: 475, loss: 0.32184121012687683, mean loss: 0.3575183138694348
Epoch: 17, step: 476, loss: 0.3584679961204529, mean loss: 0.3575183518187755
Epoch: 17, step: 477, loss: 0.29932549595832825, mean loss: 0.35751602652284886
Epoch: 17, step: 478, loss: 0.3352818489074707, mean loss: 0.3575151381152245
Epoch: 17, step: 479, loss: 0.33374878764152527, mean loss: 0.35751418852474687
Epoch: 17, step: 480, loss: 0.37023043632507324, mean loss: 0.35751469658530866
Epoch: 17, step: 481, loss: 0.3611370325088501, mean loss: 0.3575148413050819
Epoch: 17, step: 482, loss: 0.37352609634399414, mean loss: 0.3575154809621087
Epoch: 17, step: 483, loss: 0.3379825949668884, mean loss: 0.3575147006454742
Epoch: 17, step: 484, loss: 0.3440854549407959, mean loss: 0.35751416418377546
Epoch: 17, step: 485, loss: 0.3511715531349182, mean loss: 0.35751391082390294
Epoch: 17, step: 486, loss: 0.30451706051826477, mean loss: 0.3575117939135652
Epoch: 17, step: 487, loss: 0.3203868567943573, mean loss: 0.35751031105140196
Epoch: 17, step: 488, loss: 0.37691494822502136, mean loss: 0.357511086089832
Epoch: 17, step: 489, loss: 0.34370139241218567, mean loss: 0.35751053454043996
Epoch: 17, step: 490, loss: 0.31937333941459656, mean loss: 0.35750901142868924
Epoch: 17, step: 491, loss: 0.32617366313934326, mean loss: 0.35750776001701634
Epoch: 17, step: 492, loss: 0.32378801703453064, mean loss: 0.3575064134356904
Epoch: 17, step: 493, loss: 0.35573938488960266, mean loss: 0.35750634287309374
Epoch: 17, step: 494, loss: 0.34313586354255676, mean loss: 0.35750576904091186
Epoch: 17, step: 495, loss: 0.3001978099346161, mean loss: 0.3575034807499397
Epoch: 17, step: 496, loss: 0.35151737928390503, mean loss: 0.357503241736106
Epoch: 17, step: 497, loss: 0.373002290725708, mean loss: 0.3575038605594307
Epoch: 17, step: 498, loss: 0.33608219027519226, mean loss: 0.3575030053005061
Epoch: 17, step: 499, loss: 0.37239184975624084, mean loss: 0.3575035997130123
Epoch: 17, step: 500, loss: 0.3403763175010681, mean loss: 0.35750291596187606
Epoch: 17, step: 501, loss: 0.35155564546585083, mean loss: 0.3575026785458882
Epoch: 17, step: 502, loss: 0.332618772983551, mean loss: 0.3575016852160585
Epoch: 17, step: 503, loss: 0.3664831221103668, mean loss: 0.3575020437278298
Epoch: 17, step: 504, loss: 0.32361945509910583, mean loss: 0.3575006912914498
Epoch: 17, step: 505, loss: 0.3331736922264099, mean loss: 0.35749972030880967
Epoch: 17, step: 506, loss: 0.335103303194046, mean loss: 0.35749882641868336
Epoch: 17, step: 507, loss: 0.3014717102050781, mean loss: 0.3574965903428447
Epoch: 17, step: 508, loss: 0.35020601749420166, mean loss: 0.35749629938331845
Epoch: 17, step: 509, loss: 0.3421657383441925, mean loss: 0.35749568758025996
Epoch: 17, step: 510, loss: 0.3441728949546814, mean loss: 0.3574951559232654
Epoch: 17, step: 511, loss: 0.3018063008785248, mean loss: 0.3574929337023937
Epoch: 17, step: 512, loss: 0.34478241205215454, mean loss: 0.35749242651905505
Epoch: 17, step: 513, loss: 0.3363941013813019, mean loss: 0.3574915846738257
Epoch: 17, step: 514, loss: 0.3095240890979767, mean loss: 0.3574896707969723
Epoch: 17, step: 515, loss: 0.302185982465744, mean loss: 0.3574874642980762
Epoch: 17, step: 516, loss: 0.3383609652519226, mean loss: 0.35748670122211185
Epoch: 17, step: 517, loss: 0.29613032937049866, mean loss: 0.35748425342941054
Epoch: 17, step: 518, loss: 0.34198543429374695, mean loss: 0.3574836351336777
Epoch: 17, step: 519, loss: 0.3961763083934784, mean loss: 0.35748517864226476
Epoch: 17, step: 520, loss: 0.30745822191238403, mean loss: 0.3574831830717701
Epoch: 17, step: 521, loss: 0.33847230672836304, mean loss: 0.35748242475998937
Epoch: 17, step: 522, loss: 0.30514103174209595, mean loss: 0.35748033703341214
Epoch: 17, step: 523, loss: 0.3372008502483368, mean loss: 0.3574795281834287
Epoch: 17, step: 524, loss: 0.3375493288040161, mean loss: 0.3574787332965233
Epoch: 17, step: 525, loss: 0.3425029516220093, mean loss: 0.35747813603315587
Epoch: 17, step: 526, loss: 0.31560906767845154, mean loss: 0.3574764662796821
Epoch: 17, step: 527, loss: 0.3332383632659912, mean loss: 0.35747549969398207
Epoch: 17, step: 528, loss: 0.329039990901947, mean loss: 0.3574743657661282
Epoch: 17, step: 529, loss: 0.33828258514404297, mean loss: 0.3574736004825879
Epoch: 17, step: 530, loss: 0.3539074659347534, mean loss: 0.3574734582865455
Epoch: 17, step: 531, loss: 0.32490673661231995, mean loss: 0.3574721597729221
Epoch: 17, step: 532, loss: 0.35946449637413025, mean loss: 0.3574722392090132
Epoch: 17, step: 533, loss: 0.2922472059726715, mean loss: 0.3574696387372312
Epoch: 17, step: 534, loss: 0.3207288980484009, mean loss: 0.35746817397062874
Epoch: 17, step: 535, loss: 0.323836088180542, mean loss: 0.3574668331922126
Epoch: 17, step: 536, loss: 0.39869850873947144, mean loss: 0.3574684768707276
Epoch: 17, step: 537, loss: 0.34307920932769775, mean loss: 0.3574679032732013
Epoch: 17, step: 538, loss: 0.35407555103302, mean loss: 0.35746776804968955
Epoch: 17, step: 539, loss: 0.3401908874511719, mean loss: 0.35746707939851774
Epoch: 17, step: 540, loss: 0.33649781346321106, mean loss: 0.35746624360331125
Epoch: 17, step: 541, loss: 0.3817625641822815, mean loss: 0.3574672119700143
Epoch: 17, step: 542, loss: 0.3069493770599365, mean loss: 0.3574651985853381
Epoch: 17, step: 543, loss: 0.31058835983276367, mean loss: 0.35746333038675876
Epoch: 17, step: 544, loss: 0.3177328407764435, mean loss: 0.35746174705716044
Epoch: 17, step: 545, loss: 0.35549789667129517, mean loss: 0.3574616687974017
Epoch: 17, step: 546, loss: 0.35153117775917053, mean loss: 0.3574614324757823
Epoch: 17, step: 547, loss: 0.3153332471847534, mean loss: 0.3574597537945068
Epoch: 17, step: 548, loss: 0.3193107545375824, mean loss: 0.35745823373237756
Epoch: 17, step: 549, loss: 0.37087228894233704, mean loss: 0.3574587681994749
Epoch: 17, step: 550, loss: 0.41003885865211487, mean loss: 0.3574608631072582
Epoch: 17, step: 551, loss: 0.33379435539245605, mean loss: 0.35745992021850465
Epoch: 17, step: 552, loss: 0.3198467791080475, mean loss: 0.35745842174668635
Epoch: 17, step: 553, loss: 0.3212791681289673, mean loss: 0.3574569804570035
Epoch: 17, step: 554, loss: 0.3046344518661499, mean loss: 0.35745487622529454
Epoch: 17, step: 555, loss: 0.3725067973136902, mean loss: 0.35745547580787457
Epoch: 17, step: 556, loss: 0.33725494146347046, mean loss: 0.35745467116599666
Epoch: 17, step: 557, loss: 0.3084975481033325, mean loss: 0.3574527211491456
Epoch: 17, step: 558, loss: 0.3353477418422699, mean loss: 0.35745184071821773
Epoch: 17, step: 559, loss: 0.32986685633659363, mean loss: 0.35745074206502425
Epoch: 17, step: 560, loss: 0.3404534161090851, mean loss: 0.3574500651234513
Epoch: 17, step: 561, loss: 0.34683361649513245, mean loss: 0.3574496423258158
Epoch: 17, step: 562, loss: 0.31879448890686035, mean loss: 0.3574481029544877
Epoch: 17, step: 563, loss: 0.3603360056877136, mean loss: 0.357448217955393
Epoch: 17, step: 564, loss: 0.33932116627693176, mean loss: 0.3574474961359497
Epoch: 17, step: 565, loss: 0.3460950553417206, mean loss: 0.3574470440996037
Epoch: 17, step: 566, loss: 0.32831716537475586, mean loss: 0.3574458842398098
Epoch: 17, step: 567, loss: 0.3280198276042938, mean loss: 0.35744471263379624
Epoch: 17, step: 568, loss: 0.29840925335884094, mean loss: 0.3574423622153834
Epoch: 17, step: 569, loss: 0.3437497913837433, mean loss: 0.3574418170855629
Epoch: 17, step: 570, loss: 0.32607948780059814, mean loss: 0.35744056853548983
Epoch: 17, step: 571, loss: 0.3064456284046173, mean loss: 0.3574385384821407
Epoch: 17, step: 572, loss: 0.3138876259326935, mean loss: 0.3574368048364837
Epoch: 17, step: 573, loss: 0.3800995945930481, mean loss: 0.3574377069457806
Epoch: 17, step: 574, loss: 0.3428383469581604, mean loss: 0.35743712583046844
Epoch: 17, step: 575, loss: 0.3219931125640869, mean loss: 0.35743571506732297
Epoch: 17, step: 576, loss: 0.3452107608318329, mean loss: 0.3574352285019803
Epoch: 17, step: 577, loss: 0.34313273429870605, mean loss: 0.3574346592711356
Epoch: 17, step: 578, loss: 0.3234822452068329, mean loss: 0.3574333080388331
Epoch: 17, step: 579, loss: 0.3081660270690918, mean loss: 0.35743134738613613
Epoch: 17, step: 580, loss: 0.29528722167015076, mean loss: 0.3574288743818098
Epoch: 17, step: 581, loss: 0.32339441776275635, mean loss: 0.3574275200460908
Epoch: 17, step: 582, loss: 0.34590238332748413, mean loss: 0.35742706144369857
Epoch: 17, step: 583, loss: 0.3561302721500397, mean loss: 0.3574270098445702
Epoch: 17, step: 584, loss: 0.31902259588241577, mean loss: 0.3574254817972236
Epoch: 17, step: 585, loss: 0.3482382893562317, mean loss: 0.35742511626875856
Epoch: 17, step: 586, loss: 0.3315686285495758, mean loss: 0.3574240875642541
Epoch: 17, step: 587, loss: 0.35162508487701416, mean loss: 0.3574238568591822
Epoch: 17, step: 588, loss: 0.30489757657051086, mean loss: 0.3574217672589798
Epoch: 17, step: 589, loss: 0.3329755365848541, mean loss: 0.35742079477784866
Epoch: 17, step: 590, loss: 0.3841370940208435, mean loss: 0.35742185752096667
Epoch: 17, step: 591, loss: 0.3841116428375244, mean loss: 0.3574229191671606
Epoch: 17, step: 592, loss: 0.33829838037490845, mean loss: 0.3574221584759076
Epoch: 17, step: 593, loss: 0.3294292390346527, mean loss: 0.3574210450832005
Epoch: 17, step: 594, loss: 0.321674644947052, mean loss: 0.3574196233594549
Epoch: 17, step: 595, loss: 0.34065866470336914, mean loss: 0.35741895676071733
Epoch: 17, step: 596, loss: 0.32852932810783386, mean loss: 0.35741780783931537
Epoch: 17, step: 597, loss: 0.317905992269516, mean loss: 0.3574162365430627
Epoch: 17, step: 598, loss: 0.2986502945423126, mean loss: 0.3574138996463354
Epoch: 17, step: 599, loss: 0.36205658316612244, mean loss: 0.3574140842607588
Epoch: 17, step: 600, loss: 0.40600159764289856, mean loss: 0.35741601624665814
Epoch: 17, step: 601, loss: 0.33693933486938477, mean loss: 0.357415202064496
Epoch: 17, step: 602, loss: 0.3671656548976898, mean loss: 0.357415589741043
Epoch: 17, step: 603, loss: 0.3155764937400818, mean loss: 0.35741392629097934
Epoch: 17, step: 604, loss: 0.3556324243545532, mean loss: 0.3574138554643608
Epoch: 17, step: 605, loss: 0.373579740524292, mean loss: 0.35741449814087584
Epoch: 17, step: 606, loss: 0.35125699639320374, mean loss: 0.35741425335845695
Epoch: 17, step: 607, loss: 0.33950307965278625, mean loss: 0.35741354135441394
Epoch: 17, step: 608, loss: 0.33245912194252014, mean loss: 0.3574125494070668
Epoch: 17, step: 609, loss: 0.34641924500465393, mean loss: 0.3574121124365444
Epoch: 17, step: 610, loss: 0.32660388946533203, mean loss: 0.3574108878957053
Epoch: 17, step: 611, loss: 0.3086312711238861, mean loss: 0.357408949119204
Epoch: 17, step: 612, loss: 0.3270152807235718, mean loss: 0.3574077411517784
Epoch: 17, step: 613, loss: 0.35045358538627625, mean loss: 0.35740746477645985
Epoch: 17, step: 614, loss: 0.32842427492141724, mean loss: 0.35740631295871733
Epoch: 17, step: 615, loss: 0.33863565325737, mean loss: 0.3574055670256502
Epoch: 17, step: 616, loss: 0.36891335248947144, mean loss: 0.3574060243189331
Epoch: 17, step: 617, loss: 0.3192547559738159, mean loss: 0.357404508334337
Epoch: 17, step: 618, loss: 0.3108336329460144, mean loss: 0.3574026578604868
Epoch: 17, step: 619, loss: 0.3214357793331146, mean loss: 0.35740122878870806
Epoch: 17, step: 620, loss: 0.3103957176208496, mean loss: 0.3573993611932069
Epoch: 17, step: 621, loss: 0.39953991770744324, mean loss: 0.3574010354306529
Epoch: 17, step: 622, loss: 0.31554996967315674, mean loss: 0.3573993727606852
Epoch: 17, step: 623, loss: 0.30426672101020813, mean loss: 0.3573972619768082
Epoch: 17, step: 624, loss: 0.32980430126190186, mean loss: 0.35739616584362127
Epoch: 17, step: 625, loss: 0.37539783120155334, mean loss: 0.35739688093321204
Epoch: 17, step: 626, loss: 0.32320767641067505, mean loss: 0.35739552287146337
Epoch: 17, step: 627, loss: 0.3349686563014984, mean loss: 0.35739463206805655
Epoch: 17, step: 628, loss: 0.31488120555877686, mean loss: 0.357392943486156
Epoch: 17, step: 629, loss: 0.3559844195842743, mean loss: 0.35739288754351156
Epoch: 17, step: 630, loss: 0.3796526789665222, mean loss: 0.3573937716052862
Epoch: 17, step: 631, loss: 0.3309601843357086, mean loss: 0.35739272182024767
Epoch: 17, step: 632, loss: 0.348278671503067, mean loss: 0.35739235987869183
Epoch: 17, step: 633, loss: 0.3481832444667816, mean loss: 0.3573919941763881
Epoch: 17, step: 634, loss: 0.3120659291744232, mean loss: 0.35739019430881863
Epoch: 17, step: 635, loss: 0.3147788345813751, mean loss: 0.3573885023075588
Epoch: 17, step: 636, loss: 0.3560488820075989, mean loss: 0.3573884491163617
Epoch: 17, step: 637, loss: 0.3511303961277008, mean loss: 0.3573882006428848
Epoch: 17, step: 638, loss: 0.34302452206611633, mean loss: 0.3573876303614469
Epoch: 17, step: 639, loss: 0.33673471212387085, mean loss: 0.35738681041074666
Epoch: 17, step: 640, loss: 0.3505307137966156, mean loss: 0.3573865382246093
Epoch: 17, step: 641, loss: 0.30037635564804077, mean loss: 0.35738427501767894
Epoch: 17, step: 642, loss: 0.37240323424339294, mean loss: 0.35738487122105417
Epoch: 17, step: 643, loss: 0.366688996553421, mean loss: 0.35738524054962406
Epoch: 17, step: 644, loss: 0.40248286724090576, mean loss: 0.3573870306352308
Epoch: 17, step: 645, loss: 0.35452648997306824, mean loss: 0.357386917094679
Epoch: 17, step: 646, loss: 0.3555832505226135, mean loss: 0.35738684550640465
Epoch: 17, step: 647, loss: 0.32064682245254517, mean loss: 0.3573853873375265
Epoch: 17, step: 648, loss: 0.34655189514160156, mean loss: 0.3573849573858578
Epoch: 17, step: 649, loss: 0.37315618991851807, mean loss: 0.3573855832780926
Epoch: 17, step: 650, loss: 0.3038278818130493, mean loss: 0.357383457888138
Epoch: 17, step: 651, loss: 0.3597511947154999, mean loss: 0.3573835518459486
Epoch: 17, step: 652, loss: 0.32940635085105896, mean loss: 0.357382441683614
Epoch: 17, step: 653, loss: 0.3227323591709137, mean loss: 0.35738106678945825
Epoch: 17, step: 654, loss: 0.3294641077518463, mean loss: 0.3573799591054906
Epoch: 17, step: 655, loss: 0.37401145696640015, mean loss: 0.3573806189808223
Epoch: 17, step: 656, loss: 0.42662566900253296, mean loss: 0.3573833662551735
Epoch: 17, step: 657, loss: 0.3429868221282959, mean loss: 0.35738279509972926
Epoch: 17, step: 658, loss: 0.3065950870513916, mean loss: 0.35738078027416303
Epoch: 17, step: 659, loss: 0.3570661246776581, mean loss: 0.3573807677917925
Epoch: 17, step: 660, loss: 0.3364221751689911, mean loss: 0.3573799363985352
Epoch: 17, step: 661, loss: 0.34975796937942505, mean loss: 0.35737963405950235
Epoch: 17, step: 662, loss: 0.3267545998096466, mean loss: 0.357378419310613
Epoch: 17, step: 663, loss: 0.32085978984832764, mean loss: 0.3573769708483941
Epoch: 17, step: 664, loss: 0.359770804643631, mean loss: 0.3573770657928194
Epoch: 17, step: 665, loss: 0.3084692358970642, mean loss: 0.35737512608353506
Epoch: 17, step: 666, loss: 0.37769824266433716, mean loss: 0.3573759320766574
Epoch: 17, step: 667, loss: 0.35182833671569824, mean loss: 0.3573757120736688
Epoch: 17, step: 668, loss: 0.32973212003707886, mean loss: 0.35737461584525004
Epoch: 17, step: 669, loss: 0.2890572249889374, mean loss: 0.3573719067727282
Epoch: 17, step: 670, loss: 0.3398991525173187, mean loss: 0.3573712139318441
Epoch: 17, step: 671, loss: 0.33615854382514954, mean loss: 0.35737037282676454
Epoch: 17, step: 672, loss: 0.35354718565940857, mean loss: 0.35737022123931095
Epoch: 17, step: 673, loss: 0.33256515860557556, mean loss: 0.35736923777001295
Epoch: 17, step: 674, loss: 0.3450963497161865, mean loss: 0.3573687511947422
Epoch: 17, step: 675, loss: 0.34999680519104004, mean loss: 0.3573684589355445
Epoch: 17, step: 676, loss: 0.3377014696598053, mean loss: 0.3573676792729369
Epoch: 17, step: 677, loss: 0.34507161378860474, mean loss: 0.3573671918367407
Epoch: 17, step: 678, loss: 0.34904375672340393, mean loss: 0.35736686189520533
Epoch: 17, step: 679, loss: 0.35455846786499023, mean loss: 0.35736675057468725
Epoch: 17, step: 680, loss: 0.339182049036026, mean loss: 0.3573660297890224
Epoch: 17, step: 681, loss: 0.3299134075641632, mean loss: 0.35736494169460203
Epoch: 17, step: 682, loss: 0.3483075499534607, mean loss: 0.35736458271589566
Epoch: 17, step: 683, loss: 0.3374998867511749, mean loss: 0.35736379543403274
Epoch: 17, step: 684, loss: 0.32955411076545715, mean loss: 0.357362693318364
Epoch: 17, step: 685, loss: 0.320634663105011, mean loss: 0.3573612378206144
Epoch: 17, step: 686, loss: 0.2860485315322876, mean loss: 0.35735841187624
Epoch: 17, step: 687, loss: 0.3240602910518646, mean loss: 0.3573570924071948
Epoch: 17, step: 688, loss: 0.31147313117980957, mean loss: 0.35735527428454844
Epoch: 17, step: 689, loss: 0.3392910659313202, mean loss: 0.35735455853019576
Epoch: 17, step: 690, loss: 0.3351619839668274, mean loss: 0.35735367923329164
Epoch: 17, step: 691, loss: 0.4071390926837921, mean loss: 0.35735565171401473
Epoch: 17, step: 692, loss: 0.3314903676509857, mean loss: 0.3573546269810777
Epoch: 17, step: 693, loss: 0.3599841594696045, mean loss: 0.35735473115398353
Epoch: 17, step: 694, loss: 0.37412962317466736, mean loss: 0.35735539569037067
Epoch: 17, step: 695, loss: 0.33749663829803467, mean loss: 0.3573546090179973
Epoch: 17, step: 696, loss: 0.31616291403770447, mean loss: 0.35735297734063626
Epoch: 17, step: 697, loss: 0.33443164825439453, mean loss: 0.35735206942139813
Epoch: 17, step: 698, loss: 0.3049823045730591, mean loss: 0.35734999512485405
Epoch: 17, step: 699, loss: 0.3323226571083069, mean loss: 0.35734900386463475
Epoch: 17, step: 700, loss: 0.3359020948410034, mean loss: 0.3573481544484589
Epoch: 17, step: 701, loss: 0.3301565647125244, mean loss: 0.3573470775538159
Epoch: 17, step: 702, loss: 0.34055328369140625, mean loss: 0.35734641247940846
Epoch: 17, step: 703, loss: 0.3357791304588318, mean loss: 0.35734555839727555
Epoch: 17, step: 704, loss: 0.3288009762763977, mean loss: 0.35734442805307404
Epoch: 17, step: 705, loss: 0.36179810762405396, mean loss: 0.35734460440848587
Epoch: 17, step: 706, loss: 0.3281745910644531, mean loss: 0.35734344938914936
Epoch: 17, step: 707, loss: 0.32383519411087036, mean loss: 0.35734212264480036
Epoch: 17, step: 708, loss: 0.3424098491668701, mean loss: 0.35734153143153363
Epoch: 17, step: 709, loss: 0.3511247932910919, mean loss: 0.35734128530206416
Epoch: 17, step: 710, loss: 0.34174078702926636, mean loss: 0.35734066768069067
Epoch: 17, step: 711, loss: 0.3625742197036743, mean loss: 0.35734087486802335
Epoch: 17, step: 712, loss: 0.3767026662826538, mean loss: 0.35734164133773616
Epoch: 17, step: 713, loss: 0.37531623244285583, mean loss: 0.35734235286457905
Epoch: 17, step: 714, loss: 0.3298128843307495, mean loss: 0.3573412631496389
Epoch: 17, step: 715, loss: 0.31886357069015503, mean loss: 0.35733974012507985
Epoch: 17, step: 716, loss: 0.3163452446460724, mean loss: 0.35733811754461364
Epoch: 17, step: 717, loss: 0.32897868752479553, mean loss: 0.3573369951101159
Epoch: 17, step: 718, loss: 0.33004438877105713, mean loss: 0.3573359149420572
Epoch: 17, step: 719, loss: 0.3095824420452118, mean loss: 0.35733402506264855
Epoch: 17, step: 720, loss: 0.3596801459789276, mean loss: 0.3573341179084642
Epoch: 17, step: 721, loss: 0.3488195836544037, mean loss: 0.3573337809660719
Epoch: 17, step: 722, loss: 0.3639366924762726, mean loss: 0.3573340422502122
Epoch: 17, step: 723, loss: 0.3001108169555664, mean loss: 0.35733177795671367
Epoch: 17, step: 724, loss: 0.36611035466194153, mean loss: 0.3573321253067198
Epoch: 17, step: 725, loss: 0.3028281629085541, mean loss: 0.35732996878371603
Epoch: 17, step: 726, loss: 0.3203749656677246, mean loss: 0.35732850666687666
Epoch: 17, step: 727, loss: 0.33091893792152405, mean loss: 0.3573274618192447
Epoch: 17, step: 728, loss: 0.3201541006565094, mean loss: 0.3573259911794867
Epoch: 17, step: 729, loss: 0.3407822251319885, mean loss: 0.3573253367065835
Epoch: 17, step: 730, loss: 0.3242206871509552, mean loss: 0.3573240271354155
Epoch: 17, step: 731, loss: 0.3782973885536194, mean loss: 0.3573248567778767
Epoch: 17, step: 732, loss: 0.34673210978507996, mean loss: 0.3573244377775605
Epoch: 17, step: 733, loss: 0.35314661264419556, mean loss: 0.35732427252856386
Epoch: 17, step: 734, loss: 0.35422784090042114, mean loss: 0.35732415005766927
Epoch: 17, step: 735, loss: 0.3385954201221466, mean loss: 0.35732340932321527
Epoch: 17, step: 736, loss: 0.33585771918296814, mean loss: 0.35732256037363486
Epoch: 17, step: 737, loss: 0.38150349259376526, mean loss: 0.35732351667088313
Epoch: 17, step: 738, loss: 0.3012267053127289, mean loss: 0.35732129826572007
Epoch: 17, step: 739, loss: 0.31446558237075806, mean loss: 0.35731960356009307
Epoch: 17, step: 740, loss: 0.3462198078632355, mean loss: 0.3573191646421565
Epoch: 17, step: 741, loss: 0.3239096403121948, mean loss: 0.3573178435854412
Epoch: 17, step: 742, loss: 0.308056503534317, mean loss: 0.35731589580401496
Epoch: 17, step: 743, loss: 0.33461299538612366, mean loss: 0.35731499817233625
Epoch: 17, step: 744, loss: 0.35099124908447266, mean loss: 0.357314748152604
Epoch: 17, step: 745, loss: 0.3563411831855774, mean loss: 0.3573147096626472
Epoch: 17, step: 746, loss: 0.356534868478775, mean loss: 0.35731467883279217
Epoch: 17, step: 747, loss: 0.31132757663726807, mean loss: 0.3573128608733442
Epoch: 17, step: 748, loss: 0.34662389755249023, mean loss: 0.357312438334572
Epoch: 17, step: 749, loss: 0.30610397458076477, mean loss: 0.3573104141246046
Epoch: 17, step: 750, loss: 0.3222956955432892, mean loss: 0.35730903008892806
Epoch: 17, step: 751, loss: 0.35464224219322205, mean loss: 0.35730892468229186
Epoch: 17, step: 752, loss: 0.2967110574245453, mean loss: 0.3573065296043401
Epoch: 17, step: 753, loss: 0.3317873477935791, mean loss: 0.35730552102075736
Epoch: 17, step: 754, loss: 0.34061944484710693, mean loss: 0.35730486157025054
Epoch: 17, step: 755, loss: 0.3887229561805725, mean loss: 0.3573061031958675
Epoch: 17, step: 756, loss: 0.3707835078239441, mean loss: 0.3573066357943511
Epoch: 17, step: 757, loss: 0.3088882863521576, mean loss: 0.3573047224793491
Epoch: 17, step: 758, loss: 0.3558827340602875, mean loss: 0.3573046662898197
Epoch: 17, step: 759, loss: 0.3247970938682556, mean loss: 0.35730338181169335
Epoch: 17, step: 760, loss: 0.32214590907096863, mean loss: 0.3573019926824215
Epoch: 17, step: 761, loss: 0.36049365997314453, mean loss: 0.3573021187854358
Epoch: 17, step: 762, loss: 0.31878241896629333, mean loss: 0.3573005969293329
Epoch: 17, step: 763, loss: 0.34658074378967285, mean loss: 0.35730017342059633
Epoch: 17, step: 764, loss: 0.33314287662506104, mean loss: 0.35729921907710505
Epoch: 17, step: 765, loss: 0.3234013020992279, mean loss: 0.357297879979492
Epoch: 17, step: 766, loss: 0.31259310245513916, mean loss: 0.3572961140392382
Epoch: 17, step: 767, loss: 0.33535557985305786, mean loss: 0.35729524737253787
Epoch: 17, step: 768, loss: 0.303333580493927, mean loss: 0.3572931159325221
Epoch: 17, step: 769, loss: 0.308150053024292, mean loss: 0.3572911748999402
Epoch: 17, step: 770, loss: 0.3245025873184204, mean loss: 0.3572898798808802
Epoch: 17, step: 771, loss: 0.32122278213500977, mean loss: 0.35728845542994236
Epoch: 17, step: 772, loss: 0.3907551169395447, mean loss: 0.3572897771258276
Epoch: 17, step: 773, loss: 0.30606311559677124, mean loss: 0.35728775411573643
Epoch: 17, step: 774, loss: 0.34626054763793945, mean loss: 0.3572873186536475
Epoch: 17, step: 775, loss: 0.3019631505012512, mean loss: 0.35728513400003226
Epoch: 17, step: 776, loss: 0.31037238240242004, mean loss: 0.35728328157153877
Epoch: 17, step: 777, loss: 0.3210614323616028, mean loss: 0.35728185134768936
Epoch: 17, step: 778, loss: 0.37400728464126587, mean loss: 0.3572825117272564
Epoch: 17, step: 779, loss: 0.33100590109825134, mean loss: 0.35728147427421514
Epoch: 17, step: 780, loss: 0.3883403539657593, mean loss: 0.3572827004923719
Epoch: 17, step: 781, loss: 0.34729018807411194, mean loss: 0.3572823059991852
Epoch: 17, step: 782, loss: 0.36527955532073975, mean loss: 0.35728262170915803
Epoch: 17, step: 783, loss: 0.32075193524360657, mean loss: 0.35728117963247774
Epoch: 17, step: 784, loss: 0.34054335951805115, mean loss: 0.3572805189203586
Epoch: 17, step: 785, loss: 0.39221763610839844, mean loss: 0.3572818979807987
Epoch: 17, step: 786, loss: 0.3332580626010895, mean loss: 0.357280949733892
Epoch: 17, step: 787, loss: 0.30528977513313293, mean loss: 0.3572788976666912
Epoch: 17, step: 788, loss: 0.3174275755882263, mean loss: 0.35727732481583757
Epoch: 17, step: 789, loss: 0.3439435362815857, mean loss: 0.357276798579018
Epoch: 17, step: 790, loss: 0.36203932762145996, mean loss: 0.35727698653154344
Epoch: 17, step: 791, loss: 0.33767837285995483, mean loss: 0.35727621310558955
Epoch: 17, step: 792, loss: 0.32413798570632935, mean loss: 0.35727490541341483
Epoch: 17, step: 793, loss: 0.36157456040382385, mean loss: 0.3572750750785948
Epoch: 17, step: 794, loss: 0.4008290469646454, mean loss: 0.3572767936585532
Epoch: 17, step: 795, loss: 0.3429066836833954, mean loss: 0.3572762266561078
Epoch: 17, step: 796, loss: 0.3513611853122711, mean loss: 0.3572759932751118
Epoch: 17, step: 797, loss: 0.3500155806541443, mean loss: 0.3572757068231027
Epoch: 17, step: 798, loss: 0.3319630026817322, mean loss: 0.3572747081761567
Epoch: 17, step: 799, loss: 0.37007108330726624, mean loss: 0.3572752130039589
Epoch: 17, step: 800, loss: 0.31210166215896606, mean loss: 0.35727343093954433
Epoch: 17, step: 801, loss: 0.3591791093349457, mean loss: 0.3572735061142345
Epoch: 17, step: 802, loss: 0.33786478638648987, mean loss: 0.3572727405144661
Epoch: 17, step: 803, loss: 0.3128533363342285, mean loss: 0.3572709884079585
Epoch: 17, step: 804, loss: 0.3016766905784607, mean loss: 0.35726879559851465
Epoch: 17, step: 805, loss: 0.32868656516075134, mean loss: 0.3572676682722372
Epoch: 17, step: 806, loss: 0.309323787689209, mean loss: 0.3572657773678561
Epoch: 17, step: 807, loss: 0.30511611700057983, mean loss: 0.35726372066883544
Epoch: 17, step: 808, loss: 0.31061217188835144, mean loss: 0.3572618808790819
Epoch: 17, step: 809, loss: 0.35744771361351013, mean loss: 0.35726188820744903
Epoch: 17, step: 810, loss: 0.31735485792160034, mean loss: 0.3572603145243272
Epoch: 17, step: 811, loss: 0.3491485118865967, mean loss: 0.3572599946582926
Epoch: 17, step: 812, loss: 0.3670274019241333, mean loss: 0.35726037979323466
Epoch: 17, step: 813, loss: 0.28531205654144287, mean loss: 0.35725754293796885
Epoch: 17, step: 814, loss: 0.3188364505767822, mean loss: 0.35725602808986884
Epoch: 17, step: 815, loss: 0.3519231975078583, mean loss: 0.35725581783791405
Epoch: 17, step: 816, loss: 0.3214854300022125, mean loss: 0.3572544076117033
Epoch: 17, step: 817, loss: 0.33908894658088684, mean loss: 0.3572536914774673
Epoch: 17, step: 818, loss: 0.34549885988235474, mean loss: 0.3572532280867788
Epoch: 17, step: 819, loss: 0.32470154762268066, mean loss: 0.35725194490795253
Epoch: 17, step: 820, loss: 0.3469294607639313, mean loss: 0.35725153801433657
Epoch: 17, step: 821, loss: 0.35060742497444153, mean loss: 0.3572512761257658
Epoch: 17, step: 822, loss: 0.35491374135017395, mean loss: 0.3572511839916451
Epoch: 17, step: 823, loss: 0.3223780691623688, mean loss: 0.35724980951920193
Epoch: 17, step: 824, loss: 0.32573115825653076, mean loss: 0.3572485673069581
Epoch: 17, step: 825, loss: 0.3493206799030304, mean loss: 0.35724825486558487
Epoch: 17, step: 826, loss: 0.3497202396392822, mean loss: 0.3572479581950341
Epoch: 17, step: 827, loss: 0.35629838705062866, mean loss: 0.35724792077498585
Epoch: 17, step: 828, loss: 0.35796308517456055, mean loss: 0.35724794895658335
Epoch: 17, step: 829, loss: 0.3206174671649933, mean loss: 0.35724650556144616
Epoch: 17, step: 830, loss: 0.34477224946022034, mean loss: 0.3572460140426274
Epoch: 17, step: 831, loss: 0.3514699935913086, mean loss: 0.3572457864610493
Epoch: 17, step: 832, loss: 0.33215466141700745, mean loss: 0.35724479788199237
Epoch: 17, step: 833, loss: 0.31993961334228516, mean loss: 0.3572433281323848
Epoch: 17, step: 834, loss: 0.30801355838775635, mean loss: 0.35724138865439775
Epoch: 17, step: 835, loss: 0.31000474095344543, mean loss: 0.35723952777164875
Epoch: 17, step: 836, loss: 0.3023566007614136, mean loss: 0.35723736574970627
Epoch: 17, step: 837, loss: 0.37582269310951233, mean loss: 0.35723809785903266
Epoch: 17, step: 838, loss: 0.33344390988349915, mean loss: 0.35723716060027916
Epoch: 17, step: 839, loss: 0.32522639632225037, mean loss: 0.3572358997382862
Epoch: 17, step: 840, loss: 0.33904483914375305, mean loss: 0.35723518324450565
Epoch: 17, step: 841, loss: 0.3216562271118164, mean loss: 0.35723378194650907
Epoch: 17, step: 842, loss: 0.3602192997932434, mean loss: 0.3572338995282446
Epoch: 17, step: 843, loss: 0.3348519504070282, mean loss: 0.35723301807152114
Epoch: 17, step: 844, loss: 0.31800904870033264, mean loss: 0.35723147339506023
Epoch: 17, step: 845, loss: 0.3326634168624878, mean loss: 0.35723050592020267
Epoch: 17, step: 846, loss: 0.3109024465084076, mean loss: 0.3572286816217419
Epoch: 17, step: 847, loss: 0.3221665620803833, mean loss: 0.35722730100591493
Epoch: 17, step: 848, loss: 0.3286330997943878, mean loss: 0.35722617511698274
Epoch: 17, step: 849, loss: 0.31927788257598877, mean loss: 0.3572246809720681
Epoch: 17, step: 850, loss: 0.2980405390262604, mean loss: 0.35722235079600034
Epoch: 17, step: 851, loss: 0.3528759479522705, mean loss: 0.35722217967777814
Epoch: 17, step: 852, loss: 0.3401494324207306, mean loss: 0.3572215075488361
Epoch: 17, step: 853, loss: 0.3317246735095978, mean loss: 0.35722050381550646
Epoch: 17, step: 854, loss: 0.32995015382766724, mean loss: 0.3572194303064726
Epoch: 17, step: 855, loss: 0.31875184178352356, mean loss: 0.35721791607294545
Epoch: 17, step: 856, loss: 0.33271560072898865, mean loss: 0.357216951604717
Epoch: 17, step: 857, loss: 0.3180781900882721, mean loss: 0.35721541107249954
Epoch: 17, step: 858, loss: 0.2931565046310425, mean loss: 0.35721288976315796
Epoch: 17, step: 859, loss: 0.32130444049835205, mean loss: 0.35721147648980844
Epoch: 17, step: 860, loss: 0.34164443612098694, mean loss: 0.3572108638312871
Epoch: 17, step: 861, loss: 0.37168189883232117, mean loss: 0.3572114333328613
Epoch: 17, step: 862, loss: 0.32454967498779297, mean loss: 0.35721014799350653
Epoch: 17, step: 863, loss: 0.3244890570640564, mean loss: 0.3572088603699063
Epoch: 17, step: 864, loss: 0.30839574337005615, mean loss: 0.35720693957672955
Epoch: 17, step: 865, loss: 0.3245498538017273, mean loss: 0.35720565457296094
Epoch: 17, step: 866, loss: 0.3404780924320221, mean loss: 0.3572049963962094
Epoch: 17, step: 867, loss: 0.32095852494239807, mean loss: 0.3572035702681226
Epoch: 17, step: 868, loss: 0.2935276925563812, mean loss: 0.3572010650205438
Epoch: 17, step: 869, loss: 0.3830779194831848, mean loss: 0.3572020830728871
Epoch: 17, step: 870, loss: 0.32362452149391174, mean loss: 0.35720076210976587
Epoch: 17, step: 871, loss: 0.3512374758720398, mean loss: 0.35720052751943393
Epoch: 17, step: 872, loss: 0.3271891474723816, mean loss: 0.35719934694510375
Epoch: 17, step: 873, loss: 0.3194470703601837, mean loss: 0.35719786192124314
Epoch: 17, step: 874, loss: 0.3311825394630432, mean loss: 0.3571968386225586
Epoch: 17, step: 875, loss: 0.3629366457462311, mean loss: 0.3571970643858973
Epoch: 17, step: 876, loss: 0.3178468942642212, mean loss: 0.357195516689924
Epoch: 17, step: 877, loss: 0.37002313137054443, mean loss: 0.3571960211976987
Epoch: 17, step: 878, loss: 0.3127155601978302, mean loss: 0.3571942718579811
Epoch: 17, step: 879, loss: 0.3043845295906067, mean loss: 0.35719219502369337
Epoch: 17, step: 880, loss: 0.31368303298950195, mean loss: 0.3571904840180685
Epoch: 17, step: 881, loss: 0.28896868228912354, mean loss: 0.35718780128894034
Epoch: 17, step: 882, loss: 0.30585941672325134, mean loss: 0.35718578294972575
Epoch: 17, step: 883, loss: 0.35806888341903687, mean loss: 0.357185817673714
Epoch: 17, step: 884, loss: 0.4019598662853241, mean loss: 0.3571875781443078
Epoch: 17, step: 885, loss: 0.3857171833515167, mean loss: 0.3571886998556079
Epoch: 17, step: 886, loss: 0.3149394989013672, mean loss: 0.35718703879010943
Epoch: 17, step: 887, loss: 0.3661038279533386, mean loss: 0.35718738934794725
Epoch: 17, step: 888, loss: 0.27979031205177307, mean loss: 0.35718434665119464
Epoch: 17, step: 889, loss: 0.33287498354911804, mean loss: 0.35718339101934066
Epoch: 17, step: 890, loss: 0.3083673417568207, mean loss: 0.3571814720740495
Epoch: 17, step: 891, loss: 0.31642070412635803, mean loss: 0.357179869842605
Epoch: 17, step: 892, loss: 0.34147343039512634, mean loss: 0.3571792524753849
Epoch: 17, step: 893, loss: 0.3311064839363098, mean loss: 0.3571782276829732
Epoch: 17, step: 894, loss: 0.34061214327812195, mean loss: 0.35717757657719146
Epoch: 17, step: 895, loss: 0.3386061489582062, mean loss: 0.3571768466830074
Epoch: 17, step: 896, loss: 0.3818824291229248, mean loss: 0.3571778176235631
Epoch: 17, step: 897, loss: 0.34279197454452515, mean loss: 0.3571772522756468
Epoch: 17, step: 898, loss: 0.3394377529621124, mean loss: 0.3571765551601002
Epoch: 17, step: 899, loss: 0.3063219487667084, mean loss: 0.3571745567866959
Epoch: 17, step: 900, loss: 0.3320631682872772, mean loss: 0.357173570052895
Epoch: 17, step: 901, loss: 0.3608742356300354, mean loss: 0.3571737154621515
Epoch: 17, step: 902, loss: 0.2971978485584259, mean loss: 0.35717135893915025
Epoch: 17, step: 903, loss: 0.34774672985076904, mean loss: 0.3571709886488356
Epoch: 17, step: 904, loss: 0.35921943187713623, mean loss: 0.3571710691282773
Epoch: 17, step: 905, loss: 0.3413810133934021, mean loss: 0.35717044879136617
Epoch: 17, step: 906, loss: 0.34097903966903687, mean loss: 0.35716981271165205
Epoch: 17, step: 907, loss: 0.33881905674934387, mean loss: 0.3571690918302896
Epoch: 17, step: 908, loss: 0.34519317746162415, mean loss: 0.35716862139330297
Epoch: 17, step: 909, loss: 0.3212054371833801, mean loss: 0.3571672087456398
Epoch: 17, step: 910, loss: 0.3398311138153076, mean loss: 0.3571665278039323
Epoch: 17, step: 911, loss: 0.3289659023284912, mean loss: 0.3571654201595696
Epoch: 17, step: 912, loss: 0.3086830973625183, mean loss: 0.3571635159797339
Epoch: 17, step: 913, loss: 0.3456704914569855, mean loss: 0.35716306460024594
Epoch: 17, step: 914, loss: 0.32276198267936707, mean loss: 0.3571617135779029
Epoch: 17, step: 915, loss: 0.3874197006225586, mean loss: 0.3571629018431811
Epoch: 17, step: 916, loss: 0.32557937502861023, mean loss: 0.35716166157116797
Epoch: 17, step: 917, loss: 0.3004230558872223, mean loss: 0.35715943355712243
Epoch: 17, step: 918, loss: 0.32829663157463074, mean loss: 0.3571583002158579
Epoch: 17, step: 919, loss: 0.35109901428222656, mean loss: 0.35715806229823843
Epoch: 17, step: 920, loss: 0.32010987401008606, mean loss: 0.3571566076597254
Epoch: 17, step: 921, loss: 0.3397558927536011, mean loss: 0.35715592447500194
Epoch: 17, step: 922, loss: 0.332243412733078, mean loss: 0.3571549464014382
Epoch: 17, step: 923, loss: 0.33515867590904236, mean loss: 0.3571540828543868
Epoch: 17, step: 924, loss: 0.3420991897583008, mean loss: 0.357153491840643
Epoch: 17, step: 925, loss: 0.34475472569465637, mean loss: 0.35715300511825365
Epoch: 17, step: 926, loss: 0.37563028931617737, mean loss: 0.35715373042872267
Epoch: 17, step: 927, loss: 0.3152320384979248, mean loss: 0.3571520848920634
Epoch: 17, step: 928, loss: 0.37282830476760864, mean loss: 0.35715270020076834
Epoch: 17, step: 929, loss: 0.3266448974609375, mean loss: 0.3571515027832811
Epoch: 17, step: 930, loss: 0.31601014733314514, mean loss: 0.3571498880670265
Epoch: 17, step: 931, loss: 0.3311687707901001, mean loss: 0.3571488683999434
Epoch: 17, step: 932, loss: 0.2911970317363739, mean loss: 0.3571462801248889
Epoch: 17, step: 933, loss: 0.31919625401496887, mean loss: 0.35714479083730905
Epoch: 17, step: 934, loss: 0.3475915193557739, mean loss: 0.35714441594928636
Epoch: 17, step: 935, loss: 0.31803470849990845, mean loss: 0.3571428812723342
Epoch: 17, step: 936, loss: 0.34980687499046326, mean loss: 0.35714259341648635
Epoch: 17, step: 937, loss: 0.32048165798187256, mean loss: 0.35714115494299364
Epoch: 17, step: 938, loss: 0.32707443833351135, mean loss: 0.357139975254658
Epoch: 17, step: 939, loss: 0.32389405369758606, mean loss: 0.3571386708792046
Epoch: 17, step: 940, loss: 0.3024083971977234, mean loss: 0.3571365236677141
Epoch: 17, step: 941, loss: 0.36876070499420166, mean loss: 0.35713697969679714
Epoch: 17, step: 942, loss: 0.3428798019886017, mean loss: 0.35713642039438814
Epoch: 17, step: 943, loss: 0.35338497161865234, mean loss: 0.35713627323258146
Epoch: 17, step: 944, loss: 0.3534853458404541, mean loss: 0.3571361300196449
Epoch: 17, step: 945, loss: 0.3072890341281891, mean loss: 0.3571341747715123
Epoch: 17, step: 946, loss: 0.40125057101249695, mean loss: 0.3571359051655598
Epoch: 17, step: 947, loss: 0.3365488052368164, mean loss: 0.3571350977016467
Epoch: 17, step: 948, loss: 0.3115633428096771, mean loss: 0.3571333103637288
Epoch: 17, step: 949, loss: 0.34415698051452637, mean loss: 0.3571328014481335
Epoch: 17, step: 950, loss: 0.30765506625175476, mean loss: 0.3571308610686991
Epoch: 17, step: 951, loss: 0.33079463243484497, mean loss: 0.3571298282754194
Epoch: 17, step: 952, loss: 0.34789592027664185, mean loss: 0.3571294661755802
Epoch: 17, step: 953, loss: 0.37695977091789246, mean loss: 0.35713024377360164
Epoch: 17, step: 954, loss: 0.326107919216156, mean loss: 0.3571290273549624
Epoch: 17, step: 955, loss: 0.32704389095306396, mean loss: 0.3571278477307308
Epoch: 17, step: 956, loss: 0.3365391790866852, mean loss: 0.3571270404902429
Epoch: 17, step: 957, loss: 0.33887434005737305, mean loss: 0.35712632486645113
Epoch: 17, step: 958, loss: 0.3379077613353729, mean loss: 0.3571255714041258
Epoch: 17, step: 959, loss: 0.3567999005317688, mean loss: 0.3571255586367245
Epoch: 17, step: 960, loss: 0.3070068359375, mean loss: 0.35712359389005865
Epoch: 17, step: 961, loss: 0.310151606798172, mean loss: 0.3571217525734341
Epoch: 17, step: 962, loss: 0.2954164743423462, mean loss: 0.3571193338019931
Epoch: 17, step: 963, loss: 0.3051539361476898, mean loss: 0.3571172969018028
Epoch: 17, step: 964, loss: 0.325430691242218, mean loss: 0.3571160549229819
Epoch: 17, step: 965, loss: 0.32734718918800354, mean loss: 0.35711488815705983
Epoch: 17, step: 966, loss: 0.2974534332752228, mean loss: 0.35711254986762686
Epoch: 17, step: 967, loss: 0.34904274344444275, mean loss: 0.3571122336030704
Epoch: 17, step: 968, loss: 0.3532995581626892, mean loss: 0.3571120841859978
Epoch: 17, step: 969, loss: 0.3582145869731903, mean loss: 0.35711212739090364
Epoch: 17, step: 970, loss: 0.30176037549972534, mean loss: 0.3571099583501148
Epoch: 17, step: 971, loss: 0.34034958481788635, mean loss: 0.357109301595666
Epoch: 17, step: 972, loss: 0.3215193450450897, mean loss: 0.35710790705953693
Epoch: 17, step: 973, loss: 0.36194702982902527, mean loss: 0.3571080966654757
Epoch: 17, step: 974, loss: 0.365962952375412, mean loss: 0.3571084436017963
Epoch: 17, step: 975, loss: 0.3351345360279083, mean loss: 0.3571075826902004
Epoch: 17, step: 976, loss: 0.3326301872730255, mean loss: 0.35710662373249547
Epoch: 17, step: 977, loss: 0.3052661418914795, mean loss: 0.357104592843134
Epoch: 17, step: 978, loss: 0.34240421652793884, mean loss: 0.35710401696753896
Epoch: 17, step: 979, loss: 0.3148149847984314, mean loss: 0.3571023603931043
Epoch: 17, step: 980, loss: 0.32823777198791504, mean loss: 0.3571012297343082
Epoch: 17, step: 981, loss: 0.33785274624824524, mean loss: 0.357100475778825
Epoch: 17, step: 982, loss: 0.312240868806839, mean loss: 0.3570987187145904
Epoch: 17, step: 983, loss: 0.3270629346370697, mean loss: 0.3570975423169687
Epoch: 17, step: 984, loss: 0.3299809694290161, mean loss: 0.3570964802963332
Epoch: 17, step: 985, loss: 0.33593007922172546, mean loss: 0.35709565134665533
Epoch: 17, step: 986, loss: 0.37857359647750854, mean loss: 0.3570964924645379
Epoch: 17, step: 987, loss: 0.39802220463752747, mean loss: 0.3570980951318379
Epoch: 17, step: 988, loss: 0.327125608921051, mean loss: 0.3570969214432209
Epoch: 17, step: 989, loss: 0.3986872434616089, mean loss: 0.35709855000935836
Epoch: 17, step: 990, loss: 0.3533749282360077, mean loss: 0.35709840420796546
Epoch: 17, step: 991, loss: 0.3420664668083191, mean loss: 0.3570978156434627
Epoch: 17, step: 992, loss: 0.3242972493171692, mean loss: 0.3570965314115874
Epoch: 17, step: 993, loss: 0.33045685291290283, mean loss: 0.35709548843615485
Epoch: 17, step: 994, loss: 0.3311421275138855, mean loss: 0.3570944723706605
Epoch: 17, step: 995, loss: 0.34342676401138306, mean loss: 0.35709393730534733
Epoch: 17, step: 996, loss: 0.33856454491615295, mean loss: 0.3570932119425605
Epoch: 17, step: 997, loss: 0.3320973515510559, mean loss: 0.3570922334778149
Epoch: 17, step: 998, loss: 0.3399876654148102, mean loss: 0.3570915639444817
Epoch: 17, step: 999, loss: 0.3516210615634918, mean loss: 0.35709134981803814
Epoch: 17, step: 1000, loss: 0.32030102610588074, mean loss: 0.35708990982728656
Epoch: 17, step: 1001, loss: 0.3445439636707306, mean loss: 0.35708941879221195
Epoch: 17, step: 1002, loss: 0.31042230129241943, mean loss: 0.3570875923620331
Epoch: 17, step: 1003, loss: 0.34225988388061523, mean loss: 0.35708701206661664
Epoch: 17, step: 1004, loss: 0.3802991211414337, mean loss: 0.35708792045737603
Epoch: 17, step: 1005, loss: 0.34729495644569397, mean loss: 0.35708753723110964
Epoch: 17, step: 1006, loss: 0.3336085081100464, mean loss: 0.35708661846651873
Epoch: 17, step: 1007, loss: 0.32996854186058044, mean loss: 0.35708555734284503
Epoch: 17, step: 1008, loss: 0.3663334846496582, mean loss: 0.3570859191978087
Epoch: 17, step: 1009, loss: 0.3583846092224121, mean loss: 0.3570859700112536
Epoch: 17, step: 1010, loss: 0.32770416140556335, mean loss: 0.3570848204432499
Epoch: 17, step: 1011, loss: 0.3206881880760193, mean loss: 0.35708339647484744
Epoch: 17, step: 1012, loss: 0.35888227820396423, mean loss: 0.35708346685087844
Epoch: 17, step: 1013, loss: 0.3022279739379883, mean loss: 0.35708132087275024
Epoch: 17, step: 1014, loss: 0.31997063755989075, mean loss: 0.3570798691384736
Epoch: 17, step: 1015, loss: 0.304123193025589, mean loss: 0.3570777976052193
Epoch: 17, step: 1016, loss: 0.33652329444885254, mean loss: 0.357076993595708
Epoch: 17, step: 1017, loss: 0.3501015901565552, mean loss: 0.35707672075664676
Epoch: 17, step: 1018, loss: 0.32007837295532227, mean loss: 0.3570752736432662
Epoch: 17, step: 1019, loss: 0.31055229902267456, mean loss: 0.3570734540650974
Epoch: 17, step: 1020, loss: 0.3306463658809662, mean loss: 0.357072420505389
Epoch: 17, step: 1021, loss: 0.3489591181278229, mean loss: 0.3570721032076816
Epoch: 17, step: 1022, loss: 0.3084808588027954, mean loss: 0.35707020295957226
Epoch: 17, step: 1023, loss: 0.3293567895889282, mean loss: 0.35706911921902124
Epoch: 17, step: 1024, loss: 0.33589205145835876, mean loss: 0.35706829111642235
Epoch: 17, step: 1025, loss: 0.3405570983886719, mean loss: 0.35706764549224435
Epoch: 17, step: 1026, loss: 0.3295348584651947, mean loss: 0.35706656894143196
Epoch: 17, step: 1027, loss: 0.3202158510684967, mean loss: 0.3570651281094851
Epoch: 17, step: 1028, loss: 0.3032509982585907, mean loss: 0.357063024104721
Epoch: 17, step: 1029, loss: 0.3318101465702057, mean loss: 0.35706203681574084
Epoch: 17, step: 1030, loss: 0.35292503237724304, mean loss: 0.3570618750813322
Epoch: 17, step: 1031, loss: 0.31135109066963196, mean loss: 0.357060088107743
Epoch: 17, step: 1032, loss: 0.3208197057247162, mean loss: 0.3570586714163555
Epoch: 17, step: 1033, loss: 0.3471865952014923, mean loss: 0.3570582855170429
Epoch: 17, step: 1034, loss: 0.32977643609046936, mean loss: 0.35705721911163985
Epoch: 17, step: 1035, loss: 0.32949158549308777, mean loss: 0.3570561416556666
Epoch: 17, step: 1036, loss: 0.3193456828594208, mean loss: 0.35705466772724
Epoch: 17, step: 1037, loss: 0.3268626034259796, mean loss: 0.3570534877044032
Epoch: 17, step: 1038, loss: 0.3038761615753174, mean loss: 0.35705140940971725
Epoch: 17, step: 1039, loss: 0.32993510365486145, mean loss: 0.35705034968227645
Epoch: 17, step: 1040, loss: 0.3386147618293762, mean loss: 0.35704962923255773
Epoch: 17, step: 1041, loss: 0.358115017414093, mean loss: 0.35704967086554645
Epoch: 17, step: 1042, loss: 0.33788588643074036, mean loss: 0.3570489220169499
Epoch: 17, step: 1043, loss: 0.3447611331939697, mean loss: 0.35704844187515467
Epoch: 17, step: 1044, loss: 0.3515278100967407, mean loss: 0.357048226166493
Epoch: 17, step: 1045, loss: 0.3229887783527374, mean loss: 0.35704689540741613
Epoch: 17, step: 1046, loss: 0.2855505645275116, mean loss: 0.35704410203641085
Epoch: 17, step: 1047, loss: 0.327298104763031, mean loss: 0.35704293990180885
Epoch: 17, step: 1048, loss: 0.39479440450668335, mean loss: 0.3570444147412277
Epoch: 17, step: 1049, loss: 0.34266138076782227, mean loss: 0.3570438528600662
Epoch: 17, step: 1050, loss: 0.31863102316856384, mean loss: 0.35704235230029074
Epoch: 17, step: 1051, loss: 0.3126698136329651, mean loss: 0.35704061899799905
Epoch: 17, step: 1052, loss: 0.38358989357948303, mean loss: 0.357041656038528
Epoch: 17, step: 1053, loss: 0.3516363501548767, mean loss: 0.3570414449102613
Epoch: 17, step: 1054, loss: 0.37431469559669495, mean loss: 0.3570421195675548
Epoch: 17, step: 1055, loss: 0.3219619393348694, mean loss: 0.35704074946209347
Epoch: 17, step: 1056, loss: 0.3049064576625824, mean loss: 0.35703871336399545
Epoch: 17, step: 1057, loss: 0.360333114862442, mean loss: 0.3570388420213999
Epoch: 17, step: 1058, loss: 0.32046985626220703, mean loss: 0.35703741393588584
Epoch: 17, step: 1059, loss: 0.3072618246078491, mean loss: 0.35703547018435006
Epoch: 17, step: 1060, loss: 0.3570972681045532, mean loss: 0.357035472597483
Epoch: 17, step: 1061, loss: 0.30151674151420593, mean loss: 0.35703330474386785
Epoch: 17, step: 1062, loss: 0.3142077922821045, mean loss: 0.35703163259079057
Epoch: 17, step: 1063, loss: 0.33764997124671936, mean loss: 0.3570308758493669
Epoch: 17, step: 1064, loss: 0.33821800351142883, mean loss: 0.3570301413445319
Epoch: 17, step: 1065, loss: 0.3119297921657562, mean loss: 0.3570283805750629
Epoch: 17, step: 1066, loss: 0.4304252564907074, mean loss: 0.35703124596159097
Epoch: 17, step: 1067, loss: 0.3764955997467041, mean loss: 0.3570320058130036
Epoch: 17, step: 1068, loss: 0.3656747043132782, mean loss: 0.35703234319437144
Epoch: 17, step: 1069, loss: 0.3116095960140228, mean loss: 0.3570305701150061
Epoch: 17, step: 1070, loss: 0.331836074590683, mean loss: 0.3570295866849142
Epoch: 17, step: 1071, loss: 0.34091246128082275, mean loss: 0.35702895760117476
Epoch: 17, step: 1072, loss: 0.33366087079048157, mean loss: 0.35702804553346423
Epoch: 17, step: 1073, loss: 0.3622850775718689, mean loss: 0.3570282507099547
Epoch: 17, step: 1074, loss: 0.32781344652175903, mean loss: 0.3570271105310456
Epoch: 17, step: 1075, loss: 0.3320782482624054, mean loss: 0.3570261368789121
Epoch: 17, step: 1076, loss: 0.34132006764411926, mean loss: 0.3570255239591371
Epoch: 17, step: 1077, loss: 0.36610910296440125, mean loss: 0.3570258784264362
Epoch: 17, step: 1078, loss: 0.316945880651474, mean loss: 0.3570243144510284
Epoch: 17, step: 1079, loss: 0.3223336637020111, mean loss: 0.35702296082800866
Epoch: 17, step: 1080, loss: 0.31849944591522217, mean loss: 0.35702145770596283
Epoch: 17, step: 1081, loss: 0.2949835956096649, mean loss: 0.3570190371885186
Epoch: 17, step: 1082, loss: 0.32370254397392273, mean loss: 0.3570177373370413
Epoch: 17, step: 1083, loss: 0.30910348892211914, mean loss: 0.35701586802335467
Epoch: 17, step: 1084, loss: 0.3599031865596771, mean loss: 0.3570159806640341
Epoch: 17, step: 1085, loss: 0.33153268694877625, mean loss: 0.3570149865431901
Epoch: 17, step: 1086, loss: 0.3312460780143738, mean loss: 0.3570139813195299
Epoch: 17, step: 1087, loss: 0.3512476980686188, mean loss: 0.357013756390397
Epoch: 17, step: 1088, loss: 0.3322194814682007, mean loss: 0.3570127892618359
Epoch: 17, step: 1089, loss: 0.3546932637691498, mean loss: 0.35701269878966596
Epoch: 17, step: 1090, loss: 0.3410828113555908, mean loss: 0.35701207747497216
Epoch: 17, step: 1091, loss: 0.34478652477264404, mean loss: 0.3570116006593441
Epoch: 17, step: 1092, loss: 0.3129621148109436, mean loss: 0.3570098827276781
Epoch: 17, step: 1093, loss: 0.3912547528743744, mean loss: 0.3570112182268648
Epoch: 17, step: 1094, loss: 0.2958860397338867, mean loss: 0.3570088345284484
Epoch: 17, step: 1095, loss: 0.3131153881549835, mean loss: 0.35700712288259073
Epoch: 17, step: 1096, loss: 0.31809738278388977, mean loss: 0.3570056056378998
Epoch: 17, step: 1097, loss: 0.328974187374115, mean loss: 0.35700451262463206
Epoch: 17, step: 1098, loss: 0.32481294870376587, mean loss: 0.35700325744609573
Epoch: 17, step: 1099, loss: 0.33970537781715393, mean loss: 0.3570025830122362
Epoch: 17, step: 1100, loss: 0.3161475658416748, mean loss: 0.357000990161943
Epoch: 17, step: 1101, loss: 0.3546816110610962, mean loss: 0.35700089973780647
Epoch: 17, step: 1102, loss: 0.39537739753723145, mean loss: 0.3570023958392372
Epoch: 17, step: 1103, loss: 0.3672339618206024, mean loss: 0.3570027946995982
Epoch: 17, step: 1104, loss: 0.30349305272102356, mean loss: 0.3570007087937791
Epoch: 17, step: 1105, loss: 0.34463775157928467, mean loss: 0.35700022688229494
Epoch: 17, step: 1106, loss: 0.3474740982055664, mean loss: 0.3569998555656441
Epoch: 17, step: 1107, loss: 0.33161115646362305, mean loss: 0.35699886598429464
Epoch: 17, step: 1108, loss: 0.3499603867530823, mean loss: 0.3569985916545121
Epoch: 17, step: 1109, loss: 0.3414458632469177, mean loss: 0.3569979854993789
Epoch: 17, step: 1110, loss: 0.3312476575374603, mean loss: 0.35699698194008345
Epoch: 17, step: 1111, loss: 0.32105112075805664, mean loss: 0.3569955810881278
Epoch: 17, step: 1112, loss: 0.342646986246109, mean loss: 0.3569950219285143
Epoch: 17, step: 1113, loss: 0.3689345419406891, mean loss: 0.35699548718921154
Epoch: 17, step: 1114, loss: 0.31987911462783813, mean loss: 0.3569940408901599
Epoch: 17, step: 1115, loss: 0.3811289370059967, mean loss: 0.3569949813084936
Epoch: 17, step: 1116, loss: 0.33120107650756836, mean loss: 0.3569939762859025
Epoch: 17, step: 1117, loss: 0.3275468349456787, mean loss: 0.35699282896488094
Epoch: 17, step: 1118, loss: 0.2960743308067322, mean loss: 0.35699045554772435
Epoch: 17, step: 1119, loss: 0.35516825318336487, mean loss: 0.3569903845565149
Epoch: 17, step: 1120, loss: 0.33291465044021606, mean loss: 0.3569894466261664
Epoch: 17, step: 1121, loss: 0.3531668186187744, mean loss: 0.35698929771194715
Epoch: 17, step: 1122, loss: 0.3603423833847046, mean loss: 0.35698942832959635
Epoch: 17, step: 1123, loss: 0.33894747495651245, mean loss: 0.35698872554238176
Epoch: 17, step: 1124, loss: 0.42154189944267273, mean loss: 0.35699123998065935
Epoch: 17, step: 1125, loss: 0.3234163820743561, mean loss: 0.35698993224295167
Epoch: 17, step: 1126, loss: 0.3498436212539673, mean loss: 0.35698965390562004
Epoch: 17, step: 1127, loss: 0.30818483233451843, mean loss: 0.35698775311026365
Epoch: 17, step: 1128, loss: 0.34042584896087646, mean loss: 0.3569871081009499
Epoch: 17, step: 1129, loss: 0.3236863315105438, mean loss: 0.3569858112407353
Epoch: 17, step: 1130, loss: 0.3536967635154724, mean loss: 0.3569856831575652
Epoch: 17, step: 1131, loss: 0.3399102985858917, mean loss: 0.35698501822825945
Epoch: 17, step: 1132, loss: 0.34560447931289673, mean loss: 0.3569845750781128
Epoch: 17, step: 1133, loss: 0.3706183433532715, mean loss: 0.3569851059467475
Epoch: 17, step: 1134, loss: 0.3560015559196472, mean loss: 0.3569850676509866
Epoch: 17, step: 1135, loss: 0.3063885271549225, mean loss: 0.3569830976875659
Epoch: 17, step: 1136, loss: 0.3709211051464081, mean loss: 0.35698364033920926
Epoch: 17, step: 1137, loss: 0.30617189407348633, mean loss: 0.3569816621508473
Epoch: 17, step: 1138, loss: 0.31014004349708557, mean loss: 0.3569798385973512
Epoch: 17, step: 1139, loss: 0.3236447274684906, mean loss: 0.3569785409053889
Epoch: 17, step: 1140, loss: 0.33921241760253906, mean loss: 0.35697784932053533
Epoch: 17, step: 1141, loss: 0.3658445179462433, mean loss: 0.3569781944613927
Epoch: 17, step: 1142, loss: 0.3270846903324127, mean loss: 0.3569770308825468
Epoch: 17, step: 1143, loss: 0.3237541913986206, mean loss: 0.3569757377625295
Epoch: 17, step: 1144, loss: 0.31941044330596924, mean loss: 0.3569742756796876
Epoch: 17, step: 1145, loss: 0.3400329351425171, mean loss: 0.3569736163296239
Epoch: 17, step: 1146, loss: 0.3427414894104004, mean loss: 0.3569730624426062
Epoch: 17, step: 1147, loss: 0.31683483719825745, mean loss: 0.3569715004008392
Epoch: 17, step: 1148, loss: 0.31811362504959106, mean loss: 0.35696998824473725
Epoch: 17, step: 1149, loss: 0.3519066274166107, mean loss: 0.3569697912114729
Epoch: 17, step: 1150, loss: 0.3186127841472626, mean loss: 0.3569682986628498
Epoch: 17, step: 1151, loss: 0.34145548939704895, mean loss: 0.3569676950515943
Epoch: 17, step: 1152, loss: 0.33092573285102844, mean loss: 0.3569666817850988
Epoch: 17, step: 1153, loss: 0.36905407905578613, mean loss: 0.35696715207524243
Epoch: 17, step: 1154, loss: 0.3257908821105957, mean loss: 0.35696593913239666
Epoch: 17, step: 1155, loss: 0.3037078082561493, mean loss: 0.35696386715407125
Epoch: 17, step: 1156, loss: 0.3627966344356537, mean loss: 0.35696409406585033
Epoch: 17, step: 1157, loss: 0.3342898488044739, mean loss: 0.35696321200542624
Epoch: 17, step: 1158, loss: 0.34162870049476624, mean loss: 0.3569626154943005
Epoch: 17, step: 1159, loss: 0.3471371829509735, mean loss: 0.3569622333007209
Epoch: 17, step: 1160, loss: 0.3141888380050659, mean loss: 0.3569605695489104
Epoch: 17, step: 1161, loss: 0.3066728413105011, mean loss: 0.3569586135890412
Epoch: 17, step: 1162, loss: 0.3237532675266266, mean loss: 0.3569573221050047
Epoch: 17, step: 1163, loss: 0.3872869610786438, mean loss: 0.3569585016958173
Epoch: 17, step: 1164, loss: 0.35924121737480164, mean loss: 0.35695859047253253
Epoch: 17, step: 1165, loss: 0.3389558792114258, mean loss: 0.3569578903593156
Epoch: 17, step: 1166, loss: 0.3505244255065918, mean loss: 0.35695764017596526
Epoch: 17, step: 1167, loss: 0.3144155442714691, mean loss: 0.35695598587141153
Epoch: 17, step: 1168, loss: 0.34755003452301025, mean loss: 0.3569556201230214
Epoch: 17, step: 1169, loss: 0.34600138664245605, mean loss: 0.35695519418657684
Epoch: 17, step: 1170, loss: 0.33991295099258423, mean loss: 0.35695453155415746
Epoch: 17, step: 1171, loss: 0.3094290792942047, mean loss: 0.3569526837527477
Epoch: 17, step: 1172, loss: 0.31172725558280945, mean loss: 0.3569509254452103
Epoch: 17, step: 1173, loss: 0.3730095624923706, mean loss: 0.35695154976046756
Epoch: 17, step: 1174, loss: 0.33450767397880554, mean loss: 0.35695067723876395
Epoch: 17, step: 1175, loss: 0.3557729423046112, mean loss: 0.35695063145525696
Epoch: 17, step: 1176, loss: 0.40041545033454895, mean loss: 0.3569523210497712
Epoch: 17, step: 1177, loss: 0.3374347984790802, mean loss: 0.35695156238062054
Epoch: 17, step: 1178, loss: 0.3296164870262146, mean loss: 0.3569504998752622
Epoch: 17, step: 1179, loss: 0.3391247093677521, mean loss: 0.3569498070195988
Epoch: 17, step: 1180, loss: 0.3590143620967865, mean loss: 0.35694988726193533
Epoch: 17, step: 1181, loss: 0.30910107493400574, mean loss: 0.35694802761124245
Epoch: 17, step: 1182, loss: 0.33394381403923035, mean loss: 0.35694713358405455
Epoch: 17, step: 1183, loss: 0.3090721666812897, mean loss: 0.35694527306147944
Epoch: 17, step: 1184, loss: 0.3492628037929535, mean loss: 0.3569449745160604
Epoch: 17, step: 1185, loss: 0.32495906949043274, mean loss: 0.3569437315726771
Epoch: 17, step: 1186, loss: 0.33022481203079224, mean loss: 0.35694269333993794
Epoch: 17, step: 1187, loss: 0.336444616317749, mean loss: 0.356941896865077
Epoch: 17, step: 1188, loss: 0.3354537785053253, mean loss: 0.35694106195353487
Epoch: 17, step: 1189, loss: 0.34302273392677307, mean loss: 0.35694052118393244
Epoch: 17, step: 1190, loss: 0.33882007002830505, mean loss: 0.3569398171763503
Epoch: 17, step: 1191, loss: 0.3288942873477936, mean loss: 0.3569387276064269
Epoch: 17, step: 1192, loss: 0.33213353157043457, mean loss: 0.3569377639610349
Epoch: 17, step: 1193, loss: 0.33208200335502625, mean loss: 0.3569367983887947
Epoch: 17, step: 1194, loss: 0.38209614157676697, mean loss: 0.3569377757163474
Epoch: 17, step: 1195, loss: 0.3334326148033142, mean loss: 0.35693686268181846
Epoch: 17, step: 1196, loss: 0.298933744430542, mean loss: 0.3569346096960639
Epoch: 17, step: 1197, loss: 0.34061914682388306, mean loss: 0.35693397598741505
Epoch: 17, step: 1198, loss: 0.3019198179244995, mean loss: 0.3569318392663189
Epoch: 17, step: 1199, loss: 0.37793782353401184, mean loss: 0.35693265509606364
Epoch: 17, step: 1200, loss: 0.3137599229812622, mean loss: 0.3569309784199941
Epoch: 17, step: 1201, loss: 0.4141468405723572, mean loss: 0.3569332003952233
Epoch: 17, step: 1202, loss: 0.3397446274757385, mean loss: 0.3569325329037504
Epoch: 17, step: 1203, loss: 0.307674765586853, mean loss: 0.35693062012931276
Epoch: 17, step: 1204, loss: 0.3746701180934906, mean loss: 0.35693130896160274
Epoch: 17, step: 1205, loss: 0.3349514603614807, mean loss: 0.3569304555078247
Epoch: 17, step: 1206, loss: 0.4058879613876343, mean loss: 0.3569323564010835
Epoch: 17, step: 1207, loss: 0.3388371765613556, mean loss: 0.35693165383935654
Epoch: 17, step: 1208, loss: 0.36353984475135803, mean loss: 0.3569319103983856
Epoch: 17, step: 1209, loss: 0.3333796262741089, mean loss: 0.35693099603065037
Epoch: 17, step: 1210, loss: 0.33716312050819397, mean loss: 0.3569302286143872
Epoch: 17, step: 1211, loss: 0.32947343587875366, mean loss: 0.356929162745104
Epoch: 17, step: 1212, loss: 0.31859272718429565, mean loss: 0.3569276745872079
Epoch: 17, step: 1213, loss: 0.34298864006996155, mean loss: 0.356927133517628
Epoch: 17, step: 1214, loss: 0.3232406973838806, mean loss: 0.35692582596663885
Epoch: 17, step: 1215, loss: 0.33921462297439575, mean loss: 0.35692513852668417
Epoch: 17, step: 1216, loss: 0.3371593952178955, mean loss: 0.35692437137188854
Epoch: 17, step: 1217, loss: 0.3479684293270111, mean loss: 0.3569240237842907
Epoch: 17, step: 1218, loss: 0.34130430221557617, mean loss: 0.35692341759336554
Epoch: 17, step: 1219, loss: 0.32729265093803406, mean loss: 0.35692226768779833
Epoch: 17, step: 1220, loss: 0.3617333173751831, mean loss: 0.35692245438692083
Epoch: 17, step: 1221, loss: 0.32639190554618835, mean loss: 0.35692126965471904
Epoch: 17, step: 1222, loss: 0.34451979398727417, mean loss: 0.35692078843646335
Epoch: 17, step: 1223, loss: 0.31620773673057556, mean loss: 0.35691920869675725
Epoch: 17, step: 1224, loss: 0.33378419280052185, mean loss: 0.3569183110513184
Epoch: 17, step: 1225, loss: 0.34208375215530396, mean loss: 0.3569177354883908
Epoch: 17, step: 1226, loss: 0.3832198977470398, mean loss: 0.35691875594085476
Epoch: 17, step: 1227, loss: 0.3890198767185211, mean loss: 0.3569200013288427
Epoch: 17, step: 1228, loss: 0.3050036132335663, mean loss: 0.35691798727025964
Epoch: 17, step: 1229, loss: 0.3326353430747986, mean loss: 0.356917045279252
Epoch: 17, step: 1230, loss: 0.29988420009613037, mean loss: 0.356914832903086
Epoch: 17, step: 1231, loss: 0.3197828233242035, mean loss: 0.35691339256136456
Epoch: 17, step: 1232, loss: 0.3429773151874542, mean loss: 0.35691285200524286
Epoch: 17, step: 1233, loss: 0.3354288339614868, mean loss: 0.35691201870999645
Epoch: 17, step: 1234, loss: 0.31897738575935364, mean loss: 0.35691054740592204
Epoch: 17, step: 1235, loss: 0.3465092182159424, mean loss: 0.3569101440034558
Epoch: 17, step: 1236, loss: 0.3259376883506775, mean loss: 0.3569089428223174
Epoch: 17, step: 1237, loss: 0.33969101309776306, mean loss: 0.3569082750983693
Epoch: 17, step: 1238, loss: 0.28860700130462646, mean loss: 0.3569056264275742
Epoch: 17, step: 1239, loss: 0.34704461693763733, mean loss: 0.35690524404004936
Epoch: 17, step: 1240, loss: 0.318803995847702, mean loss: 0.35690376661757495
Epoch: 17, step: 1241, loss: 0.33491548895835876, mean loss: 0.35690291402829
Epoch: 17, step: 1242, loss: 0.34579211473464966, mean loss: 0.356902483226875
Epoch: 17, step: 1243, loss: 0.3442201614379883, mean loss: 0.3569019915115451
Epoch: 17, step: 1244, loss: 0.3229494094848633, mean loss: 0.3569006751628448
Epoch: 17, step: 1245, loss: 0.3505536615848541, mean loss: 0.35690042909734204
Epoch: 17, step: 1246, loss: 0.3515165448188782, mean loss: 0.3569002203792076
Epoch: 17, step: 1247, loss: 0.32777026295661926, mean loss: 0.356899091136014
Epoch: 17, step: 1248, loss: 0.35276877880096436, mean loss: 0.35689893102777137
Epoch: 17, step: 1249, loss: 0.31830209493637085, mean loss: 0.3568974349103944
Epoch: 17, step: 1250, loss: 0.3439164161682129, mean loss: 0.35689693175063075
Epoch: 17, step: 1251, loss: 0.3234519362449646, mean loss: 0.3568956354329755
Epoch: 17, step: 1252, loss: 0.3096178472042084, mean loss: 0.3568938030315868
Epoch: 17, step: 1253, loss: 0.29948747158050537, mean loss: 0.3568915781524514
Epoch: 17, step: 1254, loss: 0.29836419224739075, mean loss: 0.35688930991287054
Epoch: 17, step: 1255, loss: 0.35686296224594116, mean loss: 0.3568893088918014
Epoch: 17, step: 1256, loss: 0.29164308309555054, mean loss: 0.35688678045832745
Epoch: 17, step: 1257, loss: 0.3794001042842865, mean loss: 0.3568876528648928
Epoch: 17, step: 1258, loss: 0.32722434401512146, mean loss: 0.35688650343610023
Epoch: 17, step: 1259, loss: 0.3650359809398651, mean loss: 0.3568868192094071
Epoch: 17, step: 1260, loss: 0.337469220161438, mean loss: 0.35688606685173935
Epoch: 17, step: 1261, loss: 0.32692280411720276, mean loss: 0.35688490593493444
Epoch: 17, step: 1262, loss: 0.36933833360671997, mean loss: 0.35688538842021866
Epoch: 17, step: 1263, loss: 0.3717646598815918, mean loss: 0.3568859648680515
Epoch: 17, step: 1264, loss: 0.32382428646087646, mean loss: 0.35688468405302004
Epoch: 17, step: 1265, loss: 0.3481154441833496, mean loss: 0.35688434434433985
Epoch: 17, step: 1266, loss: 0.3514707684516907, mean loss: 0.3568841346377393
Epoch: 17, step: 1267, loss: 0.33796706795692444, mean loss: 0.3568834018725286
Epoch: 17, step: 1268, loss: 0.3112312853336334, mean loss: 0.356881633575804
Epoch: 17, step: 1269, loss: 0.31592512130737305, mean loss: 0.35688004722084743
Epoch: 17, step: 1270, loss: 0.36382678151130676, mean loss: 0.3568803162759731
Epoch: 17, step: 1271, loss: 0.31231051683425903, mean loss: 0.35687859010248585
Epoch: 17, step: 1272, loss: 0.3165636658668518, mean loss: 0.3568770287793676
Epoch: 17, step: 1273, loss: 0.29327914118766785, mean loss: 0.3568745658451413
Epoch: 17, step: 1274, loss: 0.343800812959671, mean loss: 0.3568740595618712
Epoch: 17, step: 1275, loss: 0.2827320098876953, mean loss: 0.35687118850976174
Epoch: 17, step: 1276, loss: 0.31145182251930237, mean loss: 0.35686942977342134
Epoch: 17, step: 1277, loss: 0.32173484563827515, mean loss: 0.3568680693388153
Epoch: 17, step: 1278, loss: 0.3214395344257355, mean loss: 0.3568666975753541
Epoch: 17, step: 1279, loss: 0.30838972330093384, mean loss: 0.35686482065982544
Epoch: 17, step: 1280, loss: 0.2983283996582031, mean loss: 0.3568625543536966
Epoch: 17, step: 1281, loss: 0.3123200833797455, mean loss: 0.3568608299065045
Epoch: 17, step: 1282, loss: 0.32628288865089417, mean loss: 0.3568596461373412
Epoch: 17, step: 1283, loss: 0.284970223903656, mean loss: 0.35685686317736004
Epoch: 17, step: 1284, loss: 0.3246455788612366, mean loss: 0.3568556162728458
Epoch: 17, step: 1285, loss: 0.302404522895813, mean loss: 0.35685350854297904
Epoch: 17, step: 1286, loss: 0.3332124650478363, mean loss: 0.35685259346484877
Epoch: 17, step: 1287, loss: 0.3238328993320465, mean loss: 0.3568513154150681
Epoch: 17, step: 1288, loss: 0.35632720589637756, mean loss: 0.3568512951298369
Epoch: 17, step: 1289, loss: 0.3367515802383423, mean loss: 0.35685051721688343
Epoch: 17, step: 1290, loss: 0.31680184602737427, mean loss: 0.3568489672857255
Epoch: 17, step: 1291, loss: 0.31810277700424194, mean loss: 0.35684746782015736
Epoch: 17, step: 1292, loss: 0.3612162172794342, mean loss: 0.3568476368828662
Epoch: 17, step: 1293, loss: 0.34326109290122986, mean loss: 0.35684711112851353
Epoch: 17, step: 1294, loss: 0.34112900495529175, mean loss: 0.3568465029132841
Epoch: 17, step: 1295, loss: 0.31490540504455566, mean loss: 0.3568448800569976
Epoch: 17, step: 1296, loss: 0.32021257281303406, mean loss: 0.35684346267231026
Epoch: 17, step: 1297, loss: 0.3572691082954407, mean loss: 0.35684347914084014
Epoch: 17, step: 1298, loss: 0.3148166239261627, mean loss: 0.35684185315503075
Epoch: 17, step: 1299, loss: 0.33421725034713745, mean loss: 0.3568409778608955
Epoch: 17, step: 1300, loss: 0.3278926908969879, mean loss: 0.35683985796121026
Epoch: 17, step: 1301, loss: 0.317464143037796, mean loss: 0.3568383347227219
Epoch: 17, step: 1302, loss: 0.34186774492263794, mean loss: 0.35683775561205694
Epoch: 17, step: 1303, loss: 0.3194669187068939, mean loss: 0.35683631004355526
Epoch: 17, step: 1304, loss: 0.3354702591896057, mean loss: 0.3568354835997826
Epoch: 17, step: 1305, loss: 0.3678392171859741, mean loss: 0.35683590921027175
Epoch: 17, step: 1306, loss: 0.3471153676509857, mean loss: 0.356835533246568
Epoch: 17, step: 1307, loss: 0.3380012810230255, mean loss: 0.35683480481787744
Epoch: 17, step: 1308, loss: 0.34358876943588257, mean loss: 0.3568342925374357
Epoch: 17, step: 1309, loss: 0.33224183320999146, mean loss: 0.35683334147937523
Epoch: 17, step: 1310, loss: 0.3458369970321655, mean loss: 0.3568329162369278
Epoch: 17, step: 1311, loss: 0.3217707872390747, mean loss: 0.3568315603928057
Epoch: 17, step: 1312, loss: 0.3570738732814789, mean loss: 0.3568315697626247
Epoch: 17, step: 1313, loss: 0.3241189420223236, mean loss: 0.35683030487097905
Epoch: 17, step: 1314, loss: 0.3583938181400299, mean loss: 0.3568303653246491
Epoch: 17, step: 1315, loss: 0.3239043653011322, mean loss: 0.3568290922810355
Epoch: 17, step: 1316, loss: 0.34863075613975525, mean loss: 0.35682877531462753
Epoch: 17, step: 1317, loss: 0.3126768171787262, mean loss: 0.35682706836503597
Epoch: 17, step: 1318, loss: 0.32185420393943787, mean loss: 0.35682571633873117
Epoch: 17, step: 1319, loss: 0.3150409162044525, mean loss: 0.3568241010302367
Epoch: 17, step: 1320, loss: 0.32726529240608215, mean loss: 0.3568229583958626
Epoch: 17, step: 1321, loss: 0.31363239884376526, mean loss: 0.3568212888728803
Epoch: 17, step: 1322, loss: 0.3634049892425537, mean loss: 0.35682154335474686
Epoch: 17, step: 1323, loss: 0.3648401200771332, mean loss: 0.356821853287366
Epoch: 17, step: 1324, loss: 0.3464677631855011, mean loss: 0.35682145309836194
Epoch: 17, step: 1325, loss: 0.350179523229599, mean loss: 0.35682119639549925
Epoch: 17, step: 1326, loss: 0.31980738043785095, mean loss: 0.35681976590985837
Epoch: 17, step: 1327, loss: 0.3298279643058777, mean loss: 0.3568187227887576
Epoch: 17, step: 1328, loss: 0.3106214106082916, mean loss: 0.35681693752337984
Epoch: 17, step: 1329, loss: 0.3440498113632202, mean loss: 0.356816444165077
Epoch: 17, step: 1330, loss: 0.3240707218647003, mean loss: 0.3568151788255237
Epoch: 17, step: 1331, loss: 0.3608594238758087, mean loss: 0.3568153350946524
Epoch: 17, step: 1332, loss: 0.3171095848083496, mean loss: 0.35681380092865084
Epoch: 17, step: 1333, loss: 0.301279753446579, mean loss: 0.3568116552657391
Epoch: 17, step: 1334, loss: 0.336923211812973, mean loss: 0.35681088686781565
Epoch: 17, step: 1335, loss: 0.34657543897628784, mean loss: 0.356810491432493
Epoch: 17, step: 1336, loss: 0.3449040353298187, mean loss: 0.3568100314573683
Epoch: 17, step: 1337, loss: 0.38127613067626953, mean loss: 0.35681097660529454
Epoch: 17, step: 1338, loss: 0.326540470123291, mean loss: 0.356809807272947
Epoch: 17, step: 1339, loss: 0.2918008863925934, mean loss: 0.35680729611252976
Epoch: 17, step: 1340, loss: 0.29602792859077454, mean loss: 0.3568049484217143
Epoch: 17, step: 1341, loss: 0.3166252076625824, mean loss: 0.3568033964811674
Epoch: 17, step: 1342, loss: 0.32436543703079224, mean loss: 0.35680214361494167
Epoch: 17, step: 1343, loss: 0.32057201862335205, mean loss: 0.35680074433620723
Epoch: 17, step: 1344, loss: 0.32082170248031616, mean loss: 0.356799354808464
Epoch: 17, step: 1345, loss: 0.3140016794204712, mean loss: 0.3567977020056762
Epoch: 17, step: 1346, loss: 0.32368940114974976, mean loss: 0.35679642344607565
Epoch: 17, step: 1347, loss: 0.2734120190143585, mean loss: 0.356793203473708
Epoch: 17, step: 1348, loss: 0.34156110882759094, mean loss: 0.3567926152938167
Epoch: 17, step: 1349, loss: 0.3218011260032654, mean loss: 0.35679126416673
Epoch: 17, step: 1350, loss: 0.3503398597240448, mean loss: 0.3567910150681377
Epoch: 17, step: 1351, loss: 0.35230541229248047, mean loss: 0.35679084187884136
Epoch: 17, step: 1352, loss: 0.3010617792606354, mean loss: 0.356788690260656
Epoch: 17, step: 1353, loss: 0.3132956922054291, mean loss: 0.3567870111239849
Epoch: 17, step: 1354, loss: 0.3185773491859436, mean loss: 0.35678553601832386
Epoch: 17, step: 1355, loss: 0.3288710117340088, mean loss: 0.3567844584038904
Epoch: 17, step: 1356, loss: 0.3480645716190338, mean loss: 0.3567841217937076
Epoch: 17, step: 1357, loss: 0.32887640595436096, mean loss: 0.3567830445252818
Epoch: 17, step: 1358, loss: 0.3339819610118866, mean loss: 0.3567821644124353
Epoch: 17, step: 1359, loss: 0.2954481840133667, mean loss: 0.35677979703631985
Epoch: 17, step: 1360, loss: 0.3502179980278015, mean loss: 0.35677954377301335
Epoch: 17, step: 1361, loss: 0.2955849766731262, mean loss: 0.3567771819603117
Epoch: 17, step: 1362, loss: 0.33225905895233154, mean loss: 0.35677623571651534
Epoch: 17, step: 1363, loss: 0.36135947704315186, mean loss: 0.3567764125936891
Epoch: 17, step: 1364, loss: 0.3745322525501251, mean loss: 0.3567770978034277
Epoch: 17, step: 1365, loss: 0.37894687056541443, mean loss: 0.35677795331677037
Epoch: 17, step: 1366, loss: 0.3277921974658966, mean loss: 0.3567768348233939
Epoch: 17, step: 1367, loss: 0.3198835849761963, mean loss: 0.35677541125301854
Epoch: 17, step: 1368, loss: 0.3297754228115082, mean loss: 0.3567743694662206
Epoch: 17, step: 1369, loss: 0.31157585978507996, mean loss: 0.35677262556199646
Epoch: 17, step: 1370, loss: 0.35074567794799805, mean loss: 0.3567723930318983
Epoch: 17, step: 1371, loss: 0.3747914433479309, mean loss: 0.3567730882113086
Epoch: 17, step: 1372, loss: 0.29896995425224304, mean loss: 0.356770858238161
Epoch: 17, step: 1373, loss: 0.35144367814064026, mean loss: 0.3567706527300946
Epoch: 17, step: 1374, loss: 0.34705862402915955, mean loss: 0.3567702780809915
Epoch: 17, step: 1375, loss: 0.3336088955402374, mean loss: 0.3567693846470098
Epoch: 17, step: 1376, loss: 0.3439253866672516, mean loss: 0.35676888921796523
Epoch: 17, step: 1377, loss: 0.2972998023033142, mean loss: 0.3567665954168808
Epoch: 17, step: 1378, loss: 0.32581958174705505, mean loss: 0.35676540179580357
Epoch: 17, step: 1379, loss: 0.353669673204422, mean loss: 0.3567652823986811
Epoch: 17, step: 1380, loss: 0.3248131275177002, mean loss: 0.35676405010453627
Epoch: 17, step: 1381, loss: 0.343797892332077, mean loss: 0.35676355005988636
Epoch: 17, step: 1382, loss: 0.3466184437274933, mean loss: 0.3567631588252123
Epoch: 17, step: 1383, loss: 0.3385792374610901, mean loss: 0.35676245760967307
Epoch: 17, step: 1384, loss: 0.3213525116443634, mean loss: 0.3567610921700415
Epoch: 17, step: 1385, loss: 0.3095279633998871, mean loss: 0.3567592708879882
Epoch: 17, step: 1386, loss: 0.28107595443725586, mean loss: 0.356756352695721
Epoch: 17, step: 1387, loss: 0.34758761525154114, mean loss: 0.35675599918178497
Epoch: 17, step: 1388, loss: 0.3677181601524353, mean loss: 0.35675642182746375
Epoch: 17, step: 1389, loss: 0.3479733169078827, mean loss: 0.3567560832082595
Epoch: 17, step: 1390, loss: 0.3354012370109558, mean loss: 0.356755259936499
Epoch: 17, step: 1391, loss: 0.39806780219078064, mean loss: 0.35675685255570694
Epoch: 17, step: 1392, loss: 0.33266693353652954, mean loss: 0.35675592391305555
Epoch: 17, step: 1393, loss: 0.32853856682777405, mean loss: 0.3567548362036621
Epoch: 17, step: 1394, loss: 0.3515995442867279, mean loss: 0.3567546374875569
Epoch: 17, step: 1395, loss: 0.30784672498703003, mean loss: 0.35675275235371096
Epoch: 17, step: 1396, loss: 0.28702327609062195, mean loss: 0.356750064765495
Epoch: 17, step: 1397, loss: 0.2934071123600006, mean loss: 0.3567476234276238
Epoch: 17, step: 1398, loss: 0.3058215379714966, mean loss: 0.35674566073114805
Epoch: 17, step: 1399, loss: 0.32669058442115784, mean loss: 0.3567445024501125
Epoch: 17, step: 1400, loss: 0.3421526551246643, mean loss: 0.3567439401221875
Epoch: 17, step: 1401, loss: 0.32960614562034607, mean loss: 0.3567428943497597
Epoch: 17, step: 1402, loss: 0.34534138441085815, mean loss: 0.3567424550021454
Epoch: 17, step: 1403, loss: 0.36112505197525024, mean loss: 0.35674262387533334
Epoch: 17, step: 1404, loss: 0.3249809443950653, mean loss: 0.35674140005999483
Epoch: 17, step: 1405, loss: 0.2911391854286194, mean loss: 0.35673887242592567
Epoch: 17, step: 1406, loss: 0.29962584376335144, mean loss: 0.3567366719624827
Epoch: 17, step: 1407, loss: 0.31648290157318115, mean loss: 0.3567351211160353
Epoch: 17, step: 1408, loss: 0.34974539279937744, mean loss: 0.3567348518349814
Epoch: 17, step: 1409, loss: 0.3238169848918915, mean loss: 0.35673358371467384
Epoch: 17, step: 1410, loss: 0.35351482033729553, mean loss: 0.3567334597205532
Epoch: 17, step: 1411, loss: 0.304235577583313, mean loss: 0.35673143746007024
Epoch: 17, step: 1412, loss: 0.31351783871650696, mean loss: 0.3567297729017426
Epoch: 17, step: 1413, loss: 0.3207499086856842, mean loss: 0.3567283870353142
Epoch: 17, step: 1414, loss: 0.3360232412815094, mean loss: 0.35672758954866957
Epoch: 17, step: 1415, loss: 0.33348140120506287, mean loss: 0.35672669422482334
Epoch: 17, step: 1416, loss: 0.30661827325820923, mean loss: 0.35672476437999506
Epoch: 17, step: 1417, loss: 0.3385522663593292, mean loss: 0.35672406452256533
Epoch: 17, step: 1418, loss: 0.3791065216064453, mean loss: 0.3567249264803226
Epoch: 17, step: 1419, loss: 0.350406289100647, mean loss: 0.3567246831563323
Epoch: 17, step: 1420, loss: 0.34355977177619934, mean loss: 0.3567241762091499
Epoch: 17, step: 1421, loss: 0.3263644874095917, mean loss: 0.3567230071799316
Epoch: 17, step: 1422, loss: 0.32737618684768677, mean loss: 0.35672187719570564
Epoch: 17, step: 1423, loss: 0.3508080542087555, mean loss: 0.35672164949576
Epoch: 17, step: 1424, loss: 0.3354182839393616, mean loss: 0.35672082928378773
Epoch: 17, step: 1425, loss: 0.36362409591674805, mean loss: 0.35672109505981886
Epoch: 17, step: 1426, loss: 0.39194029569625854, mean loss: 0.35672245094819754
Epoch: 17, step: 1427, loss: 0.32879334688186646, mean loss: 0.3567213757594053
Epoch: 17, step: 1428, loss: 0.33725929260253906, mean loss: 0.3567206265549877
Epoch: 17, step: 1429, loss: 0.31298723816871643, mean loss: 0.35671894307710694
Epoch: 17, step: 1430, loss: 0.3354059159755707, mean loss: 0.35671812268266906
Epoch: 17, step: 1431, loss: 0.33941057324409485, mean loss: 0.3567174564952388
Epoch: 17, step: 1432, loss: 0.34774982929229736, mean loss: 0.3567171113342672
Epoch: 17, step: 1433, loss: 0.3167872130870819, mean loss: 0.35671557450499125
Epoch: 17, step: 1434, loss: 0.3253623843193054, mean loss: 0.35671436782407734
Epoch: 17, step: 1435, loss: 0.31267836689949036, mean loss: 0.3567126730888201
Epoch: 17, step: 1436, loss: 0.3424871265888214, mean loss: 0.35671212563657845
Epoch: 17, step: 1437, loss: 0.3050059676170349, mean loss: 0.3567101358667786
Epoch: 17, step: 1438, loss: 0.3496445119380951, mean loss: 0.35670986397606674
Epoch: 17, step: 1439, loss: 0.35216856002807617, mean loss: 0.35670968922987817
Epoch: 17, step: 1440, loss: 0.3531801700592041, mean loss: 0.35670955342168353
Epoch: 17, step: 1441, loss: 0.3123584985733032, mean loss: 0.3567078469555485
Epoch: 17, step: 1442, loss: 0.3451785445213318, mean loss: 0.35670740336728973
Epoch: 17, step: 1443, loss: 0.380374014377594, mean loss: 0.3567083139017238
Valid: 17, mean loss: 0.19009617964426678
Epoch: 18, step: 0, loss: 0.42134684324264526, mean loss: 0.3567108006685203
Epoch: 18, step: 1, loss: 0.3000045716762543, mean loss: 0.356708619156287
Epoch: 18, step: 2, loss: 0.3358621597290039, mean loss: 0.3567078172151665
Epoch: 18, step: 3, loss: 0.33206650614738464, mean loss: 0.3567068693266041
Epoch: 18, step: 4, loss: 0.36639171838760376, mean loss: 0.35670724186378383
Epoch: 18, step: 5, loss: 0.3462505638599396, mean loss: 0.3567068396529213
Epoch: 18, step: 6, loss: 0.3239222466945648, mean loss: 0.3567055786585385
Epoch: 18, step: 7, loss: 0.35170233249664307, mean loss: 0.35670538622599385
Epoch: 18, step: 8, loss: 0.36118775606155396, mean loss: 0.3567055586182032
Epoch: 18, step: 9, loss: 0.3402811288833618, mean loss: 0.35670492695795647
Epoch: 18, step: 10, loss: 0.331817626953125, mean loss: 0.356703969864544
Epoch: 18, step: 11, loss: 0.38347193598747253, mean loss: 0.3567049992433366
Epoch: 18, step: 12, loss: 0.3521583080291748, mean loss: 0.3567048244042205
Epoch: 18, step: 13, loss: 0.3183481991291046, mean loss: 0.3567033494897671
Epoch: 18, step: 14, loss: 0.3214047849178314, mean loss: 0.3567019922180875
Epoch: 18, step: 15, loss: 0.30112403631210327, mean loss: 0.35669985526192377
Epoch: 18, step: 16, loss: 0.3422657549381256, mean loss: 0.35669930029632246
Epoch: 18, step: 17, loss: 0.3577168881893158, mean loss: 0.35669933941927107
Epoch: 18, step: 18, loss: 0.30982494354248047, mean loss: 0.35669753732031767
Epoch: 18, step: 19, loss: 0.38600414991378784, mean loss: 0.35669866397772937
Epoch: 18, step: 20, loss: 0.28864333033561707, mean loss: 0.35669604777299935
Epoch: 18, step: 21, loss: 0.31104782223701477, mean loss: 0.3566942930168859
Epoch: 18, step: 22, loss: 0.3236270546913147, mean loss: 0.3566930219333446
Epoch: 18, step: 23, loss: 0.3394078016281128, mean loss: 0.35669235752604506
Epoch: 18, step: 24, loss: 0.36718231439590454, mean loss: 0.35669276072229633
Epoch: 18, step: 25, loss: 0.33013561367988586, mean loss: 0.3566917400002177
Epoch: 18, step: 26, loss: 0.3311779201030731, mean loss: 0.3566907594160332
Epoch: 18, step: 27, loss: 0.38112491369247437, mean loss: 0.35669169846884935
Epoch: 18, step: 28, loss: 0.3277147710323334, mean loss: 0.3566905848710846
Epoch: 18, step: 29, loss: 0.344015508890152, mean loss: 0.356690097780316
Epoch: 18, step: 30, loss: 0.30053141713142395, mean loss: 0.3566879397400959
Epoch: 18, step: 31, loss: 0.34069445729255676, mean loss: 0.35668732517344787
Epoch: 18, step: 32, loss: 0.35640808939933777, mean loss: 0.35668731444392726
Epoch: 18, step: 33, loss: 0.29674503207206726, mean loss: 0.3566850112746976
Epoch: 18, step: 34, loss: 0.39202752709388733, mean loss: 0.35668636919208413
Epoch: 18, step: 35, loss: 0.3238104283809662, mean loss: 0.3566851060930826
Epoch: 18, step: 36, loss: 0.32563522458076477, mean loss: 0.3566839131974081
Epoch: 18, step: 37, loss: 0.31760311126708984, mean loss: 0.3566824118219978
Epoch: 18, step: 38, loss: 0.33023276925086975, mean loss: 0.35668139573953567
Epoch: 18, step: 39, loss: 0.3296981751918793, mean loss: 0.35668035919910285
Epoch: 18, step: 40, loss: 0.3427218794822693, mean loss: 0.35667982301503964
Epoch: 18, step: 41, loss: 0.31866833567619324, mean loss: 0.35667836294408095
Epoch: 18, step: 42, loss: 0.30150890350341797, mean loss: 0.3566762438943617
Epoch: 18, step: 43, loss: 0.3255918323993683, mean loss: 0.3566750499931674
Epoch: 18, step: 44, loss: 0.3860396444797516, mean loss: 0.3566761777956979
Epoch: 18, step: 45, loss: 0.34954795241355896, mean loss: 0.35667590403329746
Epoch: 18, step: 46, loss: 0.35238468647003174, mean loss: 0.3566757392336676
Epoch: 18, step: 47, loss: 0.3056751787662506, mean loss: 0.3566737806867986
Epoch: 18, step: 48, loss: 0.3392893671989441, mean loss: 0.3566731131082307
Epoch: 18, step: 49, loss: 0.3042604923248291, mean loss: 0.35667110048935413
Epoch: 18, step: 50, loss: 0.3562248945236206, mean loss: 0.3566710833559223
Epoch: 18, step: 51, loss: 0.34212812781333923, mean loss: 0.35667052495646207
Epoch: 18, step: 52, loss: 0.31582820415496826, mean loss: 0.3566689568120658
Epoch: 18, step: 53, loss: 0.3164745569229126, mean loss: 0.35666741360389986
Epoch: 18, step: 54, loss: 0.2980646789073944, mean loss: 0.35666516371966384
Epoch: 18, step: 55, loss: 0.3077554404735565, mean loss: 0.3566632860429422
Epoch: 18, step: 56, loss: 0.368940144777298, mean loss: 0.3566637573415999
Epoch: 18, step: 57, loss: 0.3269650936126709, mean loss: 0.35666261727773313
Epoch: 18, step: 58, loss: 0.31492388248443604, mean loss: 0.3566610150845431
Epoch: 18, step: 59, loss: 0.32360100746154785, mean loss: 0.3566597460837899
Epoch: 18, step: 60, loss: 0.33276936411857605, mean loss: 0.3566588290921972
Epoch: 18, step: 61, loss: 0.3588878810405731, mean loss: 0.3566589146472731
Epoch: 18, step: 62, loss: 0.30317422747612, mean loss: 0.35665686188629936
Epoch: 18, step: 63, loss: 0.30686846375465393, mean loss: 0.35665495106352796
Epoch: 18, step: 64, loss: 0.3969404697418213, mean loss: 0.3566564971171288
Epoch: 18, step: 65, loss: 0.33419883251190186, mean loss: 0.35665563528335015
Epoch: 18, step: 66, loss: 0.3241134583950043, mean loss: 0.3566543864949512
Epoch: 18, step: 67, loss: 0.3130875825881958, mean loss: 0.35665271470662013
Epoch: 18, step: 68, loss: 0.32778701186180115, mean loss: 0.35665160708592847
Epoch: 18, step: 69, loss: 0.3602341115474701, mean loss: 0.35665174454677034
Epoch: 18, step: 70, loss: 0.3132564127445221, mean loss: 0.3566500795300109
Epoch: 18, step: 71, loss: 0.31766176223754883, mean loss: 0.3566485836614837
Epoch: 18, step: 72, loss: 0.30489885807037354, mean loss: 0.35664659825094885
Epoch: 18, step: 73, loss: 0.3223803639411926, mean loss: 0.356645283655909
Epoch: 18, step: 74, loss: 0.29891130328178406, mean loss: 0.3566430688256495
Epoch: 18, step: 75, loss: 0.3409635126590729, mean loss: 0.3566424673389161
Epoch: 18, step: 76, loss: 0.39703047275543213, mean loss: 0.35664401661220685
Epoch: 18, step: 77, loss: 0.3353186547756195, mean loss: 0.35664319860830057
Epoch: 18, step: 78, loss: 0.3561529517173767, mean loss: 0.3566431798040011
Epoch: 18, step: 79, loss: 0.3227155804634094, mean loss: 0.3566418784999454
Epoch: 18, step: 80, loss: 0.32043880224227905, mean loss: 0.3566404899724933
Epoch: 18, step: 81, loss: 0.3067888915538788, mean loss: 0.35663857804496324
Epoch: 18, step: 82, loss: 0.35542306303977966, mean loss: 0.35663853142885565
Epoch: 18, step: 83, loss: 0.3484259843826294, mean loss: 0.3566382164822747
Epoch: 18, step: 84, loss: 0.2947484850883484, mean loss: 0.35663584313674435
Epoch: 18, step: 85, loss: 0.34526678919792175, mean loss: 0.35663540717332926
Epoch: 18, step: 86, loss: 0.365225613117218, mean loss: 0.35663573656502157
Epoch: 18, step: 87, loss: 0.32390761375427246, mean loss: 0.35663448165233713
Epoch: 18, step: 88, loss: 0.3429243266582489, mean loss: 0.3566339559763663
Epoch: 18, step: 89, loss: 0.29719266295433044, mean loss: 0.3566316769604541
Epoch: 18, step: 90, loss: 0.38361385464668274, mean loss: 0.3566327114341606
Epoch: 18, step: 91, loss: 0.3292689025402069, mean loss: 0.356631662369259
Epoch: 18, step: 92, loss: 0.32994213700294495, mean loss: 0.35663063919404847
Epoch: 18, step: 93, loss: 0.34691596031188965, mean loss: 0.35663026678436965
Epoch: 18, step: 94, loss: 0.3210693895816803, mean loss: 0.35662890361968214
Epoch: 18, step: 95, loss: 0.3525809347629547, mean loss: 0.35662874845374926
Epoch: 18, step: 96, loss: 0.33366501331329346, mean loss: 0.35662786824618514
Epoch: 18, step: 97, loss: 0.31363168358802795, mean loss: 0.35662622025137264
Epoch: 18, step: 98, loss: 0.32858583331108093, mean loss: 0.3566251455364541
Epoch: 18, step: 99, loss: 0.31385964155197144, mean loss: 0.3566235065090133
Epoch: 18, step: 100, loss: 0.3330239951610565, mean loss: 0.35662260207060653
Epoch: 18, step: 101, loss: 0.31033700704574585, mean loss: 0.35662082826839053
Epoch: 18, step: 102, loss: 0.31709951162338257, mean loss: 0.3566193137515618
Epoch: 18, step: 103, loss: 0.3217513859272003, mean loss: 0.35661797761085734
Epoch: 18, step: 104, loss: 0.3372212052345276, mean loss: 0.3566172343540701
Epoch: 18, step: 105, loss: 0.3401409685611725, mean loss: 0.3566166030311414
Epoch: 18, step: 106, loss: 0.33542120456695557, mean loss: 0.35661579091579354
Epoch: 18, step: 107, loss: 0.4085044264793396, mean loss: 0.3566177789861216
Epoch: 18, step: 108, loss: 0.3166173994541168, mean loss: 0.3566162464632477
Epoch: 18, step: 109, loss: 0.3213028907775879, mean loss: 0.35661489356478454
Epoch: 18, step: 110, loss: 0.35397323966026306, mean loss: 0.3566147923636236
Epoch: 18, step: 111, loss: 0.32441920042037964, mean loss: 0.35661355900506003
Epoch: 18, step: 112, loss: 0.33957570791244507, mean loss: 0.3566129063388623
Epoch: 18, step: 113, loss: 0.32157331705093384, mean loss: 0.35661156413441547
Epoch: 18, step: 114, loss: 0.3719254732131958, mean loss: 0.35661215071690594
Epoch: 18, step: 115, loss: 0.3761415183544159, mean loss: 0.35661289873926066
Epoch: 18, step: 116, loss: 0.3159518241882324, mean loss: 0.35661134138070416
Epoch: 18, step: 117, loss: 0.37753206491470337, mean loss: 0.3566121426339992
Epoch: 18, step: 118, loss: 0.29293081164360046, mean loss: 0.3566097037641363
Epoch: 18, step: 119, loss: 0.3466896712779999, mean loss: 0.3566093238609314
Epoch: 18, step: 120, loss: 0.3460911810398102, mean loss: 0.35660892106757863
Epoch: 18, step: 121, loss: 0.3349899351596832, mean loss: 0.3566080931980103
Epoch: 18, step: 122, loss: 0.28935328125953674, mean loss: 0.3566055178653686
Epoch: 18, step: 123, loss: 0.32528403401374817, mean loss: 0.35660431854373237
Epoch: 18, step: 124, loss: 0.295925110578537, mean loss: 0.35660199518316393
Epoch: 18, step: 125, loss: 0.3053447902202606, mean loss: 0.35660003265904405
Epoch: 18, step: 126, loss: 0.33087557554244995, mean loss: 0.3565990477646332
Epoch: 18, step: 127, loss: 0.38966843485832214, mean loss: 0.35660031382080065
Epoch: 18, step: 128, loss: 0.3249923288822174, mean loss: 0.3565991037605067
Epoch: 18, step: 129, loss: 0.31587478518486023, mean loss: 0.35659754475589084
Epoch: 18, step: 130, loss: 0.3619760274887085, mean loss: 0.35659775064658994
Epoch: 18, step: 131, loss: 0.32304465770721436, mean loss: 0.3565964662685108
Epoch: 18, step: 132, loss: 0.31241506338119507, mean loss: 0.3565947751143333
Epoch: 18, step: 133, loss: 0.3407585322856903, mean loss: 0.35659416896556084
Epoch: 18, step: 134, loss: 0.3281712234020233, mean loss: 0.35659308108920446
Epoch: 18, step: 135, loss: 0.35107576847076416, mean loss: 0.35659286992445327
Epoch: 18, step: 136, loss: 0.36493730545043945, mean loss: 0.3565931892797874
Epoch: 18, step: 137, loss: 0.38102686405181885, mean loss: 0.3565941243611028
Epoch: 18, step: 138, loss: 0.36147618293762207, mean loss: 0.35659431119125
Epoch: 18, step: 139, loss: 0.29243770241737366, mean loss: 0.3565918560937154
Epoch: 18, step: 140, loss: 0.2947828769683838, mean loss: 0.3565894909240401
Epoch: 18, step: 141, loss: 0.3408224582672119, mean loss: 0.3565888876090995
Epoch: 18, step: 142, loss: 0.32019051909446716, mean loss: 0.35658749490320646
Epoch: 18, step: 143, loss: 0.3422195613384247, mean loss: 0.3565869451659259
Epoch: 18, step: 144, loss: 0.312677800655365, mean loss: 0.35658526520477846
Epoch: 18, step: 145, loss: 0.3237820267677307, mean loss: 0.35658401020292535
Epoch: 18, step: 146, loss: 0.3155055344104767, mean loss: 0.35658243866324163
Epoch: 18, step: 147, loss: 0.34098920226097107, mean loss: 0.3565818421354527
Epoch: 18, step: 148, loss: 0.31905338168144226, mean loss: 0.35658040651858824
Epoch: 18, step: 149, loss: 0.35695523023605347, mean loss: 0.3565804208565776
Epoch: 18, step: 150, loss: 0.3413758873939514, mean loss: 0.3565798392655795
Epoch: 18, step: 151, loss: 0.3229730427265167, mean loss: 0.3565785538158955
Epoch: 18, step: 152, loss: 0.3868165910243988, mean loss: 0.3565797103673282
Epoch: 18, step: 153, loss: 0.3362743854522705, mean loss: 0.356578933754274
Epoch: 18, step: 154, loss: 0.33114370703697205, mean loss: 0.3565779609762606
Epoch: 18, step: 155, loss: 0.327823281288147, mean loss: 0.35657686128681254
Epoch: 18, step: 156, loss: 0.35945427417755127, mean loss: 0.3565769713259303
Epoch: 18, step: 157, loss: 0.3379635810852051, mean loss: 0.3565762595328045
Epoch: 18, step: 158, loss: 0.33273711800575256, mean loss: 0.3565753479370136
Epoch: 18, step: 159, loss: 0.31753888726234436, mean loss: 0.35657385526109303
Epoch: 18, step: 160, loss: 0.30983996391296387, mean loss: 0.35657206831919924
Epoch: 18, step: 161, loss: 0.30895310640335083, mean loss: 0.3565702476048949
Epoch: 18, step: 162, loss: 0.2978135645389557, mean loss: 0.3565680011249459
Epoch: 18, step: 163, loss: 0.3343140184879303, mean loss: 0.3565671503074418
Epoch: 18, step: 164, loss: 0.3055686354637146, mean loss: 0.35656520059933905
Epoch: 18, step: 165, loss: 0.31962576508522034, mean loss: 0.3565637884334428
Epoch: 18, step: 166, loss: 0.32688257098197937, mean loss: 0.35656265378695584
Epoch: 18, step: 167, loss: 0.33781492710113525, mean loss: 0.356561937130737
Epoch: 18, step: 168, loss: 0.3254663050174713, mean loss: 0.3565607485052214
Epoch: 18, step: 169, loss: 0.340769499540329, mean loss: 0.3565601449103523
Epoch: 18, step: 170, loss: 0.3188546299934387, mean loss: 0.35655870373331155
Epoch: 18, step: 171, loss: 0.276617169380188, mean loss: 0.3565556483314482
Epoch: 18, step: 172, loss: 0.34269392490386963, mean loss: 0.356555118550312
Epoch: 18, step: 173, loss: 0.3254812955856323, mean loss: 0.35655393098542
Epoch: 18, step: 174, loss: 0.33878305554389954, mean loss: 0.3565532518523347
Epoch: 18, step: 175, loss: 0.32755008339881897, mean loss: 0.3565521435074687
Epoch: 18, step: 176, loss: 0.31176450848579407, mean loss: 0.3565504320307206
Epoch: 18, step: 177, loss: 0.30947554111480713, mean loss: 0.3565486332194514
Epoch: 18, step: 178, loss: 0.3313269317150116, mean loss: 0.3565476694923678
Epoch: 18, step: 179, loss: 0.40813517570495605, mean loss: 0.35654964058766864
Epoch: 18, step: 180, loss: 0.31347301602363586, mean loss: 0.3565479947455961
Epoch: 18, step: 181, loss: 0.3345288634300232, mean loss: 0.3565471534858989
Epoch: 18, step: 182, loss: 0.3123965859413147, mean loss: 0.35654546674024296
Epoch: 18, step: 183, loss: 0.34163764119148254, mean loss: 0.35654489721756766
Epoch: 18, step: 184, loss: 0.3231496512889862, mean loss: 0.35654362146992935
Epoch: 18, step: 185, loss: 0.328937828540802, mean loss: 0.3565425669282176
Epoch: 18, step: 186, loss: 0.3635055422782898, mean loss: 0.3565428329038221
Epoch: 18, step: 187, loss: 0.30809280276298523, mean loss: 0.35654098225332015
Epoch: 18, step: 188, loss: 0.34578534960746765, mean loss: 0.3565405714350685
Epoch: 18, step: 189, loss: 0.3694241940975189, mean loss: 0.3565410635144613
Epoch: 18, step: 190, loss: 0.3310062885284424, mean loss: 0.35654008827193806
Epoch: 18, step: 191, loss: 0.33358609676361084, mean loss: 0.3565392116300381
Epoch: 18, step: 192, loss: 0.3080363869667053, mean loss: 0.3565373593167036
Epoch: 18, step: 193, loss: 0.31021028757095337, mean loss: 0.3565355901625088
Epoch: 18, step: 194, loss: 0.36058366298675537, mean loss: 0.3565357447458068
Epoch: 18, step: 195, loss: 0.33857885003089905, mean loss: 0.35653505905408867
Epoch: 18, step: 196, loss: 0.30194130539894104, mean loss: 0.35653297444781673
Epoch: 18, step: 197, loss: 0.30011624097824097, mean loss: 0.35653082031519095
Epoch: 18, step: 198, loss: 0.3137066960334778, mean loss: 0.35652918524496524
Epoch: 18, step: 199, loss: 0.3626348078250885, mean loss: 0.3565294183551737
Epoch: 18, step: 200, loss: 0.30282920598983765, mean loss: 0.35652736818099107
Epoch: 18, step: 201, loss: 0.34156182408332825, mean loss: 0.35652679684617783
Epoch: 18, step: 202, loss: 0.31935200095176697, mean loss: 0.35652537769000703
Epoch: 18, step: 203, loss: 0.3173363506793976, mean loss: 0.3565238816972215
Epoch: 18, step: 204, loss: 0.3296196758747101, mean loss: 0.3565228547015417
Epoch: 18, step: 205, loss: 0.3278263509273529, mean loss: 0.3565217593315221
Epoch: 18, step: 206, loss: 0.3440161347389221, mean loss: 0.35652128199938754
Epoch: 18, step: 207, loss: 0.329610139131546, mean loss: 0.35652025485653
Epoch: 18, step: 208, loss: 0.3428935110569, mean loss: 0.3565197347716554
Epoch: 18, step: 209, loss: 0.3898971974849701, mean loss: 0.3565210086233733
Epoch: 18, step: 210, loss: 0.3378881514072418, mean loss: 0.35652029752704023
Epoch: 18, step: 211, loss: 0.32646721601486206, mean loss: 0.35651915063795797
Epoch: 18, step: 212, loss: 0.3292285203933716, mean loss: 0.35651810920959526
Epoch: 18, step: 213, loss: 0.298115998506546, mean loss: 0.3565158806317618
Epoch: 18, step: 214, loss: 0.31471067667007446, mean loss: 0.35651428543948643
Epoch: 18, step: 215, loss: 0.31230971217155457, mean loss: 0.356512598757051
Epoch: 18, step: 216, loss: 0.28928327560424805, mean loss: 0.3565100336334998
Epoch: 18, step: 217, loss: 0.3057400584220886, mean loss: 0.3565080965875169
Epoch: 18, step: 218, loss: 0.31982630491256714, mean loss: 0.3565066971067007
Epoch: 18, step: 219, loss: 0.3382786810398102, mean loss: 0.3565060016994038
Epoch: 18, step: 220, loss: 0.332588255405426, mean loss: 0.35650508926106045
Epoch: 18, step: 221, loss: 0.35619214177131653, mean loss: 0.35650507732287895
Epoch: 18, step: 222, loss: 0.34655293822288513, mean loss: 0.35650469768758997
Epoch: 18, step: 223, loss: 0.36348339915275574, mean loss: 0.3565049638876764
Epoch: 18, step: 224, loss: 0.31671613454818726, mean loss: 0.35650344621481755
Epoch: 18, step: 225, loss: 0.33767518401145935, mean loss: 0.356502728072236
Epoch: 18, step: 226, loss: 0.34042108058929443, mean loss: 0.3565021147136989
Epoch: 18, step: 227, loss: 0.3594294786453247, mean loss: 0.35650222635992057
Epoch: 18, step: 228, loss: 0.3671133518218994, mean loss: 0.356502631040347
Epoch: 18, step: 229, loss: 0.3232142925262451, mean loss: 0.35650136155905215
Epoch: 18, step: 230, loss: 0.2952783703804016, mean loss: 0.3564990268532146
Epoch: 18, step: 231, loss: 0.35210782289505005, mean loss: 0.35649885940339926
Epoch: 18, step: 232, loss: 0.3248620331287384, mean loss: 0.35649765304205416
Epoch: 18, step: 233, loss: 0.33693844079971313, mean loss: 0.3564969072473374
Epoch: 18, step: 234, loss: 0.3044092357158661, mean loss: 0.3564949212149459
Epoch: 18, step: 235, loss: 0.32946109771728516, mean loss: 0.3564938904911584
Epoch: 18, step: 236, loss: 0.3060746192932129, mean loss: 0.3564919682192
Epoch: 18, step: 237, loss: 0.30890825390815735, mean loss: 0.3564901541241062
Epoch: 18, step: 238, loss: 0.33766719698905945, mean loss: 0.356489436539678
Epoch: 18, step: 239, loss: 0.3267798125743866, mean loss: 0.3564883039678587
Epoch: 18, step: 240, loss: 0.3142339885234833, mean loss: 0.356486693236511
Epoch: 18, step: 241, loss: 0.28215447068214417, mean loss: 0.35648385980575115
Epoch: 18, step: 242, loss: 0.32038524746894836, mean loss: 0.35648248383424985
Epoch: 18, step: 243, loss: 0.350369393825531, mean loss: 0.3564822508303617
Epoch: 18, step: 244, loss: 0.3420858681201935, mean loss: 0.35648170212499486
Epoch: 18, step: 245, loss: 0.31793174147605896, mean loss: 0.3564802328834121
Epoch: 18, step: 246, loss: 0.33262622356414795, mean loss: 0.35647932377828917
Epoch: 18, step: 247, loss: 0.3497164249420166, mean loss: 0.356479066045864
Epoch: 18, step: 248, loss: 0.32417115569114685, mean loss: 0.35647783484620105
Epoch: 18, step: 249, loss: 0.3563898503780365, mean loss: 0.35647783149338996
Epoch: 18, step: 250, loss: 0.31040817499160767, mean loss: 0.3564760759907225
Epoch: 18, step: 251, loss: 0.31804290413856506, mean loss: 0.35647461153515736
Epoch: 18, step: 252, loss: 0.3506472408771515, mean loss: 0.35647438949779187
Epoch: 18, step: 253, loss: 0.3708498477935791, mean loss: 0.35647493721776047
Epoch: 18, step: 254, loss: 0.35323530435562134, mean loss: 0.3564748137890691
Epoch: 18, step: 255, loss: 0.3240659832954407, mean loss: 0.3564735790728814
Epoch: 18, step: 256, loss: 0.35451728105545044, mean loss: 0.35647350454440346
Epoch: 18, step: 257, loss: 0.3230850100517273, mean loss: 0.35647223260175614
Epoch: 18, step: 258, loss: 0.302961528301239, mean loss: 0.3564701941763895
Epoch: 18, step: 259, loss: 0.335168719291687, mean loss: 0.3564693827534547
Epoch: 18, step: 260, loss: 0.3378772735595703, mean loss: 0.35646867456356424
Epoch: 18, step: 261, loss: 0.33308765292167664, mean loss: 0.3564677839936838
Epoch: 18, step: 262, loss: 0.3212145268917084, mean loss: 0.3564664412682181
Epoch: 18, step: 263, loss: 0.29970237612724304, mean loss: 0.35646427932180047
Epoch: 18, step: 264, loss: 0.30769628286361694, mean loss: 0.3564624219886528
Epoch: 18, step: 265, loss: 0.3731369972229004, mean loss: 0.356463057017034
Epoch: 18, step: 266, loss: 0.3510203957557678, mean loss: 0.35646284974862086
Epoch: 18, step: 267, loss: 0.3628779947757721, mean loss: 0.3564630940420339
Epoch: 18, step: 268, loss: 0.32827848196029663, mean loss: 0.3564620207922688
Epoch: 18, step: 269, loss: 0.332614541053772, mean loss: 0.35646111273196346
Epoch: 18, step: 270, loss: 0.3165501356124878, mean loss: 0.35645959306638375
Epoch: 18, step: 271, loss: 0.3295060098171234, mean loss: 0.35645856681054877
Epoch: 18, step: 272, loss: 0.3472636640071869, mean loss: 0.3564582167285841
Epoch: 18, step: 273, loss: 0.3551689684391022, mean loss: 0.35645816764428156
Epoch: 18, step: 274, loss: 0.3400516211986542, mean loss: 0.35645754303749566
Epoch: 18, step: 275, loss: 0.30369630455970764, mean loss: 0.356455534462862
Epoch: 18, step: 276, loss: 0.33428066968917847, mean loss: 0.35645469031710947
Epoch: 18, step: 277, loss: 0.3018627166748047, mean loss: 0.35645261220619806
Epoch: 18, step: 278, loss: 0.3308291435241699, mean loss: 0.3564516368543393
Epoch: 18, step: 279, loss: 0.3489728569984436, mean loss: 0.35645135218701834
Epoch: 18, step: 280, loss: 0.31470775604248047, mean loss: 0.35644976334691086
Epoch: 18, step: 281, loss: 0.3478584885597229, mean loss: 0.3564494363592125
Epoch: 18, step: 282, loss: 0.34876367449760437, mean loss: 0.3564491438468676
Epoch: 18, step: 283, loss: 0.3430781960487366, mean loss: 0.35644863498144674
Epoch: 18, step: 284, loss: 0.35012945532798767, mean loss: 0.3564483944981475
Epoch: 18, step: 285, loss: 0.325996994972229, mean loss: 0.356447235680904
Epoch: 18, step: 286, loss: 0.3367198407649994, mean loss: 0.3564464849904319
Epoch: 18, step: 287, loss: 0.3273913562297821, mean loss: 0.35644537939192505
Epoch: 18, step: 288, loss: 0.32983171939849854, mean loss: 0.3564443667341117
Epoch: 18, step: 289, loss: 0.3219938576221466, mean loss: 0.3564430559316951
Epoch: 18, step: 290, loss: 0.3210374712944031, mean loss: 0.3564417088410039
Epoch: 18, step: 291, loss: 0.29931461811065674, mean loss: 0.3564395353860225
Epoch: 18, step: 292, loss: 0.3476825952529907, mean loss: 0.35643920223250786
Epoch: 18, step: 293, loss: 0.34053802490234375, mean loss: 0.3564385973029891
Epoch: 18, step: 294, loss: 0.33345121145248413, mean loss: 0.35643772282564856
Epoch: 18, step: 295, loss: 0.35094723105430603, mean loss: 0.3564375139664059
Epoch: 18, step: 296, loss: 0.34397366642951965, mean loss: 0.35643703985755665
Epoch: 18, step: 297, loss: 0.32959386706352234, mean loss: 0.3564360188163701
Epoch: 18, step: 298, loss: 0.29951202869415283, mean loss: 0.35643385366517305
Epoch: 18, step: 299, loss: 0.3145105540752411, mean loss: 0.35643225913833637
Epoch: 18, step: 300, loss: 0.3103443682193756, mean loss: 0.35643050628050654
Epoch: 18, step: 301, loss: 0.30954501032829285, mean loss: 0.3564287231552326
Epoch: 18, step: 302, loss: 0.375802606344223, mean loss: 0.3564294599448576
Epoch: 18, step: 303, loss: 0.4268389642238617, mean loss: 0.3564321375195564
Epoch: 18, step: 304, loss: 0.3140367865562439, mean loss: 0.35643052534512726
Epoch: 18, step: 305, loss: 0.33027562499046326, mean loss: 0.35642953078659223
Epoch: 18, step: 306, loss: 0.3459728956222534, mean loss: 0.35642913318078345
Epoch: 18, step: 307, loss: 0.3489774167537689, mean loss: 0.3564288498455581
Epoch: 18, step: 308, loss: 0.33317551016807556, mean loss: 0.3564279657217728
Epoch: 18, step: 309, loss: 0.3195814788341522, mean loss: 0.35642656482119917
Epoch: 18, step: 310, loss: 0.30018529295921326, mean loss: 0.35642442661369955
Epoch: 18, step: 311, loss: 0.36562222242355347, mean loss: 0.3564247762865938
Epoch: 18, step: 312, loss: 0.3248649537563324, mean loss: 0.3564235765214339
Epoch: 18, step: 313, loss: 0.37532687187194824, mean loss: 0.35642429511397367
Epoch: 18, step: 314, loss: 0.3154703378677368, mean loss: 0.356422738343637
Epoch: 18, step: 315, loss: 0.3185517489910126, mean loss: 0.3564212988199426
Epoch: 18, step: 316, loss: 0.2811161279678345, mean loss: 0.3564184364849678
Epoch: 18, step: 317, loss: 0.36220312118530273, mean loss: 0.356418656351357
Epoch: 18, step: 318, loss: 0.3277556896209717, mean loss: 0.3564175669603521
Epoch: 18, step: 319, loss: 0.3282521069049835, mean loss: 0.3564164965187264
Epoch: 18, step: 320, loss: 0.363729864358902, mean loss: 0.3564167744561657
Epoch: 18, step: 321, loss: 0.3297709822654724, mean loss: 0.356415761847205
Epoch: 18, step: 322, loss: 0.3192373216152191, mean loss: 0.3564143490240915
Epoch: 18, step: 323, loss: 0.37532782554626465, mean loss: 0.35641506773044973
Epoch: 18, step: 324, loss: 0.3180038630962372, mean loss: 0.35641360817181333
Epoch: 18, step: 325, loss: 0.3626214861869812, mean loss: 0.356413844051364
Epoch: 18, step: 326, loss: 0.34211722016334534, mean loss: 0.3564133008459273
Epoch: 18, step: 327, loss: 0.3511122167110443, mean loss: 0.35641309943695565
Epoch: 18, step: 328, loss: 0.34080082178115845, mean loss: 0.35641250628784826
Epoch: 18, step: 329, loss: 0.3010205924510956, mean loss: 0.35641040189175993
Epoch: 18, step: 330, loss: 0.29683104157447815, mean loss: 0.35640813849623826
Epoch: 18, step: 331, loss: 0.32015082240104675, mean loss: 0.35640676114795933
Epoch: 18, step: 332, loss: 0.35094356536865234, mean loss: 0.3564065536191548
Epoch: 18, step: 333, loss: 0.304505854845047, mean loss: 0.3564045821575285
Epoch: 18, step: 334, loss: 0.36207902431488037, mean loss: 0.3564047976945117
Epoch: 18, step: 335, loss: 0.32794472575187683, mean loss: 0.35640371671335314
Epoch: 18, step: 336, loss: 0.2949466109275818, mean loss: 0.3564013825151008
Epoch: 18, step: 337, loss: 0.28543752431869507, mean loss: 0.3563986873438818
Epoch: 18, step: 338, loss: 0.3291950523853302, mean loss: 0.35639765420290886
Epoch: 18, step: 339, loss: 0.3514867424964905, mean loss: 0.3563974677031479
Epoch: 18, step: 340, loss: 0.3237699270248413, mean loss: 0.3563962286669318
Epoch: 18, step: 341, loss: 0.32585689425468445, mean loss: 0.35639506897473117
Epoch: 18, step: 342, loss: 0.2983020842075348, mean loss: 0.35639286305163387
Epoch: 18, step: 343, loss: 0.3208622932434082, mean loss: 0.35639151392610957
Epoch: 18, step: 344, loss: 0.33082571625709534, mean loss: 0.3563905432081968
Epoch: 18, step: 345, loss: 0.3236405551433563, mean loss: 0.35638929975812217
Epoch: 18, step: 346, loss: 0.3223397433757782, mean loss: 0.3563880070151789
Epoch: 18, step: 347, loss: 0.3137074112892151, mean loss: 0.3563863866432835
Epoch: 18, step: 348, loss: 0.3144373297691345, mean loss: 0.35638479410477414
Epoch: 18, step: 349, loss: 0.32890069484710693, mean loss: 0.3563837507481855
Epoch: 18, step: 350, loss: 0.35382184386253357, mean loss: 0.3563836534962823
Epoch: 18, step: 351, loss: 0.3147736191749573, mean loss: 0.35638207400818933
Epoch: 18, step: 352, loss: 0.34004831314086914, mean loss: 0.3563814540134705
Epoch: 18, step: 353, loss: 0.3619626462459564, mean loss: 0.35638166585558056
Epoch: 18, step: 354, loss: 0.3455335199832916, mean loss: 0.3563812541143625
Epoch: 18, step: 355, loss: 0.38508033752441406, mean loss: 0.3563823433463122
Epoch: 18, step: 356, loss: 0.3515549600124359, mean loss: 0.35638216013695573
Epoch: 18, step: 357, loss: 0.35190820693969727, mean loss: 0.3563819903474606
Epoch: 18, step: 358, loss: 0.30873847007751465, mean loss: 0.3563801823128407
Epoch: 18, step: 359, loss: 0.30964627861976624, mean loss: 0.3563784088647649
Epoch: 18, step: 360, loss: 0.34327104687690735, mean loss: 0.35637791148829967
Epoch: 18, step: 361, loss: 0.3502122461795807, mean loss: 0.3563776775327214
Epoch: 18, step: 362, loss: 0.3939613997936249, mean loss: 0.356379103589343
Epoch: 18, step: 363, loss: 0.36882033944129944, mean loss: 0.3563795756350196
Epoch: 18, step: 364, loss: 0.34813380241394043, mean loss: 0.3563792627855594
Epoch: 18, step: 365, loss: 0.3771141767501831, mean loss: 0.3563800494504796
Epoch: 18, step: 366, loss: 0.32380178570747375, mean loss: 0.35637881350587836
Epoch: 18, step: 367, loss: 0.33699697256088257, mean loss: 0.35637807823118395
Epoch: 18, step: 368, loss: 0.34570184350013733, mean loss: 0.3563776732300561
Epoch: 18, step: 369, loss: 0.3343864679336548, mean loss: 0.3563768390291117
Epoch: 18, step: 370, loss: 0.30193695425987244, mean loss: 0.3563747740181202
Epoch: 18, step: 371, loss: 0.32186540961265564, mean loss: 0.3563734650602835
Epoch: 18, step: 372, loss: 0.3277598023414612, mean loss: 0.3563723797705919
Epoch: 18, step: 373, loss: 0.3083382546901703, mean loss: 0.35637055794987277
Epoch: 18, step: 374, loss: 0.3554201126098633, mean loss: 0.35637052190309687
Epoch: 18, step: 375, loss: 0.3483537435531616, mean loss: 0.35637021786872375
Epoch: 18, step: 376, loss: 0.31554800271987915, mean loss: 0.3563686697548344
Epoch: 18, step: 377, loss: 0.32076457142829895, mean loss: 0.3563673195804572
Epoch: 18, step: 378, loss: 0.35324904322624207, mean loss: 0.3563672013340367
Epoch: 18, step: 379, loss: 0.3319877088069916, mean loss: 0.35636627688793754
Epoch: 18, step: 380, loss: 0.3457094132900238, mean loss: 0.35636587280559584
Epoch: 18, step: 381, loss: 0.3003765046596527, mean loss: 0.3563637499054614
Epoch: 18, step: 382, loss: 0.33001068234443665, mean loss: 0.35636275073702306
Epoch: 18, step: 383, loss: 0.34872308373451233, mean loss: 0.3563624610923839
Epoch: 18, step: 384, loss: 0.3652542233467102, mean loss: 0.3563627981952483
Epoch: 18, step: 385, loss: 0.3091427981853485, mean loss: 0.35636100806711085
Epoch: 18, step: 386, loss: 0.3089706003665924, mean loss: 0.3563592115468599
Epoch: 18, step: 387, loss: 0.357221394777298, mean loss: 0.3563592442300756
Epoch: 18, step: 388, loss: 0.3668520152568817, mean loss: 0.35635964196977565
Epoch: 18, step: 389, loss: 0.30811917781829834, mean loss: 0.3563578134327371
Epoch: 18, step: 390, loss: 0.3147165775299072, mean loss: 0.35635623509684267
Epoch: 18, step: 391, loss: 0.3087739646434784, mean loss: 0.3563544316451123
Epoch: 18, step: 392, loss: 0.37014877796173096, mean loss: 0.3563549544552816
Epoch: 18, step: 393, loss: 0.3265419006347656, mean loss: 0.3563538245737603
Epoch: 18, step: 394, loss: 0.31236958503723145, mean loss: 0.3563521576832636
Epoch: 18, step: 395, loss: 0.3449704051017761, mean loss: 0.35635172636021595
Epoch: 18, step: 396, loss: 0.3040461242198944, mean loss: 0.35634974426153315
Epoch: 18, step: 397, loss: 0.3333032727241516, mean loss: 0.3563488709583298
Epoch: 18, step: 398, loss: 0.3381745517253876, mean loss: 0.35634818230237764
Epoch: 18, step: 399, loss: 0.3693382143974304, mean loss: 0.3563486744981981
Epoch: 18, step: 400, loss: 0.30936381220817566, mean loss: 0.35634689429654276
Epoch: 18, step: 401, loss: 0.3146810531616211, mean loss: 0.35634531568620953
Epoch: 18, step: 402, loss: 0.32891109585762024, mean loss: 0.35634427631436527
Epoch: 18, step: 403, loss: 0.35355842113494873, mean loss: 0.35634417077355685
Epoch: 18, step: 404, loss: 0.35573315620422363, mean loss: 0.35634414762643524
Epoch: 18, step: 405, loss: 0.3713597059249878, mean loss: 0.3563447164406749
Epoch: 18, step: 406, loss: 0.35595962405204773, mean loss: 0.3563447018532894
Epoch: 18, step: 407, loss: 0.3396826684474945, mean loss: 0.35634407071566043
Epoch: 18, step: 408, loss: 0.33845075964927673, mean loss: 0.3563433929643985
Epoch: 18, step: 409, loss: 0.3267407715320587, mean loss: 0.356342271737922
Epoch: 18, step: 410, loss: 0.35143154859542847, mean loss: 0.3563420857468171
Epoch: 18, step: 411, loss: 0.33763307332992554, mean loss: 0.356341377179463
Epoch: 18, step: 412, loss: 0.34362444281578064, mean loss: 0.356340895568618
Epoch: 18, step: 413, loss: 0.3133911192417145, mean loss: 0.3563392690528137
Epoch: 18, step: 414, loss: 0.337881863117218, mean loss: 0.35633857009397946
Epoch: 18, step: 415, loss: 0.33516862988471985, mean loss: 0.35633776844522874
Epoch: 18, step: 416, loss: 0.3812817335128784, mean loss: 0.35633871297039316
Epoch: 18, step: 417, loss: 0.32991957664489746, mean loss: 0.35633771262445124
Epoch: 18, step: 418, loss: 0.32245615124702454, mean loss: 0.356336429766499
Epoch: 18, step: 419, loss: 0.32824328541755676, mean loss: 0.356335366115721
Epoch: 18, step: 420, loss: 0.34701207280158997, mean loss: 0.35633501313448773
Epoch: 18, step: 421, loss: 0.3232116103172302, mean loss: 0.35633375912514353
Epoch: 18, step: 422, loss: 0.31414711475372314, mean loss: 0.35633216205361706
Epoch: 18, step: 423, loss: 0.3088250756263733, mean loss: 0.3563303636327196
Epoch: 18, step: 424, loss: 0.3665558695793152, mean loss: 0.3563307507132339
Epoch: 18, step: 425, loss: 0.3078903257846832, mean loss: 0.3563289170988449
Epoch: 18, step: 426, loss: 0.3406386077404022, mean loss: 0.35632832319637475
Epoch: 18, step: 427, loss: 0.3605897128582001, mean loss: 0.35632848449045734
Epoch: 18, step: 428, loss: 0.3542892634868622, mean loss: 0.35632840730863213
Epoch: 18, step: 429, loss: 0.3454549312591553, mean loss: 0.356327995777482
Epoch: 18, step: 430, loss: 0.34282737970352173, mean loss: 0.3563274848356482
Epoch: 18, step: 431, loss: 0.335195928812027, mean loss: 0.35632668512492977
Epoch: 18, step: 432, loss: 0.34466394782066345, mean loss: 0.3563262437725247
Epoch: 18, step: 433, loss: 0.34206756949424744, mean loss: 0.3563257042026209
Epoch: 18, step: 434, loss: 0.3433111608028412, mean loss: 0.3563252117311561
Epoch: 18, step: 435, loss: 0.35549646615982056, mean loss: 0.3563251803725376
Epoch: 18, step: 436, loss: 0.38578829169273376, mean loss: 0.356326295174888
Epoch: 18, step: 437, loss: 0.3429437577724457, mean loss: 0.3563257888359776
Epoch: 18, step: 438, loss: 0.3285399377346039, mean loss: 0.3563247375760517
Epoch: 18, step: 439, loss: 0.31045740842819214, mean loss: 0.35632300228060876
Epoch: 18, step: 440, loss: 0.3262867033481598, mean loss: 0.35632186596241056
Epoch: 18, step: 441, loss: 0.37874314188957214, mean loss: 0.3563227141607887
Epoch: 18, step: 442, loss: 0.32041844725608826, mean loss: 0.35632135595133513
Epoch: 18, step: 443, loss: 0.32663702964782715, mean loss: 0.35632023307622906
Epoch: 18, step: 444, loss: 0.3232872486114502, mean loss: 0.35631898357800823
Epoch: 18, step: 445, loss: 0.36974549293518066, mean loss: 0.3563194914269135
Epoch: 18, step: 446, loss: 0.337199866771698, mean loss: 0.35631876826701125
Epoch: 18, step: 447, loss: 0.30600032210350037, mean loss: 0.35631686514877514
Epoch: 18, step: 448, loss: 0.3438456058502197, mean loss: 0.3563163934850976
Epoch: 18, step: 449, loss: 0.3068534731864929, mean loss: 0.35631452286561727
Epoch: 18, step: 450, loss: 0.3534165322780609, mean loss: 0.3563144132717517
Epoch: 18, step: 451, loss: 0.33347880840301514, mean loss: 0.35631354972596174
Epoch: 18, step: 452, loss: 0.33859726786613464, mean loss: 0.3563128797966042
Epoch: 18, step: 453, loss: 0.32475611567497253, mean loss: 0.35631168654378254
Epoch: 18, step: 454, loss: 0.3182535767555237, mean loss: 0.3563102475106299
Epoch: 18, step: 455, loss: 0.2914460003376007, mean loss: 0.3563077949906975
Epoch: 18, step: 456, loss: 0.34367337822914124, mean loss: 0.3563073173009262
Epoch: 18, step: 457, loss: 0.3531339168548584, mean loss: 0.3563071973235936
Epoch: 18, step: 458, loss: 0.33061620593070984, mean loss: 0.3563062260562921
Epoch: 18, step: 459, loss: 0.33409765362739563, mean loss: 0.3563053864762063
Epoch: 18, step: 460, loss: 0.3262467682361603, mean loss: 0.356304250173396
Epoch: 18, step: 461, loss: 0.29968369007110596, mean loss: 0.35630210983317895
Epoch: 18, step: 462, loss: 0.31963804364204407, mean loss: 0.35630072393009105
Epoch: 18, step: 463, loss: 0.30252915620803833, mean loss: 0.3562986914396268
Epoch: 18, step: 464, loss: 0.354247510433197, mean loss: 0.3562986139107684
Epoch: 18, step: 465, loss: 0.3383699059486389, mean loss: 0.3562979362817729
Epoch: 18, step: 466, loss: 0.3175090551376343, mean loss: 0.3562964702822588
Epoch: 18, step: 467, loss: 0.3796848952770233, mean loss: 0.35629735419854736
Epoch: 18, step: 468, loss: 0.33988329768180847, mean loss: 0.3562967338872773
Epoch: 18, step: 469, loss: 0.29806604981422424, mean loss: 0.3562945333474816
Epoch: 18, step: 470, loss: 0.303608775138855, mean loss: 0.3562925424258851
Epoch: 18, step: 471, loss: 0.34241974353790283, mean loss: 0.3562920182119005
Epoch: 18, step: 472, loss: 0.3622508645057678, mean loss: 0.35629224337140525
Epoch: 18, step: 473, loss: 0.37312638759613037, mean loss: 0.3562928794382164
Epoch: 18, step: 474, loss: 0.32430049777030945, mean loss: 0.3562916706732764
Epoch: 18, step: 475, loss: 0.3404034674167633, mean loss: 0.35629107039357044
Epoch: 18, step: 476, loss: 0.323550283908844, mean loss: 0.35628983344519743
Epoch: 18, step: 477, loss: 0.30910032987594604, mean loss: 0.3562880506910014
Epoch: 18, step: 478, loss: 0.3485989570617676, mean loss: 0.3562877602186494
Epoch: 18, step: 479, loss: 0.3353392481803894, mean loss: 0.35628696887262196
Epoch: 18, step: 480, loss: 0.31917309761047363, mean loss: 0.35628556692077434
Epoch: 18, step: 481, loss: 0.3706326186656952, mean loss: 0.3562861088506582
Epoch: 18, step: 482, loss: 0.3061144948005676, mean loss: 0.35628421379441455
Epoch: 18, step: 483, loss: 0.33034560084342957, mean loss: 0.35628323409155344
Epoch: 18, step: 484, loss: 0.31992870569229126, mean loss: 0.3562818610308442
Epoch: 18, step: 485, loss: 0.31362923979759216, mean loss: 0.35628025016064124
Epoch: 18, step: 486, loss: 0.3061222434043884, mean loss: 0.3562783559045607
Epoch: 18, step: 487, loss: 0.3075101673603058, mean loss: 0.3562765142055975
Epoch: 18, step: 488, loss: 0.30326738953590393, mean loss: 0.3562745124260322
Epoch: 18, step: 489, loss: 0.34801653027534485, mean loss: 0.3562742005922526
Epoch: 18, step: 490, loss: 0.3399883806705475, mean loss: 0.3562735856385117
Epoch: 18, step: 491, loss: 0.336008757352829, mean loss: 0.3562728204660194
Epoch: 18, step: 492, loss: 0.34309589862823486, mean loss: 0.35627232294206856
Epoch: 18, step: 493, loss: 0.336421400308609, mean loss: 0.35627157345469285
Epoch: 18, step: 494, loss: 0.3222048878669739, mean loss: 0.3562702872884382
Epoch: 18, step: 495, loss: 0.3561176359653473, mean loss: 0.35627028152540124
Epoch: 18, step: 496, loss: 0.3184967637062073, mean loss: 0.35626885551770676
Epoch: 18, step: 497, loss: 0.30234789848327637, mean loss: 0.3562668199964899
Epoch: 18, step: 498, loss: 0.3702136278152466, mean loss: 0.35626734646992686
Epoch: 18, step: 499, loss: 0.326933890581131, mean loss: 0.3562662392127968
Epoch: 18, step: 500, loss: 0.3178825080394745, mean loss: 0.35626479038740244
Epoch: 18, step: 501, loss: 0.34921208024024963, mean loss: 0.3562645241871251
Epoch: 18, step: 502, loss: 0.31744006276130676, mean loss: 0.35626305883662784
Epoch: 18, step: 503, loss: 0.31887903809547424, mean loss: 0.3562616479058934
Epoch: 18, step: 504, loss: 0.3021180331707001, mean loss: 0.35625960451929356
Epoch: 18, step: 505, loss: 0.3465365469455719, mean loss: 0.3562592375837673
Epoch: 18, step: 506, loss: 0.33891433477401733, mean loss: 0.35625858303443303
Epoch: 18, step: 507, loss: 0.3143884539604187, mean loss: 0.3562570030295623
Epoch: 18, step: 508, loss: 0.3322741687297821, mean loss: 0.35625609805109737
Epoch: 18, step: 509, loss: 0.3444689214229584, mean loss: 0.35625565328554654
Epoch: 18, step: 510, loss: 0.3240694999694824, mean loss: 0.35625443885120645
Epoch: 18, step: 511, loss: 0.3448227643966675, mean loss: 0.3562540075323695
Epoch: 18, step: 512, loss: 0.3434910476207733, mean loss: 0.35625352600209553
Epoch: 18, step: 513, loss: 0.3345053791999817, mean loss: 0.3562527055030839
Epoch: 18, step: 514, loss: 0.3560642898082733, mean loss: 0.35625269839493534
Epoch: 18, step: 515, loss: 0.33358538150787354, mean loss: 0.3562518432826339
Epoch: 18, step: 516, loss: 0.35494235157966614, mean loss: 0.3562517938846293
Epoch: 18, step: 517, loss: 0.33024877309799194, mean loss: 0.35625081300870376
Epoch: 18, step: 518, loss: 0.3336855173110962, mean loss: 0.3562499618414261
Epoch: 18, step: 519, loss: 0.34508606791496277, mean loss: 0.3562495407530915
Epoch: 18, step: 520, loss: 0.37612906098365784, mean loss: 0.3562502905558385
Epoch: 18, step: 521, loss: 0.34512022137641907, mean loss: 0.356249870774999
Epoch: 18, step: 522, loss: 0.31275734305381775, mean loss: 0.35624823047600895
Epoch: 18, step: 523, loss: 0.3306821584701538, mean loss: 0.35624726630071835
Epoch: 18, step: 524, loss: 0.32268840074539185, mean loss: 0.35624600074030216
Epoch: 18, step: 525, loss: 0.3161586821079254, mean loss: 0.35624448903811373
Epoch: 18, step: 526, loss: 0.3164253830909729, mean loss: 0.3562429875069117
Epoch: 18, step: 527, loss: 0.35288625955581665, mean loss: 0.3562428609334595
Epoch: 18, step: 528, loss: 0.3364061117172241, mean loss: 0.3562421129696114
Epoch: 18, step: 529, loss: 0.33951088786125183, mean loss: 0.3562414821263451
Epoch: 18, step: 530, loss: 0.35494109988212585, mean loss: 0.35624143309787004
Epoch: 18, step: 531, loss: 0.3327910304069519, mean loss: 0.3562405489777264
Epoch: 18, step: 532, loss: 0.3683535158634186, mean loss: 0.35624100564000294
Epoch: 18, step: 533, loss: 0.35897722840309143, mean loss: 0.3562411087924859
Epoch: 18, step: 534, loss: 0.3648497462272644, mean loss: 0.35624143331608205
Epoch: 18, step: 535, loss: 0.3289305865764618, mean loss: 0.35624040380587624
Epoch: 18, step: 536, loss: 0.357492595911026, mean loss: 0.3562404510067547
Epoch: 18, step: 537, loss: 0.36714687943458557, mean loss: 0.35624086210469774
Epoch: 18, step: 538, loss: 0.32343265414237976, mean loss: 0.35623962550570176
Epoch: 18, step: 539, loss: 0.33678773045539856, mean loss: 0.35623889235723766
Epoch: 18, step: 540, loss: 0.41264986991882324, mean loss: 0.35624101842581496
Epoch: 18, step: 541, loss: 0.31885722279548645, mean loss: 0.35623960952419326
Epoch: 18, step: 542, loss: 0.3815280497074127, mean loss: 0.35624056254624653
Epoch: 18, step: 543, loss: 0.2853895127773285, mean loss: 0.35623789254889315
Epoch: 18, step: 544, loss: 0.32658112049102783, mean loss: 0.35623677498579037
Epoch: 18, step: 545, loss: 0.3615436255931854, mean loss: 0.3562369749575519
Epoch: 18, step: 546, loss: 0.34025007486343384, mean loss: 0.3562363725648433
Epoch: 18, step: 547, loss: 0.3340774476528168, mean loss: 0.3562355376392626
Epoch: 18, step: 548, loss: 0.3154808282852173, mean loss: 0.3562340021014398
Epoch: 18, step: 549, loss: 0.34306600689888, mean loss: 0.35623350598226255
Epoch: 18, step: 550, loss: 0.38704097270965576, mean loss: 0.35623466664483755
Epoch: 18, step: 551, loss: 0.30286985635757446, mean loss: 0.3562326562164813
Epoch: 18, step: 552, loss: 0.32330188155174255, mean loss: 0.35623141565235755
Epoch: 18, step: 553, loss: 0.36116790771484375, mean loss: 0.3562316016122785
Epoch: 18, step: 554, loss: 0.3225433826446533, mean loss: 0.3562303326094169
Epoch: 18, step: 555, loss: 0.3719092309474945, mean loss: 0.3562309231962158
Epoch: 18, step: 556, loss: 0.31289997696876526, mean loss: 0.3562292910840373
Epoch: 18, step: 557, loss: 0.3120722472667694, mean loss: 0.3562276279185451
Epoch: 18, step: 558, loss: 0.3291826546192169, mean loss: 0.35622660931384853
Epoch: 18, step: 559, loss: 0.32930293679237366, mean loss: 0.35622559531593795
Epoch: 18, step: 560, loss: 0.3531824052333832, mean loss: 0.35622548070779264
Epoch: 18, step: 561, loss: 0.36822277307510376, mean loss: 0.35622593251514245
Epoch: 18, step: 562, loss: 0.31856679916381836, mean loss: 0.3562245143591134
Epoch: 18, step: 563, loss: 0.326850026845932, mean loss: 0.3562234082253766
Epoch: 18, step: 564, loss: 0.29800131916999817, mean loss: 0.3562212158810209
Epoch: 18, step: 565, loss: 0.30171701312065125, mean loss: 0.35621916361041467
Epoch: 18, step: 566, loss: 0.3479595482349396, mean loss: 0.3562188526192111
Epoch: 18, step: 567, loss: 0.3324669301509857, mean loss: 0.3562179583450218
Epoch: 18, step: 568, loss: 0.34614503383636475, mean loss: 0.3562175791076245
Epoch: 18, step: 569, loss: 0.32161861658096313, mean loss: 0.356216276533928
Epoch: 18, step: 570, loss: 0.3523659408092499, mean loss: 0.356216131582841
Epoch: 18, step: 571, loss: 0.3337002694606781, mean loss: 0.35621528397472013
Epoch: 18, step: 572, loss: 0.3353829085826874, mean loss: 0.3562144997708657
Epoch: 18, step: 573, loss: 0.39167049527168274, mean loss: 0.35621583440895577
Epoch: 18, step: 574, loss: 0.3268934190273285, mean loss: 0.3562147306932415
Epoch: 18, step: 575, loss: 0.34778547286987305, mean loss: 0.35621441342217014
Epoch: 18, step: 576, loss: 0.3464567959308624, mean loss: 0.3562140461664401
Epoch: 18, step: 577, loss: 0.30063945055007935, mean loss: 0.35621195453694754
Epoch: 18, step: 578, loss: 0.2970355749130249, mean loss: 0.35620972743297613
Epoch: 18, step: 579, loss: 0.3463612496852875, mean loss: 0.3562093567993111
Epoch: 18, step: 580, loss: 0.32994771003723145, mean loss: 0.3562083685162131
Epoch: 18, step: 581, loss: 0.3138507604598999, mean loss: 0.3562067745669373
Epoch: 18, step: 582, loss: 0.32530808448791504, mean loss: 0.3562056118692861
Epoch: 18, step: 583, loss: 0.32913947105407715, mean loss: 0.3562045934262994
Epoch: 18, step: 584, loss: 0.36935704946517944, mean loss: 0.3562050883074387
Epoch: 18, step: 585, loss: 0.36544299125671387, mean loss: 0.356205435884493
Epoch: 18, step: 586, loss: 0.33465978503227234, mean loss: 0.3562046252576503
Epoch: 18, step: 587, loss: 0.31550705432891846, mean loss: 0.3562030941225514
Epoch: 18, step: 588, loss: 0.3519134819507599, mean loss: 0.3562029327436653
Epoch: 18, step: 589, loss: 0.35293468832969666, mean loss: 0.35620280979413504
Epoch: 18, step: 590, loss: 0.35859179496765137, mean loss: 0.35620289966304275
Epoch: 18, step: 591, loss: 0.38836297392845154, mean loss: 0.35620410941606206
Epoch: 18, step: 592, loss: 0.33849528431892395, mean loss: 0.35620344329512554
Epoch: 18, step: 593, loss: 0.3171856701374054, mean loss: 0.356201975689124
Epoch: 18, step: 594, loss: 0.3819655776023865, mean loss: 0.356202944719173
Epoch: 18, step: 595, loss: 0.32472801208496094, mean loss: 0.3562017609169828
Epoch: 18, step: 596, loss: 0.35031911730766296, mean loss: 0.35620153967347573
Epoch: 18, step: 597, loss: 0.37217092514038086, mean loss: 0.3562021402520943
Epoch: 18, step: 598, loss: 0.31973350048065186, mean loss: 0.3562007687865694
Epoch: 18, step: 599, loss: 0.3661956787109375, mean loss: 0.3562011446481039
Epoch: 18, step: 600, loss: 0.36427733302116394, mean loss: 0.35620144834412815
Epoch: 18, step: 601, loss: 0.34134429693222046, mean loss: 0.3562008896785866
Epoch: 18, step: 602, loss: 0.36021390557289124, mean loss: 0.35620104057220925
Epoch: 18, step: 603, loss: 0.2800193428993225, mean loss: 0.356198176167875
Epoch: 18, step: 604, loss: 0.3846951723098755, mean loss: 0.35619924760435817
Epoch: 18, step: 605, loss: 0.3282718062400818, mean loss: 0.35619819762160143
Epoch: 18, step: 606, loss: 0.3739126920700073, mean loss: 0.3561988636050763
Epoch: 18, step: 607, loss: 0.3656553030014038, mean loss: 0.35619921911031677
Epoch: 18, step: 608, loss: 0.3018707036972046, mean loss: 0.3561971767617053
Epoch: 18, step: 609, loss: 0.3310031294822693, mean loss: 0.3561962296882793
Epoch: 18, step: 610, loss: 0.29424604773521423, mean loss: 0.35619390099670495
Epoch: 18, step: 611, loss: 0.3261553943157196, mean loss: 0.3561927718993256
Epoch: 18, step: 612, loss: 0.36881694197654724, mean loss: 0.3561932464029932
Epoch: 18, step: 613, loss: 0.31266653537750244, mean loss: 0.35619161042949005
Epoch: 18, step: 614, loss: 0.355647474527359, mean loss: 0.3561915899786349
Epoch: 18, step: 615, loss: 0.3581550121307373, mean loss: 0.3561916637693051
Epoch: 18, step: 616, loss: 0.4124349355697632, mean loss: 0.35619377746285996
Epoch: 18, step: 617, loss: 0.31521135568618774, mean loss: 0.356192237349302
Epoch: 18, step: 618, loss: 0.3482288122177124, mean loss: 0.35619193809616867
Epoch: 18, step: 619, loss: 0.34002628922462463, mean loss: 0.3561913306390489
Epoch: 18, step: 620, loss: 0.31189054250717163, mean loss: 0.35618966600942686
Epoch: 18, step: 621, loss: 0.31547656655311584, mean loss: 0.3561881362469163
Epoch: 18, step: 622, loss: 0.35857638716697693, mean loss: 0.356188225980184
Epoch: 18, step: 623, loss: 0.31722694635391235, mean loss: 0.35618676215092243
Epoch: 18, step: 624, loss: 0.29941651225090027, mean loss: 0.3561846292941054
Epoch: 18, step: 625, loss: 0.334684282541275, mean loss: 0.3561838215569819
Epoch: 18, step: 626, loss: 0.3583548069000244, mean loss: 0.3561839031147167
Epoch: 18, step: 627, loss: 0.2897336483001709, mean loss: 0.3561814068617184
Epoch: 18, step: 628, loss: 0.3321102559566498, mean loss: 0.3561805026450885
Epoch: 18, step: 629, loss: 0.32602372765541077, mean loss: 0.3561793698686258
Epoch: 18, step: 630, loss: 0.3301207423210144, mean loss: 0.3561783910673056
Epoch: 18, step: 631, loss: 0.38118746876716614, mean loss: 0.35617933041066874
Epoch: 18, step: 632, loss: 0.3393940031528473, mean loss: 0.3561786999758422
Epoch: 18, step: 633, loss: 0.3008861541748047, mean loss: 0.3561766233385027
Epoch: 18, step: 634, loss: 0.32556024193763733, mean loss: 0.356175473513836
Epoch: 18, step: 635, loss: 0.34746697545051575, mean loss: 0.35617514647094645
Epoch: 18, step: 636, loss: 0.38369494676589966, mean loss: 0.3561761799232088
Epoch: 18, step: 637, loss: 0.3481294810771942, mean loss: 0.35617587775652293
Epoch: 18, step: 638, loss: 0.3379148542881012, mean loss: 0.3561751920510117
Epoch: 18, step: 639, loss: 0.31130510568618774, mean loss: 0.356173507232509
Epoch: 18, step: 640, loss: 0.2957533597946167, mean loss: 0.3561712386128478
Epoch: 18, step: 641, loss: 0.325324684381485, mean loss: 0.35617008044831255
Epoch: 18, step: 642, loss: 0.351787805557251, mean loss: 0.3561699159176239
Epoch: 18, step: 643, loss: 0.32296445965766907, mean loss: 0.3561686692793802
Epoch: 18, step: 644, loss: 0.32181286811828613, mean loss: 0.35616737950195926
Epoch: 18, step: 645, loss: 0.31610792875289917, mean loss: 0.35616587565592167
Epoch: 18, step: 646, loss: 0.37503111362457275, mean loss: 0.35616658383708344
Epoch: 18, step: 647, loss: 0.35359111428260803, mean loss: 0.35616648716029836
Epoch: 18, step: 648, loss: 0.3501947820186615, mean loss: 0.35616626300560666
Epoch: 18, step: 649, loss: 0.3664054274559021, mean loss: 0.3561666473297734
Epoch: 18, step: 650, loss: 0.3176751136779785, mean loss: 0.35616520261507717
Epoch: 18, step: 651, loss: 0.30223390460014343, mean loss: 0.356163178470879
Epoch: 18, step: 652, loss: 0.3416711688041687, mean loss: 0.35616263457860403
Epoch: 18, step: 653, loss: 0.32159262895584106, mean loss: 0.35616133719792314
Epoch: 18, step: 654, loss: 0.33785900473594666, mean loss: 0.35616065035390837
Epoch: 18, step: 655, loss: 0.3305014669895172, mean loss: 0.3561596874605068
Epoch: 18, step: 656, loss: 0.30982524156570435, mean loss: 0.3561579487669012
Epoch: 18, step: 657, loss: 0.3224813640117645, mean loss: 0.35615668510518433
Epoch: 18, step: 658, loss: 0.30241426825523376, mean loss: 0.35615466857984385
Epoch: 18, step: 659, loss: 0.32233646512031555, mean loss: 0.35615339969932985
Epoch: 18, step: 660, loss: 0.30244824290275574, mean loss: 0.35615138472327473
Epoch: 18, step: 661, loss: 0.3307449519634247, mean loss: 0.3561504315292791
Epoch: 18, step: 662, loss: 0.30105122923851013, mean loss: 0.3561483644048263
Epoch: 18, step: 663, loss: 0.32763421535491943, mean loss: 0.35614729469635353
Epoch: 18, step: 664, loss: 0.32972437143325806, mean loss: 0.3561463034774143
Epoch: 18, step: 665, loss: 0.3098272979259491, mean loss: 0.35614456595000976
Epoch: 18, step: 666, loss: 0.332853764295578, mean loss: 0.3561436922937716
Epoch: 18, step: 667, loss: 0.34992101788520813, mean loss: 0.3561434588851291
Epoch: 18, step: 668, loss: 0.3273831307888031, mean loss: 0.3561423801435929
Epoch: 18, step: 669, loss: 0.32407599687576294, mean loss: 0.3561411774437479
Epoch: 18, step: 670, loss: 0.3252940773963928, mean loss: 0.3561400205184189
Epoch: 18, step: 671, loss: 0.3141513168811798, mean loss: 0.35613844578455917
Epoch: 18, step: 672, loss: 0.32782307267189026, mean loss: 0.35613738389169913
Epoch: 18, step: 673, loss: 0.33640891313552856, mean loss: 0.3561366440555499
Epoch: 18, step: 674, loss: 0.3274734318256378, mean loss: 0.356135569198527
Epoch: 18, step: 675, loss: 0.3673887848854065, mean loss: 0.35613599117301653
Epoch: 18, step: 676, loss: 0.34007886052131653, mean loss: 0.35613538908329995
Epoch: 18, step: 677, loss: 0.3081570565700531, mean loss: 0.356133590120701
Epoch: 18, step: 678, loss: 0.33286193013191223, mean loss: 0.35613271757524007
Epoch: 18, step: 679, loss: 0.3362845480442047, mean loss: 0.35613197341771413
Epoch: 18, step: 680, loss: 0.32770678400993347, mean loss: 0.3561309077262131
Epoch: 18, step: 681, loss: 0.3363131880760193, mean loss: 0.35613016476604026
Epoch: 18, step: 682, loss: 0.3446158766746521, mean loss: 0.35612973311512774
Epoch: 18, step: 683, loss: 0.36653393507003784, mean loss: 0.3561301231361937
Epoch: 18, step: 684, loss: 0.32736822962760925, mean loss: 0.3561290449829715
Epoch: 18, step: 685, loss: 0.3173118233680725, mean loss: 0.3561275899555476
Epoch: 18, step: 686, loss: 0.37772488594055176, mean loss: 0.3561283994797421
Epoch: 18, step: 687, loss: 0.335214227437973, mean loss: 0.3561276155902353
Epoch: 18, step: 688, loss: 0.3601694703102112, mean loss: 0.35612776707836247
Epoch: 18, step: 689, loss: 0.33644065260887146, mean loss: 0.35612702923582934
Epoch: 18, step: 690, loss: 0.2751387655735016, mean loss: 0.3561239940350025
Epoch: 18, step: 691, loss: 0.31116026639938354, mean loss: 0.3561223089904951
Epoch: 18, step: 692, loss: 0.3221821188926697, mean loss: 0.35612103710778575
Epoch: 18, step: 693, loss: 0.3370913565158844, mean loss: 0.3561203240117582
Epoch: 18, step: 694, loss: 0.3121163547039032, mean loss: 0.35611867512018897
Epoch: 18, step: 695, loss: 0.3965378403663635, mean loss: 0.35612018962728004
Epoch: 18, step: 696, loss: 0.3242799639701843, mean loss: 0.3561189966179632
Epoch: 18, step: 697, loss: 0.31657323241233826, mean loss: 0.3561175149482665
Epoch: 18, step: 698, loss: 0.3033751845359802, mean loss: 0.35611553891400727
Epoch: 18, step: 699, loss: 0.3369223177433014, mean loss: 0.35611481985132293
Epoch: 18, step: 700, loss: 0.31576746702194214, mean loss: 0.35611330831823074
Epoch: 18, step: 701, loss: 0.29828688502311707, mean loss: 0.3561111420477844
Epoch: 18, step: 702, loss: 0.32152849435806274, mean loss: 0.35610984657493594
Epoch: 18, step: 703, loss: 0.35711660981178284, mean loss: 0.35610988428707396
Epoch: 18, step: 704, loss: 0.3059408962726593, mean loss: 0.3561080050876128
Epoch: 18, step: 705, loss: 0.374783992767334, mean loss: 0.3561087046152059
Epoch: 18, step: 706, loss: 0.3369008004665375, mean loss: 0.35610798519110204
Epoch: 18, step: 707, loss: 0.3348322808742523, mean loss: 0.35610718834824373
Epoch: 18, step: 708, loss: 0.3563518524169922, mean loss: 0.35610719751134884
Epoch: 18, step: 709, loss: 0.34145358204841614, mean loss: 0.35610664872790704
Epoch: 18, step: 710, loss: 0.356252521276474, mean loss: 0.3561066541906846
Epoch: 18, step: 711, loss: 0.3257043957710266, mean loss: 0.35610551569988097
Epoch: 18, step: 712, loss: 0.38218191266059875, mean loss: 0.356106492161104
Epoch: 18, step: 713, loss: 0.3271729648113251, mean loss: 0.35610540875185703
Epoch: 18, step: 714, loss: 0.35295143723487854, mean loss: 0.3561052906565443
Epoch: 18, step: 715, loss: 0.37744832038879395, mean loss: 0.35610608978151553
Epoch: 18, step: 716, loss: 0.3222525417804718, mean loss: 0.35610482228561524
Epoch: 18, step: 717, loss: 0.3084472417831421, mean loss: 0.35610303802576865
Epoch: 18, step: 718, loss: 0.3401802182197571, mean loss: 0.3561024419110666
Epoch: 18, step: 719, loss: 0.3547140061855316, mean loss: 0.35610238993308946
Epoch: 18, step: 720, loss: 0.3441658318042755, mean loss: 0.35610194308855203
Epoch: 18, step: 721, loss: 0.32789769768714905, mean loss: 0.3561008873033682
Epoch: 18, step: 722, loss: 0.32029977440834045, mean loss: 0.35609954719058906
Epoch: 18, step: 723, loss: 0.3270854353904724, mean loss: 0.3560984611705337
Epoch: 18, step: 724, loss: 0.3491753041744232, mean loss: 0.35609820204125286
Epoch: 18, step: 725, loss: 0.32832375168800354, mean loss: 0.3560971625004806
Epoch: 18, step: 726, loss: 0.3351035416126251, mean loss: 0.3560963767816705
Epoch: 18, step: 727, loss: 0.32949692010879517, mean loss: 0.35609538129302254
Epoch: 18, step: 728, loss: 0.33730003237724304, mean loss: 0.35609467790060023
Epoch: 18, step: 729, loss: 0.3478541374206543, mean loss: 0.3560943695202215
Epoch: 18, step: 730, loss: 0.3060873746871948, mean loss: 0.3560924982110559
Epoch: 18, step: 731, loss: 0.34023618698120117, mean loss: 0.35609190487505715
Epoch: 18, step: 732, loss: 0.33418604731559753, mean loss: 0.3560910851984413
Epoch: 18, step: 733, loss: 0.31363624334335327, mean loss: 0.35608949667633344
Epoch: 18, step: 734, loss: 0.30351492762565613, mean loss: 0.35608752958054823
Epoch: 18, step: 735, loss: 0.30934223532676697, mean loss: 0.35608578065454355
Epoch: 18, step: 736, loss: 0.30682310461997986, mean loss: 0.3560839376123035
Epoch: 18, step: 737, loss: 0.34779229760169983, mean loss: 0.3560836274125276
Epoch: 18, step: 738, loss: 0.30437010526657104, mean loss: 0.3560816928226452
Epoch: 18, step: 739, loss: 0.3415127396583557, mean loss: 0.3560811478221527
Epoch: 18, step: 740, loss: 0.3322622776031494, mean loss: 0.35608025683086036
Epoch: 18, step: 741, loss: 0.3400450348854065, mean loss: 0.35607965702454836
Epoch: 18, step: 742, loss: 0.29876241087913513, mean loss: 0.35607751312156927
Epoch: 18, step: 743, loss: 0.346028596162796, mean loss: 0.3560771372644119
Epoch: 18, step: 744, loss: 0.32596340775489807, mean loss: 0.3560760109701564
Epoch: 18, step: 745, loss: 0.3361913561820984, mean loss: 0.35607526728495975
Epoch: 18, step: 746, loss: 0.32631149888038635, mean loss: 0.35607415416298793
Epoch: 18, step: 747, loss: 0.3298349380493164, mean loss: 0.356073172890882
Epoch: 18, step: 748, loss: 0.37059566378593445, mean loss: 0.35607371597045623
Epoch: 18, step: 749, loss: 0.29854851961135864, mean loss: 0.35607156485250097
Epoch: 18, step: 750, loss: 0.3735545873641968, mean loss: 0.35607221859450866
Epoch: 18, step: 751, loss: 0.3558112680912018, mean loss: 0.3560722088371611
Epoch: 18, step: 752, loss: 0.37331435084342957, mean loss: 0.3560728535237196
Epoch: 18, step: 753, loss: 0.3242577314376831, mean loss: 0.35607166399548784
Epoch: 18, step: 754, loss: 0.3528918921947479, mean loss: 0.35607154511218125
Epoch: 18, step: 755, loss: 0.33541613817214966, mean loss: 0.35607077288969957
Epoch: 18, step: 756, loss: 0.32114753127098083, mean loss: 0.3560694672991497
Epoch: 18, step: 757, loss: 0.33280280232429504, mean loss: 0.3560685975172815
Epoch: 18, step: 758, loss: 0.314093679189682, mean loss: 0.356067028420114
Epoch: 18, step: 759, loss: 0.3225193917751312, mean loss: 0.356065774396615
Epoch: 18, step: 760, loss: 0.34665581583976746, mean loss: 0.35606542266191027
Epoch: 18, step: 761, loss: 0.3243314027786255, mean loss: 0.35606423652077684
Epoch: 18, step: 762, loss: 0.330733060836792, mean loss: 0.35606328973790696
Epoch: 18, step: 763, loss: 0.34623944759368896, mean loss: 0.3560629225738262
Epoch: 18, step: 764, loss: 0.31492990255355835, mean loss: 0.3560613852931139
Epoch: 18, step: 765, loss: 0.3366478979587555, mean loss: 0.3560606597722478
Epoch: 18, step: 766, loss: 0.324429988861084, mean loss: 0.356059477714962
Epoch: 18, step: 767, loss: 0.3249526619911194, mean loss: 0.35605831527790205
Epoch: 18, step: 768, loss: 0.3032723665237427, mean loss: 0.3560563427825262
Epoch: 18, step: 769, loss: 0.3561854064464569, mean loss: 0.35605634760517263
Epoch: 18, step: 770, loss: 0.32795894145965576, mean loss: 0.35605529774506184
Epoch: 18, step: 771, loss: 0.3073336184024811, mean loss: 0.35605347732661385
Epoch: 18, step: 772, loss: 0.33712565898895264, mean loss: 0.3560527701411725
Epoch: 18, step: 773, loss: 0.3266911804676056, mean loss: 0.3560516731677856
Epoch: 18, step: 774, loss: 0.36466458439826965, mean loss: 0.3560519949412839
Epoch: 18, step: 775, loss: 0.35792553424835205, mean loss: 0.35605206493303926
Epoch: 18, step: 776, loss: 0.36461079120635986, mean loss: 0.3560523846583287
Epoch: 18, step: 777, loss: 0.31870806217193604, mean loss: 0.3560509896518855
Epoch: 18, step: 778, loss: 0.3369556665420532, mean loss: 0.3560502763679921
Epoch: 18, step: 779, loss: 0.34359046816825867, mean loss: 0.3560498109635322
Epoch: 18, step: 780, loss: 0.3221743106842041, mean loss: 0.3560485456775994
Epoch: 18, step: 781, loss: 0.32232189178466797, mean loss: 0.35604728599828767
Epoch: 18, step: 782, loss: 0.35868242383003235, mean loss: 0.35604738441613387
Epoch: 18, step: 783, loss: 0.3300516903400421, mean loss: 0.3560464135581239
Epoch: 18, step: 784, loss: 0.34671109914779663, mean loss: 0.3560460649262977
Epoch: 18, step: 785, loss: 0.368883341550827, mean loss: 0.35604654432269117
Epoch: 18, step: 786, loss: 0.32869240641593933, mean loss: 0.35604552284549235
Epoch: 18, step: 787, loss: 0.33690834045410156, mean loss: 0.35604480823823353
Epoch: 18, step: 788, loss: 0.33477500081062317, mean loss: 0.3560440140256415
Epoch: 18, step: 789, loss: 0.3336924612522125, mean loss: 0.35604317945194375
Epoch: 18, step: 790, loss: 0.3186993896961212, mean loss: 0.35604178514250284
Epoch: 18, step: 791, loss: 0.32955387234687805, mean loss: 0.35604079619713264
Epoch: 18, step: 792, loss: 0.32138147950172424, mean loss: 0.3560395022148031
Epoch: 18, step: 793, loss: 0.32111138105392456, mean loss: 0.35603819824552213
Epoch: 18, step: 794, loss: 0.3740384578704834, mean loss: 0.3560388702229599
Epoch: 18, step: 795, loss: 0.35187336802482605, mean loss: 0.35603871472414705
Epoch: 18, step: 796, loss: 0.2897054851055145, mean loss: 0.3560362385873141
Epoch: 18, step: 797, loss: 0.36581388115882874, mean loss: 0.35603660356090766
Epoch: 18, step: 798, loss: 0.3156309127807617, mean loss: 0.3560350953793997
Epoch: 18, step: 799, loss: 0.3443339467048645, mean loss: 0.35603465863900424
Epoch: 18, step: 800, loss: 0.34742817282676697, mean loss: 0.3560343374175728
Epoch: 18, step: 801, loss: 0.3021596670150757, mean loss: 0.35603232671852064
Epoch: 18, step: 802, loss: 0.3693926930427551, mean loss: 0.35603282533267716
Epoch: 18, step: 803, loss: 0.29092833399772644, mean loss: 0.3560303956979804
Epoch: 18, step: 804, loss: 0.32527974247932434, mean loss: 0.3560292481570908
Epoch: 18, step: 805, loss: 0.3276748061180115, mean loss: 0.35602819007656095
Epoch: 18, step: 806, loss: 0.3428259491920471, mean loss: 0.3560276974372504
Epoch: 18, step: 807, loss: 0.3508211672306061, mean loss: 0.3560275031637352
Epoch: 18, step: 808, loss: 0.33260083198547363, mean loss: 0.3560266290668292
Epoch: 18, step: 809, loss: 0.31132426857948303, mean loss: 0.35602496119277177
Epoch: 18, step: 810, loss: 0.3685242831707001, mean loss: 0.3560254275331806
Epoch: 18, step: 811, loss: 0.334391713142395, mean loss: 0.35602462042549554
Epoch: 18, step: 812, loss: 0.3145108222961426, mean loss: 0.35602307169212005
Epoch: 18, step: 813, loss: 0.3048001229763031, mean loss: 0.3560211608158716
Epoch: 18, step: 814, loss: 0.30686885118484497, mean loss: 0.35601932725338303
Epoch: 18, step: 815, loss: 0.3435434401035309, mean loss: 0.35601886187412496
Epoch: 18, step: 816, loss: 0.35136494040489197, mean loss: 0.3560186882786358
Epoch: 18, step: 817, loss: 0.35435745120048523, mean loss: 0.3560186263152983
Epoch: 18, step: 818, loss: 0.34070396423339844, mean loss: 0.3560180551071344
Epoch: 18, step: 819, loss: 0.29316115379333496, mean loss: 0.3560157107500811
Epoch: 18, step: 820, loss: 0.32467222213745117, mean loss: 0.3560145417839597
Epoch: 18, step: 821, loss: 0.3081016540527344, mean loss: 0.35601275492307616
Epoch: 18, step: 822, loss: 0.3324575126171112, mean loss: 0.356011876487786
Epoch: 18, step: 823, loss: 0.31391724944114685, mean loss: 0.3560103067299158
Epoch: 18, step: 824, loss: 0.31915944814682007, mean loss: 0.356008932569548
Epoch: 18, step: 825, loss: 0.3371431231498718, mean loss: 0.356008229093919
Epoch: 18, step: 826, loss: 0.38876697421073914, mean loss: 0.3560094505691834
Epoch: 18, step: 827, loss: 0.36015933752059937, mean loss: 0.3560096053002405
Epoch: 18, step: 828, loss: 0.34034258127212524, mean loss: 0.35600902116750766
Epoch: 18, step: 829, loss: 0.33974406123161316, mean loss: 0.35600841476381156
Epoch: 18, step: 830, loss: 0.3031720221042633, mean loss: 0.35600644494713707
Epoch: 18, step: 831, loss: 0.33878493309020996, mean loss: 0.35600580292835327
Epoch: 18, step: 832, loss: 0.3274393677711487, mean loss: 0.35600473800998766
Epoch: 18, step: 833, loss: 0.3817235231399536, mean loss: 0.3560056967360419
Epoch: 18, step: 834, loss: 0.35404351353645325, mean loss: 0.3560056235939388
Epoch: 18, step: 835, loss: 0.3195042908191681, mean loss: 0.3560042630253994
Epoch: 18, step: 836, loss: 0.38274818658828735, mean loss: 0.35600525985433684
Epoch: 18, step: 837, loss: 0.30874475836753845, mean loss: 0.3560034983745945
Epoch: 18, step: 838, loss: 0.3047967255115509, mean loss: 0.3560015898816996
Epoch: 18, step: 839, loss: 0.32021233439445496, mean loss: 0.35600025605434843
Epoch: 18, step: 840, loss: 0.29735344648361206, mean loss: 0.3559980704318101
Epoch: 18, step: 841, loss: 0.3574841320514679, mean loss: 0.35599812581161255
Epoch: 18, step: 842, loss: 0.34605497121810913, mean loss: 0.3559977552822817
Epoch: 18, step: 843, loss: 0.3933615982532501, mean loss: 0.3559991475852692
Epoch: 18, step: 844, loss: 0.3913891613483429, mean loss: 0.3560004662875743
Epoch: 18, step: 845, loss: 0.3129759430885315, mean loss: 0.3559988631679976
Epoch: 18, step: 846, loss: 0.3745585083961487, mean loss: 0.3559995546857601
Epoch: 18, step: 847, loss: 0.3326590657234192, mean loss: 0.35599868506992693
Epoch: 18, step: 848, loss: 0.40400514006614685, mean loss: 0.35600047361934745
Epoch: 18, step: 849, loss: 0.33833277225494385, mean loss: 0.355999815408284
Epoch: 18, step: 850, loss: 0.3651975691318512, mean loss: 0.35600015805827556
Epoch: 18, step: 851, loss: 0.30954188108444214, mean loss: 0.35599842738188703
Epoch: 18, step: 852, loss: 0.3608510494232178, mean loss: 0.3559986081463512
Epoch: 18, step: 853, loss: 0.3222339451313019, mean loss: 0.35599735042963304
Epoch: 18, step: 854, loss: 0.3196856677532196, mean loss: 0.35599599788809483
Epoch: 18, step: 855, loss: 0.3391697108745575, mean loss: 0.3559953711640553
Epoch: 18, step: 856, loss: 0.3332161009311676, mean loss: 0.35599452274250387
Epoch: 18, step: 857, loss: 0.3617599308490753, mean loss: 0.3559947374690628
Epoch: 18, step: 858, loss: 0.3414386510848999, mean loss: 0.35599419536313065
Epoch: 18, step: 859, loss: 0.32328009605407715, mean loss: 0.3559929770516712
Epoch: 18, step: 860, loss: 0.3406658470630646, mean loss: 0.3559924062726153
Epoch: 18, step: 861, loss: 0.3475167155265808, mean loss: 0.355992090651451
Epoch: 18, step: 862, loss: 0.32093346118927, mean loss: 0.3559907851727892
Epoch: 18, step: 863, loss: 0.37298327684402466, mean loss: 0.3559914178988717
Epoch: 18, step: 864, loss: 0.3297055959701538, mean loss: 0.3559904391662534
Epoch: 18, step: 865, loss: 0.36370939016342163, mean loss: 0.355990726564831
Epoch: 18, step: 866, loss: 0.32727333903312683, mean loss: 0.355989657374335
Epoch: 18, step: 867, loss: 0.3046402931213379, mean loss: 0.35598774563329805
Epoch: 18, step: 868, loss: 0.32336729764938354, mean loss: 0.3559865312165606
Epoch: 18, step: 869, loss: 0.33694979548454285, mean loss: 0.35598582253009897
Epoch: 18, step: 870, loss: 0.3169090449810028, mean loss: 0.35598436786094256
Epoch: 18, step: 871, loss: 0.32223471999168396, mean loss: 0.3559831115458789
Epoch: 18, step: 872, loss: 0.341970831155777, mean loss: 0.35598258996462484
Epoch: 18, step: 873, loss: 0.37431976199150085, mean loss: 0.3559832725065748
Epoch: 18, step: 874, loss: 0.3509674668312073, mean loss: 0.3559830858163721
Epoch: 18, step: 875, loss: 0.31865158677101135, mean loss: 0.355981696375437
Epoch: 18, step: 876, loss: 0.3099955916404724, mean loss: 0.35597998488246235
Epoch: 18, step: 877, loss: 0.3312062919139862, mean loss: 0.3559790628990992
Epoch: 18, step: 878, loss: 0.32877621054649353, mean loss: 0.35597805054926657
Epoch: 18, step: 879, loss: 0.3005636930465698, mean loss: 0.3559759883894905
Epoch: 18, step: 880, loss: 0.31837132573127747, mean loss: 0.35597458904209134
Epoch: 18, step: 881, loss: 0.32484179735183716, mean loss: 0.3559734305695271
Epoch: 18, step: 882, loss: 0.338128924369812, mean loss: 0.3559727665879011
Epoch: 18, step: 883, loss: 0.318464457988739, mean loss: 0.35597137098183623
Epoch: 18, step: 884, loss: 0.3250334560871124, mean loss: 0.3559702198892703
Epoch: 18, step: 885, loss: 0.3514206111431122, mean loss: 0.3559700506203981
Epoch: 18, step: 886, loss: 0.34334689378738403, mean loss: 0.35596958099143744
Epoch: 18, step: 887, loss: 0.32849329710006714, mean loss: 0.35596855880825695
Epoch: 18, step: 888, loss: 0.32221636176109314, mean loss: 0.3559673031928763
Epoch: 18, step: 889, loss: 0.36089345812797546, mean loss: 0.35596748644393406
Epoch: 18, step: 890, loss: 0.33193761110305786, mean loss: 0.35596659257511953
Epoch: 18, step: 891, loss: 0.321468323469162, mean loss: 0.35596530934832643
Epoch: 18, step: 892, loss: 0.3450264632701874, mean loss: 0.35596490247289114
Epoch: 18, step: 893, loss: 0.3745702803134918, mean loss: 0.3559655944827788
Epoch: 18, step: 894, loss: 0.3797122836112976, mean loss: 0.35596647768615325
Epoch: 18, step: 895, loss: 0.32097941637039185, mean loss: 0.35596517647143605
Epoch: 18, step: 896, loss: 0.34879806637763977, mean loss: 0.35596490992712077
Epoch: 18, step: 897, loss: 0.3191590905189514, mean loss: 0.3559635411722153
Epoch: 18, step: 898, loss: 0.31854110956192017, mean loss: 0.3559621495381515
Epoch: 18, step: 899, loss: 0.3105275630950928, mean loss: 0.35596046001760845
Epoch: 18, step: 900, loss: 0.3253619372844696, mean loss: 0.35595932222997845
Epoch: 18, step: 901, loss: 0.336496502161026, mean loss: 0.3559585985436518
Epoch: 18, step: 902, loss: 0.3408827483654022, mean loss: 0.3559580379989343
Epoch: 18, step: 903, loss: 0.356752872467041, mean loss: 0.3559580675510784
Epoch: 18, step: 904, loss: 0.3978056311607361, mean loss: 0.3559596233961024
Epoch: 18, step: 905, loss: 0.34182843565940857, mean loss: 0.3559590980340778
Epoch: 18, step: 906, loss: 0.35698655247688293, mean loss: 0.3559591362308302
Epoch: 18, step: 907, loss: 0.32824593782424927, mean loss: 0.35595810600040617
Epoch: 18, step: 908, loss: 0.33544450998306274, mean loss: 0.35595734344154156
Epoch: 18, step: 909, loss: 0.34703925251960754, mean loss: 0.35595701193864504
Epoch: 18, step: 910, loss: 0.33396467566490173, mean loss: 0.35595619447084315
Epoch: 18, step: 911, loss: 0.31259286403656006, mean loss: 0.3559545826907943
Epoch: 18, step: 912, loss: 0.311077743768692, mean loss: 0.3559529147168518
Epoch: 18, step: 913, loss: 0.3151352107524872, mean loss: 0.35595139766846245
Epoch: 18, step: 914, loss: 0.3205902576446533, mean loss: 0.35595008346992585
Epoch: 18, step: 915, loss: 0.3142993748188019, mean loss: 0.35594853557678435
Epoch: 18, step: 916, loss: 0.33796969056129456, mean loss: 0.3559478674417732
Epoch: 18, step: 917, loss: 0.38772404193878174, mean loss: 0.3559490482732298
Epoch: 18, step: 918, loss: 0.33552810549736023, mean loss: 0.35594828944067897
Epoch: 18, step: 919, loss: 0.33398905396461487, mean loss: 0.35594747347622163
Epoch: 18, step: 920, loss: 0.3555511236190796, mean loss: 0.35594745874914335
Epoch: 18, step: 921, loss: 0.36075061559677124, mean loss: 0.35594763721227957
Epoch: 18, step: 922, loss: 0.3276385962963104, mean loss: 0.3559465854180787
Epoch: 18, step: 923, loss: 0.33116888999938965, mean loss: 0.35594566486170265
Epoch: 18, step: 924, loss: 0.31809693574905396, mean loss: 0.3559442587343812
Epoch: 18, step: 925, loss: 0.3187675476074219, mean loss: 0.3559428776246729
Epoch: 18, step: 926, loss: 0.32628369331359863, mean loss: 0.355941775830984
Epoch: 18, step: 927, loss: 0.3642779290676117, mean loss: 0.35594208549492296
Epoch: 18, step: 928, loss: 0.3171936571598053, mean loss: 0.35594064615655013
Epoch: 18, step: 929, loss: 0.342650830745697, mean loss: 0.3559401525150892
Epoch: 18, step: 930, loss: 0.3121662437915802, mean loss: 0.3559385266224055
Epoch: 18, step: 931, loss: 0.296074241399765, mean loss: 0.35593630316804425
Epoch: 18, step: 932, loss: 0.33828678727149963, mean loss: 0.35593564766141855
Epoch: 18, step: 933, loss: 0.3399489223957062, mean loss: 0.3559350539332277
Epoch: 18, step: 934, loss: 0.3149276375770569, mean loss: 0.35593353102253006
Epoch: 18, step: 935, loss: 0.3273012042045593, mean loss: 0.35593246773053594
Epoch: 18, step: 936, loss: 0.372229665517807, mean loss: 0.3559330729218831
Epoch: 18, step: 937, loss: 0.34043562412261963, mean loss: 0.3559324974503347
Epoch: 18, step: 938, loss: 0.29202383756637573, mean loss: 0.35593012439846566
Epoch: 18, step: 939, loss: 0.38549572229385376, mean loss: 0.3559312221854067
Epoch: 18, step: 940, loss: 0.30354011058807373, mean loss: 0.35592927694679244
Epoch: 18, step: 941, loss: 0.3085586130619049, mean loss: 0.3559275181785484
Epoch: 18, step: 942, loss: 0.3712140917778015, mean loss: 0.35592808571423057
Epoch: 18, step: 943, loss: 0.29767459630966187, mean loss: 0.35592592305127374
Epoch: 18, step: 944, loss: 0.3098539710044861, mean loss: 0.3559242126918407
Epoch: 18, step: 945, loss: 0.3137441873550415, mean loss: 0.3559226468730963
Epoch: 18, step: 946, loss: 0.36088353395462036, mean loss: 0.3559228310257034
Epoch: 18, step: 947, loss: 0.373005211353302, mean loss: 0.3559234651155448
Epoch: 18, step: 948, loss: 0.36553525924682617, mean loss: 0.3559238218875329
Epoch: 18, step: 949, loss: 0.3390662670135498, mean loss: 0.35592319618955676
Epoch: 18, step: 950, loss: 0.32213494181632996, mean loss: 0.35592194212525907
Epoch: 18, step: 951, loss: 0.32259854674339294, mean loss: 0.35592070536028797
Epoch: 18, step: 952, loss: 0.3001669645309448, mean loss: 0.3559186361919514
Epoch: 18, step: 953, loss: 0.3138059079647064, mean loss: 0.35591707333556355
Epoch: 18, step: 954, loss: 0.31879401206970215, mean loss: 0.3559156957031271
Epoch: 18, step: 955, loss: 0.31292667984962463, mean loss: 0.35591410044500577
Epoch: 18, step: 956, loss: 0.34963542222976685, mean loss: 0.3559138674612878
Epoch: 18, step: 957, loss: 0.31939855217933655, mean loss: 0.35591251253307693
Epoch: 18, step: 958, loss: 0.3446130156517029, mean loss: 0.35591209327231177
Epoch: 18, step: 959, loss: 0.3047178387641907, mean loss: 0.3559101938119931
Epoch: 18, step: 960, loss: 0.32228919863700867, mean loss: 0.355908946418561
Epoch: 18, step: 961, loss: 0.37541720271110535, mean loss: 0.3559096701796463
Epoch: 18, step: 962, loss: 0.38011208176612854, mean loss: 0.35591056806173077
Epoch: 18, step: 963, loss: 0.32138898968696594, mean loss: 0.35590928739774597
Epoch: 18, step: 964, loss: 0.31137916445732117, mean loss: 0.35590763550313825
Epoch: 18, step: 965, loss: 0.3222244083881378, mean loss: 0.35590638603258723
Epoch: 18, step: 966, loss: 0.3483774662017822, mean loss: 0.3559061067596234
Epoch: 18, step: 967, loss: 0.3484000861644745, mean loss: 0.3559058283463966
Epoch: 18, step: 968, loss: 0.361408531665802, mean loss: 0.3559060324450324
Epoch: 18, step: 969, loss: 0.2833300828933716, mean loss: 0.35590334065846047
Epoch: 18, step: 970, loss: 0.3708969056606293, mean loss: 0.35590389673771733
Epoch: 18, step: 971, loss: 0.3353966772556305, mean loss: 0.3559031361970156
Epoch: 18, step: 972, loss: 0.32522377371788025, mean loss: 0.35590199844947323
Epoch: 18, step: 973, loss: 0.3322157859802246, mean loss: 0.35590112007624514
Epoch: 18, step: 974, loss: 0.3618234097957611, mean loss: 0.35590133968872406
Epoch: 18, step: 975, loss: 0.32213515043258667, mean loss: 0.3559000876051711
Epoch: 18, step: 976, loss: 0.39319875836372375, mean loss: 0.35590147062533345
Epoch: 18, step: 977, loss: 0.3885762095451355, mean loss: 0.3559026821469842
Epoch: 18, step: 978, loss: 0.31436780095100403, mean loss: 0.3559011421639952
Epoch: 18, step: 979, loss: 0.3410528302192688, mean loss: 0.3559005916556182
Epoch: 18, step: 980, loss: 0.3285995423793793, mean loss: 0.3558995794934829
Epoch: 18, step: 981, loss: 0.3171570301055908, mean loss: 0.35589814320115
Epoch: 18, step: 982, loss: 0.32693758606910706, mean loss: 0.35589706959384204
Epoch: 18, step: 983, loss: 0.37058794498443604, mean loss: 0.3558976141844185
Epoch: 18, step: 984, loss: 0.3155459463596344, mean loss: 0.35589611840401947
Epoch: 18, step: 985, loss: 0.34381699562072754, mean loss: 0.3558956706642766
Epoch: 18, step: 986, loss: 0.37801364064216614, mean loss: 0.3558964904859889
Epoch: 18, step: 987, loss: 0.3191148340702057, mean loss: 0.355895127192571
Epoch: 18, step: 988, loss: 0.32653287053108215, mean loss: 0.3558940389357732
Epoch: 18, step: 989, loss: 0.3534054756164551, mean loss: 0.35589394670527436
Epoch: 18, step: 990, loss: 0.29855456948280334, mean loss: 0.3558918216866618
Epoch: 18, step: 991, loss: 0.32100725173950195, mean loss: 0.3558905288994565
Epoch: 18, step: 992, loss: 0.37562933564186096, mean loss: 0.35589126037274693
Epoch: 18, step: 993, loss: 0.32874035835266113, mean loss: 0.3558902542620962
Epoch: 18, step: 994, loss: 0.38942450284957886, mean loss: 0.35589149686959565
Epoch: 18, step: 995, loss: 0.32662513852119446, mean loss: 0.3558904124484326
Epoch: 18, step: 996, loss: 0.32470864057540894, mean loss: 0.35588925709729424
Epoch: 18, step: 997, loss: 0.3124777376651764, mean loss: 0.3558876486675265
Epoch: 18, step: 998, loss: 0.39926764369010925, mean loss: 0.35588925586974285
Epoch: 18, step: 999, loss: 0.31814172863960266, mean loss: 0.355887857398817
Epoch: 18, step: 1000, loss: 0.3328250050544739, mean loss: 0.35588700299758913
Epoch: 18, step: 1001, loss: 0.35996687412261963, mean loss: 0.35588715413751376
Epoch: 18, step: 1002, loss: 0.32137149572372437, mean loss: 0.355885875543018
Epoch: 18, step: 1003, loss: 0.34810593724250793, mean loss: 0.3558855873544604
Epoch: 18, step: 1004, loss: 0.357994943857193, mean loss: 0.35588566548745676
Epoch: 18, step: 1005, loss: 0.3445717692375183, mean loss: 0.3558852464232205
Epoch: 18, step: 1006, loss: 0.3389326333999634, mean loss: 0.3558846185254086
Epoch: 18, step: 1007, loss: 0.31188908219337463, mean loss: 0.3558829890611
Epoch: 18, step: 1008, loss: 0.3056764602661133, mean loss: 0.3558811296289014
Epoch: 18, step: 1009, loss: 0.3357459604740143, mean loss: 0.35588038393713206
Epoch: 18, step: 1010, loss: 0.3285640776157379, mean loss: 0.3558793723344834
Epoch: 18, step: 1011, loss: 0.32760104537010193, mean loss: 0.3558783251441796
Epoch: 18, step: 1012, loss: 0.36267322301864624, mean loss: 0.35587857676046825
Epoch: 18, step: 1013, loss: 0.34193155169487, mean loss: 0.35587806031874913
Epoch: 18, step: 1014, loss: 0.38378170132637024, mean loss: 0.3558790935190679
Epoch: 18, step: 1015, loss: 0.33717668056488037, mean loss: 0.3558784010422849
Epoch: 18, step: 1016, loss: 0.3449975550174713, mean loss: 0.3558779981822744
Epoch: 18, step: 1017, loss: 0.36064964532852173, mean loss: 0.355878174844516
Epoch: 18, step: 1018, loss: 0.33670175075531006, mean loss: 0.3558774648958251
Epoch: 18, step: 1019, loss: 0.328517347574234, mean loss: 0.35587645200831874
Epoch: 18, step: 1020, loss: 0.32798174023628235, mean loss: 0.3558754193680429
Epoch: 18, step: 1021, loss: 0.348671019077301, mean loss: 0.3558751526766869
Epoch: 18, step: 1022, loss: 0.3306754231452942, mean loss: 0.35587421987159595
Epoch: 18, step: 1023, loss: 0.3174743354320526, mean loss: 0.35587279849595044
Epoch: 18, step: 1024, loss: 0.34342458844184875, mean loss: 0.35587233774123844
Epoch: 18, step: 1025, loss: 0.37613263726234436, mean loss: 0.35587308762278114
Epoch: 18, step: 1026, loss: 0.3992527425289154, mean loss: 0.3558746931468533
Epoch: 18, step: 1027, loss: 0.34212568402290344, mean loss: 0.35587418430121587
Epoch: 18, step: 1028, loss: 0.2990383207798004, mean loss: 0.3558720809052083
Epoch: 18, step: 1029, loss: 0.3290442228317261, mean loss: 0.3558710880897959
Epoch: 18, step: 1030, loss: 0.3524835407733917, mean loss: 0.35587096273186686
Epoch: 18, step: 1031, loss: 0.37617194652557373, mean loss: 0.3558717139524039
Epoch: 18, step: 1032, loss: 0.31774288415908813, mean loss: 0.3558703030798861
Epoch: 18, step: 1033, loss: 0.3384123742580414, mean loss: 0.3558696571119729
Epoch: 18, step: 1034, loss: 0.3039533495903015, mean loss: 0.35586773620667367
Epoch: 18, step: 1035, loss: 0.3170899450778961, mean loss: 0.35586630148005205
Epoch: 18, step: 1036, loss: 0.34032493829727173, mean loss: 0.35586572649158843
Epoch: 18, step: 1037, loss: 0.3428034484386444, mean loss: 0.3558652432404581
Epoch: 18, step: 1038, loss: 0.29723310470581055, mean loss: 0.35586307417018564
Epoch: 18, step: 1039, loss: 0.3214039206504822, mean loss: 0.35586179941606016
Epoch: 18, step: 1040, loss: 0.36150529980659485, mean loss: 0.3558620081794379
Epoch: 18, step: 1041, loss: 0.45976534485816956, mean loss: 0.3558658516112896
Epoch: 18, step: 1042, loss: 0.31915292143821716, mean loss: 0.35586449363347666
Epoch: 18, step: 1043, loss: 0.3227248191833496, mean loss: 0.3558632678724747
Epoch: 18, step: 1044, loss: 0.32830703258514404, mean loss: 0.35586224866785554
Epoch: 18, step: 1045, loss: 0.3507843613624573, mean loss: 0.3558620608622743
Epoch: 18, step: 1046, loss: 0.3203088045120239, mean loss: 0.3558607459742847
Epoch: 18, step: 1047, loss: 0.33412057161331177, mean loss: 0.3558599419737536
Epoch: 18, step: 1048, loss: 0.32757824659347534, mean loss: 0.35585889609174554
Epoch: 18, step: 1049, loss: 0.2938230633735657, mean loss: 0.3558566020368414
Epoch: 18, step: 1050, loss: 0.32224783301353455, mean loss: 0.3558553592468764
Epoch: 18, step: 1051, loss: 0.3552255630493164, mean loss: 0.35585533595904184
Epoch: 18, step: 1052, loss: 0.31993815302848816, mean loss: 0.3558540079064284
Epoch: 18, step: 1053, loss: 0.33107659220695496, mean loss: 0.35585309178516467
Epoch: 18, step: 1054, loss: 0.3325088322162628, mean loss: 0.35585222868539135
Epoch: 18, step: 1055, loss: 0.35067760944366455, mean loss: 0.35585203737293786
Epoch: 18, step: 1056, loss: 0.3370877802371979, mean loss: 0.35585134365941296
Epoch: 18, step: 1057, loss: 0.3370216190814972, mean loss: 0.3558506475512955
Epoch: 18, step: 1058, loss: 0.3274032473564148, mean loss: 0.3558495959302761
Epoch: 18, step: 1059, loss: 0.3823685944080353, mean loss: 0.3558505762274252
Epoch: 18, step: 1060, loss: 0.3683132827281952, mean loss: 0.35585103690485476
Epoch: 18, step: 1061, loss: 0.35668712854385376, mean loss: 0.3558510678094027
Epoch: 18, step: 1062, loss: 0.33429279923439026, mean loss: 0.3558502709781857
Epoch: 18, step: 1063, loss: 0.31297147274017334, mean loss: 0.35584868616157433
Epoch: 18, step: 1064, loss: 0.32726141810417175, mean loss: 0.35584762960437816
Epoch: 18, step: 1065, loss: 0.2865305244922638, mean loss: 0.35584506780730846
Epoch: 18, step: 1066, loss: 0.3728755712509155, mean loss: 0.35584569719137454
Epoch: 18, step: 1067, loss: 0.3406081199645996, mean loss: 0.3558451340880033
Epoch: 18, step: 1068, loss: 0.37814977765083313, mean loss: 0.35584595832375077
Epoch: 18, step: 1069, loss: 0.350394070148468, mean loss: 0.3558457568645765
Epoch: 18, step: 1070, loss: 0.3063965141773224, mean loss: 0.35584392967458695
Epoch: 18, step: 1071, loss: 0.37618327140808105, mean loss: 0.3558446812021414
Epoch: 18, step: 1072, loss: 0.318111777305603, mean loss: 0.35584328704349016
Epoch: 18, step: 1073, loss: 0.3306814432144165, mean loss: 0.35584235739582043
Epoch: 18, step: 1074, loss: 0.34100139141082764, mean loss: 0.3558418090910218
Epoch: 18, step: 1075, loss: 0.2881926894187927, mean loss: 0.3558393098624245
Epoch: 18, step: 1076, loss: 0.37866050004959106, mean loss: 0.35584015293716637
Epoch: 18, step: 1077, loss: 0.29261842370033264, mean loss: 0.3558378174466146
Epoch: 18, step: 1078, loss: 0.35849207639694214, mean loss: 0.35583791549467153
Epoch: 18, step: 1079, loss: 0.3522208333015442, mean loss: 0.35583778188495696
Epoch: 18, step: 1080, loss: 0.3309021294116974, mean loss: 0.35583686083252564
Epoch: 18, step: 1081, loss: 0.3149072229862213, mean loss: 0.3558353490633801
Epoch: 18, step: 1082, loss: 0.32219773530960083, mean loss: 0.3558341066769072
Epoch: 18, step: 1083, loss: 0.33619168400764465, mean loss: 0.3558333812217931
Epoch: 18, step: 1084, loss: 0.3074989318847656, mean loss: 0.3558315961477695
Epoch: 18, step: 1085, loss: 0.34396225214004517, mean loss: 0.3558311578087486
Epoch: 18, step: 1086, loss: 0.34856322407722473, mean loss: 0.35583088941132873
Epoch: 18, step: 1087, loss: 0.3247113525867462, mean loss: 0.35582974024084035
Epoch: 18, step: 1088, loss: 0.322695791721344, mean loss: 0.35582851672810006
Epoch: 18, step: 1089, loss: 0.3039558529853821, mean loss: 0.35582660133545024
Epoch: 18, step: 1090, loss: 0.3657872974872589, mean loss: 0.35582696911952705
Epoch: 18, step: 1091, loss: 0.32640716433525085, mean loss: 0.3558258828765502
Epoch: 18, step: 1092, loss: 0.3167651295661926, mean loss: 0.355824440722099
Epoch: 18, step: 1093, loss: 0.33496585488319397, mean loss: 0.35582367063475356
Epoch: 18, step: 1094, loss: 0.31558647751808167, mean loss: 0.35582218515488806
Epoch: 18, step: 1095, loss: 0.390487939119339, mean loss: 0.35582346490067823
Epoch: 18, step: 1096, loss: 0.29889747500419617, mean loss: 0.3558213634576609
Epoch: 18, step: 1097, loss: 0.3224020004272461, mean loss: 0.3558201298156147
Epoch: 18, step: 1098, loss: 0.32944703102111816, mean loss: 0.35581915631523475
Epoch: 18, step: 1099, loss: 0.325033962726593, mean loss: 0.35581801999478635
Epoch: 18, step: 1100, loss: 0.3214041590690613, mean loss: 0.35581674978252026
Epoch: 18, step: 1101, loss: 0.35643091797828674, mean loss: 0.3558167724505721
Epoch: 18, step: 1102, loss: 0.3417213261127472, mean loss: 0.3558162522274188
Epoch: 18, step: 1103, loss: 0.36245596408843994, mean loss: 0.3558164972714054
Epoch: 18, step: 1104, loss: 0.3116656541824341, mean loss: 0.3558148679086313
Epoch: 18, step: 1105, loss: 0.3796651363372803, mean loss: 0.35581574805729277
Epoch: 18, step: 1106, loss: 0.3113926649093628, mean loss: 0.35581410876864195
Epoch: 18, step: 1107, loss: 0.3031291663646698, mean loss: 0.3558121646748263
Epoch: 18, step: 1108, loss: 0.3310093581676483, mean loss: 0.35581124947588505
Epoch: 18, step: 1109, loss: 0.31320685148239136, mean loss: 0.3558096774738928
Epoch: 18, step: 1110, loss: 0.3665520250797272, mean loss: 0.35581007382660673
Epoch: 18, step: 1111, loss: 0.3470785915851593, mean loss: 0.3558097516792395
Epoch: 18, step: 1112, loss: 0.33999526500701904, mean loss: 0.3558091682264938
Epoch: 18, step: 1113, loss: 0.31828010082244873, mean loss: 0.3558077836965962
Epoch: 18, step: 1114, loss: 0.3625941872596741, mean loss: 0.35580803405272426
Epoch: 18, step: 1115, loss: 0.3371894359588623, mean loss: 0.35580734722233864
Epoch: 18, step: 1116, loss: 0.32393553853034973, mean loss: 0.355806171531288
Epoch: 18, step: 1117, loss: 0.3740637004375458, mean loss: 0.3558068449923321
Epoch: 18, step: 1118, loss: 0.32977622747421265, mean loss: 0.35580588484266895
Epoch: 18, step: 1119, loss: 0.3453414738178253, mean loss: 0.3558054988729498
Epoch: 18, step: 1120, loss: 0.3405081629753113, mean loss: 0.35580493466626306
Epoch: 18, step: 1121, loss: 0.32066285610198975, mean loss: 0.3558036385801613
Epoch: 18, step: 1122, loss: 0.34306299686431885, mean loss: 0.35580316870585865
Epoch: 18, step: 1123, loss: 0.36568713188171387, mean loss: 0.35580353321254016
Epoch: 18, step: 1124, loss: 0.3254510462284088, mean loss: 0.3558024138967241
Epoch: 18, step: 1125, loss: 0.3054821789264679, mean loss: 0.35580055829398904
Epoch: 18, step: 1126, loss: 0.32432863116264343, mean loss: 0.3557993977819078
Epoch: 18, step: 1127, loss: 0.37699830532073975, mean loss: 0.3558001794525397
Epoch: 18, step: 1128, loss: 0.36276599764823914, mean loss: 0.35580043629477254
Epoch: 18, step: 1129, loss: 0.33051031827926636, mean loss: 0.3557995038370624
Epoch: 18, step: 1130, loss: 0.3239166736602783, mean loss: 0.35579832834651276
Epoch: 18, step: 1131, loss: 0.40152227878570557, mean loss: 0.355800014084252
Epoch: 18, step: 1132, loss: 0.33237332105636597, mean loss: 0.35579915042736615
Epoch: 18, step: 1133, loss: 0.32623180747032166, mean loss: 0.35579806042725715
Epoch: 18, step: 1134, loss: 0.3066246807575226, mean loss: 0.355796247717423
Epoch: 18, step: 1135, loss: 0.3352118730545044, mean loss: 0.35579548893038887
Epoch: 18, step: 1136, loss: 0.3576626181602478, mean loss: 0.355795557754497
Epoch: 18, step: 1137, loss: 0.3037707507610321, mean loss: 0.35579364014273906
Epoch: 18, step: 1138, loss: 0.34417617321014404, mean loss: 0.3557932119437441
Epoch: 18, step: 1139, loss: 0.3417072892189026, mean loss: 0.35579269278103126
Epoch: 18, step: 1140, loss: 0.3541606068611145, mean loss: 0.35579263262970556
Epoch: 18, step: 1141, loss: 0.31144189834594727, mean loss: 0.3557909981219189
Epoch: 18, step: 1142, loss: 0.34220317006111145, mean loss: 0.35579049737277346
Epoch: 18, step: 1143, loss: 0.30532220005989075, mean loss: 0.3557886375446001
Epoch: 18, step: 1144, loss: 0.3550192713737488, mean loss: 0.35578860919341276
Epoch: 18, step: 1145, loss: 0.321537584066391, mean loss: 0.35578734708768917
Epoch: 18, step: 1146, loss: 0.3426920473575592, mean loss: 0.3557868645607084
Epoch: 18, step: 1147, loss: 0.3174397945404053, mean loss: 0.35578545162518815
Epoch: 18, step: 1148, loss: 0.3333960771560669, mean loss: 0.35578462669705474
Epoch: 18, step: 1149, loss: 0.33591437339782715, mean loss: 0.35578389461197263
Epoch: 18, step: 1150, loss: 0.33442825078964233, mean loss: 0.35578310782923595
Epoch: 18, step: 1151, loss: 0.3473733365535736, mean loss: 0.35578279800860246
Epoch: 18, step: 1152, loss: 0.34943217039108276, mean loss: 0.3557825640565812
Epoch: 18, step: 1153, loss: 0.31812918186187744, mean loss: 0.35578117698731887
Epoch: 18, step: 1154, loss: 0.3779227137565613, mean loss: 0.3557819926036584
Epoch: 18, step: 1155, loss: 0.30838873982429504, mean loss: 0.35578024686722187
Epoch: 18, step: 1156, loss: 0.33860331773757935, mean loss: 0.35577961417617876
Epoch: 18, step: 1157, loss: 0.34342125058174133, mean loss: 0.35577915898783274
Epoch: 18, step: 1158, loss: 0.3048570454120636, mean loss: 0.3557772834726187
Epoch: 18, step: 1159, loss: 0.34924113750457764, mean loss: 0.35577704274832705
Epoch: 18, step: 1160, loss: 0.32468587160110474, mean loss: 0.3557758977120089
Epoch: 18, step: 1161, loss: 0.35559216141700745, mean loss: 0.3557758909455548
Epoch: 18, step: 1162, loss: 0.3336888253688812, mean loss: 0.35577507757543597
Epoch: 18, step: 1163, loss: 0.3171539604663849, mean loss: 0.3557736553808157
Epoch: 18, step: 1164, loss: 0.32712027430534363, mean loss: 0.35577260027969715
Epoch: 18, step: 1165, loss: 0.3576000928878784, mean loss: 0.3557726675708308
Epoch: 18, step: 1166, loss: 0.3165270984172821, mean loss: 0.3557712225408535
Epoch: 18, step: 1167, loss: 0.35470500588417053, mean loss: 0.35577118328398105
Epoch: 18, step: 1168, loss: 0.3282221555709839, mean loss: 0.3557701689977724
Epoch: 18, step: 1169, loss: 0.36711743474006653, mean loss: 0.3557705867602988
Epoch: 18, step: 1170, loss: 0.32967790961265564, mean loss: 0.3557696261640043
Epoch: 18, step: 1171, loss: 0.31843364238739014, mean loss: 0.35576825169839627
Epoch: 18, step: 1172, loss: 0.3112555742263794, mean loss: 0.35576661309440316
Epoch: 18, step: 1173, loss: 0.3657747805118561, mean loss: 0.3557669815022445
Epoch: 18, step: 1174, loss: 0.3712705075740814, mean loss: 0.35576755217718364
Epoch: 18, step: 1175, loss: 0.3180379271507263, mean loss: 0.35576616342479017
Epoch: 18, step: 1176, loss: 0.2971278131008148, mean loss: 0.35576400514328094
Epoch: 18, step: 1177, loss: 0.32240819931030273, mean loss: 0.35576277747284174
Epoch: 18, step: 1178, loss: 0.32613492012023926, mean loss: 0.3557616870507979
Epoch: 18, step: 1179, loss: 0.30474555492401123, mean loss: 0.35575980952495784
Epoch: 18, step: 1180, loss: 0.3227091431617737, mean loss: 0.3557585932195678
Epoch: 18, step: 1181, loss: 0.3501840829849243, mean loss: 0.3557583880782476
Epoch: 18, step: 1182, loss: 0.36344268918037415, mean loss: 0.3557586708492173
Epoch: 18, step: 1183, loss: 0.3565909266471863, mean loss: 0.3557587014738787
Epoch: 18, step: 1184, loss: 0.3480556309223175, mean loss: 0.3557584180330813
Epoch: 18, step: 1185, loss: 0.32752493023872375, mean loss: 0.3557573791969714
Epoch: 18, step: 1186, loss: 0.299113392829895, mean loss: 0.35575529508841824
Epoch: 18, step: 1187, loss: 0.35525500774383545, mean loss: 0.355755276681967
Epoch: 18, step: 1188, loss: 0.31406185030937195, mean loss: 0.3557537427639223
Epoch: 18, step: 1189, loss: 0.31421777606010437, mean loss: 0.3557522146951009
Epoch: 18, step: 1190, loss: 0.32268226146698, mean loss: 0.3557509981276422
Epoch: 18, step: 1191, loss: 0.31125202775001526, mean loss: 0.3557493611731698
Epoch: 18, step: 1192, loss: 0.33563798666000366, mean loss: 0.35574862137642477
Epoch: 18, step: 1193, loss: 0.34837672114372253, mean loss: 0.3557483502111105
Epoch: 18, step: 1194, loss: 0.3211507201194763, mean loss: 0.3557470776311976
Epoch: 18, step: 1195, loss: 0.3346557319164276, mean loss: 0.355746301871829
Epoch: 18, step: 1196, loss: 0.33906224370002747, mean loss: 0.3557456882391771
Epoch: 18, step: 1197, loss: 0.3022877275943756, mean loss: 0.3557437221501501
Epoch: 18, step: 1198, loss: 0.31585344672203064, mean loss: 0.3557422551104889
Epoch: 18, step: 1199, loss: 0.3473387360572815, mean loss: 0.3557419460666873
Epoch: 18, step: 1200, loss: 0.3369685113430023, mean loss: 0.3557412556892106
Epoch: 18, step: 1201, loss: 0.4031430780887604, mean loss: 0.35574299878777643
Epoch: 18, step: 1202, loss: 0.4216533303260803, mean loss: 0.3557454224072483
Epoch: 18, step: 1203, loss: 0.32912734150886536, mean loss: 0.35574444365739916
Epoch: 18, step: 1204, loss: 0.3604961037635803, mean loss: 0.35574461837005517
Epoch: 18, step: 1205, loss: 0.3403885066509247, mean loss: 0.3557440537656093
Epoch: 18, step: 1206, loss: 0.31689316034317017, mean loss: 0.35574262537142487
Epoch: 18, step: 1207, loss: 0.3809780478477478, mean loss: 0.35574355314431005
Epoch: 18, step: 1208, loss: 0.33010855317115784, mean loss: 0.3557426107157239
Epoch: 18, step: 1209, loss: 0.3049646019935608, mean loss: 0.35574074401442535
Epoch: 18, step: 1210, loss: 0.36499565839767456, mean loss: 0.35574108423110673
Epoch: 18, step: 1211, loss: 0.3112852871417999, mean loss: 0.3557394500671202
Epoch: 18, step: 1212, loss: 0.31131690740585327, mean loss: 0.3557378171855668
Epoch: 18, step: 1213, loss: 0.3192268908023834, mean loss: 0.35573647516813006
Epoch: 18, step: 1214, loss: 0.33781886100769043, mean loss: 0.3557358166017993
Epoch: 18, step: 1215, loss: 0.3086998462677002, mean loss: 0.3557340878466415
Epoch: 18, step: 1216, loss: 0.3507786989212036, mean loss: 0.35573390572348645
Epoch: 18, step: 1217, loss: 0.40673795342445374, mean loss: 0.3557357801831594
Epoch: 18, step: 1218, loss: 0.30076074600219727, mean loss: 0.3557337598592396
Epoch: 18, step: 1219, loss: 0.33786240220069885, mean loss: 0.3557331031137722
Epoch: 18, step: 1220, loss: 0.28655970096588135, mean loss: 0.3557305611888779
Epoch: 18, step: 1221, loss: 0.34346771240234375, mean loss: 0.35573011058077963
Epoch: 18, step: 1222, loss: 0.3186173439025879, mean loss: 0.355728746892862
Epoch: 18, step: 1223, loss: 0.3204769492149353, mean loss: 0.3557274516328062
Epoch: 18, step: 1224, loss: 0.34618079662323, mean loss: 0.3557271008720681
Epoch: 18, step: 1225, loss: 0.32518264651298523, mean loss: 0.3557259786568297
Epoch: 18, step: 1226, loss: 0.34705114364624023, mean loss: 0.35572565995169686
Epoch: 18, step: 1227, loss: 0.3394821286201477, mean loss: 0.3557250632018316
Epoch: 18, step: 1228, loss: 0.3482431173324585, mean loss: 0.3557247883424999
Epoch: 18, step: 1229, loss: 0.3108162581920624, mean loss: 0.35572313862792526
Epoch: 18, step: 1230, loss: 0.3227446973323822, mean loss: 0.35572192720959167
Epoch: 18, step: 1231, loss: 0.3643985688686371, mean loss: 0.35572224592255297
Epoch: 18, step: 1232, loss: 0.3302837908267975, mean loss: 0.3557213115440371
Epoch: 18, step: 1233, loss: 0.32389992475509644, mean loss: 0.3557201427573336
Epoch: 18, step: 1234, loss: 0.29549750685691833, mean loss: 0.3557179308854454
Epoch: 18, step: 1235, loss: 0.3213081657886505, mean loss: 0.35571666712148564
Epoch: 18, step: 1236, loss: 0.36317139863967896, mean loss: 0.35571694090060046
Epoch: 18, step: 1237, loss: 0.3236626088619232, mean loss: 0.3557157637308598
Epoch: 18, step: 1238, loss: 0.3168801963329315, mean loss: 0.3557143375780414
Epoch: 18, step: 1239, loss: 0.30229651927948, mean loss: 0.35571237599540706
Epoch: 18, step: 1240, loss: 0.36197954416275024, mean loss: 0.35571260612679795
Epoch: 18, step: 1241, loss: 0.2586217522621155, mean loss: 0.3557090410664372
Epoch: 18, step: 1242, loss: 0.3493276834487915, mean loss: 0.3557088067591995
Epoch: 18, step: 1243, loss: 0.32396399974823, mean loss: 0.3557076412133407
Epoch: 18, step: 1244, loss: 0.2952674925327301, mean loss: 0.3557054221676058
Epoch: 18, step: 1245, loss: 0.3354671597480774, mean loss: 0.3557046791518771
Epoch: 18, step: 1246, loss: 0.3567539155483246, mean loss: 0.35570471767151424
Epoch: 18, step: 1247, loss: 0.41344910860061646, mean loss: 0.3557068375096541
Epoch: 18, step: 1248, loss: 0.28120100498199463, mean loss: 0.3557041024473389
Epoch: 18, step: 1249, loss: 0.3300172984600067, mean loss: 0.35570315953551207
Epoch: 18, step: 1250, loss: 0.31196072697639465, mean loss: 0.35570155389617136
Epoch: 18, step: 1251, loss: 0.33246946334838867, mean loss: 0.3557007011546302
Epoch: 18, step: 1252, loss: 0.3403084874153137, mean loss: 0.3557001361990883
Epoch: 18, step: 1253, loss: 0.36931413412094116, mean loss: 0.35570063586868833
Epoch: 18, step: 1254, loss: 0.29438918828964233, mean loss: 0.35569838565957984
Epoch: 18, step: 1255, loss: 0.32482627034187317, mean loss: 0.3556972526547605
Epoch: 18, step: 1256, loss: 0.34738633036613464, mean loss: 0.35569694765559395
Epoch: 18, step: 1257, loss: 0.37353086471557617, mean loss: 0.3556976021112659
Epoch: 18, step: 1258, loss: 0.3408774435520172, mean loss: 0.3556970582721936
Epoch: 18, step: 1259, loss: 0.3108524978160858, mean loss: 0.3556954127210247
Epoch: 18, step: 1260, loss: 0.33883339166641235, mean loss: 0.35569479399937737
Epoch: 18, step: 1261, loss: 0.32985156774520874, mean loss: 0.3556938457632926
Epoch: 18, step: 1262, loss: 0.3000187873840332, mean loss: 0.35569180301670006
Epoch: 18, step: 1263, loss: 0.3246834874153137, mean loss: 0.3556906653473575
Epoch: 18, step: 1264, loss: 0.33950075507164, mean loss: 0.35569007137478986
Epoch: 18, step: 1265, loss: 0.32765570282936096, mean loss: 0.3556890428925628
Epoch: 18, step: 1266, loss: 0.37104833126068115, mean loss: 0.35568960635007657
Epoch: 18, step: 1267, loss: 0.3124300539493561, mean loss: 0.35568801942592393
Epoch: 18, step: 1268, loss: 0.35141095519065857, mean loss: 0.35568786253277124
Epoch: 18, step: 1269, loss: 0.2989906370639801, mean loss: 0.35568578281648233
Epoch: 18, step: 1270, loss: 0.37281471490859985, mean loss: 0.355686411101414
Epoch: 18, step: 1271, loss: 0.3751783072948456, mean loss: 0.3556871260330526
Epoch: 18, step: 1272, loss: 0.307563841342926, mean loss: 0.3556853610125248
Epoch: 18, step: 1273, loss: 0.31286996603012085, mean loss: 0.3556837907273718
Epoch: 18, step: 1274, loss: 0.33530211448669434, mean loss: 0.35568304324227107
Epoch: 18, step: 1275, loss: 0.3796183466911316, mean loss: 0.3556839210222127
Epoch: 18, step: 1276, loss: 0.37668362259864807, mean loss: 0.35568469111651674
Epoch: 18, step: 1277, loss: 0.3170224726200104, mean loss: 0.3556832733600629
Epoch: 18, step: 1278, loss: 0.30001989006996155, mean loss: 0.3556812322400713
Epoch: 18, step: 1279, loss: 0.34151625633239746, mean loss: 0.3556807128437708
Epoch: 18, step: 1280, loss: 0.31062841415405273, mean loss: 0.35567906094267115
Epoch: 18, step: 1281, loss: 0.3483825922012329, mean loss: 0.35567879341796843
Epoch: 18, step: 1282, loss: 0.35055506229400635, mean loss: 0.35567860556348174
Epoch: 18, step: 1283, loss: 0.3345035910606384, mean loss: 0.3556778292394422
Epoch: 18, step: 1284, loss: 0.347333699464798, mean loss: 0.355677523335942
Epoch: 18, step: 1285, loss: 0.31785017251968384, mean loss: 0.3556761366011808
Epoch: 18, step: 1286, loss: 0.31588014960289, mean loss: 0.3556746777505265
Epoch: 18, step: 1287, loss: 0.322933167219162, mean loss: 0.3556734775485276
Epoch: 18, step: 1288, loss: 0.38021183013916016, mean loss: 0.3556743770152843
Epoch: 18, step: 1289, loss: 0.3132372796535492, mean loss: 0.3556728215172504
Epoch: 18, step: 1290, loss: 0.35987451672554016, mean loss: 0.3556729755213998
Epoch: 18, step: 1291, loss: 0.38498640060424805, mean loss: 0.3556740499029085
Epoch: 18, step: 1292, loss: 0.353246808052063, mean loss: 0.3556739609440721
Epoch: 18, step: 1293, loss: 0.3473128378391266, mean loss: 0.35567365451868527
Epoch: 18, step: 1294, loss: 0.39558589458465576, mean loss: 0.3556751172020167
Epoch: 18, step: 1295, loss: 0.33213740587234497, mean loss: 0.35567425463563845
Epoch: 18, step: 1296, loss: 0.3199816942214966, mean loss: 0.35567294668883154
Epoch: 18, step: 1297, loss: 0.39262983202934265, mean loss: 0.35567430091694957
Epoch: 18, step: 1298, loss: 0.32609865069389343, mean loss: 0.35567321720253003
Epoch: 18, step: 1299, loss: 0.3247600495815277, mean loss: 0.35567208452014615
Epoch: 18, step: 1300, loss: 0.38320618867874146, mean loss: 0.35567309335406544
Epoch: 18, step: 1301, loss: 0.30749237537384033, mean loss: 0.35567132810463403
Epoch: 18, step: 1302, loss: 0.3315906524658203, mean loss: 0.35567044586702135
Epoch: 18, step: 1303, loss: 0.33123600482940674, mean loss: 0.3556695507013913
Epoch: 18, step: 1304, loss: 0.3696042597293854, mean loss: 0.35567006118639066
Epoch: 18, step: 1305, loss: 0.40219646692276, mean loss: 0.3556717655752007
Epoch: 18, step: 1306, loss: 0.35279855132102966, mean loss: 0.35567166032540204
Epoch: 18, step: 1307, loss: 0.34691768884658813, mean loss: 0.3556713396671061
Epoch: 18, step: 1308, loss: 0.36047711968421936, mean loss: 0.3556715156965562
Epoch: 18, step: 1309, loss: 0.312090665102005, mean loss: 0.35566991944534404
Epoch: 18, step: 1310, loss: 0.3392614424228668, mean loss: 0.3556693184682711
Epoch: 18, step: 1311, loss: 0.3302344083786011, mean loss: 0.35566838692307295
Epoch: 18, step: 1312, loss: 0.3244406580924988, mean loss: 0.3556672432596842
Epoch: 18, step: 1313, loss: 0.3121926486492157, mean loss: 0.35566565113360893
Epoch: 18, step: 1314, loss: 0.3052453398704529, mean loss: 0.3556638047092026
Epoch: 18, step: 1315, loss: 0.32528796792030334, mean loss: 0.3556626923671494
Epoch: 18, step: 1316, loss: 0.3222992718219757, mean loss: 0.35566147066659115
Epoch: 18, step: 1317, loss: 0.35671141743659973, mean loss: 0.3556615091120972
Epoch: 18, step: 1318, loss: 0.3213061988353729, mean loss: 0.35566025118268135
Epoch: 18, step: 1319, loss: 0.31689226627349854, mean loss: 0.3556588317339076
Epoch: 18, step: 1320, loss: 0.3408287465572357, mean loss: 0.35565828876590055
Epoch: 18, step: 1321, loss: 0.32972079515457153, mean loss: 0.3556573391615361
Epoch: 18, step: 1322, loss: 0.3105795979499817, mean loss: 0.35565568886897847
Epoch: 18, step: 1323, loss: 0.320515900850296, mean loss: 0.35565440245120067
Epoch: 18, step: 1324, loss: 0.3055116534233093, mean loss: 0.355652566863507
Epoch: 18, step: 1325, loss: 0.3932066559791565, mean loss: 0.3556539415647705
Epoch: 18, step: 1326, loss: 0.33515065908432007, mean loss: 0.3556531910511177
Epoch: 18, step: 1327, loss: 0.3129355013370514, mean loss: 0.3556516274460769
Epoch: 18, step: 1328, loss: 0.3651913106441498, mean loss: 0.35565197661642933
Epoch: 18, step: 1329, loss: 0.35273903608322144, mean loss: 0.3556518700012279
Epoch: 18, step: 1330, loss: 0.32418733835220337, mean loss: 0.35565071842447393
Epoch: 18, step: 1331, loss: 0.3420368432998657, mean loss: 0.3556502201857415
Epoch: 18, step: 1332, loss: 0.3352331519126892, mean loss: 0.3556494729920261
Epoch: 18, step: 1333, loss: 0.34160158038139343, mean loss: 0.35564895890681014
Epoch: 18, step: 1334, loss: 0.36610808968544006, mean loss: 0.3556493416466198
Epoch: 18, step: 1335, loss: 0.3338031768798828, mean loss: 0.3556485422407077
Epoch: 18, step: 1336, loss: 0.3272321820259094, mean loss: 0.3556475024529286
Epoch: 18, step: 1337, loss: 0.3174547553062439, mean loss: 0.3556461049868786
Epoch: 18, step: 1338, loss: 0.3561895489692688, mean loss: 0.35564612487067293
Epoch: 18, step: 1339, loss: 0.32550469040870667, mean loss: 0.3556450220814712
Epoch: 18, step: 1340, loss: 0.348739892244339, mean loss: 0.355644769451689
Epoch: 18, step: 1341, loss: 0.3349928855895996, mean loss: 0.35564401391339007
Epoch: 18, step: 1342, loss: 0.3272078335285187, mean loss: 0.3556429736287592
Epoch: 18, step: 1343, loss: 0.34141984581947327, mean loss: 0.35564245332118644
Epoch: 18, step: 1344, loss: 0.3837207555770874, mean loss: 0.355643480438363
Epoch: 18, step: 1345, loss: 0.33457377552986145, mean loss: 0.3556427097270854
Epoch: 18, step: 1346, loss: 0.31848153471946716, mean loss: 0.35564135045370276
Epoch: 18, step: 1347, loss: 0.3423265218734741, mean loss: 0.3556408634446106
Epoch: 18, step: 1348, loss: 0.30505141615867615, mean loss: 0.35563901313016394
Epoch: 18, step: 1349, loss: 0.32331565022468567, mean loss: 0.35563783094294626
Epoch: 18, step: 1350, loss: 0.30975469946861267, mean loss: 0.3556361528852542
Epoch: 18, step: 1351, loss: 0.3178865313529968, mean loss: 0.35563477234028884
Epoch: 18, step: 1352, loss: 0.3711705803871155, mean loss: 0.355635340481011
Epoch: 18, step: 1353, loss: 0.3299885094165802, mean loss: 0.3556344026169334
Epoch: 18, step: 1354, loss: 0.31428253650665283, mean loss: 0.3556328904998416
Epoch: 18, step: 1355, loss: 0.3270178735256195, mean loss: 0.35563184417042176
Epoch: 18, step: 1356, loss: 0.3201308250427246, mean loss: 0.35563054609666667
Epoch: 18, step: 1357, loss: 0.3133794963359833, mean loss: 0.35562900126852187
Epoch: 18, step: 1358, loss: 0.3619499206542969, mean loss: 0.35562923237229815
Epoch: 18, step: 1359, loss: 0.359464168548584, mean loss: 0.3556293725790902
Epoch: 18, step: 1360, loss: 0.2950171232223511, mean loss: 0.3556271566521587
Epoch: 18, step: 1361, loss: 0.32915574312210083, mean loss: 0.35562618891751185
Epoch: 18, step: 1362, loss: 0.35979780554771423, mean loss: 0.3556263414167489
Epoch: 18, step: 1363, loss: 0.3109300136566162, mean loss: 0.35562470754016756
Epoch: 18, step: 1364, loss: 0.33186668157577515, mean loss: 0.3556238390960412
Epoch: 18, step: 1365, loss: 0.3032219111919403, mean loss: 0.3556219236808828
Epoch: 18, step: 1366, loss: 0.32109054923057556, mean loss: 0.35562066152311206
Epoch: 18, step: 1367, loss: 0.3049403727054596, mean loss: 0.3556188091733746
Epoch: 18, step: 1368, loss: 0.34711769223213196, mean loss: 0.35561849847139215
Epoch: 18, step: 1369, loss: 0.293995201587677, mean loss: 0.3556162463225403
Epoch: 18, step: 1370, loss: 0.35083526372909546, mean loss: 0.3556160715981828
Epoch: 18, step: 1371, loss: 0.3440319895744324, mean loss: 0.35561564826526276
Epoch: 18, step: 1372, loss: 0.327715665102005, mean loss: 0.3556146287153573
Epoch: 18, step: 1373, loss: 0.3632306456565857, mean loss: 0.3556149070175184
Epoch: 18, step: 1374, loss: 0.36410537362098694, mean loss: 0.3556152172622147
Epoch: 18, step: 1375, loss: 0.3291662633419037, mean loss: 0.35561425084326115
Epoch: 18, step: 1376, loss: 0.35463500022888184, mean loss: 0.3556142150637071
Epoch: 18, step: 1377, loss: 0.32045215368270874, mean loss: 0.35561293037019664
Epoch: 18, step: 1378, loss: 0.3221432566642761, mean loss: 0.35561170755503807
Epoch: 18, step: 1379, loss: 0.30240339040756226, mean loss: 0.3556097636591902
Epoch: 18, step: 1380, loss: 0.31646928191185, mean loss: 0.35560833376543555
Epoch: 18, step: 1381, loss: 0.34235870838165283, mean loss: 0.35560784974317416
Epoch: 18, step: 1382, loss: 0.33637017011642456, mean loss: 0.35560714699688645
Epoch: 18, step: 1383, loss: 0.3054640293121338, mean loss: 0.35560531535173434
Epoch: 18, step: 1384, loss: 0.3145574927330017, mean loss: 0.35560381599743623
Epoch: 18, step: 1385, loss: 0.2972821593284607, mean loss: 0.3556016857594105
Epoch: 18, step: 1386, loss: 0.37383243441581726, mean loss: 0.3556023516255362
Epoch: 18, step: 1387, loss: 0.33857622742652893, mean loss: 0.3556017297802404
Epoch: 18, step: 1388, loss: 0.30891135334968567, mean loss: 0.3556000245694581
Epoch: 18, step: 1389, loss: 0.32863736152648926, mean loss: 0.3555990398837871
Epoch: 18, step: 1390, loss: 0.3354215919971466, mean loss: 0.3555983030234034
Epoch: 18, step: 1391, loss: 0.3100436329841614, mean loss: 0.35559663947278847
Epoch: 18, step: 1392, loss: 0.32522454857826233, mean loss: 0.35559553039515857
Epoch: 18, step: 1393, loss: 0.3048803210258484, mean loss: 0.35559367852889956
Epoch: 18, step: 1394, loss: 0.3573346436023712, mean loss: 0.3555937420979313
Epoch: 18, step: 1395, loss: 0.3432152569293976, mean loss: 0.35559329013045765
Epoch: 18, step: 1396, loss: 0.3601313531398773, mean loss: 0.3555934558197128
Epoch: 18, step: 1397, loss: 0.32943934202194214, mean loss: 0.35559250094151645
Epoch: 18, step: 1398, loss: 0.3379874527454376, mean loss: 0.35559185821039324
Epoch: 18, step: 1399, loss: 0.3387855887413025, mean loss: 0.3555912446637567
Epoch: 18, step: 1400, loss: 0.315147340297699, mean loss: 0.35558976823166216
Epoch: 18, step: 1401, loss: 0.374800443649292, mean loss: 0.3555904695047664
Epoch: 18, step: 1402, loss: 0.3604147136211395, mean loss: 0.3555906456042049
Epoch: 18, step: 1403, loss: 0.3492550849914551, mean loss: 0.3555904143456046
Epoch: 18, step: 1404, loss: 0.33998093008995056, mean loss: 0.35558984459401666
Epoch: 18, step: 1405, loss: 0.3584316074848175, mean loss: 0.3555899483155617
Epoch: 18, step: 1406, loss: 0.3419375419616699, mean loss: 0.3555894500343706
Epoch: 18, step: 1407, loss: 0.3301709294319153, mean loss: 0.3555885223511369
Epoch: 18, step: 1408, loss: 0.328321248292923, mean loss: 0.35558752723146764
Epoch: 18, step: 1409, loss: 0.33655276894569397, mean loss: 0.3555868325829644
Epoch: 18, step: 1410, loss: 0.32407060265541077, mean loss: 0.35558568248151834
Epoch: 18, step: 1411, loss: 0.3447403013706207, mean loss: 0.35558528672246453
Epoch: 18, step: 1412, loss: 0.30517277121543884, mean loss: 0.35558344718531776
Epoch: 18, step: 1413, loss: 0.3311556875705719, mean loss: 0.35558255585642573
Epoch: 18, step: 1414, loss: 0.2925419807434082, mean loss: 0.35558025569314217
Epoch: 18, step: 1415, loss: 0.3389401435852051, mean loss: 0.35557964856704366
Epoch: 18, step: 1416, loss: 0.34269261360168457, mean loss: 0.3555791783917375
Epoch: 18, step: 1417, loss: 0.3123374283313751, mean loss: 0.3555776008014398
Epoch: 18, step: 1418, loss: 0.36992451548576355, mean loss: 0.3555781242013407
Epoch: 18, step: 1419, loss: 0.38485187292099, mean loss: 0.3555791921186295
Epoch: 18, step: 1420, loss: 0.36975547671318054, mean loss: 0.3555797092559218
Epoch: 18, step: 1421, loss: 0.3191544711589813, mean loss: 0.3555783805465727
Epoch: 18, step: 1422, loss: 0.3184863030910492, mean loss: 0.3555770275618032
Epoch: 18, step: 1423, loss: 0.35493403673171997, mean loss: 0.3555770041086798
Epoch: 18, step: 1424, loss: 0.3372775912284851, mean loss: 0.35557633666100574
Epoch: 18, step: 1425, loss: 0.3347949683666229, mean loss: 0.35557557871482826
Epoch: 18, step: 1426, loss: 0.31956273317337036, mean loss: 0.35557426528817004
Epoch: 18, step: 1427, loss: 0.3605495095252991, mean loss: 0.3555744467339847
Epoch: 18, step: 1428, loss: 0.3391028046607971, mean loss: 0.3555738460395507
Epoch: 18, step: 1429, loss: 0.3557089567184448, mean loss: 0.35557385096664135
Epoch: 18, step: 1430, loss: 0.33886370062828064, mean loss: 0.35557324161863646
Epoch: 18, step: 1431, loss: 0.3155745267868042, mean loss: 0.35557178308906995
Epoch: 18, step: 1432, loss: 0.3452807366847992, mean loss: 0.35557140784581
Epoch: 18, step: 1433, loss: 0.3068503141403198, mean loss: 0.3555696313893925
Epoch: 18, step: 1434, loss: 0.3511256277561188, mean loss: 0.35556946935914374
Epoch: 18, step: 1435, loss: 0.3403102457523346, mean loss: 0.3555689130216927
Epoch: 18, step: 1436, loss: 0.35205239057540894, mean loss: 0.3555687848171484
Epoch: 18, step: 1437, loss: 0.334497332572937, mean loss: 0.35556801662712856
Epoch: 18, step: 1438, loss: 0.3534824252128601, mean loss: 0.35556794059667346
Epoch: 18, step: 1439, loss: 0.3074716627597809, mean loss: 0.3555661873057054
Epoch: 18, step: 1440, loss: 0.33876508474349976, mean loss: 0.35556557486439155
Epoch: 18, step: 1441, loss: 0.37680020928382874, mean loss: 0.35556634889057875
Epoch: 18, step: 1442, loss: 0.32238638401031494, mean loss: 0.35556513948781293
Epoch: 18, step: 1443, loss: 0.34038251638412476, mean loss: 0.35556458610455355
Valid: 18, mean loss: 0.18850411474704742
Epoch: 19, step: 0, loss: 0.31823667883872986, mean loss: 0.3555632256093367
Epoch: 19, step: 1, loss: 0.3152291178703308, mean loss: 0.3555617556003076
Epoch: 19, step: 2, loss: 0.3138526678085327, mean loss: 0.35556023553442356
Epoch: 19, step: 3, loss: 0.3145991563796997, mean loss: 0.3555587427837255
Epoch: 19, step: 4, loss: 0.3127085566520691, mean loss: 0.3555571812449284
Epoch: 19, step: 5, loss: 0.3182828426361084, mean loss: 0.35555582294966537
Epoch: 19, step: 6, loss: 0.301207959651947, mean loss: 0.35555384255891737
Epoch: 19, step: 7, loss: 0.3659036457538605, mean loss: 0.3555542196833597
Epoch: 19, step: 8, loss: 0.3140818476676941, mean loss: 0.35555270857488763
Epoch: 19, step: 9, loss: 0.3727235198020935, mean loss: 0.3555533341965165
Epoch: 19, step: 10, loss: 0.31620290875434875, mean loss: 0.35555190050884783
Epoch: 19, step: 11, loss: 0.3630025386810303, mean loss: 0.3555521719544239
Epoch: 19, step: 12, loss: 0.3678617477416992, mean loss: 0.3555526204070374
Epoch: 19, step: 13, loss: 0.31887736916542053, mean loss: 0.3555512843323109
Epoch: 19, step: 14, loss: 0.29827988147735596, mean loss: 0.35554919801841145
Epoch: 19, step: 15, loss: 0.324224054813385, mean loss: 0.35554805693057795
Epoch: 19, step: 16, loss: 0.3454112708568573, mean loss: 0.35554768768910805
Epoch: 19, step: 17, loss: 0.3880205750465393, mean loss: 0.3555488704998955
Epoch: 19, step: 18, loss: 0.30793100595474243, mean loss: 0.35554713610308086
Epoch: 19, step: 19, loss: 0.3476608693599701, mean loss: 0.35554684887017207
Epoch: 19, step: 20, loss: 0.3367621898651123, mean loss: 0.3555461647219037
Epoch: 19, step: 21, loss: 0.32063356041908264, mean loss: 0.35554489323074256
Epoch: 19, step: 22, loss: 0.3291461169719696, mean loss: 0.35554393184189886
Epoch: 19, step: 23, loss: 0.3061753511428833, mean loss: 0.35554213400574813
Epoch: 19, step: 24, loss: 0.3208252489566803, mean loss: 0.3555408697806635
Epoch: 19, step: 25, loss: 0.308151513338089, mean loss: 0.35553914414682614
Epoch: 19, step: 26, loss: 0.3335084617137909, mean loss: 0.35553834195178435
Epoch: 19, step: 27, loss: 0.3165489137172699, mean loss: 0.3555369222959354
Epoch: 19, step: 28, loss: 0.3390515446662903, mean loss: 0.3555363220637261
Epoch: 19, step: 29, loss: 0.3467622399330139, mean loss: 0.35553600261123464
Epoch: 19, step: 30, loss: 0.3298380374908447, mean loss: 0.3555350670170627
Epoch: 19, step: 31, loss: 0.293544739484787, mean loss: 0.35553281019721666
Epoch: 19, step: 32, loss: 0.3445708155632019, mean loss: 0.3555324111293717
Epoch: 19, step: 33, loss: 0.34145477414131165, mean loss: 0.3555318986562378
Epoch: 19, step: 34, loss: 0.32945314049720764, mean loss: 0.35553094933665863
Epoch: 19, step: 35, loss: 0.36833110451698303, mean loss: 0.35553141527125315
Epoch: 19, step: 36, loss: 0.33217960596084595, mean loss: 0.3555305652800141
Epoch: 19, step: 37, loss: 0.36164137721061707, mean loss: 0.3555307877016466
Epoch: 19, step: 38, loss: 0.36775416135787964, mean loss: 0.3555312325924075
Epoch: 19, step: 39, loss: 0.341383695602417, mean loss: 0.35553071768714506
Epoch: 19, step: 40, loss: 0.35285916924476624, mean loss: 0.35553062045861056
Epoch: 19, step: 41, loss: 0.30809009075164795, mean loss: 0.3555288939672463
Epoch: 19, step: 42, loss: 0.3417949378490448, mean loss: 0.35552839416899606
Epoch: 19, step: 43, loss: 0.33880019187927246, mean loss: 0.3555277854280103
Epoch: 19, step: 44, loss: 0.35037851333618164, mean loss: 0.3555275980522928
Epoch: 19, step: 45, loss: 0.32844653725624084, mean loss: 0.35552661264144947
Epoch: 19, step: 46, loss: 0.33643195033073425, mean loss: 0.35552591786059184
Epoch: 19, step: 47, loss: 0.30795344710350037, mean loss: 0.35552418694548643
Epoch: 19, step: 48, loss: 0.4280831515789032, mean loss: 0.3555268268932628
Epoch: 19, step: 49, loss: 0.29999470710754395, mean loss: 0.35552480651489615
Epoch: 19, step: 50, loss: 0.3224419057369232, mean loss: 0.35552360293135565
Epoch: 19, step: 51, loss: 0.35410308837890625, mean loss: 0.3555235512537308
Epoch: 19, step: 52, loss: 0.33995503187179565, mean loss: 0.35552298489921147
Epoch: 19, step: 53, loss: 0.358354389667511, mean loss: 0.35552308789683856
Epoch: 19, step: 54, loss: 0.3219183087348938, mean loss: 0.35552186550481346
Epoch: 19, step: 55, loss: 0.30882248282432556, mean loss: 0.3555201668512895
Epoch: 19, step: 56, loss: 0.34432196617126465, mean loss: 0.3555197595403129
Epoch: 19, step: 57, loss: 0.3259443938732147, mean loss: 0.35551868383777174
Epoch: 19, step: 58, loss: 0.34330180287361145, mean loss: 0.3555182395067674
Epoch: 19, step: 59, loss: 0.33208128809928894, mean loss: 0.3555173871300069
Epoch: 19, step: 60, loss: 0.35894113779067993, mean loss: 0.3555175116436142
Epoch: 19, step: 61, loss: 0.34651979804039, mean loss: 0.35551718443023134
Epoch: 19, step: 62, loss: 0.3229255676269531, mean loss: 0.3555159992374315
Epoch: 19, step: 63, loss: 0.39140546321868896, mean loss: 0.355517304308849
Epoch: 19, step: 64, loss: 0.3423078954219818, mean loss: 0.355516823984174
Epoch: 19, step: 65, loss: 0.33672210574150085, mean loss: 0.3555161405895757
Epoch: 19, step: 66, loss: 0.3369169235229492, mean loss: 0.3555154643281836
Epoch: 19, step: 67, loss: 0.3989807665348053, mean loss: 0.3555170446547618
Epoch: 19, step: 68, loss: 0.35106614232063293, mean loss: 0.35551688283318994
Epoch: 19, step: 69, loss: 0.3313824534416199, mean loss: 0.3555160054090137
Epoch: 19, step: 70, loss: 0.31382331252098083, mean loss: 0.35551448969690813
Epoch: 19, step: 71, loss: 0.30719396471977234, mean loss: 0.3555127330979196
Epoch: 19, step: 72, loss: 0.3588498830795288, mean loss: 0.35551285440912617
Epoch: 19, step: 73, loss: 0.334879606962204, mean loss: 0.3555121043819562
Epoch: 19, step: 74, loss: 0.3305381238460541, mean loss: 0.3555111966003221
Epoch: 19, step: 75, loss: 0.3286290168762207, mean loss: 0.3555102194928881
Epoch: 19, step: 76, loss: 0.3102356195449829, mean loss: 0.35550857392170543
Epoch: 19, step: 77, loss: 0.32513853907585144, mean loss: 0.355507470118738
Epoch: 19, step: 78, loss: 0.338452011346817, mean loss: 0.3555068502583429
Epoch: 19, step: 79, loss: 0.33642274141311646, mean loss: 0.3555061566942767
Epoch: 19, step: 80, loss: 0.34019389748573303, mean loss: 0.35550560022884775
Epoch: 19, step: 81, loss: 0.3527768552303314, mean loss: 0.35550550106666307
Epoch: 19, step: 82, loss: 0.3187868297100067, mean loss: 0.3555041667641318
Epoch: 19, step: 83, loss: 0.3017931580543518, mean loss: 0.3555022150559665
Epoch: 19, step: 84, loss: 0.32768720388412476, mean loss: 0.35550120437280924
Epoch: 19, step: 85, loss: 0.317484974861145, mean loss: 0.355499823069506
Epoch: 19, step: 86, loss: 0.2850382626056671, mean loss: 0.35549726297211603
Epoch: 19, step: 87, loss: 0.3836468458175659, mean loss: 0.35549828570074726
Epoch: 19, step: 88, loss: 0.3103621304035187, mean loss: 0.3554966458767583
Epoch: 19, step: 89, loss: 0.3767518401145935, mean loss: 0.3554974180628455
Epoch: 19, step: 90, loss: 0.3148089051246643, mean loss: 0.3554959399318128
Epoch: 19, step: 91, loss: 0.32284092903137207, mean loss: 0.3554947536846862
Epoch: 19, step: 92, loss: 0.42107540369033813, mean loss: 0.3554971359234165
Epoch: 19, step: 93, loss: 0.3597400486469269, mean loss: 0.3554972900430214
Epoch: 19, step: 94, loss: 0.3145354390144348, mean loss: 0.3554958021983725
Epoch: 19, step: 95, loss: 0.4129515290260315, mean loss: 0.3554978890691711
Epoch: 19, step: 96, loss: 0.3346000611782074, mean loss: 0.35549713005896916
Epoch: 19, step: 97, loss: 0.29469048976898193, mean loss: 0.3554949216388235
Epoch: 19, step: 98, loss: 0.3246123194694519, mean loss: 0.355493800062569
Epoch: 19, step: 99, loss: 0.320906400680542, mean loss: 0.35549254398327707
Epoch: 19, step: 100, loss: 0.38548001646995544, mean loss: 0.3554936329716377
Epoch: 19, step: 101, loss: 0.30869260430336, mean loss: 0.3554919334644597
Epoch: 19, step: 102, loss: 0.3527164161205292, mean loss: 0.3554918326794877
Epoch: 19, step: 103, loss: 0.3471033573150635, mean loss: 0.3554915280870634
Epoch: 19, step: 104, loss: 0.31102612614631653, mean loss: 0.35548991357045395
Epoch: 19, step: 105, loss: 0.3293958306312561, mean loss: 0.35548896614169284
Epoch: 19, step: 106, loss: 0.30448204278945923, mean loss: 0.3554871142401806
Epoch: 19, step: 107, loss: 0.3411746323108673, mean loss: 0.3554865946176882
Epoch: 19, step: 108, loss: 0.3602994978427887, mean loss: 0.3554867693464312
Epoch: 19, step: 109, loss: 0.32681870460510254, mean loss: 0.3554857286122142
Epoch: 19, step: 110, loss: 0.3302443325519562, mean loss: 0.35548481230931156
Epoch: 19, step: 111, loss: 0.3453492224216461, mean loss: 0.3554844443846024
Epoch: 19, step: 112, loss: 0.35304343700408936, mean loss: 0.3554843557785775
Epoch: 19, step: 113, loss: 0.33381950855255127, mean loss: 0.3554835693957381
Epoch: 19, step: 114, loss: 0.3110116422176361, mean loss: 0.35548195522829673
Epoch: 19, step: 115, loss: 0.3413447439670563, mean loss: 0.35548144211813193
Epoch: 19, step: 116, loss: 0.4001237452030182, mean loss: 0.35548306235197524
Epoch: 19, step: 117, loss: 0.35471585392951965, mean loss: 0.35548303450816227
Epoch: 19, step: 118, loss: 0.33586153388023376, mean loss: 0.3554823224232184
Epoch: 19, step: 119, loss: 0.3285980522632599, mean loss: 0.35548134680011784
Epoch: 19, step: 120, loss: 0.3413705825805664, mean loss: 0.35548083474277414
Epoch: 19, step: 121, loss: 0.32681360840797424, mean loss: 0.35547979449216327
Epoch: 19, step: 122, loss: 0.371127188205719, mean loss: 0.35548036227015645
Epoch: 19, step: 123, loss: 0.3780446946620941, mean loss: 0.35548118100500375
Epoch: 19, step: 124, loss: 0.3353568911552429, mean loss: 0.3554804508323014
Epoch: 19, step: 125, loss: 0.3315490782260895, mean loss: 0.35547958255813383
Epoch: 19, step: 126, loss: 0.37684205174446106, mean loss: 0.3554803575996455
Epoch: 19, step: 127, loss: 0.31024783849716187, mean loss: 0.3554787165998232
Epoch: 19, step: 128, loss: 0.34734731912612915, mean loss: 0.3554784216098913
Epoch: 19, step: 129, loss: 0.3069285452365875, mean loss: 0.35547666038677683
Epoch: 19, step: 130, loss: 0.30833977460861206, mean loss: 0.3554749504841477
Epoch: 19, step: 131, loss: 0.3273281455039978, mean loss: 0.3554739294886101
Epoch: 19, step: 132, loss: 0.3119713366031647, mean loss: 0.3554723515353697
Epoch: 19, step: 133, loss: 0.32991668581962585, mean loss: 0.35547142459791176
Epoch: 19, step: 134, loss: 0.31451794505119324, mean loss: 0.3554699392154611
Epoch: 19, step: 135, loss: 0.34018659591674805, mean loss: 0.3554693849087986
Epoch: 19, step: 136, loss: 0.327293336391449, mean loss: 0.3554683630378191
Epoch: 19, step: 137, loss: 0.3172230124473572, mean loss: 0.3554669760301093
Epoch: 19, step: 138, loss: 0.3214486539363861, mean loss: 0.35546574236475686
Epoch: 19, step: 139, loss: 0.32445624470710754, mean loss: 0.3554646178543979
Epoch: 19, step: 140, loss: 0.389367938041687, mean loss: 0.35546584726006886
Epoch: 19, step: 141, loss: 0.29261088371276855, mean loss: 0.35546356808958707
Epoch: 19, step: 142, loss: 0.33229175209999084, mean loss: 0.35546272789175576
Epoch: 19, step: 143, loss: 0.3216366767883301, mean loss: 0.35546150142144745
Epoch: 19, step: 144, loss: 0.34141993522644043, mean loss: 0.3554609923185797
Epoch: 19, step: 145, loss: 0.34668979048728943, mean loss: 0.3554606743140176
Epoch: 19, step: 146, loss: 0.3167639374732971, mean loss: 0.35545927139421774
Epoch: 19, step: 147, loss: 0.3515884280204773, mean loss: 0.3554591310649191
Epoch: 19, step: 148, loss: 0.3615571856498718, mean loss: 0.3554593521290694
Epoch: 19, step: 149, loss: 0.3022908568382263, mean loss: 0.3554574247566598
Epoch: 19, step: 150, loss: 0.40715235471725464, mean loss: 0.3554592986439966
Epoch: 19, step: 151, loss: 0.31991663575172424, mean loss: 0.3554580103062087
Epoch: 19, step: 152, loss: 0.33219650387763977, mean loss: 0.355457167161969
Epoch: 19, step: 153, loss: 0.31613603234291077, mean loss: 0.35545574196679613
Epoch: 19, step: 154, loss: 0.3028987646102905, mean loss: 0.3554538371073363
Epoch: 19, step: 155, loss: 0.3595614731311798, mean loss: 0.35545398597787936
Epoch: 19, step: 156, loss: 0.33514633774757385, mean loss: 0.3554532500068639
Epoch: 19, step: 157, loss: 0.2997882068157196, mean loss: 0.35545123271893203
Epoch: 19, step: 158, loss: 0.3194120228290558, mean loss: 0.35544992671386266
Epoch: 19, step: 159, loss: 0.32845765352249146, mean loss: 0.355448948591193
Epoch: 19, step: 160, loss: 0.3435494899749756, mean loss: 0.35544851740452
Epoch: 19, step: 161, loss: 0.313366174697876, mean loss: 0.355446992571463
Epoch: 19, step: 162, loss: 0.35738837718963623, mean loss: 0.35544706291403405
Epoch: 19, step: 163, loss: 0.312845915555954, mean loss: 0.3554455193942022
Epoch: 19, step: 164, loss: 0.32478073239326477, mean loss: 0.35544440839144864
Epoch: 19, step: 165, loss: 0.31403547525405884, mean loss: 0.3554429081764955
Epoch: 19, step: 166, loss: 0.3526122570037842, mean loss: 0.355442805627817
Epoch: 19, step: 167, loss: 0.36412978172302246, mean loss: 0.355443120327719
Epoch: 19, step: 168, loss: 0.3247915208339691, mean loss: 0.35544200996367287
Epoch: 19, step: 169, loss: 0.329802542924881, mean loss: 0.3554410811993811
Epoch: 19, step: 170, loss: 0.31897464394569397, mean loss: 0.3554397602866686
Epoch: 19, step: 171, loss: 0.3625076115131378, mean loss: 0.35544001629402977
Epoch: 19, step: 172, loss: 0.31032460927963257, mean loss: 0.35543838221068685
Epoch: 19, step: 173, loss: 0.34862908720970154, mean loss: 0.3554381355864565
Epoch: 19, step: 174, loss: 0.3759765028953552, mean loss: 0.3554388794337387
Epoch: 19, step: 175, loss: 0.36284926533699036, mean loss: 0.35543914780929653
Epoch: 19, step: 176, loss: 0.3785027861595154, mean loss: 0.3554399830549544
Epoch: 19, step: 177, loss: 0.32317933440208435, mean loss: 0.3554388147834742
Epoch: 19, step: 178, loss: 0.31976673007011414, mean loss: 0.35543752301868287
Epoch: 19, step: 179, loss: 0.32211530208587646, mean loss: 0.3554363163913316
Epoch: 19, step: 180, loss: 0.361421138048172, mean loss: 0.35543653309921647
Epoch: 19, step: 181, loss: 0.2951529026031494, mean loss: 0.35543435033324877
Epoch: 19, step: 182, loss: 0.30521661043167114, mean loss: 0.3554325321016002
Epoch: 19, step: 183, loss: 0.29877427220344543, mean loss: 0.35543048075258143
Epoch: 19, step: 184, loss: 0.34016403555870056, mean loss: 0.35542992804105056
Epoch: 19, step: 185, loss: 0.31391623616218567, mean loss: 0.3554284251197603
Epoch: 19, step: 186, loss: 0.33963367342948914, mean loss: 0.3554278533226459
Epoch: 19, step: 187, loss: 0.3124299943447113, mean loss: 0.3554262967827177
Epoch: 19, step: 188, loss: 0.3211400806903839, mean loss: 0.3554250556527234
Epoch: 19, step: 189, loss: 0.3341699540615082, mean loss: 0.35542428626513234
Epoch: 19, step: 190, loss: 0.34350618720054626, mean loss: 0.3554238548719639
Epoch: 19, step: 191, loss: 0.3002336025238037, mean loss: 0.35542185725171094
Epoch: 19, step: 192, loss: 0.32520878314971924, mean loss: 0.3554207637241094
Epoch: 19, step: 193, loss: 0.3177421987056732, mean loss: 0.3554194000409745
Epoch: 19, step: 194, loss: 0.30712196230888367, mean loss: 0.3554176520970806
Epoch: 19, step: 195, loss: 0.3387516140937805, mean loss: 0.3554170489544198
Epoch: 19, step: 196, loss: 0.31338366866111755, mean loss: 0.3554155278246006
Epoch: 19, step: 197, loss: 0.2999840974807739, mean loss: 0.35541352191049685
Epoch: 19, step: 198, loss: 0.3397088348865509, mean loss: 0.3554129536207547
Epoch: 19, step: 199, loss: 0.3496062755584717, mean loss: 0.3554127435079286
Epoch: 19, step: 200, loss: 0.3057345747947693, mean loss: 0.3554109459840037
Epoch: 19, step: 201, loss: 0.3505145311355591, mean loss: 0.3554107688215879
Epoch: 19, step: 202, loss: 0.32199063897132874, mean loss: 0.35540955965592164
Epoch: 19, step: 203, loss: 0.3371729254722595, mean loss: 0.3554088998645257
Epoch: 19, step: 204, loss: 0.36872705817222595, mean loss: 0.355409381690737
Epoch: 19, step: 205, loss: 0.33637163043022156, mean loss: 0.35540869296520117
Epoch: 19, step: 206, loss: 0.32459893822669983, mean loss: 0.35540757840619025
Epoch: 19, step: 207, loss: 0.30577293038368225, mean loss: 0.3554057829117603
Epoch: 19, step: 208, loss: 0.37378910183906555, mean loss: 0.3554064478898369
Epoch: 19, step: 209, loss: 0.3338165581226349, mean loss: 0.35540566694902204
Epoch: 19, step: 210, loss: 0.3803881108760834, mean loss: 0.3554065705712569
Epoch: 19, step: 211, loss: 0.30219048261642456, mean loss: 0.35540464579955716
Epoch: 19, step: 212, loss: 0.36430707573890686, mean loss: 0.35540496777973507
Epoch: 19, step: 213, loss: 0.31073346734046936, mean loss: 0.35540335217393254
Epoch: 19, step: 214, loss: 0.34033912420272827, mean loss: 0.3554028073752645
Epoch: 19, step: 215, loss: 0.3105805516242981, mean loss: 0.35540118643443736
Epoch: 19, step: 216, loss: 0.33067166805267334, mean loss: 0.3554002921546709
Epoch: 19, step: 217, loss: 0.32542884349823, mean loss: 0.35539920835309946
Epoch: 19, step: 218, loss: 0.35603851079940796, mean loss: 0.35539923147016494
Epoch: 19, step: 219, loss: 0.3268206715583801, mean loss: 0.3553981981117649
Epoch: 19, step: 220, loss: 0.3481418490409851, mean loss: 0.3553979357424164
Epoch: 19, step: 221, loss: 0.3033376634120941, mean loss: 0.35539605345619435
Epoch: 19, step: 222, loss: 0.3410991132259369, mean loss: 0.3553955365560812
Epoch: 19, step: 223, loss: 0.33194372057914734, mean loss: 0.35539468869577834
Epoch: 19, step: 224, loss: 0.29945477843284607, mean loss: 0.35539266635709704
Epoch: 19, step: 225, loss: 0.3496789336204529, mean loss: 0.355392459801796
Epoch: 19, step: 226, loss: 0.33013153076171875, mean loss: 0.355391546635146
Epoch: 19, step: 227, loss: 0.3538908362388611, mean loss: 0.35539149238737283
Epoch: 19, step: 228, loss: 0.32701408863067627, mean loss: 0.3553904666362882
Epoch: 19, step: 229, loss: 0.3701454997062683, mean loss: 0.35539099996358775
Epoch: 19, step: 230, loss: 0.30951422452926636, mean loss: 0.3553893417868633
Epoch: 19, step: 231, loss: 0.34486690163612366, mean loss: 0.3553889614760295
Epoch: 19, step: 232, loss: 0.336754709482193, mean loss: 0.3553882880056477
Epoch: 19, step: 233, loss: 0.3180292546749115, mean loss: 0.35538693784181213
Epoch: 19, step: 234, loss: 0.2956830859184265, mean loss: 0.35538478020920317
Epoch: 19, step: 235, loss: 0.3194257915019989, mean loss: 0.35538348073722037
Epoch: 19, step: 236, loss: 0.34759801626205444, mean loss: 0.3553831993992926
Epoch: 19, step: 237, loss: 0.3392546772956848, mean loss: 0.35538261659514053
Epoch: 19, step: 238, loss: 0.3326111435890198, mean loss: 0.35538179377768775
Epoch: 19, step: 239, loss: 0.33283764123916626, mean loss: 0.3553809792035969
Epoch: 19, step: 240, loss: 0.3202435374259949, mean loss: 0.3553797096497516
Epoch: 19, step: 241, loss: 0.30604055523872375, mean loss: 0.35537792703704796
Epoch: 19, step: 242, loss: 0.3086000382900238, mean loss: 0.3553762370233644
Epoch: 19, step: 243, loss: 0.3332626521587372, mean loss: 0.3553754381221771
Epoch: 19, step: 244, loss: 0.3470008969306946, mean loss: 0.35537513558465345
Epoch: 19, step: 245, loss: 0.33775728940963745, mean loss: 0.3553744991477567
Epoch: 19, step: 246, loss: 0.31975850462913513, mean loss: 0.35537321258219234
Epoch: 19, step: 247, loss: 0.3729257583618164, mean loss: 0.3553738466143329
Epoch: 19, step: 248, loss: 0.32519885897636414, mean loss: 0.3553727566743785
Epoch: 19, step: 249, loss: 0.3767877519130707, mean loss: 0.3553735301698361
Epoch: 19, step: 250, loss: 0.33943918347358704, mean loss: 0.3553729546525646
Epoch: 19, step: 251, loss: 0.3507556617259979, mean loss: 0.355372787891046
Epoch: 19, step: 252, loss: 0.31838566064834595, mean loss: 0.35537145208522986
Epoch: 19, step: 253, loss: 0.2981981635093689, mean loss: 0.3553693873221899
Epoch: 19, step: 254, loss: 0.3295406103134155, mean loss: 0.355368454572307
Epoch: 19, step: 255, loss: 0.3049386739730835, mean loss: 0.35536663347666203
Epoch: 19, step: 256, loss: 0.33959630131721497, mean loss: 0.3553660640066819
Epoch: 19, step: 257, loss: 0.3158513605594635, mean loss: 0.35536463717403055
Epoch: 19, step: 258, loss: 0.323529988527298, mean loss: 0.35536348770125037
Epoch: 19, step: 259, loss: 0.3138965666294098, mean loss: 0.355361990484285
Epoch: 19, step: 260, loss: 0.3303661346435547, mean loss: 0.35536108800907684
Epoch: 19, step: 261, loss: 0.3544285297393799, mean loss: 0.35536105434028237
Epoch: 19, step: 262, loss: 0.3119787573814392, mean loss: 0.35535948813583607
Epoch: 19, step: 263, loss: 0.3740707337856293, mean loss: 0.3553601636320689
Epoch: 19, step: 264, loss: 0.3183501660823822, mean loss: 0.35535882757930726
Epoch: 19, step: 265, loss: 0.29963791370391846, mean loss: 0.3553568161391991
Epoch: 19, step: 266, loss: 0.37562260031700134, mean loss: 0.35535754767672856
Epoch: 19, step: 267, loss: 0.32090744376182556, mean loss: 0.3553563041702344
Epoch: 19, step: 268, loss: 0.34360724687576294, mean loss: 0.35535588009308966
Epoch: 19, step: 269, loss: 0.362148642539978, mean loss: 0.3553561252660647
Epoch: 19, step: 270, loss: 0.386154443025589, mean loss: 0.3553572368377888
Epoch: 19, step: 271, loss: 0.3383498787879944, mean loss: 0.3553566230310164
Epoch: 19, step: 272, loss: 0.3512648642063141, mean loss: 0.3553564753620704
Epoch: 19, step: 273, loss: 0.3830215632915497, mean loss: 0.3553574737412811
Epoch: 19, step: 274, loss: 0.3278835415840149, mean loss: 0.3553564822962897
Epoch: 19, step: 275, loss: 0.3013702929019928, mean loss: 0.3553545341803329
Epoch: 19, step: 276, loss: 0.31120601296424866, mean loss: 0.35535294111854904
Epoch: 19, step: 277, loss: 0.32297879457473755, mean loss: 0.35535177296719794
Epoch: 19, step: 278, loss: 0.3308980166912079, mean loss: 0.3553508906379078
Epoch: 19, step: 279, loss: 0.3192567527294159, mean loss: 0.35534958835266073
Epoch: 19, step: 280, loss: 0.39406833052635193, mean loss: 0.35535098528386444
Epoch: 19, step: 281, loss: 0.328946977853775, mean loss: 0.3553500326896141
Epoch: 19, step: 282, loss: 0.3309701979160309, mean loss: 0.3553491531544659
Epoch: 19, step: 283, loss: 0.3077070116996765, mean loss: 0.3553474344624942
Epoch: 19, step: 284, loss: 0.3196239471435547, mean loss: 0.35534614578288964
Epoch: 19, step: 285, loss: 0.3045111894607544, mean loss: 0.355344312042311
Epoch: 19, step: 286, loss: 0.3394511044025421, mean loss: 0.355343738756316
Epoch: 19, step: 287, loss: 0.3176770806312561, mean loss: 0.3553423801263158
Epoch: 19, step: 288, loss: 0.3322087228298187, mean loss: 0.3553415457292988
Epoch: 19, step: 289, loss: 0.365415096282959, mean loss: 0.35534190905435664
Epoch: 19, step: 290, loss: 0.3549553453922272, mean loss: 0.35534189511257924
Epoch: 19, step: 291, loss: 0.30293765664100647, mean loss: 0.35534000517322295
Epoch: 19, step: 292, loss: 0.3504268527030945, mean loss: 0.3553398279885978
Epoch: 19, step: 293, loss: 0.3062540292739868, mean loss: 0.35533805785521466
Epoch: 19, step: 294, loss: 0.36717501282691956, mean loss: 0.3553384847044077
Epoch: 19, step: 295, loss: 0.3554629683494568, mean loss: 0.3553384891932165
Epoch: 19, step: 296, loss: 0.3411710560321808, mean loss: 0.3553379783421307
Epoch: 19, step: 297, loss: 0.3057534694671631, mean loss: 0.3553361904821439
Epoch: 19, step: 298, loss: 0.3256828784942627, mean loss: 0.35533512131639705
Epoch: 19, step: 299, loss: 0.3544240891933441, mean loss: 0.3553350884698394
Epoch: 19, step: 300, loss: 0.32762131094932556, mean loss: 0.3553340893070777
Epoch: 19, step: 301, loss: 0.340166300535202, mean loss: 0.35533354248363075
Epoch: 19, step: 302, loss: 0.324309766292572, mean loss: 0.3553324240663774
Epoch: 19, step: 303, loss: 0.3155483901500702, mean loss: 0.35533098989067746
Epoch: 19, step: 304, loss: 0.3651849031448364, mean loss: 0.3553313451018542
Epoch: 19, step: 305, loss: 0.34357234835624695, mean loss: 0.35533092123202703
Epoch: 19, step: 306, loss: 0.30696019530296326, mean loss: 0.3553291777029952
Epoch: 19, step: 307, loss: 0.380814790725708, mean loss: 0.3553300963020805
Epoch: 19, step: 308, loss: 0.3058511018753052, mean loss: 0.3553283129539303
Epoch: 19, step: 309, loss: 0.3127206563949585, mean loss: 0.35532677732153073
Epoch: 19, step: 310, loss: 0.33051979541778564, mean loss: 0.3553258832795837
Epoch: 19, step: 311, loss: 0.3336869776248932, mean loss: 0.3553251034429953
Epoch: 19, step: 312, loss: 0.3439067304134369, mean loss: 0.35532469195526495
Epoch: 19, step: 313, loss: 0.2921234965324402, mean loss: 0.3553224144347092
Epoch: 19, step: 314, loss: 0.33879342675209045, mean loss: 0.3553218188169771
Epoch: 19, step: 315, loss: 0.35698065161705017, mean loss: 0.3553218785904277
Epoch: 19, step: 316, loss: 0.3741457462310791, mean loss: 0.35532255685467445
Epoch: 19, step: 317, loss: 0.33022376894950867, mean loss: 0.355321652524203
Epoch: 19, step: 318, loss: 0.32415860891342163, mean loss: 0.355320529733945
Epoch: 19, step: 319, loss: 0.31639954447746277, mean loss: 0.355319127479108
Epoch: 19, step: 320, loss: 0.31548190116882324, mean loss: 0.355317692265421
Epoch: 19, step: 321, loss: 0.36016643047332764, mean loss: 0.3553178669443679
Epoch: 19, step: 322, loss: 0.33899423480033875, mean loss: 0.3553172788960901
Epoch: 19, step: 323, loss: 0.33605143427848816, mean loss: 0.3553165848815145
Epoch: 19, step: 324, loss: 0.37678930163383484, mean loss: 0.3553173583665025
Epoch: 19, step: 325, loss: 0.324668288230896, mean loss: 0.35531625437290926
Epoch: 19, step: 326, loss: 0.3224758207798004, mean loss: 0.3553150714880051
Epoch: 19, step: 327, loss: 0.30844610929489136, mean loss: 0.3553133833680587
Epoch: 19, step: 328, loss: 0.29970261454582214, mean loss: 0.3553113804590429
Epoch: 19, step: 329, loss: 0.2989710569381714, mean loss: 0.3553093513470527
Epoch: 19, step: 330, loss: 0.3898090422153473, mean loss: 0.35531059381800273
Epoch: 19, step: 331, loss: 0.32034242153167725, mean loss: 0.3553093345205277
Epoch: 19, step: 332, loss: 0.3204822242259979, mean loss: 0.3553080803482387
Epoch: 19, step: 333, loss: 0.3273545205593109, mean loss: 0.3553070737382355
Epoch: 19, step: 334, loss: 0.34374845027923584, mean loss: 0.35530665752623525
Epoch: 19, step: 335, loss: 0.3272140920162201, mean loss: 0.35530564598347597
Epoch: 19, step: 336, loss: 0.33325281739234924, mean loss: 0.3553048519450721
Epoch: 19, step: 337, loss: 0.373790979385376, mean loss: 0.35530551753618034
Epoch: 19, step: 338, loss: 0.325147807598114, mean loss: 0.35530443175004395
Epoch: 19, step: 339, loss: 0.3306301236152649, mean loss: 0.35530354341809783
Epoch: 19, step: 340, loss: 0.38457292318344116, mean loss: 0.35530459714527374
Epoch: 19, step: 341, loss: 0.3185644745826721, mean loss: 0.35530327451144256
Epoch: 19, step: 342, loss: 0.3170509338378906, mean loss: 0.35530189748776736
Epoch: 19, step: 343, loss: 0.3509630560874939, mean loss: 0.35530174130197184
Epoch: 19, step: 344, loss: 0.31919118762016296, mean loss: 0.3553004414728195
Epoch: 19, step: 345, loss: 0.3676985800266266, mean loss: 0.3553008877379751
Epoch: 19, step: 346, loss: 0.3035854399204254, mean loss: 0.355299026331798
Epoch: 19, step: 347, loss: 0.36303430795669556, mean loss: 0.35529930473957316
Epoch: 19, step: 348, loss: 0.33586785197257996, mean loss: 0.3552986053891047
Epoch: 19, step: 349, loss: 0.31779929995536804, mean loss: 0.3552972558135834
Epoch: 19, step: 350, loss: 0.42075616121292114, mean loss: 0.3552996115520726
Epoch: 19, step: 351, loss: 0.32016128301620483, mean loss: 0.35529834703758667
Epoch: 19, step: 352, loss: 0.35743120312690735, mean loss: 0.35529842378939813
Epoch: 19, step: 353, loss: 0.32588231563568115, mean loss: 0.3552973652752508
Epoch: 19, step: 354, loss: 0.3274903893470764, mean loss: 0.355296364700391
Epoch: 19, step: 355, loss: 0.3628617823123932, mean loss: 0.3552966369160506
Epoch: 19, step: 356, loss: 0.32104867696762085, mean loss: 0.35529540466476617
Epoch: 19, step: 357, loss: 0.33729809522628784, mean loss: 0.355294757139781
Epoch: 19, step: 358, loss: 0.3157069981098175, mean loss: 0.35529333286350717
Epoch: 19, step: 359, loss: 0.3512147068977356, mean loss: 0.3552931861292301
Epoch: 19, step: 360, loss: 0.34390613436698914, mean loss: 0.3552927764788447
Epoch: 19, step: 361, loss: 0.3375069797039032, mean loss: 0.3552921366559519
Epoch: 19, step: 362, loss: 0.31842631101608276, mean loss: 0.35529081049941247
Epoch: 19, step: 363, loss: 0.3365235924720764, mean loss: 0.35529013541962734
Epoch: 19, step: 364, loss: 0.3470665216445923, mean loss: 0.3552898396168226
Epoch: 19, step: 365, loss: 0.313914030790329, mean loss: 0.3552883513854426
Epoch: 19, step: 366, loss: 0.45628097653388977, mean loss: 0.35529198382169586
Epoch: 19, step: 367, loss: 0.32781484723091125, mean loss: 0.35529099557768096
Epoch: 19, step: 368, loss: 0.3331364095211029, mean loss: 0.3552901987934315
Epoch: 19, step: 369, loss: 0.3439972996711731, mean loss: 0.3552897926616929
Epoch: 19, step: 370, loss: 0.33550140261650085, mean loss: 0.35528908102828965
Epoch: 19, step: 371, loss: 0.29929009079933167, mean loss: 0.3552870672556261
Epoch: 19, step: 372, loss: 0.3403739333152771, mean loss: 0.3552865309855718
Epoch: 19, step: 373, loss: 0.30539342761039734, mean loss: 0.35528473691497214
Epoch: 19, step: 374, loss: 0.3534226417541504, mean loss: 0.35528466995962493
Epoch: 19, step: 375, loss: 0.31465408205986023, mean loss: 0.35528320905829097
Epoch: 19, step: 376, loss: 0.3358939588069916, mean loss: 0.35528251192924154
Epoch: 19, step: 377, loss: 0.3416264057159424, mean loss: 0.3552820209496552
Epoch: 19, step: 378, loss: 0.3512408137321472, mean loss: 0.3552818756608823
Epoch: 19, step: 379, loss: 0.32037392258644104, mean loss: 0.3552806207013959
Epoch: 19, step: 380, loss: 0.3074234127998352, mean loss: 0.35527890027115894
Epoch: 19, step: 381, loss: 0.3166654407978058, mean loss: 0.3552775121965499
Epoch: 19, step: 382, loss: 0.35255298018455505, mean loss: 0.3552774142587372
Epoch: 19, step: 383, loss: 0.34033912420272827, mean loss: 0.35527687729647783
Epoch: 19, step: 384, loss: 0.3196307122707367, mean loss: 0.35527559602819037
Epoch: 19, step: 385, loss: 0.4002186954021454, mean loss: 0.35527721140808305
Epoch: 19, step: 386, loss: 0.3091704845428467, mean loss: 0.3552755542637469
Epoch: 19, step: 387, loss: 0.3389440178871155, mean loss: 0.35527496730513647
Epoch: 19, step: 388, loss: 0.34271878004074097, mean loss: 0.3552745160495295
Epoch: 19, step: 389, loss: 0.3101361095905304, mean loss: 0.35527289388297806
Epoch: 19, step: 390, loss: 0.3414880335330963, mean loss: 0.3552723985058138
Epoch: 19, step: 391, loss: 0.3615242540836334, mean loss: 0.3552726231664282
Epoch: 19, step: 392, loss: 0.3435188829898834, mean loss: 0.355272200810606
Epoch: 19, step: 393, loss: 0.30055710673332214, mean loss: 0.355270234763388
Epoch: 19, step: 394, loss: 0.3301975727081299, mean loss: 0.3552693338736587
Epoch: 19, step: 395, loss: 0.34565261006355286, mean loss: 0.3552689883460714
Epoch: 19, step: 396, loss: 0.32709404826164246, mean loss: 0.3552679760606518
Epoch: 19, step: 397, loss: 0.31951749324798584, mean loss: 0.355266691642932
Epoch: 19, step: 398, loss: 0.33731168508529663, mean loss: 0.3552660465915019
Epoch: 19, step: 399, loss: 0.3072410821914673, mean loss: 0.3552643213089757
Epoch: 19, step: 400, loss: 0.3450755178928375, mean loss: 0.3552639552924
Epoch: 19, step: 401, loss: 0.296284019947052, mean loss: 0.3552618366080353
Epoch: 19, step: 402, loss: 0.31456276774406433, mean loss: 0.35526037466368154
Epoch: 19, step: 403, loss: 0.28884151577949524, mean loss: 0.35525798892880783
Epoch: 19, step: 404, loss: 0.3290296494960785, mean loss: 0.35525704685275333
Epoch: 19, step: 405, loss: 0.2776917517185211, mean loss: 0.3552542609431515
Epoch: 19, step: 406, loss: 0.3150290250778198, mean loss: 0.35525281622685423
Epoch: 19, step: 407, loss: 0.32697609066963196, mean loss: 0.3552518006857841
Epoch: 19, step: 408, loss: 0.3552951514720917, mean loss: 0.3552518022426448
Epoch: 19, step: 409, loss: 0.337167352437973, mean loss: 0.35525115279748914
Epoch: 19, step: 410, loss: 0.3952259123325348, mean loss: 0.3552525883115314
Epoch: 19, step: 411, loss: 0.3040867745876312, mean loss: 0.35525075098699377
Epoch: 19, step: 412, loss: 0.3252074420452118, mean loss: 0.35524967219389736
Epoch: 19, step: 413, loss: 0.31596359610557556, mean loss: 0.35524826156279904
Epoch: 19, step: 414, loss: 0.31461387872695923, mean loss: 0.35524680257091956
Epoch: 19, step: 415, loss: 0.3702368140220642, mean loss: 0.35524734077325515
Epoch: 19, step: 416, loss: 0.3135365843772888, mean loss: 0.35524584324134134
Epoch: 19, step: 417, loss: 0.3406871259212494, mean loss: 0.3552453205617506
Epoch: 19, step: 418, loss: 0.33864864706993103, mean loss: 0.35524472473789526
Epoch: 19, step: 419, loss: 0.32792580127716064, mean loss: 0.3552437440183569
Epoch: 19, step: 420, loss: 0.3553350269794464, mean loss: 0.355243747295198
Epoch: 19, step: 421, loss: 0.32456496357917786, mean loss: 0.3552426460394109
Epoch: 19, step: 422, loss: 0.34070339798927307, mean loss: 0.3552421241524785
Epoch: 19, step: 423, loss: 0.34203487634658813, mean loss: 0.3552416500947683
Epoch: 19, step: 424, loss: 0.32659482955932617, mean loss: 0.3552406218897313
Epoch: 19, step: 425, loss: 0.35969558358192444, mean loss: 0.35524078178355417
Epoch: 19, step: 426, loss: 0.31674349308013916, mean loss: 0.3552394001201043
Epoch: 19, step: 427, loss: 0.32697969675064087, mean loss: 0.35523838591886364
Epoch: 19, step: 428, loss: 0.3065674901008606, mean loss: 0.3552366392511508
Epoch: 19, step: 429, loss: 0.32663801312446594, mean loss: 0.3552356129601106
Epoch: 19, step: 430, loss: 0.31980109214782715, mean loss: 0.35523434140160726
Epoch: 19, step: 431, loss: 0.3140581548213959, mean loss: 0.35523286385795216
Epoch: 19, step: 432, loss: 0.2741842269897461, mean loss: 0.355229955657555
Epoch: 19, step: 433, loss: 0.3528446853160858, mean loss: 0.3552298700719669
Epoch: 19, step: 434, loss: 0.32787200808525085, mean loss: 0.35522888848314743
Epoch: 19, step: 435, loss: 0.33571356534957886, mean loss: 0.35522818830651376
Epoch: 19, step: 436, loss: 0.31121179461479187, mean loss: 0.3552266091297588
Epoch: 19, step: 437, loss: 0.3146735727787018, mean loss: 0.3552251542601186
Epoch: 19, step: 438, loss: 0.3101668059825897, mean loss: 0.35522353781713106
Epoch: 19, step: 439, loss: 0.36512696743011475, mean loss: 0.3552238930843722
Epoch: 19, step: 440, loss: 0.3540296256542206, mean loss: 0.35522385024377134
Epoch: 19, step: 441, loss: 0.34473130106925964, mean loss: 0.3552234738699578
Epoch: 19, step: 442, loss: 0.35301607847213745, mean loss: 0.35522339469224706
Epoch: 19, step: 443, loss: 0.34126219153404236, mean loss: 0.35522289393173206
Epoch: 19, step: 444, loss: 0.29684963822364807, mean loss: 0.35522080027455666
Epoch: 19, step: 445, loss: 0.3109585642814636, mean loss: 0.35521921279030183
Epoch: 19, step: 446, loss: 0.318435937166214, mean loss: 0.35521789358951195
Epoch: 19, step: 447, loss: 0.30773094296455383, mean loss: 0.35521619057162984
Epoch: 19, step: 448, loss: 0.35982921719551086, mean loss: 0.35521635600202695
Epoch: 19, step: 449, loss: 0.3750443458557129, mean loss: 0.3552170670394598
Epoch: 19, step: 450, loss: 0.33993107080459595, mean loss: 0.3552165188988841
Epoch: 19, step: 451, loss: 0.3963908851146698, mean loss: 0.35521799531763826
Epoch: 19, step: 452, loss: 0.34961867332458496, mean loss: 0.3552177945459364
Epoch: 19, step: 453, loss: 0.3336105942726135, mean loss: 0.35521701981663295
Epoch: 19, step: 454, loss: 0.309836745262146, mean loss: 0.3552153927586374
Epoch: 19, step: 455, loss: 0.3196890652179718, mean loss: 0.35521411904834266
Epoch: 19, step: 456, loss: 0.3136347532272339, mean loss: 0.35521262837448825
Epoch: 19, step: 457, loss: 0.3897915184497833, mean loss: 0.3552138680278214
Epoch: 19, step: 458, loss: 0.3353705406188965, mean loss: 0.35521315666996484
Epoch: 19, step: 459, loss: 0.34193676710128784, mean loss: 0.355212680745475
Epoch: 19, step: 460, loss: 0.3208049237728119, mean loss: 0.35521144735991483
Epoch: 19, step: 461, loss: 0.3537445366382599, mean loss: 0.35521139477870034
Epoch: 19, step: 462, loss: 0.31649136543273926, mean loss: 0.35521000691428417
Epoch: 19, step: 463, loss: 0.30331864953041077, mean loss: 0.3552081470090016
Epoch: 19, step: 464, loss: 0.31855398416519165, mean loss: 0.35520683328681085
Epoch: 19, step: 465, loss: 0.3327413499355316, mean loss: 0.3552060281300711
Epoch: 19, step: 466, loss: 0.31607601046562195, mean loss: 0.3552046257712687
Epoch: 19, step: 467, loss: 0.38618743419647217, mean loss: 0.35520573610700645
Epoch: 19, step: 468, loss: 0.34191542863845825, mean loss: 0.35520525983725304
Epoch: 19, step: 469, loss: 0.34947311878204346, mean loss: 0.3552050544283426
Epoch: 19, step: 470, loss: 0.37721267342567444, mean loss: 0.35520584303403285
Epoch: 19, step: 471, loss: 0.320365846157074, mean loss: 0.35520459464658566
Epoch: 19, step: 472, loss: 0.33829376101493835, mean loss: 0.35520398871897696
Epoch: 19, step: 473, loss: 0.31799325346946716, mean loss: 0.35520265547873153
Epoch: 19, step: 474, loss: 0.3202711343765259, mean loss: 0.35520140394632127
Epoch: 19, step: 475, loss: 0.34025564789772034, mean loss: 0.35520086848644566
Epoch: 19, step: 476, loss: 0.38763031363487244, mean loss: 0.3552020302908074
Epoch: 19, step: 477, loss: 0.31355535984039307, mean loss: 0.3552005383272604
Epoch: 19, step: 478, loss: 0.3293834924697876, mean loss: 0.3551996134823434
Epoch: 19, step: 479, loss: 0.37795454263687134, mean loss: 0.35520042860374884
Epoch: 19, step: 480, loss: 0.331775039434433, mean loss: 0.35519958949535
Epoch: 19, step: 481, loss: 0.2962900996208191, mean loss: 0.3551974794054484
Epoch: 19, step: 482, loss: 0.3273538053035736, mean loss: 0.355196482103464
Epoch: 19, step: 483, loss: 0.3377609848976135, mean loss: 0.35519585762290506
Epoch: 19, step: 484, loss: 0.3229145109653473, mean loss: 0.3551947014556239
Epoch: 19, step: 485, loss: 0.3481128513813019, mean loss: 0.3551944478258669
Epoch: 19, step: 486, loss: 0.3630119562149048, mean loss: 0.35519472779250333
Epoch: 19, step: 487, loss: 0.32594338059425354, mean loss: 0.3551936802582246
Epoch: 19, step: 488, loss: 0.30664753913879395, mean loss: 0.35519194181091507
Epoch: 19, step: 489, loss: 0.3342944085597992, mean loss: 0.3551911934927438
Epoch: 19, step: 490, loss: 0.3164721429347992, mean loss: 0.35518980705486797
Epoch: 19, step: 491, loss: 0.3206001818180084, mean loss: 0.3551885685263218
Epoch: 19, step: 492, loss: 0.32705873250961304, mean loss: 0.3551875613353727
Epoch: 19, step: 493, loss: 0.3796972930431366, mean loss: 0.35518843887678725
Epoch: 19, step: 494, loss: 0.37336266040802, mean loss: 0.355189089559596
Epoch: 19, step: 495, loss: 0.2820189893245697, mean loss: 0.35518646997989406
Epoch: 19, step: 496, loss: 0.3786619007587433, mean loss: 0.35518731039913937
Epoch: 19, step: 497, loss: 0.35443273186683655, mean loss: 0.3551872833862328
Epoch: 19, step: 498, loss: 0.33406195044517517, mean loss: 0.3551865271545184
Epoch: 19, step: 499, loss: 0.3575834631919861, mean loss: 0.3551866129554934
Epoch: 19, step: 500, loss: 0.35376742482185364, mean loss: 0.35518656215590383
Epoch: 19, step: 501, loss: 0.3480992317199707, mean loss: 0.3551863084752382
Epoch: 19, step: 502, loss: 0.3473289906978607, mean loss: 0.35518602724406395
Epoch: 19, step: 503, loss: 0.328402042388916, mean loss: 0.35518506861897964
Epoch: 19, step: 504, loss: 0.32310888171195984, mean loss: 0.3551839206218819
Epoch: 19, step: 505, loss: 0.31616896390914917, mean loss: 0.35518252433826897
Epoch: 19, step: 506, loss: 0.34282177686691284, mean loss: 0.3551820819824922
Epoch: 19, step: 507, loss: 0.3136965334415436, mean loss: 0.3551805973865667
Epoch: 19, step: 508, loss: 0.3409324586391449, mean loss: 0.35518008752295077
Epoch: 19, step: 509, loss: 0.34613776206970215, mean loss: 0.3551797639587393
Epoch: 19, step: 510, loss: 0.3547399640083313, mean loss: 0.3551797482218104
Epoch: 19, step: 511, loss: 0.3034815192222595, mean loss: 0.3551778984211449
Epoch: 19, step: 512, loss: 0.33931687474250793, mean loss: 0.355177330922355
Epoch: 19, step: 513, loss: 0.31437137722969055, mean loss: 0.35517587095979
Epoch: 19, step: 514, loss: 0.3393540382385254, mean loss: 0.35517530490373755
Epoch: 19, step: 515, loss: 0.3376521170139313, mean loss: 0.3551746780009081
Epoch: 19, step: 516, loss: 0.3265148103237152, mean loss: 0.3551736527131866
Epoch: 19, step: 517, loss: 0.32660722732543945, mean loss: 0.3551726308048591
Epoch: 19, step: 518, loss: 0.3282506465911865, mean loss: 0.3551716677576685
Epoch: 19, step: 519, loss: 0.3375962972640991, mean loss: 0.3551710390779399
Epoch: 19, step: 520, loss: 0.2912626266479492, mean loss: 0.3551687531240668
Epoch: 19, step: 521, loss: 0.3063195049762726, mean loss: 0.35516700588720623
Epoch: 19, step: 522, loss: 0.31230252981185913, mean loss: 0.3551654727681363
Epoch: 19, step: 523, loss: 0.2973672151565552, mean loss: 0.35516340559154075
Epoch: 19, step: 524, loss: 0.31720128655433655, mean loss: 0.3551620479105194
Epoch: 19, step: 525, loss: 0.34068214893341064, mean loss: 0.3551615300684846
Epoch: 19, step: 526, loss: 0.3035443127155304, mean loss: 0.3551596841571964
Epoch: 19, step: 527, loss: 0.333402156829834, mean loss: 0.35515890610229267
Epoch: 19, step: 528, loss: 0.30699169635772705, mean loss: 0.35515718369178867
Epoch: 19, step: 529, loss: 0.32877233624458313, mean loss: 0.35515624023017645
Epoch: 19, step: 530, loss: 0.35336291790008545, mean loss: 0.3551561761073771
Epoch: 19, step: 531, loss: 0.2816004455089569, mean loss: 0.35515354611128874
Epoch: 19, step: 532, loss: 0.32043150067329407, mean loss: 0.3551523046637776
Epoch: 19, step: 533, loss: 0.30088096857070923, mean loss: 0.3551503643228376
Epoch: 19, step: 534, loss: 0.35215169191360474, mean loss: 0.3551502571163591
Epoch: 19, step: 535, loss: 0.30326583981513977, mean loss: 0.3551484022465857
Epoch: 19, step: 536, loss: 0.33174458146095276, mean loss: 0.35514756558906646
Epoch: 19, step: 537, loss: 0.3222332298755646, mean loss: 0.35514638898451534
Epoch: 19, step: 538, loss: 0.37297526001930237, mean loss: 0.3551470262989402
Epoch: 19, step: 539, loss: 0.292657732963562, mean loss: 0.3551447926238853
Epoch: 19, step: 540, loss: 0.30090075731277466, mean loss: 0.3551428537442588
Epoch: 19, step: 541, loss: 0.34407272934913635, mean loss: 0.35514245807178774
Epoch: 19, step: 542, loss: 0.31606605648994446, mean loss: 0.355141061438542
Epoch: 19, step: 543, loss: 0.3622142970561981, mean loss: 0.35514131423466844
Epoch: 19, step: 544, loss: 0.3586336076259613, mean loss: 0.35514143904412454
Epoch: 19, step: 545, loss: 0.3204478323459625, mean loss: 0.3551401991896932
Epoch: 19, step: 546, loss: 0.34787657856941223, mean loss: 0.3551399396170734
Epoch: 19, step: 547, loss: 0.3426429331302643, mean loss: 0.3551394930402264
Epoch: 19, step: 548, loss: 0.35453444719314575, mean loss: 0.3551394714198638
Epoch: 19, step: 549, loss: 0.3172113299369812, mean loss: 0.3551381161657552
Epoch: 19, step: 550, loss: 0.36980772018432617, mean loss: 0.3551386403235434
Epoch: 19, step: 551, loss: 0.3407781422138214, mean loss: 0.35513812722871313
Epoch: 19, step: 552, loss: 0.34271278977394104, mean loss: 0.3551376832922576
Epoch: 19, step: 553, loss: 0.3168458342552185, mean loss: 0.3551363152376296
Epoch: 19, step: 554, loss: 0.318752259016037, mean loss: 0.35513501538924186
Epoch: 19, step: 555, loss: 0.31643691658973694, mean loss: 0.35513363291929334
Epoch: 19, step: 556, loss: 0.369138240814209, mean loss: 0.35513413320893344
Epoch: 19, step: 557, loss: 0.29876255989074707, mean loss: 0.35513211950695023
Epoch: 19, step: 558, loss: 0.3455948531627655, mean loss: 0.3551317788294598
Epoch: 19, step: 559, loss: 0.3240343928337097, mean loss: 0.35513066804984855
Epoch: 19, step: 560, loss: 0.3690228760242462, mean loss: 0.355131164253298
Epoch: 19, step: 561, loss: 0.30139490962028503, mean loss: 0.35512924496425474
Epoch: 19, step: 562, loss: 0.31131061911582947, mean loss: 0.3551276799574385
Epoch: 19, step: 563, loss: 0.31386131048202515, mean loss: 0.35512620615852863
Epoch: 19, step: 564, loss: 0.32400014996528625, mean loss: 0.3551250945533648
Epoch: 19, step: 565, loss: 0.30800482630729675, mean loss: 0.3551234118068379
Epoch: 19, step: 566, loss: 0.30695992708206177, mean loss: 0.3551216918666627
Epoch: 19, step: 567, loss: 0.32728680968284607, mean loss: 0.355120697905722
Epoch: 19, step: 568, loss: 0.3204100728034973, mean loss: 0.35511945846186904
Epoch: 19, step: 569, loss: 0.3475835621356964, mean loss: 0.35511918938037484
Epoch: 19, step: 570, loss: 0.3773733377456665, mean loss: 0.3551199839727398
Epoch: 19, step: 571, loss: 0.32693180441856384, mean loss: 0.35511897753959376
Epoch: 19, step: 572, loss: 0.31896263360977173, mean loss: 0.355117686656523
Epoch: 19, step: 573, loss: 0.3736777901649475, mean loss: 0.35511834928071107
Epoch: 19, step: 574, loss: 0.3584021031856537, mean loss: 0.35511846651158124
Epoch: 19, step: 575, loss: 0.377157598733902, mean loss: 0.35511925328625715
Epoch: 19, step: 576, loss: 0.3542667627334595, mean loss: 0.3551192228542951
Epoch: 19, step: 577, loss: 0.3393045663833618, mean loss: 0.35511865832739886
Epoch: 19, step: 578, loss: 0.3097841143608093, mean loss: 0.3551170401034486
Epoch: 19, step: 579, loss: 0.3020118474960327, mean loss: 0.35511514457258736
Epoch: 19, step: 580, loss: 0.34599992632865906, mean loss: 0.35511481922661015
Epoch: 19, step: 581, loss: 0.34201857447624207, mean loss: 0.35511435180406925
Epoch: 19, step: 582, loss: 0.3169441819190979, mean loss: 0.3551129895081313
Epoch: 19, step: 583, loss: 0.3116772174835205, mean loss: 0.3551114393378235
Epoch: 19, step: 584, loss: 0.2934635281562805, mean loss: 0.3551092392767557
Epoch: 19, step: 585, loss: 0.30891507863998413, mean loss: 0.3551075907805514
Epoch: 19, step: 586, loss: 0.31818294525146484, mean loss: 0.35510627312557047
Epoch: 19, step: 587, loss: 0.3435479402542114, mean loss: 0.3551058606814914
Epoch: 19, step: 588, loss: 0.3377358019351959, mean loss: 0.35510524087564854
Epoch: 19, step: 589, loss: 0.3361981511116028, mean loss: 0.3551045662488818
Epoch: 19, step: 590, loss: 0.3268929421901703, mean loss: 0.3551035596615175
Epoch: 19, step: 591, loss: 0.34382107853889465, mean loss: 0.35510315711830637
Epoch: 19, step: 592, loss: 0.3389253616333008, mean loss: 0.3551025799376904
Epoch: 19, step: 593, loss: 0.34811267256736755, mean loss: 0.35510233056532614
Epoch: 19, step: 594, loss: 0.3215045630931854, mean loss: 0.3551011319720732
Epoch: 19, step: 595, loss: 0.31727540493011475, mean loss: 0.35509978259539504
Epoch: 19, step: 596, loss: 0.3340492248535156, mean loss: 0.35509903167477497
Epoch: 19, step: 597, loss: 0.35020315647125244, mean loss: 0.3550988570341527
Epoch: 19, step: 598, loss: 0.32641783356666565, mean loss: 0.35509783399069034
Epoch: 19, step: 599, loss: 0.3182813227176666, mean loss: 0.35509652080367105
Epoch: 19, step: 600, loss: 0.31652870774269104, mean loss: 0.3550951451995386
Epoch: 19, step: 601, loss: 0.33230310678482056, mean loss: 0.3550943323013856
Epoch: 19, step: 602, loss: 0.32930147647857666, mean loss: 0.3550934124092417
Epoch: 19, step: 603, loss: 0.3395388722419739, mean loss: 0.3550928576824169
Epoch: 19, step: 604, loss: 0.3199315667152405, mean loss: 0.35509160375812865
Epoch: 19, step: 605, loss: 0.33683207631111145, mean loss: 0.3550909526088723
Epoch: 19, step: 606, loss: 0.32352861762046814, mean loss: 0.3550898271110658
Epoch: 19, step: 607, loss: 0.3076806664466858, mean loss: 0.35508813658329996
Epoch: 19, step: 608, loss: 0.3459242880344391, mean loss: 0.35508780982813687
Epoch: 19, step: 609, loss: 0.32968226075172424, mean loss: 0.35508690397528525
Epoch: 19, step: 610, loss: 0.3116358816623688, mean loss: 0.35508535475353914
Epoch: 19, step: 611, loss: 0.34955301880836487, mean loss: 0.3550851575082473
Epoch: 19, step: 612, loss: 0.3313761353492737, mean loss: 0.3550843122366812
Epoch: 19, step: 613, loss: 0.34029990434646606, mean loss: 0.3550837851633161
Epoch: 19, step: 614, loss: 0.34743189811706543, mean loss: 0.35508351237849395
Epoch: 19, step: 615, loss: 0.41289007663726807, mean loss: 0.35508557307164446
Epoch: 19, step: 616, loss: 0.33650973439216614, mean loss: 0.3550849109022266
Epoch: 19, step: 617, loss: 0.31895768642425537, mean loss: 0.35508362312777453
Epoch: 19, step: 618, loss: 0.3378032445907593, mean loss: 0.3550830071812931
Epoch: 19, step: 619, loss: 0.3294283449649811, mean loss: 0.35508209277217506
Epoch: 19, step: 620, loss: 0.32686635851860046, mean loss: 0.3550810871146118
Epoch: 19, step: 621, loss: 0.3119357228279114, mean loss: 0.35507954939402275
Epoch: 19, step: 622, loss: 0.32558441162109375, mean loss: 0.35507849821123744
Epoch: 19, step: 623, loss: 0.36250460147857666, mean loss: 0.35507876286210227
Epoch: 19, step: 624, loss: 0.3251630961894989, mean loss: 0.35507769676799755
Epoch: 19, step: 625, loss: 0.3088911175727844, mean loss: 0.35507605089175226
Epoch: 19, step: 626, loss: 0.344841331243515, mean loss: 0.35507568618663704
Epoch: 19, step: 627, loss: 0.2855052947998047, mean loss: 0.35507320719606594
Epoch: 19, step: 628, loss: 0.39991217851638794, mean loss: 0.355074804878992
Epoch: 19, step: 629, loss: 0.3140544593334198, mean loss: 0.3550733433117738
Epoch: 19, step: 630, loss: 0.32011678814888, mean loss: 0.35507209784360255
Epoch: 19, step: 631, loss: 0.35177600383758545, mean loss: 0.35507198041115257
Epoch: 19, step: 632, loss: 0.3445405066013336, mean loss: 0.3550716052116866
Epoch: 19, step: 633, loss: 0.33807891607284546, mean loss: 0.3550709998433525
Epoch: 19, step: 634, loss: 0.33728793263435364, mean loss: 0.35507036634019234
Epoch: 19, step: 635, loss: 0.3080798089504242, mean loss: 0.3550686924103908
Epoch: 19, step: 636, loss: 0.33174630999565125, mean loss: 0.35506786163411413
Epoch: 19, step: 637, loss: 0.38397017121315, mean loss: 0.3550688911386229
Epoch: 19, step: 638, loss: 0.31840780377388, mean loss: 0.3550675853118245
Epoch: 19, step: 639, loss: 0.35704997181892395, mean loss: 0.35506765591969264
Epoch: 19, step: 640, loss: 0.35683682560920715, mean loss: 0.3550677189310432
Epoch: 19, step: 641, loss: 0.34919220209121704, mean loss: 0.3550675096740862
Epoch: 19, step: 642, loss: 0.3756864666938782, mean loss: 0.35506824399357834
Epoch: 19, step: 643, loss: 0.31941431760787964, mean loss: 0.3550669742668552
Epoch: 19, step: 644, loss: 0.33121049404144287, mean loss: 0.35506612470735854
Epoch: 19, step: 645, loss: 0.33925992250442505, mean loss: 0.35506556184850935
Epoch: 19, step: 646, loss: 0.33651357889175415, mean loss: 0.35506490123593387
Epoch: 19, step: 647, loss: 0.30838629603385925, mean loss: 0.3550632391292111
Epoch: 19, step: 648, loss: 0.3704962730407715, mean loss: 0.3550637886408334
Epoch: 19, step: 649, loss: 0.34080269932746887, mean loss: 0.35506328087577915
Epoch: 19, step: 650, loss: 0.3647286593914032, mean loss: 0.35506362499863015
Epoch: 19, step: 651, loss: 0.31995847821235657, mean loss: 0.35506237517141614
Epoch: 19, step: 652, loss: 0.33413589000701904, mean loss: 0.3550616301650021
Epoch: 19, step: 653, loss: 0.3237396478652954, mean loss: 0.35506051510689246
Epoch: 19, step: 654, loss: 0.3300403952598572, mean loss: 0.3550596244258969
Epoch: 19, step: 655, loss: 0.35062193870544434, mean loss: 0.35505946645616454
Epoch: 19, step: 656, loss: 0.37730246782302856, mean loss: 0.35506025821928583
Epoch: 19, step: 657, loss: 0.33155322074890137, mean loss: 0.35505942149124886
Epoch: 19, step: 658, loss: 0.3672591745853424, mean loss: 0.35505985572342874
Epoch: 19, step: 659, loss: 0.3083624541759491, mean loss: 0.35505819365759916
Epoch: 19, step: 660, loss: 0.3319065272808075, mean loss: 0.3550573696669106
Epoch: 19, step: 661, loss: 0.3507044315338135, mean loss: 0.35505721474705393
Epoch: 19, step: 662, loss: 0.36262962222099304, mean loss: 0.35505748423733735
Epoch: 19, step: 663, loss: 0.37355703115463257, mean loss: 0.3550581425842027
Epoch: 19, step: 664, loss: 0.31282544136047363, mean loss: 0.3550566396945823
Epoch: 19, step: 665, loss: 0.32607507705688477, mean loss: 0.3550556083956485
Epoch: 19, step: 666, loss: 0.34299734234809875, mean loss: 0.3550551793216689
Epoch: 19, step: 667, loss: 0.294502317905426, mean loss: 0.35505302472227324
Epoch: 19, step: 668, loss: 0.3192204535007477, mean loss: 0.35505174976866277
Epoch: 19, step: 669, loss: 0.3266008496284485, mean loss: 0.3550507374972567
Epoch: 19, step: 670, loss: 0.3155859708786011, mean loss: 0.3550493334069369
Epoch: 19, step: 671, loss: 0.32363060116767883, mean loss: 0.3550482156208177
Epoch: 19, step: 672, loss: 0.29347264766693115, mean loss: 0.35504602502108257
Epoch: 19, step: 673, loss: 0.3224025070667267, mean loss: 0.3550448637433183
Epoch: 19, step: 674, loss: 0.2928880751132965, mean loss: 0.3550426526235207
Epoch: 19, step: 675, loss: 0.35409045219421387, mean loss: 0.35504261875184917
Epoch: 19, step: 676, loss: 0.3560163676738739, mean loss: 0.3550426533888115
Epoch: 19, step: 677, loss: 0.32457593083381653, mean loss: 0.35504156970372386
Epoch: 19, step: 678, loss: 0.32070645689964294, mean loss: 0.35504034846549504
Epoch: 19, step: 679, loss: 0.31363341212272644, mean loss: 0.3550388757475998
Epoch: 19, step: 680, loss: 0.3163584768772125, mean loss: 0.3550375000532202
Epoch: 19, step: 681, loss: 0.32529929280281067, mean loss: 0.3550364424315099
Epoch: 19, step: 682, loss: 0.36386507749557495, mean loss: 0.3550367564055155
Epoch: 19, step: 683, loss: 0.3856363892555237, mean loss: 0.3550378445859156
Epoch: 19, step: 684, loss: 0.3440215587615967, mean loss: 0.35503745284003796
Epoch: 19, step: 685, loss: 0.33173438906669617, mean loss: 0.3550366241982709
Epoch: 19, step: 686, loss: 0.34939295053482056, mean loss: 0.355036423520048
Epoch: 19, step: 687, loss: 0.33682191371917725, mean loss: 0.3550357758700053
Epoch: 19, step: 688, loss: 0.3007144331932068, mean loss: 0.3550338444444879
Epoch: 19, step: 689, loss: 0.33571290969848633, mean loss: 0.35503315750234377
Epoch: 19, step: 690, loss: 0.3654254078865051, mean loss: 0.3550335269783058
Epoch: 19, step: 691, loss: 0.32554998993873596, mean loss: 0.35503247878657374
Epoch: 19, step: 692, loss: 0.30877789855003357, mean loss: 0.35503083441314287
Epoch: 19, step: 693, loss: 0.3114315867424011, mean loss: 0.35502928449321147
Epoch: 19, step: 694, loss: 0.31721213459968567, mean loss: 0.3550279401702264
Epoch: 19, step: 695, loss: 0.31940582394599915, mean loss: 0.35502667392124926
Epoch: 19, step: 696, loss: 0.3637171983718872, mean loss: 0.3550269828298068
Epoch: 19, step: 697, loss: 0.3163091838359833, mean loss: 0.3550256066373353
Epoch: 19, step: 698, loss: 0.3501957058906555, mean loss: 0.35502543496856875
Epoch: 19, step: 699, loss: 0.3643378019332886, mean loss: 0.35502576594550095
Epoch: 19, step: 700, loss: 0.29732075333595276, mean loss: 0.35502371508675235
Epoch: 19, step: 701, loss: 0.3042190968990326, mean loss: 0.3550219095348941
Epoch: 19, step: 702, loss: 0.3310924470424652, mean loss: 0.35502105913287224
Epoch: 19, step: 703, loss: 0.340349406003952, mean loss: 0.355020537752164
Epoch: 19, step: 704, loss: 0.33641400933265686, mean loss: 0.35501987656285233
Epoch: 19, step: 705, loss: 0.3160419166088104, mean loss: 0.35501849151701503
Epoch: 19, step: 706, loss: 0.3242538571357727, mean loss: 0.35501739836296675
Epoch: 19, step: 707, loss: 0.3241622745990753, mean loss: 0.3550163020325317
Epoch: 19, step: 708, loss: 0.3606923520565033, mean loss: 0.35501650370423266
Epoch: 19, step: 709, loss: 0.35669752955436707, mean loss: 0.3550165634294458
Epoch: 19, step: 710, loss: 0.380258172750473, mean loss: 0.3550174602074087
Epoch: 19, step: 711, loss: 0.35012349486351013, mean loss: 0.35501728634193536
Epoch: 19, step: 712, loss: 0.37811437249183655, mean loss: 0.35501810687147994
Epoch: 19, step: 713, loss: 0.3637864589691162, mean loss: 0.35501841835823295
Epoch: 19, step: 714, loss: 0.40776392817497253, mean loss: 0.35502029202203944
Epoch: 19, step: 715, loss: 0.36707931756973267, mean loss: 0.35502072037617227
Epoch: 19, step: 716, loss: 0.33168405294418335, mean loss: 0.35501989145323576
Epoch: 19, step: 717, loss: 0.308794766664505, mean loss: 0.3550182495861906
Epoch: 19, step: 718, loss: 0.3527718484401703, mean loss: 0.35501816979925593
Epoch: 19, step: 719, loss: 0.3514007329940796, mean loss: 0.3550180413208923
Epoch: 19, step: 720, loss: 0.35816001892089844, mean loss: 0.3550181529086893
Epoch: 19, step: 721, loss: 0.3436667323112488, mean loss: 0.3550177497756331
Epoch: 19, step: 722, loss: 0.333842933177948, mean loss: 0.3550169978023174
Epoch: 19, step: 723, loss: 0.33024129271507263, mean loss: 0.3550161179832447
Epoch: 19, step: 724, loss: 0.32124149799346924, mean loss: 0.35501491864302276
Epoch: 19, step: 725, loss: 0.33357787132263184, mean loss: 0.3550141574383029
Epoch: 19, step: 726, loss: 0.30283093452453613, mean loss: 0.3550123045382953
Epoch: 19, step: 727, loss: 0.3580961525440216, mean loss: 0.3550124140343898
Epoch: 19, step: 728, loss: 0.3066946268081665, mean loss: 0.3550106985084808
Epoch: 19, step: 729, loss: 0.31536200642585754, mean loss: 0.3550092908292902
Epoch: 19, step: 730, loss: 0.3010769486427307, mean loss: 0.35500737609423905
Epoch: 19, step: 731, loss: 0.3602572977542877, mean loss: 0.3550075624731676
Epoch: 19, step: 732, loss: 0.3113444745540619, mean loss: 0.35500601243277147
Epoch: 19, step: 733, loss: 0.33729088306427, mean loss: 0.3550053835676892
Epoch: 19, step: 734, loss: 0.3062308132648468, mean loss: 0.3550036521925054
Epoch: 19, step: 735, loss: 0.3222060203552246, mean loss: 0.3550024879999796
Epoch: 19, step: 736, loss: 0.3090176582336426, mean loss: 0.3550008557694835
Epoch: 19, step: 737, loss: 0.31608378887176514, mean loss: 0.3549994744581007
Epoch: 19, step: 738, loss: 0.3355066478252411, mean loss: 0.354998782609773
Epoch: 19, step: 739, loss: 0.32357341051101685, mean loss: 0.3549976672856639
Epoch: 19, step: 740, loss: 0.3255601227283478, mean loss: 0.35499662254901493
Epoch: 19, step: 741, loss: 0.3589490056037903, mean loss: 0.3549967628138689
Epoch: 19, step: 742, loss: 0.3159743547439575, mean loss: 0.35499537800929565
Epoch: 19, step: 743, loss: 0.36632898449897766, mean loss: 0.3549957801954734
Epoch: 19, step: 744, loss: 0.34877076745033264, mean loss: 0.35499555930151133
Epoch: 19, step: 745, loss: 0.32256177067756653, mean loss: 0.35499440843256574
Epoch: 19, step: 746, loss: 0.2979196608066559, mean loss: 0.35499238328451105
Epoch: 19, step: 747, loss: 0.362225741147995, mean loss: 0.35499263993217867
Epoch: 19, step: 748, loss: 0.34301966428756714, mean loss: 0.35499221513261703
Epoch: 19, step: 749, loss: 0.32419073581695557, mean loss: 0.35499112233905583
Epoch: 19, step: 750, loss: 0.41116389632225037, mean loss: 0.35499311520009047
Epoch: 19, step: 751, loss: 0.3272537887096405, mean loss: 0.3549921311172719
Epoch: 19, step: 752, loss: 0.30409330129623413, mean loss: 0.3549903254899059
Epoch: 19, step: 753, loss: 0.32860538363456726, mean loss: 0.3549893895217663
Epoch: 19, step: 754, loss: 0.35272446274757385, mean loss: 0.3549893091795729
Epoch: 19, step: 755, loss: 0.3247555196285248, mean loss: 0.3549882367551422
Epoch: 19, step: 756, loss: 0.2901303172111511, mean loss: 0.3549859362578718
Epoch: 19, step: 757, loss: 0.37575864791870117, mean loss: 0.3549866730356139
Epoch: 19, step: 758, loss: 0.3474310338497162, mean loss: 0.35498640505763246
Epoch: 19, step: 759, loss: 0.34504473209381104, mean loss: 0.354986052466025
Epoch: 19, step: 760, loss: 0.35052916407585144, mean loss: 0.35498589440352224
Epoch: 19, step: 761, loss: 0.30428001284599304, mean loss: 0.3549840961950834
Epoch: 19, step: 762, loss: 0.3241439759731293, mean loss: 0.3549830025350167
Epoch: 19, step: 763, loss: 0.34936240315437317, mean loss: 0.3549828032229819
Epoch: 19, step: 764, loss: 0.32152894139289856, mean loss: 0.354981616957891
Epoch: 19, step: 765, loss: 0.30453965067863464, mean loss: 0.3549798283625332
Epoch: 19, step: 766, loss: 0.3001077473163605, mean loss: 0.35497788275103637
Epoch: 19, step: 767, loss: 0.2948792576789856, mean loss: 0.3549757518963678
Epoch: 19, step: 768, loss: 0.2866792380809784, mean loss: 0.3549733304635079
Epoch: 19, step: 769, loss: 0.3071434497833252, mean loss: 0.3549716347292428
Epoch: 19, step: 770, loss: 0.3242661952972412, mean loss: 0.3549705461540866
Epoch: 19, step: 771, loss: 0.30729615688323975, mean loss: 0.3549688560523682
Epoch: 19, step: 772, loss: 0.3825112581253052, mean loss: 0.35496983242168556
Epoch: 19, step: 773, loss: 0.31858423352241516, mean loss: 0.3549685426096012
Epoch: 19, step: 774, loss: 0.35396620631217957, mean loss: 0.3549685070796201
Epoch: 19, step: 775, loss: 0.35097381472587585, mean loss: 0.35496836548411626
Epoch: 19, step: 776, loss: 0.345588743686676, mean loss: 0.35496803302667473
Epoch: 19, step: 777, loss: 0.33224478363990784, mean loss: 0.35496722763752797
Epoch: 19, step: 778, loss: 0.332986056804657, mean loss: 0.3549664485777784
Epoch: 19, step: 779, loss: 0.3723142147064209, mean loss: 0.3549670633979559
Epoch: 19, step: 780, loss: 0.3248160183429718, mean loss: 0.35496599485611746
Epoch: 19, step: 781, loss: 0.33094435930252075, mean loss: 0.35496514356844455
Epoch: 19, step: 782, loss: 0.31446966528892517, mean loss: 0.35496370852544945
Epoch: 19, step: 783, loss: 0.2856746315956116, mean loss: 0.35496125320734423
Epoch: 19, step: 784, loss: 0.28699371218681335, mean loss: 0.35495884480434575
Epoch: 19, step: 785, loss: 0.32926660776138306, mean loss: 0.3549579344423217
Epoch: 19, step: 786, loss: 0.3267687261104584, mean loss: 0.35495693563963127
Epoch: 19, step: 787, loss: 0.3842684030532837, mean loss: 0.35495797416951413
Epoch: 19, step: 788, loss: 0.3562842905521393, mean loss: 0.3549580211603514
Epoch: 19, step: 789, loss: 0.31689703464508057, mean loss: 0.35495667272321846
Epoch: 19, step: 790, loss: 0.3186562657356262, mean loss: 0.35495538670603677
Epoch: 19, step: 791, loss: 0.33680108189582825, mean loss: 0.35495474357493256
Epoch: 19, step: 792, loss: 0.3447973430156708, mean loss: 0.35495438375345256
Epoch: 19, step: 793, loss: 0.3305225372314453, mean loss: 0.3549535182966151
Epoch: 19, step: 794, loss: 0.3288020193576813, mean loss: 0.3549525919568135
Epoch: 19, step: 795, loss: 0.32394173741340637, mean loss: 0.354951493527565
Epoch: 19, step: 796, loss: 0.3475522994995117, mean loss: 0.35495123145148283
Epoch: 19, step: 797, loss: 0.3403202295303345, mean loss: 0.3549507132464137
Epoch: 19, step: 798, loss: 0.3348459303379059, mean loss: 0.3549500011946018
Epoch: 19, step: 799, loss: 0.30522581934928894, mean loss: 0.3549482401738536
Epoch: 19, step: 800, loss: 0.2763660252094269, mean loss: 0.354945457221877
Epoch: 19, step: 801, loss: 0.36519402265548706, mean loss: 0.35494582015712145
Epoch: 19, step: 802, loss: 0.3162839114665985, mean loss: 0.3549444510608825
Epoch: 19, step: 803, loss: 0.3494977653026581, mean loss: 0.3549442581895738
Epoch: 19, step: 804, loss: 0.3237244486808777, mean loss: 0.35494315271138577
Epoch: 19, step: 805, loss: 0.340213418006897, mean loss: 0.3549426311571508
Epoch: 19, step: 806, loss: 0.36706864833831787, mean loss: 0.35494306050308366
Epoch: 19, step: 807, loss: 0.30731090903282166, mean loss: 0.3549413740510418
Epoch: 19, step: 808, loss: 0.3088778853416443, mean loss: 0.35493974319642296
Epoch: 19, step: 809, loss: 0.360267698764801, mean loss: 0.3549399318233283
Epoch: 19, step: 810, loss: 0.35039108991622925, mean loss: 0.35493977078527444
Epoch: 19, step: 811, loss: 0.3695407211780548, mean loss: 0.35494028766966956
Epoch: 19, step: 812, loss: 0.32688015699386597, mean loss: 0.35493929435554605
Epoch: 19, step: 813, loss: 0.3128166198730469, mean loss: 0.3549378032874228
Epoch: 19, step: 814, loss: 0.33005833625793457, mean loss: 0.35493692262949816
Epoch: 19, step: 815, loss: 0.3352327048778534, mean loss: 0.3549362251844411
Epoch: 19, step: 816, loss: 0.3147364556789398, mean loss: 0.35493480233484975
Epoch: 19, step: 817, loss: 0.35558512806892395, mean loss: 0.3549348253519707
Epoch: 19, step: 818, loss: 0.32901880145072937, mean loss: 0.3549339081329333
Epoch: 19, step: 819, loss: 0.30938827991485596, mean loss: 0.3549322962406549
Epoch: 19, step: 820, loss: 0.3326199948787689, mean loss: 0.3549315066203356
Epoch: 19, step: 821, loss: 0.34890255331993103, mean loss: 0.3549312932664783
Epoch: 19, step: 822, loss: 0.31307119131088257, mean loss: 0.3549298119648769
Epoch: 19, step: 823, loss: 0.31947553157806396, mean loss: 0.35492855739019935
Epoch: 19, step: 824, loss: 0.3126833736896515, mean loss: 0.35492706256752143
Epoch: 19, step: 825, loss: 0.34161266684532166, mean loss: 0.35492659146159394
Epoch: 19, step: 826, loss: 0.3510332703590393, mean loss: 0.35492645370830866
Epoch: 19, step: 827, loss: 0.32524171471595764, mean loss: 0.35492540344157386
Epoch: 19, step: 828, loss: 0.33318281173706055, mean loss: 0.35492463420075643
Epoch: 19, step: 829, loss: 0.36498787999153137, mean loss: 0.354924990220207
Epoch: 19, step: 830, loss: 0.33788183331489563, mean loss: 0.35492438728544545
Epoch: 19, step: 831, loss: 0.2851707637310028, mean loss: 0.35492191970289433
Epoch: 19, step: 832, loss: 0.3571939766407013, mean loss: 0.35492200007563257
Epoch: 19, step: 833, loss: 0.3762282729148865, mean loss: 0.35492275374640864
Epoch: 19, step: 834, loss: 0.35216623544692993, mean loss: 0.35492265624302005
Epoch: 19, step: 835, loss: 0.345672070980072, mean loss: 0.3549223290434847
Epoch: 19, step: 836, loss: 0.30802085995674133, mean loss: 0.3549206701650817
Epoch: 19, step: 837, loss: 0.37957045435905457, mean loss: 0.3549215419831546
Epoch: 19, step: 838, loss: 0.3180775046348572, mean loss: 0.3549202389225941
Epoch: 19, step: 839, loss: 0.3765759766101837, mean loss: 0.3549210047925081
Epoch: 19, step: 840, loss: 0.3371213674545288, mean loss: 0.3549203753184713
Epoch: 19, step: 841, loss: 0.31627529859542847, mean loss: 0.35491900870567256
Epoch: 19, step: 842, loss: 0.3440868854522705, mean loss: 0.3549186256608954
Epoch: 19, step: 843, loss: 0.3201389014720917, mean loss: 0.3549173958262352
Epoch: 19, step: 844, loss: 0.33294785022735596, mean loss: 0.3549166189956564
Epoch: 19, step: 845, loss: 0.3462778925895691, mean loss: 0.35491631354602743
Epoch: 19, step: 846, loss: 0.34113889932632446, mean loss: 0.3549158264189822
Epoch: 19, step: 847, loss: 0.32590624690055847, mean loss: 0.3549148007656263
Epoch: 19, step: 848, loss: 0.3222740888595581, mean loss: 0.3549136467719227
Epoch: 19, step: 849, loss: 0.38771694898605347, mean loss: 0.3549148064729131
Epoch: 19, step: 850, loss: 0.32526251673698425, mean loss: 0.35491375820728804
Epoch: 19, step: 851, loss: 0.3212412893772125, mean loss: 0.3549125678626603
Epoch: 19, step: 852, loss: 0.32438719272613525, mean loss: 0.35491148880807594
Epoch: 19, step: 853, loss: 0.3253887891769409, mean loss: 0.35491044523438803
Epoch: 19, step: 854, loss: 0.3807241916656494, mean loss: 0.35491135767107923
Epoch: 19, step: 855, loss: 0.31334763765335083, mean loss: 0.35490988857310035
Epoch: 19, step: 856, loss: 0.3650219142436981, mean loss: 0.35491024597689885
Epoch: 19, step: 857, loss: 0.3101601004600525, mean loss: 0.35490866436434787
Epoch: 19, step: 858, loss: 0.32299110293388367, mean loss: 0.3549075363360238
Epoch: 19, step: 859, loss: 0.3216564655303955, mean loss: 0.3549063612204313
Epoch: 19, step: 860, loss: 0.39704814553260803, mean loss: 0.3549078504872904
Epoch: 19, step: 861, loss: 0.33085936307907104, mean loss: 0.35490700065735864
Epoch: 19, step: 862, loss: 0.41320037841796875, mean loss: 0.3549090605668169
Epoch: 19, step: 863, loss: 0.35371166467666626, mean loss: 0.35490901825600807
Epoch: 19, step: 864, loss: 0.3140413761138916, mean loss: 0.35490757422073926
Epoch: 19, step: 865, loss: 0.3721785843372345, mean loss: 0.35490818446065575
Epoch: 19, step: 866, loss: 0.32642796635627747, mean loss: 0.3549071781991957
Epoch: 19, step: 867, loss: 0.3456380367279053, mean loss: 0.3549068507139826
Epoch: 19, step: 868, loss: 0.3158845901489258, mean loss: 0.35490547207909245
Epoch: 19, step: 869, loss: 0.3217843472957611, mean loss: 0.35490430196940603
Epoch: 19, step: 870, loss: 0.3466441035270691, mean loss: 0.35490401016178097
Epoch: 19, step: 871, loss: 0.32788798213005066, mean loss: 0.354903055801599
Epoch: 19, step: 872, loss: 0.32611992955207825, mean loss: 0.35490203905334755
Epoch: 19, step: 873, loss: 0.3650696873664856, mean loss: 0.35490239820729713
Epoch: 19, step: 874, loss: 0.36425134539604187, mean loss: 0.35490272843043263
Epoch: 19, step: 875, loss: 0.33970171213150024, mean loss: 0.35490219151971286
Epoch: 19, step: 876, loss: 0.40730369091033936, mean loss: 0.3549040423126133
Epoch: 19, step: 877, loss: 0.347262978553772, mean loss: 0.3549037724438643
Epoch: 19, step: 878, loss: 0.3610195219516754, mean loss: 0.354903988433605
Epoch: 19, step: 879, loss: 0.32652202248573303, mean loss: 0.35490298610396986
Epoch: 19, step: 880, loss: 0.2999021112918854, mean loss: 0.35490104377692916
Epoch: 19, step: 881, loss: 0.3247476816177368, mean loss: 0.35489997896436615
Epoch: 19, step: 882, loss: 0.36875519156455994, mean loss: 0.35490046821937515
Epoch: 19, step: 883, loss: 0.3544559180736542, mean loss: 0.354900452521983
Epoch: 19, step: 884, loss: 0.35292699933052063, mean loss: 0.3549003828403619
Epoch: 19, step: 885, loss: 0.32891562581062317, mean loss: 0.35489946536429984
Epoch: 19, step: 886, loss: 0.347144216299057, mean loss: 0.3548991915497652
Epoch: 19, step: 887, loss: 0.3825625777244568, mean loss: 0.3549001682263001
Epoch: 19, step: 888, loss: 0.3211238384246826, mean loss: 0.3548989757698199
Epoch: 19, step: 889, loss: 0.34187817573547363, mean loss: 0.3548985160931965
Epoch: 19, step: 890, loss: 0.3232293128967285, mean loss: 0.3548973981067102
Epoch: 19, step: 891, loss: 0.3448694348335266, mean loss: 0.3548970441119604
Epoch: 19, step: 892, loss: 0.2941875457763672, mean loss: 0.35489490109602845
Epoch: 19, step: 893, loss: 0.33796238899230957, mean loss: 0.3548943034076379
Epoch: 19, step: 894, loss: 0.3161584734916687, mean loss: 0.35489293614810186
Epoch: 19, step: 895, loss: 0.34734153747558594, mean loss: 0.354892669615606
Epoch: 19, step: 896, loss: 0.3516509234905243, mean loss: 0.3548925551996908
Epoch: 19, step: 897, loss: 0.31151241064071655, mean loss: 0.3548910241717894
Epoch: 19, step: 898, loss: 0.300691157579422, mean loss: 0.3548891113478405
Epoch: 19, step: 899, loss: 0.36024805903434753, mean loss: 0.35488930046937095
Epoch: 19, step: 900, loss: 0.35510918498039246, mean loss: 0.35488930822899656
Epoch: 19, step: 901, loss: 0.38645070791244507, mean loss: 0.3548904219773092
Epoch: 19, step: 902, loss: 0.3335384130477905, mean loss: 0.35488966852768394
Epoch: 19, step: 903, loss: 0.33270925283432007, mean loss: 0.3548888858736369
Epoch: 19, step: 904, loss: 0.34605586528778076, mean loss: 0.3548885742043032
Epoch: 19, step: 905, loss: 0.33718472719192505, mean loss: 0.35488794955371356
Epoch: 19, step: 906, loss: 0.29767659306526184, mean loss: 0.3548859310180438
Epoch: 19, step: 907, loss: 0.3145677149295807, mean loss: 0.3548845085576963
Epoch: 19, step: 908, loss: 0.31982189416885376, mean loss: 0.3548832715630098
Epoch: 19, step: 909, loss: 0.3314320147037506, mean loss: 0.35488244424145265
Epoch: 19, step: 910, loss: 0.339738667011261, mean loss: 0.3548819100128842
Epoch: 19, step: 911, loss: 0.3424997627735138, mean loss: 0.35488147322202634
Epoch: 19, step: 912, loss: 0.35311636328697205, mean loss: 0.3548814109584567
Epoch: 19, step: 913, loss: 0.34166210889816284, mean loss: 0.35488094466914244
Epoch: 19, step: 914, loss: 0.3148146867752075, mean loss: 0.35487953144710815
Epoch: 19, step: 915, loss: 0.3177105784416199, mean loss: 0.35487822046541356
Epoch: 19, step: 916, loss: 0.3192131519317627, mean loss: 0.35487696257141527
Epoch: 19, step: 917, loss: 0.33697018027305603, mean loss: 0.3548763310279894
Epoch: 19, step: 918, loss: 0.29732370376586914, mean loss: 0.35487430131092845
Epoch: 19, step: 919, loss: 0.3012130558490753, mean loss: 0.35487240889854793
Epoch: 19, step: 920, loss: 0.30825427174568176, mean loss: 0.3548707649257316
Epoch: 19, step: 921, loss: 0.3140077292919159, mean loss: 0.3548693239554363
Epoch: 19, step: 922, loss: 0.3238978683948517, mean loss: 0.35486823183457306
Epoch: 19, step: 923, loss: 0.32352495193481445, mean loss: 0.3548671266413467
Epoch: 19, step: 924, loss: 0.3098139762878418, mean loss: 0.35486553808133986
Epoch: 19, step: 925, loss: 0.32869184017181396, mean loss: 0.35486461523746743
Epoch: 19, step: 926, loss: 0.3618345558643341, mean loss: 0.354864860978067
Epoch: 19, step: 927, loss: 0.34843122959136963, mean loss: 0.3548646341542274
Epoch: 19, step: 928, loss: 0.32615387439727783, mean loss: 0.3548636219645656
Epoch: 19, step: 929, loss: 0.30126523971557617, mean loss: 0.3548617324354727
Epoch: 19, step: 930, loss: 0.28926151990890503, mean loss: 0.3548594198817121
Epoch: 19, step: 931, loss: 0.3353774845600128, mean loss: 0.3548587331242628
Epoch: 19, step: 932, loss: 0.33330947160720825, mean loss: 0.35485797351830145
Epoch: 19, step: 933, loss: 0.343883216381073, mean loss: 0.35485758667455325
Epoch: 19, step: 934, loss: 0.3482539653778076, mean loss: 0.3548573539149996
Epoch: 19, step: 935, loss: 0.3561859130859375, mean loss: 0.354857400741419
Epoch: 19, step: 936, loss: 0.32891684770584106, mean loss: 0.35485648647246487
Epoch: 19, step: 937, loss: 0.37972521781921387, mean loss: 0.35485736293441406
Epoch: 19, step: 938, loss: 0.32536235451698303, mean loss: 0.35485632346275175
Epoch: 19, step: 939, loss: 0.3758822977542877, mean loss: 0.35485706444013726
Epoch: 19, step: 940, loss: 0.29731860756874084, mean loss: 0.3548550367960286
Epoch: 19, step: 941, loss: 0.31496095657348633, mean loss: 0.3548536309858861
Epoch: 19, step: 942, loss: 0.32533419132232666, mean loss: 0.35485259079984494
Epoch: 19, step: 943, loss: 0.35196077823638916, mean loss: 0.354852488903701
Epoch: 19, step: 944, loss: 0.34342634677886963, mean loss: 0.35485208630540904
Epoch: 19, step: 945, loss: 0.33001551032066345, mean loss: 0.35485121122345625
Epoch: 19, step: 946, loss: 0.343397855758667, mean loss: 0.35485080769474314
Epoch: 19, step: 947, loss: 0.38254624605178833, mean loss: 0.3548517834359479
Epoch: 19, step: 948, loss: 0.3660065829753876, mean loss: 0.3548521764181406
Epoch: 19, step: 949, loss: 0.33098188042640686, mean loss: 0.35485133550022363
Epoch: 19, step: 950, loss: 0.40969982743263245, mean loss: 0.3548532676695946
Epoch: 19, step: 951, loss: 0.3446817398071289, mean loss: 0.3548529093658091
Epoch: 19, step: 952, loss: 0.3148269057273865, mean loss: 0.35485149945339095
Epoch: 19, step: 953, loss: 0.3755764663219452, mean loss: 0.35485222946279105
Epoch: 19, step: 954, loss: 0.35080400109291077, mean loss: 0.3548520868743521
Epoch: 19, step: 955, loss: 0.3390568792819977, mean loss: 0.3548515305483591
Epoch: 19, step: 956, loss: 0.3715561628341675, mean loss: 0.35485211888464924
Epoch: 19, step: 957, loss: 0.3247028589248657, mean loss: 0.3548510570666609
Epoch: 19, step: 958, loss: 0.3251791000366211, mean loss: 0.35485001209546774
Epoch: 19, step: 959, loss: 0.30354684591293335, mean loss: 0.3548482053914889
Epoch: 19, step: 960, loss: 0.31796303391456604, mean loss: 0.3548469064806365
Epoch: 19, step: 961, loss: 0.3901350200176239, mean loss: 0.35484814910735446
Epoch: 19, step: 962, loss: 0.35904017090797424, mean loss: 0.35484829671895346
Epoch: 19, step: 963, loss: 0.3245270848274231, mean loss: 0.3548472290706474
Epoch: 19, step: 964, loss: 0.3776935935020447, mean loss: 0.3548480334917745
Epoch: 19, step: 965, loss: 0.3106149137020111, mean loss: 0.35484647609723224
Epoch: 19, step: 966, loss: 0.2946251928806305, mean loss: 0.3548443558534828
Epoch: 19, step: 967, loss: 0.3099846839904785, mean loss: 0.35484277651001483
Epoch: 19, step: 968, loss: 0.33335185050964355, mean loss: 0.3548420199204707
Epoch: 19, step: 969, loss: 0.37470144033432007, mean loss: 0.35484271904813436
Epoch: 19, step: 970, loss: 0.34153464436531067, mean loss: 0.3548422505694255
Epoch: 19, step: 971, loss: 0.3632674813270569, mean loss: 0.3548425471489368
Epoch: 19, step: 972, loss: 0.3316836953163147, mean loss: 0.35484173195474367
Epoch: 19, step: 973, loss: 0.3204639256000519, mean loss: 0.3548405218946819
Epoch: 19, step: 974, loss: 0.3129976987838745, mean loss: 0.35483904912627845
Epoch: 19, step: 975, loss: 0.3489134907722473, mean loss: 0.35483884056798076
Epoch: 19, step: 976, loss: 0.30918142199516296, mean loss: 0.3548372336479592
Epoch: 19, step: 977, loss: 0.3211778402328491, mean loss: 0.35483604904201094
Epoch: 19, step: 978, loss: 0.41612508893013, mean loss: 0.3548382059675745
Epoch: 19, step: 979, loss: 0.3256309926509857, mean loss: 0.3548371781236374
Epoch: 19, step: 980, loss: 0.34037041664123535, mean loss: 0.35483666903536343
Epoch: 19, step: 981, loss: 0.3211711347103119, mean loss: 0.35483548438006307
Epoch: 19, step: 982, loss: 0.3581891357898712, mean loss: 0.3548356023874317
Epoch: 19, step: 983, loss: 0.3159584701061249, mean loss: 0.35483423443766815
Epoch: 19, step: 984, loss: 0.3359130918979645, mean loss: 0.35483356869253113
Epoch: 19, step: 985, loss: 0.3261299133300781, mean loss: 0.3548325587827654
Epoch: 19, step: 986, loss: 0.35203588008880615, mean loss: 0.3548324603878495
Epoch: 19, step: 987, loss: 0.281170129776001, mean loss: 0.3548298688338595
Epoch: 19, step: 988, loss: 0.3238169550895691, mean loss: 0.3548287777902801
Epoch: 19, step: 989, loss: 0.3179108202457428, mean loss: 0.35482747905118406
Epoch: 19, step: 990, loss: 0.3454396426677704, mean loss: 0.35482714880752897
Epoch: 19, step: 991, loss: 0.32082486152648926, mean loss: 0.35482595272313044
Epoch: 19, step: 992, loss: 0.32187744975090027, mean loss: 0.35482479374803555
Epoch: 19, step: 993, loss: 0.3332354724407196, mean loss: 0.35482403436283305
Epoch: 19, step: 994, loss: 0.338781476020813, mean loss: 0.354823470099939
Epoch: 19, step: 995, loss: 0.3189731240272522, mean loss: 0.35482220918455937
Epoch: 19, step: 996, loss: 0.3519301116466522, mean loss: 0.3548221074683304
Epoch: 19, step: 997, loss: 0.317538321018219, mean loss: 0.35482079622874224
Epoch: 19, step: 998, loss: 0.31991782784461975, mean loss: 0.35481956876370324
Epoch: 19, step: 999, loss: 0.34515514969825745, mean loss: 0.3548192288980729
Epoch: 19, step: 1000, loss: 0.3483119606971741, mean loss: 0.3548190000670358
Epoch: 19, step: 1001, loss: 0.3074515759944916, mean loss: 0.3548173344286621
Epoch: 19, step: 1002, loss: 0.2990935444831848, mean loss: 0.35481537501412763
Epoch: 19, step: 1003, loss: 0.3488064110279083, mean loss: 0.3548151637284741
Epoch: 19, step: 1004, loss: 0.3179476857185364, mean loss: 0.354813867449229
Epoch: 19, step: 1005, loss: 0.3433612883090973, mean loss: 0.3548134647848896
Epoch: 19, step: 1006, loss: 0.3228221833705902, mean loss: 0.35481234003428613
Epoch: 19, step: 1007, loss: 0.4005906581878662, mean loss: 0.3548139494534309
Epoch: 19, step: 1008, loss: 0.3280082046985626, mean loss: 0.35481300708237257
Epoch: 19, step: 1009, loss: 0.33505043387413025, mean loss: 0.3548123123424018
Epoch: 19, step: 1010, loss: 0.3066951334476471, mean loss: 0.3548106208747991
Epoch: 19, step: 1011, loss: 0.34193551540374756, mean loss: 0.35481016829094536
Epoch: 19, step: 1012, loss: 0.30602696537971497, mean loss: 0.3548084535310975
Epoch: 19, step: 1013, loss: 0.3368368446826935, mean loss: 0.35480782184010107
Epoch: 19, step: 1014, loss: 0.3763616383075714, mean loss: 0.3548085794168635
Epoch: 19, step: 1015, loss: 0.317982017993927, mean loss: 0.35480728507687254
Epoch: 19, step: 1016, loss: 0.33713090419769287, mean loss: 0.35480666382846715
Epoch: 19, step: 1017, loss: 0.31143900752067566, mean loss: 0.3548051396963132
Epoch: 19, step: 1018, loss: 0.30679449439048767, mean loss: 0.35480345244819145
Epoch: 19, step: 1019, loss: 0.36557695269584656, mean loss: 0.3548038310502524
Epoch: 19, step: 1020, loss: 0.3385527431964874, mean loss: 0.35480325997502127
Epoch: 19, step: 1021, loss: 0.3166067898273468, mean loss: 0.3548019177700122
Epoch: 19, step: 1022, loss: 0.344479501247406, mean loss: 0.35480155505816274
Epoch: 19, step: 1023, loss: 0.31273412704467773, mean loss: 0.3548000769334961
Epoch: 19, step: 1024, loss: 0.31448429822921753, mean loss: 0.35479866040636404
Epoch: 19, step: 1025, loss: 0.3519562780857086, mean loss: 0.3547985605404965
Epoch: 19, step: 1026, loss: 0.3573468029499054, mean loss: 0.35479865006874056
Epoch: 19, step: 1027, loss: 0.34869274497032166, mean loss: 0.3547984355554923
Epoch: 19, step: 1028, loss: 0.38324880599975586, mean loss: 0.3547994350415434
Epoch: 19, step: 1029, loss: 0.3331909477710724, mean loss: 0.3547986759434168
Epoch: 19, step: 1030, loss: 0.3296159505844116, mean loss: 0.3547977913147113
Epoch: 19, step: 1031, loss: 0.3449470102787018, mean loss: 0.35479744528474655
Epoch: 19, step: 1032, loss: 0.39233893156051636, mean loss: 0.35479876396423216
Epoch: 19, step: 1033, loss: 0.3366025984287262, mean loss: 0.3547981248295102
Epoch: 19, step: 1034, loss: 0.3365267515182495, mean loss: 0.35479748307567954
Epoch: 19, step: 1035, loss: 0.3575358986854553, mean loss: 0.35479757925492966
Epoch: 19, step: 1036, loss: 0.3471963703632355, mean loss: 0.3547973122929344
Epoch: 19, step: 1037, loss: 0.35978102684020996, mean loss: 0.3547974873197851
Epoch: 19, step: 1038, loss: 0.3277546465396881, mean loss: 0.3547965376151045
Epoch: 19, step: 1039, loss: 0.343505322933197, mean loss: 0.3547961410982242
Epoch: 19, step: 1040, loss: 0.3623160421848297, mean loss: 0.35479640516751126
Epoch: 19, step: 1041, loss: 0.3241259753704071, mean loss: 0.35479532818072157
Epoch: 19, step: 1042, loss: 0.32090601325035095, mean loss: 0.35479413820512795
Epoch: 19, step: 1043, loss: 0.3066798150539398, mean loss: 0.35479244879771393
Epoch: 19, step: 1044, loss: 0.3143105208873749, mean loss: 0.35479102743161334
Epoch: 19, step: 1045, loss: 0.28789788484573364, mean loss: 0.35478867882046994
Epoch: 19, step: 1046, loss: 0.3323175013065338, mean loss: 0.3547878898875094
Epoch: 19, step: 1047, loss: 0.3157719373703003, mean loss: 0.35478652013773704
Epoch: 19, step: 1048, loss: 0.3242727220058441, mean loss: 0.3547854489143517
Epoch: 19, step: 1049, loss: 0.3137512803077698, mean loss: 0.3547840084113465
Epoch: 19, step: 1050, loss: 0.3554031550884247, mean loss: 0.3547840301457052
Epoch: 19, step: 1051, loss: 0.3489413559436798, mean loss: 0.35478382505323813
Epoch: 19, step: 1052, loss: 0.3259440064430237, mean loss: 0.35478281273906037
Epoch: 19, step: 1053, loss: 0.3479399085044861, mean loss: 0.35478257255288154
Epoch: 19, step: 1054, loss: 0.33218175172805786, mean loss: 0.3547817792911208
Epoch: 19, step: 1055, loss: 0.3197101354598999, mean loss: 0.35478054836160267
Epoch: 19, step: 1056, loss: 0.33311381936073303, mean loss: 0.35477978793872683
Epoch: 19, step: 1057, loss: 0.30651381611824036, mean loss: 0.35477809403924554
Epoch: 19, step: 1058, loss: 0.33952200412750244, mean loss: 0.35477755864391614
Epoch: 19, step: 1059, loss: 0.352751761674881, mean loss: 0.3547774875533431
Epoch: 19, step: 1060, loss: 0.3332849144935608, mean loss: 0.3547767333485826
Epoch: 19, step: 1061, loss: 0.32685837149620056, mean loss: 0.3547757536881906
Epoch: 19, step: 1062, loss: 0.42138025164604187, mean loss: 0.3547780907701218
Epoch: 19, step: 1063, loss: 0.3710194528102875, mean loss: 0.3547786606424741
Epoch: 19, step: 1064, loss: 0.30871203541755676, mean loss: 0.354777044326372
Epoch: 19, step: 1065, loss: 0.34851542115211487, mean loss: 0.35477682463571264
Epoch: 19, step: 1066, loss: 0.34307897090911865, mean loss: 0.3547764142279055
Epoch: 19, step: 1067, loss: 0.3392805755138397, mean loss: 0.3547758705905664
Epoch: 19, step: 1068, loss: 0.3134044408798218, mean loss: 0.3547744192160809
Epoch: 19, step: 1069, loss: 0.3346054255962372, mean loss: 0.354773711681049
Epoch: 19, step: 1070, loss: 0.3075258135795593, mean loss: 0.3547720542671471
Epoch: 19, step: 1071, loss: 0.3414331078529358, mean loss: 0.35477158636528044
Epoch: 19, step: 1072, loss: 0.363101065158844, mean loss: 0.35477187853543
Epoch: 19, step: 1073, loss: 0.37214595079421997, mean loss: 0.35477248793817495
Epoch: 19, step: 1074, loss: 0.34024912118911743, mean loss: 0.3547719785429679
Epoch: 19, step: 1075, loss: 0.3328835666179657, mean loss: 0.3547712108517528
Epoch: 19, step: 1076, loss: 0.38272228837013245, mean loss: 0.3547721911441639
Epoch: 19, step: 1077, loss: 0.3326808214187622, mean loss: 0.3547714163889656
Epoch: 19, step: 1078, loss: 0.31638672947883606, mean loss: 0.3547700702663315
Epoch: 19, step: 1079, loss: 0.2799113988876343, mean loss: 0.3547674451200495
Epoch: 19, step: 1080, loss: 0.32453587651252747, mean loss: 0.35476638499561114
Epoch: 19, step: 1081, loss: 0.3418147563934326, mean loss: 0.35476593083933783
Epoch: 19, step: 1082, loss: 0.3259301483631134, mean loss: 0.35476491973156843
Epoch: 19, step: 1083, loss: 0.31039929389953613, mean loss: 0.35476336413458975
Epoch: 19, step: 1084, loss: 0.35179439187049866, mean loss: 0.35476326003682795
Epoch: 19, step: 1085, loss: 0.3488750159740448, mean loss: 0.3547630535911347
Epoch: 19, step: 1086, loss: 0.39539822936058044, mean loss: 0.3547644782370615
Epoch: 19, step: 1087, loss: 0.366745263338089, mean loss: 0.35476489826178104
Epoch: 19, step: 1088, loss: 0.30316171050071716, mean loss: 0.3547630892105011
Epoch: 19, step: 1089, loss: 0.30156275629997253, mean loss: 0.35476122423353584
Epoch: 19, step: 1090, loss: 0.30226194858551025, mean loss: 0.3547593838971651
Epoch: 19, step: 1091, loss: 0.3659048080444336, mean loss: 0.35475977458084945
Epoch: 19, step: 1092, loss: 0.3285451829433441, mean loss: 0.3547588557056124
Epoch: 19, step: 1093, loss: 0.3489282727241516, mean loss: 0.35475865133887624
Epoch: 19, step: 1094, loss: 0.3487117886543274, mean loss: 0.35475843939878704
Epoch: 19, step: 1095, loss: 0.35451871156692505, mean loss: 0.35475843099671805
Epoch: 19, step: 1096, loss: 0.2992367446422577, mean loss: 0.3547564851204921
Epoch: 19, step: 1097, loss: 0.37659209966659546, mean loss: 0.3547572503694774
Epoch: 19, step: 1098, loss: 0.34737294912338257, mean loss: 0.35475699158898866
Epoch: 19, step: 1099, loss: 0.3565891683101654, mean loss: 0.3547570557947891
Epoch: 19, step: 1100, loss: 0.34716346859931946, mean loss: 0.35475678969859137
Epoch: 19, step: 1101, loss: 0.37724173069000244, mean loss: 0.35475757759336296
Epoch: 19, step: 1102, loss: 0.32317113876342773, mean loss: 0.35475647081180683
Epoch: 19, step: 1103, loss: 0.3289335072040558, mean loss: 0.35475556601280167
Epoch: 19, step: 1104, loss: 0.35293394327163696, mean loss: 0.35475550218803237
Epoch: 19, step: 1105, loss: 0.3642108738422394, mean loss: 0.35475583346725786
Epoch: 19, step: 1106, loss: 0.3131328225135803, mean loss: 0.3547543752109094
Epoch: 19, step: 1107, loss: 0.3403618335723877, mean loss: 0.35475387098789796
Epoch: 19, step: 1108, loss: 0.3328999876976013, mean loss: 0.3547531053938083
Epoch: 19, step: 1109, loss: 0.2979797124862671, mean loss: 0.35475111655499
Epoch: 19, step: 1110, loss: 0.38013720512390137, mean loss: 0.35475200582841865
Epoch: 19, step: 1111, loss: 0.34702351689338684, mean loss: 0.35475173510931624
Epoch: 19, step: 1112, loss: 0.39149001240730286, mean loss: 0.35475302195919883
Epoch: 19, step: 1113, loss: 0.3218252956867218, mean loss: 0.3547518686237777
Epoch: 19, step: 1114, loss: 0.34501349925994873, mean loss: 0.3547515275369729
Epoch: 19, step: 1115, loss: 0.3171190023422241, mean loss: 0.35475020950232755
Epoch: 19, step: 1116, loss: 0.3558538854122162, mean loss: 0.35475024815591594
Epoch: 19, step: 1117, loss: 0.3351379930973053, mean loss: 0.35474956130801166
Epoch: 19, step: 1118, loss: 0.3373628556728363, mean loss: 0.35474895242320564
Epoch: 19, step: 1119, loss: 0.34702134132385254, mean loss: 0.3547486818106864
Epoch: 19, step: 1120, loss: 0.35368260741233826, mean loss: 0.3547486444792301
Epoch: 19, step: 1121, loss: 0.31835493445396423, mean loss: 0.3547473701004212
Epoch: 19, step: 1122, loss: 0.4068261981010437, mean loss: 0.3547491936526464
Epoch: 19, step: 1123, loss: 0.3268737196922302, mean loss: 0.354748217620645
Epoch: 19, step: 1124, loss: 0.3385031223297119, mean loss: 0.35474764883470294
Epoch: 19, step: 1125, loss: 0.30758559703826904, mean loss: 0.35474599761798853
Epoch: 19, step: 1126, loss: 0.3163589537143707, mean loss: 0.3547446536749887
Epoch: 19, step: 1127, loss: 0.3515763282775879, mean loss: 0.35474454275476053
Epoch: 19, step: 1128, loss: 0.3533298373222351, mean loss: 0.3547444932289271
Epoch: 19, step: 1129, loss: 0.3357076644897461, mean loss: 0.35474382681330224
Epoch: 19, step: 1130, loss: 0.35352566838264465, mean loss: 0.35474378417114766
Epoch: 19, step: 1131, loss: 0.320801705121994, mean loss: 0.3547425960558071
Epoch: 19, step: 1132, loss: 0.33305487036705017, mean loss: 0.3547418369208815
Epoch: 19, step: 1133, loss: 0.29500019550323486, mean loss: 0.3547397458588788
Epoch: 19, step: 1134, loss: 0.32554978132247925, mean loss: 0.3547387241947951
Epoch: 19, step: 1135, loss: 0.3959246575832367, mean loss: 0.3547401656736341
Epoch: 19, step: 1136, loss: 0.30845749378204346, mean loss: 0.3547385458692071
Epoch: 19, step: 1137, loss: 0.32284581661224365, mean loss: 0.3547374297241362
Epoch: 19, step: 1138, loss: 0.3311923146247864, mean loss: 0.3547366057481047
Epoch: 19, step: 1139, loss: 0.32023128867149353, mean loss: 0.3547353982552059
Epoch: 19, step: 1140, loss: 0.3419593572616577, mean loss: 0.3547349511809506
Epoch: 19, step: 1141, loss: 0.29942378401756287, mean loss: 0.3547330157352524
Epoch: 19, step: 1142, loss: 0.33456891775131226, mean loss: 0.3547323101787954
Epoch: 19, step: 1143, loss: 0.33704331517219543, mean loss: 0.35473169124964893
Epoch: 19, step: 1144, loss: 0.35089850425720215, mean loss: 0.3547315571330333
Epoch: 19, step: 1145, loss: 0.3570246696472168, mean loss: 0.35473163736228647
Epoch: 19, step: 1146, loss: 0.3376065790653229, mean loss: 0.3547310382278955
Epoch: 19, step: 1147, loss: 0.33645227551460266, mean loss: 0.3547303987525697
Epoch: 19, step: 1148, loss: 0.3237377107143402, mean loss: 0.35472931452349715
Epoch: 19, step: 1149, loss: 0.32152795791625977, mean loss: 0.35472815306835803
Epoch: 19, step: 1150, loss: 0.3785052001476288, mean loss: 0.35472898481170567
Epoch: 19, step: 1151, loss: 0.33518198132514954, mean loss: 0.3547283010631578
Epoch: 19, step: 1152, loss: 0.3486484885215759, mean loss: 0.35472808840050635
Epoch: 19, step: 1153, loss: 0.31418880820274353, mean loss: 0.35472667044736894
Epoch: 19, step: 1154, loss: 0.33201053738594055, mean loss: 0.35472587592695826
Epoch: 19, step: 1155, loss: 0.3431777358055115, mean loss: 0.35472547203285776
Epoch: 19, step: 1156, loss: 0.3242836892604828, mean loss: 0.35472440737427796
Epoch: 19, step: 1157, loss: 0.33744651079177856, mean loss: 0.3547238031252543
Epoch: 19, step: 1158, loss: 0.3301771879196167, mean loss: 0.35472294470192134
Epoch: 19, step: 1159, loss: 0.3757645785808563, mean loss: 0.35472368052629816
Epoch: 19, step: 1160, loss: 0.3089800179004669, mean loss: 0.35472208092974516
Epoch: 19, step: 1161, loss: 0.3283390700817108, mean loss: 0.3547211583823346
Epoch: 19, step: 1162, loss: 0.3400290310382843, mean loss: 0.35472064465362574
Epoch: 19, step: 1163, loss: 0.34292009472846985, mean loss: 0.354720232046985
Epoch: 19, step: 1164, loss: 0.37009647488594055, mean loss: 0.35472076965905586
Epoch: 19, step: 1165, loss: 0.36608144640922546, mean loss: 0.3547211668577395
Epoch: 19, step: 1166, loss: 0.3247494101524353, mean loss: 0.3547201190041331
Epoch: 19, step: 1167, loss: 0.3531295955181122, mean loss: 0.3547200633992007
Epoch: 19, step: 1168, loss: 0.3032948076725006, mean loss: 0.35471826562763187
Epoch: 19, step: 1169, loss: 0.3111492395401001, mean loss: 0.35471674255463714
Epoch: 19, step: 1170, loss: 0.3373776376247406, mean loss: 0.3547161364405766
Epoch: 19, step: 1171, loss: 0.3584606349468231, mean loss: 0.3547162673304852
Epoch: 19, step: 1172, loss: 0.3354799449443817, mean loss: 0.3547155949433907
Epoch: 19, step: 1173, loss: 0.36318662762641907, mean loss: 0.35471589102981793
Epoch: 19, step: 1174, loss: 0.3560131788253784, mean loss: 0.3547159363720917
Epoch: 19, step: 1175, loss: 0.31986430287361145, mean loss: 0.3547147182945893
Epoch: 19, step: 1176, loss: 0.35744041204452515, mean loss: 0.35471481355526624
Epoch: 19, step: 1177, loss: 0.3163159489631653, mean loss: 0.35471347159452704
Epoch: 19, step: 1178, loss: 0.36063534021377563, mean loss: 0.3547136785443303
Epoch: 19, step: 1179, loss: 0.33312246203422546, mean loss: 0.3547129240287967
Epoch: 19, step: 1180, loss: 0.31989815831184387, mean loss: 0.35471170745243585
Epoch: 19, step: 1181, loss: 0.33422282338142395, mean loss: 0.354710991508482
Epoch: 19, step: 1182, loss: 0.3427141010761261, mean loss: 0.3547105723152736
Epoch: 19, step: 1183, loss: 0.38146349787712097, mean loss: 0.35471150707857063
Epoch: 19, step: 1184, loss: 0.32057905197143555, mean loss: 0.35471031451174534
Epoch: 19, step: 1185, loss: 0.34365206956863403, mean loss: 0.3547099281570202
Epoch: 19, step: 1186, loss: 0.32376745343208313, mean loss: 0.3547088471216736
Epoch: 19, step: 1187, loss: 0.3138422966003418, mean loss: 0.3547074194193776
Epoch: 19, step: 1188, loss: 0.33301109075546265, mean loss: 0.3547066614690313
Epoch: 19, step: 1189, loss: 0.30064964294433594, mean loss: 0.3547047730802056
Epoch: 19, step: 1190, loss: 0.33355674147605896, mean loss: 0.354704034335957
Epoch: 19, step: 1191, loss: 0.32477593421936035, mean loss: 0.3547029889223718
Epoch: 19, step: 1192, loss: 0.3290187120437622, mean loss: 0.35470209178042206
Epoch: 19, step: 1193, loss: 0.3209463059902191, mean loss: 0.35470091274494214
Epoch: 19, step: 1194, loss: 0.34885460138320923, mean loss: 0.35470070854979135
Epoch: 19, step: 1195, loss: 0.3181896209716797, mean loss: 0.3546994333651176
Epoch: 19, step: 1196, loss: 0.30749210715293884, mean loss: 0.35469778466165613
Epoch: 19, step: 1197, loss: 0.3466600477695465, mean loss: 0.35469750395561117
Epoch: 19, step: 1198, loss: 0.2997743487358093, mean loss: 0.3546955859128237
Epoch: 19, step: 1199, loss: 0.366356760263443, mean loss: 0.354695993133607
Epoch: 19, step: 1200, loss: 0.3215283453464508, mean loss: 0.3546948349240254
Epoch: 19, step: 1201, loss: 0.3413538932800293, mean loss: 0.35469436907649265
Epoch: 19, step: 1202, loss: 0.3375055193901062, mean loss: 0.3546937688862037
Epoch: 19, step: 1203, loss: 0.3098318874835968, mean loss: 0.35469220247973016
Epoch: 19, step: 1204, loss: 0.3241332173347473, mean loss: 0.3546911355133133
Epoch: 19, step: 1205, loss: 0.3621175289154053, mean loss: 0.35469139479665257
Epoch: 19, step: 1206, loss: 0.3256072700023651, mean loss: 0.35469037939586373
Epoch: 19, step: 1207, loss: 0.3487585186958313, mean loss: 0.3546901723067456
Epoch: 19, step: 1208, loss: 0.32335466146469116, mean loss: 0.3546890783807256
Epoch: 19, step: 1209, loss: 0.2875702381134033, mean loss: 0.3546867353366613
Epoch: 19, step: 1210, loss: 0.35534417629241943, mean loss: 0.3546867582863927
Epoch: 19, step: 1211, loss: 0.3369170129299164, mean loss: 0.35468613800765225
Epoch: 19, step: 1212, loss: 0.3711197078227997, mean loss: 0.3546867116252241
Epoch: 19, step: 1213, loss: 0.35553497076034546, mean loss: 0.3546867412328728
Epoch: 19, step: 1214, loss: 0.328033983707428, mean loss: 0.3546858109771217
Epoch: 19, step: 1215, loss: 0.31811434030532837, mean loss: 0.3546845345751019
Epoch: 19, step: 1216, loss: 0.3243277668952942, mean loss: 0.3546834751129974
Epoch: 19, step: 1217, loss: 0.31226760149002075, mean loss: 0.3546819948354228
Epoch: 19, step: 1218, loss: 0.32947787642478943, mean loss: 0.35468111526402474
Epoch: 19, step: 1219, loss: 0.3666069507598877, mean loss: 0.35468153143639686
Epoch: 19, step: 1220, loss: 0.3626003861427307, mean loss: 0.35468180776869634
Epoch: 19, step: 1221, loss: 0.333812415599823, mean loss: 0.35468107954648376
Epoch: 19, step: 1222, loss: 0.2959878742694855, mean loss: 0.3546790315613734
Epoch: 19, step: 1223, loss: 0.3181734085083008, mean loss: 0.35467775781318595
Epoch: 19, step: 1224, loss: 0.3032667636871338, mean loss: 0.3546759640518334
Epoch: 19, step: 1225, loss: 0.3268343210220337, mean loss: 0.35467499267359637
Epoch: 19, step: 1226, loss: 0.328850656747818, mean loss: 0.3546740917094291
Epoch: 19, step: 1227, loss: 0.35454583168029785, mean loss: 0.3546740872348258
Epoch: 19, step: 1228, loss: 0.3381959795951843, mean loss: 0.3546735123836959
Epoch: 19, step: 1229, loss: 0.3378421664237976, mean loss: 0.35467292523006577
Epoch: 19, step: 1230, loss: 0.3209553360939026, mean loss: 0.3546717490487724
Epoch: 19, step: 1231, loss: 0.3293193280696869, mean loss: 0.3546708647031264
Epoch: 19, step: 1232, loss: 0.34340015053749084, mean loss: 0.35467047157067794
Epoch: 19, step: 1233, loss: 0.30831485986709595, mean loss: 0.3546688547024637
Epoch: 19, step: 1234, loss: 0.3278823494911194, mean loss: 0.3546679204307183
Epoch: 19, step: 1235, loss: 0.33700844645500183, mean loss: 0.35466730451714495
Epoch: 19, step: 1236, loss: 0.31693196296691895, mean loss: 0.35466598845877817
Epoch: 19, step: 1237, loss: 0.36766165494918823, mean loss: 0.354666441680041
Epoch: 19, step: 1238, loss: 0.3466576933860779, mean loss: 0.35466616238629056
Epoch: 19, step: 1239, loss: 0.3259018063545227, mean loss: 0.35466515930510656
Epoch: 19, step: 1240, loss: 0.3643476665019989, mean loss: 0.354665496945278
Epoch: 19, step: 1241, loss: 0.3160994350910187, mean loss: 0.35466415214920244
Epoch: 19, step: 1242, loss: 0.3536147475242615, mean loss: 0.3546641155578072
Epoch: 19, step: 1243, loss: 0.34132617712020874, mean loss: 0.35466365049719223
Epoch: 19, step: 1244, loss: 0.3138367235660553, mean loss: 0.3546622270138084
Epoch: 19, step: 1245, loss: 0.36551862955093384, mean loss: 0.3546626055230664
Epoch: 19, step: 1246, loss: 0.3413996994495392, mean loss: 0.3546621431270104
Epoch: 19, step: 1247, loss: 0.35850751399993896, mean loss: 0.3546622771867954
Epoch: 19, step: 1248, loss: 0.3316067159175873, mean loss: 0.3546614734370562
Epoch: 19, step: 1249, loss: 0.32300400733947754, mean loss: 0.35466036985112237
Epoch: 19, step: 1250, loss: 0.3686574399471283, mean loss: 0.35466085777492395
Epoch: 19, step: 1251, loss: 0.3363375961780548, mean loss: 0.35466021906669765
Epoch: 19, step: 1252, loss: 0.33184486627578735, mean loss: 0.35465942380186477
Epoch: 19, step: 1253, loss: 0.36247730255126953, mean loss: 0.35465969629676714
Epoch: 19, step: 1254, loss: 0.365960955619812, mean loss: 0.35466009019239025
Epoch: 19, step: 1255, loss: 0.28543782234191895, mean loss: 0.35465767759417993
Epoch: 19, step: 1256, loss: 0.3260927200317383, mean loss: 0.35465668205667733
Epoch: 19, step: 1257, loss: 0.35794374346733093, mean loss: 0.35465679661238275
Epoch: 19, step: 1258, loss: 0.32044586539268494, mean loss: 0.35465560438616844
Epoch: 19, step: 1259, loss: 0.3040951192378998, mean loss: 0.3546538424512246
Epoch: 19, step: 1260, loss: 0.31623128056526184, mean loss: 0.3546525035460469
Epoch: 19, step: 1261, loss: 0.33669906854629517, mean loss: 0.3546518779472247
Epoch: 19, step: 1262, loss: 0.29829496145248413, mean loss: 0.35464991422317527
Epoch: 19, step: 1263, loss: 0.28790920972824097, mean loss: 0.35464758876308833
Epoch: 19, step: 1264, loss: 0.32833853363990784, mean loss: 0.35464667210321155
Epoch: 19, step: 1265, loss: 0.3261300027370453, mean loss: 0.35464567856027496
Epoch: 19, step: 1266, loss: 0.3414486050605774, mean loss: 0.35464521877999067
Epoch: 19, step: 1267, loss: 0.3631824553012848, mean loss: 0.3546455162032251
Epoch: 19, step: 1268, loss: 0.3251827359199524, mean loss: 0.35464448980433
Epoch: 19, step: 1269, loss: 0.36574485898017883, mean loss: 0.3546448764959337
Epoch: 19, step: 1270, loss: 0.35647690296173096, mean loss: 0.35464494031404303
Epoch: 19, step: 1271, loss: 0.34513139724731445, mean loss: 0.35464460892407973
Epoch: 19, step: 1272, loss: 0.3491686284542084, mean loss: 0.3546444181831807
Epoch: 19, step: 1273, loss: 0.33580195903778076, mean loss: 0.35464376188018015
Epoch: 19, step: 1274, loss: 0.31192630529403687, mean loss: 0.354642274037312
Epoch: 19, step: 1275, loss: 0.32781052589416504, mean loss: 0.35464133952393284
Epoch: 19, step: 1276, loss: 0.30539366602897644, mean loss: 0.3546396243540274
Epoch: 19, step: 1277, loss: 0.3230433464050293, mean loss: 0.3546385239751896
Epoch: 19, step: 1278, loss: 0.34016910195350647, mean loss: 0.35463802007750467
Epoch: 19, step: 1279, loss: 0.3381306827068329, mean loss: 0.35463744522942797
Epoch: 19, step: 1280, loss: 0.30352434515953064, mean loss: 0.3546356653394649
Epoch: 19, step: 1281, loss: 0.3518795371055603, mean loss: 0.35463556936731383
Epoch: 19, step: 1282, loss: 0.316681832075119, mean loss: 0.35463424781234004
Epoch: 19, step: 1283, loss: 0.34862327575683594, mean loss: 0.35463403851665565
Epoch: 19, step: 1284, loss: 0.3287879526615143, mean loss: 0.3546331386146378
Epoch: 19, step: 1285, loss: 0.35018062591552734, mean loss: 0.3546329835936539
Epoch: 19, step: 1286, loss: 0.31585848331451416, mean loss: 0.3546316336476079
Epoch: 19, step: 1287, loss: 0.3335435092449188, mean loss: 0.35463089948368914
Epoch: 19, step: 1288, loss: 0.30013230443000793, mean loss: 0.3546290022305976
Epoch: 19, step: 1289, loss: 0.33039388060569763, mean loss: 0.35462815856556856
Epoch: 19, step: 1290, loss: 0.3289507329463959, mean loss: 0.3546272647226466
Epoch: 19, step: 1291, loss: 0.31023404002189636, mean loss: 0.35462571942799676
Epoch: 19, step: 1292, loss: 0.34426936507225037, mean loss: 0.35462535894366537
Epoch: 19, step: 1293, loss: 0.3078429102897644, mean loss: 0.35462373059529595
Epoch: 19, step: 1294, loss: 0.3274403512477875, mean loss: 0.35462278446117784
Epoch: 19, step: 1295, loss: 0.3497372567653656, mean loss: 0.35462261442332127
Epoch: 19, step: 1296, loss: 0.3230117857456207, mean loss: 0.35462151426570887
Epoch: 19, step: 1297, loss: 0.30758020281791687, mean loss: 0.3546198771350815
Epoch: 19, step: 1298, loss: 0.3248845338821411, mean loss: 0.3546188423223704
Epoch: 19, step: 1299, loss: 0.3438034951686859, mean loss: 0.354618465953107
Epoch: 19, step: 1300, loss: 0.33592361211776733, mean loss: 0.3546178154031597
Epoch: 19, step: 1301, loss: 0.3156207799911499, mean loss: 0.3546164584181429
Epoch: 19, step: 1302, loss: 0.32812970876693726, mean loss: 0.35461553678727015
Epoch: 19, step: 1303, loss: 0.33091437816619873, mean loss: 0.3546147121123007
Epoch: 19, step: 1304, loss: 0.32355034351348877, mean loss: 0.35461363127417406
Epoch: 19, step: 1305, loss: 0.34956642985343933, mean loss: 0.3546134556704784
Epoch: 19, step: 1306, loss: 0.30428001284599304, mean loss: 0.3546117045156642
Epoch: 19, step: 1307, loss: 0.35528630018234253, mean loss: 0.3546117279847592
Epoch: 19, step: 1308, loss: 0.34810176491737366, mean loss: 0.35461150151187465
Epoch: 19, step: 1309, loss: 0.33599892258644104, mean loss: 0.35461085402774034
Epoch: 19, step: 1310, loss: 0.33577558398246765, mean loss: 0.35461019881954314
Epoch: 19, step: 1311, loss: 0.3337149918079376, mean loss: 0.35460947197917125
Epoch: 19, step: 1312, loss: 0.3633778393268585, mean loss: 0.3546097769764702
Epoch: 19, step: 1313, loss: 0.3252067267894745, mean loss: 0.3546087542616811
Epoch: 19, step: 1314, loss: 0.3166106641292572, mean loss: 0.3546074326349505
Epoch: 19, step: 1315, loss: 0.324875146150589, mean loss: 0.3546063985404011
Epoch: 19, step: 1316, loss: 0.31060341000556946, mean loss: 0.35460486816136116
Epoch: 19, step: 1317, loss: 0.32482340931892395, mean loss: 0.3546038324286338
Epoch: 19, step: 1318, loss: 0.33298376202583313, mean loss: 0.3546030805569453
Epoch: 19, step: 1319, loss: 0.3339858949184418, mean loss: 0.3546023635870733
Epoch: 19, step: 1320, loss: 0.35506966710090637, mean loss: 0.35460237983715204
Epoch: 19, step: 1321, loss: 0.3454897403717041, mean loss: 0.35460206296395275
Epoch: 19, step: 1322, loss: 0.3160663843154907, mean loss: 0.3546007230119847
Epoch: 19, step: 1323, loss: 0.3557465672492981, mean loss: 0.3546007628535785
Epoch: 19, step: 1324, loss: 0.30992329120635986, mean loss: 0.3545992094489108
Epoch: 19, step: 1325, loss: 0.3294505476951599, mean loss: 0.3545983350778047
Epoch: 19, step: 1326, loss: 0.37263011932373047, mean loss: 0.3545989619868283
Epoch: 19, step: 1327, loss: 0.33199891448020935, mean loss: 0.354598176280824
Epoch: 19, step: 1328, loss: 0.2724972665309906, mean loss: 0.3545953220861517
Epoch: 19, step: 1329, loss: 0.3603750169277191, mean loss: 0.3545955230071988
Epoch: 19, step: 1330, loss: 0.3219907581806183, mean loss: 0.35459438959861167
Epoch: 19, step: 1331, loss: 0.28713512420654297, mean loss: 0.3545920446575177
Epoch: 19, step: 1332, loss: 0.33037224411964417, mean loss: 0.3545912027860401
Epoch: 19, step: 1333, loss: 0.29583612084388733, mean loss: 0.3545891605517008
Epoch: 19, step: 1334, loss: 0.33026692271232605, mean loss: 0.3545883151783096
Epoch: 19, step: 1335, loss: 0.39761945605278015, mean loss: 0.35458981076919216
Epoch: 19, step: 1336, loss: 0.383629709482193, mean loss: 0.35459082004520487
Epoch: 19, step: 1337, loss: 0.3098788261413574, mean loss: 0.3545892661425878
Epoch: 19, step: 1338, loss: 0.3196137845516205, mean loss: 0.35458805066103816
Epoch: 19, step: 1339, loss: 0.36073538661003113, mean loss: 0.3545882642882257
Epoch: 19, step: 1340, loss: 0.3397631049156189, mean loss: 0.3545877491143239
Epoch: 19, step: 1341, loss: 0.356336772441864, mean loss: 0.35458780989072697
Epoch: 19, step: 1342, loss: 0.3261762261390686, mean loss: 0.3545868226575447
Epoch: 19, step: 1343, loss: 0.34210434556007385, mean loss: 0.3545863889370062
Epoch: 19, step: 1344, loss: 0.3788527548313141, mean loss: 0.35458723207539244
Epoch: 19, step: 1345, loss: 0.3111913502216339, mean loss: 0.3545857243315993
Epoch: 19, step: 1346, loss: 0.3721567690372467, mean loss: 0.35458633479766277
Epoch: 19, step: 1347, loss: 0.35611578822135925, mean loss: 0.3545863879332042
Epoch: 19, step: 1348, loss: 0.33850404620170593, mean loss: 0.3545858292275682
Epoch: 19, step: 1349, loss: 0.3801288902759552, mean loss: 0.3545867165707575
Epoch: 19, step: 1350, loss: 0.34294477105140686, mean loss: 0.35458631215398884
Epoch: 19, step: 1351, loss: 0.3497214913368225, mean loss: 0.35458614316618775
Epoch: 19, step: 1352, loss: 0.3225984275341034, mean loss: 0.3545850320572353
Epoch: 19, step: 1353, loss: 0.302080899477005, mean loss: 0.3545832083638494
Epoch: 19, step: 1354, loss: 0.2976405620574951, mean loss: 0.35458123057057
Epoch: 19, step: 1355, loss: 0.3698734939098358, mean loss: 0.35458176169947175
Epoch: 19, step: 1356, loss: 0.34121695160865784, mean loss: 0.354581297530747
Epoch: 19, step: 1357, loss: 0.3331836760044098, mean loss: 0.35458055440295905
Epoch: 19, step: 1358, loss: 0.3140217959880829, mean loss: 0.354579145868199
Epoch: 19, step: 1359, loss: 0.3341812491416931, mean loss: 0.35457843750951284
Epoch: 19, step: 1360, loss: 0.3233240246772766, mean loss: 0.3545773521737893
Epoch: 19, step: 1361, loss: 0.36838069558143616, mean loss: 0.3545778314898323
Epoch: 19, step: 1362, loss: 0.3649144172668457, mean loss: 0.3545781904115232
Epoch: 19, step: 1363, loss: 0.35370320081710815, mean loss: 0.3545781600299401
Epoch: 19, step: 1364, loss: 0.30442747473716736, mean loss: 0.35457641874716195
Epoch: 19, step: 1365, loss: 0.40443021059036255, mean loss: 0.35457814966139856
Epoch: 19, step: 1366, loss: 0.3325251042842865, mean loss: 0.3545773840104116
Epoch: 19, step: 1367, loss: 0.3254692852497101, mean loss: 0.35457637345289317
Epoch: 19, step: 1368, loss: 0.40657904744148254, mean loss: 0.35457817878786935
Epoch: 19, step: 1369, loss: 0.3206069767475128, mean loss: 0.35457699947793253
Epoch: 19, step: 1370, loss: 0.33780860900878906, mean loss: 0.3545764173836336
Epoch: 19, step: 1371, loss: 0.34915101528167725, mean loss: 0.35457622905393
Epoch: 19, step: 1372, loss: 0.2992745041847229, mean loss: 0.3545743094550245
Epoch: 19, step: 1373, loss: 0.34155163168907166, mean loss: 0.35457385743566433
Epoch: 19, step: 1374, loss: 0.3328385055065155, mean loss: 0.3545731030240879
Epoch: 19, step: 1375, loss: 0.3340674638748169, mean loss: 0.3545723913192722
Epoch: 19, step: 1376, loss: 0.35064008831977844, mean loss: 0.35457225484257765
Epoch: 19, step: 1377, loss: 0.33169203996658325, mean loss: 0.3545714607766765
Epoch: 19, step: 1378, loss: 0.3001718819141388, mean loss: 0.354569572885687
Epoch: 19, step: 1379, loss: 0.36152684688568115, mean loss: 0.35456981432356877
Epoch: 19, step: 1380, loss: 0.34714698791503906, mean loss: 0.35456955673858737
Epoch: 19, step: 1381, loss: 0.32182982563972473, mean loss: 0.3545684206524225
Epoch: 19, step: 1382, loss: 0.3315132260322571, mean loss: 0.35456762065260916
Epoch: 19, step: 1383, loss: 0.3331138789653778, mean loss: 0.35456687624797045
Epoch: 19, step: 1384, loss: 0.3565767705440521, mean loss: 0.35456694598511684
Epoch: 19, step: 1385, loss: 0.30327528715133667, mean loss: 0.3545651663841581
Epoch: 19, step: 1386, loss: 0.3069929778575897, mean loss: 0.35456351589015933
Epoch: 19, step: 1387, loss: 0.33500245213508606, mean loss: 0.3545628372520884
Epoch: 19, step: 1388, loss: 0.32751575112342834, mean loss: 0.3545618989316677
Epoch: 19, step: 1389, loss: 0.3530789613723755, mean loss: 0.3545618474872231
Epoch: 19, step: 1390, loss: 0.2869024872779846, mean loss: 0.35455950040427275
Epoch: 19, step: 1391, loss: 0.3699095547199249, mean loss: 0.35456003287459037
Epoch: 19, step: 1392, loss: 0.3375629484653473, mean loss: 0.35455944329172556
Epoch: 19, step: 1393, loss: 0.3204442858695984, mean loss: 0.3545582599702749
Epoch: 19, step: 1394, loss: 0.36242806911468506, mean loss: 0.354558532933722
Epoch: 19, step: 1395, loss: 0.32561755180358887, mean loss: 0.35455752915385486
Epoch: 19, step: 1396, loss: 0.37182092666625977, mean loss: 0.35455812789132624
Epoch: 19, step: 1397, loss: 0.35806626081466675, mean loss: 0.3545582495578631
Epoch: 19, step: 1398, loss: 0.3167530298233032, mean loss: 0.3545569384699583
Epoch: 19, step: 1399, loss: 0.32742616534233093, mean loss: 0.3545559976053055
Epoch: 19, step: 1400, loss: 0.35615119338035583, mean loss: 0.3545560529229798
Epoch: 19, step: 1401, loss: 0.3239648640155792, mean loss: 0.3545549921285798
Epoch: 19, step: 1402, loss: 0.3493145704269409, mean loss: 0.3545548104155627
Epoch: 19, step: 1403, loss: 0.3186452090740204, mean loss: 0.35455356528375476
Epoch: 19, step: 1404, loss: 0.3271757662296295, mean loss: 0.35455261601711857
Epoch: 19, step: 1405, loss: 0.3473542034626007, mean loss: 0.35455236643621035
Epoch: 19, step: 1406, loss: 0.35301917791366577, mean loss: 0.35455231327986314
Epoch: 19, step: 1407, loss: 0.3461880683898926, mean loss: 0.3545520232977216
Epoch: 19, step: 1408, loss: 0.34009161591529846, mean loss: 0.35455152198354645
Epoch: 19, step: 1409, loss: 0.33211004734039307, mean loss: 0.3545507440082763
Epoch: 19, step: 1410, loss: 0.3584279716014862, mean loss: 0.35455087841489025
Epoch: 19, step: 1411, loss: 0.30632075667381287, mean loss: 0.35454920654433625
Epoch: 19, step: 1412, loss: 0.3265150487422943, mean loss: 0.3545482347894123
Epoch: 19, step: 1413, loss: 0.31373700499534607, mean loss: 0.3545468201887262
Epoch: 19, step: 1414, loss: 0.35102638602256775, mean loss: 0.354546698167508
Epoch: 19, step: 1415, loss: 0.3052314221858978, mean loss: 0.35454498891768194
Epoch: 19, step: 1416, loss: 0.3541208505630493, mean loss: 0.35454497421770775
Epoch: 19, step: 1417, loss: 0.38039934635162354, mean loss: 0.3545458702588852
Epoch: 19, step: 1418, loss: 0.35252636671066284, mean loss: 0.35454580027089183
Epoch: 19, step: 1419, loss: 0.37731122970581055, mean loss: 0.3545465892031567
Epoch: 19, step: 1420, loss: 0.34791475534439087, mean loss: 0.35454635938599416
Epoch: 19, step: 1421, loss: 0.3424530029296875, mean loss: 0.35454594032173276
Epoch: 19, step: 1422, loss: 0.3582114279270172, mean loss: 0.35454606733540633
Epoch: 19, step: 1423, loss: 0.3081705868244171, mean loss: 0.3545444604233997
Epoch: 19, step: 1424, loss: 0.31840062141418457, mean loss: 0.35454320808151935
Epoch: 19, step: 1425, loss: 0.35333696007728577, mean loss: 0.3545431662878805
Epoch: 19, step: 1426, loss: 0.3282639682292938, mean loss: 0.35454225580740173
Epoch: 19, step: 1427, loss: 0.2921465039253235, mean loss: 0.35454009409205106
Epoch: 19, step: 1428, loss: 0.35290437936782837, mean loss: 0.3545400374242969
Epoch: 19, step: 1429, loss: 0.34004440903663635, mean loss: 0.3545395352546722
Epoch: 19, step: 1430, loss: 0.37647056579589844, mean loss: 0.35454029498136846
Epoch: 19, step: 1431, loss: 0.3627201020717621, mean loss: 0.3545405783334223
Epoch: 19, step: 1432, loss: 0.329145610332489, mean loss: 0.35453969867122404
Epoch: 19, step: 1433, loss: 0.3113226890563965, mean loss: 0.3545382017190379
Epoch: 19, step: 1434, loss: 0.3675844371318817, mean loss: 0.35453865359931264
Epoch: 19, step: 1435, loss: 0.34014925360679626, mean loss: 0.3545381552133334
Epoch: 19, step: 1436, loss: 0.3231724500656128, mean loss: 0.35453706887990255
Epoch: 19, step: 1437, loss: 0.31344538927078247, mean loss: 0.3545356457421451
Epoch: 19, step: 1438, loss: 0.3293202817440033, mean loss: 0.3545347724827858
Epoch: 19, step: 1439, loss: 0.36904409527778625, mean loss: 0.3545352749527538
Epoch: 19, step: 1440, loss: 0.3051896393299103, mean loss: 0.3545335661313519
Epoch: 19, step: 1441, loss: 0.33541497588157654, mean loss: 0.35453290408445637
Epoch: 19, step: 1442, loss: 0.3351917564868927, mean loss: 0.3545322343539395
Epoch: 19, step: 1443, loss: 0.316965252161026, mean loss: 0.3545309335581572
Valid: 19, mean loss: 0.18793796251217523
Epoch: 20, step: 0, loss: 0.3435899615287781, mean loss: 0.3545305547287527
Epoch: 20, step: 1, loss: 0.3577321171760559, mean loss: 0.3545306655785016
Epoch: 20, step: 2, loss: 0.31109896302223206, mean loss: 0.35452916186688727
Epoch: 20, step: 3, loss: 0.3634766638278961, mean loss: 0.3545294716405322
Epoch: 20, step: 4, loss: 0.36068156361579895, mean loss: 0.3545296846262333
Epoch: 20, step: 5, loss: 0.30980443954467773, mean loss: 0.35452813628983915
Epoch: 20, step: 6, loss: 0.2923266887664795, mean loss: 0.3545259830220189
Epoch: 20, step: 7, loss: 0.3509353995323181, mean loss: 0.35452585872876596
Epoch: 20, step: 8, loss: 0.3470494747161865, mean loss: 0.35452559993185323
Epoch: 20, step: 9, loss: 0.30378907918930054, mean loss: 0.3545238437352197
Epoch: 20, step: 10, loss: 0.34163129329681396, mean loss: 0.35452339748723805
Epoch: 20, step: 11, loss: 0.33369317650794983, mean loss: 0.35452267651877
Epoch: 20, step: 12, loss: 0.3200417757034302, mean loss: 0.35452148311895637
Epoch: 20, step: 13, loss: 0.3495037853717804, mean loss: 0.3545213094601432
Epoch: 20, step: 14, loss: 0.32645946741104126, mean loss: 0.3545203382941266
Epoch: 20, step: 15, loss: 0.29154807329177856, mean loss: 0.35451815902138983
Epoch: 20, step: 16, loss: 0.3431991934776306, mean loss: 0.3545177673210215
Epoch: 20, step: 17, loss: 0.37790948152542114, mean loss: 0.35451857677891496
Epoch: 20, step: 18, loss: 0.3465724587440491, mean loss: 0.3545183018172196
Epoch: 20, step: 19, loss: 0.3229456841945648, mean loss: 0.3545172093391012
Epoch: 20, step: 20, loss: 0.3319651782512665, mean loss: 0.35451642901900543
Epoch: 20, step: 21, loss: 0.32909095287323, mean loss: 0.3545155493056241
Epoch: 20, step: 22, loss: 0.2927161753177643, mean loss: 0.35451341114093576
Epoch: 20, step: 23, loss: 0.3717803955078125, mean loss: 0.3545140085317594
Epoch: 20, step: 24, loss: 0.3032832741737366, mean loss: 0.3545122361486299
Epoch: 20, step: 25, loss: 0.3206127882003784, mean loss: 0.3545110634008285
Epoch: 20, step: 26, loss: 0.3197023570537567, mean loss: 0.3545098592389872
Epoch: 20, step: 27, loss: 0.31019023060798645, mean loss: 0.35450832611221844
Epoch: 20, step: 28, loss: 0.3371524512767792, mean loss: 0.3545077257498802
Epoch: 20, step: 29, loss: 0.32663068175315857, mean loss: 0.35450676147993915
Epoch: 20, step: 30, loss: 0.2996164560317993, mean loss: 0.35450486288406047
Epoch: 20, step: 31, loss: 0.3374882638454437, mean loss: 0.3545042743187921
Epoch: 20, step: 32, loss: 0.4174899160861969, mean loss: 0.3545064527728359
Epoch: 20, step: 33, loss: 0.341070294380188, mean loss: 0.35450598807897155
Epoch: 20, step: 34, loss: 0.3208639919757843, mean loss: 0.35450482459994326
Epoch: 20, step: 35, loss: 0.37375152111053467, mean loss: 0.3545054902070988
Epoch: 20, step: 36, loss: 0.3372950255870819, mean loss: 0.35450489503939053
Epoch: 20, step: 37, loss: 0.3279511034488678, mean loss: 0.35450397679498946
Epoch: 20, step: 38, loss: 0.33615851402282715, mean loss: 0.3545033424209526
Epoch: 20, step: 39, loss: 0.34751060605049133, mean loss: 0.35450310062508916
Epoch: 20, step: 40, loss: 0.3932689130306244, mean loss: 0.35450444102868534
Epoch: 20, step: 41, loss: 0.35433685779571533, mean loss: 0.3545044352343685
Epoch: 20, step: 42, loss: 0.33735036849975586, mean loss: 0.35450384214005826
Epoch: 20, step: 43, loss: 0.34417596459388733, mean loss: 0.3545034850705815
Epoch: 20, step: 44, loss: 0.33019959926605225, mean loss: 0.3545026448325243
Epoch: 20, step: 45, loss: 0.361795574426651, mean loss: 0.35450289695620524
Epoch: 20, step: 46, loss: 0.31838086247444153, mean loss: 0.3545016482254526
Epoch: 20, step: 47, loss: 0.3142542839050293, mean loss: 0.35450025693105547
Epoch: 20, step: 48, loss: 0.37762999534606934, mean loss: 0.3545010564657236
Epoch: 20, step: 49, loss: 0.32858753204345703, mean loss: 0.3545001607338044
Epoch: 20, step: 50, loss: 0.3297724425792694, mean loss: 0.3544993060202392
Epoch: 20, step: 51, loss: 0.3622157573699951, mean loss: 0.3544995727301573
Epoch: 20, step: 52, loss: 0.29417890310287476, mean loss: 0.3544974878903679
Epoch: 20, step: 53, loss: 0.35176295042037964, mean loss: 0.3544973933808818
Epoch: 20, step: 54, loss: 0.34823185205459595, mean loss: 0.35449717684238774
Epoch: 20, step: 55, loss: 0.33558183908462524, mean loss: 0.3544965231467229
Epoch: 20, step: 56, loss: 0.3286934196949005, mean loss: 0.354495631447395
Epoch: 20, step: 57, loss: 0.31159836053848267, mean loss: 0.35449414906191884
Epoch: 20, step: 58, loss: 0.3620026111602783, mean loss: 0.354494408520162
Epoch: 20, step: 59, loss: 0.3425563871860504, mean loss: 0.35449399601078624
Epoch: 20, step: 60, loss: 0.31966516375541687, mean loss: 0.35449279256818733
Epoch: 20, step: 61, loss: 0.33419084548950195, mean loss: 0.35449209109810653
Epoch: 20, step: 62, loss: 0.328179270029068, mean loss: 0.35449118197254703
Epoch: 20, step: 63, loss: 0.30594518780708313, mean loss: 0.35448950473394264
Epoch: 20, step: 64, loss: 0.33689379692077637, mean loss: 0.3544888968324808
Epoch: 20, step: 65, loss: 0.342966228723526, mean loss: 0.3544884987578553
Epoch: 20, step: 66, loss: 0.33897629380226135, mean loss: 0.3544879628748638
Epoch: 20, step: 67, loss: 0.30353844165802, mean loss: 0.35448620283889526
Epoch: 20, step: 68, loss: 0.3506256341934204, mean loss: 0.3544860694813131
Epoch: 20, step: 69, loss: 0.3817726671695709, mean loss: 0.3544870120235476
Epoch: 20, step: 70, loss: 0.30988675355911255, mean loss: 0.3544854714806142
Epoch: 20, step: 71, loss: 0.3442915081977844, mean loss: 0.3544851193818548
Epoch: 20, step: 72, loss: 0.3279324173927307, mean loss: 0.3544842022851122
Epoch: 20, step: 73, loss: 0.378744900226593, mean loss: 0.35448504018999377
Epoch: 20, step: 74, loss: 0.32883432507514954, mean loss: 0.35448415430793145
Epoch: 20, step: 75, loss: 0.2976272702217102, mean loss: 0.354482190746525
Epoch: 20, step: 76, loss: 0.287243127822876, mean loss: 0.35447986871513626
Epoch: 20, step: 77, loss: 0.36598411202430725, mean loss: 0.3544802659885429
Epoch: 20, step: 78, loss: 0.3291979432106018, mean loss: 0.3544793929500133
Epoch: 20, step: 79, loss: 0.3344558775424957, mean loss: 0.3544787015302824
Epoch: 20, step: 80, loss: 0.36029648780822754, mean loss: 0.35447890241375596
Epoch: 20, step: 81, loss: 0.34917470812797546, mean loss: 0.35447871927052393
Epoch: 20, step: 82, loss: 0.2930396795272827, mean loss: 0.35447659797646797
Epoch: 20, step: 83, loss: 0.3521323800086975, mean loss: 0.3544765170408939
Epoch: 20, step: 84, loss: 0.37347811460494995, mean loss: 0.3544771730601435
Epoch: 20, step: 85, loss: 0.31314074993133545, mean loss: 0.3544757459931294
Epoch: 20, step: 86, loss: 0.3469991385936737, mean loss: 0.3544754878853723
Epoch: 20, step: 87, loss: 0.32244014739990234, mean loss: 0.35447438199816966
Epoch: 20, step: 88, loss: 0.32145896553993225, mean loss: 0.3544732423172536
Epoch: 20, step: 89, loss: 0.3344511091709137, mean loss: 0.3544725511839037
Epoch: 20, step: 90, loss: 0.340374231338501, mean loss: 0.35447206454830793
Epoch: 20, step: 91, loss: 0.3423650562763214, mean loss: 0.35447164666178743
Epoch: 20, step: 92, loss: 0.3492228090763092, mean loss: 0.3544714654987189
Epoch: 20, step: 93, loss: 0.30449584126472473, mean loss: 0.3544697406549198
Epoch: 20, step: 94, loss: 0.29171571135520935, mean loss: 0.3544675748558068
Epoch: 20, step: 95, loss: 0.3525059223175049, mean loss: 0.3544675071565889
Epoch: 20, step: 96, loss: 0.3138332962989807, mean loss: 0.35446610486474167
Epoch: 20, step: 97, loss: 0.34072139859199524, mean loss: 0.3544656305495276
Epoch: 20, step: 98, loss: 0.3276163935661316, mean loss: 0.35446470404285096
Epoch: 20, step: 99, loss: 0.31784942746162415, mean loss: 0.3544634405757502
Epoch: 20, step: 100, loss: 0.32230040431022644, mean loss: 0.35446233077842554
Epoch: 20, step: 101, loss: 0.31929856538772583, mean loss: 0.35446111748171066
Epoch: 20, step: 102, loss: 0.32931068539619446, mean loss: 0.35446024971674206
Epoch: 20, step: 103, loss: 0.32611000537872314, mean loss: 0.35445927158244944
Epoch: 20, step: 104, loss: 0.37348657846450806, mean loss: 0.35445992803602483
Epoch: 20, step: 105, loss: 0.3360053598880768, mean loss: 0.35445929136424714
Epoch: 20, step: 106, loss: 0.3721810281276703, mean loss: 0.35445990273268
Epoch: 20, step: 107, loss: 0.33931243419647217, mean loss: 0.3544593801899542
Epoch: 20, step: 108, loss: 0.4414351284503937, mean loss: 0.35446238049173284
Epoch: 20, step: 109, loss: 0.31315696239471436, mean loss: 0.354460955675655
Epoch: 20, step: 110, loss: 0.34771716594696045, mean loss: 0.35446072305899023
Epoch: 20, step: 111, loss: 0.3393484055995941, mean loss: 0.35446020180079973
Epoch: 20, step: 112, loss: 0.310332715511322, mean loss: 0.354458679795961
Epoch: 20, step: 113, loss: 0.3640572726726532, mean loss: 0.3544590108504163
Epoch: 20, step: 114, loss: 0.4066048264503479, mean loss: 0.35446080929206486
Epoch: 20, step: 115, loss: 0.3445603847503662, mean loss: 0.3544604678510198
Epoch: 20, step: 116, loss: 0.2946249544620514, mean loss: 0.35445840434398845
Epoch: 20, step: 117, loss: 0.4066062569618225, mean loss: 0.3544602026698253
Epoch: 20, step: 118, loss: 0.33537715673446655, mean loss: 0.3544595446110669
Epoch: 20, step: 119, loss: 0.3168927729129791, mean loss: 0.35445824920514624
Epoch: 20, step: 120, loss: 0.35538703203201294, mean loss: 0.3544582812310359
Epoch: 20, step: 121, loss: 0.33419671654701233, mean loss: 0.3544575826045728
Epoch: 20, step: 122, loss: 0.395832896232605, mean loss: 0.35445900919194745
Epoch: 20, step: 123, loss: 0.32665178179740906, mean loss: 0.354458050454277
Epoch: 20, step: 124, loss: 0.3472108542919159, mean loss: 0.35445780059404036
Epoch: 20, step: 125, loss: 0.294497013092041, mean loss: 0.35445573340837183
Epoch: 20, step: 126, loss: 0.31858205795288086, mean loss: 0.3544544966836
Epoch: 20, step: 127, loss: 0.34775838255882263, mean loss: 0.35445426584679207
Epoch: 20, step: 128, loss: 0.31501248478889465, mean loss: 0.35445290620733333
Epoch: 20, step: 129, loss: 0.37851107120513916, mean loss: 0.35445373551326226
Epoch: 20, step: 130, loss: 0.31635040044784546, mean loss: 0.35445242210334654
Epoch: 20, step: 131, loss: 0.329898476600647, mean loss: 0.35445157576577924
Epoch: 20, step: 132, loss: 0.3095126450061798, mean loss: 0.3544500268418224
Epoch: 20, step: 133, loss: 0.3157677948474884, mean loss: 0.35444869361538023
Epoch: 20, step: 134, loss: 0.34336206316947937, mean loss: 0.35444831151541656
Epoch: 20, step: 135, loss: 0.3550854027271271, mean loss: 0.3544483334719651
Epoch: 20, step: 136, loss: 0.311006098985672, mean loss: 0.35444683634150753
Epoch: 20, step: 137, loss: 0.34476417303085327, mean loss: 0.35444650266367617
Epoch: 20, step: 138, loss: 0.35578128695487976, mean loss: 0.3544465486605848
Epoch: 20, step: 139, loss: 0.2949574291706085, mean loss: 0.35444449872538525
Epoch: 20, step: 140, loss: 0.32363250851631165, mean loss: 0.3544434370117913
Epoch: 20, step: 141, loss: 0.31352782249450684, mean loss: 0.35444202719804596
Epoch: 20, step: 142, loss: 0.3338182270526886, mean loss: 0.35444131659610456
Epoch: 20, step: 143, loss: 0.3479379117488861, mean loss: 0.35444109252620215
Epoch: 20, step: 144, loss: 0.34150123596191406, mean loss: 0.3544406467085772
Epoch: 20, step: 145, loss: 0.35399001836776733, mean loss: 0.3544406311835879
Epoch: 20, step: 146, loss: 0.33649972081184387, mean loss: 0.3544400131069567
Epoch: 20, step: 147, loss: 0.3342515230178833, mean loss: 0.3544393176236272
Epoch: 20, step: 148, loss: 0.39046984910964966, mean loss: 0.35444055881455644
Epoch: 20, step: 149, loss: 0.3416285216808319, mean loss: 0.3544401174767289
Epoch: 20, step: 150, loss: 0.350935161113739, mean loss: 0.3544399967452225
Epoch: 20, step: 151, loss: 0.33979785442352295, mean loss: 0.35443949240028166
Epoch: 20, step: 152, loss: 0.3232826590538025, mean loss: 0.3544384192478914
Epoch: 20, step: 153, loss: 0.34282195568084717, mean loss: 0.3544380191492633
Epoch: 20, step: 154, loss: 0.31044185161590576, mean loss: 0.35443650386882475
Epoch: 20, step: 155, loss: 0.341982901096344, mean loss: 0.3544360749666766
Epoch: 20, step: 156, loss: 0.35692107677459717, mean loss: 0.35443616054720517
Epoch: 20, step: 157, loss: 0.35026344656944275, mean loss: 0.3544360168488107
Epoch: 20, step: 158, loss: 0.3153758645057678, mean loss: 0.3544346717559238
Epoch: 20, step: 159, loss: 0.3350493013858795, mean loss: 0.3544340042156218
Epoch: 20, step: 160, loss: 0.3429083526134491, mean loss: 0.35443360734045903
Epoch: 20, step: 161, loss: 0.32774588465690613, mean loss: 0.3544326884050316
Epoch: 20, step: 162, loss: 0.33463501930236816, mean loss: 0.35443200673753505
Epoch: 20, step: 163, loss: 0.3168346881866455, mean loss: 0.35443071224233635
Epoch: 20, step: 164, loss: 0.38622593879699707, mean loss: 0.3544318069308044
Epoch: 20, step: 165, loss: 0.3032057583332062, mean loss: 0.35443004331279854
Epoch: 20, step: 166, loss: 0.31604018807411194, mean loss: 0.35442872166666506
Epoch: 20, step: 167, loss: 0.29501479864120483, mean loss: 0.35442667629613955
Epoch: 20, step: 168, loss: 0.34934893250465393, mean loss: 0.35442650149687654
Epoch: 20, step: 169, loss: 0.31809931993484497, mean loss: 0.35442525099148714
Epoch: 20, step: 170, loss: 0.3372904360294342, mean loss: 0.35442466117306565
Epoch: 20, step: 171, loss: 0.3397704064846039, mean loss: 0.3544241567584061
Epoch: 20, step: 172, loss: 0.2892972230911255, mean loss: 0.35442191509889875
Epoch: 20, step: 173, loss: 0.41916051506996155, mean loss: 0.35442414331532235
Epoch: 20, step: 174, loss: 0.3165130317211151, mean loss: 0.35442283851024253
Epoch: 20, step: 175, loss: 0.3970699608325958, mean loss: 0.3544243062663797
Epoch: 20, step: 176, loss: 0.3317873477935791, mean loss: 0.3544235272128479
Epoch: 20, step: 177, loss: 0.352905809879303, mean loss: 0.3544234749822287
Epoch: 20, step: 178, loss: 0.32860812544822693, mean loss: 0.35442258660514986
Epoch: 20, step: 179, loss: 0.352510541677475, mean loss: 0.35442252080869674
Epoch: 20, step: 180, loss: 0.2868303060531616, mean loss: 0.35442019493502563
Epoch: 20, step: 181, loss: 0.3883359134197235, mean loss: 0.35442136194756724
Epoch: 20, step: 182, loss: 0.340347021818161, mean loss: 0.3544208776775287
Epoch: 20, step: 183, loss: 0.3653549551963806, mean loss: 0.3544212538844348
Epoch: 20, step: 184, loss: 0.331022709608078, mean loss: 0.3544204488424848
Epoch: 20, step: 185, loss: 0.31966760754585266, mean loss: 0.3544192531897876
Epoch: 20, step: 186, loss: 0.31196871399879456, mean loss: 0.3544177927522058
Epoch: 20, step: 187, loss: 0.3259349465370178, mean loss: 0.3544168128827199
Epoch: 20, step: 188, loss: 0.3406183123588562, mean loss: 0.3544163382017703
Epoch: 20, step: 189, loss: 0.34224316477775574, mean loss: 0.3544159194479546
Epoch: 20, step: 190, loss: 0.334816038608551, mean loss: 0.3544152452406401
Epoch: 20, step: 191, loss: 0.3567957282066345, mean loss: 0.3544153271229656
Epoch: 20, step: 192, loss: 0.33327576518058777, mean loss: 0.35441460000289055
Epoch: 20, step: 193, loss: 0.3756626844406128, mean loss: 0.3544153308305867
Epoch: 20, step: 194, loss: 0.3021939694881439, mean loss: 0.35441353473905296
Epoch: 20, step: 195, loss: 0.34353896975517273, mean loss: 0.35441316073420415
Epoch: 20, step: 196, loss: 0.348410040140152, mean loss: 0.35441295427822195
Epoch: 20, step: 197, loss: 0.3585507869720459, mean loss: 0.3544130965793669
Epoch: 20, step: 198, loss: 0.31469252705574036, mean loss: 0.3544117306256022
Epoch: 20, step: 199, loss: 0.3604303300380707, mean loss: 0.3544119375925696
Epoch: 20, step: 200, loss: 0.3067066967487335, mean loss: 0.35441029716614536
Epoch: 20, step: 201, loss: 0.3336259126663208, mean loss: 0.3544095824840568
Epoch: 20, step: 202, loss: 0.3283761441707611, mean loss: 0.3544086873412478
Epoch: 20, step: 203, loss: 0.30814576148986816, mean loss: 0.3544070966753885
Epoch: 20, step: 204, loss: 0.3421619236469269, mean loss: 0.3544066756620473
Epoch: 20, step: 205, loss: 0.3134177625179291, mean loss: 0.35440526643035014
Epoch: 20, step: 206, loss: 0.32330843806266785, mean loss: 0.3544041973332151
Epoch: 20, step: 207, loss: 0.3076636493206024, mean loss: 0.35440259046619044
Epoch: 20, step: 208, loss: 0.32827654480934143, mean loss: 0.3544016923244304
Epoch: 20, step: 209, loss: 0.31210166215896606, mean loss: 0.3544002382154526
Epoch: 20, step: 210, loss: 0.363453209400177, mean loss: 0.3544005494103646
Epoch: 20, step: 211, loss: 0.35322514176368713, mean loss: 0.35440050900724185
Epoch: 20, step: 212, loss: 0.3505761921405792, mean loss: 0.3544003775557976
Epoch: 20, step: 213, loss: 0.30922630429267883, mean loss: 0.3543988248620029
Epoch: 20, step: 214, loss: 0.3576968014240265, mean loss: 0.3543989382140071
Epoch: 20, step: 215, loss: 0.3609298765659332, mean loss: 0.3543991626757321
Epoch: 20, step: 216, loss: 0.3305968940258026, mean loss: 0.3543983446440227
Epoch: 20, step: 217, loss: 0.3987812101840973, mean loss: 0.3543998699332364
Epoch: 20, step: 218, loss: 0.34948205947875977, mean loss: 0.35439970093050593
Epoch: 20, step: 219, loss: 0.3578155040740967, mean loss: 0.35439981831205725
Epoch: 20, step: 220, loss: 0.3483023941516876, mean loss: 0.35439960878578114
Epoch: 20, step: 221, loss: 0.3315570056438446, mean loss: 0.35439882387054705
Epoch: 20, step: 222, loss: 0.3566284477710724, mean loss: 0.354398900482027
Epoch: 20, step: 223, loss: 0.2971304655075073, mean loss: 0.35439693276504736
Epoch: 20, step: 224, loss: 0.3174651265144348, mean loss: 0.3543956638488388
Epoch: 20, step: 225, loss: 0.330220490694046, mean loss: 0.35439483325813054
Epoch: 20, step: 226, loss: 0.33725622296333313, mean loss: 0.3543942444440894
Epoch: 20, step: 227, loss: 0.2824952006340027, mean loss: 0.3543917743656295
Epoch: 20, step: 228, loss: 0.3179107904434204, mean loss: 0.3543905211111748
Epoch: 20, step: 229, loss: 0.32638683915138245, mean loss: 0.35438955911591685
Epoch: 20, step: 230, loss: 0.3101654648780823, mean loss: 0.3543880399618432
Epoch: 20, step: 231, loss: 0.3503270447254181, mean loss: 0.3543879004662662
Epoch: 20, step: 232, loss: 0.34935057163238525, mean loss: 0.35438772743947977
Epoch: 20, step: 233, loss: 0.306184858083725, mean loss: 0.35438607178002535
Epoch: 20, step: 234, loss: 0.32129478454589844, mean loss: 0.35438493520825015
Epoch: 20, step: 235, loss: 0.3295027017593384, mean loss: 0.35438408061855897
Epoch: 20, step: 236, loss: 0.32252874970436096, mean loss: 0.3543829865727811
Epoch: 20, step: 237, loss: 0.3366275429725647, mean loss: 0.3543823767972608
Epoch: 20, step: 238, loss: 0.33588600158691406, mean loss: 0.3543817415977275
Epoch: 20, step: 239, loss: 0.306275874376297, mean loss: 0.35438008961052897
Epoch: 20, step: 240, loss: 0.33780577778816223, mean loss: 0.354379520457278
Epoch: 20, step: 241, loss: 0.3505372405052185, mean loss: 0.3543793885199127
Epoch: 20, step: 242, loss: 0.3238573968410492, mean loss: 0.35437834048256495
Epoch: 20, step: 243, loss: 0.3497661054134369, mean loss: 0.35437818211712513
Epoch: 20, step: 244, loss: 0.33396315574645996, mean loss: 0.3543774811720137
Epoch: 20, step: 245, loss: 0.35929495096206665, mean loss: 0.3543776500063813
Epoch: 20, step: 246, loss: 0.3429184854030609, mean loss: 0.3543772565856856
Epoch: 20, step: 247, loss: 0.3188302516937256, mean loss: 0.3543760362133671
Epoch: 20, step: 248, loss: 0.3398914635181427, mean loss: 0.3543755389572754
Epoch: 20, step: 249, loss: 0.33742836117744446, mean loss: 0.3543749571798027
Epoch: 20, step: 250, loss: 0.3432053327560425, mean loss: 0.3543745737523741
Epoch: 20, step: 251, loss: 0.35037872195243835, mean loss: 0.35437443658871215
Epoch: 20, step: 252, loss: 0.3252604603767395, mean loss: 0.35437343724171005
Epoch: 20, step: 253, loss: 0.33529359102249146, mean loss: 0.3543727823420664
Epoch: 20, step: 254, loss: 0.3521978259086609, mean loss: 0.35437270769108187
Epoch: 20, step: 255, loss: 0.3741181194782257, mean loss: 0.35437338538918
Epoch: 20, step: 256, loss: 0.36836251616477966, mean loss: 0.3543738655048671
Epoch: 20, step: 257, loss: 0.3549697697162628, mean loss: 0.35437388595596914
Epoch: 20, step: 258, loss: 0.32405808568000793, mean loss: 0.35437284557022236
Epoch: 20, step: 259, loss: 0.35258930921554565, mean loss: 0.3543727843644449
Epoch: 20, step: 260, loss: 0.2915504574775696, mean loss: 0.3543706285589857
Epoch: 20, step: 261, loss: 0.31665369868278503, mean loss: 0.35436933431254153
Epoch: 20, step: 262, loss: 0.33537137508392334, mean loss: 0.3543686824249792
Epoch: 20, step: 263, loss: 0.3906659483909607, mean loss: 0.3543699278705586
Epoch: 20, step: 264, loss: 0.3450285494327545, mean loss: 0.35436960735663037
Epoch: 20, step: 265, loss: 0.33599504828453064, mean loss: 0.3543689769250421
Epoch: 20, step: 266, loss: 0.3240188956260681, mean loss: 0.3543679356487084
Epoch: 20, step: 267, loss: 0.34136173129081726, mean loss: 0.3543674894361258
Epoch: 20, step: 268, loss: 0.3551718592643738, mean loss: 0.35436751703123465
Epoch: 20, step: 269, loss: 0.33888500928878784, mean loss: 0.3543669858988936
Epoch: 20, step: 270, loss: 0.34895816445350647, mean loss: 0.35436680035392276
Epoch: 20, step: 271, loss: 0.33854013681411743, mean loss: 0.35436625745245665
Epoch: 20, step: 272, loss: 0.34184423089027405, mean loss: 0.35436582792456717
Epoch: 20, step: 273, loss: 0.3056226372718811, mean loss: 0.35436415600336757
Epoch: 20, step: 274, loss: 0.3191206157207489, mean loss: 0.35436294716988165
Epoch: 20, step: 275, loss: 0.33991092443466187, mean loss: 0.35436245149068235
Epoch: 20, step: 276, loss: 0.32227009534835815, mean loss: 0.354361350816534
Epoch: 20, step: 277, loss: 0.3390960693359375, mean loss: 0.3543608272798895
Epoch: 20, step: 278, loss: 0.35416823625564575, mean loss: 0.35436082067503255
Epoch: 20, step: 279, loss: 0.3601168990135193, mean loss: 0.354361018071409
Epoch: 20, step: 280, loss: 0.3566240966320038, mean loss: 0.35436109567775176
Epoch: 20, step: 281, loss: 0.2888857424259186, mean loss: 0.35435885044926085
Epoch: 20, step: 282, loss: 0.35018599033355713, mean loss: 0.35435870736178304
Epoch: 20, step: 283, loss: 0.367061585187912, mean loss: 0.35435914292884607
Epoch: 20, step: 284, loss: 0.29957154393196106, mean loss: 0.35435726438953535
Epoch: 20, step: 285, loss: 0.2896696925163269, mean loss: 0.35435504647923316
Epoch: 20, step: 286, loss: 0.34049397706985474, mean loss: 0.3543545712479989
Epoch: 20, step: 287, loss: 0.31396961212158203, mean loss: 0.3543531866841232
Epoch: 20, step: 288, loss: 0.3840039372444153, mean loss: 0.35435420319996397
Epoch: 20, step: 289, loss: 0.36760851740837097, mean loss: 0.3543546575816646
Epoch: 20, step: 290, loss: 0.35413414239883423, mean loss: 0.3543546500222672
Epoch: 20, step: 291, loss: 0.3164593279361725, mean loss: 0.3543533509916184
Epoch: 20, step: 292, loss: 0.34243714809417725, mean loss: 0.35435294252478616
Epoch: 20, step: 293, loss: 0.3024705648422241, mean loss: 0.3543511641475433
Epoch: 20, step: 294, loss: 0.28614678978919983, mean loss: 0.35434882637978465
Epoch: 20, step: 295, loss: 0.3022364675998688, mean loss: 0.3543470402419049
Epoch: 20, step: 296, loss: 0.36732664704322815, mean loss: 0.35434748509938857
Epoch: 20, step: 297, loss: 0.32501721382141113, mean loss: 0.3543464798806869
Epoch: 20, step: 298, loss: 0.3699594736099243, mean loss: 0.35434701495706816
Epoch: 20, step: 299, loss: 0.3154617249965668, mean loss: 0.3543456823563156
Epoch: 20, step: 300, loss: 0.3206107020378113, mean loss: 0.35434452629653973
Epoch: 20, step: 301, loss: 0.32659995555877686, mean loss: 0.3543435755539334
Epoch: 20, step: 302, loss: 0.3339516520500183, mean loss: 0.35434287679357623
Epoch: 20, step: 303, loss: 0.3521531820297241, mean loss: 0.3543428017629168
Epoch: 20, step: 304, loss: 0.32279300689697266, mean loss: 0.35434172073516745
Epoch: 20, step: 305, loss: 0.33632296323776245, mean loss: 0.3543411033584287
Epoch: 20, step: 306, loss: 0.3494234085083008, mean loss: 0.3543409348692092
Epoch: 20, step: 307, loss: 0.37295985221862793, mean loss: 0.35434157276551415
Epoch: 20, step: 308, loss: 0.3069894015789032, mean loss: 0.3543399505046903
Epoch: 20, step: 309, loss: 0.36134305596351624, mean loss: 0.35434019041923154
Epoch: 20, step: 310, loss: 0.34480562806129456, mean loss: 0.35433986379245075
Epoch: 20, step: 311, loss: 0.33534249663352966, mean loss: 0.35433921301939103
Epoch: 20, step: 312, loss: 0.31920284032821655, mean loss: 0.3543380094304248
Epoch: 20, step: 313, loss: 0.32944056391716003, mean loss: 0.3543371566029427
Epoch: 20, step: 314, loss: 0.3565441370010376, mean loss: 0.3543372321974074
Epoch: 20, step: 315, loss: 0.3350078761577606, mean loss: 0.35433657014246706
Epoch: 20, step: 316, loss: 0.29787003993988037, mean loss: 0.35433463615848915
Epoch: 20, step: 317, loss: 0.33179163932800293, mean loss: 0.35433386408516804
Epoch: 20, step: 318, loss: 0.3867339789867401, mean loss: 0.3543349737161452
Epoch: 20, step: 319, loss: 0.3623295724391937, mean loss: 0.3543352475037727
Epoch: 20, step: 320, loss: 0.38051387667655945, mean loss: 0.35433614400146707
Epoch: 20, step: 321, loss: 0.3446260988712311, mean loss: 0.3543358114884498
Epoch: 20, step: 322, loss: 0.30843889713287354, mean loss: 0.3543342398377853
Epoch: 20, step: 323, loss: 0.30810546875, mean loss: 0.3543326568775371
Epoch: 20, step: 324, loss: 0.3706200122833252, mean loss: 0.35433321456818617
Epoch: 20, step: 325, loss: 0.3441564738750458, mean loss: 0.35433286612126796
Epoch: 20, step: 326, loss: 0.36232131719589233, mean loss: 0.3543331396327917
Epoch: 20, step: 327, loss: 0.37194883823394775, mean loss: 0.35433374274490487
Epoch: 20, step: 328, loss: 0.3143914043903351, mean loss: 0.35433237527808453
Epoch: 20, step: 329, loss: 0.33630186319351196, mean loss: 0.35433175800618844
Epoch: 20, step: 330, loss: 0.34228065609931946, mean loss: 0.354331345452633
Epoch: 20, step: 331, loss: 0.35613399744033813, mean loss: 0.3543314071619301
Epoch: 20, step: 332, loss: 0.2944430112838745, mean loss: 0.3543293571021664
Epoch: 20, step: 333, loss: 0.308731347322464, mean loss: 0.3543277962748309
Epoch: 20, step: 334, loss: 0.3156745135784149, mean loss: 0.3543264732119284
Epoch: 20, step: 335, loss: 0.3516279458999634, mean loss: 0.3543263808472203
Epoch: 20, step: 336, loss: 0.3057190179824829, mean loss: 0.3543247171800791
Epoch: 20, step: 337, loss: 0.31097540259361267, mean loss: 0.3543232335290904
Epoch: 20, step: 338, loss: 0.3305438458919525, mean loss: 0.354322419696049
Epoch: 20, step: 339, loss: 0.31842443346977234, mean loss: 0.3543211911544259
Epoch: 20, step: 340, loss: 0.3543514311313629, mean loss: 0.3543211921892973
Epoch: 20, step: 341, loss: 0.28663498163223267, mean loss: 0.3543188759135271
Epoch: 20, step: 342, loss: 0.3435441255569458, mean loss: 0.35431850720564784
Epoch: 20, step: 343, loss: 0.3566434383392334, mean loss: 0.35431858676118894
Epoch: 20, step: 344, loss: 0.3572913408279419, mean loss: 0.3543186884807464
Epoch: 20, step: 345, loss: 0.31468063592910767, mean loss: 0.35431733222082196
Epoch: 20, step: 346, loss: 0.32025694847106934, mean loss: 0.3543161668468955
Epoch: 20, step: 347, loss: 0.35244622826576233, mean loss: 0.3543161028692514
Epoch: 20, step: 348, loss: 0.31616130471229553, mean loss: 0.35431479749451544
Epoch: 20, step: 349, loss: 0.33031514286994934, mean loss: 0.35431397643209245
Epoch: 20, step: 350, loss: 0.3750833570957184, mean loss: 0.3543146869579268
Epoch: 20, step: 351, loss: 0.3623611330986023, mean loss: 0.35431496221949427
Epoch: 20, step: 352, loss: 0.36858639121055603, mean loss: 0.3543154504153343
Epoch: 20, step: 353, loss: 0.3469824492931366, mean loss: 0.3543151995772306
Epoch: 20, step: 354, loss: 0.3667699992656708, mean loss: 0.3543156256008218
Epoch: 20, step: 355, loss: 0.33927738666534424, mean loss: 0.3543151112267988
Epoch: 20, step: 356, loss: 0.35634562373161316, mean loss: 0.35431518067689644
Epoch: 20, step: 357, loss: 0.32138723134994507, mean loss: 0.35431405447300673
Epoch: 20, step: 358, loss: 0.3567107319831848, mean loss: 0.35431413644152515
Epoch: 20, step: 359, loss: 0.37276920676231384, mean loss: 0.35431476759988084
Epoch: 20, step: 360, loss: 0.33543115854263306, mean loss: 0.3543141218077035
Epoch: 20, step: 361, loss: 0.3279518783092499, mean loss: 0.35431322028785195
Epoch: 20, step: 362, loss: 0.33146512508392334, mean loss: 0.3543124389694098
Epoch: 20, step: 363, loss: 0.3193499445915222, mean loss: 0.35431124342521686
Epoch: 20, step: 364, loss: 0.32153618335723877, mean loss: 0.354310122718769
Epoch: 20, step: 365, loss: 0.31781673431396484, mean loss: 0.35430887491091817
Epoch: 20, step: 366, loss: 0.3293988108634949, mean loss: 0.35430802319744165
Epoch: 20, step: 367, loss: 0.373288094997406, mean loss: 0.3543086721331569
Epoch: 20, step: 368, loss: 0.3270929753780365, mean loss: 0.3543077416501744
Epoch: 20, step: 369, loss: 0.33775025606155396, mean loss: 0.3543071755822911
Epoch: 20, step: 370, loss: 0.307778537273407, mean loss: 0.35430558491399566
Epoch: 20, step: 371, loss: 0.36472591757774353, mean loss: 0.35430594114032765
Epoch: 20, step: 372, loss: 0.34531307220458984, mean loss: 0.354305633723347
Epoch: 20, step: 373, loss: 0.3769550025463104, mean loss: 0.35430640795486484
Epoch: 20, step: 374, loss: 0.3117474615573883, mean loss: 0.354304953196827
Epoch: 20, step: 375, loss: 0.3517816662788391, mean loss: 0.35430486694829955
Epoch: 20, step: 376, loss: 0.33154383301734924, mean loss: 0.3543040889794739
Epoch: 20, step: 377, loss: 0.3202556371688843, mean loss: 0.35430292524812484
Epoch: 20, step: 378, loss: 0.3098236918449402, mean loss: 0.3543014050583233
Epoch: 20, step: 379, loss: 0.3207489550113678, mean loss: 0.3543002583580483
Epoch: 20, step: 380, loss: 0.3227851092815399, mean loss: 0.35429918132209337
Epoch: 20, step: 381, loss: 0.33157432079315186, mean loss: 0.3542984047223897
Epoch: 20, step: 382, loss: 0.34331831336021423, mean loss: 0.3542980295014157
Epoch: 20, step: 383, loss: 0.3275950253009796, mean loss: 0.3542971170149408
Epoch: 20, step: 384, loss: 0.315858393907547, mean loss: 0.35429580354413587
Epoch: 20, step: 385, loss: 0.3092886805534363, mean loss: 0.35429426568030103
Epoch: 20, step: 386, loss: 0.3176570534706116, mean loss: 0.35429301385359485
Epoch: 20, step: 387, loss: 0.3249317705631256, mean loss: 0.35429201066775057
Epoch: 20, step: 388, loss: 0.3360338509082794, mean loss: 0.35429138686236744
Epoch: 20, step: 389, loss: 0.3567446172237396, mean loss: 0.35429147067618233
Epoch: 20, step: 390, loss: 0.31426766514778137, mean loss: 0.3542901033226403
Epoch: 20, step: 391, loss: 0.35274145007133484, mean loss: 0.3542900504170223
Epoch: 20, step: 392, loss: 0.2943711578845978, mean loss: 0.35428800351740375
Epoch: 20, step: 393, loss: 0.32498112320899963, mean loss: 0.35428700239421224
Epoch: 20, step: 394, loss: 0.33362966775894165, mean loss: 0.35428629676365253
Epoch: 20, step: 395, loss: 0.3567163646221161, mean loss: 0.3542863797691129
Epoch: 20, step: 396, loss: 0.31904932856559753, mean loss: 0.35428517619459354
Epoch: 20, step: 397, loss: 0.3132379353046417, mean loss: 0.3542837742121873
Epoch: 20, step: 398, loss: 0.3075695335865021, mean loss: 0.35428217872598133
Epoch: 20, step: 399, loss: 0.3022266626358032, mean loss: 0.35428040087365587
Epoch: 20, step: 400, loss: 0.3244379460811615, mean loss: 0.35427938169894213
Epoch: 20, step: 401, loss: 0.28426194190979004, mean loss: 0.3542769905562678
Epoch: 20, step: 402, loss: 0.3521091341972351, mean loss: 0.3542769165250429
Epoch: 20, step: 403, loss: 0.36672157049179077, mean loss: 0.3542773414893226
Epoch: 20, step: 404, loss: 0.36828503012657166, mean loss: 0.3542778198123083
Epoch: 20, step: 405, loss: 0.40572789311408997, mean loss: 0.35427957662693993
Epoch: 20, step: 406, loss: 0.3418434262275696, mean loss: 0.3542791519965442
Epoch: 20, step: 407, loss: 0.33507975935935974, mean loss: 0.35427849645869125
Epoch: 20, step: 408, loss: 0.336355984210968, mean loss: 0.35427788453912257
Epoch: 20, step: 409, loss: 0.3500610291957855, mean loss: 0.35427774057000877
Epoch: 20, step: 410, loss: 0.3235218822956085, mean loss: 0.35427669055948424
Epoch: 20, step: 411, loss: 0.33603689074516296, mean loss: 0.3542760678707018
Epoch: 20, step: 412, loss: 0.42058897018432617, mean loss: 0.3542783316505234
Epoch: 20, step: 413, loss: 0.3349439799785614, mean loss: 0.354277671639884
Epoch: 20, step: 414, loss: 0.35705476999282837, mean loss: 0.3542777664375748
Epoch: 20, step: 415, loss: 0.41049855947494507, mean loss: 0.35427968549795974
Epoch: 20, step: 416, loss: 0.33449241518974304, mean loss: 0.3542790100953483
Epoch: 20, step: 417, loss: 0.31146591901779175, mean loss: 0.3542775487979533
Epoch: 20, step: 418, loss: 0.3535732328891754, mean loss: 0.3542775247590472
Epoch: 20, step: 419, loss: 0.31482571363449097, mean loss: 0.35427617828085184
Epoch: 20, step: 420, loss: 0.3238406479358673, mean loss: 0.35427513956100115
Epoch: 20, step: 421, loss: 0.32357165217399597, mean loss: 0.3542740917319319
Epoch: 20, step: 422, loss: 0.3584514856338501, mean loss: 0.3542742342905062
Epoch: 20, step: 423, loss: 0.322398841381073, mean loss: 0.3542731465416354
Epoch: 20, step: 424, loss: 0.3303149938583374, mean loss: 0.35427232899675626
Epoch: 20, step: 425, loss: 0.3455241918563843, mean loss: 0.3542720304866511
Epoch: 20, step: 426, loss: 0.31945914030075073, mean loss: 0.35427084261719377
Epoch: 20, step: 427, loss: 0.34018653631210327, mean loss: 0.3542703620553572
Epoch: 20, step: 428, loss: 0.3341856598854065, mean loss: 0.3542696767811353
Epoch: 20, step: 429, loss: 0.3756687343120575, mean loss: 0.3542704068752169
Epoch: 20, step: 430, loss: 0.3183246850967407, mean loss: 0.35426918051918066
Epoch: 20, step: 431, loss: 0.31457677483558655, mean loss: 0.35426782638416143
Epoch: 20, step: 432, loss: 0.3260939121246338, mean loss: 0.3542668652435665
Epoch: 20, step: 433, loss: 0.32211461663246155, mean loss: 0.35426576842127644
Epoch: 20, step: 434, loss: 0.345094233751297, mean loss: 0.35426545555978334
Epoch: 20, step: 435, loss: 0.32076403498649597, mean loss: 0.3542643127906275
Epoch: 20, step: 436, loss: 0.3517080247402191, mean loss: 0.3542642255958923
Epoch: 20, step: 437, loss: 0.3449714779853821, mean loss: 0.35426390863199264
Epoch: 20, step: 438, loss: 0.3269170820713043, mean loss: 0.35426297589804673
Epoch: 20, step: 439, loss: 0.2938230335712433, mean loss: 0.35426091450847214
Epoch: 20, step: 440, loss: 0.3404226303100586, mean loss: 0.3542604425503466
Epoch: 20, step: 441, loss: 0.3248821496963501, mean loss: 0.3542594406305303
Epoch: 20, step: 442, loss: 0.33724552392959595, mean loss: 0.35425886040624555
Epoch: 20, step: 443, loss: 0.3329976201057434, mean loss: 0.35425813536053896
Epoch: 20, step: 444, loss: 0.33346980810165405, mean loss: 0.3542574264661738
Epoch: 20, step: 445, loss: 0.30260542035102844, mean loss: 0.3542556651620029
Epoch: 20, step: 446, loss: 0.3138986825942993, mean loss: 0.3542542890586658
Epoch: 20, step: 447, loss: 0.2996178865432739, mean loss: 0.3542524261153176
Epoch: 20, step: 448, loss: 0.32846373319625854, mean loss: 0.35425154682543664
Epoch: 20, step: 449, loss: 0.32362475991249084, mean loss: 0.3542505026117676
Epoch: 20, step: 450, loss: 0.33712682127952576, mean loss: 0.3542499188034647
Epoch: 20, step: 451, loss: 0.27308669686317444, mean loss: 0.3542471517496688
Epoch: 20, step: 452, loss: 0.38041695952415466, mean loss: 0.35424804391234477
Epoch: 20, step: 453, loss: 0.3138444721698761, mean loss: 0.35424666654915726
Epoch: 20, step: 454, loss: 0.3500869572162628, mean loss: 0.35424652474894136
Epoch: 20, step: 455, loss: 0.3278011977672577, mean loss: 0.35424562328565457
Epoch: 20, step: 456, loss: 0.32638660073280334, mean loss: 0.35424467366495194
Epoch: 20, step: 457, loss: 0.3002106845378876, mean loss: 0.35424283189015043
Epoch: 20, step: 458, loss: 0.30575376749038696, mean loss: 0.35424117917313896
Epoch: 20, step: 459, loss: 0.34788650274276733, mean loss: 0.3542409625856669
Epoch: 20, step: 460, loss: 0.33058491349220276, mean loss: 0.35424015634017103
Epoch: 20, step: 461, loss: 0.344204306602478, mean loss: 0.35423981430998436
Epoch: 20, step: 462, loss: 0.40730077028274536, mean loss: 0.35424162261029357
Epoch: 20, step: 463, loss: 0.3409249186515808, mean loss: 0.35424116879677264
Epoch: 20, step: 464, loss: 0.3169264793395996, mean loss: 0.354239897210831
Epoch: 20, step: 465, loss: 0.326292484998703, mean loss: 0.3542389448693803
Epoch: 20, step: 466, loss: 0.3409818112850189, mean loss: 0.354238493132113
Epoch: 20, step: 467, loss: 0.32627397775650024, mean loss: 0.3542375402727912
Epoch: 20, step: 468, loss: 0.32013121247291565, mean loss: 0.3542363781777351
Epoch: 20, step: 469, loss: 0.3296634256839752, mean loss: 0.35423554093914933
Epoch: 20, step: 470, loss: 0.3566729724407196, mean loss: 0.35423562398338976
Epoch: 20, step: 471, loss: 0.3805842995643616, mean loss: 0.35423652166244335
Epoch: 20, step: 472, loss: 0.3479539155960083, mean loss: 0.3542363076261927
Epoch: 20, step: 473, loss: 0.31548064947128296, mean loss: 0.35423498734077485
Epoch: 20, step: 474, loss: 0.3375082314014435, mean loss: 0.3542344175313407
Epoch: 20, step: 475, loss: 0.343098521232605, mean loss: 0.3542340381916385
Epoch: 20, step: 476, loss: 0.3597313463687897, mean loss: 0.35423422544878935
Epoch: 20, step: 477, loss: 0.307221382856369, mean loss: 0.3542326240848479
Epoch: 20, step: 478, loss: 0.34783321619033813, mean loss: 0.3542324061139397
Epoch: 20, step: 479, loss: 0.3253325819969177, mean loss: 0.35423142178750516
Epoch: 20, step: 480, loss: 0.31134340167045593, mean loss: 0.35422996107362903
Epoch: 20, step: 481, loss: 0.34492790699005127, mean loss: 0.35422964426775466
Epoch: 20, step: 482, loss: 0.32949721813201904, mean loss: 0.3542288019687343
Epoch: 20, step: 483, loss: 0.3419799506664276, mean loss: 0.3542283848303573
Epoch: 20, step: 484, loss: 0.35714659094810486, mean loss: 0.35422848420737474
Epoch: 20, step: 485, loss: 0.33209148049354553, mean loss: 0.3542277303762873
Epoch: 20, step: 486, loss: 0.3274318277835846, mean loss: 0.3542268179268511
Epoch: 20, step: 487, loss: 0.36070021986961365, mean loss: 0.35422703835050756
Epoch: 20, step: 488, loss: 0.34373724460601807, mean loss: 0.3542266811781917
Epoch: 20, step: 489, loss: 0.34797540307044983, mean loss: 0.35422646833249516
Epoch: 20, step: 490, loss: 0.3079051375389099, mean loss: 0.3542248912213722
Epoch: 20, step: 491, loss: 0.36271926760673523, mean loss: 0.3542251804211674
Epoch: 20, step: 492, loss: 0.3179052174091339, mean loss: 0.35422394391270684
Epoch: 20, step: 493, loss: 0.32088375091552734, mean loss: 0.3542228088887742
Epoch: 20, step: 494, loss: 0.36099615693092346, mean loss: 0.3542230394708352
Epoch: 20, step: 495, loss: 0.30841341614723206, mean loss: 0.3542214800473833
Epoch: 20, step: 496, loss: 0.32971036434173584, mean loss: 0.35422064568323086
Epoch: 20, step: 497, loss: 0.30789506435394287, mean loss: 0.3542190688032074
Epoch: 20, step: 498, loss: 0.3046417534351349, mean loss: 0.3542173812946003
Epoch: 20, step: 499, loss: 0.3187943398952484, mean loss: 0.35421617560905233
Epoch: 20, step: 500, loss: 0.30864641070365906, mean loss: 0.3542146246147055
Epoch: 20, step: 501, loss: 0.3132742941379547, mean loss: 0.35421323123336734
Epoch: 20, step: 502, loss: 0.33812111616134644, mean loss: 0.3542126835658361
Epoch: 20, step: 503, loss: 0.30364179611206055, mean loss: 0.35421096253100576
Epoch: 20, step: 504, loss: 0.3274027705192566, mean loss: 0.3542100502222764
Epoch: 20, step: 505, loss: 0.3366784453392029, mean loss: 0.35420945362509126
Epoch: 20, step: 506, loss: 0.33578935265541077, mean loss: 0.35420882681388327
Epoch: 20, step: 507, loss: 0.33250075578689575, mean loss: 0.35420808814262195
Epoch: 20, step: 508, loss: 0.29449018836021423, mean loss: 0.35420605616127576
Epoch: 20, step: 509, loss: 0.31787946820259094, mean loss: 0.3542048201426314
Epoch: 20, step: 510, loss: 0.3408421277999878, mean loss: 0.35420436549010703
Epoch: 20, step: 511, loss: 0.3690303862094879, mean loss: 0.3542048699137842
Epoch: 20, step: 512, loss: 0.3666740953922272, mean loss: 0.3542052941381056
Epoch: 20, step: 513, loss: 0.3502456545829773, mean loss: 0.3542051594289964
Epoch: 20, step: 514, loss: 0.3396081328392029, mean loss: 0.3542046628470406
Epoch: 20, step: 515, loss: 0.33565789461135864, mean loss: 0.354204031918743
Epoch: 20, step: 516, loss: 0.3494654595851898, mean loss: 0.3542038707263651
Epoch: 20, step: 517, loss: 0.3050307333469391, mean loss: 0.3542021980568849
Epoch: 20, step: 518, loss: 0.34028854966163635, mean loss: 0.35420172478744055
Epoch: 20, step: 519, loss: 0.3260836601257324, mean loss: 0.3542007683906834
Epoch: 20, step: 520, loss: 0.3172890841960907, mean loss: 0.3541995129339236
Epoch: 20, step: 521, loss: 0.31975728273391724, mean loss: 0.3541983415091838
Epoch: 20, step: 522, loss: 0.36881548166275024, mean loss: 0.354198838640094
Epoch: 20, step: 523, loss: 0.35809293389320374, mean loss: 0.3541989710742952
Epoch: 20, step: 524, loss: 0.319297730922699, mean loss: 0.35419778415913955
Epoch: 20, step: 525, loss: 0.3026238679885864, mean loss: 0.3541960303022338
Epoch: 20, step: 526, loss: 0.4133642315864563, mean loss: 0.35419804234702873
Epoch: 20, step: 527, loss: 0.2944915294647217, mean loss: 0.3541960120657147
Epoch: 20, step: 528, loss: 0.3077433407306671, mean loss: 0.35419443252641264
Epoch: 20, step: 529, loss: 0.3084414601325989, mean loss: 0.35419287683200956
Epoch: 20, step: 530, loss: 0.3349021375179291, mean loss: 0.35419222092981945
Epoch: 20, step: 531, loss: 0.31668561697006226, mean loss: 0.35419094571548654
Epoch: 20, step: 532, loss: 0.29289063811302185, mean loss: 0.35418886159256124
Epoch: 20, step: 533, loss: 0.3104190230369568, mean loss: 0.35418737353114305
Epoch: 20, step: 534, loss: 0.3216642737388611, mean loss: 0.3541862678673731
Epoch: 20, step: 535, loss: 0.31267252564430237, mean loss: 0.3541848566033596
Epoch: 20, step: 536, loss: 0.35835161805152893, mean loss: 0.35418499824803606
Epoch: 20, step: 537, loss: 0.3591175079345703, mean loss: 0.3541851659178194
Epoch: 20, step: 538, loss: 0.30522263050079346, mean loss: 0.3541835016010372
Epoch: 20, step: 539, loss: 0.32062843441963196, mean loss: 0.35418236104810785
Epoch: 20, step: 540, loss: 0.31013980507850647, mean loss: 0.3541808640712556
Epoch: 20, step: 541, loss: 0.35341259837150574, mean loss: 0.35418083795930877
Epoch: 20, step: 542, loss: 0.31415238976478577, mean loss: 0.3541794775117611
Epoch: 20, step: 543, loss: 0.3122144043445587, mean loss: 0.3541780512925806
Epoch: 20, step: 544, loss: 0.32825079560279846, mean loss: 0.35417717016239575
Epoch: 20, step: 545, loss: 0.31836941838264465, mean loss: 0.35417595328780255
Epoch: 20, step: 546, loss: 0.346385657787323, mean loss: 0.3541756885548872
Epoch: 20, step: 547, loss: 0.3562663197517395, mean loss: 0.35417575959713254
Epoch: 20, step: 548, loss: 0.34612250328063965, mean loss: 0.3541754859467769
Epoch: 20, step: 549, loss: 0.36261051893234253, mean loss: 0.35417577256019805
Epoch: 20, step: 550, loss: 0.3491900861263275, mean loss: 0.35417560315764857
Epoch: 20, step: 551, loss: 0.34649351239204407, mean loss: 0.35417534214613844
Epoch: 20, step: 552, loss: 0.3025417923927307, mean loss: 0.35417358787203274
Epoch: 20, step: 553, loss: 0.31039148569107056, mean loss: 0.3541721004050836
Epoch: 20, step: 554, loss: 0.3860923945903778, mean loss: 0.3541731848383836
Epoch: 20, step: 555, loss: 0.3261899948120117, mean loss: 0.35417223419325433
Epoch: 20, step: 556, loss: 0.3591969907283783, mean loss: 0.35417240488852
Epoch: 20, step: 557, loss: 0.3569853603839874, mean loss: 0.3541725004437715
Epoch: 20, step: 558, loss: 0.340192973613739, mean loss: 0.35417202557958355
Epoch: 20, step: 559, loss: 0.32760897278785706, mean loss: 0.35417112330197514
Epoch: 20, step: 560, loss: 0.3182319700717926, mean loss: 0.3541699025841588
Epoch: 20, step: 561, loss: 0.3143858313560486, mean loss: 0.35416855131484193
Epoch: 20, step: 562, loss: 0.337568074464798, mean loss: 0.35416798749740314
Epoch: 20, step: 563, loss: 0.37302857637405396, mean loss: 0.3541686280553734
Epoch: 20, step: 564, loss: 0.33233627676963806, mean loss: 0.35416788659328186
Epoch: 20, step: 565, loss: 0.30518367886543274, mean loss: 0.3541662230665642
Epoch: 20, step: 566, loss: 0.37842512130737305, mean loss: 0.35416704688217326
Epoch: 20, step: 567, loss: 0.3208014667034149, mean loss: 0.35416591384834484
Epoch: 20, step: 568, loss: 0.34402668476104736, mean loss: 0.35416556955043704
Epoch: 20, step: 569, loss: 0.3176630139350891, mean loss: 0.35416433007486436
Epoch: 20, step: 570, loss: 0.32624533772468567, mean loss: 0.35416338209373127
Epoch: 20, step: 571, loss: 0.32914161682128906, mean loss: 0.35416253251593444
Epoch: 20, step: 572, loss: 0.35709646344184875, mean loss: 0.3541626321299271
Epoch: 20, step: 573, loss: 0.3698258101940155, mean loss: 0.3541631639143389
Epoch: 20, step: 574, loss: 0.3196145296096802, mean loss: 0.3541619909849787
Epoch: 20, step: 575, loss: 0.3149269223213196, mean loss: 0.3541606589959556
Epoch: 20, step: 576, loss: 0.35386723279953003, mean loss: 0.3541606490347852
Epoch: 20, step: 577, loss: 0.3264985680580139, mean loss: 0.3541597100001944
Epoch: 20, step: 578, loss: 0.37018516659736633, mean loss: 0.3541602539920678
Epoch: 20, step: 579, loss: 0.3339376151561737, mean loss: 0.35415956754811545
Epoch: 20, step: 580, loss: 0.35461708903312683, mean loss: 0.35415958307784917
Epoch: 20, step: 581, loss: 0.3316424787044525, mean loss: 0.35415881880168415
Epoch: 20, step: 582, loss: 0.3034617006778717, mean loss: 0.35415709809713525
Epoch: 20, step: 583, loss: 0.32074305415153503, mean loss: 0.35415596403373767
Epoch: 20, step: 584, loss: 0.33198368549346924, mean loss: 0.35415521153828405
Epoch: 20, step: 585, loss: 0.33139923214912415, mean loss: 0.3541544392590677
Epoch: 20, step: 586, loss: 0.3519035875797272, mean loss: 0.35415436287356256
Epoch: 20, step: 587, loss: 0.32669797539711, mean loss: 0.354153431137867
Epoch: 20, step: 588, loss: 0.29828548431396484, mean loss: 0.35415153531694255
Epoch: 20, step: 589, loss: 0.32126280665397644, mean loss: 0.354150419309862
Epoch: 20, step: 590, loss: 0.3344666063785553, mean loss: 0.35414975140538196
Epoch: 20, step: 591, loss: 0.3605254888534546, mean loss: 0.3541499677374072
Epoch: 20, step: 592, loss: 0.3191216289997101, mean loss: 0.3541487792483244
Epoch: 20, step: 593, loss: 0.3355993628501892, mean loss: 0.3541481498998682
Epoch: 20, step: 594, loss: 0.29057249426841736, mean loss: 0.3541459929649867
Epoch: 20, step: 595, loss: 0.32799509167671204, mean loss: 0.35414510577197245
Epoch: 20, step: 596, loss: 0.30811190605163574, mean loss: 0.354143544106955
Epoch: 20, step: 597, loss: 0.3291158080101013, mean loss: 0.35414269507594553
Epoch: 20, step: 598, loss: 0.3454819321632385, mean loss: 0.35414240128162033
Epoch: 20, step: 599, loss: 0.3233320713043213, mean loss: 0.3541413561550946
Epoch: 20, step: 600, loss: 0.3232761323451996, mean loss: 0.3541403092020126
Epoch: 20, step: 601, loss: 0.3419681191444397, mean loss: 0.3541398963334807
Epoch: 20, step: 602, loss: 0.3323843777179718, mean loss: 0.3541391584330426
Epoch: 20, step: 603, loss: 0.29446470737457275, mean loss: 0.35413713447255357
Epoch: 20, step: 604, loss: 0.35946595668792725, mean loss: 0.35413731520249137
Epoch: 20, step: 605, loss: 0.32326963543891907, mean loss: 0.35413626834365114
Epoch: 20, step: 606, loss: 0.3214566707611084, mean loss: 0.35413516007229145
Epoch: 20, step: 607, loss: 0.3072778582572937, mean loss: 0.3541335710427942
Epoch: 20, step: 608, loss: 0.37338510155677795, mean loss: 0.3541342238804799
Epoch: 20, step: 609, loss: 0.345427930355072, mean loss: 0.35413392865180826
Epoch: 20, step: 610, loss: 0.3728684186935425, mean loss: 0.35413456391307585
Epoch: 20, step: 611, loss: 0.319049209356308, mean loss: 0.35413337425640434
Epoch: 20, step: 612, loss: 0.323321133852005, mean loss: 0.3541323295257766
Epoch: 20, step: 613, loss: 0.3378128707408905, mean loss: 0.35413177621124536
Epoch: 20, step: 614, loss: 0.33491095900535583, mean loss: 0.35413112454766826
Epoch: 20, step: 615, loss: 0.32348400354385376, mean loss: 0.3541300855213256
Epoch: 20, step: 616, loss: 0.3084300756454468, mean loss: 0.3541285362108914
Epoch: 20, step: 617, loss: 0.3242223560810089, mean loss: 0.3541275223733387
Epoch: 20, step: 618, loss: 0.33190351724624634, mean loss: 0.3541267689916944
Epoch: 20, step: 619, loss: 0.38629016280174255, mean loss: 0.3541278592762303
Epoch: 20, step: 620, loss: 0.3775070309638977, mean loss: 0.3541286517636608
Epoch: 20, step: 621, loss: 0.3220215141773224, mean loss: 0.3541275634598988
Epoch: 20, step: 622, loss: 0.34120866656303406, mean loss: 0.35412712557572107
Epoch: 20, step: 623, loss: 0.3759235441684723, mean loss: 0.35412786433719723
Epoch: 20, step: 624, loss: 0.3550599217414856, mean loss: 0.3541278959270093
Epoch: 20, step: 625, loss: 0.34859320521354675, mean loss: 0.35412770834852647
Epoch: 20, step: 626, loss: 0.3528338074684143, mean loss: 0.3541276644978849
Epoch: 20, step: 627, loss: 0.3152841627597809, mean loss: 0.35412634812599464
Epoch: 20, step: 628, loss: 0.342026025056839, mean loss: 0.35412593807065323
Epoch: 20, step: 629, loss: 0.30643942952156067, mean loss: 0.35412432212661565
Epoch: 20, step: 630, loss: 0.29372215270996094, mean loss: 0.3541222753586506
Epoch: 20, step: 631, loss: 0.3230462074279785, mean loss: 0.3541212223609571
Epoch: 20, step: 632, loss: 0.3487757742404938, mean loss: 0.3541210412391423
Epoch: 20, step: 633, loss: 0.321440726518631, mean loss: 0.3541199339573533
Epoch: 20, step: 634, loss: 0.3620671331882477, mean loss: 0.3541202032170257
Epoch: 20, step: 635, loss: 0.32283079624176025, mean loss: 0.35411914313412235
Epoch: 20, step: 636, loss: 0.34572634100914, mean loss: 0.35411885879621113
Epoch: 20, step: 637, loss: 0.34508150815963745, mean loss: 0.3541185526321541
Epoch: 20, step: 638, loss: 0.32484859228134155, mean loss: 0.35411756106874237
Epoch: 20, step: 639, loss: 0.34040045738220215, mean loss: 0.3541170963972083
Epoch: 20, step: 640, loss: 0.3593440353870392, mean loss: 0.3541172734555393
Epoch: 20, step: 641, loss: 0.3361617922782898, mean loss: 0.35411666524873836
Epoch: 20, step: 642, loss: 0.3479730784893036, mean loss: 0.3541164571538036
Epoch: 20, step: 643, loss: 0.3504273295402527, mean loss: 0.3541163322002873
Epoch: 20, step: 644, loss: 0.3532068729400635, mean loss: 0.35411630139726413
Epoch: 20, step: 645, loss: 0.3257230222225189, mean loss: 0.35411533976076837
Epoch: 20, step: 646, loss: 0.3682505786418915, mean loss: 0.35411581848325563
Epoch: 20, step: 647, loss: 0.33714890480041504, mean loss: 0.3541152438790263
Epoch: 20, step: 648, loss: 0.3343702256679535, mean loss: 0.3541145752137071
Epoch: 20, step: 649, loss: 0.3238828480243683, mean loss: 0.3541135514505107
Epoch: 20, step: 650, loss: 0.3696599304676056, mean loss: 0.35411407789319865
Epoch: 20, step: 651, loss: 0.3125128149986267, mean loss: 0.3541126692089614
Epoch: 20, step: 652, loss: 0.31392452120780945, mean loss: 0.35411130842109695
Epoch: 20, step: 653, loss: 0.3389013111591339, mean loss: 0.35411079342152824
Epoch: 20, step: 654, loss: 0.3036046028137207, mean loss: 0.3541090833761378
Epoch: 20, step: 655, loss: 0.3308141827583313, mean loss: 0.35410829468096516
Epoch: 20, step: 656, loss: 0.32837626338005066, mean loss: 0.3541074235013836
Epoch: 20, step: 657, loss: 0.31332308053970337, mean loss: 0.35410604275986546
Epoch: 20, step: 658, loss: 0.30913829803466797, mean loss: 0.3541045204420915
Epoch: 20, step: 659, loss: 0.3119506239891052, mean loss: 0.3541030934313788
Epoch: 20, step: 660, loss: 0.35042399168014526, mean loss: 0.35410296888915777
Epoch: 20, step: 661, loss: 0.3297215700149536, mean loss: 0.35410214357608233
Epoch: 20, step: 662, loss: 0.3477177023887634, mean loss: 0.3541019274693502
Epoch: 20, step: 663, loss: 0.40138792991638184, mean loss: 0.35410352799745903
Epoch: 20, step: 664, loss: 0.3451985716819763, mean loss: 0.3541032265943006
Epoch: 20, step: 665, loss: 0.328435480594635, mean loss: 0.35410235785585886
Epoch: 20, step: 666, loss: 0.33355021476745605, mean loss: 0.35410166228124595
Epoch: 20, step: 667, loss: 0.3426043391227722, mean loss: 0.35410127317460055
Epoch: 20, step: 668, loss: 0.32492658495903015, mean loss: 0.3541002858420947
Epoch: 20, step: 669, loss: 0.33013996481895447, mean loss: 0.35409947500212774
Epoch: 20, step: 670, loss: 0.29938796162605286, mean loss: 0.3540976235753274
Epoch: 20, step: 671, loss: 0.3270685076713562, mean loss: 0.3540967089463377
Epoch: 20, step: 672, loss: 0.3383001685142517, mean loss: 0.35409617443070707
Epoch: 20, step: 673, loss: 0.30827751755714417, mean loss: 0.35409462409380266
Epoch: 20, step: 674, loss: 0.31878721714019775, mean loss: 0.3540934294598337
Epoch: 20, step: 675, loss: 0.36131271719932556, mean loss: 0.3540936737177759
Epoch: 20, step: 676, loss: 0.33988064527511597, mean loss: 0.3540931928493372
Epoch: 20, step: 677, loss: 0.34472477436065674, mean loss: 0.35409287589898575
Epoch: 20, step: 678, loss: 0.3186280429363251, mean loss: 0.35409167610085446
Epoch: 20, step: 679, loss: 0.3464615046977997, mean loss: 0.35409141797597615
Epoch: 20, step: 680, loss: 0.3060116171836853, mean loss: 0.35408979151541015
Epoch: 20, step: 681, loss: 0.323588490486145, mean loss: 0.3540887597414764
Epoch: 20, step: 682, loss: 0.42887988686561584, mean loss: 0.35409128963110614
Epoch: 20, step: 683, loss: 0.32900166511535645, mean loss: 0.3540904409765088
Epoch: 20, step: 684, loss: 0.3474850654602051, mean loss: 0.354090217557753
Epoch: 20, step: 685, loss: 0.3398517966270447, mean loss: 0.3540897359768516
Epoch: 20, step: 686, loss: 0.3014764189720154, mean loss: 0.35408795651606745
Epoch: 20, step: 687, loss: 0.3236645758152008, mean loss: 0.3540869275867959
Epoch: 20, step: 688, loss: 0.39433401823043823, mean loss: 0.35408828871130615
Epoch: 20, step: 689, loss: 0.3794059157371521, mean loss: 0.3540891449043067
Epoch: 20, step: 690, loss: 0.3159034252166748, mean loss: 0.3540878535810614
Epoch: 20, step: 691, loss: 0.3204616606235504, mean loss: 0.35408671648539797
Epoch: 20, step: 692, loss: 0.31670159101486206, mean loss: 0.3540854523212797
Epoch: 20, step: 693, loss: 0.309498131275177, mean loss: 0.35408394466857646
Epoch: 20, step: 694, loss: 0.35976818203926086, mean loss: 0.35408413686595164
Epoch: 20, step: 695, loss: 0.34157857298851013, mean loss: 0.35408371403785194
Epoch: 20, step: 696, loss: 0.3624736964702606, mean loss: 0.35408399770362037
Epoch: 20, step: 697, loss: 0.3426562547683716, mean loss: 0.3540836113440648
Epoch: 20, step: 698, loss: 0.32153892517089844, mean loss: 0.35408251108083166
Epoch: 20, step: 699, loss: 0.30414915084838867, mean loss: 0.3540808230023924
Epoch: 20, step: 700, loss: 0.32275038957595825, mean loss: 0.35407976386195
Epoch: 20, step: 701, loss: 0.334311842918396, mean loss: 0.3540790956204199
Epoch: 20, step: 702, loss: 0.32846179604530334, mean loss: 0.3540782296737757
Epoch: 20, step: 703, loss: 0.32705697417259216, mean loss: 0.35407731629980665
Epoch: 20, step: 704, loss: 0.32874372601509094, mean loss: 0.35407646000133497
Epoch: 20, step: 705, loss: 0.3481973111629486, mean loss: 0.3540762612874555
Epoch: 20, step: 706, loss: 0.3172568380832672, mean loss: 0.3540750168414757
Epoch: 20, step: 707, loss: 0.3512529730796814, mean loss: 0.3540749214634927
Epoch: 20, step: 708, loss: 0.3364252746105194, mean loss: 0.35407432496996966
Epoch: 20, step: 709, loss: 0.2985956072807312, mean loss: 0.3540724500555496
Epoch: 20, step: 710, loss: 0.31669798493385315, mean loss: 0.35407118702067003
Epoch: 20, step: 711, loss: 0.33328840136528015, mean loss: 0.35407048470971925
Epoch: 20, step: 712, loss: 0.36432746052742004, mean loss: 0.3540708313111391
Epoch: 20, step: 713, loss: 0.3276865780353546, mean loss: 0.35406993977051343
Epoch: 20, step: 714, loss: 0.3038095533847809, mean loss: 0.35406824149761645
Epoch: 20, step: 715, loss: 0.3348974287509918, mean loss: 0.35406759374748986
Epoch: 20, step: 716, loss: 0.37286850810050964, mean loss: 0.35406822897789675
Epoch: 20, step: 717, loss: 0.33086442947387695, mean loss: 0.3540674450127807
Epoch: 20, step: 718, loss: 0.330329567193985, mean loss: 0.354066643030355
Epoch: 20, step: 719, loss: 0.3333609998226166, mean loss: 0.3540659435153818
Epoch: 20, step: 720, loss: 0.3125579357147217, mean loss: 0.35406454126519427
Epoch: 20, step: 721, loss: 0.30011487007141113, mean loss: 0.3540627187643094
Epoch: 20, step: 722, loss: 0.32778114080429077, mean loss: 0.3540618309631419
Epoch: 20, step: 723, loss: 0.30740970373153687, mean loss: 0.3540602550907182
Epoch: 20, step: 724, loss: 0.36672666668891907, mean loss: 0.3540606829377575
Epoch: 20, step: 725, loss: 0.33273011445999146, mean loss: 0.3540599624564876
Epoch: 20, step: 726, loss: 0.3373529314994812, mean loss: 0.3540593981632138
Epoch: 20, step: 727, loss: 0.3290933668613434, mean loss: 0.35405855494410743
Epoch: 20, step: 728, loss: 0.36252468824386597, mean loss: 0.3540588408751858
Epoch: 20, step: 729, loss: 0.356710284948349, mean loss: 0.3540589304207472
Epoch: 20, step: 730, loss: 0.3090250492095947, mean loss: 0.35405740957102205
Epoch: 20, step: 731, loss: 0.3523944020271301, mean loss: 0.3540573534111023
Epoch: 20, step: 732, loss: 0.3597468137741089, mean loss: 0.3540575455382209
Epoch: 20, step: 733, loss: 0.3358055055141449, mean loss: 0.35405692920675524
Epoch: 20, step: 734, loss: 0.3416405916213989, mean loss: 0.3540565099483529
Epoch: 20, step: 735, loss: 0.3382274806499481, mean loss: 0.3540559754727553
Epoch: 20, step: 736, loss: 0.32650133967399597, mean loss: 0.3540550451072288
Epoch: 20, step: 737, loss: 0.31353381276130676, mean loss: 0.35405367697864665
Epoch: 20, step: 738, loss: 0.36889150738716125, mean loss: 0.3540541779351411
Epoch: 20, step: 739, loss: 0.33552658557891846, mean loss: 0.3540535524256085
Epoch: 20, step: 740, loss: 0.34258344769477844, mean loss: 0.3540531651967934
Epoch: 20, step: 741, loss: 0.33237165212631226, mean loss: 0.35405243325725283
Epoch: 20, step: 742, loss: 0.3003368675708771, mean loss: 0.3540506199511837
Epoch: 20, step: 743, loss: 0.3111685812473297, mean loss: 0.3540491724073441
Epoch: 20, step: 744, loss: 0.34401625394821167, mean loss: 0.3540488337434299
Epoch: 20, step: 745, loss: 0.3281359374523163, mean loss: 0.3540479590760333
Epoch: 20, step: 746, loss: 0.38316231966018677, mean loss: 0.3540489417729174
Epoch: 20, step: 747, loss: 0.41274723410606384, mean loss: 0.35405092294924834
Epoch: 20, step: 748, loss: 0.36071521043777466, mean loss: 0.3540511478737307
Epoch: 20, step: 749, loss: 0.3199462890625, mean loss: 0.35404999684913363
Epoch: 20, step: 750, loss: 0.3641040325164795, mean loss: 0.35405033615714443
Epoch: 20, step: 751, loss: 0.3285730481147766, mean loss: 0.35404947636745615
Epoch: 20, step: 752, loss: 0.3136930465698242, mean loss: 0.3540481144928637
Epoch: 20, step: 753, loss: 0.3216700255870819, mean loss: 0.35404702189352155
Epoch: 20, step: 754, loss: 0.3050185441970825, mean loss: 0.35404536748226134
Epoch: 20, step: 755, loss: 0.3669784665107727, mean loss: 0.3540458038805279
Epoch: 20, step: 756, loss: 0.3402833044528961, mean loss: 0.354045339511684
Epoch: 20, step: 757, loss: 0.3152426779270172, mean loss: 0.35404403029171017
Epoch: 20, step: 758, loss: 0.3498663604259491, mean loss: 0.3540438893399282
Epoch: 20, step: 759, loss: 0.3415334224700928, mean loss: 0.3540434672593995
Epoch: 20, step: 760, loss: 0.30729955434799194, mean loss: 0.3540418902575132
Epoch: 20, step: 761, loss: 0.331464022397995, mean loss: 0.35404112857247644
Epoch: 20, step: 762, loss: 0.31950870156288147, mean loss: 0.35403996362874574
Epoch: 20, step: 763, loss: 0.3736724257469177, mean loss: 0.3540406259031391
Epoch: 20, step: 764, loss: 0.3637029230594635, mean loss: 0.3540409518365902
Epoch: 20, step: 765, loss: 0.3619566857814789, mean loss: 0.3540412188450886
Epoch: 20, step: 766, loss: 0.30156630277633667, mean loss: 0.35403944885432836
Epoch: 20, step: 767, loss: 0.3766668140888214, mean loss: 0.3540402120547208
Epoch: 20, step: 768, loss: 0.35034382343292236, mean loss: 0.3540400873831089
Epoch: 20, step: 769, loss: 0.35326826572418213, mean loss: 0.35404006135202426
Epoch: 20, step: 770, loss: 0.3496430218219757, mean loss: 0.35403991305889654
Epoch: 20, step: 771, loss: 0.32214057445526123, mean loss: 0.3540388372684405
Epoch: 20, step: 772, loss: 0.3272806704044342, mean loss: 0.3540379348920582
Epoch: 20, step: 773, loss: 0.3515161871910095, mean loss: 0.3540378498530179
Epoch: 20, step: 774, loss: 0.3156105875968933, mean loss: 0.35403655404245454
Epoch: 20, step: 775, loss: 0.32093918323516846, mean loss: 0.3540354379994681
Epoch: 20, step: 776, loss: 0.3385778069496155, mean loss: 0.35403491678589116
Epoch: 20, step: 777, loss: 0.3096141517162323, mean loss: 0.35403341901918167
Epoch: 20, step: 778, loss: 0.31967994570732117, mean loss: 0.354032260737604
Epoch: 20, step: 779, loss: 0.3425508141517639, mean loss: 0.3540318736355613
Epoch: 20, step: 780, loss: 0.3092252016067505, mean loss: 0.35403036300975543
Epoch: 20, step: 781, loss: 0.339368611574173, mean loss: 0.3540298687156608
Epoch: 20, step: 782, loss: 0.32325559854507446, mean loss: 0.3540288312524854
Epoch: 20, step: 783, loss: 0.35629865527153015, mean loss: 0.3540289077702854
Epoch: 20, step: 784, loss: 0.3541461229324341, mean loss: 0.35402891172158024
Epoch: 20, step: 785, loss: 0.3651025593280792, mean loss: 0.35402928499898895
Epoch: 20, step: 786, loss: 0.34855613112449646, mean loss: 0.35402910051272896
Epoch: 20, step: 787, loss: 0.33011394739151, mean loss: 0.35402829442020095
Epoch: 20, step: 788, loss: 0.3330099582672119, mean loss: 0.35402758599267886
Epoch: 20, step: 789, loss: 0.3169727921485901, mean loss: 0.3540263370950097
Epoch: 20, step: 790, loss: 0.30605238676071167, mean loss: 0.35402472023173126
Epoch: 20, step: 791, loss: 0.3567344546318054, mean loss: 0.35402481155467547
Epoch: 20, step: 792, loss: 0.3174740970134735, mean loss: 0.35402357977108295
Epoch: 20, step: 793, loss: 0.3108097016811371, mean loss: 0.3540221234834881
Epoch: 20, step: 794, loss: 0.3375970125198364, mean loss: 0.3540215699835399
Epoch: 20, step: 795, loss: 0.34716883301734924, mean loss: 0.35402133906505473
Epoch: 20, step: 796, loss: 0.36895957589149475, mean loss: 0.35402184242579965
Epoch: 20, step: 797, loss: 0.3193964958190918, mean loss: 0.35402067572499074
Epoch: 20, step: 798, loss: 0.32800042629241943, mean loss: 0.3540197990024114
Epoch: 20, step: 799, loss: 0.3077617585659027, mean loss: 0.3540182404430975
Epoch: 20, step: 800, loss: 0.37774229049682617, mean loss: 0.35401903974399884
Epoch: 20, step: 801, loss: 0.34091660380363464, mean loss: 0.35401859831700805
Epoch: 20, step: 802, loss: 0.3273082673549652, mean loss: 0.35401769846419795
Epoch: 20, step: 803, loss: 0.32827329635620117, mean loss: 0.3540168311820895
Epoch: 20, step: 804, loss: 0.37654635310173035, mean loss: 0.3540175901351607
Epoch: 20, step: 805, loss: 0.36141669750213623, mean loss: 0.3540178393808444
Epoch: 20, step: 806, loss: 0.34134215116500854, mean loss: 0.3540174124031028
Epoch: 20, step: 807, loss: 0.33138251304626465, mean loss: 0.3540166499772285
Epoch: 20, step: 808, loss: 0.33633020520210266, mean loss: 0.35401605425339894
Epoch: 20, step: 809, loss: 0.30819573998451233, mean loss: 0.35401451096224806
Epoch: 20, step: 810, loss: 0.32332316040992737, mean loss: 0.35401347727020155
Epoch: 20, step: 811, loss: 0.3713415861129761, mean loss: 0.3540140608654071
Epoch: 20, step: 812, loss: 0.3010011613368988, mean loss: 0.3540122754985015
Epoch: 20, step: 813, loss: 0.2987764775753021, mean loss: 0.3540104153315343
Epoch: 20, step: 814, loss: 0.35706812143325806, mean loss: 0.3540105183019368
Epoch: 20, step: 815, loss: 0.34309035539627075, mean loss: 0.35401015057015794
Epoch: 20, step: 816, loss: 0.3424761891365051, mean loss: 0.354009762182057
Epoch: 20, step: 817, loss: 0.37055450677871704, mean loss: 0.35401031928167975
Epoch: 20, step: 818, loss: 0.3257949948310852, mean loss: 0.3540093692387675
Epoch: 20, step: 819, loss: 0.33010998368263245, mean loss: 0.35400856454565116
Epoch: 20, step: 820, loss: 0.33604758977890015, mean loss: 0.35400795981938715
Epoch: 20, step: 821, loss: 0.3035320043563843, mean loss: 0.35400626040670574
Epoch: 20, step: 822, loss: 0.3261849284172058, mean loss: 0.3540053237561321
Epoch: 20, step: 823, loss: 0.3469904661178589, mean loss: 0.3540050875974451
Epoch: 20, step: 824, loss: 0.3340291380882263, mean loss: 0.35400441511976427
Epoch: 20, step: 825, loss: 0.31913453340530396, mean loss: 0.3540032412868108
Epoch: 20, step: 826, loss: 0.3517206907272339, mean loss: 0.354003164451366
Epoch: 20, step: 827, loss: 0.33144938945770264, mean loss: 0.354002405269496
Epoch: 20, step: 828, loss: 0.3379102945327759, mean loss: 0.35400186361172437
Epoch: 20, step: 829, loss: 0.3281514048576355, mean loss: 0.35400099351886827
Epoch: 20, step: 830, loss: 0.30423641204833984, mean loss: 0.35399931856408823
Epoch: 20, step: 831, loss: 0.33640047907829285, mean loss: 0.35399872624988904
Epoch: 20, step: 832, loss: 0.32954421639442444, mean loss: 0.35399790322596497
Epoch: 20, step: 833, loss: 0.33200743794441223, mean loss: 0.3539971631551135
Epoch: 20, step: 834, loss: 0.38341236114501953, mean loss: 0.3539981530658653
Epoch: 20, step: 835, loss: 0.34387779235839844, mean loss: 0.35399781249645124
Epoch: 20, step: 836, loss: 0.27049320936203003, mean loss: 0.3539950025020664
Epoch: 20, step: 837, loss: 0.33811694383621216, mean loss: 0.3539944682111092
Epoch: 20, step: 838, loss: 0.3499112129211426, mean loss: 0.3539943308156622
Epoch: 20, step: 839, loss: 0.34996306896209717, mean loss: 0.3539941951742808
Epoch: 20, step: 840, loss: 0.3510858118534088, mean loss: 0.3539940973181077
Epoch: 20, step: 841, loss: 0.3369278013706207, mean loss: 0.35399352312067994
Epoch: 20, step: 842, loss: 0.30563727021217346, mean loss: 0.35399189622390276
Epoch: 20, step: 843, loss: 0.3340207636356354, mean loss: 0.35399122433813407
Epoch: 20, step: 844, loss: 0.3514463007450104, mean loss: 0.353991138722538
Epoch: 20, step: 845, loss: 0.3149779438972473, mean loss: 0.3539898262958804
Epoch: 20, step: 846, loss: 0.35676518082618713, mean loss: 0.3539899196572869
Epoch: 20, step: 847, loss: 0.38843852281570435, mean loss: 0.3539910784504502
Epoch: 20, step: 848, loss: 0.3448113203048706, mean loss: 0.3539907696691879
Epoch: 20, step: 849, loss: 0.35424306988716125, mean loss: 0.3539907781555726
Epoch: 20, step: 850, loss: 0.3545362949371338, mean loss: 0.35399079650398946
Epoch: 20, step: 851, loss: 0.3278115689754486, mean loss: 0.3539899159972113
Epoch: 20, step: 852, loss: 0.281607449054718, mean loss: 0.353987481582018
Epoch: 20, step: 853, loss: 0.31836652755737305, mean loss: 0.3539862835947299
Epoch: 20, step: 854, loss: 0.3554195165634155, mean loss: 0.3539863317949306
Epoch: 20, step: 855, loss: 0.30658215284347534, mean loss: 0.35398473762695404
Epoch: 20, step: 856, loss: 0.3485051095485687, mean loss: 0.3539845533572537
Epoch: 20, step: 857, loss: 0.2926194965839386, mean loss: 0.35398248983392416
Epoch: 20, step: 858, loss: 0.28834208846092224, mean loss: 0.3539802826177645
Epoch: 20, step: 859, loss: 0.3435860574245453, mean loss: 0.35397993311456366
Epoch: 20, step: 860, loss: 0.39526912569999695, mean loss: 0.35398132140657085
Epoch: 20, step: 861, loss: 0.3326861262321472, mean loss: 0.35398060540915394
Epoch: 20, step: 862, loss: 0.34520113468170166, mean loss: 0.3539803102314406
Epoch: 20, step: 863, loss: 0.32543718814849854, mean loss: 0.3539793506052275
Epoch: 20, step: 864, loss: 0.3468913435935974, mean loss: 0.35397911231284185
Epoch: 20, step: 865, loss: 0.3219144642353058, mean loss: 0.3539780343646109
Epoch: 20, step: 866, loss: 0.33398106694221497, mean loss: 0.3539773621298503
Epoch: 20, step: 867, loss: 0.32142558693885803, mean loss: 0.3539762678789699
Epoch: 20, step: 868, loss: 0.3059978187084198, mean loss: 0.35397465510377846
Epoch: 20, step: 869, loss: 0.29187992215156555, mean loss: 0.3539725678858641
Epoch: 20, step: 870, loss: 0.3113861083984375, mean loss: 0.3539711364563496
Epoch: 20, step: 871, loss: 0.3391539752483368, mean loss: 0.3539706384339912
Epoch: 20, step: 872, loss: 0.33677351474761963, mean loss: 0.35397006043769885
Epoch: 20, step: 873, loss: 0.3536522388458252, mean loss: 0.35397004975605634
Epoch: 20, step: 874, loss: 0.30901601910591125, mean loss: 0.35396853895011954
Epoch: 20, step: 875, loss: 0.325666218996048, mean loss: 0.3539675878034616
Epoch: 20, step: 876, loss: 0.33858704566955566, mean loss: 0.3539670709320655
Epoch: 20, step: 877, loss: 0.306607186794281, mean loss: 0.35396547943115353
Epoch: 20, step: 878, loss: 0.32540464401245117, mean loss: 0.3539645196934131
Epoch: 20, step: 879, loss: 0.32323408126831055, mean loss: 0.353963487084595
Epoch: 20, step: 880, loss: 0.3035799562931061, mean loss: 0.3539617941464951
Epoch: 20, step: 881, loss: 0.3217926025390625, mean loss: 0.3539607132651159
Epoch: 20, step: 882, loss: 0.32706761360168457, mean loss: 0.3539598096902188
Epoch: 20, step: 883, loss: 0.3032723665237427, mean loss: 0.35395810671201805
Epoch: 20, step: 884, loss: 0.32986021041870117, mean loss: 0.35395729710690155
Epoch: 20, step: 885, loss: 0.32431578636169434, mean loss: 0.35395630128916505
Epoch: 20, step: 886, loss: 0.3479682505130768, mean loss: 0.35395610012509826
Epoch: 20, step: 887, loss: 0.34466123580932617, mean loss: 0.3539557878816047
Epoch: 20, step: 888, loss: 0.3525694012641907, mean loss: 0.353955741310117
Epoch: 20, step: 889, loss: 0.3390558362007141, mean loss: 0.35395524080944146
Epoch: 20, step: 890, loss: 0.3376948833465576, mean loss: 0.35395469462834367
Epoch: 20, step: 891, loss: 0.34831851720809937, mean loss: 0.35395450531699674
Epoch: 20, step: 892, loss: 0.3610928952693939, mean loss: 0.3539547450775164
Epoch: 20, step: 893, loss: 0.32734358310699463, mean loss: 0.35395385130570306
Epoch: 20, step: 894, loss: 0.2972904145717621, mean loss: 0.3539519482515726
Epoch: 20, step: 895, loss: 0.3950817883014679, mean loss: 0.35395332956001063
Epoch: 20, step: 896, loss: 0.33789023756980896, mean loss: 0.35395279011372693
Epoch: 20, step: 897, loss: 0.33876970410346985, mean loss: 0.3539522802377779
Epoch: 20, step: 898, loss: 0.33014094829559326, mean loss: 0.35395148063631576
Epoch: 20, step: 899, loss: 0.31934458017349243, mean loss: 0.35395031855100806
Epoch: 20, step: 900, loss: 0.3177414536476135, mean loss: 0.3539491027132288
Epoch: 20, step: 901, loss: 0.3413589298725128, mean loss: 0.35394867996885837
Epoch: 20, step: 902, loss: 0.3226287364959717, mean loss: 0.3539476283641351
Epoch: 20, step: 903, loss: 0.3350193500518799, mean loss: 0.3539469928457927
Epoch: 20, step: 904, loss: 0.3337043225765228, mean loss: 0.3539463132194617
Epoch: 20, step: 905, loss: 0.3023918867111206, mean loss: 0.35394458239200893
Epoch: 20, step: 906, loss: 0.3827204704284668, mean loss: 0.35394554844726916
Epoch: 20, step: 907, loss: 0.3117994964122772, mean loss: 0.353944133580476
Epoch: 20, step: 908, loss: 0.2839280962944031, mean loss: 0.3539417831814265
Epoch: 20, step: 909, loss: 0.4113841652870178, mean loss: 0.35394371142520314
Epoch: 20, step: 910, loss: 0.33633142709732056, mean loss: 0.35394312023040175
Epoch: 20, step: 911, loss: 0.35925787687301636, mean loss: 0.35394329862583146
Epoch: 20, step: 912, loss: 0.3290437161922455, mean loss: 0.3539424628730562
Epoch: 20, step: 913, loss: 0.3399174213409424, mean loss: 0.3539419921393
Epoch: 20, step: 914, loss: 0.34972381591796875, mean loss: 0.35394185056600846
Epoch: 20, step: 915, loss: 0.3203713893890381, mean loss: 0.3539407238892338
Epoch: 20, step: 916, loss: 0.328926146030426, mean loss: 0.35393988438935603
Epoch: 20, step: 917, loss: 0.33233052492141724, mean loss: 0.35393915919439434
Epoch: 20, step: 918, loss: 0.3362036347389221, mean loss: 0.35393856402259477
Epoch: 20, step: 919, loss: 0.3356465995311737, mean loss: 0.353937950198283
Epoch: 20, step: 920, loss: 0.33616021275520325, mean loss: 0.35393735364993084
Epoch: 20, step: 921, loss: 0.32533591985702515, mean loss: 0.3539363939346838
Epoch: 20, step: 922, loss: 0.36126577854156494, mean loss: 0.35393663986242957
Epoch: 20, step: 923, loss: 0.3477873206138611, mean loss: 0.35393643353712934
Epoch: 20, step: 924, loss: 0.33762407302856445, mean loss: 0.3539358862343107
Epoch: 20, step: 925, loss: 0.31434863805770874, mean loss: 0.3539345580705794
Epoch: 20, step: 926, loss: 0.2993498146533966, mean loss: 0.35393272679794485
Epoch: 20, step: 927, loss: 0.3427846431732178, mean loss: 0.35393235280158064
Epoch: 20, step: 928, loss: 0.35942715406417847, mean loss: 0.3539325371352135
Epoch: 20, step: 929, loss: 0.36035284399986267, mean loss: 0.35393275250947936
Epoch: 20, step: 930, loss: 0.32398319244384766, mean loss: 0.3539317478615284
Epoch: 20, step: 931, loss: 0.3083874583244324, mean loss: 0.3539302201448527
Epoch: 20, step: 932, loss: 0.32578232884407043, mean loss: 0.35392927599661866
Epoch: 20, step: 933, loss: 0.3459698557853699, mean loss: 0.3539290090274025
Epoch: 20, step: 934, loss: 0.32128259539604187, mean loss: 0.35392791406132396
Epoch: 20, step: 935, loss: 0.35157251358032227, mean loss: 0.3539278350634543
Epoch: 20, step: 936, loss: 0.3253340721130371, mean loss: 0.35392687608827406
Epoch: 20, step: 937, loss: 0.33398550748825073, mean loss: 0.3539262073187858
Epoch: 20, step: 938, loss: 0.2987790107727051, mean loss: 0.35392435792086685
Epoch: 20, step: 939, loss: 0.3771549463272095, mean loss: 0.3539251369479764
Epoch: 20, step: 940, loss: 0.3275691270828247, mean loss: 0.3539242531409322
Epoch: 20, step: 941, loss: 0.31698158383369446, mean loss: 0.3539230143685726
Epoch: 20, step: 942, loss: 0.3658994436264038, mean loss: 0.35392341595222476
Epoch: 20, step: 943, loss: 0.3394584357738495, mean loss: 0.35392293094081856
Epoch: 20, step: 944, loss: 0.3509975075721741, mean loss: 0.3539228328545363
Epoch: 20, step: 945, loss: 0.3452461063861847, mean loss: 0.35392254194303396
Epoch: 20, step: 946, loss: 0.3261069655418396, mean loss: 0.3539216093793701
Epoch: 20, step: 947, loss: 0.3487808406352997, mean loss: 0.35392143703228873
Epoch: 20, step: 948, loss: 0.31797319650650024, mean loss: 0.3539202318882837
Epoch: 20, step: 949, loss: 0.29680073261260986, mean loss: 0.3539183170542483
Epoch: 20, step: 950, loss: 0.3659985065460205, mean loss: 0.3539187220084735
Epoch: 20, step: 951, loss: 0.3107580244541168, mean loss: 0.3539172752165201
Epoch: 20, step: 952, loss: 0.32382476329803467, mean loss: 0.3539162665176994
Epoch: 20, step: 953, loss: 0.31868836283683777, mean loss: 0.3539150857204989
Epoch: 20, step: 954, loss: 0.31354567408561707, mean loss: 0.35391373263145465
Epoch: 20, step: 955, loss: 0.3157702088356018, mean loss: 0.35391245419185835
Epoch: 20, step: 956, loss: 0.30151548981666565, mean loss: 0.35391069808486453
Epoch: 20, step: 957, loss: 0.31448206305503845, mean loss: 0.3539093766613432
Epoch: 20, step: 958, loss: 0.34721678495407104, mean loss: 0.35390915237126286
Epoch: 20, step: 959, loss: 0.3606119155883789, mean loss: 0.35390937699469505
Epoch: 20, step: 960, loss: 0.33177390694618225, mean loss: 0.3539086352142571
Epoch: 20, step: 961, loss: 0.3436344861984253, mean loss: 0.3539082909293896
Epoch: 20, step: 962, loss: 0.35108110308647156, mean loss: 0.35390819619401304
Epoch: 20, step: 963, loss: 0.32759860157966614, mean loss: 0.3539073146233585
Epoch: 20, step: 964, loss: 0.3338649272918701, mean loss: 0.3539066430741097
Epoch: 20, step: 965, loss: 0.3597140908241272, mean loss: 0.3539068376545476
Epoch: 20, step: 966, loss: 0.3330058753490448, mean loss: 0.3539061373844265
Epoch: 20, step: 967, loss: 0.34758031368255615, mean loss: 0.3539059254498345
Epoch: 20, step: 968, loss: 0.326318621635437, mean loss: 0.35390500122108937
Epoch: 20, step: 969, loss: 0.33221912384033203, mean loss: 0.35390427472603475
Epoch: 20, step: 970, loss: 0.31482043862342834, mean loss: 0.35390296542865435
Epoch: 20, step: 971, loss: 0.3231460452079773, mean loss: 0.3539019351151001
Epoch: 20, step: 972, loss: 0.32022687792778015, mean loss: 0.35390080708585053
Epoch: 20, step: 973, loss: 0.35642436146736145, mean loss: 0.35390089161570853
Epoch: 20, step: 974, loss: 0.29936400055885315, mean loss: 0.35389906489016654
Epoch: 20, step: 975, loss: 0.28499430418014526, mean loss: 0.35389675698687373
Epoch: 20, step: 976, loss: 0.35843726992607117, mean loss: 0.3538969090621974
Epoch: 20, step: 977, loss: 0.35190120339393616, mean loss: 0.3538968422222996
Epoch: 20, step: 978, loss: 0.29729053378105164, mean loss: 0.35389494643515196
Epoch: 20, step: 979, loss: 0.32317420840263367, mean loss: 0.35389391760936384
Epoch: 20, step: 980, loss: 0.3599244952201843, mean loss: 0.35389411956434225
Epoch: 20, step: 981, loss: 0.3439457416534424, mean loss: 0.35389378641927793
Epoch: 20, step: 982, loss: 0.331171452999115, mean loss: 0.353893025533452
Epoch: 20, step: 983, loss: 0.30739495158195496, mean loss: 0.35389146853928
Epoch: 20, step: 984, loss: 0.3089485466480255, mean loss: 0.3538899636699717
Epoch: 20, step: 985, loss: 0.32538551092147827, mean loss: 0.3538890092585089
Epoch: 20, step: 986, loss: 0.329721063375473, mean loss: 0.3538882000729234
Epoch: 20, step: 987, loss: 0.3456900119781494, mean loss: 0.353887925592272
Epoch: 20, step: 988, loss: 0.32869434356689453, mean loss: 0.3538870821230556
Epoch: 20, step: 989, loss: 0.3457004129886627, mean loss: 0.35388680804641903
Epoch: 20, step: 990, loss: 0.3372707962989807, mean loss: 0.3538862517874472
Epoch: 20, step: 991, loss: 0.30940085649490356, mean loss: 0.3538847625870156
Epoch: 20, step: 992, loss: 0.32979822158813477, mean loss: 0.35388395628898733
Epoch: 20, step: 993, loss: 0.32444536685943604, mean loss: 0.3538829708638876
Epoch: 20, step: 994, loss: 0.3416612446308136, mean loss: 0.35388256176844884
Epoch: 20, step: 995, loss: 0.3080226480960846, mean loss: 0.35388102675995803
Epoch: 20, step: 996, loss: 0.35376283526420593, mean loss: 0.35388102280402217
Epoch: 20, step: 997, loss: 0.3471069931983948, mean loss: 0.35388079608102846
Epoch: 20, step: 998, loss: 0.39111220836639404, mean loss: 0.35388204215393204
Epoch: 20, step: 999, loss: 0.33960017561912537, mean loss: 0.35388156417981775
Epoch: 20, step: 1000, loss: 0.32858699560165405, mean loss: 0.35388071766970836
Epoch: 20, step: 1001, loss: 0.32365739345550537, mean loss: 0.3538797062473064
Epoch: 20, step: 1002, loss: 0.33467838168144226, mean loss: 0.35387906369720884
Epoch: 20, step: 1003, loss: 0.3158620297908783, mean loss: 0.35387779154375193
Epoch: 20, step: 1004, loss: 0.3195175528526306, mean loss: 0.3538766417950924
Epoch: 20, step: 1005, loss: 0.33891069889068604, mean loss: 0.3538761410274117
Epoch: 20, step: 1006, loss: 0.3434242308139801, mean loss: 0.35387579131314756
Epoch: 20, step: 1007, loss: 0.3233855366706848, mean loss: 0.3538747711627647
Epoch: 20, step: 1008, loss: 0.3153833746910095, mean loss: 0.3538734833513133
Epoch: 20, step: 1009, loss: 0.3481987714767456, mean loss: 0.35387329349812247
Epoch: 20, step: 1010, loss: 0.3495108485221863, mean loss: 0.35387314755302274
Epoch: 20, step: 1011, loss: 0.33944928646087646, mean loss: 0.35387266502053605
Epoch: 20, step: 1012, loss: 0.33646178245544434, mean loss: 0.3538720825804141
Epoch: 20, step: 1013, loss: 0.3484468162059784, mean loss: 0.35387190109696004
Epoch: 20, step: 1014, loss: 0.34158265590667725, mean loss: 0.3538714900166727
Epoch: 20, step: 1015, loss: 0.32953330874443054, mean loss: 0.3538706759217679
Epoch: 20, step: 1016, loss: 0.3094269931316376, mean loss: 0.3538691893618191
Epoch: 20, step: 1017, loss: 0.3244008421897888, mean loss: 0.35386820373244016
Epoch: 20, step: 1018, loss: 0.3081219494342804, mean loss: 0.35386667370620856
Epoch: 20, step: 1019, loss: 0.3678973317146301, mean loss: 0.35386714295898475
Epoch: 20, step: 1020, loss: 0.3264705240726471, mean loss: 0.3538662267147492
Epoch: 20, step: 1021, loss: 0.3140266239643097, mean loss: 0.35386489437568325
Epoch: 20, step: 1022, loss: 0.3187764286994934, mean loss: 0.3538637209661365
Epoch: 20, step: 1023, loss: 0.29239025712013245, mean loss: 0.35386166527245516
Epoch: 20, step: 1024, loss: 0.3388269245624542, mean loss: 0.35386116252238964
Epoch: 20, step: 1025, loss: 0.34279486536979675, mean loss: 0.3538607924863717
Epoch: 20, step: 1026, loss: 0.3320407569408417, mean loss: 0.3538600628901051
Epoch: 20, step: 1027, loss: 0.30366793274879456, mean loss: 0.3538583846725666
Epoch: 20, step: 1028, loss: 0.3551860451698303, mean loss: 0.35385842906256615
Epoch: 20, step: 1029, loss: 0.3503476083278656, mean loss: 0.35385831168306986
Epoch: 20, step: 1030, loss: 0.3230409026145935, mean loss: 0.35385728137953376
Epoch: 20, step: 1031, loss: 0.3376121520996094, mean loss: 0.35385673828213876
Epoch: 20, step: 1032, loss: 0.34803956747055054, mean loss: 0.35385654381248305
Epoch: 20, step: 1033, loss: 0.36348479986190796, mean loss: 0.35385686567702973
Epoch: 20, step: 1034, loss: 0.321256548166275, mean loss: 0.3538557759121121
Epoch: 20, step: 1035, loss: 0.3874821662902832, mean loss: 0.3538568999390668
Epoch: 20, step: 1036, loss: 0.325703501701355, mean loss: 0.3538559588888867
Epoch: 20, step: 1037, loss: 0.35317540168762207, mean loss: 0.3538559361414704
Epoch: 20, step: 1038, loss: 0.3506867587566376, mean loss: 0.3538558302162261
Epoch: 20, step: 1039, loss: 0.35325607657432556, mean loss: 0.35385581017098405
Epoch: 20, step: 1040, loss: 0.3437485992908478, mean loss: 0.3538554723744238
Epoch: 20, step: 1041, loss: 0.33235108852386475, mean loss: 0.3538547536930572
Epoch: 20, step: 1042, loss: 0.3248811960220337, mean loss: 0.3538537854225739
Epoch: 20, step: 1043, loss: 0.3242056369781494, mean loss: 0.353852794640979
Epoch: 20, step: 1044, loss: 0.3208038806915283, mean loss: 0.35385169024953544
Epoch: 20, step: 1045, loss: 0.35178783535957336, mean loss: 0.3538516212842581
Epoch: 20, step: 1046, loss: 0.30428677797317505, mean loss: 0.3538499650927484
Epoch: 20, step: 1047, loss: 0.3474541902542114, mean loss: 0.35384975138736086
Epoch: 20, step: 1048, loss: 0.31124573945999146, mean loss: 0.3538483278846736
Epoch: 20, step: 1049, loss: 0.3439275920391083, mean loss: 0.3538479964200613
Epoch: 20, step: 1050, loss: 0.33818262815475464, mean loss: 0.3538474730373389
Epoch: 20, step: 1051, loss: 0.391215443611145, mean loss: 0.35384872146612995
Epoch: 20, step: 1052, loss: 0.32717767357826233, mean loss: 0.3538478304412448
Epoch: 20, step: 1053, loss: 0.3307929039001465, mean loss: 0.3538470602492711
Epoch: 20, step: 1054, loss: 0.3241064250469208, mean loss: 0.3538460667421656
Epoch: 20, step: 1055, loss: 0.31850752234458923, mean loss: 0.3538448862723501
Epoch: 20, step: 1056, loss: 0.3493169844150543, mean loss: 0.35384473502466807
Epoch: 20, step: 1057, loss: 0.34044313430786133, mean loss: 0.35384428737951085
Epoch: 20, step: 1058, loss: 0.31106138229370117, mean loss: 0.3538428583770363
Epoch: 20, step: 1059, loss: 0.33989217877388, mean loss: 0.35384239242247373
Epoch: 20, step: 1060, loss: 0.41031140089035034, mean loss: 0.35384427843190785
Epoch: 20, step: 1061, loss: 0.32837843894958496, mean loss: 0.3538434279262809
Epoch: 20, step: 1062, loss: 0.33478885889053345, mean loss: 0.35384279156489307
Epoch: 20, step: 1063, loss: 0.3356580138206482, mean loss: 0.3538421842720216
Epoch: 20, step: 1064, loss: 0.3152627646923065, mean loss: 0.3538408959294075
Epoch: 20, step: 1065, loss: 0.3811093270778656, mean loss: 0.3538418065161686
Epoch: 20, step: 1066, loss: 0.3379110097885132, mean loss: 0.35384127454980374
Epoch: 20, step: 1067, loss: 0.32058414816856384, mean loss: 0.3538401640540651
Epoch: 20, step: 1068, loss: 0.31438595056533813, mean loss: 0.3538388466740695
Epoch: 20, step: 1069, loss: 0.3252286911010742, mean loss: 0.35383789141011046
Epoch: 20, step: 1070, loss: 0.33721214532852173, mean loss: 0.353837336311914
Epoch: 20, step: 1071, loss: 0.34962376952171326, mean loss: 0.353837195634604
Epoch: 20, step: 1072, loss: 0.32053783535957336, mean loss: 0.3538360839142329
Epoch: 20, step: 1073, loss: 0.35669443011283875, mean loss: 0.3538361793387571
Epoch: 20, step: 1074, loss: 0.33976542949676514, mean loss: 0.353835709609168
Epoch: 20, step: 1075, loss: 0.3532218635082245, mean loss: 0.35383568911757696
Epoch: 20, step: 1076, loss: 0.34945812821388245, mean loss: 0.3538355429894298
Epoch: 20, step: 1077, loss: 0.3377118408679962, mean loss: 0.3538350047791981
Epoch: 20, step: 1078, loss: 0.324446439743042, mean loss: 0.35383402381971896
Epoch: 20, step: 1079, loss: 0.3301140069961548, mean loss: 0.353833232096861
Epoch: 20, step: 1080, loss: 0.352183997631073, mean loss: 0.35383317705081896
Epoch: 20, step: 1081, loss: 0.29683157801628113, mean loss: 0.3538312745877312
Epoch: 20, step: 1082, loss: 0.3519512712955475, mean loss: 0.35383121184357036
Epoch: 20, step: 1083, loss: 0.305182546377182, mean loss: 0.35382958827310357
Epoch: 20, step: 1084, loss: 0.3243984282016754, mean loss: 0.35382860608855254
Epoch: 20, step: 1085, loss: 0.3062901794910431, mean loss: 0.35382701967639885
Epoch: 20, step: 1086, loss: 0.34979766607284546, mean loss: 0.3538268852167064
Epoch: 20, step: 1087, loss: 0.31355389952659607, mean loss: 0.3538255413503927
Epoch: 20, step: 1088, loss: 0.35785695910453796, mean loss: 0.3538256758699881
Epoch: 20, step: 1089, loss: 0.32767125964164734, mean loss: 0.35382480318342724
Epoch: 20, step: 1090, loss: 0.3311804533004761, mean loss: 0.3538240476414072
Epoch: 20, step: 1091, loss: 0.30138126015663147, mean loss: 0.3538222979154134
Epoch: 20, step: 1092, loss: 0.3213155269622803, mean loss: 0.35382121338030004
Epoch: 20, step: 1093, loss: 0.3204123377799988, mean loss: 0.3538200987851309
Epoch: 20, step: 1094, loss: 0.3530130684375763, mean loss: 0.35382007186168307
Epoch: 20, step: 1095, loss: 0.34224432706832886, mean loss: 0.3538196856945896
Epoch: 20, step: 1096, loss: 0.3181890547275543, mean loss: 0.3538184970956315
Epoch: 20, step: 1097, loss: 0.30452993512153625, mean loss: 0.35381685293785
Epoch: 20, step: 1098, loss: 0.3383360803127289, mean loss: 0.3538163365506248
Epoch: 20, step: 1099, loss: 0.4134949743747711, mean loss: 0.35381832716562894
Epoch: 20, step: 1100, loss: 0.33758994936943054, mean loss: 0.3538177858768862
Epoch: 20, step: 1101, loss: 0.32809388637542725, mean loss: 0.35381692789878266
Epoch: 20, step: 1102, loss: 0.3299010097980499, mean loss: 0.35381613024951136
Epoch: 20, step: 1103, loss: 0.3489692211151123, mean loss: 0.3538159685996603
Epoch: 20, step: 1104, loss: 0.3200015425682068, mean loss: 0.3538148408882702
Epoch: 20, step: 1105, loss: 0.32361653447151184, mean loss: 0.35381383380808556
Epoch: 20, step: 1106, loss: 0.2652794122695923, mean loss: 0.353810881381316
Epoch: 20, step: 1107, loss: 0.32762467861175537, mean loss: 0.35381000815860125
Epoch: 20, step: 1108, loss: 0.3078433871269226, mean loss: 0.35380847537587984
Epoch: 20, step: 1109, loss: 0.33789417147636414, mean loss: 0.3538079447221986
Epoch: 20, step: 1110, loss: 0.3164686858654022, mean loss: 0.35380669970673206
Epoch: 20, step: 1111, loss: 0.3321893811225891, mean loss: 0.35380597893724075
Epoch: 20, step: 1112, loss: 0.31045886874198914, mean loss: 0.3538045336963447
Epoch: 20, step: 1113, loss: 0.325302392244339, mean loss: 0.35380358343491064
Epoch: 20, step: 1114, loss: 0.31216832995414734, mean loss: 0.3538021953617824
Epoch: 20, step: 1115, loss: 0.31884562969207764, mean loss: 0.35380102998754354
Epoch: 20, step: 1116, loss: 0.3132766783237457, mean loss: 0.35379967904072673
Epoch: 20, step: 1117, loss: 0.3256951868534088, mean loss: 0.3537987421618619
Epoch: 20, step: 1118, loss: 0.3104003667831421, mean loss: 0.35379729550112726
Epoch: 20, step: 1119, loss: 0.3384726941585541, mean loss: 0.3537967846810825
Epoch: 20, step: 1120, loss: 0.31515657901763916, mean loss: 0.3537954967171592
Epoch: 20, step: 1121, loss: 0.33155357837677, mean loss: 0.3537947553693044
Epoch: 20, step: 1122, loss: 0.34386393427848816, mean loss: 0.3537944243750341
Epoch: 20, step: 1123, loss: 0.3258390724658966, mean loss: 0.3537934926541999
Epoch: 20, step: 1124, loss: 0.33006352186203003, mean loss: 0.3537927017869847
Epoch: 20, step: 1125, loss: 0.3428015410900116, mean loss: 0.3537923354882212
Epoch: 20, step: 1126, loss: 0.3046151101589203, mean loss: 0.3537906966297772
Epoch: 20, step: 1127, loss: 0.31546592712402344, mean loss: 0.3537894194780341
Epoch: 20, step: 1128, loss: 0.3204832077026367, mean loss: 0.35378830960393715
Epoch: 20, step: 1129, loss: 0.3050232529640198, mean loss: 0.35378668464370255
Epoch: 20, step: 1130, loss: 0.3214201033115387, mean loss: 0.3537856061531047
Epoch: 20, step: 1131, loss: 0.3628401756286621, mean loss: 0.3537859078514079
Epoch: 20, step: 1132, loss: 0.32742685079574585, mean loss: 0.35378502959674973
Epoch: 20, step: 1133, loss: 0.31636562943458557, mean loss: 0.35378378286521905
Epoch: 20, step: 1134, loss: 0.31220871210098267, mean loss: 0.35378239772209846
Epoch: 20, step: 1135, loss: 0.3599448502063751, mean loss: 0.35378260302768494
Epoch: 20, step: 1136, loss: 0.29724565148353577, mean loss: 0.35378071952994883
Epoch: 20, step: 1137, loss: 0.35064154863357544, mean loss: 0.3537806149536647
Epoch: 20, step: 1138, loss: 0.36255744099617004, mean loss: 0.3537809073293615
Epoch: 20, step: 1139, loss: 0.33509182929992676, mean loss: 0.35378028477513
Epoch: 20, step: 1140, loss: 0.3741036355495453, mean loss: 0.35378096174627605
Epoch: 20, step: 1141, loss: 0.3613820970058441, mean loss: 0.353781214931782
Epoch: 20, step: 1142, loss: 0.30980661511421204, mean loss: 0.35377975023472247
Epoch: 20, step: 1143, loss: 0.3341820240020752, mean loss: 0.35377909749936964
Epoch: 20, step: 1144, loss: 0.3554418683052063, mean loss: 0.35377915287891354
Epoch: 20, step: 1145, loss: 0.32849597930908203, mean loss: 0.3537783108362315
Epoch: 20, step: 1146, loss: 0.3064294159412384, mean loss: 0.3537767339589246
Epoch: 20, step: 1147, loss: 0.33002424240112305, mean loss: 0.3537759429474834
Epoch: 20, step: 1148, loss: 0.3095110058784485, mean loss: 0.3537744688745183
Epoch: 20, step: 1149, loss: 0.3778092563152313, mean loss: 0.3537752692337404
Epoch: 20, step: 1150, loss: 0.2895570695400238, mean loss: 0.3537731308367608
Epoch: 20, step: 1151, loss: 0.33775198459625244, mean loss: 0.3537725973675866
Epoch: 20, step: 1152, loss: 0.3016667068004608, mean loss: 0.3537708624130177
Epoch: 20, step: 1153, loss: 0.3270498216152191, mean loss: 0.35376997271997657
Epoch: 20, step: 1154, loss: 0.2978905439376831, mean loss: 0.35376811224290705
Epoch: 20, step: 1155, loss: 0.38145968317985535, mean loss: 0.3537690341889364
Epoch: 20, step: 1156, loss: 0.3209591507911682, mean loss: 0.3537679418733457
Epoch: 20, step: 1157, loss: 0.31814223527908325, mean loss: 0.35376675585208617
Epoch: 20, step: 1158, loss: 0.33685463666915894, mean loss: 0.3537661928466871
Epoch: 20, step: 1159, loss: 0.3385716378688812, mean loss: 0.35376568703593547
Epoch: 20, step: 1160, loss: 0.38350391387939453, mean loss: 0.3537666769572711
Epoch: 20, step: 1161, loss: 0.34921228885650635, mean loss: 0.3537665253565754
Epoch: 20, step: 1162, loss: 0.3937833309173584, mean loss: 0.35376785734091654
Epoch: 20, step: 1163, loss: 0.3307640850543976, mean loss: 0.3537670916714888
Epoch: 20, step: 1164, loss: 0.2961914539337158, mean loss: 0.35376517535803437
Epoch: 20, step: 1165, loss: 0.32266050577163696, mean loss: 0.3537641401230751
Epoch: 20, step: 1166, loss: 0.342879056930542, mean loss: 0.35376377785452273
Epoch: 20, step: 1167, loss: 0.3316909372806549, mean loss: 0.3537630432685079
Epoch: 20, step: 1168, loss: 0.3092724680900574, mean loss: 0.35376156266765
Epoch: 20, step: 1169, loss: 0.29354798793792725, mean loss: 0.3537595588881249
Epoch: 20, step: 1170, loss: 0.3237471282482147, mean loss: 0.35375856017158835
Epoch: 20, step: 1171, loss: 0.3153323829174042, mean loss: 0.3537572815153507
Epoch: 20, step: 1172, loss: 0.30143222212791443, mean loss: 0.3537555404226349
Epoch: 20, step: 1173, loss: 0.35512563586235046, mean loss: 0.3537555860104249
Epoch: 20, step: 1174, loss: 0.3565737307071686, mean loss: 0.35375567977667666
Epoch: 20, step: 1175, loss: 0.34554895758628845, mean loss: 0.3537554067289594
Epoch: 20, step: 1176, loss: 0.3220890164375305, mean loss: 0.3537543531843511
Epoch: 20, step: 1177, loss: 0.30896133184432983, mean loss: 0.353752862964731
Epoch: 20, step: 1178, loss: 0.3245369493961334, mean loss: 0.3537518910124515
Epoch: 20, step: 1179, loss: 0.34221789240837097, mean loss: 0.35375150731322985
Epoch: 20, step: 1180, loss: 0.3075464367866516, mean loss: 0.3537499702695345
Epoch: 20, step: 1181, loss: 0.3165857493877411, mean loss: 0.35374873401709345
Epoch: 20, step: 1182, loss: 0.3348061442375183, mean loss: 0.3537481039206367
Epoch: 20, step: 1183, loss: 0.36440837383270264, mean loss: 0.35374845850651726
Epoch: 20, step: 1184, loss: 0.32530391216278076, mean loss: 0.3537475124048594
Epoch: 20, step: 1185, loss: 0.3078218996524811, mean loss: 0.3537459849115862
Epoch: 20, step: 1186, loss: 0.32716336846351624, mean loss: 0.35374510079888966
Epoch: 20, step: 1187, loss: 0.3211956024169922, mean loss: 0.3537440182693439
Epoch: 20, step: 1188, loss: 0.3229133188724518, mean loss: 0.3537429929376269
Epoch: 20, step: 1189, loss: 0.34181198477745056, mean loss: 0.353742596163162
Epoch: 20, step: 1190, loss: 0.33989500999450684, mean loss: 0.3537421356667978
Epoch: 20, step: 1191, loss: 0.35733020305633545, mean loss: 0.35374225498268597
Epoch: 20, step: 1192, loss: 0.3432042598724365, mean loss: 0.35374190456885596
Epoch: 20, step: 1193, loss: 0.3347841799259186, mean loss: 0.353741274199612
Epoch: 20, step: 1194, loss: 0.3388344347476959, mean loss: 0.35374077854410235
Epoch: 20, step: 1195, loss: 0.3402435779571533, mean loss: 0.35374032977429964
Epoch: 20, step: 1196, loss: 0.3432367444038391, mean loss: 0.35373998055112676
Epoch: 20, step: 1197, loss: 0.3048834800720215, mean loss: 0.3537383562243604
Epoch: 20, step: 1198, loss: 0.34232211112976074, mean loss: 0.35373797668231793
Epoch: 20, step: 1199, loss: 0.31343957781791687, mean loss: 0.35373663697490887
Epoch: 20, step: 1200, loss: 0.2926900386810303, mean loss: 0.35373460756769853
Epoch: 20, step: 1201, loss: 0.3175598680973053, mean loss: 0.35373340502998596
Epoch: 20, step: 1202, loss: 0.3115208148956299, mean loss: 0.35373200182584624
Epoch: 20, step: 1203, loss: 0.31442418694496155, mean loss: 0.3537306952238358
Epoch: 20, step: 1204, loss: 0.31906071305274963, mean loss: 0.3537295428228994
Epoch: 20, step: 1205, loss: 0.33237677812576294, mean loss: 0.35372883309861913
Epoch: 20, step: 1206, loss: 0.3159242272377014, mean loss: 0.3537275765889684
Epoch: 20, step: 1207, loss: 0.36422404646873474, mean loss: 0.353727925447978
Epoch: 20, step: 1208, loss: 0.32102906703948975, mean loss: 0.3537268387100203
Epoch: 20, step: 1209, loss: 0.32911932468414307, mean loss: 0.35372602091294403
Epoch: 20, step: 1210, loss: 0.35157787799835205, mean loss: 0.35372594952472447
Epoch: 20, step: 1211, loss: 0.34949791431427, mean loss: 0.35372580902109524
Epoch: 20, step: 1212, loss: 0.3290926218032837, mean loss: 0.35372499045241756
Epoch: 20, step: 1213, loss: 0.3193027973175049, mean loss: 0.35372384662995676
Epoch: 20, step: 1214, loss: 0.31286218762397766, mean loss: 0.3537224888742164
Epoch: 20, step: 1215, loss: 0.3226490020751953, mean loss: 0.3537214563952558
Epoch: 20, step: 1216, loss: 0.3851500451564789, mean loss: 0.3537225006384947
Epoch: 20, step: 1217, loss: 0.355133593082428, mean loss: 0.3537225475217575
Epoch: 20, step: 1218, loss: 0.332954466342926, mean loss: 0.3537218575293598
Epoch: 20, step: 1219, loss: 0.34226205945014954, mean loss: 0.35372147680517113
Epoch: 20, step: 1220, loss: 0.30598434805870056, mean loss: 0.35371989090673767
Epoch: 20, step: 1221, loss: 0.3535062074661255, mean loss: 0.3537198838080917
Epoch: 20, step: 1222, loss: 0.32674530148506165, mean loss: 0.35371898773187593
Epoch: 20, step: 1223, loss: 0.36162203550338745, mean loss: 0.3537192502567155
Epoch: 20, step: 1224, loss: 0.3157755732536316, mean loss: 0.35371798987880476
Epoch: 20, step: 1225, loss: 0.28732410073280334, mean loss: 0.3537157845413589
Epoch: 20, step: 1226, loss: 0.28767138719558716, mean loss: 0.35371359088548665
Epoch: 20, step: 1227, loss: 0.3205716609954834, mean loss: 0.353712490117256
Epoch: 20, step: 1228, loss: 0.3758756220340729, mean loss: 0.3537132262138356
Epoch: 20, step: 1229, loss: 0.33108022809028625, mean loss: 0.3537124745367143
Epoch: 20, step: 1230, loss: 0.3102884888648987, mean loss: 0.35371103240640733
Epoch: 20, step: 1231, loss: 0.32223495841026306, mean loss: 0.3537099871063942
Epoch: 20, step: 1232, loss: 0.3235015869140625, mean loss: 0.35370898393832084
Epoch: 20, step: 1233, loss: 0.38942113518714905, mean loss: 0.3537101698369477
Epoch: 20, step: 1234, loss: 0.36197343468666077, mean loss: 0.35371044422727976
Epoch: 20, step: 1235, loss: 0.3104148507118225, mean loss: 0.35370900659965604
Epoch: 20, step: 1236, loss: 0.35180044174194336, mean loss: 0.353708943227977
Epoch: 20, step: 1237, loss: 0.37896305322647095, mean loss: 0.35370978173352186
Epoch: 20, step: 1238, loss: 0.39771586656570435, mean loss: 0.3537112428074231
Epoch: 20, step: 1239, loss: 0.3419066369533539, mean loss: 0.35371085088823806
Epoch: 20, step: 1240, loss: 0.2967053949832916, mean loss: 0.3537089583396539
Epoch: 20, step: 1241, loss: 0.3324854373931885, mean loss: 0.35370825375426956
Epoch: 20, step: 1242, loss: 0.3402310609817505, mean loss: 0.3537078063488726
Epoch: 20, step: 1243, loss: 0.3117276132106781, mean loss: 0.35370641276923054
Epoch: 20, step: 1244, loss: 0.3387131989002228, mean loss: 0.3537059150691851
Epoch: 20, step: 1245, loss: 0.34645411372184753, mean loss: 0.3537056743534795
Epoch: 20, step: 1246, loss: 0.34351733326911926, mean loss: 0.35370533617373756
Epoch: 20, step: 1247, loss: 0.3220565915107727, mean loss: 0.3537042856976136
Epoch: 20, step: 1248, loss: 0.37138915061950684, mean loss: 0.3537048726691334
Epoch: 20, step: 1249, loss: 0.32693102955818176, mean loss: 0.35370398405834313
Epoch: 20, step: 1250, loss: 0.32545119524002075, mean loss: 0.35370304639318706
Epoch: 20, step: 1251, loss: 0.3022666871547699, mean loss: 0.3537013393588303
Epoch: 20, step: 1252, loss: 0.32348933815956116, mean loss: 0.35370033673708007
Epoch: 20, step: 1253, loss: 0.31287881731987, mean loss: 0.35369898207060974
Epoch: 20, step: 1254, loss: 0.2996155321598053, mean loss: 0.35369718736512074
Epoch: 20, step: 1255, loss: 0.3190002143383026, mean loss: 0.35369603601878985
Epoch: 20, step: 1256, loss: 0.3293173909187317, mean loss: 0.35369522709138834
Epoch: 20, step: 1257, loss: 0.36456626653671265, mean loss: 0.35369558780010973
Epoch: 20, step: 1258, loss: 0.3297501504421234, mean loss: 0.3536947933000481
Epoch: 20, step: 1259, loss: 0.32703039050102234, mean loss: 0.353693908615151
Epoch: 20, step: 1260, loss: 0.3383709788322449, mean loss: 0.3536934002401872
Epoch: 20, step: 1261, loss: 0.3124196529388428, mean loss: 0.353692030930012
Epoch: 20, step: 1262, loss: 0.3204660415649414, mean loss: 0.3536909286512287
Epoch: 20, step: 1263, loss: 0.3225238025188446, mean loss: 0.35368989470994244
Epoch: 20, step: 1264, loss: 0.32418569922447205, mean loss: 0.3536889159673488
Epoch: 20, step: 1265, loss: 0.2961072027683258, mean loss: 0.3536870058727028
Epoch: 20, step: 1266, loss: 0.36434483528137207, mean loss: 0.3536873594013925
Epoch: 20, step: 1267, loss: 0.33013442158699036, mean loss: 0.3536865781576014
Epoch: 20, step: 1268, loss: 0.3581683337688446, mean loss: 0.35368672681114255
Epoch: 20, step: 1269, loss: 0.34513017535209656, mean loss: 0.3536864430117575
Epoch: 20, step: 1270, loss: 0.32321587204933167, mean loss: 0.3536854324127405
Epoch: 20, step: 1271, loss: 0.3332121968269348, mean loss: 0.3536847534118256
Epoch: 20, step: 1272, loss: 0.30897119641304016, mean loss: 0.35368327052266035
Epoch: 20, step: 1273, loss: 0.3169002830982208, mean loss: 0.3536820506849133
Epoch: 20, step: 1274, loss: 0.33233773708343506, mean loss: 0.3536813428648635
Epoch: 20, step: 1275, loss: 0.3279581665992737, mean loss: 0.3536804898612733
Epoch: 20, step: 1276, loss: 0.2927330732345581, mean loss: 0.3536784688573065
Epoch: 20, step: 1277, loss: 0.3485538065433502, mean loss: 0.35367829893017894
Epoch: 20, step: 1278, loss: 0.32276999950408936, mean loss: 0.3536772740852097
Epoch: 20, step: 1279, loss: 0.3477301299571991, mean loss: 0.35367707689873334
Epoch: 20, step: 1280, loss: 0.3436378836631775, mean loss: 0.3536767440452724
Epoch: 20, step: 1281, loss: 0.348905086517334, mean loss: 0.35367658584430667
Epoch: 20, step: 1282, loss: 0.3486391007900238, mean loss: 0.3536764188355524
Epoch: 20, step: 1283, loss: 0.2975893020629883, mean loss: 0.3536745594297451
Epoch: 20, step: 1284, loss: 0.3138505518436432, mean loss: 0.3536732392239574
Epoch: 20, step: 1285, loss: 0.3056747317314148, mean loss: 0.35367164807804835
Epoch: 20, step: 1286, loss: 0.3490079343318939, mean loss: 0.3536714934815109
Epoch: 20, step: 1287, loss: 0.3863028883934021, mean loss: 0.35367257513740163
Epoch: 20, step: 1288, loss: 0.3132542073726654, mean loss: 0.3536712354056318
Epoch: 20, step: 1289, loss: 0.2959655523300171, mean loss: 0.35366932272140655
Epoch: 20, step: 1290, loss: 0.32622218132019043, mean loss: 0.3536684130020933
Epoch: 20, step: 1291, loss: 0.34106364846229553, mean loss: 0.3536679952384535
Epoch: 20, step: 1292, loss: 0.37902408838272095, mean loss: 0.35366883559549933
Epoch: 20, step: 1293, loss: 0.39209991693496704, mean loss: 0.35367010924438047
Epoch: 20, step: 1294, loss: 0.3594081699848175, mean loss: 0.3536702994038085
Epoch: 20, step: 1295, loss: 0.3601089417934418, mean loss: 0.3536705127734529
Epoch: 20, step: 1296, loss: 0.3306867182254791, mean loss: 0.3536697511406018
Epoch: 20, step: 1297, loss: 0.35205841064453125, mean loss: 0.35366969774605955
Epoch: 20, step: 1298, loss: 0.3975205421447754, mean loss: 0.3536711507711564
Epoch: 20, step: 1299, loss: 0.30237534642219543, mean loss: 0.35366945110898446
Epoch: 20, step: 1300, loss: 0.34551987051963806, mean loss: 0.3536691810854402
Epoch: 20, step: 1301, loss: 0.3721995949745178, mean loss: 0.353669795041238
Epoch: 20, step: 1302, loss: 0.3208100199699402, mean loss: 0.3536687063563799
Epoch: 20, step: 1303, loss: 0.3604462742805481, mean loss: 0.3536689308981214
Epoch: 20, step: 1304, loss: 0.34648874402046204, mean loss: 0.35366869302544035
Epoch: 20, step: 1305, loss: 0.36013925075531006, mean loss: 0.35366890738168927
Epoch: 20, step: 1306, loss: 0.3367892801761627, mean loss: 0.3536683482129343
Epoch: 20, step: 1307, loss: 0.32804837822914124, mean loss: 0.3536674995323333
Epoch: 20, step: 1308, loss: 0.32497313618659973, mean loss: 0.3536665490416464
Epoch: 20, step: 1309, loss: 0.3481108844280243, mean loss: 0.3536663650183071
Epoch: 20, step: 1310, loss: 0.4035976231098175, mean loss: 0.353668018864092
Epoch: 20, step: 1311, loss: 0.4252014458179474, mean loss: 0.3536703881482386
Epoch: 20, step: 1312, loss: 0.32620251178741455, mean loss: 0.35366947840504115
Epoch: 20, step: 1313, loss: 0.3545730412006378, mean loss: 0.35366950833028443
Epoch: 20, step: 1314, loss: 0.3218955993652344, mean loss: 0.3536684560398733
Epoch: 20, step: 1315, loss: 0.3323895037174225, mean loss: 0.353667751345466
Epoch: 20, step: 1316, loss: 0.29998481273651123, mean loss: 0.35366597358811896
Epoch: 20, step: 1317, loss: 0.3196498155593872, mean loss: 0.3536648471506718
Epoch: 20, step: 1318, loss: 0.319916307926178, mean loss: 0.3536637296123684
Epoch: 20, step: 1319, loss: 0.3386956453323364, mean loss: 0.35366323398043864
Epoch: 20, step: 1320, loss: 0.3142930567264557, mean loss: 0.35366193037535093
Epoch: 20, step: 1321, loss: 0.3238571882247925, mean loss: 0.35366094352871325
Epoch: 20, step: 1322, loss: 0.30255749821662903, mean loss: 0.3536592515297293
Epoch: 20, step: 1323, loss: 0.32485201954841614, mean loss: 0.3536582977742009
Epoch: 20, step: 1324, loss: 0.32953211665153503, mean loss: 0.3536574990262743
Epoch: 20, step: 1325, loss: 0.3468666970729828, mean loss: 0.35365727420994797
Epoch: 20, step: 1326, loss: 0.31898367404937744, mean loss: 0.3536561263435541
Epoch: 20, step: 1327, loss: 0.31981050968170166, mean loss: 0.35365500592457033
Epoch: 20, step: 1328, loss: 0.30128347873687744, mean loss: 0.35365327228468857
Epoch: 20, step: 1329, loss: 0.3545590937137604, mean loss: 0.3536533022688471
Epoch: 20, step: 1330, loss: 0.3638649880886078, mean loss: 0.35365364028102214
Epoch: 20, step: 1331, loss: 0.341632217168808, mean loss: 0.35365324237876106
Epoch: 20, step: 1332, loss: 0.33069896697998047, mean loss: 0.3536524826304607
Epoch: 20, step: 1333, loss: 0.3520744740962982, mean loss: 0.353652430402734
Epoch: 20, step: 1334, loss: 0.36641940474510193, mean loss: 0.3536528529403591
Epoch: 20, step: 1335, loss: 0.33320316672325134, mean loss: 0.35365217615699207
Epoch: 20, step: 1336, loss: 0.330966979265213, mean loss: 0.3536514254141357
Epoch: 20, step: 1337, loss: 0.36019232869148254, mean loss: 0.3536516418713227
Epoch: 20, step: 1338, loss: 0.3407171964645386, mean loss: 0.3536512138477148
Epoch: 20, step: 1339, loss: 0.363323837518692, mean loss: 0.35365153392129756
Epoch: 20, step: 1340, loss: 0.3344002366065979, mean loss: 0.3536508969040806
Epoch: 20, step: 1341, loss: 0.31332266330718994, mean loss: 0.35364956250418655
Epoch: 20, step: 1342, loss: 0.3258665204048157, mean loss: 0.35364864323601003
Epoch: 20, step: 1343, loss: 0.35787540674209595, mean loss: 0.3536487830839291
Epoch: 20, step: 1344, loss: 0.3436712920665741, mean loss: 0.35364845297669945
Epoch: 20, step: 1345, loss: 0.33811330795288086, mean loss: 0.35364793901041136
Epoch: 20, step: 1346, loss: 0.3321032226085663, mean loss: 0.3536472262464453
Epoch: 20, step: 1347, loss: 0.3641674518585205, mean loss: 0.3536475742756107
Epoch: 20, step: 1348, loss: 0.31047338247299194, mean loss: 0.35364614603809696
Epoch: 20, step: 1349, loss: 0.36456966400146484, mean loss: 0.3536465073850359
Epoch: 20, step: 1350, loss: 0.33544957637786865, mean loss: 0.3536459054555262
Epoch: 20, step: 1351, loss: 0.310178279876709, mean loss: 0.3536444676536746
Epoch: 20, step: 1352, loss: 0.34781792759895325, mean loss: 0.3536442749324741
Epoch: 20, step: 1353, loss: 0.31688809394836426, mean loss: 0.35364305920908373
Epoch: 20, step: 1354, loss: 0.3485548198223114, mean loss: 0.35364289091937356
Epoch: 20, step: 1355, loss: 0.3775475323200226, mean loss: 0.35364368152135134
Epoch: 20, step: 1356, loss: 0.36298924684524536, mean loss: 0.3536439905984861
Epoch: 20, step: 1357, loss: 0.30235958099365234, mean loss: 0.3536422945732991
Epoch: 20, step: 1358, loss: 0.3119219243526459, mean loss: 0.3536409148858021
Epoch: 20, step: 1359, loss: 0.3672761619091034, mean loss: 0.35364136578682803
Epoch: 20, step: 1360, loss: 0.293253630399704, mean loss: 0.353639368903941
Epoch: 20, step: 1361, loss: 0.3383078873157501, mean loss: 0.3536388619440313
Epoch: 20, step: 1362, loss: 0.2988929748535156, mean loss: 0.3536370517437506
Epoch: 20, step: 1363, loss: 0.2875959873199463, mean loss: 0.35363486813495465
Epoch: 20, step: 1364, loss: 0.3440822660923004, mean loss: 0.3536345522942523
Epoch: 20, step: 1365, loss: 0.28634947538375854, mean loss: 0.3536323277000279
Epoch: 20, step: 1366, loss: 0.3383486568927765, mean loss: 0.3536318224046
Epoch: 20, step: 1367, loss: 0.30782684683799744, mean loss: 0.35363030809041174
Epoch: 20, step: 1368, loss: 0.34262174367904663, mean loss: 0.35362994415889626
Epoch: 20, step: 1369, loss: 0.3191571533679962, mean loss: 0.3536288045625065
Epoch: 20, step: 1370, loss: 0.32803580164909363, mean loss: 0.3536279585407911
Epoch: 20, step: 1371, loss: 0.3203928470611572, mean loss: 0.35362685993205517
Epoch: 20, step: 1372, loss: 0.33796054124832153, mean loss: 0.353626342088579
Epoch: 20, step: 1373, loss: 0.3379819393157959, mean loss: 0.35362582498661654
Epoch: 20, step: 1374, loss: 0.35041284561157227, mean loss: 0.3536257187899755
Epoch: 20, step: 1375, loss: 0.33581894636154175, mean loss: 0.3536251302530761
Epoch: 20, step: 1376, loss: 0.35172727704048157, mean loss: 0.3536250675286417
Epoch: 20, step: 1377, loss: 0.3386443853378296, mean loss: 0.35362457243041345
Epoch: 20, step: 1378, loss: 0.32890382409095764, mean loss: 0.3536237554586583
Epoch: 20, step: 1379, loss: 0.3183151185512543, mean loss: 0.35362258861672485
Epoch: 20, step: 1380, loss: 0.38567033410072327, mean loss: 0.35362364766122056
Epoch: 20, step: 1381, loss: 0.34488558769226074, mean loss: 0.3536233589142782
Epoch: 20, step: 1382, loss: 0.325779527425766, mean loss: 0.3536224388524374
Epoch: 20, step: 1383, loss: 0.34600532054901123, mean loss: 0.35362218716335786
Epoch: 20, step: 1384, loss: 0.36239486932754517, mean loss: 0.3536224770256465
Epoch: 20, step: 1385, loss: 0.32968413829803467, mean loss: 0.35362168609394995
Epoch: 20, step: 1386, loss: 0.3505615293979645, mean loss: 0.35362158498856466
Epoch: 20, step: 1387, loss: 0.31944936513900757, mean loss: 0.3536204560001991
Epoch: 20, step: 1388, loss: 0.3157980144023895, mean loss: 0.35361920645638867
Epoch: 20, step: 1389, loss: 0.30868756771087646, mean loss: 0.35361772209435544
Epoch: 20, step: 1390, loss: 0.3272751271724701, mean loss: 0.3536168518688947
Epoch: 20, step: 1391, loss: 0.3312523066997528, mean loss: 0.3536161130823867
Epoch: 20, step: 1392, loss: 0.3220599889755249, mean loss: 0.35361507069728754
Epoch: 20, step: 1393, loss: 0.33009853959083557, mean loss: 0.3536142939075965
Epoch: 20, step: 1394, loss: 0.3172420561313629, mean loss: 0.3536130925124594
Epoch: 20, step: 1395, loss: 0.322689414024353, mean loss: 0.3536120711199872
Epoch: 20, step: 1396, loss: 0.34922298789024353, mean loss: 0.35361192615571635
Epoch: 20, step: 1397, loss: 0.3676600456237793, mean loss: 0.353612390126899
Epoch: 20, step: 1398, loss: 0.3108925521373749, mean loss: 0.35361097925342266
Epoch: 20, step: 1399, loss: 0.36508068442344666, mean loss: 0.3536113580415723
Epoch: 20, step: 1400, loss: 0.32623687386512756, mean loss: 0.3536104540263754
Epoch: 20, step: 1401, loss: 0.3529907166957855, mean loss: 0.35361043356084043
Epoch: 20, step: 1402, loss: 0.34480229020118713, mean loss: 0.35361014269985047
Epoch: 20, step: 1403, loss: 0.3006233274936676, mean loss: 0.3536083930361599
Epoch: 20, step: 1404, loss: 0.32821229100227356, mean loss: 0.3536075544658434
Epoch: 20, step: 1405, loss: 0.33825990557670593, mean loss: 0.3536070477086325
Epoch: 20, step: 1406, loss: 0.3425288796424866, mean loss: 0.35360668193559236
Epoch: 20, step: 1407, loss: 0.3233893811702728, mean loss: 0.35360568426982486
Epoch: 20, step: 1408, loss: 0.3129833936691284, mean loss: 0.35360434311327954
Epoch: 20, step: 1409, loss: 0.33348721265792847, mean loss: 0.35360367896238964
Epoch: 20, step: 1410, loss: 0.3115217983722687, mean loss: 0.3536022897087965
Epoch: 20, step: 1411, loss: 0.31959229707717896, mean loss: 0.35360116697036287
Epoch: 20, step: 1412, loss: 0.34253132343292236, mean loss: 0.3536008015445702
Epoch: 20, step: 1413, loss: 0.3450169563293457, mean loss: 0.3536005181932394
Epoch: 20, step: 1414, loss: 0.34008270502090454, mean loss: 0.3536000719871601
Epoch: 20, step: 1415, loss: 0.3467061519622803, mean loss: 0.3535998444350072
Epoch: 20, step: 1416, loss: 0.34944260120391846, mean loss: 0.3535997072186745
Epoch: 20, step: 1417, loss: 0.3297581970691681, mean loss: 0.3535989203182141
Epoch: 20, step: 1418, loss: 0.35886695981025696, mean loss: 0.3535990941866418
Epoch: 20, step: 1419, loss: 0.31073248386383057, mean loss: 0.3535976794470272
Epoch: 20, step: 1420, loss: 0.343194842338562, mean loss: 0.3535973361304004
Epoch: 20, step: 1421, loss: 0.3446616232395172, mean loss: 0.35359704124184876
Epoch: 20, step: 1422, loss: 0.30746540427207947, mean loss: 0.3535955188963064
Epoch: 20, step: 1423, loss: 0.31089043617248535, mean loss: 0.35359410967367166
Epoch: 20, step: 1424, loss: 0.3401874899864197, mean loss: 0.35359366728397734
Epoch: 20, step: 1425, loss: 0.35419762134552, mean loss: 0.3535936872125084
Epoch: 20, step: 1426, loss: 0.3879019320011139, mean loss: 0.3535948192362913
Epoch: 20, step: 1427, loss: 0.34971553087234497, mean loss: 0.3535946912407666
Epoch: 20, step: 1428, loss: 0.3192341923713684, mean loss: 0.3535935575676375
Epoch: 20, step: 1429, loss: 0.3310896158218384, mean loss: 0.3535928151083255
Epoch: 20, step: 1430, loss: 0.3856610357761383, mean loss: 0.35359387308136064
Epoch: 20, step: 1431, loss: 0.3240380585193634, mean loss: 0.35359289802809585
Epoch: 20, step: 1432, loss: 0.34364962577819824, mean loss: 0.3535925700080302
Epoch: 20, step: 1433, loss: 0.3226022720336914, mean loss: 0.35359154769827317
Epoch: 20, step: 1434, loss: 0.32589754462242126, mean loss: 0.35359063415702047
Epoch: 20, step: 1435, loss: 0.32628899812698364, mean loss: 0.3535897335884748
Epoch: 20, step: 1436, loss: 0.3183281421661377, mean loss: 0.35358857049214526
Epoch: 20, step: 1437, loss: 0.319192498922348, mean loss: 0.35358743598223136
Epoch: 20, step: 1438, loss: 0.3275896906852722, mean loss: 0.3535865785085252
Epoch: 20, step: 1439, loss: 0.3444899618625641, mean loss: 0.3535862784881873
Epoch: 20, step: 1440, loss: 0.31717821955680847, mean loss: 0.3535850777342896
Epoch: 20, step: 1441, loss: 0.28488779067993164, mean loss: 0.35358281214207754
Epoch: 20, step: 1442, loss: 0.3135043680667877, mean loss: 0.353581490424435
Epoch: 20, step: 1443, loss: 0.30248358845710754, mean loss: 0.3535798053597348
Valid: 20, mean loss: 0.18774635841449103
Epoch: 21, step: 0, loss: 0.36080068349838257, mean loss: 0.3535800434760791
Epoch: 21, step: 1, loss: 0.3223147690296173, mean loss: 0.35357901250349955
Epoch: 21, step: 2, loss: 0.33355778455734253, mean loss: 0.35357835232517837
Epoch: 21, step: 3, loss: 0.31602030992507935, mean loss: 0.3535771139302166
Epoch: 21, step: 4, loss: 0.33798080682754517, mean loss: 0.3535765996927837
Epoch: 21, step: 5, loss: 0.30161404609680176, mean loss: 0.3535748864532982
Epoch: 21, step: 6, loss: 0.3306788206100464, mean loss: 0.35357413157987355
Epoch: 21, step: 7, loss: 0.2971390187740326, mean loss: 0.35357227099986543
Epoch: 21, step: 8, loss: 0.3242596983909607, mean loss: 0.3535713046406986
Epoch: 21, step: 9, loss: 0.31429246068000793, mean loss: 0.3535700097622137
Epoch: 21, step: 10, loss: 0.30064657330513, mean loss: 0.35356826512939826
Epoch: 21, step: 11, loss: 0.3995833396911621, mean loss: 0.3535697819765291
Epoch: 21, step: 12, loss: 0.351859986782074, mean loss: 0.3535697256164673
Epoch: 21, step: 13, loss: 0.33210843801498413, mean loss: 0.35356901821032316
Epoch: 21, step: 14, loss: 0.3299637734889984, mean loss: 0.35356824016079214
Epoch: 21, step: 15, loss: 0.3051590323448181, mean loss: 0.3535666446035141
Epoch: 21, step: 16, loss: 0.32449039816856384, mean loss: 0.3535656862881509
Epoch: 21, step: 17, loss: 0.33859649300575256, mean loss: 0.3535651929392193
Epoch: 21, step: 18, loss: 0.32100459933280945, mean loss: 0.35356411985502834
Epoch: 21, step: 19, loss: 0.37740227580070496, mean loss: 0.3535649054520474
Epoch: 21, step: 20, loss: 0.32432350516319275, mean loss: 0.3535639418204676
Epoch: 21, step: 21, loss: 0.32188430428504944, mean loss: 0.35356289787274675
Epoch: 21, step: 22, loss: 0.3586581349372864, mean loss: 0.3535630657719481
Epoch: 21, step: 23, loss: 0.37832677364349365, mean loss: 0.3535638817633766
Epoch: 21, step: 24, loss: 0.35204017162323, mean loss: 0.3535638315571049
Epoch: 21, step: 25, loss: 0.3312874138355255, mean loss: 0.3535630975729955
Epoch: 21, step: 26, loss: 0.3507792055606842, mean loss: 0.353563005849757
Epoch: 21, step: 27, loss: 0.3600544333457947, mean loss: 0.353563219721248
Epoch: 21, step: 28, loss: 0.34807905554771423, mean loss: 0.3535630390417707
Epoch: 21, step: 29, loss: 0.30627742409706116, mean loss: 0.35356148123670567
Epoch: 21, step: 30, loss: 0.29373568296432495, mean loss: 0.35355951036540695
Epoch: 21, step: 31, loss: 0.3292643129825592, mean loss: 0.353558710022892
Epoch: 21, step: 32, loss: 0.35180094838142395, mean loss: 0.35355865211988313
Epoch: 21, step: 33, loss: 0.337404727935791, mean loss: 0.3535581200056403
Epoch: 21, step: 34, loss: 0.39775362610816956, mean loss: 0.3535595757685476
Epoch: 21, step: 35, loss: 0.3358248770236969, mean loss: 0.3535589916216851
Epoch: 21, step: 36, loss: 0.34901630878448486, mean loss: 0.3535588419993789
Epoch: 21, step: 37, loss: 0.34767428040504456, mean loss: 0.35355864818600713
Epoch: 21, step: 38, loss: 0.3022470772266388, mean loss: 0.3535569582485517
Epoch: 21, step: 39, loss: 0.33673763275146484, mean loss: 0.3535564043253039
Epoch: 21, step: 40, loss: 0.37159380316734314, mean loss: 0.353556998344696
Epoch: 21, step: 41, loss: 0.34831002354621887, mean loss: 0.3535568255535876
Epoch: 21, step: 42, loss: 0.3229401409626007, mean loss: 0.3535558173313532
Epoch: 21, step: 43, loss: 0.3343876898288727, mean loss: 0.35355518613642756
Epoch: 21, step: 44, loss: 0.4009769558906555, mean loss: 0.3535567476554026
Epoch: 21, step: 45, loss: 0.356045126914978, mean loss: 0.3535568295908409
Epoch: 21, step: 46, loss: 0.318679541349411, mean loss: 0.3535556812161334
Epoch: 21, step: 47, loss: 0.31842249631881714, mean loss: 0.3535545244538228
Epoch: 21, step: 48, loss: 0.3254742920398712, mean loss: 0.35355359994085356
Epoch: 21, step: 49, loss: 0.32626044750213623, mean loss: 0.35355270137127304
Epoch: 21, step: 50, loss: 0.3305457830429077, mean loss: 0.35355194394186307
Epoch: 21, step: 51, loss: 0.32567575573921204, mean loss: 0.3535510262374845
Epoch: 21, step: 52, loss: 0.36043885350227356, mean loss: 0.35355125298230017
Epoch: 21, step: 53, loss: 0.3561380207538605, mean loss: 0.3535513381349689
Epoch: 21, step: 54, loss: 0.3219296634197235, mean loss: 0.35355029722925396
Epoch: 21, step: 55, loss: 0.33894068002700806, mean loss: 0.35354981633336185
Epoch: 21, step: 56, loss: 0.33516013622283936, mean loss: 0.3535492110313603
Epoch: 21, step: 57, loss: 0.30058935284614563, mean loss: 0.353547467898644
Epoch: 21, step: 58, loss: 0.3965770900249481, mean loss: 0.3535488841387166
Epoch: 21, step: 59, loss: 0.36735424399375916, mean loss: 0.35354933850153436
Epoch: 21, step: 60, loss: 0.3235104978084564, mean loss: 0.35354834989397493
Epoch: 21, step: 61, loss: 0.3239004909992218, mean loss: 0.35354737418611953
Epoch: 21, step: 62, loss: 0.31111353635787964, mean loss: 0.3535459777390261
Epoch: 21, step: 63, loss: 0.3446958661079407, mean loss: 0.35354568650197093
Epoch: 21, step: 64, loss: 0.31357988715171814, mean loss: 0.35354437136164546
Epoch: 21, step: 65, loss: 0.3390238583087921, mean loss: 0.3535438935560169
Epoch: 21, step: 66, loss: 0.34084609150886536, mean loss: 0.353543475741465
Epoch: 21, step: 67, loss: 0.3337405323982239, mean loss: 0.3535428241573855
Epoch: 21, step: 68, loss: 0.3180396556854248, mean loss: 0.35354165602102283
Epoch: 21, step: 69, loss: 0.3060782551765442, mean loss: 0.35354009441673107
Epoch: 21, step: 70, loss: 0.37642377614974976, mean loss: 0.35354084729324803
Epoch: 21, step: 71, loss: 0.32337039709091187, mean loss: 0.35353985471362565
Epoch: 21, step: 72, loss: 0.3592684268951416, mean loss: 0.3535400431720979
Epoch: 21, step: 73, loss: 0.31573885679244995, mean loss: 0.3535387996302077
Epoch: 21, step: 74, loss: 0.3225044906139374, mean loss: 0.3535377787311973
Epoch: 21, step: 75, loss: 0.3237651288509369, mean loss: 0.35353679936771437
Epoch: 21, step: 76, loss: 0.36338335275650024, mean loss: 0.35353712325684267
Epoch: 21, step: 77, loss: 0.3229599893093109, mean loss: 0.35353611749623653
Epoch: 21, step: 78, loss: 0.34255436062812805, mean loss: 0.35353575628987965
Epoch: 21, step: 79, loss: 0.3212222158908844, mean loss: 0.35353469348431465
Epoch: 21, step: 80, loss: 0.3119858503341675, mean loss: 0.35353332697080864
Epoch: 21, step: 81, loss: 0.33590197563171387, mean loss: 0.35353274710659305
Epoch: 21, step: 82, loss: 0.3313289284706116, mean loss: 0.35353201688596503
Epoch: 21, step: 83, loss: 0.3696999251842499, mean loss: 0.35353254858513294
Epoch: 21, step: 84, loss: 0.3283883035182953, mean loss: 0.35353172171660496
Epoch: 21, step: 85, loss: 0.3070034384727478, mean loss: 0.3535301916842721
Epoch: 21, step: 86, loss: 0.36233559250831604, mean loss: 0.35353048123084485
Epoch: 21, step: 87, loss: 0.33542025089263916, mean loss: 0.353529885734648
Epoch: 21, step: 88, loss: 0.3172388970851898, mean loss: 0.35352869246240753
Epoch: 21, step: 89, loss: 0.36708372831344604, mean loss: 0.3535291381464955
Epoch: 21, step: 90, loss: 0.3290810286998749, mean loss: 0.35352833432898945
Epoch: 21, step: 91, loss: 0.31092607975006104, mean loss: 0.35352693367622184
Epoch: 21, step: 92, loss: 0.4237103760242462, mean loss: 0.35352924105177985
Epoch: 21, step: 93, loss: 0.3380111753940582, mean loss: 0.35352873089116255
Epoch: 21, step: 94, loss: 0.3203313648700714, mean loss: 0.3535276395546288
Epoch: 21, step: 95, loss: 0.336704820394516, mean loss: 0.3535270865362475
Epoch: 21, step: 96, loss: 0.32373666763305664, mean loss: 0.3535261072647277
Epoch: 21, step: 97, loss: 0.33391597867012024, mean loss: 0.35352546266119755
Epoch: 21, step: 98, loss: 0.35075756907463074, mean loss: 0.3535253716809002
Epoch: 21, step: 99, loss: 0.2980034649372101, mean loss: 0.35352354674312925
Epoch: 21, step: 100, loss: 0.3876955807209015, mean loss: 0.35352466989954595
Epoch: 21, step: 101, loss: 0.3359438180923462, mean loss: 0.3535240920762433
Epoch: 21, step: 102, loss: 0.3141951560974121, mean loss: 0.3535227995092476
Epoch: 21, step: 103, loss: 0.3315656781196594, mean loss: 0.3535220779001576
Epoch: 21, step: 104, loss: 0.355994313955307, mean loss: 0.3535221591462076
Epoch: 21, step: 105, loss: 0.32349976897239685, mean loss: 0.3535211725412068
Epoch: 21, step: 106, loss: 0.3329518735408783, mean loss: 0.3535204966088023
Epoch: 21, step: 107, loss: 0.35191237926483154, mean loss: 0.35352044376582964
Epoch: 21, step: 108, loss: 0.38921964168548584, mean loss: 0.35352161680818234
Epoch: 21, step: 109, loss: 0.3163895010948181, mean loss: 0.3535203967215781
Epoch: 21, step: 110, loss: 0.35949134826660156, mean loss: 0.3535205929085847
Epoch: 21, step: 111, loss: 0.3772604465484619, mean loss: 0.35352137290114743
Epoch: 21, step: 112, loss: 0.3551924526691437, mean loss: 0.35352142780405404
Epoch: 21, step: 113, loss: 0.3330790400505066, mean loss: 0.3535207561965978
Epoch: 21, step: 114, loss: 0.31115320324897766, mean loss: 0.3535193643127334
Epoch: 21, step: 115, loss: 0.36069631576538086, mean loss: 0.3535196000864342
Epoch: 21, step: 116, loss: 0.32274696230888367, mean loss: 0.3535185891919899
Epoch: 21, step: 117, loss: 0.31731081008911133, mean loss: 0.3535173997898776
Epoch: 21, step: 118, loss: 0.37983933091163635, mean loss: 0.35351826441987866
Epoch: 21, step: 119, loss: 0.3825927972793579, mean loss: 0.35351921943672465
Epoch: 21, step: 120, loss: 0.3421236276626587, mean loss: 0.35351884513579596
Epoch: 21, step: 121, loss: 0.3037225902080536, mean loss: 0.35351720957595467
Epoch: 21, step: 122, loss: 0.33158692717552185, mean loss: 0.3535164892986728
Epoch: 21, step: 123, loss: 0.30094462633132935, mean loss: 0.35351476268730364
Epoch: 21, step: 124, loss: 0.31606853008270264, mean loss: 0.35351353288558257
Epoch: 21, step: 125, loss: 0.3494926989078522, mean loss: 0.3535134008384897
Epoch: 21, step: 126, loss: 0.30269476771354675, mean loss: 0.3535117319726684
Epoch: 21, step: 127, loss: 0.3909280002117157, mean loss: 0.35351296066924787
Epoch: 21, step: 128, loss: 0.3120889365673065, mean loss: 0.35351160040838353
Epoch: 21, step: 129, loss: 0.27750298380851746, mean loss: 0.35350910455836054
Epoch: 21, step: 130, loss: 0.309336394071579, mean loss: 0.35350765413279867
Epoch: 21, step: 131, loss: 0.3945208787918091, mean loss: 0.35350900077138087
Epoch: 21, step: 132, loss: 0.3729742765426636, mean loss: 0.3535096398781797
Epoch: 21, step: 133, loss: 0.29819321632385254, mean loss: 0.3535078237240148
Epoch: 21, step: 134, loss: 0.33529070019721985, mean loss: 0.35350722563729076
Epoch: 21, step: 135, loss: 0.3035825490951538, mean loss: 0.3535055866131101
Epoch: 21, step: 136, loss: 0.3345261812210083, mean loss: 0.35350496354080807
Epoch: 21, step: 137, loss: 0.3684593737125397, mean loss: 0.35350545446097653
Epoch: 21, step: 138, loss: 0.32493260502815247, mean loss: 0.3535045165083969
Epoch: 21, step: 139, loss: 0.34924307465553284, mean loss: 0.35350437662388234
Epoch: 21, step: 140, loss: 0.31425172090530396, mean loss: 0.3535030881730135
Epoch: 21, step: 141, loss: 0.3511449098587036, mean loss: 0.35350301076940577
Epoch: 21, step: 142, loss: 0.2841693162918091, mean loss: 0.3535007350712905
Epoch: 21, step: 143, loss: 0.3351644277572632, mean loss: 0.3535001332494671
Epoch: 21, step: 144, loss: 0.3476599454879761, mean loss: 0.3534999415730825
Epoch: 21, step: 145, loss: 0.3260137438774109, mean loss: 0.3534990394989868
Epoch: 21, step: 146, loss: 0.33205273747444153, mean loss: 0.35349833567233113
Epoch: 21, step: 147, loss: 0.3069731891155243, mean loss: 0.35349680885602247
Epoch: 21, step: 148, loss: 0.3139983117580414, mean loss: 0.3534955126758926
Epoch: 21, step: 149, loss: 0.35890212655067444, mean loss: 0.35349569009316223
Epoch: 21, step: 150, loss: 0.33907797932624817, mean loss: 0.35349521699354725
Epoch: 21, step: 151, loss: 0.3536613881587982, mean loss: 0.3534952224460727
Epoch: 21, step: 152, loss: 0.3391968011856079, mean loss: 0.35349475329158697
Epoch: 21, step: 153, loss: 0.4011980891227722, mean loss: 0.3534963184643618
Epoch: 21, step: 154, loss: 0.3015608787536621, mean loss: 0.35349461448983144
Epoch: 21, step: 155, loss: 0.30638253688812256, mean loss: 0.35349306881799414
Epoch: 21, step: 156, loss: 0.36372214555740356, mean loss: 0.3534934044066146
Epoch: 21, step: 157, loss: 0.3316819965839386, mean loss: 0.3534926888561972
Epoch: 21, step: 158, loss: 0.347468763589859, mean loss: 0.35349249124030424
Epoch: 21, step: 159, loss: 0.40466490387916565, mean loss: 0.35349416990493615
Epoch: 21, step: 160, loss: 0.3558444380760193, mean loss: 0.353494247000825
Epoch: 21, step: 161, loss: 0.343306303024292, mean loss: 0.35349391281647885
Epoch: 21, step: 162, loss: 0.30294376611709595, mean loss: 0.3534922547278936
Epoch: 21, step: 163, loss: 0.3225927948951721, mean loss: 0.35349124123209746
Epoch: 21, step: 164, loss: 0.32512980699539185, mean loss: 0.3534903110135191
Epoch: 21, step: 165, loss: 0.31908154487609863, mean loss: 0.35348918248724365
Epoch: 21, step: 166, loss: 0.3039204776287079, mean loss: 0.3534875568040959
Epoch: 21, step: 167, loss: 0.3526524603366852, mean loss: 0.35348752941670025
Epoch: 21, step: 168, loss: 0.34979012608528137, mean loss: 0.3534874081625327
Epoch: 21, step: 169, loss: 0.33973854780197144, mean loss: 0.35348695729152985
Epoch: 21, step: 170, loss: 0.3190936744213104, mean loss: 0.35348582945802043
Epoch: 21, step: 171, loss: 0.33508479595184326, mean loss: 0.3534852260663131
Epoch: 21, step: 172, loss: 0.30746182799339294, mean loss: 0.3534837169540046
Epoch: 21, step: 173, loss: 0.34620168805122375, mean loss: 0.3534834781833015
Epoch: 21, step: 174, loss: 0.32589033246040344, mean loss: 0.35348257346033607
Epoch: 21, step: 175, loss: 0.30579426884651184, mean loss: 0.35348100990936515
Epoch: 21, step: 176, loss: 0.30119258165359497, mean loss: 0.35347929559087543
Epoch: 21, step: 177, loss: 0.3376573920249939, mean loss: 0.35347877687395307
Epoch: 21, step: 178, loss: 0.35396599769592285, mean loss: 0.35347879284683514
Epoch: 21, step: 179, loss: 0.3512084186077118, mean loss: 0.35347871841809664
Epoch: 21, step: 180, loss: 0.3170168995857239, mean loss: 0.3534775231445732
Epoch: 21, step: 181, loss: 0.3291091322898865, mean loss: 0.35347672433808086
Epoch: 21, step: 182, loss: 0.35656771063804626, mean loss: 0.3534768256586401
Epoch: 21, step: 183, loss: 0.31065529584884644, mean loss: 0.3534754220422178
Epoch: 21, step: 184, loss: 0.34359773993492126, mean loss: 0.35347509827932466
Epoch: 21, step: 185, loss: 0.316569447517395, mean loss: 0.35347388865458645
Epoch: 21, step: 186, loss: 0.32344850897789, mean loss: 0.353472904570824
Epoch: 21, step: 187, loss: 0.3391225337982178, mean loss: 0.3534724342519077
Epoch: 21, step: 188, loss: 0.3564203083515167, mean loss: 0.3534725308623393
Epoch: 21, step: 189, loss: 0.30423396825790405, mean loss: 0.35347091722392404
Epoch: 21, step: 190, loss: 0.34163698554039, mean loss: 0.3534705294168887
Epoch: 21, step: 191, loss: 0.33894583582878113, mean loss: 0.3534700534471159
Epoch: 21, step: 192, loss: 0.34585532546043396, mean loss: 0.3534698039229823
Epoch: 21, step: 193, loss: 0.3156650960445404, mean loss: 0.35346856515543923
Epoch: 21, step: 194, loss: 0.38628891110420227, mean loss: 0.3534696405624299
Epoch: 21, step: 195, loss: 0.33754676580429077, mean loss: 0.35346911884307347
Epoch: 21, step: 196, loss: 0.37905603647232056, mean loss: 0.3534699571811892
Epoch: 21, step: 197, loss: 0.3504795730113983, mean loss: 0.35346985920647683
Epoch: 21, step: 198, loss: 0.3289872109889984, mean loss: 0.35346905710156523
Epoch: 21, step: 199, loss: 0.3326236605644226, mean loss: 0.35346837418331933
Epoch: 21, step: 200, loss: 0.33146828413009644, mean loss: 0.3534676534596485
Epoch: 21, step: 201, loss: 0.3053377568721771, mean loss: 0.3534660767743118
Epoch: 21, step: 202, loss: 0.39168787002563477, mean loss: 0.35346732883947546
Epoch: 21, step: 203, loss: 0.3290470838546753, mean loss: 0.3534665289100669
Epoch: 21, step: 204, loss: 0.36380666494369507, mean loss: 0.35346686760887897
Epoch: 21, step: 205, loss: 0.33714812994003296, mean loss: 0.35346633309405195
Epoch: 21, step: 206, loss: 0.3438357710838318, mean loss: 0.3534660176585271
Epoch: 21, step: 207, loss: 0.33046954870224, mean loss: 0.35346526446617293
Epoch: 21, step: 208, loss: 0.33165085315704346, mean loss: 0.353464550012588
Epoch: 21, step: 209, loss: 0.3653121888637543, mean loss: 0.3534649380272225
Epoch: 21, step: 210, loss: 0.3087815046310425, mean loss: 0.353463474675875
Epoch: 21, step: 211, loss: 0.31175827980041504, mean loss: 0.35346210890449453
Epoch: 21, step: 212, loss: 0.3187648057937622, mean loss: 0.3534609726663863
Epoch: 21, step: 213, loss: 0.3476620316505432, mean loss: 0.3534607827737602
Epoch: 21, step: 214, loss: 0.32505613565444946, mean loss: 0.35345985266317637
Epoch: 21, step: 215, loss: 0.3100730776786804, mean loss: 0.35345843200911664
Epoch: 21, step: 216, loss: 0.34100502729415894, mean loss: 0.353458024248902
Epoch: 21, step: 217, loss: 0.3228154480457306, mean loss: 0.35345702095585624
Epoch: 21, step: 218, loss: 0.3034326434135437, mean loss: 0.35345538312140834
Epoch: 21, step: 219, loss: 0.3860088288784027, mean loss: 0.3534564489099677
Epoch: 21, step: 220, loss: 0.33020201325416565, mean loss: 0.35345568759270934
Epoch: 21, step: 221, loss: 0.3154982030391693, mean loss: 0.3534544449591549
Epoch: 21, step: 222, loss: 0.3223288059234619, mean loss: 0.3534534260165734
Epoch: 21, step: 223, loss: 0.31276431679725647, mean loss: 0.3534520940436384
Epoch: 21, step: 224, loss: 0.3104833960533142, mean loss: 0.3534506874935716
Epoch: 21, step: 225, loss: 0.3213503360748291, mean loss: 0.353449636745571
Epoch: 21, step: 226, loss: 0.33228471875190735, mean loss: 0.35344894397224136
Epoch: 21, step: 227, loss: 0.3178682327270508, mean loss: 0.3534477793770841
Epoch: 21, step: 228, loss: 0.3407834470272064, mean loss: 0.3534473648733578
Epoch: 21, step: 229, loss: 0.3893057703971863, mean loss: 0.3534485384809223
Epoch: 21, step: 230, loss: 0.36033302545547485, mean loss: 0.3534487637955017
Epoch: 21, step: 231, loss: 0.3519041836261749, mean loss: 0.35344871324634053
Epoch: 21, step: 232, loss: 0.3821776807308197, mean loss: 0.3534496534226499
Epoch: 21, step: 233, loss: 0.33349406719207764, mean loss: 0.35344900038298005
Epoch: 21, step: 234, loss: 0.32982900738716125, mean loss: 0.35344822745215787
Epoch: 21, step: 235, loss: 0.35230395197868347, mean loss: 0.35344819000858874
Epoch: 21, step: 236, loss: 0.33430346846580505, mean loss: 0.35344756356568624
Epoch: 21, step: 237, loss: 0.34214627742767334, mean loss: 0.35344719378340306
Epoch: 21, step: 238, loss: 0.3313184380531311, mean loss: 0.353446469745981
Epoch: 21, step: 239, loss: 0.33614686131477356, mean loss: 0.35344590373340307
Epoch: 21, step: 240, loss: 0.35180431604385376, mean loss: 0.3534458500253157
Epoch: 21, step: 241, loss: 0.31473687291145325, mean loss: 0.35344458361894543
Epoch: 21, step: 242, loss: 0.3074188828468323, mean loss: 0.35344307788724877
Epoch: 21, step: 243, loss: 0.33243733644485474, mean loss: 0.35344239070648975
Epoch: 21, step: 244, loss: 0.3155376613140106, mean loss: 0.35344115073366134
Epoch: 21, step: 245, loss: 0.3612174093723297, mean loss: 0.35344140510914834
Epoch: 21, step: 246, loss: 0.3205298185348511, mean loss: 0.35344032854683194
Epoch: 21, step: 247, loss: 0.3127092719078064, mean loss: 0.3534389962474521
Epoch: 21, step: 248, loss: 0.3230496048927307, mean loss: 0.3534380022530337
Epoch: 21, step: 249, loss: 0.3096346855163574, mean loss: 0.35343656955476926
Epoch: 21, step: 250, loss: 0.3100879490375519, mean loss: 0.35343515177486684
Epoch: 21, step: 251, loss: 0.3252872824668884, mean loss: 0.35343423118782774
Epoch: 21, step: 252, loss: 0.3327889144420624, mean loss: 0.3534335559967774
Epoch: 21, step: 253, loss: 0.32406505942344666, mean loss: 0.35343259555147116
Epoch: 21, step: 254, loss: 0.3029184341430664, mean loss: 0.3534309436282098
Epoch: 21, step: 255, loss: 0.34455692768096924, mean loss: 0.3534306534380219
Epoch: 21, step: 256, loss: 0.30038943886756897, mean loss: 0.3534289189880506
Epoch: 21, step: 257, loss: 0.3556571304798126, mean loss: 0.3534289918482786
Epoch: 21, step: 258, loss: 0.3422611653804779, mean loss: 0.3534286266837601
Epoch: 21, step: 259, loss: 0.3263252079486847, mean loss: 0.3534277404877513
Epoch: 21, step: 260, loss: 0.31635069847106934, mean loss: 0.3534265282254653
Epoch: 21, step: 261, loss: 0.3324250280857086, mean loss: 0.35342584158778334
Epoch: 21, step: 262, loss: 0.32887619733810425, mean loss: 0.35342503897084643
Epoch: 21, step: 263, loss: 0.33252623677253723, mean loss: 0.3534243557355189
Epoch: 21, step: 264, loss: 0.3449093699455261, mean loss: 0.3534240773679426
Epoch: 21, step: 265, loss: 0.3153868317604065, mean loss: 0.35342283391434315
Epoch: 21, step: 266, loss: 0.3252367675304413, mean loss: 0.3534219125300673
Epoch: 21, step: 267, loss: 0.34730470180511475, mean loss: 0.3534217125689426
Epoch: 21, step: 268, loss: 0.32752692699432373, mean loss: 0.3534208661404925
Epoch: 21, step: 269, loss: 0.3182729184627533, mean loss: 0.3534197172894865
Epoch: 21, step: 270, loss: 0.34464752674102783, mean loss: 0.3534194305697431
Epoch: 21, step: 271, loss: 0.32674461603164673, mean loss: 0.3534185587298118
Epoch: 21, step: 272, loss: 0.3062852621078491, mean loss: 0.3534170182749757
Epoch: 21, step: 273, loss: 0.36312761902809143, mean loss: 0.3534173356356121
Epoch: 21, step: 274, loss: 0.3259469270706177, mean loss: 0.35341643788050364
Epoch: 21, step: 275, loss: 0.33865612745285034, mean loss: 0.3534159555174178
Epoch: 21, step: 276, loss: 0.3263385593891144, mean loss: 0.35341507066410816
Epoch: 21, step: 277, loss: 0.2956104278564453, mean loss: 0.3534131817469522
Epoch: 21, step: 278, loss: 0.3184516131877899, mean loss: 0.3534120393240342
Epoch: 21, step: 279, loss: 0.3146330714225769, mean loss: 0.3534107722031382
Epoch: 21, step: 280, loss: 0.32608768343925476, mean loss: 0.3534098794376174
Epoch: 21, step: 281, loss: 0.3302690088748932, mean loss: 0.3534091233482701
Epoch: 21, step: 282, loss: 0.39087939262390137, mean loss: 0.35341034758681933
Epoch: 21, step: 283, loss: 0.34640008211135864, mean loss: 0.35341011855305443
Epoch: 21, step: 284, loss: 0.3664180040359497, mean loss: 0.3534105435223603
Epoch: 21, step: 285, loss: 0.3244682848453522, mean loss: 0.35340959800590566
Epoch: 21, step: 286, loss: 0.31052666902542114, mean loss: 0.35340819710658905
Epoch: 21, step: 287, loss: 0.35248973965644836, mean loss: 0.35340816710340567
Epoch: 21, step: 288, loss: 0.340768963098526, mean loss: 0.35340775423292564
Epoch: 21, step: 289, loss: 0.3096071779727936, mean loss: 0.35340632349613005
Epoch: 21, step: 290, loss: 0.40207594633102417, mean loss: 0.35340791322740017
Epoch: 21, step: 291, loss: 0.3228451907634735, mean loss: 0.3534069149675862
Epoch: 21, step: 292, loss: 0.3658587634563446, mean loss: 0.35340732166479655
Epoch: 21, step: 293, loss: 0.3666047155857086, mean loss: 0.3534077526986303
Epoch: 21, step: 294, loss: 0.3312036395072937, mean loss: 0.3534070275242878
Epoch: 21, step: 295, loss: 0.4039756655693054, mean loss: 0.35340867901475304
Epoch: 21, step: 296, loss: 0.31680354475975037, mean loss: 0.3534074835889258
Epoch: 21, step: 297, loss: 0.34889188408851624, mean loss: 0.35340733612633357
Epoch: 21, step: 298, loss: 0.3386172652244568, mean loss: 0.35340685315370185
Epoch: 21, step: 299, loss: 0.33769965171813965, mean loss: 0.3534063402487438
Epoch: 21, step: 300, loss: 0.2998383343219757, mean loss: 0.3534045910893666
Epoch: 21, step: 301, loss: 0.3329177796840668, mean loss: 0.35340392215410227
Epoch: 21, step: 302, loss: 0.307835191488266, mean loss: 0.3534024342927164
Epoch: 21, step: 303, loss: 0.3318955600261688, mean loss: 0.35340173209622083
Epoch: 21, step: 304, loss: 0.30337175726890564, mean loss: 0.3534000986777342
Epoch: 21, step: 305, loss: 0.3599069118499756, mean loss: 0.3534003111104202
Epoch: 21, step: 306, loss: 0.3221482038497925, mean loss: 0.35339929083333943
Epoch: 21, step: 307, loss: 0.35411226749420166, mean loss: 0.35339931410888986
Epoch: 21, step: 308, loss: 0.3432283401489258, mean loss: 0.35339898208218795
Epoch: 21, step: 309, loss: 0.3337741494178772, mean loss: 0.35339834145959004
Epoch: 21, step: 310, loss: 0.3171674907207489, mean loss: 0.353397158797578
Epoch: 21, step: 311, loss: 0.3182646334171295, mean loss: 0.3533960120249778
Epoch: 21, step: 312, loss: 0.34043505787849426, mean loss: 0.35339558897591467
Epoch: 21, step: 313, loss: 0.30301451683044434, mean loss: 0.3533939445777116
Epoch: 21, step: 314, loss: 0.38273948431015015, mean loss: 0.3533949023615731
Epoch: 21, step: 315, loss: 0.3219388723373413, mean loss: 0.3533938757287394
Epoch: 21, step: 316, loss: 0.3534601926803589, mean loss: 0.35339387789306015
Epoch: 21, step: 317, loss: 0.3395482301712036, mean loss: 0.35339342604110136
Epoch: 21, step: 318, loss: 0.33599182963371277, mean loss: 0.3533928581594838
Epoch: 21, step: 319, loss: 0.3341578543186188, mean loss: 0.3533922304671512
Epoch: 21, step: 320, loss: 0.32176485657691956, mean loss: 0.3533911984105713
Epoch: 21, step: 321, loss: 0.3307252526283264, mean loss: 0.3533904588052139
Epoch: 21, step: 322, loss: 0.32372233271598816, mean loss: 0.3533894907454988
Epoch: 21, step: 323, loss: 0.37800222635269165, mean loss: 0.3533902938235335
Epoch: 21, step: 324, loss: 0.37066757678985596, mean loss: 0.35339085753794397
Epoch: 21, step: 325, loss: 0.3287739157676697, mean loss: 0.35339005437508036
Epoch: 21, step: 326, loss: 0.3245871067047119, mean loss: 0.3533891146684584
Epoch: 21, step: 327, loss: 0.31796911358833313, mean loss: 0.35338795911576754
Epoch: 21, step: 328, loss: 0.2895874083042145, mean loss: 0.353385877735452
Epoch: 21, step: 329, loss: 0.3722100853919983, mean loss: 0.3533864918219548
Epoch: 21, step: 330, loss: 0.31872543692588806, mean loss: 0.35338536114001395
Epoch: 21, step: 331, loss: 0.2970882058143616, mean loss: 0.3533835247244566
Epoch: 21, step: 332, loss: 0.31049659848213196, mean loss: 0.353382125796765
Epoch: 21, step: 333, loss: 0.37190333008766174, mean loss: 0.35338272991980924
Epoch: 21, step: 334, loss: 0.359447181224823, mean loss: 0.353382927723107
Epoch: 21, step: 335, loss: 0.33028554916381836, mean loss: 0.3533821743839498
Epoch: 21, step: 336, loss: 0.3595696687698364, mean loss: 0.35338237618736085
Epoch: 21, step: 337, loss: 0.3582729995250702, mean loss: 0.3533825356884807
Epoch: 21, step: 338, loss: 0.33676978945732117, mean loss: 0.35338199390371633
Epoch: 21, step: 339, loss: 0.3381924629211426, mean loss: 0.3533814985498492
Epoch: 21, step: 340, loss: 0.3291529417037964, mean loss: 0.3533807084452724
Epoch: 21, step: 341, loss: 0.29531392455101013, mean loss: 0.3533788149220254
Epoch: 21, step: 342, loss: 0.326236367225647, mean loss: 0.35337792985182953
Epoch: 21, step: 343, loss: 0.3212927281856537, mean loss: 0.3533768836407409
Epoch: 21, step: 344, loss: 0.299751341342926, mean loss: 0.3533751351147929
Epoch: 21, step: 345, loss: 0.34679320454597473, mean loss: 0.3533749205099488
Epoch: 21, step: 346, loss: 0.3114769458770752, mean loss: 0.35337355446467367
Epoch: 21, step: 347, loss: 0.31982484459877014, mean loss: 0.3533724606752284
Epoch: 21, step: 348, loss: 0.330215722322464, mean loss: 0.3533717057201098
Epoch: 21, step: 349, loss: 0.3279525935649872, mean loss: 0.3533708770341818
Epoch: 21, step: 350, loss: 0.3127327561378479, mean loss: 0.35336955223806454
Epoch: 21, step: 351, loss: 0.3362065553665161, mean loss: 0.35336899274540345
Epoch: 21, step: 352, loss: 0.3107149302959442, mean loss: 0.3533676023205754
Epoch: 21, step: 353, loss: 0.36300528049468994, mean loss: 0.35336791647658866
Epoch: 21, step: 354, loss: 0.3345943093299866, mean loss: 0.35336730453985193
Epoch: 21, step: 355, loss: 0.3205924928188324, mean loss: 0.35336623626046076
Epoch: 21, step: 356, loss: 0.3545362055301666, mean loss: 0.3533662743938094
Epoch: 21, step: 357, loss: 0.3169998824596405, mean loss: 0.35336508912583686
Epoch: 21, step: 358, loss: 0.3305297791957855, mean loss: 0.35336434489255036
Epoch: 21, step: 359, loss: 0.35073110461235046, mean loss: 0.35336425907452534
Epoch: 21, step: 360, loss: 0.29983192682266235, mean loss: 0.35336251449794875
Epoch: 21, step: 361, loss: 0.3546273112297058, mean loss: 0.3533625557153356
Epoch: 21, step: 362, loss: 0.37152886390686035, mean loss: 0.3533631477024373
Epoch: 21, step: 363, loss: 0.3318287134170532, mean loss: 0.3533624459807779
Epoch: 21, step: 364, loss: 0.2959331274032593, mean loss: 0.353360574648425
Epoch: 21, step: 365, loss: 0.36081069707870483, mean loss: 0.35336081740249575
Epoch: 21, step: 366, loss: 0.33134767413139343, mean loss: 0.35336010015172936
Epoch: 21, step: 367, loss: 0.31234920024871826, mean loss: 0.3533587639436001
Epoch: 21, step: 368, loss: 0.3716795742511749, mean loss: 0.3533593608487677
Epoch: 21, step: 369, loss: 0.2992576062679291, mean loss: 0.3533575982321462
Epoch: 21, step: 370, loss: 0.32034361362457275, mean loss: 0.35335652268288387
Epoch: 21, step: 371, loss: 0.3220462203025818, mean loss: 0.35335550267042687
Epoch: 21, step: 372, loss: 0.33199265599250793, mean loss: 0.3533548067442231
Epoch: 21, step: 373, loss: 0.32131415605545044, mean loss: 0.35335376300682364
Epoch: 21, step: 374, loss: 0.33343982696533203, mean loss: 0.3533531143232821
Epoch: 21, step: 375, loss: 0.3493114411830902, mean loss: 0.3533529826726912
Epoch: 21, step: 376, loss: 0.3486451208591461, mean loss: 0.3533528293271385
Epoch: 21, step: 377, loss: 0.33932340145111084, mean loss: 0.35335237237228617
Epoch: 21, step: 378, loss: 0.32366126775741577, mean loss: 0.3533514053298273
Epoch: 21, step: 379, loss: 0.3458218276500702, mean loss: 0.35335116009866263
Epoch: 21, step: 380, loss: 0.33519303798675537, mean loss: 0.3533505687252019
Epoch: 21, step: 381, loss: 0.3664945065975189, mean loss: 0.35335099678284115
Epoch: 21, step: 382, loss: 0.3245847523212433, mean loss: 0.35335005998522295
Epoch: 21, step: 383, loss: 0.3064154088497162, mean loss: 0.3533485315675098
Epoch: 21, step: 384, loss: 0.3161400854587555, mean loss: 0.3533473199212136
Epoch: 21, step: 385, loss: 0.34553882479667664, mean loss: 0.3533470656556609
Epoch: 21, step: 386, loss: 0.3367510735988617, mean loss: 0.35334652526322635
Epoch: 21, step: 387, loss: 0.2980899512767792, mean loss: 0.3533447260780874
Epoch: 21, step: 388, loss: 0.3360700309276581, mean loss: 0.3533441636226076
Epoch: 21, step: 389, loss: 0.3525952994823456, mean loss: 0.35334413924075764
Epoch: 21, step: 390, loss: 0.36084431409835815, mean loss: 0.35334438342681845
Epoch: 21, step: 391, loss: 0.3643418550491333, mean loss: 0.3533447414640506
Epoch: 21, step: 392, loss: 0.34566813707351685, mean loss: 0.3533444915501791
Epoch: 21, step: 393, loss: 0.30251261591911316, mean loss: 0.35334283675899375
Epoch: 21, step: 394, loss: 0.33394527435302734, mean loss: 0.35334220530737076
Epoch: 21, step: 395, loss: 0.29186689853668213, mean loss: 0.35334020415806183
Epoch: 21, step: 396, loss: 0.33244675397872925, mean loss: 0.35333952405486924
Epoch: 21, step: 397, loss: 0.3432345688343048, mean loss: 0.35333919513893863
Epoch: 21, step: 398, loss: 0.35126781463623047, mean loss: 0.353339127717772
Epoch: 21, step: 399, loss: 0.35806167125701904, mean loss: 0.35333928142638865
Epoch: 21, step: 400, loss: 0.34147679805755615, mean loss: 0.35333889534068097
Epoch: 21, step: 401, loss: 0.362505704164505, mean loss: 0.3533391936811361
Epoch: 21, step: 402, loss: 0.366001695394516, mean loss: 0.3533396057780448
Epoch: 21, step: 403, loss: 0.4135417938232422, mean loss: 0.3533415649744795
Epoch: 21, step: 404, loss: 0.3310128152370453, mean loss: 0.3533408383400385
Epoch: 21, step: 405, loss: 0.3644765317440033, mean loss: 0.3533412007120985
Epoch: 21, step: 406, loss: 0.31073513627052307, mean loss: 0.35333981429237765
Epoch: 21, step: 407, loss: 0.31701239943504333, mean loss: 0.3533386322210885
Epoch: 21, step: 408, loss: 0.29138457775115967, mean loss: 0.35333661634061897
Epoch: 21, step: 409, loss: 0.3552272319793701, mean loss: 0.35333667785606243
Epoch: 21, step: 410, loss: 0.31886163353919983, mean loss: 0.35333555616924556
Epoch: 21, step: 411, loss: 0.310606986284256, mean loss: 0.35333416598933
Epoch: 21, step: 412, loss: 0.2900351881980896, mean loss: 0.3533321066153575
Epoch: 21, step: 413, loss: 0.33749210834503174, mean loss: 0.3533315912923609
Epoch: 21, step: 414, loss: 0.31718891859054565, mean loss: 0.3533304155002824
Epoch: 21, step: 415, loss: 0.32170233130455017, mean loss: 0.3533293866101003
Epoch: 21, step: 416, loss: 0.32342296838760376, mean loss: 0.35332841375891716
Epoch: 21, step: 417, loss: 0.32160279154777527, mean loss: 0.3533273817628788
Epoch: 21, step: 418, loss: 0.3226354718208313, mean loss: 0.3533263834247224
Epoch: 21, step: 419, loss: 0.3479909300804138, mean loss: 0.35332620988018215
Epoch: 21, step: 420, loss: 0.39020171761512756, mean loss: 0.35332740927870987
Epoch: 21, step: 421, loss: 0.3319467604160309, mean loss: 0.3533267138825978
Epoch: 21, step: 422, loss: 0.3308945298194885, mean loss: 0.3533259843094992
Epoch: 21, step: 423, loss: 0.33334651589393616, mean loss: 0.35332533452842674
Epoch: 21, step: 424, loss: 0.33075860142707825, mean loss: 0.3533246006270608
Epoch: 21, step: 425, loss: 0.329571008682251, mean loss: 0.353323828152526
Epoch: 21, step: 426, loss: 0.3205517828464508, mean loss: 0.35332276242961275
Epoch: 21, step: 427, loss: 0.3329322040081024, mean loss: 0.35332209936514797
Epoch: 21, step: 428, loss: 0.3326075077056885, mean loss: 0.3533214257856058
Epoch: 21, step: 429, loss: 0.3689894676208496, mean loss: 0.3533219352491499
Epoch: 21, step: 430, loss: 0.3464437425136566, mean loss: 0.3533217116044503
Epoch: 21, step: 431, loss: 0.34566476941108704, mean loss: 0.3533214626467772
Epoch: 21, step: 432, loss: 0.3560238182544708, mean loss: 0.3533215505082594
Epoch: 21, step: 433, loss: 0.2878958582878113, mean loss: 0.3533194233968666
Epoch: 21, step: 434, loss: 0.33816710114479065, mean loss: 0.3533189307825992
Epoch: 21, step: 435, loss: 0.3631118834018707, mean loss: 0.35331924914906926
Epoch: 21, step: 436, loss: 0.3396764397621155, mean loss: 0.35331880563912527
Epoch: 21, step: 437, loss: 0.34200116991996765, mean loss: 0.3533184377295056
Epoch: 21, step: 438, loss: 0.30542218685150146, mean loss: 0.35331688078607104
Epoch: 21, step: 439, loss: 0.34821125864982605, mean loss: 0.35331671482513827
Epoch: 21, step: 440, loss: 0.33861038088798523, mean loss: 0.35331623680355734
Epoch: 21, step: 441, loss: 0.32466205954551697, mean loss: 0.3533153054450038
Epoch: 21, step: 442, loss: 0.29421985149383545, mean loss: 0.3533133847034966
Epoch: 21, step: 443, loss: 0.3325973153114319, mean loss: 0.35331271140430937
Epoch: 21, step: 444, loss: 0.37247422337532043, mean loss: 0.35331333415811905
Epoch: 21, step: 445, loss: 0.3134121596813202, mean loss: 0.35331203740236744
Epoch: 21, step: 446, loss: 0.33089473843574524, mean loss: 0.35331130888204093
Epoch: 21, step: 447, loss: 0.31165382266044617, mean loss: 0.3533099551355759
Epoch: 21, step: 448, loss: 0.31959131360054016, mean loss: 0.3533088594139519
Epoch: 21, step: 449, loss: 0.3553926348686218, mean loss: 0.3533089271261588
Epoch: 21, step: 450, loss: 0.3363940119743347, mean loss: 0.3533083774944723
Epoch: 21, step: 451, loss: 0.3373906910419464, mean loss: 0.353307860283449
Epoch: 21, step: 452, loss: 0.33764684200286865, mean loss: 0.3533073514288407
Epoch: 21, step: 453, loss: 0.3331052362918854, mean loss: 0.3533066950471675
Epoch: 21, step: 454, loss: 0.3481679856777191, mean loss: 0.3533065280921212
Epoch: 21, step: 455, loss: 0.29608482122421265, mean loss: 0.35330466903731716
Epoch: 21, step: 456, loss: 0.3552509844303131, mean loss: 0.35330473226838155
Epoch: 21, step: 457, loss: 0.2967175543308258, mean loss: 0.3533028939480015
Epoch: 21, step: 458, loss: 0.32501736283302307, mean loss: 0.35330197507943395
Epoch: 21, step: 459, loss: 0.3029789328575134, mean loss: 0.35330034036522456
Epoch: 21, step: 460, loss: 0.3454262316226959, mean loss: 0.3533000845877764
Epoch: 21, step: 461, loss: 0.2943335175514221, mean loss: 0.3532981692182241
Epoch: 21, step: 462, loss: 0.3148628771305084, mean loss: 0.35329692079219727
Epoch: 21, step: 463, loss: 0.3078237473964691, mean loss: 0.353295443815018
Epoch: 21, step: 464, loss: 0.3135378360748291, mean loss: 0.3532941525224219
Epoch: 21, step: 465, loss: 0.32935187220573425, mean loss: 0.3532933749231911
Epoch: 21, step: 466, loss: 0.3409263491630554, mean loss: 0.3532929732790171
Epoch: 21, step: 467, loss: 0.2930774390697479, mean loss: 0.35329101772126803
Epoch: 21, step: 468, loss: 0.3054312765598297, mean loss: 0.3532894634803314
Epoch: 21, step: 469, loss: 0.3256997764110565, mean loss: 0.35328856753673626
Epoch: 21, step: 470, loss: 0.31587255001068115, mean loss: 0.35328735253373167
Epoch: 21, step: 471, loss: 0.3090372085571289, mean loss: 0.3532859156541377
Epoch: 21, step: 472, loss: 0.34252867102622986, mean loss: 0.3532855663589262
Epoch: 21, step: 473, loss: 0.3824233114719391, mean loss: 0.35328651245104625
Epoch: 21, step: 474, loss: 0.35254746675491333, mean loss: 0.35328648845527705
Epoch: 21, step: 475, loss: 0.3111426830291748, mean loss: 0.3532851201499061
Epoch: 21, step: 476, loss: 0.35192862153053284, mean loss: 0.35328507610917304
Epoch: 21, step: 477, loss: 0.3527207374572754, mean loss: 0.3532850577876792
Epoch: 21, step: 478, loss: 0.3234533369541168, mean loss: 0.3532840893196458
Epoch: 21, step: 479, loss: 0.3674269914627075, mean loss: 0.3532845484451536
Epoch: 21, step: 480, loss: 0.35059982538223267, mean loss: 0.3532844612929685
Epoch: 21, step: 481, loss: 0.34287023544311523, mean loss: 0.3532841232346081
Epoch: 21, step: 482, loss: 0.3574467897415161, mean loss: 0.35328425835540883
Epoch: 21, step: 483, loss: 0.3174167573451996, mean loss: 0.35328309412855186
Epoch: 21, step: 484, loss: 0.3191896677017212, mean loss: 0.35328198752248136
Epoch: 21, step: 485, loss: 0.2894165813922882, mean loss: 0.35327991464334696
Epoch: 21, step: 486, loss: 0.3575063645839691, mean loss: 0.35328005181675715
Epoch: 21, step: 487, loss: 0.3377818763256073, mean loss: 0.35327954882521195
Epoch: 21, step: 488, loss: 0.32115796208381653, mean loss: 0.3532785063565545
Epoch: 21, step: 489, loss: 0.3375031054019928, mean loss: 0.35327799440091895
Epoch: 21, step: 490, loss: 0.37876585125923157, mean loss: 0.3532788215259184
Epoch: 21, step: 491, loss: 0.3675965964794159, mean loss: 0.35327928614737975
Epoch: 21, step: 492, loss: 0.36338499188423157, mean loss: 0.35327961407371056
Epoch: 21, step: 493, loss: 0.3320685029029846, mean loss: 0.3532789258035058
Epoch: 21, step: 494, loss: 0.32544711232185364, mean loss: 0.3532780227302886
Epoch: 21, step: 495, loss: 0.3564433753490448, mean loss: 0.35327812543478626
Epoch: 21, step: 496, loss: 0.30407944321632385, mean loss: 0.35327652916334085
Epoch: 21, step: 497, loss: 0.32148101925849915, mean loss: 0.35327549757843707
Epoch: 21, step: 498, loss: 0.33003589510917664, mean loss: 0.35327474360891853
Epoch: 21, step: 499, loss: 0.3233768343925476, mean loss: 0.35327377365338986
Epoch: 21, step: 500, loss: 0.36214178800582886, mean loss: 0.35327406134241995
Epoch: 21, step: 501, loss: 0.4062981903553009, mean loss: 0.35327578145300886
Epoch: 21, step: 502, loss: 0.3106972575187683, mean loss: 0.35327440024420054
Epoch: 21, step: 503, loss: 0.3186543881893158, mean loss: 0.3532732772387492
Epoch: 21, step: 504, loss: 0.3334655165672302, mean loss: 0.3532726347345917
Epoch: 21, step: 505, loss: 0.3383452296257019, mean loss: 0.35327215055018985
Epoch: 21, step: 506, loss: 0.3755900263786316, mean loss: 0.3532728744279696
Epoch: 21, step: 507, loss: 0.3188745081424713, mean loss: 0.35327175875703404
Epoch: 21, step: 508, loss: 0.3183051347732544, mean loss: 0.35327062469210413
Epoch: 21, step: 509, loss: 0.32860371470451355, mean loss: 0.35326982470150975
Epoch: 21, step: 510, loss: 0.372683584690094, mean loss: 0.35327045430293635
Epoch: 21, step: 511, loss: 0.3037516176700592, mean loss: 0.3532688484254998
Epoch: 21, step: 512, loss: 0.358856737613678, mean loss: 0.3532690296327894
Epoch: 21, step: 513, loss: 0.330793559551239, mean loss: 0.35326830080893307
Epoch: 21, step: 514, loss: 0.3046359717845917, mean loss: 0.35326672383403035
Epoch: 21, step: 515, loss: 0.3384915292263031, mean loss: 0.353266244742117
Epoch: 21, step: 516, loss: 0.3362613618373871, mean loss: 0.3532656933694992
Epoch: 21, step: 517, loss: 0.2954781651496887, mean loss: 0.35326381970604614
Epoch: 21, step: 518, loss: 0.3215700685977936, mean loss: 0.35326279212276607
Epoch: 21, step: 519, loss: 0.30390068888664246, mean loss: 0.3532611917433329
Epoch: 21, step: 520, loss: 0.32409512996673584, mean loss: 0.35326024617478774
Epoch: 21, step: 521, loss: 0.32738834619522095, mean loss: 0.3532594074307049
Epoch: 21, step: 522, loss: 0.3533931374549866, mean loss: 0.3532594117659733
Epoch: 21, step: 523, loss: 0.3664948344230652, mean loss: 0.3532598408188343
Epoch: 21, step: 524, loss: 0.3033340275287628, mean loss: 0.3532582224255869
Epoch: 21, step: 525, loss: 0.3331594467163086, mean loss: 0.3532575709255639
Epoch: 21, step: 526, loss: 0.32754838466644287, mean loss: 0.35325673759159554
Epoch: 21, step: 527, loss: 0.3126199245452881, mean loss: 0.35325542043831387
Epoch: 21, step: 528, loss: 0.3318134546279907, mean loss: 0.35325472546648584
Epoch: 21, step: 529, loss: 0.3678686022758484, mean loss: 0.3532551991125871
Epoch: 21, step: 530, loss: 0.3034707009792328, mean loss: 0.35325358561402503
Epoch: 21, step: 531, loss: 0.3338859975337982, mean loss: 0.35325295793746037
Epoch: 21, step: 532, loss: 0.2933576703071594, mean loss: 0.35325101687748595
Epoch: 21, step: 533, loss: 0.31684961915016174, mean loss: 0.35324983723532744
Epoch: 21, step: 534, loss: 0.348964124917984, mean loss: 0.35324969835486086
Epoch: 21, step: 535, loss: 0.3493817448616028, mean loss: 0.3532495730161216
Epoch: 21, step: 536, loss: 0.32382485270500183, mean loss: 0.3532486195564051
Epoch: 21, step: 537, loss: 0.33502396941185, mean loss: 0.3532480290356953
Epoch: 21, step: 538, loss: 0.3640385568141937, mean loss: 0.35324837866236086
Epoch: 21, step: 539, loss: 0.31621646881103516, mean loss: 0.3532471788208027
Epoch: 21, step: 540, loss: 0.3103821873664856, mean loss: 0.3532457900311881
Epoch: 21, step: 541, loss: 0.3099121153354645, mean loss: 0.35324438610211745
Epoch: 21, step: 542, loss: 0.33373838663101196, mean loss: 0.35324375416511444
Epoch: 21, step: 543, loss: 0.3092367947101593, mean loss: 0.35324232851526816
Epoch: 21, step: 544, loss: 0.31759414076805115, mean loss: 0.35324117369367536
Epoch: 21, step: 545, loss: 0.34048178791999817, mean loss: 0.35324076036728164
Epoch: 21, step: 546, loss: 0.32694482803344727, mean loss: 0.35323990856681087
Epoch: 21, step: 547, loss: 0.3243435323238373, mean loss: 0.3532389725608429
Epoch: 21, step: 548, loss: 0.315120667219162, mean loss: 0.35323773787988083
Epoch: 21, step: 549, loss: 0.33325156569480896, mean loss: 0.3532370905334992
Epoch: 21, step: 550, loss: 0.3447849750518799, mean loss: 0.35323681678077107
Epoch: 21, step: 551, loss: 0.30942612886428833, mean loss: 0.35323539785707897
Epoch: 21, step: 552, loss: 0.3269880414009094, mean loss: 0.3532345477953354
Epoch: 21, step: 553, loss: 0.35665884613990784, mean loss: 0.35323465869300835
Epoch: 21, step: 554, loss: 0.35936906933784485, mean loss: 0.3532348573526361
Epoch: 21, step: 555, loss: 0.32950350642204285, mean loss: 0.35323408885033913
Epoch: 21, step: 556, loss: 0.34267154335975647, mean loss: 0.35323374681007197
Epoch: 21, step: 557, loss: 0.3436412811279297, mean loss: 0.35323343619334757
Epoch: 21, step: 558, loss: 0.3669764995574951, mean loss: 0.35323388119750404
Epoch: 21, step: 559, loss: 0.3092409670352936, mean loss: 0.35323245674101644
Epoch: 21, step: 560, loss: 0.31709909439086914, mean loss: 0.35323128680861077
Epoch: 21, step: 561, loss: 0.4182506501674652, mean loss: 0.3532333919489125
Epoch: 21, step: 562, loss: 0.3107956349849701, mean loss: 0.3532320179806746
Epoch: 21, step: 563, loss: 0.3773767948150635, mean loss: 0.3532327996686063
Epoch: 21, step: 564, loss: 0.3682743012905121, mean loss: 0.3532332866219432
Epoch: 21, step: 565, loss: 0.30902689695358276, mean loss: 0.3532318555313097
Epoch: 21, step: 566, loss: 0.3613962233066559, mean loss: 0.35323211982731095
Epoch: 21, step: 567, loss: 0.3410017788410187, mean loss: 0.3532317239208955
Epoch: 21, step: 568, loss: 0.3484249711036682, mean loss: 0.3532315683273042
Epoch: 21, step: 569, loss: 0.34933027625083923, mean loss: 0.3532314420473768
Epoch: 21, step: 570, loss: 0.33649012446403503, mean loss: 0.3532309001694812
Epoch: 21, step: 571, loss: 0.3489964008331299, mean loss: 0.3532307631129258
Epoch: 21, step: 572, loss: 0.3378310203552246, mean loss: 0.3532302646909833
Epoch: 21, step: 573, loss: 0.33050817251205444, mean loss: 0.35322952930059626
Epoch: 21, step: 574, loss: 0.3467150926589966, mean loss: 0.353229318470581
Epoch: 21, step: 575, loss: 0.34259170293807983, mean loss: 0.3532289742111786
Epoch: 21, step: 576, loss: 0.37696194648742676, mean loss: 0.3532297422436784
Epoch: 21, step: 577, loss: 0.35056692361831665, mean loss: 0.3532296560738957
Epoch: 21, step: 578, loss: 0.31765955686569214, mean loss: 0.35322850504974895
Epoch: 21, step: 579, loss: 0.33989930152893066, mean loss: 0.3532280737397722
Epoch: 21, step: 580, loss: 0.327310711145401, mean loss: 0.35322723512587173
Epoch: 21, step: 581, loss: 0.33409324288368225, mean loss: 0.35322661602303596
Epoch: 21, step: 582, loss: 0.32111048698425293, mean loss: 0.35322557690150885
Epoch: 21, step: 583, loss: 0.3447438180446625, mean loss: 0.3532253024819781
Epoch: 21, step: 584, loss: 0.39470741152763367, mean loss: 0.3532266445541592
Epoch: 21, step: 585, loss: 0.2886609435081482, mean loss: 0.3532245557252674
Epoch: 21, step: 586, loss: 0.3336380422115326, mean loss: 0.35322392208308456
Epoch: 21, step: 587, loss: 0.33413589000701904, mean loss: 0.3532233045872229
Epoch: 21, step: 588, loss: 0.31835347414016724, mean loss: 0.3532221765883083
Epoch: 21, step: 589, loss: 0.3314570486545563, mean loss: 0.3532214725342249
Epoch: 21, step: 590, loss: 0.36033910512924194, mean loss: 0.35322170276655857
Epoch: 21, step: 591, loss: 0.3025868833065033, mean loss: 0.3532200649473239
Epoch: 21, step: 592, loss: 0.2850794196128845, mean loss: 0.3532178609609949
Epoch: 21, step: 593, loss: 0.31908440589904785, mean loss: 0.35321675696154275
Epoch: 21, step: 594, loss: 0.37840530276298523, mean loss: 0.3532175716239122
Epoch: 21, step: 595, loss: 0.308969110250473, mean loss: 0.3532161405611252
Epoch: 21, step: 596, loss: 0.3196928799152374, mean loss: 0.35321505640276535
Epoch: 21, step: 597, loss: 0.3239632546901703, mean loss: 0.3532141104160338
Epoch: 21, step: 598, loss: 0.33211278915405273, mean loss: 0.35321342803330047
Epoch: 21, step: 599, loss: 0.327593594789505, mean loss: 0.35321259955596107
Epoch: 21, step: 600, loss: 0.34151491522789, mean loss: 0.35321222129616064
Epoch: 21, step: 601, loss: 0.32787084579467773, mean loss: 0.35321140187640054
Epoch: 21, step: 602, loss: 0.3211023211479187, mean loss: 0.35321036365475833
Epoch: 21, step: 603, loss: 0.3223344385623932, mean loss: 0.3532093653385047
Epoch: 21, step: 604, loss: 0.32112735509872437, mean loss: 0.3532083280592445
Epoch: 21, step: 605, loss: 0.31976282596588135, mean loss: 0.35320724673036985
Epoch: 21, step: 606, loss: 0.3287714421749115, mean loss: 0.3532064567202003
Epoch: 21, step: 607, loss: 0.3347109854221344, mean loss: 0.3532058587804842
Epoch: 21, step: 608, loss: 0.33874911069869995, mean loss: 0.3532053914236782
Epoch: 21, step: 609, loss: 0.3442729711532593, mean loss: 0.35320510266631505
Epoch: 21, step: 610, loss: 0.32248154282569885, mean loss: 0.35320410950129677
Epoch: 21, step: 611, loss: 0.3333446979522705, mean loss: 0.35320346754979853
Epoch: 21, step: 612, loss: 0.36594682931900024, mean loss: 0.3532038794630988
Epoch: 21, step: 613, loss: 0.31509125232696533, mean loss: 0.353202647559707
Epoch: 21, step: 614, loss: 0.29916250705718994, mean loss: 0.35320090089237766
Epoch: 21, step: 615, loss: 0.35511183738708496, mean loss: 0.353200962655031
Epoch: 21, step: 616, loss: 0.37799033522605896, mean loss: 0.353201763837041
Epoch: 21, step: 617, loss: 0.34563514590263367, mean loss: 0.35320151929506133
Epoch: 21, step: 618, loss: 0.3283943235874176, mean loss: 0.35320071758883675
Epoch: 21, step: 619, loss: 0.39399489760398865, mean loss: 0.35320203591161387
Epoch: 21, step: 620, loss: 0.3129555881023407, mean loss: 0.3532007353316233
Epoch: 21, step: 621, loss: 0.33831125497817993, mean loss: 0.3532002541876837
Epoch: 21, step: 622, loss: 0.3420085608959198, mean loss: 0.3531998925470306
Epoch: 21, step: 623, loss: 0.3199487030506134, mean loss: 0.35319881812575954
Epoch: 21, step: 624, loss: 0.3586180806159973, mean loss: 0.35319899322875126
Epoch: 21, step: 625, loss: 0.3573944568634033, mean loss: 0.3531991287849269
Epoch: 21, step: 626, loss: 0.3257063031196594, mean loss: 0.35319824051554416
Epoch: 21, step: 627, loss: 0.3515505790710449, mean loss: 0.35319818728275
Epoch: 21, step: 628, loss: 0.33004990220069885, mean loss: 0.3531974394300352
Epoch: 21, step: 629, loss: 0.3249008357524872, mean loss: 0.3531965252798873
Epoch: 21, step: 630, loss: 0.3286181390285492, mean loss: 0.3531957312761318
Epoch: 21, step: 631, loss: 0.34943434596061707, mean loss: 0.3531956097686594
Epoch: 21, step: 632, loss: 0.30311617255210876, mean loss: 0.3531939920590229
Epoch: 21, step: 633, loss: 0.3581969439983368, mean loss: 0.35319415366351736
Epoch: 21, step: 634, loss: 0.3284377157688141, mean loss: 0.3531933540111418
Epoch: 21, step: 635, loss: 0.3442326486110687, mean loss: 0.35319306458267286
Epoch: 21, step: 636, loss: 0.34167930483818054, mean loss: 0.35319269270321985
Epoch: 21, step: 637, loss: 0.3861410319805145, mean loss: 0.3531937568573209
Epoch: 21, step: 638, loss: 0.3157147467136383, mean loss: 0.35319254641226894
Epoch: 21, step: 639, loss: 0.3324090242385864, mean loss: 0.3531918751965935
Epoch: 21, step: 640, loss: 0.3097526729106903, mean loss: 0.3531904723481425
Epoch: 21, step: 641, loss: 0.3466668128967285, mean loss: 0.3531902616764558
Epoch: 21, step: 642, loss: 0.3082154393196106, mean loss: 0.35318880932968805
Epoch: 21, step: 643, loss: 0.37755897641181946, mean loss: 0.3531895962764422
Epoch: 21, step: 644, loss: 0.3491261601448059, mean loss: 0.3531894650666475
Epoch: 21, step: 645, loss: 0.3268676698207855, mean loss: 0.35318861515398214
Epoch: 21, step: 646, loss: 0.3192822337150574, mean loss: 0.35318752037559464
Epoch: 21, step: 647, loss: 0.33685916662216187, mean loss: 0.35318699317832764
Epoch: 21, step: 648, loss: 0.36192262172698975, mean loss: 0.3531872752184448
Epoch: 21, step: 649, loss: 0.3162866532802582, mean loss: 0.3531860838766117
Epoch: 21, step: 650, loss: 0.38326847553253174, mean loss: 0.3531870550595546
Epoch: 21, step: 651, loss: 0.3317827880382538, mean loss: 0.3531863640643641
Epoch: 21, step: 652, loss: 0.30686265230178833, mean loss: 0.3531848686415742
Epoch: 21, step: 653, loss: 0.3431738615036011, mean loss: 0.3531845454765172
Epoch: 21, step: 654, loss: 0.3258664906024933, mean loss: 0.35318366365157533
Epoch: 21, step: 655, loss: 0.2935293912887573, mean loss: 0.3531817380779032
Epoch: 21, step: 656, loss: 0.31790778040885925, mean loss: 0.3531805995104693
Epoch: 21, step: 657, loss: 0.32239991426467896, mean loss: 0.3531796060082666
Epoch: 21, step: 658, loss: 0.33323240280151367, mean loss: 0.35317896219704087
Epoch: 21, step: 659, loss: 0.2947872579097748, mean loss: 0.3531770776209924
Epoch: 21, step: 660, loss: 0.32337164878845215, mean loss: 0.3531761156900957
Epoch: 21, step: 661, loss: 0.33262425661087036, mean loss: 0.3531754524273616
Epoch: 21, step: 662, loss: 0.3275134265422821, mean loss: 0.35317462427278434
Epoch: 21, step: 663, loss: 0.33616429567337036, mean loss: 0.3531740753400168
Epoch: 21, step: 664, loss: 0.3458119034767151, mean loss: 0.3531738377663015
Epoch: 21, step: 665, loss: 0.317048579454422, mean loss: 0.3531726720593537
Epoch: 21, step: 666, loss: 0.30647024512290955, mean loss: 0.35317116509194585
Epoch: 21, step: 667, loss: 0.31519007682800293, mean loss: 0.3531699395792889
Epoch: 21, step: 668, loss: 0.34469401836395264, mean loss: 0.35316966610072226
Epoch: 21, step: 669, loss: 0.3225083351135254, mean loss: 0.35316867683405817
Epoch: 21, step: 670, loss: 0.42388617992401123, mean loss: 0.35317095841183166
Epoch: 21, step: 671, loss: 0.3681029975414276, mean loss: 0.3531714401526734
Epoch: 21, step: 672, loss: 0.30969947576522827, mean loss: 0.35317003769551986
Epoch: 21, step: 673, loss: 0.34875619411468506, mean loss: 0.35316989530428233
Epoch: 21, step: 674, loss: 0.3323167562484741, mean loss: 0.3531692226006772
Epoch: 21, step: 675, loss: 0.3408697843551636, mean loss: 0.35316882584460474
Epoch: 21, step: 676, loss: 0.3532555401325226, mean loss: 0.3531688286417496
Epoch: 21, step: 677, loss: 0.3626667261123657, mean loss: 0.3531691350057735
Epoch: 21, step: 678, loss: 0.2952229976654053, mean loss: 0.35316726595641246
Epoch: 21, step: 679, loss: 0.3307703137397766, mean loss: 0.3531665435672944
Epoch: 21, step: 680, loss: 0.2999343276023865, mean loss: 0.3531648266759554
Epoch: 21, step: 681, loss: 0.3092913031578064, mean loss: 0.35316341167487436
Epoch: 21, step: 682, loss: 0.3644251227378845, mean loss: 0.35316377487386375
Epoch: 21, step: 683, loss: 0.32575786113739014, mean loss: 0.3531628910402164
Epoch: 21, step: 684, loss: 0.3197566270828247, mean loss: 0.35316181373156547
Epoch: 21, step: 685, loss: 0.3561429977416992, mean loss: 0.3531619098677799
Epoch: 21, step: 686, loss: 0.35865068435668945, mean loss: 0.353162086862217
Epoch: 21, step: 687, loss: 0.3980386555194855, mean loss: 0.35316353393330746
Epoch: 21, step: 688, loss: 0.30933651328086853, mean loss: 0.3531621207510725
Epoch: 21, step: 689, loss: 0.349595844745636, mean loss: 0.35316200576184165
Epoch: 21, step: 690, loss: 0.3344756066799164, mean loss: 0.3531614032663046
Epoch: 21, step: 691, loss: 0.4224573075771332, mean loss: 0.35316363746492174
Epoch: 21, step: 692, loss: 0.2963142693042755, mean loss: 0.35316180461944474
Epoch: 21, step: 693, loss: 0.3193255066871643, mean loss: 0.3531607137593657
Epoch: 21, step: 694, loss: 0.3815181851387024, mean loss: 0.35316162795619277
Epoch: 21, step: 695, loss: 0.34713414311408997, mean loss: 0.35316143364655894
Epoch: 21, step: 696, loss: 0.32989487051963806, mean loss: 0.3531606836203468
Epoch: 21, step: 697, loss: 0.3331852853298187, mean loss: 0.3531600397096289
Epoch: 21, step: 698, loss: 0.3378573954105377, mean loss: 0.35315954644191466
Epoch: 21, step: 699, loss: 0.3323156237602234, mean loss: 0.35315887457746514
Epoch: 21, step: 700, loss: 0.3661716878414154, mean loss: 0.353159294007385
Epoch: 21, step: 701, loss: 0.32248640060424805, mean loss: 0.353158305388375
Epoch: 21, step: 702, loss: 0.33550798892974854, mean loss: 0.353157736518795
Epoch: 21, step: 703, loss: 0.34058427810668945, mean loss: 0.35315733128937604
Epoch: 21, step: 704, loss: 0.31431323289871216, mean loss: 0.35315607942504296
Epoch: 21, step: 705, loss: 0.3540273606777191, mean loss: 0.3531561075037169
Epoch: 21, step: 706, loss: 0.3122493624687195, mean loss: 0.35315478924955057
Epoch: 21, step: 707, loss: 0.3490346074104309, mean loss: 0.353154656477514
Epoch: 21, step: 708, loss: 0.33412182331085205, mean loss: 0.3531540431680316
Epoch: 21, step: 709, loss: 0.347504198551178, mean loss: 0.3531538611146509
Epoch: 21, step: 710, loss: 0.3127308189868927, mean loss: 0.3531525586161129
Epoch: 21, step: 711, loss: 0.32338252663612366, mean loss: 0.35315159940642155
Epoch: 21, step: 712, loss: 0.4050041139125824, mean loss: 0.35315327007415703
Epoch: 21, step: 713, loss: 0.322176456451416, mean loss: 0.35315227204549465
Epoch: 21, step: 714, loss: 0.3134753704071045, mean loss: 0.35315099375361547
Epoch: 21, step: 715, loss: 0.3231015205383301, mean loss: 0.35315002566491654
Epoch: 21, step: 716, loss: 0.30533257126808167, mean loss: 0.35314848520377173
Epoch: 21, step: 717, loss: 0.35369986295700073, mean loss: 0.3531485029660858
Epoch: 21, step: 718, loss: 0.355684757232666, mean loss: 0.3531485846674119
Epoch: 21, step: 719, loss: 0.31576189398765564, mean loss: 0.3531473803544793
Epoch: 21, step: 720, loss: 0.3253589868545532, mean loss: 0.3531464852540283
Epoch: 21, step: 721, loss: 0.32062920928001404, mean loss: 0.35314543786383396
Epoch: 21, step: 722, loss: 0.35709020495414734, mean loss: 0.3531455649217491
Epoch: 21, step: 723, loss: 0.34578022360801697, mean loss: 0.3531453276974089
Epoch: 21, step: 724, loss: 0.31284523010253906, mean loss: 0.3531440297458615
Epoch: 21, step: 725, loss: 0.3789062201976776, mean loss: 0.3531448594460371
Epoch: 21, step: 726, loss: 0.30397114157676697, mean loss: 0.3531432758024227
Epoch: 21, step: 727, loss: 0.33662909269332886, mean loss: 0.3531427439789296
Epoch: 21, step: 728, loss: 0.3770264983177185, mean loss: 0.3531435131076559
Epoch: 21, step: 729, loss: 0.34567931294441223, mean loss: 0.3531432727457005
Epoch: 21, step: 730, loss: 0.2841545045375824, mean loss: 0.35314105124294065
Epoch: 21, step: 731, loss: 0.3151439130306244, mean loss: 0.35313982773900543
Epoch: 21, step: 732, loss: 0.36904439330101013, mean loss: 0.3531403398478879
Epoch: 21, step: 733, loss: 0.319213330745697, mean loss: 0.3531392474720394
Epoch: 21, step: 734, loss: 0.35683584213256836, mean loss: 0.3531393664905094
Epoch: 21, step: 735, loss: 0.3621767461299896, mean loss: 0.3531396574557264
Epoch: 21, step: 736, loss: 0.32409417629241943, mean loss: 0.35313872234477817
Epoch: 21, step: 737, loss: 0.3151267170906067, mean loss: 0.35313749859855276
Epoch: 21, step: 738, loss: 0.3335285186767578, mean loss: 0.3531368673337064
Epoch: 21, step: 739, loss: 0.35294875502586365, mean loss: 0.3531368612780694
Epoch: 21, step: 740, loss: 0.30777251720428467, mean loss: 0.3531354009740593
Epoch: 21, step: 741, loss: 0.3407615125179291, mean loss: 0.35313500266438136
Epoch: 21, step: 742, loss: 0.357965350151062, mean loss: 0.3531351581460013
Epoch: 21, step: 743, loss: 0.3228335380554199, mean loss: 0.3531341828138238
Epoch: 21, step: 744, loss: 0.3193727135658264, mean loss: 0.3531330961528676
Epoch: 21, step: 745, loss: 0.3248402774333954, mean loss: 0.3531321855375242
Epoch: 21, step: 746, loss: 0.34063369035720825, mean loss: 0.3531317832815562
Epoch: 21, step: 747, loss: 0.3250699043273926, mean loss: 0.35313088015723354
Epoch: 21, step: 748, loss: 0.35717475414276123, mean loss: 0.35313101029832017
Epoch: 21, step: 749, loss: 0.38815566897392273, mean loss: 0.35313213743543403
Epoch: 21, step: 750, loss: 0.3364221453666687, mean loss: 0.353131599704394
Epoch: 21, step: 751, loss: 0.3125711977481842, mean loss: 0.3531302945041766
Epoch: 21, step: 752, loss: 0.35821253061294556, mean loss: 0.35313045804107235
Epoch: 21, step: 753, loss: 0.3409935235977173, mean loss: 0.3531300675096854
Epoch: 21, step: 754, loss: 0.32405829429626465, mean loss: 0.3531291320943499
Epoch: 21, step: 755, loss: 0.3218071758747101, mean loss: 0.3531281243094007
Epoch: 21, step: 756, loss: 0.30392253398895264, mean loss: 0.3531265411688866
Epoch: 21, step: 757, loss: 0.3071158826351166, mean loss: 0.3531250608697252
Epoch: 21, step: 758, loss: 0.32107827067375183, mean loss: 0.3531240298627376
Epoch: 21, step: 759, loss: 0.32090914249420166, mean loss: 0.35312299348108245
Epoch: 21, step: 760, loss: 0.36342868208885193, mean loss: 0.35312332501360966
Epoch: 21, step: 761, loss: 0.3783074915409088, mean loss: 0.3531241351585793
Epoch: 21, step: 762, loss: 0.37980857491493225, mean loss: 0.35312499353795834
Epoch: 21, step: 763, loss: 0.3465419411659241, mean loss: 0.35312478178254236
Epoch: 21, step: 764, loss: 0.35240378975868225, mean loss: 0.3531247585913164
Epoch: 21, step: 765, loss: 0.33595356345176697, mean loss: 0.353124206285265
Epoch: 21, step: 766, loss: 0.31353211402893066, mean loss: 0.35312293285912055
Epoch: 21, step: 767, loss: 0.353392094373703, mean loss: 0.3531229415160585
Epoch: 21, step: 768, loss: 0.32837915420532227, mean loss: 0.3531221457167689
Epoch: 21, step: 769, loss: 0.32044172286987305, mean loss: 0.35312109469654485
Epoch: 21, step: 770, loss: 0.32399678230285645, mean loss: 0.35312015807289493
Epoch: 21, step: 771, loss: 0.3410710394382477, mean loss: 0.3531197705915908
Epoch: 21, step: 772, loss: 0.3261467516422272, mean loss: 0.35311890320827566
Epoch: 21, step: 773, loss: 0.3608781397342682, mean loss: 0.35311915271745714
Epoch: 21, step: 774, loss: 0.37135398387908936, mean loss: 0.35311973906528704
Epoch: 21, step: 775, loss: 0.312381774187088, mean loss: 0.3531184291628794
Epoch: 21, step: 776, loss: 0.29765209555625916, mean loss: 0.35311664573682855
Epoch: 21, step: 777, loss: 0.30101078748703003, mean loss: 0.3531149704150406
Epoch: 21, step: 778, loss: 0.3202020525932312, mean loss: 0.35311391222393934
Epoch: 21, step: 779, loss: 0.3668191134929657, mean loss: 0.35311435284898013
Epoch: 21, step: 780, loss: 0.32644394040107727, mean loss: 0.3531134954172988
Epoch: 21, step: 781, loss: 0.30918535590171814, mean loss: 0.3531120832093802
Epoch: 21, step: 782, loss: 0.393363356590271, mean loss: 0.35311337717129815
Epoch: 21, step: 783, loss: 0.3516556918621063, mean loss: 0.35311333031244163
Epoch: 21, step: 784, loss: 0.36234283447265625, mean loss: 0.3531136269952074
Epoch: 21, step: 785, loss: 0.3180083632469177, mean loss: 0.3531124985714289
Epoch: 21, step: 786, loss: 0.29524165391921997, mean loss: 0.3531106384304932
Epoch: 21, step: 787, loss: 0.31108418107032776, mean loss: 0.35310928761867266
Epoch: 21, step: 788, loss: 0.35385122895240784, mean loss: 0.35310931146533914
Epoch: 21, step: 789, loss: 0.3650944232940674, mean loss: 0.35310969666530795
Epoch: 21, step: 790, loss: 0.342252641916275, mean loss: 0.3531093477321648
Epoch: 21, step: 791, loss: 0.40783166885375977, mean loss: 0.353111106387555
Epoch: 21, step: 792, loss: 0.35848090052604675, mean loss: 0.3531112789554162
Epoch: 21, step: 793, loss: 0.301535040140152, mean loss: 0.35310962151474473
Epoch: 21, step: 794, loss: 0.33166590332984924, mean loss: 0.35310893242710745
Epoch: 21, step: 795, loss: 0.33597078919410706, mean loss: 0.35310838171556397
Epoch: 21, step: 796, loss: 0.3344804644584656, mean loss: 0.3531077831513386
Epoch: 21, step: 797, loss: 0.37363487482070923, mean loss: 0.35310844271986475
Epoch: 21, step: 798, loss: 0.30051425099372864, mean loss: 0.3531067528380498
Epoch: 21, step: 799, loss: 0.3058624267578125, mean loss: 0.35310523489928614
Epoch: 21, step: 800, loss: 0.3036445677280426, mean loss: 0.3531036458015457
Epoch: 21, step: 801, loss: 0.33786582946777344, mean loss: 0.353103156248878
Epoch: 21, step: 802, loss: 0.3716471493244171, mean loss: 0.3531037520015389
Epoch: 21, step: 803, loss: 0.3328537344932556, mean loss: 0.3531031014612694
Epoch: 21, step: 804, loss: 0.2952958345413208, mean loss: 0.3531012444383351
Epoch: 21, step: 805, loss: 0.3480842709541321, mean loss: 0.3531010832763215
Epoch: 21, step: 806, loss: 0.38577020168304443, mean loss: 0.35310213268425594
Epoch: 21, step: 807, loss: 0.33159416913986206, mean loss: 0.35310144182072184
Epoch: 21, step: 808, loss: 0.35681432485580444, mean loss: 0.35310156107948376
Epoch: 21, step: 809, loss: 0.31979021430015564, mean loss: 0.35310049114478925
Epoch: 21, step: 810, loss: 0.3159821033477783, mean loss: 0.35309929896917347
Epoch: 21, step: 811, loss: 0.34960049390792847, mean loss: 0.3530991865974796
Epoch: 21, step: 812, loss: 0.3125448226928711, mean loss: 0.35309788414817794
Epoch: 21, step: 813, loss: 0.31502678990364075, mean loss: 0.35309666149115937
Epoch: 21, step: 814, loss: 0.29406648874282837, mean loss: 0.3530947657921084
Epoch: 21, step: 815, loss: 0.35154759883880615, mean loss: 0.3530947161078774
Epoch: 21, step: 816, loss: 0.35969826579093933, mean loss: 0.35309492816110893
Epoch: 21, step: 817, loss: 0.36556127667427063, mean loss: 0.353095328467721
Epoch: 21, step: 818, loss: 0.3161799907684326, mean loss: 0.35309414311827814
Epoch: 21, step: 819, loss: 0.34431084990501404, mean loss: 0.35309386109627666
Epoch: 21, step: 820, loss: 0.2869206666946411, mean loss: 0.35309173641512714
Epoch: 21, step: 821, loss: 0.39267972111701965, mean loss: 0.3530930074606772
Epoch: 21, step: 822, loss: 0.41368597745895386, mean loss: 0.3530949528477128
Epoch: 21, step: 823, loss: 0.3386373817920685, mean loss: 0.35309448869042964
Epoch: 21, step: 824, loss: 0.35008183121681213, mean loss: 0.3530943919727991
Epoch: 21, step: 825, loss: 0.3544211685657501, mean loss: 0.3530944345659482
Epoch: 21, step: 826, loss: 0.34785300493240356, mean loss: 0.35309426630715607
Epoch: 21, step: 827, loss: 0.3564226031303406, mean loss: 0.3530943731489904
Epoch: 21, step: 828, loss: 0.3071866035461426, mean loss: 0.35309289952623807
Epoch: 21, step: 829, loss: 0.31467655301094055, mean loss: 0.353091666415032
Epoch: 21, step: 830, loss: 0.33321720361709595, mean loss: 0.3530910284929393
Epoch: 21, step: 831, loss: 0.3271562457084656, mean loss: 0.35309019607597997
Epoch: 21, step: 832, loss: 0.3579515814781189, mean loss: 0.35309035210465417
Epoch: 21, step: 833, loss: 0.3353559672832489, mean loss: 0.3530897829286858
Epoch: 21, step: 834, loss: 0.34996461868286133, mean loss: 0.35308968263136414
Epoch: 21, step: 835, loss: 0.3226274251937866, mean loss: 0.35308870502361583
Epoch: 21, step: 836, loss: 0.2986547350883484, mean loss: 0.35308695816151464
Epoch: 21, step: 837, loss: 0.31238672137260437, mean loss: 0.35308565207600057
Epoch: 21, step: 838, loss: 0.3409734070301056, mean loss: 0.35308526340209095
Epoch: 21, step: 839, loss: 0.32838574051856995, mean loss: 0.3530844708362174
Epoch: 21, step: 840, loss: 0.2988753914833069, mean loss: 0.3530827314144509
Epoch: 21, step: 841, loss: 0.3594614863395691, mean loss: 0.3530829360847623
Epoch: 21, step: 842, loss: 0.3549497425556183, mean loss: 0.35308299598165555
Epoch: 21, step: 843, loss: 0.32348793745040894, mean loss: 0.3530820464482068
Epoch: 21, step: 844, loss: 0.3395070731639862, mean loss: 0.35308161092017304
Epoch: 21, step: 845, loss: 0.34499529004096985, mean loss: 0.35308135149377334
Epoch: 21, step: 846, loss: 0.34010180830955505, mean loss: 0.35308093509573724
Epoch: 21, step: 847, loss: 0.34148961305618286, mean loss: 0.35308056324529324
Epoch: 21, step: 848, loss: 0.32455673813819885, mean loss: 0.3530796482282879
Epoch: 21, step: 849, loss: 0.29069045186042786, mean loss: 0.3530776469067903
Epoch: 21, step: 850, loss: 0.3047177195549011, mean loss: 0.35307609566613746
Epoch: 21, step: 851, loss: 0.3651246130466461, mean loss: 0.3530764821338492
Epoch: 21, step: 852, loss: 0.32445037364959717, mean loss: 0.3530755639535084
Epoch: 21, step: 853, loss: 0.3318907916545868, mean loss: 0.353074884475277
Epoch: 21, step: 854, loss: 0.35528379678726196, mean loss: 0.35307495532143346
Epoch: 21, step: 855, loss: 0.313689261674881, mean loss: 0.35307369214973217
Epoch: 21, step: 856, loss: 0.36129987239837646, mean loss: 0.3530739559700153
Epoch: 21, step: 857, loss: 0.3181157410144806, mean loss: 0.35307283486761787
Epoch: 21, step: 858, loss: 0.3337264060974121, mean loss: 0.35307221445172554
Epoch: 21, step: 859, loss: 0.33808839321136475, mean loss: 0.353071733954636
Epoch: 21, step: 860, loss: 0.2833699584007263, mean loss: 0.3530694988487981
Epoch: 21, step: 861, loss: 0.3152679204940796, mean loss: 0.3530682867158425
Epoch: 21, step: 862, loss: 0.3127300441265106, mean loss: 0.3530669932845221
Epoch: 21, step: 863, loss: 0.32701683044433594, mean loss: 0.3530661580221507
Epoch: 21, step: 864, loss: 0.36435654759407043, mean loss: 0.3530665200212392
Epoch: 21, step: 865, loss: 0.3437855541706085, mean loss: 0.35306622245901254
Epoch: 21, step: 866, loss: 0.31342583894729614, mean loss: 0.3530649515672966
Epoch: 21, step: 867, loss: 0.33381763100624084, mean loss: 0.3530643345077762
Epoch: 21, step: 868, loss: 0.31223517656326294, mean loss: 0.35306302558725094
Epoch: 21, step: 869, loss: 0.397254079580307, mean loss: 0.35306444223961975
Epoch: 21, step: 870, loss: 0.29030200839042664, mean loss: 0.3530624303007241
Epoch: 21, step: 871, loss: 0.3220802843570709, mean loss: 0.35306143715589966
Epoch: 21, step: 872, loss: 0.29108479619026184, mean loss: 0.35305945053407817
Epoch: 21, step: 873, loss: 0.3399611711502075, mean loss: 0.3530590306905182
Epoch: 21, step: 874, loss: 0.3429708778858185, mean loss: 0.3530587073419235
Epoch: 21, step: 875, loss: 0.33691835403442383, mean loss: 0.3530581900229072
Epoch: 21, step: 876, loss: 0.3290897011756897, mean loss: 0.3530574218267325
Epoch: 21, step: 877, loss: 0.3453645706176758, mean loss: 0.3530571752767931
Epoch: 21, step: 878, loss: 0.34483057260513306, mean loss: 0.3530569116289813
Epoch: 21, step: 879, loss: 0.32591691613197327, mean loss: 0.35305604186883843
Epoch: 21, step: 880, loss: 0.3376592695713043, mean loss: 0.3530555484616185
Epoch: 21, step: 881, loss: 0.3602232038974762, mean loss: 0.35305577814999367
Epoch: 21, step: 882, loss: 0.33048298954963684, mean loss: 0.3530550548254639
Epoch: 21, step: 883, loss: 0.382663369178772, mean loss: 0.35305600356663136
Epoch: 21, step: 884, loss: 0.35276171565055847, mean loss: 0.3530559941370464
Epoch: 21, step: 885, loss: 0.32879823446273804, mean loss: 0.35305521689386554
Epoch: 21, step: 886, loss: 0.32453975081443787, mean loss: 0.3530543032587344
Epoch: 21, step: 887, loss: 0.3077491521835327, mean loss: 0.3530528517288396
Epoch: 21, step: 888, loss: 0.3038520812988281, mean loss: 0.3530512754378573
Epoch: 21, step: 889, loss: 0.3069441616535187, mean loss: 0.35304979830856326
Epoch: 21, step: 890, loss: 0.3403366804122925, mean loss: 0.35304939103264155
Epoch: 21, step: 891, loss: 0.3334425091743469, mean loss: 0.35304876292904536
Epoch: 21, step: 892, loss: 0.3959706723690033, mean loss: 0.3530501378820979
Epoch: 21, step: 893, loss: 0.3338031470775604, mean loss: 0.35304952134706025
Epoch: 21, step: 894, loss: 0.36539286375045776, mean loss: 0.3530499167262333
Epoch: 21, step: 895, loss: 0.3381134569644928, mean loss: 0.353049438300232
Epoch: 21, step: 896, loss: 0.3157607913017273, mean loss: 0.3530482439551758
Epoch: 21, step: 897, loss: 0.3632734715938568, mean loss: 0.3530485714559009
Epoch: 21, step: 898, loss: 0.3683050870895386, mean loss: 0.3530490600865781
Epoch: 21, step: 899, loss: 0.35188451409339905, mean loss: 0.3530490227900756
Epoch: 21, step: 900, loss: 0.34414270520210266, mean loss: 0.3530487375597285
Epoch: 21, step: 901, loss: 0.3773621618747711, mean loss: 0.3530495161872925
Epoch: 21, step: 902, loss: 0.3384639322757721, mean loss: 0.35304904910483464
Epoch: 21, step: 903, loss: 0.3218996524810791, mean loss: 0.3530480516219147
Epoch: 21, step: 904, loss: 0.31082481145858765, mean loss: 0.35304669956965035
Epoch: 21, step: 905, loss: 0.30960965156555176, mean loss: 0.3530453086939538
Epoch: 21, step: 906, loss: 0.3641560971736908, mean loss: 0.35304566445548813
Epoch: 21, step: 907, loss: 0.30981478095054626, mean loss: 0.35304428026992507
Epoch: 21, step: 908, loss: 0.30848339200019836, mean loss: 0.3530428535453623
Epoch: 21, step: 909, loss: 0.3066319525241852, mean loss: 0.3530413676357439
Epoch: 21, step: 910, loss: 0.33834731578826904, mean loss: 0.35304089720027576
Epoch: 21, step: 911, loss: 0.3415910303592682, mean loss: 0.353040530640318
Epoch: 21, step: 912, loss: 0.3541540503501892, mean loss: 0.353040566287778
Epoch: 21, step: 913, loss: 0.3158630132675171, mean loss: 0.3530393761490681
Epoch: 21, step: 914, loss: 0.28325992822647095, mean loss: 0.35303714242046214
Epoch: 21, step: 915, loss: 0.30697473883628845, mean loss: 0.3530356679517174
Epoch: 21, step: 916, loss: 0.3133692145347595, mean loss: 0.35303439825953675
Epoch: 21, step: 917, loss: 0.34221306443214417, mean loss: 0.3530340518881832
Epoch: 21, step: 918, loss: 0.35918769240379333, mean loss: 0.35303424884879886
Epoch: 21, step: 919, loss: 0.4050138592720032, mean loss: 0.35303591251575644
Epoch: 21, step: 920, loss: 0.31032031774520874, mean loss: 0.35303454539798496
Epoch: 21, step: 921, loss: 0.34943538904190063, mean loss: 0.3530344302102375
Epoch: 21, step: 922, loss: 0.3280266225337982, mean loss: 0.3530336298835605
Epoch: 21, step: 923, loss: 0.3351271450519562, mean loss: 0.3530330568393711
Epoch: 21, step: 924, loss: 0.34107574820518494, mean loss: 0.35303267419325013
Epoch: 21, step: 925, loss: 0.3439718186855316, mean loss: 0.3530323842458739
Epoch: 21, step: 926, loss: 0.3359014093875885, mean loss: 0.35303183607222
Epoch: 21, step: 927, loss: 0.31624460220336914, mean loss: 0.3530306589560716
Epoch: 21, step: 928, loss: 0.32586371898651123, mean loss: 0.3530297896974414
Epoch: 21, step: 929, loss: 0.3378252387046814, mean loss: 0.35302930321407955
Epoch: 21, step: 930, loss: 0.3247445225715637, mean loss: 0.3530283982458939
Epoch: 21, step: 931, loss: 0.28820592164993286, mean loss: 0.35302632432483566
Epoch: 21, step: 932, loss: 0.31335917115211487, mean loss: 0.3530250552602046
Epoch: 21, step: 933, loss: 0.31887584924697876, mean loss: 0.3530239627652909
Epoch: 21, step: 934, loss: 0.31590691208839417, mean loss: 0.3530227753616415
Epoch: 21, step: 935, loss: 0.359476238489151, mean loss: 0.35302298180639924
Epoch: 21, step: 936, loss: 0.3345487415790558, mean loss: 0.3530223908387326
Epoch: 21, step: 937, loss: 0.3778765797615051, mean loss: 0.3530231858674871
Epoch: 21, step: 938, loss: 0.3383047878742218, mean loss: 0.35302271507460115
Epoch: 21, step: 939, loss: 0.31517672538757324, mean loss: 0.35302150454524833
Epoch: 21, step: 940, loss: 0.34984326362609863, mean loss: 0.3530214028903333
Epoch: 21, step: 941, loss: 0.34184184670448303, mean loss: 0.3530210453276075
Epoch: 21, step: 942, loss: 0.3352067768573761, mean loss: 0.3530204755809586
Epoch: 21, step: 943, loss: 0.34328025579452515, mean loss: 0.35302016407335385
Epoch: 21, step: 944, loss: 0.37411442399024963, mean loss: 0.3530208386795106
Epoch: 21, step: 945, loss: 0.3031952381134033, mean loss: 0.3530192452800682
Epoch: 21, step: 946, loss: 0.34222137928009033, mean loss: 0.35301889998039754
Epoch: 21, step: 947, loss: 0.3246634602546692, mean loss: 0.35301799324466826
Epoch: 21, step: 948, loss: 0.316670686006546, mean loss: 0.35301683098625886
Epoch: 21, step: 949, loss: 0.29453763365745544, mean loss: 0.35301496108802616
Epoch: 21, step: 950, loss: 0.3309592306613922, mean loss: 0.35301425586882784
Epoch: 21, step: 951, loss: 0.3164346516132355, mean loss: 0.35301308629457745
Epoch: 21, step: 952, loss: 0.3023989200592041, mean loss: 0.35301146803943034
Epoch: 21, step: 953, loss: 0.34429770708084106, mean loss: 0.35301118944869697
Epoch: 21, step: 954, loss: 0.3204647898674011, mean loss: 0.35301014892951216
Epoch: 21, step: 955, loss: 0.3296358287334442, mean loss: 0.3530094016686363
Epoch: 21, step: 956, loss: 0.33359307050704956, mean loss: 0.35300878096178034
Epoch: 21, step: 957, loss: 0.3896484971046448, mean loss: 0.3530099522333149
Epoch: 21, step: 958, loss: 0.31785136461257935, mean loss: 0.3530088283453367
Epoch: 21, step: 959, loss: 0.3234587609767914, mean loss: 0.35300788377087794
Epoch: 21, step: 960, loss: 0.3099243640899658, mean loss: 0.35300650664063404
Epoch: 21, step: 961, loss: 0.33428919315338135, mean loss: 0.35300590837580353
Epoch: 21, step: 962, loss: 0.30812129378318787, mean loss: 0.35300447376671373
Epoch: 21, step: 963, loss: 0.33599555492401123, mean loss: 0.353003930142358
Epoch: 21, step: 964, loss: 0.34730297327041626, mean loss: 0.3530037479391277
Epoch: 21, step: 965, loss: 0.3269931972026825, mean loss: 0.35300291666553435
Epoch: 21, step: 966, loss: 0.32938480377197266, mean loss: 0.35300216187620537
Epoch: 21, step: 967, loss: 0.44924354553222656, mean loss: 0.3530052374668885
Epoch: 21, step: 968, loss: 0.29506102204322815, mean loss: 0.3530033857998887
Epoch: 21, step: 969, loss: 0.3296029269695282, mean loss: 0.3530026380380548
Epoch: 21, step: 970, loss: 0.3415040075778961, mean loss: 0.3530022706109751
Epoch: 21, step: 971, loss: 0.333663672208786, mean loss: 0.35300165268541267
Epoch: 21, step: 972, loss: 0.3088057339191437, mean loss: 0.35300024053987905
Epoch: 21, step: 973, loss: 0.3339345157146454, mean loss: 0.35299963137236595
Epoch: 21, step: 974, loss: 0.32169002294540405, mean loss: 0.35299863103342777
Epoch: 21, step: 975, loss: 0.36274999380111694, mean loss: 0.3529989425785641
Epoch: 21, step: 976, loss: 0.3448045253753662, mean loss: 0.3529986807844616
Epoch: 21, step: 977, loss: 0.29329001903533936, mean loss: 0.3529967732813708
Epoch: 21, step: 978, loss: 0.3157825171947479, mean loss: 0.3529955844414485
Epoch: 21, step: 979, loss: 0.3405543863773346, mean loss: 0.3529951870098722
Epoch: 21, step: 980, loss: 0.33806636929512024, mean loss: 0.35299471012701916
Epoch: 21, step: 981, loss: 0.3696519732475281, mean loss: 0.3529952422059536
Epoch: 21, step: 982, loss: 0.3473280370235443, mean loss: 0.3529950611855689
Epoch: 21, step: 983, loss: 0.3138613700866699, mean loss: 0.3529938112273761
Epoch: 21, step: 984, loss: 0.3055122494697571, mean loss: 0.3529922946806401
Epoch: 21, step: 985, loss: 0.38194793462753296, mean loss: 0.35299321948549306
Epoch: 21, step: 986, loss: 0.3245840072631836, mean loss: 0.35299231216179777
Epoch: 21, step: 987, loss: 0.3175564110279083, mean loss: 0.3529911804582613
Epoch: 21, step: 988, loss: 0.35142087936401367, mean loss: 0.35299113030972573
Epoch: 21, step: 989, loss: 0.3182128667831421, mean loss: 0.3529900196798628
Epoch: 21, step: 990, loss: 0.3577623963356018, mean loss: 0.35299017207892575
Epoch: 21, step: 991, loss: 0.37661173939704895, mean loss: 0.3529909263760045
Epoch: 21, step: 992, loss: 0.3815494775772095, mean loss: 0.3529918382944897
Epoch: 21, step: 993, loss: 0.36612191796302795, mean loss: 0.35299225754475055
Epoch: 21, step: 994, loss: 0.30165496468544006, mean loss: 0.3529906183706754
Epoch: 21, step: 995, loss: 0.3395431637763977, mean loss: 0.3529901890138876
Epoch: 21, step: 996, loss: 0.34634771943092346, mean loss: 0.3529899769367003
Epoch: 21, step: 997, loss: 0.32773739099502563, mean loss: 0.35298917071149305
Epoch: 21, step: 998, loss: 0.3290395140647888, mean loss: 0.3529884061085927
Epoch: 21, step: 999, loss: 0.3317320942878723, mean loss: 0.3529877275135276
Epoch: 21, step: 1000, loss: 0.3200334310531616, mean loss: 0.3529866755008712
Epoch: 21, step: 1001, loss: 0.33575892448425293, mean loss: 0.35298612555031844
Epoch: 21, step: 1002, loss: 0.35613158345222473, mean loss: 0.35298622595756785
Epoch: 21, step: 1003, loss: 0.3062179684638977, mean loss: 0.3529847330995018
Epoch: 21, step: 1004, loss: 0.3272915780544281, mean loss: 0.3529839129917727
Epoch: 21, step: 1005, loss: 0.32951170206069946, mean loss: 0.3529831637989565
Epoch: 21, step: 1006, loss: 0.34765326976776123, mean loss: 0.35298299368328734
Epoch: 21, step: 1007, loss: 0.3125925660133362, mean loss: 0.3529817045722293
Epoch: 21, step: 1008, loss: 0.29368776082992554, mean loss: 0.35297981219219093
Epoch: 21, step: 1009, loss: 0.31185460090637207, mean loss: 0.35297849971337286
Epoch: 21, step: 1010, loss: 0.3480685353279114, mean loss: 0.35297834302071657
Epoch: 21, step: 1011, loss: 0.3709457218647003, mean loss: 0.35297891639890283
Epoch: 21, step: 1012, loss: 0.37177035212516785, mean loss: 0.3529795160554024
Epoch: 21, step: 1013, loss: 0.37141549587249756, mean loss: 0.3529801043501186
Epoch: 21, step: 1014, loss: 0.3073762357234955, mean loss: 0.3529786491706736
Epoch: 21, step: 1015, loss: 0.30910447239875793, mean loss: 0.3529772492288494
Epoch: 21, step: 1016, loss: 0.32539132237434387, mean loss: 0.3529763690422933
Epoch: 21, step: 1017, loss: 0.33877599239349365, mean loss: 0.3529759159641027
Epoch: 21, step: 1018, loss: 0.3102662265300751, mean loss: 0.3529745533093015
Epoch: 21, step: 1019, loss: 0.3273411989212036, mean loss: 0.3529737355019257
Epoch: 21, step: 1020, loss: 0.34224581718444824, mean loss: 0.35297339324898847
Epoch: 21, step: 1021, loss: 0.3340347707271576, mean loss: 0.35297278906910834
Epoch: 21, step: 1022, loss: 0.3627890944480896, mean loss: 0.35297310221886363
Epoch: 21, step: 1023, loss: 0.3368794620037079, mean loss: 0.3529725888323568
Epoch: 21, step: 1024, loss: 0.3269691467285156, mean loss: 0.3529717593500096
Epoch: 21, step: 1025, loss: 0.30922621488571167, mean loss: 0.35297036395784165
Epoch: 21, step: 1026, loss: 0.31649014353752136, mean loss: 0.3529692003515637
Epoch: 21, step: 1027, loss: 0.3355966806411743, mean loss: 0.3529686462395546
Epoch: 21, step: 1028, loss: 0.3603375554084778, mean loss: 0.3529688812699877
Epoch: 21, step: 1029, loss: 0.33285000920295715, mean loss: 0.3529682396015541
Epoch: 21, step: 1030, loss: 0.3003232479095459, mean loss: 0.35296656060325426
Epoch: 21, step: 1031, loss: 0.3124344050884247, mean loss: 0.35296526795892735
Epoch: 21, step: 1032, loss: 0.3352542817592621, mean loss: 0.3529647031413045
Epoch: 21, step: 1033, loss: 0.3252338171005249, mean loss: 0.35296381880920297
Epoch: 21, step: 1034, loss: 0.3327338993549347, mean loss: 0.35296317370191466
Epoch: 21, step: 1035, loss: 0.3247188329696655, mean loss: 0.35296227305329436
Epoch: 21, step: 1036, loss: 0.42155691981315613, mean loss: 0.35296446031284473
Epoch: 21, step: 1037, loss: 0.3478335738182068, mean loss: 0.3529642967108265
Epoch: 21, step: 1038, loss: 0.31938499212265015, mean loss: 0.3529632260446087
Epoch: 21, step: 1039, loss: 0.32169845700263977, mean loss: 0.35296222920845766
Epoch: 21, step: 1040, loss: 0.3496881127357483, mean loss: 0.35296212482087685
Epoch: 21, step: 1041, loss: 0.31847092509269714, mean loss: 0.3529610251843364
Epoch: 21, step: 1042, loss: 0.35500556230545044, mean loss: 0.35296109036548606
Epoch: 21, step: 1043, loss: 0.30023816227912903, mean loss: 0.3529594095784392
Epoch: 21, step: 1044, loss: 0.3838456869125366, mean loss: 0.3529603941899134
Epoch: 21, step: 1045, loss: 0.3547559976577759, mean loss: 0.3529604514294246
Epoch: 21, step: 1046, loss: 0.34002310037612915, mean loss: 0.3529600390309976
Epoch: 21, step: 1047, loss: 0.34977051615715027, mean loss: 0.3529599373631768
Epoch: 21, step: 1048, loss: 0.3121754229068756, mean loss: 0.35295863737546584
Epoch: 21, step: 1049, loss: 0.3156532943248749, mean loss: 0.3529574483226498
Epoch: 21, step: 1050, loss: 0.29146912693977356, mean loss: 0.3529554885355141
Epoch: 21, step: 1051, loss: 0.3445151448249817, mean loss: 0.35295521952914904
Epoch: 21, step: 1052, loss: 0.31535089015960693, mean loss: 0.352954021061183
Epoch: 21, step: 1053, loss: 0.35907626152038574, mean loss: 0.3529542161736968
Epoch: 21, step: 1054, loss: 0.2760595381259918, mean loss: 0.352951765659721
Epoch: 21, step: 1055, loss: 0.29518750309944153, mean loss: 0.35294992486104154
Epoch: 21, step: 1056, loss: 0.34072884917259216, mean loss: 0.35294953541915985
Epoch: 21, step: 1057, loss: 0.3340757489204407, mean loss: 0.3529489339983932
Epoch: 21, step: 1058, loss: 0.3895636796951294, mean loss: 0.35295010070475324
Epoch: 21, step: 1059, loss: 0.363426148891449, mean loss: 0.3529504345069514
Epoch: 21, step: 1060, loss: 0.33227819204330444, mean loss: 0.3529497758406311
Epoch: 21, step: 1061, loss: 0.33094537258148193, mean loss: 0.35294907475086945
Epoch: 21, step: 1062, loss: 0.3377736508846283, mean loss: 0.3529485912569431
Epoch: 21, step: 1063, loss: 0.3514384925365448, mean loss: 0.3529485431462409
Epoch: 21, step: 1064, loss: 0.32920363545417786, mean loss: 0.35294778667398335
Epoch: 21, step: 1065, loss: 0.35651665925979614, mean loss: 0.35294790036855445
Epoch: 21, step: 1066, loss: 0.3407500386238098, mean loss: 0.352947511790244
Epoch: 21, step: 1067, loss: 0.3226310908794403, mean loss: 0.35294654605308445
Epoch: 21, step: 1068, loss: 0.29986339807510376, mean loss: 0.3529448551300131
Epoch: 21, step: 1069, loss: 0.3324350118637085, mean loss: 0.352944201825456
Epoch: 21, step: 1070, loss: 0.35296374559402466, mean loss: 0.35294420244796815
Epoch: 21, step: 1071, loss: 0.313757061958313, mean loss: 0.3529429542908625
Epoch: 21, step: 1072, loss: 0.3690915107727051, mean loss: 0.35294346862524095
Epoch: 21, step: 1073, loss: 0.3334169089794159, mean loss: 0.35294284672067233
Epoch: 21, step: 1074, loss: 0.3238176703453064, mean loss: 0.3529419191377437
Epoch: 21, step: 1075, loss: 0.3296189308166504, mean loss: 0.352941176367415
Epoch: 21, step: 1076, loss: 0.33852431178092957, mean loss: 0.35294071724622184
Epoch: 21, step: 1077, loss: 0.2954005002975464, mean loss: 0.35293888487194797
Epoch: 21, step: 1078, loss: 0.34011438488960266, mean loss: 0.3529384764873993
Epoch: 21, step: 1079, loss: 0.3279578387737274, mean loss: 0.3529376810270212
Epoch: 21, step: 1080, loss: 0.3265341520309448, mean loss: 0.3529368402841779
Epoch: 21, step: 1081, loss: 0.3465273380279541, mean loss: 0.35293663619889937
Epoch: 21, step: 1082, loss: 0.3306266665458679, mean loss: 0.35293592584867
Epoch: 21, step: 1083, loss: 0.3153746724128723, mean loss: 0.35293472993509906
Epoch: 21, step: 1084, loss: 0.35440173745155334, mean loss: 0.3529347766416964
Epoch: 21, step: 1085, loss: 0.3784107565879822, mean loss: 0.35293558772033207
Epoch: 21, step: 1086, loss: 0.3135681748390198, mean loss: 0.35293433442012256
Epoch: 21, step: 1087, loss: 0.33005058765411377, mean loss: 0.35293360591678735
Epoch: 21, step: 1088, loss: 0.33609673380851746, mean loss: 0.35293306993257356
Epoch: 21, step: 1089, loss: 0.32327353954315186, mean loss: 0.35293212578250066
Epoch: 21, step: 1090, loss: 0.3327134847640991, mean loss: 0.3529314821841872
Epoch: 21, step: 1091, loss: 0.2931869924068451, mean loss: 0.35292958046246015
Epoch: 21, step: 1092, loss: 0.2868417203426361, mean loss: 0.35292747689241466
Epoch: 21, step: 1093, loss: 0.3732519745826721, mean loss: 0.35292812379857325
Epoch: 21, step: 1094, loss: 0.35600727796554565, mean loss: 0.35292822180150674
Epoch: 21, step: 1095, loss: 0.3459862470626831, mean loss: 0.3529280008602356
Epoch: 21, step: 1096, loss: 0.3078663647174835, mean loss: 0.3529265667354101
Epoch: 21, step: 1097, loss: 0.3228154480457306, mean loss: 0.35292560845399296
Epoch: 21, step: 1098, loss: 0.37004348635673523, mean loss: 0.35292615321031484
Epoch: 21, step: 1099, loss: 0.3142940104007721, mean loss: 0.3529249238269515
Epoch: 21, step: 1100, loss: 0.3579760491847992, mean loss: 0.352925084562842
Epoch: 21, step: 1101, loss: 0.3247244954109192, mean loss: 0.3529241871979482
Epoch: 21, step: 1102, loss: 0.326598584651947, mean loss: 0.3529233495232562
Epoch: 21, step: 1103, loss: 0.27168336510658264, mean loss: 0.35292076456766197
Epoch: 21, step: 1104, loss: 0.3363877236843109, mean loss: 0.3529202385235345
Epoch: 21, step: 1105, loss: 0.3061726987361908, mean loss: 0.352918751169421
Epoch: 21, step: 1106, loss: 0.3922557234764099, mean loss: 0.3529200027036486
Epoch: 21, step: 1107, loss: 0.3545999228954315, mean loss: 0.3529200561498242
Epoch: 21, step: 1108, loss: 0.3367256224155426, mean loss: 0.35291954094498423
Epoch: 21, step: 1109, loss: 0.3395380675792694, mean loss: 0.3529191152443618
Epoch: 21, step: 1110, loss: 0.3588019013404846, mean loss: 0.3529193023856405
Epoch: 21, step: 1111, loss: 0.3480278551578522, mean loss: 0.3529191467854615
Epoch: 21, step: 1112, loss: 0.35914331674575806, mean loss: 0.352919344774136
Epoch: 21, step: 1113, loss: 0.2970940172672272, mean loss: 0.3529175690464336
Epoch: 21, step: 1114, loss: 0.3660494089126587, mean loss: 0.3529179867391041
Epoch: 21, step: 1115, loss: 0.29476305842399597, mean loss: 0.3529161370276437
Epoch: 21, step: 1116, loss: 0.33141231536865234, mean loss: 0.35291545308560435
Epoch: 21, step: 1117, loss: 0.3102821409702301, mean loss: 0.35291409715048205
Epoch: 21, step: 1118, loss: 0.35902419686317444, mean loss: 0.3529142914735337
Epoch: 21, step: 1119, loss: 0.30617496371269226, mean loss: 0.3529128050428073
Epoch: 21, step: 1120, loss: 0.31930267810821533, mean loss: 0.35291173618839694
Epoch: 21, step: 1121, loss: 0.3164924085140228, mean loss: 0.3529105780338566
Epoch: 21, step: 1122, loss: 0.3317664563655853, mean loss: 0.3529099056606042
Epoch: 21, step: 1123, loss: 0.3261801302433014, mean loss: 0.3529090556931844
Epoch: 21, step: 1124, loss: 0.32011809945106506, mean loss: 0.3529080130223128
Epoch: 21, step: 1125, loss: 0.31817173957824707, mean loss: 0.35290690853031137
Epoch: 21, step: 1126, loss: 0.33490437269210815, mean loss: 0.35290633613083794
Epoch: 21, step: 1127, loss: 0.29532989859580994, mean loss: 0.35290450551791874
Epoch: 21, step: 1128, loss: 0.3621487319469452, mean loss: 0.35290479942395087
Epoch: 21, step: 1129, loss: 0.36911630630493164, mean loss: 0.35290531482761595
Epoch: 21, step: 1130, loss: 0.3405184745788574, mean loss: 0.35290492103202703
Epoch: 21, step: 1131, loss: 0.38303104043006897, mean loss: 0.35290587875454094
Epoch: 21, step: 1132, loss: 0.32513493299484253, mean loss: 0.3529049959320925
Epoch: 21, step: 1133, loss: 0.3455158472061157, mean loss: 0.3529047610427567
Epoch: 21, step: 1134, loss: 0.34171533584594727, mean loss: 0.352904405359957
Epoch: 21, step: 1135, loss: 0.31314364075660706, mean loss: 0.352903141508571
Epoch: 21, step: 1136, loss: 0.34090521931648254, mean loss: 0.35290276014999394
Epoch: 21, step: 1137, loss: 0.3007723391056061, mean loss: 0.3529011032171529
Epoch: 21, step: 1138, loss: 0.342428058385849, mean loss: 0.3529007703485507
Epoch: 21, step: 1139, loss: 0.3132598400115967, mean loss: 0.35289951046645257
Epoch: 21, step: 1140, loss: 0.3097391128540039, mean loss: 0.35289813877099374
Epoch: 21, step: 1141, loss: 0.3286091089248657, mean loss: 0.3528973668575047
Epoch: 21, step: 1142, loss: 0.3389696776866913, mean loss: 0.35289692424495284
Epoch: 21, step: 1143, loss: 0.3090076446533203, mean loss: 0.35289552951762376
Epoch: 21, step: 1144, loss: 0.34985604882240295, mean loss: 0.35289543293111975
Epoch: 21, step: 1145, loss: 0.3696785271167755, mean loss: 0.35289596623566966
Epoch: 21, step: 1146, loss: 0.2971407473087311, mean loss: 0.3528941945976878
Epoch: 21, step: 1147, loss: 0.3244517743587494, mean loss: 0.3528932908603899
Epoch: 21, step: 1148, loss: 0.363884836435318, mean loss: 0.3528936400976909
Epoch: 21, step: 1149, loss: 0.3229139745235443, mean loss: 0.35289268757606757
Epoch: 21, step: 1150, loss: 0.32959336042404175, mean loss: 0.3528919473273892
Epoch: 21, step: 1151, loss: 0.3257196247577667, mean loss: 0.3528910840562439
Epoch: 21, step: 1152, loss: 0.3266175091266632, mean loss: 0.35289024936504304
Epoch: 21, step: 1153, loss: 0.26853230595588684, mean loss: 0.3528875694634162
Epoch: 21, step: 1154, loss: 0.3923596739768982, mean loss: 0.3528888233820449
Epoch: 21, step: 1155, loss: 0.2960546612739563, mean loss: 0.35288701797664124
Epoch: 21, step: 1156, loss: 0.42131587862968445, mean loss: 0.3528891916325179
Epoch: 21, step: 1157, loss: 0.3503805696964264, mean loss: 0.3528891119481924
Epoch: 21, step: 1158, loss: 0.3605332374572754, mean loss: 0.3528893547498793
Epoch: 21, step: 1159, loss: 0.36800315976142883, mean loss: 0.3528898347970465
Epoch: 21, step: 1160, loss: 0.2985357940196991, mean loss: 0.3528881084498724
Epoch: 21, step: 1161, loss: 0.3289511799812317, mean loss: 0.35288734820949674
Epoch: 21, step: 1162, loss: 0.33744552731513977, mean loss: 0.3528868577905653
Epoch: 21, step: 1163, loss: 0.32813066244125366, mean loss: 0.35288607158009305
Epoch: 21, step: 1164, loss: 0.3236798346042633, mean loss: 0.35288514407407584
Epoch: 21, step: 1165, loss: 0.3389729857444763, mean loss: 0.3528847022780031
Epoch: 21, step: 1166, loss: 0.32590627670288086, mean loss: 0.35288384557527613
Epoch: 21, step: 1167, loss: 0.31124135851860046, mean loss: 0.3528825232557329
Epoch: 21, step: 1168, loss: 0.37519893050193787, mean loss: 0.35288323187057574
Epoch: 21, step: 1169, loss: 0.30716925859451294, mean loss: 0.3528817803568501
Epoch: 21, step: 1170, loss: 0.3169797658920288, mean loss: 0.3528806404294183
Epoch: 21, step: 1171, loss: 0.3119942545890808, mean loss: 0.3528793422840716
Epoch: 21, step: 1172, loss: 0.31424954533576965, mean loss: 0.3528781158245056
Epoch: 21, step: 1173, loss: 0.3490784764289856, mean loss: 0.35287799519337365
Epoch: 21, step: 1174, loss: 0.34241974353790283, mean loss: 0.3528776631748443
Epoch: 21, step: 1175, loss: 0.300859272480011, mean loss: 0.35287601179736194
Epoch: 21, step: 1176, loss: 0.33599451184272766, mean loss: 0.3528754758937413
Epoch: 21, step: 1177, loss: 0.30980944633483887, mean loss: 0.35287410880499903
Epoch: 21, step: 1178, loss: 0.33591750264167786, mean loss: 0.35287357055130375
Epoch: 21, step: 1179, loss: 0.39891210198402405, mean loss: 0.3528750319064152
Epoch: 21, step: 1180, loss: 0.32147490978240967, mean loss: 0.3528740352353432
Epoch: 21, step: 1181, loss: 0.3045923411846161, mean loss: 0.35287250277504834
Epoch: 21, step: 1182, loss: 0.3421228229999542, mean loss: 0.35287216159119156
Epoch: 21, step: 1183, loss: 0.32155516743659973, mean loss: 0.3528711676533296
Epoch: 21, step: 1184, loss: 0.31694814562797546, mean loss: 0.3528700275656713
Epoch: 21, step: 1185, loss: 0.3432714343070984, mean loss: 0.35286972294512997
Epoch: 21, step: 1186, loss: 0.36265239119529724, mean loss: 0.3528700333976148
Epoch: 21, step: 1187, loss: 0.31807002425193787, mean loss: 0.3528689290561212
Epoch: 21, step: 1188, loss: 0.3320738971233368, mean loss: 0.3528682691687118
Epoch: 21, step: 1189, loss: 0.3552089333534241, mean loss: 0.35286834344250073
Epoch: 21, step: 1190, loss: 0.3692058026790619, mean loss: 0.3528688618451419
Epoch: 21, step: 1191, loss: 0.32051366567611694, mean loss: 0.3528678352175188
Epoch: 21, step: 1192, loss: 0.33425620198249817, mean loss: 0.3528672446907163
Epoch: 21, step: 1193, loss: 0.295837938785553, mean loss: 0.35286543527051495
Epoch: 21, step: 1194, loss: 0.35262539982795715, mean loss: 0.35286542765493567
Epoch: 21, step: 1195, loss: 0.34791016578674316, mean loss: 0.352865270444851
Epoch: 21, step: 1196, loss: 0.3245910108089447, mean loss: 0.35286437344730537
Epoch: 21, step: 1197, loss: 0.34012308716773987, mean loss: 0.35286396924432717
Epoch: 21, step: 1198, loss: 0.3608075976371765, mean loss: 0.3528642212390102
Epoch: 21, step: 1199, loss: 0.3904545307159424, mean loss: 0.35286541367364654
Epoch: 21, step: 1200, loss: 0.36120375990867615, mean loss: 0.3528656781731306
Epoch: 21, step: 1201, loss: 0.3202744126319885, mean loss: 0.3528646443830671
Epoch: 21, step: 1202, loss: 0.32791510224342346, mean loss: 0.35286385301242795
Epoch: 21, step: 1203, loss: 0.36041831970214844, mean loss: 0.35286409262377944
Epoch: 21, step: 1204, loss: 0.32970502972602844, mean loss: 0.3528633580916694
Epoch: 21, step: 1205, loss: 0.299343466758728, mean loss: 0.3528616606640978
Epoch: 21, step: 1206, loss: 0.35488075017929077, mean loss: 0.352861724699159
Epoch: 21, step: 1207, loss: 0.3425082862377167, mean loss: 0.3528613963521318
Epoch: 21, step: 1208, loss: 0.338007390499115, mean loss: 0.3528609252898842
Epoch: 21, step: 1209, loss: 0.34638264775276184, mean loss: 0.35286071985202233
Epoch: 21, step: 1210, loss: 0.32998111844062805, mean loss: 0.35285999432161447
Epoch: 21, step: 1211, loss: 0.3404256999492645, mean loss: 0.35285960003272643
Epoch: 21, step: 1212, loss: 0.3003537058830261, mean loss: 0.3528579351345386
Epoch: 21, step: 1213, loss: 0.2974376976490021, mean loss: 0.3528561778817805
Epoch: 21, step: 1214, loss: 0.3194776773452759, mean loss: 0.3528551195571495
Epoch: 21, step: 1215, loss: 0.3805031180381775, mean loss: 0.35285599615824276
Epoch: 21, step: 1216, loss: 0.37540769577026367, mean loss: 0.3528567111545844
Epoch: 21, step: 1217, loss: 0.3092601001262665, mean loss: 0.35285532897808863
Epoch: 21, step: 1218, loss: 0.30458304286003113, mean loss: 0.35285379861363003
Epoch: 21, step: 1219, loss: 0.3539472818374634, mean loss: 0.35285383327896175
Epoch: 21, step: 1220, loss: 0.32658153772354126, mean loss: 0.35285300042762063
Epoch: 21, step: 1221, loss: 0.32321467995643616, mean loss: 0.3528520609005658
Epoch: 21, step: 1222, loss: 0.31815972924232483, mean loss: 0.3528509611975304
Epoch: 21, step: 1223, loss: 0.36976903676986694, mean loss: 0.3528514974621295
Epoch: 21, step: 1224, loss: 0.32931721210479736, mean loss: 0.35285075150234135
Epoch: 21, step: 1225, loss: 0.3283511996269226, mean loss: 0.3528499749713786
Epoch: 21, step: 1226, loss: 0.34798216819763184, mean loss: 0.352849820687623
Epoch: 21, step: 1227, loss: 0.3111453652381897, mean loss: 0.35284849891862424
Epoch: 21, step: 1228, loss: 0.3328396677970886, mean loss: 0.35284786478459196
Epoch: 21, step: 1229, loss: 0.35913965106010437, mean loss: 0.35284806418201464
Epoch: 21, step: 1230, loss: 0.3146474063396454, mean loss: 0.3528468535764738
Epoch: 21, step: 1231, loss: 0.3292211890220642, mean loss: 0.3528461048863814
Epoch: 21, step: 1232, loss: 0.3661820590496063, mean loss: 0.3528465274853028
Epoch: 21, step: 1233, loss: 0.32455721497535706, mean loss: 0.35284563106244615
Epoch: 21, step: 1234, loss: 0.3415452837944031, mean loss: 0.3528452729919348
Epoch: 21, step: 1235, loss: 0.3595566749572754, mean loss: 0.3528454856472569
Epoch: 21, step: 1236, loss: 0.34244343638420105, mean loss: 0.35284515606171574
Epoch: 21, step: 1237, loss: 0.35366758704185486, mean loss: 0.3528451821193477
Epoch: 21, step: 1238, loss: 0.3025270402431488, mean loss: 0.3528435879064441
Epoch: 21, step: 1239, loss: 0.3145888149738312, mean loss: 0.35284237593163315
Epoch: 21, step: 1240, loss: 0.33912038803100586, mean loss: 0.3528419412100142
Epoch: 21, step: 1241, loss: 0.33553314208984375, mean loss: 0.352841392873224
Epoch: 21, step: 1242, loss: 0.3352000415325165, mean loss: 0.3528408340189984
Epoch: 21, step: 1243, loss: 0.32158663868904114, mean loss: 0.35283984395959234
Epoch: 21, step: 1244, loss: 0.32382774353027344, mean loss: 0.35283892495359187
Epoch: 21, step: 1245, loss: 0.3448841869831085, mean loss: 0.35283867298216426
Epoch: 21, step: 1246, loss: 0.3282625079154968, mean loss: 0.3528378945410295
Epoch: 21, step: 1247, loss: 0.3354300856590271, mean loss: 0.35283734317244714
Epoch: 21, step: 1248, loss: 0.3314228951931, mean loss: 0.3528366649205237
Epoch: 21, step: 1249, loss: 0.3262661397457123, mean loss: 0.3528358233887198
Epoch: 21, step: 1250, loss: 0.3290015161037445, mean loss: 0.35283506854129987
Epoch: 21, step: 1251, loss: 0.3209131956100464, mean loss: 0.3528340575876347
Epoch: 21, step: 1252, loss: 0.30516666173934937, mean loss: 0.3528325480270099
Epoch: 21, step: 1253, loss: 0.29024478793144226, mean loss: 0.3528305660218134
Epoch: 21, step: 1254, loss: 0.33492663502693176, mean loss: 0.3528299990649435
Epoch: 21, step: 1255, loss: 0.31927597522735596, mean loss: 0.3528289365562723
Epoch: 21, step: 1256, loss: 0.41045787930488586, mean loss: 0.3528307613541808
Epoch: 21, step: 1257, loss: 0.3526581823825836, mean loss: 0.35283075588970825
Epoch: 21, step: 1258, loss: 0.38175785541534424, mean loss: 0.3528316717969851
Epoch: 21, step: 1259, loss: 0.3360581398010254, mean loss: 0.35283114072011085
Epoch: 21, step: 1260, loss: 0.3357407748699188, mean loss: 0.3528305996289014
Epoch: 21, step: 1261, loss: 0.3063347339630127, mean loss: 0.35282912758857765
Epoch: 21, step: 1262, loss: 0.29352736473083496, mean loss: 0.35282725017816013
Epoch: 21, step: 1263, loss: 0.3154543340206146, mean loss: 0.3528260670416476
Epoch: 21, step: 1264, loss: 0.33768340945243835, mean loss: 0.3528255876767551
Epoch: 21, step: 1265, loss: 0.3471754491329193, mean loss: 0.35282540881830166
Epoch: 21, step: 1266, loss: 0.29583391547203064, mean loss: 0.35282360477622177
Epoch: 21, step: 1267, loss: 0.3405807614326477, mean loss: 0.35282321724636156
Epoch: 21, step: 1268, loss: 0.3162081837654114, mean loss: 0.3528220582860387
Epoch: 21, step: 1269, loss: 0.3266908824443817, mean loss: 0.35282123119305137
Epoch: 21, step: 1270, loss: 0.3393820524215698, mean loss: 0.35282080583528047
Epoch: 21, step: 1271, loss: 0.3393403887748718, mean loss: 0.3528203791857976
Epoch: 21, step: 1272, loss: 0.3203413486480713, mean loss: 0.3528193512707887
Epoch: 21, step: 1273, loss: 0.34775787591934204, mean loss: 0.35281919108737986
Epoch: 21, step: 1274, loss: 0.3198220431804657, mean loss: 0.3528181468407927
Epoch: 21, step: 1275, loss: 0.3123207092285156, mean loss: 0.3528168652763113
Epoch: 21, step: 1276, loss: 0.3419092297554016, mean loss: 0.352816520108895
Epoch: 21, step: 1277, loss: 0.31415411829948425, mean loss: 0.3528152966925983
Epoch: 21, step: 1278, loss: 0.3088221549987793, mean loss: 0.35281390463672724
Epoch: 21, step: 1279, loss: 0.3538225591182709, mean loss: 0.35281393655213295
Epoch: 21, step: 1280, loss: 0.34315067529678345, mean loss: 0.35281363080110445
Epoch: 21, step: 1281, loss: 0.3037846088409424, mean loss: 0.35281207954431903
Epoch: 21, step: 1282, loss: 0.368332177400589, mean loss: 0.352812570577883
Epoch: 21, step: 1283, loss: 0.3472881615161896, mean loss: 0.35281239579905926
Epoch: 21, step: 1284, loss: 0.3529013693332672, mean loss: 0.35281239861387576
Epoch: 21, step: 1285, loss: 0.32676100730895996, mean loss: 0.3528115744635656
Epoch: 21, step: 1286, loss: 0.28697043657302856, mean loss: 0.35280949160829717
Epoch: 21, step: 1287, loss: 0.32035139203071594, mean loss: 0.35280846484315803
Epoch: 21, step: 1288, loss: 0.36054757237434387, mean loss: 0.35280870965091216
Epoch: 21, step: 1289, loss: 0.3510236442089081, mean loss: 0.35280865318651533
Epoch: 21, step: 1290, loss: 0.3202546238899231, mean loss: 0.3528076234844974
Epoch: 21, step: 1291, loss: 0.3149574100971222, mean loss: 0.3528064262991043
Epoch: 21, step: 1292, loss: 0.3153553605079651, mean loss: 0.3528052417760379
Epoch: 21, step: 1293, loss: 0.35946428775787354, mean loss: 0.35280545238537375
Epoch: 21, step: 1294, loss: 0.3459341526031494, mean loss: 0.3528052350698425
Epoch: 21, step: 1295, loss: 0.34998220205307007, mean loss: 0.35280514578986094
Epoch: 21, step: 1296, loss: 0.34603092074394226, mean loss: 0.3528049315580199
Epoch: 21, step: 1297, loss: 0.3226492702960968, mean loss: 0.35280397792886103
Epoch: 21, step: 1298, loss: 0.33335763216018677, mean loss: 0.3528033629857573
Epoch: 21, step: 1299, loss: 0.34205421805381775, mean loss: 0.35280302308109845
Epoch: 21, step: 1300, loss: 0.32772913575172424, mean loss: 0.35280223023090623
Epoch: 21, step: 1301, loss: 0.37139707803726196, mean loss: 0.35280281819169185
Epoch: 21, step: 1302, loss: 0.3472122848033905, mean loss: 0.3528026414271113
Epoch: 21, step: 1303, loss: 0.28728801012039185, mean loss: 0.3528005700147139
Epoch: 21, step: 1304, loss: 0.33237558603286743, mean loss: 0.3527999242470961
Epoch: 21, step: 1305, loss: 0.30806389451026917, mean loss: 0.35279850989269407
Epoch: 21, step: 1306, loss: 0.3194437026977539, mean loss: 0.3527974553952961
Epoch: 21, step: 1307, loss: 0.3232586681842804, mean loss: 0.3527965215691956
Epoch: 21, step: 1308, loss: 0.3056553900241852, mean loss: 0.35279503131751083
Epoch: 21, step: 1309, loss: 0.3827008903026581, mean loss: 0.35279597668828233
Epoch: 21, step: 1310, loss: 0.34198907017707825, mean loss: 0.35279563507593803
Epoch: 21, step: 1311, loss: 0.31812193989753723, mean loss: 0.3527945390557339
Epoch: 21, step: 1312, loss: 0.328864187002182, mean loss: 0.3527937826517748
Epoch: 21, step: 1313, loss: 0.35803505778312683, mean loss: 0.35279394831569577
Epoch: 21, step: 1314, loss: 0.34786540269851685, mean loss: 0.3527937925413155
Epoch: 21, step: 1315, loss: 0.3488338887691498, mean loss: 0.352793667386329
Epoch: 21, step: 1316, loss: 0.32385537028312683, mean loss: 0.35279275280407485
Epoch: 21, step: 1317, loss: 0.3368363082408905, mean loss: 0.3527922485235438
Epoch: 21, step: 1318, loss: 0.33168825507164, mean loss: 0.3527915815831952
Epoch: 21, step: 1319, loss: 0.31195032596588135, mean loss: 0.35279029093550157
Epoch: 21, step: 1320, loss: 0.3407893180847168, mean loss: 0.3527899116979332
Epoch: 21, step: 1321, loss: 0.30935096740722656, mean loss: 0.3527885390459617
Epoch: 21, step: 1322, loss: 0.30186906456947327, mean loss: 0.35278693006329426
Epoch: 21, step: 1323, loss: 0.3306271731853485, mean loss: 0.35278622986875185
Epoch: 21, step: 1324, loss: 0.3358836770057678, mean loss: 0.3527856958059738
Epoch: 21, step: 1325, loss: 0.32735803723335266, mean loss: 0.3527848924044391
Epoch: 21, step: 1326, loss: 0.34614133834838867, mean loss: 0.35278468250414985
Epoch: 21, step: 1327, loss: 0.3277987539768219, mean loss: 0.35278389310921343
Epoch: 21, step: 1328, loss: 0.3486108183860779, mean loss: 0.3527837612710078
Epoch: 21, step: 1329, loss: 0.3782941997051239, mean loss: 0.3527845671861665
Epoch: 21, step: 1330, loss: 0.3643700182437897, mean loss: 0.35278493317735454
Epoch: 21, step: 1331, loss: 0.3716971278190613, mean loss: 0.3527855306057928
Epoch: 21, step: 1332, loss: 0.3425479531288147, mean loss: 0.3527852072151532
Epoch: 21, step: 1333, loss: 0.3564012050628662, mean loss: 0.3527853214358193
Epoch: 21, step: 1334, loss: 0.3259182572364807, mean loss: 0.352784472796753
Epoch: 21, step: 1335, loss: 0.3298199474811554, mean loss: 0.3527837474485118
Epoch: 21, step: 1336, loss: 0.2980785667896271, mean loss: 0.3527820196072984
Epoch: 21, step: 1337, loss: 0.310305655002594, mean loss: 0.35278067805071306
Epoch: 21, step: 1338, loss: 0.37715259194374084, mean loss: 0.3527814477792256
Epoch: 21, step: 1339, loss: 0.3578009605407715, mean loss: 0.3527816063035043
Epoch: 21, step: 1340, loss: 0.33049577474594116, mean loss: 0.35278090250336036
Epoch: 21, step: 1341, loss: 0.32622721791267395, mean loss: 0.3527800639482984
Epoch: 21, step: 1342, loss: 0.29253822565078735, mean loss: 0.3527781615944822
Epoch: 21, step: 1343, loss: 0.32797807455062866, mean loss: 0.3527773784668125
Epoch: 21, step: 1344, loss: 0.3538636267185211, mean loss: 0.35277741276686153
Epoch: 21, step: 1345, loss: 0.3166520595550537, mean loss: 0.3527762720863054
Epoch: 21, step: 1346, loss: 0.33455386757850647, mean loss: 0.35277569672068676
Epoch: 21, step: 1347, loss: 0.37062203884124756, mean loss: 0.35277626019448444
Epoch: 21, step: 1348, loss: 0.3439349830150604, mean loss: 0.3527759810520862
Epoch: 21, step: 1349, loss: 0.34906336665153503, mean loss: 0.35277586383877557
Epoch: 21, step: 1350, loss: 0.3334786593914032, mean loss: 0.35277525461369436
Epoch: 21, step: 1351, loss: 0.31886276602745056, mean loss: 0.35277418400854893
Epoch: 21, step: 1352, loss: 0.33773601055145264, mean loss: 0.35277370927377427
Epoch: 21, step: 1353, loss: 0.32362374663352966, mean loss: 0.3527727890779715
Epoch: 21, step: 1354, loss: 0.30879390239715576, mean loss: 0.3527714008117169
Epoch: 21, step: 1355, loss: 0.3286202549934387, mean loss: 0.35277063846494233
Epoch: 21, step: 1356, loss: 0.3836880326271057, mean loss: 0.3527716143619835
Epoch: 21, step: 1357, loss: 0.33105704188346863, mean loss: 0.3527709289705159
Epoch: 21, step: 1358, loss: 0.36743107438087463, mean loss: 0.35277139168381355
Epoch: 21, step: 1359, loss: 0.35137900710105896, mean loss: 0.35277134773782876
Epoch: 21, step: 1360, loss: 0.3237801790237427, mean loss: 0.35277043275696357
Epoch: 21, step: 1361, loss: 0.3705376386642456, mean loss: 0.35277099348428503
Epoch: 21, step: 1362, loss: 0.3419972360134125, mean loss: 0.3527706534786843
Epoch: 21, step: 1363, loss: 0.3415909707546234, mean loss: 0.3527703006737511
Epoch: 21, step: 1364, loss: 0.32839739322662354, mean loss: 0.35276953154542745
Epoch: 21, step: 1365, loss: 0.3344880938529968, mean loss: 0.3527689546619408
Epoch: 21, step: 1366, loss: 0.33462411165237427, mean loss: 0.3527683821068618
Epoch: 21, step: 1367, loss: 0.31495827436447144, mean loss: 0.35276718905789856
Epoch: 21, step: 1368, loss: 0.31964513659477234, mean loss: 0.35276614396742234
Epoch: 21, step: 1369, loss: 0.35489580035209656, mean loss: 0.3527662111617299
Epoch: 21, step: 1370, loss: 0.31565845012664795, mean loss: 0.3527650403852341
Epoch: 21, step: 1371, loss: 0.3304705023765564, mean loss: 0.3527643369987497
Epoch: 21, step: 1372, loss: 0.3329150080680847, mean loss: 0.35276371077769
Epoch: 21, step: 1373, loss: 0.3412284255027771, mean loss: 0.35276334686560484
Epoch: 21, step: 1374, loss: 0.3266673684120178, mean loss: 0.3527625236226491
Epoch: 21, step: 1375, loss: 0.3059605360031128, mean loss: 0.35276104721925416
Epoch: 21, step: 1376, loss: 0.3542086184024811, mean loss: 0.3527610928825198
Epoch: 21, step: 1377, loss: 0.3163071274757385, mean loss: 0.35275994298770535
Epoch: 21, step: 1378, loss: 0.3597898781299591, mean loss: 0.35276016473123567
Epoch: 21, step: 1379, loss: 0.3372327387332916, mean loss: 0.35275967496887134
Epoch: 21, step: 1380, loss: 0.3655562698841095, mean loss: 0.3527600785832828
Epoch: 21, step: 1381, loss: 0.3544967770576477, mean loss: 0.3527601333583561
Epoch: 21, step: 1382, loss: 0.30398935079574585, mean loss: 0.35275859518752434
Epoch: 21, step: 1383, loss: 0.3448803126811981, mean loss: 0.35275834672396605
Epoch: 21, step: 1384, loss: 0.3609197437763214, mean loss: 0.3527586041082119
Epoch: 21, step: 1385, loss: 0.3301886320114136, mean loss: 0.35275789234624105
Epoch: 21, step: 1386, loss: 0.32689720392227173, mean loss: 0.35275707683463864
Epoch: 21, step: 1387, loss: 0.4109867811203003, mean loss: 0.3527589130387344
Epoch: 21, step: 1388, loss: 0.3287133574485779, mean loss: 0.35275815481480133
Epoch: 21, step: 1389, loss: 0.3119693994522095, mean loss: 0.3527568686712886
Epoch: 21, step: 1390, loss: 0.3235723674297333, mean loss: 0.3527559484599929
Epoch: 21, step: 1391, loss: 0.3357571065425873, mean loss: 0.35275541248944436
Epoch: 21, step: 1392, loss: 0.33091408014297485, mean loss: 0.3527547238577217
Epoch: 21, step: 1393, loss: 0.30362552404403687, mean loss: 0.3527531749202158
Epoch: 21, step: 1394, loss: 0.34791138768196106, mean loss: 0.3527530222739395
Epoch: 21, step: 1395, loss: 0.32659855484962463, mean loss: 0.3527521977320913
Epoch: 21, step: 1396, loss: 0.3576957881450653, mean loss: 0.3527523535780739
Epoch: 21, step: 1397, loss: 0.39372023940086365, mean loss: 0.3527536450441171
Epoch: 21, step: 1398, loss: 0.31961309909820557, mean loss: 0.35275260035900075
Epoch: 21, step: 1399, loss: 0.3326095640659332, mean loss: 0.35275196541270476
Epoch: 21, step: 1400, loss: 0.30454176664352417, mean loss: 0.35275044578468995
Epoch: 21, step: 1401, loss: 0.3427143096923828, mean loss: 0.35275012944679385
Epoch: 21, step: 1402, loss: 0.3278031647205353, mean loss: 0.35274934314601764
Epoch: 21, step: 1403, loss: 0.339801162481308, mean loss: 0.3527489350465262
Epoch: 21, step: 1404, loss: 0.2856719493865967, mean loss: 0.35274682098728516
Epoch: 21, step: 1405, loss: 0.30268362164497375, mean loss: 0.35274524319972317
Epoch: 21, step: 1406, loss: 0.3182052671909332, mean loss: 0.3527441546750625
Epoch: 21, step: 1407, loss: 0.30576762557029724, mean loss: 0.35274267426005224
Epoch: 21, step: 1408, loss: 0.32043391466140747, mean loss: 0.3527416561161768
Epoch: 21, step: 1409, loss: 0.29143932461738586, mean loss: 0.35273972436059925
Epoch: 21, step: 1410, loss: 0.3725878596305847, mean loss: 0.35274034979419844
Epoch: 21, step: 1411, loss: 0.31247246265411377, mean loss: 0.3527390809548003
Epoch: 21, step: 1412, loss: 0.3358374536037445, mean loss: 0.35273854840202745
Epoch: 21, step: 1413, loss: 0.3180801570415497, mean loss: 0.3527374563864196
Epoch: 21, step: 1414, loss: 0.35778993368148804, mean loss: 0.3527376155747146
Epoch: 21, step: 1415, loss: 0.32418614625930786, mean loss: 0.35273671603251816
Epoch: 21, step: 1416, loss: 0.3238062858581543, mean loss: 0.3527358045795024
Epoch: 21, step: 1417, loss: 0.3210696876049042, mean loss: 0.3527348069701213
Epoch: 21, step: 1418, loss: 0.3778512179851532, mean loss: 0.3527355982126319
Epoch: 21, step: 1419, loss: 0.31822699308395386, mean loss: 0.35273451112199655
Epoch: 21, step: 1420, loss: 0.3254457116127014, mean loss: 0.3527336514968742
Epoch: 21, step: 1421, loss: 0.362274706363678, mean loss: 0.35273395204040303
Epoch: 21, step: 1422, loss: 0.3950852155685425, mean loss: 0.35273528606451643
Epoch: 21, step: 1423, loss: 0.32495492696762085, mean loss: 0.35273441103745656
Epoch: 21, step: 1424, loss: 0.40041887760162354, mean loss: 0.3527359129577238
Epoch: 21, step: 1425, loss: 0.31171154975891113, mean loss: 0.35273462085179624
Epoch: 21, step: 1426, loss: 0.3775445222854614, mean loss: 0.35273540224140393
Epoch: 21, step: 1427, loss: 0.3773423135280609, mean loss: 0.3527361772134147
Epoch: 21, step: 1428, loss: 0.32595276832580566, mean loss: 0.3527353337211813
Epoch: 21, step: 1429, loss: 0.37896522879600525, mean loss: 0.35273615975554157
Epoch: 21, step: 1430, loss: 0.35870635509490967, mean loss: 0.3527363477635825
Epoch: 21, step: 1431, loss: 0.350201815366745, mean loss: 0.35273626795087315
Epoch: 21, step: 1432, loss: 0.3102869689464569, mean loss: 0.3527349312597813
Epoch: 21, step: 1433, loss: 0.35905587673187256, mean loss: 0.3527351302945276
Epoch: 21, step: 1434, loss: 0.31697890162467957, mean loss: 0.3527340044332388
Epoch: 21, step: 1435, loss: 0.3393746018409729, mean loss: 0.35273358379713704
Epoch: 21, step: 1436, loss: 0.312550812959671, mean loss: 0.35273231863637894
Epoch: 21, step: 1437, loss: 0.30796363949775696, mean loss: 0.3527309091319668
Epoch: 21, step: 1438, loss: 0.33282753825187683, mean loss: 0.35273028251071314
Epoch: 21, step: 1439, loss: 0.3289983868598938, mean loss: 0.35272953537887675
Epoch: 21, step: 1440, loss: 0.307071715593338, mean loss: 0.3527280980163776
Epoch: 21, step: 1441, loss: 0.33562958240509033, mean loss: 0.35272755975170433
Epoch: 21, step: 1442, loss: 0.3207603991031647, mean loss: 0.35272655345080567
Epoch: 21, step: 1443, loss: 0.3102421164512634, mean loss: 0.35272521611647556
Valid: 21, mean loss: 0.18670879552761713
Epoch: 22, step: 0, loss: 0.3216300308704376, mean loss: 0.352724237326295
Epoch: 22, step: 1, loss: 0.3656662702560425, mean loss: 0.3527246446927706
Epoch: 22, step: 2, loss: 0.3597854971885681, mean loss: 0.35272486693483085
Epoch: 22, step: 3, loss: 0.3076464831829071, mean loss: 0.352723448126328
Epoch: 22, step: 4, loss: 0.350260466337204, mean loss: 0.35272337060825326
Epoch: 22, step: 5, loss: 0.31879138946533203, mean loss: 0.35272230269168175
Epoch: 22, step: 6, loss: 0.3231317400932312, mean loss: 0.3527213714387282
Epoch: 22, step: 7, loss: 0.34422415494918823, mean loss: 0.3527211040288437
Epoch: 22, step: 8, loss: 0.350987046957016, mean loss: 0.35272104945927857
Epoch: 22, step: 9, loss: 0.35855695605278015, mean loss: 0.3527212331054046
Epoch: 22, step: 10, loss: 0.35033681988716125, mean loss: 0.35272115807430804
Epoch: 22, step: 11, loss: 0.35901230573654175, mean loss: 0.3527213560336429
Epoch: 22, step: 12, loss: 0.3688253164291382, mean loss: 0.35272186275024703
Epoch: 22, step: 13, loss: 0.3593518137931824, mean loss: 0.352722071357353
Epoch: 22, step: 14, loss: 0.3262190818786621, mean loss: 0.3527212374842297
Epoch: 22, step: 15, loss: 0.39657384157180786, mean loss: 0.35272261719112896
Epoch: 22, step: 16, loss: 0.3318452835083008, mean loss: 0.3527219603613765
Epoch: 22, step: 17, loss: 0.35513579845428467, mean loss: 0.3527220363016676
Epoch: 22, step: 18, loss: 0.3403007388114929, mean loss: 0.35272164553508095
Epoch: 22, step: 19, loss: 0.36112913489341736, mean loss: 0.3527219100213449
Epoch: 22, step: 20, loss: 0.2941240966320038, mean loss: 0.35272006668517863
Epoch: 22, step: 21, loss: 0.3103071451187134, mean loss: 0.3527187325259598
Epoch: 22, step: 22, loss: 0.29642781615257263, mean loss: 0.3527169618702279
Epoch: 22, step: 23, loss: 0.3603475093841553, mean loss: 0.3527172018849333
Epoch: 22, step: 24, loss: 0.32086238265037537, mean loss: 0.3527161999405042
Epoch: 22, step: 25, loss: 0.33456575870513916, mean loss: 0.35271562906419934
Epoch: 22, step: 26, loss: 0.3184904158115387, mean loss: 0.35271455263038104
Epoch: 22, step: 27, loss: 0.3191758394241333, mean loss: 0.3527134978211847
Epoch: 22, step: 28, loss: 0.351665198802948, mean loss: 0.35271346485269656
Epoch: 22, step: 29, loss: 0.32887911796569824, mean loss: 0.352712715297791
Epoch: 22, step: 30, loss: 0.32766789197921753, mean loss: 0.35271192769996346
Epoch: 22, step: 31, loss: 0.3321179151535034, mean loss: 0.35271128008950603
Epoch: 22, step: 32, loss: 0.33949822187423706, mean loss: 0.3527108645975965
Epoch: 22, step: 33, loss: 0.31863129138946533, mean loss: 0.3527097929803017
Epoch: 22, step: 34, loss: 0.34711360931396484, mean loss: 0.3527096170162836
Epoch: 22, step: 35, loss: 0.32260075211524963, mean loss: 0.35270867031571446
Epoch: 22, step: 36, loss: 0.3585599660873413, mean loss: 0.3527088542897994
Epoch: 22, step: 37, loss: 0.3598446547985077, mean loss: 0.3527090786437109
Epoch: 22, step: 38, loss: 0.32832735776901245, mean loss: 0.3527083120916666
Epoch: 22, step: 39, loss: 0.33550333976745605, mean loss: 0.3527077711908767
Epoch: 22, step: 40, loss: 0.3759150505065918, mean loss: 0.35270850077304894
Epoch: 22, step: 41, loss: 0.31168273091316223, mean loss: 0.35270721106007
Epoch: 22, step: 42, loss: 0.3575957715511322, mean loss: 0.3527073647352293
Epoch: 22, step: 43, loss: 0.3623723089694977, mean loss: 0.3527076685496463
Epoch: 22, step: 44, loss: 0.34983325004577637, mean loss: 0.3527075781960643
Epoch: 22, step: 45, loss: 0.34220069646835327, mean loss: 0.35270724793637587
Epoch: 22, step: 46, loss: 0.3139649033546448, mean loss: 0.352706030198058
Epoch: 22, step: 47, loss: 0.29537516832351685, mean loss: 0.3527042282474082
Epoch: 22, step: 48, loss: 0.3476170599460602, mean loss: 0.35270406835903717
Epoch: 22, step: 49, loss: 0.323667049407959, mean loss: 0.35270315576179817
Epoch: 22, step: 50, loss: 0.3650588095188141, mean loss: 0.3527035440723597
Epoch: 22, step: 51, loss: 0.3586502969264984, mean loss: 0.35270373095962726
Epoch: 22, step: 52, loss: 0.35625502467155457, mean loss: 0.35270384256183057
Epoch: 22, step: 53, loss: 0.4091434180736542, mean loss: 0.35270561616422863
Epoch: 22, step: 54, loss: 0.31432509422302246, mean loss: 0.35270441010188563
Epoch: 22, step: 55, loss: 0.32967332005500793, mean loss: 0.3527036863999611
Epoch: 22, step: 56, loss: 0.31457850337028503, mean loss: 0.35270248843662944
Epoch: 22, step: 57, loss: 0.3996705710887909, mean loss: 0.3527039642137504
Epoch: 22, step: 58, loss: 0.3061802089214325, mean loss: 0.35270250244370316
Epoch: 22, step: 59, loss: 0.3132970631122589, mean loss: 0.3527012643690729
Epoch: 22, step: 60, loss: 0.33138400316238403, mean loss: 0.3527005946257191
Epoch: 22, step: 61, loss: 0.33604979515075684, mean loss: 0.3527000715091789
Epoch: 22, step: 62, loss: 0.30545705556869507, mean loss: 0.3526985873265915
Epoch: 22, step: 63, loss: 0.3707634508609772, mean loss: 0.35269915483298553
Epoch: 22, step: 64, loss: 0.30511200428009033, mean loss: 0.35269765993302155
Epoch: 22, step: 65, loss: 0.3462632894515991, mean loss: 0.35269745781043305
Epoch: 22, step: 66, loss: 0.3377329409122467, mean loss: 0.35269698774550773
Epoch: 22, step: 67, loss: 0.3381984829902649, mean loss: 0.35269653233324627
Epoch: 22, step: 68, loss: 0.3560241758823395, mean loss: 0.35269663685451236
Epoch: 22, step: 69, loss: 0.35944968461990356, mean loss: 0.35269684896104436
Epoch: 22, step: 70, loss: 0.35379815101623535, mean loss: 0.3526968835507631
Epoch: 22, step: 71, loss: 0.32533615827560425, mean loss: 0.352696024231502
Epoch: 22, step: 72, loss: 0.3431954085826874, mean loss: 0.3526957258547032
Epoch: 22, step: 73, loss: 0.3019251525402069, mean loss: 0.3526941314016753
Epoch: 22, step: 74, loss: 0.33792877197265625, mean loss: 0.35269366770920196
Epoch: 22, step: 75, loss: 0.34098005294799805, mean loss: 0.35269329986550263
Epoch: 22, step: 76, loss: 0.3019906282424927, mean loss: 0.35269170769493824
Epoch: 22, step: 77, loss: 0.3517249822616577, mean loss: 0.35269167733867895
Epoch: 22, step: 78, loss: 0.38253307342529297, mean loss: 0.3526926143624516
Epoch: 22, step: 79, loss: 0.3187307119369507, mean loss: 0.35269154798772084
Epoch: 22, step: 80, loss: 0.3185250759124756, mean loss: 0.35269047522336167
Epoch: 22, step: 81, loss: 0.30986225605010986, mean loss: 0.35268913053830125
Epoch: 22, step: 82, loss: 0.31680163741111755, mean loss: 0.35268800380780213
Epoch: 22, step: 83, loss: 0.33647263050079346, mean loss: 0.3526874947228685
Epoch: 22, step: 84, loss: 0.291655033826828, mean loss: 0.35268557865653577
Epoch: 22, step: 85, loss: 0.3287602365016937, mean loss: 0.35268482756272795
Epoch: 22, step: 86, loss: 0.3168141841888428, mean loss: 0.35268370150266287
Epoch: 22, step: 87, loss: 0.3280870318412781, mean loss: 0.35268292938219387
Epoch: 22, step: 88, loss: 0.35169005393981934, mean loss: 0.3526828982155604
Epoch: 22, step: 89, loss: 0.33308809995651245, mean loss: 0.3526822831487559
Epoch: 22, step: 90, loss: 0.32895970344543457, mean loss: 0.35268153853719547
Epoch: 22, step: 91, loss: 0.3351919651031494, mean loss: 0.3526809895863658
Epoch: 22, step: 92, loss: 0.34175822138786316, mean loss: 0.35268064676071065
Epoch: 22, step: 93, loss: 0.3424243927001953, mean loss: 0.3526803248645943
Epoch: 22, step: 94, loss: 0.32351529598236084, mean loss: 0.35267940953870275
Epoch: 22, step: 95, loss: 0.3084735870361328, mean loss: 0.3526780222106051
Epoch: 22, step: 96, loss: 0.3286256790161133, mean loss: 0.3526772673904829
Epoch: 22, step: 97, loss: 0.32984021306037903, mean loss: 0.3526765507315257
Epoch: 22, step: 98, loss: 0.3445775806903839, mean loss: 0.3526762965824046
Epoch: 22, step: 99, loss: 0.3646939694881439, mean loss: 0.3526766736902528
Epoch: 22, step: 100, loss: 0.33638033270835876, mean loss: 0.3526761623362416
Epoch: 22, step: 101, loss: 0.34693196415901184, mean loss: 0.35267598209783
Epoch: 22, step: 102, loss: 0.32875069975852966, mean loss: 0.3526752314065326
Epoch: 22, step: 103, loss: 0.31639209389686584, mean loss: 0.35267409300487884
Epoch: 22, step: 104, loss: 0.3204466700553894, mean loss: 0.35267308188502977
Epoch: 22, step: 105, loss: 0.34683120250701904, mean loss: 0.35267289860463263
Epoch: 22, step: 106, loss: 0.3410438001155853, mean loss: 0.3526725337701702
Epoch: 22, step: 107, loss: 0.3381006419658661, mean loss: 0.352672076627122
Epoch: 22, step: 108, loss: 0.3523569703102112, mean loss: 0.35267206674205387
Epoch: 22, step: 109, loss: 0.3297100365161896, mean loss: 0.35267134643242887
Epoch: 22, step: 110, loss: 0.3474760055541992, mean loss: 0.3526711834617937
Epoch: 22, step: 111, loss: 0.33142414689064026, mean loss: 0.35267051699264157
Epoch: 22, step: 112, loss: 0.287811815738678, mean loss: 0.352668482592803
Epoch: 22, step: 113, loss: 0.2771851122379303, mean loss: 0.3526661150070068
Epoch: 22, step: 114, loss: 0.32813289761543274, mean loss: 0.35266534553056506
Epoch: 22, step: 115, loss: 0.33771950006484985, mean loss: 0.35266487677365044
Epoch: 22, step: 116, loss: 0.32291218638420105, mean loss: 0.35266394364865783
Epoch: 22, step: 117, loss: 0.3189154863357544, mean loss: 0.35266288523878164
Epoch: 22, step: 118, loss: 0.37214693427085876, mean loss: 0.35266349627302856
Epoch: 22, step: 119, loss: 0.34038490056991577, mean loss: 0.3526631112192245
Epoch: 22, step: 120, loss: 0.3054015338420868, mean loss: 0.3526616291540178
Epoch: 22, step: 121, loss: 0.3320866823196411, mean loss: 0.35266098396910606
Epoch: 22, step: 122, loss: 0.2985592782497406, mean loss: 0.3526592875122461
Epoch: 22, step: 123, loss: 0.3337344527244568, mean loss: 0.3526586941084211
Epoch: 22, step: 124, loss: 0.35283297300338745, mean loss: 0.35265869957290846
Epoch: 22, step: 125, loss: 0.3436528742313385, mean loss: 0.3526584172055246
Epoch: 22, step: 126, loss: 0.33372434973716736, mean loss: 0.3526578235680432
Epoch: 22, step: 127, loss: 0.321628600358963, mean loss: 0.35265685074313696
Epoch: 22, step: 128, loss: 0.3122381567955017, mean loss: 0.3526555835802706
Epoch: 22, step: 129, loss: 0.3142516314983368, mean loss: 0.3526543796191419
Epoch: 22, step: 130, loss: 0.3010827600955963, mean loss: 0.35265276290327235
Epoch: 22, step: 131, loss: 0.329966276884079, mean loss: 0.35265205172816205
Epoch: 22, step: 132, loss: 0.35022684931755066, mean loss: 0.35265197570539125
Epoch: 22, step: 133, loss: 0.39248111844062805, mean loss: 0.35265322418958456
Epoch: 22, step: 134, loss: 0.36494389176368713, mean loss: 0.3526536094407388
Epoch: 22, step: 135, loss: 0.2884179353713989, mean loss: 0.35265159603570906
Epoch: 22, step: 136, loss: 0.3201947808265686, mean loss: 0.35265057874013755
Epoch: 22, step: 137, loss: 0.3224853575229645, mean loss: 0.35264963329974336
Epoch: 22, step: 138, loss: 0.3683747351169586, mean loss: 0.3526501261414965
Epoch: 22, step: 139, loss: 0.3381175994873047, mean loss: 0.35264967069061726
Epoch: 22, step: 140, loss: 0.3737250864505768, mean loss: 0.35265033117561395
Epoch: 22, step: 141, loss: 0.38208675384521484, mean loss: 0.35265125365830496
Epoch: 22, step: 142, loss: 0.3250858783721924, mean loss: 0.3526503898378266
Epoch: 22, step: 143, loss: 0.3117731809616089, mean loss: 0.352649108902477
Epoch: 22, step: 144, loss: 0.37790966033935547, mean loss: 0.35264990044672034
Epoch: 22, step: 145, loss: 0.3323696553707123, mean loss: 0.35264926498124827
Epoch: 22, step: 146, loss: 0.34334415197372437, mean loss: 0.35264897342201257
Epoch: 22, step: 147, loss: 0.3479245603084564, mean loss: 0.35264882539553327
Epoch: 22, step: 148, loss: 0.35890060663223267, mean loss: 0.35264902127175085
Epoch: 22, step: 149, loss: 0.31287238001823425, mean loss: 0.3526477750582897
Epoch: 22, step: 150, loss: 0.3323659598827362, mean loss: 0.35264713964317096
Epoch: 22, step: 151, loss: 0.328154593706131, mean loss: 0.3526463723328346
Epoch: 22, step: 152, loss: 0.37446531653404236, mean loss: 0.35264705586230427
Epoch: 22, step: 153, loss: 0.42257967591285706, mean loss: 0.3526492465965957
Epoch: 22, step: 154, loss: 0.3272345960140228, mean loss: 0.3526484504730928
Epoch: 22, step: 155, loss: 0.29534560441970825, mean loss: 0.3526466554960832
Epoch: 22, step: 156, loss: 0.33380264043807983, mean loss: 0.3526460652371934
Epoch: 22, step: 157, loss: 0.3149377405643463, mean loss: 0.3526448841207155
Epoch: 22, step: 158, loss: 0.3108973801136017, mean loss: 0.35264357652827
Epoch: 22, step: 159, loss: 0.37129953503608704, mean loss: 0.35264416084167854
Epoch: 22, step: 160, loss: 0.32757818698883057, mean loss: 0.35264337578815813
Epoch: 22, step: 161, loss: 0.34367480874061584, mean loss: 0.3526430949060082
Epoch: 22, step: 162, loss: 0.3030196726322174, mean loss: 0.3526415408230708
Epoch: 22, step: 163, loss: 0.3286310136318207, mean loss: 0.3526407888962516
Epoch: 22, step: 164, loss: 0.32342106103897095, mean loss: 0.3526398738639071
Epoch: 22, step: 165, loss: 0.3486945331096649, mean loss: 0.3526397503171934
Epoch: 22, step: 166, loss: 0.3255382776260376, mean loss: 0.352638901672362
Epoch: 22, step: 167, loss: 0.35447731614112854, mean loss: 0.3526389592379453
Epoch: 22, step: 168, loss: 0.2901247441768646, mean loss: 0.3526370018150483
Epoch: 22, step: 169, loss: 0.30601388216018677, mean loss: 0.35263554201419495
Epoch: 22, step: 170, loss: 0.3246022164821625, mean loss: 0.3526346642996287
Epoch: 22, step: 171, loss: 0.33963656425476074, mean loss: 0.35263425734596415
Epoch: 22, step: 172, loss: 0.3416779637336731, mean loss: 0.35263391432935187
Epoch: 22, step: 173, loss: 0.3442174792289734, mean loss: 0.3526336508381772
Epoch: 22, step: 174, loss: 0.30870988965034485, mean loss: 0.35263227577130224
Epoch: 22, step: 175, loss: 0.3314751088619232, mean loss: 0.35263161345077537
Epoch: 22, step: 176, loss: 0.34489256143569946, mean loss: 0.3526313711890125
Epoch: 22, step: 177, loss: 0.3927459418773651, mean loss: 0.35263262688833913
Epoch: 22, step: 178, loss: 0.34960511326789856, mean loss: 0.352632532121581
Epoch: 22, step: 179, loss: 0.3227629065513611, mean loss: 0.35263159717649617
Epoch: 22, step: 180, loss: 0.3038789927959442, mean loss: 0.35263007122562506
Epoch: 22, step: 181, loss: 0.2939276099205017, mean loss: 0.3526282339028925
Epoch: 22, step: 182, loss: 0.32654231786727905, mean loss: 0.3526274174678502
Epoch: 22, step: 183, loss: 0.3486156761646271, mean loss: 0.3526272919126016
Epoch: 22, step: 184, loss: 0.3474681079387665, mean loss: 0.3526271304509556
Epoch: 22, step: 185, loss: 0.3114948272705078, mean loss: 0.3526258432160811
Epoch: 22, step: 186, loss: 0.3020442724227905, mean loss: 0.3526242603160406
Epoch: 22, step: 187, loss: 0.3303986191749573, mean loss: 0.352623564808432
Epoch: 22, step: 188, loss: 0.40424492955207825, mean loss: 0.35262518014669103
Epoch: 22, step: 189, loss: 0.3080180287361145, mean loss: 0.3526237843412148
Epoch: 22, step: 190, loss: 0.30030232667922974, mean loss: 0.35262214719807317
Epoch: 22, step: 191, loss: 0.34364891052246094, mean loss: 0.3526218664334713
Epoch: 22, step: 192, loss: 0.3164623975753784, mean loss: 0.35262073507122177
Epoch: 22, step: 193, loss: 0.31749409437179565, mean loss: 0.35261963605862245
Epoch: 22, step: 194, loss: 0.3209383189678192, mean loss: 0.35261864487140315
Epoch: 22, step: 195, loss: 0.315168172121048, mean loss: 0.35261747322602865
Epoch: 22, step: 196, loss: 0.3475872576236725, mean loss: 0.35261731585967165
Epoch: 22, step: 197, loss: 0.31297534704208374, mean loss: 0.35261607573050885
Epoch: 22, step: 198, loss: 0.32055673003196716, mean loss: 0.3526150728417267
Epoch: 22, step: 199, loss: 0.3024470806121826, mean loss: 0.3526135035226505
Epoch: 22, step: 200, loss: 0.34622812271118164, mean loss: 0.35261330378600525
Epoch: 22, step: 201, loss: 0.32061487436294556, mean loss: 0.3526123028967521
Epoch: 22, step: 202, loss: 0.3057352602481842, mean loss: 0.3526108366603926
Epoch: 22, step: 203, loss: 0.2976769804954529, mean loss: 0.35260911847397436
Epoch: 22, step: 204, loss: 0.289305180311203, mean loss: 0.3526071385553504
Epoch: 22, step: 205, loss: 0.33892667293548584, mean loss: 0.3526067106931618
Epoch: 22, step: 206, loss: 0.30679965019226074, mean loss: 0.3526052781033103
Epoch: 22, step: 207, loss: 0.32377859950065613, mean loss: 0.3526043765934716
Epoch: 22, step: 208, loss: 0.3217301070690155, mean loss: 0.3526034110785851
Epoch: 22, step: 209, loss: 0.32904502749443054, mean loss: 0.3526026743726128
Epoch: 22, step: 210, loss: 0.3032350540161133, mean loss: 0.3526011306213899
Epoch: 22, step: 211, loss: 0.2915712594985962, mean loss: 0.3525992222451822
Epoch: 22, step: 212, loss: 0.2878565788269043, mean loss: 0.3525971978355822
Epoch: 22, step: 213, loss: 0.32788196206092834, mean loss: 0.35259642504977223
Epoch: 22, step: 214, loss: 0.33005762100219727, mean loss: 0.3525957203377675
Epoch: 22, step: 215, loss: 0.34674331545829773, mean loss: 0.3525955373586254
Epoch: 22, step: 216, loss: 0.3153449594974518, mean loss: 0.3525943727321486
Epoch: 22, step: 217, loss: 0.33402761816978455, mean loss: 0.35259379226711507
Epoch: 22, step: 218, loss: 0.34111809730529785, mean loss: 0.3525934335059008
Epoch: 22, step: 219, loss: 0.33139917254447937, mean loss: 0.3525927709367823
Epoch: 22, step: 220, loss: 0.30563297867774963, mean loss: 0.3525913029386499
Epoch: 22, step: 221, loss: 0.338151752948761, mean loss: 0.35259085156165737
Epoch: 22, step: 222, loss: 0.3382560610771179, mean loss: 0.3525904034734299
Epoch: 22, step: 223, loss: 0.34402430057525635, mean loss: 0.3525901357157749
Epoch: 22, step: 224, loss: 0.3474467396736145, mean loss: 0.35258997494948097
Epoch: 22, step: 225, loss: 0.3120374381542206, mean loss: 0.35258870744504905
Epoch: 22, step: 226, loss: 0.3736591637134552, mean loss: 0.3525893659997066
Epoch: 22, step: 227, loss: 0.3346708416938782, mean loss: 0.35258880597581904
Epoch: 22, step: 228, loss: 0.3063080310821533, mean loss: 0.3525873595660027
Epoch: 22, step: 229, loss: 0.30345311760902405, mean loss: 0.3525858240249702
Epoch: 22, step: 230, loss: 0.3201615512371063, mean loss: 0.35258481073478026
Epoch: 22, step: 231, loss: 0.3410813510417938, mean loss: 0.3525844512516649
Epoch: 22, step: 232, loss: 0.33719754219055176, mean loss: 0.35258397042578254
Epoch: 22, step: 233, loss: 0.3510041832923889, mean loss: 0.35258392106051994
Epoch: 22, step: 234, loss: 0.35351988673210144, mean loss: 0.35258395030670536
Epoch: 22, step: 235, loss: 0.2862233519554138, mean loss: 0.35258187679719555
Epoch: 22, step: 236, loss: 0.31001126766204834, mean loss: 0.3525805466734919
Epoch: 22, step: 237, loss: 0.3042053282260895, mean loss: 0.35257903523131084
Epoch: 22, step: 238, loss: 0.31583312153816223, mean loss: 0.35257788717264577
Epoch: 22, step: 239, loss: 0.3523235023021698, mean loss: 0.3525778792251055
Epoch: 22, step: 240, loss: 0.33507975935935974, mean loss: 0.3525773325626085
Epoch: 22, step: 241, loss: 0.3833935558795929, mean loss: 0.35257829526874146
Epoch: 22, step: 242, loss: 0.30102741718292236, mean loss: 0.3525766848573802
Epoch: 22, step: 243, loss: 0.3266191780567169, mean loss: 0.3525758739893682
Epoch: 22, step: 244, loss: 0.30659791827201843, mean loss: 0.3525744377617195
Epoch: 22, step: 245, loss: 0.3312506377696991, mean loss: 0.3525737716843786
Epoch: 22, step: 246, loss: 0.331887423992157, mean loss: 0.3525731255388939
Epoch: 22, step: 247, loss: 0.3880655765533447, mean loss: 0.3525742341236957
Epoch: 22, step: 248, loss: 0.3143100440502167, mean loss: 0.35257303900266396
Epoch: 22, step: 249, loss: 0.32868492603302, mean loss: 0.3525722929188058
Epoch: 22, step: 250, loss: 0.34000054001808167, mean loss: 0.3525719002846542
Epoch: 22, step: 251, loss: 0.35217201709747314, mean loss: 0.35257188779610993
Epoch: 22, step: 252, loss: 0.32247212529182434, mean loss: 0.35257094779540715
Epoch: 22, step: 253, loss: 0.2831670045852661, mean loss: 0.35256878041225775
Epoch: 22, step: 254, loss: 0.32528939843177795, mean loss: 0.35256792854385127
Epoch: 22, step: 255, loss: 0.3099048137664795, mean loss: 0.3525665963206819
Epoch: 22, step: 256, loss: 0.30616775155067444, mean loss: 0.35256514748868284
Epoch: 22, step: 257, loss: 0.3834509551525116, mean loss: 0.35256611188659903
Epoch: 22, step: 258, loss: 0.34942710399627686, mean loss: 0.3525660138752995
Epoch: 22, step: 259, loss: 0.3476322293281555, mean loss: 0.35256585982932265
Epoch: 22, step: 260, loss: 0.3530774712562561, mean loss: 0.3525658758027039
Epoch: 22, step: 261, loss: 0.29614901542663574, mean loss: 0.3525641144271067
Epoch: 22, step: 262, loss: 0.3448289632797241, mean loss: 0.35256387293757635
Epoch: 22, step: 263, loss: 0.38202062249183655, mean loss: 0.3525647925413961
Epoch: 22, step: 264, loss: 0.36311233043670654, mean loss: 0.35256512181239463
Epoch: 22, step: 265, loss: 0.3350948095321655, mean loss: 0.35256457644458916
Epoch: 22, step: 266, loss: 0.3278277814388275, mean loss: 0.3525638042643174
Epoch: 22, step: 267, loss: 0.32876279950141907, mean loss: 0.35256306131873233
Epoch: 22, step: 268, loss: 0.33070141077041626, mean loss: 0.3525623789311633
Epoch: 22, step: 269, loss: 0.3162994086742401, mean loss: 0.35256124705744285
Epoch: 22, step: 270, loss: 0.3269423246383667, mean loss: 0.35256044744065024
Epoch: 22, step: 271, loss: 0.3784441351890564, mean loss: 0.3525612552960731
Epoch: 22, step: 272, loss: 0.34971949458122253, mean loss: 0.35256116660468656
Epoch: 22, step: 273, loss: 0.32786184549331665, mean loss: 0.35256039576263204
Epoch: 22, step: 274, loss: 0.35629212856292725, mean loss: 0.3525605122227887
Epoch: 22, step: 275, loss: 0.32634320855140686, mean loss: 0.3525596940570269
Epoch: 22, step: 276, loss: 0.2980155944824219, mean loss: 0.3525579919475067
Epoch: 22, step: 277, loss: 0.32764679193496704, mean loss: 0.35255721458995776
Epoch: 22, step: 278, loss: 0.36845657229423523, mean loss: 0.3525577107162006
Epoch: 22, step: 279, loss: 0.3330846130847931, mean loss: 0.35255710309333393
Epoch: 22, step: 280, loss: 0.3492806553840637, mean loss: 0.3525570008608865
Epoch: 22, step: 281, loss: 0.32217323780059814, mean loss: 0.35255605284955854
Epoch: 22, step: 282, loss: 0.3229827284812927, mean loss: 0.35255513015371853
Epoch: 22, step: 283, loss: 0.35898691415786743, mean loss: 0.3525553308208845
Epoch: 22, step: 284, loss: 0.3222697377204895, mean loss: 0.3525543859610243
Epoch: 22, step: 285, loss: 0.34702691435813904, mean loss: 0.3525542135185334
Epoch: 22, step: 286, loss: 0.35180628299713135, mean loss: 0.3525541901858077
Epoch: 22, step: 287, loss: 0.3338799774646759, mean loss: 0.3525536076361221
Epoch: 22, step: 288, loss: 0.3058825731277466, mean loss: 0.35255215175957383
Epoch: 22, step: 289, loss: 0.3175835609436035, mean loss: 0.35255106096817024
Epoch: 22, step: 290, loss: 0.3677781820297241, mean loss: 0.3525515359399741
Epoch: 22, step: 291, loss: 0.3714660704135895, mean loss: 0.352552125912977
Epoch: 22, step: 292, loss: 0.33871057629585266, mean loss: 0.35255169418752813
Epoch: 22, step: 293, loss: 0.3679533004760742, mean loss: 0.35255217455700877
Epoch: 22, step: 294, loss: 0.3474491238594055, mean loss: 0.3525520154000148
Epoch: 22, step: 295, loss: 0.3019472658634186, mean loss: 0.35255043715807566
Epoch: 22, step: 296, loss: 0.3298700153827667, mean loss: 0.352549729831652
Epoch: 22, step: 297, loss: 0.33280104398727417, mean loss: 0.352549113955464
Epoch: 22, step: 298, loss: 0.32670149207115173, mean loss: 0.3525483079049484
Epoch: 22, step: 299, loss: 0.31161946058273315, mean loss: 0.3525470315906375
Epoch: 22, step: 300, loss: 0.3679724335670471, mean loss: 0.3525475125972787
Epoch: 22, step: 301, loss: 0.3600672483444214, mean loss: 0.3525477470760984
Epoch: 22, step: 302, loss: 0.31432151794433594, mean loss: 0.3525465551510218
Epoch: 22, step: 303, loss: 0.3442399203777313, mean loss: 0.3525462961514342
Epoch: 22, step: 304, loss: 0.3989683985710144, mean loss: 0.352547743540279
Epoch: 22, step: 305, loss: 0.3947480320930481, mean loss: 0.35254905925670205
Epoch: 22, step: 306, loss: 0.32563385367393494, mean loss: 0.3525482201232466
Epoch: 22, step: 307, loss: 0.3538835048675537, mean loss: 0.3525482617520265
Epoch: 22, step: 308, loss: 0.33144545555114746, mean loss: 0.35254760387235573
Epoch: 22, step: 309, loss: 0.3019125461578369, mean loss: 0.35254602537439095
Epoch: 22, step: 310, loss: 0.3954611122608185, mean loss: 0.35254736316817775
Epoch: 22, step: 311, loss: 0.30937859416007996, mean loss: 0.35254601750829595
Epoch: 22, step: 312, loss: 0.32491469383239746, mean loss: 0.3525451562095934
Epoch: 22, step: 313, loss: 0.3367076814174652, mean loss: 0.3525446625534999
Epoch: 22, step: 314, loss: 0.345525324344635, mean loss: 0.3525444437666593
Epoch: 22, step: 315, loss: 0.3148823082447052, mean loss: 0.35254326990630763
Epoch: 22, step: 316, loss: 0.3540690839290619, mean loss: 0.3525433174616769
Epoch: 22, step: 317, loss: 0.31445831060409546, mean loss: 0.352542130495185
Epoch: 22, step: 318, loss: 0.3156951069831848, mean loss: 0.3525409821477698
Epoch: 22, step: 319, loss: 0.33199119567871094, mean loss: 0.35254034172809673
Epoch: 22, step: 320, loss: 0.3377895951271057, mean loss: 0.352539882045757
Epoch: 22, step: 321, loss: 0.3423498868942261, mean loss: 0.3525395645015017
Epoch: 22, step: 322, loss: 0.3270600736141205, mean loss: 0.3525387705252813
Epoch: 22, step: 323, loss: 0.32551300525665283, mean loss: 0.35253792839125203
Epoch: 22, step: 324, loss: 0.3092595040798187, mean loss: 0.35253657985966225
Epoch: 22, step: 325, loss: 0.335722953081131, mean loss: 0.35253605597274323
Epoch: 22, step: 326, loss: 0.3667707145214081, mean loss: 0.35253649948913357
Epoch: 22, step: 327, loss: 0.36476507782936096, mean loss: 0.3525368804892065
Epoch: 22, step: 328, loss: 0.3698110282421112, mean loss: 0.35253741867494826
Epoch: 22, step: 329, loss: 0.30028846859931946, mean loss: 0.3525357908803793
Epoch: 22, step: 330, loss: 0.2986716032028198, mean loss: 0.352534112816026
Epoch: 22, step: 331, loss: 0.32745829224586487, mean loss: 0.3525333316378151
Epoch: 22, step: 332, loss: 0.3256157636642456, mean loss: 0.352532493110418
Epoch: 22, step: 333, loss: 0.340341180562973, mean loss: 0.3525321133424114
Epoch: 22, step: 334, loss: 0.3340420126914978, mean loss: 0.352531537380643
Epoch: 22, step: 335, loss: 0.34378793835639954, mean loss: 0.35253126502831855
Epoch: 22, step: 336, loss: 0.37245744466781616, mean loss: 0.35253188568490285
Epoch: 22, step: 337, loss: 0.3347480297088623, mean loss: 0.3525313317742327
Epoch: 22, step: 338, loss: 0.32606568932533264, mean loss: 0.3525305074791429
Epoch: 22, step: 339, loss: 0.3092583417892456, mean loss: 0.35252915977247506
Epoch: 22, step: 340, loss: 0.3015541136264801, mean loss: 0.352527572209918
Epoch: 22, step: 341, loss: 0.3065384328365326, mean loss: 0.35252613997262827
Epoch: 22, step: 342, loss: 0.3524065315723419, mean loss: 0.3525261362477863
Epoch: 22, step: 343, loss: 0.3667981028556824, mean loss: 0.35252658069119086
Epoch: 22, step: 344, loss: 0.33380329608917236, mean loss: 0.3525259976474204
Epoch: 22, step: 345, loss: 0.43703773617744446, mean loss: 0.352528629264115
Epoch: 22, step: 346, loss: 0.345580518245697, mean loss: 0.3525284129131569
Epoch: 22, step: 347, loss: 0.30300217866897583, mean loss: 0.3525268708084663
Epoch: 22, step: 348, loss: 0.3260842263698578, mean loss: 0.3525260474861
Epoch: 22, step: 349, loss: 0.326030433177948, mean loss: 0.35252522254014107
Epoch: 22, step: 350, loss: 0.3959856629371643, mean loss: 0.3525265756470372
Epoch: 22, step: 351, loss: 0.3000720739364624, mean loss: 0.3525249425679055
Epoch: 22, step: 352, loss: 0.350737601518631, mean loss: 0.3525248869239016
Epoch: 22, step: 353, loss: 0.3345789313316345, mean loss: 0.3525243282427612
Epoch: 22, step: 354, loss: 0.30473220348358154, mean loss: 0.35252284045753696
Epoch: 22, step: 355, loss: 0.3757195472717285, mean loss: 0.3525235625564915
Epoch: 22, step: 356, loss: 0.27905210852622986, mean loss: 0.3525212755073388
Epoch: 22, step: 357, loss: 0.3369659185409546, mean loss: 0.3525207913089647
Epoch: 22, step: 358, loss: 0.36823153495788574, mean loss: 0.35252128032890584
Epoch: 22, step: 359, loss: 0.32498234510421753, mean loss: 0.3525204231658324
Epoch: 22, step: 360, loss: 0.36007243394851685, mean loss: 0.35252065821861284
Epoch: 22, step: 361, loss: 0.3155243694782257, mean loss: 0.35251950676238064
Epoch: 22, step: 362, loss: 0.3078649640083313, mean loss: 0.3525181169972705
Epoch: 22, step: 363, loss: 0.3465625047683716, mean loss: 0.3525179316489501
Epoch: 22, step: 364, loss: 0.3615070879459381, mean loss: 0.35251821139738
Epoch: 22, step: 365, loss: 0.33403724431991577, mean loss: 0.35251763627548177
Epoch: 22, step: 366, loss: 0.36116915941238403, mean loss: 0.35251790549978973
Epoch: 22, step: 367, loss: 0.3176378309726715, mean loss: 0.35251682011036584
Epoch: 22, step: 368, loss: 0.3462137281894684, mean loss: 0.35251662397843314
Epoch: 22, step: 369, loss: 0.3362811505794525, mean loss: 0.352516118798478
Epoch: 22, step: 370, loss: 0.3278651833534241, mean loss: 0.3525153517884452
Epoch: 22, step: 371, loss: 0.3304811120033264, mean loss: 0.35251466621782335
Epoch: 22, step: 372, loss: 0.3821811079978943, mean loss: 0.3525155892271193
Epoch: 22, step: 373, loss: 0.3116198778152466, mean loss: 0.3525143168821684
Epoch: 22, step: 374, loss: 0.3084603250026703, mean loss: 0.35251294631962354
Epoch: 22, step: 375, loss: 0.3401460349559784, mean loss: 0.3525125615849495
Epoch: 22, step: 376, loss: 0.3379552960395813, mean loss: 0.35251210872243444
Epoch: 22, step: 377, loss: 0.32184985280036926, mean loss: 0.3525111548788482
Epoch: 22, step: 378, loss: 0.2862650454044342, mean loss: 0.35250909415438014
Epoch: 22, step: 379, loss: 0.3248157501220703, mean loss: 0.35250823272150617
Epoch: 22, step: 380, loss: 0.33012935519218445, mean loss: 0.352507536622793
Epoch: 22, step: 381, loss: 0.32180655002593994, mean loss: 0.3525065816931943
Epoch: 22, step: 382, loss: 0.32934582233428955, mean loss: 0.35250586131873135
Epoch: 22, step: 383, loss: 0.4222465753555298, mean loss: 0.35250803041284795
Epoch: 22, step: 384, loss: 0.38012370467185974, mean loss: 0.35250888929613283
Epoch: 22, step: 385, loss: 0.3435078263282776, mean loss: 0.3525086093601072
Epoch: 22, step: 386, loss: 0.3349592089653015, mean loss: 0.3525080635849433
Epoch: 22, step: 387, loss: 0.34771728515625, mean loss: 0.3525079145994218
Epoch: 22, step: 388, loss: 0.3243258595466614, mean loss: 0.3525070382099871
Epoch: 22, step: 389, loss: 0.31758350133895874, mean loss: 0.352505952211577
Epoch: 22, step: 390, loss: 0.34160682559013367, mean loss: 0.3525056132978477
Epoch: 22, step: 391, loss: 0.32371097803115845, mean loss: 0.35250471794227345
Epoch: 22, step: 392, loss: 0.3363054394721985, mean loss: 0.3525042142490279
Epoch: 22, step: 393, loss: 0.3083304464817047, mean loss: 0.35250284077201255
Epoch: 22, step: 394, loss: 0.343919575214386, mean loss: 0.35250257390432116
Epoch: 22, step: 395, loss: 0.34571316838264465, mean loss: 0.35250236281722
Epoch: 22, step: 396, loss: 0.3643828332424164, mean loss: 0.35250273217740735
Epoch: 22, step: 397, loss: 0.33024924993515015, mean loss: 0.35250204034496807
Epoch: 22, step: 398, loss: 0.3142333924770355, mean loss: 0.352500850658399
Epoch: 22, step: 399, loss: 0.335187166929245, mean loss: 0.3525003124314738
Epoch: 22, step: 400, loss: 0.33642396330833435, mean loss: 0.35249981268485053
Epoch: 22, step: 401, loss: 0.3077142536640167, mean loss: 0.35249842053194347
Epoch: 22, step: 402, loss: 0.33367279171943665, mean loss: 0.352497835358066
Epoch: 22, step: 403, loss: 0.32927271723747253, mean loss: 0.35249711345336254
Epoch: 22, step: 404, loss: 0.30900827050209045, mean loss: 0.35249576173474906
Epoch: 22, step: 405, loss: 0.3533081114292145, mean loss: 0.3524957869833875
Epoch: 22, step: 406, loss: 0.3367840051651001, mean loss: 0.35249529866072027
Epoch: 22, step: 407, loss: 0.338838666677475, mean loss: 0.35249487422536524
Epoch: 22, step: 408, loss: 0.3233090043067932, mean loss: 0.35249396718400283
Epoch: 22, step: 409, loss: 0.35967734456062317, mean loss: 0.35249419042278013
Epoch: 22, step: 410, loss: 0.2939605712890625, mean loss: 0.3524923714222166
Epoch: 22, step: 411, loss: 0.36119386553764343, mean loss: 0.35249264182290385
Epoch: 22, step: 412, loss: 0.3477051258087158, mean loss: 0.3524924930544997
Epoch: 22, step: 413, loss: 0.3276267945766449, mean loss: 0.352491720395918
Epoch: 22, step: 414, loss: 0.29951211810112, mean loss: 0.3524900741975432
Epoch: 22, step: 415, loss: 0.3377610445022583, mean loss: 0.3524896165468567
Epoch: 22, step: 416, loss: 0.3358536958694458, mean loss: 0.35248909966257275
Epoch: 22, step: 417, loss: 0.36473721265792847, mean loss: 0.3524894802042056
Epoch: 22, step: 418, loss: 0.3326614201068878, mean loss: 0.3524888641772352
Epoch: 22, step: 419, loss: 0.33760103583335876, mean loss: 0.35248840164994727
Epoch: 22, step: 420, loss: 0.2871684432029724, mean loss: 0.35248637238658254
Epoch: 22, step: 421, loss: 0.3589039444923401, mean loss: 0.3524865717519788
Epoch: 22, step: 422, loss: 0.3931126296520233, mean loss: 0.3524878337835373
Epoch: 22, step: 423, loss: 0.3207639753818512, mean loss: 0.35248684832570926
Epoch: 22, step: 424, loss: 0.41577932238578796, mean loss: 0.35248881435789203
Epoch: 22, step: 425, loss: 0.3328200578689575, mean loss: 0.35248820341310455
Epoch: 22, step: 426, loss: 0.3792661428451538, mean loss: 0.3524890351552829
Epoch: 22, step: 427, loss: 0.346646249294281, mean loss: 0.3524888536797623
Epoch: 22, step: 428, loss: 0.3537937104701996, mean loss: 0.35248889420704094
Epoch: 22, step: 429, loss: 0.3125351667404175, mean loss: 0.35248765333097826
Epoch: 22, step: 430, loss: 0.3248215913772583, mean loss: 0.35248679410982375
Epoch: 22, step: 431, loss: 0.35060158371925354, mean loss: 0.3524867355629172
Epoch: 22, step: 432, loss: 0.34505128860473633, mean loss: 0.35248650465558645
Epoch: 22, step: 433, loss: 0.31938350200653076, mean loss: 0.3524854766758756
Epoch: 22, step: 434, loss: 0.30724000930786133, mean loss: 0.3524840716680388
Epoch: 22, step: 435, loss: 0.37904784083366394, mean loss: 0.35248489652734716
Epoch: 22, step: 436, loss: 0.3025336265563965, mean loss: 0.3524833454865159
Epoch: 22, step: 437, loss: 0.34539273381233215, mean loss: 0.35248312532220877
Epoch: 22, step: 438, loss: 0.33516228199005127, mean loss: 0.35248258752473205
Epoch: 22, step: 439, loss: 0.3269712030887604, mean loss: 0.3524817954425029
Epoch: 22, step: 440, loss: 0.32599666714668274, mean loss: 0.3524809731528231
Epoch: 22, step: 441, loss: 0.3430618643760681, mean loss: 0.3524806807247332
Epoch: 22, step: 442, loss: 0.337013304233551, mean loss: 0.35248020053546586
Epoch: 22, step: 443, loss: 0.31749585270881653, mean loss: 0.3524791144697814
Epoch: 22, step: 444, loss: 0.34478113055229187, mean loss: 0.352478875498437
Epoch: 22, step: 445, loss: 0.31610995531082153, mean loss: 0.35247774651972624
Epoch: 22, step: 446, loss: 0.38968625664711, mean loss: 0.35247890152547284
Epoch: 22, step: 447, loss: 0.3136308789253235, mean loss: 0.3524776956643293
Epoch: 22, step: 448, loss: 0.3122508227825165, mean loss: 0.35247644704177344
Epoch: 22, step: 449, loss: 0.3792881369590759, mean loss: 0.3524772792377483
Epoch: 22, step: 450, loss: 0.3480442464351654, mean loss: 0.35247714164710914
Epoch: 22, step: 451, loss: 0.2834651470184326, mean loss: 0.3524749997478345
Epoch: 22, step: 452, loss: 0.31731849908828735, mean loss: 0.3524739086426342
Epoch: 22, step: 453, loss: 0.3107626438140869, mean loss: 0.3524726141461775
Epoch: 22, step: 454, loss: 0.33005496859550476, mean loss: 0.35247191844293596
Epoch: 22, step: 455, loss: 0.36213722825050354, mean loss: 0.35247221838427806
Epoch: 22, step: 456, loss: 0.3604464828968048, mean loss: 0.3524724658401202
Epoch: 22, step: 457, loss: 0.386306494474411, mean loss: 0.35247351573860697
Epoch: 22, step: 458, loss: 0.3302079141139984, mean loss: 0.3524728248396209
Epoch: 22, step: 459, loss: 0.3485338091850281, mean loss: 0.3524727026162234
Epoch: 22, step: 460, loss: 0.3540751338005066, mean loss: 0.352472752336388
Epoch: 22, step: 461, loss: 0.3475579619407654, mean loss: 0.3524725998452184
Epoch: 22, step: 462, loss: 0.3635232150554657, mean loss: 0.3524729427019467
Epoch: 22, step: 463, loss: 0.3239835202693939, mean loss: 0.3524720588156712
Epoch: 22, step: 464, loss: 0.3295357823371887, mean loss: 0.35247134723820467
Epoch: 22, step: 465, loss: 0.35606086254119873, mean loss: 0.3524714585962522
Epoch: 22, step: 466, loss: 0.33566683530807495, mean loss: 0.35247093728018924
Epoch: 22, step: 467, loss: 0.33400866389274597, mean loss: 0.35247036455797226
Epoch: 22, step: 468, loss: 0.30785906314849854, mean loss: 0.3524689807039719
Epoch: 22, step: 469, loss: 0.34991949796676636, mean loss: 0.35246890162081734
Epoch: 22, step: 470, loss: 0.3212759792804718, mean loss: 0.3524679340684013
Epoch: 22, step: 471, loss: 0.3845946192741394, mean loss: 0.35246893055367445
Epoch: 22, step: 472, loss: 0.34236419200897217, mean loss: 0.35246861714098426
Epoch: 22, step: 473, loss: 0.338392972946167, mean loss: 0.3524681805786062
Epoch: 22, step: 474, loss: 0.3351476490497589, mean loss: 0.3524676433912623
Epoch: 22, step: 475, loss: 0.2954650819301605, mean loss: 0.35246587554107434
Epoch: 22, step: 476, loss: 0.3507804274559021, mean loss: 0.35246582327101433
Epoch: 22, step: 477, loss: 0.3121378421783447, mean loss: 0.3524645726358629
Epoch: 22, step: 478, loss: 0.30296286940574646, mean loss: 0.3524630375565305
Epoch: 22, step: 479, loss: 0.3494708836078644, mean loss: 0.352462944770809
Epoch: 22, step: 480, loss: 0.3582051396369934, mean loss: 0.35246312282888415
Epoch: 22, step: 481, loss: 0.3972441554069519, mean loss: 0.35246451138803386
Epoch: 22, step: 482, loss: 0.37686240673065186, mean loss: 0.35246526788846305
Epoch: 22, step: 483, loss: 0.3508750796318054, mean loss: 0.3524652185833577
Epoch: 22, step: 484, loss: 0.33066174387931824, mean loss: 0.3524645425695077
Epoch: 22, step: 485, loss: 0.2974129021167755, mean loss: 0.3524628357535949
Epoch: 22, step: 486, loss: 0.32065582275390625, mean loss: 0.3524618496425113
Epoch: 22, step: 487, loss: 0.35236626863479614, mean loss: 0.3524618466793104
Epoch: 22, step: 488, loss: 0.3357657790184021, mean loss: 0.3524613290841323
Epoch: 22, step: 489, loss: 0.30687883496284485, mean loss: 0.3524599160239884
Epoch: 22, step: 490, loss: 0.3360557556152344, mean loss: 0.3524594075097626
Epoch: 22, step: 491, loss: 0.34195640683174133, mean loss: 0.352459081936276
Epoch: 22, step: 492, loss: 0.3539198040962219, mean loss: 0.35245912721454264
Epoch: 22, step: 493, loss: 0.3687054216861725, mean loss: 0.3524596307882353
Epoch: 22, step: 494, loss: 0.32520630955696106, mean loss: 0.35245878606451986
Epoch: 22, step: 495, loss: 0.3383771479129791, mean loss: 0.35245834961404404
Epoch: 22, step: 496, loss: 0.37002742290496826, mean loss: 0.3524588941382434
Epoch: 22, step: 497, loss: 0.31824034452438354, mean loss: 0.35245783362409183
Epoch: 22, step: 498, loss: 0.39594969153404236, mean loss: 0.3524591814983259
Epoch: 22, step: 499, loss: 0.31452566385269165, mean loss: 0.35245800592135657
Epoch: 22, step: 500, loss: 0.3357069194316864, mean loss: 0.3524574868136529
Epoch: 22, step: 501, loss: 0.3324107527732849, mean loss: 0.35245686559474865
Epoch: 22, step: 502, loss: 0.3206888437271118, mean loss: 0.3524558811808207
Epoch: 22, step: 503, loss: 0.3198099434375763, mean loss: 0.35245486959375627
Epoch: 22, step: 504, loss: 0.3246611952781677, mean loss: 0.3524540083885905
Epoch: 22, step: 505, loss: 0.31675857305526733, mean loss: 0.35245290237646515
Epoch: 22, step: 506, loss: 0.36545905470848083, mean loss: 0.35245330535562336
Epoch: 22, step: 507, loss: 0.3581404685974121, mean loss: 0.3524534815597144
Epoch: 22, step: 508, loss: 0.3207724392414093, mean loss: 0.35245250002356426
Epoch: 22, step: 509, loss: 0.34763720631599426, mean loss: 0.35245235084165377
Epoch: 22, step: 510, loss: 0.34529995918273926, mean loss: 0.35245212926131797
Epoch: 22, step: 511, loss: 0.34120839834213257, mean loss: 0.3524517809425163
Epoch: 22, step: 512, loss: 0.32189199328422546, mean loss: 0.3524508342621886
Epoch: 22, step: 513, loss: 0.3262244760990143, mean loss: 0.3524500218478969
Epoch: 22, step: 514, loss: 0.32597559690475464, mean loss: 0.3524492017746403
Epoch: 22, step: 515, loss: 0.32797446846961975, mean loss: 0.352448443667426
Epoch: 22, step: 516, loss: 0.3284769654273987, mean loss: 0.3524477011715846
Epoch: 22, step: 517, loss: 0.34175848960876465, mean loss: 0.3524473700927404
Epoch: 22, step: 518, loss: 0.3352205455303192, mean loss: 0.352446836539776
Epoch: 22, step: 519, loss: 0.3531322479248047, mean loss: 0.3524468577678293
Epoch: 22, step: 520, loss: 0.37734630703926086, mean loss: 0.3524476289112302
Epoch: 22, step: 521, loss: 0.3320537209510803, mean loss: 0.35244699732535345
Epoch: 22, step: 522, loss: 0.3072074055671692, mean loss: 0.3524455963284268
Epoch: 22, step: 523, loss: 0.3368673622608185, mean loss: 0.3524451139106742
Epoch: 22, step: 524, loss: 0.37756502628326416, mean loss: 0.35244589178551927
Epoch: 22, step: 525, loss: 0.29310742020606995, mean loss: 0.35244405433981485
Epoch: 22, step: 526, loss: 0.3640647232532501, mean loss: 0.35244441416854727
Epoch: 22, step: 527, loss: 0.3596818149089813, mean loss: 0.35244463826443345
Epoch: 22, step: 528, loss: 0.31360703706741333, mean loss: 0.35244343575023096
Epoch: 22, step: 529, loss: 0.3222600221633911, mean loss: 0.3524425012213565
Epoch: 22, step: 530, loss: 0.28517818450927734, mean loss: 0.35244041867029574
Epoch: 22, step: 531, loss: 0.32947251200675964, mean loss: 0.3524397075895941
Epoch: 22, step: 532, loss: 0.36187949776649475, mean loss: 0.3524399998341121
Epoch: 22, step: 533, loss: 0.38085314631462097, mean loss: 0.35244087944362484
Epoch: 22, step: 534, loss: 0.37362438440322876, mean loss: 0.3524415352187838
Epoch: 22, step: 535, loss: 0.312359094619751, mean loss: 0.35244029443000846
Epoch: 22, step: 536, loss: 0.31287410855293274, mean loss: 0.3524390696602862
Epoch: 22, step: 537, loss: 0.3187757730484009, mean loss: 0.3524380276465237
Epoch: 22, step: 538, loss: 0.3239695131778717, mean loss: 0.35243714645933616
Epoch: 22, step: 539, loss: 0.34007740020751953, mean loss: 0.35243676389940515
Epoch: 22, step: 540, loss: 0.3034909665584564, mean loss: 0.3524352489717583
Epoch: 22, step: 541, loss: 0.34662696719169617, mean loss: 0.3524350692044485
Epoch: 22, step: 542, loss: 0.30494174361228943, mean loss: 0.3524335993234299
Epoch: 22, step: 543, loss: 0.3176749050617218, mean loss: 0.35243252360251315
Epoch: 22, step: 544, loss: 0.3193936347961426, mean loss: 0.35243150113821686
Epoch: 22, step: 545, loss: 0.3122152090072632, mean loss: 0.3524302565912053
Epoch: 22, step: 546, loss: 0.3247143626213074, mean loss: 0.3524293989122955
Epoch: 22, step: 547, loss: 0.3527805507183075, mean loss: 0.3524294097784858
Epoch: 22, step: 548, loss: 0.3873060345649719, mean loss: 0.35243048898214907
Epoch: 22, step: 549, loss: 0.3084505796432495, mean loss: 0.35242912813341654
Epoch: 22, step: 550, loss: 0.31361255049705505, mean loss: 0.3524279270882841
Epoch: 22, step: 551, loss: 0.2999550998210907, mean loss: 0.35242630354783644
Epoch: 22, step: 552, loss: 0.3217909336090088, mean loss: 0.3524253557006183
Epoch: 22, step: 553, loss: 0.33573007583618164, mean loss: 0.3524248391707048
Epoch: 22, step: 554, loss: 0.3451599180698395, mean loss: 0.35242461441059275
Epoch: 22, step: 555, loss: 0.3519481420516968, mean loss: 0.3524245996700792
Epoch: 22, step: 556, loss: 0.3600160479545593, mean loss: 0.3524248345176673
Epoch: 22, step: 557, loss: 0.39035916328430176, mean loss: 0.35242600801048324
Epoch: 22, step: 558, loss: 0.4067651629447937, mean loss: 0.3524276889321566
Epoch: 22, step: 559, loss: 0.3394124209880829, mean loss: 0.3524272863316881
Epoch: 22, step: 560, loss: 0.3295290768146515, mean loss: 0.35242657804471617
Epoch: 22, step: 561, loss: 0.32039451599121094, mean loss: 0.35242558726024187
Epoch: 22, step: 562, loss: 0.3326711356639862, mean loss: 0.3524249762537281
Epoch: 22, step: 563, loss: 0.3615320324897766, mean loss: 0.35242525792687657
Epoch: 22, step: 564, loss: 0.32224926352500916, mean loss: 0.3524243246390777
Epoch: 22, step: 565, loss: 0.35279569029808044, mean loss: 0.35242433612437674
Epoch: 22, step: 566, loss: 0.30586370825767517, mean loss: 0.35242289617918215
Epoch: 22, step: 567, loss: 0.3184768557548523, mean loss: 0.35242184638822394
Epoch: 22, step: 568, loss: 0.3246159851551056, mean loss: 0.35242098651064613
Epoch: 22, step: 569, loss: 0.34825599193573, mean loss: 0.35242085771497
Epoch: 22, step: 570, loss: 0.31999292969703674, mean loss: 0.35241985496510086
Epoch: 22, step: 571, loss: 0.3422681987285614, mean loss: 0.35241954106107376
Epoch: 22, step: 572, loss: 0.33197250962257385, mean loss: 0.3524189088285689
Epoch: 22, step: 573, loss: 0.31500932574272156, mean loss: 0.3524177521411938
Epoch: 22, step: 574, loss: 0.32227903604507446, mean loss: 0.3524168202945471
Epoch: 22, step: 575, loss: 0.37395212054252625, mean loss: 0.35241748611510876
Epoch: 22, step: 576, loss: 0.3387104868888855, mean loss: 0.3524170623402061
Epoch: 22, step: 577, loss: 0.30085766315460205, mean loss: 0.35241546834406484
Epoch: 22, step: 578, loss: 0.3730761706829071, mean loss: 0.352416107064884
Epoch: 22, step: 579, loss: 0.34430158138275146, mean loss: 0.35241585621396027
Epoch: 22, step: 580, loss: 0.33383676409721375, mean loss: 0.35241528188114885
Epoch: 22, step: 581, loss: 0.2935987710952759, mean loss: 0.3524134637509854
Epoch: 22, step: 582, loss: 0.34066757559776306, mean loss: 0.3524131006744761
Epoch: 22, step: 583, loss: 0.31567326188087463, mean loss: 0.3524119650464224
Epoch: 22, step: 584, loss: 0.3561234474182129, mean loss: 0.35241207976475986
Epoch: 22, step: 585, loss: 0.3193790912628174, mean loss: 0.35241105877852935
Epoch: 22, step: 586, loss: 0.3174298107624054, mean loss: 0.35240997760875603
Epoch: 22, step: 587, loss: 0.3668450713157654, mean loss: 0.35241042374219983
Epoch: 22, step: 588, loss: 0.28604936599731445, mean loss: 0.35240837283952825
Epoch: 22, step: 589, loss: 0.3237757980823517, mean loss: 0.3524074879710334
Epoch: 22, step: 590, loss: 0.3497345745563507, mean loss: 0.35240740536917875
Epoch: 22, step: 591, loss: 0.3461731970310211, mean loss: 0.3524072127174996
Epoch: 22, step: 592, loss: 0.33496004343032837, mean loss: 0.3524066735756533
Epoch: 22, step: 593, loss: 0.3722020387649536, mean loss: 0.3524072852611236
Epoch: 22, step: 594, loss: 0.30618348717689514, mean loss: 0.35240585696961524
Epoch: 22, step: 595, loss: 0.33348461985588074, mean loss: 0.3524052723312172
Epoch: 22, step: 596, loss: 0.319399893283844, mean loss: 0.35240425254505786
Epoch: 22, step: 597, loss: 0.32613062858581543, mean loss: 0.35240344077888475
Epoch: 22, step: 598, loss: 0.35901975631713867, mean loss: 0.3524036451943554
Epoch: 22, step: 599, loss: 0.30542534589767456, mean loss: 0.35240219381338356
Epoch: 22, step: 600, loss: 0.36515894532203674, mean loss: 0.35240258791735674
Epoch: 22, step: 601, loss: 0.33652687072753906, mean loss: 0.3524020974719693
Epoch: 22, step: 602, loss: 0.3059289753437042, mean loss: 0.3524006618313611
Epoch: 22, step: 603, loss: 0.3507503569126129, mean loss: 0.35240061085196783
Epoch: 22, step: 604, loss: 0.36188793182373047, mean loss: 0.35240090391473533
Epoch: 22, step: 605, loss: 0.3110648989677429, mean loss: 0.35239962708749906
Epoch: 22, step: 606, loss: 0.278570294380188, mean loss: 0.35239734664478994
Epoch: 22, step: 607, loss: 0.35216668248176575, mean loss: 0.3523973395202482
Epoch: 22, step: 608, loss: 0.3107750713825226, mean loss: 0.3523960539697606
Epoch: 22, step: 609, loss: 0.3910553455352783, mean loss: 0.35239724796851174
Epoch: 22, step: 610, loss: 0.3357286751270294, mean loss: 0.3523967331727231
Epoch: 22, step: 611, loss: 0.32661476731300354, mean loss: 0.3523959369415353
Epoch: 22, step: 612, loss: 0.3378100097179413, mean loss: 0.35239548649444524
Epoch: 22, step: 613, loss: 0.32944318652153015, mean loss: 0.35239477769634836
Epoch: 22, step: 614, loss: 0.36687377095222473, mean loss: 0.35239522481345475
Epoch: 22, step: 615, loss: 0.29009583592414856, mean loss: 0.3523933010427998
Epoch: 22, step: 616, loss: 0.3593306243419647, mean loss: 0.35239351525688967
Epoch: 22, step: 617, loss: 0.31236976385116577, mean loss: 0.3523922794219176
Epoch: 22, step: 618, loss: 0.4220317304134369, mean loss: 0.35239442965043494
Epoch: 22, step: 619, loss: 0.31666839122772217, mean loss: 0.35239332658638584
Epoch: 22, step: 620, loss: 0.34481576085090637, mean loss: 0.35239309263147106
Epoch: 22, step: 621, loss: 0.36744600534439087, mean loss: 0.35239355737098055
Epoch: 22, step: 622, loss: 0.3579319715499878, mean loss: 0.35239372835718596
Epoch: 22, step: 623, loss: 0.31894683837890625, mean loss: 0.3523926957908122
Epoch: 22, step: 624, loss: 0.30652132630348206, mean loss: 0.35239127970185824
Epoch: 22, step: 625, loss: 0.33311641216278076, mean loss: 0.35239068468835144
Epoch: 22, step: 626, loss: 0.33160439133644104, mean loss: 0.3523900430370672
Epoch: 22, step: 627, loss: 0.34078890085220337, mean loss: 0.35238968493291284
Epoch: 22, step: 628, loss: 0.30524569749832153, mean loss: 0.35238822973683187
Epoch: 22, step: 629, loss: 0.33275771141052246, mean loss: 0.3523876238192343
Epoch: 22, step: 630, loss: 0.35371920466423035, mean loss: 0.352387664918677
Epoch: 22, step: 631, loss: 0.34514614939689636, mean loss: 0.3523874414151115
Epoch: 22, step: 632, loss: 0.33785679936408997, mean loss: 0.35238699295234643
Epoch: 22, step: 633, loss: 0.3077505826950073, mean loss: 0.3523856153703991
Epoch: 22, step: 634, loss: 0.3788255453109741, mean loss: 0.35238643134206654
Epoch: 22, step: 635, loss: 0.30524542927742004, mean loss: 0.3523849765524707
Epoch: 22, step: 636, loss: 0.2974812686443329, mean loss: 0.3523832822550503
Epoch: 22, step: 637, loss: 0.3509432077407837, mean loss: 0.35238323781653536
Epoch: 22, step: 638, loss: 0.3957093060016632, mean loss: 0.35238457475201795
Epoch: 22, step: 639, loss: 0.37127935886383057, mean loss: 0.35238515778040946
Epoch: 22, step: 640, loss: 0.3265197277069092, mean loss: 0.3523843596863592
Epoch: 22, step: 641, loss: 0.3379766643047333, mean loss: 0.35238391514160816
Epoch: 22, step: 642, loss: 0.29693537950515747, mean loss: 0.35238220434787654
Epoch: 22, step: 643, loss: 0.3279151916503906, mean loss: 0.352381449472747
Epoch: 22, step: 644, loss: 0.32287102937698364, mean loss: 0.352380539022616
Epoch: 22, step: 645, loss: 0.3677831292152405, mean loss: 0.3523810142058761
Epoch: 22, step: 646, loss: 0.3229179382324219, mean loss: 0.35238010527248187
Epoch: 22, step: 647, loss: 0.34420084953308105, mean loss: 0.35237985295092034
Epoch: 22, step: 648, loss: 0.3132959306240082, mean loss: 0.3523786472896214
Epoch: 22, step: 649, loss: 0.33030790090560913, mean loss: 0.3523779664719774
Epoch: 22, step: 650, loss: 0.3250774145126343, mean loss: 0.35237712435618235
Epoch: 22, step: 651, loss: 0.32941609621047974, mean loss: 0.3523764161196572
Epoch: 22, step: 652, loss: 0.32124677300453186, mean loss: 0.3523754559505349
Epoch: 22, step: 653, loss: 0.324174702167511, mean loss: 0.3523745861475066
Epoch: 22, step: 654, loss: 0.3588893413543701, mean loss: 0.35237478707756265
Epoch: 22, step: 655, loss: 0.30647388100624084, mean loss: 0.3523733714315575
Epoch: 22, step: 656, loss: 0.3492914140224457, mean loss: 0.3523732763827554
Epoch: 22, step: 657, loss: 0.30828776955604553, mean loss: 0.35237191680997965
Epoch: 22, step: 658, loss: 0.3486887514591217, mean loss: 0.3523718032266895
Epoch: 22, step: 659, loss: 0.3447297513484955, mean loss: 0.3523715675645494
Epoch: 22, step: 660, loss: 0.3184514045715332, mean loss: 0.3523705215821573
Epoch: 22, step: 661, loss: 0.30351904034614563, mean loss: 0.352369015215175
Epoch: 22, step: 662, loss: 0.32520627975463867, mean loss: 0.3523681776605063
Epoch: 22, step: 663, loss: 0.3312668204307556, mean loss: 0.35236752702665
Epoch: 22, step: 664, loss: 0.30958497524261475, mean loss: 0.35236620792105433
Epoch: 22, step: 665, loss: 0.34740522503852844, mean loss: 0.35236605496480833
Epoch: 22, step: 666, loss: 0.32212501764297485, mean loss: 0.35236512260663594
Epoch: 22, step: 667, loss: 0.3138207197189331, mean loss: 0.35236393428492896
Epoch: 22, step: 668, loss: 0.3266690969467163, mean loss: 0.35236314213900494
Epoch: 22, step: 669, loss: 0.3006078898906708, mean loss: 0.35236154662595703
Epoch: 22, step: 670, loss: 0.3701241910457611, mean loss: 0.35236209419661024
Epoch: 22, step: 671, loss: 0.39761990308761597, mean loss: 0.3523634893201889
Epoch: 22, step: 672, loss: 0.38062673807144165, mean loss: 0.3523643605402114
Epoch: 22, step: 673, loss: 0.3518405556678772, mean loss: 0.35236434439432424
Epoch: 22, step: 674, loss: 0.3037048578262329, mean loss: 0.3523628445488547
Epoch: 22, step: 675, loss: 0.3828754723072052, mean loss: 0.3523637850194427
Epoch: 22, step: 676, loss: 0.3277992904186249, mean loss: 0.35236302790757335
Epoch: 22, step: 677, loss: 0.320663183927536, mean loss: 0.3523620509044303
Epoch: 22, step: 678, loss: 0.32593977451324463, mean loss: 0.3523612365833408
Epoch: 22, step: 679, loss: 0.3221508860588074, mean loss: 0.3523603055444316
Epoch: 22, step: 680, loss: 0.2937925457954407, mean loss: 0.35235850062718455
Epoch: 22, step: 681, loss: 0.3819824457168579, mean loss: 0.352359413537665
Epoch: 22, step: 682, loss: 0.30872562527656555, mean loss: 0.3523580689323135
Epoch: 22, step: 683, loss: 0.3440876305103302, mean loss: 0.3523578140808892
Epoch: 22, step: 684, loss: 0.30681464076042175, mean loss: 0.35235641072300794
Epoch: 22, step: 685, loss: 0.3103163242340088, mean loss: 0.35235511534843195
Epoch: 22, step: 686, loss: 0.3382534384727478, mean loss: 0.3523546808490674
Epoch: 22, step: 687, loss: 0.3316301107406616, mean loss: 0.3523540423054974
Epoch: 22, step: 688, loss: 0.34901687502861023, mean loss: 0.3523539394873911
Epoch: 22, step: 689, loss: 0.336803138256073, mean loss: 0.35235346038204785
Epoch: 22, step: 690, loss: 0.31789836287498474, mean loss: 0.3523523988860835
Epoch: 22, step: 691, loss: 0.3671551048755646, mean loss: 0.3523528549152267
Epoch: 22, step: 692, loss: 0.355829656124115, mean loss: 0.3523529620222539
Epoch: 22, step: 693, loss: 0.3182210624217987, mean loss: 0.3523519105805806
Epoch: 22, step: 694, loss: 0.3315403163433075, mean loss: 0.3523512694939824
Epoch: 22, step: 695, loss: 0.3569372296333313, mean loss: 0.35235141075692405
Epoch: 22, step: 696, loss: 0.3247130513191223, mean loss: 0.3523505594290498
Epoch: 22, step: 697, loss: 0.3814430236816406, mean loss: 0.35235145551924424
Epoch: 22, step: 698, loss: 0.31357821822166443, mean loss: 0.35235026128395003
Epoch: 22, step: 699, loss: 0.3351535201072693, mean loss: 0.35234973163194877
Epoch: 22, step: 700, loss: 0.3492414951324463, mean loss: 0.35234963590259155
Epoch: 22, step: 701, loss: 0.3613128066062927, mean loss: 0.35234991194726983
Epoch: 22, step: 702, loss: 0.34744471311569214, mean loss: 0.35234976088327946
Epoch: 22, step: 703, loss: 0.3425971269607544, mean loss: 0.35234946054348143
Epoch: 22, step: 704, loss: 0.36012059450149536, mean loss: 0.3523496998541074
Epoch: 22, step: 705, loss: 0.34350070357322693, mean loss: 0.3523494273593029
Epoch: 22, step: 706, loss: 0.328866183757782, mean loss: 0.35234870424171705
Epoch: 22, step: 707, loss: 0.341950923204422, mean loss: 0.35234838407356095
Epoch: 22, step: 708, loss: 0.32018959522247314, mean loss: 0.35234739387160724
Epoch: 22, step: 709, loss: 0.32435011863708496, mean loss: 0.3523465318334511
Epoch: 22, step: 710, loss: 0.3031870722770691, mean loss: 0.35234501825669207
Epoch: 22, step: 711, loss: 0.3016597032546997, mean loss: 0.35234345774822523
Epoch: 22, step: 712, loss: 0.33199378848075867, mean loss: 0.35234283123828813
Epoch: 22, step: 713, loss: 0.3554154932498932, mean loss: 0.3523429258341262
Epoch: 22, step: 714, loss: 0.35667097568511963, mean loss: 0.35234305907458585
Epoch: 22, step: 715, loss: 0.31765830516815186, mean loss: 0.35234199132572774
Epoch: 22, step: 716, loss: 0.34806254506111145, mean loss: 0.3523418595896568
Epoch: 22, step: 717, loss: 0.30236753821372986, mean loss: 0.35234032125556286
Epoch: 22, step: 718, loss: 0.35245075821876526, mean loss: 0.35234032465498305
Epoch: 22, step: 719, loss: 0.30361124873161316, mean loss: 0.35233882474498784
Epoch: 22, step: 720, loss: 0.3482740819454193, mean loss: 0.35233869963363323
Epoch: 22, step: 721, loss: 0.3116026222705841, mean loss: 0.35233744583008253
Epoch: 22, step: 722, loss: 0.2806127071380615, mean loss: 0.35233523830373087
Epoch: 22, step: 723, loss: 0.33423739671707153, mean loss: 0.3523346813099605
Epoch: 22, step: 724, loss: 0.4271603524684906, mean loss: 0.35233698413429676
Epoch: 22, step: 725, loss: 0.35018470883369446, mean loss: 0.35233691789821314
Epoch: 22, step: 726, loss: 0.3462003469467163, mean loss: 0.3523367290515921
Epoch: 22, step: 727, loss: 0.32303905487060547, mean loss: 0.35233582747373077
Epoch: 22, step: 728, loss: 0.3308098614215851, mean loss: 0.3523351650751693
Epoch: 22, step: 729, loss: 0.315287321805954, mean loss: 0.3523340250713762
Epoch: 22, step: 730, loss: 0.3118954002857208, mean loss: 0.3523327807677119
Epoch: 22, step: 731, loss: 0.3127146363258362, mean loss: 0.35233156174788294
Epoch: 22, step: 732, loss: 0.38450637459754944, mean loss: 0.35233255171166405
Epoch: 22, step: 733, loss: 0.3303976058959961, mean loss: 0.3523318768317854
Epoch: 22, step: 734, loss: 0.3500259518623352, mean loss: 0.35233180588679663
Epoch: 22, step: 735, loss: 0.34851309657096863, mean loss: 0.35233168840250806
Epoch: 22, step: 736, loss: 0.3441959321498871, mean loss: 0.35233143811005296
Epoch: 22, step: 737, loss: 0.3237265944480896, mean loss: 0.35233055812347625
Epoch: 22, step: 738, loss: 0.33749106526374817, mean loss: 0.35233010162201933
Epoch: 22, step: 739, loss: 0.3271734118461609, mean loss: 0.35232932776051523
Epoch: 22, step: 740, loss: 0.3213786482810974, mean loss: 0.35232837569556463
Epoch: 22, step: 741, loss: 0.3332747519016266, mean loss: 0.352327789610551
Epoch: 22, step: 742, loss: 0.35528045892715454, mean loss: 0.3523278804311753
Epoch: 22, step: 743, loss: 0.287661075592041, mean loss: 0.35232589141773907
Epoch: 22, step: 744, loss: 0.33597424626350403, mean loss: 0.3523253884913664
Epoch: 22, step: 745, loss: 0.34002771973609924, mean loss: 0.35232501026448704
Epoch: 22, step: 746, loss: 0.3117523491382599, mean loss: 0.3523237624508279
Epoch: 22, step: 747, loss: 0.38343316316604614, mean loss: 0.35232471919214653
Epoch: 22, step: 748, loss: 0.3223326802253723, mean loss: 0.35232379684263804
Epoch: 22, step: 749, loss: 0.3136266767978668, mean loss: 0.3523226068211101
Epoch: 22, step: 750, loss: 0.3387531638145447, mean loss: 0.3523221895437336
Epoch: 22, step: 751, loss: 0.3367125988006592, mean loss: 0.35232170954401826
Epoch: 22, step: 752, loss: 0.2994498908519745, mean loss: 0.35232008376932833
Epoch: 22, step: 753, loss: 0.3227577805519104, mean loss: 0.3523191747753176
Epoch: 22, step: 754, loss: 0.36468610167503357, mean loss: 0.35231955502704404
Epoch: 22, step: 755, loss: 0.34082499146461487, mean loss: 0.3523192016091507
Epoch: 22, step: 756, loss: 0.36815324425697327, mean loss: 0.35231968843598077
Epoch: 22, step: 757, loss: 0.2952689528465271, mean loss: 0.3523179344319351
Epoch: 22, step: 758, loss: 0.3357938528060913, mean loss: 0.3523174264206944
Epoch: 22, step: 759, loss: 0.3654963970184326, mean loss: 0.35231783157842306
Epoch: 22, step: 760, loss: 0.3365219533443451, mean loss: 0.3523173459846995
Epoch: 22, step: 761, loss: 0.34164655208587646, mean loss: 0.35231701795537584
Epoch: 22, step: 762, loss: 0.37661468982696533, mean loss: 0.35231776486361327
Epoch: 22, step: 763, loss: 0.32666832208633423, mean loss: 0.3523169764262969
Epoch: 22, step: 764, loss: 0.32179880142211914, mean loss: 0.3523160383580276
Epoch: 22, step: 765, loss: 0.3587138056755066, mean loss: 0.35231623500668185
Epoch: 22, step: 766, loss: 0.35435551404953003, mean loss: 0.3523162976862283
Epoch: 22, step: 767, loss: 0.36051732301712036, mean loss: 0.3523165497462643
Epoch: 22, step: 768, loss: 0.31119734048843384, mean loss: 0.35231528597857653
Epoch: 22, step: 769, loss: 0.31580233573913574, mean loss: 0.35231416381525243
Epoch: 22, step: 770, loss: 0.3277691602706909, mean loss: 0.35231340948956497
Epoch: 22, step: 771, loss: 0.30766069889068604, mean loss: 0.35231203724891963
Epoch: 22, step: 772, loss: 0.35692113637924194, mean loss: 0.3523121788886704
Epoch: 22, step: 773, loss: 0.3223036229610443, mean loss: 0.3523112567401876
Epoch: 22, step: 774, loss: 0.33108609914779663, mean loss: 0.3523106045213512
Epoch: 22, step: 775, loss: 0.33704888820648193, mean loss: 0.35231013556497476
Epoch: 22, step: 776, loss: 0.3419751822948456, mean loss: 0.3523098180061095
Epoch: 22, step: 777, loss: 0.3324373960494995, mean loss: 0.35230920741119903
Epoch: 22, step: 778, loss: 0.3277861475944519, mean loss: 0.3523084539451402
Epoch: 22, step: 779, loss: 0.3162575364112854, mean loss: 0.3523073463220133
Epoch: 22, step: 780, loss: 0.3196849226951599, mean loss: 0.35230634406622585
Epoch: 22, step: 781, loss: 0.33375900983810425, mean loss: 0.35230577425565046
Epoch: 22, step: 782, loss: 0.3223772346973419, mean loss: 0.3523048548203164
Epoch: 22, step: 783, loss: 0.3234093189239502, mean loss: 0.35230396714718126
Epoch: 22, step: 784, loss: 0.3075387477874756, mean loss: 0.3523025919983667
Epoch: 22, step: 785, loss: 0.3554888367652893, mean loss: 0.35230268987404306
Epoch: 22, step: 786, loss: 0.35962170362472534, mean loss: 0.3523029146940016
Epoch: 22, step: 787, loss: 0.2836340367794037, mean loss: 0.35230080543985753
Epoch: 22, step: 788, loss: 0.36353445053100586, mean loss: 0.35230115048531907
Epoch: 22, step: 789, loss: 0.32720747590065, mean loss: 0.3523003797477251
Epoch: 22, step: 790, loss: 0.31313759088516235, mean loss: 0.35229917692242757
Epoch: 22, step: 791, loss: 0.3710256516933441, mean loss: 0.3522997520598591
Epoch: 22, step: 792, loss: 0.3658740818500519, mean loss: 0.35230016894907595
Epoch: 22, step: 793, loss: 0.31636303663253784, mean loss: 0.3522990652965879
Epoch: 22, step: 794, loss: 0.3481576144695282, mean loss: 0.3522989381138705
Epoch: 22, step: 795, loss: 0.3531690835952759, mean loss: 0.3522989648349576
Epoch: 22, step: 796, loss: 0.29800647497177124, mean loss: 0.3522972976312154
Epoch: 22, step: 797, loss: 0.31322404742240906, mean loss: 0.3522960978139149
Epoch: 22, step: 798, loss: 0.2982020080089569, mean loss: 0.35229443680461703
Epoch: 22, step: 799, loss: 0.34297963976860046, mean loss: 0.35229415079389986
Epoch: 22, step: 800, loss: 0.32138586044311523, mean loss: 0.35229320178440154
Epoch: 22, step: 801, loss: 0.3480394780635834, mean loss: 0.35229307118189246
Epoch: 22, step: 802, loss: 0.31626051664352417, mean loss: 0.35229196490469683
Epoch: 22, step: 803, loss: 0.3566082715988159, mean loss: 0.35229209742055995
Epoch: 22, step: 804, loss: 0.3243222236633301, mean loss: 0.35229123873779333
Epoch: 22, step: 805, loss: 0.3344937860965729, mean loss: 0.3522906923679081
Epoch: 22, step: 806, loss: 0.3115233778953552, mean loss: 0.35228944087705705
Epoch: 22, step: 807, loss: 0.31505391001701355, mean loss: 0.35228829784136023
Epoch: 22, step: 808, loss: 0.33384501934051514, mean loss: 0.3522877316971941
Epoch: 22, step: 809, loss: 0.31185564398765564, mean loss: 0.35228649061156236
Epoch: 22, step: 810, loss: 0.3350217640399933, mean loss: 0.35228596067735407
Epoch: 22, step: 811, loss: 0.29343974590301514, mean loss: 0.3522841544706391
Epoch: 22, step: 812, loss: 0.3355890214443207, mean loss: 0.3522836420513448
Epoch: 22, step: 813, loss: 0.3484322726726532, mean loss: 0.35228352384591305
Epoch: 22, step: 814, loss: 0.3052729070186615, mean loss: 0.3522820810500739
Epoch: 22, step: 815, loss: 0.34442055225372314, mean loss: 0.3522818397804693
Epoch: 22, step: 816, loss: 0.3280869126319885, mean loss: 0.35228109726314083
Epoch: 22, step: 817, loss: 0.32785874605178833, mean loss: 0.3522803477894033
Epoch: 22, step: 818, loss: 0.35351303219795227, mean loss: 0.35228038561689307
Epoch: 22, step: 819, loss: 0.34313949942588806, mean loss: 0.35228010511836017
Epoch: 22, step: 820, loss: 0.3368366062641144, mean loss: 0.35227963123150097
Epoch: 22, step: 821, loss: 0.33728495240211487, mean loss: 0.3522791711308925
Epoch: 22, step: 822, loss: 0.3686574101448059, mean loss: 0.35227967366959995
Epoch: 22, step: 823, loss: 0.36840546131134033, mean loss: 0.3522801684470804
Epoch: 22, step: 824, loss: 0.30102476477622986, mean loss: 0.3522785958577615
Epoch: 22, step: 825, loss: 0.3654778003692627, mean loss: 0.35227900081586766
Epoch: 22, step: 826, loss: 0.3429144620895386, mean loss: 0.35227871351601414
Epoch: 22, step: 827, loss: 0.340716689825058, mean loss: 0.35227835880918845
Epoch: 22, step: 828, loss: 0.3276473879814148, mean loss: 0.3522776031884004
Epoch: 22, step: 829, loss: 0.3444065451622009, mean loss: 0.3522773617300893
Epoch: 22, step: 830, loss: 0.3301691710948944, mean loss: 0.3522766835439291
Epoch: 22, step: 831, loss: 0.3031193017959595, mean loss: 0.35227517564878347
Epoch: 22, step: 832, loss: 0.3403060734272003, mean loss: 0.3522748085096705
Epoch: 22, step: 833, loss: 0.3306021988391876, mean loss: 0.3522741437464759
Epoch: 22, step: 834, loss: 0.28903260827064514, mean loss: 0.35227220400057907
Epoch: 22, step: 835, loss: 0.3501114249229431, mean loss: 0.352272137727144
Epoch: 22, step: 836, loss: 0.2782760560512543, mean loss: 0.352269868256766
Epoch: 22, step: 837, loss: 0.31975093483924866, mean loss: 0.3522688709270286
Epoch: 22, step: 838, loss: 0.35850024223327637, mean loss: 0.35226906203235275
Epoch: 22, step: 839, loss: 0.29005998373031616, mean loss: 0.3522671542465854
Epoch: 22, step: 840, loss: 0.3538474440574646, mean loss: 0.35226720270835393
Epoch: 22, step: 841, loss: 0.3371325135231018, mean loss: 0.3522667385964501
Epoch: 22, step: 842, loss: 0.3194798529148102, mean loss: 0.35226573320300364
Epoch: 22, step: 843, loss: 0.29390180110931396, mean loss: 0.35226394355710355
Epoch: 22, step: 844, loss: 0.3337312340736389, mean loss: 0.3522633752956899
Epoch: 22, step: 845, loss: 0.3108813762664795, mean loss: 0.35226210645411793
Epoch: 22, step: 846, loss: 0.30817562341690063, mean loss: 0.3522607547299715
Epoch: 22, step: 847, loss: 0.3279505968093872, mean loss: 0.35226000938541907
Epoch: 22, step: 848, loss: 0.3257085680961609, mean loss: 0.3522591953485276
Epoch: 22, step: 849, loss: 0.3379564881324768, mean loss: 0.35225875685728913
Epoch: 22, step: 850, loss: 0.3561214804649353, mean loss: 0.3522588752767259
Epoch: 22, step: 851, loss: 0.34898847341537476, mean loss: 0.3522587750191581
Epoch: 22, step: 852, loss: 0.3369898796081543, mean loss: 0.3522583069496504
Epoch: 22, step: 853, loss: 0.3618994355201721, mean loss: 0.35225860249034596
Epoch: 22, step: 854, loss: 0.32382673025131226, mean loss: 0.35225773096190777
Epoch: 22, step: 855, loss: 0.3348408639431, mean loss: 0.35225719709521397
Epoch: 22, step: 856, loss: 0.31664368510246277, mean loss: 0.3522561054933138
Epoch: 22, step: 857, loss: 0.31829190254211426, mean loss: 0.35225506447685606
Epoch: 22, step: 858, loss: 0.3084836006164551, mean loss: 0.3522537229050333
Epoch: 22, step: 859, loss: 0.3258262574672699, mean loss: 0.35225291294225786
Epoch: 22, step: 860, loss: 0.32124459743499756, mean loss: 0.35225196261232106
Epoch: 22, step: 861, loss: 0.3582419455051422, mean loss: 0.3522521461851955
Epoch: 22, step: 862, loss: 0.3719179034233093, mean loss: 0.3522527488561905
Epoch: 22, step: 863, loss: 0.35658976435661316, mean loss: 0.3522528817630151
Epoch: 22, step: 864, loss: 0.3215760290622711, mean loss: 0.35225194170685414
Epoch: 22, step: 865, loss: 0.3731653392314911, mean loss: 0.3522525825537477
Epoch: 22, step: 866, loss: 0.3382784426212311, mean loss: 0.352252154358867
Epoch: 22, step: 867, loss: 0.3093935251235962, mean loss: 0.3522508411271831
Epoch: 22, step: 868, loss: 0.3467037081718445, mean loss: 0.35225067116263503
Epoch: 22, step: 869, loss: 0.3611871004104614, mean loss: 0.35225094496707304
Epoch: 22, step: 870, loss: 0.3483303487300873, mean loss: 0.35225082484708664
Epoch: 22, step: 871, loss: 0.3503303825855255, mean loss: 0.35225076601000754
Epoch: 22, step: 872, loss: 0.3348175287246704, mean loss: 0.3522502319198361
Epoch: 22, step: 873, loss: 0.34240633249282837, mean loss: 0.3522499303482588
Epoch: 22, step: 874, loss: 0.40889954566955566, mean loss: 0.35225166577745715
Epoch: 22, step: 875, loss: 0.29664066433906555, mean loss: 0.3522499622178003
Epoch: 22, step: 876, loss: 0.34036383032798767, mean loss: 0.35224959811512335
Epoch: 22, step: 877, loss: 0.3508201241493225, mean loss: 0.3522495543280142
Epoch: 22, step: 878, loss: 0.3813333809375763, mean loss: 0.3522504451855695
Epoch: 22, step: 879, loss: 0.27673500776290894, mean loss: 0.3522481321667805
Epoch: 22, step: 880, loss: 0.317813515663147, mean loss: 0.35224707747547285
Epoch: 22, step: 881, loss: 0.3791995346546173, mean loss: 0.35224790297186426
Epoch: 22, step: 882, loss: 0.33718669414520264, mean loss: 0.35224744169322575
Epoch: 22, step: 883, loss: 0.2910928726196289, mean loss: 0.35224556877367796
Epoch: 22, step: 884, loss: 0.3335484564304352, mean loss: 0.3522449961735388
Epoch: 22, step: 885, loss: 0.30537256598472595, mean loss: 0.3522435607466328
Epoch: 22, step: 886, loss: 0.334857702255249, mean loss: 0.35224302833632837
Epoch: 22, step: 887, loss: 0.3409232795238495, mean loss: 0.3522426817002182
Epoch: 22, step: 888, loss: 0.33686336874961853, mean loss: 0.3522422107655656
Epoch: 22, step: 889, loss: 0.3904650807380676, mean loss: 0.3522433811639358
Epoch: 22, step: 890, loss: 0.3251851499080658, mean loss: 0.3522425526562884
Epoch: 22, step: 891, loss: 0.34433513879776, mean loss: 0.352242310543188
Epoch: 22, step: 892, loss: 0.3632071614265442, mean loss: 0.35224264626012514
Epoch: 22, step: 893, loss: 0.3094539940357208, mean loss: 0.3522413362162753
Epoch: 22, step: 894, loss: 0.3448202610015869, mean loss: 0.3522411090150012
Epoch: 22, step: 895, loss: 0.3172941505908966, mean loss: 0.3522400391228134
Epoch: 22, step: 896, loss: 0.3055947721004486, mean loss: 0.3522386111336194
Epoch: 22, step: 897, loss: 0.39278680086135864, mean loss: 0.35223985243006606
Epoch: 22, step: 898, loss: 0.33996570110321045, mean loss: 0.3522394766945738
Epoch: 22, step: 899, loss: 0.33754804730415344, mean loss: 0.35223902697529524
Epoch: 22, step: 900, loss: 0.34082695841789246, mean loss: 0.3522386776512095
Epoch: 22, step: 901, loss: 0.33796653151512146, mean loss: 0.3522382407933541
Epoch: 22, step: 902, loss: 0.35170549154281616, mean loss: 0.35223822448686665
Epoch: 22, step: 903, loss: 0.3247262239456177, mean loss: 0.3522373824202487
Epoch: 22, step: 904, loss: 0.30536743998527527, mean loss: 0.352235947904213
Epoch: 22, step: 905, loss: 0.33650508522987366, mean loss: 0.3522354664552727
Epoch: 22, step: 906, loss: 0.3342755436897278, mean loss: 0.35223491680193636
Epoch: 22, step: 907, loss: 0.3584086000919342, mean loss: 0.35223510573825934
Epoch: 22, step: 908, loss: 0.3282865285873413, mean loss: 0.3522343728503825
Epoch: 22, step: 909, loss: 0.4012225568294525, mean loss: 0.3522358719685654
Epoch: 22, step: 910, loss: 0.3404630422592163, mean loss: 0.3522355117118345
Epoch: 22, step: 911, loss: 0.3266255557537079, mean loss: 0.3522347280534514
Epoch: 22, step: 912, loss: 0.334002822637558, mean loss: 0.35223417017867964
Epoch: 22, step: 913, loss: 0.32198143005371094, mean loss: 0.35223324450888815
Epoch: 22, step: 914, loss: 0.32892686128616333, mean loss: 0.3522325314047293
Epoch: 22, step: 915, loss: 0.3666306734085083, mean loss: 0.35223297193043007
Epoch: 22, step: 916, loss: 0.3536069989204407, mean loss: 0.3522330139688878
Epoch: 22, step: 917, loss: 0.37069666385650635, mean loss: 0.35223357884834344
Epoch: 22, step: 918, loss: 0.3013554811477661, mean loss: 0.3522320223244134
Epoch: 22, step: 919, loss: 0.316482812166214, mean loss: 0.3522309286750571
Epoch: 22, step: 920, loss: 0.3276185989379883, mean loss: 0.3522301757511458
Epoch: 22, step: 921, loss: 0.35887715220451355, mean loss: 0.3522303790847785
Epoch: 22, step: 922, loss: 0.3250866234302521, mean loss: 0.35222954877198126
Epoch: 22, step: 923, loss: 0.3225747346878052, mean loss: 0.35222864167501305
Epoch: 22, step: 924, loss: 0.3210518956184387, mean loss: 0.3522276880535633
Epoch: 22, step: 925, loss: 0.330731064081192, mean loss: 0.352227030543807
Epoch: 22, step: 926, loss: 0.32505279779434204, mean loss: 0.3522261994004288
Epoch: 22, step: 927, loss: 0.3342331051826477, mean loss: 0.3522256490855824
Epoch: 22, step: 928, loss: 0.3626929819583893, mean loss: 0.352225969216875
Epoch: 22, step: 929, loss: 0.33636534214019775, mean loss: 0.3522254841527403
Epoch: 22, step: 930, loss: 0.3293588161468506, mean loss: 0.35222478484487135
Epoch: 22, step: 931, loss: 0.2893955707550049, mean loss: 0.35222286346217746
Epoch: 22, step: 932, loss: 0.33609792590141296, mean loss: 0.35222237035990045
Epoch: 22, step: 933, loss: 0.32414790987968445, mean loss: 0.35222151186621564
Epoch: 22, step: 934, loss: 0.3311227262020111, mean loss: 0.3522208667026018
Epoch: 22, step: 935, loss: 0.3035631477832794, mean loss: 0.3522193788809616
Epoch: 22, step: 936, loss: 0.33666738867759705, mean loss: 0.3522189033576409
Epoch: 22, step: 937, loss: 0.30400392413139343, mean loss: 0.3522174291639386
Epoch: 22, step: 938, loss: 0.3729623556137085, mean loss: 0.35221806342958356
Epoch: 22, step: 939, loss: 0.353325217962265, mean loss: 0.3522180972792391
Epoch: 22, step: 940, loss: 0.32201048731803894, mean loss: 0.3522171737532994
Epoch: 22, step: 941, loss: 0.33194097876548767, mean loss: 0.3522165538757394
Epoch: 22, step: 942, loss: 0.3240519165992737, mean loss: 0.35221569286148496
Epoch: 22, step: 943, loss: 0.34158384799957275, mean loss: 0.3522153678478856
Epoch: 22, step: 944, loss: 0.32111966609954834, mean loss: 0.35221441728689307
Epoch: 22, step: 945, loss: 0.34981900453567505, mean loss: 0.35221434406402974
Epoch: 22, step: 946, loss: 0.33822497725486755, mean loss: 0.3522139164508001
Epoch: 22, step: 947, loss: 0.3005821108818054, mean loss: 0.3522123382687005
Epoch: 22, step: 948, loss: 0.35062098503112793, mean loss: 0.35221228962875073
Epoch: 22, step: 949, loss: 0.3231937289237976, mean loss: 0.35221140269921025
Epoch: 22, step: 950, loss: 0.3356446325778961, mean loss: 0.3522108963643552
Epoch: 22, step: 951, loss: 0.34104517102241516, mean loss: 0.3522105551135807
Epoch: 22, step: 952, loss: 0.3104170858860016, mean loss: 0.35220927784610023
Epoch: 22, step: 953, loss: 0.3251728117465973, mean loss: 0.35220845159874065
Epoch: 22, step: 954, loss: 0.3410792648792267, mean loss: 0.35220811149585524
Epoch: 22, step: 955, loss: 0.3357102572917938, mean loss: 0.3522076073443394
Epoch: 22, step: 956, loss: 0.3244554400444031, mean loss: 0.3522067593025579
Epoch: 22, step: 957, loss: 0.2987328767776489, mean loss: 0.3522051253148257
Epoch: 22, step: 958, loss: 0.3293408155441284, mean loss: 0.3522044266773163
Epoch: 22, step: 959, loss: 0.33287522196769714, mean loss: 0.35220383607585243
Epoch: 22, step: 960, loss: 0.3287737965583801, mean loss: 0.35220312019576083
Epoch: 22, step: 961, loss: 0.34412118792533875, mean loss: 0.3522028732684076
Epoch: 22, step: 962, loss: 0.3317037522792816, mean loss: 0.3522022469777049
Epoch: 22, step: 963, loss: 0.33582887053489685, mean loss: 0.35220174675234617
Epoch: 22, step: 964, loss: 0.31431442499160767, mean loss: 0.35220058928673775
Epoch: 22, step: 965, loss: 0.308695524930954, mean loss: 0.3521992602385201
Epoch: 22, step: 966, loss: 0.379737913608551, mean loss: 0.3522001014987422
Epoch: 22, step: 967, loss: 0.3088132441043854, mean loss: 0.352198776142639
Epoch: 22, step: 968, loss: 0.32834506034851074, mean loss: 0.3521980474956709
Epoch: 22, step: 969, loss: 0.341377317905426, mean loss: 0.35219771697060553
Epoch: 22, step: 970, loss: 0.3405434191226959, mean loss: 0.35219736099461824
Epoch: 22, step: 971, loss: 0.335287481546402, mean loss: 0.3521968445047145
Epoch: 22, step: 972, loss: 0.34642869234085083, mean loss: 0.3521966683295163
Epoch: 22, step: 973, loss: 0.3553178012371063, mean loss: 0.35219676365457
Epoch: 22, step: 974, loss: 0.38224470615386963, mean loss: 0.35219768134514506
Epoch: 22, step: 975, loss: 0.32297655940055847, mean loss: 0.35219678893365153
Epoch: 22, step: 976, loss: 0.3811352550983429, mean loss: 0.352197672685863
Epoch: 22, step: 977, loss: 0.3206009268760681, mean loss: 0.3521967077818805
Epoch: 22, step: 978, loss: 0.32306402921676636, mean loss: 0.35219581815295065
Epoch: 22, step: 979, loss: 0.3428190350532532, mean loss: 0.352195531821477
Epoch: 22, step: 980, loss: 0.3251756429672241, mean loss: 0.35219470676151016
Epoch: 22, step: 981, loss: 0.34388744831085205, mean loss: 0.35219445310476355
Epoch: 22, step: 982, loss: 0.35385438799858093, mean loss: 0.3521945037882509
Epoch: 22, step: 983, loss: 0.31527408957481384, mean loss: 0.3521933765161999
Epoch: 22, step: 984, loss: 0.3144579827785492, mean loss: 0.35219222439597464
Epoch: 22, step: 985, loss: 0.3540022075176239, mean loss: 0.35219227965588557
Epoch: 22, step: 986, loss: 0.3542337119579315, mean loss: 0.3521923419801812
Epoch: 22, step: 987, loss: 0.3599390685558319, mean loss: 0.3521925784781228
Epoch: 22, step: 988, loss: 0.3149876892566681, mean loss: 0.3521914426937341
Epoch: 22, step: 989, loss: 0.36681222915649414, mean loss: 0.35219188902093546
Epoch: 22, step: 990, loss: 0.31000006198883057, mean loss: 0.3521906010748128
Epoch: 22, step: 991, loss: 0.2952924966812134, mean loss: 0.35218886425843937
Epoch: 22, step: 992, loss: 0.31726157665252686, mean loss: 0.3521877981344625
Epoch: 22, step: 993, loss: 0.3413047790527344, mean loss: 0.3521874659502527
Epoch: 22, step: 994, loss: 0.2998438775539398, mean loss: 0.35218586830692344
Epoch: 22, step: 995, loss: 0.34781622886657715, mean loss: 0.3521857349398303
Epoch: 22, step: 996, loss: 0.3091185390949249, mean loss: 0.3521844205129771
Epoch: 22, step: 997, loss: 0.35852885246276855, mean loss: 0.35218461414149294
Epoch: 22, step: 998, loss: 0.38994672894477844, mean loss: 0.3521857665849514
Epoch: 22, step: 999, loss: 0.31201979517936707, mean loss: 0.352184540816781
Epoch: 22, step: 1000, loss: 0.3191072642803192, mean loss: 0.3521835314092148
Epoch: 22, step: 1001, loss: 0.29845502972602844, mean loss: 0.3521818918455382
Epoch: 22, step: 1002, loss: 0.3137704133987427, mean loss: 0.35218071972755444
Epoch: 22, step: 1003, loss: 0.317437082529068, mean loss: 0.3521796595653062
Epoch: 22, step: 1004, loss: 0.34281882643699646, mean loss: 0.35217937393893306
Epoch: 22, step: 1005, loss: 0.3303840458393097, mean loss: 0.35217870892007364
Epoch: 22, step: 1006, loss: 0.3387402892112732, mean loss: 0.3521782988996401
Epoch: 22, step: 1007, loss: 0.3247010409832001, mean loss: 0.35217746056494653
Epoch: 22, step: 1008, loss: 0.3419075310230255, mean loss: 0.35217714723762733
Epoch: 22, step: 1009, loss: 0.3107011318206787, mean loss: 0.35217588187624416
Epoch: 22, step: 1010, loss: 0.3447299003601074, mean loss: 0.35217565471917667
Epoch: 22, step: 1011, loss: 0.325987309217453, mean loss: 0.3521748558068673
Epoch: 22, step: 1012, loss: 0.2982729375362396, mean loss: 0.3521732115032075
Epoch: 22, step: 1013, loss: 0.3108849823474884, mean loss: 0.3521719520245559
Epoch: 22, step: 1014, loss: 0.33910346031188965, mean loss: 0.3521715533883203
Epoch: 22, step: 1015, loss: 0.35804814100265503, mean loss: 0.35217173264001667
Epoch: 22, step: 1016, loss: 0.3582761883735657, mean loss: 0.35217191883662285
Epoch: 22, step: 1017, loss: 0.34385186433792114, mean loss: 0.3521716650681089
Epoch: 22, step: 1018, loss: 0.3524666726589203, mean loss: 0.3521716740658089
Epoch: 22, step: 1019, loss: 0.31323641538619995, mean loss: 0.35217048658079364
Epoch: 22, step: 1020, loss: 0.30939337611198425, mean loss: 0.3521691819630722
Epoch: 22, step: 1021, loss: 0.39842820167541504, mean loss: 0.35217059272915063
Epoch: 22, step: 1022, loss: 0.3358854651451111, mean loss: 0.35217009609508687
Epoch: 22, step: 1023, loss: 0.33619603514671326, mean loss: 0.35216960896222066
Epoch: 22, step: 1024, loss: 0.35461556911468506, mean loss: 0.35216968355009465
Epoch: 22, step: 1025, loss: 0.36124223470687866, mean loss: 0.3521699602028713
Epoch: 22, step: 1026, loss: 0.31987205147743225, mean loss: 0.35216897536040365
Epoch: 22, step: 1027, loss: 0.32103610038757324, mean loss: 0.35216802607161923
Epoch: 22, step: 1028, loss: 0.3218974769115448, mean loss: 0.3521671031046052
Epoch: 22, step: 1029, loss: 0.3044450283050537, mean loss: 0.352165648074579
Epoch: 22, step: 1030, loss: 0.30447423458099365, mean loss: 0.3521641940237392
Epoch: 22, step: 1031, loss: 0.3508511185646057, mean loss: 0.35216415399095086
Epoch: 22, step: 1032, loss: 0.3190743029117584, mean loss: 0.352163145184784
Epoch: 22, step: 1033, loss: 0.34731346368789673, mean loss: 0.3521629973376558
Epoch: 22, step: 1034, loss: 0.32638996839523315, mean loss: 0.3521622116464403
Epoch: 22, step: 1035, loss: 0.3239861726760864, mean loss: 0.3521613527256084
Epoch: 22, step: 1036, loss: 0.3220504820346832, mean loss: 0.35216043485117793
Epoch: 22, step: 1037, loss: 0.3531113862991333, mean loss: 0.3521604638382976
Epoch: 22, step: 1038, loss: 0.3359617292881012, mean loss: 0.35215997007981464
Epoch: 22, step: 1039, loss: 0.3434489965438843, mean loss: 0.3521597045661126
Epoch: 22, step: 1040, loss: 0.3607613444328308, mean loss: 0.35215996673929273
Epoch: 22, step: 1041, loss: 0.2912851572036743, mean loss: 0.3521581113656403
Epoch: 22, step: 1042, loss: 0.3563406765460968, mean loss: 0.3521582388401208
Epoch: 22, step: 1043, loss: 0.32478511333465576, mean loss: 0.3521574045988217
Epoch: 22, step: 1044, loss: 0.36332324147224426, mean loss: 0.35215774488580776
Epoch: 22, step: 1045, loss: 0.3179183006286621, mean loss: 0.3521567014456829
Epoch: 22, step: 1046, loss: 0.3264940679073334, mean loss: 0.35215591940595903
Epoch: 22, step: 1047, loss: 0.2834163308143616, mean loss: 0.35215382470859824
Epoch: 22, step: 1048, loss: 0.31078362464904785, mean loss: 0.35215256407538803
Epoch: 22, step: 1049, loss: 0.2991563379764557, mean loss: 0.35215094922298695
Epoch: 22, step: 1050, loss: 0.34518691897392273, mean loss: 0.35215073702790944
Epoch: 22, step: 1051, loss: 0.340806782245636, mean loss: 0.35215039138638654
Epoch: 22, step: 1052, loss: 0.33217746019363403, mean loss: 0.3521497828451723
Epoch: 22, step: 1053, loss: 0.3533971905708313, mean loss: 0.3521498208504043
Epoch: 22, step: 1054, loss: 0.3673290014266968, mean loss: 0.352150283306017
Epoch: 22, step: 1055, loss: 0.3474208414554596, mean loss: 0.35215013922114463
Epoch: 22, step: 1056, loss: 0.3327105939388275, mean loss: 0.35214954700346657
Epoch: 22, step: 1057, loss: 0.3087255656719208, mean loss: 0.3521482241501999
Epoch: 22, step: 1058, loss: 0.323377400636673, mean loss: 0.3521473477124044
Epoch: 22, step: 1059, loss: 0.3251887559890747, mean loss: 0.35214652650515077
Epoch: 22, step: 1060, loss: 0.37058115005493164, mean loss: 0.35214708803987765
Epoch: 22, step: 1061, loss: 0.30609598755836487, mean loss: 0.35214568532588186
Epoch: 22, step: 1062, loss: 0.3484782874584198, mean loss: 0.35214557362054644
Epoch: 22, step: 1063, loss: 0.33824536204338074, mean loss: 0.3521451502466558
Epoch: 22, step: 1064, loss: 0.3443566858768463, mean loss: 0.35214491303213474
Epoch: 22, step: 1065, loss: 0.2976249158382416, mean loss: 0.3521432525583212
Epoch: 22, step: 1066, loss: 0.3505713939666748, mean loss: 0.3521432046868855
Epoch: 22, step: 1067, loss: 0.33188560605049133, mean loss: 0.3521425877542921
Epoch: 22, step: 1068, loss: 0.3696914613246918, mean loss: 0.35214312217806926
Epoch: 22, step: 1069, loss: 0.3766443729400635, mean loss: 0.3521438683030087
Epoch: 22, step: 1070, loss: 0.34927549958229065, mean loss: 0.3521437809565998
Epoch: 22, step: 1071, loss: 0.3487795293331146, mean loss: 0.35214367851288414
Epoch: 22, step: 1072, loss: 0.32008594274520874, mean loss: 0.3521427023630785
Epoch: 22, step: 1073, loss: 0.3696027994155884, mean loss: 0.352143234002353
Epoch: 22, step: 1074, loss: 0.3367030620574951, mean loss: 0.3521427638817201
Epoch: 22, step: 1075, loss: 0.3102132976055145, mean loss: 0.35214148725687916
Epoch: 22, step: 1076, loss: 0.33121299743652344, mean loss: 0.35214085006735807
Epoch: 22, step: 1077, loss: 0.3594827651977539, mean loss: 0.35214107359275326
Epoch: 22, step: 1078, loss: 0.3094554841518402, mean loss: 0.3521397740649595
Epoch: 22, step: 1079, loss: 0.32300081849098206, mean loss: 0.35213888698034024
Epoch: 22, step: 1080, loss: 0.3284335434436798, mean loss: 0.35213816533452036
Epoch: 22, step: 1081, loss: 0.31058523058891296, mean loss: 0.35213690040499995
Epoch: 22, step: 1082, loss: 0.3709705173969269, mean loss: 0.3521374737092218
Epoch: 22, step: 1083, loss: 0.3037395179271698, mean loss: 0.3521360004973692
Epoch: 22, step: 1084, loss: 0.31057894229888916, mean loss: 0.3521347355578447
Epoch: 22, step: 1085, loss: 0.33479830622673035, mean loss: 0.35213420787691296
Epoch: 22, step: 1086, loss: 0.3378760814666748, mean loss: 0.3521337739056328
Epoch: 22, step: 1087, loss: 0.30437374114990234, mean loss: 0.3521323202888579
Epoch: 22, step: 1088, loss: 0.34558212757110596, mean loss: 0.3521321209342997
Epoch: 22, step: 1089, loss: 0.32254618406295776, mean loss: 0.3521312205162319
Epoch: 22, step: 1090, loss: 0.3332514464855194, mean loss: 0.35213064594688925
Epoch: 22, step: 1091, loss: 0.35287585854530334, mean loss: 0.3521306686253006
Epoch: 22, step: 1092, loss: 0.36157089471817017, mean loss: 0.35213095590280563
Epoch: 22, step: 1093, loss: 0.3224380910396576, mean loss: 0.35213005234048855
Epoch: 22, step: 1094, loss: 0.3343501687049866, mean loss: 0.35212951131003983
Epoch: 22, step: 1095, loss: 0.33194494247436523, mean loss: 0.35212889712525297
Epoch: 22, step: 1096, loss: 0.31822046637535095, mean loss: 0.35212786537625707
Epoch: 22, step: 1097, loss: 0.356692910194397, mean loss: 0.35212800427496144
Epoch: 22, step: 1098, loss: 0.3297557830810547, mean loss: 0.35212732358547977
Epoch: 22, step: 1099, loss: 0.35592183470726013, mean loss: 0.3521274390324532
Epoch: 22, step: 1100, loss: 0.3226272165775299, mean loss: 0.35212654152347955
Epoch: 22, step: 1101, loss: 0.30372539162635803, mean loss: 0.35212506902120094
Epoch: 22, step: 1102, loss: 0.35625025629997253, mean loss: 0.35212519451745233
Epoch: 22, step: 1103, loss: 0.3540782630443573, mean loss: 0.3521252539318028
Epoch: 22, step: 1104, loss: 0.31016626954078674, mean loss: 0.35212397753523444
Epoch: 22, step: 1105, loss: 0.3345165550708771, mean loss: 0.3521234419319472
Epoch: 22, step: 1106, loss: 0.3484607934951782, mean loss: 0.3521233305205879
Epoch: 22, step: 1107, loss: 0.33560168743133545, mean loss: 0.35212282797638883
Epoch: 22, step: 1108, loss: 0.3926449418067932, mean loss: 0.35212406051323314
Epoch: 22, step: 1109, loss: 0.31357526779174805, mean loss: 0.35212288803337666
Epoch: 22, step: 1110, loss: 0.3216434419155121, mean loss: 0.352121961014729
Epoch: 22, step: 1111, loss: 0.34501153230667114, mean loss: 0.3521217447608145
Epoch: 22, step: 1112, loss: 0.318816602230072, mean loss: 0.3521207318614948
Epoch: 22, step: 1113, loss: 0.29002609848976135, mean loss: 0.3521188434534487
Epoch: 22, step: 1114, loss: 0.3288481831550598, mean loss: 0.3521181357728752
Epoch: 22, step: 1115, loss: 0.312355101108551, mean loss: 0.3521169265819415
Epoch: 22, step: 1116, loss: 0.3621188700199127, mean loss: 0.35211723073105017
Epoch: 22, step: 1117, loss: 0.3160005807876587, mean loss: 0.3521161324931999
Epoch: 22, step: 1118, loss: 0.33448338508605957, mean loss: 0.3521155963315735
Epoch: 22, step: 1119, loss: 0.3707982897758484, mean loss: 0.352116164401795
Epoch: 22, step: 1120, loss: 0.3100075423717499, mean loss: 0.3521148840763965
Epoch: 22, step: 1121, loss: 0.3116011917591095, mean loss: 0.3521136522827718
Epoch: 22, step: 1122, loss: 0.324908584356308, mean loss: 0.3521128251547451
Epoch: 22, step: 1123, loss: 0.2968612313270569, mean loss: 0.3521111453665344
Epoch: 22, step: 1124, loss: 0.3196544945240021, mean loss: 0.3521101586322492
Epoch: 22, step: 1125, loss: 0.3408629298210144, mean loss: 0.35210981670883423
Epoch: 22, step: 1126, loss: 0.32296162843704224, mean loss: 0.35210893061099957
Epoch: 22, step: 1127, loss: 0.3554496467113495, mean loss: 0.35210903216486933
Epoch: 22, step: 1128, loss: 0.3095962107181549, mean loss: 0.3521077398640077
Epoch: 22, step: 1129, loss: 0.319058895111084, mean loss: 0.35210673527878206
Epoch: 22, step: 1130, loss: 0.4132244884967804, mean loss: 0.3521085930177169
Epoch: 22, step: 1131, loss: 0.3433355987071991, mean loss: 0.35210832636135486
Epoch: 22, step: 1132, loss: 0.3425566852092743, mean loss: 0.35210803604673974
Epoch: 22, step: 1133, loss: 0.32506728172302246, mean loss: 0.35210721418927443
Epoch: 22, step: 1134, loss: 0.33165106177330017, mean loss: 0.35210659247841475
Epoch: 22, step: 1135, loss: 0.32574865221977234, mean loss: 0.3521057914226082
Epoch: 22, step: 1136, loss: 0.3289206027984619, mean loss: 0.35210508681271235
Epoch: 22, step: 1137, loss: 0.3447023034095764, mean loss: 0.3521048618451258
Epoch: 22, step: 1138, loss: 0.31157514452934265, mean loss: 0.35210363020087637
Epoch: 22, step: 1139, loss: 0.31873267889022827, mean loss: 0.3521026161328288
Epoch: 22, step: 1140, loss: 0.3426501154899597, mean loss: 0.3521023289013528
Epoch: 22, step: 1141, loss: 0.3155091404914856, mean loss: 0.3521012169843546
Epoch: 22, step: 1142, loss: 0.30454352498054504, mean loss: 0.3520997719449452
Epoch: 22, step: 1143, loss: 0.3433827757835388, mean loss: 0.3520995070872592
Epoch: 22, step: 1144, loss: 0.2948099970817566, mean loss: 0.3520977664525554
Epoch: 22, step: 1145, loss: 0.30545279383659363, mean loss: 0.3520963492752869
Epoch: 22, step: 1146, loss: 0.35433098673820496, mean loss: 0.3520964171664448
Epoch: 22, step: 1147, loss: 0.3357613682746887, mean loss: 0.35209592090174396
Epoch: 22, step: 1148, loss: 0.3377767503261566, mean loss: 0.35209548589337214
Epoch: 22, step: 1149, loss: 0.30021747946739197, mean loss: 0.35209390991650763
Epoch: 22, step: 1150, loss: 0.3656609058380127, mean loss: 0.35209432204919455
Epoch: 22, step: 1151, loss: 0.31613266468048096, mean loss: 0.3520932296537702
Epoch: 22, step: 1152, loss: 0.30739203095436096, mean loss: 0.3520918718214231
Epoch: 22, step: 1153, loss: 0.3147558271884918, mean loss: 0.3520907377455883
Epoch: 22, step: 1154, loss: 0.3557423949241638, mean loss: 0.3520908486606683
Epoch: 22, step: 1155, loss: 0.34031346440315247, mean loss: 0.3520904909464095
Epoch: 22, step: 1156, loss: 0.3073038160800934, mean loss: 0.35208913068293596
Epoch: 22, step: 1157, loss: 0.3368316888809204, mean loss: 0.3520886672971071
Epoch: 22, step: 1158, loss: 0.3260502517223358, mean loss: 0.3520878765048826
Epoch: 22, step: 1159, loss: 0.33518052101135254, mean loss: 0.3520873630404908
Epoch: 22, step: 1160, loss: 0.312393456697464, mean loss: 0.35208615760132345
Epoch: 22, step: 1161, loss: 0.38692981004714966, mean loss: 0.35208721571406093
Epoch: 22, step: 1162, loss: 0.34263551235198975, mean loss: 0.35208692869868446
Epoch: 22, step: 1163, loss: 0.3357981741428375, mean loss: 0.35208643408084905
Epoch: 22, step: 1164, loss: 0.3800014853477478, mean loss: 0.3520872817124425
Epoch: 22, step: 1165, loss: 0.3354765772819519, mean loss: 0.352086777349036
Epoch: 22, step: 1166, loss: 0.33554181456565857, mean loss: 0.3520862749970462
Epoch: 22, step: 1167, loss: 0.3399995267391205, mean loss: 0.3520859080202349
Epoch: 22, step: 1168, loss: 0.3617895543575287, mean loss: 0.3520862026325656
Epoch: 22, step: 1169, loss: 0.33177608251571655, mean loss: 0.35208558601588835
Epoch: 22, step: 1170, loss: 0.3095647394657135, mean loss: 0.3520842951191838
Epoch: 22, step: 1171, loss: 0.3367742896080017, mean loss: 0.3520838303345599
Epoch: 22, step: 1172, loss: 0.3324364125728607, mean loss: 0.35208323389189694
Epoch: 22, step: 1173, loss: 0.36936500668525696, mean loss: 0.3520837585040272
Epoch: 22, step: 1174, loss: 0.3425535559654236, mean loss: 0.35208346921032174
Epoch: 22, step: 1175, loss: 0.3446195721626282, mean loss: 0.3520832426471525
Epoch: 22, step: 1176, loss: 0.3207481801509857, mean loss: 0.3520822915145832
Epoch: 22, step: 1177, loss: 0.31669679284095764, mean loss: 0.35208121746921583
Epoch: 22, step: 1178, loss: 0.34449461102485657, mean loss: 0.35208098720222814
Epoch: 22, step: 1179, loss: 0.30389806628227234, mean loss: 0.35207952480933874
Epoch: 22, step: 1180, loss: 0.33557194471359253, mean loss: 0.35207902380536
Epoch: 22, step: 1181, loss: 0.33905932307243347, mean loss: 0.3520786286702846
Epoch: 22, step: 1182, loss: 0.3578616976737976, mean loss: 0.3520788041753984
Epoch: 22, step: 1183, loss: 0.32377976179122925, mean loss: 0.3520779453795018
Epoch: 22, step: 1184, loss: 0.33679285645484924, mean loss: 0.352077481534361
Epoch: 22, step: 1185, loss: 0.3601723313331604, mean loss: 0.35207772717524827
Epoch: 22, step: 1186, loss: 0.30548912286758423, mean loss: 0.3520763134715824
Epoch: 22, step: 1187, loss: 0.35684290528297424, mean loss: 0.3520764581066052
Epoch: 22, step: 1188, loss: 0.3134912848472595, mean loss: 0.3520752873333777
Epoch: 22, step: 1189, loss: 0.34273895621299744, mean loss: 0.35207500405371506
Epoch: 22, step: 1190, loss: 0.3133537471294403, mean loss: 0.3520738292226545
Epoch: 22, step: 1191, loss: 0.30853521823883057, mean loss: 0.35207250826965136
Epoch: 22, step: 1192, loss: 0.3094564974308014, mean loss: 0.3520712153473845
Epoch: 22, step: 1193, loss: 0.3611397445201874, mean loss: 0.3520714904681045
Epoch: 22, step: 1194, loss: 0.30411702394485474, mean loss: 0.35207003567131645
Epoch: 22, step: 1195, loss: 0.32906487584114075, mean loss: 0.3520693377839293
Epoch: 22, step: 1196, loss: 0.3626788258552551, mean loss: 0.3520696596249143
Epoch: 22, step: 1197, loss: 0.3595021367073059, mean loss: 0.3520698850837835
Epoch: 22, step: 1198, loss: 0.3170051574707031, mean loss: 0.35206882145264895
Epoch: 22, step: 1199, loss: 0.29937899112701416, mean loss: 0.35206722324134326
Epoch: 22, step: 1200, loss: 0.3166654706001282, mean loss: 0.35206614945224923
Epoch: 22, step: 1201, loss: 0.33402350544929504, mean loss: 0.35206560220796645
Epoch: 22, step: 1202, loss: 0.3585173487663269, mean loss: 0.3520657978873986
Epoch: 22, step: 1203, loss: 0.30126020312309265, mean loss: 0.35206425701651534
Epoch: 22, step: 1204, loss: 0.33287790417671204, mean loss: 0.3520636751357996
Epoch: 22, step: 1205, loss: 0.35672199726104736, mean loss: 0.3520638164083818
Epoch: 22, step: 1206, loss: 0.32695451378822327, mean loss: 0.35206305494355633
Epoch: 22, step: 1207, loss: 0.33153030276298523, mean loss: 0.352062432286103
Epoch: 22, step: 1208, loss: 0.3078332245349884, mean loss: 0.3520610910722949
Epoch: 22, step: 1209, loss: 0.34151580929756165, mean loss: 0.3520607713051236
Epoch: 22, step: 1210, loss: 0.34305083751678467, mean loss: 0.3520604981029711
Epoch: 22, step: 1211, loss: 0.30639228224754333, mean loss: 0.3520591133784151
Epoch: 22, step: 1212, loss: 0.32962605357170105, mean loss: 0.35205843319710445
Epoch: 22, step: 1213, loss: 0.32080739736557007, mean loss: 0.3520574856791907
Epoch: 22, step: 1214, loss: 0.32006555795669556, mean loss: 0.35205651572716323
Epoch: 22, step: 1215, loss: 0.3342057764530182, mean loss: 0.35205597453327303
Epoch: 22, step: 1216, loss: 0.3225950002670288, mean loss: 0.352055081370494
Epoch: 22, step: 1217, loss: 0.3165130913257599, mean loss: 0.35205400388337693
Epoch: 22, step: 1218, loss: 0.3440427780151367, mean loss: 0.3520537610232845
Epoch: 22, step: 1219, loss: 0.3425338566303253, mean loss: 0.3520534724363925
Epoch: 22, step: 1220, loss: 0.3107364773750305, mean loss: 0.3520522199887566
Epoch: 22, step: 1221, loss: 0.3248175084590912, mean loss: 0.35205139444430283
Epoch: 22, step: 1222, loss: 0.34986963868141174, mean loss: 0.3520513283124559
Epoch: 22, step: 1223, loss: 0.3014664351940155, mean loss: 0.35204979506521056
Epoch: 22, step: 1224, loss: 0.35636085271835327, mean loss: 0.35204992573103827
Epoch: 22, step: 1225, loss: 0.3362431526184082, mean loss: 0.3520494466508082
Epoch: 22, step: 1226, loss: 0.3203926384449005, mean loss: 0.35204848720821974
Epoch: 22, step: 1227, loss: 0.33747512102127075, mean loss: 0.3520480455375267
Epoch: 22, step: 1228, loss: 0.31192073225975037, mean loss: 0.35204682944778287
Epoch: 22, step: 1229, loss: 0.3249357342720032, mean loss: 0.3520460078496504
Epoch: 22, step: 1230, loss: 0.28422781825065613, mean loss: 0.35204395269071836
Epoch: 22, step: 1231, loss: 0.3079211711883545, mean loss: 0.35204261563673345
Epoch: 22, step: 1232, loss: 0.29594916105270386, mean loss: 0.352040915886587
Epoch: 22, step: 1233, loss: 0.3267943859100342, mean loss: 0.3520401508865877
Epoch: 22, step: 1234, loss: 0.3571033477783203, mean loss: 0.3520403043028496
Epoch: 22, step: 1235, loss: 0.34747418761253357, mean loss: 0.3520401659524469
Epoch: 22, step: 1236, loss: 0.37343549728393555, mean loss: 0.35204081419760164
Epoch: 22, step: 1237, loss: 0.31519901752471924, mean loss: 0.35203969798246887
Epoch: 22, step: 1238, loss: 0.3092730939388275, mean loss: 0.3520384022996124
Epoch: 22, step: 1239, loss: 0.32778340578079224, mean loss: 0.35203766747785653
Epoch: 22, step: 1240, loss: 0.30901727080345154, mean loss: 0.35203636418491596
Epoch: 22, step: 1241, loss: 0.32674291729927063, mean loss: 0.35203559794902123
Epoch: 22, step: 1242, loss: 0.3203342854976654, mean loss: 0.35203463762329795
Epoch: 22, step: 1243, loss: 0.3499881625175476, mean loss: 0.3520345756314433
Epoch: 22, step: 1244, loss: 0.3876127004623413, mean loss: 0.3520356533318895
Epoch: 22, step: 1245, loss: 0.3732532262802124, mean loss: 0.3520362960159917
Epoch: 22, step: 1246, loss: 0.30984991788864136, mean loss: 0.3520350182217125
Epoch: 22, step: 1247, loss: 0.3344818651676178, mean loss: 0.3520344865657562
Epoch: 22, step: 1248, loss: 0.3197522759437561, mean loss: 0.35203350882063633
Epoch: 22, step: 1249, loss: 0.3488941490650177, mean loss: 0.3520334137403845
Epoch: 22, step: 1250, loss: 0.3344673216342926, mean loss: 0.35203288174086583
Epoch: 22, step: 1251, loss: 0.3219442665576935, mean loss: 0.3520319705169051
Epoch: 22, step: 1252, loss: 0.3453717827796936, mean loss: 0.352031768821386
Epoch: 22, step: 1253, loss: 0.35479098558425903, mean loss: 0.35203185237831053
Epoch: 22, step: 1254, loss: 0.30263766646385193, mean loss: 0.3520303566272911
Epoch: 22, step: 1255, loss: 0.3576454520225525, mean loss: 0.3520305266580383
Epoch: 22, step: 1256, loss: 0.35490232706069946, mean loss: 0.35203061361641536
Epoch: 22, step: 1257, loss: 0.3227752149105072, mean loss: 0.35202972778710795
Epoch: 22, step: 1258, loss: 0.31772109866142273, mean loss: 0.35202868898161166
Epoch: 22, step: 1259, loss: 0.33441904187202454, mean loss: 0.35202815580833113
Epoch: 22, step: 1260, loss: 0.2996596395969391, mean loss: 0.35202657027694323
Epoch: 22, step: 1261, loss: 0.3214253783226013, mean loss: 0.3520256438103385
Epoch: 22, step: 1262, loss: 0.358948290348053, mean loss: 0.35202585339062786
Epoch: 22, step: 1263, loss: 0.3144451379776001, mean loss: 0.35202471568430027
Epoch: 22, step: 1264, loss: 0.3291197121143341, mean loss: 0.3520240222866806
Epoch: 22, step: 1265, loss: 0.34775832295417786, mean loss: 0.3520238931561081
Epoch: 22, step: 1266, loss: 0.31513267755508423, mean loss: 0.3520227764248957
Epoch: 22, step: 1267, loss: 0.3109903335571289, mean loss: 0.35202153437250233
Epoch: 22, step: 1268, loss: 0.3224532902240753, mean loss: 0.3520206393685931
Epoch: 22, step: 1269, loss: 0.35644733905792236, mean loss: 0.3520207733567186
Epoch: 22, step: 1270, loss: 0.38111674785614014, mean loss: 0.35202165401214097
Epoch: 22, step: 1271, loss: 0.3320758044719696, mean loss: 0.3520210503242009
Epoch: 22, step: 1272, loss: 0.3333325982093811, mean loss: 0.3520204847102027
Epoch: 22, step: 1273, loss: 0.2913493514060974, mean loss: 0.3520186485279709
Epoch: 22, step: 1274, loss: 0.3485824763774872, mean loss: 0.3520185445370454
Epoch: 22, step: 1275, loss: 0.3361150920391083, mean loss: 0.35201806325595053
Epoch: 22, step: 1276, loss: 0.3299027681350708, mean loss: 0.352017394008103
Epoch: 22, step: 1277, loss: 0.3234005868434906, mean loss: 0.35201652803923644
Epoch: 22, step: 1278, loss: 0.3472681939601898, mean loss: 0.3520163843549662
Epoch: 22, step: 1279, loss: 0.3121778070926666, mean loss: 0.3520151788787721
Epoch: 22, step: 1280, loss: 0.35843417048454285, mean loss: 0.3520153731052723
Epoch: 22, step: 1281, loss: 0.3264538049697876, mean loss: 0.3520145996841487
Epoch: 22, step: 1282, loss: 0.37119990587234497, mean loss: 0.3520151801599645
Epoch: 22, step: 1283, loss: 0.35670673847198486, mean loss: 0.3520153221047277
Epoch: 22, step: 1284, loss: 0.34310251474380493, mean loss: 0.35201505245273357
Epoch: 22, step: 1285, loss: 0.32248547673225403, mean loss: 0.35201415907899
Epoch: 22, step: 1286, loss: 0.3096807599067688, mean loss: 0.352012878383205
Epoch: 22, step: 1287, loss: 0.33594217896461487, mean loss: 0.3520123922173223
Epoch: 22, step: 1288, loss: 0.35817739367485046, mean loss: 0.3520125787134186
Epoch: 22, step: 1289, loss: 0.3184286952018738, mean loss: 0.352011562805514
Epoch: 22, step: 1290, loss: 0.32521799206733704, mean loss: 0.35201075232816326
Epoch: 22, step: 1291, loss: 0.3030855059623718, mean loss: 0.3520092724356537
Epoch: 22, step: 1292, loss: 0.3321813941001892, mean loss: 0.35200867269945896
Epoch: 22, step: 1293, loss: 0.32000094652175903, mean loss: 0.3520077045872402
Epoch: 22, step: 1294, loss: 0.32931214570999146, mean loss: 0.3520070181534962
Epoch: 22, step: 1295, loss: 0.3010580837726593, mean loss: 0.35200547723484205
Epoch: 22, step: 1296, loss: 0.3292580246925354, mean loss: 0.35200478927317436
Epoch: 22, step: 1297, loss: 0.31105828285217285, mean loss: 0.35200355094660263
Epoch: 22, step: 1298, loss: 0.3407556116580963, mean loss: 0.35200321079057734
Epoch: 22, step: 1299, loss: 0.3452451825141907, mean loss: 0.35200300642296284
Epoch: 22, step: 1300, loss: 0.3644143044948578, mean loss: 0.3520033817381545
Epoch: 22, step: 1301, loss: 0.33292728662490845, mean loss: 0.35200280489826596
Epoch: 22, step: 1302, loss: 0.34956902265548706, mean loss: 0.3520027313056246
Epoch: 22, step: 1303, loss: 0.3377891778945923, mean loss: 0.35200230152957807
Epoch: 22, step: 1304, loss: 0.3109424114227295, mean loss: 0.3520010600368164
Epoch: 22, step: 1305, loss: 0.3420599400997162, mean loss: 0.3520007594647678
Epoch: 22, step: 1306, loss: 0.32618385553359985, mean loss: 0.3519999789083375
Epoch: 22, step: 1307, loss: 0.3480603098869324, mean loss: 0.35199985979874077
Epoch: 22, step: 1308, loss: 0.33044761419296265, mean loss: 0.35199920822073777
Epoch: 22, step: 1309, loss: 0.4069870710372925, mean loss: 0.35200087059037366
Epoch: 22, step: 1310, loss: 0.3182829022407532, mean loss: 0.3519998512739388
Epoch: 22, step: 1311, loss: 0.33410313725471497, mean loss: 0.3519993102608185
Epoch: 22, step: 1312, loss: 0.3243071734905243, mean loss: 0.35199847315986116
Epoch: 22, step: 1313, loss: 0.31402647495269775, mean loss: 0.35199732534539385
Epoch: 22, step: 1314, loss: 0.37595799565315247, mean loss: 0.3519980496046904
Epoch: 22, step: 1315, loss: 0.32146477699279785, mean loss: 0.35199712670320893
Epoch: 22, step: 1316, loss: 0.36105743050575256, mean loss: 0.35199740055250023
Epoch: 22, step: 1317, loss: 0.35156500339508057, mean loss: 0.35199738748361437
Epoch: 22, step: 1318, loss: 0.32599759101867676, mean loss: 0.3519966016826513
Epoch: 22, step: 1319, loss: 0.33657127618789673, mean loss: 0.3519961354917212
Epoch: 22, step: 1320, loss: 0.3369314968585968, mean loss: 0.3519956802153867
Epoch: 22, step: 1321, loss: 0.3794204592704773, mean loss: 0.35199650900895135
Epoch: 22, step: 1322, loss: 0.3148849308490753, mean loss: 0.3519953875082968
Epoch: 22, step: 1323, loss: 0.3346981108188629, mean loss: 0.3519948648056288
Epoch: 22, step: 1324, loss: 0.33803069591522217, mean loss: 0.35199444283817677
Epoch: 22, step: 1325, loss: 0.3184153735637665, mean loss: 0.351993428180859
Epoch: 22, step: 1326, loss: 0.32261088490486145, mean loss: 0.35199254035661737
Epoch: 22, step: 1327, loss: 0.3553561270236969, mean loss: 0.35199264198783164
Epoch: 22, step: 1328, loss: 0.34099432826042175, mean loss: 0.3519923096823741
Epoch: 22, step: 1329, loss: 0.32552072405815125, mean loss: 0.35199150988825895
Epoch: 22, step: 1330, loss: 0.3352242708206177, mean loss: 0.3519910033098406
Epoch: 22, step: 1331, loss: 0.31291648745536804, mean loss: 0.3519898228108722
Epoch: 22, step: 1332, loss: 0.33583176136016846, mean loss: 0.35198933466666354
Epoch: 22, step: 1333, loss: 0.3057760000228882, mean loss: 0.3519879385777673
Epoch: 22, step: 1334, loss: 0.31075963377952576, mean loss: 0.3519866931225276
Epoch: 22, step: 1335, loss: 0.2904694080352783, mean loss: 0.3519848348188457
Epoch: 22, step: 1336, loss: 0.3169393837451935, mean loss: 0.3519837762038004
Epoch: 22, step: 1337, loss: 0.3101744055747986, mean loss: 0.35198251330974406
Epoch: 22, step: 1338, loss: 0.3265921473503113, mean loss: 0.3519817463913896
Epoch: 22, step: 1339, loss: 0.3238905966281891, mean loss: 0.3519808979212385
Epoch: 22, step: 1340, loss: 0.3317854702472687, mean loss: 0.3519802879533242
Epoch: 22, step: 1341, loss: 0.3369014859199524, mean loss: 0.3519798325379804
Epoch: 22, step: 1342, loss: 0.351809024810791, mean loss: 0.3519798273793404
Epoch: 22, step: 1343, loss: 0.3354593515396118, mean loss: 0.35197932845218893
Epoch: 22, step: 1344, loss: 0.3263504207134247, mean loss: 0.3519785544689274
Epoch: 22, step: 1345, loss: 0.3258219063282013, mean loss: 0.3519777645719611
Epoch: 22, step: 1346, loss: 0.3407328724861145, mean loss: 0.3519774250010088
Epoch: 22, step: 1347, loss: 0.3109029531478882, mean loss: 0.35197618467996
Epoch: 22, step: 1348, loss: 0.359084814786911, mean loss: 0.3519763993319547
Epoch: 22, step: 1349, loss: 0.31753063201904297, mean loss: 0.3519753592399409
Epoch: 22, step: 1350, loss: 0.336088627576828, mean loss: 0.3519748795536079
Epoch: 22, step: 1351, loss: 0.34400269389152527, mean loss: 0.35197463884751906
Epoch: 22, step: 1352, loss: 0.3462707996368408, mean loss: 0.35197446663535126
Epoch: 22, step: 1353, loss: 0.3947264850139618, mean loss: 0.3519757573792187
Epoch: 22, step: 1354, loss: 0.30832988023757935, mean loss: 0.35197443968827463
Epoch: 22, step: 1355, loss: 0.32703644037246704, mean loss: 0.3519736868202842
Epoch: 22, step: 1356, loss: 0.35031434893608093, mean loss: 0.35197363672706505
Epoch: 22, step: 1357, loss: 0.31745022535324097, mean loss: 0.3519725945423348
Epoch: 22, step: 1358, loss: 0.29004013538360596, mean loss: 0.3519707249960687
Epoch: 22, step: 1359, loss: 0.33076298236846924, mean loss: 0.35197008482030717
Epoch: 22, step: 1360, loss: 0.3544885516166687, mean loss: 0.3519701608403137
Epoch: 22, step: 1361, loss: 0.35678830742836, mean loss: 0.35197030627184367
Epoch: 22, step: 1362, loss: 0.31353840231895447, mean loss: 0.35196914627353537
Epoch: 22, step: 1363, loss: 0.308432400226593, mean loss: 0.35196783223435735
Epoch: 22, step: 1364, loss: 0.3265560269355774, mean loss: 0.35196706527074706
Epoch: 22, step: 1365, loss: 0.35511934757232666, mean loss: 0.3519671604081377
Epoch: 22, step: 1366, loss: 0.3118436634540558, mean loss: 0.3519659494983156
Epoch: 22, step: 1367, loss: 0.3062078654766083, mean loss: 0.351964568580763
Epoch: 22, step: 1368, loss: 0.3119184374809265, mean loss: 0.3519633600787532
Epoch: 22, step: 1369, loss: 0.33235037326812744, mean loss: 0.3519627682208616
Epoch: 22, step: 1370, loss: 0.347551167011261, mean loss: 0.3519626350967115
Epoch: 22, step: 1371, loss: 0.36573678255081177, mean loss: 0.3519630507318187
Epoch: 22, step: 1372, loss: 0.3087301254272461, mean loss: 0.35196174621700915
Epoch: 22, step: 1373, loss: 0.31689080595970154, mean loss: 0.3519606880147203
Epoch: 22, step: 1374, loss: 0.36672937870025635, mean loss: 0.35196113361984616
Epoch: 22, step: 1375, loss: 0.3393593430519104, mean loss: 0.3519607534065174
Epoch: 22, step: 1376, loss: 0.3318798542022705, mean loss: 0.3519601475564886
Epoch: 22, step: 1377, loss: 0.35788553953170776, mean loss: 0.35196032632291513
Epoch: 22, step: 1378, loss: 0.3402476906776428, mean loss: 0.3519599729685951
Epoch: 22, step: 1379, loss: 0.3277552127838135, mean loss: 0.3519592427658624
Epoch: 22, step: 1380, loss: 0.3271467387676239, mean loss: 0.35195849425145775
Epoch: 22, step: 1381, loss: 0.33608201146125793, mean loss: 0.3519580153228668
Epoch: 22, step: 1382, loss: 0.33157750964164734, mean loss: 0.3519574005448607
Epoch: 22, step: 1383, loss: 0.3300541043281555, mean loss: 0.351956739851804
Epoch: 22, step: 1384, loss: 0.33126339316368103, mean loss: 0.35195611567460466
Epoch: 22, step: 1385, loss: 0.3334670662879944, mean loss: 0.351955558002849
Epoch: 22, step: 1386, loss: 0.3496766686439514, mean loss: 0.3519554892684391
Epoch: 22, step: 1387, loss: 0.2994018793106079, mean loss: 0.35195390422772377
Epoch: 22, step: 1388, loss: 0.3651092052459717, mean loss: 0.3519543009856035
Epoch: 22, step: 1389, loss: 0.30873310565948486, mean loss: 0.35195299749337455
Epoch: 22, step: 1390, loss: 0.3427536189556122, mean loss: 0.35195272006104733
Epoch: 22, step: 1391, loss: 0.34259268641471863, mean loss: 0.35195243779224017
Epoch: 22, step: 1392, loss: 0.3270152807235718, mean loss: 0.35195168578967484
Epoch: 22, step: 1393, loss: 0.3157048225402832, mean loss: 0.3519505927656338
Epoch: 22, step: 1394, loss: 0.34822356700897217, mean loss: 0.3519504803805734
Epoch: 22, step: 1395, loss: 0.4052464962005615, mean loss: 0.35195208742483286
Epoch: 22, step: 1396, loss: 0.33200421929359436, mean loss: 0.35195148595134784
Epoch: 22, step: 1397, loss: 0.3074193298816681, mean loss: 0.3519501432462863
Epoch: 22, step: 1398, loss: 0.3343159258365631, mean loss: 0.3519496115666828
Epoch: 22, step: 1399, loss: 0.33247876167297363, mean loss: 0.35194902452948146
Epoch: 22, step: 1400, loss: 0.33101215958595276, mean loss: 0.35194839331162914
Epoch: 22, step: 1401, loss: 0.313857764005661, mean loss: 0.35194724496585567
Epoch: 22, step: 1402, loss: 0.32051652669906616, mean loss: 0.3519462974298071
Epoch: 22, step: 1403, loss: 0.32329776883125305, mean loss: 0.3519454337939516
Epoch: 22, step: 1404, loss: 0.35456499457359314, mean loss: 0.3519455127606046
Epoch: 22, step: 1405, loss: 0.3077821135520935, mean loss: 0.3519441814951796
Epoch: 22, step: 1406, loss: 0.32102489471435547, mean loss: 0.3519432494895494
Epoch: 22, step: 1407, loss: 0.31434959173202515, mean loss: 0.3519421163313098
Epoch: 22, step: 1408, loss: 0.3713008761405945, mean loss: 0.3519426998307163
Epoch: 22, step: 1409, loss: 0.3903764486312866, mean loss: 0.351943858241374
Epoch: 22, step: 1410, loss: 0.3481893837451935, mean loss: 0.3519437450832168
Epoch: 22, step: 1411, loss: 0.30341511964797974, mean loss: 0.35194228249655507
Epoch: 22, step: 1412, loss: 0.3596390187740326, mean loss: 0.35194251445871044
Epoch: 22, step: 1413, loss: 0.31678473949432373, mean loss: 0.3519414549151337
Epoch: 22, step: 1414, loss: 0.32568421959877014, mean loss: 0.3519406636293754
Epoch: 22, step: 1415, loss: 0.3390180766582489, mean loss: 0.35194027420715474
Epoch: 22, step: 1416, loss: 0.32563966512680054, mean loss: 0.35193948166205663
Epoch: 22, step: 1417, loss: 0.33470940589904785, mean loss: 0.35193896246493245
Epoch: 22, step: 1418, loss: 0.3170504868030548, mean loss: 0.3519379111955902
Epoch: 22, step: 1419, loss: 0.33137694001197815, mean loss: 0.35193729166530263
Epoch: 22, step: 1420, loss: 0.40274369716644287, mean loss: 0.35193882248592095
Epoch: 22, step: 1421, loss: 0.3035174310207367, mean loss: 0.35193736357084215
Epoch: 22, step: 1422, loss: 0.3359927237033844, mean loss: 0.35193688318037886
Epoch: 22, step: 1423, loss: 0.3500388562679291, mean loss: 0.35193682599711446
Epoch: 22, step: 1424, loss: 0.33164140582084656, mean loss: 0.35193621456036045
Epoch: 22, step: 1425, loss: 0.3348630368709564, mean loss: 0.3519357002150664
Epoch: 22, step: 1426, loss: 0.3124881386756897, mean loss: 0.35193451185653235
Epoch: 22, step: 1427, loss: 0.31196317076683044, mean loss: 0.351933307755403
Epoch: 22, step: 1428, loss: 0.3152494430541992, mean loss: 0.35193220271986664
Epoch: 22, step: 1429, loss: 0.3404647409915924, mean loss: 0.35193185729358406
Epoch: 22, step: 1430, loss: 0.3535654544830322, mean loss: 0.3519319064998008
Epoch: 22, step: 1431, loss: 0.3115507960319519, mean loss: 0.3519306902012927
Epoch: 22, step: 1432, loss: 0.4422694742679596, mean loss: 0.35193341116704874
Epoch: 22, step: 1433, loss: 0.29875147342681885, mean loss: 0.35193180939794627
Epoch: 22, step: 1434, loss: 0.3518848121166229, mean loss: 0.3519318079824934
Epoch: 22, step: 1435, loss: 0.3463030755519867, mean loss: 0.351931638462784
Epoch: 22, step: 1436, loss: 0.36741769313812256, mean loss: 0.3519321048399765
Epoch: 22, step: 1437, loss: 0.3075406849384308, mean loss: 0.3519307679906149
Epoch: 22, step: 1438, loss: 0.3170447051525116, mean loss: 0.351929717427094
Epoch: 22, step: 1439, loss: 0.34556806087493896, mean loss: 0.35192952585709425
Epoch: 22, step: 1440, loss: 0.33099275827407837, mean loss: 0.351928895402471
Epoch: 22, step: 1441, loss: 0.3098942041397095, mean loss: 0.3519276296785546
Epoch: 22, step: 1442, loss: 0.2979726791381836, mean loss: 0.35192600506771665
Epoch: 22, step: 1443, loss: 0.32964861392974854, mean loss: 0.35192533430440404
Valid: 22, mean loss: 0.1864597275853157
Epoch: 23, step: 0, loss: 0.32949334383010864, mean loss: 0.3519246589065034
Epoch: 23, step: 1, loss: 0.3454614281654358, mean loss: 0.35192446431293617
Epoch: 23, step: 2, loss: 0.28866878151893616, mean loss: 0.35192255988172155
Epoch: 23, step: 3, loss: 0.3286685645580292, mean loss: 0.35192185979756563
Epoch: 23, step: 4, loss: 0.36361920833587646, mean loss: 0.3519222119470234
Epoch: 23, step: 5, loss: 0.3056274652481079, mean loss: 0.35192081828254335
Epoch: 23, step: 6, loss: 0.3678979277610779, mean loss: 0.3519212992455307
Epoch: 23, step: 7, loss: 0.37631693482398987, mean loss: 0.3519220336114422
Epoch: 23, step: 8, loss: 0.33499929308891296, mean loss: 0.35192152421255224
Epoch: 23, step: 9, loss: 0.337030827999115, mean loss: 0.3519210759946179
Epoch: 23, step: 10, loss: 0.3623471260070801, mean loss: 0.3519213898148633
Epoch: 23, step: 11, loss: 0.3478567600250244, mean loss: 0.3519212674746939
Epoch: 23, step: 12, loss: 0.3595358729362488, mean loss: 0.3519214966577025
Epoch: 23, step: 13, loss: 0.3088964819908142, mean loss: 0.35192020173761984
Epoch: 23, step: 14, loss: 0.3254585564136505, mean loss: 0.35191940534777655
Epoch: 23, step: 15, loss: 0.35020923614501953, mean loss: 0.3519193538800625
Epoch: 23, step: 16, loss: 0.2936439514160156, mean loss: 0.35191760012874695
Epoch: 23, step: 17, loss: 0.37333226203918457, mean loss: 0.3519182445663609
Epoch: 23, step: 18, loss: 0.3241586685180664, mean loss: 0.3519174092145494
Epoch: 23, step: 19, loss: 0.3427194058895111, mean loss: 0.35191713243303385
Epoch: 23, step: 20, loss: 0.2819596230983734, mean loss: 0.35191502737151864
Epoch: 23, step: 21, loss: 0.3521227538585663, mean loss: 0.3519150336219395
Epoch: 23, step: 22, loss: 0.3923076093196869, mean loss: 0.35191624898453006
Epoch: 23, step: 23, loss: 0.3556426167488098, mean loss: 0.35191636110294877
Epoch: 23, step: 24, loss: 0.3409616947174072, mean loss: 0.3519160315104348
Epoch: 23, step: 25, loss: 0.3199754059314728, mean loss: 0.35191507054330146
Epoch: 23, step: 26, loss: 0.3136763870716095, mean loss: 0.35191392012711953
Epoch: 23, step: 27, loss: 0.3617797791957855, mean loss: 0.3519142169339507
Epoch: 23, step: 28, loss: 0.3497553765773773, mean loss: 0.35191415198884207
Epoch: 23, step: 29, loss: 0.3342863619327545, mean loss: 0.35191362170215484
Epoch: 23, step: 30, loss: 0.33726006746292114, mean loss: 0.3519131809009564
Epoch: 23, step: 31, loss: 0.3120873272418976, mean loss: 0.35191198291474357
Epoch: 23, step: 32, loss: 0.330169141292572, mean loss: 0.35191132889634613
Epoch: 23, step: 33, loss: 0.32226258516311646, mean loss: 0.35191043709752123
Epoch: 23, step: 34, loss: 0.3736153841018677, mean loss: 0.35191108993678505
Epoch: 23, step: 35, loss: 0.3242286443710327, mean loss: 0.3519102573319497
Epoch: 23, step: 36, loss: 0.33221715688705444, mean loss: 0.3519096650404388
Epoch: 23, step: 37, loss: 0.35625991225242615, mean loss: 0.3519097958749414
Epoch: 23, step: 38, loss: 0.37308698892593384, mean loss: 0.35191043276384854
Epoch: 23, step: 39, loss: 0.355724573135376, mean loss: 0.35191054746793765
Epoch: 23, step: 40, loss: 0.3443754017353058, mean loss: 0.3519103208674585
Epoch: 23, step: 41, loss: 0.2916202247142792, mean loss: 0.3519085078495914
Epoch: 23, step: 42, loss: 0.31044241786003113, mean loss: 0.35190726093664626
Epoch: 23, step: 43, loss: 0.30897119641304016, mean loss: 0.35190596985941136
Epoch: 23, step: 44, loss: 0.3475564420223236, mean loss: 0.35190583907407785
Epoch: 23, step: 45, loss: 0.3986399471759796, mean loss: 0.35190724427307063
Epoch: 23, step: 46, loss: 0.33702346682548523, mean loss: 0.35190679676179704
Epoch: 23, step: 47, loss: 0.32563477754592896, mean loss: 0.3519060068634442
Epoch: 23, step: 48, loss: 0.3493250906467438, mean loss: 0.35190592926757464
Epoch: 23, step: 49, loss: 0.32323020696640015, mean loss: 0.3519050671509761
Epoch: 23, step: 50, loss: 0.32749247550964355, mean loss: 0.35190433322464226
Epoch: 23, step: 51, loss: 0.3036332130432129, mean loss: 0.35190288207264064
Epoch: 23, step: 52, loss: 0.3308284878730774, mean loss: 0.351902248542077
Epoch: 23, step: 53, loss: 0.3408002257347107, mean loss: 0.3519019148072485
Epoch: 23, step: 54, loss: 0.36787548661231995, mean loss: 0.35190239496992637
Epoch: 23, step: 55, loss: 0.32920709252357483, mean loss: 0.3519017127737485
Epoch: 23, step: 56, loss: 0.3540647327899933, mean loss: 0.35190177778983
Epoch: 23, step: 57, loss: 0.32624876499176025, mean loss: 0.3519010067344408
Epoch: 23, step: 58, loss: 0.33876627683639526, mean loss: 0.351900611954305
Epoch: 23, step: 59, loss: 0.3315196931362152, mean loss: 0.3518999993996399
Epoch: 23, step: 60, loss: 0.3179222047328949, mean loss: 0.35189897821746013
Epoch: 23, step: 61, loss: 0.3213227391242981, mean loss: 0.35189805929460466
Epoch: 23, step: 62, loss: 0.3123044967651367, mean loss: 0.3518968694054227
Epoch: 23, step: 63, loss: 0.3608783781528473, mean loss: 0.3518971393149295
Epoch: 23, step: 64, loss: 0.3238339424133301, mean loss: 0.3518962959938098
Epoch: 23, step: 65, loss: 0.3036080300807953, mean loss: 0.35189484493707823
Epoch: 23, step: 66, loss: 0.3703722357749939, mean loss: 0.351895400163823
Epoch: 23, step: 67, loss: 0.38487911224365234, mean loss: 0.35189639126094074
Epoch: 23, step: 68, loss: 0.3876831829547882, mean loss: 0.35189746655289994
Epoch: 23, step: 69, loss: 0.2978760600090027, mean loss: 0.3518958434110652
Epoch: 23, step: 70, loss: 0.3947506844997406, mean loss: 0.351897131000558
Epoch: 23, step: 71, loss: 0.3572766184806824, mean loss: 0.3518972926243857
Epoch: 23, step: 72, loss: 0.314637154340744, mean loss: 0.35189617319706756
Epoch: 23, step: 73, loss: 0.35629910230636597, mean loss: 0.35189630547277234
Epoch: 23, step: 74, loss: 0.35445737838745117, mean loss: 0.3518963824119052
Epoch: 23, step: 75, loss: 0.30122047662734985, mean loss: 0.35189486006433895
Epoch: 23, step: 76, loss: 0.35812103748321533, mean loss: 0.35189504709841685
Epoch: 23, step: 77, loss: 0.34585294127464294, mean loss: 0.3518948655992933
Epoch: 23, step: 78, loss: 0.2950664162635803, mean loss: 0.35189315857789605
Epoch: 23, step: 79, loss: 0.3076689839363098, mean loss: 0.351891830205475
Epoch: 23, step: 80, loss: 0.37406861782073975, mean loss: 0.35189249631509606
Epoch: 23, step: 81, loss: 0.3539915382862091, mean loss: 0.3518925593607491
Epoch: 23, step: 82, loss: 0.3507297933101654, mean loss: 0.35189252443760594
Epoch: 23, step: 83, loss: 0.30715084075927734, mean loss: 0.3518911806820894
Epoch: 23, step: 84, loss: 0.3516222834587097, mean loss: 0.35189117260637015
Epoch: 23, step: 85, loss: 0.3126218616962433, mean loss: 0.35188999327695364
Epoch: 23, step: 86, loss: 0.3291172683238983, mean loss: 0.3518893093908023
Epoch: 23, step: 87, loss: 0.33552980422973633, mean loss: 0.35188881811437106
Epoch: 23, step: 88, loss: 0.33313828706741333, mean loss: 0.3518882550522694
Epoch: 23, step: 89, loss: 0.34090811014175415, mean loss: 0.3518879253379907
Epoch: 23, step: 90, loss: 0.3266485035419464, mean loss: 0.351887167465673
Epoch: 23, step: 91, loss: 0.3474017083644867, mean loss: 0.35188703278337957
Epoch: 23, step: 92, loss: 0.3642804026603699, mean loss: 0.3518874049007757
Epoch: 23, step: 93, loss: 0.34163638949394226, mean loss: 0.35188709711793154
Epoch: 23, step: 94, loss: 0.30965498089790344, mean loss: 0.35188582915275246
Epoch: 23, step: 95, loss: 0.3411605954170227, mean loss: 0.3518855071510191
Epoch: 23, step: 96, loss: 0.3352576494216919, mean loss: 0.3518850079508711
Epoch: 23, step: 97, loss: 0.3308514356613159, mean loss: 0.35188437650168797
Epoch: 23, step: 98, loss: 0.34497687220573425, mean loss: 0.35188416913762516
Epoch: 23, step: 99, loss: 0.30656611919403076, mean loss: 0.35188280872546307
Epoch: 23, step: 100, loss: 0.32523950934410095, mean loss: 0.35188200893861166
Epoch: 23, step: 101, loss: 0.3495761454105377, mean loss: 0.3518819397225605
Epoch: 23, step: 102, loss: 0.29058822989463806, mean loss: 0.3518800998993629
Epoch: 23, step: 103, loss: 0.3161337673664093, mean loss: 0.351879026951454
Epoch: 23, step: 104, loss: 0.30965015292167664, mean loss: 0.35187775946416433
Epoch: 23, step: 105, loss: 0.35110101103782654, mean loss: 0.3518777361509875
Epoch: 23, step: 106, loss: 0.3041154742240906, mean loss: 0.3518763026667315
Epoch: 23, step: 107, loss: 0.38675186038017273, mean loss: 0.35187734935213705
Epoch: 23, step: 108, loss: 0.32236576080322266, mean loss: 0.3518764636767807
Epoch: 23, step: 109, loss: 0.3014383614063263, mean loss: 0.351874950019069
Epoch: 23, step: 110, loss: 0.3012234568595886, mean loss: 0.35187343000306925
Epoch: 23, step: 111, loss: 0.34630298614501953, mean loss: 0.3518732628429487
Epoch: 23, step: 112, loss: 0.32825514674186707, mean loss: 0.35187255412228546
Epoch: 23, step: 113, loss: 0.36119696497917175, mean loss: 0.3518728339161658
Epoch: 23, step: 114, loss: 0.32595929503440857, mean loss: 0.3518720563622641
Epoch: 23, step: 115, loss: 0.4422960579395294, mean loss: 0.35187476951641605
Epoch: 23, step: 116, loss: 0.32276007533073425, mean loss: 0.3518738959620284
Epoch: 23, step: 117, loss: 0.3750588595867157, mean loss: 0.351874591580499
Epoch: 23, step: 118, loss: 0.3309694230556488, mean loss: 0.35187396438153934
Epoch: 23, step: 119, loss: 0.3889479637145996, mean loss: 0.3518750766460099
Epoch: 23, step: 120, loss: 0.32319292426109314, mean loss: 0.35187421617283365
Epoch: 23, step: 121, loss: 0.3289671540260315, mean loss: 0.3518735289747132
Epoch: 23, step: 122, loss: 0.33376848697662354, mean loss: 0.35187298585060944
Epoch: 23, step: 123, loss: 0.31895536184310913, mean loss: 0.3518719984008852
Epoch: 23, step: 124, loss: 0.3181518018245697, mean loss: 0.3518709869062523
Epoch: 23, step: 125, loss: 0.28912922739982605, mean loss: 0.3518691049169456
Epoch: 23, step: 126, loss: 0.3828813135623932, mean loss: 0.3518700351250696
Epoch: 23, step: 127, loss: 0.3181743919849396, mean loss: 0.3518690244579088
Epoch: 23, step: 128, loss: 0.3165512979030609, mean loss: 0.35186796516974844
Epoch: 23, step: 129, loss: 0.33843398094177246, mean loss: 0.35186756225497945
Epoch: 23, step: 130, loss: 0.3289974331855774, mean loss: 0.3518668763500198
Epoch: 23, step: 131, loss: 0.32843706011772156, mean loss: 0.3518661736803871
Epoch: 23, step: 132, loss: 0.34648823738098145, mean loss: 0.35186601239874665
Epoch: 23, step: 133, loss: 0.31656613945961, mean loss: 0.3518649538048242
Epoch: 23, step: 134, loss: 0.3192434310913086, mean loss: 0.3518639755602231
Epoch: 23, step: 135, loss: 0.30481961369514465, mean loss: 0.3518625648500796
Epoch: 23, step: 136, loss: 0.29403626918792725, mean loss: 0.3518608308761775
Epoch: 23, step: 137, loss: 0.3476315140724182, mean loss: 0.3518607040600814
Epoch: 23, step: 138, loss: 0.3180360794067383, mean loss: 0.35185968985886845
Epoch: 23, step: 139, loss: 0.38067781925201416, mean loss: 0.35186055391887666
Epoch: 23, step: 140, loss: 0.3237258195877075, mean loss: 0.3518597103745379
Epoch: 23, step: 141, loss: 0.3384909927845001, mean loss: 0.3518593095615143
Epoch: 23, step: 142, loss: 0.3434126079082489, mean loss: 0.35185905632506836
Epoch: 23, step: 143, loss: 0.344143271446228, mean loss: 0.35185882500881704
Epoch: 23, step: 144, loss: 0.33190345764160156, mean loss: 0.3518582267725438
Epoch: 23, step: 145, loss: 0.37448668479919434, mean loss: 0.3518589051243043
Epoch: 23, step: 146, loss: 0.3278656303882599, mean loss: 0.35185818587988044
Epoch: 23, step: 147, loss: 0.30674636363983154, mean loss: 0.3518568336070315
Epoch: 23, step: 148, loss: 0.3670591413974762, mean loss: 0.35185728929804166
Epoch: 23, step: 149, loss: 0.2980099022388458, mean loss: 0.35185567526449874
Epoch: 23, step: 150, loss: 0.3363191783428192, mean loss: 0.3518552095840467
Epoch: 23, step: 151, loss: 0.3331778347492218, mean loss: 0.3518546497778234
Epoch: 23, step: 152, loss: 0.35415148735046387, mean loss: 0.3518547186175528
Epoch: 23, step: 153, loss: 0.3194728195667267, mean loss: 0.351853748111677
Epoch: 23, step: 154, loss: 0.30623573064804077, mean loss: 0.3518523809519844
Epoch: 23, step: 155, loss: 0.2989824414253235, mean loss: 0.351850796501627
Epoch: 23, step: 156, loss: 0.39769598841667175, mean loss: 0.35185217038732675
Epoch: 23, step: 157, loss: 0.31004616618156433, mean loss: 0.3518509175852828
Epoch: 23, step: 158, loss: 0.31621992588043213, mean loss: 0.3518498498620589
Epoch: 23, step: 159, loss: 0.3233172297477722, mean loss: 0.3518489948752402
Epoch: 23, step: 160, loss: 0.32574307918548584, mean loss: 0.35184821262864296
Epoch: 23, step: 161, loss: 0.34831732511520386, mean loss: 0.3518481068310906
Epoch: 23, step: 162, loss: 0.35555315017700195, mean loss: 0.3518482178436253
Epoch: 23, step: 163, loss: 0.3277609050273895, mean loss: 0.3518474961480112
Epoch: 23, step: 164, loss: 0.30593445897102356, mean loss: 0.3518461205589176
Epoch: 23, step: 165, loss: 0.301866352558136, mean loss: 0.3518446231723756
Epoch: 23, step: 166, loss: 0.32410773634910583, mean loss: 0.3518437922041973
Epoch: 23, step: 167, loss: 0.3142106235027313, mean loss: 0.35184266478751963
Epoch: 23, step: 168, loss: 0.32611939311027527, mean loss: 0.3518418941913219
Epoch: 23, step: 169, loss: 0.3033612370491028, mean loss: 0.3518404418919647
Epoch: 23, step: 170, loss: 0.36128467321395874, mean loss: 0.35184072479737527
Epoch: 23, step: 171, loss: 0.2914479970932007, mean loss: 0.35183891576527293
Epoch: 23, step: 172, loss: 0.3207184374332428, mean loss: 0.35183798359578566
Epoch: 23, step: 173, loss: 0.308979332447052, mean loss: 0.3518366998645466
Epoch: 23, step: 174, loss: 0.35338300466537476, mean loss: 0.35183674617912414
Epoch: 23, step: 175, loss: 0.3316943645477295, mean loss: 0.3518361428970578
Epoch: 23, step: 176, loss: 0.316691130399704, mean loss: 0.35183509030451243
Epoch: 23, step: 177, loss: 0.3550197184085846, mean loss: 0.35183518568121513
Epoch: 23, step: 178, loss: 0.3194037675857544, mean loss: 0.35183421441895596
Epoch: 23, step: 179, loss: 0.4070918560028076, mean loss: 0.35183586923572596
Epoch: 23, step: 180, loss: 0.33867591619491577, mean loss: 0.3518354751425615
Epoch: 23, step: 181, loss: 0.31749430298805237, mean loss: 0.35183444677901854
Epoch: 23, step: 182, loss: 0.29866549372673035, mean loss: 0.35183285465585484
Epoch: 23, step: 183, loss: 0.33184584975242615, mean loss: 0.35183225617085956
Epoch: 23, step: 184, loss: 0.32902732491493225, mean loss: 0.35183157332715337
Epoch: 23, step: 185, loss: 0.32962676882743835, mean loss: 0.35183090847283577
Epoch: 23, step: 186, loss: 0.3470555543899536, mean loss: 0.3518307654938818
Epoch: 23, step: 187, loss: 0.33970990777015686, mean loss: 0.35183040259395
Epoch: 23, step: 188, loss: 0.3418079614639282, mean loss: 0.3518301025298462
Epoch: 23, step: 189, loss: 0.332450270652771, mean loss: 0.35182952233010134
Epoch: 23, step: 190, loss: 0.2916533052921295, mean loss: 0.3518277208087698
Epoch: 23, step: 191, loss: 0.3327018618583679, mean loss: 0.3518271482468326
Epoch: 23, step: 192, loss: 0.3625833988189697, mean loss: 0.35182747024206
Epoch: 23, step: 193, loss: 0.3425554037094116, mean loss: 0.3518271926851381
Epoch: 23, step: 194, loss: 0.3647308051586151, mean loss: 0.3518275789398893
Epoch: 23, step: 195, loss: 0.3050497770309448, mean loss: 0.3518261787422747
Epoch: 23, step: 196, loss: 0.2925798296928406, mean loss: 0.3518244053773416
Epoch: 23, step: 197, loss: 0.33824342489242554, mean loss: 0.35182399888286436
Epoch: 23, step: 198, loss: 0.3300073444843292, mean loss: 0.35182334590467157
Epoch: 23, step: 199, loss: 0.32479143142700195, mean loss: 0.3518225368565907
Epoch: 23, step: 200, loss: 0.3510031998157501, mean loss: 0.3518225123350859
Epoch: 23, step: 201, loss: 0.2983629107475281, mean loss: 0.35182091241883556
Epoch: 23, step: 202, loss: 0.3538907468318939, mean loss: 0.35182097436210696
Epoch: 23, step: 203, loss: 0.34437307715415955, mean loss: 0.35182075147794345
Epoch: 23, step: 204, loss: 0.33365345001220703, mean loss: 0.3518202078234722
Epoch: 23, step: 205, loss: 0.3502276539802551, mean loss: 0.351820160167902
Epoch: 23, step: 206, loss: 0.325995534658432, mean loss: 0.35181938741511143
Epoch: 23, step: 207, loss: 0.31118303537368774, mean loss: 0.35181817148596595
Epoch: 23, step: 208, loss: 0.3265917897224426, mean loss: 0.35181741667965366
Epoch: 23, step: 209, loss: 0.3524188995361328, mean loss: 0.35181743467626836
Epoch: 23, step: 210, loss: 0.34679076075553894, mean loss: 0.35181728428061504
Epoch: 23, step: 211, loss: 0.3180180788040161, mean loss: 0.3518162730549845
Epoch: 23, step: 212, loss: 0.3935251832008362, mean loss: 0.35181752089074053
Epoch: 23, step: 213, loss: 0.3529258966445923, mean loss: 0.3518175540498309
Epoch: 23, step: 214, loss: 0.3102301061153412, mean loss: 0.351816309922391
Epoch: 23, step: 215, loss: 0.3228553831577301, mean loss: 0.3518154435550712
Epoch: 23, step: 216, loss: 0.30554336309432983, mean loss: 0.3518140593652821
Epoch: 23, step: 217, loss: 0.3458596169948578, mean loss: 0.3518138812485495
Epoch: 23, step: 218, loss: 0.35089293122291565, mean loss: 0.35181385370076373
Epoch: 23, step: 219, loss: 0.3279626667499542, mean loss: 0.35181314027688987
Epoch: 23, step: 220, loss: 0.31851938366889954, mean loss: 0.35181214444173875
Epoch: 23, step: 221, loss: 0.3254399299621582, mean loss: 0.351811355657433
Epoch: 23, step: 222, loss: 0.3319266736507416, mean loss: 0.35181076093088876
Epoch: 23, step: 223, loss: 0.32829684019088745, mean loss: 0.35181005767928153
Epoch: 23, step: 224, loss: 0.2923066318035126, mean loss: 0.3518082781109627
Epoch: 23, step: 225, loss: 0.2996341586112976, mean loss: 0.3518067177867956
Epoch: 23, step: 226, loss: 0.35202768445014954, mean loss: 0.351806724394848
Epoch: 23, step: 227, loss: 0.3437495529651642, mean loss: 0.3518064834507263
Epoch: 23, step: 228, loss: 0.3407997488975525, mean loss: 0.3518061543118084
Epoch: 23, step: 229, loss: 0.3265988826751709, mean loss: 0.3518054005509198
Epoch: 23, step: 230, loss: 0.34084537625312805, mean loss: 0.35180507282839796
Epoch: 23, step: 231, loss: 0.33549508452415466, mean loss: 0.35180458514784824
Epoch: 23, step: 232, loss: 0.3556126356124878, mean loss: 0.3518046990079309
Epoch: 23, step: 233, loss: 0.3054366707801819, mean loss: 0.35180331265296383
Epoch: 23, step: 234, loss: 0.3126831650733948, mean loss: 0.35180214303692714
Epoch: 23, step: 235, loss: 0.3422092795372009, mean loss: 0.3518018562376118
Epoch: 23, step: 236, loss: 0.3226141631603241, mean loss: 0.3518009836347514
Epoch: 23, step: 237, loss: 0.3225618898868561, mean loss: 0.3518001095213359
Epoch: 23, step: 238, loss: 0.32911860942840576, mean loss: 0.3517994314698548
Epoch: 23, step: 239, loss: 0.36897575855255127, mean loss: 0.351799944931743
Epoch: 23, step: 240, loss: 0.35440924763679504, mean loss: 0.3518000229308075
Epoch: 23, step: 241, loss: 0.3608212172985077, mean loss: 0.3518002925904705
Epoch: 23, step: 242, loss: 0.32990702986717224, mean loss: 0.3517996381811827
Epoch: 23, step: 243, loss: 0.32373863458633423, mean loss: 0.3517987994376511
Epoch: 23, step: 244, loss: 0.3545215427875519, mean loss: 0.35179888081803035
Epoch: 23, step: 245, loss: 0.380785197019577, mean loss: 0.35179974716736984
Epoch: 23, step: 246, loss: 0.3621293902397156, mean loss: 0.35180005589276725
Epoch: 23, step: 247, loss: 0.34732845425605774, mean loss: 0.35179992225255097
Epoch: 23, step: 248, loss: 0.3171573579311371, mean loss: 0.3517988869408651
Epoch: 23, step: 249, loss: 0.3104032576084137, mean loss: 0.35179764984716677
Epoch: 23, step: 250, loss: 0.34094053506851196, mean loss: 0.3517973253958391
Epoch: 23, step: 251, loss: 0.353877454996109, mean loss: 0.35179738755605905
Epoch: 23, step: 252, loss: 0.3396907448768616, mean loss: 0.3517970257857713
Epoch: 23, step: 253, loss: 0.3324798345565796, mean loss: 0.3517964485673637
Epoch: 23, step: 254, loss: 0.3243511915206909, mean loss: 0.3517956284981299
Epoch: 23, step: 255, loss: 0.3077542185783386, mean loss: 0.3517943125721732
Epoch: 23, step: 256, loss: 0.37831613421440125, mean loss: 0.3517951050016346
Epoch: 23, step: 257, loss: 0.3041962683200836, mean loss: 0.35179368286728496
Epoch: 23, step: 258, loss: 0.3335600793361664, mean loss: 0.3517931381090306
Epoch: 23, step: 259, loss: 0.3683507442474365, mean loss: 0.3517936327793861
Epoch: 23, step: 260, loss: 0.3340129256248474, mean loss: 0.3517931015838806
Epoch: 23, step: 261, loss: 0.3084413409233093, mean loss: 0.35179180649633024
Epoch: 23, step: 262, loss: 0.37065091729164124, mean loss: 0.3517923698752935
Epoch: 23, step: 263, loss: 0.32909131050109863, mean loss: 0.3517916917459061
Epoch: 23, step: 264, loss: 0.3147982954978943, mean loss: 0.35179058670673746
Epoch: 23, step: 265, loss: 0.3185802102088928, mean loss: 0.3517895947007485
Epoch: 23, step: 266, loss: 0.3371054530143738, mean loss: 0.3517891560932128
Epoch: 23, step: 267, loss: 0.30722132325172424, mean loss: 0.3517878249154099
Epoch: 23, step: 268, loss: 0.34763702750205994, mean loss: 0.35178770094069545
Epoch: 23, step: 269, loss: 0.36365067958831787, mean loss: 0.3517880552498361
Epoch: 23, step: 270, loss: 0.3043235242366791, mean loss: 0.35178663767879964
Epoch: 23, step: 271, loss: 0.3903003931045532, mean loss: 0.3517877878924965
Epoch: 23, step: 272, loss: 0.32697170972824097, mean loss: 0.3517870467822034
Epoch: 23, step: 273, loss: 0.3010735511779785, mean loss: 0.3517855323136015
Epoch: 23, step: 274, loss: 0.3160981237888336, mean loss: 0.35178446660426577
Epoch: 23, step: 275, loss: 0.3064136505126953, mean loss: 0.3517831117662315
Epoch: 23, step: 276, loss: 0.3406756818294525, mean loss: 0.3517827800922509
Epoch: 23, step: 277, loss: 0.30393698811531067, mean loss: 0.35178135143318917
Epoch: 23, step: 278, loss: 0.3362855613231659, mean loss: 0.35178088874798685
Epoch: 23, step: 279, loss: 0.38241472840309143, mean loss: 0.35178180340938825
Epoch: 23, step: 280, loss: 0.35065045952796936, mean loss: 0.3517817696308709
Epoch: 23, step: 281, loss: 0.3188987672328949, mean loss: 0.3517807878728725
Epoch: 23, step: 282, loss: 0.30879536271095276, mean loss: 0.3517795045343097
Epoch: 23, step: 283, loss: 0.3676013648509979, mean loss: 0.3517799768850476
Epoch: 23, step: 284, loss: 0.35356733202934265, mean loss: 0.35178003024371085
Epoch: 23, step: 285, loss: 0.3569219410419464, mean loss: 0.35178018374274955
Epoch: 23, step: 286, loss: 0.3118886351585388, mean loss: 0.3517789929147074
Epoch: 23, step: 287, loss: 0.33261653780937195, mean loss: 0.35177842090112216
Epoch: 23, step: 288, loss: 0.33503684401512146, mean loss: 0.3517779211674758
Epoch: 23, step: 289, loss: 0.31629130244255066, mean loss: 0.3517768619286625
Epoch: 23, step: 290, loss: 0.36398035287857056, mean loss: 0.351777226179355
Epoch: 23, step: 291, loss: 0.347552627325058, mean loss: 0.3517771000869823
Epoch: 23, step: 292, loss: 0.33669349551200867, mean loss: 0.3517766498973218
Epoch: 23, step: 293, loss: 0.34704354405403137, mean loss: 0.3517765086358808
Epoch: 23, step: 294, loss: 0.307890921831131, mean loss: 0.35177519889204206
Epoch: 23, step: 295, loss: 0.3502291142940521, mean loss: 0.3517751527512817
Epoch: 23, step: 296, loss: 0.36021074652671814, mean loss: 0.3517754044924192
Epoch: 23, step: 297, loss: 0.29488512873649597, mean loss: 0.35177370678201164
Epoch: 23, step: 298, loss: 0.34567928314208984, mean loss: 0.35177352491863423
Epoch: 23, step: 299, loss: 0.3386855721473694, mean loss: 0.3517731343733737
Epoch: 23, step: 300, loss: 0.3605564534664154, mean loss: 0.351773396460298
Epoch: 23, step: 301, loss: 0.37024518847465515, mean loss: 0.3517739476267363
Epoch: 23, step: 302, loss: 0.2900697588920593, mean loss: 0.3517721065350241
Epoch: 23, step: 303, loss: 0.3021382987499237, mean loss: 0.35177062563611655
Epoch: 23, step: 304, loss: 0.33803513646125793, mean loss: 0.3517702158294759
Epoch: 23, step: 305, loss: 0.3156464695930481, mean loss: 0.35176913808777777
Epoch: 23, step: 306, loss: 0.2933495044708252, mean loss: 0.3517673952066173
Epoch: 23, step: 307, loss: 0.3544033467769623, mean loss: 0.3517674738447907
Epoch: 23, step: 308, loss: 0.34824174642562866, mean loss: 0.3517673686651296
Epoch: 23, step: 309, loss: 0.36572715640068054, mean loss: 0.3517677851017305
Epoch: 23, step: 310, loss: 0.30798640847206116, mean loss: 0.3517664790916291
Epoch: 23, step: 311, loss: 0.3140864372253418, mean loss: 0.35176535511949375
Epoch: 23, step: 312, loss: 0.3757534623146057, mean loss: 0.3517660706484183
Epoch: 23, step: 313, loss: 0.31394311785697937, mean loss: 0.35176494248064427
Epoch: 23, step: 314, loss: 0.34705910086631775, mean loss: 0.351764802120886
Epoch: 23, step: 315, loss: 0.38295239210128784, mean loss: 0.35176573231624453
Epoch: 23, step: 316, loss: 0.31231698393821716, mean loss: 0.3517645557601773
Epoch: 23, step: 317, loss: 0.3482685685157776, mean loss: 0.3517644514957203
Epoch: 23, step: 318, loss: 0.31323519349098206, mean loss: 0.35176330243192844
Epoch: 23, step: 319, loss: 0.3484286665916443, mean loss: 0.35176320298555364
Epoch: 23, step: 320, loss: 0.28913217782974243, mean loss: 0.35176133524257935
Epoch: 23, step: 321, loss: 0.31807735562324524, mean loss: 0.351760330770115
Epoch: 23, step: 322, loss: 0.31099799275398254, mean loss: 0.3517591152538479
Epoch: 23, step: 323, loss: 0.34723106026649475, mean loss: 0.3517589802331243
Epoch: 23, step: 324, loss: 0.3253585994243622, mean loss: 0.35175819303150196
Epoch: 23, step: 325, loss: 0.3542756140232086, mean loss: 0.35175826809325256
Epoch: 23, step: 326, loss: 0.37643107771873474, mean loss: 0.35175900373860947
Epoch: 23, step: 327, loss: 0.3265720307826996, mean loss: 0.3517582527853311
Epoch: 23, step: 328, loss: 0.34154102206230164, mean loss: 0.3517579481661867
Epoch: 23, step: 329, loss: 0.3280273973941803, mean loss: 0.35175724067853625
Epoch: 23, step: 330, loss: 0.3137145936489105, mean loss: 0.3517561065329014
Epoch: 23, step: 331, loss: 0.3578226864337921, mean loss: 0.35175628738729864
Epoch: 23, step: 332, loss: 0.3662034571170807, mean loss: 0.3517567180675708
Epoch: 23, step: 333, loss: 0.3554384410381317, mean loss: 0.3517568278190455
Epoch: 23, step: 334, loss: 0.3378884494304657, mean loss: 0.35175641441759714
Epoch: 23, step: 335, loss: 0.3246386647224426, mean loss: 0.3517556060907313
Epoch: 23, step: 336, loss: 0.31846630573272705, mean loss: 0.3517546138316369
Epoch: 23, step: 337, loss: 0.3148380517959595, mean loss: 0.3517535134870159
Epoch: 23, step: 338, loss: 0.33019593358039856, mean loss: 0.35175287095535046
Epoch: 23, step: 339, loss: 0.3335767090320587, mean loss: 0.3517523292242488
Epoch: 23, step: 340, loss: 0.35297754406929016, mean loss: 0.35175236574005503
Epoch: 23, step: 341, loss: 0.31578436493873596, mean loss: 0.35175129379629866
Epoch: 23, step: 342, loss: 0.29676729440689087, mean loss: 0.35174965517316087
Epoch: 23, step: 343, loss: 0.315247505903244, mean loss: 0.35174856737517335
Epoch: 23, step: 344, loss: 0.3888303339481354, mean loss: 0.3517496724133643
Epoch: 23, step: 345, loss: 0.3242790102958679, mean loss: 0.3517488538108815
Epoch: 23, step: 346, loss: 0.3935921788215637, mean loss: 0.35175010066939966
Epoch: 23, step: 347, loss: 0.3734029531478882, mean loss: 0.35175074586762606
Epoch: 23, step: 348, loss: 0.307567298412323, mean loss: 0.351749429355977
Epoch: 23, step: 349, loss: 0.2975243031978607, mean loss: 0.3517478136856904
Epoch: 23, step: 350, loss: 0.3218993544578552, mean loss: 0.35174692435937194
Epoch: 23, step: 351, loss: 0.29860955476760864, mean loss: 0.35174534119379003
Epoch: 23, step: 352, loss: 0.36241307854652405, mean loss: 0.351745659017039
Epoch: 23, step: 353, loss: 0.33580273389816284, mean loss: 0.35174518404459315
Epoch: 23, step: 354, loss: 0.34769782423973083, mean loss: 0.35174506346903367
Epoch: 23, step: 355, loss: 0.3431251049041748, mean loss: 0.351744806678085
Epoch: 23, step: 356, loss: 0.3192335367202759, mean loss: 0.3517438381872167
Epoch: 23, step: 357, loss: 0.3205868899822235, mean loss: 0.35174291006841407
Epoch: 23, step: 358, loss: 0.354731947183609, mean loss: 0.3517429991046988
Epoch: 23, step: 359, loss: 0.3143293261528015, mean loss: 0.3517418846738352
Epoch: 23, step: 360, loss: 0.3330894708633423, mean loss: 0.35174132909602535
Epoch: 23, step: 361, loss: 0.3314925730228424, mean loss: 0.35174072598778466
Epoch: 23, step: 362, loss: 0.33936163783073425, mean loss: 0.35174035728821185
Epoch: 23, step: 363, loss: 0.324690580368042, mean loss: 0.3517395516598785
Epoch: 23, step: 364, loss: 0.33677878975868225, mean loss: 0.3517391060941073
Epoch: 23, step: 365, loss: 0.2963669002056122, mean loss: 0.3517374570320462
Epoch: 23, step: 366, loss: 0.2729811668395996, mean loss: 0.35173511162896115
Epoch: 23, step: 367, loss: 0.30808740854263306, mean loss: 0.3517338118164809
Epoch: 23, step: 368, loss: 0.3473520576953888, mean loss: 0.3517336813333469
Epoch: 23, step: 369, loss: 0.3630382716655731, mean loss: 0.3517340179598234
Epoch: 23, step: 370, loss: 0.30555662512779236, mean loss: 0.35173264293695966
Epoch: 23, step: 371, loss: 0.3395712077617645, mean loss: 0.35173228081704616
Epoch: 23, step: 372, loss: 0.38914230465888977, mean loss: 0.35173339470788556
Epoch: 23, step: 373, loss: 0.3718034625053406, mean loss: 0.35173399228032043
Epoch: 23, step: 374, loss: 0.33246657252311707, mean loss: 0.35173341862325797
Epoch: 23, step: 375, loss: 0.3056629002094269, mean loss: 0.3517320469870065
Epoch: 23, step: 376, loss: 0.3141472637653351, mean loss: 0.3517309280259412
Epoch: 23, step: 377, loss: 0.3284028470516205, mean loss: 0.3517302335311221
Epoch: 23, step: 378, loss: 0.3425111472606659, mean loss: 0.35172995908004084
Epoch: 23, step: 379, loss: 0.3133983314037323, mean loss: 0.35172881798609956
Epoch: 23, step: 380, loss: 0.3224843442440033, mean loss: 0.3517279474334921
Epoch: 23, step: 381, loss: 0.3634040653705597, mean loss: 0.35172829499906744
Epoch: 23, step: 382, loss: 0.3127138018608093, mean loss: 0.3517271336806231
Epoch: 23, step: 383, loss: 0.3471604287624359, mean loss: 0.35172699775060406
Epoch: 23, step: 384, loss: 0.3352337181568146, mean loss: 0.3517265068353559
Epoch: 23, step: 385, loss: 0.32017406821250916, mean loss: 0.3517255677187828
Epoch: 23, step: 386, loss: 0.30719634890556335, mean loss: 0.35172424240496947
Epoch: 23, step: 387, loss: 0.34038519859313965, mean loss: 0.3517239049334274
Epoch: 23, step: 388, loss: 0.3303081691265106, mean loss: 0.35172326757930683
Epoch: 23, step: 389, loss: 0.2960999310016632, mean loss: 0.35172161222139425
Epoch: 23, step: 390, loss: 0.2992190718650818, mean loss: 0.35172004978529164
Epoch: 23, step: 391, loss: 0.34598925709724426, mean loss: 0.3517198792462877
Epoch: 23, step: 392, loss: 0.32209503650665283, mean loss: 0.3517189976857241
Epoch: 23, step: 393, loss: 0.343626469373703, mean loss: 0.3517187568796683
Epoch: 23, step: 394, loss: 0.42167800664901733, mean loss: 0.3517208385665124
Epoch: 23, step: 395, loss: 0.37732425332069397, mean loss: 0.35172160039151695
Epoch: 23, step: 396, loss: 0.292616069316864, mean loss: 0.3517198417693897
Epoch: 23, step: 397, loss: 0.30835652351379395, mean loss: 0.351718551578427
Epoch: 23, step: 398, loss: 0.33857426047325134, mean loss: 0.3517181605073162
Epoch: 23, step: 399, loss: 0.3125097453594208, mean loss: 0.351716994006806
Epoch: 23, step: 400, loss: 0.38540348410606384, mean loss: 0.3517179961931654
Epoch: 23, step: 401, loss: 0.3474157154560089, mean loss: 0.35171786820242534
Epoch: 23, step: 402, loss: 0.3809652030467987, mean loss: 0.35171873827039635
Epoch: 23, step: 403, loss: 0.3416576683521271, mean loss: 0.3517184389763126
Epoch: 23, step: 404, loss: 0.3460925221443176, mean loss: 0.35171827162298447
Epoch: 23, step: 405, loss: 0.33611080050468445, mean loss: 0.35171780736362585
Epoch: 23, step: 406, loss: 0.32336464524269104, mean loss: 0.35171696399641916
Epoch: 23, step: 407, loss: 0.3128405511379242, mean loss: 0.3517158076486244
Epoch: 23, step: 408, loss: 0.3813885748386383, mean loss: 0.3517166902150915
Epoch: 23, step: 409, loss: 0.3133172392845154, mean loss: 0.351715548122089
Epoch: 23, step: 410, loss: 0.32466182112693787, mean loss: 0.35171474350242404
Epoch: 23, step: 411, loss: 0.2978851795196533, mean loss: 0.35171314257558656
Epoch: 23, step: 412, loss: 0.3472198247909546, mean loss: 0.3517130089453179
Epoch: 23, step: 413, loss: 0.30021223425865173, mean loss: 0.3517114773693146
Epoch: 23, step: 414, loss: 0.3181494176387787, mean loss: 0.35171047930050886
Epoch: 23, step: 415, loss: 0.4140722155570984, mean loss: 0.35171233375918187
Epoch: 23, step: 416, loss: 0.3646172285079956, mean loss: 0.35171271750222355
Epoch: 23, step: 417, loss: 0.3552687168121338, mean loss: 0.3517128232411266
Epoch: 23, step: 418, loss: 0.3366259038448334, mean loss: 0.35171237463955674
Epoch: 23, step: 419, loss: 0.3463239371776581, mean loss: 0.35171221442198236
Epoch: 23, step: 420, loss: 0.31709569692611694, mean loss: 0.35171118517934874
Epoch: 23, step: 421, loss: 0.36578378081321716, mean loss: 0.3517116035832149
Epoch: 23, step: 422, loss: 0.2936345934867859, mean loss: 0.35170987689940053
Epoch: 23, step: 423, loss: 0.31992465257644653, mean loss: 0.351708931923056
Epoch: 23, step: 424, loss: 0.3231704533100128, mean loss: 0.35170808349785126
Epoch: 23, step: 425, loss: 0.31613707542419434, mean loss: 0.35170702603283927
Epoch: 23, step: 426, loss: 0.29227712750434875, mean loss: 0.35170525933648894
Epoch: 23, step: 427, loss: 0.3301318287849426, mean loss: 0.35170461803355935
Epoch: 23, step: 428, loss: 0.3241291344165802, mean loss: 0.35170379833486975
Epoch: 23, step: 429, loss: 0.34929323196411133, mean loss: 0.3517037266813899
Epoch: 23, step: 430, loss: 0.35645127296447754, mean loss: 0.35170386779681606
Epoch: 23, step: 431, loss: 0.3143914043903351, mean loss: 0.351702758759145
Epoch: 23, step: 432, loss: 0.3142951428890228, mean loss: 0.3517016469263059
Epoch: 23, step: 433, loss: 0.314576119184494, mean loss: 0.3517005435105138
Epoch: 23, step: 434, loss: 0.32296690344810486, mean loss: 0.35169968953720077
Epoch: 23, step: 435, loss: 0.3116481304168701, mean loss: 0.35169849922695584
Epoch: 23, step: 436, loss: 0.37643498182296753, mean loss: 0.3516992343597264
Epoch: 23, step: 437, loss: 0.3179439306259155, mean loss: 0.3516982312303435
Epoch: 23, step: 438, loss: 0.3214588463306427, mean loss: 0.35169733261262337
Epoch: 23, step: 439, loss: 0.33748701214790344, mean loss: 0.35169691033993633
Epoch: 23, step: 440, loss: 0.356741338968277, mean loss: 0.3516970602352987
Epoch: 23, step: 441, loss: 0.3473247289657593, mean loss: 0.351696930315192
Epoch: 23, step: 442, loss: 0.32422736287117004, mean loss: 0.3516961141046009
Epoch: 23, step: 443, loss: 0.3512221872806549, mean loss: 0.35169610002310503
Epoch: 23, step: 444, loss: 0.3076172173023224, mean loss: 0.3516947903733228
Epoch: 23, step: 445, loss: 0.31421932578086853, mean loss: 0.3516936769540884
Epoch: 23, step: 446, loss: 0.3495764434337616, mean loss: 0.3516936140516397
Epoch: 23, step: 447, loss: 0.31538254022598267, mean loss: 0.3516925352912765
Epoch: 23, step: 448, loss: 0.30982136726379395, mean loss: 0.3516912913838457
Epoch: 23, step: 449, loss: 0.3499341905117035, mean loss: 0.3516912391854953
Epoch: 23, step: 450, loss: 0.38439491391181946, mean loss: 0.35169221068758144
Epoch: 23, step: 451, loss: 0.3205520808696747, mean loss: 0.3516912856599609
Epoch: 23, step: 452, loss: 0.3215939998626709, mean loss: 0.35169039163691623
Epoch: 23, step: 453, loss: 0.3388606011867523, mean loss: 0.35169001054648524
Epoch: 23, step: 454, loss: 0.3272828757762909, mean loss: 0.35168928558926393
Epoch: 23, step: 455, loss: 0.32543691992759705, mean loss: 0.35168850584690736
Epoch: 23, step: 456, loss: 0.31938326358795166, mean loss: 0.35168754635175575
Epoch: 23, step: 457, loss: 0.35501134395599365, mean loss: 0.3516876450686433
Epoch: 23, step: 458, loss: 0.3402845561504364, mean loss: 0.35168730640662205
Epoch: 23, step: 459, loss: 0.34185990691185, mean loss: 0.3516870145499015
Epoch: 23, step: 460, loss: 0.2992483973503113, mean loss: 0.35168545726016787
Epoch: 23, step: 461, loss: 0.3610556721687317, mean loss: 0.3516857355227713
Epoch: 23, step: 462, loss: 0.3587123155593872, mean loss: 0.35168594418142124
Epoch: 23, step: 463, loss: 0.3328014612197876, mean loss: 0.3516853834116457
Epoch: 23, step: 464, loss: 0.3987993597984314, mean loss: 0.3516867824072922
Epoch: 23, step: 465, loss: 0.343845933675766, mean loss: 0.3516865495891696
Epoch: 23, step: 466, loss: 0.3227475583553314, mean loss: 0.35168569032995073
Epoch: 23, step: 467, loss: 0.3246253728866577, mean loss: 0.3516848868763449
Epoch: 23, step: 468, loss: 0.288392573595047, mean loss: 0.35168300770668603
Epoch: 23, step: 469, loss: 0.3596173822879791, mean loss: 0.3516832432738905
Epoch: 23, step: 470, loss: 0.3039083778858185, mean loss: 0.3516818249066017
Epoch: 23, step: 471, loss: 0.3176637291908264, mean loss: 0.3516808149880732
Epoch: 23, step: 472, loss: 0.3107030391693115, mean loss: 0.35167959848886526
Epoch: 23, step: 473, loss: 0.358113169670105, mean loss: 0.35167978947536355
Epoch: 23, step: 474, loss: 0.36967265605926514, mean loss: 0.3516803235943585
Epoch: 23, step: 475, loss: 0.3269612193107605, mean loss: 0.3516795898284988
Epoch: 23, step: 476, loss: 0.3432256877422333, mean loss: 0.3516793388889611
Epoch: 23, step: 477, loss: 0.321524053812027, mean loss: 0.35167844380777746
Epoch: 23, step: 478, loss: 0.3209476172924042, mean loss: 0.35167753167021804
Epoch: 23, step: 479, loss: 0.3998076915740967, mean loss: 0.35167896020399175
Epoch: 23, step: 480, loss: 0.3187355101108551, mean loss: 0.3516779824504497
Epoch: 23, step: 481, loss: 0.33674895763397217, mean loss: 0.3516775393737946
Epoch: 23, step: 482, loss: 0.34858909249305725, mean loss: 0.3516774477148873
Epoch: 23, step: 483, loss: 0.32617679238319397, mean loss: 0.3516766909290572
Epoch: 23, step: 484, loss: 0.3097773492336273, mean loss: 0.35167544751445956
Epoch: 23, step: 485, loss: 0.3271010220050812, mean loss: 0.3516747182597409
Epoch: 23, step: 486, loss: 0.3768070936203003, mean loss: 0.351675464049686
Epoch: 23, step: 487, loss: 0.3309449553489685, mean loss: 0.3516748489010599
Epoch: 23, step: 488, loss: 0.3071921169757843, mean loss: 0.3516735289778551
Epoch: 23, step: 489, loss: 0.35987308621406555, mean loss: 0.35167377227371993
Epoch: 23, step: 490, loss: 0.3173062205314636, mean loss: 0.35167275255583896
Epoch: 23, step: 491, loss: 0.338876873254776, mean loss: 0.3516723729012193
Epoch: 23, step: 492, loss: 0.33260855078697205, mean loss: 0.3516718072930865
Epoch: 23, step: 493, loss: 0.33271151781082153, mean loss: 0.3516712447733724
Epoch: 23, step: 494, loss: 0.31484556198120117, mean loss: 0.3516701522500748
Epoch: 23, step: 495, loss: 0.3472291827201843, mean loss: 0.3516700205018391
Epoch: 23, step: 496, loss: 0.3085569441318512, mean loss: 0.35166874152363237
Epoch: 23, step: 497, loss: 0.3467247486114502, mean loss: 0.3516685948611313
Epoch: 23, step: 498, loss: 0.3223276138305664, mean loss: 0.3516677244929716
Epoch: 23, step: 499, loss: 0.32031500339508057, mean loss: 0.35166679447632776
Epoch: 23, step: 500, loss: 0.35175999999046326, mean loss: 0.3516667972410035
Epoch: 23, step: 501, loss: 0.35273802280426025, mean loss: 0.35166682901491236
Epoch: 23, step: 502, loss: 0.3167378306388855, mean loss: 0.3516657930072488
Epoch: 23, step: 503, loss: 0.3507413864135742, mean loss: 0.3516657655898033
Epoch: 23, step: 504, loss: 0.3183402717113495, mean loss: 0.35166477720133815
Epoch: 23, step: 505, loss: 0.3573293089866638, mean loss: 0.35166494519860325
Epoch: 23, step: 506, loss: 0.3001747727394104, mean loss: 0.35166341816125163
Epoch: 23, step: 507, loss: 0.28094279766082764, mean loss: 0.3516613208712012
Epoch: 23, step: 508, loss: 0.3276883363723755, mean loss: 0.3516606099496835
Epoch: 23, step: 509, loss: 0.3206996023654938, mean loss: 0.35165969182479223
Epoch: 23, step: 510, loss: 0.34934332966804504, mean loss: 0.35165962313688914
Epoch: 23, step: 511, loss: 0.32260358333587646, mean loss: 0.351658761553453
Epoch: 23, step: 512, loss: 0.34291693568229675, mean loss: 0.35165850234438345
Epoch: 23, step: 513, loss: 0.3091996908187866, mean loss: 0.35165724341028143
Epoch: 23, step: 514, loss: 0.34568169713020325, mean loss: 0.35165706623631754
Epoch: 23, step: 515, loss: 0.3186056315898895, mean loss: 0.35165608629577416
Epoch: 23, step: 516, loss: 0.31933513283729553, mean loss: 0.3516551280416469
Epoch: 23, step: 517, loss: 0.3417404890060425, mean loss: 0.35165483410037696
Epoch: 23, step: 518, loss: 0.3513161838054657, mean loss: 0.35165482406064213
Epoch: 23, step: 519, loss: 0.2934836745262146, mean loss: 0.351653099551288
Epoch: 23, step: 520, loss: 0.30379045009613037, mean loss: 0.35165168068402286
Epoch: 23, step: 521, loss: 0.32924970984458923, mean loss: 0.35165101660710224
Epoch: 23, step: 522, loss: 0.33729034662246704, mean loss: 0.3516505909165736
Epoch: 23, step: 523, loss: 0.3600907325744629, mean loss: 0.35165084109862416
Epoch: 23, step: 524, loss: 0.3378176689147949, mean loss: 0.35165043106891836
Epoch: 23, step: 525, loss: 0.31723493337631226, mean loss: 0.3516494109877727
Epoch: 23, step: 526, loss: 0.35444754362106323, mean loss: 0.35164949392243683
Epoch: 23, step: 527, loss: 0.332543283700943, mean loss: 0.35164892764471833
Epoch: 23, step: 528, loss: 0.330039918422699, mean loss: 0.35164828720699504
Epoch: 23, step: 529, loss: 0.3492518365383148, mean loss: 0.35164821618421427
Epoch: 23, step: 530, loss: 0.3882158696651459, mean loss: 0.351649299895013
Epoch: 23, step: 531, loss: 0.33066028356552124, mean loss: 0.35164867788765375
Epoch: 23, step: 532, loss: 0.3332423269748688, mean loss: 0.35164813243348536
Epoch: 23, step: 533, loss: 0.3476434051990509, mean loss: 0.3516480137608357
Epoch: 23, step: 534, loss: 0.4033888578414917, mean loss: 0.35164954695916684
Epoch: 23, step: 535, loss: 0.3354479670524597, mean loss: 0.3516490668839059
Epoch: 23, step: 536, loss: 0.33325955271720886, mean loss: 0.3516485219932672
Epoch: 23, step: 537, loss: 0.328460693359375, mean loss: 0.3516478349464928
Epoch: 23, step: 538, loss: 0.3014189898967743, mean loss: 0.35164634672851264
Epoch: 23, step: 539, loss: 0.37440696358680725, mean loss: 0.35164702107719886
Epoch: 23, step: 540, loss: 0.30890822410583496, mean loss: 0.35164575485502686
Epoch: 23, step: 541, loss: 0.37956345081329346, mean loss: 0.35164658194799236
Epoch: 23, step: 542, loss: 0.3444020748138428, mean loss: 0.35164636732772475
Epoch: 23, step: 543, loss: 0.3177238404750824, mean loss: 0.3516453623944728
Epoch: 23, step: 544, loss: 0.3323970437049866, mean loss: 0.3516447921921832
Epoch: 23, step: 545, loss: 0.30069878697395325, mean loss: 0.35164328303864273
Epoch: 23, step: 546, loss: 0.33896106481552124, mean loss: 0.35164290736939235
Epoch: 23, step: 547, loss: 0.3015630841255188, mean loss: 0.35164142396230574
Epoch: 23, step: 548, loss: 0.3876325488090515, mean loss: 0.3516424900185495
Epoch: 23, step: 549, loss: 0.33665230870246887, mean loss: 0.3516420460228942
Epoch: 23, step: 550, loss: 0.33731919527053833, mean loss: 0.3516416218055334
Epoch: 23, step: 551, loss: 0.3359842002391815, mean loss: 0.351641158074294
Epoch: 23, step: 552, loss: 0.32213839888572693, mean loss: 0.3516402843068073
Epoch: 23, step: 553, loss: 0.33994337916374207, mean loss: 0.35163993789606446
Epoch: 23, step: 554, loss: 0.32545533776283264, mean loss: 0.35163916244665727
Epoch: 23, step: 555, loss: 0.3059239983558655, mean loss: 0.3516378086453042
Epoch: 23, step: 556, loss: 0.350118488073349, mean loss: 0.35163776365372695
Epoch: 23, step: 557, loss: 0.3323555588722229, mean loss: 0.35163719266750304
Epoch: 23, step: 558, loss: 0.3576829731464386, mean loss: 0.3516373716903475
Epoch: 23, step: 559, loss: 0.378133624792099, mean loss: 0.3516381562530948
Epoch: 23, step: 560, loss: 0.34733399748802185, mean loss: 0.35163802880931533
Epoch: 23, step: 561, loss: 0.312367707490921, mean loss: 0.3516368660710753
Epoch: 23, step: 562, loss: 0.3128463625907898, mean loss: 0.35163571757356293
Epoch: 23, step: 563, loss: 0.3386741280555725, mean loss: 0.3516353338220969
Epoch: 23, step: 564, loss: 0.3294418156147003, mean loss: 0.35163467676202026
Epoch: 23, step: 565, loss: 0.3015165328979492, mean loss: 0.3516331930109437
Epoch: 23, step: 566, loss: 0.2987475097179413, mean loss: 0.3516316273730239
Epoch: 23, step: 567, loss: 0.32381415367126465, mean loss: 0.3516308038835715
Epoch: 23, step: 568, loss: 0.32966235280036926, mean loss: 0.3516301535638331
Epoch: 23, step: 569, loss: 0.297629177570343, mean loss: 0.3516285550505422
Epoch: 23, step: 570, loss: 0.2879205048084259, mean loss: 0.35162666924850444
Epoch: 23, step: 571, loss: 0.33129239082336426, mean loss: 0.3516260673577152
Epoch: 23, step: 572, loss: 0.35993218421936035, mean loss: 0.3516263132099236
Epoch: 23, step: 573, loss: 0.32470834255218506, mean loss: 0.3516255164902569
Epoch: 23, step: 574, loss: 0.3874681890010834, mean loss: 0.35162657733237107
Epoch: 23, step: 575, loss: 0.3111862540245056, mean loss: 0.3516253804481723
Epoch: 23, step: 576, loss: 0.29015782475471497, mean loss: 0.3516235612894019
Epoch: 23, step: 577, loss: 0.3454321324825287, mean loss: 0.35162337805682403
Epoch: 23, step: 578, loss: 0.3758140802383423, mean loss: 0.3516240939486941
Epoch: 23, step: 579, loss: 0.33878806233406067, mean loss: 0.35162371409453885
Epoch: 23, step: 580, loss: 0.34276288747787476, mean loss: 0.3516234518856016
Epoch: 23, step: 581, loss: 0.3383030891418457, mean loss: 0.3516230577220595
Epoch: 23, step: 582, loss: 0.32332634925842285, mean loss: 0.3516222204174741
Epoch: 23, step: 583, loss: 0.34093838930130005, mean loss: 0.3516219042903846
Epoch: 23, step: 584, loss: 0.31895947456359863, mean loss: 0.35162093786053206
Epoch: 23, step: 585, loss: 0.3432055413722992, mean loss: 0.3516206888695714
Epoch: 23, step: 586, loss: 0.33147895336151123, mean loss: 0.3516200929426058
Epoch: 23, step: 587, loss: 0.3174147307872772, mean loss: 0.35161908094964267
Epoch: 23, step: 588, loss: 0.34703829884529114, mean loss: 0.35161894542755445
Epoch: 23, step: 589, loss: 0.3532353937625885, mean loss: 0.35161899324864004
Epoch: 23, step: 590, loss: 0.3473711311817169, mean loss: 0.3516188675834013
Epoch: 23, step: 591, loss: 0.341321736574173, mean loss: 0.3516185629706037
Epoch: 23, step: 592, loss: 0.2869565486907959, mean loss: 0.35161665017621585
Epoch: 23, step: 593, loss: 0.34660106897354126, mean loss: 0.3516165018125762
Epoch: 23, step: 594, loss: 0.32504114508628845, mean loss: 0.3516157157222184
Epoch: 23, step: 595, loss: 0.35748428106307983, mean loss: 0.3516158893073267
Epoch: 23, step: 596, loss: 0.34680354595184326, mean loss: 0.3516157469682053
Epoch: 23, step: 597, loss: 0.3297087252140045, mean loss: 0.35161509902316673
Epoch: 23, step: 598, loss: 0.33111247420310974, mean loss: 0.3516144926339792
Epoch: 23, step: 599, loss: 0.3703753352165222, mean loss: 0.35161504749150263
Epoch: 23, step: 600, loss: 0.3693804144859314, mean loss: 0.3516155728919993
Epoch: 23, step: 601, loss: 0.34827059507369995, mean loss: 0.3516154739691325
Epoch: 23, step: 602, loss: 0.37857070565223694, mean loss: 0.35161627110743454
Epoch: 23, step: 603, loss: 0.317984014749527, mean loss: 0.35161527654106484
Epoch: 23, step: 604, loss: 0.305023193359375, mean loss: 0.35161389877002713
Epoch: 23, step: 605, loss: 0.3123100996017456, mean loss: 0.35161273655466346
Epoch: 23, step: 606, loss: 0.39784663915634155, mean loss: 0.35161410365311707
Epoch: 23, step: 607, loss: 0.35205894708633423, mean loss: 0.3516141168063824
Epoch: 23, step: 608, loss: 0.3103237748146057, mean loss: 0.35161289595714695
Epoch: 23, step: 609, loss: 0.35879749059677124, mean loss: 0.3516131083808546
Epoch: 23, step: 610, loss: 0.3209962546825409, mean loss: 0.35161220317275066
Epoch: 23, step: 611, loss: 0.28954821825027466, mean loss: 0.35161036826307346
Epoch: 23, step: 612, loss: 0.3207756280899048, mean loss: 0.3516094566669116
Epoch: 23, step: 613, loss: 0.3039652705192566, mean loss: 0.35160804815907304
Epoch: 23, step: 614, loss: 0.35378021001815796, mean loss: 0.3516081123729217
Epoch: 23, step: 615, loss: 0.3464219868183136, mean loss: 0.3516079590642557
Epoch: 23, step: 616, loss: 0.2820909321308136, mean loss: 0.35160590411060844
Epoch: 23, step: 617, loss: 0.2893334925174713, mean loss: 0.35160406336536476
Epoch: 23, step: 618, loss: 0.2883911430835724, mean loss: 0.3516021948743275
Epoch: 23, step: 619, loss: 0.35917145013809204, mean loss: 0.35160241860497493
Epoch: 23, step: 620, loss: 0.3394370973110199, mean loss: 0.35160205903528574
Epoch: 23, step: 621, loss: 0.334781289100647, mean loss: 0.35160156187946806
Epoch: 23, step: 622, loss: 0.33227425813674927, mean loss: 0.35160099065725015
Epoch: 23, step: 623, loss: 0.2962890565395355, mean loss: 0.3515993559506029
Epoch: 23, step: 624, loss: 0.3194998800754547, mean loss: 0.35159840730043074
Epoch: 23, step: 625, loss: 0.354343056678772, mean loss: 0.3515984884118847
Epoch: 23, step: 626, loss: 0.3309978246688843, mean loss: 0.35159787962723554
Epoch: 23, step: 627, loss: 0.30842411518096924, mean loss: 0.35159660380677316
Epoch: 23, step: 628, loss: 0.34396132826805115, mean loss: 0.3515963781847307
Epoch: 23, step: 629, loss: 0.3503451943397522, mean loss: 0.3515963412133979
Epoch: 23, step: 630, loss: 0.30181685090065, mean loss: 0.35159487031866893
Epoch: 23, step: 631, loss: 0.39685115218162537, mean loss: 0.3515962075211823
Epoch: 23, step: 632, loss: 0.3447616398334503, mean loss: 0.35159600558388915
Epoch: 23, step: 633, loss: 0.32649731636047363, mean loss: 0.35159526402833685
Epoch: 23, step: 634, loss: 0.32869166135787964, mean loss: 0.3515945873479022
Epoch: 23, step: 635, loss: 0.36460381746292114, mean loss: 0.3515949716905551
Epoch: 23, step: 636, loss: 0.33144837617874146, mean loss: 0.35159437650028325
Epoch: 23, step: 637, loss: 0.3447010815143585, mean loss: 0.35159417285789074
Epoch: 23, step: 638, loss: 0.2873016893863678, mean loss: 0.3515922735791849
Epoch: 23, step: 639, loss: 0.3291395902633667, mean loss: 0.35159161031901365
Epoch: 23, step: 640, loss: 0.3342418074607849, mean loss: 0.3515910978148675
Epoch: 23, step: 641, loss: 0.3192436397075653, mean loss: 0.3515901423160164
Epoch: 23, step: 642, loss: 0.3170698881149292, mean loss: 0.3515891226659144
Epoch: 23, step: 643, loss: 0.34134143590927124, mean loss: 0.35158881998140484
Epoch: 23, step: 644, loss: 0.37901607155799866, mean loss: 0.3515896300724223
Epoch: 23, step: 645, loss: 0.3363582193851471, mean loss: 0.35158918021092167
Epoch: 23, step: 646, loss: 0.31109583377838135, mean loss: 0.351587984270509
Epoch: 23, step: 647, loss: 0.3608287274837494, mean loss: 0.3515882571808225
Epoch: 23, step: 648, loss: 0.4124468266963959, mean loss: 0.35159005448655817
Epoch: 23, step: 649, loss: 0.3383016884326935, mean loss: 0.3515896620594702
Epoch: 23, step: 650, loss: 0.36184775829315186, mean loss: 0.35158996498880996
Epoch: 23, step: 651, loss: 0.32417580485343933, mean loss: 0.35158915545183456
Epoch: 23, step: 652, loss: 0.34174269437789917, mean loss: 0.35158886469556483
Epoch: 23, step: 653, loss: 0.3541228473186493, mean loss: 0.35158893951935927
Epoch: 23, step: 654, loss: 0.31631532311439514, mean loss: 0.3515878979858191
Epoch: 23, step: 655, loss: 0.3443398177623749, mean loss: 0.35158768397612783
Epoch: 23, step: 656, loss: 0.30893474817276, mean loss: 0.3515864246258133
Epoch: 23, step: 657, loss: 0.38776537775993347, mean loss: 0.3515874927968536
Epoch: 23, step: 658, loss: 0.3408215641975403, mean loss: 0.351587174945931
Epoch: 23, step: 659, loss: 0.320120632648468, mean loss: 0.35158624596204174
Epoch: 23, step: 660, loss: 0.32107827067375183, mean loss: 0.3515853453044298
Epoch: 23, step: 661, loss: 0.32245638966560364, mean loss: 0.35158448538367526
Epoch: 23, step: 662, loss: 0.34388554096221924, mean loss: 0.3515842581085632
Epoch: 23, step: 663, loss: 0.3233191668987274, mean loss: 0.3515834237393576
Epoch: 23, step: 664, loss: 0.33797672390937805, mean loss: 0.3515830220892755
Epoch: 23, step: 665, loss: 0.3661489188671112, mean loss: 0.3515834520407714
Epoch: 23, step: 666, loss: 0.2996777892112732, mean loss: 0.3515819199511929
Epoch: 23, step: 667, loss: 0.2941035032272339, mean loss: 0.3515802234217737
Epoch: 23, step: 668, loss: 0.33091744780540466, mean loss: 0.3515796135585578
Epoch: 23, step: 669, loss: 0.30758240818977356, mean loss: 0.3515783150164007
Epoch: 23, step: 670, loss: 0.31848663091659546, mean loss: 0.3515773383707642
Epoch: 23, step: 671, loss: 0.3136286735534668, mean loss: 0.35157621841252973
Epoch: 23, step: 672, loss: 0.3158133924007416, mean loss: 0.351575162994911
Epoch: 23, step: 673, loss: 0.3081050515174866, mean loss: 0.3515738801609537
Epoch: 23, step: 674, loss: 0.3527807891368866, mean loss: 0.3515739157766463
Epoch: 23, step: 675, loss: 0.36158353090286255, mean loss: 0.3515742111500861
Epoch: 23, step: 676, loss: 0.33407124876976013, mean loss: 0.3515736946709223
Epoch: 23, step: 677, loss: 0.32290661334991455, mean loss: 0.35157284878478123
Epoch: 23, step: 678, loss: 0.372699111700058, mean loss: 0.35157347214387114
Epoch: 23, step: 679, loss: 0.33982738852500916, mean loss: 0.35157312556994164
Epoch: 23, step: 680, loss: 0.3204742968082428, mean loss: 0.35157220801089517
Epoch: 23, step: 681, loss: 0.3189975619316101, mean loss: 0.35157124693677944
Epoch: 23, step: 682, loss: 0.3340160548686981, mean loss: 0.35157072900811537
Epoch: 23, step: 683, loss: 0.3021416664123535, mean loss: 0.3515692707516074
Epoch: 23, step: 684, loss: 0.31604769825935364, mean loss: 0.35156822282487366
Epoch: 23, step: 685, loss: 0.3576098084449768, mean loss: 0.3515684010532535
Epoch: 23, step: 686, loss: 0.3037722706794739, mean loss: 0.35156699109631157
Epoch: 23, step: 687, loss: 0.31523260474205017, mean loss: 0.3515659192855047
Epoch: 23, step: 688, loss: 0.31314727663993835, mean loss: 0.3515647860256408
Epoch: 23, step: 689, loss: 0.3009825050830841, mean loss: 0.3515632940109826
Epoch: 23, step: 690, loss: 0.34775134921073914, mean loss: 0.3515631815741835
Epoch: 23, step: 691, loss: 0.3382807970046997, mean loss: 0.3515627898096551
Epoch: 23, step: 692, loss: 0.31330859661102295, mean loss: 0.3515616615337902
Epoch: 23, step: 693, loss: 0.34756311774253845, mean loss: 0.35156154360351854
Epoch: 23, step: 694, loss: 0.308351993560791, mean loss: 0.3515602692486643
Epoch: 23, step: 695, loss: 0.34981784224510193, mean loss: 0.35156021786176433
Epoch: 23, step: 696, loss: 0.35839608311653137, mean loss: 0.3515604194561863
Epoch: 23, step: 697, loss: 0.3417368233203888, mean loss: 0.35156012976004547
Epoch: 23, step: 698, loss: 0.31543827056884766, mean loss: 0.35155906456411523
Epoch: 23, step: 699, loss: 0.3064131736755371, mean loss: 0.3515577332981655
Epoch: 23, step: 700, loss: 0.34133046865463257, mean loss: 0.35155743172459064
Epoch: 23, step: 701, loss: 0.3899820148944855, mean loss: 0.35155856472521485
Epoch: 23, step: 702, loss: 0.33279138803482056, mean loss: 0.3515580113660319
Epoch: 23, step: 703, loss: 0.31971481442451477, mean loss: 0.35155707248181967
Epoch: 23, step: 704, loss: 0.3071678876876831, mean loss: 0.3515557637226489
Epoch: 23, step: 705, loss: 0.344654381275177, mean loss: 0.3515555602500843
Epoch: 23, step: 706, loss: 0.2825773060321808, mean loss: 0.351553526633108
Epoch: 23, step: 707, loss: 0.3149479329586029, mean loss: 0.3515524474587662
Epoch: 23, step: 708, loss: 0.3104119598865509, mean loss: 0.3515512346263741
Epoch: 23, step: 709, loss: 0.30199912190437317, mean loss: 0.3515497738601244
Epoch: 23, step: 710, loss: 0.3056753873825073, mean loss: 0.3515484215508806
Epoch: 23, step: 711, loss: 0.32145026326179504, mean loss: 0.35154753432772623
Epoch: 23, step: 712, loss: 0.30795860290527344, mean loss: 0.3515462494660778
Epoch: 23, step: 713, loss: 0.3515393137931824, mean loss: 0.3515462492616425
Epoch: 23, step: 714, loss: 0.3263434171676636, mean loss: 0.3515455064069223
Epoch: 23, step: 715, loss: 0.32137712836265564, mean loss: 0.35154461721869884
Epoch: 23, step: 716, loss: 0.3887735605239868, mean loss: 0.35154571447895716
Epoch: 23, step: 717, loss: 0.28856581449508667, mean loss: 0.351543858307428
Epoch: 23, step: 718, loss: 0.3207966983318329, mean loss: 0.35154295214020703
Epoch: 23, step: 719, loss: 0.3371155560016632, mean loss: 0.3515425269546554
Epoch: 23, step: 720, loss: 0.3153592050075531, mean loss: 0.351541460638033
Epoch: 23, step: 721, loss: 0.34198907017707825, mean loss: 0.35154117913893296
Epoch: 23, step: 722, loss: 0.3600035309791565, mean loss: 0.35154142850836984
Epoch: 23, step: 723, loss: 0.3648245334625244, mean loss: 0.351541819924711
Epoch: 23, step: 724, loss: 0.34954962134361267, mean loss: 0.35154176122186215
Epoch: 23, step: 725, loss: 0.37212374806404114, mean loss: 0.35154236768031116
Epoch: 23, step: 726, loss: 0.30771395564079285, mean loss: 0.3515410762924671
Epoch: 23, step: 727, loss: 0.3139854967594147, mean loss: 0.351539969763901
Epoch: 23, step: 728, loss: 0.32060855627059937, mean loss: 0.3515390584350217
Epoch: 23, step: 729, loss: 0.3064819276332855, mean loss: 0.35153773096077734
Epoch: 23, step: 730, loss: 0.3296171724796295, mean loss: 0.351537085155796
Epoch: 23, step: 731, loss: 0.32195112109184265, mean loss: 0.35153621354478776
Epoch: 23, step: 732, loss: 0.31213998794555664, mean loss: 0.3515350529548452
Epoch: 23, step: 733, loss: 0.35720598697662354, mean loss: 0.35153522001234894
Epoch: 23, step: 734, loss: 0.34363579750061035, mean loss: 0.3515349873136565
Epoch: 23, step: 735, loss: 0.36735236644744873, mean loss: 0.3515354532432881
Epoch: 23, step: 736, loss: 0.33078041672706604, mean loss: 0.3515348418839987
Epoch: 23, step: 737, loss: 0.31938713788986206, mean loss: 0.35153389497077353
Epoch: 23, step: 738, loss: 0.306112676858902, mean loss: 0.35153255712452125
Epoch: 23, step: 739, loss: 0.34516680240631104, mean loss: 0.3515323696317456
Epoch: 23, step: 740, loss: 0.34960857033729553, mean loss: 0.3515323129710884
Epoch: 23, step: 741, loss: 0.29716354608535767, mean loss: 0.35153071172331535
Epoch: 23, step: 742, loss: 0.32546594738960266, mean loss: 0.35152994409662314
Epoch: 23, step: 743, loss: 0.33683985471725464, mean loss: 0.3515295114753079
Epoch: 23, step: 744, loss: 0.32214680314064026, mean loss: 0.35152864618366453
Epoch: 23, step: 745, loss: 0.3383867144584656, mean loss: 0.35152825917819525
Epoch: 23, step: 746, loss: 0.35825005173683167, mean loss: 0.3515284571166669
Epoch: 23, step: 747, loss: 0.29625844955444336, mean loss: 0.35152682961349957
Epoch: 23, step: 748, loss: 0.35124391317367554, mean loss: 0.3515268212828721
Epoch: 23, step: 749, loss: 0.36379843950271606, mean loss: 0.3515271826166634
Epoch: 23, step: 750, loss: 0.3297187387943268, mean loss: 0.35152654049306353
Epoch: 23, step: 751, loss: 0.3138785660266876, mean loss: 0.3515254320260259
Epoch: 23, step: 752, loss: 0.3289540708065033, mean loss: 0.3515247674783674
Epoch: 23, step: 753, loss: 0.3489897549152374, mean loss: 0.3515246928445406
Epoch: 23, step: 754, loss: 0.33629879355430603, mean loss: 0.3515242445889016
Epoch: 23, step: 755, loss: 0.3274260461330414, mean loss: 0.35152353515065216
Epoch: 23, step: 756, loss: 0.34509360790252686, mean loss: 0.3515233458625587
Epoch: 23, step: 757, loss: 0.32611188292503357, mean loss: 0.3515225978065405
Epoch: 23, step: 758, loss: 0.28977450728416443, mean loss: 0.35152078013586485
Epoch: 23, step: 759, loss: 0.3624446988105774, mean loss: 0.35152110169240186
Epoch: 23, step: 760, loss: 0.34260401129722595, mean loss: 0.35152083921660066
Epoch: 23, step: 761, loss: 0.31756916642189026, mean loss: 0.3515198398737857
Epoch: 23, step: 762, loss: 0.2947446405887604, mean loss: 0.35151816878624237
Epoch: 23, step: 763, loss: 0.3412252366542816, mean loss: 0.35151786583909933
Epoch: 23, step: 764, loss: 0.3480399250984192, mean loss: 0.35151776347748
Epoch: 23, step: 765, loss: 0.31510475277900696, mean loss: 0.3515166918131472
Epoch: 23, step: 766, loss: 0.3465016782283783, mean loss: 0.3515165442215882
Epoch: 23, step: 767, loss: 0.3499307930469513, mean loss: 0.35151649755439646
Epoch: 23, step: 768, loss: 0.3610970675945282, mean loss: 0.35151677949342236
Epoch: 23, step: 769, loss: 0.339275062084198, mean loss: 0.3515164192521944
Epoch: 23, step: 770, loss: 0.3457106053829193, mean loss: 0.35151624840754064
Epoch: 23, step: 771, loss: 0.32845956087112427, mean loss: 0.35151556995039795
Epoch: 23, step: 772, loss: 0.33575835824012756, mean loss: 0.3515151062984424
Epoch: 23, step: 773, loss: 0.3621027171611786, mean loss: 0.3515154178270384
Epoch: 23, step: 774, loss: 0.3276769518852234, mean loss: 0.351514716427505
Epoch: 23, step: 775, loss: 0.4001385569572449, mean loss: 0.3515161470453857
Epoch: 23, step: 776, loss: 0.3078320324420929, mean loss: 0.3515148618026718
Epoch: 23, step: 777, loss: 0.3264447748661041, mean loss: 0.3515141242302406
Epoch: 23, step: 778, loss: 0.3351096212863922, mean loss: 0.35151364161710935
Epoch: 23, step: 779, loss: 0.3814712166786194, mean loss: 0.35151452292962587
Epoch: 23, step: 780, loss: 0.32841548323631287, mean loss: 0.3515138434062036
Epoch: 23, step: 781, loss: 0.29535841941833496, mean loss: 0.35151219148457075
Epoch: 23, step: 782, loss: 0.3265676498413086, mean loss: 0.35151145771367376
Epoch: 23, step: 783, loss: 0.3335988521575928, mean loss: 0.35151093081034523
Epoch: 23, step: 784, loss: 0.3317384123802185, mean loss: 0.35151034921436825
Epoch: 23, step: 785, loss: 0.3319161534309387, mean loss: 0.35150977288059027
Epoch: 23, step: 786, loss: 0.3746342062950134, mean loss: 0.3515104530309892
Epoch: 23, step: 787, loss: 0.32478612661361694, mean loss: 0.3515096670213887
Epoch: 23, step: 788, loss: 0.34636932611465454, mean loss: 0.351509515839338
Epoch: 23, step: 789, loss: 0.3645978569984436, mean loss: 0.35150990076790567
Epoch: 23, step: 790, loss: 0.38323265314102173, mean loss: 0.3515108337077161
Epoch: 23, step: 791, loss: 0.309908926486969, mean loss: 0.3515096102661439
Epoch: 23, step: 792, loss: 0.36751747131347656, mean loss: 0.3515100810163585
Epoch: 23, step: 793, loss: 0.34986642003059387, mean loss: 0.35151003268191794
Epoch: 23, step: 794, loss: 0.3192913234233856, mean loss: 0.35150908526787794
Epoch: 23, step: 795, loss: 0.32946300506591797, mean loss: 0.3515084370062865
Epoch: 23, step: 796, loss: 0.3456137180328369, mean loss: 0.35150826367808
Epoch: 23, step: 797, loss: 0.34520620107650757, mean loss: 0.3515080783777977
Epoch: 23, step: 798, loss: 0.35172638297080994, mean loss: 0.3515080847964444
Epoch: 23, step: 799, loss: 0.3068135976791382, mean loss: 0.3515067707164986
Epoch: 23, step: 800, loss: 0.35574379563331604, mean loss: 0.35150689528724854
Epoch: 23, step: 801, loss: 0.3716434836387634, mean loss: 0.3515074872960788
Epoch: 23, step: 802, loss: 0.3240809440612793, mean loss: 0.35150668098876625
Epoch: 23, step: 803, loss: 0.32009848952293396, mean loss: 0.35150575765294
Epoch: 23, step: 804, loss: 0.2977500259876251, mean loss: 0.35150417739213907
Epoch: 23, step: 805, loss: 0.3373814523220062, mean loss: 0.35150376223765994
Epoch: 23, step: 806, loss: 0.33049285411834717, mean loss: 0.3515031446149162
Epoch: 23, step: 807, loss: 0.3243253827095032, mean loss: 0.3515023457389049
Epoch: 23, step: 808, loss: 0.33723777532577515, mean loss: 0.35150192645168776
Epoch: 23, step: 809, loss: 0.3414449691772461, mean loss: 0.3515016308500984
Epoch: 23, step: 810, loss: 0.35564717650413513, mean loss: 0.35150175269548695
Epoch: 23, step: 811, loss: 0.34384340047836304, mean loss: 0.3515015276087183
Epoch: 23, step: 812, loss: 0.3898213505744934, mean loss: 0.3515026538342279
Epoch: 23, step: 813, loss: 0.34966790676116943, mean loss: 0.3515025999123131
Epoch: 23, step: 814, loss: 0.30859461426734924, mean loss: 0.3515013389141162
Epoch: 23, step: 815, loss: 0.3731723725795746, mean loss: 0.3515019757729873
Epoch: 23, step: 816, loss: 0.3389572501182556, mean loss: 0.3515016071249032
Epoch: 23, step: 817, loss: 0.31681591272354126, mean loss: 0.351500587856775
Epoch: 23, step: 818, loss: 0.30095773935317993, mean loss: 0.3514991026565604
Epoch: 23, step: 819, loss: 0.3365029990673065, mean loss: 0.3514986620094169
Epoch: 23, step: 820, loss: 0.30245086550712585, mean loss: 0.3514972208259625
Epoch: 23, step: 821, loss: 0.3301618993282318, mean loss: 0.3514965939433893
Epoch: 23, step: 822, loss: 0.299068808555603, mean loss: 0.3514950535354155
Epoch: 23, step: 823, loss: 0.3148577809333801, mean loss: 0.3514939771083206
Epoch: 23, step: 824, loss: 0.3344863951206207, mean loss: 0.35149347742908954
Epoch: 23, step: 825, loss: 0.34673449397087097, mean loss: 0.35149333761525037
Epoch: 23, step: 826, loss: 0.33509472012519836, mean loss: 0.35149285585557793
Epoch: 23, step: 827, loss: 0.34738919138908386, mean loss: 0.3514927353013927
Epoch: 23, step: 828, loss: 0.36833396553993225, mean loss: 0.3514932300351032
Epoch: 23, step: 829, loss: 0.30781248211860657, mean loss: 0.3514919468922821
Epoch: 23, step: 830, loss: 0.4123506247997284, mean loss: 0.35149373459248207
Epoch: 23, step: 831, loss: 0.3512687087059021, mean loss: 0.35149372798262757
Epoch: 23, step: 832, loss: 0.31156277656555176, mean loss: 0.351492555095231
Epoch: 23, step: 833, loss: 0.31932520866394043, mean loss: 0.35149161027509257
Epoch: 23, step: 834, loss: 0.3247038424015045, mean loss: 0.35149082348718547
Epoch: 23, step: 835, loss: 0.2942008674144745, mean loss: 0.35148914086394556
Epoch: 23, step: 836, loss: 0.3009923994541168, mean loss: 0.3514876578030213
Epoch: 23, step: 837, loss: 0.37484657764434814, mean loss: 0.3514883438212252
Epoch: 23, step: 838, loss: 0.3439435660839081, mean loss: 0.3514881222483569
Epoch: 23, step: 839, loss: 0.32138770818710327, mean loss: 0.3514872382939912
Epoch: 23, step: 840, loss: 0.3187922537326813, mean loss: 0.3514862781734567
Epoch: 23, step: 841, loss: 0.31387338042259216, mean loss: 0.35148517366597587
Epoch: 23, step: 842, loss: 0.342965692281723, mean loss: 0.351484923497678
Epoch: 23, step: 843, loss: 0.33353814482688904, mean loss: 0.35148439651921104
Epoch: 23, step: 844, loss: 0.32717469334602356, mean loss: 0.3514836827245969
Epoch: 23, step: 845, loss: 0.32037660479545593, mean loss: 0.351482769368618
Epoch: 23, step: 846, loss: 0.4335957467556, mean loss: 0.35148518027256076
Epoch: 23, step: 847, loss: 0.2985508441925049, mean loss: 0.3514836261229401
Epoch: 23, step: 848, loss: 0.3085255026817322, mean loss: 0.351482364911483
Epoch: 23, step: 849, loss: 0.299196720123291, mean loss: 0.35148082989754403
Epoch: 23, step: 850, loss: 0.3417096734046936, mean loss: 0.3514805430421146
Epoch: 23, step: 851, loss: 0.30329224467277527, mean loss: 0.35147912840207324
Epoch: 23, step: 852, loss: 0.3642990291118622, mean loss: 0.35147950473850975
Epoch: 23, step: 853, loss: 0.3448806703090668, mean loss: 0.3514793110311643
Epoch: 23, step: 854, loss: 0.32966694235801697, mean loss: 0.35147867075263456
Epoch: 23, step: 855, loss: 0.3135233521461487, mean loss: 0.3514775566479437
Epoch: 23, step: 856, loss: 0.31982284784317017, mean loss: 0.35147662751269454
Epoch: 23, step: 857, loss: 0.32469651103019714, mean loss: 0.3514758414805113
Epoch: 23, step: 858, loss: 0.3558966815471649, mean loss: 0.3514759712342628
Epoch: 23, step: 859, loss: 0.3129311800003052, mean loss: 0.3514748399595729
Epoch: 23, step: 860, loss: 0.3133167028427124, mean loss: 0.3514737200659
Epoch: 23, step: 861, loss: 0.31264543533325195, mean loss: 0.35147258053767516
Epoch: 23, step: 862, loss: 0.34407851099967957, mean loss: 0.35147236354370487
Epoch: 23, step: 863, loss: 0.2760521471500397, mean loss: 0.35147015024941
Epoch: 23, step: 864, loss: 0.30427250266075134, mean loss: 0.3514687652199887
Epoch: 23, step: 865, loss: 0.3034837245941162, mean loss: 0.3514673571255986
Epoch: 23, step: 866, loss: 0.31951582431793213, mean loss: 0.3514664195531109
Epoch: 23, step: 867, loss: 0.35046184062957764, mean loss: 0.3514663900760298
Epoch: 23, step: 868, loss: 0.3542701303958893, mean loss: 0.35146647234299144
Epoch: 23, step: 869, loss: 0.306305468082428, mean loss: 0.3514651472739151
Epoch: 23, step: 870, loss: 0.3238321542739868, mean loss: 0.35146433651802506
Epoch: 23, step: 871, loss: 0.3409743010997772, mean loss: 0.3514640287479447
Epoch: 23, step: 872, loss: 0.3242199122905731, mean loss: 0.35146322944865005
Epoch: 23, step: 873, loss: 0.3521658182144165, mean loss: 0.3514632500608887
Epoch: 23, step: 874, loss: 0.3361017107963562, mean loss: 0.3514627994040616
Epoch: 23, step: 875, loss: 0.346147745847702, mean loss: 0.35146264348251866
Epoch: 23, step: 876, loss: 0.3572489321231842, mean loss: 0.3514628132231576
Epoch: 23, step: 877, loss: 0.3277396559715271, mean loss: 0.35146211732532096
Epoch: 23, step: 878, loss: 0.30751147866249084, mean loss: 0.35146082811002477
Epoch: 23, step: 879, loss: 0.3506042957305908, mean loss: 0.35146080298587895
Epoch: 23, step: 880, loss: 0.32311883568763733, mean loss: 0.3514599716724921
Epoch: 23, step: 881, loss: 0.3145844042301178, mean loss: 0.3514588900872442
Epoch: 23, step: 882, loss: 0.3917180895805359, mean loss: 0.35146007088206727
Epoch: 23, step: 883, loss: 0.3063066303730011, mean loss: 0.3514587465789083
Epoch: 23, step: 884, loss: 0.3114742338657379, mean loss: 0.35145757390938565
Epoch: 23, step: 885, loss: 0.31792449951171875, mean loss: 0.35145659047709055
Epoch: 23, step: 886, loss: 0.3583669364452362, mean loss: 0.3514567931324754
Epoch: 23, step: 887, loss: 0.3112809956073761, mean loss: 0.3514556149565949
Epoch: 23, step: 888, loss: 0.3242087960243225, mean loss: 0.3514548159530779
Epoch: 23, step: 889, loss: 0.38620832562446594, mean loss: 0.35145583505781286
Epoch: 23, step: 890, loss: 0.3020669221878052, mean loss: 0.3514543868300068
Epoch: 23, step: 891, loss: 0.32409024238586426, mean loss: 0.35145358445654784
Epoch: 23, step: 892, loss: 0.31086722016334534, mean loss: 0.35145239441507903
Epoch: 23, step: 893, loss: 0.3144966959953308, mean loss: 0.351451310860912
Epoch: 23, step: 894, loss: 0.3234592378139496, mean loss: 0.35145049014747937
Epoch: 23, step: 895, loss: 0.357604444026947, mean loss: 0.3514506705730065
Epoch: 23, step: 896, loss: 0.34805214405059814, mean loss: 0.3514505709357693
Epoch: 23, step: 897, loss: 0.3530612885951996, mean loss: 0.3514506181570434
Epoch: 23, step: 898, loss: 0.34005558490753174, mean loss: 0.35145028409960594
Epoch: 23, step: 899, loss: 0.3677595257759094, mean loss: 0.35145076220823857
Epoch: 23, step: 900, loss: 0.3671643137931824, mean loss: 0.35145122284059527
Epoch: 23, step: 901, loss: 0.30470871925354004, mean loss: 0.35144985265522893
Epoch: 23, step: 902, loss: 0.31825271248817444, mean loss: 0.35144887956010457
Epoch: 23, step: 903, loss: 0.3884119391441345, mean loss: 0.3514499630124315
Epoch: 23, step: 904, loss: 0.33177292346954346, mean loss: 0.3514493862606789
Epoch: 23, step: 905, loss: 0.3395283818244934, mean loss: 0.35144903685554274
Epoch: 23, step: 906, loss: 0.32606324553489685, mean loss: 0.35144829281875034
Epoch: 23, step: 907, loss: 0.3002220094203949, mean loss: 0.35144679146226154
Epoch: 23, step: 908, loss: 0.3243955373764038, mean loss: 0.3514459986585897
Epoch: 23, step: 909, loss: 0.3120032548904419, mean loss: 0.35144484272565
Epoch: 23, step: 910, loss: 0.32143041491508484, mean loss: 0.35144396313042653
Epoch: 23, step: 911, loss: 0.34887227416038513, mean loss: 0.3514438877673691
Epoch: 23, step: 912, loss: 0.35022208094596863, mean loss: 0.35144385196350625
Epoch: 23, step: 913, loss: 0.3694603741168976, mean loss: 0.3514443799047286
Epoch: 23, step: 914, loss: 0.3468552827835083, mean loss: 0.35144424543357317
Epoch: 23, step: 915, loss: 0.3444386124610901, mean loss: 0.3514440401583454
Epoch: 23, step: 916, loss: 0.31268948316574097, mean loss: 0.35144290462677424
Epoch: 23, step: 917, loss: 0.3279063105583191, mean loss: 0.3514422150107746
Epoch: 23, step: 918, loss: 0.3357812166213989, mean loss: 0.35144175616109574
Epoch: 23, step: 919, loss: 0.3143343925476074, mean loss: 0.3514406689888347
Epoch: 23, step: 920, loss: 0.31027111411094666, mean loss: 0.3514394628377528
Epoch: 23, step: 921, loss: 0.331504225730896, mean loss: 0.35143887880901
Epoch: 23, step: 922, loss: 0.31291958689689636, mean loss: 0.35143775036922936
Epoch: 23, step: 923, loss: 0.334366112947464, mean loss: 0.3514372502626726
Epoch: 23, step: 924, loss: 0.33085766434669495, mean loss: 0.351436647409876
Epoch: 23, step: 925, loss: 0.32741424441337585, mean loss: 0.3514359437247452
Epoch: 23, step: 926, loss: 0.3159184753894806, mean loss: 0.3514349033466341
Epoch: 23, step: 927, loss: 0.3639187812805176, mean loss: 0.35143526901382605
Epoch: 23, step: 928, loss: 0.30763235688209534, mean loss: 0.3514339860135586
Epoch: 23, step: 929, loss: 0.37975984811782837, mean loss: 0.35143481566214696
Epoch: 23, step: 930, loss: 0.3136802613735199, mean loss: 0.3514337098848489
Epoch: 23, step: 931, loss: 0.3738590180873871, mean loss: 0.35143436667105443
Epoch: 23, step: 932, loss: 0.31731531023979187, mean loss: 0.35143336743086023
Epoch: 23, step: 933, loss: 0.33243921399116516, mean loss: 0.3514328111679469
Epoch: 23, step: 934, loss: 0.33051279187202454, mean loss: 0.35143219852205426
Epoch: 23, step: 935, loss: 0.3330855667591095, mean loss: 0.3514316612539342
Epoch: 23, step: 936, loss: 0.3440742790699005, mean loss: 0.35143144580451596
Epoch: 23, step: 937, loss: 0.390852153301239, mean loss: 0.35143260014441335
Epoch: 23, step: 938, loss: 0.31533220410346985, mean loss: 0.35143154306274543
Epoch: 23, step: 939, loss: 0.3060864806175232, mean loss: 0.3514302153202283
Epoch: 23, step: 940, loss: 0.33110374212265015, mean loss: 0.3514296201609978
Epoch: 23, step: 941, loss: 0.3081212341785431, mean loss: 0.35142835212838136
Epoch: 23, step: 942, loss: 0.3097092807292938, mean loss: 0.35142713066530423
Epoch: 23, step: 943, loss: 0.31140127778053284, mean loss: 0.35142595881107996
Epoch: 23, step: 944, loss: 0.3067370057106018, mean loss: 0.3514246504715566
Epoch: 23, step: 945, loss: 0.3327800929546356, mean loss: 0.3514241046387351
Epoch: 23, step: 946, loss: 0.3484021723270416, mean loss: 0.3514240161720847
Epoch: 23, step: 947, loss: 0.3337904214859009, mean loss: 0.35142349996615124
Epoch: 23, step: 948, loss: 0.39594462513923645, mean loss: 0.35142480323962605
Epoch: 23, step: 949, loss: 0.31006908416748047, mean loss: 0.35142359266298906
Epoch: 23, step: 950, loss: 0.30148211121559143, mean loss: 0.35142213080421064
Epoch: 23, step: 951, loss: 0.3457256257534027, mean loss: 0.3514219640642197
Epoch: 23, step: 952, loss: 0.3152843713760376, mean loss: 0.35142090632698314
Epoch: 23, step: 953, loss: 0.3356384336948395, mean loss: 0.35142044439194153
Epoch: 23, step: 954, loss: 0.39585161209106445, mean loss: 0.35142174480367505
Epoch: 23, step: 955, loss: 0.3516350984573364, mean loss: 0.35142175104792855
Epoch: 23, step: 956, loss: 0.3543829023838043, mean loss: 0.35142183770985413
Epoch: 23, step: 957, loss: 0.3556101620197296, mean loss: 0.35142196028299755
Epoch: 23, step: 958, loss: 0.3345242142677307, mean loss: 0.35142146577753924
Epoch: 23, step: 959, loss: 0.34252873063087463, mean loss: 0.3514212055429862
Epoch: 23, step: 960, loss: 0.36718758940696716, mean loss: 0.3514216669126015
Epoch: 23, step: 961, loss: 0.32652541995048523, mean loss: 0.3514209383983228
Epoch: 23, step: 962, loss: 0.29998543858528137, mean loss: 0.3514194333361483
Epoch: 23, step: 963, loss: 0.3222537338733673, mean loss: 0.3514185799390432
Epoch: 23, step: 964, loss: 0.32346129417419434, mean loss: 0.35141776192442037
Epoch: 23, step: 965, loss: 0.351746141910553, mean loss: 0.3514177715323549
Epoch: 23, step: 966, loss: 0.31518226861953735, mean loss: 0.35141671136374514
Epoch: 23, step: 967, loss: 0.358853816986084, mean loss: 0.3514169289502174
Epoch: 23, step: 968, loss: 0.31206780672073364, mean loss: 0.3514157777515331
Epoch: 23, step: 969, loss: 0.386492520570755, mean loss: 0.3514168039273806
Epoch: 23, step: 970, loss: 0.29236337542533875, mean loss: 0.3514150763602127
Epoch: 23, step: 971, loss: 0.34070131182670593, mean loss: 0.35141476294561713
Epoch: 23, step: 972, loss: 0.3343328833580017, mean loss: 0.35141426325629177
Epoch: 23, step: 973, loss: 0.3053934872150421, mean loss: 0.35141291706849437
Epoch: 23, step: 974, loss: 0.3454440236091614, mean loss: 0.3514127424730792
Epoch: 23, step: 975, loss: 0.31119057536125183, mean loss: 0.35141156597351464
Epoch: 23, step: 976, loss: 0.3427402079105377, mean loss: 0.35141131234345635
Epoch: 23, step: 977, loss: 0.3409321904182434, mean loss: 0.3514110058467636
Epoch: 23, step: 978, loss: 0.3290386199951172, mean loss: 0.35141035151124106
Epoch: 23, step: 979, loss: 0.30980923771858215, mean loss: 0.35140913481979885
Epoch: 23, step: 980, loss: 0.37861889600753784, mean loss: 0.351409930589728
Epoch: 23, step: 981, loss: 0.2946368157863617, mean loss: 0.35140827026584653
Epoch: 23, step: 982, loss: 0.3272382318973541, mean loss: 0.3514075634362408
Epoch: 23, step: 983, loss: 0.3085707724094391, mean loss: 0.3514063107519787
Epoch: 23, step: 984, loss: 0.37365877628326416, mean loss: 0.35140696146594574
Epoch: 23, step: 985, loss: 0.36867716908454895, mean loss: 0.35140746647230925
Epoch: 23, step: 986, loss: 0.34041258692741394, mean loss: 0.35140714497520276
Epoch: 23, step: 987, loss: 0.3203648328781128, mean loss: 0.3514062373052584
Epoch: 23, step: 988, loss: 0.3325567841529846, mean loss: 0.35140568616777257
Epoch: 23, step: 989, loss: 0.338401198387146, mean loss: 0.3514053059418273
Epoch: 23, step: 990, loss: 0.3137807846069336, mean loss: 0.35140420590611887
Epoch: 23, step: 991, loss: 0.3074870705604553, mean loss: 0.3514029219295271
Epoch: 23, step: 992, loss: 0.33043766021728516, mean loss: 0.3514023089997884
Epoch: 23, step: 993, loss: 0.29856008291244507, mean loss: 0.35140076417648003
Epoch: 23, step: 994, loss: 0.3295997083187103, mean loss: 0.3514001268491535
Epoch: 23, step: 995, loss: 0.2936382293701172, mean loss: 0.3513984382997651
Epoch: 23, step: 996, loss: 0.35040757060050964, mean loss: 0.3513984093346477
Epoch: 23, step: 997, loss: 0.35457471013069153, mean loss: 0.3513985021817917
Epoch: 23, step: 998, loss: 0.33686164021492004, mean loss: 0.35139807726401767
Epoch: 23, step: 999, loss: 0.3365768790245056, mean loss: 0.35139764404765383
Epoch: 23, step: 1000, loss: 0.3152911365032196, mean loss: 0.35139658870297363
Epoch: 23, step: 1001, loss: 0.32206955552101135, mean loss: 0.35139573153826964
Epoch: 23, step: 1002, loss: 0.3321283161640167, mean loss: 0.3513951684105369
Epoch: 23, step: 1003, loss: 0.3337898254394531, mean loss: 0.35139465387514496
Epoch: 23, step: 1004, loss: 0.3307337760925293, mean loss: 0.35139405005605556
Epoch: 23, step: 1005, loss: 0.35203179717063904, mean loss: 0.35139406869382267
Epoch: 23, step: 1006, loss: 0.35171598196029663, mean loss: 0.35139407810126494
Epoch: 23, step: 1007, loss: 0.2987900674343109, mean loss: 0.351392540871263
Epoch: 23, step: 1008, loss: 0.2975527346134186, mean loss: 0.35139096757398186
Epoch: 23, step: 1009, loss: 0.30452144145965576, mean loss: 0.35138959800101377
Epoch: 23, step: 1010, loss: 0.31021642684936523, mean loss: 0.35138839491621254
Epoch: 23, step: 1011, loss: 0.33278825879096985, mean loss: 0.3513878514339742
Epoch: 23, step: 1012, loss: 0.34267130494117737, mean loss: 0.35138759675036596
Epoch: 23, step: 1013, loss: 0.29536592960357666, mean loss: 0.3513859599342862
Epoch: 23, step: 1014, loss: 0.31966760754585266, mean loss: 0.3513850332286915
Epoch: 23, step: 1015, loss: 0.3588525950908661, mean loss: 0.35138525139983395
Epoch: 23, step: 1016, loss: 0.3104071319103241, mean loss: 0.3513840542243544
Epoch: 23, step: 1017, loss: 0.2909368872642517, mean loss: 0.3513822883123778
Epoch: 23, step: 1018, loss: 0.3205083906650543, mean loss: 0.3513813863843696
Epoch: 23, step: 1019, loss: 0.3087608814239502, mean loss: 0.3513801413357321
Epoch: 23, step: 1020, loss: 0.3190136253833771, mean loss: 0.35137919585867916
Epoch: 23, step: 1021, loss: 0.3345823585987091, mean loss: 0.3513787052108653
Epoch: 23, step: 1022, loss: 0.30392810702323914, mean loss: 0.35137731918492143
Epoch: 23, step: 1023, loss: 0.31509822607040405, mean loss: 0.3513762595081743
Epoch: 23, step: 1024, loss: 0.33205676078796387, mean loss: 0.351375695221037
Epoch: 23, step: 1025, loss: 0.31757649779319763, mean loss: 0.3513747080372813
Epoch: 23, step: 1026, loss: 0.32232916355133057, mean loss: 0.3513738597197345
Epoch: 23, step: 1027, loss: 0.35831788182258606, mean loss: 0.35137406252411835
Epoch: 23, step: 1028, loss: 0.3387300968170166, mean loss: 0.3513736932602035
Epoch: 23, step: 1029, loss: 0.3366561532020569, mean loss: 0.35137326345061126
Epoch: 23, step: 1030, loss: 0.32684382796287537, mean loss: 0.3513725471163097
Epoch: 23, step: 1031, loss: 0.3645859658718109, mean loss: 0.3513729329771541
Epoch: 23, step: 1032, loss: 0.3335437774658203, mean loss: 0.35137241234186395
Epoch: 23, step: 1033, loss: 0.31095370650291443, mean loss: 0.3513712320958253
Epoch: 23, step: 1034, loss: 0.30169692635536194, mean loss: 0.35136978162408355
Epoch: 23, step: 1035, loss: 0.3303937017917633, mean loss: 0.35136916914803146
Epoch: 23, step: 1036, loss: 0.40584585070610046, mean loss: 0.35137075975451804
Epoch: 23, step: 1037, loss: 0.3290065824985504, mean loss: 0.351370106785839
Epoch: 23, step: 1038, loss: 0.33357515931129456, mean loss: 0.35136958724049805
Epoch: 23, step: 1039, loss: 0.3274875581264496, mean loss: 0.3513688899956915
Epoch: 23, step: 1040, loss: 0.33854612708091736, mean loss: 0.3513685156412433
Epoch: 23, step: 1041, loss: 0.3614296317100525, mean loss: 0.3513688093621538
Epoch: 23, step: 1042, loss: 0.3581273853778839, mean loss: 0.3513690066640372
Epoch: 23, step: 1043, loss: 0.3143590986728668, mean loss: 0.3513679262720477
Epoch: 23, step: 1044, loss: 0.30297571420669556, mean loss: 0.3513665136494577
Epoch: 23, step: 1045, loss: 0.36247771978378296, mean loss: 0.35136683798847734
Epoch: 23, step: 1046, loss: 0.330959290266037, mean loss: 0.3513662423041981
Epoch: 23, step: 1047, loss: 0.3763633668422699, mean loss: 0.3513669719342197
Epoch: 23, step: 1048, loss: 0.31648361682891846, mean loss: 0.35136595376910174
Epoch: 23, step: 1049, loss: 0.32457655668258667, mean loss: 0.3513651718708738
Epoch: 23, step: 1050, loss: 0.33506837487220764, mean loss: 0.3513646962325176
Epoch: 23, step: 1051, loss: 0.35553187131881714, mean loss: 0.35136481785215007
Epoch: 23, step: 1052, loss: 0.39633801579475403, mean loss: 0.3513661303633989
Epoch: 23, step: 1053, loss: 0.3291754722595215, mean loss: 0.35136548276350094
Epoch: 23, step: 1054, loss: 0.321227490901947, mean loss: 0.35136460325867525
Epoch: 23, step: 1055, loss: 0.31917423009872437, mean loss: 0.3513636638874496
Epoch: 23, step: 1056, loss: 0.3196013867855072, mean loss: 0.35136273703586063
Epoch: 23, step: 1057, loss: 0.3171141743659973, mean loss: 0.3513617376614028
Epoch: 23, step: 1058, loss: 0.34170863032341003, mean loss: 0.35136145599155544
Epoch: 23, step: 1059, loss: 0.3635746240615845, mean loss: 0.35136181235150143
Epoch: 23, step: 1060, loss: 0.3076162338256836, mean loss: 0.35136053596546796
Epoch: 23, step: 1061, loss: 0.3764265775680542, mean loss: 0.3513612673082235
Epoch: 23, step: 1062, loss: 0.2983939051628113, mean loss: 0.3513597219439012
Epoch: 23, step: 1063, loss: 0.33977043628692627, mean loss: 0.35135938382726983
Epoch: 23, step: 1064, loss: 0.3344666361808777, mean loss: 0.35135889099686907
Epoch: 23, step: 1065, loss: 0.3073292374610901, mean loss: 0.3513576065096313
Epoch: 23, step: 1066, loss: 0.3352392613887787, mean loss: 0.3513571362991491
Epoch: 23, step: 1067, loss: 0.37114623188972473, mean loss: 0.3513577135773169
Epoch: 23, step: 1068, loss: 0.3429321050643921, mean loss: 0.3513574677966071
Epoch: 23, step: 1069, loss: 0.330570250749588, mean loss: 0.3513568614370876
Epoch: 23, step: 1070, loss: 0.2990366518497467, mean loss: 0.3513553353101563
Epoch: 23, step: 1071, loss: 0.31694987416267395, mean loss: 0.35135433176736236
Epoch: 23, step: 1072, loss: 0.3325394093990326, mean loss: 0.35135378298736036
Epoch: 23, step: 1073, loss: 0.354872465133667, mean loss: 0.3513538856147344
Epoch: 23, step: 1074, loss: 0.33619728684425354, mean loss: 0.3513534435638472
Epoch: 23, step: 1075, loss: 0.32475271821022034, mean loss: 0.3513526677610779
Epoch: 23, step: 1076, loss: 0.3594497740268707, mean loss: 0.35135290390404694
Epoch: 23, step: 1077, loss: 0.36032721400260925, mean loss: 0.3513531656220434
Epoch: 23, step: 1078, loss: 0.32149478793144226, mean loss: 0.3513522948869324
Epoch: 23, step: 1079, loss: 0.3134039342403412, mean loss: 0.351351188262628
Epoch: 23, step: 1080, loss: 0.3431750535964966, mean loss: 0.3513509498426978
Epoch: 23, step: 1081, loss: 0.30991244316101074, mean loss: 0.35134974151159964
Epoch: 23, step: 1082, loss: 0.33976927399635315, mean loss: 0.35134940383941665
Epoch: 23, step: 1083, loss: 0.3075239360332489, mean loss: 0.35134812597996345
Epoch: 23, step: 1084, loss: 0.3253743052482605, mean loss: 0.3513473686594768
Epoch: 23, step: 1085, loss: 0.32726627588272095, mean loss: 0.3513466665458615
Epoch: 23, step: 1086, loss: 0.3216051161289215, mean loss: 0.3513457994199856
Epoch: 23, step: 1087, loss: 0.31634876132011414, mean loss: 0.35134477909817513
Epoch: 23, step: 1088, loss: 0.36154991388320923, mean loss: 0.3513450766152966
Epoch: 23, step: 1089, loss: 0.33880341053009033, mean loss: 0.3513447109903743
Epoch: 23, step: 1090, loss: 0.3291626572608948, mean loss: 0.35134406433982684
Epoch: 23, step: 1091, loss: 0.31307411193847656, mean loss: 0.35134294872787486
Epoch: 23, step: 1092, loss: 0.34274545311927795, mean loss: 0.3513426981085596
Epoch: 23, step: 1093, loss: 0.33017751574516296, mean loss: 0.3513420811557711
Epoch: 23, step: 1094, loss: 0.3072640895843506, mean loss: 0.3513407963453367
Epoch: 23, step: 1095, loss: 0.34391677379608154, mean loss: 0.35134057995200135
Epoch: 23, step: 1096, loss: 0.3360558748245239, mean loss: 0.35134013445067147
Epoch: 23, step: 1097, loss: 0.30211323499679565, mean loss: 0.3513386996823983
Epoch: 23, step: 1098, loss: 0.3182815611362457, mean loss: 0.3513377362264061
Epoch: 23, step: 1099, loss: 0.3403511047363281, mean loss: 0.35133741602847274
Epoch: 23, step: 1100, loss: 0.35722440481185913, mean loss: 0.35133758759577327
Epoch: 23, step: 1101, loss: 0.310989648103714, mean loss: 0.3513364117509434
Epoch: 23, step: 1102, loss: 0.3535255193710327, mean loss: 0.3513364755454245
Epoch: 23, step: 1103, loss: 0.39074552059173584, mean loss: 0.3513376239614709
Epoch: 23, step: 1104, loss: 0.3148460388183594, mean loss: 0.3513365605938938
Epoch: 23, step: 1105, loss: 0.35293227434158325, mean loss: 0.3513366070917593
Epoch: 23, step: 1106, loss: 0.326622873544693, mean loss: 0.3513358869736455
Epoch: 23, step: 1107, loss: 0.3306398093700409, mean loss: 0.35133528394108127
Epoch: 23, step: 1108, loss: 0.33206722140312195, mean loss: 0.3513347225337057
Epoch: 23, step: 1109, loss: 0.32198354601860046, mean loss: 0.3513338673627799
Epoch: 23, step: 1110, loss: 0.3267028331756592, mean loss: 0.351333149738033
Epoch: 23, step: 1111, loss: 0.3248670697212219, mean loss: 0.3513323786717232
Epoch: 23, step: 1112, loss: 0.3462354242801666, mean loss: 0.35133223018069937
Epoch: 23, step: 1113, loss: 0.3461615741252899, mean loss: 0.3513320795468925
Epoch: 23, step: 1114, loss: 0.3215233087539673, mean loss: 0.3513312111700814
Epoch: 23, step: 1115, loss: 0.3016681671142578, mean loss: 0.3513297644489192
Epoch: 23, step: 1116, loss: 0.3363068699836731, mean loss: 0.35132932683365325
Epoch: 23, step: 1117, loss: 0.31533196568489075, mean loss: 0.3513282782650209
Epoch: 23, step: 1118, loss: 0.309440553188324, mean loss: 0.3513270581512731
Epoch: 23, step: 1119, loss: 0.35507524013519287, mean loss: 0.3513271673258619
Epoch: 23, step: 1120, loss: 0.31512999534606934, mean loss: 0.35132611302906347
Epoch: 23, step: 1121, loss: 0.33314138650894165, mean loss: 0.35132558338711906
Epoch: 23, step: 1122, loss: 0.3694193959236145, mean loss: 0.3513261103657862
Epoch: 23, step: 1123, loss: 0.29638904333114624, mean loss: 0.35132451038130824
Epoch: 23, step: 1124, loss: 0.34827613830566406, mean loss: 0.3513244216032532
Epoch: 23, step: 1125, loss: 0.31980979442596436, mean loss: 0.35132350382623717
Epoch: 23, step: 1126, loss: 0.3421500325202942, mean loss: 0.35132323668184434
Epoch: 23, step: 1127, loss: 0.30441755056381226, mean loss: 0.3513218707620389
Epoch: 23, step: 1128, loss: 0.3088025152683258, mean loss: 0.3513206326106894
Epoch: 23, step: 1129, loss: 0.35427767038345337, mean loss: 0.3513207187162678
Epoch: 23, step: 1130, loss: 0.3311014771461487, mean loss: 0.35132012997208206
Epoch: 23, step: 1131, loss: 0.3203652799129486, mean loss: 0.3513192286545285
Epoch: 23, step: 1132, loss: 0.34511125087738037, mean loss: 0.3513190479010629
Epoch: 23, step: 1133, loss: 0.31846868991851807, mean loss: 0.3513180914473861
Epoch: 23, step: 1134, loss: 0.2987363338470459, mean loss: 0.35131656054926985
Epoch: 23, step: 1135, loss: 0.3742293119430542, mean loss: 0.3513172276259961
Epoch: 23, step: 1136, loss: 0.3932597041130066, mean loss: 0.3513184486943383
Epoch: 23, step: 1137, loss: 0.33180782198905945, mean loss: 0.3513178806993833
Epoch: 23, step: 1138, loss: 0.32512664794921875, mean loss: 0.3513171182402773
Epoch: 23, step: 1139, loss: 0.3191659450531006, mean loss: 0.35131618230719663
Epoch: 23, step: 1140, loss: 0.34955835342407227, mean loss: 0.35131613113760785
Epoch: 23, step: 1141, loss: 0.3745305836200714, mean loss: 0.35131680687995176
Epoch: 23, step: 1142, loss: 0.32546019554138184, mean loss: 0.35131605424972795
Epoch: 23, step: 1143, loss: 0.3171238601207733, mean loss: 0.351315059017625
Epoch: 23, step: 1144, loss: 0.316145658493042, mean loss: 0.35131403537177336
Epoch: 23, step: 1145, loss: 0.3582536578178406, mean loss: 0.3513142373515873
Epoch: 23, step: 1146, loss: 0.30458176136016846, mean loss: 0.35131287722830107
Epoch: 23, step: 1147, loss: 0.3154965937137604, mean loss: 0.3513118348451953
Epoch: 23, step: 1148, loss: 0.3768778145313263, mean loss: 0.35131257888581363
Epoch: 23, step: 1149, loss: 0.2970966100692749, mean loss: 0.35131100109730257
Epoch: 23, step: 1150, loss: 0.3288237452507019, mean loss: 0.35131034669414085
Epoch: 23, step: 1151, loss: 0.31223076581954956, mean loss: 0.3513092094696945
Epoch: 23, step: 1152, loss: 0.2892877757549286, mean loss: 0.3513074046847763
Epoch: 23, step: 1153, loss: 0.3292430341243744, mean loss: 0.35130676264408023
Epoch: 23, step: 1154, loss: 0.3464725613594055, mean loss: 0.35130662198003376
Epoch: 23, step: 1155, loss: 0.33949533104896545, mean loss: 0.3513062783088591
Epoch: 23, step: 1156, loss: 0.3107937276363373, mean loss: 0.3513050995561845
Epoch: 23, step: 1157, loss: 0.37034666538238525, mean loss: 0.3513056535732292
Epoch: 23, step: 1158, loss: 0.32185518741607666, mean loss: 0.35130479673269044
Epoch: 23, step: 1159, loss: 0.31520846486091614, mean loss: 0.3513037465659305
Epoch: 23, step: 1160, loss: 0.3246428370475769, mean loss: 0.35130297093070756
Epoch: 23, step: 1161, loss: 0.34684425592422485, mean loss: 0.3513028412188612
Epoch: 23, step: 1162, loss: 0.38263848423957825, mean loss: 0.35130375280120363
Epoch: 23, step: 1163, loss: 0.34571585059165955, mean loss: 0.3513035902487772
Epoch: 23, step: 1164, loss: 0.3234406113624573, mean loss: 0.3513027797365485
Epoch: 23, step: 1165, loss: 0.3604240417480469, mean loss: 0.351303045059197
Epoch: 23, step: 1166, loss: 0.3064570128917694, mean loss: 0.3513017405991439
Epoch: 23, step: 1167, loss: 0.3150525987148285, mean loss: 0.3513006862320152
Epoch: 23, step: 1168, loss: 0.28409484028816223, mean loss: 0.3512987314940511
Epoch: 23, step: 1169, loss: 0.32733726501464844, mean loss: 0.3512980345751261
Epoch: 23, step: 1170, loss: 0.3034530580043793, mean loss: 0.3512966430451092
Epoch: 23, step: 1171, loss: 0.30043473839759827, mean loss: 0.3512951638133547
Epoch: 23, step: 1172, loss: 0.36835339665412903, mean loss: 0.3512956599085369
Epoch: 23, step: 1173, loss: 0.3712335228919983, mean loss: 0.3512962397335524
Epoch: 23, step: 1174, loss: 0.3817536234855652, mean loss: 0.35129712545733616
Epoch: 23, step: 1175, loss: 0.34146422147750854, mean loss: 0.3512968395173577
Epoch: 23, step: 1176, loss: 0.3925924003124237, mean loss: 0.3512980403536947
Epoch: 23, step: 1177, loss: 0.3080618679523468, mean loss: 0.3512967831227438
Epoch: 23, step: 1178, loss: 0.31570449471473694, mean loss: 0.3512957481924304
Epoch: 23, step: 1179, loss: 0.3579445481300354, mean loss: 0.35129594151645743
Epoch: 23, step: 1180, loss: 0.35237249732017517, mean loss: 0.3512959728180538
Epoch: 23, step: 1181, loss: 0.3434032201766968, mean loss: 0.3512957433375444
Epoch: 23, step: 1182, loss: 0.3409971296787262, mean loss: 0.3512954439157197
Epoch: 23, step: 1183, loss: 0.3337019383907318, mean loss: 0.351294932417129
Epoch: 23, step: 1184, loss: 0.329005628824234, mean loss: 0.3512942844157454
Epoch: 23, step: 1185, loss: 0.33931154012680054, mean loss: 0.35129393605990233
Epoch: 23, step: 1186, loss: 0.352811723947525, mean loss: 0.3512939801829259
Epoch: 23, step: 1187, loss: 0.33867180347442627, mean loss: 0.3512936132591844
Epoch: 23, step: 1188, loss: 0.3168199956417084, mean loss: 0.3512926111482685
Epoch: 23, step: 1189, loss: 0.33469176292419434, mean loss: 0.35129212859352676
Epoch: 23, step: 1190, loss: 0.3386058211326599, mean loss: 0.35129175983767813
Epoch: 23, step: 1191, loss: 0.37255167961120605, mean loss: 0.3512923777867472
Epoch: 23, step: 1192, loss: 0.3823322057723999, mean loss: 0.351293279976196
Epoch: 23, step: 1193, loss: 0.3363862931728363, mean loss: 0.35129284670912625
Epoch: 23, step: 1194, loss: 0.3164326250553131, mean loss: 0.3512918335367586
Epoch: 23, step: 1195, loss: 0.32098904252052307, mean loss: 0.3512909528464826
Epoch: 23, step: 1196, loss: 0.3072297275066376, mean loss: 0.3512896723319271
Epoch: 23, step: 1197, loss: 0.3067578375339508, mean loss: 0.3512883781780533
Epoch: 23, step: 1198, loss: 0.37536492943763733, mean loss: 0.3512890778540656
Epoch: 23, step: 1199, loss: 0.37057170271873474, mean loss: 0.3512896382000166
Epoch: 23, step: 1200, loss: 0.3185798227787018, mean loss: 0.35128868769249266
Epoch: 23, step: 1201, loss: 0.3576481342315674, mean loss: 0.3512888724849184
Epoch: 23, step: 1202, loss: 0.3217197358608246, mean loss: 0.3512880132916415
Epoch: 23, step: 1203, loss: 0.3250634968280792, mean loss: 0.3512872513054588
Epoch: 23, step: 1204, loss: 0.3201007544994354, mean loss: 0.3512863451690493
Epoch: 23, step: 1205, loss: 0.36267390847206116, mean loss: 0.35128667602974145
Epoch: 23, step: 1206, loss: 0.31593573093414307, mean loss: 0.3512856489532693
Epoch: 23, step: 1207, loss: 0.29536253213882446, mean loss: 0.35128402422587784
Epoch: 23, step: 1208, loss: 0.31146129965782166, mean loss: 0.3512828672948018
Epoch: 23, step: 1209, loss: 0.31774038076400757, mean loss: 0.3512818928457131
Epoch: 23, step: 1210, loss: 0.30415526032447815, mean loss: 0.35128052380081515
Epoch: 23, step: 1211, loss: 0.3272085189819336, mean loss: 0.3512798245211028
Epoch: 23, step: 1212, loss: 0.3181086480617523, mean loss: 0.35127886094299215
Epoch: 23, step: 1213, loss: 0.36068007349967957, mean loss: 0.35127913402765365
Epoch: 23, step: 1214, loss: 0.320148229598999, mean loss: 0.35127822976923934
Epoch: 23, step: 1215, loss: 0.3169066905975342, mean loss: 0.35127723140920764
Epoch: 23, step: 1216, loss: 0.32119664549827576, mean loss: 0.35127635771011934
Epoch: 23, step: 1217, loss: 0.3046627938747406, mean loss: 0.35127500384535504
Epoch: 23, step: 1218, loss: 0.3432063162326813, mean loss: 0.35127476950166436
Epoch: 23, step: 1219, loss: 0.3151242733001709, mean loss: 0.3512737195918072
Epoch: 23, step: 1220, loss: 0.3263753354549408, mean loss: 0.35127299649523885
Epoch: 23, step: 1221, loss: 0.32857489585876465, mean loss: 0.35127233731824414
Epoch: 23, step: 1222, loss: 0.3493580222129822, mean loss: 0.35127228172611097
Epoch: 23, step: 1223, loss: 0.35085564851760864, mean loss: 0.351272269627342
Epoch: 23, step: 1224, loss: 0.4004404842853546, mean loss: 0.3512736974002217
Epoch: 23, step: 1225, loss: 0.31210294365882874, mean loss: 0.3512725599719813
Epoch: 23, step: 1226, loss: 0.3479368984699249, mean loss: 0.3512724631148861
Epoch: 23, step: 1227, loss: 0.32750973105430603, mean loss: 0.35127177314008756
Epoch: 23, step: 1228, loss: 0.34731578826904297, mean loss: 0.3512716582774276
Epoch: 23, step: 1229, loss: 0.33465442061424255, mean loss: 0.35127117580725564
Epoch: 23, step: 1230, loss: 0.36849939823150635, mean loss: 0.351271676002431
Epoch: 23, step: 1231, loss: 0.30468177795410156, mean loss: 0.3512703233750344
Epoch: 23, step: 1232, loss: 0.33570539951324463, mean loss: 0.35126987149743644
Epoch: 23, step: 1233, loss: 0.30986061692237854, mean loss: 0.351268669347562
Epoch: 23, step: 1234, loss: 0.335697203874588, mean loss: 0.3512682173062965
Epoch: 23, step: 1235, loss: 0.29918989539146423, mean loss: 0.35126670551107136
Epoch: 23, step: 1236, loss: 0.3339806795120239, mean loss: 0.3512662037250689
Epoch: 23, step: 1237, loss: 0.37908634543418884, mean loss: 0.3512670112763522
Epoch: 23, step: 1238, loss: 0.33387139439582825, mean loss: 0.35126650633841483
Epoch: 23, step: 1239, loss: 0.3010816276073456, mean loss: 0.35126504967759015
Epoch: 23, step: 1240, loss: 0.33415669202804565, mean loss: 0.3512645531066776
Epoch: 23, step: 1241, loss: 0.3228515088558197, mean loss: 0.3512637284406228
Epoch: 23, step: 1242, loss: 0.30930888652801514, mean loss: 0.3512625107699825
Epoch: 23, step: 1243, loss: 0.3733850121498108, mean loss: 0.35126315282075393
Epoch: 23, step: 1244, loss: 0.32393917441368103, mean loss: 0.3512623598330183
Epoch: 23, step: 1245, loss: 0.3232811689376831, mean loss: 0.35126154779543933
Epoch: 23, step: 1246, loss: 0.35972681641578674, mean loss: 0.3512617934574905
Epoch: 23, step: 1247, loss: 0.3570864200592041, mean loss: 0.3512619624832189
Epoch: 23, step: 1248, loss: 0.33791184425354004, mean loss: 0.35126157508534217
Epoch: 23, step: 1249, loss: 0.3395480811595917, mean loss: 0.35126123518940094
Epoch: 23, step: 1250, loss: 0.31372106075286865, mean loss: 0.35126014590017957
Epoch: 23, step: 1251, loss: 0.31542539596557617, mean loss: 0.35125910612679473
Epoch: 23, step: 1252, loss: 0.3208281099796295, mean loss: 0.35125822317318534
Epoch: 23, step: 1253, loss: 0.3493855893611908, mean loss: 0.35125816884039907
Epoch: 23, step: 1254, loss: 0.33740565180778503, mean loss: 0.3512577669337338
Epoch: 23, step: 1255, loss: 0.36943939328193665, mean loss: 0.35125829442666484
Epoch: 23, step: 1256, loss: 0.3092155158519745, mean loss: 0.35125707469941503
Epoch: 23, step: 1257, loss: 0.3352762460708618, mean loss: 0.35125661108384704
Epoch: 23, step: 1258, loss: 0.3529966473579407, mean loss: 0.35125666156211205
Epoch: 23, step: 1259, loss: 0.30288225412368774, mean loss: 0.3512552582664681
Epoch: 23, step: 1260, loss: 0.3666813373565674, mean loss: 0.35125570574939935
Epoch: 23, step: 1261, loss: 0.3067689836025238, mean loss: 0.35125441530668466
Epoch: 23, step: 1262, loss: 0.3588077127933502, mean loss: 0.35125463440160815
Epoch: 23, step: 1263, loss: 0.3669731616973877, mean loss: 0.35125509032826135
Epoch: 23, step: 1264, loss: 0.3614719808101654, mean loss: 0.351255386667574
Epoch: 23, step: 1265, loss: 0.3447123169898987, mean loss: 0.35125519689236434
Epoch: 23, step: 1266, loss: 0.35699209570884705, mean loss: 0.35125536328056634
Epoch: 23, step: 1267, loss: 0.3045584261417389, mean loss: 0.35125400896104375
Epoch: 23, step: 1268, loss: 0.32851293683052063, mean loss: 0.3512533494363162
Epoch: 23, step: 1269, loss: 0.3442783057689667, mean loss: 0.3512531471555997
Epoch: 23, step: 1270, loss: 0.31780436635017395, mean loss: 0.35125217714774637
Epoch: 23, step: 1271, loss: 0.3259369432926178, mean loss: 0.3512514430323927
Epoch: 23, step: 1272, loss: 0.36163511872291565, mean loss: 0.3512517441394158
Epoch: 23, step: 1273, loss: 0.3087310492992401, mean loss: 0.3512505111551659
Epoch: 23, step: 1274, loss: 0.3572924733161926, mean loss: 0.3512506863505196
Epoch: 23, step: 1275, loss: 0.36938104033470154, mean loss: 0.35125121205087867
Epoch: 23, step: 1276, loss: 0.3054683208465576, mean loss: 0.35124988458730466
Epoch: 23, step: 1277, loss: 0.38141459226608276, mean loss: 0.35125075918016285
Epoch: 23, step: 1278, loss: 0.42623287439346313, mean loss: 0.3512529331419272
Epoch: 23, step: 1279, loss: 0.3259698152542114, mean loss: 0.35125220012795616
Epoch: 23, step: 1280, loss: 0.30943962931632996, mean loss: 0.35125098792342735
Epoch: 23, step: 1281, loss: 0.3524341881275177, mean loss: 0.35125102222505095
Epoch: 23, step: 1282, loss: 0.32429036498069763, mean loss: 0.35125024064345234
Epoch: 23, step: 1283, loss: 0.3840332627296448, mean loss: 0.35125119098616125
Epoch: 23, step: 1284, loss: 0.2915566563606262, mean loss: 0.3512494605593234
Epoch: 23, step: 1285, loss: 0.3212992250919342, mean loss: 0.35124859238622735
Epoch: 23, step: 1286, loss: 0.380765825510025, mean loss: 0.35124944798300184
Epoch: 23, step: 1287, loss: 0.33162418007850647, mean loss: 0.3512488791346568
Epoch: 23, step: 1288, loss: 0.33494052290916443, mean loss: 0.3512484064423805
Epoch: 23, step: 1289, loss: 0.32248127460479736, mean loss: 0.3512475726608073
Epoch: 23, step: 1290, loss: 0.34497174620628357, mean loss: 0.35124739076861083
Epoch: 23, step: 1291, loss: 0.336929053068161, mean loss: 0.35124697579244285
Epoch: 23, step: 1292, loss: 0.3605506718158722, mean loss: 0.35124724542571406
Epoch: 23, step: 1293, loss: 0.36510297656059265, mean loss: 0.35124764697127525
Epoch: 23, step: 1294, loss: 0.3131280243396759, mean loss: 0.35124654227881774
Epoch: 23, step: 1295, loss: 0.3819757103919983, mean loss: 0.35124743277285136
Epoch: 23, step: 1296, loss: 0.3180159628391266, mean loss: 0.3512464697930509
Epoch: 23, step: 1297, loss: 0.3110646903514862, mean loss: 0.351245305441285
Epoch: 23, step: 1298, loss: 0.30791744589805603, mean loss: 0.35124404996159614
Epoch: 23, step: 1299, loss: 0.3468753695487976, mean loss: 0.3512439233772077
Epoch: 23, step: 1300, loss: 0.32993724942207336, mean loss: 0.35124330602508086
Epoch: 23, step: 1301, loss: 0.3272381126880646, mean loss: 0.35124261050461564
Epoch: 23, step: 1302, loss: 0.3258773982524872, mean loss: 0.3512418756005956
Epoch: 23, step: 1303, loss: 0.39380955696105957, mean loss: 0.351243108874479
Epoch: 23, step: 1304, loss: 0.3456995189189911, mean loss: 0.3512429482698507
Epoch: 23, step: 1305, loss: 0.3324279487133026, mean loss: 0.3512424031919332
Epoch: 23, step: 1306, loss: 0.2924308478832245, mean loss: 0.35124069944746467
Epoch: 23, step: 1307, loss: 0.3402218520641327, mean loss: 0.35124038024562854
Epoch: 23, step: 1308, loss: 0.4083840847015381, mean loss: 0.35124203557729494
Epoch: 23, step: 1309, loss: 0.3325897455215454, mean loss: 0.3512414952757465
Epoch: 23, step: 1310, loss: 0.3523760139942169, mean loss: 0.35124152813843856
Epoch: 23, step: 1311, loss: 0.3457712233066559, mean loss: 0.35124136968910386
Epoch: 23, step: 1312, loss: 0.30376434326171875, mean loss: 0.35123999453989524
Epoch: 23, step: 1313, loss: 0.3371025621891022, mean loss: 0.35123958506783504
Epoch: 23, step: 1314, loss: 0.3436203598976135, mean loss: 0.35123936439343034
Epoch: 23, step: 1315, loss: 0.31426072120666504, mean loss: 0.3512382934178978
Epoch: 23, step: 1316, loss: 0.35978275537490845, mean loss: 0.351238540875454
Epoch: 23, step: 1317, loss: 0.3290633261203766, mean loss: 0.35123789867404204
Epoch: 23, step: 1318, loss: 0.3519252836704254, mean loss: 0.351237918580358
Epoch: 23, step: 1319, loss: 0.3365768790245056, mean loss: 0.3512374940164881
Epoch: 23, step: 1320, loss: 0.3000057637691498, mean loss: 0.3512360104578559
Epoch: 23, step: 1321, loss: 0.3381190001964569, mean loss: 0.35123563062898405
Epoch: 23, step: 1322, loss: 0.33889898657798767, mean loss: 0.3512352734074971
Epoch: 23, step: 1323, loss: 0.30658870935440063, mean loss: 0.35123398065315226
Epoch: 23, step: 1324, loss: 0.33565154671669006, mean loss: 0.3512335294722756
Epoch: 23, step: 1325, loss: 0.3267291486263275, mean loss: 0.35123281998183475
Epoch: 23, step: 1326, loss: 0.34375277161598206, mean loss: 0.35123260341365486
Epoch: 23, step: 1327, loss: 0.336115300655365, mean loss: 0.35123216573841576
Epoch: 23, step: 1328, loss: 0.29425248503685, mean loss: 0.3512305161138912
Epoch: 23, step: 1329, loss: 0.32728514075279236, mean loss: 0.35122982288896615
Epoch: 23, step: 1330, loss: 0.30642858147621155, mean loss: 0.3512285259187721
Epoch: 23, step: 1331, loss: 0.3134125769138336, mean loss: 0.3512274312004707
Epoch: 23, step: 1332, loss: 0.33096587657928467, mean loss: 0.35122684467406684
Epoch: 23, step: 1333, loss: 0.31986427307128906, mean loss: 0.3512259368244865
Epoch: 23, step: 1334, loss: 0.3806644082069397, mean loss: 0.3512267889526418
Epoch: 23, step: 1335, loss: 0.3455192744731903, mean loss: 0.3512266237472904
Epoch: 23, step: 1336, loss: 0.37035679817199707, mean loss: 0.35122717745866916
Epoch: 23, step: 1337, loss: 0.29312238097190857, mean loss: 0.3512254956990024
Epoch: 23, step: 1338, loss: 0.30538052320480347, mean loss: 0.35122416882069224
Epoch: 23, step: 1339, loss: 0.3784079849720001, mean loss: 0.35122495557156486
Epoch: 23, step: 1340, loss: 0.3107735514640808, mean loss: 0.3512237848655738
Epoch: 23, step: 1341, loss: 0.3450269401073456, mean loss: 0.35122360552758813
Epoch: 23, step: 1342, loss: 0.3347242474555969, mean loss: 0.3512231280465269
Epoch: 23, step: 1343, loss: 0.38844025135040283, mean loss: 0.3512242050555356
Epoch: 23, step: 1344, loss: 0.2954813241958618, mean loss: 0.35122259198493166
Epoch: 23, step: 1345, loss: 0.3437628746032715, mean loss: 0.35122237612413587
Epoch: 23, step: 1346, loss: 0.3444671928882599, mean loss: 0.3512221806560021
Epoch: 23, step: 1347, loss: 0.31250467896461487, mean loss: 0.3512210603579207
Epoch: 23, step: 1348, loss: 0.30675452947616577, mean loss: 0.3512197737478434
Epoch: 23, step: 1349, loss: 0.30946090817451477, mean loss: 0.35121856551725567
Epoch: 23, step: 1350, loss: 0.2997124493122101, mean loss: 0.3512170753076036
Epoch: 23, step: 1351, loss: 0.31449469923973083, mean loss: 0.3512160128618199
Epoch: 23, step: 1352, loss: 0.31940677762031555, mean loss: 0.3512150925888489
Epoch: 23, step: 1353, loss: 0.3639109432697296, mean loss: 0.3512154598818733
Epoch: 23, step: 1354, loss: 0.2943650186061859, mean loss: 0.3512138152369439
Epoch: 23, step: 1355, loss: 0.38001298904418945, mean loss: 0.3512146483535201
Epoch: 23, step: 1356, loss: 0.36068883538246155, mean loss: 0.3512149224195049
Epoch: 23, step: 1357, loss: 0.35692882537841797, mean loss: 0.35121508770451965
Epoch: 23, step: 1358, loss: 0.30281704664230347, mean loss: 0.3512136877438283
Epoch: 23, step: 1359, loss: 0.34673869609832764, mean loss: 0.35121355830406065
Epoch: 23, step: 1360, loss: 0.30884718894958496, mean loss: 0.35121233288626774
Epoch: 23, step: 1361, loss: 0.34036579728126526, mean loss: 0.3512120191668368
Epoch: 23, step: 1362, loss: 0.32911208271980286, mean loss: 0.3512113799785086
Epoch: 23, step: 1363, loss: 0.3498629033565521, mean loss: 0.35121134097814355
Epoch: 23, step: 1364, loss: 0.32969605922698975, mean loss: 0.35121071873556176
Epoch: 23, step: 1365, loss: 0.3145328760147095, mean loss: 0.3512096580078528
Epoch: 23, step: 1366, loss: 0.3068183362483978, mean loss: 0.35120837424251083
Epoch: 23, step: 1367, loss: 0.3251895010471344, mean loss: 0.351207621817028
Epoch: 23, step: 1368, loss: 0.3356766700744629, mean loss: 0.35120717269896484
Epoch: 23, step: 1369, loss: 0.31439346075057983, mean loss: 0.35120610816504694
Epoch: 23, step: 1370, loss: 0.3389360308647156, mean loss: 0.3512057533642113
Epoch: 23, step: 1371, loss: 0.3141515552997589, mean loss: 0.3512046819381743
Epoch: 23, step: 1372, loss: 0.31276240944862366, mean loss: 0.3512035704079592
Epoch: 23, step: 1373, loss: 0.3266798257827759, mean loss: 0.3512028613423076
Epoch: 23, step: 1374, loss: 0.36715349555015564, mean loss: 0.3512033225165698
Epoch: 23, step: 1375, loss: 0.3259010314941406, mean loss: 0.35120259098277135
Epoch: 23, step: 1376, loss: 0.3944699764251709, mean loss: 0.3512038418829258
Epoch: 23, step: 1377, loss: 0.3491254448890686, mean loss: 0.3512037817962824
Epoch: 23, step: 1378, loss: 0.31393322348594666, mean loss: 0.35120270433225104
Epoch: 23, step: 1379, loss: 0.3897610306739807, mean loss: 0.3512038189924714
Epoch: 23, step: 1380, loss: 0.40297120809555054, mean loss: 0.3512053154625406
Epoch: 23, step: 1381, loss: 0.33386093378067017, mean loss: 0.3512048140928903
Epoch: 23, step: 1382, loss: 0.31627416610717773, mean loss: 0.3512038043906794
Epoch: 23, step: 1383, loss: 0.37807971239089966, mean loss: 0.3512045812408355
Epoch: 23, step: 1384, loss: 0.3217359185218811, mean loss: 0.35120372947152834
Epoch: 23, step: 1385, loss: 0.3263038992881775, mean loss: 0.3512030097816566
Epoch: 23, step: 1386, loss: 0.33249497413635254, mean loss: 0.35120246907135727
Epoch: 23, step: 1387, loss: 0.32083258032798767, mean loss: 0.35120159132890805
Epoch: 23, step: 1388, loss: 0.33427977561950684, mean loss: 0.35120110227322443
Epoch: 23, step: 1389, loss: 0.3124314844608307, mean loss: 0.3511999818288047
Epoch: 23, step: 1390, loss: 0.2989426553249359, mean loss: 0.351198471632391
Epoch: 23, step: 1391, loss: 0.31847041845321655, mean loss: 0.3511975258442399
Epoch: 23, step: 1392, loss: 0.33781003952026367, mean loss: 0.3511971389785753
Epoch: 23, step: 1393, loss: 0.33420926332473755, mean loss: 0.3511966480846363
Epoch: 23, step: 1394, loss: 0.34674715995788574, mean loss: 0.35119651951272524
Epoch: 23, step: 1395, loss: 0.3143611550331116, mean loss: 0.3511954551529102
Epoch: 23, step: 1396, loss: 0.33386677503585815, mean loss: 0.3511949544542446
Epoch: 23, step: 1397, loss: 0.3576087951660156, mean loss: 0.35119513977180344
Epoch: 23, step: 1398, loss: 0.3327207863330841, mean loss: 0.35119460600064867
Epoch: 23, step: 1399, loss: 0.3604210615158081, mean loss: 0.3511948725687613
Epoch: 23, step: 1400, loss: 0.3209626376628876, mean loss: 0.3511939991329162
Epoch: 23, step: 1401, loss: 0.3653232455253601, mean loss: 0.3511944073274731
Epoch: 23, step: 1402, loss: 0.3234690725803375, mean loss: 0.35119360636445857
Epoch: 23, step: 1403, loss: 0.3465927839279175, mean loss: 0.35119347345417323
Epoch: 23, step: 1404, loss: 0.30232587456703186, mean loss: 0.3511920617894164
Epoch: 23, step: 1405, loss: 0.3407116234302521, mean loss: 0.35119175904407124
Epoch: 23, step: 1406, loss: 0.31940996646881104, mean loss: 0.3511908409992815
Epoch: 23, step: 1407, loss: 0.3272453248500824, mean loss: 0.35119014933214837
Epoch: 23, step: 1408, loss: 0.28585585951805115, mean loss: 0.35118826220324356
Epoch: 23, step: 1409, loss: 0.2892175018787384, mean loss: 0.3511864722789086
Epoch: 23, step: 1410, loss: 0.33656489849090576, mean loss: 0.35118604997079583
Epoch: 23, step: 1411, loss: 0.3128942549228668, mean loss: 0.35118494403863754
Epoch: 23, step: 1412, loss: 0.3404574990272522, mean loss: 0.3511846342207311
Epoch: 23, step: 1413, loss: 0.3477461338043213, mean loss: 0.35118453491672785
Epoch: 23, step: 1414, loss: 0.33277469873428345, mean loss: 0.3511840032554178
Epoch: 23, step: 1415, loss: 0.33992835879325867, mean loss: 0.35118367821081625
Epoch: 23, step: 1416, loss: 0.33653849363327026, mean loss: 0.3511832552940535
Epoch: 23, step: 1417, loss: 0.3410564959049225, mean loss: 0.351182962866696
Epoch: 23, step: 1418, loss: 0.3514949381351471, mean loss: 0.351182971875251
Epoch: 23, step: 1419, loss: 0.3310184180736542, mean loss: 0.3511823896231777
Epoch: 23, step: 1420, loss: 0.31473249197006226, mean loss: 0.35118133716172034
Epoch: 23, step: 1421, loss: 0.2861490249633789, mean loss: 0.3511794594602652
Epoch: 23, step: 1422, loss: 0.3822242319583893, mean loss: 0.35118035580132184
Epoch: 23, step: 1423, loss: 0.3083748519420624, mean loss: 0.3511791199339047
Epoch: 23, step: 1424, loss: 0.3323611319065094, mean loss: 0.3511785766423948
Epoch: 23, step: 1425, loss: 0.3278317451477051, mean loss: 0.351177902618736
Epoch: 23, step: 1426, loss: 0.32997095584869385, mean loss: 0.35117729039128226
Epoch: 23, step: 1427, loss: 0.35695773363113403, mean loss: 0.35117745726320027
Epoch: 23, step: 1428, loss: 0.3030141592025757, mean loss: 0.351176066907897
Epoch: 23, step: 1429, loss: 0.3448437452316284, mean loss: 0.35117588411470735
Epoch: 23, step: 1430, loss: 0.3262406885623932, mean loss: 0.35117516433883483
Epoch: 23, step: 1431, loss: 0.3501693904399872, mean loss: 0.35117513530714395
Epoch: 23, step: 1432, loss: 0.3273178040981293, mean loss: 0.35117444668450837
Epoch: 23, step: 1433, loss: 0.3842127323150635, mean loss: 0.3511754002804684
Epoch: 23, step: 1434, loss: 0.34775179624557495, mean loss: 0.3511753014666018
Epoch: 23, step: 1435, loss: 0.3718796372413635, mean loss: 0.3511758990288211
Epoch: 23, step: 1436, loss: 0.34669363498687744, mean loss: 0.3511757696668181
Epoch: 23, step: 1437, loss: 0.2978728115558624, mean loss: 0.3511742313419087
Epoch: 23, step: 1438, loss: 0.38153064250946045, mean loss: 0.3511751074035279
Epoch: 23, step: 1439, loss: 0.31665369868278503, mean loss: 0.3511741111721785
Epoch: 23, step: 1440, loss: 0.31163832545280457, mean loss: 0.3511729702670413
Epoch: 23, step: 1441, loss: 0.3855763077735901, mean loss: 0.35117396303374954
Epoch: 23, step: 1442, loss: 0.3540618121623993, mean loss: 0.351174046365134
Epoch: 23, step: 1443, loss: 0.3473464548587799, mean loss: 0.3511739359198574
Valid: 23, mean loss: 0.18691740930080414
Epoch: 24, step: 0, loss: 0.2737720310688019, mean loss: 0.35117170254983543
Epoch: 24, step: 1, loss: 0.3286066949367523, mean loss: 0.3511710514733852
Epoch: 24, step: 2, loss: 0.30414918065071106, mean loss: 0.35116969477322585
Epoch: 24, step: 3, loss: 0.3429499864578247, mean loss: 0.35116945762064894
Epoch: 24, step: 4, loss: 0.3601868152618408, mean loss: 0.35116971777926065
Epoch: 24, step: 5, loss: 0.32428407669067383, mean loss: 0.3511689421275069
Epoch: 24, step: 6, loss: 0.29439640045166016, mean loss: 0.3511673042848021
Epoch: 24, step: 7, loss: 0.3030180037021637, mean loss: 0.3511659152558215
Epoch: 24, step: 8, loss: 0.342329740524292, mean loss: 0.3511656603539109
Epoch: 24, step: 9, loss: 0.31877127289772034, mean loss: 0.35116472588245595
Epoch: 24, step: 10, loss: 0.315248966217041, mean loss: 0.35116368986088886
Epoch: 24, step: 11, loss: 0.38736554980278015, mean loss: 0.35116473410514704
Epoch: 24, step: 12, loss: 0.33586692810058594, mean loss: 0.35116429285198125
Epoch: 24, step: 13, loss: 0.3357807993888855, mean loss: 0.35116384914002674
Epoch: 24, step: 14, loss: 0.33319592475891113, mean loss: 0.35116333089929586
Epoch: 24, step: 15, loss: 0.29123637080192566, mean loss: 0.35116160250289247
Epoch: 24, step: 16, loss: 0.30511173605918884, mean loss: 0.35116027438399755
Epoch: 24, step: 17, loss: 0.3210218548774719, mean loss: 0.3511594051903797
Epoch: 24, step: 18, loss: 0.3363640010356903, mean loss: 0.35115897850244443
Epoch: 24, step: 19, loss: 0.3332943320274353, mean loss: 0.35115846331480816
Epoch: 24, step: 20, loss: 0.33762791752815247, mean loss: 0.3511580731269088
Epoch: 24, step: 21, loss: 0.34383004903793335, mean loss: 0.35115786181068265
Epoch: 24, step: 22, loss: 0.3547763228416443, mean loss: 0.3511579661522447
Epoch: 24, step: 23, loss: 0.31721386313438416, mean loss: 0.3511569873718809
Epoch: 24, step: 24, loss: 0.31682002544403076, mean loss: 0.35115599729195446
Epoch: 24, step: 25, loss: 0.32334253191947937, mean loss: 0.351155195335165
Epoch: 24, step: 26, loss: 0.35350552201271057, mean loss: 0.3511552631011217
Epoch: 24, step: 27, loss: 0.3368687331676483, mean loss: 0.35115485119563405
Epoch: 24, step: 28, loss: 0.3516466021537781, mean loss: 0.35115486537326007
Epoch: 24, step: 29, loss: 0.3465822637081146, mean loss: 0.3511547335448087
Epoch: 24, step: 30, loss: 0.3569914698600769, mean loss: 0.35115490181350634
Epoch: 24, step: 31, loss: 0.31427404284477234, mean loss: 0.3511538385968617
Epoch: 24, step: 32, loss: 0.3312678635120392, mean loss: 0.35115326533227975
Epoch: 24, step: 33, loss: 0.35807791352272034, mean loss: 0.35115346494739047
Epoch: 24, step: 34, loss: 0.33422181010246277, mean loss: 0.3511529768768579
Epoch: 24, step: 35, loss: 0.2999702990055084, mean loss: 0.3511515015315947
Epoch: 24, step: 36, loss: 0.33696192502975464, mean loss: 0.35115109252757365
Epoch: 24, step: 37, loss: 0.3710425794124603, mean loss: 0.35115166586840735
Epoch: 24, step: 38, loss: 0.301191121339798, mean loss: 0.3511502258757707
Epoch: 24, step: 39, loss: 0.3225819766521454, mean loss: 0.3511494024883709
Epoch: 24, step: 40, loss: 0.3653770983219147, mean loss: 0.35114981254387523
Epoch: 24, step: 41, loss: 0.3258470594882965, mean loss: 0.3511490833158778
Epoch: 24, step: 42, loss: 0.32743415236473083, mean loss: 0.351148399868777
Epoch: 24, step: 43, loss: 0.2917172610759735, mean loss: 0.35114668715584346
Epoch: 24, step: 44, loss: 0.3045523166656494, mean loss: 0.35114534441729156
Epoch: 24, step: 45, loss: 0.3139355778694153, mean loss: 0.3511442721515274
Epoch: 24, step: 46, loss: 0.29612988233566284, mean loss: 0.351142686859483
Epoch: 24, step: 47, loss: 0.3069678246974945, mean loss: 0.3511414139554327
Epoch: 24, step: 48, loss: 0.4120834171772003, mean loss: 0.3511431699561018
Epoch: 24, step: 49, loss: 0.3359020948410034, mean loss: 0.3511427308079685
Epoch: 24, step: 50, loss: 0.32950446009635925, mean loss: 0.3511421073524491
Epoch: 24, step: 51, loss: 0.3369264006614685, mean loss: 0.3511416977723324
Epoch: 24, step: 52, loss: 0.3626368045806885, mean loss: 0.3511420289575238
Epoch: 24, step: 53, loss: 0.330610066652298, mean loss: 0.3511414374287913
Epoch: 24, step: 54, loss: 0.3548719882965088, mean loss: 0.35114154490339206
Epoch: 24, step: 55, loss: 0.32308095693588257, mean loss: 0.3511407365204707
Epoch: 24, step: 56, loss: 0.3697398602962494, mean loss: 0.3511412723175431
Epoch: 24, step: 57, loss: 0.3634923994541168, mean loss: 0.3511416281142573
Epoch: 24, step: 58, loss: 0.32184094190597534, mean loss: 0.3511407840789352
Epoch: 24, step: 59, loss: 0.3311801850795746, mean loss: 0.3511402091106497
Epoch: 24, step: 60, loss: 0.3254412114620209, mean loss: 0.3511394688681849
Epoch: 24, step: 61, loss: 0.3332560062408447, mean loss: 0.3511389537618243
Epoch: 24, step: 62, loss: 0.31302395462989807, mean loss: 0.3511378559479722
Epoch: 24, step: 63, loss: 0.3319512903690338, mean loss: 0.3511373033395166
Epoch: 24, step: 64, loss: 0.3361760377883911, mean loss: 0.35113687243990105
Epoch: 24, step: 65, loss: 0.31275901198387146, mean loss: 0.3511357671504461
Epoch: 24, step: 66, loss: 0.3219682574272156, mean loss: 0.3511349271449822
Epoch: 24, step: 67, loss: 0.34226301312446594, mean loss: 0.3511346716469399
Epoch: 24, step: 68, loss: 0.3752109110355377, mean loss: 0.3511353649871671
Epoch: 24, step: 69, loss: 0.3164176642894745, mean loss: 0.351134365226161
Epoch: 24, step: 70, loss: 0.3183848261833191, mean loss: 0.3511334221692012
Epoch: 24, step: 71, loss: 0.3154844343662262, mean loss: 0.3511323956491654
Epoch: 24, step: 72, loss: 0.31415852904319763, mean loss: 0.35113133100962474
Epoch: 24, step: 73, loss: 0.31119173765182495, mean loss: 0.35113018100693666
Epoch: 24, step: 74, loss: 0.3342962861061096, mean loss: 0.35112969631329405
Epoch: 24, step: 75, loss: 0.3771633207798004, mean loss: 0.3511304458706033
Epoch: 24, step: 76, loss: 0.3538110852241516, mean loss: 0.3511305230490605
Epoch: 24, step: 77, loss: 0.4418264627456665, mean loss: 0.3511331342064192
Epoch: 24, step: 78, loss: 0.3179555833339691, mean loss: 0.35113217904445365
Epoch: 24, step: 79, loss: 0.3352459669113159, mean loss: 0.3511317217030173
Epoch: 24, step: 80, loss: 0.28826969861984253, mean loss: 0.35112991204694216
Epoch: 24, step: 81, loss: 0.32418930530548096, mean loss: 0.35112913650987204
Epoch: 24, step: 82, loss: 0.28544944524765015, mean loss: 0.3511272458483313
Epoch: 24, step: 83, loss: 0.31528645753860474, mean loss: 0.35112621416185147
Epoch: 24, step: 84, loss: 0.35482490062713623, mean loss: 0.3511263206264456
Epoch: 24, step: 85, loss: 0.2997784912586212, mean loss: 0.35112484265081473
Epoch: 24, step: 86, loss: 0.3335202634334564, mean loss: 0.35112433594214776
Epoch: 24, step: 87, loss: 0.3123662769794464, mean loss: 0.35112322040971156
Epoch: 24, step: 88, loss: 0.31418749690055847, mean loss: 0.35112215735823626
Epoch: 24, step: 89, loss: 0.2909236550331116, mean loss: 0.35112042482780614
Epoch: 24, step: 90, loss: 0.3590904176235199, mean loss: 0.3511206541999187
Epoch: 24, step: 91, loss: 0.32762160897254944, mean loss: 0.35111997792947935
Epoch: 24, step: 92, loss: 0.31741610169410706, mean loss: 0.3511190080058489
Epoch: 24, step: 93, loss: 0.3484722375869751, mean loss: 0.35111893183979365
Epoch: 24, step: 94, loss: 0.3215028643608093, mean loss: 0.3511180796033838
Epoch: 24, step: 95, loss: 0.3128903806209564, mean loss: 0.35111697958902544
Epoch: 24, step: 96, loss: 0.3250446617603302, mean loss: 0.35111622937126497
Epoch: 24, step: 97, loss: 0.317109078168869, mean loss: 0.35111525086084305
Epoch: 24, step: 98, loss: 0.3436470925807953, mean loss: 0.3511150359807314
Epoch: 24, step: 99, loss: 0.3493022620677948, mean loss: 0.3511149838235812
Epoch: 24, step: 100, loss: 0.2950890064239502, mean loss: 0.3511133718899448
Epoch: 24, step: 101, loss: 0.36852461099624634, mean loss: 0.3511138728174753
Epoch: 24, step: 102, loss: 0.3410728871822357, mean loss: 0.3511135839430648
Epoch: 24, step: 103, loss: 0.3543178141117096, mean loss: 0.35111367612460015
Epoch: 24, step: 104, loss: 0.36149531602859497, mean loss: 0.35111397478228845
Epoch: 24, step: 105, loss: 0.3139232397079468, mean loss: 0.35111290491475855
Epoch: 24, step: 106, loss: 0.38105475902557373, mean loss: 0.35111376622862994
Epoch: 24, step: 107, loss: 0.3517296314239502, mean loss: 0.35111378394423215
Epoch: 24, step: 108, loss: 0.30517876148223877, mean loss: 0.3511124626434278
Epoch: 24, step: 109, loss: 0.3350019156932831, mean loss: 0.3511119992439298
Epoch: 24, step: 110, loss: 0.32457175850868225, mean loss: 0.3511112358694443
Epoch: 24, step: 111, loss: 0.3456416130065918, mean loss: 0.3511110785517136
Epoch: 24, step: 112, loss: 0.3044101893901825, mean loss: 0.35110973537563256
Epoch: 24, step: 113, loss: 0.32524555921554565, mean loss: 0.351108991510917
Epoch: 24, step: 114, loss: 0.3335460126399994, mean loss: 0.35110848640669595
Epoch: 24, step: 115, loss: 0.34986698627471924, mean loss: 0.35110845070267743
Epoch: 24, step: 116, loss: 0.31123000383377075, mean loss: 0.3511073038805203
Epoch: 24, step: 117, loss: 0.3382498025894165, mean loss: 0.35110693413584637
Epoch: 24, step: 118, loss: 0.3747231066226959, mean loss: 0.35110761324936146
Epoch: 24, step: 119, loss: 0.32598796486854553, mean loss: 0.35110689092222835
Epoch: 24, step: 120, loss: 0.37680795788764954, mean loss: 0.35110762994707134
Epoch: 24, step: 121, loss: 0.37074628472328186, mean loss: 0.3511081946332171
Epoch: 24, step: 122, loss: 0.3547585904598236, mean loss: 0.3511082995929867
Epoch: 24, step: 123, loss: 0.34016093611717224, mean loss: 0.35110798483267974
Epoch: 24, step: 124, loss: 0.3120884597301483, mean loss: 0.3511068629694469
Epoch: 24, step: 125, loss: 0.31179365515708923, mean loss: 0.35110573269494244
Epoch: 24, step: 126, loss: 0.3434011936187744, mean loss: 0.3511055111919359
Epoch: 24, step: 127, loss: 0.3307390511035919, mean loss: 0.35110492567962887
Epoch: 24, step: 128, loss: 0.3408762514591217, mean loss: 0.35110463162546124
Epoch: 24, step: 129, loss: 0.3241086006164551, mean loss: 0.3511038555652356
Epoch: 24, step: 130, loss: 0.3196924924850464, mean loss: 0.3511029526025461
Epoch: 24, step: 131, loss: 0.37231022119522095, mean loss: 0.3511035622170279
Epoch: 24, step: 132, loss: 0.3463123142719269, mean loss: 0.3511034244939561
Epoch: 24, step: 133, loss: 0.3255321979522705, mean loss: 0.35110268947738404
Epoch: 24, step: 134, loss: 0.3404000997543335, mean loss: 0.3511023818521441
Epoch: 24, step: 135, loss: 0.3408350348472595, mean loss: 0.35110208674559645
Epoch: 24, step: 136, loss: 0.3661360740661621, mean loss: 0.35110251884364263
Epoch: 24, step: 137, loss: 0.3364230692386627, mean loss: 0.35110209694763744
Epoch: 24, step: 138, loss: 0.32642507553100586, mean loss: 0.35110138773592836
Epoch: 24, step: 139, loss: 0.3195008337497711, mean loss: 0.3511004795696453
Epoch: 24, step: 140, loss: 0.31299394369125366, mean loss: 0.35109938445984046
Epoch: 24, step: 141, loss: 0.34369224309921265, mean loss: 0.3510991715987174
Epoch: 24, step: 142, loss: 0.3263797163963318, mean loss: 0.3510984612491326
Epoch: 24, step: 143, loss: 0.3308473229408264, mean loss: 0.35109787931987085
Epoch: 24, step: 144, loss: 0.3067292869091034, mean loss: 0.35109660439695456
Epoch: 24, step: 145, loss: 0.3172926902770996, mean loss: 0.35109563307593505
Epoch: 24, step: 146, loss: 0.3237060606479645, mean loss: 0.35109484608709995
Epoch: 24, step: 147, loss: 0.32594025135040283, mean loss: 0.3510941233369926
Epoch: 24, step: 148, loss: 0.353351354598999, mean loss: 0.3510941881906418
Epoch: 24, step: 149, loss: 0.31856492161750793, mean loss: 0.3510932536027382
Epoch: 24, step: 150, loss: 0.325935035943985, mean loss: 0.3510925308108383
Epoch: 24, step: 151, loss: 0.3262585401535034, mean loss: 0.35109181735443007
Epoch: 24, step: 152, loss: 0.37252646684646606, mean loss: 0.3510924331333807
Epoch: 24, step: 153, loss: 0.39543378353118896, mean loss: 0.3510937069440787
Epoch: 24, step: 154, loss: 0.37209972739219666, mean loss: 0.3510943103746164
Epoch: 24, step: 155, loss: 0.3377534747123718, mean loss: 0.3510939271494164
Epoch: 24, step: 156, loss: 0.35443100333213806, mean loss: 0.3510940230066014
Epoch: 24, step: 157, loss: 0.30662718415260315, mean loss: 0.35109274573771954
Epoch: 24, step: 158, loss: 0.3315250873565674, mean loss: 0.35109218369094713
Epoch: 24, step: 159, loss: 0.32322555780410767, mean loss: 0.3510913832938341
Epoch: 24, step: 160, loss: 0.36185070872306824, mean loss: 0.35109169231889165
Epoch: 24, step: 161, loss: 0.3235175311565399, mean loss: 0.3510909003675687
Epoch: 24, step: 162, loss: 0.39138883352279663, mean loss: 0.35109205772226454
Epoch: 24, step: 163, loss: 0.34184256196022034, mean loss: 0.3510917920848216
Epoch: 24, step: 164, loss: 0.30121222138404846, mean loss: 0.3510903596282379
Epoch: 24, step: 165, loss: 0.3700397312641144, mean loss: 0.3510909038063907
Epoch: 24, step: 166, loss: 0.31812524795532227, mean loss: 0.3510899571430977
Epoch: 24, step: 167, loss: 0.37739330530166626, mean loss: 0.3510907124655236
Epoch: 24, step: 168, loss: 0.33261892199516296, mean loss: 0.3510901820479939
Epoch: 24, step: 169, loss: 0.35960280895233154, mean loss: 0.3510904264810871
Epoch: 24, step: 170, loss: 0.3695451021194458, mean loss: 0.35109095637673243
Epoch: 24, step: 171, loss: 0.2799583077430725, mean loss: 0.351088913978414
Epoch: 24, step: 172, loss: 0.3498844504356384, mean loss: 0.3510888793962112
Epoch: 24, step: 173, loss: 0.34202566742897034, mean loss: 0.35108861918340706
Epoch: 24, step: 174, loss: 0.33204570412635803, mean loss: 0.3510880724602278
Epoch: 24, step: 175, loss: 0.303532212972641, mean loss: 0.3510867071679825
Epoch: 24, step: 176, loss: 0.33417990803718567, mean loss: 0.3510862218006834
Epoch: 24, step: 177, loss: 0.3323136866092682, mean loss: 0.3510856828865423
Epoch: 24, step: 178, loss: 0.3362356424331665, mean loss: 0.35108525658998846
Epoch: 24, step: 179, loss: 0.33605632185935974, mean loss: 0.3510848251703441
Epoch: 24, step: 180, loss: 0.34965673089027405, mean loss: 0.35108478417673733
Epoch: 24, step: 181, loss: 0.36253347992897034, mean loss: 0.35108511280340227
Epoch: 24, step: 182, loss: 0.3523092567920685, mean loss: 0.35108514794057577
Epoch: 24, step: 183, loss: 0.32042065262794495, mean loss: 0.3510842677885863
Epoch: 24, step: 184, loss: 0.311496376991272, mean loss: 0.3510831315441962
Epoch: 24, step: 185, loss: 0.3265720009803772, mean loss: 0.3510824280504081
Epoch: 24, step: 186, loss: 0.31523144245147705, mean loss: 0.35108139912105074
Epoch: 24, step: 187, loss: 0.3569965958595276, mean loss: 0.35108156888332653
Epoch: 24, step: 188, loss: 0.3686111867427826, mean loss: 0.3510820719574508
Epoch: 24, step: 189, loss: 0.3246520459651947, mean loss: 0.351081313476535
Epoch: 24, step: 190, loss: 0.3195805549621582, mean loss: 0.3510804095032083
Epoch: 24, step: 191, loss: 0.3709501028060913, mean loss: 0.35108097968494906
Epoch: 24, step: 192, loss: 0.28527697920799255, mean loss: 0.3510790914241531
Epoch: 24, step: 193, loss: 0.34314101934432983, mean loss: 0.3510788636459012
Epoch: 24, step: 194, loss: 0.30601048469543457, mean loss: 0.35107757047270816
Epoch: 24, step: 195, loss: 0.3515344560146332, mean loss: 0.3510775835820144
Epoch: 24, step: 196, loss: 0.37076953053474426, mean loss: 0.3510781485820704
Epoch: 24, step: 197, loss: 0.32196933031082153, mean loss: 0.35107731341771997
Epoch: 24, step: 198, loss: 0.31305360794067383, mean loss: 0.35107622250664616
Epoch: 24, step: 199, loss: 0.3155958652496338, mean loss: 0.35107520459417035
Epoch: 24, step: 200, loss: 0.34067246317863464, mean loss: 0.35107490615364434
Epoch: 24, step: 201, loss: 0.352971613407135, mean loss: 0.351074960566039
Epoch: 24, step: 202, loss: 0.3184780776500702, mean loss: 0.35107402545938315
Epoch: 24, step: 203, loss: 0.33842137455940247, mean loss: 0.3510736625032472
Epoch: 24, step: 204, loss: 0.3556725084781647, mean loss: 0.3510737944227554
Epoch: 24, step: 205, loss: 0.3319033682346344, mean loss: 0.35107324452813693
Epoch: 24, step: 206, loss: 0.3210945725440979, mean loss: 0.35107238462875984
Epoch: 24, step: 207, loss: 0.3184884488582611, mean loss: 0.35107145002757323
Epoch: 24, step: 208, loss: 0.30997806787490845, mean loss: 0.35107027138474656
Epoch: 24, step: 209, loss: 0.32138434052467346, mean loss: 0.35106941995553587
Epoch: 24, step: 210, loss: 0.3338119685649872, mean loss: 0.3510689250046829
Epoch: 24, step: 211, loss: 0.29825854301452637, mean loss: 0.351067410424495
Epoch: 24, step: 212, loss: 0.33247971534729004, mean loss: 0.35106687735227965
Epoch: 24, step: 213, loss: 0.3243951201438904, mean loss: 0.35106611246104913
Epoch: 24, step: 214, loss: 0.35112515091896057, mean loss: 0.3510661141541023
Epoch: 24, step: 215, loss: 0.35824158787727356, mean loss: 0.35106631992015314
Epoch: 24, step: 216, loss: 0.3497314751148224, mean loss: 0.35106628164283815
Epoch: 24, step: 217, loss: 0.326764851808548, mean loss: 0.3510655848076648
Epoch: 24, step: 218, loss: 0.32287201285362244, mean loss: 0.351064776389831
Epoch: 24, step: 219, loss: 0.3165235221385956, mean loss: 0.3510637859880002
Epoch: 24, step: 220, loss: 0.3223150968551636, mean loss: 0.35106296170009893
Epoch: 24, step: 221, loss: 0.3527904152870178, mean loss: 0.35106301122855776
Epoch: 24, step: 222, loss: 0.30700770020484924, mean loss: 0.3510617481387036
Epoch: 24, step: 223, loss: 0.36015549302101135, mean loss: 0.3510620088538665
Epoch: 24, step: 224, loss: 0.3520795404911041, mean loss: 0.35106203802538216
Epoch: 24, step: 225, loss: 0.35111507773399353, mean loss: 0.3510620395459288
Epoch: 24, step: 226, loss: 0.29796573519706726, mean loss: 0.35106051742041355
Epoch: 24, step: 227, loss: 0.30626916885375977, mean loss: 0.3510592334120267
Epoch: 24, step: 228, loss: 0.3265445828437805, mean loss: 0.3510585306844771
Epoch: 24, step: 229, loss: 0.304802805185318, mean loss: 0.351057204773639
Epoch: 24, step: 230, loss: 0.3889119625091553, mean loss: 0.3510582898413644
Epoch: 24, step: 231, loss: 0.33461451530456543, mean loss: 0.3510578185109775
Epoch: 24, step: 232, loss: 0.3576349914073944, mean loss: 0.3510580070280716
Epoch: 24, step: 233, loss: 0.3288736045360565, mean loss: 0.3510573711896511
Epoch: 24, step: 234, loss: 0.32711586356163025, mean loss: 0.3510566850096153
Epoch: 24, step: 235, loss: 0.34572848677635193, mean loss: 0.3510565323041747
Epoch: 24, step: 236, loss: 0.30500108003616333, mean loss: 0.35105521239897114
Epoch: 24, step: 237, loss: 0.34429967403411865, mean loss: 0.35105501879725265
Epoch: 24, step: 238, loss: 0.34627193212509155, mean loss: 0.35105488172642096
Epoch: 24, step: 239, loss: 0.324905127286911, mean loss: 0.35105413236390265
Epoch: 24, step: 240, loss: 0.3586284816265106, mean loss: 0.351054349412625
Epoch: 24, step: 241, loss: 0.3396386206150055, mean loss: 0.35105402229563265
Epoch: 24, step: 242, loss: 0.33608478307724, mean loss: 0.3510535933653132
Epoch: 24, step: 243, loss: 0.37494441866874695, mean loss: 0.3510542779161815
Epoch: 24, step: 244, loss: 0.31865355372428894, mean loss: 0.3510533495552694
Epoch: 24, step: 245, loss: 0.330127090215683, mean loss: 0.351052749983344
Epoch: 24, step: 246, loss: 0.351397305727005, mean loss: 0.35105275985515283
Epoch: 24, step: 247, loss: 0.34473487734794617, mean loss: 0.3510525788477466
Epoch: 24, step: 248, loss: 0.35594627261161804, mean loss: 0.35105271904811225
Epoch: 24, step: 249, loss: 0.313931941986084, mean loss: 0.3510516555983597
Epoch: 24, step: 250, loss: 0.3011897802352905, mean loss: 0.35105022717783196
Epoch: 24, step: 251, loss: 0.3163347542285919, mean loss: 0.3510492326931021
Epoch: 24, step: 252, loss: 0.32221466302871704, mean loss: 0.3510484067006743
Epoch: 24, step: 253, loss: 0.32202452421188354, mean loss: 0.35104757530902464
Epoch: 24, step: 254, loss: 0.3023260831832886, mean loss: 0.3510461797176029
Epoch: 24, step: 255, loss: 0.3212609589099884, mean loss: 0.3510453265662278
Epoch: 24, step: 256, loss: 0.32781240344047546, mean loss: 0.3510446611143008
Epoch: 24, step: 257, loss: 0.36120960116386414, mean loss: 0.3510449522565375
Epoch: 24, step: 258, loss: 0.3049205243587494, mean loss: 0.3510436312074784
Epoch: 24, step: 259, loss: 0.3217906057834625, mean loss: 0.35104279339600447
Epoch: 24, step: 260, loss: 0.31527042388916016, mean loss: 0.3510417688987823
Epoch: 24, step: 261, loss: 0.32748252153396606, mean loss: 0.35104109419669843
Epoch: 24, step: 262, loss: 0.31912803649902344, mean loss: 0.3510401802799855
Epoch: 24, step: 263, loss: 0.34342509508132935, mean loss: 0.3510399622076717
Epoch: 24, step: 264, loss: 0.3673638701438904, mean loss: 0.3510404296601483
Epoch: 24, step: 265, loss: 0.31659194827079773, mean loss: 0.3510394432194694
Epoch: 24, step: 266, loss: 0.33410802483558655, mean loss: 0.3510389583980513
Epoch: 24, step: 267, loss: 0.3411408066749573, mean loss: 0.3510386749782906
Epoch: 24, step: 268, loss: 0.3240269720554352, mean loss: 0.3510379015580208
Epoch: 24, step: 269, loss: 0.36264878511428833, mean loss: 0.3510382340004292
Epoch: 24, step: 270, loss: 0.3013267517089844, mean loss: 0.35103681070377357
Epoch: 24, step: 271, loss: 0.32377973198890686, mean loss: 0.35103603032474484
Epoch: 24, step: 272, loss: 0.30642735958099365, mean loss: 0.3510347532005574
Epoch: 24, step: 273, loss: 0.3320894241333008, mean loss: 0.3510342108206814
Epoch: 24, step: 274, loss: 0.307039737701416, mean loss: 0.3510329513527842
Epoch: 24, step: 275, loss: 0.3222063183784485, mean loss: 0.35103212613141194
Epoch: 24, step: 276, loss: 0.3296717405319214, mean loss: 0.3510315146641575
Epoch: 24, step: 277, loss: 0.3375262916088104, mean loss: 0.3510311280716386
Epoch: 24, step: 278, loss: 0.3559744656085968, mean loss: 0.3510312695726415
Epoch: 24, step: 279, loss: 0.3041212856769562, mean loss: 0.35102992683209033
Epoch: 24, step: 280, loss: 0.3334604501724243, mean loss: 0.35102942394184045
Epoch: 24, step: 281, loss: 0.33598828315734863, mean loss: 0.35102899343234406
Epoch: 24, step: 282, loss: 0.34128251671791077, mean loss: 0.3510287144753987
Epoch: 24, step: 283, loss: 0.3569265604019165, mean loss: 0.3510288832746524
Epoch: 24, step: 284, loss: 0.30938926339149475, mean loss: 0.3510276915623407
Epoch: 24, step: 285, loss: 0.34350553154945374, mean loss: 0.35102747628674075
Epoch: 24, step: 286, loss: 0.3040594160556793, mean loss: 0.35102613215314515
Epoch: 24, step: 287, loss: 0.31211021542549133, mean loss: 0.35102501848794576
Epoch: 24, step: 288, loss: 0.33405211567878723, mean loss: 0.3510245327846174
Epoch: 24, step: 289, loss: 0.34974807500839233, mean loss: 0.35102449625803994
Epoch: 24, step: 290, loss: 0.3569013178348541, mean loss: 0.35102466442187596
Epoch: 24, step: 291, loss: 0.30854690074920654, mean loss: 0.3510234489656647
Epoch: 24, step: 292, loss: 0.33660978078842163, mean loss: 0.35102303654561895
Epoch: 24, step: 293, loss: 0.35326918959617615, mean loss: 0.3510231008132313
Epoch: 24, step: 294, loss: 0.34916603565216064, mean loss: 0.35102304767983994
Epoch: 24, step: 295, loss: 0.3267921209335327, mean loss: 0.35102235441688656
Epoch: 24, step: 296, loss: 0.3256896436214447, mean loss: 0.3510216296518937
Epoch: 24, step: 297, loss: 0.3789001703262329, mean loss: 0.3510224272298726
Epoch: 24, step: 298, loss: 0.31947779655456543, mean loss: 0.3510215247944363
Epoch: 24, step: 299, loss: 0.33256959915161133, mean loss: 0.3510209969329635
Epoch: 24, step: 300, loss: 0.3051130473613739, mean loss: 0.35101968366381653
Epoch: 24, step: 301, loss: 0.33209529519081116, mean loss: 0.3510191423173873
Epoch: 24, step: 302, loss: 0.33627501130104065, mean loss: 0.3510187205624453
Epoch: 24, step: 303, loss: 0.3642723560333252, mean loss: 0.3510190996710114
Epoch: 24, step: 304, loss: 0.3204204738140106, mean loss: 0.3510182244493113
Epoch: 24, step: 305, loss: 0.3098013401031494, mean loss: 0.35101704554409
Epoch: 24, step: 306, loss: 0.30536895990371704, mean loss: 0.3510157399328541
Epoch: 24, step: 307, loss: 0.29753556847572327, mean loss: 0.35101421035467495
Epoch: 24, step: 308, loss: 0.35466381907463074, mean loss: 0.35101431473358874
Epoch: 24, step: 309, loss: 0.37649840116500854, mean loss: 0.3510150435583451
Epoch: 24, step: 310, loss: 0.3618331253528595, mean loss: 0.3510153529380973
Epoch: 24, step: 311, loss: 0.36353880167007446, mean loss: 0.35101571107836077
Epoch: 24, step: 312, loss: 0.30703648924827576, mean loss: 0.3510144534152354
Epoch: 24, step: 313, loss: 0.32709768414497375, mean loss: 0.35101376949275126
Epoch: 24, step: 314, loss: 0.31553035974502563, mean loss: 0.3510127548403322
Epoch: 24, step: 315, loss: 0.3595981001853943, mean loss: 0.35101300033230703
Epoch: 24, step: 316, loss: 0.30631276965141296, mean loss: 0.3510117221968688
Epoch: 24, step: 317, loss: 0.4107755720615387, mean loss: 0.3510134310048366
Epoch: 24, step: 318, loss: 0.3469369113445282, mean loss: 0.35101331444959255
Epoch: 24, step: 319, loss: 0.29889485239982605, mean loss: 0.3510118243288798
Epoch: 24, step: 320, loss: 0.3308364450931549, mean loss: 0.3510112475104209
Epoch: 24, step: 321, loss: 0.35429051518440247, mean loss: 0.35101134126271305
Epoch: 24, step: 322, loss: 0.3343588709831238, mean loss: 0.3510108651922056
Epoch: 24, step: 323, loss: 0.3542925715446472, mean loss: 0.35101095900885376
Epoch: 24, step: 324, loss: 0.4296640455722809, mean loss: 0.3510132074604865
Epoch: 24, step: 325, loss: 0.3427976667881012, mean loss: 0.3510129726099727
Epoch: 24, step: 326, loss: 0.33173877000808716, mean loss: 0.3510124216508611
Epoch: 24, step: 327, loss: 0.369832843542099, mean loss: 0.35101295962313106
Epoch: 24, step: 328, loss: 0.32759889960289, mean loss: 0.35101229036316195
Epoch: 24, step: 329, loss: 0.318552702665329, mean loss: 0.35101136257525545
Epoch: 24, step: 330, loss: 0.32858121395111084, mean loss: 0.3510107214757435
Epoch: 24, step: 331, loss: 0.32255157828330994, mean loss: 0.35100990807848753
Epoch: 24, step: 332, loss: 0.37665027379989624, mean loss: 0.3510106408906777
Epoch: 24, step: 333, loss: 0.33761629462242126, mean loss: 0.3510102580856972
Epoch: 24, step: 334, loss: 0.3706153333187103, mean loss: 0.3510108183747782
Epoch: 24, step: 335, loss: 0.3973519802093506, mean loss: 0.3510121427106788
Epoch: 24, step: 336, loss: 0.32554563879966736, mean loss: 0.35101141495072935
Epoch: 24, step: 337, loss: 0.30102941393852234, mean loss: 0.3510099866487058
Epoch: 24, step: 338, loss: 0.3507854640483856, mean loss: 0.35100998023285784
Epoch: 24, step: 339, loss: 0.4192337393760681, mean loss: 0.351011929705916
Epoch: 24, step: 340, loss: 0.31954172253608704, mean loss: 0.3510110304800632
Epoch: 24, step: 341, loss: 0.3025113046169281, mean loss: 0.35100964469442225
Epoch: 24, step: 342, loss: 0.3433924913406372, mean loss: 0.351009427055251
Epoch: 24, step: 343, loss: 0.32613134384155273, mean loss: 0.3510087162528735
Epoch: 24, step: 344, loss: 0.34209999442100525, mean loss: 0.35100846172523625
Epoch: 24, step: 345, loss: 0.342946857213974, mean loss: 0.35100823140683984
Epoch: 24, step: 346, loss: 0.2902248501777649, mean loss: 0.35100649488764923
Epoch: 24, step: 347, loss: 0.3339306712150574, mean loss: 0.3510060070627243
Epoch: 24, step: 348, loss: 0.3078482151031494, mean loss: 0.3510047741590831
Epoch: 24, step: 349, loss: 0.35592782497406006, mean loss: 0.35100491479356905
Epoch: 24, step: 350, loss: 0.33664989471435547, mean loss: 0.3510045047321505
Epoch: 24, step: 351, loss: 0.307018518447876, mean loss: 0.351003248276875
Epoch: 24, step: 352, loss: 0.3433930277824402, mean loss: 0.3510030308979012
Epoch: 24, step: 353, loss: 0.353472501039505, mean loss: 0.3510031014340378
Epoch: 24, step: 354, loss: 0.3672909736633301, mean loss: 0.3510035666556033
Epoch: 24, step: 355, loss: 0.3012472689151764, mean loss: 0.351002145534338
Epoch: 24, step: 356, loss: 0.3863614797592163, mean loss: 0.3510031554259276
Epoch: 24, step: 357, loss: 0.3222573697566986, mean loss: 0.3510023344461575
Epoch: 24, step: 358, loss: 0.3104127049446106, mean loss: 0.35100117523926044
Epoch: 24, step: 359, loss: 0.3690057694911957, mean loss: 0.3510016894211845
Epoch: 24, step: 360, loss: 0.30252209305763245, mean loss: 0.35100030496231127
Epoch: 24, step: 361, loss: 0.35242709517478943, mean loss: 0.3510003457067916
Epoch: 24, step: 362, loss: 0.33698785305023193, mean loss: 0.35099994556707725
Epoch: 24, step: 363, loss: 0.3173026144504547, mean loss: 0.3509989833360345
Epoch: 24, step: 364, loss: 0.3634461462497711, mean loss: 0.35099933875600864
Epoch: 24, step: 365, loss: 0.30445656180381775, mean loss: 0.35099800979772666
Epoch: 24, step: 366, loss: 0.30328771471977234, mean loss: 0.35099664754163556
Epoch: 24, step: 367, loss: 0.3457910716533661, mean loss: 0.3509964989128128
Epoch: 24, step: 368, loss: 0.3363686501979828, mean loss: 0.3509960812725926
Epoch: 24, step: 369, loss: 0.3539007604122162, mean loss: 0.35099616420182056
Epoch: 24, step: 370, loss: 0.3101694881916046, mean loss: 0.35099499862452277
Epoch: 24, step: 371, loss: 0.3830862045288086, mean loss: 0.3509959147831931
Epoch: 24, step: 372, loss: 0.3277552127838135, mean loss: 0.3509952513128685
Epoch: 24, step: 373, loss: 0.31632062792778015, mean loss: 0.35099426145779045
Epoch: 24, step: 374, loss: 0.31283801794052124, mean loss: 0.35099317224413634
Epoch: 24, step: 375, loss: 0.35459089279174805, mean loss: 0.3509932749422566
Epoch: 24, step: 376, loss: 0.3421895503997803, mean loss: 0.3509930236442078
Epoch: 24, step: 377, loss: 0.33991149067878723, mean loss: 0.3509927073362508
Epoch: 24, step: 378, loss: 0.33318793773651123, mean loss: 0.35099219913674745
Epoch: 24, step: 379, loss: 0.40501052141189575, mean loss: 0.3509937409315378
Epoch: 24, step: 380, loss: 0.30567413568496704, mean loss: 0.3509924474530651
Epoch: 24, step: 381, loss: 0.32066109776496887, mean loss: 0.35099158178294443
Epoch: 24, step: 382, loss: 0.32869645953178406, mean loss: 0.3509909454884654
Epoch: 24, step: 383, loss: 0.3012058734893799, mean loss: 0.3509895246816161
Epoch: 24, step: 384, loss: 0.37340816855430603, mean loss: 0.35099016446483783
Epoch: 24, step: 385, loss: 0.3285018801689148, mean loss: 0.35098952271253214
Epoch: 24, step: 386, loss: 0.36980894207954407, mean loss: 0.3509900597504389
Epoch: 24, step: 387, loss: 0.3578978180885315, mean loss: 0.35099025686715896
Epoch: 24, step: 388, loss: 0.3297182619571686, mean loss: 0.35098964987629266
Epoch: 24, step: 389, loss: 0.35959067940711975, mean loss: 0.35098989529744
Epoch: 24, step: 390, loss: 0.2998563349246979, mean loss: 0.3509884362978003
Epoch: 24, step: 391, loss: 0.33560794591903687, mean loss: 0.3509879974570568
Epoch: 24, step: 392, loss: 0.3585363030433655, mean loss: 0.35098821282142056
Epoch: 24, step: 393, loss: 0.33891162276268005, mean loss: 0.3509878682682092
Epoch: 24, step: 394, loss: 0.357554167509079, mean loss: 0.35098805560378427
Epoch: 24, step: 395, loss: 0.3233470618724823, mean loss: 0.35098726703269756
Epoch: 24, step: 396, loss: 0.33543726801872253, mean loss: 0.3509868234187697
Epoch: 24, step: 397, loss: 0.36507517099380493, mean loss: 0.35098722532290544
Epoch: 24, step: 398, loss: 0.30761364102363586, mean loss: 0.3509859880219698
Epoch: 24, step: 399, loss: 0.35072410106658936, mean loss: 0.3509859805514382
Epoch: 24, step: 400, loss: 0.3335985541343689, mean loss: 0.35098548457555845
Epoch: 24, step: 401, loss: 0.3360712230205536, mean loss: 0.3509850591587761
Epoch: 24, step: 402, loss: 0.32722562551498413, mean loss: 0.350984381460221
Epoch: 24, step: 403, loss: 0.3218814432621002, mean loss: 0.35098355137071163
Epoch: 24, step: 404, loss: 0.3572770655155182, mean loss: 0.3509837308725554
Epoch: 24, step: 405, loss: 0.3574018180370331, mean loss: 0.350983913922215
Epoch: 24, step: 406, loss: 0.3745688199996948, mean loss: 0.3509845865659157
Epoch: 24, step: 407, loss: 0.3289048671722412, mean loss: 0.35098395686823736
Epoch: 24, step: 408, loss: 0.3057973384857178, mean loss: 0.3509826682152106
Epoch: 24, step: 409, loss: 0.31639546155929565, mean loss: 0.3509816818692728
Epoch: 24, step: 410, loss: 0.31730395555496216, mean loss: 0.3509807214869671
Epoch: 24, step: 411, loss: 0.3111187517642975, mean loss: 0.3509795847820018
Epoch: 24, step: 412, loss: 0.3796803057193756, mean loss: 0.35098040318916873
Epoch: 24, step: 413, loss: 0.3215949237346649, mean loss: 0.3509795652798601
Epoch: 24, step: 414, loss: 0.33179739117622375, mean loss: 0.35097901832727524
Epoch: 24, step: 415, loss: 0.3165234625339508, mean loss: 0.35097803590380944
Epoch: 24, step: 416, loss: 0.3410404622554779, mean loss: 0.35097775256409947
Epoch: 24, step: 417, loss: 0.3347891569137573, mean loss: 0.35097729100865527
Epoch: 24, step: 418, loss: 0.348321795463562, mean loss: 0.3509772152995877
Epoch: 24, step: 419, loss: 0.35207992792129517, mean loss: 0.35097724673739766
Epoch: 24, step: 420, loss: 0.3262083828449249, mean loss: 0.35097654060905453
Epoch: 24, step: 421, loss: 0.3053503930568695, mean loss: 0.3509752399035539
Epoch: 24, step: 422, loss: 0.3405493199825287, mean loss: 0.35097494269097884
Epoch: 24, step: 423, loss: 0.33036378026008606, mean loss: 0.35097435514358916
Epoch: 24, step: 424, loss: 0.29823657870292664, mean loss: 0.3509728518290759
Epoch: 24, step: 425, loss: 0.3130217492580414, mean loss: 0.350971770046322
Epoch: 24, step: 426, loss: 0.31066927313804626, mean loss: 0.3509706212706498
Epoch: 24, step: 427, loss: 0.30007708072662354, mean loss: 0.3509691706509786
Epoch: 24, step: 428, loss: 0.3551638126373291, mean loss: 0.35096929020754086
Epoch: 24, step: 429, loss: 0.3755601644515991, mean loss: 0.35096999108179966
Epoch: 24, step: 430, loss: 0.31656986474990845, mean loss: 0.3509690106581005
Epoch: 24, step: 431, loss: 0.3385449945926666, mean loss: 0.3509686565764753
Epoch: 24, step: 432, loss: 0.3246690630912781, mean loss: 0.35096790706541814
Epoch: 24, step: 433, loss: 0.32602354884147644, mean loss: 0.3509671961974152
Epoch: 24, step: 434, loss: 0.3451344072818756, mean loss: 0.35096702997847257
Epoch: 24, step: 435, loss: 0.35760578513145447, mean loss: 0.3509672191599143
Epoch: 24, step: 436, loss: 0.3226380944252014, mean loss: 0.35096641190135175
Epoch: 24, step: 437, loss: 0.32783445715904236, mean loss: 0.3509657527586281
Epoch: 24, step: 438, loss: 0.3298507034778595, mean loss: 0.35096515110456683
Epoch: 24, step: 439, loss: 0.29149335622787476, mean loss: 0.3509634565583258
Epoch: 24, step: 440, loss: 0.3563551604747772, mean loss: 0.35096361018125416
Epoch: 24, step: 441, loss: 0.3142772316932678, mean loss: 0.35096256492572714
Epoch: 24, step: 442, loss: 0.3081414997577667, mean loss: 0.35096134491760245
Epoch: 24, step: 443, loss: 0.36275267601013184, mean loss: 0.3509616808529612
Epoch: 24, step: 444, loss: 0.3386487364768982, mean loss: 0.350961330066819
Epoch: 24, step: 445, loss: 0.31940004229545593, mean loss: 0.3509604309360637
Epoch: 24, step: 446, loss: 0.392534464597702, mean loss: 0.35096161528024117
Epoch: 24, step: 447, loss: 0.3206232190132141, mean loss: 0.35096075103695645
Epoch: 24, step: 448, loss: 0.30071771144866943, mean loss: 0.3509593198152049
Epoch: 24, step: 449, loss: 0.3384190499782562, mean loss: 0.3509589626036218
Epoch: 24, step: 450, loss: 0.3315791189670563, mean loss: 0.35095841058141436
Epoch: 24, step: 451, loss: 0.3664717972278595, mean loss: 0.3509588524575294
Epoch: 24, step: 452, loss: 0.335703045129776, mean loss: 0.35095841793056115
Epoch: 24, step: 453, loss: 0.33291324973106384, mean loss: 0.35095790396963267
Epoch: 24, step: 454, loss: 0.29216527938842773, mean loss: 0.35095622949084876
Epoch: 24, step: 455, loss: 0.33260011672973633, mean loss: 0.350955706703404
Epoch: 24, step: 456, loss: 0.3091849684715271, mean loss: 0.3509545170944776
Epoch: 24, step: 457, loss: 0.3528314530849457, mean loss: 0.3509545705471173
Epoch: 24, step: 458, loss: 0.3443812429904938, mean loss: 0.3509543833528255
Epoch: 24, step: 459, loss: 0.28838983178138733, mean loss: 0.3509526016991186
Epoch: 24, step: 460, loss: 0.33035439252853394, mean loss: 0.35095201513964114
Epoch: 24, step: 461, loss: 0.32074838876724243, mean loss: 0.35095115507852226
Epoch: 24, step: 462, loss: 0.3324935734272003, mean loss: 0.3509506295059931
Epoch: 24, step: 463, loss: 0.3951820433139801, mean loss: 0.35095188894260493
Epoch: 24, step: 464, loss: 0.3706338107585907, mean loss: 0.3509524493458342
Epoch: 24, step: 465, loss: 0.3609634041786194, mean loss: 0.350952734379569
Epoch: 24, step: 466, loss: 0.3592211902141571, mean loss: 0.3509529697938512
Epoch: 24, step: 467, loss: 0.3409670889377594, mean loss: 0.35095268549021674
Epoch: 24, step: 468, loss: 0.31288942694664, mean loss: 0.350951601838728
Epoch: 24, step: 469, loss: 0.34919506311416626, mean loss: 0.3509515518319317
Epoch: 24, step: 470, loss: 0.36826762557029724, mean loss: 0.35095204478816877
Epoch: 24, step: 471, loss: 0.3308298587799072, mean loss: 0.35095147196347026
Epoch: 24, step: 472, loss: 0.3325422704219818, mean loss: 0.3509509479177661
Epoch: 24, step: 473, loss: 0.2967139482498169, mean loss: 0.350949404023668
Epoch: 24, step: 474, loss: 0.327309787273407, mean loss: 0.35094873112461156
Epoch: 24, step: 475, loss: 0.3573216199874878, mean loss: 0.35094891252301935
Epoch: 24, step: 476, loss: 0.324913889169693, mean loss: 0.3509481714811683
Epoch: 24, step: 477, loss: 0.30445119738578796, mean loss: 0.35094684806299514
Epoch: 24, step: 478, loss: 0.34636545181274414, mean loss: 0.35094671766890806
Epoch: 24, step: 479, loss: 0.3355877697467804, mean loss: 0.35094628054038113
Epoch: 24, step: 480, loss: 0.3538433313369751, mean loss: 0.3509463629905276
Epoch: 24, step: 481, loss: 0.3190019428730011, mean loss: 0.3509454538773135
Epoch: 24, step: 482, loss: 0.31673911213874817, mean loss: 0.3509444804192829
Epoch: 24, step: 483, loss: 0.3179691731929779, mean loss: 0.35094354202124
Epoch: 24, step: 484, loss: 0.3261759579181671, mean loss: 0.3509428372153408
Epoch: 24, step: 485, loss: 0.3096962571144104, mean loss: 0.3509416635035401
Epoch: 24, step: 486, loss: 0.4057202637195587, mean loss: 0.35094322223786034
Epoch: 24, step: 487, loss: 0.3082685172557831, mean loss: 0.3509420079564757
Epoch: 24, step: 488, loss: 0.322733610868454, mean loss: 0.35094120532745054
Epoch: 24, step: 489, loss: 0.3094678223133087, mean loss: 0.35094002529606677
Epoch: 24, step: 490, loss: 0.33887094259262085, mean loss: 0.3509396819073649
Epoch: 24, step: 491, loss: 0.3410463035106659, mean loss: 0.3509394004296593
Epoch: 24, step: 492, loss: 0.31169262528419495, mean loss: 0.35093828384667985
Epoch: 24, step: 493, loss: 0.37321269512176514, mean loss: 0.35093891754259093
Epoch: 24, step: 494, loss: 0.34757211804389954, mean loss: 0.35093882176154634
Epoch: 24, step: 495, loss: 0.33789896965026855, mean loss: 0.3509384508053529
Epoch: 24, step: 496, loss: 0.33340510725975037, mean loss: 0.35093795203302774
Epoch: 24, step: 497, loss: 0.3458191752433777, mean loss: 0.3509378064229467
Epoch: 24, step: 498, loss: 0.31828761100769043, mean loss: 0.3509368776732549
Epoch: 24, step: 499, loss: 0.35790157318115234, mean loss: 0.3509370757815581
Epoch: 24, step: 500, loss: 0.3392845392227173, mean loss: 0.3509367443387001
Epoch: 24, step: 501, loss: 0.3543754518032074, mean loss: 0.3509368421459549
Epoch: 24, step: 502, loss: 0.3040692210197449, mean loss: 0.35093550912678123
Epoch: 24, step: 503, loss: 0.3200249671936035, mean loss: 0.35093462998736336
Epoch: 24, step: 504, loss: 0.30896416306495667, mean loss: 0.3509334363220261
Epoch: 24, step: 505, loss: 0.36196014285087585, mean loss: 0.3509337499192768
Epoch: 24, step: 506, loss: 0.34888094663619995, mean loss: 0.3509336915396367
Epoch: 24, step: 507, loss: 0.33838072419166565, mean loss: 0.3509333345561494
Epoch: 24, step: 508, loss: 0.31839871406555176, mean loss: 0.35093240935721604
Epoch: 24, step: 509, loss: 0.37481388449668884, mean loss: 0.3509330884641699
Epoch: 24, step: 510, loss: 0.297880083322525, mean loss: 0.35093157986220946
Epoch: 24, step: 511, loss: 0.34885820746421814, mean loss: 0.35093152090598795
Epoch: 24, step: 512, loss: 0.3294038474559784, mean loss: 0.3509309087852723
Epoch: 24, step: 513, loss: 0.34295856952667236, mean loss: 0.35093068210516826
Epoch: 24, step: 514, loss: 0.3326023817062378, mean loss: 0.35093016098548446
Epoch: 24, step: 515, loss: 0.305388867855072, mean loss: 0.35092886616878
Epoch: 24, step: 516, loss: 0.3595256209373474, mean loss: 0.35092911058224396
Epoch: 24, step: 517, loss: 0.34261471033096313, mean loss: 0.35092887420309316
Epoch: 24, step: 518, loss: 0.3474266231060028, mean loss: 0.35092877463660854
Epoch: 24, step: 519, loss: 0.3107709288597107, mean loss: 0.3509276330103356
Epoch: 24, step: 520, loss: 0.3064590096473694, mean loss: 0.35092636887117185
Epoch: 24, step: 521, loss: 0.35614001750946045, mean loss: 0.3509265170788198
Epoch: 24, step: 522, loss: 0.3101184666156769, mean loss: 0.35092535706715194
Epoch: 24, step: 523, loss: 0.2979760766029358, mean loss: 0.3509238519710614
Epoch: 24, step: 524, loss: 0.34517091512680054, mean loss: 0.3509236884470898
Epoch: 24, step: 525, loss: 0.33085837960243225, mean loss: 0.3509231181182613
Epoch: 24, step: 526, loss: 0.30717945098876953, mean loss: 0.35092187479997894
Epoch: 24, step: 527, loss: 0.3758459687232971, mean loss: 0.35092258319282577
Epoch: 24, step: 528, loss: 0.3299688994884491, mean loss: 0.350921987663944
Epoch: 24, step: 529, loss: 0.33256515860557556, mean loss: 0.35092146595562085
Epoch: 24, step: 530, loss: 0.3328045606613159, mean loss: 0.3509209510806587
Epoch: 24, step: 531, loss: 0.3219030797481537, mean loss: 0.3509201264281825
Epoch: 24, step: 532, loss: 0.2862303853034973, mean loss: 0.35091828807696124
Epoch: 24, step: 533, loss: 0.36956536769866943, mean loss: 0.35091881797408037
Epoch: 24, step: 534, loss: 0.32789960503578186, mean loss: 0.3509181638519202
Epoch: 24, step: 535, loss: 0.3732423782348633, mean loss: 0.3509187982067276
Epoch: 24, step: 536, loss: 0.3579173982143402, mean loss: 0.3509189970701382
Epoch: 24, step: 537, loss: 0.3530668020248413, mean loss: 0.35091905809772683
Epoch: 24, step: 538, loss: 0.2991092801094055, mean loss: 0.350917586019932
Epoch: 24, step: 539, loss: 0.3813086152076721, mean loss: 0.3509184494995657
Epoch: 24, step: 540, loss: 0.3175284266471863, mean loss: 0.35091750083851925
Epoch: 24, step: 541, loss: 0.34799087047576904, mean loss: 0.3509174176908869
Epoch: 24, step: 542, loss: 0.3512763977050781, mean loss: 0.3509174278894725
Epoch: 24, step: 543, loss: 0.3531252443790436, mean loss: 0.3509174906115319
Epoch: 24, step: 544, loss: 0.29255878925323486, mean loss: 0.35091583274097826
Epoch: 24, step: 545, loss: 0.3208900988101959, mean loss: 0.3509149797856368
Epoch: 24, step: 546, loss: 0.31275302171707153, mean loss: 0.35091389573149173
Epoch: 24, step: 547, loss: 0.3228455185890198, mean loss: 0.35091309842501683
Epoch: 24, step: 548, loss: 0.37373045086860657, mean loss: 0.3509137465531931
Epoch: 24, step: 549, loss: 0.3262387216091156, mean loss: 0.35091304567763365
Epoch: 24, step: 550, loss: 0.32808718085289, mean loss: 0.35091239734449464
Epoch: 24, step: 551, loss: 0.397647887468338, mean loss: 0.3509137247555979
Epoch: 24, step: 552, loss: 0.3244607448577881, mean loss: 0.35091297344258426
Epoch: 24, step: 553, loss: 0.3273007571697235, mean loss: 0.3509123028315001
Epoch: 24, step: 554, loss: 0.2889595925807953, mean loss: 0.350910543361157
Epoch: 24, step: 555, loss: 0.321083664894104, mean loss: 0.3509096962954275
Epoch: 24, step: 556, loss: 0.34463995695114136, mean loss: 0.3509095182435903
Epoch: 24, step: 557, loss: 0.3814984858036041, mean loss: 0.350910386902861
Epoch: 24, step: 558, loss: 0.3276601731777191, mean loss: 0.3509097266667763
Epoch: 24, step: 559, loss: 0.3334334194660187, mean loss: 0.3509092304063492
Epoch: 24, step: 560, loss: 0.35139572620391846, mean loss: 0.3509092442205809
Epoch: 24, step: 561, loss: 0.30720028281211853, mean loss: 0.35090800312337467
Epoch: 24, step: 562, loss: 0.31255093216896057, mean loss: 0.3509069140217263
Epoch: 24, step: 563, loss: 0.44357940554618835, mean loss: 0.35090954526793655
Epoch: 24, step: 564, loss: 0.35410258173942566, mean loss: 0.3509096359251147
Epoch: 24, step: 565, loss: 0.29257890582084656, mean loss: 0.3509079798371553
Epoch: 24, step: 566, loss: 0.32153260707855225, mean loss: 0.35090714585445204
Epoch: 24, step: 567, loss: 0.3488340377807617, mean loss: 0.3509070869994647
Epoch: 24, step: 568, loss: 0.3002358078956604, mean loss: 0.35090564849615447
Epoch: 24, step: 569, loss: 0.31366103887557983, mean loss: 0.35090459119161743
Epoch: 24, step: 570, loss: 0.34953221678733826, mean loss: 0.3509045522335908
Epoch: 24, step: 571, loss: 0.3527644872665405, mean loss: 0.35090460503065657
Epoch: 24, step: 572, loss: 0.3441711366176605, mean loss: 0.35090441389640886
Epoch: 24, step: 573, loss: 0.3101121187210083, mean loss: 0.3509032560112208
Epoch: 24, step: 574, loss: 0.35039520263671875, mean loss: 0.3509032415905863
Epoch: 24, step: 575, loss: 0.2908347547054291, mean loss: 0.3509015366494281
Epoch: 24, step: 576, loss: 0.3439393639564514, mean loss: 0.35090133904568466
Epoch: 24, step: 577, loss: 0.37128305435180664, mean loss: 0.35090191751294086
Epoch: 24, step: 578, loss: 0.3306334316730499, mean loss: 0.35090134227565295
Epoch: 24, step: 579, loss: 0.3072437345981598, mean loss: 0.3509001032698726
Epoch: 24, step: 580, loss: 0.34721696376800537, mean loss: 0.3508999987450974
Epoch: 24, step: 581, loss: 0.33163362741470337, mean loss: 0.35089945199524414
Epoch: 24, step: 582, loss: 0.324849009513855, mean loss: 0.35089871274491125
Epoch: 24, step: 583, loss: 0.30987152457237244, mean loss: 0.3508975485227724
Epoch: 24, step: 584, loss: 0.3484172523021698, mean loss: 0.3508974781417894
Epoch: 24, step: 585, loss: 0.3334640562534332, mean loss: 0.3508969834643622
Epoch: 24, step: 586, loss: 0.35198974609375, mean loss: 0.3508970144708778
Epoch: 24, step: 587, loss: 0.3353256285190582, mean loss: 0.3508965726542295
Epoch: 24, step: 588, loss: 0.30699360370635986, mean loss: 0.35089532700324505
Epoch: 24, step: 589, loss: 0.33333849906921387, mean loss: 0.3508948288806798
Epoch: 24, step: 590, loss: 0.35193005204200745, mean loss: 0.35089485825121236
Epoch: 24, step: 591, loss: 0.33238428831100464, mean loss: 0.350894333098865
Epoch: 24, step: 592, loss: 0.3463602364063263, mean loss: 0.35089420446835934
Epoch: 24, step: 593, loss: 0.3328757882118225, mean loss: 0.3508936933076145
Epoch: 24, step: 594, loss: 0.32227134704589844, mean loss: 0.35089288134919455
Epoch: 24, step: 595, loss: 0.33592790365219116, mean loss: 0.3508924568349061
Epoch: 24, step: 596, loss: 0.35825273394584656, mean loss: 0.35089266561932475
Epoch: 24, step: 597, loss: 0.30026975274086, mean loss: 0.35089122967126557
Epoch: 24, step: 598, loss: 0.39304929971694946, mean loss: 0.3508924254752663
Epoch: 24, step: 599, loss: 0.3490699827671051, mean loss: 0.35089237378356253
Epoch: 24, step: 600, loss: 0.3231065571308136, mean loss: 0.3508915856899456
Epoch: 24, step: 601, loss: 0.3514440655708313, mean loss: 0.3508916013595775
Epoch: 24, step: 602, loss: 0.358647882938385, mean loss: 0.35089182133976915
Epoch: 24, step: 603, loss: 0.32525569200515747, mean loss: 0.35089109427994686
Epoch: 24, step: 604, loss: 0.3154411017894745, mean loss: 0.35089008892013035
Epoch: 24, step: 605, loss: 0.3038977384567261, mean loss: 0.35088875625747756
Epoch: 24, step: 606, loss: 0.39622193574905396, mean loss: 0.35089004183101047
Epoch: 24, step: 607, loss: 0.3170452415943146, mean loss: 0.3508890820760128
Epoch: 24, step: 608, loss: 0.29527559876441956, mean loss: 0.3508875050596138
Epoch: 24, step: 609, loss: 0.3269956707954407, mean loss: 0.3508868275845879
Epoch: 24, step: 610, loss: 0.3224291503429413, mean loss: 0.3508860206637485
Epoch: 24, step: 611, loss: 0.2847537696361542, mean loss: 0.3508841455290364
Epoch: 24, step: 612, loss: 0.33128833770751953, mean loss: 0.35088358991907237
Epoch: 24, step: 613, loss: 0.3535192608833313, mean loss: 0.3508836646474808
Epoch: 24, step: 614, loss: 0.31340107321739197, mean loss: 0.35088260194465326
Epoch: 24, step: 615, loss: 0.33913835883140564, mean loss: 0.35088226898244207
Epoch: 24, step: 616, loss: 0.3481159508228302, mean loss: 0.3508821905565027
Epoch: 24, step: 617, loss: 0.30522942543029785, mean loss: 0.35088089632377817
Epoch: 24, step: 618, loss: 0.31867465376853943, mean loss: 0.3508799833190282
Epoch: 24, step: 619, loss: 0.32806864380836487, mean loss: 0.3508793366657934
Epoch: 24, step: 620, loss: 0.3433130979537964, mean loss: 0.3508791221850067
Epoch: 24, step: 621, loss: 0.39236465096473694, mean loss: 0.35088029814534405
Epoch: 24, step: 622, loss: 0.3375696539878845, mean loss: 0.3508799208488176
Epoch: 24, step: 623, loss: 0.34621235728263855, mean loss: 0.35087978854826296
Epoch: 24, step: 624, loss: 0.3605596423149109, mean loss: 0.3508800629127585
Epoch: 24, step: 625, loss: 0.32830095291137695, mean loss: 0.3508794229515884
Epoch: 24, step: 626, loss: 0.30549347400665283, mean loss: 0.35087813661117107
Epoch: 24, step: 627, loss: 0.35236209630966187, mean loss: 0.35087817866875237
Epoch: 24, step: 628, loss: 0.3445444107055664, mean loss: 0.3508779991656218
Epoch: 24, step: 629, loss: 0.34799718856811523, mean loss: 0.35087791752387726
Epoch: 24, step: 630, loss: 0.3751077950000763, mean loss: 0.35087860417554717
Epoch: 24, step: 631, loss: 0.3393526077270508, mean loss: 0.35087827754903256
Epoch: 24, step: 632, loss: 0.32896602153778076, mean loss: 0.35087765661174297
Epoch: 24, step: 633, loss: 0.3968183994293213, mean loss: 0.3508789584180002
Epoch: 24, step: 634, loss: 0.30453500151634216, mean loss: 0.35087764522322246
Epoch: 24, step: 635, loss: 0.3488246500492096, mean loss: 0.35087758705153554
Epoch: 24, step: 636, loss: 0.32420894503593445, mean loss: 0.35087683141608333
Epoch: 24, step: 637, loss: 0.3177476227283478, mean loss: 0.3508758927520416
Epoch: 24, step: 638, loss: 0.3013339638710022, mean loss: 0.350874489099148
Epoch: 24, step: 639, loss: 0.2866981029510498, mean loss: 0.3508726708651796
Epoch: 24, step: 640, loss: 0.32082614302635193, mean loss: 0.35087181961640945
Epoch: 24, step: 641, loss: 0.35341939330101013, mean loss: 0.3508718917897248
Epoch: 24, step: 642, loss: 0.37294477224349976, mean loss: 0.35087251710150286
Epoch: 24, step: 643, loss: 0.3664914071559906, mean loss: 0.3508729595629775
Epoch: 24, step: 644, loss: 0.38214579224586487, mean loss: 0.35087384545382144
Epoch: 24, step: 645, loss: 0.32803624868392944, mean loss: 0.3508731985330586
Epoch: 24, step: 646, loss: 0.3305938243865967, mean loss: 0.3508726240953579
Epoch: 24, step: 647, loss: 0.3317317068576813, mean loss: 0.3508720819211783
Epoch: 24, step: 648, loss: 0.30673301219940186, mean loss: 0.3508708316996878
Epoch: 24, step: 649, loss: 0.3127330243587494, mean loss: 0.35086975149214966
Epoch: 24, step: 650, loss: 0.3404247462749481, mean loss: 0.3508694556583145
Epoch: 24, step: 651, loss: 0.31685879826545715, mean loss: 0.35086849240190254
Epoch: 24, step: 652, loss: 0.34264400601387024, mean loss: 0.3508682594730066
Epoch: 24, step: 653, loss: 0.3271660804748535, mean loss: 0.3508675882133352
Epoch: 24, step: 654, loss: 0.3254968523979187, mean loss: 0.3508668697195
Epoch: 24, step: 655, loss: 0.31166958808898926, mean loss: 0.3508657596922676
Epoch: 24, step: 656, loss: 0.3467763662338257, mean loss: 0.35086564388807484
Epoch: 24, step: 657, loss: 0.33039727807044983, mean loss: 0.35086506427755726
Epoch: 24, step: 658, loss: 0.34752196073532104, mean loss: 0.3508649696123005
Epoch: 24, step: 659, loss: 0.339687317609787, mean loss: 0.3508646531083929
Epoch: 24, step: 660, loss: 0.3506797254085541, mean loss: 0.35086464787216953
Epoch: 24, step: 661, loss: 0.32554277777671814, mean loss: 0.3508639309043317
Epoch: 24, step: 662, loss: 0.32882994413375854, mean loss: 0.3508633070478587
Epoch: 24, step: 663, loss: 0.32706761360168457, mean loss: 0.3508626333306037
Epoch: 24, step: 664, loss: 0.31294623017311096, mean loss: 0.3508615598501485
Epoch: 24, step: 665, loss: 0.3176092803478241, mean loss: 0.3508606184459386
Epoch: 24, step: 666, loss: 0.31375059485435486, mean loss: 0.3508595678550037
Epoch: 24, step: 667, loss: 0.3172835409641266, mean loss: 0.350858617339012
Epoch: 24, step: 668, loss: 0.3288209140300751, mean loss: 0.35085799348329205
Epoch: 24, step: 669, loss: 0.34087032079696655, mean loss: 0.35085771075463085
Epoch: 24, step: 670, loss: 0.31529995799064636, mean loss: 0.3508567042227214
Epoch: 24, step: 671, loss: 0.37951967120170593, mean loss: 0.3508575155612342
Epoch: 24, step: 672, loss: 0.3361886739730835, mean loss: 0.3508571003544186
Epoch: 24, step: 673, loss: 0.3133257031440735, mean loss: 0.35085603804484566
Epoch: 24, step: 674, loss: 0.33013561367988586, mean loss: 0.3508554515790121
Epoch: 24, step: 675, loss: 0.3132782280445099, mean loss: 0.3508543880325518
Epoch: 24, step: 676, loss: 0.3221875727176666, mean loss: 0.350853576699936
Epoch: 24, step: 677, loss: 0.3184429407119751, mean loss: 0.3508526594350923
Epoch: 24, step: 678, loss: 0.32600143551826477, mean loss: 0.350851956131741
Epoch: 24, step: 679, loss: 0.31961944699287415, mean loss: 0.35085107225951045
Epoch: 24, step: 680, loss: 0.3585595190525055, mean loss: 0.35085129040046165
Epoch: 24, step: 681, loss: 0.3528929054737091, mean loss: 0.3508513481743898
Epoch: 24, step: 682, loss: 0.36802077293395996, mean loss: 0.35085183402358644
Epoch: 24, step: 683, loss: 0.3588815927505493, mean loss: 0.35085206123803825
Epoch: 24, step: 684, loss: 0.32996895909309387, mean loss: 0.35085147033506026
Epoch: 24, step: 685, loss: 0.4329809844493866, mean loss: 0.35085379418527
Epoch: 24, step: 686, loss: 0.35693442821502686, mean loss: 0.3508539662316167
Epoch: 24, step: 687, loss: 0.3543974757194519, mean loss: 0.3508540664893546
Epoch: 24, step: 688, loss: 0.2992466986179352, mean loss: 0.35085260638558113
Epoch: 24, step: 689, loss: 0.38161227107048035, mean loss: 0.35085347663015437
Epoch: 24, step: 690, loss: 0.35242053866386414, mean loss: 0.3508535209638187
Epoch: 24, step: 691, loss: 0.3272276520729065, mean loss: 0.3508528525845924
Epoch: 24, step: 692, loss: 0.3740141987800598, mean loss: 0.35085350780386865
Epoch: 24, step: 693, loss: 0.32743123173713684, mean loss: 0.3508528452218017
Epoch: 24, step: 694, loss: 0.3384978473186493, mean loss: 0.3508524957267972
Epoch: 24, step: 695, loss: 0.3173588812351227, mean loss: 0.3508515482948417
Epoch: 24, step: 696, loss: 0.3161866068840027, mean loss: 0.3508505677573651
Epoch: 24, step: 697, loss: 0.32621651887893677, mean loss: 0.35084987097485454
Epoch: 24, step: 698, loss: 0.35009822249412537, mean loss: 0.35084984971482114
Epoch: 24, step: 699, loss: 0.32010388374328613, mean loss: 0.3508489801038365
Epoch: 24, step: 700, loss: 0.32587623596191406, mean loss: 0.35084827380114847
Epoch: 24, step: 701, loss: 0.31327322125434875, mean loss: 0.3508472110981521
Epoch: 24, step: 702, loss: 0.331901878118515, mean loss: 0.3508466752986957
Epoch: 24, step: 703, loss: 0.35571491718292236, mean loss: 0.3508468129752195
Epoch: 24, step: 704, loss: 0.29837143421173096, mean loss: 0.3508453289849827
Epoch: 24, step: 705, loss: 0.3555753231048584, mean loss: 0.3508454627442192
Epoch: 24, step: 706, loss: 0.3123001158237457, mean loss: 0.3508443727533553
Epoch: 24, step: 707, loss: 0.31299230456352234, mean loss: 0.3508433023973947
Epoch: 24, step: 708, loss: 0.3301983177661896, mean loss: 0.35084271862856586
Epoch: 24, step: 709, loss: 0.33626502752304077, mean loss: 0.3508423064334885
Epoch: 24, step: 710, loss: 0.3211381733417511, mean loss: 0.3508414665507421
Epoch: 24, step: 711, loss: 0.32768672704696655, mean loss: 0.350840811870254
Epoch: 24, step: 712, loss: 0.3422442376613617, mean loss: 0.35084056881633086
Epoch: 24, step: 713, loss: 0.3467790186405182, mean loss: 0.35084045398596114
Epoch: 24, step: 714, loss: 0.35801345109939575, mean loss: 0.35084065677912823
Epoch: 24, step: 715, loss: 0.33840885758399963, mean loss: 0.35084030532037
Epoch: 24, step: 716, loss: 0.32518768310546875, mean loss: 0.3508395801169037
Epoch: 24, step: 717, loss: 0.36048123240470886, mean loss: 0.3508398526801504
Epoch: 24, step: 718, loss: 0.3573911190032959, mean loss: 0.3508400378749581
Epoch: 24, step: 719, loss: 0.359814316034317, mean loss: 0.3508402915576288
Epoch: 24, step: 720, loss: 0.3005533516407013, mean loss: 0.35083887009905634
Epoch: 24, step: 721, loss: 0.3102627396583557, mean loss: 0.35083772316790024
Epoch: 24, step: 722, loss: 0.3574100136756897, mean loss: 0.3508379089360256
Epoch: 24, step: 723, loss: 0.40316423773765564, mean loss: 0.3508393879164892
Epoch: 24, step: 724, loss: 0.3655906021595001, mean loss: 0.35083980484122973
Epoch: 24, step: 725, loss: 0.32642272114753723, mean loss: 0.35083911474220497
Epoch: 24, step: 726, loss: 0.3152061402797699, mean loss: 0.35083810767738677
Epoch: 24, step: 727, loss: 0.33134230971336365, mean loss: 0.3508375566996012
Epoch: 24, step: 728, loss: 0.3219231963157654, mean loss: 0.35083673956351574
Epoch: 24, step: 729, loss: 0.3271929919719696, mean loss: 0.3508360713967947
Epoch: 24, step: 730, loss: 0.3274419605731964, mean loss: 0.35083541030343207
Epoch: 24, step: 731, loss: 0.36316558718681335, mean loss: 0.35083575873162476
Epoch: 24, step: 732, loss: 0.3350833058357239, mean loss: 0.3508353136087647
Epoch: 24, step: 733, loss: 0.3500102758407593, mean loss: 0.3508352902960275
Epoch: 24, step: 734, loss: 0.34201890230178833, mean loss: 0.35083504118218517
Epoch: 24, step: 735, loss: 0.3298981487751007, mean loss: 0.35083444961085813
Epoch: 24, step: 736, loss: 0.327045738697052, mean loss: 0.35083377748046757
Epoch: 24, step: 737, loss: 0.3102506995201111, mean loss: 0.3508326308714954
Epoch: 24, step: 738, loss: 0.29915904998779297, mean loss: 0.35083117095961847
Epoch: 24, step: 739, loss: 0.3480004072189331, mean loss: 0.3508310909855044
Epoch: 24, step: 740, loss: 0.3227134346961975, mean loss: 0.35083029663411053
Epoch: 24, step: 741, loss: 0.29986801743507385, mean loss: 0.35082885694036514
Epoch: 24, step: 742, loss: 0.3110713064670563, mean loss: 0.3508277338139923
Epoch: 24, step: 743, loss: 0.35916924476623535, mean loss: 0.3508279694498949
Epoch: 24, step: 744, loss: 0.3854416012763977, mean loss: 0.3508289472084844
Epoch: 24, step: 745, loss: 0.32690536975860596, mean loss: 0.3508282714393908
Epoch: 24, step: 746, loss: 0.3579486310482025, mean loss: 0.3508284725624484
Epoch: 24, step: 747, loss: 0.2953008711338043, mean loss: 0.3508269041633571
Epoch: 24, step: 748, loss: 0.33118510246276855, mean loss: 0.3508263493885597
Epoch: 24, step: 749, loss: 0.4364587366580963, mean loss: 0.35082876797262086
Epoch: 24, step: 750, loss: 0.370303213596344, mean loss: 0.35082931798944306
Epoch: 24, step: 751, loss: 0.35451003909111023, mean loss: 0.35082942194112354
Epoch: 24, step: 752, loss: 0.32006072998046875, mean loss: 0.350828552989954
Epoch: 24, step: 753, loss: 0.3353523015975952, mean loss: 0.35082811593117424
Epoch: 24, step: 754, loss: 0.3345792591571808, mean loss: 0.3508276570665058
Epoch: 24, step: 755, loss: 0.31221431493759155, mean loss: 0.35082656666375733
Epoch: 24, step: 756, loss: 0.33446577191352844, mean loss: 0.350826104664075
Epoch: 24, step: 757, loss: 0.33051782846450806, mean loss: 0.35082553121074583
Epoch: 24, step: 758, loss: 0.3554302752017975, mean loss: 0.35082566123316544
Epoch: 24, step: 759, loss: 0.3167862296104431, mean loss: 0.3508247001017101
Epoch: 24, step: 760, loss: 0.33072638511657715, mean loss: 0.35082413262521617
Epoch: 24, step: 761, loss: 0.3485253155231476, mean loss: 0.35082406771988267
Epoch: 24, step: 762, loss: 0.3469858765602112, mean loss: 0.3508239593545658
Epoch: 24, step: 763, loss: 0.31135499477386475, mean loss: 0.35082284504161887
Epoch: 24, step: 764, loss: 0.34326571226119995, mean loss: 0.35082263168985633
Epoch: 24, step: 765, loss: 0.3646753430366516, mean loss: 0.35082302276634403
Epoch: 24, step: 766, loss: 0.3314562439918518, mean loss: 0.35082247603741723
Epoch: 24, step: 767, loss: 0.3300183117389679, mean loss: 0.350821888747323
Epoch: 24, step: 768, loss: 0.313571959733963, mean loss: 0.35082083723203683
Epoch: 24, step: 769, loss: 0.3326272666454315, mean loss: 0.35082032366655985
Epoch: 24, step: 770, loss: 0.34685370326042175, mean loss: 0.3508202117005338
Epoch: 24, step: 771, loss: 0.3325003683567047, mean loss: 0.350819694599841
Epoch: 24, step: 772, loss: 0.31650105118751526, mean loss: 0.35081872594017205
Epoch: 24, step: 773, loss: 0.33987921476364136, mean loss: 0.3508184171760971
Epoch: 24, step: 774, loss: 0.3417624533176422, mean loss: 0.35081816158173457
Epoch: 24, step: 775, loss: 0.3383808135986328, mean loss: 0.35081781056152733
Epoch: 24, step: 776, loss: 0.32020753622055054, mean loss: 0.3508169466698348
Epoch: 24, step: 777, loss: 0.3305180072784424, mean loss: 0.35081637380367825
Epoch: 24, step: 778, loss: 0.3219183683395386, mean loss: 0.3508155582821469
Epoch: 24, step: 779, loss: 0.35934922099113464, mean loss: 0.3508157991011645
Epoch: 24, step: 780, loss: 0.3470799922943115, mean loss: 0.35081569368008464
Epoch: 24, step: 781, loss: 0.3590030074119568, mean loss: 0.3508159247121331
Epoch: 24, step: 782, loss: 0.3489019572734833, mean loss: 0.35081587070475595
Epoch: 24, step: 783, loss: 0.3442176282405853, mean loss: 0.3508156845240995
Epoch: 24, step: 784, loss: 0.32814735174179077, mean loss: 0.3508150449165043
Epoch: 24, step: 785, loss: 0.30660951137542725, mean loss: 0.35081379765242376
Epoch: 24, step: 786, loss: 0.38011303544044495, mean loss: 0.35081462431037563
Epoch: 24, step: 787, loss: 0.3115975260734558, mean loss: 0.35081351785799336
Epoch: 24, step: 788, loss: 0.30181100964546204, mean loss: 0.3508121353637569
Epoch: 24, step: 789, loss: 0.3187819719314575, mean loss: 0.3508112317310922
Epoch: 24, step: 790, loss: 0.31810176372528076, mean loss: 0.35081030895996895
Epoch: 24, step: 791, loss: 0.33041760325431824, mean loss: 0.3508097336748836
Epoch: 24, step: 792, loss: 0.32513803243637085, mean loss: 0.35080900948798865
Epoch: 24, step: 793, loss: 0.3332156836986542, mean loss: 0.35080851320235285
Epoch: 24, step: 794, loss: 0.3311072885990143, mean loss: 0.350807957471214
Epoch: 24, step: 795, loss: 0.35758736729621887, mean loss: 0.35080814869906646
Epoch: 24, step: 796, loss: 0.2933085858821869, mean loss: 0.3508065268458293
Epoch: 24, step: 797, loss: 0.3235670030117035, mean loss: 0.3508057585397472
Epoch: 24, step: 798, loss: 0.3454296886920929, mean loss: 0.3508056069089519
Epoch: 24, step: 799, loss: 0.2983616292476654, mean loss: 0.35080412778052056
Epoch: 24, step: 800, loss: 0.3333421051502228, mean loss: 0.35080363529602865
Epoch: 24, step: 801, loss: 0.3692778944969177, mean loss: 0.35080415631411205
Epoch: 24, step: 802, loss: 0.32829058170318604, mean loss: 0.3508035213956256
Epoch: 24, step: 803, loss: 0.3280416429042816, mean loss: 0.35080287949267885
Epoch: 24, step: 804, loss: 0.31735360622406006, mean loss: 0.3508019362233613
Epoch: 24, step: 805, loss: 0.34587883949279785, mean loss: 0.3508017973959762
Epoch: 24, step: 806, loss: 0.35156962275505066, mean loss: 0.35080181904742586
Epoch: 24, step: 807, loss: 0.34771445393562317, mean loss: 0.3508017319911121
Epoch: 24, step: 808, loss: 0.2977159321308136, mean loss: 0.35080023514070013
Epoch: 24, step: 809, loss: 0.3248238265514374, mean loss: 0.3507995027093972
Epoch: 24, step: 810, loss: 0.3673635423183441, mean loss: 0.3507999697361998
Epoch: 24, step: 811, loss: 0.31391990184783936, mean loss: 0.3507989299237523
Epoch: 24, step: 812, loss: 0.2986222505569458, mean loss: 0.3507974588735573
Epoch: 24, step: 813, loss: 0.290533185005188, mean loss: 0.35079575985258554
Epoch: 24, step: 814, loss: 0.3439818024635315, mean loss: 0.35079556775319765
Epoch: 24, step: 815, loss: 0.331385999917984, mean loss: 0.35079502057322937
Epoch: 24, step: 816, loss: 0.37395015358924866, mean loss: 0.350795673326958
Epoch: 24, step: 817, loss: 0.33688294887542725, mean loss: 0.35079528113198555
Epoch: 24, step: 818, loss: 0.2945917248725891, mean loss: 0.3507936968175033
Epoch: 24, step: 819, loss: 0.3358060121536255, mean loss: 0.3507932743435867
Epoch: 24, step: 820, loss: 0.32109832763671875, mean loss: 0.35079243732392024
Epoch: 24, step: 821, loss: 0.3593025803565979, mean loss: 0.35079267719491164
Epoch: 24, step: 822, loss: 0.34448257088661194, mean loss: 0.3507924993402284
Epoch: 24, step: 823, loss: 0.3738730549812317, mean loss: 0.35079314986321714
Epoch: 24, step: 824, loss: 0.3312060534954071, mean loss: 0.35079259781856315
Epoch: 24, step: 825, loss: 0.36167970299720764, mean loss: 0.3507929046531604
Epoch: 24, step: 826, loss: 0.32552194595336914, mean loss: 0.35079219245411575
Epoch: 24, step: 827, loss: 0.30576035380363464, mean loss: 0.35079092337964135
Epoch: 24, step: 828, loss: 0.301676481962204, mean loss: 0.35078953928942247
Epoch: 24, step: 829, loss: 0.33063292503356934, mean loss: 0.3507889712734653
Epoch: 24, step: 830, loss: 0.39049386978149414, mean loss: 0.35079009013103307
Epoch: 24, step: 831, loss: 0.31282517313957214, mean loss: 0.3507890203351305
Epoch: 24, step: 832, loss: 0.34158214926719666, mean loss: 0.35078876090626326
Epoch: 24, step: 833, loss: 0.2967921197414398, mean loss: 0.3507872394455373
Epoch: 24, step: 834, loss: 0.31053540110588074, mean loss: 0.3507861053034072
Epoch: 24, step: 835, loss: 0.3472541868686676, mean loss: 0.3507860057903216
Epoch: 24, step: 836, loss: 0.30105704069137573, mean loss: 0.3507846046981316
Epoch: 24, step: 837, loss: 0.3406403362751007, mean loss: 0.35078431889578693
Epoch: 24, step: 838, loss: 0.3548676669597626, mean loss: 0.3507844339358789
Epoch: 24, step: 839, loss: 0.3059358298778534, mean loss: 0.3507831704525552
Epoch: 24, step: 840, loss: 0.34937605261802673, mean loss: 0.3507831308120832
Epoch: 24, step: 841, loss: 0.30076348781585693, mean loss: 0.3507817217286701
Epoch: 24, step: 842, loss: 0.3337143659591675, mean loss: 0.35078124094454183
Epoch: 24, step: 843, loss: 0.35671475529670715, mean loss: 0.35078140808579117
Epoch: 24, step: 844, loss: 0.31850141286849976, mean loss: 0.3507804988157645
Epoch: 24, step: 845, loss: 0.30718889832496643, mean loss: 0.3507792709525317
Epoch: 24, step: 846, loss: 0.30949658155441284, mean loss: 0.3507781081581369
Epoch: 24, step: 847, loss: 0.3528822660446167, mean loss: 0.35077816742351225
Epoch: 24, step: 848, loss: 0.34690603613853455, mean loss: 0.35077805836475195
Epoch: 24, step: 849, loss: 0.32307183742523193, mean loss: 0.35077727803971
Epoch: 24, step: 850, loss: 0.3578402101993561, mean loss: 0.3507774769563225
Epoch: 24, step: 851, loss: 0.30366361141204834, mean loss: 0.35077615010418933
Epoch: 24, step: 852, loss: 0.3530708849430084, mean loss: 0.3507762147282238
Epoch: 24, step: 853, loss: 0.33125507831573486, mean loss: 0.35077566499191254
Epoch: 24, step: 854, loss: 0.35076406598091125, mean loss: 0.35077566466528104
Epoch: 24, step: 855, loss: 0.3245472013950348, mean loss: 0.3507749260849907
Epoch: 24, step: 856, loss: 0.3057126998901367, mean loss: 0.3507736571911717
Epoch: 24, step: 857, loss: 0.34777146577835083, mean loss: 0.35077357265573744
Epoch: 24, step: 858, loss: 0.32786825299263, mean loss: 0.35077292770797835
Epoch: 24, step: 859, loss: 0.31811121106147766, mean loss: 0.35077200807410497
Epoch: 24, step: 860, loss: 0.3158052861690521, mean loss: 0.350771023567477
Epoch: 24, step: 861, loss: 0.31126365065574646, mean loss: 0.35076991124772616
Epoch: 24, step: 862, loss: 0.36578166484832764, mean loss: 0.350770333887823
Epoch: 24, step: 863, loss: 0.30678945779800415, mean loss: 0.35076909568748266
Epoch: 24, step: 864, loss: 0.3363661468029022, mean loss: 0.3507686902104723
Epoch: 24, step: 865, loss: 0.3571569323539734, mean loss: 0.3507688700495057
Epoch: 24, step: 866, loss: 0.35802215337753296, mean loss: 0.3507690742350567
Epoch: 24, step: 867, loss: 0.32831698656082153, mean loss: 0.3507684422091679
Epoch: 24, step: 868, loss: 0.3282155692577362, mean loss: 0.3507678073640461
Epoch: 24, step: 869, loss: 0.31379860639572144, mean loss: 0.35076676674025037
Epoch: 24, step: 870, loss: 0.36559218168258667, mean loss: 0.35076718404018964
Epoch: 24, step: 871, loss: 0.36036983132362366, mean loss: 0.35076745432411455
Epoch: 24, step: 872, loss: 0.33395108580589294, mean loss: 0.3507669810102437
Epoch: 24, step: 873, loss: 0.3431801497936249, mean loss: 0.3507667674771388
Epoch: 24, step: 874, loss: 0.3250492513179779, mean loss: 0.350766043672119
Epoch: 24, step: 875, loss: 0.34867197275161743, mean loss: 0.35076598473733006
Epoch: 24, step: 876, loss: 0.3648489713668823, mean loss: 0.3507663810727543
Epoch: 24, step: 877, loss: 0.32411879301071167, mean loss: 0.3507656311547023
Epoch: 24, step: 878, loss: 0.33368363976478577, mean loss: 0.3507651504457846
Epoch: 24, step: 879, loss: 0.327168345451355, mean loss: 0.3507644864204302
Epoch: 24, step: 880, loss: 0.35451510548591614, mean loss: 0.3507645919616707
Epoch: 24, step: 881, loss: 0.34900805354118347, mean loss: 0.350764542534623
Epoch: 24, step: 882, loss: 0.3130951523780823, mean loss: 0.3507634825894879
Epoch: 24, step: 883, loss: 0.32177096605300903, mean loss: 0.35076266681806034
Epoch: 24, step: 884, loss: 0.38065671920776367, mean loss: 0.35076350793261507
Epoch: 24, step: 885, loss: 0.312832772731781, mean loss: 0.3507624407238142
Epoch: 24, step: 886, loss: 0.3182113468647003, mean loss: 0.3507615249008994
Epoch: 24, step: 887, loss: 0.34211498498916626, mean loss: 0.35076128163790393
Epoch: 24, step: 888, loss: 0.30503159761428833, mean loss: 0.3507599951086024
Epoch: 24, step: 889, loss: 0.31396785378456116, mean loss: 0.35075896005145607
Epoch: 24, step: 890, loss: 0.31098586320877075, mean loss: 0.35075784116387504
Epoch: 24, step: 891, loss: 0.31098100543022156, mean loss: 0.35075672220259074
Epoch: 24, step: 892, loss: 0.30569905042648315, mean loss: 0.3507554547218803
Epoch: 24, step: 893, loss: 0.3254911005496979, mean loss: 0.35075474405087687
Epoch: 24, step: 894, loss: 0.2923740744590759, mean loss: 0.350753101884142
Epoch: 24, step: 895, loss: 0.31023702025413513, mean loss: 0.3507519622553833
Epoch: 24, step: 896, loss: 0.3243680000305176, mean loss: 0.3507512201531071
Epoch: 24, step: 897, loss: 0.31215956807136536, mean loss: 0.3507501347154044
Epoch: 24, step: 898, loss: 0.34553614258766174, mean loss: 0.35074998806958446
Epoch: 24, step: 899, loss: 0.37657058238983154, mean loss: 0.35075071426472226
Epoch: 24, step: 900, loss: 0.35602569580078125, mean loss: 0.3507508626175511
Epoch: 24, step: 901, loss: 0.340450257062912, mean loss: 0.3507505729329357
Epoch: 24, step: 902, loss: 0.32622256875038147, mean loss: 0.35074988314964084
Epoch: 24, step: 903, loss: 0.3356829583644867, mean loss: 0.3507494594453443
Epoch: 24, step: 904, loss: 0.29395371675491333, mean loss: 0.35074786230964256
Epoch: 24, step: 905, loss: 0.35528889298439026, mean loss: 0.35074799000298584
Epoch: 24, step: 906, loss: 0.32927405834198, mean loss: 0.35074738617508433
Epoch: 24, step: 907, loss: 0.35648494958877563, mean loss: 0.35074754750573933
Epoch: 24, step: 908, loss: 0.3517991900444031, mean loss: 0.35074757707533133
Epoch: 24, step: 909, loss: 0.33662062883377075, mean loss: 0.35074717987159065
Epoch: 24, step: 910, loss: 0.35134825110435486, mean loss: 0.35074719677127947
Epoch: 24, step: 911, loss: 0.3228304088115692, mean loss: 0.3507464118863278
Epoch: 24, step: 912, loss: 0.3378066420555115, mean loss: 0.35074604809286075
Epoch: 24, step: 913, loss: 0.3795752227306366, mean loss: 0.35074685858413535
Epoch: 24, step: 914, loss: 0.33200541138648987, mean loss: 0.35074633170979397
Epoch: 24, step: 915, loss: 0.31470799446105957, mean loss: 0.3507453186001221
Epoch: 24, step: 916, loss: 0.33233290910720825, mean loss: 0.3507448010050502
Epoch: 24, step: 917, loss: 0.3438601493835449, mean loss: 0.3507446074746172
Epoch: 24, step: 918, loss: 0.3492268919944763, mean loss: 0.35074456481220034
Epoch: 24, step: 919, loss: 0.31088918447494507, mean loss: 0.3507434445237942
Epoch: 24, step: 920, loss: 0.45070919394493103, mean loss: 0.3507462543658107
Epoch: 24, step: 921, loss: 0.32543689012527466, mean loss: 0.350745542988998
Epoch: 24, step: 922, loss: 0.35321059823036194, mean loss: 0.35074561227299256
Epoch: 24, step: 923, loss: 0.30694735050201416, mean loss: 0.35074438129317886
Epoch: 24, step: 924, loss: 0.298740953207016, mean loss: 0.350742919742686
Epoch: 24, step: 925, loss: 0.3295413851737976, mean loss: 0.3507423238926897
Epoch: 24, step: 926, loss: 0.37250471115112305, mean loss: 0.3507429354877564
Epoch: 24, step: 927, loss: 0.3058004379272461, mean loss: 0.35074167249041044
Epoch: 24, step: 928, loss: 0.3072982430458069, mean loss: 0.35074045165496165
Epoch: 24, step: 929, loss: 0.32599371671676636, mean loss: 0.3507397562484833
Epoch: 24, step: 930, loss: 0.3379964232444763, mean loss: 0.350739398158928
Epoch: 24, step: 931, loss: 0.32850325107574463, mean loss: 0.3507387733374409
Epoch: 24, step: 932, loss: 0.32276663184165955, mean loss: 0.3507379873602711
Epoch: 24, step: 933, loss: 0.3265077769756317, mean loss: 0.3507373065451437
Epoch: 24, step: 934, loss: 0.34585508704185486, mean loss: 0.35073716936946714
Epoch: 24, step: 935, loss: 0.3381732702255249, mean loss: 0.3507368163716265
Epoch: 24, step: 936, loss: 0.36135780811309814, mean loss: 0.35073711477276553
Epoch: 24, step: 937, loss: 0.3589107394218445, mean loss: 0.3507373444076661
Epoch: 24, step: 938, loss: 0.32262760400772095, mean loss: 0.35073655469730225
Epoch: 24, step: 939, loss: 0.31736746430397034, mean loss: 0.3507356172579722
Epoch: 24, step: 940, loss: 0.3669622838497162, mean loss: 0.35073607310162735
Epoch: 24, step: 941, loss: 0.34652888774871826, mean loss: 0.35073595491562387
Epoch: 24, step: 942, loss: 0.4280051589012146, mean loss: 0.3507381254598522
Epoch: 24, step: 943, loss: 0.34499359130859375, mean loss: 0.35073796409653335
Epoch: 24, step: 944, loss: 0.3290206491947174, mean loss: 0.3507373540767333
Epoch: 24, step: 945, loss: 0.32964012026786804, mean loss: 0.3507367614910974
Epoch: 24, step: 946, loss: 0.2896001935005188, mean loss: 0.35073504431647756
Epoch: 24, step: 947, loss: 0.3143521547317505, mean loss: 0.35073402244001467
Epoch: 24, step: 948, loss: 0.3269646465778351, mean loss: 0.3507333548546794
Epoch: 24, step: 949, loss: 0.3125949800014496, mean loss: 0.3507322837325412
Epoch: 24, step: 950, loss: 0.34485021233558655, mean loss: 0.35073211853829855
Epoch: 24, step: 951, loss: 0.3351670503616333, mean loss: 0.3507316814155122
Epoch: 24, step: 952, loss: 0.30397680401802063, mean loss: 0.3507303684081995
Epoch: 24, step: 953, loss: 0.34133654832839966, mean loss: 0.3507301046109493
Epoch: 24, step: 954, loss: 0.33382558822631836, mean loss: 0.3507296299116602
Epoch: 24, step: 955, loss: 0.3689717948436737, mean loss: 0.35073014215935566
Epoch: 24, step: 956, loss: 0.34220319986343384, mean loss: 0.3507299027259382
Epoch: 24, step: 957, loss: 0.33764371275901794, mean loss: 0.3507295352808332
Epoch: 24, step: 958, loss: 0.31687483191490173, mean loss: 0.35072858470654245
Epoch: 24, step: 959, loss: 0.31756019592285156, mean loss: 0.3507276534287801
Epoch: 24, step: 960, loss: 0.37042227387428284, mean loss: 0.35072820638440366
Epoch: 24, step: 961, loss: 0.3221660852432251, mean loss: 0.35072740448308576
Epoch: 24, step: 962, loss: 0.3634295165538788, mean loss: 0.3507277610936608
Epoch: 24, step: 963, loss: 0.3521278202533722, mean loss: 0.3507278003990836
Epoch: 24, step: 964, loss: 0.3181845545768738, mean loss: 0.3507268868018847
Epoch: 24, step: 965, loss: 0.34552669525146484, mean loss: 0.3507267408193023
Epoch: 24, step: 966, loss: 0.3211894631385803, mean loss: 0.3507259116561863
Epoch: 24, step: 967, loss: 0.36857688426971436, mean loss: 0.35072641275018507
Epoch: 24, step: 968, loss: 0.3152516782283783, mean loss: 0.3507254169681634
Epoch: 24, step: 969, loss: 0.3866904377937317, mean loss: 0.3507264264842703
Epoch: 24, step: 970, loss: 0.3165968656539917, mean loss: 0.3507254685152909
Epoch: 24, step: 971, loss: 0.3448079526424408, mean loss: 0.35072530242356886
Epoch: 24, step: 972, loss: 0.32711145281791687, mean loss: 0.350724639653084
Epoch: 24, step: 973, loss: 0.34278765320777893, mean loss: 0.35072441689174677
Epoch: 24, step: 974, loss: 0.3301537334918976, mean loss: 0.3507238395662886
Epoch: 24, step: 975, loss: 0.325329452753067, mean loss: 0.3507231268814319
Epoch: 24, step: 976, loss: 0.33301815390586853, mean loss: 0.3507226300113122
Epoch: 24, step: 977, loss: 0.341338187456131, mean loss: 0.3507223666548954
Epoch: 24, step: 978, loss: 0.34351396560668945, mean loss: 0.35072216437059495
Epoch: 24, step: 979, loss: 0.3387555181980133, mean loss: 0.35072182856842377
Epoch: 24, step: 980, loss: 0.3546011745929718, mean loss: 0.35072193742567953
Epoch: 24, step: 981, loss: 0.32720550894737244, mean loss: 0.3507212775562009
Epoch: 24, step: 982, loss: 0.30289721488952637, mean loss: 0.3507199356537158
Epoch: 24, step: 983, loss: 0.30142924189567566, mean loss: 0.3507185526376171
Epoch: 24, step: 984, loss: 0.3227343261241913, mean loss: 0.3507177674681069
Epoch: 24, step: 985, loss: 0.32416513562202454, mean loss: 0.3507170224865726
Epoch: 24, step: 986, loss: 0.3502962589263916, mean loss: 0.35071701068163025
Epoch: 24, step: 987, loss: 0.3027207553386688, mean loss: 0.3507156641364798
Epoch: 24, step: 988, loss: 0.33419665694236755, mean loss: 0.3507152007052217
Epoch: 24, step: 989, loss: 0.2998032569885254, mean loss: 0.35071377243995444
Epoch: 24, step: 990, loss: 0.32345372438430786, mean loss: 0.3507130077178725
Epoch: 24, step: 991, loss: 0.3654775619506836, mean loss: 0.3507134218941021
Epoch: 24, step: 992, loss: 0.3316020667552948, mean loss: 0.3507128857961712
Epoch: 24, step: 993, loss: 0.3572927415370941, mean loss: 0.3507130703643547
Epoch: 24, step: 994, loss: 0.3361797034740448, mean loss: 0.3507126627077142
Epoch: 24, step: 995, loss: 0.34395086765289307, mean loss: 0.3507124730466838
Epoch: 24, step: 996, loss: 0.3007238507270813, mean loss: 0.35071107095927684
Epoch: 24, step: 997, loss: 0.3073281943798065, mean loss: 0.3507098541848173
Epoch: 24, step: 998, loss: 0.3686493933200836, mean loss: 0.35071035732712935
Epoch: 24, step: 999, loss: 0.3530727028846741, mean loss: 0.3507104235809312
Epoch: 24, step: 1000, loss: 0.37437108159065247, mean loss: 0.35071108714371013
Epoch: 24, step: 1001, loss: 0.38078415393829346, mean loss: 0.35071193051873945
Epoch: 24, step: 1002, loss: 0.32269275188446045, mean loss: 0.3507111447653915
Epoch: 24, step: 1003, loss: 0.31345459818840027, mean loss: 0.3507100999940349
Epoch: 24, step: 1004, loss: 0.3522094190120697, mean loss: 0.35071014203769657
Epoch: 24, step: 1005, loss: 0.35561761260032654, mean loss: 0.3507102796483343
Epoch: 24, step: 1006, loss: 0.3134329915046692, mean loss: 0.3507092343832656
Epoch: 24, step: 1007, loss: 0.3857138156890869, mean loss: 0.3507102158935086
Epoch: 24, step: 1008, loss: 0.34711065888404846, mean loss: 0.35071011496663324
Epoch: 24, step: 1009, loss: 0.3248152732849121, mean loss: 0.3507093889294639
Epoch: 24, step: 1010, loss: 0.3210548162460327, mean loss: 0.35070855750061697
Epoch: 24, step: 1011, loss: 0.3565204441547394, mean loss: 0.3507087204446187
Epoch: 24, step: 1012, loss: 0.33382275700569153, mean loss: 0.35070824703736203
Epoch: 24, step: 1013, loss: 0.31717440485954285, mean loss: 0.3507073069240405
Epoch: 24, step: 1014, loss: 0.31354179978370667, mean loss: 0.3507062650270614
Epoch: 24, step: 1015, loss: 0.37573081254959106, mean loss: 0.3507069665449893
Epoch: 24, step: 1016, loss: 0.32795774936676025, mean loss: 0.3507063288297094
Epoch: 24, step: 1017, loss: 0.31219783425331116, mean loss: 0.35070524937423553
Epoch: 24, step: 1018, loss: 0.3278135061264038, mean loss: 0.35070460769958245
Epoch: 24, step: 1019, loss: 0.30690306425094604, mean loss: 0.35070337994020784
Epoch: 24, step: 1020, loss: 0.3323780298233032, mean loss: 0.3507028662941581
Epoch: 24, step: 1021, loss: 0.3126745820045471, mean loss: 0.35070180041926907
Epoch: 24, step: 1022, loss: 0.3664620816707611, mean loss: 0.3507022421435677
Epoch: 24, step: 1023, loss: 0.3666207492351532, mean loss: 0.3507026882900669
Epoch: 24, step: 1024, loss: 0.30604854226112366, mean loss: 0.3507014368075964
Epoch: 24, step: 1025, loss: 0.31638503074645996, mean loss: 0.3507004750788239
Epoch: 24, step: 1026, loss: 0.37050265073776245, mean loss: 0.350701030025876
Epoch: 24, step: 1027, loss: 0.2982407808303833, mean loss: 0.3506995598922252
Epoch: 24, step: 1028, loss: 0.3486183285713196, mean loss: 0.3506995015699239
Epoch: 24, step: 1029, loss: 0.33569613099098206, mean loss: 0.35069908114256926
Epoch: 24, step: 1030, loss: 0.33248329162597656, mean loss: 0.3506985707104927
Epoch: 24, step: 1031, loss: 0.3242872357368469, mean loss: 0.35069783064842774
Epoch: 24, step: 1032, loss: 0.32395270466804504, mean loss: 0.35069708125432925
Epoch: 24, step: 1033, loss: 0.3408941626548767, mean loss: 0.3506968065858339
Epoch: 24, step: 1034, loss: 0.32183799147605896, mean loss: 0.35069599801182055
Epoch: 24, step: 1035, loss: 0.3494197428226471, mean loss: 0.3506959622543626
Epoch: 24, step: 1036, loss: 0.3499920964241028, mean loss: 0.35069594253436626
Epoch: 24, step: 1037, loss: 0.3676225543022156, mean loss: 0.3506964167488496
Epoch: 24, step: 1038, loss: 0.31261277198791504, mean loss: 0.3506953498306605
Epoch: 24, step: 1039, loss: 0.35494473576545715, mean loss: 0.35069546887441705
Epoch: 24, step: 1040, loss: 0.3313271999359131, mean loss: 0.3506949263002809
Epoch: 24, step: 1041, loss: 0.3245590031147003, mean loss: 0.35069419416057596
Epoch: 24, step: 1042, loss: 0.38384735584259033, mean loss: 0.35069512284658066
Epoch: 24, step: 1043, loss: 0.3329413831233978, mean loss: 0.35069462554294695
Epoch: 24, step: 1044, loss: 0.3572256565093994, mean loss: 0.35069480847986656
Epoch: 24, step: 1045, loss: 0.3670174479484558, mean loss: 0.3506952656710454
Epoch: 24, step: 1046, loss: 0.3498539328575134, mean loss: 0.35069524210628017
Epoch: 24, step: 1047, loss: 0.310482919216156, mean loss: 0.35069411583687365
Epoch: 24, step: 1048, loss: 0.3051305413246155, mean loss: 0.3506928397249982
Epoch: 24, step: 1049, loss: 0.3282187283039093, mean loss: 0.3506922103038527
Epoch: 24, step: 1050, loss: 0.3592452108860016, mean loss: 0.35069244983673376
Epoch: 24, step: 1051, loss: 0.3319712281227112, mean loss: 0.35069192555025136
Epoch: 24, step: 1052, loss: 0.32538041472435, mean loss: 0.3506912167230418
Epoch: 24, step: 1053, loss: 0.3127037584781647, mean loss: 0.3506901529465578
Epoch: 24, step: 1054, loss: 0.34548279643058777, mean loss: 0.35069000712716
Epoch: 24, step: 1055, loss: 0.3240950107574463, mean loss: 0.35068926241960036
Epoch: 24, step: 1056, loss: 0.3033476173877716, mean loss: 0.3506879368058174
Epoch: 24, step: 1057, loss: 0.31490761041641235, mean loss: 0.35068693494866365
Epoch: 24, step: 1058, loss: 0.33231526613235474, mean loss: 0.3506864205522247
Epoch: 24, step: 1059, loss: 0.32371217012405396, mean loss: 0.3506856653094644
Epoch: 24, step: 1060, loss: 0.2948014736175537, mean loss: 0.3506841006710095
Epoch: 24, step: 1061, loss: 0.30971360206604004, mean loss: 0.3506829536163423
Epoch: 24, step: 1062, loss: 0.3112315237522125, mean loss: 0.3506818491220993
Epoch: 24, step: 1063, loss: 0.33012983202934265, mean loss: 0.35068127375767905
Epoch: 24, step: 1064, loss: 0.3090265691280365, mean loss: 0.35068010764517854
Epoch: 24, step: 1065, loss: 0.3483295440673828, mean loss: 0.3506800418436115
Epoch: 24, step: 1066, loss: 0.3671792149543762, mean loss: 0.35068050370776377
Epoch: 24, step: 1067, loss: 0.34362953901290894, mean loss: 0.35068030633443786
Epoch: 24, step: 1068, loss: 0.3186727464199066, mean loss: 0.3506794103915431
Epoch: 24, step: 1069, loss: 0.31203800439834595, mean loss: 0.3506783287869416
Epoch: 24, step: 1070, loss: 0.3124372065067291, mean loss: 0.3506772584165696
Epoch: 24, step: 1071, loss: 0.3445644974708557, mean loss: 0.3506770873249623
Epoch: 24, step: 1072, loss: 0.32160505652427673, mean loss: 0.3506762736433367
Epoch: 24, step: 1073, loss: 0.37293151021003723, mean loss: 0.3506768965158966
Epoch: 24, step: 1074, loss: 0.3689126670360565, mean loss: 0.3506774068786214
Epoch: 24, step: 1075, loss: 0.3207855224609375, mean loss: 0.3506765703207904
Epoch: 24, step: 1076, loss: 0.34832823276519775, mean loss: 0.35067650460177563
Epoch: 24, step: 1077, loss: 0.3770711421966553, mean loss: 0.3506772432438978
Epoch: 24, step: 1078, loss: 0.3378796875476837, mean loss: 0.35067688512005013
Epoch: 24, step: 1079, loss: 0.35353291034698486, mean loss: 0.35067696504016505
Epoch: 24, step: 1080, loss: 0.29782557487487793, mean loss: 0.35067548614181976
Epoch: 24, step: 1081, loss: 0.3057512044906616, mean loss: 0.35067422909661156
Epoch: 24, step: 1082, loss: 0.33710604906082153, mean loss: 0.3506738494502858
Epoch: 24, step: 1083, loss: 0.36184248328208923, mean loss: 0.35067416194703543
Epoch: 24, step: 1084, loss: 0.3266085982322693, mean loss: 0.3506734886149038
Epoch: 24, step: 1085, loss: 0.3143255114555359, mean loss: 0.3506724716606998
Epoch: 24, step: 1086, loss: 0.3182542026042938, mean loss: 0.35067156467838
Epoch: 24, step: 1087, loss: 0.36598727107048035, mean loss: 0.3506719931616609
Epoch: 24, step: 1088, loss: 0.30087488889694214, mean loss: 0.35067060004082545
Epoch: 24, step: 1089, loss: 0.4044976830482483, mean loss: 0.3506721058619805
Epoch: 24, step: 1090, loss: 0.30813834071159363, mean loss: 0.35067091600646394
Epoch: 24, step: 1091, loss: 0.28623294830322266, mean loss: 0.3506691134449863
Epoch: 24, step: 1092, loss: 0.3543996512889862, mean loss: 0.3506692177986142
Epoch: 24, step: 1093, loss: 0.3373565673828125, mean loss: 0.3506688454167844
Epoch: 24, step: 1094, loss: 0.35050109028816223, mean loss: 0.35066884072446447
Epoch: 24, step: 1095, loss: 0.3222792446613312, mean loss: 0.3506680466543128
Epoch: 24, step: 1096, loss: 0.32422465085983276, mean loss: 0.3506673070409714
Epoch: 24, step: 1097, loss: 0.33589407801628113, mean loss: 0.35066689385002703
Epoch: 24, step: 1098, loss: 0.32006269693374634, mean loss: 0.35066603790828693
Epoch: 24, step: 1099, loss: 0.34484899044036865, mean loss: 0.3506658752209766
Epoch: 24, step: 1100, loss: 0.31690824031829834, mean loss: 0.3506649311363246
Epoch: 24, step: 1101, loss: 0.2953994572162628, mean loss: 0.35066338559479765
Epoch: 24, step: 1102, loss: 0.34209445118904114, mean loss: 0.35066314596465126
Epoch: 24, step: 1103, loss: 0.3242586553096771, mean loss: 0.3506624075840401
Epoch: 24, step: 1104, loss: 0.34714627265930176, mean loss: 0.35066230926086894
Epoch: 24, step: 1105, loss: 0.31712135672569275, mean loss: 0.35066137136722386
Epoch: 24, step: 1106, loss: 0.3239920139312744, mean loss: 0.3506606256423843
Epoch: 24, step: 1107, loss: 0.33926206827163696, mean loss: 0.3506603069264305
Epoch: 24, step: 1108, loss: 0.3377310037612915, mean loss: 0.350659945419282
Epoch: 24, step: 1109, loss: 0.3330138921737671, mean loss: 0.3506594520441983
Epoch: 24, step: 1110, loss: 0.30044451355934143, mean loss: 0.3506580480981451
Epoch: 24, step: 1111, loss: 0.3619339168071747, mean loss: 0.35065836334833267
Epoch: 24, step: 1112, loss: 0.30622097849845886, mean loss: 0.3506571210048271
Epoch: 24, step: 1113, loss: 0.3422732651233673, mean loss: 0.35065688662249883
Epoch: 24, step: 1114, loss: 0.310038685798645, mean loss: 0.35065575111606
Epoch: 24, step: 1115, loss: 0.3161608874797821, mean loss: 0.3506547868181836
Epoch: 24, step: 1116, loss: 0.331429123878479, mean loss: 0.3506542493831644
Epoch: 24, step: 1117, loss: 0.32928934693336487, mean loss: 0.3506536521644455
Epoch: 24, step: 1118, loss: 0.308331161737442, mean loss: 0.35065246914584514
Epoch: 24, step: 1119, loss: 0.3446792662143707, mean loss: 0.35065230218467197
Epoch: 24, step: 1120, loss: 0.33705970644950867, mean loss: 0.3506519222591406
Epoch: 24, step: 1121, loss: 0.36083585023880005, mean loss: 0.35065220690132237
Epoch: 24, step: 1122, loss: 0.3153909742832184, mean loss: 0.35065122137258714
Epoch: 24, step: 1123, loss: 0.30600130558013916, mean loss: 0.35064997347108373
Epoch: 24, step: 1124, loss: 0.33124297857284546, mean loss: 0.3506494310883974
Epoch: 24, step: 1125, loss: 0.371048241853714, mean loss: 0.35065000117421613
Epoch: 24, step: 1126, loss: 0.3292662501335144, mean loss: 0.35064940357896024
Epoch: 24, step: 1127, loss: 0.33807870745658875, mean loss: 0.3506490522851942
Epoch: 24, step: 1128, loss: 0.3150383234024048, mean loss: 0.350648057155143
Epoch: 24, step: 1129, loss: 0.329830527305603, mean loss: 0.3506474754324065
Epoch: 24, step: 1130, loss: 0.3069199323654175, mean loss: 0.3506462535489553
Epoch: 24, step: 1131, loss: 0.3268263339996338, mean loss: 0.35064558796497325
Epoch: 24, step: 1132, loss: 0.32089605927467346, mean loss: 0.3506447567171404
Epoch: 24, step: 1133, loss: 0.3485215902328491, mean loss: 0.35064469739424337
Epoch: 24, step: 1134, loss: 0.33730050921440125, mean loss: 0.35064432455782696
Epoch: 24, step: 1135, loss: 0.3539574146270752, mean loss: 0.35064441712292727
Epoch: 24, step: 1136, loss: 0.3498351573944092, mean loss: 0.35064439451348606
Epoch: 24, step: 1137, loss: 0.38079169392585754, mean loss: 0.3506452367579799
Epoch: 24, step: 1138, loss: 0.3447626531124115, mean loss: 0.3506450724170483
Epoch: 24, step: 1139, loss: 0.33067119121551514, mean loss: 0.35064451442506034
Epoch: 24, step: 1140, loss: 0.3258395791053772, mean loss: 0.35064382149170503
Epoch: 24, step: 1141, loss: 0.3717087507247925, mean loss: 0.35064440993042323
Epoch: 24, step: 1142, loss: 0.3362729847431183, mean loss: 0.35064400848275185
Epoch: 24, step: 1143, loss: 0.31525492668151855, mean loss: 0.35064301996091385
Epoch: 24, step: 1144, loss: 0.3271356523036957, mean loss: 0.3506423633488735
Epoch: 24, step: 1145, loss: 0.34938135743141174, mean loss: 0.3506423281272122
Epoch: 24, step: 1146, loss: 0.33910423517227173, mean loss: 0.35064200586111843
Epoch: 24, step: 1147, loss: 0.3577346205711365, mean loss: 0.3506422039567142
Epoch: 24, step: 1148, loss: 0.3183019161224365, mean loss: 0.3506413007228688
Epoch: 24, step: 1149, loss: 0.3101125657558441, mean loss: 0.35064016882500343
Epoch: 24, step: 1150, loss: 0.3861725926399231, mean loss: 0.35064116115677696
Epoch: 24, step: 1151, loss: 0.3060418963432312, mean loss: 0.35063991564558356
Epoch: 24, step: 1152, loss: 0.30370375514030457, mean loss: 0.3506386049091624
Epoch: 24, step: 1153, loss: 0.3212425708770752, mean loss: 0.3506377840201919
Epoch: 24, step: 1154, loss: 0.2849372327327728, mean loss: 0.35063594937298054
Epoch: 24, step: 1155, loss: 0.30609092116355896, mean loss: 0.35063470551538506
Epoch: 24, step: 1156, loss: 0.31029078364372253, mean loss: 0.35063357899926323
Epoch: 24, step: 1157, loss: 0.310892790555954, mean loss: 0.3506324693553127
Epoch: 24, step: 1158, loss: 0.2908945679664612, mean loss: 0.35063080139771424
Epoch: 24, step: 1159, loss: 0.3086923360824585, mean loss: 0.35062963045552875
Epoch: 24, step: 1160, loss: 0.3188324570655823, mean loss: 0.35062874268789357
Epoch: 24, step: 1161, loss: 0.33697694540023804, mean loss: 0.3506283615444102
Epoch: 24, step: 1162, loss: 0.3376467227935791, mean loss: 0.35062799912115017
Epoch: 24, step: 1163, loss: 0.31467732787132263, mean loss: 0.35062699547315324
Epoch: 24, step: 1164, loss: 0.3109363913536072, mean loss: 0.35062588744702
Epoch: 24, step: 1165, loss: 0.3584209084510803, mean loss: 0.3506261050513136
Epoch: 24, step: 1166, loss: 0.3085207939147949, mean loss: 0.35062492968043074
Epoch: 24, step: 1167, loss: 0.344376802444458, mean loss: 0.3506247552686611
Epoch: 24, step: 1168, loss: 0.3207271099090576, mean loss: 0.35062392072168663
Epoch: 24, step: 1169, loss: 0.3100303113460541, mean loss: 0.35062278764488836
Epoch: 24, step: 1170, loss: 0.3163841962814331, mean loss: 0.3506218319804073
Epoch: 24, step: 1171, loss: 0.3571491241455078, mean loss: 0.3506220141645137
Epoch: 24, step: 1172, loss: 0.32675427198410034, mean loss: 0.3506213480074292
Epoch: 24, step: 1173, loss: 0.36047324538230896, mean loss: 0.350621622969678
Epoch: 24, step: 1174, loss: 0.4040565490722656, mean loss: 0.3506231142740263
Epoch: 24, step: 1175, loss: 0.3137122690677643, mean loss: 0.3506220841655979
Epoch: 24, step: 1176, loss: 0.360973596572876, mean loss: 0.3506223730477012
Epoch: 24, step: 1177, loss: 0.3363926410675049, mean loss: 0.3506219759462897
Epoch: 24, step: 1178, loss: 0.35432639718055725, mean loss: 0.3506220793206788
Epoch: 24, step: 1179, loss: 0.3320731222629547, mean loss: 0.35062156171388514
Epoch: 24, step: 1180, loss: 0.32554295659065247, mean loss: 0.3506208619174423
Epoch: 24, step: 1181, loss: 0.31721702218055725, mean loss: 0.3506199298386506
Epoch: 24, step: 1182, loss: 0.372422993183136, mean loss: 0.3506205382000263
Epoch: 24, step: 1183, loss: 0.3711431622505188, mean loss: 0.3506211108178849
Epoch: 24, step: 1184, loss: 0.3178364336490631, mean loss: 0.3506201960923703
Epoch: 24, step: 1185, loss: 0.321367472410202, mean loss: 0.35061937993468706
Epoch: 24, step: 1186, loss: 0.3273179233074188, mean loss: 0.3506187298368541
Epoch: 24, step: 1187, loss: 0.3503188192844391, mean loss: 0.350618721469748
Epoch: 24, step: 1188, loss: 0.3736089766025543, mean loss: 0.350619362849442
Epoch: 24, step: 1189, loss: 0.3401709496974945, mean loss: 0.3506190713688542
Epoch: 24, step: 1190, loss: 0.2945029139518738, mean loss: 0.3506175059336039
Epoch: 24, step: 1191, loss: 0.3099639415740967, mean loss: 0.3506163718796997
Epoch: 24, step: 1192, loss: 0.31592676043510437, mean loss: 0.3506154042205894
Epoch: 24, step: 1193, loss: 0.36858853697776794, mean loss: 0.35061590556320466
Epoch: 24, step: 1194, loss: 0.31912514567375183, mean loss: 0.35061502718436194
Epoch: 24, step: 1195, loss: 0.3603811264038086, mean loss: 0.3506152995847641
Epoch: 24, step: 1196, loss: 0.3356340229511261, mean loss: 0.35061488173195865
Epoch: 24, step: 1197, loss: 0.3193613588809967, mean loss: 0.3506140100433646
Epoch: 24, step: 1198, loss: 0.30450519919395447, mean loss: 0.3506127240634218
Epoch: 24, step: 1199, loss: 0.3422287702560425, mean loss: 0.35061249024052443
Epoch: 24, step: 1200, loss: 0.32427528500556946, mean loss: 0.35061175573386644
Epoch: 24, step: 1201, loss: 0.30839937925338745, mean loss: 0.3506105785244158
Epoch: 24, step: 1202, loss: 0.3295963406562805, mean loss: 0.3506099925003251
Epoch: 24, step: 1203, loss: 0.35239893198013306, mean loss: 0.35061004238709254
Epoch: 24, step: 1204, loss: 0.33709558844566345, mean loss: 0.35060966553050904
Epoch: 24, step: 1205, loss: 0.3313983976840973, mean loss: 0.3506091298306639
Epoch: 24, step: 1206, loss: 0.3217170536518097, mean loss: 0.3506083242071472
Epoch: 24, step: 1207, loss: 0.37824293971061707, mean loss: 0.35060909474628127
Epoch: 24, step: 1208, loss: 0.35462135076522827, mean loss: 0.3506092066173539
Epoch: 24, step: 1209, loss: 0.3087169826030731, mean loss: 0.35060803859683265
Epoch: 24, step: 1210, loss: 0.30631181597709656, mean loss: 0.35060680358351626
Epoch: 24, step: 1211, loss: 0.2769828140735626, mean loss: 0.3506047509463603
Epoch: 24, step: 1212, loss: 0.3207021653652191, mean loss: 0.35060391728538337
Epoch: 24, step: 1213, loss: 0.37890419363975525, mean loss: 0.35060470625322154
Epoch: 24, step: 1214, loss: 0.29777127504348755, mean loss: 0.35060323338011484
Epoch: 24, step: 1215, loss: 0.365204781293869, mean loss: 0.35060364042594205
Epoch: 24, step: 1216, loss: 0.2897842526435852, mean loss: 0.3506019450174794
Epoch: 24, step: 1217, loss: 0.33336493372917175, mean loss: 0.35060146452990376
Epoch: 24, step: 1218, loss: 0.34631842374801636, mean loss: 0.3506013451420074
Epoch: 24, step: 1219, loss: 0.3780142366886139, mean loss: 0.35060210924312085
Epoch: 24, step: 1220, loss: 0.32695022225379944, mean loss: 0.3506014499938249
Epoch: 24, step: 1221, loss: 0.33435550332069397, mean loss: 0.35060099718300286
Epoch: 24, step: 1222, loss: 0.3245745897293091, mean loss: 0.3506002717891108
Epoch: 24, step: 1223, loss: 0.32728782296180725, mean loss: 0.3505996220553085
Epoch: 24, step: 1224, loss: 0.34245407581329346, mean loss: 0.3505993950397225
Epoch: 24, step: 1225, loss: 0.3221161663532257, mean loss: 0.35059860123701675
Epoch: 24, step: 1226, loss: 0.3028948903083801, mean loss: 0.35059727181330835
Epoch: 24, step: 1227, loss: 0.3607805073261261, mean loss: 0.35059755559537037
Epoch: 24, step: 1228, loss: 0.3035906255245209, mean loss: 0.35059624566280606
Epoch: 24, step: 1229, loss: 0.3718988597393036, mean loss: 0.3505968392818797
Epoch: 24, step: 1230, loss: 0.3306344449520111, mean loss: 0.3505962830248972
Epoch: 24, step: 1231, loss: 0.3318175673484802, mean loss: 0.3505957597659896
Epoch: 24, step: 1232, loss: 0.3361245393753052, mean loss: 0.3505953565443788
Epoch: 24, step: 1233, loss: 0.3392348885536194, mean loss: 0.35059504000863095
Epoch: 24, step: 1234, loss: 0.32412850856781006, mean loss: 0.3505943025944758
Epoch: 24, step: 1235, loss: 0.2873416244983673, mean loss: 0.35059254028872255
Epoch: 24, step: 1236, loss: 0.3261604607105255, mean loss: 0.3505918595966774
Epoch: 24, step: 1237, loss: 0.351774126291275, mean loss: 0.3505918925344022
Epoch: 24, step: 1238, loss: 0.31435343623161316, mean loss: 0.35059088296604163
Epoch: 24, step: 1239, loss: 0.37405848503112793, mean loss: 0.3505915367325355
Epoch: 24, step: 1240, loss: 0.2891499996185303, mean loss: 0.35058982512607495
Epoch: 24, step: 1241, loss: 0.32145655155181885, mean loss: 0.35058901356906413
Epoch: 24, step: 1242, loss: 0.3463169038295746, mean loss: 0.350588894565478
Epoch: 24, step: 1243, loss: 0.3432684540748596, mean loss: 0.3505886906534866
Epoch: 24, step: 1244, loss: 0.32208502292633057, mean loss: 0.3505878967015708
Epoch: 24, step: 1245, loss: 0.38079485297203064, mean loss: 0.3505887380740924
Epoch: 24, step: 1246, loss: 0.31338027119636536, mean loss: 0.35058770171315107
Epoch: 24, step: 1247, loss: 0.3532756268978119, mean loss: 0.35058777657737744
Epoch: 24, step: 1248, loss: 0.37381771206855774, mean loss: 0.3505884235606804
Epoch: 24, step: 1249, loss: 0.30002349615097046, mean loss: 0.3505870153022442
Epoch: 24, step: 1250, loss: 0.35263562202453613, mean loss: 0.35058707235537373
Epoch: 24, step: 1251, loss: 0.31429770588874817, mean loss: 0.35058606173471907
Epoch: 24, step: 1252, loss: 0.334023654460907, mean loss: 0.3505856005019564
Epoch: 24, step: 1253, loss: 0.332063764333725, mean loss: 0.350585084717045
Epoch: 24, step: 1254, loss: 0.27954381704330444, mean loss: 0.35058310645780205
Epoch: 24, step: 1255, loss: 0.32749292254447937, mean loss: 0.35058246349211053
Epoch: 24, step: 1256, loss: 0.32741492986679077, mean loss: 0.3505818183905143
Epoch: 24, step: 1257, loss: 0.3322068750858307, mean loss: 0.3505813067531777
Epoch: 24, step: 1258, loss: 0.31080299615859985, mean loss: 0.35058019918501415
Epoch: 24, step: 1259, loss: 0.3398299217224121, mean loss: 0.35057989986778887
Epoch: 24, step: 1260, loss: 0.3823748528957367, mean loss: 0.3505807851018849
Epoch: 24, step: 1261, loss: 0.3074532449245453, mean loss: 0.3505795843796794
Epoch: 24, step: 1262, loss: 0.42656978964805603, mean loss: 0.35058169997881267
Epoch: 24, step: 1263, loss: 0.31294551491737366, mean loss: 0.3505806522008321
Epoch: 24, step: 1264, loss: 0.3354802429676056, mean loss: 0.35058023182252324
Epoch: 24, step: 1265, loss: 0.32700732350349426, mean loss: 0.3505795755976939
Epoch: 24, step: 1266, loss: 0.2929985523223877, mean loss: 0.3505779726963974
Epoch: 24, step: 1267, loss: 0.31216180324554443, mean loss: 0.3505769033230133
Epoch: 24, step: 1268, loss: 0.33975932002067566, mean loss: 0.3505766022072637
Epoch: 24, step: 1269, loss: 0.30894336104393005, mean loss: 0.3505754433462393
Epoch: 24, step: 1270, loss: 0.34090539813041687, mean loss: 0.35057517418807926
Epoch: 24, step: 1271, loss: 0.35807546973228455, mean loss: 0.3505753829471403
Epoch: 24, step: 1272, loss: 0.3460474908351898, mean loss: 0.3505752569238134
Epoch: 24, step: 1273, loss: 0.3737512230873108, mean loss: 0.35057590195487837
Epoch: 24, step: 1274, loss: 0.3159746527671814, mean loss: 0.3505749389633338
Epoch: 24, step: 1275, loss: 0.314444363117218, mean loss: 0.35057393343689924
Epoch: 24, step: 1276, loss: 0.33917054533958435, mean loss: 0.35057361608549253
Epoch: 24, step: 1277, loss: 0.30544352531433105, mean loss: 0.35057236016934706
Epoch: 24, step: 1278, loss: 0.3174777925014496, mean loss: 0.3505714392129628
Epoch: 24, step: 1279, loss: 0.3473704159259796, mean loss: 0.3505713501372925
Epoch: 24, step: 1280, loss: 0.3223618268966675, mean loss: 0.3505705651657245
Epoch: 24, step: 1281, loss: 0.3277786374092102, mean loss: 0.3505699309643845
Epoch: 24, step: 1282, loss: 0.35669466853141785, mean loss: 0.3505701013847514
Epoch: 24, step: 1283, loss: 0.32870757579803467, mean loss: 0.3505694930785303
Epoch: 24, step: 1284, loss: 0.3413967192173004, mean loss: 0.35056923786098315
Epoch: 24, step: 1285, loss: 0.34542304277420044, mean loss: 0.35056909468043984
Epoch: 24, step: 1286, loss: 0.3262462615966797, mean loss: 0.3505684179747368
Epoch: 24, step: 1287, loss: 0.3283669948577881, mean loss: 0.3505678003077238
Epoch: 24, step: 1288, loss: 0.32726752758026123, mean loss: 0.3505671520875895
Epoch: 24, step: 1289, loss: 0.3406847417354584, mean loss: 0.35056687716380514
Epoch: 24, step: 1290, loss: 0.31258195638656616, mean loss: 0.35056582047143087
Epoch: 24, step: 1291, loss: 0.32944533228874207, mean loss: 0.35056523294255076
Epoch: 24, step: 1292, loss: 0.31705233454704285, mean loss: 0.3505643007080409
Epoch: 24, step: 1293, loss: 0.3247835636138916, mean loss: 0.3505635835804444
Epoch: 24, step: 1294, loss: 0.33217719197273254, mean loss: 0.3505630721512322
Epoch: 24, step: 1295, loss: 0.3073294162750244, mean loss: 0.35056186961296243
Epoch: 24, step: 1296, loss: 0.31886717677116394, mean loss: 0.3505609880539036
Epoch: 24, step: 1297, loss: 0.3122733235359192, mean loss: 0.35055992314695256
Epoch: 24, step: 1298, loss: 0.33425605297088623, mean loss: 0.35055946969485474
Epoch: 24, step: 1299, loss: 0.33295243978500366, mean loss: 0.35055898001218955
Epoch: 24, step: 1300, loss: 0.3627106249332428, mean loss: 0.35055931796154355
Epoch: 24, step: 1301, loss: 0.3285854458808899, mean loss: 0.35055870686325996
Epoch: 24, step: 1302, loss: 0.33711689710617065, mean loss: 0.3505583330539283
Epoch: 24, step: 1303, loss: 0.32736682891845703, mean loss: 0.3505576881288967
Epoch: 24, step: 1304, loss: 0.3161050081253052, mean loss: 0.35055673007211285
Epoch: 24, step: 1305, loss: 0.34577232599258423, mean loss: 0.35055659703156783
Epoch: 24, step: 1306, loss: 0.3656628429889679, mean loss: 0.3505570170812288
Epoch: 24, step: 1307, loss: 0.33113059401512146, mean loss: 0.3505564769182028
Epoch: 24, step: 1308, loss: 0.3522723615169525, mean loss: 0.3505565246280484
Epoch: 24, step: 1309, loss: 0.3406326472759247, mean loss: 0.3505562487041939
Epoch: 24, step: 1310, loss: 0.3427578806877136, mean loss: 0.35055603188410833
Epoch: 24, step: 1311, loss: 0.41951340436935425, mean loss: 0.35055794907084337
Epoch: 24, step: 1312, loss: 0.317051500082016, mean loss: 0.3505570175339925
Epoch: 24, step: 1313, loss: 0.31538254022598267, mean loss: 0.35055603965027526
Epoch: 24, step: 1314, loss: 0.3297765851020813, mean loss: 0.35055546197785725
Epoch: 24, step: 1315, loss: 0.339389830827713, mean loss: 0.3505551515800159
Epoch: 24, step: 1316, loss: 0.3334169089794159, mean loss: 0.3505546751604067
Epoch: 24, step: 1317, loss: 0.33820778131484985, mean loss: 0.3505543319432542
Epoch: 24, step: 1318, loss: 0.3545399606227875, mean loss: 0.3505544427320987
Epoch: 24, step: 1319, loss: 0.33327817916870117, mean loss: 0.35055396251574433
Epoch: 24, step: 1320, loss: 0.353270947933197, mean loss: 0.3505540380358104
Epoch: 24, step: 1321, loss: 0.3692845106124878, mean loss: 0.3505545586448653
Epoch: 24, step: 1322, loss: 0.29824718832969666, mean loss: 0.3505531048142887
Epoch: 24, step: 1323, loss: 0.3336924612522125, mean loss: 0.3505526362027389
Epoch: 24, step: 1324, loss: 0.45423638820648193, mean loss: 0.3505555178278189
Epoch: 24, step: 1325, loss: 0.36433109641075134, mean loss: 0.3505559006742027
Epoch: 24, step: 1326, loss: 0.3679848611354828, mean loss: 0.35055638504072195
Epoch: 24, step: 1327, loss: 0.3289972245693207, mean loss: 0.3505557859088725
Epoch: 24, step: 1328, loss: 0.3110198974609375, mean loss: 0.35055468723196687
Epoch: 24, step: 1329, loss: 0.379259318113327, mean loss: 0.3505554848930262
Epoch: 24, step: 1330, loss: 0.30919259786605835, mean loss: 0.3505543355088867
Epoch: 24, step: 1331, loss: 0.30446094274520874, mean loss: 0.35055305470993253
Epoch: 24, step: 1332, loss: 0.40720999240875244, mean loss: 0.350554628994789
Epoch: 24, step: 1333, loss: 0.35000544786453247, mean loss: 0.35055461373551894
Epoch: 24, step: 1334, loss: 0.3448358476161957, mean loss: 0.3505544548411809
Epoch: 24, step: 1335, loss: 0.33163338899612427, mean loss: 0.3505539291391959
Epoch: 24, step: 1336, loss: 0.31279799342155457, mean loss: 0.3505528801592354
Epoch: 24, step: 1337, loss: 0.3541141450405121, mean loss: 0.35055297909975
Epoch: 24, step: 1338, loss: 0.34674546122550964, mean loss: 0.35055287332067303
Epoch: 24, step: 1339, loss: 0.32477715611457825, mean loss: 0.3505521572489649
Epoch: 24, step: 1340, loss: 0.3150195777416229, mean loss: 0.35055117015060927
Epoch: 24, step: 1341, loss: 0.3284396231174469, mean loss: 0.3505505559068448
Epoch: 24, step: 1342, loss: 0.29236048460006714, mean loss: 0.3505489394710742
Epoch: 24, step: 1343, loss: 0.38102981448173523, mean loss: 0.3505497861620467
Epoch: 24, step: 1344, loss: 0.3085397779941559, mean loss: 0.3505486192497896
Epoch: 24, step: 1345, loss: 0.31496116518974304, mean loss: 0.3505476307643149
Epoch: 24, step: 1346, loss: 0.342036634683609, mean loss: 0.35054739436745685
Epoch: 24, step: 1347, loss: 0.3061111271381378, mean loss: 0.3505461601638342
Epoch: 24, step: 1348, loss: 0.32650357484817505, mean loss: 0.3505454924069861
Epoch: 24, step: 1349, loss: 0.4117155373096466, mean loss: 0.3505471912917526
Epoch: 24, step: 1350, loss: 0.3151153028011322, mean loss: 0.3505462072639666
Epoch: 24, step: 1351, loss: 0.35641995072364807, mean loss: 0.35054637038725756
Epoch: 24, step: 1352, loss: 0.34069621562957764, mean loss: 0.35054609684023436
Epoch: 24, step: 1353, loss: 0.3228492736816406, mean loss: 0.3505453276976862
Epoch: 24, step: 1354, loss: 0.37923502922058105, mean loss: 0.3505461243904057
Epoch: 24, step: 1355, loss: 0.31415945291519165, mean loss: 0.35054511398633276
Epoch: 24, step: 1356, loss: 0.357605516910553, mean loss: 0.35054531003783984
Epoch: 24, step: 1357, loss: 0.3092590272426605, mean loss: 0.3505441636424715
Epoch: 24, step: 1358, loss: 0.29702311754226685, mean loss: 0.35054267756594504
Epoch: 24, step: 1359, loss: 0.3258478045463562, mean loss: 0.3505419919019896
Epoch: 24, step: 1360, loss: 0.3399304151535034, mean loss: 0.35054169727509815
Epoch: 24, step: 1361, loss: 0.2883681654930115, mean loss: 0.3505399710956384
Epoch: 24, step: 1362, loss: 0.3099232017993927, mean loss: 0.3505388434471946
Epoch: 24, step: 1363, loss: 0.36621060967445374, mean loss: 0.3505392785323203
Epoch: 24, step: 1364, loss: 0.3214278519153595, mean loss: 0.3505384703530189
Epoch: 24, step: 1365, loss: 0.38410717248916626, mean loss: 0.35053940224747604
Epoch: 24, step: 1366, loss: 0.3200775980949402, mean loss: 0.3505385566265074
Epoch: 24, step: 1367, loss: 0.31569191813468933, mean loss: 0.35053758930920526
Epoch: 24, step: 1368, loss: 0.3147461712360382, mean loss: 0.35053659579308943
Epoch: 24, step: 1369, loss: 0.372454434633255, mean loss: 0.35053720418255374
Epoch: 24, step: 1370, loss: 0.3451554775238037, mean loss: 0.35053705480218184
Epoch: 24, step: 1371, loss: 0.3363434374332428, mean loss: 0.3505366608414466
Epoch: 24, step: 1372, loss: 0.31472331285476685, mean loss: 0.35053566682695864
Epoch: 24, step: 1373, loss: 0.331743448972702, mean loss: 0.35053514525554996
Epoch: 24, step: 1374, loss: 0.30173686146736145, mean loss: 0.3505337909139056
Epoch: 24, step: 1375, loss: 0.3207504451274872, mean loss: 0.35053296433348297
Epoch: 24, step: 1376, loss: 0.333526074886322, mean loss: 0.3505324923525364
Epoch: 24, step: 1377, loss: 0.4004335403442383, mean loss: 0.35053387718486123
Epoch: 24, step: 1378, loss: 0.33953654766082764, mean loss: 0.35053357200019286
Epoch: 24, step: 1379, loss: 0.32484427094459534, mean loss: 0.3505328591213757
Epoch: 24, step: 1380, loss: 0.3007795214653015, mean loss: 0.3505314785031873
Epoch: 24, step: 1381, loss: 0.3702046275138855, mean loss: 0.35053202440332076
Epoch: 24, step: 1382, loss: 0.3174344599246979, mean loss: 0.3505311060214434
Epoch: 24, step: 1383, loss: 0.3160746693611145, mean loss: 0.35053014996049275
Epoch: 24, step: 1384, loss: 0.2995816469192505, mean loss: 0.35052873633426035
Epoch: 24, step: 1385, loss: 0.3234756290912628, mean loss: 0.3505279857347586
Epoch: 24, step: 1386, loss: 0.32425352931022644, mean loss: 0.3505272567594673
Epoch: 24, step: 1387, loss: 0.3179040849208832, mean loss: 0.35052635166647433
Epoch: 24, step: 1388, loss: 0.3141733407974243, mean loss: 0.35052534312129835
Epoch: 24, step: 1389, loss: 0.316087543964386, mean loss: 0.35052438773653566
Epoch: 24, step: 1390, loss: 0.3085342347621918, mean loss: 0.350523222864203
Epoch: 24, step: 1391, loss: 0.33457309007644653, mean loss: 0.35052278039491797
Epoch: 24, step: 1392, loss: 0.36473140120506287, mean loss: 0.35052317454235093
Epoch: 24, step: 1393, loss: 0.2996327877044678, mean loss: 0.3505217628811349
Epoch: 24, step: 1394, loss: 0.40732496976852417, mean loss: 0.3505233385158437
Epoch: 24, step: 1395, loss: 0.34866487979888916, mean loss: 0.3505232869664507
Epoch: 24, step: 1396, loss: 0.3452872931957245, mean loss: 0.3505231417359908
Epoch: 24, step: 1397, loss: 0.3383825719356537, mean loss: 0.3505228050030402
Epoch: 24, step: 1398, loss: 0.3274167776107788, mean loss: 0.35052216414803006
Epoch: 24, step: 1399, loss: 0.3022407293319702, mean loss: 0.35052082508005755
Epoch: 24, step: 1400, loss: 0.33704686164855957, mean loss: 0.35052045139496363
Epoch: 24, step: 1401, loss: 0.28813934326171875, mean loss: 0.3505187213736609
Epoch: 24, step: 1402, loss: 0.3166194260120392, mean loss: 0.35051778126729743
Epoch: 24, step: 1403, loss: 0.2907205820083618, mean loss: 0.35051612299776724
Epoch: 24, step: 1404, loss: 0.3202019929885864, mean loss: 0.3505152823630092
Epoch: 24, step: 1405, loss: 0.3307168781757355, mean loss: 0.3505147333528548
Epoch: 24, step: 1406, loss: 0.33443883061408997, mean loss: 0.3505142875801033
Epoch: 24, step: 1407, loss: 0.3355085253715515, mean loss: 0.3505138714930855
Epoch: 24, step: 1408, loss: 0.3407225012779236, mean loss: 0.350513600000774
Epoch: 24, step: 1409, loss: 0.3000968396663666, mean loss: 0.3505122020980308
Epoch: 24, step: 1410, loss: 0.34313541650772095, mean loss: 0.35051199756797313
Epoch: 24, step: 1411, loss: 0.3625180721282959, mean loss: 0.35051233044128355
Epoch: 24, step: 1412, loss: 0.3570834994316101, mean loss: 0.3505125126245709
Epoch: 24, step: 1413, loss: 0.3357016444206238, mean loss: 0.3505121020099825
Epoch: 24, step: 1414, loss: 0.35393157601356506, mean loss: 0.35051219680840795
Epoch: 24, step: 1415, loss: 0.3627273440361023, mean loss: 0.3505125354407884
Epoch: 24, step: 1416, loss: 0.3047843277454376, mean loss: 0.35051126778332453
Epoch: 24, step: 1417, loss: 0.38576632738113403, mean loss: 0.3505122450816446
Epoch: 24, step: 1418, loss: 0.31341639161109924, mean loss: 0.35051121678355807
Epoch: 24, step: 1419, loss: 0.33209019899368286, mean loss: 0.35051070616658864
Epoch: 24, step: 1420, loss: 0.360907644033432, mean loss: 0.3505109943540174
Epoch: 24, step: 1421, loss: 0.3169303238391876, mean loss: 0.3505100635743036
Epoch: 24, step: 1422, loss: 0.3590266704559326, mean loss: 0.35051029962870867
Epoch: 24, step: 1423, loss: 0.3248467445373535, mean loss: 0.35050958833283585
Epoch: 24, step: 1424, loss: 0.37139540910720825, mean loss: 0.3505101671920907
Epoch: 24, step: 1425, loss: 0.31370678544044495, mean loss: 0.350509147199248
Epoch: 24, step: 1426, loss: 0.36405304074287415, mean loss: 0.3505095225531139
Epoch: 24, step: 1427, loss: 0.36182984709739685, mean loss: 0.3505098362745568
Epoch: 24, step: 1428, loss: 0.36434558033943176, mean loss: 0.3505102196954814
Epoch: 24, step: 1429, loss: 0.3144848942756653, mean loss: 0.35050922137686974
Epoch: 24, step: 1430, loss: 0.29514244198799133, mean loss: 0.3505076871185665
Epoch: 24, step: 1431, loss: 0.32406771183013916, mean loss: 0.35050695446573765
Epoch: 24, step: 1432, loss: 0.34237319231033325, mean loss: 0.35050672908509106
Epoch: 24, step: 1433, loss: 0.3464970886707306, mean loss: 0.35050661798394356
Epoch: 24, step: 1434, loss: 0.3521009385585785, mean loss: 0.35050666215896153
Epoch: 24, step: 1435, loss: 0.3083418309688568, mean loss: 0.35050549389920344
Epoch: 24, step: 1436, loss: 0.366180956363678, mean loss: 0.35050592820675514
Epoch: 24, step: 1437, loss: 0.3234705626964569, mean loss: 0.3505051791801715
Epoch: 24, step: 1438, loss: 0.3555193543434143, mean loss: 0.35050531809623087
Epoch: 24, step: 1439, loss: 0.31566041707992554, mean loss: 0.3505043527565529
Epoch: 24, step: 1440, loss: 0.3247053623199463, mean loss: 0.3505036380436838
Epoch: 24, step: 1441, loss: 0.3560808002948761, mean loss: 0.3505037925442725
Epoch: 24, step: 1442, loss: 0.3372921943664551, mean loss: 0.35050342656188577
Epoch: 24, step: 1443, loss: 0.30218905210494995, mean loss: 0.3505020882135629
Valid: 24, mean loss: 0.18693167716264725
Epoch: 25, step: 0, loss: 0.3145553469657898, mean loss: 0.35050109248654016
Epoch: 25, step: 1, loss: 0.3201124668121338, mean loss: 0.35050025074298924
Epoch: 25, step: 2, loss: 0.361085444688797, mean loss: 0.3505005439372929
Epoch: 25, step: 3, loss: 0.31555628776550293, mean loss: 0.35049957605960147
Epoch: 25, step: 4, loss: 0.34000393748283386, mean loss: 0.35049928536195357
Epoch: 25, step: 5, loss: 0.33966854214668274, mean loss: 0.35049898539122254
Epoch: 25, step: 6, loss: 0.30956965684890747, mean loss: 0.35049785183461185
Epoch: 25, step: 7, loss: 0.31052008271217346, mean loss: 0.3504967446625413
Epoch: 25, step: 8, loss: 0.3625185489654541, mean loss: 0.35049707759350873
Epoch: 25, step: 9, loss: 0.33247408270835876, mean loss: 0.3504965784798315
Epoch: 25, step: 10, loss: 0.312813401222229, mean loss: 0.3504955349424812
Epoch: 25, step: 11, loss: 0.3250073790550232, mean loss: 0.3504948291339996
Epoch: 25, step: 12, loss: 0.3889112174510956, mean loss: 0.3504958929168013
Epoch: 25, step: 13, loss: 0.3497334122657776, mean loss: 0.35049587180364156
Epoch: 25, step: 14, loss: 0.34766942262649536, mean loss: 0.35049579354116955
Epoch: 25, step: 15, loss: 0.33009931445121765, mean loss: 0.3504952287920531
Epoch: 25, step: 16, loss: 0.3040037751197815, mean loss: 0.350493941546333
Epoch: 25, step: 17, loss: 0.3402304947376251, mean loss: 0.3504936573820158
Epoch: 25, step: 18, loss: 0.3340819478034973, mean loss: 0.3504932030031687
Epoch: 25, step: 19, loss: 0.3280530273914337, mean loss: 0.35049258173584835
Epoch: 25, step: 20, loss: 0.31489190459251404, mean loss: 0.35049159614084424
Epoch: 25, step: 21, loss: 0.2970680296421051, mean loss: 0.35049011716497086
Epoch: 25, step: 22, loss: 0.39743366837501526, mean loss: 0.35049141671238415
Epoch: 25, step: 23, loss: 0.3073725700378418, mean loss: 0.35049022307805033
Epoch: 25, step: 24, loss: 0.3113466799259186, mean loss: 0.3504891395197624
Epoch: 25, step: 25, loss: 0.3621942400932312, mean loss: 0.3504894635274182
Epoch: 25, step: 26, loss: 0.33067435026168823, mean loss: 0.35048891504253804
Epoch: 25, step: 27, loss: 0.3094387352466583, mean loss: 0.3504877787997403
Epoch: 25, step: 28, loss: 0.3546050190925598, mean loss: 0.3504878927591716
Epoch: 25, step: 29, loss: 0.31902164220809937, mean loss: 0.35048702184163627
Epoch: 25, step: 30, loss: 0.33901891112327576, mean loss: 0.3504867044380018
Epoch: 25, step: 31, loss: 0.34006306529045105, mean loss: 0.3504864159502583
Epoch: 25, step: 32, loss: 0.33632445335388184, mean loss: 0.3504860240104084
Epoch: 25, step: 33, loss: 0.33571451902389526, mean loss: 0.35048561521246224
Epoch: 25, step: 34, loss: 0.33460626006126404, mean loss: 0.3504851757671834
Epoch: 25, step: 35, loss: 0.3288581371307373, mean loss: 0.35048457727707283
Epoch: 25, step: 36, loss: 0.353010892868042, mean loss: 0.35048464718646183
Epoch: 25, step: 37, loss: 0.3581634759902954, mean loss: 0.35048485967273124
Epoch: 25, step: 38, loss: 0.31747692823410034, mean loss: 0.3504839463123328
Epoch: 25, step: 39, loss: 0.2957906126976013, mean loss: 0.3504824329384088
Epoch: 25, step: 40, loss: 0.32908716797828674, mean loss: 0.3504818409441375
Epoch: 25, step: 41, loss: 0.3294951021671295, mean loss: 0.35048126026960985
Epoch: 25, step: 42, loss: 0.3675777018070221, mean loss: 0.35048173329181437
Epoch: 25, step: 43, loss: 0.33890077471733093, mean loss: 0.3504814128801672
Epoch: 25, step: 44, loss: 0.316987007856369, mean loss: 0.3504804862124393
Epoch: 25, step: 45, loss: 0.3496323227882385, mean loss: 0.35048046274750755
Epoch: 25, step: 46, loss: 0.368437796831131, mean loss: 0.3504809595337992
Epoch: 25, step: 47, loss: 0.3226548731327057, mean loss: 0.3504801897516148
Epoch: 25, step: 48, loss: 0.3239451050758362, mean loss: 0.35047945570407063
Epoch: 25, step: 49, loss: 0.3334280550479889, mean loss: 0.3504789840194052
Epoch: 25, step: 50, loss: 0.30935096740722656, mean loss: 0.3504778463464055
Epoch: 25, step: 51, loss: 0.3532525897026062, mean loss: 0.35047792309854525
Epoch: 25, step: 52, loss: 0.314683735370636, mean loss: 0.3504769330233723
Epoch: 25, step: 53, loss: 0.3567044734954834, mean loss: 0.35047710527375875
Epoch: 25, step: 54, loss: 0.3512327969074249, mean loss: 0.3504771261752007
Epoch: 25, step: 55, loss: 0.3060041069984436, mean loss: 0.35047589614369346
Epoch: 25, step: 56, loss: 0.3132629692554474, mean loss: 0.35047486693975266
Epoch: 25, step: 57, loss: 0.3213137984275818, mean loss: 0.35047406044966717
Epoch: 25, step: 58, loss: 0.34862005710601807, mean loss: 0.35047400917603283
Epoch: 25, step: 59, loss: 0.3649604916572571, mean loss: 0.3504744097977829
Epoch: 25, step: 60, loss: 0.3373326361179352, mean loss: 0.3504740463738267
Epoch: 25, step: 61, loss: 0.3616735339164734, mean loss: 0.3504743560770384
Epoch: 25, step: 62, loss: 0.3248879015445709, mean loss: 0.3504736485457348
Epoch: 25, step: 63, loss: 0.3502741754055023, mean loss: 0.3504736430299418
Epoch: 25, step: 64, loss: 0.35220181941986084, mean loss: 0.35047369081582286
Epoch: 25, step: 65, loss: 0.330683171749115, mean loss: 0.3504731436024438
Epoch: 25, step: 66, loss: 0.3468124568462372, mean loss: 0.35047304238623134
Epoch: 25, step: 67, loss: 0.3204798698425293, mean loss: 0.35047221311249366
Epoch: 25, step: 68, loss: 0.4254312813282013, mean loss: 0.3504742855797506
Epoch: 25, step: 69, loss: 0.3351438045501709, mean loss: 0.35047386173454653
Epoch: 25, step: 70, loss: 0.3972523510456085, mean loss: 0.3504751549940448
Epoch: 25, step: 71, loss: 0.3619672358036041, mean loss: 0.3504754727005805
Epoch: 25, step: 72, loss: 0.34051185846328735, mean loss: 0.3504751972571769
Epoch: 25, step: 73, loss: 0.3406776785850525, mean loss: 0.35047492641296085
Epoch: 25, step: 74, loss: 0.33305853605270386, mean loss: 0.35047444496471314
Epoch: 25, step: 75, loss: 0.367001473903656, mean loss: 0.3504749018153583
Epoch: 25, step: 76, loss: 0.3751027286052704, mean loss: 0.35047558257459177
Epoch: 25, step: 77, loss: 0.32508155703544617, mean loss: 0.35047488065559296
Epoch: 25, step: 78, loss: 0.32621440291404724, mean loss: 0.35047421008764634
Epoch: 25, step: 79, loss: 0.3252743184566498, mean loss: 0.3504735135732287
Epoch: 25, step: 80, loss: 0.33783939480781555, mean loss: 0.3504731643811454
Epoch: 25, step: 81, loss: 0.32658594846725464, mean loss: 0.3504725041850282
Epoch: 25, step: 82, loss: 0.3050003945827484, mean loss: 0.3504712474592287
Epoch: 25, step: 83, loss: 0.2950231730937958, mean loss: 0.35046971506716684
Epoch: 25, step: 84, loss: 0.3234347403049469, mean loss: 0.3504689679350745
Epoch: 25, step: 85, loss: 0.336887925863266, mean loss: 0.3504685926230181
Epoch: 25, step: 86, loss: 0.3046746551990509, mean loss: 0.35046732714266815
Epoch: 25, step: 87, loss: 0.3387019634246826, mean loss: 0.3504670020248468
Epoch: 25, step: 88, loss: 0.30277878046035767, mean loss: 0.3504656842702373
Epoch: 25, step: 89, loss: 0.3882695138454437, mean loss: 0.35046672886348335
Epoch: 25, step: 90, loss: 0.39084097743034363, mean loss: 0.3504678444515734
Epoch: 25, step: 91, loss: 0.3155868947505951, mean loss: 0.350466880676438
Epoch: 25, step: 92, loss: 0.29159870743751526, mean loss: 0.35046525416928914
Epoch: 25, step: 93, loss: 0.35807478427886963, mean loss: 0.3504654644121501
Epoch: 25, step: 94, loss: 0.3364032804965973, mean loss: 0.350465075900369
Epoch: 25, step: 95, loss: 0.35967448353767395, mean loss: 0.3504653303320089
Epoch: 25, step: 96, loss: 0.306415319442749, mean loss: 0.350464113380027
Epoch: 25, step: 97, loss: 0.35433095693588257, mean loss: 0.35046422020481166
Epoch: 25, step: 98, loss: 0.3502165675163269, mean loss: 0.3504642133633882
Epoch: 25, step: 99, loss: 0.3009371757507324, mean loss: 0.3504628452131779
Epoch: 25, step: 100, loss: 0.3465674817562103, mean loss: 0.35046273760942503
Epoch: 25, step: 101, loss: 0.34658464789390564, mean loss: 0.3504626304857933
Epoch: 25, step: 102, loss: 0.3668343424797058, mean loss: 0.35046308270555393
Epoch: 25, step: 103, loss: 0.3123571276664734, mean loss: 0.3504620301711644
Epoch: 25, step: 104, loss: 0.3153359293937683, mean loss: 0.35046105997089433
Epoch: 25, step: 105, loss: 0.3467468023300171, mean loss: 0.35046095738409544
Epoch: 25, step: 106, loss: 0.3156159222126007, mean loss: 0.3504599950001594
Epoch: 25, step: 107, loss: 0.3316009044647217, mean loss: 0.3504594741459135
Epoch: 25, step: 108, loss: 0.33865073323249817, mean loss: 0.35045914801868233
Epoch: 25, step: 109, loss: 0.33150237798690796, mean loss: 0.35045862449562154
Epoch: 25, step: 110, loss: 0.308887243270874, mean loss: 0.3504574764637742
Epoch: 25, step: 111, loss: 0.3758190870285034, mean loss: 0.350458176828586
Epoch: 25, step: 112, loss: 0.3759300410747528, mean loss: 0.3504588802186461
Epoch: 25, step: 113, loss: 0.3056875765323639, mean loss: 0.35045764392042755
Epoch: 25, step: 114, loss: 0.31965166330337524, mean loss: 0.3504567932789636
Epoch: 25, step: 115, loss: 0.34897610545158386, mean loss: 0.35045675239405566
Epoch: 25, step: 116, loss: 0.3983016014099121, mean loss: 0.3504580734545802
Epoch: 25, step: 117, loss: 0.3063555657863617, mean loss: 0.3504568557587475
Epoch: 25, step: 118, loss: 0.326551228761673, mean loss: 0.3504561957287357
Epoch: 25, step: 119, loss: 0.33844077587127686, mean loss: 0.35045586399433876
Epoch: 25, step: 120, loss: 0.3858250081539154, mean loss: 0.3504568404760527
Epoch: 25, step: 121, loss: 0.313384473323822, mean loss: 0.3504558169995149
Epoch: 25, step: 122, loss: 0.3284062445163727, mean loss: 0.35045520828205684
Epoch: 25, step: 123, loss: 0.31302863359451294, mean loss: 0.3504541750837715
Epoch: 25, step: 124, loss: 0.329887717962265, mean loss: 0.35045360734168396
Epoch: 25, step: 125, loss: 0.34149935841560364, mean loss: 0.350453360164272
Epoch: 25, step: 126, loss: 0.36541324853897095, mean loss: 0.3504537731128566
Epoch: 25, step: 127, loss: 0.27174514532089233, mean loss: 0.3504516005218278
Epoch: 25, step: 128, loss: 0.2960543930530548, mean loss: 0.3504500990393836
Epoch: 25, step: 129, loss: 0.37265023589134216, mean loss: 0.350450711795024
Epoch: 25, step: 130, loss: 0.38552188873291016, mean loss: 0.3504516797831264
Epoch: 25, step: 131, loss: 0.2968432605266571, mean loss: 0.3504502001954896
Epoch: 25, step: 132, loss: 0.36456024646759033, mean loss: 0.3504505896207724
Epoch: 25, step: 133, loss: 0.3356553912162781, mean loss: 0.35045018129714256
Epoch: 25, step: 134, loss: 0.34722259640693665, mean loss: 0.3504500922234599
Epoch: 25, step: 135, loss: 0.3495911657810211, mean loss: 0.35045006851978283
Epoch: 25, step: 136, loss: 0.3482503294944763, mean loss: 0.3504500078155572
Epoch: 25, step: 137, loss: 0.31135842204093933, mean loss: 0.35044892906988206
Epoch: 25, step: 138, loss: 0.31615808606147766, mean loss: 0.35044798282845685
Epoch: 25, step: 139, loss: 0.3245263993740082, mean loss: 0.35044726755297523
Epoch: 25, step: 140, loss: 0.3523291349411011, mean loss: 0.35044731947945046
Epoch: 25, step: 141, loss: 0.32236507534980774, mean loss: 0.3504465446258516
Epoch: 25, step: 142, loss: 0.30439475178718567, mean loss: 0.3504452739862015
Epoch: 25, step: 143, loss: 0.34037908911705017, mean loss: 0.3504449962523733
Epoch: 25, step: 144, loss: 0.3229007422924042, mean loss: 0.3504442363060646
Epoch: 25, step: 145, loss: 0.37657174468040466, mean loss: 0.35044495714445706
Epoch: 25, step: 146, loss: 0.3227631151676178, mean loss: 0.3504441934442342
Epoch: 25, step: 147, loss: 0.3168092966079712, mean loss: 0.3504432655338161
Epoch: 25, step: 148, loss: 0.30882057547569275, mean loss: 0.35044211729000085
Epoch: 25, step: 149, loss: 0.36091235280036926, mean loss: 0.3504424061240839
Epoch: 25, step: 150, loss: 0.34067773818969727, mean loss: 0.35044213676136465
Epoch: 25, step: 151, loss: 0.3114144802093506, mean loss: 0.35044106019575305
Epoch: 25, step: 152, loss: 0.32664310932159424, mean loss: 0.35044040375488267
Epoch: 25, step: 153, loss: 0.3182441294193268, mean loss: 0.35043951567979204
Epoch: 25, step: 154, loss: 0.3400075137615204, mean loss: 0.350439227940117
Epoch: 25, step: 155, loss: 0.3319176435470581, mean loss: 0.3504387170844133
Epoch: 25, step: 156, loss: 0.3444124460220337, mean loss: 0.35043855087454867
Epoch: 25, step: 157, loss: 0.2945183217525482, mean loss: 0.3504370085879051
Epoch: 25, step: 158, loss: 0.3577413260936737, mean loss: 0.3504372100363043
Epoch: 25, step: 159, loss: 0.3112196922302246, mean loss: 0.35043612847210664
Epoch: 25, step: 160, loss: 0.2986409068107605, mean loss: 0.35043470007185124
Epoch: 25, step: 161, loss: 0.33022022247314453, mean loss: 0.3504341426156271
Epoch: 25, step: 162, loss: 0.3789549767971039, mean loss: 0.3504349291152047
Epoch: 25, step: 163, loss: 0.3099408745765686, mean loss: 0.35043381246909455
Epoch: 25, step: 164, loss: 0.3090793490409851, mean loss: 0.3504326721281755
Epoch: 25, step: 165, loss: 0.32121869921684265, mean loss: 0.3504318665810264
Epoch: 25, step: 166, loss: 0.3405058979988098, mean loss: 0.3504315928895553
Epoch: 25, step: 167, loss: 0.34631121158599854, mean loss: 0.350431479280277
Epoch: 25, step: 168, loss: 0.3348456621170044, mean loss: 0.35043104955193705
Epoch: 25, step: 169, loss: 0.35286879539489746, mean loss: 0.35043111676301625
Epoch: 25, step: 170, loss: 0.30181580781936646, mean loss: 0.3504297764275156
Epoch: 25, step: 171, loss: 0.326246976852417, mean loss: 0.3504291097204254
Epoch: 25, step: 172, loss: 0.3244088888168335, mean loss: 0.3504283923763705
Epoch: 25, step: 173, loss: 0.31695666909217834, mean loss: 0.35042746962940896
Epoch: 25, step: 174, loss: 0.3271501660346985, mean loss: 0.3504268279394408
Epoch: 25, step: 175, loss: 0.29686984419822693, mean loss: 0.35042535156432386
Epoch: 25, step: 176, loss: 0.36971527338027954, mean loss: 0.3504258833040437
Epoch: 25, step: 177, loss: 0.3179633617401123, mean loss: 0.3504249884773839
Epoch: 25, step: 178, loss: 0.32633814215660095, mean loss: 0.3504243245438047
Epoch: 25, step: 179, loss: 0.32457321882247925, mean loss: 0.3504236119995455
Epoch: 25, step: 180, loss: 0.39838722348213196, mean loss: 0.3504249340031144
Epoch: 25, step: 181, loss: 0.31596484780311584, mean loss: 0.3504239842184774
Epoch: 25, step: 182, loss: 0.31535446643829346, mean loss: 0.3504230176634026
Epoch: 25, step: 183, loss: 0.3510065972805023, mean loss: 0.3504230337470653
Epoch: 25, step: 184, loss: 0.3589072525501251, mean loss: 0.3504232675687217
Epoch: 25, step: 185, loss: 0.3495650589466095, mean loss: 0.35042324391748925
Epoch: 25, step: 186, loss: 0.31493642926216125, mean loss: 0.3504222659690599
Epoch: 25, step: 187, loss: 0.3237268328666687, mean loss: 0.3504215303144881
Epoch: 25, step: 188, loss: 0.30987417697906494, mean loss: 0.35042041296891957
Epoch: 25, step: 189, loss: 0.34241461753845215, mean loss: 0.35042019236281785
Epoch: 25, step: 190, loss: 0.3652121424674988, mean loss: 0.3504205999556123
Epoch: 25, step: 191, loss: 0.3254822790622711, mean loss: 0.35041991279808743
Epoch: 25, step: 192, loss: 0.3112857937812805, mean loss: 0.3504188345152501
Epoch: 25, step: 193, loss: 0.3412858545780182, mean loss: 0.3504185828764134
Epoch: 25, step: 194, loss: 0.35467493534088135, mean loss: 0.3504187001474553
Epoch: 25, step: 195, loss: 0.3606100380420685, mean loss: 0.35041898093150575
Epoch: 25, step: 196, loss: 0.341017484664917, mean loss: 0.350418721915712
Epoch: 25, step: 197, loss: 0.29971858859062195, mean loss: 0.350417325140867
Epoch: 25, step: 198, loss: 0.3683800995349884, mean loss: 0.3504178199967692
Epoch: 25, step: 199, loss: 0.3384752869606018, mean loss: 0.35041749100136876
Epoch: 25, step: 200, loss: 0.3406917154788971, mean loss: 0.35041722308104917
Epoch: 25, step: 201, loss: 0.3609275817871094, mean loss: 0.3504175126066595
Epoch: 25, step: 202, loss: 0.34115585684776306, mean loss: 0.35041725748571195
Epoch: 25, step: 203, loss: 0.32747286558151245, mean loss: 0.35041662547844266
Epoch: 25, step: 204, loss: 0.37801799178123474, mean loss: 0.35041738574194087
Epoch: 25, step: 205, loss: 0.32955437898635864, mean loss: 0.35041681109844514
Epoch: 25, step: 206, loss: 0.3119761645793915, mean loss: 0.3504157523316366
Epoch: 25, step: 207, loss: 0.31978610157966614, mean loss: 0.35041490872552356
Epoch: 25, step: 208, loss: 0.3698769509792328, mean loss: 0.35041544473704284
Epoch: 25, step: 209, loss: 0.318378746509552, mean loss: 0.35041456242643343
Epoch: 25, step: 210, loss: 0.3707752525806427, mean loss: 0.35041512315707024
Epoch: 25, step: 211, loss: 0.3172747790813446, mean loss: 0.35041421050163746
Epoch: 25, step: 212, loss: 0.311624675989151, mean loss: 0.35041314230197035
Epoch: 25, step: 213, loss: 0.29779282212257385, mean loss: 0.35041169326523025
Epoch: 25, step: 214, loss: 0.34290051460266113, mean loss: 0.3504114864311765
Epoch: 25, step: 215, loss: 0.31705376505851746, mean loss: 0.35041056789055053
Epoch: 25, step: 216, loss: 0.3191319406032562, mean loss: 0.35040970662372545
Epoch: 25, step: 217, loss: 0.3361544907093048, mean loss: 0.35040931411268644
Epoch: 25, step: 218, loss: 0.35817936062812805, mean loss: 0.3504095280515756
Epoch: 25, step: 219, loss: 0.3214264512062073, mean loss: 0.35040873005937173
Epoch: 25, step: 220, loss: 0.31244367361068726, mean loss: 0.3504076847947466
Epoch: 25, step: 221, loss: 0.31761813163757324, mean loss: 0.3504067820483902
Epoch: 25, step: 222, loss: 0.41536569595336914, mean loss: 0.35040857041702456
Epoch: 25, step: 223, loss: 0.3184201121330261, mean loss: 0.3504076897745214
Epoch: 25, step: 224, loss: 0.3380827307701111, mean loss: 0.3504073504776459
Epoch: 25, step: 225, loss: 0.35967549681663513, mean loss: 0.35040760561573814
Epoch: 25, step: 226, loss: 0.3093721866607666, mean loss: 0.35040647600363267
Epoch: 25, step: 227, loss: 0.30131059885025024, mean loss: 0.3504051245425791
Epoch: 25, step: 228, loss: 0.3050646185874939, mean loss: 0.3504038764898952
Epoch: 25, step: 229, loss: 0.30493515729904175, mean loss: 0.350402624942436
Epoch: 25, step: 230, loss: 0.3647860586643219, mean loss: 0.3504030208421834
Epoch: 25, step: 231, loss: 0.3235175907611847, mean loss: 0.35040228084906216
Epoch: 25, step: 232, loss: 0.310837984085083, mean loss: 0.3504011919134729
Epoch: 25, step: 233, loss: 0.3386119604110718, mean loss: 0.3504008674451649
Epoch: 25, step: 234, loss: 0.34421324729919434, mean loss: 0.3504006971515046
Epoch: 25, step: 235, loss: 0.36778178811073303, mean loss: 0.3504011754950471
Epoch: 25, step: 236, loss: 0.3254193961620331, mean loss: 0.3504004879925199
Epoch: 25, step: 237, loss: 0.338507741689682, mean loss: 0.3504001607112633
Epoch: 25, step: 238, loss: 0.3426656424999237, mean loss: 0.35039994786781103
Epoch: 25, step: 239, loss: 0.33338990807533264, mean loss: 0.3503994797874645
Epoch: 25, step: 240, loss: 0.37513384222984314, mean loss: 0.35040016040611677
Epoch: 25, step: 241, loss: 0.3492021858692169, mean loss: 0.3504001274422035
Epoch: 25, step: 242, loss: 0.35939592123031616, mean loss: 0.350400374967003
Epoch: 25, step: 243, loss: 0.31782373785972595, mean loss: 0.3503994786254581
Epoch: 25, step: 244, loss: 0.33672037720680237, mean loss: 0.35039910225728044
Epoch: 25, step: 245, loss: 0.37332648038864136, mean loss: 0.3503997330661213
Epoch: 25, step: 246, loss: 0.3297356367111206, mean loss: 0.3503991645433724
Epoch: 25, step: 247, loss: 0.37785008549690247, mean loss: 0.35039991976844537
Epoch: 25, step: 248, loss: 0.32011038064956665, mean loss: 0.35039908647071727
Epoch: 25, step: 249, loss: 0.28899523615837097, mean loss: 0.3503973972313689
Epoch: 25, step: 250, loss: 0.30762025713920593, mean loss: 0.35039622045108526
Epoch: 25, step: 251, loss: 0.34668099880218506, mean loss: 0.3503961182497855
Epoch: 25, step: 252, loss: 0.33744263648986816, mean loss: 0.35039576192481203
Epoch: 25, step: 253, loss: 0.32658958435058594, mean loss: 0.35039510708139526
Epoch: 25, step: 254, loss: 0.3514827489852905, mean loss: 0.350395136998653
Epoch: 25, step: 255, loss: 0.2864643931388855, mean loss: 0.3503933785339193
Epoch: 25, step: 256, loss: 0.3007507920265198, mean loss: 0.35039201311360113
Epoch: 25, step: 257, loss: 0.30726540088653564, mean loss: 0.3503908269479092
Epoch: 25, step: 258, loss: 0.35363146662712097, mean loss: 0.3503909160768643
Epoch: 25, step: 259, loss: 0.32544344663619995, mean loss: 0.35039022995284225
Epoch: 25, step: 260, loss: 0.3387664258480072, mean loss: 0.35038991027505273
Epoch: 25, step: 261, loss: 0.3509847819805145, mean loss: 0.3503899266347608
Epoch: 25, step: 262, loss: 0.3367471694946289, mean loss: 0.35038955145237377
Epoch: 25, step: 263, loss: 0.33931803703308105, mean loss: 0.3503892469887719
Epoch: 25, step: 264, loss: 0.34562334418296814, mean loss: 0.35038911593135935
Epoch: 25, step: 265, loss: 0.3267756998538971, mean loss: 0.35038846660462347
Epoch: 25, step: 266, loss: 0.33289769291877747, mean loss: 0.35038798565283513
Epoch: 25, step: 267, loss: 0.3470728099346161, mean loss: 0.35038789449644164
Epoch: 25, step: 268, loss: 0.3299039304256439, mean loss: 0.35038733127050553
Epoch: 25, step: 269, loss: 0.30035078525543213, mean loss: 0.35038595550624885
Epoch: 25, step: 270, loss: 0.2880620062351227, mean loss: 0.35038424194464013
Epoch: 25, step: 271, loss: 0.37072890996932983, mean loss: 0.3503848012943604
Epoch: 25, step: 272, loss: 0.34937918186187744, mean loss: 0.3503847736469452
Epoch: 25, step: 273, loss: 0.3695141673088074, mean loss: 0.350385299555387
Epoch: 25, step: 274, loss: 0.3236500322818756, mean loss: 0.3503845645652214
Epoch: 25, step: 275, loss: 0.30146464705467224, mean loss: 0.35038321972473563
Epoch: 25, step: 276, loss: 0.3440777361392975, mean loss: 0.3503830463876384
Epoch: 25, step: 277, loss: 0.3496483862400055, mean loss: 0.3503830261924614
Epoch: 25, step: 278, loss: 0.3369564116001129, mean loss: 0.35038265711649474
Epoch: 25, step: 279, loss: 0.3635300397872925, mean loss: 0.3503830185068925
Epoch: 25, step: 280, loss: 0.3310645818710327, mean loss: 0.3503824875034392
Epoch: 25, step: 281, loss: 0.33751553297042847, mean loss: 0.3503821338407892
Epoch: 25, step: 282, loss: 0.33601272106170654, mean loss: 0.3503817388922479
Epoch: 25, step: 283, loss: 0.3393419682979584, mean loss: 0.35038143546847383
Epoch: 25, step: 284, loss: 0.3398105800151825, mean loss: 0.350381144940634
Epoch: 25, step: 285, loss: 0.40074092149734497, mean loss: 0.3503825289833031
Epoch: 25, step: 286, loss: 0.33961978554725647, mean loss: 0.3503822331979007
Epoch: 25, step: 287, loss: 0.3020268678665161, mean loss: 0.3503809043157051
Epoch: 25, step: 288, loss: 0.357594758272171, mean loss: 0.35038110255841465
Epoch: 25, step: 289, loss: 0.32339179515838623, mean loss: 0.3503803608901706
Epoch: 25, step: 290, loss: 0.36775222420692444, mean loss: 0.35038083825719313
Epoch: 25, step: 291, loss: 0.36377817392349243, mean loss: 0.35038120639677506
Epoch: 25, step: 292, loss: 0.3794102966785431, mean loss: 0.3503820040526507
Epoch: 25, step: 293, loss: 0.30123546719551086, mean loss: 0.35038065365047294
Epoch: 25, step: 294, loss: 0.33919811248779297, mean loss: 0.3503803463955983
Epoch: 25, step: 295, loss: 0.33320537209510803, mean loss: 0.3503798745037887
Epoch: 25, step: 296, loss: 0.2852849066257477, mean loss: 0.35037808603309395
Epoch: 25, step: 297, loss: 0.34934377670288086, mean loss: 0.3503780576164411
Epoch: 25, step: 298, loss: 0.35421159863471985, mean loss: 0.35037816293639545
Epoch: 25, step: 299, loss: 0.3333226442337036, mean loss: 0.35037769437818933
Epoch: 25, step: 300, loss: 0.3014960289001465, mean loss: 0.3503763515121835
Epoch: 25, step: 301, loss: 0.3146778345108032, mean loss: 0.35037537083757764
Epoch: 25, step: 302, loss: 0.2854999601840973, mean loss: 0.3503735886929562
Epoch: 25, step: 303, loss: 0.3677152991294861, mean loss: 0.3503740650612244
Epoch: 25, step: 304, loss: 0.32198116183280945, mean loss: 0.350373285143542
Epoch: 25, step: 305, loss: 0.30213871598243713, mean loss: 0.3503719602364069
Epoch: 25, step: 306, loss: 0.3338998258113861, mean loss: 0.35037150779224985
Epoch: 25, step: 307, loss: 0.3538772463798523, mean loss: 0.3503716040825868
Epoch: 25, step: 308, loss: 0.3177872598171234, mean loss: 0.35037070912957335
Epoch: 25, step: 309, loss: 0.32965537905693054, mean loss: 0.35037014018340273
Epoch: 25, step: 310, loss: 0.36120492219924927, mean loss: 0.3503704377523246
Epoch: 25, step: 311, loss: 0.33490464091300964, mean loss: 0.3503700130078217
Epoch: 25, step: 312, loss: 0.3289717137813568, mean loss: 0.35036942535233534
Epoch: 25, step: 313, loss: 0.3318996727466583, mean loss: 0.35036891813663246
Epoch: 25, step: 314, loss: 0.3180469572544098, mean loss: 0.35036803053644344
Epoch: 25, step: 315, loss: 0.31657350063323975, mean loss: 0.3503671025232102
Epoch: 25, step: 316, loss: 0.37816569209098816, mean loss: 0.35036786586422036
Epoch: 25, step: 317, loss: 0.3630213737487793, mean loss: 0.3503682133162464
Epoch: 25, step: 318, loss: 0.3270268738269806, mean loss: 0.3503675724051975
Epoch: 25, step: 319, loss: 0.3446562588214874, mean loss: 0.35036741558714196
Epoch: 25, step: 320, loss: 0.3745826780796051, mean loss: 0.3503680804580267
Epoch: 25, step: 321, loss: 0.32280421257019043, mean loss: 0.3503673236663105
Epoch: 25, step: 322, loss: 0.3448881208896637, mean loss: 0.3503671732338152
Epoch: 25, step: 323, loss: 0.3550088107585907, mean loss: 0.35036730066730754
Epoch: 25, step: 324, loss: 0.304206520318985, mean loss: 0.3503660333843879
Epoch: 25, step: 325, loss: 0.34904375672340393, mean loss: 0.3503659970840348
Epoch: 25, step: 326, loss: 0.3382152318954468, mean loss: 0.3503656635192288
Epoch: 25, step: 327, loss: 0.3262227475643158, mean loss: 0.3503650007621201
Epoch: 25, step: 328, loss: 0.363163024187088, mean loss: 0.3503653520762771
Epoch: 25, step: 329, loss: 0.32410547137260437, mean loss: 0.3503646312450747
Epoch: 25, step: 330, loss: 0.3629254102706909, mean loss: 0.35036497602778793
Epoch: 25, step: 331, loss: 0.3232743442058563, mean loss: 0.35036423243337034
Epoch: 25, step: 332, loss: 0.30729520320892334, mean loss: 0.35036305029000514
Epoch: 25, step: 333, loss: 0.36180657148361206, mean loss: 0.3503633643790756
Epoch: 25, step: 334, loss: 0.3588000535964966, mean loss: 0.35036359593360333
Epoch: 25, step: 335, loss: 0.32272401452064514, mean loss: 0.35036283735468654
Epoch: 25, step: 336, loss: 0.3487904965877533, mean loss: 0.35036279420237526
Epoch: 25, step: 337, loss: 0.3022315800189972, mean loss: 0.3503614732952403
Epoch: 25, step: 338, loss: 0.31841418147087097, mean loss: 0.3503605965617453
Epoch: 25, step: 339, loss: 0.3971461355686188, mean loss: 0.35036188046786515
Epoch: 25, step: 340, loss: 0.34197476506233215, mean loss: 0.3503616503118484
Epoch: 25, step: 341, loss: 0.34104421734809875, mean loss: 0.3503613946334289
Epoch: 25, step: 342, loss: 0.2888765335083008, mean loss: 0.35035970748195605
Epoch: 25, step: 343, loss: 0.32115960121154785, mean loss: 0.3503589062497568
Epoch: 25, step: 344, loss: 0.33861979842185974, mean loss: 0.35035858414500093
Epoch: 25, step: 345, loss: 0.3358318507671356, mean loss: 0.3503581855626221
Epoch: 25, step: 346, loss: 0.33261600136756897, mean loss: 0.3503576987685322
Epoch: 25, step: 347, loss: 0.3404461145401001, mean loss: 0.3503574268308613
Epoch: 25, step: 348, loss: 0.375838965177536, mean loss: 0.35035812593202587
Epoch: 25, step: 349, loss: 0.3628801107406616, mean loss: 0.35035846947070376
Epoch: 25, step: 350, loss: 0.30678847432136536, mean loss: 0.35035727416755297
Epoch: 25, step: 351, loss: 0.36838680505752563, mean loss: 0.35035776877774966
Epoch: 25, step: 352, loss: 0.3233555257320404, mean loss: 0.3503570280364377
Epoch: 25, step: 353, loss: 0.3761453330516815, mean loss: 0.3503577354568858
Epoch: 25, step: 354, loss: 0.3436534106731415, mean loss: 0.35035755155002024
Epoch: 25, step: 355, loss: 0.32765838503837585, mean loss: 0.3503569289044609
Epoch: 25, step: 356, loss: 0.29376670718193054, mean loss: 0.3503553766587544
Epoch: 25, step: 357, loss: 0.3517675995826721, mean loss: 0.3503554153943659
Epoch: 25, step: 358, loss: 0.33940139412879944, mean loss: 0.35035511494670507
Epoch: 25, step: 359, loss: 0.36485403776168823, mean loss: 0.3503555126132661
Epoch: 25, step: 360, loss: 0.3518773019313812, mean loss: 0.3503555543507203
Epoch: 25, step: 361, loss: 0.3479178547859192, mean loss: 0.3503554874948275
Epoch: 25, step: 362, loss: 0.3354932367801666, mean loss: 0.35035507989669473
Epoch: 25, step: 363, loss: 0.3129073977470398, mean loss: 0.3503540529198916
Epoch: 25, step: 364, loss: 0.3427239656448364, mean loss: 0.35035384367575956
Epoch: 25, step: 365, loss: 0.3185226321220398, mean loss: 0.35035297077465843
Epoch: 25, step: 366, loss: 0.30391040444374084, mean loss: 0.35035169722415166
Epoch: 25, step: 367, loss: 0.334553062915802, mean loss: 0.350351264005047
Epoch: 25, step: 368, loss: 0.3000617027282715, mean loss: 0.3503498850376699
Epoch: 25, step: 369, loss: 0.3098415732383728, mean loss: 0.3503487743079798
Epoch: 25, step: 370, loss: 0.3253185451030731, mean loss: 0.3503480880029921
Epoch: 25, step: 371, loss: 0.34194469451904297, mean loss: 0.3503478575962833
Epoch: 25, step: 372, loss: 0.3372640311717987, mean loss: 0.3503474988699261
Epoch: 25, step: 373, loss: 0.3570704460144043, mean loss: 0.35034768319155646
Epoch: 25, step: 374, loss: 0.30116257071495056, mean loss: 0.35034633473062493
Epoch: 25, step: 375, loss: 0.34781068563461304, mean loss: 0.35034626521507783
Epoch: 25, step: 376, loss: 0.3316000998020172, mean loss: 0.3503457512976665
Epoch: 25, step: 377, loss: 0.333245187997818, mean loss: 0.35034528250652386
Epoch: 25, step: 378, loss: 0.3219437301158905, mean loss: 0.3503445039338549
Epoch: 25, step: 379, loss: 0.3007546663284302, mean loss: 0.3503431445633065
Epoch: 25, step: 380, loss: 0.3879309892654419, mean loss: 0.35034417490361247
Epoch: 25, step: 381, loss: 0.32027193903923035, mean loss: 0.3503433506002337
Epoch: 25, step: 382, loss: 0.3397805690765381, mean loss: 0.3503430610741113
Epoch: 25, step: 383, loss: 0.32869720458984375, mean loss: 0.35034246777687184
Epoch: 25, step: 384, loss: 0.3416549861431122, mean loss: 0.3503422296658225
Epoch: 25, step: 385, loss: 0.31470048427581787, mean loss: 0.3503412528049611
Epoch: 25, step: 386, loss: 0.32080066204071045, mean loss: 0.3503404431853496
Epoch: 25, step: 387, loss: 0.3168007731437683, mean loss: 0.35033952398807816
Epoch: 25, step: 388, loss: 0.365742564201355, mean loss: 0.3503399461163966
Epoch: 25, step: 389, loss: 0.3014991283416748, mean loss: 0.3503386076450956
Epoch: 25, step: 390, loss: 0.29800915718078613, mean loss: 0.35033717360792305
Epoch: 25, step: 391, loss: 0.345506876707077, mean loss: 0.35033704124200993
Epoch: 25, step: 392, loss: 0.3404565751552582, mean loss: 0.3503367704923843
Epoch: 25, step: 393, loss: 0.3220883309841156, mean loss: 0.3503359964352925
Epoch: 25, step: 394, loss: 0.3377034366130829, mean loss: 0.350335650290346
Epoch: 25, step: 395, loss: 0.3699885606765747, mean loss: 0.3503361887852602
Epoch: 25, step: 396, loss: 0.3222366273403168, mean loss: 0.3503354188709811
Epoch: 25, step: 397, loss: 0.3255327641963959, mean loss: 0.3503347393089592
Epoch: 25, step: 398, loss: 0.320310115814209, mean loss: 0.35033391669399727
Epoch: 25, step: 399, loss: 0.3678835928440094, mean loss: 0.3503343975070425
Epoch: 25, step: 400, loss: 0.3537328541278839, mean loss: 0.35033449061289224
Epoch: 25, step: 401, loss: 0.3202418386936188, mean loss: 0.35033366620184847
Epoch: 25, step: 402, loss: 0.33472564816474915, mean loss: 0.35033323862005966
Epoch: 25, step: 403, loss: 0.32715219259262085, mean loss: 0.3503326035925003
Epoch: 25, step: 404, loss: 0.3022594451904297, mean loss: 0.3503312867000636
Epoch: 25, step: 405, loss: 0.30935001373291016, mean loss: 0.3503301641099971
Epoch: 25, step: 406, loss: 0.3151656985282898, mean loss: 0.3503292008847093
Epoch: 25, step: 407, loss: 0.3417088985443115, mean loss: 0.350328964763795
Epoch: 25, step: 408, loss: 0.36510786414146423, mean loss: 0.3503293695653337
Epoch: 25, step: 409, loss: 0.3657110631465912, mean loss: 0.35032979086617133
Epoch: 25, step: 410, loss: 0.32724109292030334, mean loss: 0.35032915848968355
Epoch: 25, step: 411, loss: 0.38019102811813354, mean loss: 0.35032997635421104
Epoch: 25, step: 412, loss: 0.32513371109962463, mean loss: 0.35032928629134974
Epoch: 25, step: 413, loss: 0.3279692530632019, mean loss: 0.3503286739225808
Epoch: 25, step: 414, loss: 0.31367918848991394, mean loss: 0.350327670239562
Epoch: 25, step: 415, loss: 0.3425234854221344, mean loss: 0.35032745651996466
Epoch: 25, step: 416, loss: 0.30607062578201294, mean loss: 0.35032624456852457
Epoch: 25, step: 417, loss: 0.32966291904449463, mean loss: 0.3503256787290612
Epoch: 25, step: 418, loss: 0.3627944588661194, mean loss: 0.3503260201617438
Epoch: 25, step: 419, loss: 0.319435715675354, mean loss: 0.35032517431550925
Epoch: 25, step: 420, loss: 0.3122536242008209, mean loss: 0.35032413185911115
Epoch: 25, step: 421, loss: 0.3110883831977844, mean loss: 0.350323057554619
Epoch: 25, step: 422, loss: 0.32617154717445374, mean loss: 0.35032239628609285
Epoch: 25, step: 423, loss: 0.37211430072784424, mean loss: 0.35032299293225544
Epoch: 25, step: 424, loss: 0.35363757610321045, mean loss: 0.3503230836805969
Epoch: 25, step: 425, loss: 0.34170281887054443, mean loss: 0.35032284767707034
Epoch: 25, step: 426, loss: 0.3331572711467743, mean loss: 0.3503223777349308
Epoch: 25, step: 427, loss: 0.34705978631973267, mean loss: 0.3503222884173822
Epoch: 25, step: 428, loss: 0.30467042326927185, mean loss: 0.3503210386742973
Epoch: 25, step: 429, loss: 0.3552151322364807, mean loss: 0.3503211726489363
Epoch: 25, step: 430, loss: 0.32027336955070496, mean loss: 0.35032035012004037
Epoch: 25, step: 431, loss: 0.3173050582408905, mean loss: 0.3503194463838124
Epoch: 25, step: 432, loss: 0.3228827714920044, mean loss: 0.35031869537308535
Epoch: 25, step: 433, loss: 0.327134907245636, mean loss: 0.35031806079192457
Epoch: 25, step: 434, loss: 0.35043421387672424, mean loss: 0.3503180639711523
Epoch: 25, step: 435, loss: 0.32020118832588196, mean loss: 0.3503172396642866
Epoch: 25, step: 436, loss: 0.34417787194252014, mean loss: 0.3503170716327645
Epoch: 25, step: 437, loss: 0.3311540186405182, mean loss: 0.3503165471636367
Epoch: 25, step: 438, loss: 0.31036484241485596, mean loss: 0.3503154537646726
Epoch: 25, step: 439, loss: 0.3537282347679138, mean loss: 0.3503155471631675
Epoch: 25, step: 440, loss: 0.3341206908226013, mean loss: 0.35031510396631077
Epoch: 25, step: 441, loss: 0.298799991607666, mean loss: 0.3503136942155484
Epoch: 25, step: 442, loss: 0.31315502524375916, mean loss: 0.35031267736775346
Epoch: 25, step: 443, loss: 0.2939108610153198, mean loss: 0.35031113397304153
Epoch: 25, step: 444, loss: 0.3283871114253998, mean loss: 0.3503105340545151
Epoch: 25, step: 445, loss: 0.3349311649799347, mean loss: 0.35031011323228906
Epoch: 25, step: 446, loss: 0.3150964081287384, mean loss: 0.35030914971394
Epoch: 25, step: 447, loss: 0.35017120838165283, mean loss: 0.3503091459396888
Epoch: 25, step: 448, loss: 0.3663322925567627, mean loss: 0.3503095843414677
Epoch: 25, step: 449, loss: 0.3208664357662201, mean loss: 0.35030877878336714
Epoch: 25, step: 450, loss: 0.3537082374095917, mean loss: 0.35030887178926645
Epoch: 25, step: 451, loss: 0.32640573382377625, mean loss: 0.35030821784042737
Epoch: 25, step: 452, loss: 0.3227527141571045, mean loss: 0.3503074639897535
Epoch: 25, step: 453, loss: 0.3529782295227051, mean loss: 0.3503075370533179
Epoch: 25, step: 454, loss: 0.3292314410209656, mean loss: 0.35030696049481613
Epoch: 25, step: 455, loss: 0.3504883050918579, mean loss: 0.3503069654555503
Epoch: 25, step: 456, loss: 0.3598436117172241, mean loss: 0.3503072263261431
Epoch: 25, step: 457, loss: 0.35651305317878723, mean loss: 0.35030739607905226
Epoch: 25, step: 458, loss: 0.31058672070503235, mean loss: 0.35030630959760106
Epoch: 25, step: 459, loss: 0.3758912682533264, mean loss: 0.35030700940500414
Epoch: 25, step: 460, loss: 0.34464630484580994, mean loss: 0.3503068545759634
Epoch: 25, step: 461, loss: 0.3378586769104004, mean loss: 0.3503065141083285
Epoch: 25, step: 462, loss: 0.41791802644729614, mean loss: 0.3503083632867969
Epoch: 25, step: 463, loss: 0.35457906126976013, mean loss: 0.35030848008742
Epoch: 25, step: 464, loss: 0.3012210726737976, mean loss: 0.35030713761764254
Epoch: 25, step: 465, loss: 0.34350094199180603, mean loss: 0.35030695148310154
Epoch: 25, step: 466, loss: 0.346285879611969, mean loss: 0.35030684151860153
Epoch: 25, step: 467, loss: 0.34861859679222107, mean loss: 0.35030679535133163
Epoch: 25, step: 468, loss: 0.3529042601585388, mean loss: 0.35030686638047676
Epoch: 25, step: 469, loss: 0.34404006600379944, mean loss: 0.35030669501596
Epoch: 25, step: 470, loss: 0.3159489929676056, mean loss: 0.3503057555365351
Epoch: 25, step: 471, loss: 0.362797349691391, mean loss: 0.35030609709822585
Epoch: 25, step: 472, loss: 0.37842753529548645, mean loss: 0.35030686601076233
Epoch: 25, step: 473, loss: 0.3211694359779358, mean loss: 0.3503060693401758
Epoch: 25, step: 474, loss: 0.400817334651947, mean loss: 0.3503074503727202
Epoch: 25, step: 475, loss: 0.29812943935394287, mean loss: 0.3503060238085519
Epoch: 25, step: 476, loss: 0.32853439450263977, mean loss: 0.35030542858124225
Epoch: 25, step: 477, loss: 0.2979540228843689, mean loss: 0.3503039973546663
Epoch: 25, step: 478, loss: 0.3672768473625183, mean loss: 0.35030446135997007
Epoch: 25, step: 479, loss: 0.3234151303768158, mean loss: 0.35030372627711104
Epoch: 25, step: 480, loss: 0.3301331698894501, mean loss: 0.3503031748827701
Epoch: 25, step: 481, loss: 0.30588752031326294, mean loss: 0.35030196074317765
Epoch: 25, step: 482, loss: 0.3026970624923706, mean loss: 0.3503006594584757
Epoch: 25, step: 483, loss: 0.3122861087322235, mean loss: 0.350299620355296
Epoch: 25, step: 484, loss: 0.3699439764022827, mean loss: 0.35030015730639746
Epoch: 25, step: 485, loss: 0.2936583459377289, mean loss: 0.3502986091237219
Epoch: 25, step: 486, loss: 0.3360249400138855, mean loss: 0.350298218994192
Epoch: 25, step: 487, loss: 0.3068026900291443, mean loss: 0.3502970302019933
Epoch: 25, step: 488, loss: 0.29865092039108276, mean loss: 0.3502956186818695
Epoch: 25, step: 489, loss: 0.3542894721031189, mean loss: 0.3502957278333705
Epoch: 25, step: 490, loss: 0.3054593801498413, mean loss: 0.35029450249523586
Epoch: 25, step: 491, loss: 0.349675714969635, mean loss: 0.3502944855847766
Epoch: 25, step: 492, loss: 0.34061065316200256, mean loss: 0.3502942209485778
Epoch: 25, step: 493, loss: 0.3042062222957611, mean loss: 0.35029296150717615
Epoch: 25, step: 494, loss: 0.32239237427711487, mean loss: 0.3502921990918946
Epoch: 25, step: 495, loss: 0.30330079793930054, mean loss: 0.350290915033496
Epoch: 25, step: 496, loss: 0.3210134506225586, mean loss: 0.3502901150372009
Epoch: 25, step: 497, loss: 0.3395101726055145, mean loss: 0.35028982048715906
Epoch: 25, step: 498, loss: 0.3108227550983429, mean loss: 0.35028874212257566
Epoch: 25, step: 499, loss: 0.3417111039161682, mean loss: 0.35028850776087606
Epoch: 25, step: 500, loss: 0.3522515594959259, mean loss: 0.35028856139470393
Epoch: 25, step: 501, loss: 0.31449058651924133, mean loss: 0.35028758336140314
Epoch: 25, step: 502, loss: 0.3674681484699249, mean loss: 0.3502880527372769
Epoch: 25, step: 503, loss: 0.3086402118206024, mean loss: 0.3502869149424753
Epoch: 25, step: 504, loss: 0.38522499799728394, mean loss: 0.3502878694045175
Epoch: 25, step: 505, loss: 0.3233890235424042, mean loss: 0.35028713458383615
Epoch: 25, step: 506, loss: 0.3106149435043335, mean loss: 0.35028605085146036
Epoch: 25, step: 507, loss: 0.3500250279903412, mean loss: 0.3502860437212467
Epoch: 25, step: 508, loss: 0.33481189608573914, mean loss: 0.35028562103426714
Epoch: 25, step: 509, loss: 0.3747664988040924, mean loss: 0.35028628972800574
Epoch: 25, step: 510, loss: 0.3650333881378174, mean loss: 0.35028669253313016
Epoch: 25, step: 511, loss: 0.35162830352783203, mean loss: 0.3502867291771538
Epoch: 25, step: 512, loss: 0.33305221796035767, mean loss: 0.3502862584560652
Epoch: 25, step: 513, loss: 0.30877289175987244, mean loss: 0.3502851246447718
Epoch: 25, step: 514, loss: 0.3306216895580292, mean loss: 0.3502845876125422
Epoch: 25, step: 515, loss: 0.3412300646305084, mean loss: 0.3502843403293059
Epoch: 25, step: 516, loss: 0.3204345405101776, mean loss: 0.35028352513964484
Epoch: 25, step: 517, loss: 0.3160272538661957, mean loss: 0.3502825896360326
Epoch: 25, step: 518, loss: 0.28725990653038025, mean loss: 0.3502808685982351
Epoch: 25, step: 519, loss: 0.3207543194293976, mean loss: 0.35028006230251774
Epoch: 25, step: 520, loss: 0.29129573702812195, mean loss: 0.3502784516330856
Epoch: 25, step: 521, loss: 0.34944385290145874, mean loss: 0.35027842884354016
Epoch: 25, step: 522, loss: 0.3360139727592468, mean loss: 0.35027803934906715
Epoch: 25, step: 523, loss: 0.37688443064689636, mean loss: 0.35027876582327255
Epoch: 25, step: 524, loss: 0.33165067434310913, mean loss: 0.35027825720644035
Epoch: 25, step: 525, loss: 0.3236522376537323, mean loss: 0.3502775302359944
Epoch: 25, step: 526, loss: 0.3358197808265686, mean loss: 0.35027713550671247
Epoch: 25, step: 527, loss: 0.3470976650714874, mean loss: 0.3502770487023433
Epoch: 25, step: 528, loss: 0.37053194642066956, mean loss: 0.35027760167670013
Epoch: 25, step: 529, loss: 0.3651956617832184, mean loss: 0.3502780089401483
Epoch: 25, step: 530, loss: 0.3492594063282013, mean loss: 0.3502779811330283
Epoch: 25, step: 531, loss: 0.3020560145378113, mean loss: 0.35027666474389874
Epoch: 25, step: 532, loss: 0.2922256290912628, mean loss: 0.3502750800788248
Epoch: 25, step: 533, loss: 0.2891429662704468, mean loss: 0.350273411352674
Epoch: 25, step: 534, loss: 0.34306663274765015, mean loss: 0.3502732146342734
Epoch: 25, step: 535, loss: 0.30487534403800964, mean loss: 0.3502719754741414
Epoch: 25, step: 536, loss: 0.3120883107185364, mean loss: 0.35027093325821884
Epoch: 25, step: 537, loss: 0.31350773572921753, mean loss: 0.3502699298410692
Epoch: 25, step: 538, loss: 0.30538830161094666, mean loss: 0.35026870487236833
Epoch: 25, step: 539, loss: 0.36232098937034607, mean loss: 0.35026903381026403
Epoch: 25, step: 540, loss: 0.3402630090713501, mean loss: 0.35026876072752233
Epoch: 25, step: 541, loss: 0.31243541836738586, mean loss: 0.35026772821449464
Epoch: 25, step: 542, loss: 0.2962963581085205, mean loss: 0.35026625531734906
Epoch: 25, step: 543, loss: 0.32623326778411865, mean loss: 0.35026559946679964
Epoch: 25, step: 544, loss: 0.3290139138698578, mean loss: 0.3502650195326859
Epoch: 25, step: 545, loss: 0.32566115260124207, mean loss: 0.35026434813971175
Epoch: 25, step: 546, loss: 0.349630206823349, mean loss: 0.3502643308356673
Epoch: 25, step: 547, loss: 0.33411160111427307, mean loss: 0.35026389008229136
Epoch: 25, step: 548, loss: 0.3308417797088623, mean loss: 0.3502633601330329
Epoch: 25, step: 549, loss: 0.33611059188842773, mean loss: 0.35026297397291706
Epoch: 25, step: 550, loss: 0.3255762755870819, mean loss: 0.3502623004115303
Epoch: 25, step: 551, loss: 0.32948610186576843, mean loss: 0.35026173356119344
Epoch: 25, step: 552, loss: 0.2951681613922119, mean loss: 0.3502602304489743
Epoch: 25, step: 553, loss: 0.3898699879646301, mean loss: 0.3502613110884002
Epoch: 25, step: 554, loss: 0.36306139826774597, mean loss: 0.35026166029279737
Epoch: 25, step: 555, loss: 0.3109751045703888, mean loss: 0.350260588529492
Epoch: 25, step: 556, loss: 0.3322584331035614, mean loss: 0.35026009743214565
Epoch: 25, step: 557, loss: 0.37987399101257324, mean loss: 0.35026090527473336
Epoch: 25, step: 558, loss: 0.32732677459716797, mean loss: 0.3502602796676334
Epoch: 25, step: 559, loss: 0.32031407952308655, mean loss: 0.35025946280456344
Epoch: 25, step: 560, loss: 0.33135947585105896, mean loss: 0.3502589472707004
Epoch: 25, step: 561, loss: 0.38501885533332825, mean loss: 0.3502598953888626
Epoch: 25, step: 562, loss: 0.3222217857837677, mean loss: 0.35025913063667086
Epoch: 25, step: 563, loss: 0.3044595718383789, mean loss: 0.3502578814669458
Epoch: 25, step: 564, loss: 0.30287498235702515, mean loss: 0.35025658914731916
Epoch: 25, step: 565, loss: 0.3094082474708557, mean loss: 0.35025547508138133
Epoch: 25, step: 566, loss: 0.33710214495658875, mean loss: 0.3502551163574572
Epoch: 25, step: 567, loss: 0.35125815868377686, mean loss: 0.3502551437121623
Epoch: 25, step: 568, loss: 0.3558080494403839, mean loss: 0.35025529514540915
Epoch: 25, step: 569, loss: 0.31416308879852295, mean loss: 0.35025431090198544
Epoch: 25, step: 570, loss: 0.31770291924476624, mean loss: 0.35025342324166375
Epoch: 25, step: 571, loss: 0.3355047106742859, mean loss: 0.3502530210625471
Epoch: 25, step: 572, loss: 0.3771094083786011, mean loss: 0.35025375338298215
Epoch: 25, step: 573, loss: 0.3152509927749634, mean loss: 0.3502527989531243
Epoch: 25, step: 574, loss: 0.3216025233268738, mean loss: 0.3502520177595148
Epoch: 25, step: 575, loss: 0.31754669547080994, mean loss: 0.3502511260231671
Epoch: 25, step: 576, loss: 0.3215876519680023, mean loss: 0.35025034451230047
Epoch: 25, step: 577, loss: 0.3148729205131531, mean loss: 0.3502493799715949
Epoch: 25, step: 578, loss: 0.3474314510822296, mean loss: 0.35024930314483055
Epoch: 25, step: 579, loss: 0.3273479640483856, mean loss: 0.35024867878989335
Epoch: 25, step: 580, loss: 0.3472801446914673, mean loss: 0.35024859786150814
Epoch: 25, step: 581, loss: 0.33966460824012756, mean loss: 0.35024830932790524
Epoch: 25, step: 582, loss: 0.34036171436309814, mean loss: 0.3502480398135535
Epoch: 25, step: 583, loss: 0.36210212111473083, mean loss: 0.35024836295392264
Epoch: 25, step: 584, loss: 0.32050999999046326, mean loss: 0.3502475523129805
Epoch: 25, step: 585, loss: 0.3514463007450104, mean loss: 0.3502475849888904
Epoch: 25, step: 586, loss: 0.3274584412574768, mean loss: 0.35024696381125986
Epoch: 25, step: 587, loss: 0.29741981625556946, mean loss: 0.3502455239086335
Epoch: 25, step: 588, loss: 0.3350122272968292, mean loss: 0.3502451087079845
Epoch: 25, step: 589, loss: 0.3711545467376709, mean loss: 0.350245678602725
Epoch: 25, step: 590, loss: 0.3051440715789795, mean loss: 0.3502444493746575
Epoch: 25, step: 591, loss: 0.34959280490875244, mean loss: 0.3502444316148061
Epoch: 25, step: 592, loss: 0.32046276330947876, mean loss: 0.35024361997039694
Epoch: 25, step: 593, loss: 0.36485597491264343, mean loss: 0.35024401819231177
Epoch: 25, step: 594, loss: 0.32280054688453674, mean loss: 0.35024327031191094
Epoch: 25, step: 595, loss: 0.32289040088653564, mean loss: 0.3502425249208758
Epoch: 25, step: 596, loss: 0.37863656878471375, mean loss: 0.3502432986637939
Epoch: 25, step: 597, loss: 0.338469922542572, mean loss: 0.35024297784587133
Epoch: 25, step: 598, loss: 0.3363233208656311, mean loss: 0.35024259855332984
Epoch: 25, step: 599, loss: 0.31869786977767944, mean loss: 0.3502417390239354
Epoch: 25, step: 600, loss: 0.35129016637802124, mean loss: 0.35024176759065984
Epoch: 25, step: 601, loss: 0.32437384128570557, mean loss: 0.35024106278094086
Epoch: 25, step: 602, loss: 0.33283814787864685, mean loss: 0.35024058862583357
Epoch: 25, step: 603, loss: 0.32606789469718933, mean loss: 0.3502399300411036
Epoch: 25, step: 604, loss: 0.35357895493507385, mean loss: 0.3502400210103147
Epoch: 25, step: 605, loss: 0.33741796016693115, mean loss: 0.35023967169246906
Epoch: 25, step: 606, loss: 0.3275831341743469, mean loss: 0.3502390544658497
Epoch: 25, step: 607, loss: 0.379569411277771, mean loss: 0.35023985348396053
Epoch: 25, step: 608, loss: 0.3545249402523041, mean loss: 0.35023997021519176
Epoch: 25, step: 609, loss: 0.32483944296836853, mean loss: 0.35023927829126783
Epoch: 25, step: 610, loss: 0.31995195150375366, mean loss: 0.3502384532707893
Epoch: 25, step: 611, loss: 0.3033682107925415, mean loss: 0.3502371765699155
Epoch: 25, step: 612, loss: 0.3556239902973175, mean loss: 0.3502373232976067
Epoch: 25, step: 613, loss: 0.3366325795650482, mean loss: 0.35023695273750066
Epoch: 25, step: 614, loss: 0.33606886863708496, mean loss: 0.350236566843885
Epoch: 25, step: 615, loss: 0.31579187512397766, mean loss: 0.35023562870542435
Epoch: 25, step: 616, loss: 0.2876940071582794, mean loss: 0.3502339253630612
Epoch: 25, step: 617, loss: 0.33930251002311707, mean loss: 0.3502336276503497
Epoch: 25, step: 618, loss: 0.33584028482437134, mean loss: 0.3502332356641075
Epoch: 25, step: 619, loss: 0.3198508024215698, mean loss: 0.3502324082557948
Epoch: 25, step: 620, loss: 0.3381088078022003, mean loss: 0.3502320781013749
Epoch: 25, step: 621, loss: 0.3322826027870178, mean loss: 0.3502315893078638
Epoch: 25, step: 622, loss: 0.36243847012519836, mean loss: 0.3502319217121014
Epoch: 25, step: 623, loss: 0.3533673584461212, mean loss: 0.3502320070905115
Epoch: 25, step: 624, loss: 0.34807926416397095, mean loss: 0.35023194847259653
Epoch: 25, step: 625, loss: 0.3447800278663635, mean loss: 0.35023180002406945
Epoch: 25, step: 626, loss: 0.32596060633659363, mean loss: 0.35023113916982906
Epoch: 25, step: 627, loss: 0.34330251812934875, mean loss: 0.35023095052299175
Epoch: 25, step: 628, loss: 0.3341243267059326, mean loss: 0.3502305119969274
Epoch: 25, step: 629, loss: 0.31646832823753357, mean loss: 0.3502295927978052
Epoch: 25, step: 630, loss: 0.3398403823375702, mean loss: 0.3502293099519676
Epoch: 25, step: 631, loss: 0.3573181927204132, mean loss: 0.3502295029412622
Epoch: 25, step: 632, loss: 0.30514729022979736, mean loss: 0.3502282756466576
Epoch: 25, step: 633, loss: 0.33690956234931946, mean loss: 0.3502279130748359
Epoch: 25, step: 634, loss: 0.3045335114002228, mean loss: 0.350226669182045
Epoch: 25, step: 635, loss: 0.30770835280418396, mean loss: 0.3502255117801401
Epoch: 25, step: 636, loss: 0.3109821379184723, mean loss: 0.35022444355535687
Epoch: 25, step: 637, loss: 0.35973528027534485, mean loss: 0.3502247024381681
Epoch: 25, step: 638, loss: 0.31440430879592896, mean loss: 0.3502237274417435
Epoch: 25, step: 639, loss: 0.33880946040153503, mean loss: 0.3502234167649052
Epoch: 25, step: 640, loss: 0.3318665623664856, mean loss: 0.35022291713630505
Epoch: 25, step: 641, loss: 0.3662726581096649, mean loss: 0.35022335395904125
Epoch: 25, step: 642, loss: 0.36138275265693665, mean loss: 0.35022365767399916
Epoch: 25, step: 643, loss: 0.3371571898460388, mean loss: 0.3502233020657957
Epoch: 25, step: 644, loss: 0.3213266432285309, mean loss: 0.3502225156551592
Epoch: 25, step: 645, loss: 0.32296615839004517, mean loss: 0.35022177390483905
Epoch: 25, step: 646, loss: 0.29352670907974243, mean loss: 0.35022023105603983
Epoch: 25, step: 647, loss: 0.39849022030830383, mean loss: 0.35022154459662036
Epoch: 25, step: 648, loss: 0.36210867762565613, mean loss: 0.35022186806482436
Epoch: 25, step: 649, loss: 0.33756086230278015, mean loss: 0.3502215235476608
Epoch: 25, step: 650, loss: 0.4040037989616394, mean loss: 0.3502229869711163
Epoch: 25, step: 651, loss: 0.34550708532333374, mean loss: 0.3502228586542452
Epoch: 25, step: 652, loss: 0.33858272433280945, mean loss: 0.3502225419417504
Epoch: 25, step: 653, loss: 0.2873188257217407, mean loss: 0.3502208304622864
Epoch: 25, step: 654, loss: 0.30931833386421204, mean loss: 0.35021971762058873
Epoch: 25, step: 655, loss: 0.32428112626075745, mean loss: 0.35021901192379473
Epoch: 25, step: 656, loss: 0.32498395442962646, mean loss: 0.35021832538633263
Epoch: 25, step: 657, loss: 0.3443695306777954, mean loss: 0.3502181662700938
Epoch: 25, step: 658, loss: 0.3552320897579193, mean loss: 0.3502183026699819
Epoch: 25, step: 659, loss: 0.35905641317367554, mean loss: 0.3502185430973623
Epoch: 25, step: 660, loss: 0.3561709225177765, mean loss: 0.35021870501840413
Epoch: 25, step: 661, loss: 0.3461143374443054, mean loss: 0.3502185933713889
Epoch: 25, step: 662, loss: 0.33104926347732544, mean loss: 0.3502180719414214
Epoch: 25, step: 663, loss: 0.3607422113418579, mean loss: 0.35021835820350933
Epoch: 25, step: 664, loss: 0.30659037828445435, mean loss: 0.3502171715319489
Epoch: 25, step: 665, loss: 0.3400459587574005, mean loss: 0.3502168948846994
Epoch: 25, step: 666, loss: 0.357897013425827, mean loss: 0.35021710377088927
Epoch: 25, step: 667, loss: 0.3238939642906189, mean loss: 0.3502163878456423
Epoch: 25, step: 668, loss: 0.30989715456962585, mean loss: 0.3502152912905748
Epoch: 25, step: 669, loss: 0.3447558581829071, mean loss: 0.35021514281537475
Epoch: 25, step: 670, loss: 0.321012407541275, mean loss: 0.3502143486369386
Epoch: 25, step: 671, loss: 0.3479084372520447, mean loss: 0.3502142859285903
Epoch: 25, step: 672, loss: 0.3570546805858612, mean loss: 0.3502144719453596
Epoch: 25, step: 673, loss: 0.3369009494781494, mean loss: 0.35021410990907126
Epoch: 25, step: 674, loss: 0.33339381217956543, mean loss: 0.35021365252504055
Epoch: 25, step: 675, loss: 0.35500583052635193, mean loss: 0.3502137828322518
Epoch: 25, step: 676, loss: 0.38979145884513855, mean loss: 0.3502148589851738
Epoch: 25, step: 677, loss: 0.36106064915657043, mean loss: 0.350215153884031
Epoch: 25, step: 678, loss: 0.3378894329071045, mean loss: 0.3502148187547187
Epoch: 25, step: 679, loss: 0.29058000445365906, mean loss: 0.35021319736226897
Epoch: 25, step: 680, loss: 0.29392561316490173, mean loss: 0.35021166701822726
Epoch: 25, step: 681, loss: 0.3387032151222229, mean loss: 0.35021135413551574
Epoch: 25, step: 682, loss: 0.3966643512248993, mean loss: 0.35021261702862094
Epoch: 25, step: 683, loss: 0.38139811158180237, mean loss: 0.35021346482914706
Epoch: 25, step: 684, loss: 0.3711314797401428, mean loss: 0.3502140334852545
Epoch: 25, step: 685, loss: 0.31073319911956787, mean loss: 0.3502129602281902
Epoch: 25, step: 686, loss: 0.3747933506965637, mean loss: 0.3502136284096257
Epoch: 25, step: 687, loss: 0.35395824909210205, mean loss: 0.35021373019881463
Epoch: 25, step: 688, loss: 0.3169277310371399, mean loss: 0.3502128254175169
Epoch: 25, step: 689, loss: 0.3320738673210144, mean loss: 0.3502123323770685
Epoch: 25, step: 690, loss: 0.32089754939079285, mean loss: 0.3502115355848371
Epoch: 25, step: 691, loss: 0.3171425461769104, mean loss: 0.35021063677560116
Epoch: 25, step: 692, loss: 0.331310898065567, mean loss: 0.3502101230980345
Epoch: 25, step: 693, loss: 0.31392720341682434, mean loss: 0.3502091369883514
Epoch: 25, step: 694, loss: 0.36732518672943115, mean loss: 0.3502096021616016
Epoch: 25, step: 695, loss: 0.32389333844184875, mean loss: 0.3502088869680012
Epoch: 25, step: 696, loss: 0.3201775848865509, mean loss: 0.3502080708334771
Epoch: 25, step: 697, loss: 0.33756136894226074, mean loss: 0.3502077271544214
Epoch: 25, step: 698, loss: 0.33927690982818604, mean loss: 0.3502074301132701
Epoch: 25, step: 699, loss: 0.34269818663597107, mean loss: 0.35020722605774085
Epoch: 25, step: 700, loss: 0.3416976034641266, mean loss: 0.35020699482427997
Epoch: 25, step: 701, loss: 0.2929796278476715, mean loss: 0.3502054398172973
Epoch: 25, step: 702, loss: 0.3578394949436188, mean loss: 0.3502056472475374
Epoch: 25, step: 703, loss: 0.3611467182636261, mean loss: 0.3502059445269368
Epoch: 25, step: 704, loss: 0.35767292976379395, mean loss: 0.3502061474065792
Epoch: 25, step: 705, loss: 0.28153568506240845, mean loss: 0.3502042816656037
Epoch: 25, step: 706, loss: 0.34630927443504333, mean loss: 0.35020417584314517
Epoch: 25, step: 707, loss: 0.30756035447120667, mean loss: 0.35020301729550957
Epoch: 25, step: 708, loss: 0.3162105977535248, mean loss: 0.35020209381430817
Epoch: 25, step: 709, loss: 0.31887173652648926, mean loss: 0.3502012426771909
Epoch: 25, step: 710, loss: 0.30062010884284973, mean loss: 0.35019989576638066
Epoch: 25, step: 711, loss: 0.32978004217147827, mean loss: 0.3501993410599373
Epoch: 25, step: 712, loss: 0.3422101140022278, mean loss: 0.35019912403804127
Epoch: 25, step: 713, loss: 0.2985249161720276, mean loss: 0.35019772038160984
Epoch: 25, step: 714, loss: 0.29913654923439026, mean loss: 0.3501963334151248
Epoch: 25, step: 715, loss: 0.3250639736652374, mean loss: 0.35019565076736975
Epoch: 25, step: 716, loss: 0.30319276452064514, mean loss: 0.3501943741047887
Epoch: 25, step: 717, loss: 0.29716071486473083, mean loss: 0.3501929336773011
Epoch: 25, step: 718, loss: 0.3427962362766266, mean loss: 0.3501927327838113
Epoch: 25, step: 719, loss: 0.3453495502471924, mean loss: 0.3501926012470776
Epoch: 25, step: 720, loss: 0.35330936312675476, mean loss: 0.35019268589339025
Epoch: 25, step: 721, loss: 0.4078609049320221, mean loss: 0.35019425202828347
Epoch: 25, step: 722, loss: 0.4107398986816406, mean loss: 0.35019589626277425
Epoch: 25, step: 723, loss: 0.333609402179718, mean loss: 0.3501954458365826
Epoch: 25, step: 724, loss: 0.3374461233615875, mean loss: 0.3501950996228019
Epoch: 25, step: 725, loss: 0.2897590696811676, mean loss: 0.3501934584988693
Epoch: 25, step: 726, loss: 0.3617590665817261, mean loss: 0.35019377255127876
Epoch: 25, step: 727, loss: 0.3312689960002899, mean loss: 0.3501932586820339
Epoch: 25, step: 728, loss: 0.3751370310783386, mean loss: 0.35019393596820503
Epoch: 25, step: 729, loss: 0.29404324293136597, mean loss: 0.35019241137702833
Epoch: 25, step: 730, loss: 0.3729013502597809, mean loss: 0.3501930279483645
Epoch: 25, step: 731, loss: 0.326057493686676, mean loss: 0.35019237266127007
Epoch: 25, step: 732, loss: 0.32994696497917175, mean loss: 0.35019182300721846
Epoch: 25, step: 733, loss: 0.3480202257633209, mean loss: 0.3501917640508943
Epoch: 25, step: 734, loss: 0.3328745663166046, mean loss: 0.3501912939220024
Epoch: 25, step: 735, loss: 0.32979461550712585, mean loss: 0.35019074020611535
Epoch: 25, step: 736, loss: 0.3022586703300476, mean loss: 0.3501894390124819
Epoch: 25, step: 737, loss: 0.2954697906970978, mean loss: 0.35018795359936733
Epoch: 25, step: 738, loss: 0.3462725877761841, mean loss: 0.35018784731619396
Epoch: 25, step: 739, loss: 0.32746484875679016, mean loss: 0.35018723051384437
Epoch: 25, step: 740, loss: 0.3251427710056305, mean loss: 0.3501865507152638
Epoch: 25, step: 741, loss: 0.3444335460662842, mean loss: 0.3501863945618343
Epoch: 25, step: 742, loss: 0.3271517753601074, mean loss: 0.35018576935163964
Epoch: 25, step: 743, loss: 0.3112297058105469, mean loss: 0.3501847120271488
Epoch: 25, step: 744, loss: 0.33429691195487976, mean loss: 0.3501842808207416
Epoch: 25, step: 745, loss: 0.3190937936306, mean loss: 0.35018343702529053
Epoch: 25, step: 746, loss: 0.3239423334598541, mean loss: 0.35018272486138124
Epoch: 25, step: 747, loss: 0.3638792335987091, mean loss: 0.3501830965642888
Epoch: 25, step: 748, loss: 0.3239133656024933, mean loss: 0.35018238366214866
Epoch: 25, step: 749, loss: 0.3553013801574707, mean loss: 0.35018252257657184
Epoch: 25, step: 750, loss: 0.3309631049633026, mean loss: 0.3501820010325808
Epoch: 25, step: 751, loss: 0.3683846592903137, mean loss: 0.3501824949720755
Epoch: 25, step: 752, loss: 0.35823288559913635, mean loss: 0.3501827134180806
Epoch: 25, step: 753, loss: 0.3551429808139801, mean loss: 0.3501828480104558
Epoch: 25, step: 754, loss: 0.3443017899990082, mean loss: 0.3501826884375888
Epoch: 25, step: 755, loss: 0.3518180251121521, mean loss: 0.3501827328085644
Epoch: 25, step: 756, loss: 0.32406970858573914, mean loss: 0.350182024312913
Epoch: 25, step: 757, loss: 0.33350855112075806, mean loss: 0.35018157194237765
Epoch: 25, step: 758, loss: 0.3464777171611786, mean loss: 0.35018147145525697
Epoch: 25, step: 759, loss: 0.3285761773586273, mean loss: 0.35018088531054464
Epoch: 25, step: 760, loss: 0.3460676372051239, mean loss: 0.35018077372246764
Epoch: 25, step: 761, loss: 0.31783610582351685, mean loss: 0.35017989626959206
Epoch: 25, step: 762, loss: 0.34749817848205566, mean loss: 0.3501798235213679
Epoch: 25, step: 763, loss: 0.3357217311859131, mean loss: 0.35017943132051244
Epoch: 25, step: 764, loss: 0.3087254464626312, mean loss: 0.3501783068397079
Epoch: 25, step: 765, loss: 0.3457081913948059, mean loss: 0.35017818558664426
Epoch: 25, step: 766, loss: 0.318627268075943, mean loss: 0.35017732978287636
Epoch: 25, step: 767, loss: 0.3653779625892639, mean loss: 0.35017774208169394
Epoch: 25, step: 768, loss: 0.3233988881111145, mean loss: 0.350177015757303
Epoch: 25, step: 769, loss: 0.3510987460613251, mean loss: 0.35017704075676875
Epoch: 25, step: 770, loss: 0.3278496265411377, mean loss: 0.35017643520188235
Epoch: 25, step: 771, loss: 0.328792929649353, mean loss: 0.35017585526302486
Epoch: 25, step: 772, loss: 0.31326451897621155, mean loss: 0.3501748542233403
Epoch: 25, step: 773, loss: 0.37673237919807434, mean loss: 0.3501755744469389
Epoch: 25, step: 774, loss: 0.341539204120636, mean loss: 0.350175340240286
Epoch: 25, step: 775, loss: 0.318136990070343, mean loss: 0.3501744714272323
Epoch: 25, step: 776, loss: 0.30611464381217957, mean loss: 0.350173276649251
Epoch: 25, step: 777, loss: 0.344078004360199, mean loss: 0.350173111367178
Epoch: 25, step: 778, loss: 0.31353121995925903, mean loss: 0.35017211779654406
Epoch: 25, step: 779, loss: 0.3347265124320984, mean loss: 0.35017169898945716
Epoch: 25, step: 780, loss: 0.3388962149620056, mean loss: 0.3501713932633644
Epoch: 25, step: 781, loss: 0.3730166554450989, mean loss: 0.35017201267831427
Epoch: 25, step: 782, loss: 0.3276308476924896, mean loss: 0.3501714015250733
Epoch: 25, step: 783, loss: 0.3166290819644928, mean loss: 0.3501704921248033
Epoch: 25, step: 784, loss: 0.3218860328197479, mean loss: 0.35016972529657214
Epoch: 25, step: 785, loss: 0.3345651924610138, mean loss: 0.35016930224899756
Epoch: 25, step: 786, loss: 0.3128270208835602, mean loss: 0.3501682899064008
Epoch: 25, step: 787, loss: 0.33023130893707275, mean loss: 0.35016774943304985
Epoch: 25, step: 788, loss: 0.3230457007884979, mean loss: 0.350167014199006
Epoch: 25, step: 789, loss: 0.3124503791332245, mean loss: 0.350165991790899
Epoch: 25, step: 790, loss: 0.3129153847694397, mean loss: 0.3501649820430738
Epoch: 25, step: 791, loss: 0.3005914092063904, mean loss: 0.3501636382944877
Epoch: 25, step: 792, loss: 0.29427146911621094, mean loss: 0.3501621233141614
Epoch: 25, step: 793, loss: 0.3740553855895996, mean loss: 0.35016277093334813
Epoch: 25, step: 794, loss: 0.3876444697380066, mean loss: 0.35016378683519944
Epoch: 25, step: 795, loss: 0.34800004959106445, mean loss: 0.35016372819097663
Epoch: 25, step: 796, loss: 0.3832012414932251, mean loss: 0.350164623589337
Epoch: 25, step: 797, loss: 0.35974377393722534, mean loss: 0.3501648832009785
Epoch: 25, step: 798, loss: 0.33441275358200073, mean loss: 0.3501644563024279
Epoch: 25, step: 799, loss: 0.35395485162734985, mean loss: 0.3501645590231684
Epoch: 25, step: 800, loss: 0.34848836064338684, mean loss: 0.35016451359896905
Epoch: 25, step: 801, loss: 0.351669579744339, mean loss: 0.35016455438445887
Epoch: 25, step: 802, loss: 0.31242597103118896, mean loss: 0.3501635317417644
Epoch: 25, step: 803, loss: 0.3605159521102905, mean loss: 0.3501638122647529
Epoch: 25, step: 804, loss: 0.3569450080394745, mean loss: 0.35016399601209813
Epoch: 25, step: 805, loss: 0.33217453956604004, mean loss: 0.3501635085722118
Epoch: 25, step: 806, loss: 0.3483628034591675, mean loss: 0.35016345978187086
Epoch: 25, step: 807, loss: 0.34688282012939453, mean loss: 0.3501633708949181
Epoch: 25, step: 808, loss: 0.3647448718547821, mean loss: 0.35016376596118814
Epoch: 25, step: 809, loss: 0.3173055648803711, mean loss: 0.35016287573628757
Epoch: 25, step: 810, loss: 0.3364326059818268, mean loss: 0.35016250375314556
Epoch: 25, step: 811, loss: 0.37713634967803955, mean loss: 0.3501632345140343
Epoch: 25, step: 812, loss: 0.3352017104625702, mean loss: 0.35016282919547304
Epoch: 25, step: 813, loss: 0.32324039936065674, mean loss: 0.35016209986703845
Epoch: 25, step: 814, loss: 0.35750070214271545, mean loss: 0.350162298664337
Epoch: 25, step: 815, loss: 0.3455269932746887, mean loss: 0.3501621731007497
Epoch: 25, step: 816, loss: 0.3451261818408966, mean loss: 0.3501620366868683
Epoch: 25, step: 817, loss: 0.270938515663147, mean loss: 0.3501598907547749
Epoch: 25, step: 818, loss: 0.30233055353164673, mean loss: 0.3501585952338446
Epoch: 25, step: 819, loss: 0.381686806678772, mean loss: 0.35015944919406794
Epoch: 25, step: 820, loss: 0.31808364391326904, mean loss: 0.3501585804254734
Epoch: 25, step: 821, loss: 0.32677197456359863, mean loss: 0.35015794701975694
Epoch: 25, step: 822, loss: 0.32957980036735535, mean loss: 0.3501573896937907
Epoch: 25, step: 823, loss: 0.45037156343460083, mean loss: 0.35016010375981116
Epoch: 25, step: 824, loss: 0.44011589884757996, mean loss: 0.3501625399357106
Epoch: 25, step: 825, loss: 0.29264122247695923, mean loss: 0.3501609821900176
Epoch: 25, step: 826, loss: 0.3523332476615906, mean loss: 0.35016104101595724
Epoch: 25, step: 827, loss: 0.34485557675361633, mean loss: 0.3501608973454562
Epoch: 25, step: 828, loss: 0.3515814244747162, mean loss: 0.3501609358118953
Epoch: 25, step: 829, loss: 0.3514009118080139, mean loss: 0.35016096938828295
Epoch: 25, step: 830, loss: 0.3248484432697296, mean loss: 0.3501602839877761
Epoch: 25, step: 831, loss: 0.3403773307800293, mean loss: 0.3501600190968087
Epoch: 25, step: 832, loss: 0.324972003698349, mean loss: 0.35015933710467706
Epoch: 25, step: 833, loss: 0.3826848864555359, mean loss: 0.3501602177444494
Epoch: 25, step: 834, loss: 0.3253170847892761, mean loss: 0.350159545126798
Epoch: 25, step: 835, loss: 0.3305373191833496, mean loss: 0.3501590138774493
Epoch: 25, step: 836, loss: 0.2995202839374542, mean loss: 0.35015764292880863
Epoch: 25, step: 837, loss: 0.33465373516082764, mean loss: 0.3501572232009466
Epoch: 25, step: 838, loss: 0.3717317581176758, mean loss: 0.35015780725939205
Epoch: 25, step: 839, loss: 0.3096236288547516, mean loss: 0.35015670996165504
Epoch: 25, step: 840, loss: 0.3113582730293274, mean loss: 0.3501556596804788
Epoch: 25, step: 841, loss: 0.3723590672016144, mean loss: 0.35015626071473577
Epoch: 25, step: 842, loss: 0.3138786852359772, mean loss: 0.3501552787269308
Epoch: 25, step: 843, loss: 0.3247700035572052, mean loss: 0.35015459159843443
Epoch: 25, step: 844, loss: 0.3181983530521393, mean loss: 0.3501537266305485
Epoch: 25, step: 845, loss: 0.3445712924003601, mean loss: 0.3501535755334276
Epoch: 25, step: 846, loss: 0.3526371121406555, mean loss: 0.35015364275232513
Epoch: 25, step: 847, loss: 0.3111690878868103, mean loss: 0.3501525876328365
Epoch: 25, step: 848, loss: 0.38203397393226624, mean loss: 0.3501534504812573
Epoch: 25, step: 849, loss: 0.32958927750587463, mean loss: 0.3501528939407167
Epoch: 25, step: 850, loss: 0.31404659152030945, mean loss: 0.350151916800655
Epoch: 25, step: 851, loss: 0.3483128249645233, mean loss: 0.35015186703090406
Epoch: 25, step: 852, loss: 0.3271682560443878, mean loss: 0.35015124506216033
Epoch: 25, step: 853, loss: 0.3296282887458801, mean loss: 0.3501506896972116
Epoch: 25, step: 854, loss: 0.316580206155777, mean loss: 0.3501497812820163
Epoch: 25, step: 855, loss: 0.31215208768844604, mean loss: 0.35014875309461524
Epoch: 25, step: 856, loss: 0.3472232222557068, mean loss: 0.35014867393421695
Epoch: 25, step: 857, loss: 0.34813395142555237, mean loss: 0.35014861942037667
Epoch: 25, step: 858, loss: 0.36622464656829834, mean loss: 0.3501490543895898
Epoch: 25, step: 859, loss: 0.34346944093704224, mean loss: 0.3501488736641176
Epoch: 25, step: 860, loss: 0.38180679082870483, mean loss: 0.3501497301863212
Epoch: 25, step: 861, loss: 0.3411964774131775, mean loss: 0.3501494879577412
Epoch: 25, step: 862, loss: 0.35030168294906616, mean loss: 0.3501494920752368
Epoch: 25, step: 863, loss: 0.3104783594608307, mean loss: 0.3501484188382329
Epoch: 25, step: 864, loss: 0.3058445155620575, mean loss: 0.3501472203016909
Epoch: 25, step: 865, loss: 0.30355194211006165, mean loss: 0.3501459598115596
Epoch: 25, step: 866, loss: 0.3339284658432007, mean loss: 0.35014552110963715
Epoch: 25, step: 867, loss: 0.31059530377388, mean loss: 0.35014445125956856
Epoch: 25, step: 868, loss: 0.288921058177948, mean loss: 0.35014279518574776
Epoch: 25, step: 869, loss: 0.32322055101394653, mean loss: 0.35014206696707934
Epoch: 25, step: 870, loss: 0.3378494381904602, mean loss: 0.3501417344732659
Epoch: 25, step: 871, loss: 0.33184099197387695, mean loss: 0.3501412394840173
Epoch: 25, step: 872, loss: 0.3192148208618164, mean loss: 0.35014040302447597
Epoch: 25, step: 873, loss: 0.31172192096710205, mean loss: 0.35013936395696754
Epoch: 25, step: 874, loss: 0.34308379888534546, mean loss: 0.3501391731370873
Epoch: 25, step: 875, loss: 0.3161242604255676, mean loss: 0.3501382532184181
Epoch: 25, step: 876, loss: 0.35824477672576904, mean loss: 0.35013847244992713
Epoch: 25, step: 877, loss: 0.3350059390068054, mean loss: 0.3501380632192104
Epoch: 25, step: 878, loss: 0.3337600827217102, mean loss: 0.35013762031971346
Epoch: 25, step: 879, loss: 0.2892396152019501, mean loss: 0.35013597353753073
Epoch: 25, step: 880, loss: 0.3489495813846588, mean loss: 0.35013594145640387
Epoch: 25, step: 881, loss: 0.3316414952278137, mean loss: 0.3501354413632172
Epoch: 25, step: 882, loss: 0.3332010805606842, mean loss: 0.35013498346740557
Epoch: 25, step: 883, loss: 0.3454456627368927, mean loss: 0.35013485667417793
Epoch: 25, step: 884, loss: 0.3099137842655182, mean loss: 0.3501337691772898
Epoch: 25, step: 885, loss: 0.3474808633327484, mean loss: 0.35013369744999173
Epoch: 25, step: 886, loss: 0.354950487613678, mean loss: 0.3501338276792659
Epoch: 25, step: 887, loss: 0.3653140366077423, mean loss: 0.3501342380882885
Epoch: 25, step: 888, loss: 0.32011649012565613, mean loss: 0.3501334265565368
Epoch: 25, step: 889, loss: 0.33407291769981384, mean loss: 0.3501329923713825
Epoch: 25, step: 890, loss: 0.35891786217689514, mean loss: 0.3501332298580632
Epoch: 25, step: 891, loss: 0.3130625784397125, mean loss: 0.3501322277318895
Epoch: 25, step: 892, loss: 0.3358812928199768, mean loss: 0.3501318424986045
Epoch: 25, step: 893, loss: 0.3098953068256378, mean loss: 0.3501307548482917
Epoch: 25, step: 894, loss: 0.34946995973587036, mean loss: 0.3501307369865506
Epoch: 25, step: 895, loss: 0.3117602467536926, mean loss: 0.3501296998341495
Epoch: 25, step: 896, loss: 0.3307674527168274, mean loss: 0.35012917648773983
Epoch: 25, step: 897, loss: 0.30439576506614685, mean loss: 0.35012794038277684
Epoch: 25, step: 898, loss: 0.3996487259864807, mean loss: 0.3501292788185617
Epoch: 25, step: 899, loss: 0.325549453496933, mean loss: 0.35012861449895843
Epoch: 25, step: 900, loss: 0.3160126209259033, mean loss: 0.3501276924699978
Epoch: 25, step: 901, loss: 0.31948322057724, mean loss: 0.3501268642857944
Epoch: 25, step: 902, loss: 0.3109520375728607, mean loss: 0.3501258055925341
Epoch: 25, step: 903, loss: 0.2978367507457733, mean loss: 0.3501243925275993
Epoch: 25, step: 904, loss: 0.33903035521507263, mean loss: 0.3501240927292663
Epoch: 25, step: 905, loss: 0.3648584485054016, mean loss: 0.3501244908905314
Epoch: 25, step: 906, loss: 0.3252670168876648, mean loss: 0.3501238191939874
Epoch: 25, step: 907, loss: 0.33170443773269653, mean loss: 0.35012332148048053
Epoch: 25, step: 908, loss: 0.33471396565437317, mean loss: 0.3501229051126828
Epoch: 25, step: 909, loss: 0.34717845916748047, mean loss: 0.35012282555456486
Epoch: 25, step: 910, loss: 0.337982714176178, mean loss: 0.3501224975409641
Epoch: 25, step: 911, loss: 0.3086918890476227, mean loss: 0.3501213781578318
Epoch: 25, step: 912, loss: 0.3320249617099762, mean loss: 0.35012088923727824
Epoch: 25, step: 913, loss: 0.30434831976890564, mean loss: 0.35011965260871963
Epoch: 25, step: 914, loss: 0.3547627627849579, mean loss: 0.35011977804733035
Epoch: 25, step: 915, loss: 0.38848042488098145, mean loss: 0.35012081437342807
Epoch: 25, step: 916, loss: 0.3136730194091797, mean loss: 0.3501198297502829
Epoch: 25, step: 917, loss: 0.33653685450553894, mean loss: 0.3501194628213498
Epoch: 25, step: 918, loss: 0.291136234998703, mean loss: 0.35011786949825024
Epoch: 25, step: 919, loss: 0.38556262850761414, mean loss: 0.35011882694717
Epoch: 25, step: 920, loss: 0.31777340173721313, mean loss: 0.35011795324237516
Epoch: 25, step: 921, loss: 0.3516235053539276, mean loss: 0.3501179939087927
Epoch: 25, step: 922, loss: 0.309516966342926, mean loss: 0.3501168972654206
Epoch: 25, step: 923, loss: 0.32453376054763794, mean loss: 0.3501162062775015
Epoch: 25, step: 924, loss: 0.3178959786891937, mean loss: 0.35011533604853223
Epoch: 25, step: 925, loss: 0.2931867241859436, mean loss: 0.3501137985178278
Epoch: 25, step: 926, loss: 0.3015364110469818, mean loss: 0.350112486572829
Epoch: 25, step: 927, loss: 0.34483152627944946, mean loss: 0.3501123439521016
Epoch: 25, step: 928, loss: 0.34012725949287415, mean loss: 0.3501120742963059
Epoch: 25, step: 929, loss: 0.3075698912143707, mean loss: 0.35011092543907985
Epoch: 25, step: 930, loss: 0.3148985505104065, mean loss: 0.35010997454996184
Epoch: 25, step: 931, loss: 0.35541048645973206, mean loss: 0.3501101176832495
Epoch: 25, step: 932, loss: 0.32628631591796875, mean loss: 0.35010947437048073
Epoch: 25, step: 933, loss: 0.32307401299476624, mean loss: 0.3501087443531622
Epoch: 25, step: 934, loss: 0.324632853269577, mean loss: 0.35010805646626914
Epoch: 25, step: 935, loss: 0.32653892040252686, mean loss: 0.35010742008177664
Epoch: 25, step: 936, loss: 0.3567119538784027, mean loss: 0.35010759840436745
Epoch: 25, step: 937, loss: 0.3320941925048828, mean loss: 0.35010711205505324
Epoch: 25, step: 938, loss: 0.3463577628135681, mean loss: 0.35010701082798873
Epoch: 25, step: 939, loss: 0.28818926215171814, mean loss: 0.3501053391825061
Epoch: 25, step: 940, loss: 0.32837337255477905, mean loss: 0.3501047524821841
Epoch: 25, step: 941, loss: 0.33873113989830017, mean loss: 0.35010444543578856
Epoch: 25, step: 942, loss: 0.3684268295764923, mean loss: 0.3501049400605258
Epoch: 25, step: 943, loss: 0.35050690174102783, mean loss: 0.35010495091145116
Epoch: 25, step: 944, loss: 0.3578459918498993, mean loss: 0.3501051598746294
Epoch: 25, step: 945, loss: 0.3290870487689972, mean loss: 0.3501045925229287
Epoch: 25, step: 946, loss: 0.32158493995666504, mean loss: 0.35010382269939194
Epoch: 25, step: 947, loss: 0.3530527949333191, mean loss: 0.350103902298081
Epoch: 25, step: 948, loss: 0.32675278186798096, mean loss: 0.3501032720214088
Epoch: 25, step: 949, loss: 0.3512134850025177, mean loss: 0.35010330198667144
Epoch: 25, step: 950, loss: 0.33097130060195923, mean loss: 0.3501027856173053
Epoch: 25, step: 951, loss: 0.3217739760875702, mean loss: 0.3501020210483339
Epoch: 25, step: 952, loss: 0.3604538142681122, mean loss: 0.3501023004263389
Epoch: 25, step: 953, loss: 0.3509623408317566, mean loss: 0.35010232363679944
Epoch: 25, step: 954, loss: 0.4099905490875244, mean loss: 0.35010393983503046
Epoch: 25, step: 955, loss: 0.34892159700393677, mean loss: 0.35010390792811036
Epoch: 25, step: 956, loss: 0.30856165289878845, mean loss: 0.35010278689146335
Epoch: 25, step: 957, loss: 0.3597974479198456, mean loss: 0.3501030484992411
Epoch: 25, step: 958, loss: 0.34880781173706055, mean loss: 0.35010301354857426
Epoch: 25, step: 959, loss: 0.36453863978385925, mean loss: 0.35010340306897997
Epoch: 25, step: 960, loss: 0.29178738594055176, mean loss: 0.3501018295545813
Epoch: 25, step: 961, loss: 0.3462901711463928, mean loss: 0.3501017267091221
Epoch: 25, step: 962, loss: 0.3418593406677246, mean loss: 0.35010150432059334
Epoch: 25, step: 963, loss: 0.3233568072319031, mean loss: 0.3501007827390833
Epoch: 25, step: 964, loss: 0.2884795069694519, mean loss: 0.3500991202198395
Epoch: 25, step: 965, loss: 0.3111627399921417, mean loss: 0.35009806975903374
Epoch: 25, step: 966, loss: 0.3504905104637146, mean loss: 0.35009808034636763
Epoch: 25, step: 967, loss: 0.2854251265525818, mean loss: 0.35009633563519377
Epoch: 25, step: 968, loss: 0.32032087445259094, mean loss: 0.3500955323909416
Epoch: 25, step: 969, loss: 0.3324250876903534, mean loss: 0.3500950557131779
Epoch: 25, step: 970, loss: 0.3601209223270416, mean loss: 0.3500953261635735
Epoch: 25, step: 971, loss: 0.2943914234638214, mean loss: 0.35009382357664265
Epoch: 25, step: 972, loss: 0.33759748935699463, mean loss: 0.35009348650291733
Epoch: 25, step: 973, loss: 0.3356046676635742, mean loss: 0.35009309569483515
Epoch: 25, step: 974, loss: 0.34207484126091003, mean loss: 0.3500928794236434
Epoch: 25, step: 975, loss: 0.335983544588089, mean loss: 0.35009249887194327
Epoch: 25, step: 976, loss: 0.3218880295753479, mean loss: 0.3500917381720674
Epoch: 25, step: 977, loss: 0.30987924337387085, mean loss: 0.3500906536342067
Epoch: 25, step: 978, loss: 0.3145683705806732, mean loss: 0.35008969561799663
Epoch: 25, step: 979, loss: 0.31996050477027893, mean loss: 0.35008888307239666
Epoch: 25, step: 980, loss: 0.3679351806640625, mean loss: 0.35008936435115373
Epoch: 25, step: 981, loss: 0.34399306774139404, mean loss: 0.3500891999507274
Epoch: 25, step: 982, loss: 0.3086692690849304, mean loss: 0.35008808299873145
Epoch: 25, step: 983, loss: 0.315334677696228, mean loss: 0.3500871458450991
Epoch: 25, step: 984, loss: 0.29948511719703674, mean loss: 0.35008578135733726
Epoch: 25, step: 985, loss: 0.33680248260498047, mean loss: 0.35008542318177904
Epoch: 25, step: 986, loss: 0.32108479738235474, mean loss: 0.35008464121974925
Epoch: 25, step: 987, loss: 0.3513771593570709, mean loss: 0.3500846760697853
Epoch: 25, step: 988, loss: 0.31149402260780334, mean loss: 0.3500836355819463
Epoch: 25, step: 989, loss: 0.3362520933151245, mean loss: 0.3500832626635783
Epoch: 25, step: 990, loss: 0.3150331676006317, mean loss: 0.35008231768784126
Epoch: 25, step: 991, loss: 0.32212895154953003, mean loss: 0.3500815640653313
Epoch: 25, step: 992, loss: 0.3652289807796478, mean loss: 0.3500819724285458
Epoch: 25, step: 993, loss: 0.39791807532310486, mean loss: 0.3500832620199324
Epoch: 25, step: 994, loss: 0.3028523623943329, mean loss: 0.3500819887782657
Epoch: 25, step: 995, loss: 0.32337450981140137, mean loss: 0.3500812688225032
Epoch: 25, step: 996, loss: 0.38860559463500977, mean loss: 0.35008230729800827
Epoch: 25, step: 997, loss: 0.33371078968048096, mean loss: 0.35008186599341995
Epoch: 25, step: 998, loss: 0.32526519894599915, mean loss: 0.35008119706253105
Epoch: 25, step: 999, loss: 0.313058465719223, mean loss: 0.3500801991452442
Epoch: 25, step: 1000, loss: 0.3071615993976593, mean loss: 0.3500790423408522
Epoch: 25, step: 1001, loss: 0.33793580532073975, mean loss: 0.35007871504752514
Epoch: 25, step: 1002, loss: 0.3350125253200531, mean loss: 0.3500783089836023
Epoch: 25, step: 1003, loss: 0.34441864490509033, mean loss: 0.35007815644845575
Epoch: 25, step: 1004, loss: 0.3465656042098999, mean loss: 0.35007806178325596
Epoch: 25, step: 1005, loss: 0.31008240580558777, mean loss: 0.3500769839075491
Epoch: 25, step: 1006, loss: 0.33050915598869324, mean loss: 0.3500764565723315
Epoch: 25, step: 1007, loss: 0.2965621054172516, mean loss: 0.35007501444796063
Epoch: 25, step: 1008, loss: 0.33555591106414795, mean loss: 0.35007462319237886
Epoch: 25, step: 1009, loss: 0.3296266794204712, mean loss: 0.35007407218338477
Epoch: 25, step: 1010, loss: 0.3483937084674835, mean loss: 0.35007402690398737
Epoch: 25, step: 1011, loss: 0.3481348156929016, mean loss: 0.3500739746510446
Epoch: 25, step: 1012, loss: 0.3438093662261963, mean loss: 0.3500738058528223
Epoch: 25, step: 1013, loss: 0.3365304172039032, mean loss: 0.3500734409396184
Epoch: 25, step: 1014, loss: 0.35834771394729614, mean loss: 0.35007366387570915
Epoch: 25, step: 1015, loss: 0.32573774456977844, mean loss: 0.35007300820378046
Epoch: 25, step: 1016, loss: 0.3544374108314514, mean loss: 0.35007312578878536
Epoch: 25, step: 1017, loss: 0.31576111912727356, mean loss: 0.3500722013853514
Epoch: 25, step: 1018, loss: 0.37081050872802734, mean loss: 0.35007276008325117
Epoch: 25, step: 1019, loss: 0.32979264855384827, mean loss: 0.3500722137440397
Epoch: 25, step: 1020, loss: 0.36054113507270813, mean loss: 0.35007249576557276
Epoch: 25, step: 1021, loss: 0.3112725019454956, mean loss: 0.3500714505634333
Epoch: 25, step: 1022, loss: 0.39136356115341187, mean loss: 0.3500725628687586
Epoch: 25, step: 1023, loss: 0.33486443758010864, mean loss: 0.3500721532112516
Epoch: 25, step: 1024, loss: 0.3153935968875885, mean loss: 0.3500712191087244
Epoch: 25, step: 1025, loss: 0.312019944190979, mean loss: 0.35007019418616564
Epoch: 25, step: 1026, loss: 0.3108042776584625, mean loss: 0.35006913657535604
Epoch: 25, step: 1027, loss: 0.3056444525718689, mean loss: 0.3500679400475602
Epoch: 25, step: 1028, loss: 0.3481099009513855, mean loss: 0.3500678873114484
Epoch: 25, step: 1029, loss: 0.40728652477264404, mean loss: 0.35006942834666144
Epoch: 25, step: 1030, loss: 0.3687642216682434, mean loss: 0.35006993182874707
Epoch: 25, step: 1031, loss: 0.3179413378238678, mean loss: 0.35006906657521897
Epoch: 25, step: 1032, loss: 0.34581005573272705, mean loss: 0.35006895187910386
Epoch: 25, step: 1033, loss: 0.30784496665000916, mean loss: 0.3500678148083539
Epoch: 25, step: 1034, loss: 0.3636051416397095, mean loss: 0.35006817935196055
Epoch: 25, step: 1035, loss: 0.3129408061504364, mean loss: 0.3500671795842634
Epoch: 25, step: 1036, loss: 0.32276439666748047, mean loss: 0.3500664443934048
Epoch: 25, step: 1037, loss: 0.3546750247478485, mean loss: 0.3500665684867958
Epoch: 25, step: 1038, loss: 0.3236965835094452, mean loss: 0.3500658584519274
Epoch: 25, step: 1039, loss: 0.343464732170105, mean loss: 0.3500656807156247
Epoch: 25, step: 1040, loss: 0.32059943675994873, mean loss: 0.350064887354004
Epoch: 25, step: 1041, loss: 0.3210262954235077, mean loss: 0.35006410552771755
Epoch: 25, step: 1042, loss: 0.3021019995212555, mean loss: 0.3500628142452146
Epoch: 25, step: 1043, loss: 0.3302696645259857, mean loss: 0.3500622813691184
Epoch: 25, step: 1044, loss: 0.30438968539237976, mean loss: 0.3500610517932407
Epoch: 25, step: 1045, loss: 0.3519649803638458, mean loss: 0.35006110304851906
Epoch: 25, step: 1046, loss: 0.346184104681015, mean loss: 0.35006099867943496
Epoch: 25, step: 1047, loss: 0.32560545206069946, mean loss: 0.35006034035202516
Epoch: 25, step: 1048, loss: 0.3207034468650818, mean loss: 0.3500595501048183
Epoch: 25, step: 1049, loss: 0.35543936491012573, mean loss: 0.35005969491813743
Epoch: 25, step: 1050, loss: 0.33527812361717224, mean loss: 0.3500592970399834
Epoch: 25, step: 1051, loss: 0.32081568241119385, mean loss: 0.3500585099056534
Epoch: 25, step: 1052, loss: 0.36483484506607056, mean loss: 0.3500589076214546
Epoch: 25, step: 1053, loss: 0.40197283029556274, mean loss: 0.3500603048848091
Epoch: 25, step: 1054, loss: 0.3477759063243866, mean loss: 0.35006024340187114
Epoch: 25, step: 1055, loss: 0.3195823132991791, mean loss: 0.3500594231324637
Epoch: 25, step: 1056, loss: 0.3330886662006378, mean loss: 0.3500589664013785
Epoch: 25, step: 1057, loss: 0.32224270701408386, mean loss: 0.35005821780728336
Epoch: 25, step: 1058, loss: 0.3485250473022461, mean loss: 0.350058176547548
Epoch: 25, step: 1059, loss: 0.3501460552215576, mean loss: 0.3500581789124208
Epoch: 25, step: 1060, loss: 0.3316950500011444, mean loss: 0.3500576847618621
Epoch: 25, step: 1061, loss: 0.327932208776474, mean loss: 0.3500570893828194
Epoch: 25, step: 1062, loss: 0.3278639018535614, mean loss: 0.3500564921977824
Epoch: 25, step: 1063, loss: 0.3105356991291046, mean loss: 0.35005542878175966
Epoch: 25, step: 1064, loss: 0.33786725997924805, mean loss: 0.3500551008342606
Epoch: 25, step: 1065, loss: 0.30235451459884644, mean loss: 0.3500538173873943
Epoch: 25, step: 1066, loss: 0.3613432049751282, mean loss: 0.3500541211350088
Epoch: 25, step: 1067, loss: 0.340768039226532, mean loss: 0.3500538712942342
Epoch: 25, step: 1068, loss: 0.31965845823287964, mean loss: 0.35005305353176924
Epoch: 25, step: 1069, loss: 0.3157162070274353, mean loss: 0.35005212975327843
Epoch: 25, step: 1070, loss: 0.3484782874584198, mean loss: 0.3500520874126824
Epoch: 25, step: 1071, loss: 0.35413238406181335, mean loss: 0.3500521971806973
Epoch: 25, step: 1072, loss: 0.3443133234977722, mean loss: 0.3500520427978473
Epoch: 25, step: 1073, loss: 0.32413923740386963, mean loss: 0.3500513457298591
Epoch: 25, step: 1074, loss: 0.3272896111011505, mean loss: 0.35005073344378973
Epoch: 25, step: 1075, loss: 0.34583917260169983, mean loss: 0.35005062015670013
Epoch: 25, step: 1076, loss: 0.3514229357242584, mean loss: 0.35005065706972616
Epoch: 25, step: 1077, loss: 0.338662326335907, mean loss: 0.3500503507506468
Epoch: 25, step: 1078, loss: 0.32633471488952637, mean loss: 0.35004971287346176
Epoch: 25, step: 1079, loss: 0.2996219992637634, mean loss: 0.3500483565605621
Epoch: 25, step: 1080, loss: 0.33082231879234314, mean loss: 0.35004783946748314
Epoch: 25, step: 1081, loss: 0.33280932903289795, mean loss: 0.35004737584233026
Epoch: 25, step: 1082, loss: 0.3411226272583008, mean loss: 0.3500471358200463
Epoch: 25, step: 1083, loss: 0.3236808478832245, mean loss: 0.35004642674388625
Epoch: 25, step: 1084, loss: 0.3331853449344635, mean loss: 0.3500459733061611
Epoch: 25, step: 1085, loss: 0.3012572228908539, mean loss: 0.3500446612868416
Epoch: 25, step: 1086, loss: 0.3086603283882141, mean loss: 0.3500435484158679
Epoch: 25, step: 1087, loss: 0.309506356716156, mean loss: 0.350042458354781
Epoch: 25, step: 1088, loss: 0.3143496513366699, mean loss: 0.350041498586919
Epoch: 25, step: 1089, loss: 0.3041861057281494, mean loss: 0.35004026558361545
Epoch: 25, step: 1090, loss: 0.3128577172756195, mean loss: 0.3500392658108665
Epoch: 25, step: 1091, loss: 0.38335949182510376, mean loss: 0.350040161708533
Epoch: 25, step: 1092, loss: 0.3359970152378082, mean loss: 0.3500397841335466
Epoch: 25, step: 1093, loss: 0.3490295112133026, mean loss: 0.35003975697129136
Epoch: 25, step: 1094, loss: 0.36638692021369934, mean loss: 0.35004019647023593
Epoch: 25, step: 1095, loss: 0.31027692556381226, mean loss: 0.35003912745015564
Epoch: 25, step: 1096, loss: 0.29056316614151, mean loss: 0.35003752850504427
Epoch: 25, step: 1097, loss: 0.32341623306274414, mean loss: 0.3500368128403461
Epoch: 25, step: 1098, loss: 0.31396207213401794, mean loss: 0.3500358430631826
Epoch: 25, step: 1099, loss: 0.30036666989326477, mean loss: 0.35003450787035545
Epoch: 25, step: 1100, loss: 0.32301825284957886, mean loss: 0.35003378164646304
Epoch: 25, step: 1101, loss: 0.31578537821769714, mean loss: 0.35003286103995185
Epoch: 25, step: 1102, loss: 0.3020675778388977, mean loss: 0.3500315717545931
Epoch: 25, step: 1103, loss: 0.3212936818599701, mean loss: 0.3500307993137294
Epoch: 25, step: 1104, loss: 0.32052189111709595, mean loss: 0.35003000617011437
Epoch: 25, step: 1105, loss: 0.3155052661895752, mean loss: 0.35002907823537316
Epoch: 25, step: 1106, loss: 0.2831597328186035, mean loss: 0.3500272810105118
Epoch: 25, step: 1107, loss: 0.339463472366333, mean loss: 0.35002699709821755
Epoch: 25, step: 1108, loss: 0.3881901502609253, mean loss: 0.35002802274129213
Epoch: 25, step: 1109, loss: 0.367369681596756, mean loss: 0.3500284887896355
Epoch: 25, step: 1110, loss: 0.2978024184703827, mean loss: 0.3500270852780309
Epoch: 25, step: 1111, loss: 0.33388715982437134, mean loss: 0.35002665154897966
Epoch: 25, step: 1112, loss: 0.3097529113292694, mean loss: 0.35002556929975975
Epoch: 25, step: 1113, loss: 0.3336726129055023, mean loss: 0.3500251298695347
Epoch: 25, step: 1114, loss: 0.3941091001033783, mean loss: 0.35002631444484666
Epoch: 25, step: 1115, loss: 0.33182674646377563, mean loss: 0.35002582541948174
Epoch: 25, step: 1116, loss: 0.32335466146469116, mean loss: 0.3500251087802052
Epoch: 25, step: 1117, loss: 0.34575027227401733, mean loss: 0.3500249939208225
Epoch: 25, step: 1118, loss: 0.3452903926372528, mean loss: 0.3500248667115669
Epoch: 25, step: 1119, loss: 0.30902209877967834, mean loss: 0.35002376507889815
Epoch: 25, step: 1120, loss: 0.29945579171180725, mean loss: 0.35002240649171973
Epoch: 25, step: 1121, loss: 0.3535284698009491, mean loss: 0.3500225006850277
Epoch: 25, step: 1122, loss: 0.3027379512786865, mean loss: 0.3500212303803933
Epoch: 25, step: 1123, loss: 0.2929283678531647, mean loss: 0.35001969661555
Epoch: 25, step: 1124, loss: 0.3655039668083191, mean loss: 0.3500201125798265
Epoch: 25, step: 1125, loss: 0.3389335870742798, mean loss: 0.3500198147630988
Epoch: 25, step: 1126, loss: 0.31501665711402893, mean loss: 0.3500188745004494
Epoch: 25, step: 1127, loss: 0.32890525460243225, mean loss: 0.35001830735690426
Epoch: 25, step: 1128, loss: 0.3183400332927704, mean loss: 0.35001745645373566
Epoch: 25, step: 1129, loss: 0.32263055443763733, mean loss: 0.3500167208399292
Epoch: 25, step: 1130, loss: 0.3087332248687744, mean loss: 0.3500156119925716
Epoch: 25, step: 1131, loss: 0.34555986523628235, mean loss: 0.3500154923173794
Epoch: 25, step: 1132, loss: 0.3736739456653595, mean loss: 0.3500161277336324
Epoch: 25, step: 1133, loss: 0.29642871022224426, mean loss: 0.35001468852706014
Epoch: 25, step: 1134, loss: 0.31947338581085205, mean loss: 0.3500138682960217
Epoch: 25, step: 1135, loss: 0.30979254841804504, mean loss: 0.35001278812307407
Epoch: 25, step: 1136, loss: 0.34232497215270996, mean loss: 0.35001258166670085
Epoch: 25, step: 1137, loss: 0.3001164197921753, mean loss: 0.35001124174076836
Epoch: 25, step: 1138, loss: 0.3174223005771637, mean loss: 0.3500103666114372
Epoch: 25, step: 1139, loss: 0.38543689250946045, mean loss: 0.3500113179144957
Epoch: 25, step: 1140, loss: 0.3307890295982361, mean loss: 0.3500108017552004
Epoch: 25, step: 1141, loss: 0.3394569456577301, mean loss: 0.3500105183693431
Epoch: 25, step: 1142, loss: 0.30104655027389526, mean loss: 0.3500092036533402
Epoch: 25, step: 1143, loss: 0.33736950159072876, mean loss: 0.35000886427781497
Epoch: 25, step: 1144, loss: 0.3044266104698181, mean loss: 0.35000764042887395
Epoch: 25, step: 1145, loss: 0.2824743688106537, mean loss: 0.35000582726043655
Epoch: 25, step: 1146, loss: 0.3304671049118042, mean loss: 0.35000530268873015
Epoch: 25, step: 1147, loss: 0.3057461082935333, mean loss: 0.35000411445864005
Epoch: 25, step: 1148, loss: 0.30672144889831543, mean loss: 0.3500029524766926
Epoch: 25, step: 1149, loss: 0.32713010907173157, mean loss: 0.35000233844062806
Epoch: 25, step: 1150, loss: 0.3514479100704193, mean loss: 0.3500023772468783
Epoch: 25, step: 1151, loss: 0.3244803845882416, mean loss: 0.35000169212949783
Epoch: 25, step: 1152, loss: 0.3372584581375122, mean loss: 0.35000135005680594
Epoch: 25, step: 1153, loss: 0.36704063415527344, mean loss: 0.35000180743813675
Epoch: 25, step: 1154, loss: 0.332937628030777, mean loss: 0.3500013494008422
Epoch: 25, step: 1155, loss: 0.3140639364719391, mean loss: 0.350000384793452
Epoch: 25, step: 1156, loss: 0.3653239905834198, mean loss: 0.3500007960881293
Epoch: 25, step: 1157, loss: 0.3247333765029907, mean loss: 0.3500001179137886
Epoch: 25, step: 1158, loss: 0.3354150354862213, mean loss: 0.34999972646253047
Epoch: 25, step: 1159, loss: 0.35782289505004883, mean loss: 0.3499999364241136
Epoch: 25, step: 1160, loss: 0.3330160081386566, mean loss: 0.3499994806143316
Epoch: 25, step: 1161, loss: 0.3340756297111511, mean loss: 0.34999905326607056
Epoch: 25, step: 1162, loss: 0.33989202976226807, mean loss: 0.3499987820312397
Epoch: 25, step: 1163, loss: 0.3069198429584503, mean loss: 0.34999762598414136
Epoch: 25, step: 1164, loss: 0.30664902925491333, mean loss: 0.34999646273184754
Epoch: 25, step: 1165, loss: 0.4188567101955414, mean loss: 0.3499983105354075
Epoch: 25, step: 1166, loss: 0.37218591570854187, mean loss: 0.34999890590410293
Epoch: 25, step: 1167, loss: 0.34499552845954895, mean loss: 0.3499987716501198
Epoch: 25, step: 1168, loss: 0.29259592294692993, mean loss: 0.3499972314196681
Epoch: 25, step: 1169, loss: 0.3239319622516632, mean loss: 0.3499965320563955
Epoch: 25, step: 1170, loss: 0.31426912546157837, mean loss: 0.3499955734717964
Epoch: 25, step: 1171, loss: 0.39220130443573, mean loss: 0.3499967058427709
Epoch: 25, step: 1172, loss: 0.3206178843975067, mean loss: 0.3499959176362556
Epoch: 25, step: 1173, loss: 0.31897634267807007, mean loss: 0.34999508543217345
Epoch: 25, step: 1174, loss: 0.327300101518631, mean loss: 0.3499944765794863
Epoch: 25, step: 1175, loss: 0.3215704560279846, mean loss: 0.3499937140507667
Epoch: 25, step: 1176, loss: 0.3715382218360901, mean loss: 0.34999429200789267
Epoch: 25, step: 1177, loss: 0.33797547221183777, mean loss: 0.3499939695973611
Epoch: 25, step: 1178, loss: 0.34537652134895325, mean loss: 0.3499938457354483
Epoch: 25, step: 1179, loss: 0.333118736743927, mean loss: 0.34999339307694527
Epoch: 25, step: 1180, loss: 0.2835077941417694, mean loss: 0.3499916097127937
Epoch: 25, step: 1181, loss: 0.3254110515117645, mean loss: 0.3499909503984275
Epoch: 25, step: 1182, loss: 0.38369932770729065, mean loss: 0.3499918545203412
Epoch: 25, step: 1183, loss: 0.3405153155326843, mean loss: 0.34999160034860566
Epoch: 25, step: 1184, loss: 0.3769439458847046, mean loss: 0.3499923232222958
Epoch: 25, step: 1185, loss: 0.3312862515449524, mean loss: 0.3499918215307312
Epoch: 25, step: 1186, loss: 0.3141772449016571, mean loss: 0.3499908610196515
Epoch: 25, step: 1187, loss: 0.36222851276397705, mean loss: 0.3499911892124144
Epoch: 25, step: 1188, loss: 0.3838180899620056, mean loss: 0.34999209636735956
Epoch: 25, step: 1189, loss: 0.31162118911743164, mean loss: 0.34999106738084174
Epoch: 25, step: 1190, loss: 0.33889302611351013, mean loss: 0.3499907697744148
Epoch: 25, step: 1191, loss: 0.29397010803222656, mean loss: 0.3499892675578069
Epoch: 25, step: 1192, loss: 0.3098381757736206, mean loss: 0.34998819091897965
Epoch: 25, step: 1193, loss: 0.30980807542800903, mean loss: 0.3499871135307807
Epoch: 25, step: 1194, loss: 0.3214704096317291, mean loss: 0.34998634890539126
Epoch: 25, step: 1195, loss: 0.3036579489707947, mean loss: 0.34998510672392585
Epoch: 25, step: 1196, loss: 0.3492809236049652, mean loss: 0.34998508784350335
Epoch: 25, step: 1197, loss: 0.3638782203197479, mean loss: 0.3499854603335156
Epoch: 25, step: 1198, loss: 0.35868313908576965, mean loss: 0.34998569352150327
Epoch: 25, step: 1199, loss: 0.3056272864341736, mean loss: 0.3499845042880693
Epoch: 25, step: 1200, loss: 0.32019054889678955, mean loss: 0.3499837055439233
Epoch: 25, step: 1201, loss: 0.311322420835495, mean loss: 0.3499826691039279
Epoch: 25, step: 1202, loss: 0.32484886050224304, mean loss: 0.34998199532947005
Epoch: 25, step: 1203, loss: 0.3098418712615967, mean loss: 0.3499809193021253
Epoch: 25, step: 1204, loss: 0.32425007224082947, mean loss: 0.3499802295595423
Epoch: 25, step: 1205, loss: 0.3123869299888611, mean loss: 0.3499792218583797
Epoch: 25, step: 1206, loss: 0.30901986360549927, mean loss: 0.3499781239583006
Epoch: 25, step: 1207, loss: 0.2985868752002716, mean loss: 0.3499767464722719
Epoch: 25, step: 1208, loss: 0.34128329157829285, mean loss: 0.34997651345999886
Epoch: 25, step: 1209, loss: 0.33103013038635254, mean loss: 0.349976005650214
Epoch: 25, step: 1210, loss: 0.36457377672195435, mean loss: 0.3499763968959879
Epoch: 25, step: 1211, loss: 0.3148272633552551, mean loss: 0.34997545486303494
Epoch: 25, step: 1212, loss: 0.32423272728919983, mean loss: 0.34997476494993296
Epoch: 25, step: 1213, loss: 0.35232019424438477, mean loss: 0.34997482780648265
Epoch: 25, step: 1214, loss: 0.3536235988140106, mean loss: 0.34997492558943877
Epoch: 25, step: 1215, loss: 0.29200732707977295, mean loss: 0.34997337216467433
Epoch: 25, step: 1216, loss: 0.34727492928504944, mean loss: 0.34997329985331815
Epoch: 25, step: 1217, loss: 0.3251666724681854, mean loss: 0.34997263511706794
Epoch: 25, step: 1218, loss: 0.30035465955734253, mean loss: 0.3499713055536938
Epoch: 25, step: 1219, loss: 0.3443185091018677, mean loss: 0.34997115408540735
Epoch: 25, step: 1220, loss: 0.30568814277648926, mean loss: 0.3499699675413354
Epoch: 25, step: 1221, loss: 0.37738218903541565, mean loss: 0.3499707020202351
Epoch: 25, step: 1222, loss: 0.3423100709915161, mean loss: 0.3499704967679502
Epoch: 25, step: 1223, loss: 0.32271745800971985, mean loss: 0.349969766593297
Epoch: 25, step: 1224, loss: 0.35873115062713623, mean loss: 0.34997000132562206
Epoch: 25, step: 1225, loss: 0.3540397882461548, mean loss: 0.349970110359189
Epoch: 25, step: 1226, loss: 0.3757161498069763, mean loss: 0.3499708001022556
Epoch: 25, step: 1227, loss: 0.31135252118110657, mean loss: 0.34996976553627507
Epoch: 25, step: 1228, loss: 0.3218673765659332, mean loss: 0.3499690127063313
Epoch: 25, step: 1229, loss: 0.32458099722862244, mean loss: 0.3499683326094795
Epoch: 25, step: 1230, loss: 0.3814984858036041, mean loss: 0.34996917721994253
Epoch: 25, step: 1231, loss: 0.3144698143005371, mean loss: 0.349968226310189
Epoch: 25, step: 1232, loss: 0.32356560230255127, mean loss: 0.3499675190907315
Epoch: 25, step: 1233, loss: 0.320178359746933, mean loss: 0.34996672118106886
Epoch: 25, step: 1234, loss: 0.37219467759132385, mean loss: 0.34996731654617963
Epoch: 25, step: 1235, loss: 0.30529195070266724, mean loss: 0.34996611997006427
Epoch: 25, step: 1236, loss: 0.35731345415115356, mean loss: 0.3499663167543314
Epoch: 25, step: 1237, loss: 0.32052284479141235, mean loss: 0.34996552818847454
Epoch: 25, step: 1238, loss: 0.3549846410751343, mean loss: 0.34996566260859524
Epoch: 25, step: 1239, loss: 0.3395799696445465, mean loss: 0.3499653844700584
Epoch: 25, step: 1240, loss: 0.3709148168563843, mean loss: 0.3499659455003572
Epoch: 25, step: 1241, loss: 0.31298384070396423, mean loss: 0.34996495513816994
Epoch: 25, step: 1242, loss: 0.3094666302204132, mean loss: 0.3499638706424166
Epoch: 25, step: 1243, loss: 0.28336581587791443, mean loss: 0.34996208727548306
Epoch: 25, step: 1244, loss: 0.31523555517196655, mean loss: 0.3499611573911049
Epoch: 25, step: 1245, loss: 0.32660111784935, mean loss: 0.3499605318879843
Epoch: 25, step: 1246, loss: 0.3180343210697174, mean loss: 0.34995967703456055
Epoch: 25, step: 1247, loss: 0.35095900297164917, mean loss: 0.3499597037917078
Epoch: 25, step: 1248, loss: 0.34525078535079956, mean loss: 0.34995957771287195
Epoch: 25, step: 1249, loss: 0.3471784293651581, mean loss: 0.3499595032510688
Epoch: 25, step: 1250, loss: 0.3532615303993225, mean loss: 0.3499595916563899
Epoch: 25, step: 1251, loss: 0.3269151449203491, mean loss: 0.3499589747029005
Epoch: 25, step: 1252, loss: 0.34334248304367065, mean loss: 0.3499587975687571
Epoch: 25, step: 1253, loss: 0.317443311214447, mean loss: 0.3499579271000963
Epoch: 25, step: 1254, loss: 0.29943564534187317, mean loss: 0.3499565746096196
Epoch: 25, step: 1255, loss: 0.3373841345310211, mean loss: 0.34995623805217024
Epoch: 25, step: 1256, loss: 0.29337018728256226, mean loss: 0.3499547233146172
Epoch: 25, step: 1257, loss: 0.33877259492874146, mean loss: 0.34995442399108845
Epoch: 25, step: 1258, loss: 0.3421700894832611, mean loss: 0.3499542156253798
Epoch: 25, step: 1259, loss: 0.31353068351745605, mean loss: 0.3499532406914369
Epoch: 25, step: 1260, loss: 0.37687763571739197, mean loss: 0.3499539613465325
Epoch: 25, step: 1261, loss: 0.32350024580955505, mean loss: 0.3499532533085384
Epoch: 25, step: 1262, loss: 0.37352457642555237, mean loss: 0.3499538841819457
Epoch: 25, step: 1263, loss: 0.365720272064209, mean loss: 0.3499543061492908
Epoch: 25, step: 1264, loss: 0.30904489755630493, mean loss: 0.3499532112902357
Epoch: 25, step: 1265, loss: 0.3341952860355377, mean loss: 0.3499527895719556
Epoch: 25, step: 1266, loss: 0.3325801491737366, mean loss: 0.3499523246526311
Epoch: 25, step: 1267, loss: 0.3421002924442291, mean loss: 0.3499521145254579
Epoch: 25, step: 1268, loss: 0.30286210775375366, mean loss: 0.34995085438987034
Epoch: 25, step: 1269, loss: 0.32411864399909973, mean loss: 0.3499501631345749
Epoch: 25, step: 1270, loss: 0.2960720658302307, mean loss: 0.3499487214258354
Epoch: 25, step: 1271, loss: 0.35501646995544434, mean loss: 0.3499488570286538
Epoch: 25, step: 1272, loss: 0.3539022207260132, mean loss: 0.34994896280993165
Epoch: 25, step: 1273, loss: 0.43433254957199097, mean loss: 0.3499512206251712
Epoch: 25, step: 1274, loss: 0.3220237195491791, mean loss: 0.34995047340106217
Epoch: 25, step: 1275, loss: 0.30354467034339905, mean loss: 0.3499492318074444
Epoch: 25, step: 1276, loss: 0.3142126500606537, mean loss: 0.34994827569588527
Epoch: 25, step: 1277, loss: 0.3575895428657532, mean loss: 0.34994848012809593
Epoch: 25, step: 1278, loss: 0.32880762219429016, mean loss: 0.3499479145469425
Epoch: 25, step: 1279, loss: 0.34897908568382263, mean loss: 0.34994788862856735
Epoch: 25, step: 1280, loss: 0.32412299513816833, mean loss: 0.3499471977724241
Epoch: 25, step: 1281, loss: 0.3245564103126526, mean loss: 0.349946518547464
Epoch: 25, step: 1282, loss: 0.3725167512893677, mean loss: 0.34994712230405767
Epoch: 25, step: 1283, loss: 0.32395440340042114, mean loss: 0.3499464270141234
Epoch: 25, step: 1284, loss: 0.33441007137298584, mean loss: 0.3499460114368694
Epoch: 25, step: 1285, loss: 0.39503803849220276, mean loss: 0.349947217557531
Epoch: 25, step: 1286, loss: 0.31085309386253357, mean loss: 0.34994617189664096
Epoch: 25, step: 1287, loss: 0.3220285177230835, mean loss: 0.34994542519571625
Epoch: 25, step: 1288, loss: 0.3345752954483032, mean loss: 0.3499450141087723
Epoch: 25, step: 1289, loss: 0.32830971479415894, mean loss: 0.3499444354701172
Epoch: 25, step: 1290, loss: 0.3270694613456726, mean loss: 0.3499438236925738
Epoch: 25, step: 1291, loss: 0.35030460357666016, mean loss: 0.34994383334115864
Epoch: 25, step: 1292, loss: 0.3518100082874298, mean loss: 0.3499438832482254
Epoch: 25, step: 1293, loss: 0.32663729786872864, mean loss: 0.34994325997750336
Epoch: 25, step: 1294, loss: 0.3229105770587921, mean loss: 0.349942537081851
Epoch: 25, step: 1295, loss: 0.3685700297355652, mean loss: 0.3499430351964262
Epoch: 25, step: 1296, loss: 0.3363009989261627, mean loss: 0.34994267040683696
Epoch: 25, step: 1297, loss: 0.33411139249801636, mean loss: 0.3499422470879988
Epoch: 25, step: 1298, loss: 0.3550397455692291, mean loss: 0.34994238338839406
Epoch: 25, step: 1299, loss: 0.2807818353176117, mean loss: 0.3499405341758788
Epoch: 25, step: 1300, loss: 0.3696040213108063, mean loss: 0.34994105992350943
Epoch: 25, step: 1301, loss: 0.3224417567253113, mean loss: 0.3499403246873403
Epoch: 25, step: 1302, loss: 0.31608453392982483, mean loss: 0.34993941952489993
Epoch: 25, step: 1303, loss: 0.3182573616504669, mean loss: 0.34993857250164373
Epoch: 25, step: 1304, loss: 0.3430149257183075, mean loss: 0.3499383874021441
Epoch: 25, step: 1305, loss: 0.32300376892089844, mean loss: 0.34993766734069726
Epoch: 25, step: 1306, loss: 0.32886528968811035, mean loss: 0.34993710401357525
Epoch: 25, step: 1307, loss: 0.3536575734615326, mean loss: 0.3499372034700939
Epoch: 25, step: 1308, loss: 0.3252463936805725, mean loss: 0.34993654344684305
Epoch: 25, step: 1309, loss: 0.3303363025188446, mean loss: 0.34993601951631836
Epoch: 25, step: 1310, loss: 0.31828466057777405, mean loss: 0.34993517347213515
Epoch: 25, step: 1311, loss: 0.3035064935684204, mean loss: 0.34993393246176674
Epoch: 25, step: 1312, loss: 0.3060090243816376, mean loss: 0.3499327584070777
Epoch: 25, step: 1313, loss: 0.3117557466030121, mean loss: 0.3499317380133266
Epoch: 25, step: 1314, loss: 0.30231747031211853, mean loss: 0.349930465414965
Epoch: 25, step: 1315, loss: 0.34598368406295776, mean loss: 0.34993035993117855
Epoch: 25, step: 1316, loss: 0.3043847680091858, mean loss: 0.3499291426878955
Epoch: 25, step: 1317, loss: 0.3583459258079529, mean loss: 0.34992936762731286
Epoch: 25, step: 1318, loss: 0.32429206371307373, mean loss: 0.34992868248596987
Epoch: 25, step: 1319, loss: 0.3411734104156494, mean loss: 0.34992844851290544
Epoch: 25, step: 1320, loss: 0.352856308221817, mean loss: 0.3499285267539922
Epoch: 25, step: 1321, loss: 0.31808626651763916, mean loss: 0.3499276758571872
Epoch: 25, step: 1322, loss: 0.3166441023349762, mean loss: 0.34992678646901626
Epoch: 25, step: 1323, loss: 0.36038026213645935, mean loss: 0.349927065794467
Epoch: 25, step: 1324, loss: 0.31007248163223267, mean loss: 0.34992600087571846
Epoch: 25, step: 1325, loss: 0.36080554127693176, mean loss: 0.34992629157043337
Epoch: 25, step: 1326, loss: 0.28836268186569214, mean loss: 0.3499246466721058
Epoch: 25, step: 1327, loss: 0.3221188485622406, mean loss: 0.34992390375776067
Epoch: 25, step: 1328, loss: 0.39382004737854004, mean loss: 0.3499250765420622
Epoch: 25, step: 1329, loss: 0.31571483612060547, mean loss: 0.34992416256288983
Epoch: 25, step: 1330, loss: 0.3404124975204468, mean loss: 0.3499239084509227
Epoch: 25, step: 1331, loss: 0.37928134202957153, mean loss: 0.349924692737992
Epoch: 25, step: 1332, loss: 0.34511637687683105, mean loss: 0.34992456428673613
Epoch: 25, step: 1333, loss: 0.3173793852329254, mean loss: 0.3499236948851479
Epoch: 25, step: 1334, loss: 0.34687697887420654, mean loss: 0.34992361349831713
Epoch: 25, step: 1335, loss: 0.3715693950653076, mean loss: 0.3499241917059666
Epoch: 25, step: 1336, loss: 0.2948527932167053, mean loss: 0.3499227206639897
Epoch: 25, step: 1337, loss: 0.32254764437675476, mean loss: 0.34992198945301994
Epoch: 25, step: 1338, loss: 0.3181414306163788, mean loss: 0.34992114059063484
Epoch: 25, step: 1339, loss: 0.32965341210365295, mean loss: 0.34992059925173297
Epoch: 25, step: 1340, loss: 0.3728609085083008, mean loss: 0.34992121195730325
Epoch: 25, step: 1341, loss: 0.3227216303348541, mean loss: 0.34992048551155724
Epoch: 25, step: 1342, loss: 0.31108444929122925, mean loss: 0.34991944830737437
Epoch: 25, step: 1343, loss: 0.33409982919692993, mean loss: 0.3499190258199502
Epoch: 25, step: 1344, loss: 0.32931187748908997, mean loss: 0.3499184754888424
Epoch: 25, step: 1345, loss: 0.3081533908843994, mean loss: 0.34991736014716096
Epoch: 25, step: 1346, loss: 0.34294188022613525, mean loss: 0.3499171738710929
Epoch: 25, step: 1347, loss: 0.3696688115596771, mean loss: 0.34991770131281713
Epoch: 25, step: 1348, loss: 0.3408644199371338, mean loss: 0.34991745956320097
Epoch: 25, step: 1349, loss: 0.31530117988586426, mean loss: 0.34991653522996524
Epoch: 25, step: 1350, loss: 0.3651772439479828, mean loss: 0.34991694271464435
Epoch: 25, step: 1351, loss: 0.30091848969459534, mean loss: 0.34991563441460644
Epoch: 25, step: 1352, loss: 0.343416690826416, mean loss: 0.34991546089196235
Epoch: 25, step: 1353, loss: 0.3633948564529419, mean loss: 0.3499158207839782
Epoch: 25, step: 1354, loss: 0.3664116859436035, mean loss: 0.3499162612022177
Epoch: 25, step: 1355, loss: 0.295937180519104, mean loss: 0.34991482006913666
Epoch: 25, step: 1356, loss: 0.3056066334247589, mean loss: 0.3499136371610916
Epoch: 25, step: 1357, loss: 0.34403032064437866, mean loss: 0.34991348009673906
Epoch: 25, step: 1358, loss: 0.32405951619148254, mean loss: 0.3499127899030899
Epoch: 25, step: 1359, loss: 0.3183963894844055, mean loss: 0.34991194856832164
Epoch: 25, step: 1360, loss: 0.3508625626564026, mean loss: 0.3499119739444218
Epoch: 25, step: 1361, loss: 0.2984130382537842, mean loss: 0.34991059924644274
Epoch: 25, step: 1362, loss: 0.3460019528865814, mean loss: 0.34991049491293075
Epoch: 25, step: 1363, loss: 0.3391750752925873, mean loss: 0.3499102083599834
Epoch: 25, step: 1364, loss: 0.36110806465148926, mean loss: 0.349910507248447
Epoch: 25, step: 1365, loss: 0.3109798729419708, mean loss: 0.3499094681560884
Epoch: 25, step: 1366, loss: 0.3375912308692932, mean loss: 0.3499091393804382
Epoch: 25, step: 1367, loss: 0.3194126486778259, mean loss: 0.3499083254461289
Epoch: 25, step: 1368, loss: 0.3459952175617218, mean loss: 0.34990822101025165
Epoch: 25, step: 1369, loss: 0.338809072971344, mean loss: 0.3499079247959992
Epoch: 25, step: 1370, loss: 0.343279629945755, mean loss: 0.3499077479046739
Epoch: 25, step: 1371, loss: 0.375482439994812, mean loss: 0.349908430406064
Epoch: 25, step: 1372, loss: 0.3558013141155243, mean loss: 0.3499085876628545
Epoch: 25, step: 1373, loss: 0.33440902829170227, mean loss: 0.3499081740545028
Epoch: 25, step: 1374, loss: 0.3686100244522095, mean loss: 0.34990867310321255
Epoch: 25, step: 1375, loss: 0.31394901871681213, mean loss: 0.3499077135649911
Epoch: 25, step: 1376, loss: 0.3364087641239166, mean loss: 0.3499073533720877
Epoch: 25, step: 1377, loss: 0.3441031873226166, mean loss: 0.34990719850347013
Epoch: 25, step: 1378, loss: 0.3160657286643982, mean loss: 0.3499062955586253
Epoch: 25, step: 1379, loss: 0.3015669286251068, mean loss: 0.34990500582098033
Epoch: 25, step: 1380, loss: 0.3564656376838684, mean loss: 0.3499051808598497
Epoch: 25, step: 1381, loss: 0.3202723562717438, mean loss: 0.34990439027171166
Epoch: 25, step: 1382, loss: 0.3102256953716278, mean loss: 0.34990333169329213
Epoch: 25, step: 1383, loss: 0.3426625728607178, mean loss: 0.34990313852397104
Epoch: 25, step: 1384, loss: 0.36803632974624634, mean loss: 0.34990362226923505
Epoch: 25, step: 1385, loss: 0.3563788831233978, mean loss: 0.3499037950073467
Epoch: 25, step: 1386, loss: 0.34524768590927124, mean loss: 0.34990367080137935
Epoch: 25, step: 1387, loss: 0.32943785190582275, mean loss: 0.34990312487151126
Epoch: 25, step: 1388, loss: 0.29477113485336304, mean loss: 0.34990165425372954
Epoch: 25, step: 1389, loss: 0.32406434416770935, mean loss: 0.34990096507501295
Epoch: 25, step: 1390, loss: 0.34150031208992004, mean loss: 0.3499007410038229
Epoch: 25, step: 1391, loss: 0.29900607466697693, mean loss: 0.3498993835231247
Epoch: 25, step: 1392, loss: 0.31118565797805786, mean loss: 0.3498983509643659
Epoch: 25, step: 1393, loss: 0.31919345259666443, mean loss: 0.34989753203604756
Epoch: 25, step: 1394, loss: 0.3166821300983429, mean loss: 0.34989664617388094
Epoch: 25, step: 1395, loss: 0.3105839490890503, mean loss: 0.3498955977234573
Epoch: 25, step: 1396, loss: 0.38169223070144653, mean loss: 0.3498964457015083
Epoch: 25, step: 1397, loss: 0.320626825094223, mean loss: 0.349895665136662
Epoch: 25, step: 1398, loss: 0.2982773780822754, mean loss: 0.3498942886122999
Epoch: 25, step: 1399, loss: 0.31013065576553345, mean loss: 0.3498932282487573
Epoch: 25, step: 1400, loss: 0.3518688678741455, mean loss: 0.3498932809310758
Epoch: 25, step: 1401, loss: 0.3223501145839691, mean loss: 0.3498925464858103
Epoch: 25, step: 1402, loss: 0.3517208993434906, mean loss: 0.3498925952379863
Epoch: 25, step: 1403, loss: 0.3569856286048889, mean loss: 0.3498927843653692
Epoch: 25, step: 1404, loss: 0.34043675661087036, mean loss: 0.349892532238246
Epoch: 25, step: 1405, loss: 0.32991352677345276, mean loss: 0.34989199954999706
Epoch: 25, step: 1406, loss: 0.3226429522037506, mean loss: 0.34989127304434886
Epoch: 25, step: 1407, loss: 0.31875091791152954, mean loss: 0.3498904428119949
Epoch: 25, step: 1408, loss: 0.33027711510658264, mean loss: 0.3498899199154179
Epoch: 25, step: 1409, loss: 0.3445976674556732, mean loss: 0.3498897788263094
Epoch: 25, step: 1410, loss: 0.29240497946739197, mean loss: 0.3498882463478535
Epoch: 25, step: 1411, loss: 0.3424298167228699, mean loss: 0.3498880475200217
Epoch: 25, step: 1412, loss: 0.33536165952682495, mean loss: 0.3498876602839171
Epoch: 25, step: 1413, loss: 0.33871889114379883, mean loss: 0.34988736256122316
Epoch: 25, step: 1414, loss: 0.3322985768318176, mean loss: 0.34988689371447573
Epoch: 25, step: 1415, loss: 0.3608089089393616, mean loss: 0.3498871848439998
Epoch: 25, step: 1416, loss: 0.3054393231868744, mean loss: 0.3498860001047707
Epoch: 25, step: 1417, loss: 0.37112849950790405, mean loss: 0.3498865662996479
Epoch: 25, step: 1418, loss: 0.34155240654945374, mean loss: 0.3498863441679347
Epoch: 25, step: 1419, loss: 0.33174654841423035, mean loss: 0.3498858606978986
Epoch: 25, step: 1420, loss: 0.31943178176879883, mean loss: 0.34988504904365353
Epoch: 25, step: 1421, loss: 0.3422193229198456, mean loss: 0.34988484474414594
Epoch: 25, step: 1422, loss: 0.30548936128616333, mean loss: 0.3498836615902548
Epoch: 25, step: 1423, loss: 0.32814866304397583, mean loss: 0.3498830823610003
Epoch: 25, step: 1424, loss: 0.3444235920906067, mean loss: 0.349882936871586
Epoch: 25, step: 1425, loss: 0.332380473613739, mean loss: 0.34988247046260934
Epoch: 25, step: 1426, loss: 0.32049351930618286, mean loss: 0.349881687321107
Epoch: 25, step: 1427, loss: 0.30644741654396057, mean loss: 0.3498805299380656
Epoch: 25, step: 1428, loss: 0.34036704897880554, mean loss: 0.34988027644127756
Epoch: 25, step: 1429, loss: 0.34154239296913147, mean loss: 0.349880054275451
Epoch: 25, step: 1430, loss: 0.3058857023715973, mean loss: 0.34987888206176354
Epoch: 25, step: 1431, loss: 0.3438222110271454, mean loss: 0.34987872068824133
Epoch: 25, step: 1432, loss: 0.29476016759872437, mean loss: 0.3498772521524704
Epoch: 25, step: 1433, loss: 0.3183532655239105, mean loss: 0.3498764122743165
Epoch: 25, step: 1434, loss: 0.327944815158844, mean loss: 0.34987582797707084
Epoch: 25, step: 1435, loss: 0.3737397789955139, mean loss: 0.3498764637387668
Epoch: 25, step: 1436, loss: 0.31053707003593445, mean loss: 0.34987541572231096
Epoch: 25, step: 1437, loss: 0.3498605191707611, mean loss: 0.34987541532547173
Epoch: 25, step: 1438, loss: 0.3299923241138458, mean loss: 0.3498748856605576
Epoch: 25, step: 1439, loss: 0.3043568730354309, mean loss: 0.3498736731402426
Epoch: 25, step: 1440, loss: 0.3536962568759918, mean loss: 0.349873774964481
Epoch: 25, step: 1441, loss: 0.3316783905029297, mean loss: 0.3498732902970562
Epoch: 25, step: 1442, loss: 0.3399270176887512, mean loss: 0.34987302536690656
Epoch: 25, step: 1443, loss: 0.29083451628685, mean loss: 0.34987145285174887
Valid: 25, mean loss: 0.18690243363380432
Epoch: 26, step: 0, loss: 0.31485435366630554, mean loss: 0.3498705201816414
Epoch: 26, step: 1, loss: 0.3072688579559326, mean loss: 0.34986938552915575
Epoch: 26, step: 2, loss: 0.318581759929657, mean loss: 0.3498685522368661
Epoch: 26, step: 3, loss: 0.35378843545913696, mean loss: 0.34986865663345773
Epoch: 26, step: 4, loss: 0.3110911548137665, mean loss: 0.34986762391615983
Epoch: 26, step: 5, loss: 0.3388742506504059, mean loss: 0.34986733114989443
Epoch: 26, step: 6, loss: 0.33346518874168396, mean loss: 0.34986689435347335
Epoch: 26, step: 7, loss: 0.36161887645721436, mean loss: 0.34986720730570237
Epoch: 26, step: 8, loss: 0.35492172837257385, mean loss: 0.3498673419027004
Epoch: 26, step: 9, loss: 0.3124012351036072, mean loss: 0.34986634424314883
Epoch: 26, step: 10, loss: 0.32741132378578186, mean loss: 0.3498657463195579
Epoch: 26, step: 11, loss: 0.36317500472068787, mean loss: 0.34986610070390134
Epoch: 26, step: 12, loss: 0.36417052149772644, mean loss: 0.3498664815761966
Epoch: 26, step: 13, loss: 0.38255971670150757, mean loss: 0.34986735204946795
Epoch: 26, step: 14, loss: 0.3121121823787689, mean loss: 0.3498663468264942
Epoch: 26, step: 15, loss: 0.3372366726398468, mean loss: 0.34986601057318784
Epoch: 26, step: 16, loss: 0.40619173645973206, mean loss: 0.3498675101532279
Epoch: 26, step: 17, loss: 0.318363755941391, mean loss: 0.3498666714397885
Epoch: 26, step: 18, loss: 0.3037884533405304, mean loss: 0.3498654447481478
Epoch: 26, step: 19, loss: 0.36607158184051514, mean loss: 0.3498658761755009
Epoch: 26, step: 20, loss: 0.317822128534317, mean loss: 0.3498650231541342
Epoch: 26, step: 21, loss: 0.3366406261920929, mean loss: 0.34986467112312314
Epoch: 26, step: 22, loss: 0.2992664575576782, mean loss: 0.34986332424385236
Epoch: 26, step: 23, loss: 0.3282327950000763, mean loss: 0.3498627484738022
Epoch: 26, step: 24, loss: 0.32294538617134094, mean loss: 0.3498620319957937
Epoch: 26, step: 25, loss: 0.32278570532798767, mean loss: 0.349861311305704
Epoch: 26, step: 26, loss: 0.3663889467716217, mean loss: 0.34986175120976476
Epoch: 26, step: 27, loss: 0.33953598141670227, mean loss: 0.3498614763835699
Epoch: 26, step: 28, loss: 0.3373333513736725, mean loss: 0.34986114294932164
Epoch: 26, step: 29, loss: 0.3583453893661499, mean loss: 0.34986136875031215
Epoch: 26, step: 30, loss: 0.3452242612838745, mean loss: 0.3498612453409318
Epoch: 26, step: 31, loss: 0.3111365735530853, mean loss: 0.3498602147716379
Epoch: 26, step: 32, loss: 0.3883778750896454, mean loss: 0.3498612398045122
Epoch: 26, step: 33, loss: 0.34530124068260193, mean loss: 0.34986111845693857
Epoch: 26, step: 34, loss: 0.3308963477611542, mean loss: 0.34986061379287897
Epoch: 26, step: 35, loss: 0.3611380159854889, mean loss: 0.34986091388341095
Epoch: 26, step: 36, loss: 0.37165093421936035, mean loss: 0.34986149369821995
Epoch: 26, step: 37, loss: 0.3253561854362488, mean loss: 0.34986084164914694
Epoch: 26, step: 38, loss: 0.2948414087295532, mean loss: 0.3498593777044666
Epoch: 26, step: 39, loss: 0.2956632673740387, mean loss: 0.3498579357049368
Epoch: 26, step: 40, loss: 0.3453560769557953, mean loss: 0.3498578159268671
Epoch: 26, step: 41, loss: 0.3326711654663086, mean loss: 0.3498573586648424
Epoch: 26, step: 42, loss: 0.35198163986206055, mean loss: 0.349857415181223
Epoch: 26, step: 43, loss: 0.35487890243530273, mean loss: 0.3498575487740519
Epoch: 26, step: 44, loss: 0.3385903537273407, mean loss: 0.34985724902691717
Epoch: 26, step: 45, loss: 0.3585832118988037, mean loss: 0.3498574811621359
Epoch: 26, step: 46, loss: 0.37517645955085754, mean loss: 0.34985815470043996
Epoch: 26, step: 47, loss: 0.3194062113761902, mean loss: 0.3498573446359761
Epoch: 26, step: 48, loss: 0.34566089510917664, mean loss: 0.34985723300749405
Epoch: 26, step: 49, loss: 0.3430427014827728, mean loss: 0.349857051741028
Epoch: 26, step: 50, loss: 0.31914135813713074, mean loss: 0.34985623472563754
Epoch: 26, step: 51, loss: 0.3299033045768738, mean loss: 0.34985570400614213
Epoch: 26, step: 52, loss: 0.3246193528175354, mean loss: 0.3498550327730334
Epoch: 26, step: 53, loss: 0.34549975395202637, mean loss: 0.34985491693498827
Epoch: 26, step: 54, loss: 0.34078624844551086, mean loss: 0.34985467574058177
Epoch: 26, step: 55, loss: 0.3906708061695099, mean loss: 0.3498557612759655
Epoch: 26, step: 56, loss: 0.32786574959754944, mean loss: 0.34985517645078323
Epoch: 26, step: 57, loss: 0.3288425803184509, mean loss: 0.3498546176348657
Epoch: 26, step: 58, loss: 0.3583987057209015, mean loss: 0.34985484485312185
Epoch: 26, step: 59, loss: 0.3239166736602783, mean loss: 0.3498541550815233
Epoch: 26, step: 60, loss: 0.3202689588069916, mean loss: 0.34985336834581593
Epoch: 26, step: 61, loss: 0.35718849301338196, mean loss: 0.3498535633977935
Epoch: 26, step: 62, loss: 0.3014734983444214, mean loss: 0.349852276933437
Epoch: 26, step: 63, loss: 0.32045993208885193, mean loss: 0.34985149538842414
Epoch: 26, step: 64, loss: 0.31303685903549194, mean loss: 0.34985051651006116
Epoch: 26, step: 65, loss: 0.36815470457077026, mean loss: 0.34985100319413615
Epoch: 26, step: 66, loss: 0.34265610575675964, mean loss: 0.3498508118964456
Epoch: 26, step: 67, loss: 0.3902778625488281, mean loss: 0.3498518867409275
Epoch: 26, step: 68, loss: 0.3235706686973572, mean loss: 0.34985118801394366
Epoch: 26, step: 69, loss: 0.3300347626209259, mean loss: 0.3498506611775159
Epoch: 26, step: 70, loss: 0.36510607600212097, mean loss: 0.3498510667448381
Epoch: 26, step: 71, loss: 0.3411656320095062, mean loss: 0.34985083584748766
Epoch: 26, step: 72, loss: 0.3271721601486206, mean loss: 0.34985023296379947
Epoch: 26, step: 73, loss: 0.31681302189826965, mean loss: 0.3498493547349977
Epoch: 26, step: 74, loss: 0.3153603971004486, mean loss: 0.3498484379387608
Epoch: 26, step: 75, loss: 0.3196454644203186, mean loss: 0.3498476350952329
Epoch: 26, step: 76, loss: 0.33816397190093994, mean loss: 0.349847324532962
Epoch: 26, step: 77, loss: 0.32751238346099854, mean loss: 0.34984673086593016
Epoch: 26, step: 78, loss: 0.3487151563167572, mean loss: 0.34984670078926033
Epoch: 26, step: 79, loss: 0.3429965376853943, mean loss: 0.34984651872028566
Epoch: 26, step: 80, loss: 0.3254678249359131, mean loss: 0.3498458707815804
Epoch: 26, step: 81, loss: 0.3415014147758484, mean loss: 0.3498456490079131
Epoch: 26, step: 82, loss: 0.3423383831977844, mean loss: 0.3498454494898593
Epoch: 26, step: 83, loss: 0.3269587755203247, mean loss: 0.3498448412546629
Epoch: 26, step: 84, loss: 0.3268304765224457, mean loss: 0.3498442296422169
Epoch: 26, step: 85, loss: 0.355754554271698, mean loss: 0.34984438670638457
Epoch: 26, step: 86, loss: 0.3629648983478546, mean loss: 0.3498447353687013
Epoch: 26, step: 87, loss: 0.33141082525253296, mean loss: 0.3498442455220252
Epoch: 26, step: 88, loss: 0.35588863492012024, mean loss: 0.3498444061360979
Epoch: 26, step: 89, loss: 0.3081551492214203, mean loss: 0.34984329838095857
Epoch: 26, step: 90, loss: 0.3206979036331177, mean loss: 0.34984252395835336
Epoch: 26, step: 91, loss: 0.3044987916946411, mean loss: 0.34984131916155603
Epoch: 26, step: 92, loss: 0.29794245958328247, mean loss: 0.34983994022966514
Epoch: 26, step: 93, loss: 0.35427746176719666, mean loss: 0.34984005812970065
Epoch: 26, step: 94, loss: 0.35087618231773376, mean loss: 0.3498400856576421
Epoch: 26, step: 95, loss: 0.38326653838157654, mean loss: 0.34984097371430317
Epoch: 26, step: 96, loss: 0.337578147649765, mean loss: 0.349840647930555
Epoch: 26, step: 97, loss: 0.35042804479599, mean loss: 0.3498406635353812
Epoch: 26, step: 98, loss: 0.34212827682495117, mean loss: 0.3498404586530203
Epoch: 26, step: 99, loss: 0.31027480959892273, mean loss: 0.34983940760506965
Epoch: 26, step: 100, loss: 0.3339363634586334, mean loss: 0.3498389851573569
Epoch: 26, step: 101, loss: 0.32972222566604614, mean loss: 0.34983845079090387
Epoch: 26, step: 102, loss: 0.2913874387741089, mean loss: 0.34983689818347125
Epoch: 26, step: 103, loss: 0.3090629577636719, mean loss: 0.34983581515275464
Epoch: 26, step: 104, loss: 0.3192163109779358, mean loss: 0.3498350018641102
Epoch: 26, step: 105, loss: 0.31554362177848816, mean loss: 0.3498340910704824
Epoch: 26, step: 106, loss: 0.4128850996494293, mean loss: 0.3498357656875863
Epoch: 26, step: 107, loss: 0.32565072178840637, mean loss: 0.34983512335666367
Epoch: 26, step: 108, loss: 0.3382127583026886, mean loss: 0.34983481468630395
Epoch: 26, step: 109, loss: 0.3150136172771454, mean loss: 0.3498338899187518
Epoch: 26, step: 110, loss: 0.3000279664993286, mean loss: 0.34983256722791606
Epoch: 26, step: 111, loss: 0.31519272923469543, mean loss: 0.34983164732569616
Epoch: 26, step: 112, loss: 0.32816168665885925, mean loss: 0.3498310718693224
Epoch: 26, step: 113, loss: 0.33703234791755676, mean loss: 0.3498307320019914
Epoch: 26, step: 114, loss: 0.33569931983947754, mean loss: 0.3498303567553794
Epoch: 26, step: 115, loss: 0.3594741225242615, mean loss: 0.349830612829882
Epoch: 26, step: 116, loss: 0.32150739431381226, mean loss: 0.34982986077288625
Epoch: 26, step: 117, loss: 0.31339073181152344, mean loss: 0.3498288932425118
Epoch: 26, step: 118, loss: 0.3395366072654724, mean loss: 0.34982861996937964
Epoch: 26, step: 119, loss: 0.3202689290046692, mean loss: 0.34982783514326016
Epoch: 26, step: 120, loss: 0.30296605825424194, mean loss: 0.34982659097023777
Epoch: 26, step: 121, loss: 0.3175646960735321, mean loss: 0.349825734444594
Epoch: 26, step: 122, loss: 0.301902174949646, mean loss: 0.349824462148964
Epoch: 26, step: 123, loss: 0.3188295364379883, mean loss: 0.3498236393039573
Epoch: 26, step: 124, loss: 0.36581146717071533, mean loss: 0.34982406373327235
Epoch: 26, step: 125, loss: 0.37624579668045044, mean loss: 0.3498247651331382
Epoch: 26, step: 126, loss: 0.3212403655052185, mean loss: 0.34982400634256644
Epoch: 26, step: 127, loss: 0.33214810490608215, mean loss: 0.34982353713728304
Epoch: 26, step: 128, loss: 0.31100568175315857, mean loss: 0.349822506748002
Epoch: 26, step: 129, loss: 0.33407360315322876, mean loss: 0.3498220887169038
Epoch: 26, step: 130, loss: 0.3285283148288727, mean loss: 0.3498215235205166
Epoch: 26, step: 131, loss: 0.3175170123577118, mean loss: 0.3498206660910877
Epoch: 26, step: 132, loss: 0.3102775812149048, mean loss: 0.3498196165625988
Epoch: 26, step: 133, loss: 0.3175627291202545, mean loss: 0.3498187604426497
Epoch: 26, step: 134, loss: 0.40499770641326904, mean loss: 0.34982022489090925
Epoch: 26, step: 135, loss: 0.3302646279335022, mean loss: 0.3498197058994826
Epoch: 26, step: 136, loss: 0.4022766947746277, mean loss: 0.3498210980331541
Epoch: 26, step: 137, loss: 0.3230932950973511, mean loss: 0.3498203887342067
Epoch: 26, step: 138, loss: 0.31555747985839844, mean loss: 0.34981947949373016
Epoch: 26, step: 139, loss: 0.3495802879333496, mean loss: 0.34981947314643264
Epoch: 26, step: 140, loss: 0.3237649202346802, mean loss: 0.3498187817691496
Epoch: 26, step: 141, loss: 0.3149319887161255, mean loss: 0.34981785604625376
Epoch: 26, step: 142, loss: 0.3100823163986206, mean loss: 0.3498168016895884
Epoch: 26, step: 143, loss: 0.3348868191242218, mean loss: 0.3498164055427362
Epoch: 26, step: 144, loss: 0.36904245615005493, mean loss: 0.3498169156663958
Epoch: 26, step: 145, loss: 0.3428897559642792, mean loss: 0.3498167318733551
Epoch: 26, step: 146, loss: 0.311359703540802, mean loss: 0.34981571154944935
Epoch: 26, step: 147, loss: 0.3226155638694763, mean loss: 0.3498149899069873
Epoch: 26, step: 148, loss: 0.3150300681591034, mean loss: 0.3498140670586667
Epoch: 26, step: 149, loss: 0.29987195134162903, mean loss: 0.3498127421232468
Epoch: 26, step: 150, loss: 0.31428730487823486, mean loss: 0.34981179967896386
Epoch: 26, step: 151, loss: 0.3952939212322235, mean loss: 0.34981300622930217
Epoch: 26, step: 152, loss: 0.34289729595184326, mean loss: 0.3498128227741127
Epoch: 26, step: 153, loss: 0.36853981018066406, mean loss: 0.3498133195375327
Epoch: 26, step: 154, loss: 0.3549097180366516, mean loss: 0.34981345472410263
Epoch: 26, step: 155, loss: 0.3569850027561188, mean loss: 0.3498136449508409
Epoch: 26, step: 156, loss: 0.3319510519504547, mean loss: 0.3498131711545755
Epoch: 26, step: 157, loss: 0.3223129212856293, mean loss: 0.3498124417436724
Epoch: 26, step: 158, loss: 0.3348459303379059, mean loss: 0.3498120447855681
Epoch: 26, step: 159, loss: 0.38639599084854126, mean loss: 0.3498130150790665
Epoch: 26, step: 160, loss: 0.32319116592407227, mean loss: 0.3498123090228629
Epoch: 26, step: 161, loss: 0.3244948983192444, mean loss: 0.34981163758036826
Epoch: 26, step: 162, loss: 0.28427040576934814, mean loss: 0.3498098994088932
Epoch: 26, step: 163, loss: 0.3180840313434601, mean loss: 0.3498090580524684
Epoch: 26, step: 164, loss: 0.3307010531425476, mean loss: 0.34980855132980515
Epoch: 26, step: 165, loss: 0.3411381244659424, mean loss: 0.34980832140599544
Epoch: 26, step: 166, loss: 0.3141699731349945, mean loss: 0.3498073763674584
Epoch: 26, step: 167, loss: 0.3345634937286377, mean loss: 0.34980697214910245
Epoch: 26, step: 168, loss: 0.33806291222572327, mean loss: 0.3498066607429581
Epoch: 26, step: 169, loss: 0.338727205991745, mean loss: 0.34980636696731104
Epoch: 26, step: 170, loss: 0.33048325777053833, mean loss: 0.34980585462184643
Epoch: 26, step: 171, loss: 0.3033566474914551, mean loss: 0.3498046230700612
Epoch: 26, step: 172, loss: 0.31033840775489807, mean loss: 0.34980357669268985
Epoch: 26, step: 173, loss: 0.34503722190856934, mean loss: 0.34980345032451593
Epoch: 26, step: 174, loss: 0.30583274364471436, mean loss: 0.3498022845802841
Epoch: 26, step: 175, loss: 0.31994208693504333, mean loss: 0.34980149295256285
Epoch: 26, step: 176, loss: 0.31933271884918213, mean loss: 0.34980068521220326
Epoch: 26, step: 177, loss: 0.31638580560684204, mean loss: 0.349799799392798
Epoch: 26, step: 178, loss: 0.3877749443054199, mean loss: 0.3498008060769141
Epoch: 26, step: 179, loss: 0.33394038677215576, mean loss: 0.3498003856437865
Epoch: 26, step: 180, loss: 0.30229708552360535, mean loss: 0.3497991264443135
Epoch: 26, step: 181, loss: 0.2979464828968048, mean loss: 0.34979775199052704
Epoch: 26, step: 182, loss: 0.32697242498397827, mean loss: 0.3497971469774858
Epoch: 26, step: 183, loss: 0.2835826575756073, mean loss: 0.3497953919284665
Epoch: 26, step: 184, loss: 0.31679850816726685, mean loss: 0.34979451735231126
Epoch: 26, step: 185, loss: 0.32909491658210754, mean loss: 0.34979396872785407
Epoch: 26, step: 186, loss: 0.28636279702186584, mean loss: 0.3497922875857771
Epoch: 26, step: 187, loss: 0.36699995398521423, mean loss: 0.3497927436354537
Epoch: 26, step: 188, loss: 0.3388897180557251, mean loss: 0.34979245468346
Epoch: 26, step: 189, loss: 0.33910703659057617, mean loss: 0.34979217150600483
Epoch: 26, step: 190, loss: 0.40387895703315735, mean loss: 0.34979360483807126
Epoch: 26, step: 191, loss: 0.3203830122947693, mean loss: 0.34979282546048635
Epoch: 26, step: 192, loss: 0.31738919019699097, mean loss: 0.3497919667903413
Epoch: 26, step: 193, loss: 0.3609258532524109, mean loss: 0.3497922618215158
Epoch: 26, step: 194, loss: 0.35853898525238037, mean loss: 0.34979249359033404
Epoch: 26, step: 195, loss: 0.37331217527389526, mean loss: 0.34979311679334635
Epoch: 26, step: 196, loss: 0.36315205693244934, mean loss: 0.349793470756944
Epoch: 26, step: 197, loss: 0.34142065048217773, mean loss: 0.3497932489133672
Epoch: 26, step: 198, loss: 0.3458207845687866, mean loss: 0.349793143663007
Epoch: 26, step: 199, loss: 0.296379417181015, mean loss: 0.3497917285049294
Epoch: 26, step: 200, loss: 0.30039021372795105, mean loss: 0.34979041968217733
Epoch: 26, step: 201, loss: 0.3679804801940918, mean loss: 0.34979090158914794
Epoch: 26, step: 202, loss: 0.30505940318107605, mean loss: 0.3497897165546178
Epoch: 26, step: 203, loss: 0.3283824920654297, mean loss: 0.3497891494457779
Epoch: 26, step: 204, loss: 0.3314996659755707, mean loss: 0.349788664943315
Epoch: 26, step: 205, loss: 0.3870840072631836, mean loss: 0.34978965289940295
Epoch: 26, step: 206, loss: 0.31627383828163147, mean loss: 0.34978876508677237
Epoch: 26, step: 207, loss: 0.37335169315338135, mean loss: 0.34978938923722974
Epoch: 26, step: 208, loss: 0.3292296826839447, mean loss: 0.3497888446525198
Epoch: 26, step: 209, loss: 0.3502020239830017, mean loss: 0.349788855596508
Epoch: 26, step: 210, loss: 0.35519513487815857, mean loss: 0.34978899879023817
Epoch: 26, step: 211, loss: 0.29929694533348083, mean loss: 0.34978766146495327
Epoch: 26, step: 212, loss: 0.3559481203556061, mean loss: 0.34978782462566227
Epoch: 26, step: 213, loss: 0.31539005041122437, mean loss: 0.3497869136194063
Epoch: 26, step: 214, loss: 0.37415561079978943, mean loss: 0.34978755899394426
Epoch: 26, step: 215, loss: 0.2967994511127472, mean loss: 0.3497861557071889
Epoch: 26, step: 216, loss: 0.3166272044181824, mean loss: 0.34978527758025135
Epoch: 26, step: 217, loss: 0.33285489678382874, mean loss: 0.3497848292358629
Epoch: 26, step: 218, loss: 0.32812777161598206, mean loss: 0.3497842557364688
Epoch: 26, step: 219, loss: 0.3420758843421936, mean loss: 0.34978405161690007
Epoch: 26, step: 220, loss: 0.34567150473594666, mean loss: 0.3497839427185317
Epoch: 26, step: 221, loss: 0.3241807520389557, mean loss: 0.349783264775655
Epoch: 26, step: 222, loss: 0.3471040427684784, mean loss: 0.3497831938348335
Epoch: 26, step: 223, loss: 0.3138921558856964, mean loss: 0.34978224353198584
Epoch: 26, step: 224, loss: 0.3332023322582245, mean loss: 0.34978180454998276
Epoch: 26, step: 225, loss: 0.3221832811832428, mean loss: 0.34978107385039664
Epoch: 26, step: 226, loss: 0.3654288351535797, mean loss: 0.34978148813016957
Epoch: 26, step: 227, loss: 0.3372402489185333, mean loss: 0.34978115610541016
Epoch: 26, step: 228, loss: 0.3253231942653656, mean loss: 0.3497805086068837
Epoch: 26, step: 229, loss: 0.35575249791145325, mean loss: 0.3497806667047633
Epoch: 26, step: 230, loss: 0.3573682904243469, mean loss: 0.3497808675683959
Epoch: 26, step: 231, loss: 0.3413473963737488, mean loss: 0.3497806443189466
Epoch: 26, step: 232, loss: 0.3370053768157959, mean loss: 0.3497803061431385
Epoch: 26, step: 233, loss: 0.28988951444625854, mean loss: 0.3497787208079779
Epoch: 26, step: 234, loss: 0.36210423707962036, mean loss: 0.34977904706108864
Epoch: 26, step: 235, loss: 0.3276785612106323, mean loss: 0.3497784620826384
Epoch: 26, step: 236, loss: 0.34480810165405273, mean loss: 0.3497783305254952
Epoch: 26, step: 237, loss: 0.33329835534095764, mean loss: 0.3497778943396081
Epoch: 26, step: 238, loss: 0.34800809621810913, mean loss: 0.34977784749848584
Epoch: 26, step: 239, loss: 0.3907988965511322, mean loss: 0.34977893317096764
Epoch: 26, step: 240, loss: 0.36569374799728394, mean loss: 0.3497793543649554
Epoch: 26, step: 241, loss: 0.30628982186317444, mean loss: 0.3497782034219473
Epoch: 26, step: 242, loss: 0.2900393009185791, mean loss: 0.3497766224839924
Epoch: 26, step: 243, loss: 0.3182653784751892, mean loss: 0.34977578858846975
Epoch: 26, step: 244, loss: 0.3196711540222168, mean loss: 0.3497749919377363
Epoch: 26, step: 245, loss: 0.33219850063323975, mean loss: 0.349774526828149
Epoch: 26, step: 246, loss: 0.3414262533187866, mean loss: 0.34977430592175573
Epoch: 26, step: 247, loss: 0.2952599823474884, mean loss: 0.349772863438596
Epoch: 26, step: 248, loss: 0.3072490394115448, mean loss: 0.3497717382613402
Epoch: 26, step: 249, loss: 0.3196937143802643, mean loss: 0.3497709424200987
Epoch: 26, step: 250, loss: 0.30626964569091797, mean loss: 0.34976979143989684
Epoch: 26, step: 251, loss: 0.31181809306144714, mean loss: 0.3497687873204562
Epoch: 26, step: 252, loss: 0.30433517694473267, mean loss: 0.34976758527769153
Epoch: 26, step: 253, loss: 0.3414686322212219, mean loss: 0.3497673657170519
Epoch: 26, step: 254, loss: 0.27257391810417175, mean loss: 0.34976532350832645
Epoch: 26, step: 255, loss: 0.346116304397583, mean loss: 0.3497652269734293
Epoch: 26, step: 256, loss: 0.2989041209220886, mean loss: 0.34976388147711834
Epoch: 26, step: 257, loss: 0.3190920352935791, mean loss: 0.34976307009554636
Epoch: 26, step: 258, loss: 0.35332944989204407, mean loss: 0.34976316443673083
Epoch: 26, step: 259, loss: 0.30272895097732544, mean loss: 0.3497619202770266
Epoch: 26, step: 260, loss: 0.3211774230003357, mean loss: 0.34976116417340863
Epoch: 26, step: 261, loss: 0.31016814708709717, mean loss: 0.3497601169053272
Epoch: 26, step: 262, loss: 0.3358120024204254, mean loss: 0.34975974797590975
Epoch: 26, step: 263, loss: 0.34046074748039246, mean loss: 0.3497595020226592
Epoch: 26, step: 264, loss: 0.3715379238128662, mean loss: 0.3497600780342382
Epoch: 26, step: 265, loss: 0.33019179105758667, mean loss: 0.3497595604916046
Epoch: 26, step: 266, loss: 0.38320374488830566, mean loss: 0.3497604450009907
Epoch: 26, step: 267, loss: 0.3327140510082245, mean loss: 0.349759994181304
Epoch: 26, step: 268, loss: 0.3152300715446472, mean loss: 0.34975908100534236
Epoch: 26, step: 269, loss: 0.3206968903541565, mean loss: 0.3497583124489704
Epoch: 26, step: 270, loss: 0.39588436484336853, mean loss: 0.3497595322308663
Epoch: 26, step: 271, loss: 0.31469568610191345, mean loss: 0.3497586050083645
Epoch: 26, step: 272, loss: 0.3328830897808075, mean loss: 0.3497581587668533
Epoch: 26, step: 273, loss: 0.352187842130661, mean loss: 0.34975822301359727
Epoch: 26, step: 274, loss: 0.35262972116470337, mean loss: 0.34975829894099225
Epoch: 26, step: 275, loss: 0.3154948055744171, mean loss: 0.34975739297871394
Epoch: 26, step: 276, loss: 0.33467093110084534, mean loss: 0.34975699408757205
Epoch: 26, step: 277, loss: 0.3558671176433563, mean loss: 0.34975715563702886
Epoch: 26, step: 278, loss: 0.3385741114616394, mean loss: 0.3497568599692031
Epoch: 26, step: 279, loss: 0.36014407873153687, mean loss: 0.34975713458898844
Epoch: 26, step: 280, loss: 0.3260398805141449, mean loss: 0.3497565075631041
Epoch: 26, step: 281, loss: 0.32940664887428284, mean loss: 0.3497559695770974
Epoch: 26, step: 282, loss: 0.3151135742664337, mean loss: 0.349755053765764
Epoch: 26, step: 283, loss: 0.3063098192214966, mean loss: 0.34975390527167116
Epoch: 26, step: 284, loss: 0.38214728236198425, mean loss: 0.34975476158236113
Epoch: 26, step: 285, loss: 0.32171010971069336, mean loss: 0.349754020248714
Epoch: 26, step: 286, loss: 0.3555910885334015, mean loss: 0.3497541745419731
Epoch: 26, step: 287, loss: 0.33246085047721863, mean loss: 0.3497537174335975
Epoch: 26, step: 288, loss: 0.2979191839694977, mean loss: 0.3497523473457519
Epoch: 26, step: 289, loss: 0.3283980190753937, mean loss: 0.3497517829241134
Epoch: 26, step: 290, loss: 0.33744117617607117, mean loss: 0.34975145754796044
Epoch: 26, step: 291, loss: 0.3286895155906677, mean loss: 0.34975090088388505
Epoch: 26, step: 292, loss: 0.3179730176925659, mean loss: 0.34975006102123235
Epoch: 26, step: 293, loss: 0.37361764907836914, mean loss: 0.3497506918047848
Epoch: 26, step: 294, loss: 0.31078678369522095, mean loss: 0.34974966207598357
Epoch: 26, step: 295, loss: 0.37141865491867065, mean loss: 0.34975023472378597
Epoch: 26, step: 296, loss: 0.3225402534008026, mean loss: 0.34974951566294393
Epoch: 26, step: 297, loss: 0.3442142903804779, mean loss: 0.3497493693909371
Epoch: 26, step: 298, loss: 0.3020813763141632, mean loss: 0.34974810976582604
Epoch: 26, step: 299, loss: 0.32319551706314087, mean loss: 0.3497474081329991
Epoch: 26, step: 300, loss: 0.4196711480617523, mean loss: 0.34974925576782345
Epoch: 26, step: 301, loss: 0.3271680474281311, mean loss: 0.34974865910745406
Epoch: 26, step: 302, loss: 0.3559703230857849, mean loss: 0.3497488234973391
Epoch: 26, step: 303, loss: 0.35391926765441895, mean loss: 0.3497489336866267
Epoch: 26, step: 304, loss: 0.32118746638298035, mean loss: 0.34974817907045974
Epoch: 26, step: 305, loss: 0.3151884078979492, mean loss: 0.34974726599856615
Epoch: 26, step: 306, loss: 0.3249925971031189, mean loss: 0.3497466119955307
Epoch: 26, step: 307, loss: 0.3261328935623169, mean loss: 0.34974598815218205
Epoch: 26, step: 308, loss: 0.37364324927330017, mean loss: 0.3497466194696766
Epoch: 26, step: 309, loss: 0.3188859224319458, mean loss: 0.3497458042137713
Epoch: 26, step: 310, loss: 0.3076823055744171, mean loss: 0.3497446930395899
Epoch: 26, step: 311, loss: 0.3134206235408783, mean loss: 0.34974373350690025
Epoch: 26, step: 312, loss: 0.3498283624649048, mean loss: 0.3497437357423906
Epoch: 26, step: 313, loss: 0.32546746730804443, mean loss: 0.3497430944969884
Epoch: 26, step: 314, loss: 0.3767505884170532, mean loss: 0.34974380786749265
Epoch: 26, step: 315, loss: 0.3396346867084503, mean loss: 0.34974354085425546
Epoch: 26, step: 316, loss: 0.3352222442626953, mean loss: 0.34974315731191397
Epoch: 26, step: 317, loss: 0.33517515659332275, mean loss: 0.3497427725461668
Epoch: 26, step: 318, loss: 0.30550459027290344, mean loss: 0.3497416041711761
Epoch: 26, step: 319, loss: 0.3153487741947174, mean loss: 0.34974069584585454
Epoch: 26, step: 320, loss: 0.31768080592155457, mean loss: 0.34973984915656564
Epoch: 26, step: 321, loss: 0.3424496650695801, mean loss: 0.349739656630709
Epoch: 26, step: 322, loss: 0.3098095953464508, mean loss: 0.3497386021489364
Epoch: 26, step: 323, loss: 0.32318225502967834, mean loss: 0.3497379008616458
Epoch: 26, step: 324, loss: 0.2904629707336426, mean loss: 0.34973633559902656
Epoch: 26, step: 325, loss: 0.3470763564109802, mean loss: 0.3497362653592804
Epoch: 26, step: 326, loss: 0.3443114757537842, mean loss: 0.34973612211538385
Epoch: 26, step: 327, loss: 0.3153409957885742, mean loss: 0.34973521392130047
Epoch: 26, step: 328, loss: 0.30519506335258484, mean loss: 0.3497340378816266
Epoch: 26, step: 329, loss: 0.3442595899105072, mean loss: 0.34973389333792987
Epoch: 26, step: 330, loss: 0.3213481605052948, mean loss: 0.3497331438796373
Epoch: 26, step: 331, loss: 0.3414044976234436, mean loss: 0.349732923987192
Epoch: 26, step: 332, loss: 0.3419419229030609, mean loss: 0.34973271829505476
Epoch: 26, step: 333, loss: 0.3182560205459595, mean loss: 0.34973188729294935
Epoch: 26, step: 334, loss: 0.3664262592792511, mean loss: 0.3497323280219017
Epoch: 26, step: 335, loss: 0.3413631319999695, mean loss: 0.34973210708219676
Epoch: 26, step: 336, loss: 0.28308799862861633, mean loss: 0.3497303477804768
Epoch: 26, step: 337, loss: 0.34400081634521484, mean loss: 0.34973019653367265
Epoch: 26, step: 338, loss: 0.30532893538475037, mean loss: 0.34972902447071175
Epoch: 26, step: 339, loss: 0.3195638060569763, mean loss: 0.3497282282185099
Epoch: 26, step: 340, loss: 0.3373117446899414, mean loss: 0.34972790047709434
Epoch: 26, step: 341, loss: 0.34232640266418457, mean loss: 0.3497277051147491
Epoch: 26, step: 342, loss: 0.3240513801574707, mean loss: 0.3497270274066973
Epoch: 26, step: 343, loss: 0.3486004173755646, mean loss: 0.3497269976714241
Epoch: 26, step: 344, loss: 0.32756662368774414, mean loss: 0.3497264127952336
Epoch: 26, step: 345, loss: 0.31245115399360657, mean loss: 0.3497254290195988
Epoch: 26, step: 346, loss: 0.35383766889572144, mean loss: 0.34972553754774205
Epoch: 26, step: 347, loss: 0.3233088552951813, mean loss: 0.349724840390499
Epoch: 26, step: 348, loss: 0.3053204119205475, mean loss: 0.3497236685532607
Epoch: 26, step: 349, loss: 0.3211810886859894, mean loss: 0.349722915331646
Epoch: 26, step: 350, loss: 0.3523077368736267, mean loss: 0.3497229835417408
Epoch: 26, step: 351, loss: 0.30376216769218445, mean loss: 0.34972177072730526
Epoch: 26, step: 352, loss: 0.33099812269210815, mean loss: 0.3497212766605444
Epoch: 26, step: 353, loss: 0.3288154602050781, mean loss: 0.34972072502677864
Epoch: 26, step: 354, loss: 0.345289021730423, mean loss: 0.3497206080922079
Epoch: 26, step: 355, loss: 0.3129415810108185, mean loss: 0.3497196376693298
Epoch: 26, step: 356, loss: 0.30741891264915466, mean loss: 0.3497185215846613
Epoch: 26, step: 357, loss: 0.35434690117836, mean loss: 0.3497186436990509
Epoch: 26, step: 358, loss: 0.3355378210544586, mean loss: 0.34971826956447993
Epoch: 26, step: 359, loss: 0.3761084973812103, mean loss: 0.3497189658030779
Epoch: 26, step: 360, loss: 0.33708325028419495, mean loss: 0.34971863245086793
Epoch: 26, step: 361, loss: 0.3231178820133209, mean loss: 0.34971793069519763
Epoch: 26, step: 362, loss: 0.32563072443008423, mean loss: 0.34971729526621975
Epoch: 26, step: 363, loss: 0.33368322253227234, mean loss: 0.3497168722928966
Epoch: 26, step: 364, loss: 0.29817309975624084, mean loss: 0.3497155126217753
Epoch: 26, step: 365, loss: 0.33144885301589966, mean loss: 0.3497150307790002
Epoch: 26, step: 366, loss: 0.3438105881214142, mean loss: 0.34971487503415943
Epoch: 26, step: 367, loss: 0.31105202436447144, mean loss: 0.34971385522906684
Epoch: 26, step: 368, loss: 0.3532201051712036, mean loss: 0.34971394771053604
Epoch: 26, step: 369, loss: 0.31929418444633484, mean loss: 0.3497131453746373
Epoch: 26, step: 370, loss: 0.3560299575328827, mean loss: 0.34971331197920436
Epoch: 26, step: 371, loss: 0.31833019852638245, mean loss: 0.3497124842781427
Epoch: 26, step: 372, loss: 0.3523333668708801, mean loss: 0.34971255339971336
Epoch: 26, step: 373, loss: 0.34323620796203613, mean loss: 0.3497123826010046
Epoch: 26, step: 374, loss: 0.32533302903175354, mean loss: 0.3497117396686074
Epoch: 26, step: 375, loss: 0.33084776997566223, mean loss: 0.3497112422010522
Epoch: 26, step: 376, loss: 0.3748661279678345, mean loss: 0.3497119055507995
Epoch: 26, step: 377, loss: 0.3492797017097473, mean loss: 0.34971189415362003
Epoch: 26, step: 378, loss: 0.31285059452056885, mean loss: 0.3497109221498325
Epoch: 26, step: 379, loss: 0.3777695298194885, mean loss: 0.34971166201397313
Epoch: 26, step: 380, loss: 0.3455807566642761, mean loss: 0.34971155309095797
Epoch: 26, step: 381, loss: 0.36531364917755127, mean loss: 0.3497119644735474
Epoch: 26, step: 382, loss: 0.3347950577735901, mean loss: 0.3497115711678101
Epoch: 26, step: 383, loss: 0.33696743845939636, mean loss: 0.3497112351592489
Epoch: 26, step: 384, loss: 0.3165571689605713, mean loss: 0.34971036105061964
Epoch: 26, step: 385, loss: 0.3325619697570801, mean loss: 0.3497099089443372
Epoch: 26, step: 386, loss: 0.35229283571243286, mean loss: 0.34970997703974116
Epoch: 26, step: 387, loss: 0.32580679655075073, mean loss: 0.34970934688102323
Epoch: 26, step: 388, loss: 0.33303555846214294, mean loss: 0.3497089073221057
Epoch: 26, step: 389, loss: 0.3187641501426697, mean loss: 0.34970809156955707
Epoch: 26, step: 390, loss: 0.33606886863708496, mean loss: 0.3497077320276319
Epoch: 26, step: 391, loss: 0.35073938965797424, mean loss: 0.3497077592223185
Epoch: 26, step: 392, loss: 0.30302080512046814, mean loss: 0.34970652857798445
Epoch: 26, step: 393, loss: 0.3614572584629059, mean loss: 0.34970683831307553
Epoch: 26, step: 394, loss: 0.3427903652191162, mean loss: 0.349706656007978
Epoch: 26, step: 395, loss: 0.3474072515964508, mean loss: 0.3497065954016414
Epoch: 26, step: 396, loss: 0.3006206750869751, mean loss: 0.34970530165818936
Epoch: 26, step: 397, loss: 0.37705498933792114, mean loss: 0.3497060224870249
Epoch: 26, step: 398, loss: 0.31687062978744507, mean loss: 0.3497051570996623
Epoch: 26, step: 399, loss: 0.366669237613678, mean loss: 0.3497056041816915
Epoch: 26, step: 400, loss: 0.3404596745967865, mean loss: 0.3497053605150797
Epoch: 26, step: 401, loss: 0.3112630248069763, mean loss: 0.34970434743502626
Epoch: 26, step: 402, loss: 0.3371848165988922, mean loss: 0.3497040175135348
Epoch: 26, step: 403, loss: 0.36832576990127563, mean loss: 0.3497045082311586
Epoch: 26, step: 404, loss: 0.32474878430366516, mean loss: 0.34970385061899684
Epoch: 26, step: 405, loss: 0.3730419874191284, mean loss: 0.3497044655896635
Epoch: 26, step: 406, loss: 0.3104269504547119, mean loss: 0.34970343063629905
Epoch: 26, step: 407, loss: 0.3691922128200531, mean loss: 0.349703944147634
Epoch: 26, step: 408, loss: 0.35133782029151917, mean loss: 0.3497039871976207
Epoch: 26, step: 409, loss: 0.35927432775497437, mean loss: 0.34970423935392986
Epoch: 26, step: 410, loss: 0.3097752034664154, mean loss: 0.34970318734402633
Epoch: 26, step: 411, loss: 0.3074742555618286, mean loss: 0.34970207476810206
Epoch: 26, step: 412, loss: 0.338021457195282, mean loss: 0.349701767035205
Epoch: 26, step: 413, loss: 0.2943512201309204, mean loss: 0.3497003088301651
Epoch: 26, step: 414, loss: 0.3760921359062195, mean loss: 0.3497010041020921
Epoch: 26, step: 415, loss: 0.3399835228919983, mean loss: 0.3497007481094364
Epoch: 26, step: 416, loss: 0.3463457524776459, mean loss: 0.3497006597293718
Epoch: 26, step: 417, loss: 0.2905714511871338, mean loss: 0.3496991021399787
Epoch: 26, step: 418, loss: 0.3605194687843323, mean loss: 0.3496993871639927
Epoch: 26, step: 419, loss: 0.3474901020526886, mean loss: 0.34969932896977945
Epoch: 26, step: 420, loss: 0.32416218519210815, mean loss: 0.3496986563201343
Epoch: 26, step: 421, loss: 0.3809804916381836, mean loss: 0.3496994802635394
Epoch: 26, step: 422, loss: 0.3789859712123871, mean loss: 0.34970025163054097
Epoch: 26, step: 423, loss: 0.32219478487968445, mean loss: 0.3496995271924154
Epoch: 26, step: 424, loss: 0.32456836104393005, mean loss: 0.3496988653059778
Epoch: 26, step: 425, loss: 0.3197997212409973, mean loss: 0.349698077864733
Epoch: 26, step: 426, loss: 0.2963689863681793, mean loss: 0.3496966733957568
Epoch: 26, step: 427, loss: 0.388535737991333, mean loss: 0.3496976962300714
Epoch: 26, step: 428, loss: 0.34679630398750305, mean loss: 0.349697619823355
Epoch: 26, step: 429, loss: 0.36671745777130127, mean loss: 0.34969806802048853
Epoch: 26, step: 430, loss: 0.3355962336063385, mean loss: 0.34969769667527684
Epoch: 26, step: 431, loss: 0.3383452892303467, mean loss: 0.34969739773891056
Epoch: 26, step: 432, loss: 0.3467598557472229, mean loss: 0.3496973203883565
Epoch: 26, step: 433, loss: 0.3819161653518677, mean loss: 0.3496981687438508
Epoch: 26, step: 434, loss: 0.3584919273853302, mean loss: 0.34969840028650967
Epoch: 26, step: 435, loss: 0.31401896476745605, mean loss: 0.34969746085956077
Epoch: 26, step: 436, loss: 0.3086952567100525, mean loss: 0.3496963813144158
Epoch: 26, step: 437, loss: 0.32870298624038696, mean loss: 0.34969582859483617
Epoch: 26, step: 438, loss: 0.30991655588150024, mean loss: 0.34969478130334486
Epoch: 26, step: 439, loss: 0.3722541928291321, mean loss: 0.3496953752221403
Epoch: 26, step: 440, loss: 0.3327189087867737, mean loss: 0.3496949282966056
Epoch: 26, step: 441, loss: 0.33503809571266174, mean loss: 0.3496945424483303
Epoch: 26, step: 442, loss: 0.30700698494911194, mean loss: 0.34969341870711623
Epoch: 26, step: 443, loss: 0.39537835121154785, mean loss: 0.3496946213219552
Epoch: 26, step: 444, loss: 0.3154503405094147, mean loss: 0.3496937198957315
Epoch: 26, step: 445, loss: 0.32557812333106995, mean loss: 0.3496930851077198
Epoch: 26, step: 446, loss: 0.30408376455307007, mean loss: 0.34969188457810607
Epoch: 26, step: 447, loss: 0.34377625584602356, mean loss: 0.3496917288708853
Epoch: 26, step: 448, loss: 0.2867657542228699, mean loss: 0.349690072619085
Epoch: 26, step: 449, loss: 0.3379598557949066, mean loss: 0.3496897638804204
Epoch: 26, step: 450, loss: 0.32467710971832275, mean loss: 0.349689105566059
Epoch: 26, step: 451, loss: 0.3462395966053009, mean loss: 0.34968901477995096
Epoch: 26, step: 452, loss: 0.2996646761894226, mean loss: 0.34968769824605117
Epoch: 26, step: 453, loss: 0.34583017230033875, mean loss: 0.3496875967268674
Epoch: 26, step: 454, loss: 0.28748124837875366, mean loss: 0.34968595967462
Epoch: 26, step: 455, loss: 0.3424507677555084, mean loss: 0.3496857692748327
Epoch: 26, step: 456, loss: 0.2995796203613281, mean loss: 0.3496844507266652
Epoch: 26, step: 457, loss: 0.31298550963401794, mean loss: 0.34968348501588437
Epoch: 26, step: 458, loss: 0.3094998896121979, mean loss: 0.34968242763632473
Epoch: 26, step: 459, loss: 0.32553085684776306, mean loss: 0.3496817921355672
Epoch: 26, step: 460, loss: 0.3256027400493622, mean loss: 0.349681158559667
Epoch: 26, step: 461, loss: 0.3114839494228363, mean loss: 0.349680153528642
Epoch: 26, step: 462, loss: 0.32430794835090637, mean loss: 0.3496794859620049
Epoch: 26, step: 463, loss: 0.3515518605709076, mean loss: 0.34967953522464984
Epoch: 26, step: 464, loss: 0.2915574908256531, mean loss: 0.3496780060593364
Epoch: 26, step: 465, loss: 0.3182085454463959, mean loss: 0.3496771781335113
Epoch: 26, step: 466, loss: 0.3096778094768524, mean loss: 0.3496761258231628
Epoch: 26, step: 467, loss: 0.3048911988735199, mean loss: 0.34967494764451
Epoch: 26, step: 468, loss: 0.30994874238967896, mean loss: 0.3496739025755795
Epoch: 26, step: 469, loss: 0.3235534727573395, mean loss: 0.3496732154489994
Epoch: 26, step: 470, loss: 0.2860373854637146, mean loss: 0.34967154148267066
Epoch: 26, step: 471, loss: 0.3075045645236969, mean loss: 0.34967043229240974
Epoch: 26, step: 472, loss: 0.2931724190711975, mean loss: 0.3496689461674335
Epoch: 26, step: 473, loss: 0.30554118752479553, mean loss: 0.3496677854604357
Epoch: 26, step: 474, loss: 0.3153606653213501, mean loss: 0.3496668830926686
Epoch: 26, step: 475, loss: 0.3820819854736328, mean loss: 0.3496677356729521
Epoch: 26, step: 476, loss: 0.349524587392807, mean loss: 0.34966773190797273
Epoch: 26, step: 477, loss: 0.34590837359428406, mean loss: 0.3496676330347332
Epoch: 26, step: 478, loss: 0.37234994769096375, mean loss: 0.3496682295766856
Epoch: 26, step: 479, loss: 0.3384125530719757, mean loss: 0.3496679335616292
Epoch: 26, step: 480, loss: 0.34535032510757446, mean loss: 0.34966782001505575
Epoch: 26, step: 481, loss: 0.33181482553482056, mean loss: 0.34966735052064457
Epoch: 26, step: 482, loss: 0.31468161940574646, mean loss: 0.34966643049721086
Epoch: 26, step: 483, loss: 0.33320152759552, mean loss: 0.34966599752932137
Epoch: 26, step: 484, loss: 0.35640937089920044, mean loss: 0.3496661748511907
Epoch: 26, step: 485, loss: 0.32533493638038635, mean loss: 0.3496655350605394
Epoch: 26, step: 486, loss: 0.3090246617794037, mean loss: 0.349664466435647
Epoch: 26, step: 487, loss: 0.33388909697532654, mean loss: 0.34966405164364395
Epoch: 26, step: 488, loss: 0.30883148312568665, mean loss: 0.34966297803471175
Epoch: 26, step: 489, loss: 0.32363754510879517, mean loss: 0.3496622937671373
Epoch: 26, step: 490, loss: 0.35370388627052307, mean loss: 0.34966240002696386
Epoch: 26, step: 491, loss: 0.2987712621688843, mean loss: 0.3496610620540472
Epoch: 26, step: 492, loss: 0.3087041974067688, mean loss: 0.34965998529024755
Epoch: 26, step: 493, loss: 0.32158714532852173, mean loss: 0.3496592472693221
Epoch: 26, step: 494, loss: 0.35515648126602173, mean loss: 0.3496593917850559
Epoch: 26, step: 495, loss: 0.3654116690158844, mean loss: 0.3496598058827749
Epoch: 26, step: 496, loss: 0.3213565945625305, mean loss: 0.3496590618641813
Epoch: 26, step: 497, loss: 0.3344123065471649, mean loss: 0.34965866107675375
Epoch: 26, step: 498, loss: 0.3416005074977875, mean loss: 0.34965844925976824
Epoch: 26, step: 499, loss: 0.30581697821617126, mean loss: 0.34965729687119074
Epoch: 26, step: 500, loss: 0.37223073840141296, mean loss: 0.34965789020649185
Epoch: 26, step: 501, loss: 0.300461083650589, mean loss: 0.34965659711900415
Epoch: 26, step: 502, loss: 0.30984923243522644, mean loss: 0.34965555085084415
Epoch: 26, step: 503, loss: 0.3143625855445862, mean loss: 0.34965462326029256
Epoch: 26, step: 504, loss: 0.3498370349407196, mean loss: 0.34965462805441805
Epoch: 26, step: 505, loss: 0.3435524106025696, mean loss: 0.34965446768076625
Epoch: 26, step: 506, loss: 0.30896636843681335, mean loss: 0.34965339837643145
Epoch: 26, step: 507, loss: 0.38964882493019104, mean loss: 0.34965444944934626
Epoch: 26, step: 508, loss: 0.35335537791252136, mean loss: 0.3496545467065523
Epoch: 26, step: 509, loss: 0.31310856342315674, mean loss: 0.3496535863348888
Epoch: 26, step: 510, loss: 0.3034502863883972, mean loss: 0.349652372215852
Epoch: 26, step: 511, loss: 0.37895023822784424, mean loss: 0.3496531420777926
Epoch: 26, step: 512, loss: 0.34106993675231934, mean loss: 0.3496529165422715
Epoch: 26, step: 513, loss: 0.3075258731842041, mean loss: 0.34965180962537207
Epoch: 26, step: 514, loss: 0.39715632796287537, mean loss: 0.34965305780631056
Epoch: 26, step: 515, loss: 0.3551679253578186, mean loss: 0.3496532027056157
Epoch: 26, step: 516, loss: 0.33078157901763916, mean loss: 0.3496527068798705
Epoch: 26, step: 517, loss: 0.35547971725463867, mean loss: 0.3496528599724661
Epoch: 26, step: 518, loss: 0.33594682812690735, mean loss: 0.3496524998844056
Epoch: 26, step: 519, loss: 0.33278369903564453, mean loss: 0.3496520567149844
Epoch: 26, step: 520, loss: 0.3128962218761444, mean loss: 0.34965109110786924
Epoch: 26, step: 521, loss: 0.31386280059814453, mean loss: 0.34965015094366736
Epoch: 26, step: 522, loss: 0.3223864734172821, mean loss: 0.34964943474124727
Epoch: 26, step: 523, loss: 0.33673912286758423, mean loss: 0.3496490956030768
Epoch: 26, step: 524, loss: 0.3304200768470764, mean loss: 0.34964859049344016
Epoch: 26, step: 525, loss: 0.3479559123516083, mean loss: 0.34964854603118267
Epoch: 26, step: 526, loss: 0.31072530150413513, mean loss: 0.349647523645521
Epoch: 26, step: 527, loss: 0.31125548481941223, mean loss: 0.34964651523937407
Epoch: 26, step: 528, loss: 0.314368337392807, mean loss: 0.3496455886463069
Epoch: 26, step: 529, loss: 0.3683837950229645, mean loss: 0.3496460807985992
Epoch: 26, step: 530, loss: 0.29660606384277344, mean loss: 0.34964468775810137
Epoch: 26, step: 531, loss: 0.3203464448451996, mean loss: 0.34964391829064384
Epoch: 26, step: 532, loss: 0.2997050881385803, mean loss: 0.3496426067684611
Epoch: 26, step: 533, loss: 0.33045724034309387, mean loss: 0.34964210292460307
Epoch: 26, step: 534, loss: 0.37389975786209106, mean loss: 0.34964273995958134
Epoch: 26, step: 535, loss: 0.32601478695869446, mean loss: 0.3496421194776223
Epoch: 26, step: 536, loss: 0.3374963104724884, mean loss: 0.3496418005309296
Epoch: 26, step: 537, loss: 0.3163657784461975, mean loss: 0.3496409267317046
Epoch: 26, step: 538, loss: 0.3209960460662842, mean loss: 0.3496401745619526
Epoch: 26, step: 539, loss: 0.3051491975784302, mean loss: 0.34963900632917816
Epoch: 26, step: 540, loss: 0.30264467000961304, mean loss: 0.3496377723962303
Epoch: 26, step: 541, loss: 0.34654706716537476, mean loss: 0.34963769124553895
Epoch: 26, step: 542, loss: 0.35213419795036316, mean loss: 0.3496377567930146
Epoch: 26, step: 543, loss: 0.3281639814376831, mean loss: 0.34963719299929075
Epoch: 26, step: 544, loss: 0.3656354546546936, mean loss: 0.349637613022438
Epoch: 26, step: 545, loss: 0.3095458149909973, mean loss: 0.34963656046801345
Epoch: 26, step: 546, loss: 0.30411961674690247, mean loss: 0.3496353655153023
Epoch: 26, step: 547, loss: 0.33801186084747314, mean loss: 0.3496350603723676
Epoch: 26, step: 548, loss: 0.2887378931045532, mean loss: 0.3496334617278064
Epoch: 26, step: 549, loss: 0.295978844165802, mean loss: 0.3496320532483198
Epoch: 26, step: 550, loss: 0.38899293541908264, mean loss: 0.34963308647793445
Epoch: 26, step: 551, loss: 0.32332995533943176, mean loss: 0.34963239603455093
Epoch: 26, step: 552, loss: 0.29034602642059326, mean loss: 0.3496308398393226
Epoch: 26, step: 553, loss: 0.3313339054584503, mean loss: 0.3496303595796139
Epoch: 26, step: 554, loss: 0.324148952960968, mean loss: 0.34962969075873623
Epoch: 26, step: 555, loss: 0.32002121210098267, mean loss: 0.34962891363331217
Epoch: 26, step: 556, loss: 0.33042407035827637, mean loss: 0.34962840958241387
Epoch: 26, step: 557, loss: 0.3110998868942261, mean loss: 0.3496273983881803
Epoch: 26, step: 558, loss: 0.3660699129104614, mean loss: 0.3496278299162627
Epoch: 26, step: 559, loss: 0.34951382875442505, mean loss: 0.3496278269244203
Epoch: 26, step: 560, loss: 0.31257864832878113, mean loss: 0.34962685463263193
Epoch: 26, step: 561, loss: 0.3457866311073303, mean loss: 0.349626753855234
Epoch: 26, step: 562, loss: 0.3521708846092224, mean loss: 0.3496268206180533
Epoch: 26, step: 563, loss: 0.3212842047214508, mean loss: 0.3496260768735404
Epoch: 26, step: 564, loss: 0.30935654044151306, mean loss: 0.3496250201799396
Epoch: 26, step: 565, loss: 0.3111887574195862, mean loss: 0.3496240116188596
Epoch: 26, step: 566, loss: 0.3503812551498413, mean loss: 0.3496240314882813
Epoch: 26, step: 567, loss: 0.3223072290420532, mean loss: 0.3496233147375874
Epoch: 26, step: 568, loss: 0.3440086841583252, mean loss: 0.3496231674222205
Epoch: 26, step: 569, loss: 0.35886460542678833, mean loss: 0.34962340989055246
Epoch: 26, step: 570, loss: 0.3389883041381836, mean loss: 0.3496231308637716
Epoch: 26, step: 571, loss: 0.343854159116745, mean loss: 0.34962297951075066
Epoch: 26, step: 572, loss: 0.3065970838069916, mean loss: 0.3496218507258068
Epoch: 26, step: 573, loss: 0.329183965921402, mean loss: 0.3496213145516947
Epoch: 26, step: 574, loss: 0.3052414059638977, mean loss: 0.349620150305293
Epoch: 26, step: 575, loss: 0.3555731475353241, mean loss: 0.3496203064699632
Epoch: 26, step: 576, loss: 0.3135751187801361, mean loss: 0.3496193609232124
Epoch: 26, step: 577, loss: 0.3269784152507782, mean loss: 0.34961876701560857
Epoch: 26, step: 578, loss: 0.3082972466945648, mean loss: 0.34961768311559227
Epoch: 26, step: 579, loss: 0.2968294024467468, mean loss: 0.3496162984686332
Epoch: 26, step: 580, loss: 0.34428587555885315, mean loss: 0.34961615865426177
Epoch: 26, step: 581, loss: 0.3406417965888977, mean loss: 0.3496159232673325
Epoch: 26, step: 582, loss: 0.3351365327835083, mean loss: 0.3496155434999633
Epoch: 26, step: 583, loss: 0.3234981596469879, mean loss: 0.3496148585077305
Epoch: 26, step: 584, loss: 0.3015584349632263, mean loss: 0.34961359814361015
Epoch: 26, step: 585, loss: 0.38733598589897156, mean loss: 0.3496145874535434
Epoch: 26, step: 586, loss: 0.29741644859313965, mean loss: 0.3496132185374683
Epoch: 26, step: 587, loss: 0.35158026218414307, mean loss: 0.34961327012258436
Epoch: 26, step: 588, loss: 0.29441678524017334, mean loss: 0.34961182264966373
Epoch: 26, step: 589, loss: 0.3458155393600464, mean loss: 0.3496117230985207
Epoch: 26, step: 590, loss: 0.35163065791130066, mean loss: 0.3496117760403015
Epoch: 26, step: 591, loss: 0.3456101715564728, mean loss: 0.34961167111045877
Epoch: 26, step: 592, loss: 0.3356248736381531, mean loss: 0.34961130435907634
Epoch: 26, step: 593, loss: 0.33342134952545166, mean loss: 0.3496108798492742
Epoch: 26, step: 594, loss: 0.3396281898021698, mean loss: 0.34961061810433997
Epoch: 26, step: 595, loss: 0.3423563241958618, mean loss: 0.3496104279026119
Epoch: 26, step: 596, loss: 0.36983606219291687, mean loss: 0.34961095818850607
Epoch: 26, step: 597, loss: 0.3546822965145111, mean loss: 0.34961109114792943
Epoch: 26, step: 598, loss: 0.3463766276836395, mean loss: 0.3496110063495794
Epoch: 26, step: 599, loss: 0.32517769932746887, mean loss: 0.34961036579517973
Epoch: 26, step: 600, loss: 0.3146263360977173, mean loss: 0.34960944866240484
Epoch: 26, step: 601, loss: 0.3168000280857086, mean loss: 0.3496085885611996
Epoch: 26, step: 602, loss: 0.3018917143344879, mean loss: 0.3496073376928685
Epoch: 26, step: 603, loss: 0.3273899257183075, mean loss: 0.3496067552924288
Epoch: 26, step: 604, loss: 0.34711888432502747, mean loss: 0.34960669007785
Epoch: 26, step: 605, loss: 0.31898462772369385, mean loss: 0.34960588740255893
Epoch: 26, step: 606, loss: 0.31662410497665405, mean loss: 0.34960502289619144
Epoch: 26, step: 607, loss: 0.33203181624412537, mean loss: 0.34960456228582626
Epoch: 26, step: 608, loss: 0.3034023344516754, mean loss: 0.3496033513134824
Epoch: 26, step: 609, loss: 0.3386307656764984, mean loss: 0.349603063726712
Epoch: 26, step: 610, loss: 0.3314358592033386, mean loss: 0.3496025875845413
Epoch: 26, step: 611, loss: 0.3524942100048065, mean loss: 0.34960266336875406
Epoch: 26, step: 612, loss: 0.3845491409301758, mean loss: 0.3496035792289517
Epoch: 26, step: 613, loss: 0.311984121799469, mean loss: 0.3496025933424422
Epoch: 26, step: 614, loss: 0.33733677864074707, mean loss: 0.34960227190281584
Epoch: 26, step: 615, loss: 0.33052927255630493, mean loss: 0.34960177208627113
Epoch: 26, step: 616, loss: 0.34832751750946045, mean loss: 0.34960173869473066
Epoch: 26, step: 617, loss: 0.2986414134502411, mean loss: 0.34960040332642595
Epoch: 26, step: 618, loss: 0.3205292224884033, mean loss: 0.3495996415629158
Epoch: 26, step: 619, loss: 0.3557654619216919, mean loss: 0.3495998031240823
Epoch: 26, step: 620, loss: 0.3250579237937927, mean loss: 0.3495991600773292
Epoch: 26, step: 621, loss: 0.33815115690231323, mean loss: 0.34959886012440844
Epoch: 26, step: 622, loss: 0.3565247058868408, mean loss: 0.3495990415860314
Epoch: 26, step: 623, loss: 0.33968567848205566, mean loss: 0.34959878185633364
Epoch: 26, step: 624, loss: 0.32828205823898315, mean loss: 0.34959822337370067
Epoch: 26, step: 625, loss: 0.36827126145362854, mean loss: 0.34959871258088115
Epoch: 26, step: 626, loss: 0.3235935568809509, mean loss: 0.3495980313004405
Epoch: 26, step: 627, loss: 0.3156990110874176, mean loss: 0.3495971432406005
Epoch: 26, step: 628, loss: 0.3138459026813507, mean loss: 0.34959620668228547
Epoch: 26, step: 629, loss: 0.3251612186431885, mean loss: 0.34959556658724594
Epoch: 26, step: 630, loss: 0.34233978390693665, mean loss: 0.349595376520902
Epoch: 26, step: 631, loss: 0.29849398136138916, mean loss: 0.3495940379470556
Epoch: 26, step: 632, loss: 0.31813058257102966, mean loss: 0.3495932138001772
Epoch: 26, step: 633, loss: 0.30640438199043274, mean loss: 0.34959208255098106
Epoch: 26, step: 634, loss: 0.31592264771461487, mean loss: 0.3495912006673582
Epoch: 26, step: 635, loss: 0.3011435270309448, mean loss: 0.3495899317392902
Epoch: 26, step: 636, loss: 0.306307852268219, mean loss: 0.3495887981367269
Epoch: 26, step: 637, loss: 0.33235085010528564, mean loss: 0.3495883466688092
Epoch: 26, step: 638, loss: 0.3209022581577301, mean loss: 0.34958759538974493
Epoch: 26, step: 639, loss: 0.33764907717704773, mean loss: 0.3495872827321341
Epoch: 26, step: 640, loss: 0.3030553460121155, mean loss: 0.3495860641401026
Epoch: 26, step: 641, loss: 0.31447654962539673, mean loss: 0.34958514470589863
Epoch: 26, step: 642, loss: 0.31241634488105774, mean loss: 0.34958417136942743
Epoch: 26, step: 643, loss: 0.35260212421417236, mean loss: 0.3495842503982544
Epoch: 26, step: 644, loss: 0.30811357498168945, mean loss: 0.34958316446577603
Epoch: 26, step: 645, loss: 0.34439817070961, mean loss: 0.34958302869741376
Epoch: 26, step: 646, loss: 0.34969449043273926, mean loss: 0.34958303161594784
Epoch: 26, step: 647, loss: 0.3453904986381531, mean loss: 0.3495829218407861
Epoch: 26, step: 648, loss: 0.3380074203014374, mean loss: 0.34958261876164753
Epoch: 26, step: 649, loss: 0.41858017444610596, mean loss: 0.3495844252641266
Epoch: 26, step: 650, loss: 0.33532634377479553, mean loss: 0.34958405196705916
Epoch: 26, step: 651, loss: 0.31253117322921753, mean loss: 0.34958308189483334
Epoch: 26, step: 652, loss: 0.3312262296676636, mean loss: 0.3495826013112213
Epoch: 26, step: 653, loss: 0.33710166811943054, mean loss: 0.3495822745681146
Epoch: 26, step: 654, loss: 0.3410170078277588, mean loss: 0.34958205034060236
Epoch: 26, step: 655, loss: 0.3195764720439911, mean loss: 0.3495812648542595
Epoch: 26, step: 656, loss: 0.3649142384529114, mean loss: 0.3495816662304957
Epoch: 26, step: 657, loss: 0.3373505771160126, mean loss: 0.34958134606167957
Epoch: 26, step: 658, loss: 0.29720836877822876, mean loss: 0.34957997514899514
Epoch: 26, step: 659, loss: 0.33110132813453674, mean loss: 0.3495794914654276
Epoch: 26, step: 660, loss: 0.32186123728752136, mean loss: 0.34957876595164206
Epoch: 26, step: 661, loss: 0.3688187301158905, mean loss: 0.3495792695365283
Epoch: 26, step: 662, loss: 0.35061436891555786, mean loss: 0.3495792966284062
Epoch: 26, step: 663, loss: 0.347546249628067, mean loss: 0.349579243418424
Epoch: 26, step: 664, loss: 0.3089902400970459, mean loss: 0.3495781811293476
Epoch: 26, step: 665, loss: 0.35725897550582886, mean loss: 0.3495783821446414
Epoch: 26, step: 666, loss: 0.3444318175315857, mean loss: 0.34957824745660354
Epoch: 26, step: 667, loss: 0.3485075831413269, mean loss: 0.3495782194375437
Epoch: 26, step: 668, loss: 0.3370579183101654, mean loss: 0.34957789179247195
Epoch: 26, step: 669, loss: 0.3195512294769287, mean loss: 0.34957710604216274
Epoch: 26, step: 670, loss: 0.3182910978794098, mean loss: 0.34957628735818624
Epoch: 26, step: 671, loss: 0.35111042857170105, mean loss: 0.3495763275021368
Epoch: 26, step: 672, loss: 0.330147385597229, mean loss: 0.3495758191173367
Epoch: 26, step: 673, loss: 0.37433022260665894, mean loss: 0.34957646683316407
Epoch: 26, step: 674, loss: 0.3179723918437958, mean loss: 0.3495756399126536
Epoch: 26, step: 675, loss: 0.30320098996162415, mean loss: 0.34957442655184906
Epoch: 26, step: 676, loss: 0.3180352747440338, mean loss: 0.349573601373235
Epoch: 26, step: 677, loss: 0.30437272787094116, mean loss: 0.3495724187853667
Epoch: 26, step: 678, loss: 0.3431658446788788, mean loss: 0.34957225117491997
Epoch: 26, step: 679, loss: 0.31426629424095154, mean loss: 0.3495713275155192
Epoch: 26, step: 680, loss: 0.33667612075805664, mean loss: 0.3495709901654405
Epoch: 26, step: 681, loss: 0.34298303723335266, mean loss: 0.3495708178232407
Epoch: 26, step: 682, loss: 0.2912428081035614, mean loss: 0.34956929199045966
Epoch: 26, step: 683, loss: 0.3693327307701111, mean loss: 0.3495698089790225
Epoch: 26, step: 684, loss: 0.31954729557037354, mean loss: 0.3495690236455477
Epoch: 26, step: 685, loss: 0.3174523711204529, mean loss: 0.3495681835552384
Epoch: 26, step: 686, loss: 0.3733198642730713, mean loss: 0.3495688048228149
Epoch: 26, step: 687, loss: 0.35256829857826233, mean loss: 0.34956888327787233
Epoch: 26, step: 688, loss: 0.3345523774623871, mean loss: 0.34956849051492367
Epoch: 26, step: 689, loss: 0.32463985681533813, mean loss: 0.34956783851320533
Epoch: 26, step: 690, loss: 0.32193487882614136, mean loss: 0.3495671157994696
Epoch: 26, step: 691, loss: 0.3052562475204468, mean loss: 0.3495659569212323
Epoch: 26, step: 692, loss: 0.3117058277130127, mean loss: 0.3495649667774133
Epoch: 26, step: 693, loss: 0.3319368064403534, mean loss: 0.3495645057658453
Epoch: 26, step: 694, loss: 0.31857171654701233, mean loss: 0.3495636952637606
Epoch: 26, step: 695, loss: 0.3084651529788971, mean loss: 0.3495626205110858
Epoch: 26, step: 696, loss: 0.3126011788845062, mean loss: 0.3495616539714653
Epoch: 26, step: 697, loss: 0.3234816789627075, mean loss: 0.34956097199941866
Epoch: 26, step: 698, loss: 0.3094671666622162, mean loss: 0.34955992360349425
Epoch: 26, step: 699, loss: 0.3167259097099304, mean loss: 0.34955906506322926
Epoch: 26, step: 700, loss: 0.37443000078201294, mean loss: 0.34955971536877817
Epoch: 26, step: 701, loss: 0.30603963136672974, mean loss: 0.3495585774698083
Epoch: 26, step: 702, loss: 0.3162485659122467, mean loss: 0.3495577065515256
Epoch: 26, step: 703, loss: 0.3354856073856354, mean loss: 0.3495573386342707
Epoch: 26, step: 704, loss: 0.33887916803359985, mean loss: 0.34955705945911314
Epoch: 26, step: 705, loss: 0.3392381966114044, mean loss: 0.34955678968492104
Epoch: 26, step: 706, loss: 0.34112516045570374, mean loss: 0.3495565692559328
Epoch: 26, step: 707, loss: 0.29880398511886597, mean loss: 0.349555242460363
Epoch: 26, step: 708, loss: 0.3010352551937103, mean loss: 0.349553974063446
Epoch: 26, step: 709, loss: 0.3572036325931549, mean loss: 0.3495541740336068
Epoch: 26, step: 710, loss: 0.36681032180786133, mean loss: 0.3495546251157601
Epoch: 26, step: 711, loss: 0.3316130042076111, mean loss: 0.34955415612734236
Epoch: 26, step: 712, loss: 0.29780352115631104, mean loss: 0.34955280341712014
Epoch: 26, step: 713, loss: 0.418376088142395, mean loss: 0.3495546023424358
Epoch: 26, step: 714, loss: 0.3174494504928589, mean loss: 0.34955376318950837
Epoch: 26, step: 715, loss: 0.36614790558815, mean loss: 0.34955419690990563
Epoch: 26, step: 716, loss: 0.30852967500686646, mean loss: 0.3495531246817385
Epoch: 26, step: 717, loss: 0.3164008557796478, mean loss: 0.3495522582275829
Epoch: 26, step: 718, loss: 0.31628304719924927, mean loss: 0.34955138873980024
Epoch: 26, step: 719, loss: 0.3531450033187866, mean loss: 0.34955148265613356
Epoch: 26, step: 720, loss: 0.3106921315193176, mean loss: 0.3495504671236329
Epoch: 26, step: 721, loss: 0.30259639024734497, mean loss: 0.34954924007934096
Epoch: 26, step: 722, loss: 0.327719509601593, mean loss: 0.3495486696209701
Epoch: 26, step: 723, loss: 0.3422681391239166, mean loss: 0.34954847936983346
Epoch: 26, step: 724, loss: 0.35556694865226746, mean loss: 0.34954863663731583
Epoch: 26, step: 725, loss: 0.3497612476348877, mean loss: 0.3495486421928684
Epoch: 26, step: 726, loss: 0.32301065325737, mean loss: 0.3495479487699389
Epoch: 26, step: 727, loss: 0.345488965511322, mean loss: 0.3495478427137292
Epoch: 26, step: 728, loss: 0.32430973649024963, mean loss: 0.3495471832904746
Epoch: 26, step: 729, loss: 0.3648347854614258, mean loss: 0.34954758271572856
Epoch: 26, step: 730, loss: 0.33458155393600464, mean loss: 0.34954719170256643
Epoch: 26, step: 731, loss: 0.3094291388988495, mean loss: 0.34954614357703595
Epoch: 26, step: 732, loss: 0.326156884431839, mean loss: 0.34954553252446796
Epoch: 26, step: 733, loss: 0.3104715049266815, mean loss: 0.34954451172851214
Epoch: 26, step: 734, loss: 0.3393920361995697, mean loss: 0.3495442465053995
Epoch: 26, step: 735, loss: 0.3234158158302307, mean loss: 0.3495435639445146
Epoch: 26, step: 736, loss: 0.3072269856929779, mean loss: 0.34954245852463917
Epoch: 26, step: 737, loss: 0.3333113491535187, mean loss: 0.3495420345366194
Epoch: 26, step: 738, loss: 0.3699820041656494, mean loss: 0.3495425684542755
Epoch: 26, step: 739, loss: 0.32352975010871887, mean loss: 0.34954188898456634
Epoch: 26, step: 740, loss: 0.31768500804901123, mean loss: 0.34954105688633114
Epoch: 26, step: 741, loss: 0.32816222310066223, mean loss: 0.3495404984881233
Epoch: 26, step: 742, loss: 0.2888738214969635, mean loss: 0.3495389139639508
Epoch: 26, step: 743, loss: 0.3289504945278168, mean loss: 0.3495383762388297
Epoch: 26, step: 744, loss: 0.3568814694881439, mean loss: 0.34953856801958266
Epoch: 26, step: 745, loss: 0.37306466698646545, mean loss: 0.349539182438464
Epoch: 26, step: 746, loss: 0.343413382768631, mean loss: 0.34953902245832064
Epoch: 26, step: 747, loss: 0.3083501160144806, mean loss: 0.34953794680527445
Epoch: 26, step: 748, loss: 0.3237151503562927, mean loss: 0.34953727245757515
Epoch: 26, step: 749, loss: 0.32136252522468567, mean loss: 0.3495365367092273
Epoch: 26, step: 750, loss: 0.35344183444976807, mean loss: 0.34953663868853896
Epoch: 26, step: 751, loss: 0.3398715555667877, mean loss: 0.34953638631014117
Epoch: 26, step: 752, loss: 0.3038523197174072, mean loss: 0.349535193421231
Epoch: 26, step: 753, loss: 0.3193562626838684, mean loss: 0.349534405418444
Epoch: 26, step: 754, loss: 0.3020864725112915, mean loss: 0.34953316653667404
Epoch: 26, step: 755, loss: 0.29004812240600586, mean loss: 0.34953161340236255
Epoch: 26, step: 756, loss: 0.391476035118103, mean loss: 0.3495327085283832
Epoch: 26, step: 757, loss: 0.34064820408821106, mean loss: 0.34953247656910064
Epoch: 26, step: 758, loss: 0.3460288345813751, mean loss: 0.34953238509736245
Epoch: 26, step: 759, loss: 0.35734161734580994, mean loss: 0.34953258897247336
Epoch: 26, step: 760, loss: 0.3044324815273285, mean loss: 0.34953141157768297
Epoch: 26, step: 761, loss: 0.29142141342163086, mean loss: 0.34952989458300443
Epoch: 26, step: 762, loss: 0.3132684826850891, mean loss: 0.34952894798285566
Epoch: 26, step: 763, loss: 0.3353573679924011, mean loss: 0.34952857804498394
Epoch: 26, step: 764, loss: 0.3554229140281677, mean loss: 0.34952873190794
Epoch: 26, step: 765, loss: 0.3156874477863312, mean loss: 0.3495278485541388
Epoch: 26, step: 766, loss: 0.317813903093338, mean loss: 0.34952702075153746
Epoch: 26, step: 767, loss: 0.3333745300769806, mean loss: 0.34952659914758377
Epoch: 26, step: 768, loss: 0.3145148754119873, mean loss: 0.34952568531353956
Epoch: 26, step: 769, loss: 0.368160218000412, mean loss: 0.34952617167707994
Epoch: 26, step: 770, loss: 0.3517604172229767, mean loss: 0.34952622998963495
Epoch: 26, step: 771, loss: 0.3228470981121063, mean loss: 0.34952553369743644
Epoch: 26, step: 772, loss: 0.2867620885372162, mean loss: 0.34952389569223874
Epoch: 26, step: 773, loss: 0.3080909252166748, mean loss: 0.34952281439962235
Epoch: 26, step: 774, loss: 0.3138694167137146, mean loss: 0.3495218839630847
Epoch: 26, step: 775, loss: 0.3309163451194763, mean loss: 0.34952139843232155
Epoch: 26, step: 776, loss: 0.3083288073539734, mean loss: 0.34952032349714035
Epoch: 26, step: 777, loss: 0.3095635175704956, mean loss: 0.3495192808374168
Epoch: 26, step: 778, loss: 0.33824098110198975, mean loss: 0.34951898654157004
Epoch: 26, step: 779, loss: 0.36403730511665344, mean loss: 0.34951936537255257
Epoch: 26, step: 780, loss: 0.30589956045150757, mean loss: 0.349518227217173
Epoch: 26, step: 781, loss: 0.2999167740345001, mean loss: 0.3495169330186346
Epoch: 26, step: 782, loss: 0.3062071204185486, mean loss: 0.3495158030107394
Epoch: 26, step: 783, loss: 0.32179877161979675, mean loss: 0.3495150798571339
Epoch: 26, step: 784, loss: 0.3404206931591034, mean loss: 0.3495148425854415
Epoch: 26, step: 785, loss: 0.3348187208175659, mean loss: 0.3495144591750119
Epoch: 26, step: 786, loss: 0.3079662322998047, mean loss: 0.34951337524224535
Epoch: 26, step: 787, loss: 0.31357342004776, mean loss: 0.34951243764558476
Epoch: 26, step: 788, loss: 0.34107041358947754, mean loss: 0.3495122174169552
Epoch: 26, step: 789, loss: 0.3294314444065094, mean loss: 0.349511693579813
Epoch: 26, step: 790, loss: 0.34022700786590576, mean loss: 0.3495114513811508
Epoch: 26, step: 791, loss: 0.3387127220630646, mean loss: 0.34951116969476415
Epoch: 26, step: 792, loss: 0.3625151515007019, mean loss: 0.34951150889662674
Epoch: 26, step: 793, loss: 0.3322692811489105, mean loss: 0.3495110591541324
Epoch: 26, step: 794, loss: 0.3159436583518982, mean loss: 0.34951018361223507
Epoch: 26, step: 795, loss: 0.34305739402770996, mean loss: 0.3495100153078641
Epoch: 26, step: 796, loss: 0.35013845562934875, mean loss: 0.3495100316986813
Epoch: 26, step: 797, loss: 0.3419468402862549, mean loss: 0.3495098344426328
Epoch: 26, step: 798, loss: 0.3725902736186981, mean loss: 0.34951043638925083
Epoch: 26, step: 799, loss: 0.3064989447593689, mean loss: 0.3495093146624714
Epoch: 26, step: 800, loss: 0.2970941960811615, mean loss: 0.3495079477275756
Epoch: 26, step: 801, loss: 0.3272271752357483, mean loss: 0.34950736668203
Epoch: 26, step: 802, loss: 0.32170140743255615, mean loss: 0.349506641567699
Epoch: 26, step: 803, loss: 0.3139796853065491, mean loss: 0.349505715131998
Epoch: 26, step: 804, loss: 0.34324949979782104, mean loss: 0.3495055519930548
Epoch: 26, step: 805, loss: 0.33215421438217163, mean loss: 0.349505099546181
Epoch: 26, step: 806, loss: 0.34738773107528687, mean loss: 0.34950504433592644
Epoch: 26, step: 807, loss: 0.350519061088562, mean loss: 0.3495050707756624
Epoch: 26, step: 808, loss: 0.3743688762187958, mean loss: 0.3495057190640738
Epoch: 26, step: 809, loss: 0.343311071395874, mean loss: 0.3495055575516457
Epoch: 26, step: 810, loss: 0.30562180280685425, mean loss: 0.34950441340473537
Epoch: 26, step: 811, loss: 0.3520466983318329, mean loss: 0.34950447968601933
Epoch: 26, step: 812, loss: 0.3178144097328186, mean loss: 0.3495036534986232
Epoch: 26, step: 813, loss: 0.3098624348640442, mean loss: 0.34950262004488125
Epoch: 26, step: 814, loss: 0.3457331359386444, mean loss: 0.34950252177631047
Epoch: 26, step: 815, loss: 0.2954757809638977, mean loss: 0.3495011133628378
Epoch: 26, step: 816, loss: 0.3447260856628418, mean loss: 0.3495009888867371
Epoch: 26, step: 817, loss: 0.3842892646789551, mean loss: 0.34950189572881496
Epoch: 26, step: 818, loss: 0.31909117102622986, mean loss: 0.3495011030190503
Epoch: 26, step: 819, loss: 0.3464890122413635, mean loss: 0.3495010245055799
Epoch: 26, step: 820, loss: 0.3076364994049072, mean loss: 0.3494999332889736
Epoch: 26, step: 821, loss: 0.3286156952381134, mean loss: 0.3494993889466379
Epoch: 26, step: 822, loss: 0.33024081587791443, mean loss: 0.34949888698992854
Epoch: 26, step: 823, loss: 0.3266533315181732, mean loss: 0.34949829155739437
Epoch: 26, step: 824, loss: 0.35132312774658203, mean loss: 0.34949833911756506
Epoch: 26, step: 825, loss: 0.358591228723526, mean loss: 0.34949857609670515
Epoch: 26, step: 826, loss: 0.36698395013809204, mean loss: 0.3494990317891302
Epoch: 26, step: 827, loss: 0.3757835626602173, mean loss: 0.3494997167815953
Epoch: 26, step: 828, loss: 0.36378923058509827, mean loss: 0.3495000891661835
Epoch: 26, step: 829, loss: 0.3145359754562378, mean loss: 0.3494991780254708
Epoch: 26, step: 830, loss: 0.32604196667671204, mean loss: 0.34949856676263436
Epoch: 26, step: 831, loss: 0.33743345737457275, mean loss: 0.34949825237058235
Epoch: 26, step: 832, loss: 0.35550951957702637, mean loss: 0.34949840900781837
Epoch: 26, step: 833, loss: 0.4032250642776489, mean loss: 0.34949980894151134
Epoch: 26, step: 834, loss: 0.3576350808143616, mean loss: 0.3495000209134719
Epoch: 26, step: 835, loss: 0.41233015060424805, mean loss: 0.3495016579673982
Epoch: 26, step: 836, loss: 0.3497752845287323, mean loss: 0.34950166509661734
Epoch: 26, step: 837, loss: 0.31686490774154663, mean loss: 0.34950081478247647
Epoch: 26, step: 838, loss: 0.3233495056629181, mean loss: 0.34950013345717307
Epoch: 26, step: 839, loss: 0.30060189962387085, mean loss: 0.34949885953486604
Epoch: 26, step: 840, loss: 0.3297486901283264, mean loss: 0.34949834500655014
Epoch: 26, step: 841, loss: 0.3702472746372223, mean loss: 0.3494988855403289
Epoch: 26, step: 842, loss: 0.35936394333839417, mean loss: 0.34949914252987735
Epoch: 26, step: 843, loss: 0.39465197920799255, mean loss: 0.34950031875256876
Epoch: 26, step: 844, loss: 0.35595399141311646, mean loss: 0.3495004868651182
Epoch: 26, step: 845, loss: 0.3520171642303467, mean loss: 0.349500552420663
Epoch: 26, step: 846, loss: 0.3310298025608063, mean loss: 0.34950007129878913
Epoch: 26, step: 847, loss: 0.3261079490184784, mean loss: 0.34949946200200127
Epoch: 26, step: 848, loss: 0.3198336362838745, mean loss: 0.3494986893136019
Epoch: 26, step: 849, loss: 0.34002143144607544, mean loss: 0.3494984424714425
Epoch: 26, step: 850, loss: 0.35986918210983276, mean loss: 0.3494987125779574
Epoch: 26, step: 851, loss: 0.3662886917591095, mean loss: 0.34949914986254904
Epoch: 26, step: 852, loss: 0.34394195675849915, mean loss: 0.3494990051326716
Epoch: 26, step: 853, loss: 0.29874518513679504, mean loss: 0.3494976833497664
Epoch: 26, step: 854, loss: 0.35735228657722473, mean loss: 0.34949788790205233
Epoch: 26, step: 855, loss: 0.3551923632621765, mean loss: 0.3494980361956815
Epoch: 26, step: 856, loss: 0.3049006760120392, mean loss: 0.3494968748363371
Epoch: 26, step: 857, loss: 0.3488478660583496, mean loss: 0.3494968579359471
Epoch: 26, step: 858, loss: 0.32400503754615784, mean loss: 0.34949619413831695
Epoch: 26, step: 859, loss: 0.3189994692802429, mean loss: 0.34949540003549284
Epoch: 26, step: 860, loss: 0.296652615070343, mean loss: 0.34949402410045927
Epoch: 26, step: 861, loss: 0.36155980825424194, mean loss: 0.34949433826450016
Epoch: 26, step: 862, loss: 0.35439369082450867, mean loss: 0.34949446582855254
Epoch: 26, step: 863, loss: 0.3682684004306793, mean loss: 0.34949495463126556
Epoch: 26, step: 864, loss: 0.32173269987106323, mean loss: 0.3494942318252888
Epoch: 26, step: 865, loss: 0.30443528294563293, mean loss: 0.3494930587206577
Epoch: 26, step: 866, loss: 0.33612602949142456, mean loss: 0.3494927107206257
Epoch: 26, step: 867, loss: 0.3626919388771057, mean loss: 0.3494930543431436
Epoch: 26, step: 868, loss: 0.3777662217617035, mean loss: 0.3494937903743679
Epoch: 26, step: 869, loss: 0.3335406184196472, mean loss: 0.3494933750785915
Epoch: 26, step: 870, loss: 0.34121859073638916, mean loss: 0.34949315967355854
Epoch: 26, step: 871, loss: 0.32703500986099243, mean loss: 0.3494925750694922
Epoch: 26, step: 872, loss: 0.3273174464702606, mean loss: 0.34949199784772583
Epoch: 26, step: 873, loss: 0.3438453674316406, mean loss: 0.34949185086895507
Epoch: 26, step: 874, loss: 0.3439934253692627, mean loss: 0.34949170775160426
Epoch: 26, step: 875, loss: 0.3281778395175934, mean loss: 0.3494911529918897
Epoch: 26, step: 876, loss: 0.3345503509044647, mean loss: 0.3494907641211657
Epoch: 26, step: 877, loss: 0.34554705023765564, mean loss: 0.3494906614790887
Epoch: 26, step: 878, loss: 0.3167596459388733, mean loss: 0.34948980961912096
Epoch: 26, step: 879, loss: 0.34659722447395325, mean loss: 0.3494897343384332
Epoch: 26, step: 880, loss: 0.3407357633113861, mean loss: 0.3494895065187578
Epoch: 26, step: 881, loss: 0.33697161078453064, mean loss: 0.34948918075246066
Epoch: 26, step: 882, loss: 0.3098336458206177, mean loss: 0.3494881487818428
Epoch: 26, step: 883, loss: 0.3713074326515198, mean loss: 0.34948871657834196
Epoch: 26, step: 884, loss: 0.3095228672027588, mean loss: 0.34948767658642504
Epoch: 26, step: 885, loss: 0.33094513416290283, mean loss: 0.3494871940846706
Epoch: 26, step: 886, loss: 0.31349411606788635, mean loss: 0.34948625752101065
Epoch: 26, step: 887, loss: 0.2973530888557434, mean loss: 0.34948490101683016
Epoch: 26, step: 888, loss: 0.3474360406398773, mean loss: 0.3494848477069044
Epoch: 26, step: 889, loss: 0.32613030076026917, mean loss: 0.349484240053604
Epoch: 26, step: 890, loss: 0.3754568099975586, mean loss: 0.34948491580669216
Epoch: 26, step: 891, loss: 0.3158217966556549, mean loss: 0.349484039984048
Epoch: 26, step: 892, loss: 0.31590569019317627, mean loss: 0.34948316638960014
Epoch: 26, step: 893, loss: 0.31758615374565125, mean loss: 0.34948233655941535
Epoch: 26, step: 894, loss: 0.3317999243736267, mean loss: 0.3494818765471313
Epoch: 26, step: 895, loss: 0.3121814727783203, mean loss: 0.34948090619323513
Epoch: 26, step: 896, loss: 0.40007391571998596, mean loss: 0.3494822223142915
Epoch: 26, step: 897, loss: 0.30688586831092834, mean loss: 0.34948111424618883
Epoch: 26, step: 898, loss: 0.3309392035007477, mean loss: 0.34948063192403017
Epoch: 26, step: 899, loss: 0.34639933705329895, mean loss: 0.34948055177381504
Epoch: 26, step: 900, loss: 0.33286741375923157, mean loss: 0.3494801196464119
Epoch: 26, step: 901, loss: 0.3349018096923828, mean loss: 0.3494797404571606
Epoch: 26, step: 902, loss: 0.2997989356517792, mean loss: 0.3494784482677881
Epoch: 26, step: 903, loss: 0.32243892550468445, mean loss: 0.34947774499264345
Epoch: 26, step: 904, loss: 0.2916902005672455, mean loss: 0.34947624202652144
Epoch: 26, step: 905, loss: 0.2975933849811554, mean loss: 0.34947489266743054
Epoch: 26, step: 906, loss: 0.32703888416290283, mean loss: 0.3494743091713315
Epoch: 26, step: 907, loss: 0.42263221740722656, mean loss: 0.34947621174878485
Epoch: 26, step: 908, loss: 0.30858346819877625, mean loss: 0.3494751483013672
Epoch: 26, step: 909, loss: 0.32263943552970886, mean loss: 0.3494744504360536
Epoch: 26, step: 910, loss: 0.3143543601036072, mean loss: 0.34947353715844776
Epoch: 26, step: 911, loss: 0.3210000693798065, mean loss: 0.3494727967416655
Epoch: 26, step: 912, loss: 0.31818267703056335, mean loss: 0.34947198310254357
Epoch: 26, step: 913, loss: 0.32791173458099365, mean loss: 0.34947142248450513
Epoch: 26, step: 914, loss: 0.34797754883766174, mean loss: 0.34947138364122665
Epoch: 26, step: 915, loss: 0.35795989632606506, mean loss: 0.34947160435138486
Epoch: 26, step: 916, loss: 0.36910563707351685, mean loss: 0.34947211484338253
Epoch: 26, step: 917, loss: 0.3726111948490143, mean loss: 0.34947271645224337
Epoch: 26, step: 918, loss: 0.3242066204547882, mean loss: 0.3494720595587094
Epoch: 26, step: 919, loss: 0.3669399321079254, mean loss: 0.349472513694331
Epoch: 26, step: 920, loss: 0.3392069339752197, mean loss: 0.3494722468132776
Epoch: 26, step: 921, loss: 0.32153916358947754, mean loss: 0.3494715206373502
Epoch: 26, step: 922, loss: 0.3497679829597473, mean loss: 0.3494715283442762
Epoch: 26, step: 923, loss: 0.34936562180519104, mean loss: 0.3494715255911687
Epoch: 26, step: 924, loss: 0.35958996415138245, mean loss: 0.34947178861954376
Epoch: 26, step: 925, loss: 0.2889976501464844, mean loss: 0.34947021663777944
Epoch: 26, step: 926, loss: 0.33638960123062134, mean loss: 0.3494698766254219
Epoch: 26, step: 927, loss: 0.33259615302085876, mean loss: 0.3494694380279067
Epoch: 26, step: 928, loss: 0.3053426444530487, mean loss: 0.3494682910730663
Epoch: 26, step: 929, loss: 0.3424511253833771, mean loss: 0.3494681086858518
Epoch: 26, step: 930, loss: 0.36046066880226135, mean loss: 0.34946839439241756
Epoch: 26, step: 931, loss: 0.36362168192863464, mean loss: 0.34946876223958295
Epoch: 26, step: 932, loss: 0.3156697154045105, mean loss: 0.34946788381749094
Epoch: 26, step: 933, loss: 0.32610493898391724, mean loss: 0.3494672766407969
Epoch: 26, step: 934, loss: 0.34110793471336365, mean loss: 0.3494670593965357
Epoch: 26, step: 935, loss: 0.3445998728275299, mean loss: 0.34946693291039826
Epoch: 26, step: 936, loss: 0.28875043988227844, mean loss: 0.34946535507996174
Epoch: 26, step: 937, loss: 0.3454888164997101, mean loss: 0.34946525174493287
Epoch: 26, step: 938, loss: 0.34550750255584717, mean loss: 0.34946514890084096
Epoch: 26, step: 939, loss: 0.316864550113678, mean loss: 0.34946430177999105
Epoch: 26, step: 940, loss: 0.3065585792064667, mean loss: 0.34946318691127404
Epoch: 26, step: 941, loss: 0.357830673456192, mean loss: 0.3494634043276474
Epoch: 26, step: 942, loss: 0.3531469702720642, mean loss: 0.34946350003700233
Epoch: 26, step: 943, loss: 0.3462214171886444, mean loss: 0.34946341580080276
Epoch: 26, step: 944, loss: 0.3211459219455719, mean loss: 0.3494626800712734
Epoch: 26, step: 945, loss: 0.3134791851043701, mean loss: 0.3494617451922148
Epoch: 26, step: 946, loss: 0.330917090177536, mean loss: 0.3494612634002371
Epoch: 26, step: 947, loss: 0.3137889802455902, mean loss: 0.34946033665485743
Epoch: 26, step: 948, loss: 0.29353052377700806, mean loss: 0.34945888366826566
Epoch: 26, step: 949, loss: 0.3098478317260742, mean loss: 0.3494578546494071
Epoch: 26, step: 950, loss: 0.312531054019928, mean loss: 0.3494568953871489
Epoch: 26, step: 951, loss: 0.3240898847579956, mean loss: 0.34945623643529344
Epoch: 26, step: 952, loss: 0.3084881603717804, mean loss: 0.34945517224649786
Epoch: 26, step: 953, loss: 0.32429713010787964, mean loss: 0.34945451875691036
Epoch: 26, step: 954, loss: 0.3526131808757782, mean loss: 0.3494546008022133
Epoch: 26, step: 955, loss: 0.35383185744285583, mean loss: 0.34945471449719095
Epoch: 26, step: 956, loss: 0.28944268822669983, mean loss: 0.3494531557837479
Epoch: 26, step: 957, loss: 0.3461805284023285, mean loss: 0.3494530707848548
Epoch: 26, step: 958, loss: 0.28833717107772827, mean loss: 0.3494514834825743
Epoch: 26, step: 959, loss: 0.3172961473464966, mean loss: 0.3494506483658037
Epoch: 26, step: 960, loss: 0.3271574079990387, mean loss: 0.34945006939579026
Epoch: 26, step: 961, loss: 0.3440411686897278, mean loss: 0.34944992892675414
Epoch: 26, step: 962, loss: 0.29139554500579834, mean loss: 0.3494484212947932
Epoch: 26, step: 963, loss: 0.3272058963775635, mean loss: 0.3494478436868957
Epoch: 26, step: 964, loss: 0.2910524904727936, mean loss: 0.3494463272789595
Epoch: 26, step: 965, loss: 0.35471928119659424, mean loss: 0.3494464642032368
Epoch: 26, step: 966, loss: 0.35212594270706177, mean loss: 0.3494465337802019
Epoch: 26, step: 967, loss: 0.3231697380542755, mean loss: 0.3494458514786926
Epoch: 26, step: 968, loss: 0.3374289870262146, mean loss: 0.34944553945770096
Epoch: 26, step: 969, loss: 0.39211952686309814, mean loss: 0.34944664747004467
Epoch: 26, step: 970, loss: 0.3283867835998535, mean loss: 0.3494461006736311
Epoch: 26, step: 971, loss: 0.3585107624530792, mean loss: 0.34944633602158465
Epoch: 26, step: 972, loss: 0.2901763617992401, mean loss: 0.34944479722120503
Epoch: 26, step: 973, loss: 0.31084704399108887, mean loss: 0.3494437951506606
Epoch: 26, step: 974, loss: 0.3272991180419922, mean loss: 0.34944322024796043
Epoch: 26, step: 975, loss: 0.3008754551410675, mean loss: 0.3494419594025527
Epoch: 26, step: 976, loss: 0.3142402470111847, mean loss: 0.3494410455708144
Epoch: 26, step: 977, loss: 0.3599023222923279, mean loss: 0.34944131713710697
Epoch: 26, step: 978, loss: 0.3292924761772156, mean loss: 0.34944079410305046
Epoch: 26, step: 979, loss: 0.29905572533607483, mean loss: 0.34943948621527227
Epoch: 26, step: 980, loss: 0.328124076128006, mean loss: 0.34943893292753475
Epoch: 26, step: 981, loss: 0.3264486789703369, mean loss: 0.34943833618107895
Epoch: 26, step: 982, loss: 0.3507259488105774, mean loss: 0.3494383696021247
Epoch: 26, step: 983, loss: 0.3448330760002136, mean loss: 0.3494382500710408
Epoch: 26, step: 984, loss: 0.302234947681427, mean loss: 0.3494370249340689
Epoch: 26, step: 985, loss: 0.33246761560440063, mean loss: 0.34943658451337517
Epoch: 26, step: 986, loss: 0.37070390582084656, mean loss: 0.3494371364669011
Epoch: 26, step: 987, loss: 0.34080177545547485, mean loss: 0.34943691235808216
Epoch: 26, step: 988, loss: 0.405366986989975, mean loss: 0.3494383638431633
Epoch: 26, step: 989, loss: 0.3541782796382904, mean loss: 0.3494384868492305
Epoch: 26, step: 990, loss: 0.3479929566383362, mean loss: 0.3494384493370932
Epoch: 26, step: 991, loss: 0.3604440987110138, mean loss: 0.34943873493106703
Epoch: 26, step: 992, loss: 0.28910520672798157, mean loss: 0.349437169331041
Epoch: 26, step: 993, loss: 0.3412030339241028, mean loss: 0.349436955668282
Epoch: 26, step: 994, loss: 0.30432263016700745, mean loss: 0.34943578505343725
Epoch: 26, step: 995, loss: 0.35778144001960754, mean loss: 0.349436001598714
Epoch: 26, step: 996, loss: 0.33368778228759766, mean loss: 0.3494355929891992
Epoch: 26, step: 997, loss: 0.31356608867645264, mean loss: 0.34943466232902815
Epoch: 26, step: 998, loss: 0.33853045105934143, mean loss: 0.3494343794187391
Epoch: 26, step: 999, loss: 0.333717405796051, mean loss: 0.3494339716516775
Epoch: 26, step: 1000, loss: 0.3420593738555908, mean loss: 0.3494337803273087
Epoch: 26, step: 1001, loss: 0.34756121039390564, mean loss: 0.3494337317471724
Epoch: 26, step: 1002, loss: 0.3527442216873169, mean loss: 0.34943381762908127
Epoch: 26, step: 1003, loss: 0.33047255873680115, mean loss: 0.349433325742112
Epoch: 26, step: 1004, loss: 0.3536459505558014, mean loss: 0.34943343502185503
Epoch: 26, step: 1005, loss: 0.360734760761261, mean loss: 0.3494337281820558
Epoch: 26, step: 1006, loss: 0.33921778202056885, mean loss: 0.34943346318384144
Epoch: 26, step: 1007, loss: 0.35352203249931335, mean loss: 0.34943356923720614
Epoch: 26, step: 1008, loss: 0.320837140083313, mean loss: 0.3494328274939137
Epoch: 26, step: 1009, loss: 0.3261200487613678, mean loss: 0.349432222815314
Epoch: 26, step: 1010, loss: 0.3529632091522217, mean loss: 0.3494323143984118
Epoch: 26, step: 1011, loss: 0.3584449589252472, mean loss: 0.34943254815306807
Epoch: 26, step: 1012, loss: 0.31826356053352356, mean loss: 0.34943173976580716
Epoch: 26, step: 1013, loss: 0.3597991168498993, mean loss: 0.3494320086432667
Epoch: 26, step: 1014, loss: 0.3482915759086609, mean loss: 0.34943197906696194
Epoch: 26, step: 1015, loss: 0.32287532091140747, mean loss: 0.34943129035694753
Epoch: 26, step: 1016, loss: 0.33256542682647705, mean loss: 0.349430852975564
Epoch: 26, step: 1017, loss: 0.3318808078765869, mean loss: 0.34943039786314506
Epoch: 26, step: 1018, loss: 0.3837345838546753, mean loss: 0.3494312874253158
Epoch: 26, step: 1019, loss: 0.31760528683662415, mean loss: 0.3494304621478397
Epoch: 26, step: 1020, loss: 0.32025444507598877, mean loss: 0.34942970560649206
Epoch: 26, step: 1021, loss: 0.35527703166007996, mean loss: 0.3494298572251731
Epoch: 26, step: 1022, loss: 0.3321473002433777, mean loss: 0.3494294091074304
Epoch: 26, step: 1023, loss: 0.32946163415908813, mean loss: 0.34942889137835587
Epoch: 26, step: 1024, loss: 0.35139214992523193, mean loss: 0.3494289422808565
Epoch: 26, step: 1025, loss: 0.3011651635169983, mean loss: 0.34942769095135784
Epoch: 26, step: 1026, loss: 0.34559035301208496, mean loss: 0.34942759146371327
Epoch: 26, step: 1027, loss: 0.3172348737716675, mean loss: 0.3494267568500637
Epoch: 26, step: 1028, loss: 0.33680862188339233, mean loss: 0.34942642972655846
Epoch: 26, step: 1029, loss: 0.36087527871131897, mean loss: 0.34942672652878237
Epoch: 26, step: 1030, loss: 0.3522729277610779, mean loss: 0.3494268003123529
Epoch: 26, step: 1031, loss: 0.3393477201461792, mean loss: 0.34942653903383347
Epoch: 26, step: 1032, loss: 0.34382906556129456, mean loss: 0.34942639393510955
Epoch: 26, step: 1033, loss: 0.35870057344436646, mean loss: 0.34942663433584337
Epoch: 26, step: 1034, loss: 0.2928047478199005, mean loss: 0.3494251666491092
Epoch: 26, step: 1035, loss: 0.3557155728340149, mean loss: 0.349425329697481
Epoch: 26, step: 1036, loss: 0.31833040714263916, mean loss: 0.34942452373282085
Epoch: 26, step: 1037, loss: 0.30911338329315186, mean loss: 0.34942347891553716
Epoch: 26, step: 1038, loss: 0.3487784266471863, mean loss: 0.3494234621969754
Epoch: 26, step: 1039, loss: 0.2948337495326996, mean loss: 0.3494220473692576
Epoch: 26, step: 1040, loss: 0.30928099155426025, mean loss: 0.3494210070412593
Epoch: 26, step: 1041, loss: 0.3868757486343384, mean loss: 0.34942197772341327
Epoch: 26, step: 1042, loss: 0.3797445297241211, mean loss: 0.34942276354641066
Epoch: 26, step: 1043, loss: 0.3136153221130371, mean loss: 0.349421835604008
Epoch: 26, step: 1044, loss: 0.32302746176719666, mean loss: 0.34942115161702114
Epoch: 26, step: 1045, loss: 0.320230096578598, mean loss: 0.3494203951761028
Epoch: 26, step: 1046, loss: 0.3587771952152252, mean loss: 0.34942063763678116
Epoch: 26, step: 1047, loss: 0.35428503155708313, mean loss: 0.3494207636834727
Epoch: 26, step: 1048, loss: 0.31379231810569763, mean loss: 0.34941984049933106
Epoch: 26, step: 1049, loss: 0.3324397802352905, mean loss: 0.3494194005330082
Epoch: 26, step: 1050, loss: 0.3138369917869568, mean loss: 0.3494184785895247
Epoch: 26, step: 1051, loss: 0.344661682844162, mean loss: 0.3494183553437027
Epoch: 26, step: 1052, loss: 0.28374841809272766, mean loss: 0.34941665391775634
Epoch: 26, step: 1053, loss: 0.335689902305603, mean loss: 0.349416298284003
Epoch: 26, step: 1054, loss: 0.32921943068504333, mean loss: 0.34941577503553545
Epoch: 26, step: 1055, loss: 0.3050995469093323, mean loss: 0.34941462694672387
Epoch: 26, step: 1056, loss: 0.355483740568161, mean loss: 0.34941478417357347
Epoch: 26, step: 1057, loss: 0.3468724191188812, mean loss: 0.3494147183126063
Epoch: 26, step: 1058, loss: 0.2893736660480499, mean loss: 0.34941316296581293
Epoch: 26, step: 1059, loss: 0.3384547829627991, mean loss: 0.34941287909937413
Epoch: 26, step: 1060, loss: 0.329000324010849, mean loss: 0.3494123503451949
Epoch: 26, step: 1061, loss: 0.31551676988601685, mean loss: 0.34941147235782355
Epoch: 26, step: 1062, loss: 0.31644314527511597, mean loss: 0.3494106184109465
Epoch: 26, step: 1063, loss: 0.32799434661865234, mean loss: 0.3494100637002184
Epoch: 26, step: 1064, loss: 0.3068884611129761, mean loss: 0.3494089623610853
Epoch: 26, step: 1065, loss: 0.37926292419433594, mean loss: 0.34940973557947
Epoch: 26, step: 1066, loss: 0.33226093649864197, mean loss: 0.34940929143663296
Epoch: 26, step: 1067, loss: 0.32264193892478943, mean loss: 0.3494085981974195
Epoch: 26, step: 1068, loss: 0.3295072019100189, mean loss: 0.34940808279078733
Epoch: 26, step: 1069, loss: 0.3269871175289154, mean loss: 0.34940750214736105
Epoch: 26, step: 1070, loss: 0.33991754055023193, mean loss: 0.34940725638893566
Epoch: 26, step: 1071, loss: 0.3101283609867096, mean loss: 0.3494062392225952
Epoch: 26, step: 1072, loss: 0.3414200246334076, mean loss: 0.3494060324169244
Epoch: 26, step: 1073, loss: 0.32914093136787415, mean loss: 0.34940550765901235
Epoch: 26, step: 1074, loss: 0.3324107527732849, mean loss: 0.3494050675969992
Epoch: 26, step: 1075, loss: 0.3370196521282196, mean loss: 0.349404746897479
Epoch: 26, step: 1076, loss: 0.3184640407562256, mean loss: 0.3494039457606327
Epoch: 26, step: 1077, loss: 0.30791711807250977, mean loss: 0.34940287158457534
Epoch: 26, step: 1078, loss: 0.32256242632865906, mean loss: 0.34940217665033263
Epoch: 26, step: 1079, loss: 0.32687196135520935, mean loss: 0.3494015933286856
Epoch: 26, step: 1080, loss: 0.3230300545692444, mean loss: 0.34940091057040057
Epoch: 26, step: 1081, loss: 0.3587934374809265, mean loss: 0.34940115373632274
Epoch: 26, step: 1082, loss: 0.32138973474502563, mean loss: 0.3494004285591412
Epoch: 26, step: 1083, loss: 0.2946746051311493, mean loss: 0.34939901181938177
Epoch: 26, step: 1084, loss: 0.32845598459243774, mean loss: 0.34939846966123045
Epoch: 26, step: 1085, loss: 0.3455073833465576, mean loss: 0.3493983689341708
Epoch: 26, step: 1086, loss: 0.3249945640563965, mean loss: 0.34939773721858286
Epoch: 26, step: 1087, loss: 0.32555505633354187, mean loss: 0.3493971200441967
Epoch: 26, step: 1088, loss: 0.327557772397995, mean loss: 0.34939655474127834
Epoch: 26, step: 1089, loss: 0.3209817707538605, mean loss: 0.34939581925481594
Epoch: 26, step: 1090, loss: 0.3270450830459595, mean loss: 0.34939524074475486
Epoch: 26, step: 1091, loss: 0.33296722173690796, mean loss: 0.3493948155449669
Epoch: 26, step: 1092, loss: 0.33179211616516113, mean loss: 0.3493943599531927
Epoch: 26, step: 1093, loss: 0.33369308710098267, mean loss: 0.349393953584518
Epoch: 26, step: 1094, loss: 0.3052475154399872, mean loss: 0.3493928110487861
Epoch: 26, step: 1095, loss: 0.3007398843765259, mean loss: 0.34939155191507304
Epoch: 26, step: 1096, loss: 0.3435705900192261, mean loss: 0.34939140127295987
Epoch: 26, step: 1097, loss: 0.3204694092273712, mean loss: 0.34939065281294107
Epoch: 26, step: 1098, loss: 0.3230416178703308, mean loss: 0.34938997095503815
Epoch: 26, step: 1099, loss: 0.3542526662349701, mean loss: 0.3493900967881631
Epoch: 26, step: 1100, loss: 0.3045540153980255, mean loss: 0.34938893658421977
Epoch: 26, step: 1101, loss: 0.37579816579818726, mean loss: 0.34938961994677253
Epoch: 26, step: 1102, loss: 0.32477468252182007, mean loss: 0.349388983029614
Epoch: 26, step: 1103, loss: 0.3179067373275757, mean loss: 0.3493881684403545
Epoch: 26, step: 1104, loss: 0.285272479057312, mean loss: 0.349386509518018
Epoch: 26, step: 1105, loss: 0.38850706815719604, mean loss: 0.3493875216928857
Epoch: 26, step: 1106, loss: 0.31323060393333435, mean loss: 0.3493865862211577
Epoch: 26, step: 1107, loss: 0.315985769033432, mean loss: 0.3493857220791421
Epoch: 26, step: 1108, loss: 0.29074525833129883, mean loss: 0.34938420497920814
Epoch: 26, step: 1109, loss: 0.32669350504875183, mean loss: 0.34938361795846173
Epoch: 26, step: 1110, loss: 0.32303449511528015, mean loss: 0.34938293630995976
Epoch: 26, step: 1111, loss: 0.3450410068035126, mean loss: 0.349382823987694
Epoch: 26, step: 1112, loss: 0.2972528040409088, mean loss: 0.3493814754603911
Epoch: 26, step: 1113, loss: 0.3148024082183838, mean loss: 0.3493805809736809
Epoch: 26, step: 1114, loss: 0.33516180515289307, mean loss: 0.3493802131737942
Epoch: 26, step: 1115, loss: 0.2954385578632355, mean loss: 0.34937881789041836
Epoch: 26, step: 1116, loss: 0.3424874544143677, mean loss: 0.3493786396393779
Epoch: 26, step: 1117, loss: 0.34087058901786804, mean loss: 0.3493784195770267
Epoch: 26, step: 1118, loss: 0.32001811265945435, mean loss: 0.3493776601867332
Epoch: 26, step: 1119, loss: 0.33657291531562805, mean loss: 0.34937732900669827
Epoch: 26, step: 1120, loss: 0.3174375891685486, mean loss: 0.34937650294333766
Epoch: 26, step: 1121, loss: 0.3202095627784729, mean loss: 0.34937574861291393
Epoch: 26, step: 1122, loss: 0.3041144013404846, mean loss: 0.34937457807092015
Epoch: 26, step: 1123, loss: 0.3970937430858612, mean loss: 0.3493758121447025
Epoch: 26, step: 1124, loss: 0.3493487238883972, mean loss: 0.3493758114441864
Epoch: 26, step: 1125, loss: 0.3357906937599182, mean loss: 0.3493754601352212
Epoch: 26, step: 1126, loss: 0.32536402344703674, mean loss: 0.349374839219375
Epoch: 26, step: 1127, loss: 0.34800249338150024, mean loss: 0.349374803732567
Epoch: 26, step: 1128, loss: 0.34118151664733887, mean loss: 0.34937459187191267
Epoch: 26, step: 1129, loss: 0.33054211735725403, mean loss: 0.3493741049175114
Epoch: 26, step: 1130, loss: 0.37575143575668335, mean loss: 0.3493747869428725
Epoch: 26, step: 1131, loss: 0.3112905025482178, mean loss: 0.34937380224216935
Epoch: 26, step: 1132, loss: 0.3218303620815277, mean loss: 0.34937309010213363
Epoch: 26, step: 1133, loss: 0.3429243862628937, mean loss: 0.34937292337417875
Epoch: 26, step: 1134, loss: 0.3325532376766205, mean loss: 0.34937248852101044
Epoch: 26, step: 1135, loss: 0.3209335505962372, mean loss: 0.3493717532847663
Epoch: 26, step: 1136, loss: 0.32610568404197693, mean loss: 0.3493711517990435
Epoch: 26, step: 1137, loss: 0.31218013167381287, mean loss: 0.3493701903435829
Epoch: 26, step: 1138, loss: 0.3388620913028717, mean loss: 0.349369918697148
Epoch: 26, step: 1139, loss: 0.31668317317962646, mean loss: 0.34936907372905995
Epoch: 26, step: 1140, loss: 0.3130570650100708, mean loss: 0.34936813507043984
Epoch: 26, step: 1141, loss: 0.31491315364837646, mean loss: 0.34936724443864997
Epoch: 26, step: 1142, loss: 0.33026668429374695, mean loss: 0.34936675071827505
Epoch: 26, step: 1143, loss: 0.3457045257091522, mean loss: 0.3493666560577858
Epoch: 26, step: 1144, loss: 0.34025368094444275, mean loss: 0.3493664205134421
Epoch: 26, step: 1145, loss: 0.36390089988708496, mean loss: 0.3493667961784556
Epoch: 26, step: 1146, loss: 0.3183452785015106, mean loss: 0.349365994402392
Epoch: 26, step: 1147, loss: 0.3339536488056183, mean loss: 0.3493655960682248
Epoch: 26, step: 1148, loss: 0.32727962732315063, mean loss: 0.34936502526811253
Epoch: 26, step: 1149, loss: 0.32389312982559204, mean loss: 0.34936436697753925
Epoch: 26, step: 1150, loss: 0.3455269932746887, mean loss: 0.3493642678077834
Epoch: 26, step: 1151, loss: 0.3380066156387329, mean loss: 0.34936397429806226
Epoch: 26, step: 1152, loss: 0.3377259373664856, mean loss: 0.34936367355028
Epoch: 26, step: 1153, loss: 0.3744736909866333, mean loss: 0.34936432242147325
Epoch: 26, step: 1154, loss: 0.37399381399154663, mean loss: 0.34936495885888946
Epoch: 26, step: 1155, loss: 0.32071173191070557, mean loss: 0.34936421846542826
Epoch: 26, step: 1156, loss: 0.34924155473709106, mean loss: 0.3493642152959048
Epoch: 26, step: 1157, loss: 0.34383007884025574, mean loss: 0.3493640723023526
Epoch: 26, step: 1158, loss: 0.32915645837783813, mean loss: 0.3493635501822605
Epoch: 26, step: 1159, loss: 0.30754783749580383, mean loss: 0.34936246978455776
Epoch: 26, step: 1160, loss: 0.3355097472667694, mean loss: 0.3493621118793125
Epoch: 26, step: 1161, loss: 0.31778955459594727, mean loss: 0.34936129617742434
Epoch: 26, step: 1162, loss: 0.31717708706855774, mean loss: 0.3493604646945115
Epoch: 26, step: 1163, loss: 0.3357425928115845, mean loss: 0.34936011288424274
Epoch: 26, step: 1164, loss: 0.36633923649787903, mean loss: 0.34936055151927886
Epoch: 26, step: 1165, loss: 0.32921260595321655, mean loss: 0.34936003103502244
Epoch: 26, step: 1166, loss: 0.3941955864429474, mean loss: 0.34936118924729825
Epoch: 26, step: 1167, loss: 0.3638053238391876, mean loss: 0.34936156236505483
Epoch: 26, step: 1168, loss: 0.35757583379745483, mean loss: 0.3493617745488544
Epoch: 26, step: 1169, loss: 0.33075278997421265, mean loss: 0.3493612938704287
Epoch: 26, step: 1170, loss: 0.3389502763748169, mean loss: 0.3493610249561191
Epoch: 26, step: 1171, loss: 0.3163696527481079, mean loss: 0.34936017281818627
Epoch: 26, step: 1172, loss: 0.39689433574676514, mean loss: 0.34936140055181564
Epoch: 26, step: 1173, loss: 0.3588743209838867, mean loss: 0.34936164624943516
Epoch: 26, step: 1174, loss: 0.34418797492980957, mean loss: 0.3493615126284398
Epoch: 26, step: 1175, loss: 0.31791388988494873, mean loss: 0.34936070044810036
Epoch: 26, step: 1176, loss: 0.3297743797302246, mean loss: 0.34936019461610435
Epoch: 26, step: 1177, loss: 0.39266037940979004, mean loss: 0.34936131284824096
Epoch: 26, step: 1178, loss: 0.3207539916038513, mean loss: 0.34936057408003485
Epoch: 26, step: 1179, loss: 0.30277562141418457, mean loss: 0.3493593710805341
Epoch: 26, step: 1180, loss: 0.32366469502449036, mean loss: 0.3493587075640446
Epoch: 26, step: 1181, loss: 0.3114682734012604, mean loss: 0.34935772914039737
Epoch: 26, step: 1182, loss: 0.3340003490447998, mean loss: 0.34935733258553653
Epoch: 26, step: 1183, loss: 0.3449079394340515, mean loss: 0.3493572176972606
Epoch: 26, step: 1184, loss: 0.3088735342025757, mean loss: 0.34935617239055256
Epoch: 26, step: 1185, loss: 0.3555067479610443, mean loss: 0.34935633119704806
Epoch: 26, step: 1186, loss: 0.33688071370124817, mean loss: 0.3493560090876913
Epoch: 26, step: 1187, loss: 0.34868675470352173, mean loss: 0.349355991808584
Epoch: 26, step: 1188, loss: 0.34678271412849426, mean loss: 0.34935592537227184
Epoch: 26, step: 1189, loss: 0.3384857177734375, mean loss: 0.3493556447349093
Epoch: 26, step: 1190, loss: 0.3769252896308899, mean loss: 0.3493563564851325
Epoch: 26, step: 1191, loss: 0.3322126567363739, mean loss: 0.34935591390717535
Epoch: 26, step: 1192, loss: 0.33737385272979736, mean loss: 0.34935560458892206
Epoch: 26, step: 1193, loss: 0.3110677897930145, mean loss: 0.3493546162102036
Epoch: 26, step: 1194, loss: 0.31754592061042786, mean loss: 0.3493537951075525
Epoch: 26, step: 1195, loss: 0.32661718130111694, mean loss: 0.34935320820476967
Epoch: 26, step: 1196, loss: 0.333737850189209, mean loss: 0.3493528051341722
Epoch: 26, step: 1197, loss: 0.3599779009819031, mean loss: 0.349353079386814
Epoch: 26, step: 1198, loss: 0.3376673758029938, mean loss: 0.3493527777657835
Epoch: 26, step: 1199, loss: 0.36286187171936035, mean loss: 0.3493531264415515
Epoch: 26, step: 1200, loss: 0.39530491828918457, mean loss: 0.3493543124472773
Epoch: 26, step: 1201, loss: 0.34366148710250854, mean loss: 0.34935416552048887
Epoch: 26, step: 1202, loss: 0.31075313687324524, mean loss: 0.3493531692877832
Epoch: 26, step: 1203, loss: 0.34653955698013306, mean loss: 0.34935309667468556
Epoch: 26, step: 1204, loss: 0.3299190402030945, mean loss: 0.34935259513770467
Epoch: 26, step: 1205, loss: 0.37573859095573425, mean loss: 0.349353276066629
Epoch: 26, step: 1206, loss: 0.3610473573207855, mean loss: 0.34935357784158333
Epoch: 26, step: 1207, loss: 0.33413201570510864, mean loss: 0.34935318504734986
Epoch: 26, step: 1208, loss: 0.34970343112945557, mean loss: 0.3493531940852587
Epoch: 26, step: 1209, loss: 0.3246285915374756, mean loss: 0.3493525560968563
Epoch: 26, step: 1210, loss: 0.33652326464653015, mean loss: 0.34935222506108154
Epoch: 26, step: 1211, loss: 0.35221195220947266, mean loss: 0.3493522988490666
Epoch: 26, step: 1212, loss: 0.340224027633667, mean loss: 0.34935206332332375
Epoch: 26, step: 1213, loss: 0.35764503479003906, mean loss: 0.34935227729131657
Epoch: 26, step: 1214, loss: 0.3220144510269165, mean loss: 0.3493515719628441
Epoch: 26, step: 1215, loss: 0.31108322739601135, mean loss: 0.34935058464745283
Epoch: 26, step: 1216, loss: 0.4067325294017792, mean loss: 0.34935206505158983
Epoch: 26, step: 1217, loss: 0.311514675617218, mean loss: 0.34935108890512073
Epoch: 26, step: 1218, loss: 0.365098774433136, mean loss: 0.3493514951607131
Epoch: 26, step: 1219, loss: 0.34116223454475403, mean loss: 0.3493512839012813
Epoch: 26, step: 1220, loss: 0.3006942868232727, mean loss: 0.34935002872271614
Epoch: 26, step: 1221, loss: 0.35890278220176697, mean loss: 0.3493502751436386
Epoch: 26, step: 1222, loss: 0.32155898213386536, mean loss: 0.3493495582634825
Epoch: 26, step: 1223, loss: 0.2989789545536041, mean loss: 0.34934825898047306
Epoch: 26, step: 1224, loss: 0.3617013692855835, mean loss: 0.3493485776141831
Epoch: 26, step: 1225, loss: 0.3577701449394226, mean loss: 0.3493487948328399
Epoch: 26, step: 1226, loss: 0.37726539373397827, mean loss: 0.3493495148709844
Epoch: 26, step: 1227, loss: 0.31406286358833313, mean loss: 0.3493486047644312
Epoch: 26, step: 1228, loss: 0.3269791305065155, mean loss: 0.3493480278301146
Epoch: 26, step: 1229, loss: 0.39116764068603516, mean loss: 0.34934910637792643
Epoch: 26, step: 1230, loss: 0.35086551308631897, mean loss: 0.3493491454857719
Epoch: 26, step: 1231, loss: 0.33871719241142273, mean loss: 0.3493488712967613
Epoch: 26, step: 1232, loss: 0.36320385336875916, mean loss: 0.34934922859572903
Epoch: 26, step: 1233, loss: 0.3096679151058197, mean loss: 0.34934820530124533
Epoch: 26, step: 1234, loss: 0.3096606433391571, mean loss: 0.34934718187201913
Epoch: 26, step: 1235, loss: 0.37233206629753113, mean loss: 0.3493477745714628
Epoch: 26, step: 1236, loss: 0.34728750586509705, mean loss: 0.3493477214457387
Epoch: 26, step: 1237, loss: 0.37433338165283203, mean loss: 0.3493483657049365
Epoch: 26, step: 1238, loss: 0.3258921504020691, mean loss: 0.3493477608983124
Epoch: 26, step: 1239, loss: 0.3293013870716095, mean loss: 0.34934724402604994
Epoch: 26, step: 1240, loss: 0.31598398089408875, mean loss: 0.3493463838155786
Epoch: 26, step: 1241, loss: 0.2825687527656555, mean loss: 0.34934466212138354
Epoch: 26, step: 1242, loss: 0.31245532631874084, mean loss: 0.3493437110466471
Epoch: 26, step: 1243, loss: 0.3214116096496582, mean loss: 0.3493429909244083
Epoch: 26, step: 1244, loss: 0.3876282274723053, mean loss: 0.34934397793713223
Epoch: 26, step: 1245, loss: 0.38737207651138306, mean loss: 0.34934495829543527
Epoch: 26, step: 1246, loss: 0.32934966683387756, mean loss: 0.34934444283330585
Epoch: 26, step: 1247, loss: 0.31546902656555176, mean loss: 0.3493435695755138
Epoch: 26, step: 1248, loss: 0.3376023471355438, mean loss: 0.34934326691208384
Epoch: 26, step: 1249, loss: 0.3062988519668579, mean loss: 0.34934215734836405
Epoch: 26, step: 1250, loss: 0.32708868384361267, mean loss: 0.34934158373131274
Epoch: 26, step: 1251, loss: 0.3039150536060333, mean loss: 0.34934041282374173
Epoch: 26, step: 1252, loss: 0.30148375034332275, mean loss: 0.3493391793092308
Epoch: 26, step: 1253, loss: 0.2992156744003296, mean loss: 0.3493378873997275
Epoch: 26, step: 1254, loss: 0.37306901812553406, mean loss: 0.349338499042572
Epoch: 26, step: 1255, loss: 0.3273415267467499, mean loss: 0.34933793211029635
Epoch: 26, step: 1256, loss: 0.29745742678642273, mean loss: 0.3493365950183316
Epoch: 26, step: 1257, loss: 0.3409985303878784, mean loss: 0.3493363801308353
Epoch: 26, step: 1258, loss: 0.3300122022628784, mean loss: 0.3493358821235197
Epoch: 26, step: 1259, loss: 0.37179332971572876, mean loss: 0.3493364608640514
Epoch: 26, step: 1260, loss: 0.2968215346336365, mean loss: 0.349335107560966
Epoch: 26, step: 1261, loss: 0.31676897406578064, mean loss: 0.3493342683574022
Epoch: 26, step: 1262, loss: 0.31178346276283264, mean loss: 0.3493333007277067
Epoch: 26, step: 1263, loss: 0.35123997926712036, mean loss: 0.34933334985877607
Epoch: 26, step: 1264, loss: 0.3177710771560669, mean loss: 0.349332536586785
Epoch: 26, step: 1265, loss: 0.3228679597377777, mean loss: 0.34933185468580974
Epoch: 26, step: 1266, loss: 0.3259524405002594, mean loss: 0.34933125229436957
Epoch: 26, step: 1267, loss: 0.3597679138183594, mean loss: 0.34933152119732547
Epoch: 26, step: 1268, loss: 0.29113465547561646, mean loss: 0.3493300217804878
Epoch: 26, step: 1269, loss: 0.325229674577713, mean loss: 0.34932940086156156
Epoch: 26, step: 1270, loss: 0.3363886773586273, mean loss: 0.3493290674666497
Epoch: 26, step: 1271, loss: 0.3769857883453369, mean loss: 0.3493297799749164
Epoch: 26, step: 1272, loss: 0.3086877465248108, mean loss: 0.34932873295857175
Epoch: 26, step: 1273, loss: 0.30060654878616333, mean loss: 0.3493274778144589
Epoch: 26, step: 1274, loss: 0.3330337405204773, mean loss: 0.34932705807831693
Epoch: 26, step: 1275, loss: 0.31766965985298157, mean loss: 0.3493262425863482
Epoch: 26, step: 1276, loss: 0.3331022262573242, mean loss: 0.3493258246677905
Epoch: 26, step: 1277, loss: 0.35589873790740967, mean loss: 0.34932599397677094
Epoch: 26, step: 1278, loss: 0.34495747089385986, mean loss: 0.3493258814526723
Epoch: 26, step: 1279, loss: 0.3210947811603546, mean loss: 0.3493251542967818
Epoch: 26, step: 1280, loss: 0.35169923305511475, mean loss: 0.349325215444979
Epoch: 26, step: 1281, loss: 0.3371947407722473, mean loss: 0.3493249030132407
Epoch: 26, step: 1282, loss: 0.340194433927536, mean loss: 0.3493246678555132
Epoch: 26, step: 1283, loss: 0.30554237961769104, mean loss: 0.34932354025975143
Epoch: 26, step: 1284, loss: 0.32128721475601196, mean loss: 0.34932281821371614
Epoch: 26, step: 1285, loss: 0.3328688144683838, mean loss: 0.34932239446909225
Epoch: 26, step: 1286, loss: 0.3270975649356842, mean loss: 0.3493218221214954
Epoch: 26, step: 1287, loss: 0.34198087453842163, mean loss: 0.3493216330777278
Epoch: 26, step: 1288, loss: 0.3079755902290344, mean loss: 0.3493205683636226
Epoch: 26, step: 1289, loss: 0.33815014362335205, mean loss: 0.3493202807181382
Epoch: 26, step: 1290, loss: 0.3216891586780548, mean loss: 0.349319569217635
Epoch: 26, step: 1291, loss: 0.3186090588569641, mean loss: 0.34931877844334414
Epoch: 26, step: 1292, loss: 0.3310064375400543, mean loss: 0.34931830692543847
Epoch: 26, step: 1293, loss: 0.3194015622138977, mean loss: 0.34931753662973036
Epoch: 26, step: 1294, loss: 0.31069841980934143, mean loss: 0.349316542291132
Epoch: 26, step: 1295, loss: 0.34550148248672485, mean loss: 0.3493164440661113
Epoch: 26, step: 1296, loss: 0.3359888792037964, mean loss: 0.3493161009347588
Epoch: 26, step: 1297, loss: 0.3476124703884125, mean loss: 0.3493160570742329
Epoch: 26, step: 1298, loss: 0.34162381291389465, mean loss: 0.34931585903998835
Epoch: 26, step: 1299, loss: 0.3208766579627991, mean loss: 0.34931512690114896
Epoch: 26, step: 1300, loss: 0.30492499470710754, mean loss: 0.34931398415093157
Epoch: 26, step: 1301, loss: 0.34782469272613525, mean loss: 0.3493139458125846
Epoch: 26, step: 1302, loss: 0.33330193161964417, mean loss: 0.34931353363109846
Epoch: 26, step: 1303, loss: 0.3212079107761383, mean loss: 0.34931281015439813
Epoch: 26, step: 1304, loss: 0.3265843689441681, mean loss: 0.34931222510867727
Epoch: 26, step: 1305, loss: 0.319347083568573, mean loss: 0.3493114538051627
Epoch: 26, step: 1306, loss: 0.31962957978248596, mean loss: 0.34931068981262653
Epoch: 26, step: 1307, loss: 0.3143451511859894, mean loss: 0.34930978984509264
Epoch: 26, step: 1308, loss: 0.32457607984542847, mean loss: 0.34930915324791867
Epoch: 26, step: 1309, loss: 0.32343339920043945, mean loss: 0.34930848727391217
Epoch: 26, step: 1310, loss: 0.33193400502204895, mean loss: 0.3493080401118416
Epoch: 26, step: 1311, loss: 0.3138684928417206, mean loss: 0.3493071280378435
Epoch: 26, step: 1312, loss: 0.3564026653766632, mean loss: 0.34930731064425513
Epoch: 26, step: 1313, loss: 0.32798832654953003, mean loss: 0.3493067620060315
Epoch: 26, step: 1314, loss: 0.41236230731010437, mean loss: 0.3493083846814813
Epoch: 26, step: 1315, loss: 0.31518056988716125, mean loss: 0.34930750645670533
Epoch: 26, step: 1316, loss: 0.33674412965774536, mean loss: 0.3493071831665996
Epoch: 26, step: 1317, loss: 0.32382211089134216, mean loss: 0.349306527382742
Epoch: 26, step: 1318, loss: 0.3763769567012787, mean loss: 0.3493072239432061
Epoch: 26, step: 1319, loss: 0.3001053035259247, mean loss: 0.3493059579407252
Epoch: 26, step: 1320, loss: 0.3256051242351532, mean loss: 0.3493053481161091
Epoch: 26, step: 1321, loss: 0.3584139049053192, mean loss: 0.3493055824740772
Epoch: 26, step: 1322, loss: 0.40098515152931213, mean loss: 0.34930691212568543
Epoch: 26, step: 1323, loss: 0.3694312274456024, mean loss: 0.34930742988619073
Epoch: 26, step: 1324, loss: 0.34360983967781067, mean loss: 0.34930728330176075
Epoch: 26, step: 1325, loss: 0.3172357380390167, mean loss: 0.3493064582041209
Epoch: 26, step: 1326, loss: 0.34241658449172974, mean loss: 0.3493062809544048
Epoch: 26, step: 1327, loss: 0.34061071276664734, mean loss: 0.34930605725693137
Epoch: 26, step: 1328, loss: 0.31941360235214233, mean loss: 0.3493052882796231
Epoch: 26, step: 1329, loss: 0.3246711194515228, mean loss: 0.34930465458695376
Epoch: 26, step: 1330, loss: 0.3138785660266876, mean loss: 0.3493037433049329
Epoch: 26, step: 1331, loss: 0.34581315517425537, mean loss: 0.34930365351719417
Epoch: 26, step: 1332, loss: 0.31796616315841675, mean loss: 0.3493028474495871
Epoch: 26, step: 1333, loss: 0.30108922719955444, mean loss: 0.34930160732354537
Epoch: 26, step: 1334, loss: 0.32486164569854736, mean loss: 0.34930097870754123
Epoch: 26, step: 1335, loss: 0.33453965187072754, mean loss: 0.34930059904378513
Epoch: 26, step: 1336, loss: 0.3274783790111542, mean loss: 0.34930003778712937
Epoch: 26, step: 1337, loss: 0.3185172975063324, mean loss: 0.34929924609070734
Epoch: 26, step: 1338, loss: 0.3206779658794403, mean loss: 0.34929851000346585
Epoch: 26, step: 1339, loss: 0.3490191102027893, mean loss: 0.34929850281799624
Epoch: 26, step: 1340, loss: 0.31224676966667175, mean loss: 0.34929754996385837
Epoch: 26, step: 1341, loss: 0.3426663875579834, mean loss: 0.3492973794355858
Epoch: 26, step: 1342, loss: 0.3388602137565613, mean loss: 0.34929711103828903
Epoch: 26, step: 1343, loss: 0.3152739703655243, mean loss: 0.34929623613753114
Epoch: 26, step: 1344, loss: 0.35526618361473083, mean loss: 0.3492963896500277
Epoch: 26, step: 1345, loss: 0.3224869668483734, mean loss: 0.3492957002845661
Epoch: 26, step: 1346, loss: 0.3208651840686798, mean loss: 0.34929496925383363
Epoch: 26, step: 1347, loss: 0.4166683554649353, mean loss: 0.3492967015737506
Epoch: 26, step: 1348, loss: 0.30696427822113037, mean loss: 0.34929561314078444
Epoch: 26, step: 1349, loss: 0.32540133595466614, mean loss: 0.34929499879725623
Epoch: 26, step: 1350, loss: 0.3183192014694214, mean loss: 0.34929420240190134
Epoch: 26, step: 1351, loss: 0.37350764870643616, mean loss: 0.34929482491954594
Epoch: 26, step: 1352, loss: 0.3640137016773224, mean loss: 0.3492952033260235
Epoch: 26, step: 1353, loss: 0.30985790491104126, mean loss: 0.3492941894615982
Epoch: 26, step: 1354, loss: 0.3507605493068695, mean loss: 0.3492942271581931
Epoch: 26, step: 1355, loss: 0.3262067139148712, mean loss: 0.3492936336488552
Epoch: 26, step: 1356, loss: 0.3417809307575226, mean loss: 0.3492934405252108
Epoch: 26, step: 1357, loss: 0.3308597207069397, mean loss: 0.3492929666750278
Epoch: 26, step: 1358, loss: 0.40918654203414917, mean loss: 0.349294506236896
Epoch: 26, step: 1359, loss: 0.3484412133693695, mean loss: 0.34929448430360205
Epoch: 26, step: 1360, loss: 0.3511451184749603, mean loss: 0.3492945318716311
Epoch: 26, step: 1361, loss: 0.3521423935890198, mean loss: 0.34929460507015364
Epoch: 26, step: 1362, loss: 0.34221869707107544, mean loss: 0.3492944232029318
Epoch: 26, step: 1363, loss: 0.3299464285373688, mean loss: 0.34929392592744435
Epoch: 26, step: 1364, loss: 0.3199109137058258, mean loss: 0.3492931707548051
Epoch: 26, step: 1365, loss: 0.3042529225349426, mean loss: 0.3492920132053777
Epoch: 26, step: 1366, loss: 0.3751794993877411, mean loss: 0.3492926785053233
Epoch: 26, step: 1367, loss: 0.32429957389831543, mean loss: 0.3492920362071992
Epoch: 26, step: 1368, loss: 0.30587998032569885, mean loss: 0.3492909205888742
Epoch: 26, step: 1369, loss: 0.3356205224990845, mean loss: 0.3492905692911898
Epoch: 26, step: 1370, loss: 0.3630489110946655, mean loss: 0.3492909228397393
Epoch: 26, step: 1371, loss: 0.33388105034828186, mean loss: 0.3492905268619283
Epoch: 26, step: 1372, loss: 0.3318910598754883, mean loss: 0.34929007977024634
Epoch: 26, step: 1373, loss: 0.3444395661354065, mean loss: 0.3492899551360505
Epoch: 26, step: 1374, loss: 0.29155871272087097, mean loss: 0.3492884717669399
Epoch: 26, step: 1375, loss: 0.32136890292167664, mean loss: 0.3492877544090559
Epoch: 26, step: 1376, loss: 0.34906628727912903, mean loss: 0.3492877487188853
Epoch: 26, step: 1377, loss: 0.3371909558773041, mean loss: 0.34928743792311834
Epoch: 26, step: 1378, loss: 0.3453163206577301, mean loss: 0.34928733589816485
Epoch: 26, step: 1379, loss: 0.31442537903785706, mean loss: 0.3492864402564821
Epoch: 26, step: 1380, loss: 0.3328836262226105, mean loss: 0.3492860188611312
Epoch: 26, step: 1381, loss: 0.3351866900920868, mean loss: 0.34928565665261324
Epoch: 26, step: 1382, loss: 0.39509788155555725, mean loss: 0.3492868335279158
Epoch: 26, step: 1383, loss: 0.2926543951034546, mean loss: 0.34928537872832616
Epoch: 26, step: 1384, loss: 0.3274136185646057, mean loss: 0.34928481689113117
Epoch: 26, step: 1385, loss: 0.34583204984664917, mean loss: 0.34928472819945267
Epoch: 26, step: 1386, loss: 0.354073166847229, mean loss: 0.3492848511975428
Epoch: 26, step: 1387, loss: 0.30027392506599426, mean loss: 0.34928359231214956
Epoch: 26, step: 1388, loss: 0.3215794563293457, mean loss: 0.349282880727222
Epoch: 26, step: 1389, loss: 0.33288708329200745, mean loss: 0.34928245960949883
Epoch: 26, step: 1390, loss: 0.3171755075454712, mean loss: 0.3492816349799351
Epoch: 26, step: 1391, loss: 0.38034409284591675, mean loss: 0.3492824327623952
Epoch: 26, step: 1392, loss: 0.35240092873573303, mean loss: 0.3492825128532079
Epoch: 26, step: 1393, loss: 0.3387346565723419, mean loss: 0.34928224196471125
Epoch: 26, step: 1394, loss: 0.3247809410095215, mean loss: 0.34928161274205644
Epoch: 26, step: 1395, loss: 0.29456326365470886, mean loss: 0.3492802075456238
Epoch: 26, step: 1396, loss: 0.3389236330986023, mean loss: 0.34927994159008985
Epoch: 26, step: 1397, loss: 0.2993546426296234, mean loss: 0.34927865954759174
Epoch: 26, step: 1398, loss: 0.3506506681442261, mean loss: 0.3492786947787911
Epoch: 26, step: 1399, loss: 0.3170635998249054, mean loss: 0.3492778675629182
Epoch: 26, step: 1400, loss: 0.3260060250759125, mean loss: 0.3492772700063002
Epoch: 26, step: 1401, loss: 0.31123337149620056, mean loss: 0.3492762931691793
Epoch: 26, step: 1402, loss: 0.38791754841804504, mean loss: 0.34927728531890195
Epoch: 26, step: 1403, loss: 0.323623925447464, mean loss: 0.3492766266622348
Epoch: 26, step: 1404, loss: 0.31627845764160156, mean loss: 0.3492757794474406
Epoch: 26, step: 1405, loss: 0.33130162954330444, mean loss: 0.3492753179801773
Epoch: 26, step: 1406, loss: 0.32843324542045593, mean loss: 0.34927478289577485
Epoch: 26, step: 1407, loss: 0.31922903656959534, mean loss: 0.34927401154266524
Epoch: 26, step: 1408, loss: 0.3159705102443695, mean loss: 0.3492731565763905
Epoch: 26, step: 1409, loss: 0.32640424370765686, mean loss: 0.34927256950156205
Epoch: 26, step: 1410, loss: 0.3418126106262207, mean loss: 0.3492723779996014
Epoch: 26, step: 1411, loss: 0.31201958656311035, mean loss: 0.3492714217209425
Epoch: 26, step: 1412, loss: 0.3570687174797058, mean loss: 0.34927162187228267
Epoch: 26, step: 1413, loss: 0.3373863399028778, mean loss: 0.34927131679291595
Epoch: 26, step: 1414, loss: 0.34921497106552124, mean loss: 0.34927131534663325
Epoch: 26, step: 1415, loss: 0.32746991515159607, mean loss: 0.3492707557624393
Epoch: 26, step: 1416, loss: 0.30358046293258667, mean loss: 0.34926958304375066
Epoch: 26, step: 1417, loss: 0.33857735991477966, mean loss: 0.3492693086167929
Epoch: 26, step: 1418, loss: 0.3629304766654968, mean loss: 0.3492696592357917
Epoch: 26, step: 1419, loss: 0.39215338230133057, mean loss: 0.34927075983437156
Epoch: 26, step: 1420, loss: 0.3339746296405792, mean loss: 0.34927036727360694
Epoch: 26, step: 1421, loss: 0.4077022671699524, mean loss: 0.34927186683476014
Epoch: 26, step: 1422, loss: 0.3133465051651001, mean loss: 0.3492709448915346
Epoch: 26, step: 1423, loss: 0.31638103723526, mean loss: 0.34927010086803695
Epoch: 26, step: 1424, loss: 0.3200191557407379, mean loss: 0.34926935024715555
Epoch: 26, step: 1425, loss: 0.3185204565525055, mean loss: 0.3492685612070299
Epoch: 26, step: 1426, loss: 0.33316564559936523, mean loss: 0.3492681480045048
Epoch: 26, step: 1427, loss: 0.3362213671207428, mean loss: 0.3492678132313116
Epoch: 26, step: 1428, loss: 0.3419909179210663, mean loss: 0.3492676265149872
Epoch: 26, step: 1429, loss: 0.346475213766098, mean loss: 0.3492675548668949
Epoch: 26, step: 1430, loss: 0.3343821167945862, mean loss: 0.34926717294417337
Epoch: 26, step: 1431, loss: 0.3011602759361267, mean loss: 0.34926593867444305
Epoch: 26, step: 1432, loss: 0.3310362994670868, mean loss: 0.3492654709719722
Epoch: 26, step: 1433, loss: 0.3534107208251953, mean loss: 0.3492655773204214
Epoch: 26, step: 1434, loss: 0.32124951481819153, mean loss: 0.34926485857282646
Epoch: 26, step: 1435, loss: 0.3258450925350189, mean loss: 0.34926425775789477
Epoch: 26, step: 1436, loss: 0.3251793384552002, mean loss: 0.34926363989485115
Epoch: 26, step: 1437, loss: 0.30842268466949463, mean loss: 0.3492625922073229
Epoch: 26, step: 1438, loss: 0.3181766867637634, mean loss: 0.3492617947852301
Epoch: 26, step: 1439, loss: 0.2977728843688965, mean loss: 0.3492604740149034
Epoch: 26, step: 1440, loss: 0.3517515957355499, mean loss: 0.34926053791439604
Epoch: 26, step: 1441, loss: 0.3248763084411621, mean loss: 0.34925991245321836
Epoch: 26, step: 1442, loss: 0.35030749440193176, mean loss: 0.34925993932325067
Epoch: 26, step: 1443, loss: 0.3633559048175812, mean loss: 0.3492603008695083
Valid: 26, mean loss: 0.18651171525319415
Epoch: 27, step: 0, loss: 0.3647027015686035, mean loss: 0.34926069694021283
Epoch: 27, step: 1, loss: 0.3055919110774994, mean loss: 0.3492595769405754
Epoch: 27, step: 2, loss: 0.3029062747955322, mean loss: 0.34925838812002336
Epoch: 27, step: 3, loss: 0.31952816247940063, mean loss: 0.3492576256501413
Epoch: 27, step: 4, loss: 0.33002835512161255, mean loss: 0.3492571325034091
Epoch: 27, step: 5, loss: 0.32135993242263794, mean loss: 0.34925641708052146
Epoch: 27, step: 6, loss: 0.3462074100971222, mean loss: 0.3492563388908309
Epoch: 27, step: 7, loss: 0.30677860975265503, mean loss: 0.34925524960656745
Epoch: 27, step: 8, loss: 0.3376237452030182, mean loss: 0.3492549513399212
Epoch: 27, step: 9, loss: 0.3442290723323822, mean loss: 0.3492548224646197
Epoch: 27, step: 10, loss: 0.31023040413856506, mean loss: 0.34925382181285103
Epoch: 27, step: 11, loss: 0.3452844023704529, mean loss: 0.3492537200328653
Epoch: 27, step: 12, loss: 0.37195339798927307, mean loss: 0.349254302060966
Epoch: 27, step: 13, loss: 0.34230780601501465, mean loss: 0.3492541239548164
Epoch: 27, step: 14, loss: 0.3233618438243866, mean loss: 0.34925346010126335
Epoch: 27, step: 15, loss: 0.31164640188217163, mean loss: 0.34925249591661
Epoch: 27, step: 16, loss: 0.3308127522468567, mean loss: 0.34925202316327913
Epoch: 27, step: 17, loss: 0.36193275451660156, mean loss: 0.349252348260222
Epoch: 27, step: 18, loss: 0.322405070066452, mean loss: 0.34925165999200875
Epoch: 27, step: 19, loss: 0.2941262722015381, mean loss: 0.34925024681041034
Epoch: 27, step: 20, loss: 0.35071396827697754, mean loss: 0.3492502843330709
Epoch: 27, step: 21, loss: 0.33076807856559753, mean loss: 0.3492498105518413
Epoch: 27, step: 22, loss: 0.33529916405677795, mean loss: 0.3492494529438206
Epoch: 27, step: 23, loss: 0.3140217661857605, mean loss: 0.34924854994764615
Epoch: 27, step: 24, loss: 0.31696754693984985, mean loss: 0.3492477225054344
Epoch: 27, step: 25, loss: 0.32147982716560364, mean loss: 0.34924701076361503
Epoch: 27, step: 26, loss: 0.3257187604904175, mean loss: 0.3492464077070913
Epoch: 27, step: 27, loss: 0.35021770000457764, mean loss: 0.3492464326018088
Epoch: 27, step: 28, loss: 0.33643341064453125, mean loss: 0.3492461042059312
Epoch: 27, step: 29, loss: 0.32868584990501404, mean loss: 0.3492455772631279
Epoch: 27, step: 30, loss: 0.3333527743816376, mean loss: 0.34924516995379445
Epoch: 27, step: 31, loss: 0.33854520320892334, mean loss: 0.34924489573629713
Epoch: 27, step: 32, loss: 0.29182571172714233, mean loss: 0.3492434242418708
Epoch: 27, step: 33, loss: 0.34587299823760986, mean loss: 0.34924333786941414
Epoch: 27, step: 34, loss: 0.32161930203437805, mean loss: 0.34924262997827726
Epoch: 27, step: 35, loss: 0.3532082140445709, mean loss: 0.34924273159738517
Epoch: 27, step: 36, loss: 0.3796445429325104, mean loss: 0.34924351063162823
Epoch: 27, step: 37, loss: 0.3647943139076233, mean loss: 0.3492439091045252
Epoch: 27, step: 38, loss: 0.3367692828178406, mean loss: 0.34924358946360257
Epoch: 27, step: 39, loss: 0.3453356623649597, mean loss: 0.3492434893322328
Epoch: 27, step: 40, loss: 0.39578497409820557, mean loss: 0.3492446818169177
Epoch: 27, step: 41, loss: 0.3586169481277466, mean loss: 0.34924492194672324
Epoch: 27, step: 42, loss: 0.33240818977355957, mean loss: 0.3492444905785243
Epoch: 27, step: 43, loss: 0.3236047923564911, mean loss: 0.34924383368935075
Epoch: 27, step: 44, loss: 0.292206346988678, mean loss: 0.34924237242614525
Epoch: 27, step: 45, loss: 0.33205148577690125, mean loss: 0.34924193201812537
Epoch: 27, step: 46, loss: 0.333102285861969, mean loss: 0.34924151855210367
Epoch: 27, step: 47, loss: 0.3242228031158447, mean loss: 0.3492408776381925
Epoch: 27, step: 48, loss: 0.3720610439777374, mean loss: 0.3492414622160632
Epoch: 27, step: 49, loss: 0.4111047089099884, mean loss: 0.3492430469090981
Epoch: 27, step: 50, loss: 0.38543346524238586, mean loss: 0.34924397394151013
Epoch: 27, step: 51, loss: 0.3734894096851349, mean loss: 0.3492445949823847
Epoch: 27, step: 52, loss: 0.31833910942077637, mean loss: 0.3492438033662488
Epoch: 27, step: 53, loss: 0.34732386469841003, mean loss: 0.3492437541900112
Epoch: 27, step: 54, loss: 0.3024667799472809, mean loss: 0.3492425561013847
Epoch: 27, step: 55, loss: 0.3576146960258484, mean loss: 0.34924277052972
Epoch: 27, step: 56, loss: 0.3158176839351654, mean loss: 0.3492419144639858
Epoch: 27, step: 57, loss: 0.36948004364967346, mean loss: 0.3492424327790292
Epoch: 27, step: 58, loss: 0.32621029019355774, mean loss: 0.3492418429221238
Epoch: 27, step: 59, loss: 0.33814114332199097, mean loss: 0.349241558638688
Epoch: 27, step: 60, loss: 0.3097955882549286, mean loss: 0.34924054847273284
Epoch: 27, step: 61, loss: 0.31083980202674866, mean loss: 0.3492395650989442
Epoch: 27, step: 62, loss: 0.3809202313423157, mean loss: 0.3492403763628361
Epoch: 27, step: 63, loss: 0.3116641044616699, mean loss: 0.34923941415163307
Epoch: 27, step: 64, loss: 0.36122190952301025, mean loss: 0.34923972097813477
Epoch: 27, step: 65, loss: 0.31942400336265564, mean loss: 0.3492389575296374
Epoch: 27, step: 66, loss: 0.38162586092948914, mean loss: 0.34923978679358314
Epoch: 27, step: 67, loss: 0.34295904636383057, mean loss: 0.34923962597986874
Epoch: 27, step: 68, loss: 0.3109324276447296, mean loss: 0.34923864517749437
Epoch: 27, step: 69, loss: 0.3280836045742035, mean loss: 0.349238103546059
Epoch: 27, step: 70, loss: 0.3105933964252472, mean loss: 0.3492371141529071
Epoch: 27, step: 71, loss: 0.3527347147464752, mean loss: 0.3492372036972131
Epoch: 27, step: 72, loss: 0.31696024537086487, mean loss: 0.3492363773753492
Epoch: 27, step: 73, loss: 0.31277379393577576, mean loss: 0.34923544392126493
Epoch: 27, step: 74, loss: 0.3484976887702942, mean loss: 0.3492354250349748
Epoch: 27, step: 75, loss: 0.3408414423465729, mean loss: 0.34923521015726927
Epoch: 27, step: 76, loss: 0.3196188509464264, mean loss: 0.3492344520269938
Epoch: 27, step: 77, loss: 0.3480585217475891, mean loss: 0.3492344219258757
Epoch: 27, step: 78, loss: 0.31372562050819397, mean loss: 0.3492335130052671
Epoch: 27, step: 79, loss: 0.37768736481666565, mean loss: 0.3492342413213266
Epoch: 27, step: 80, loss: 0.3523339629173279, mean loss: 0.3492343206609973
Epoch: 27, step: 81, loss: 0.33382052183151245, mean loss: 0.34923392614349463
Epoch: 27, step: 82, loss: 0.3413243591785431, mean loss: 0.34923372370263145
Epoch: 27, step: 83, loss: 0.37754204869270325, mean loss: 0.3492344482195487
Epoch: 27, step: 84, loss: 0.30037054419517517, mean loss: 0.3492331976397615
Epoch: 27, step: 85, loss: 0.314301997423172, mean loss: 0.34923230366422237
Epoch: 27, step: 86, loss: 0.3671503961086273, mean loss: 0.34923276222065086
Epoch: 27, step: 87, loss: 0.35473039746284485, mean loss: 0.3492329029114903
Epoch: 27, step: 88, loss: 0.36018696427345276, mean loss: 0.3492331832314064
Epoch: 27, step: 89, loss: 0.36609482765197754, mean loss: 0.34923361471828956
Epoch: 27, step: 90, loss: 0.35166794061660767, mean loss: 0.3492336770107202
Epoch: 27, step: 91, loss: 0.3144381046295166, mean loss: 0.34923278664295204
Epoch: 27, step: 92, loss: 0.3070495128631592, mean loss: 0.34923170726233793
Epoch: 27, step: 93, loss: 0.2971283793449402, mean loss: 0.34923037408266655
Epoch: 27, step: 94, loss: 0.3505951166152954, mean loss: 0.34923040900174984
Epoch: 27, step: 95, loss: 0.3212846517562866, mean loss: 0.3492296939839102
Epoch: 27, step: 96, loss: 0.3177592158317566, mean loss: 0.34922888880345343
Epoch: 27, step: 97, loss: 0.3817763924598694, mean loss: 0.3492297215185856
Epoch: 27, step: 98, loss: 0.34618282318115234, mean loss: 0.34922964356687947
Epoch: 27, step: 99, loss: 0.36759188771247864, mean loss: 0.3492301133336658
Epoch: 27, step: 100, loss: 0.3063814640045166, mean loss: 0.3492290171518927
Epoch: 27, step: 101, loss: 0.3261546194553375, mean loss: 0.34922842686287514
Epoch: 27, step: 102, loss: 0.35973912477493286, mean loss: 0.34922869574056853
Epoch: 27, step: 103, loss: 0.3016243875026703, mean loss: 0.34922747798992293
Epoch: 27, step: 104, loss: 0.3607483506202698, mean loss: 0.3492277726941572
Epoch: 27, step: 105, loss: 0.3506091237068176, mean loss: 0.3492278080282497
Epoch: 27, step: 106, loss: 0.3729860484600067, mean loss: 0.3492284157335939
Epoch: 27, step: 107, loss: 0.3159962296485901, mean loss: 0.34922756571860303
Epoch: 27, step: 108, loss: 0.36345866322517395, mean loss: 0.34922792971321914
Epoch: 27, step: 109, loss: 0.31741297245025635, mean loss: 0.34922711598982503
Epoch: 27, step: 110, loss: 0.3481493294239044, mean loss: 0.3492270884242462
Epoch: 27, step: 111, loss: 0.3104152977466583, mean loss: 0.34922609579532865
Epoch: 27, step: 112, loss: 0.32823705673217773, mean loss: 0.3492255590049892
Epoch: 27, step: 113, loss: 0.3348030149936676, mean loss: 0.3492251901608377
Epoch: 27, step: 114, loss: 0.32513755559921265, mean loss: 0.34922457415606667
Epoch: 27, step: 115, loss: 0.334532767534256, mean loss: 0.3492241984449726
Epoch: 27, step: 116, loss: 0.34918496012687683, mean loss: 0.34922419744156336
Epoch: 27, step: 117, loss: 0.33430156111717224, mean loss: 0.3492238158470171
Epoch: 27, step: 118, loss: 0.31573447585105896, mean loss: 0.3492229594954689
Epoch: 27, step: 119, loss: 0.34816664457321167, mean loss: 0.34922293248526837
Epoch: 27, step: 120, loss: 0.3841559588909149, mean loss: 0.34922382570745264
Epoch: 27, step: 121, loss: 0.3196321129798889, mean loss: 0.3492230690796662
Epoch: 27, step: 122, loss: 0.31186389923095703, mean loss: 0.3492221138709053
Epoch: 27, step: 123, loss: 0.3337332308292389, mean loss: 0.3492217178573278
Epoch: 27, step: 124, loss: 0.3492184281349182, mean loss: 0.34922171777321964
Epoch: 27, step: 125, loss: 0.3255610466003418, mean loss: 0.3492211128575584
Epoch: 27, step: 126, loss: 0.31278693675994873, mean loss: 0.3492201813945366
Epoch: 27, step: 127, loss: 0.30822888016700745, mean loss: 0.3492191334524866
Epoch: 27, step: 128, loss: 0.3194887042045593, mean loss: 0.3492183734139037
Epoch: 27, step: 129, loss: 0.2834409475326538, mean loss: 0.3492166919008948
Epoch: 27, step: 130, loss: 0.34655484557151794, mean loss: 0.34921662385604885
Epoch: 27, step: 131, loss: 0.2904319763183594, mean loss: 0.34921512118100956
Epoch: 27, step: 132, loss: 0.3787301778793335, mean loss: 0.34921587563658835
Epoch: 27, step: 133, loss: 0.30450642108917236, mean loss: 0.3492147328152973
Epoch: 27, step: 134, loss: 0.32466593384742737, mean loss: 0.3492141053378807
Epoch: 27, step: 135, loss: 0.3021923005580902, mean loss: 0.34921290347189615
Epoch: 27, step: 136, loss: 0.2978610098361969, mean loss: 0.3492115909634326
Epoch: 27, step: 137, loss: 0.2982819676399231, mean loss: 0.3492102892810904
Epoch: 27, step: 138, loss: 0.3155357539653778, mean loss: 0.3492094286340866
Epoch: 27, step: 139, loss: 0.32370829582214355, mean loss: 0.34920877689791785
Epoch: 27, step: 140, loss: 0.30710336565971375, mean loss: 0.349207700831286
Epoch: 27, step: 141, loss: 0.3315953016281128, mean loss: 0.3492072507316386
Epoch: 27, step: 142, loss: 0.3264519274234772, mean loss: 0.3492066692151093
Epoch: 27, step: 143, loss: 0.32464900612831116, mean loss: 0.34920604165548835
Epoch: 27, step: 144, loss: 0.34240323305130005, mean loss: 0.3492058678173312
Epoch: 27, step: 145, loss: 0.32731595635414124, mean loss: 0.3492053084594464
Epoch: 27, step: 146, loss: 0.33993998169898987, mean loss: 0.34920507170649484
Epoch: 27, step: 147, loss: 0.3606966733932495, mean loss: 0.3492053653389991
Epoch: 27, step: 148, loss: 0.3264349102973938, mean loss: 0.34920478352498574
Epoch: 27, step: 149, loss: 0.3393031060695648, mean loss: 0.3492045305310296
Epoch: 27, step: 150, loss: 0.3432893455028534, mean loss: 0.3492043793982713
Epoch: 27, step: 151, loss: 0.3055098056793213, mean loss: 0.3492032630320547
Epoch: 27, step: 152, loss: 0.3461352586746216, mean loss: 0.3492031846486624
Epoch: 27, step: 153, loss: 0.3624710440635681, mean loss: 0.3492035236159971
Epoch: 27, step: 154, loss: 0.30819272994995117, mean loss: 0.3492024758988148
Epoch: 27, step: 155, loss: 0.3104025423526764, mean loss: 0.3492014846885771
Epoch: 27, step: 156, loss: 0.34981048107147217, mean loss: 0.34920150024602714
Epoch: 27, step: 157, loss: 0.33497703075408936, mean loss: 0.3492011368763472
Epoch: 27, step: 158, loss: 0.3329644501209259, mean loss: 0.34920072211437936
Epoch: 27, step: 159, loss: 0.3352121412754059, mean loss: 0.34920036478882405
Epoch: 27, step: 160, loss: 0.3124653697013855, mean loss: 0.34919942645080554
Epoch: 27, step: 161, loss: 0.32584425806999207, mean loss: 0.34919882989478046
Epoch: 27, step: 162, loss: 0.34231889247894287, mean loss: 0.3491986541665126
Epoch: 27, step: 163, loss: 0.3190934360027313, mean loss: 0.34919788523470413
Epoch: 27, step: 164, loss: 0.35922491550445557, mean loss: 0.3491981413333497
Epoch: 27, step: 165, loss: 0.3288547992706299, mean loss: 0.3491976217608395
Epoch: 27, step: 166, loss: 0.3098473846912384, mean loss: 0.34919661677457803
Epoch: 27, step: 167, loss: 0.3617834150791168, mean loss: 0.34919693822718567
Epoch: 27, step: 168, loss: 0.36195430159568787, mean loss: 0.3491972640275118
Epoch: 27, step: 169, loss: 0.3074386715888977, mean loss: 0.3491961976147114
Epoch: 27, step: 170, loss: 0.3172951340675354, mean loss: 0.34919538296000757
Epoch: 27, step: 171, loss: 0.3322427272796631, mean loss: 0.3491949500525591
Epoch: 27, step: 172, loss: 0.34048372507095337, mean loss: 0.3491947276061205
Epoch: 27, step: 173, loss: 0.3258611261844635, mean loss: 0.34919413178360326
Epoch: 27, step: 174, loss: 0.30802038311958313, mean loss: 0.34919308044053293
Epoch: 27, step: 175, loss: 0.34885549545288086, mean loss: 0.3491930718207549
Epoch: 27, step: 176, loss: 0.38041940331459045, mean loss: 0.34919386912272077
Epoch: 27, step: 177, loss: 0.33882224559783936, mean loss: 0.3491936043108042
Epoch: 27, step: 178, loss: 0.2903771698474884, mean loss: 0.3491921026273854
Epoch: 27, step: 179, loss: 0.341935396194458, mean loss: 0.34919191735608146
Epoch: 27, step: 180, loss: 0.3394313454627991, mean loss: 0.349191668164836
Epoch: 27, step: 181, loss: 0.3088383972644806, mean loss: 0.349190637956235
Epoch: 27, step: 182, loss: 0.31052958965301514, mean loss: 0.34918965097483795
Epoch: 27, step: 183, loss: 0.3446008563041687, mean loss: 0.34918953383007456
Epoch: 27, step: 184, loss: 0.33661240339279175, mean loss: 0.34918921276376774
Epoch: 27, step: 185, loss: 0.3280380964279175, mean loss: 0.34918867283635835
Epoch: 27, step: 186, loss: 0.33560195565223694, mean loss: 0.34918832601524324
Epoch: 27, step: 187, loss: 0.32705333828926086, mean loss: 0.3491877610012621
Epoch: 27, step: 188, loss: 0.30705681443214417, mean loss: 0.34918668560124244
Epoch: 27, step: 189, loss: 0.3163665533065796, mean loss: 0.34918584788282153
Epoch: 27, step: 190, loss: 0.350355863571167, mean loss: 0.3491858777461587
Epoch: 27, step: 191, loss: 0.3012089729309082, mean loss: 0.3491846532207678
Epoch: 27, step: 192, loss: 0.33113938570022583, mean loss: 0.34918419265907924
Epoch: 27, step: 193, loss: 0.3577459752559662, mean loss: 0.34918441117223825
Epoch: 27, step: 194, loss: 0.3142058551311493, mean loss: 0.34918351847499607
Epoch: 27, step: 195, loss: 0.3567954897880554, mean loss: 0.3491837127372284
Epoch: 27, step: 196, loss: 0.34086379408836365, mean loss: 0.3491835004131593
Epoch: 27, step: 197, loss: 0.32196980714797974, mean loss: 0.34918280593826356
Epoch: 27, step: 198, loss: 0.325382798910141, mean loss: 0.3491821985938119
Epoch: 27, step: 199, loss: 0.3107694387435913, mean loss: 0.3491812183764022
Epoch: 27, step: 200, loss: 0.36093223094940186, mean loss: 0.3491815182312741
Epoch: 27, step: 201, loss: 0.3041346073150635, mean loss: 0.3491803687821565
Epoch: 27, step: 202, loss: 0.3372180461883545, mean loss: 0.34918006355078723
Epoch: 27, step: 203, loss: 0.3280043303966522, mean loss: 0.349179523243246
Epoch: 27, step: 204, loss: 0.30106455087661743, mean loss: 0.3491782956012598
Epoch: 27, step: 205, loss: 0.31577983498573303, mean loss: 0.3491774434692851
Epoch: 27, step: 206, loss: 0.36004891991615295, mean loss: 0.3491777208382466
Epoch: 27, step: 207, loss: 0.3101634979248047, mean loss: 0.3491767254758904
Epoch: 27, step: 208, loss: 0.3381500542163849, mean loss: 0.3491764441617271
Epoch: 27, step: 209, loss: 0.31068095564842224, mean loss: 0.3491754620838529
Epoch: 27, step: 210, loss: 0.3786429166793823, mean loss: 0.3491762138238105
Epoch: 27, step: 211, loss: 0.35283154249191284, mean loss: 0.34917630707199077
Epoch: 27, step: 212, loss: 0.35528430342674255, mean loss: 0.3491764628842495
Epoch: 27, step: 213, loss: 0.34450966119766235, mean loss: 0.34917634383925983
Epoch: 27, step: 214, loss: 0.3443472683429718, mean loss: 0.34917622065798554
Epoch: 27, step: 215, loss: 0.32247138023376465, mean loss: 0.34917553948156416
Epoch: 27, step: 216, loss: 0.2984321117401123, mean loss: 0.34917424517145723
Epoch: 27, step: 217, loss: 0.30726057291030884, mean loss: 0.3491731761087561
Epoch: 27, step: 218, loss: 0.3083675503730774, mean loss: 0.3491721353347684
Epoch: 27, step: 219, loss: 0.3300873041152954, mean loss: 0.3491716485761676
Epoch: 27, step: 220, loss: 0.3397611081600189, mean loss: 0.34917140856646534
Epoch: 27, step: 221, loss: 0.3397657871246338, mean loss: 0.34917116868833625
Epoch: 27, step: 222, loss: 0.29581594467163086, mean loss: 0.3491698079675177
Epoch: 27, step: 223, loss: 0.31284818053245544, mean loss: 0.34916888167894694
Epoch: 27, step: 224, loss: 0.32096391916275024, mean loss: 0.34916816240313236
Epoch: 27, step: 225, loss: 0.3506357669830322, mean loss: 0.34916819982865843
Epoch: 27, step: 226, loss: 0.3332677185535431, mean loss: 0.3491677943592902
Epoch: 27, step: 227, loss: 0.35010263323783875, mean loss: 0.3491678181974909
Epoch: 27, step: 228, loss: 0.3422192931175232, mean loss: 0.3491676410160369
Epoch: 27, step: 229, loss: 0.3299882113933563, mean loss: 0.3491671519694353
Epoch: 27, step: 230, loss: 0.3358237147331238, mean loss: 0.34916681174053515
Epoch: 27, step: 231, loss: 0.3458619713783264, mean loss: 0.34916672747637495
Epoch: 27, step: 232, loss: 0.3486432433128357, mean loss: 0.3491667141293373
Epoch: 27, step: 233, loss: 0.32540032267570496, mean loss: 0.34916610818391247
Epoch: 27, step: 234, loss: 0.329815149307251, mean loss: 0.3491656148264723
Epoch: 27, step: 235, loss: 0.3332892060279846, mean loss: 0.3491652100638576
Epoch: 27, step: 236, loss: 0.31762340664863586, mean loss: 0.3491644059388502
Epoch: 27, step: 237, loss: 0.3457445204257965, mean loss: 0.349164318754699
Epoch: 27, step: 238, loss: 0.3140137493610382, mean loss: 0.3491634226736988
Epoch: 27, step: 239, loss: 0.29491135478019714, mean loss: 0.34916203968022747
Epoch: 27, step: 240, loss: 0.3356950879096985, mean loss: 0.3491616963895045
Epoch: 27, step: 241, loss: 0.3241479694843292, mean loss: 0.3491610587721987
Epoch: 27, step: 242, loss: 0.3082525134086609, mean loss: 0.34916001601149
Epoch: 27, step: 243, loss: 0.33094799518585205, mean loss: 0.34915955179807173
Epoch: 27, step: 244, loss: 0.3133183717727661, mean loss: 0.349158638251312
Epoch: 27, step: 245, loss: 0.3052940368652344, mean loss: 0.3491575202260944
Epoch: 27, step: 246, loss: 0.3495123088359833, mean loss: 0.3491575292687505
Epoch: 27, step: 247, loss: 0.34432825446128845, mean loss: 0.3491574061859998
Epoch: 27, step: 248, loss: 0.36680176854133606, mean loss: 0.34915785587283504
Epoch: 27, step: 249, loss: 0.3454035222530365, mean loss: 0.34915776019177025
Epoch: 27, step: 250, loss: 0.32901448011398315, mean loss: 0.34915724684331395
Epoch: 27, step: 251, loss: 0.354430615901947, mean loss: 0.3491573812309046
Epoch: 27, step: 252, loss: 0.3360772430896759, mean loss: 0.3491570479025455
Epoch: 27, step: 253, loss: 0.3140486180782318, mean loss: 0.34915615323790494
Epoch: 27, step: 254, loss: 0.3299105167388916, mean loss: 0.3491556628157532
Epoch: 27, step: 255, loss: 0.28875964879989624, mean loss: 0.3491541238285446
Epoch: 27, step: 256, loss: 0.33803170919418335, mean loss: 0.3491538404188202
Epoch: 27, step: 257, loss: 0.32969143986701965, mean loss: 0.34915334451094293
Epoch: 27, step: 258, loss: 0.3426322042942047, mean loss: 0.3491531783545433
Epoch: 27, step: 259, loss: 0.38202571868896484, mean loss: 0.34915401591417267
Epoch: 27, step: 260, loss: 0.3315448760986328, mean loss: 0.3491535672622372
Epoch: 27, step: 261, loss: 0.31621161103248596, mean loss: 0.34915272797672814
Epoch: 27, step: 262, loss: 0.3371022045612335, mean loss: 0.3491524209648452
Epoch: 27, step: 263, loss: 0.33046436309814453, mean loss: 0.3491519448602425
Epoch: 27, step: 264, loss: 0.33530184626579285, mean loss: 0.3491515920184573
Epoch: 27, step: 265, loss: 0.31819435954093933, mean loss: 0.34915080337952936
Epoch: 27, step: 266, loss: 0.3844318091869354, mean loss: 0.3491517021441659
Epoch: 27, step: 267, loss: 0.30800971388816833, mean loss: 0.3491506541008539
Epoch: 27, step: 268, loss: 0.35207825899124146, mean loss: 0.34915072867621344
Epoch: 27, step: 269, loss: 0.29268819093704224, mean loss: 0.3491492904333651
Epoch: 27, step: 270, loss: 0.33008310198783875, mean loss: 0.34914880478196175
Epoch: 27, step: 271, loss: 0.3508363962173462, mean loss: 0.3491488477669703
Epoch: 27, step: 272, loss: 0.3148741126060486, mean loss: 0.3491479747699717
Epoch: 27, step: 273, loss: 0.3407377004623413, mean loss: 0.3491477605609577
Epoch: 27, step: 274, loss: 0.36794450879096985, mean loss: 0.34914823930043837
Epoch: 27, step: 275, loss: 0.3193906843662262, mean loss: 0.34914748141650054
Epoch: 27, step: 276, loss: 0.32661378383636475, mean loss: 0.34914690752887595
Epoch: 27, step: 277, loss: 0.2948729395866394, mean loss: 0.34914552531607246
Epoch: 27, step: 278, loss: 0.3347679376602173, mean loss: 0.3491451591666937
Epoch: 27, step: 279, loss: 0.3055610656738281, mean loss: 0.3491440492529346
Epoch: 27, step: 280, loss: 0.33467766642570496, mean loss: 0.34914368086100134
Epoch: 27, step: 281, loss: 0.29843541979789734, mean loss: 0.34914238958875626
Epoch: 27, step: 282, loss: 0.3260330557823181, mean loss: 0.3491418011307642
Epoch: 27, step: 283, loss: 0.31529322266578674, mean loss: 0.3491409392297033
Epoch: 27, step: 284, loss: 0.3446699380874634, mean loss: 0.3491408253855574
Epoch: 27, step: 285, loss: 0.33112776279449463, mean loss: 0.3491403667344755
Epoch: 27, step: 286, loss: 0.3333679437637329, mean loss: 0.3491399651450937
Epoch: 27, step: 287, loss: 0.3202923536300659, mean loss: 0.3491392306606372
Epoch: 27, step: 288, loss: 0.31250980496406555, mean loss: 0.3491382980683899
Epoch: 27, step: 289, loss: 0.34778234362602234, mean loss: 0.3491382635464071
Epoch: 27, step: 290, loss: 0.3274223208427429, mean loss: 0.34913771068246696
Epoch: 27, step: 291, loss: 0.31468653678894043, mean loss: 0.3491368336159218
Epoch: 27, step: 292, loss: 0.3497367799282074, mean loss: 0.3491368488891152
Epoch: 27, step: 293, loss: 0.3473811745643616, mean loss: 0.3491368041949977
Epoch: 27, step: 294, loss: 0.312340646982193, mean loss: 0.3491358675008243
Epoch: 27, step: 295, loss: 0.3181428909301758, mean loss: 0.3491350785542667
Epoch: 27, step: 296, loss: 0.3667657673358917, mean loss: 0.3491355273435955
Epoch: 27, step: 297, loss: 0.30702584981918335, mean loss: 0.3491344554686903
Epoch: 27, step: 298, loss: 0.3506006896495819, mean loss: 0.3491344927897935
Epoch: 27, step: 299, loss: 0.3715388774871826, mean loss: 0.34913506305004344
Epoch: 27, step: 300, loss: 0.36086714267730713, mean loss: 0.34913536165982295
Epoch: 27, step: 301, loss: 0.3521374464035034, mean loss: 0.3491354380681901
Epoch: 27, step: 302, loss: 0.3263058066368103, mean loss: 0.34913485702847535
Epoch: 27, step: 303, loss: 0.33488672971725464, mean loss: 0.34913449440689054
Epoch: 27, step: 304, loss: 0.3714223802089691, mean loss: 0.3491350616296987
Epoch: 27, step: 305, loss: 0.38043567538261414, mean loss: 0.34913585820458937
Epoch: 27, step: 306, loss: 0.4159526228904724, mean loss: 0.3491375585930532
Epoch: 27, step: 307, loss: 0.3492935299873352, mean loss: 0.3491375625621949
Epoch: 27, step: 308, loss: 0.3338533341884613, mean loss: 0.3491371736208413
Epoch: 27, step: 309, loss: 0.3416304886341095, mean loss: 0.3491369826013241
Epoch: 27, step: 310, loss: 0.3495922386646271, mean loss: 0.3491369941857426
Epoch: 27, step: 311, loss: 0.33715811371803284, mean loss: 0.34913668937962383
Epoch: 27, step: 312, loss: 0.3183039426803589, mean loss: 0.34913590485132434
Epoch: 27, step: 313, loss: 0.3117229640483856, mean loss: 0.34913495291654234
Epoch: 27, step: 314, loss: 0.32533392310142517, mean loss: 0.3491343473386013
Epoch: 27, step: 315, loss: 0.36546212434768677, mean loss: 0.34913476276138294
Epoch: 27, step: 316, loss: 0.33875134587287903, mean loss: 0.34913449858591195
Epoch: 27, step: 317, loss: 0.31308111548423767, mean loss: 0.34913358133706696
Epoch: 27, step: 318, loss: 0.31705936789512634, mean loss: 0.3491327653446625
Epoch: 27, step: 319, loss: 0.3422106206417084, mean loss: 0.3491325892445123
Epoch: 27, step: 320, loss: 0.31875595450401306, mean loss: 0.34913181647912167
Epoch: 27, step: 321, loss: 0.3340418040752411, mean loss: 0.3491314326070178
Epoch: 27, step: 322, loss: 0.33126088976860046, mean loss: 0.34913097801306603
Epoch: 27, step: 323, loss: 0.32304608821868896, mean loss: 0.34913031447801834
Epoch: 27, step: 324, loss: 0.36532479524612427, mean loss: 0.34913072641505616
Epoch: 27, step: 325, loss: 0.30559462308883667, mean loss: 0.3491296190206591
Epoch: 27, step: 326, loss: 0.3410538136959076, mean loss: 0.3491294136078313
Epoch: 27, step: 327, loss: 0.2992148697376251, mean loss: 0.3491281440345311
Epoch: 27, step: 328, loss: 0.3494212031364441, mean loss: 0.3491281514882814
Epoch: 27, step: 329, loss: 0.31306540966033936, mean loss: 0.34912723428135767
Epoch: 27, step: 330, loss: 0.37130850553512573, mean loss: 0.3491277984175578
Epoch: 27, step: 331, loss: 0.32310113310813904, mean loss: 0.34912713649829763
Epoch: 27, step: 332, loss: 0.3152194023132324, mean loss: 0.349126274166867
Epoch: 27, step: 333, loss: 0.35552820563316345, mean loss: 0.3491264369747472
Epoch: 27, step: 334, loss: 0.31219083070755005, mean loss: 0.3491254976871479
Epoch: 27, step: 335, loss: 0.3231845200061798, mean loss: 0.3491248380142336
Epoch: 27, step: 336, loss: 0.3412244915962219, mean loss: 0.3491246371154054
Epoch: 27, step: 337, loss: 0.3326106667518616, mean loss: 0.34912421719041015
Epoch: 27, step: 338, loss: 0.3513742685317993, mean loss: 0.3491242744043177
Epoch: 27, step: 339, loss: 0.2977559268474579, mean loss: 0.34912296825227446
Epoch: 27, step: 340, loss: 0.3291946053504944, mean loss: 0.34912246154315646
Epoch: 27, step: 341, loss: 0.3473281264305115, mean loss: 0.34912241592060084
Epoch: 27, step: 342, loss: 0.34192758798599243, mean loss: 0.3491222329903948
Epoch: 27, step: 343, loss: 0.3247227668762207, mean loss: 0.3491216126439564
Epoch: 27, step: 344, loss: 0.3502265214920044, mean loss: 0.3491216407350974
Epoch: 27, step: 345, loss: 0.3332633078098297, mean loss: 0.34912123756397506
Epoch: 27, step: 346, loss: 0.35198813676834106, mean loss: 0.34912131044815464
Epoch: 27, step: 347, loss: 0.34507060050964355, mean loss: 0.3491212074709852
Epoch: 27, step: 348, loss: 0.3335649073123932, mean loss: 0.3491208120086937
Epoch: 27, step: 349, loss: 0.3407977819442749, mean loss: 0.34912060043133686
Epoch: 27, step: 350, loss: 0.2948617935180664, mean loss: 0.34911922116885147
Epoch: 27, step: 351, loss: 0.32453909516334534, mean loss: 0.3491185963562941
Epoch: 27, step: 352, loss: 0.34466561675071716, mean loss: 0.3491184831670105
Epoch: 27, step: 353, loss: 0.33057835698127747, mean loss: 0.3491180119117061
Epoch: 27, step: 354, loss: 0.3419615924358368, mean loss: 0.34911783001354185
Epoch: 27, step: 355, loss: 0.2969072461128235, mean loss: 0.3491165029856875
Epoch: 27, step: 356, loss: 0.3059235215187073, mean loss: 0.349115405184659
Epoch: 27, step: 357, loss: 0.2991560101509094, mean loss: 0.34911413543944897
Epoch: 27, step: 358, loss: 0.3743179738521576, mean loss: 0.3491147759924368
Epoch: 27, step: 359, loss: 0.3865293562412262, mean loss: 0.3491157268560194
Epoch: 27, step: 360, loss: 0.33825892210006714, mean loss: 0.34911545094545604
Epoch: 27, step: 361, loss: 0.3100125193595886, mean loss: 0.34911445722419593
Epoch: 27, step: 362, loss: 0.36102670431137085, mean loss: 0.349114759941969
Epoch: 27, step: 363, loss: 0.3204346001148224, mean loss: 0.3491140311312395
Epoch: 27, step: 364, loss: 0.35866984724998474, mean loss: 0.34911427395430555
Epoch: 27, step: 365, loss: 0.33195409178733826, mean loss: 0.34911383790759704
Epoch: 27, step: 366, loss: 0.35534578561782837, mean loss: 0.34911399625971773
Epoch: 27, step: 367, loss: 0.3225060999393463, mean loss: 0.34911332017738417
Epoch: 27, step: 368, loss: 0.33100318908691406, mean loss: 0.34911286002719255
Epoch: 27, step: 369, loss: 0.33695074915885925, mean loss: 0.3491125510147715
Epoch: 27, step: 370, loss: 0.3433893024921417, mean loss: 0.3491124056033403
Epoch: 27, step: 371, loss: 0.3535902798175812, mean loss: 0.3491125193704697
Epoch: 27, step: 372, loss: 0.3104330003261566, mean loss: 0.3491115366840785
Epoch: 27, step: 373, loss: 0.35599052906036377, mean loss: 0.3491117114463461
Epoch: 27, step: 374, loss: 0.33139023184776306, mean loss: 0.34911126123981717
Epoch: 27, step: 375, loss: 0.3176155686378479, mean loss: 0.34911046112568744
Epoch: 27, step: 376, loss: 0.3095967769622803, mean loss: 0.3491094573486225
Epoch: 27, step: 377, loss: 0.30518487095832825, mean loss: 0.34910834154853126
Epoch: 27, step: 378, loss: 0.33113253116607666, mean loss: 0.34910788492723976
Epoch: 27, step: 379, loss: 0.4131351113319397, mean loss: 0.34910951130466317
Epoch: 27, step: 380, loss: 0.3469550311565399, mean loss: 0.3491094565793679
Epoch: 27, step: 381, loss: 0.3501288592815399, mean loss: 0.3491094824722483
Epoch: 27, step: 382, loss: 0.350980281829834, mean loss: 0.3491095299894401
Epoch: 27, step: 383, loss: 0.3297967314720154, mean loss: 0.3491090394682952
Epoch: 27, step: 384, loss: 0.3183897137641907, mean loss: 0.34910825925531414
Epoch: 27, step: 385, loss: 0.32056528329849243, mean loss: 0.3491075343359268
Epoch: 27, step: 386, loss: 0.35587742924690247, mean loss: 0.3491077062697658
Epoch: 27, step: 387, loss: 0.3378911018371582, mean loss: 0.349107421410856
Epoch: 27, step: 388, loss: 0.3641226291656494, mean loss: 0.34910780273009706
Epoch: 27, step: 389, loss: 0.3901960253715515, mean loss: 0.34910884616101384
Epoch: 27, step: 390, loss: 0.3086394965648651, mean loss: 0.34910781847240835
Epoch: 27, step: 391, loss: 0.3335968852043152, mean loss: 0.3491074245939607
Epoch: 27, step: 392, loss: 0.3328164219856262, mean loss: 0.3491070109172484
Epoch: 27, step: 393, loss: 0.30510959029197693, mean loss: 0.3491058937210515
Epoch: 27, step: 394, loss: 0.3280520439147949, mean loss: 0.3491053591287196
Epoch: 27, step: 395, loss: 0.3151874542236328, mean loss: 0.34910449791845893
Epoch: 27, step: 396, loss: 0.324431836605072, mean loss: 0.34910387147028543
Epoch: 27, step: 397, loss: 0.3181309401988983, mean loss: 0.34910308507584903
Epoch: 27, step: 398, loss: 0.30651402473449707, mean loss: 0.34910200377845796
Epoch: 27, step: 399, loss: 0.2948421835899353, mean loss: 0.3491006262060961
Epoch: 27, step: 400, loss: 0.35696980357170105, mean loss: 0.3491008259871864
Epoch: 27, step: 401, loss: 0.30311766266822815, mean loss: 0.3490996586055332
Epoch: 27, step: 402, loss: 0.33741870522499084, mean loss: 0.34909936206689796
Epoch: 27, step: 403, loss: 0.34060871601104736, mean loss: 0.34909914652450214
Epoch: 27, step: 404, loss: 0.34005650877952576, mean loss: 0.34909891697514706
Epoch: 27, step: 405, loss: 0.32333967089653015, mean loss: 0.3490982630875987
Epoch: 27, step: 406, loss: 0.36421501636505127, mean loss: 0.34909864681023556
Epoch: 27, step: 407, loss: 0.3459540605545044, mean loss: 0.3490985669902981
Epoch: 27, step: 408, loss: 0.3410491347312927, mean loss: 0.34909836267442995
Epoch: 27, step: 409, loss: 0.3462795317173004, mean loss: 0.3490982911268652
Epoch: 27, step: 410, loss: 0.3804664611816406, mean loss: 0.34909908729352057
Epoch: 27, step: 411, loss: 0.35579460859298706, mean loss: 0.3490992572306094
Epoch: 27, step: 412, loss: 0.33031409978866577, mean loss: 0.3490987804620644
Epoch: 27, step: 413, loss: 0.32186853885650635, mean loss: 0.34909808937426157
Epoch: 27, step: 414, loss: 0.3785611689090729, mean loss: 0.3490988371112241
Epoch: 27, step: 415, loss: 0.32364705204963684, mean loss: 0.34909819119240715
Epoch: 27, step: 416, loss: 0.34953534603118896, mean loss: 0.3490982022862998
Epoch: 27, step: 417, loss: 0.35026028752326965, mean loss: 0.34909823177635807
Epoch: 27, step: 418, loss: 0.368225634098053, mean loss: 0.3490987171571869
Epoch: 27, step: 419, loss: 0.32029998302459717, mean loss: 0.34909798637323103
Epoch: 27, step: 420, loss: 0.31153297424316406, mean loss: 0.3490970331642653
Epoch: 27, step: 421, loss: 0.32966941595077515, mean loss: 0.3490965402026512
Epoch: 27, step: 422, loss: 0.3251924514770508, mean loss: 0.3490959336692284
Epoch: 27, step: 423, loss: 0.31279587745666504, mean loss: 0.34909501262852477
Epoch: 27, step: 424, loss: 0.31868577003479004, mean loss: 0.34909424107491066
Epoch: 27, step: 425, loss: 0.30668896436691284, mean loss: 0.34909316518114936
Epoch: 27, step: 426, loss: 0.3126925826072693, mean loss: 0.3490922416600895
Epoch: 27, step: 427, loss: 0.33430132269859314, mean loss: 0.3490918664084414
Epoch: 27, step: 428, loss: 0.36244142055511475, mean loss: 0.3490922050834838
Epoch: 27, step: 429, loss: 0.378887414932251, mean loss: 0.34909296096175896
Epoch: 27, step: 430, loss: 0.31472650170326233, mean loss: 0.3490920891370232
Epoch: 27, step: 431, loss: 0.306607186794281, mean loss: 0.34909101138709064
Epoch: 27, step: 432, loss: 0.3681253492832184, mean loss: 0.34909149423475805
Epoch: 27, step: 433, loss: 0.31825727224349976, mean loss: 0.3490907120770291
Epoch: 27, step: 434, loss: 0.3585650324821472, mean loss: 0.3490909524017229
Epoch: 27, step: 435, loss: 0.32143649458885193, mean loss: 0.3490902509392175
Epoch: 27, step: 436, loss: 0.34723174571990967, mean loss: 0.34909020379894556
Epoch: 27, step: 437, loss: 0.33963802456855774, mean loss: 0.3490899640541267
Epoch: 27, step: 438, loss: 0.3496166467666626, mean loss: 0.349089977412554
Epoch: 27, step: 439, loss: 0.34031742811203003, mean loss: 0.349089754917137
Epoch: 27, step: 440, loss: 0.3344648480415344, mean loss: 0.34908938399961753
Epoch: 27, step: 441, loss: 0.33134719729423523, mean loss: 0.3490889340329245
Epoch: 27, step: 442, loss: 0.38036325573921204, mean loss: 0.3490897271733903
Epoch: 27, step: 443, loss: 0.36899375915527344, mean loss: 0.34909023194190275
Epoch: 27, step: 444, loss: 0.328497052192688, mean loss: 0.3490897097097685
Epoch: 27, step: 445, loss: 0.31207525730133057, mean loss: 0.34908877106665825
Epoch: 27, step: 446, loss: 0.3058629631996155, mean loss: 0.3490876749386535
Epoch: 27, step: 447, loss: 0.3247714936733246, mean loss: 0.349087058340082
Epoch: 27, step: 448, loss: 0.3170434832572937, mean loss: 0.34908624581440606
Epoch: 27, step: 449, loss: 0.31976139545440674, mean loss: 0.3490855022460111
Epoch: 27, step: 450, loss: 0.3236635625362396, mean loss: 0.3490848576571597
Epoch: 27, step: 451, loss: 0.36174726486206055, mean loss: 0.3490851787121091
Epoch: 27, step: 452, loss: 0.30973824858665466, mean loss: 0.3490841810971874
Epoch: 27, step: 453, loss: 0.2784510850906372, mean loss: 0.3490823902879991
Epoch: 27, step: 454, loss: 0.3470411002635956, mean loss: 0.3490823385350892
Epoch: 27, step: 455, loss: 0.3864208459854126, mean loss: 0.3490832851558034
Epoch: 27, step: 456, loss: 0.3083173930644989, mean loss: 0.3490822516688699
Epoch: 27, step: 457, loss: 0.30738937854766846, mean loss: 0.3490811947081357
Epoch: 27, step: 458, loss: 0.3654075264930725, mean loss: 0.34908160858832393
Epoch: 27, step: 459, loss: 0.3195688724517822, mean loss: 0.34908086044555026
Epoch: 27, step: 460, loss: 0.3203313946723938, mean loss: 0.34908013167002305
Epoch: 27, step: 461, loss: 0.34933793544769287, mean loss: 0.3490801382049731
Epoch: 27, step: 462, loss: 0.36332187056541443, mean loss: 0.34908049920297973
Epoch: 27, step: 463, loss: 0.3191312849521637, mean loss: 0.3490797400725364
Epoch: 27, step: 464, loss: 0.35170626640319824, mean loss: 0.34907980664608795
Epoch: 27, step: 465, loss: 0.40499430894851685, mean loss: 0.3490812238535271
Epoch: 27, step: 466, loss: 0.3379696309566498, mean loss: 0.3490809422265369
Epoch: 27, step: 467, loss: 0.3036718964576721, mean loss: 0.3490797913484507
Epoch: 27, step: 468, loss: 0.363475501537323, mean loss: 0.3490801561939835
Epoch: 27, step: 469, loss: 0.3257046937942505, mean loss: 0.349079563780217
Epoch: 27, step: 470, loss: 0.31304606795310974, mean loss: 0.34907865059195
Epoch: 27, step: 471, loss: 0.33775025606155396, mean loss: 0.34907836350643223
Epoch: 27, step: 472, loss: 0.3514215350151062, mean loss: 0.3490784228858577
Epoch: 27, step: 473, loss: 0.34505903720855713, mean loss: 0.3490783210312716
Epoch: 27, step: 474, loss: 0.36617812514305115, mean loss: 0.3490787543435923
Epoch: 27, step: 475, loss: 0.34918513894081116, mean loss: 0.3490787570393301
Epoch: 27, step: 476, loss: 0.3255797326564789, mean loss: 0.3490781615997157
Epoch: 27, step: 477, loss: 0.3099406957626343, mean loss: 0.3490771699242017
Epoch: 27, step: 478, loss: 0.33874642848968506, mean loss: 0.34907690816776127
Epoch: 27, step: 479, loss: 0.32522162795066833, mean loss: 0.3490763037469592
Epoch: 27, step: 480, loss: 0.3136463463306427, mean loss: 0.349075406081515
Epoch: 27, step: 481, loss: 0.33361926674842834, mean loss: 0.3490750144894366
Epoch: 27, step: 482, loss: 0.41447192430496216, mean loss: 0.3490766713238167
Epoch: 27, step: 483, loss: 0.36727461218833923, mean loss: 0.3490771323579894
Epoch: 27, step: 484, loss: 0.3193381130695343, mean loss: 0.3490763789564418
Epoch: 27, step: 485, loss: 0.3498753011226654, mean loss: 0.34907639919564143
Epoch: 27, step: 486, loss: 0.313924640417099, mean loss: 0.34907550871410176
Epoch: 27, step: 487, loss: 0.3336948752403259, mean loss: 0.34907511909424477
Epoch: 27, step: 488, loss: 0.3334087133407593, mean loss: 0.349074722245301
Epoch: 27, step: 489, loss: 0.32087409496307373, mean loss: 0.3490740079075108
Epoch: 27, step: 490, loss: 0.30324262380599976, mean loss: 0.3490728470021155
Epoch: 27, step: 491, loss: 0.3249611258506775, mean loss: 0.3490722362695635
Epoch: 27, step: 492, loss: 0.31665706634521484, mean loss: 0.3490714152374234
Epoch: 27, step: 493, loss: 0.3282269239425659, mean loss: 0.3490708872881986
Epoch: 27, step: 494, loss: 0.31669628620147705, mean loss: 0.349070067325149
Epoch: 27, step: 495, loss: 0.3466683626174927, mean loss: 0.3490700064978593
Epoch: 27, step: 496, loss: 0.29929018020629883, mean loss: 0.34906874577033514
Epoch: 27, step: 497, loss: 0.31717878580093384, mean loss: 0.34906793814332887
Epoch: 27, step: 498, loss: 0.3328907787799835, mean loss: 0.34906752846015815
Epoch: 27, step: 499, loss: 0.3173043429851532, mean loss: 0.349066724084513
Epoch: 27, step: 500, loss: 0.35411205887794495, mean loss: 0.34906685185008807
Epoch: 27, step: 501, loss: 0.3169203996658325, mean loss: 0.3490660378097694
Epoch: 27, step: 502, loss: 0.3427019417285919, mean loss: 0.34906587665669453
Epoch: 27, step: 503, loss: 0.3021865487098694, mean loss: 0.34906468959784853
Epoch: 27, step: 504, loss: 0.3084661364555359, mean loss: 0.3490636616042005
Epoch: 27, step: 505, loss: 0.32060542702674866, mean loss: 0.3490629410331118
Epoch: 27, step: 506, loss: 0.33367618918418884, mean loss: 0.34906255144577547
Epoch: 27, step: 507, loss: 0.3312118649482727, mean loss: 0.34906209948389333
Epoch: 27, step: 508, loss: 0.35469427704811096, mean loss: 0.34906224208149733
Epoch: 27, step: 509, loss: 0.35672521591186523, mean loss: 0.34906243609065807
Epoch: 27, step: 510, loss: 0.3180396556854248, mean loss: 0.34906165068392864
Epoch: 27, step: 511, loss: 0.3324788808822632, mean loss: 0.3490612308669716
Epoch: 27, step: 512, loss: 0.30184468626976013, mean loss: 0.3490600355416736
Epoch: 27, step: 513, loss: 0.3227326571941376, mean loss: 0.34905936905951196
Epoch: 27, step: 514, loss: 0.29649150371551514, mean loss: 0.3490580383285461
Epoch: 27, step: 515, loss: 0.33194923400878906, mean loss: 0.3490576052381168
Epoch: 27, step: 516, loss: 0.29066339135169983, mean loss: 0.3490561270906953
Epoch: 27, step: 517, loss: 0.3425731956958771, mean loss: 0.3490559629907764
Epoch: 27, step: 518, loss: 0.34204724431037903, mean loss: 0.34905578558629924
Epoch: 27, step: 519, loss: 0.3452775478363037, mean loss: 0.3490556899540792
Epoch: 27, step: 520, loss: 0.33451423048973083, mean loss: 0.3490553218997254
Epoch: 27, step: 521, loss: 0.3247685432434082, mean loss: 0.34905470720018966
Epoch: 27, step: 522, loss: 0.3080768287181854, mean loss: 0.3490536700743644
Epoch: 27, step: 523, loss: 0.33960583806037903, mean loss: 0.3490534309613857
Epoch: 27, step: 524, loss: 0.3161117434501648, mean loss: 0.349052597268993
Epoch: 27, step: 525, loss: 0.37632864713668823, mean loss: 0.3490532875572419
Epoch: 27, step: 526, loss: 0.34467658400535583, mean loss: 0.3490531767966813
Epoch: 27, step: 527, loss: 0.37569525837898254, mean loss: 0.34905385100666164
Epoch: 27, step: 528, loss: 0.3364753723144531, mean loss: 0.34905353270115536
Epoch: 27, step: 529, loss: 0.3075307309627533, mean loss: 0.34905248196979904
Epoch: 27, step: 530, loss: 0.30051717162132263, mean loss: 0.3490512538185212
Epoch: 27, step: 531, loss: 0.29004591703414917, mean loss: 0.34904976076850136
Epoch: 27, step: 532, loss: 0.31746751070022583, mean loss: 0.3490489616427184
Epoch: 27, step: 533, loss: 0.3375735878944397, mean loss: 0.34904867128864353
Epoch: 27, step: 534, loss: 0.33605054020881653, mean loss: 0.34904834241353083
Epoch: 27, step: 535, loss: 0.3335000276565552, mean loss: 0.34904794902433045
Epoch: 27, step: 536, loss: 0.3810066878795624, mean loss: 0.3490487575945735
Epoch: 27, step: 537, loss: 0.3287864625453949, mean loss: 0.34904824496250725
Epoch: 27, step: 538, loss: 0.3682396411895752, mean loss: 0.3490487304887609
Epoch: 27, step: 539, loss: 0.3143647015094757, mean loss: 0.3490478530340711
Epoch: 27, step: 540, loss: 0.3406188189983368, mean loss: 0.3490476397973579
Epoch: 27, step: 541, loss: 0.3831741213798523, mean loss: 0.3490485031032416
Epoch: 27, step: 542, loss: 0.3349870443344116, mean loss: 0.34904814739610623
Epoch: 27, step: 543, loss: 0.3160285949707031, mean loss: 0.3490473121347376
Epoch: 27, step: 544, loss: 0.3349080979824066, mean loss: 0.34904695447875017
Epoch: 27, step: 545, loss: 0.2982776165008545, mean loss: 0.34904567028443695
Epoch: 27, step: 546, loss: 0.3677755892276764, mean loss: 0.3490461440398168
Epoch: 27, step: 547, loss: 0.34676840901374817, mean loss: 0.3490460864281458
Epoch: 27, step: 548, loss: 0.30677470564842224, mean loss: 0.3490450172680987
Epoch: 27, step: 549, loss: 0.3357582986354828, mean loss: 0.3490446812187631
Epoch: 27, step: 550, loss: 0.365055114030838, mean loss: 0.3490450861463741
Epoch: 27, step: 551, loss: 0.3376340866088867, mean loss: 0.34904479755255674
Epoch: 27, step: 552, loss: 0.33204782009124756, mean loss: 0.3490443676955106
Epoch: 27, step: 553, loss: 0.34062665700912476, mean loss: 0.34904415481526463
Epoch: 27, step: 554, loss: 0.38015565276145935, mean loss: 0.3490449415916333
Epoch: 27, step: 555, loss: 0.3511207103729248, mean loss: 0.34904499408426887
Epoch: 27, step: 556, loss: 0.3253796696662903, mean loss: 0.3490443956438992
Epoch: 27, step: 557, loss: 0.2804352045059204, mean loss: 0.3490426607227659
Epoch: 27, step: 558, loss: 0.39106714725494385, mean loss: 0.34904372336940237
Epoch: 27, step: 559, loss: 0.33442941308021545, mean loss: 0.3490433538359167
Epoch: 27, step: 560, loss: 0.30493029952049255, mean loss: 0.34904223843339544
Epoch: 27, step: 561, loss: 0.34874966740608215, mean loss: 0.34904223103589793
Epoch: 27, step: 562, loss: 0.35314542055130005, mean loss: 0.3490423347801652
Epoch: 27, step: 563, loss: 0.30647626519203186, mean loss: 0.34904125857492685
Epoch: 27, step: 564, loss: 0.316822350025177, mean loss: 0.3490404439993308
Epoch: 27, step: 565, loss: 0.32711225748062134, mean loss: 0.3490398896132632
Epoch: 27, step: 566, loss: 0.33152279257774353, mean loss: 0.3490394467590846
Epoch: 27, step: 567, loss: 0.33715441823005676, mean loss: 0.34903914629825616
Epoch: 27, step: 568, loss: 0.325702041387558, mean loss: 0.34903855633681036
Epoch: 27, step: 569, loss: 0.34357964992523193, mean loss: 0.34903841833927735
Epoch: 27, step: 570, loss: 0.3331931531429291, mean loss: 0.3490380177916094
Epoch: 27, step: 571, loss: 0.35028475522994995, mean loss: 0.3490380493067115
Epoch: 27, step: 572, loss: 0.3883594870567322, mean loss: 0.349039043251196
Epoch: 27, step: 573, loss: 0.358627587556839, mean loss: 0.3490392856187281
Epoch: 27, step: 574, loss: 0.3335503339767456, mean loss: 0.3490388941177893
Epoch: 27, step: 575, loss: 0.3344305157661438, mean loss: 0.3490385248836787
Epoch: 27, step: 576, loss: 0.3140210211277008, mean loss: 0.3490376398210285
Epoch: 27, step: 577, loss: 0.29885733127593994, mean loss: 0.3490363715526024
Epoch: 27, step: 578, loss: 0.3319201171398163, mean loss: 0.3490359389634647
Epoch: 27, step: 579, loss: 0.3394266963005066, mean loss: 0.34903569610957613
Epoch: 27, step: 580, loss: 0.30592548847198486, mean loss: 0.349034606615082
Epoch: 27, step: 581, loss: 0.33591437339782715, mean loss: 0.34903427504487183
Epoch: 27, step: 582, loss: 0.3639306426048279, mean loss: 0.3490346514914504
Epoch: 27, step: 583, loss: 0.3280014991760254, mean loss: 0.349034119975421
Epoch: 27, step: 584, loss: 0.32768720388412476, mean loss: 0.34903358054408923
Epoch: 27, step: 585, loss: 0.3395593762397766, mean loss: 0.34903334113932083
Epoch: 27, step: 586, loss: 0.33262863755226135, mean loss: 0.3490329266174361
Epoch: 27, step: 587, loss: 0.34890541434288025, mean loss: 0.3490329233954765
Epoch: 27, step: 588, loss: 0.3257308602333069, mean loss: 0.34903233461757105
Epoch: 27, step: 589, loss: 0.32408031821250916, mean loss: 0.34903170416589574
Epoch: 27, step: 590, loss: 0.3594229817390442, mean loss: 0.3490319667111236
Epoch: 27, step: 591, loss: 0.31710442900657654, mean loss: 0.34903116005276824
Epoch: 27, step: 592, loss: 0.35782045125961304, mean loss: 0.3490313821111095
Epoch: 27, step: 593, loss: 0.31399089097976685, mean loss: 0.34903049684782994
Epoch: 27, step: 594, loss: 0.3091917335987091, mean loss: 0.3490294903863882
Epoch: 27, step: 595, loss: 0.3385322093963623, mean loss: 0.34902922519638746
Epoch: 27, step: 596, loss: 0.3096504509449005, mean loss: 0.3490282304060818
Epoch: 27, step: 597, loss: 0.3366418480873108, mean loss: 0.349027917508029
Epoch: 27, step: 598, loss: 0.3390018045902252, mean loss: 0.34902766424021586
Epoch: 27, step: 599, loss: 0.3720036447048187, mean loss: 0.34902824461761467
Epoch: 27, step: 600, loss: 0.31156274676322937, mean loss: 0.34902729825630585
Epoch: 27, step: 601, loss: 0.3497081398963928, mean loss: 0.3490273154536193
Epoch: 27, step: 602, loss: 0.28770798444747925, mean loss: 0.3490257666336601
Epoch: 27, step: 603, loss: 0.32250863313674927, mean loss: 0.3490250968737718
Epoch: 27, step: 604, loss: 0.3643333911895752, mean loss: 0.3490254835152063
Epoch: 27, step: 605, loss: 0.32492268085479736, mean loss: 0.34902487476633876
Epoch: 27, step: 606, loss: 0.39914554357528687, mean loss: 0.34902614059962095
Epoch: 27, step: 607, loss: 0.3494906425476074, mean loss: 0.3490261523306531
Epoch: 27, step: 608, loss: 0.3198551535606384, mean loss: 0.3490254156334596
Epoch: 27, step: 609, loss: 0.310929536819458, mean loss: 0.34902445356772865
Epoch: 27, step: 610, loss: 0.31109774112701416, mean loss: 0.3490234957982789
Epoch: 27, step: 611, loss: 0.32518482208251953, mean loss: 0.3490228938115689
Epoch: 27, step: 612, loss: 0.33041661977767944, mean loss: 0.34902242396802874
Epoch: 27, step: 613, loss: 0.3381192684173584, mean loss: 0.3490221486497228
Epoch: 27, step: 614, loss: 0.37057122588157654, mean loss: 0.349022692777118
Epoch: 27, step: 615, loss: 0.38797733187675476, mean loss: 0.34902367638077164
Epoch: 27, step: 616, loss: 0.3447625935077667, mean loss: 0.34902356879125335
Epoch: 27, step: 617, loss: 0.3218534290790558, mean loss: 0.34902288278055515
Epoch: 27, step: 618, loss: 0.3285985589027405, mean loss: 0.34902236710595524
Epoch: 27, step: 619, loss: 0.32200637459754944, mean loss: 0.349021685021717
Epoch: 27, step: 620, loss: 0.3023386001586914, mean loss: 0.3490205064238008
Epoch: 27, step: 621, loss: 0.31732726097106934, mean loss: 0.3490197062913733
Epoch: 27, step: 622, loss: 0.3782730996608734, mean loss: 0.3490204448082845
Epoch: 27, step: 623, loss: 0.35110199451446533, mean loss: 0.34902049735674723
Epoch: 27, step: 624, loss: 0.2945348918437958, mean loss: 0.34901912190915396
Epoch: 27, step: 625, loss: 0.3350496292114258, mean loss: 0.34901876926885766
Epoch: 27, step: 626, loss: 0.2983607351779938, mean loss: 0.3490174905099509
Epoch: 27, step: 627, loss: 0.33473071455955505, mean loss: 0.3490171298784901
Epoch: 27, step: 628, loss: 0.3658526539802551, mean loss: 0.3490175548355566
Epoch: 27, step: 629, loss: 0.3679835796356201, mean loss: 0.34901803355797567
Epoch: 27, step: 630, loss: 0.33484628796577454, mean loss: 0.3490176758572363
Epoch: 27, step: 631, loss: 0.306142121553421, mean loss: 0.3490165936877688
Epoch: 27, step: 632, loss: 0.3417521119117737, mean loss: 0.34901641033848996
Epoch: 27, step: 633, loss: 0.33574149012565613, mean loss: 0.3490160752993649
Epoch: 27, step: 634, loss: 0.33714523911476135, mean loss: 0.3490157757047813
Epoch: 27, step: 635, loss: 0.3248614966869354, mean loss: 0.3490151661176872
Epoch: 27, step: 636, loss: 0.35561829805374146, mean loss: 0.34901533275824076
Epoch: 27, step: 637, loss: 0.3227413296699524, mean loss: 0.34901466970864986
Epoch: 27, step: 638, loss: 0.28665539622306824, mean loss: 0.34901309605246883
Epoch: 27, step: 639, loss: 0.3174896836280823, mean loss: 0.3490123005691635
Epoch: 27, step: 640, loss: 0.34413427114486694, mean loss: 0.34901217747674573
Epoch: 27, step: 641, loss: 0.37137261033058167, mean loss: 0.3490127417066941
Epoch: 27, step: 642, loss: 0.2980763614177704, mean loss: 0.3490114564406072
Epoch: 27, step: 643, loss: 0.30546003580093384, mean loss: 0.34901035754525395
Epoch: 27, step: 644, loss: 0.3088662922382355, mean loss: 0.34900934465031014
Epoch: 27, step: 645, loss: 0.32496321201324463, mean loss: 0.3490087379456465
Epoch: 27, step: 646, loss: 0.3563101589679718, mean loss: 0.34900892216214763
Epoch: 27, step: 647, loss: 0.3216715157032013, mean loss: 0.3490082324506112
Epoch: 27, step: 648, loss: 0.34830963611602783, mean loss: 0.3490082148257573
Epoch: 27, step: 649, loss: 0.3040764629840851, mean loss: 0.3490070812733116
Epoch: 27, step: 650, loss: 0.3640784025192261, mean loss: 0.3490074614877783
Epoch: 27, step: 651, loss: 0.3607160449028015, mean loss: 0.3490077568607201
Epoch: 27, step: 652, loss: 0.3050582706928253, mean loss: 0.34900664817309446
Epoch: 27, step: 653, loss: 0.33212965726852417, mean loss: 0.3490062224379927
Epoch: 27, step: 654, loss: 0.3172849714756012, mean loss: 0.3490054222651762
Epoch: 27, step: 655, loss: 0.3145195245742798, mean loss: 0.34900455237571776
Epoch: 27, step: 656, loss: 0.30098700523376465, mean loss: 0.34900334118774595
Epoch: 27, step: 657, loss: 0.3723263144493103, mean loss: 0.34900392946836095
Epoch: 27, step: 658, loss: 0.35591211915016174, mean loss: 0.34900410371079243
Epoch: 27, step: 659, loss: 0.31217190623283386, mean loss: 0.3490031747308318
Epoch: 27, step: 660, loss: 0.2974633574485779, mean loss: 0.34900187482875905
Epoch: 27, step: 661, loss: 0.35045963525772095, mean loss: 0.34900191159446975
Epoch: 27, step: 662, loss: 0.32766836881637573, mean loss: 0.3490013735615632
Epoch: 27, step: 663, loss: 0.3600544333457947, mean loss: 0.349001652313197
Epoch: 27, step: 664, loss: 0.32963675260543823, mean loss: 0.34900116395418995
Epoch: 27, step: 665, loss: 0.33402732014656067, mean loss: 0.34900078634174714
Epoch: 27, step: 666, loss: 0.33003830909729004, mean loss: 0.3490003081554593
Epoch: 27, step: 667, loss: 0.29697680473327637, mean loss: 0.3489989962857946
Epoch: 27, step: 668, loss: 0.3009471297264099, mean loss: 0.3489977845989156
Epoch: 27, step: 669, loss: 0.3305997848510742, mean loss: 0.348997320682436
Epoch: 27, step: 670, loss: 0.35543057322502136, mean loss: 0.3489974828966255
Epoch: 27, step: 671, loss: 0.3657451570034027, mean loss: 0.3489979051778688
Epoch: 27, step: 672, loss: 0.34754806756973267, mean loss: 0.34899786862211857
Epoch: 27, step: 673, loss: 0.3166548013687134, mean loss: 0.3489970531547379
Epoch: 27, step: 674, loss: 0.3621552288532257, mean loss: 0.3489973849041189
Epoch: 27, step: 675, loss: 0.35514965653419495, mean loss: 0.34899754001383126
Epoch: 27, step: 676, loss: 0.30767661333084106, mean loss: 0.3489964982660263
Epoch: 27, step: 677, loss: 0.3128560185432434, mean loss: 0.34899558714618256
Epoch: 27, step: 678, loss: 0.31549501419067383, mean loss: 0.3489947426010202
Epoch: 27, step: 679, loss: 0.33734700083732605, mean loss: 0.3489944489703415
Epoch: 27, step: 680, loss: 0.34037306904792786, mean loss: 0.34899423163741344
Epoch: 27, step: 681, loss: 0.3048066794872284, mean loss: 0.34899311775911374
Epoch: 27, step: 682, loss: 0.3075726628303528, mean loss: 0.3489920736600255
Epoch: 27, step: 683, loss: 0.3632661700248718, mean loss: 0.3489924334628175
Epoch: 27, step: 684, loss: 0.31906548142433167, mean loss: 0.3489916791222827
Epoch: 27, step: 685, loss: 0.3114103376865387, mean loss: 0.3489907318686295
Epoch: 27, step: 686, loss: 0.32091718912124634, mean loss: 0.3489900242809106
Epoch: 27, step: 687, loss: 0.3156536817550659, mean loss: 0.3489891840666116
Epoch: 27, step: 688, loss: 0.2998107671737671, mean loss: 0.348987944597476
Epoch: 27, step: 689, loss: 0.33589881658554077, mean loss: 0.3489876147137114
Epoch: 27, step: 690, loss: 0.3181040287017822, mean loss: 0.3489868363779164
Epoch: 27, step: 691, loss: 0.3148372769355774, mean loss: 0.3489859757539385
Epoch: 27, step: 692, loss: 0.3356219232082367, mean loss: 0.34898563896674706
Epoch: 27, step: 693, loss: 0.32778695225715637, mean loss: 0.34898510475257666
Epoch: 27, step: 694, loss: 0.38620761036872864, mean loss: 0.34898604274883743
Epoch: 27, step: 695, loss: 0.30333271622657776, mean loss: 0.3489848923273446
Epoch: 27, step: 696, loss: 0.33787140250205994, mean loss: 0.34898461228476363
Epoch: 27, step: 697, loss: 0.3264666795730591, mean loss: 0.3489840448823368
Epoch: 27, step: 698, loss: 0.30524542927742004, mean loss: 0.3489829427930984
Epoch: 27, step: 699, loss: 0.3619321584701538, mean loss: 0.34898326906843796
Epoch: 27, step: 700, loss: 0.34064504504203796, mean loss: 0.34898305897939497
Epoch: 27, step: 701, loss: 0.33814138174057007, mean loss: 0.3489827858204824
Epoch: 27, step: 702, loss: 0.33256790041923523, mean loss: 0.3489823722535428
Epoch: 27, step: 703, loss: 0.3192962408065796, mean loss: 0.34898162434133256
Epoch: 27, step: 704, loss: 0.33163926005363464, mean loss: 0.34898118742892265
Epoch: 27, step: 705, loss: 0.344347208738327, mean loss: 0.3489810706863749
Epoch: 27, step: 706, loss: 0.3735075891017914, mean loss: 0.34898168856062645
Epoch: 27, step: 707, loss: 0.3381158411502838, mean loss: 0.34898141483411976
Epoch: 27, step: 708, loss: 0.3127734363079071, mean loss: 0.3489805027254333
Epoch: 27, step: 709, loss: 0.38723650574684143, mean loss: 0.3489814664012613
Epoch: 27, step: 710, loss: 0.3202923536300659, mean loss: 0.3489807437353813
Epoch: 27, step: 711, loss: 0.34237080812454224, mean loss: 0.34898057723826265
Epoch: 27, step: 712, loss: 0.3268801271915436, mean loss: 0.34898002056588545
Epoch: 27, step: 713, loss: 0.34069162607192993, mean loss: 0.34897981180072263
Epoch: 27, step: 714, loss: 0.36461150646209717, mean loss: 0.3489802055164283
Epoch: 27, step: 715, loss: 0.3665778338909149, mean loss: 0.34898064873696966
Epoch: 27, step: 716, loss: 0.3155980408191681, mean loss: 0.3489798079711236
Epoch: 27, step: 717, loss: 0.3393765687942505, mean loss: 0.34897956611248315
Epoch: 27, step: 718, loss: 0.3044227063655853, mean loss: 0.34897844397130534
Epoch: 27, step: 719, loss: 0.3218432366847992, mean loss: 0.3489777606025311
Epoch: 27, step: 720, loss: 0.33049896359443665, mean loss: 0.3489772952471455
Epoch: 27, step: 721, loss: 0.31788894534111023, mean loss: 0.34897651236248406
Epoch: 27, step: 722, loss: 0.32982486486434937, mean loss: 0.3489760300868552
Epoch: 27, step: 723, loss: 0.33622097969055176, mean loss: 0.34897570889803575
Epoch: 27, step: 724, loss: 0.3255402743816376, mean loss: 0.34897511877806203
Epoch: 27, step: 725, loss: 0.31677794456481934, mean loss: 0.34897430805201546
Epoch: 27, step: 726, loss: 0.31756317615509033, mean loss: 0.3489735171384589
Epoch: 27, step: 727, loss: 0.3565784692764282, mean loss: 0.34897370862179405
Epoch: 27, step: 728, loss: 0.3793827295303345, mean loss: 0.34897447426423706
Epoch: 27, step: 729, loss: 0.31806185841560364, mean loss: 0.3489736959618087
Epoch: 27, step: 730, loss: 0.3288313150405884, mean loss: 0.34897318883975326
Epoch: 27, step: 731, loss: 0.3327410817146301, mean loss: 0.34897278017643185
Epoch: 27, step: 732, loss: 0.3061210513114929, mean loss: 0.34897170135845484
Epoch: 27, step: 733, loss: 0.34672683477401733, mean loss: 0.3489716448440149
Epoch: 27, step: 734, loss: 0.29260754585266113, mean loss: 0.34897022591545984
Epoch: 27, step: 735, loss: 0.2952747046947479, mean loss: 0.34896887420059675
Epoch: 27, step: 736, loss: 0.2999967038631439, mean loss: 0.3489676414209784
Epoch: 27, step: 737, loss: 0.32549849152565, mean loss: 0.34896705064541844
Epoch: 27, step: 738, loss: 0.3050574064254761, mean loss: 0.34896594536074504
Epoch: 27, step: 739, loss: 0.3363402187824249, mean loss: 0.3489656275565118
Epoch: 27, step: 740, loss: 0.3048681616783142, mean loss: 0.3489645175999088
Epoch: 27, step: 741, loss: 0.301271915435791, mean loss: 0.34896331718203405
Epoch: 27, step: 742, loss: 0.339557021856308, mean loss: 0.34896308043251034
Epoch: 27, step: 743, loss: 0.33065128326416016, mean loss: 0.34896261954966606
Epoch: 27, step: 744, loss: 0.3218521475791931, mean loss: 0.34896193723340574
Epoch: 27, step: 745, loss: 0.334547758102417, mean loss: 0.3489615744665277
Epoch: 27, step: 746, loss: 0.33677417039871216, mean loss: 0.3489612677494252
Epoch: 27, step: 747, loss: 0.3449760377407074, mean loss: 0.34896116745674327
Epoch: 27, step: 748, loss: 0.3310873806476593, mean loss: 0.3489607176546241
Epoch: 27, step: 749, loss: 0.3996983468532562, mean loss: 0.3489619944584189
Epoch: 27, step: 750, loss: 0.32804030179977417, mean loss: 0.3489614679808362
Epoch: 27, step: 751, loss: 0.3295259475708008, mean loss: 0.34896097891389083
Epoch: 27, step: 752, loss: 0.37014541029930115, mean loss: 0.34896151197625425
Epoch: 27, step: 753, loss: 0.33184558153152466, mean loss: 0.34896108130013215
Epoch: 27, step: 754, loss: 0.35360026359558105, mean loss: 0.34896119802967684
Epoch: 27, step: 755, loss: 0.33664900064468384, mean loss: 0.34896088824210175
Epoch: 27, step: 756, loss: 0.3463817536830902, mean loss: 0.34896082335005096
Epoch: 27, step: 757, loss: 0.37375733256340027, mean loss: 0.3489614472243833
Epoch: 27, step: 758, loss: 0.3161499798297882, mean loss: 0.3489606217163602
Epoch: 27, step: 759, loss: 0.31947532296180725, mean loss: 0.3489598799105145
Epoch: 27, step: 760, loss: 0.32437846064567566, mean loss: 0.34895926149447226
Epoch: 27, step: 761, loss: 0.31766581535339355, mean loss: 0.34895847423796555
Epoch: 27, step: 762, loss: 0.3057887554168701, mean loss: 0.34895738823462424
Epoch: 27, step: 763, loss: 0.3740714192390442, mean loss: 0.3489580200023593
Epoch: 27, step: 764, loss: 0.3288270831108093, mean loss: 0.3489575136019143
Epoch: 27, step: 765, loss: 0.3838236629962921, mean loss: 0.34895839064949175
Epoch: 27, step: 766, loss: 0.3293291926383972, mean loss: 0.34895789689529705
Epoch: 27, step: 767, loss: 0.3284248411655426, mean loss: 0.3489573804183947
Epoch: 27, step: 768, loss: 0.3240680992603302, mean loss: 0.34895675438320195
Epoch: 27, step: 769, loss: 0.3292454779148102, mean loss: 0.34895625860181284
Epoch: 27, step: 770, loss: 0.34932342171669006, mean loss: 0.3489562678365299
Epoch: 27, step: 771, loss: 0.31238505244255066, mean loss: 0.34895534803734995
Epoch: 27, step: 772, loss: 0.3620610535144806, mean loss: 0.348955677649419
Epoch: 27, step: 773, loss: 0.3280006945133209, mean loss: 0.34895515063912935
Epoch: 27, step: 774, loss: 0.3428651988506317, mean loss: 0.3489549974828839
Epoch: 27, step: 775, loss: 0.31519168615341187, mean loss: 0.3489541483904553
Epoch: 27, step: 776, loss: 0.30345794558525085, mean loss: 0.3489530042636401
Epoch: 27, step: 777, loss: 0.3262466490268707, mean loss: 0.3489524332644137
Epoch: 27, step: 778, loss: 0.3438863754272461, mean loss: 0.3489523058709006
Epoch: 27, step: 779, loss: 0.30320993065834045, mean loss: 0.3489511556401821
Epoch: 27, step: 780, loss: 0.34757786989212036, mean loss: 0.3489511211086186
Epoch: 27, step: 781, loss: 0.2953234612941742, mean loss: 0.34894977266356414
Epoch: 27, step: 782, loss: 0.3372502028942108, mean loss: 0.34894947849017727
Epoch: 27, step: 783, loss: 0.310737282037735, mean loss: 0.3489485177088122
Epoch: 27, step: 784, loss: 0.3259941637516022, mean loss: 0.34894794057472733
Epoch: 27, step: 785, loss: 0.3204309642314911, mean loss: 0.3489472235994082
Epoch: 27, step: 786, loss: 0.35970768332481384, mean loss: 0.34894749413265086
Epoch: 27, step: 787, loss: 0.3229729235172272, mean loss: 0.34894684111146684
Epoch: 27, step: 788, loss: 0.36277395486831665, mean loss: 0.3489471887272689
Epoch: 27, step: 789, loss: 0.3700210154056549, mean loss: 0.348947718513248
Epoch: 27, step: 790, loss: 0.4135841429233551, mean loss: 0.34894934340136513
Epoch: 27, step: 791, loss: 0.3496701419353485, mean loss: 0.3489493615209864
Epoch: 27, step: 792, loss: 0.34107503294944763, mean loss: 0.34894916357903993
Epoch: 27, step: 793, loss: 0.28837448358535767, mean loss: 0.348947640913513
Epoch: 27, step: 794, loss: 0.35232511162757874, mean loss: 0.3489477258108489
Epoch: 27, step: 795, loss: 0.35611069202423096, mean loss: 0.3489479058572548
Epoch: 27, step: 796, loss: 0.3554832339286804, mean loss: 0.3489480701233871
Epoch: 27, step: 797, loss: 0.3022783696651459, mean loss: 0.34894689710522847
Epoch: 27, step: 798, loss: 0.3424651324748993, mean loss: 0.34894673419360833
Epoch: 27, step: 799, loss: 0.3440973460674286, mean loss: 0.3489466123129376
Epoch: 27, step: 800, loss: 0.4236980676651001, mean loss: 0.34894849100944547
Epoch: 27, step: 801, loss: 0.3669390082359314, mean loss: 0.34894894314609354
Epoch: 27, step: 802, loss: 0.3013668656349182, mean loss: 0.3489477473461008
Epoch: 27, step: 803, loss: 0.33261895179748535, mean loss: 0.3489473369923727
Epoch: 27, step: 804, loss: 0.33824214339256287, mean loss: 0.3489470679703437
Epoch: 27, step: 805, loss: 0.30231353640556335, mean loss: 0.34894589609690635
Epoch: 27, step: 806, loss: 0.33632662892341614, mean loss: 0.3489455789900544
Epoch: 27, step: 807, loss: 0.30101701617240906, mean loss: 0.3489443746337669
Epoch: 27, step: 808, loss: 0.30993402004241943, mean loss: 0.3489433944002168
Epoch: 27, step: 809, loss: 0.2912273406982422, mean loss: 0.3489419441752381
Epoch: 27, step: 810, loss: 0.31395992636680603, mean loss: 0.34894106520798246
Epoch: 27, step: 811, loss: 0.3176051676273346, mean loss: 0.3489402778738724
Epoch: 27, step: 812, loss: 0.3398001194000244, mean loss: 0.3489400482274194
Epoch: 27, step: 813, loss: 0.3647806644439697, mean loss: 0.34894044621285275
Epoch: 27, step: 814, loss: 0.33600106835365295, mean loss: 0.3489401211273602
Epoch: 27, step: 815, loss: 0.3411511480808258, mean loss: 0.3489399254441865
Epoch: 27, step: 816, loss: 0.29906222224235535, mean loss: 0.3489386723929818
Epoch: 27, step: 817, loss: 0.3178321421146393, mean loss: 0.3489378909396763
Epoch: 27, step: 818, loss: 0.3369480073451996, mean loss: 0.3489375897392946
Epoch: 27, step: 819, loss: 0.3325442969799042, mean loss: 0.34893717793029244
Epoch: 27, step: 820, loss: 0.30058038234710693, mean loss: 0.348935963210114
Epoch: 27, step: 821, loss: 0.3123009502887726, mean loss: 0.3489350429636201
Epoch: 27, step: 822, loss: 0.3447991609573364, mean loss: 0.3489349390756995
Epoch: 27, step: 823, loss: 0.29105865955352783, mean loss: 0.3489334853361355
Epoch: 27, step: 824, loss: 0.3090687394142151, mean loss: 0.34893248403641125
Epoch: 27, step: 825, loss: 0.383808434009552, mean loss: 0.34893336000843045
Epoch: 27, step: 826, loss: 0.39056065678596497, mean loss: 0.34893440552637034
Epoch: 27, step: 827, loss: 0.34446555376052856, mean loss: 0.3489342932887833
Epoch: 27, step: 828, loss: 0.3518526256084442, mean loss: 0.3489343665824096
Epoch: 27, step: 829, loss: 0.3641531765460968, mean loss: 0.34893474879171105
Epoch: 27, step: 830, loss: 0.35255753993988037, mean loss: 0.3489348397731809
Epoch: 27, step: 831, loss: 0.31143707036972046, mean loss: 0.3489338980913777
Epoch: 27, step: 832, loss: 0.3644382357597351, mean loss: 0.3489342874421642
Epoch: 27, step: 833, loss: 0.34651559591293335, mean loss: 0.3489342267045938
Epoch: 27, step: 834, loss: 0.3283561170101166, mean loss: 0.34893370996527995
Epoch: 27, step: 835, loss: 0.37039661407470703, mean loss: 0.3489342489092361
Epoch: 27, step: 836, loss: 0.35923439264297485, mean loss: 0.34893450754435806
Epoch: 27, step: 837, loss: 0.3496866524219513, mean loss: 0.3489345264301331
Epoch: 27, step: 838, loss: 0.3116236627101898, mean loss: 0.3489335896067791
Epoch: 27, step: 839, loss: 0.34459567070007324, mean loss: 0.3489334806904663
Epoch: 27, step: 840, loss: 0.3405841588973999, mean loss: 0.3489332710612566
Epoch: 27, step: 841, loss: 0.38852208852767944, mean loss: 0.34893426500595826
Epoch: 27, step: 842, loss: 0.3442847430706024, mean loss: 0.3489341482747204
Epoch: 27, step: 843, loss: 0.33441126346588135, mean loss: 0.3489337836712657
Epoch: 27, step: 844, loss: 0.33017295598983765, mean loss: 0.3489333126842027
Epoch: 27, step: 845, loss: 0.32010918855667114, mean loss: 0.3489325890781343
Epoch: 27, step: 846, loss: 0.3603825569152832, mean loss: 0.34893287651299904
Epoch: 27, step: 847, loss: 0.2885972261428833, mean loss: 0.3489313619118752
Epoch: 27, step: 848, loss: 0.3546135723590851, mean loss: 0.3489315045483801
Epoch: 27, step: 849, loss: 0.35437801480293274, mean loss: 0.34893164126483817
Epoch: 27, step: 850, loss: 0.3815324902534485, mean loss: 0.34893245957978053
Epoch: 27, step: 851, loss: 0.3419319689273834, mean loss: 0.3489322838646537
Epoch: 27, step: 852, loss: 0.36009156703948975, mean loss: 0.3489325639601125
Epoch: 27, step: 853, loss: 0.37385135889053345, mean loss: 0.3489331894004752
Epoch: 27, step: 854, loss: 0.31658563017845154, mean loss: 0.34893237752488293
Epoch: 27, step: 855, loss: 0.3575027883052826, mean loss: 0.34893259262403914
Epoch: 27, step: 856, loss: 0.3685334026813507, mean loss: 0.34893308455050565
Epoch: 27, step: 857, loss: 0.33218052983283997, mean loss: 0.34893266411797247
Epoch: 27, step: 858, loss: 0.30917927622795105, mean loss: 0.34893166646726126
Epoch: 27, step: 859, loss: 0.33912673592567444, mean loss: 0.34893142040897623
Epoch: 27, step: 860, loss: 0.3017228841781616, mean loss: 0.34893023572338233
Epoch: 27, step: 861, loss: 0.298268586397171, mean loss: 0.34892896441474175
Epoch: 27, step: 862, loss: 0.36621493101119995, mean loss: 0.34892939817968105
Epoch: 27, step: 863, loss: 0.333045095205307, mean loss: 0.3489289995973521
Epoch: 27, step: 864, loss: 0.30984383821487427, mean loss: 0.3489280188641229
Epoch: 27, step: 865, loss: 0.3380044996738434, mean loss: 0.34892774477572047
Epoch: 27, step: 866, loss: 0.30029261112213135, mean loss: 0.34892652447378464
Epoch: 27, step: 867, loss: 0.30371659994125366, mean loss: 0.3489253901420772
Epoch: 27, step: 868, loss: 0.31424474716186523, mean loss: 0.34892452001529944
Epoch: 27, step: 869, loss: 0.3901965022087097, mean loss: 0.3489255554907923
Epoch: 27, step: 870, loss: 0.3445223271846771, mean loss: 0.34892544502067746
Epoch: 27, step: 871, loss: 0.34370487928390503, mean loss: 0.34892531404813015
Epoch: 27, step: 872, loss: 0.32914847135543823, mean loss: 0.3489248179029584
Epoch: 27, step: 873, loss: 0.3216356635093689, mean loss: 0.34892413331226063
Epoch: 27, step: 874, loss: 0.33025866746902466, mean loss: 0.34892366507189126
Epoch: 27, step: 875, loss: 0.35351622104644775, mean loss: 0.34892378027748966
Epoch: 27, step: 876, loss: 0.35726508498191833, mean loss: 0.3489239895162882
Epoch: 27, step: 877, loss: 0.32905229926109314, mean loss: 0.3489234910541838
Epoch: 27, step: 878, loss: 0.3137742280960083, mean loss: 0.34892260939108005
Epoch: 27, step: 879, loss: 0.33450037240982056, mean loss: 0.3489222476413815
Epoch: 27, step: 880, loss: 0.31954464316368103, mean loss: 0.348921510788075
Epoch: 27, step: 881, loss: 0.34408658742904663, mean loss: 0.3489213895208726
Epoch: 27, step: 882, loss: 0.29782843589782715, mean loss: 0.34892010806433466
Epoch: 27, step: 883, loss: 0.3485566973686218, mean loss: 0.34892009894990106
Epoch: 27, step: 884, loss: 0.33615005016326904, mean loss: 0.3489197786818303
Epoch: 27, step: 885, loss: 0.32296350598335266, mean loss: 0.34891912772449724
Epoch: 27, step: 886, loss: 0.3740446865558624, mean loss: 0.3489197578325557
Epoch: 27, step: 887, loss: 0.3269101679325104, mean loss: 0.34891920588176073
Epoch: 27, step: 888, loss: 0.33600765466690063, mean loss: 0.3489188820973433
Epoch: 27, step: 889, loss: 0.32241010665893555, mean loss: 0.3489182173504794
Epoch: 27, step: 890, loss: 0.3076539635658264, mean loss: 0.34891718261405713
Epoch: 27, step: 891, loss: 0.33359095454216003, mean loss: 0.34891679830542943
Epoch: 27, step: 892, loss: 0.3113069236278534, mean loss: 0.34891585525298147
Epoch: 27, step: 893, loss: 0.3241785764694214, mean loss: 0.3489152349912397
Epoch: 27, step: 894, loss: 0.3072417676448822, mean loss: 0.34891419009824404
Epoch: 27, step: 895, loss: 0.35672879219055176, mean loss: 0.3489143860315028
Epoch: 27, step: 896, loss: 0.3345077931880951, mean loss: 0.3489140248282223
Epoch: 27, step: 897, loss: 0.316540390253067, mean loss: 0.3489132131741438
Epoch: 27, step: 898, loss: 0.3402636647224426, mean loss: 0.3489129963228276
Epoch: 27, step: 899, loss: 0.3397411108016968, mean loss: 0.3489127663818548
Epoch: 27, step: 900, loss: 0.3727058470249176, mean loss: 0.3489133628641091
Epoch: 27, step: 901, loss: 0.29180529713630676, mean loss: 0.34891193122545966
Epoch: 27, step: 902, loss: 0.34924450516700745, mean loss: 0.3489119395625267
Epoch: 27, step: 903, loss: 0.3531251549720764, mean loss: 0.3489120451780739
Epoch: 27, step: 904, loss: 0.30163174867630005, mean loss: 0.34891086000031085
Epoch: 27, step: 905, loss: 0.32294273376464844, mean loss: 0.34891020907219544
Epoch: 27, step: 906, loss: 0.33275410532951355, mean loss: 0.3489098041065671
Epoch: 27, step: 907, loss: 0.32964450120925903, mean loss: 0.3489093212184856
Epoch: 27, step: 908, loss: 0.4049454629421234, mean loss: 0.34891072573866816
Epoch: 27, step: 909, loss: 0.30166080594062805, mean loss: 0.3489095414707901
Epoch: 27, step: 910, loss: 0.32095029950141907, mean loss: 0.348908840720346
Epoch: 27, step: 911, loss: 0.3329988420009613, mean loss: 0.34890844197351095
Epoch: 27, step: 912, loss: 0.3454904556274414, mean loss: 0.34890835631183964
Epoch: 27, step: 913, loss: 0.3594038784503937, mean loss: 0.3489086193443227
Epoch: 27, step: 914, loss: 0.3095867931842804, mean loss: 0.34890763390898805
Epoch: 27, step: 915, loss: 0.33916401863098145, mean loss: 0.34890738973258273
Epoch: 27, step: 916, loss: 0.31833380460739136, mean loss: 0.34890662357332636
Epoch: 27, step: 917, loss: 0.31755486130714417, mean loss: 0.348905837933015
Epoch: 27, step: 918, loss: 0.2940542697906494, mean loss: 0.3489044634481341
Epoch: 27, step: 919, loss: 0.30046358704566956, mean loss: 0.3489032496344526
Epoch: 27, step: 920, loss: 0.3394525647163391, mean loss: 0.3489030128285963
Epoch: 27, step: 921, loss: 0.3040742874145508, mean loss: 0.3489018895831587
Epoch: 27, step: 922, loss: 0.3418225646018982, mean loss: 0.3489017122053686
Epoch: 27, step: 923, loss: 0.29252591729164124, mean loss: 0.3489002997029905
Epoch: 27, step: 924, loss: 0.3083420395851135, mean loss: 0.3488992835363251
Epoch: 27, step: 925, loss: 0.3488282561302185, mean loss: 0.348899281756814
Epoch: 27, step: 926, loss: 0.30915889143943787, mean loss: 0.348898286131352
Epoch: 27, step: 927, loss: 0.32819864153862, mean loss: 0.3488977675512189
Epoch: 27, step: 928, loss: 0.32084667682647705, mean loss: 0.3488970648157747
Epoch: 27, step: 929, loss: 0.31717580556869507, mean loss: 0.34889627015523944
Epoch: 27, step: 930, loss: 0.3375796675682068, mean loss: 0.34889598666610927
Epoch: 27, step: 931, loss: 0.3511863052845001, mean loss: 0.34889604403882013
Epoch: 27, step: 932, loss: 0.30893197655677795, mean loss: 0.3488950429600024
Epoch: 27, step: 933, loss: 0.3622915744781494, mean loss: 0.34889537852764724
Epoch: 27, step: 934, loss: 0.330220490694046, mean loss: 0.348894910754989
Epoch: 27, step: 935, loss: 0.3312675654888153, mean loss: 0.3488944692324646
Epoch: 27, step: 936, loss: 0.30700162053108215, mean loss: 0.3488934199438309
Epoch: 27, step: 937, loss: 0.3403538763523102, mean loss: 0.3488932060595552
Epoch: 27, step: 938, loss: 0.3221456706523895, mean loss: 0.3488925361485825
Epoch: 27, step: 939, loss: 0.3097791373729706, mean loss: 0.34889155655033627
Epoch: 27, step: 940, loss: 0.3404158055782318, mean loss: 0.34889134427978175
Epoch: 27, step: 941, loss: 0.36047008633613586, mean loss: 0.34889163425579117
Epoch: 27, step: 942, loss: 0.3457096517086029, mean loss: 0.34889155456876736
Epoch: 27, step: 943, loss: 0.3466053903102875, mean loss: 0.34889149731733343
Epoch: 27, step: 944, loss: 0.32725846767425537, mean loss: 0.34889095558418937
Epoch: 27, step: 945, loss: 0.3228674530982971, mean loss: 0.3488903039213836
Epoch: 27, step: 946, loss: 0.3354627788066864, mean loss: 0.34888996768687464
Epoch: 27, step: 947, loss: 0.3174579441547394, mean loss: 0.34888918062699054
Epoch: 27, step: 948, loss: 0.3656952977180481, mean loss: 0.34888960144270253
Epoch: 27, step: 949, loss: 0.3109733462333679, mean loss: 0.34888865206478653
Epoch: 27, step: 950, loss: 0.31407734751701355, mean loss: 0.3488877804529648
Epoch: 27, step: 951, loss: 0.28662553429603577, mean loss: 0.34888622155846916
Epoch: 27, step: 952, loss: 0.31483352184295654, mean loss: 0.3488853689834281
Epoch: 27, step: 953, loss: 0.3441625237464905, mean loss: 0.3488852507408454
Epoch: 27, step: 954, loss: 0.3271254003047943, mean loss: 0.34888470596828364
Epoch: 27, step: 955, loss: 0.33333534002304077, mean loss: 0.3488843166891442
Epoch: 27, step: 956, loss: 0.37284213304519653, mean loss: 0.34888491645923697
Epoch: 27, step: 957, loss: 0.3773987591266632, mean loss: 0.34888563026894676
Epoch: 27, step: 958, loss: 0.30090436339378357, mean loss: 0.3488844291457867
Epoch: 27, step: 959, loss: 0.2982683777809143, mean loss: 0.3488831620973396
Epoch: 27, step: 960, loss: 0.3376084268093109, mean loss: 0.3488828798691164
Epoch: 27, step: 961, loss: 0.3415523171424866, mean loss: 0.3488826963756815
Epoch: 27, step: 962, loss: 0.3391821086406708, mean loss: 0.34888245356354325
Epoch: 27, step: 963, loss: 0.3614442050457001, mean loss: 0.34888276798463563
Epoch: 27, step: 964, loss: 0.37281331419944763, mean loss: 0.3488833669520777
Epoch: 27, step: 965, loss: 0.3166225254535675, mean loss: 0.3488825595024732
Epoch: 27, step: 966, loss: 0.3344656825065613, mean loss: 0.34888219867461695
Epoch: 27, step: 967, loss: 0.3855387568473816, mean loss: 0.3488831160977367
Epoch: 27, step: 968, loss: 0.323831170797348, mean loss: 0.3488824891251086
Epoch: 27, step: 969, loss: 0.32796186208724976, mean loss: 0.348881965559689
Epoch: 27, step: 970, loss: 0.3439702093601227, mean loss: 0.3488818426397911
Epoch: 27, step: 971, loss: 0.3012852072715759, mean loss: 0.3488806515327999
Epoch: 27, step: 972, loss: 0.33973196148872375, mean loss: 0.3488804225923318
Epoch: 27, step: 973, loss: 0.3828945457935333, mean loss: 0.34888127375401545
Epoch: 27, step: 974, loss: 0.32140693068504333, mean loss: 0.3488805862595063
Epoch: 27, step: 975, loss: 0.37528687715530396, mean loss: 0.34888124701145545
Epoch: 27, step: 976, loss: 0.3016875088214874, mean loss: 0.34888006613473355
Epoch: 27, step: 977, loss: 0.3189278542995453, mean loss: 0.3488793166924117
Epoch: 27, step: 978, loss: 0.31104347109794617, mean loss: 0.3488783700152632
Epoch: 27, step: 979, loss: 0.35632023215293884, mean loss: 0.348878556210773
Epoch: 27, step: 980, loss: 0.3134508728981018, mean loss: 0.34887766983174645
Epoch: 27, step: 981, loss: 0.3995687961578369, mean loss: 0.3488789380610766
Epoch: 27, step: 982, loss: 0.3294845223426819, mean loss: 0.34887845284890484
Epoch: 27, step: 983, loss: 0.3157110810279846, mean loss: 0.34887762308377374
Epoch: 27, step: 984, loss: 0.3131558299064636, mean loss: 0.3488767294357319
Epoch: 27, step: 985, loss: 0.3500967025756836, mean loss: 0.34887675995489786
Epoch: 27, step: 986, loss: 0.2891486883163452, mean loss: 0.34887526581927214
Epoch: 27, step: 987, loss: 0.29342544078826904, mean loss: 0.34887387874139963
Epoch: 27, step: 988, loss: 0.34840890765190125, mean loss: 0.3488738671104346
Epoch: 27, step: 989, loss: 0.3223731517791748, mean loss: 0.34887320422796597
Epoch: 27, step: 990, loss: 0.3517688810825348, mean loss: 0.34887327665791307
Epoch: 27, step: 991, loss: 0.33882030844688416, mean loss: 0.3488730252079828
Epoch: 27, step: 992, loss: 0.30028170347213745, mean loss: 0.34887180984764327
Epoch: 27, step: 993, loss: 0.3019266128540039, mean loss: 0.3488706356893472
Epoch: 27, step: 994, loss: 0.3272334039211273, mean loss: 0.34887009452855966
Epoch: 27, step: 995, loss: 0.33303964138031006, mean loss: 0.3488696986088631
Epoch: 27, step: 996, loss: 0.3505670428276062, mean loss: 0.34886974105838714
Epoch: 27, step: 997, loss: 0.3430103361606598, mean loss: 0.34886959452197697
Epoch: 27, step: 998, loss: 0.31448256969451904, mean loss: 0.3488687345668709
Epoch: 27, step: 999, loss: 0.37560927867889404, mean loss: 0.34886940328108795
Epoch: 27, step: 1000, loss: 0.34785857796669006, mean loss: 0.34886937800350376
Epoch: 27, step: 1001, loss: 0.3354024291038513, mean loss: 0.3488690412455918
Epoch: 27, step: 1002, loss: 0.34411486983299255, mean loss: 0.34886892236455824
Epoch: 27, step: 1003, loss: 0.3484949767589569, mean loss: 0.348868913014048
Epoch: 27, step: 1004, loss: 0.3147181570529938, mean loss: 0.3488680590957133
Epoch: 27, step: 1005, loss: 0.32691267132759094, mean loss: 0.348867510128674
Epoch: 27, step: 1006, loss: 0.3128598630428314, mean loss: 0.3488666098249589
Epoch: 27, step: 1007, loss: 0.332163542509079, mean loss: 0.34886619220651416
Epoch: 27, step: 1008, loss: 0.3398803770542145, mean loss: 0.34886596754428567
Epoch: 27, step: 1009, loss: 0.31003689765930176, mean loss: 0.3488649967689998
Epoch: 27, step: 1010, loss: 0.33367809653282166, mean loss: 0.34886461708700184
Epoch: 27, step: 1011, loss: 0.3504921495914459, mean loss: 0.34886465777531445
Epoch: 27, step: 1012, loss: 0.3270781636238098, mean loss: 0.3488641131265769
Epoch: 27, step: 1013, loss: 0.34429192543029785, mean loss: 0.34886399882759944
Epoch: 27, step: 1014, loss: 0.3882559537887573, mean loss: 0.3488649835526191
Epoch: 27, step: 1015, loss: 0.3280336856842041, mean loss: 0.3488644628222454
Epoch: 27, step: 1016, loss: 0.33540937304496765, mean loss: 0.3488641264870429
Epoch: 27, step: 1017, loss: 0.3331882953643799, mean loss: 0.3488637346500404
Epoch: 27, step: 1018, loss: 0.3187529444694519, mean loss: 0.34886298201199756
Epoch: 27, step: 1019, loss: 0.36873701214790344, mean loss: 0.3488634787634007
Epoch: 27, step: 1020, loss: 0.3082064986228943, mean loss: 0.3488624625675412
Epoch: 27, step: 1021, loss: 0.36476263403892517, mean loss: 0.3488628599724768
Epoch: 27, step: 1022, loss: 0.3188123404979706, mean loss: 0.3488621089160305
Epoch: 27, step: 1023, loss: 0.30081605911254883, mean loss: 0.3488609081250227
Epoch: 27, step: 1024, loss: 0.34372085332870483, mean loss: 0.34886077966540213
Epoch: 27, step: 1025, loss: 0.3519245684146881, mean loss: 0.3488608562333221
Epoch: 27, step: 1026, loss: 0.35551661252975464, mean loss: 0.3488610225648552
Epoch: 27, step: 1027, loss: 0.3872023820877075, mean loss: 0.34886198071558294
Epoch: 27, step: 1028, loss: 0.3410172164440155, mean loss: 0.34886178467979134
Epoch: 27, step: 1029, loss: 0.35033321380615234, mean loss: 0.3488618214489734
Epoch: 27, step: 1030, loss: 0.3088855743408203, mean loss: 0.3488608225172882
Epoch: 27, step: 1031, loss: 0.31259459257125854, mean loss: 0.3488599163146409
Epoch: 27, step: 1032, loss: 0.31930485367774963, mean loss: 0.34885917782578163
Epoch: 27, step: 1033, loss: 0.3975432217121124, mean loss: 0.34886039425784116
Epoch: 27, step: 1034, loss: 0.35545778274536133, mean loss: 0.34886055909777036
Epoch: 27, step: 1035, loss: 0.35421404242515564, mean loss: 0.3488606928545995
Epoch: 27, step: 1036, loss: 0.3327040374279022, mean loss: 0.3488602891905039
Epoch: 27, step: 1037, loss: 0.3124251365661621, mean loss: 0.34885937890337493
Epoch: 27, step: 1038, loss: 0.32591450214385986, mean loss: 0.34885880566838956
Epoch: 27, step: 1039, loss: 0.3226909637451172, mean loss: 0.3488581519299584
Epoch: 27, step: 1040, loss: 0.31869253516197205, mean loss: 0.3488573983358949
Epoch: 27, step: 1041, loss: 0.3610002100467682, mean loss: 0.3488577016786806
Epoch: 27, step: 1042, loss: 0.30232787132263184, mean loss: 0.348856539333739
Epoch: 27, step: 1043, loss: 0.3475700616836548, mean loss: 0.3488565071975067
Epoch: 27, step: 1044, loss: 0.34930723905563354, mean loss: 0.3488565184565145
Epoch: 27, step: 1045, loss: 0.3469953238964081, mean loss: 0.3488564719661673
Epoch: 27, step: 1046, loss: 0.3597957193851471, mean loss: 0.34885674520826593
Epoch: 27, step: 1047, loss: 0.34821370244026184, mean loss: 0.34885672914665217
Epoch: 27, step: 1048, loss: 0.33092257380485535, mean loss: 0.3488562812071127
Epoch: 27, step: 1049, loss: 0.3120015859603882, mean loss: 0.3488553607141998
Epoch: 27, step: 1050, loss: 0.2992638051509857, mean loss: 0.3488541221329275
Epoch: 27, step: 1051, loss: 0.33999377489089966, mean loss: 0.34885390084553386
Epoch: 27, step: 1052, loss: 0.32628893852233887, mean loss: 0.3488533372991109
Epoch: 27, step: 1053, loss: 0.32104620337486267, mean loss: 0.3488526428499344
Epoch: 27, step: 1054, loss: 0.33760911226272583, mean loss: 0.3488523620635151
Epoch: 27, step: 1055, loss: 0.3313959836959839, mean loss: 0.34885192613357885
Epoch: 27, step: 1056, loss: 0.2962949872016907, mean loss: 0.3488506136866084
Epoch: 27, step: 1057, loss: 0.3479454219341278, mean loss: 0.34885059108280897
Epoch: 27, step: 1058, loss: 0.3490998446941376, mean loss: 0.34885059730683604
Epoch: 27, step: 1059, loss: 0.36625516414642334, mean loss: 0.34885103189949584
Epoch: 27, step: 1060, loss: 0.3206776976585388, mean loss: 0.34885032842789254
Epoch: 27, step: 1061, loss: 0.3159363865852356, mean loss: 0.34884950660662306
Epoch: 27, step: 1062, loss: 0.3361855745315552, mean loss: 0.34884919041147
Epoch: 27, step: 1063, loss: 0.3171997666358948, mean loss: 0.34884840020314645
Epoch: 27, step: 1064, loss: 0.3436623513698578, mean loss: 0.3488482707234862
Epoch: 27, step: 1065, loss: 0.30288687348365784, mean loss: 0.34884712323766104
Epoch: 27, step: 1066, loss: 0.2968761920928955, mean loss: 0.3488458257484301
Epoch: 27, step: 1067, loss: 0.338113933801651, mean loss: 0.3488455578262225
Epoch: 27, step: 1068, loss: 0.3314610421657562, mean loss: 0.3488451238317731
Epoch: 27, step: 1069, loss: 0.3383640944957733, mean loss: 0.3488448621854269
Epoch: 27, step: 1070, loss: 0.3224138915538788, mean loss: 0.34884420238436764
Epoch: 27, step: 1071, loss: 0.3167770206928253, mean loss: 0.3488434019055436
Epoch: 27, step: 1072, loss: 0.3546565771102905, mean loss: 0.34884354701363385
Epoch: 27, step: 1073, loss: 0.3109149634838104, mean loss: 0.34884260026650366
Epoch: 27, step: 1074, loss: 0.34553468227386475, mean loss: 0.3488425176985983
Epoch: 27, step: 1075, loss: 0.3568281829357147, mean loss: 0.3488427170213129
Epoch: 27, step: 1076, loss: 0.34724149107933044, mean loss: 0.3488426770556086
Epoch: 27, step: 1077, loss: 0.3108825981616974, mean loss: 0.3488417296169101
Epoch: 27, step: 1078, loss: 0.3144364356994629, mean loss: 0.3488408709228747
Epoch: 27, step: 1079, loss: 0.3495017886161804, mean loss: 0.3488408874177757
Epoch: 27, step: 1080, loss: 0.3537946045398712, mean loss: 0.3488410110474426
Epoch: 27, step: 1081, loss: 0.3436880111694336, mean loss: 0.34884088244749556
Epoch: 27, step: 1082, loss: 0.3198595345020294, mean loss: 0.34884015919756556
Epoch: 27, step: 1083, loss: 0.35562196373939514, mean loss: 0.34884032843804624
Epoch: 27, step: 1084, loss: 0.291071355342865, mean loss: 0.3488388868446268
Epoch: 27, step: 1085, loss: 0.3478190302848816, mean loss: 0.3488388613952941
Epoch: 27, step: 1086, loss: 0.4034843444824219, mean loss: 0.3488402249756581
Epoch: 27, step: 1087, loss: 0.3309739828109741, mean loss: 0.3488397791666411
Epoch: 27, step: 1088, loss: 0.31567367911338806, mean loss: 0.3488389516071917
Epoch: 27, step: 1089, loss: 0.319021612405777, mean loss: 0.3488382076244779
Epoch: 27, step: 1090, loss: 0.3313991129398346, mean loss: 0.34883777250646886
Epoch: 27, step: 1091, loss: 0.31069833040237427, mean loss: 0.34883682092358204
Epoch: 27, step: 1092, loss: 0.31258657574653625, mean loss: 0.34883591649891255
Epoch: 27, step: 1093, loss: 0.3249887526035309, mean loss: 0.348835321539482
Epoch: 27, step: 1094, loss: 0.34858742356300354, mean loss: 0.34883531535486567
Epoch: 27, step: 1095, loss: 0.3794111907482147, mean loss: 0.348836078149881
Epoch: 27, step: 1096, loss: 0.3728671967983246, mean loss: 0.34883667765390114
Epoch: 27, step: 1097, loss: 0.33718204498291016, mean loss: 0.3488363869131769
Epoch: 27, step: 1098, loss: 0.37608250975608826, mean loss: 0.3488370665879553
Epoch: 27, step: 1099, loss: 0.3559044301509857, mean loss: 0.34883724288419266
Epoch: 27, step: 1100, loss: 0.32888782024383545, mean loss: 0.34883674525584973
Epoch: 27, step: 1101, loss: 0.32026055455207825, mean loss: 0.3488360324548843
Epoch: 27, step: 1102, loss: 0.34398025274276733, mean loss: 0.3488359113359371
Epoch: 27, step: 1103, loss: 0.33242928981781006, mean loss: 0.34883550211161507
Epoch: 27, step: 1104, loss: 0.3313443958759308, mean loss: 0.34883506584827145
Epoch: 27, step: 1105, loss: 0.31911584734916687, mean loss: 0.3488343246097196
Epoch: 27, step: 1106, loss: 0.29203641414642334, mean loss: 0.34883290802634354
Epoch: 27, step: 1107, loss: 0.3128538727760315, mean loss: 0.3488320107040358
Epoch: 27, step: 1108, loss: 0.30797648429870605, mean loss: 0.3488309917867501
Epoch: 27, step: 1109, loss: 0.34131547808647156, mean loss: 0.34883080435810776
Epoch: 27, step: 1110, loss: 0.32735970616340637, mean loss: 0.34883026890589713
Epoch: 27, step: 1111, loss: 0.3730781078338623, mean loss: 0.3488308735901597
Epoch: 27, step: 1112, loss: 0.3079238831996918, mean loss: 0.3488298534911499
Epoch: 27, step: 1113, loss: 0.32907164096832275, mean loss: 0.3488293607922191
Epoch: 27, step: 1114, loss: 0.3568696975708008, mean loss: 0.34882956128437126
Epoch: 27, step: 1115, loss: 0.34945622086524963, mean loss: 0.34882957691023353
Epoch: 27, step: 1116, loss: 0.3275459408760071, mean loss: 0.34882904621241445
Epoch: 27, step: 1117, loss: 0.39650753140449524, mean loss: 0.348830235024193
Epoch: 27, step: 1118, loss: 0.34501174092292786, mean loss: 0.348830139816521
Epoch: 27, step: 1119, loss: 0.35599228739738464, mean loss: 0.34883031838806733
Epoch: 27, step: 1120, loss: 0.34509310126304626, mean loss: 0.3488302252115452
Epoch: 27, step: 1121, loss: 0.343797504901886, mean loss: 0.3488300997385881
Epoch: 27, step: 1122, loss: 0.3920309841632843, mean loss: 0.34883117677193115
Epoch: 27, step: 1123, loss: 0.31613293290138245, mean loss: 0.3488303615983205
Epoch: 27, step: 1124, loss: 0.3595349192619324, mean loss: 0.3488306284583824
Epoch: 27, step: 1125, loss: 0.3394913971424103, mean loss: 0.34883039564112867
Epoch: 27, step: 1126, loss: 0.3562265634536743, mean loss: 0.34883058001524836
Epoch: 27, step: 1127, loss: 0.34050044417381287, mean loss: 0.34883037236404085
Epoch: 27, step: 1128, loss: 0.34318578243255615, mean loss: 0.3488302316608494
Epoch: 27, step: 1129, loss: 0.3430792987346649, mean loss: 0.34883008831041007
Epoch: 27, step: 1130, loss: 0.3622468113899231, mean loss: 0.3488304227335781
Epoch: 27, step: 1131, loss: 0.3166538178920746, mean loss: 0.34882962072448437
Epoch: 27, step: 1132, loss: 0.3418184816837311, mean loss: 0.3488294459746267
Epoch: 27, step: 1133, loss: 0.3051494359970093, mean loss: 0.34882835729485057
Epoch: 27, step: 1134, loss: 0.3409948945045471, mean loss: 0.3488281620586322
Epoch: 27, step: 1135, loss: 0.32874763011932373, mean loss: 0.34882766159676554
Epoch: 27, step: 1136, loss: 0.3199966847896576, mean loss: 0.34882694306774853
Epoch: 27, step: 1137, loss: 0.31336575746536255, mean loss: 0.34882605932190786
Epoch: 27, step: 1138, loss: 0.3340376615524292, mean loss: 0.3488256907820776
Epoch: 27, step: 1139, loss: 0.34869804978370667, mean loss: 0.34882568760123134
Epoch: 27, step: 1140, loss: 0.33464786410331726, mean loss: 0.3488253342950563
Epoch: 27, step: 1141, loss: 0.33266356587409973, mean loss: 0.34882493155973554
Epoch: 27, step: 1142, loss: 0.3281441628932953, mean loss: 0.3488244162282296
Epoch: 27, step: 1143, loss: 0.3175949156284332, mean loss: 0.3488236380586741
Epoch: 27, step: 1144, loss: 0.30693483352661133, mean loss: 0.3488225943090284
Epoch: 27, step: 1145, loss: 0.39634618163108826, mean loss: 0.3488237784318998
Epoch: 27, step: 1146, loss: 0.34896320104599, mean loss: 0.348823781905741
Epoch: 27, step: 1147, loss: 0.3196161091327667, mean loss: 0.34882305418816145
Epoch: 27, step: 1148, loss: 0.341730535030365, mean loss: 0.3488228774804066
Epoch: 27, step: 1149, loss: 0.32703420519828796, mean loss: 0.3488223346364113
Epoch: 27, step: 1150, loss: 0.3759515881538391, mean loss: 0.34882301051905706
Epoch: 27, step: 1151, loss: 0.349651038646698, mean loss: 0.34882303114756047
Epoch: 27, step: 1152, loss: 0.3246893286705017, mean loss: 0.3488224299243105
Epoch: 27, step: 1153, loss: 0.3080514669418335, mean loss: 0.34882141425585894
Epoch: 27, step: 1154, loss: 0.3386855125427246, mean loss: 0.34882116176098527
Epoch: 27, step: 1155, loss: 0.31525561213493347, mean loss: 0.34882032563230786
Epoch: 27, step: 1156, loss: 0.330819696187973, mean loss: 0.34881987724198665
Epoch: 27, step: 1157, loss: 0.3370732069015503, mean loss: 0.34881958464321366
Epoch: 27, step: 1158, loss: 0.3457229733467102, mean loss: 0.3488195075113907
Epoch: 27, step: 1159, loss: 0.3452245593070984, mean loss: 0.34881941796899246
Epoch: 27, step: 1160, loss: 0.31021398305892944, mean loss: 0.34881845641490866
Epoch: 27, step: 1161, loss: 0.3272137939929962, mean loss: 0.3488179183162182
Epoch: 27, step: 1162, loss: 0.31791460514068604, mean loss: 0.34881714863892066
Epoch: 27, step: 1163, loss: 0.32593822479248047, mean loss: 0.34881657883109424
Epoch: 27, step: 1164, loss: 0.3203052282333374, mean loss: 0.3488158687633385
Epoch: 27, step: 1165, loss: 0.312975138425827, mean loss: 0.34881497618152
Epoch: 27, step: 1166, loss: 0.36637377738952637, mean loss: 0.3488154134571073
Epoch: 27, step: 1167, loss: 0.3292124271392822, mean loss: 0.34881492528631547
Epoch: 27, step: 1168, loss: 0.34585604071617126, mean loss: 0.34881485160340664
Epoch: 27, step: 1169, loss: 0.3324015736579895, mean loss: 0.3488144428858922
Epoch: 27, step: 1170, loss: 0.338800847530365, mean loss: 0.34881419353716947
Epoch: 27, step: 1171, loss: 0.3317999541759491, mean loss: 0.3488137698758308
Epoch: 27, step: 1172, loss: 0.3140626549720764, mean loss: 0.3488129045807708
Epoch: 27, step: 1173, loss: 0.3373914361000061, mean loss: 0.3488126201958178
Epoch: 27, step: 1174, loss: 0.31439879536628723, mean loss: 0.3488117633418769
Epoch: 27, step: 1175, loss: 0.3273337781429291, mean loss: 0.34881122858475117
Epoch: 27, step: 1176, loss: 0.29340752959251404, mean loss: 0.34880984918231145
Epoch: 27, step: 1177, loss: 0.36630526185035706, mean loss: 0.3488102847599808
Epoch: 27, step: 1178, loss: 0.3119610548019409, mean loss: 0.3488093673593794
Epoch: 27, step: 1179, loss: 0.36718612909317017, mean loss: 0.348809824856933
Epoch: 27, step: 1180, loss: 0.3095560669898987, mean loss: 0.3488088476417206
Epoch: 27, step: 1181, loss: 0.3250572979450226, mean loss: 0.3488082563659004
Epoch: 27, step: 1182, loss: 0.31444743275642395, mean loss: 0.34880740100199087
Epoch: 27, step: 1183, loss: 0.3222273588180542, mean loss: 0.34880673934605677
Epoch: 27, step: 1184, loss: 0.3617006540298462, mean loss: 0.3488070603057731
Epoch: 27, step: 1185, loss: 0.3347388803958893, mean loss: 0.3488067101245636
Epoch: 27, step: 1186, loss: 0.33525434136390686, mean loss: 0.34880637279117815
Epoch: 27, step: 1187, loss: 0.31938934326171875, mean loss: 0.3488056405871377
Epoch: 27, step: 1188, loss: 0.31369367241859436, mean loss: 0.3488047666550828
Epoch: 27, step: 1189, loss: 0.3568263649940491, mean loss: 0.3488049663065921
Epoch: 27, step: 1190, loss: 0.3260452151298523, mean loss: 0.3488043998477161
Epoch: 27, step: 1191, loss: 0.3338588774204254, mean loss: 0.3488040278834944
Epoch: 27, step: 1192, loss: 0.3595762848854065, mean loss: 0.34880429597679724
Epoch: 27, step: 1193, loss: 0.3130837678909302, mean loss: 0.3488034070084013
Epoch: 27, step: 1194, loss: 0.30834344029426575, mean loss: 0.34880240011576724
Epoch: 27, step: 1195, loss: 0.3533899188041687, mean loss: 0.3488025142785855
Epoch: 27, step: 1196, loss: 0.33016571402549744, mean loss: 0.34880205050353874
Epoch: 27, step: 1197, loss: 0.32434192299842834, mean loss: 0.3488014418306799
Epoch: 27, step: 1198, loss: 0.32382941246032715, mean loss: 0.34880082043497057
Epoch: 27, step: 1199, loss: 0.33737021684646606, mean loss: 0.34880053600669375
Epoch: 27, step: 1200, loss: 0.36623817682266235, mean loss: 0.3488009698975797
Epoch: 27, step: 1201, loss: 0.3162628412246704, mean loss: 0.3488001602899989
Epoch: 27, step: 1202, loss: 0.3329415023326874, mean loss: 0.3487997657076805
Epoch: 27, step: 1203, loss: 0.3505941331386566, mean loss: 0.3487998103525708
Epoch: 27, step: 1204, loss: 0.35299941897392273, mean loss: 0.34879991483864103
Epoch: 27, step: 1205, loss: 0.3499821722507477, mean loss: 0.3487999442524195
Epoch: 27, step: 1206, loss: 0.3144429922103882, mean loss: 0.34879908949555816
Epoch: 27, step: 1207, loss: 0.34194880723953247, mean loss: 0.3487989190735695
Epoch: 27, step: 1208, loss: 0.2843500077724457, mean loss: 0.3487973157471695
Epoch: 27, step: 1209, loss: 0.366714745759964, mean loss: 0.34879776147655933
Epoch: 27, step: 1210, loss: 0.3312094211578369, mean loss: 0.34879732394477203
Epoch: 27, step: 1211, loss: 0.3554600477218628, mean loss: 0.34879748968416946
Epoch: 27, step: 1212, loss: 0.3235916495323181, mean loss: 0.3487968626888173
Epoch: 27, step: 1213, loss: 0.30674856901168823, mean loss: 0.34879581676339877
Epoch: 27, step: 1214, loss: 0.3602707087993622, mean loss: 0.348796102187174
Epoch: 27, step: 1215, loss: 0.32311177253723145, mean loss: 0.3487954633370683
Epoch: 27, step: 1216, loss: 0.3176755905151367, mean loss: 0.3487946893071511
Epoch: 27, step: 1217, loss: 0.35636088252067566, mean loss: 0.3487948774928252
Epoch: 27, step: 1218, loss: 0.32776498794555664, mean loss: 0.3487943544523211
Epoch: 27, step: 1219, loss: 0.33072927594184875, mean loss: 0.34879390516166975
Epoch: 27, step: 1220, loss: 0.33564257621765137, mean loss: 0.3487935780874092
Epoch: 27, step: 1221, loss: 0.3304569721221924, mean loss: 0.34879312206637053
Epoch: 27, step: 1222, loss: 0.3335673213005066, mean loss: 0.34879274341871774
Epoch: 27, step: 1223, loss: 0.3467099368572235, mean loss: 0.34879269162307064
Epoch: 27, step: 1224, loss: 0.33763790130615234, mean loss: 0.34879241423042856
Epoch: 27, step: 1225, loss: 0.3653995990753174, mean loss: 0.34879282720065896
Epoch: 27, step: 1226, loss: 0.36646756529808044, mean loss: 0.3487932667067661
Epoch: 27, step: 1227, loss: 0.3500235378742218, mean loss: 0.34879329729835074
Epoch: 27, step: 1228, loss: 0.31417223811149597, mean loss: 0.3487924364420167
Epoch: 27, step: 1229, loss: 0.3224354386329651, mean loss: 0.34879178108874676
Epoch: 27, step: 1230, loss: 0.3221045732498169, mean loss: 0.34879111754147213
Epoch: 27, step: 1231, loss: 0.3426492512226105, mean loss: 0.3487909648347014
Epoch: 27, step: 1232, loss: 0.3336728811264038, mean loss: 0.3487905889593202
Epoch: 27, step: 1233, loss: 0.3302801847457886, mean loss: 0.34879012875335796
Epoch: 27, step: 1234, loss: 0.36764606833457947, mean loss: 0.34879059753837105
Epoch: 27, step: 1235, loss: 0.2994634509086609, mean loss: 0.34878937122704873
Epoch: 27, step: 1236, loss: 0.29584285616874695, mean loss: 0.3487880549681287
Epoch: 27, step: 1237, loss: 0.2997475862503052, mean loss: 0.34878683584445946
Epoch: 27, step: 1238, loss: 0.3410514295101166, mean loss: 0.34878664355056893
Epoch: 27, step: 1239, loss: 0.3299969434738159, mean loss: 0.3487861764704238
Epoch: 27, step: 1240, loss: 0.31389203667640686, mean loss: 0.34878530908272354
Epoch: 27, step: 1241, loss: 0.34575504064559937, mean loss: 0.3487852337591233
Epoch: 27, step: 1242, loss: 0.3293953239917755, mean loss: 0.3487847517947235
Epoch: 27, step: 1243, loss: 0.32507166266441345, mean loss: 0.34878416238606547
Epoch: 27, step: 1244, loss: 0.32713836431503296, mean loss: 0.34878362437502797
Epoch: 27, step: 1245, loss: 0.32431381940841675, mean loss: 0.3487830161877991
Epoch: 27, step: 1246, loss: 0.2787274420261383, mean loss: 0.3487812750277603
Epoch: 27, step: 1247, loss: 0.32220688462257385, mean loss: 0.348780614564732
Epoch: 27, step: 1248, loss: 0.33615997433662415, mean loss: 0.3487803009071475
Epoch: 27, step: 1249, loss: 0.32562994956970215, mean loss: 0.3487797255716105
Epoch: 27, step: 1250, loss: 0.3731660544872284, mean loss: 0.34878033160876143
Epoch: 27, step: 1251, loss: 0.3218039274215698, mean loss: 0.3487796612209834
Epoch: 27, step: 1252, loss: 0.35661780834198, mean loss: 0.34877985600111117
Epoch: 27, step: 1253, loss: 0.3398876190185547, mean loss: 0.34877963503204945
Epoch: 27, step: 1254, loss: 0.3118703067302704, mean loss: 0.3487787178705977
Epoch: 27, step: 1255, loss: 0.30391234159469604, mean loss: 0.3487776030118293
Epoch: 27, step: 1256, loss: 0.4030133783817291, mean loss: 0.348778950651918
Epoch: 27, step: 1257, loss: 0.2989512085914612, mean loss: 0.3487777125725546
Epoch: 27, step: 1258, loss: 0.32769298553466797, mean loss: 0.34877718868935736
Epoch: 27, step: 1259, loss: 0.33489182591438293, mean loss: 0.3487768436942576
Epoch: 27, step: 1260, loss: 0.31223419308662415, mean loss: 0.3487759357797602
Epoch: 27, step: 1261, loss: 0.3394815921783447, mean loss: 0.3487757048643912
Epoch: 27, step: 1262, loss: 0.2901221811771393, mean loss: 0.3487742476701926
Epoch: 27, step: 1263, loss: 0.3184339702129364, mean loss: 0.3487734939119332
Epoch: 27, step: 1264, loss: 0.31502094864845276, mean loss: 0.3487726554018777
Epoch: 27, step: 1265, loss: 0.34643396735191345, mean loss: 0.3487725973036005
Epoch: 27, step: 1266, loss: 0.3389096260070801, mean loss: 0.3487723522912717
Epoch: 27, step: 1267, loss: 0.32360976934432983, mean loss: 0.34877172722710864
Epoch: 27, step: 1268, loss: 0.32702675461769104, mean loss: 0.34877118707328175
Epoch: 27, step: 1269, loss: 0.3436138927936554, mean loss: 0.34877105896720895
Epoch: 27, step: 1270, loss: 0.31991711258888245, mean loss: 0.34877034225923365
Epoch: 27, step: 1271, loss: 0.34335681796073914, mean loss: 0.3487702077951428
Epoch: 27, step: 1272, loss: 0.32185912132263184, mean loss: 0.34876953937939376
Epoch: 27, step: 1273, loss: 0.34254682064056396, mean loss: 0.3487693848237647
Epoch: 27, step: 1274, loss: 0.35529690980911255, mean loss: 0.34876954694593604
Epoch: 27, step: 1275, loss: 0.31226494908332825, mean loss: 0.34876864031475524
Epoch: 27, step: 1276, loss: 0.35065314173698425, mean loss: 0.3487686871172244
Epoch: 27, step: 1277, loss: 0.3211074471473694, mean loss: 0.34876800015452714
Epoch: 27, step: 1278, loss: 0.3227982223033905, mean loss: 0.34876735521505187
Epoch: 27, step: 1279, loss: 0.38091254234313965, mean loss: 0.34876815349624607
Epoch: 27, step: 1280, loss: 0.3486599922180176, mean loss: 0.34876815081027723
Epoch: 27, step: 1281, loss: 0.33348363637924194, mean loss: 0.34876777125938496
Epoch: 27, step: 1282, loss: 0.29531383514404297, mean loss: 0.34876644390381606
Epoch: 27, step: 1283, loss: 0.31984710693359375, mean loss: 0.34876572580347415
Epoch: 27, step: 1284, loss: 0.3202669620513916, mean loss: 0.3487650181640196
Epoch: 27, step: 1285, loss: 0.3631886839866638, mean loss: 0.34876537630241716
Epoch: 27, step: 1286, loss: 0.3156937062740326, mean loss: 0.34876455515604776
Epoch: 27, step: 1287, loss: 0.3301723599433899, mean loss: 0.3487640935363434
Epoch: 27, step: 1288, loss: 0.3169604241847992, mean loss: 0.348763303912753
Epoch: 27, step: 1289, loss: 0.30826684832572937, mean loss: 0.348762298489058
Epoch: 27, step: 1290, loss: 0.3149375915527344, mean loss: 0.348761458728713
Epoch: 27, step: 1291, loss: 0.3181268274784088, mean loss: 0.34876069818672567
Epoch: 27, step: 1292, loss: 0.3415665924549103, mean loss: 0.3487605195887333
Epoch: 27, step: 1293, loss: 0.3425453305244446, mean loss: 0.348760365296765
Epoch: 27, step: 1294, loss: 0.3226720690727234, mean loss: 0.34875971767130953
Epoch: 27, step: 1295, loss: 0.3315191864967346, mean loss: 0.34875928969665027
Epoch: 27, step: 1296, loss: 0.3273315727710724, mean loss: 0.3487587577935368
Epoch: 27, step: 1297, loss: 0.34895387291908264, mean loss: 0.34875876263678574
Epoch: 27, step: 1298, loss: 0.34166401624679565, mean loss: 0.3487585865316801
Epoch: 27, step: 1299, loss: 0.36709722876548767, mean loss: 0.34875904172037736
Epoch: 27, step: 1300, loss: 0.3242618143558502, mean loss: 0.348758433682765
Epoch: 27, step: 1301, loss: 0.35312163829803467, mean loss: 0.3487585419777418
Epoch: 27, step: 1302, loss: 0.3331599533557892, mean loss: 0.3487581548295295
Epoch: 27, step: 1303, loss: 0.3266325891017914, mean loss: 0.34875760569903885
Epoch: 27, step: 1304, loss: 0.3212888240814209, mean loss: 0.3487569239731406
Epoch: 27, step: 1305, loss: 0.3144151568412781, mean loss: 0.34875607169321976
Epoch: 27, step: 1306, loss: 0.35792192816734314, mean loss: 0.348756299162049
Epoch: 27, step: 1307, loss: 0.32065415382385254, mean loss: 0.3487556017691232
Epoch: 27, step: 1308, loss: 0.34096914529800415, mean loss: 0.34875540854241965
Epoch: 27, step: 1309, loss: 0.3337869346141815, mean loss: 0.3487550370978336
Epoch: 27, step: 1310, loss: 0.3116667866706848, mean loss: 0.3487541167710159
Epoch: 27, step: 1311, loss: 0.37213054299354553, mean loss: 0.34875469683121996
Epoch: 27, step: 1312, loss: 0.32328033447265625, mean loss: 0.3487540647287322
Epoch: 27, step: 1313, loss: 0.3657115399837494, mean loss: 0.3487544854888745
Epoch: 27, step: 1314, loss: 0.3386760354042053, mean loss: 0.3487542354218799
Epoch: 27, step: 1315, loss: 0.31338363885879517, mean loss: 0.34875335782668926
Epoch: 27, step: 1316, loss: 0.32126545906066895, mean loss: 0.3487526758294491
Epoch: 27, step: 1317, loss: 0.3540419340133667, mean loss: 0.34875280705701284
Epoch: 27, step: 1318, loss: 0.31059810519218445, mean loss: 0.3487518604546394
Epoch: 27, step: 1319, loss: 0.297619104385376, mean loss: 0.3487505919035808
Epoch: 27, step: 1320, loss: 0.38131123781204224, mean loss: 0.34875139967965835
Epoch: 27, step: 1321, loss: 0.34692317247390747, mean loss: 0.34875135432547316
Epoch: 27, step: 1322, loss: 0.3210066258907318, mean loss: 0.3487506660585377
Epoch: 27, step: 1323, loss: 0.33540648221969604, mean loss: 0.3487503350359182
Epoch: 27, step: 1324, loss: 0.37089040875434875, mean loss: 0.34875088424023737
Epoch: 27, step: 1325, loss: 0.3309005796909332, mean loss: 0.34875044145846057
Epoch: 27, step: 1326, loss: 0.3437890410423279, mean loss: 0.34875031839259385
Epoch: 27, step: 1327, loss: 0.35309410095214844, mean loss: 0.34875042613598506
Epoch: 27, step: 1328, loss: 0.34805646538734436, mean loss: 0.3487504089233763
Epoch: 27, step: 1329, loss: 0.3533755838871002, mean loss: 0.34875052364074727
Epoch: 27, step: 1330, loss: 0.36953994631767273, mean loss: 0.348751039264217
Epoch: 27, step: 1331, loss: 0.31374213099479675, mean loss: 0.34875017098772226
Epoch: 27, step: 1332, loss: 0.3347955644130707, mean loss: 0.3487498248999126
Epoch: 27, step: 1333, loss: 0.37623655796051025, mean loss: 0.34875050658070866
Epoch: 27, step: 1334, loss: 0.3303351104259491, mean loss: 0.3487500498836337
Epoch: 27, step: 1335, loss: 0.3589968979358673, mean loss: 0.34875030399652057
Epoch: 27, step: 1336, loss: 0.3027394115924835, mean loss: 0.34874916299484904
Epoch: 27, step: 1337, loss: 0.3080970346927643, mean loss: 0.34874815490755295
Epoch: 27, step: 1338, loss: 0.3165261149406433, mean loss: 0.3487473558885343
Epoch: 27, step: 1339, loss: 0.2849756181240082, mean loss: 0.34874577456196804
Epoch: 27, step: 1340, loss: 0.36764660477638245, mean loss: 0.34874624322794573
Epoch: 27, step: 1341, loss: 0.3018869161605835, mean loss: 0.3487450813304236
Epoch: 27, step: 1342, loss: 0.3097010850906372, mean loss: 0.3487441132414538
Epoch: 27, step: 1343, loss: 0.31458374857902527, mean loss: 0.34874326626226454
Epoch: 27, step: 1344, loss: 0.3339449465274811, mean loss: 0.348742899358743
Epoch: 27, step: 1345, loss: 0.3424171507358551, mean loss: 0.3487427425245926
Epoch: 27, step: 1346, loss: 0.3763516843318939, mean loss: 0.3487434270155262
Epoch: 27, step: 1347, loss: 0.35416439175605774, mean loss: 0.34874356141072504
Epoch: 27, step: 1348, loss: 0.3593917787075043, mean loss: 0.34874382539211424
Epoch: 27, step: 1349, loss: 0.29950982332229614, mean loss: 0.34874260485559605
Epoch: 27, step: 1350, loss: 0.35531091690063477, mean loss: 0.34874276768343127
Epoch: 27, step: 1351, loss: 0.294992059469223, mean loss: 0.3487414352414825
Epoch: 27, step: 1352, loss: 0.324550598859787, mean loss: 0.3487408355826644
Epoch: 27, step: 1353, loss: 0.34413865208625793, mean loss: 0.3487407215034542
Epoch: 27, step: 1354, loss: 0.34531107544898987, mean loss: 0.34874063649128223
Epoch: 27, step: 1355, loss: 0.35373398661613464, mean loss: 0.34874076026061906
Epoch: 27, step: 1356, loss: 0.3103553354740143, mean loss: 0.3487398088310792
Epoch: 27, step: 1357, loss: 0.35403770208358765, mean loss: 0.34873994014256615
Epoch: 27, step: 1358, loss: 0.31044065952301025, mean loss: 0.34873899089527094
Epoch: 27, step: 1359, loss: 0.36809834837913513, mean loss: 0.34873947070486455
Epoch: 27, step: 1360, loss: 0.32357174158096313, mean loss: 0.3487388469538639
Epoch: 27, step: 1361, loss: 0.3521444499492645, mean loss: 0.34873893135542516
Epoch: 27, step: 1362, loss: 0.3144604563713074, mean loss: 0.3487380818479784
Epoch: 27, step: 1363, loss: 0.3150489926338196, mean loss: 0.34873724696769454
Epoch: 27, step: 1364, loss: 0.3377603590488434, mean loss: 0.34873697494608724
Epoch: 27, step: 1365, loss: 0.2833746671676636, mean loss: 0.34873535522294263
Epoch: 27, step: 1366, loss: 0.34732839465141296, mean loss: 0.3487353203583516
Epoch: 27, step: 1367, loss: 0.3440988063812256, mean loss: 0.34873520546802605
Epoch: 27, step: 1368, loss: 0.2884702980518341, mean loss: 0.34873371217299876
Epoch: 27, step: 1369, loss: 0.35101884603500366, mean loss: 0.3487337687945821
Epoch: 27, step: 1370, loss: 0.29123836755752563, mean loss: 0.3487323441953295
Epoch: 27, step: 1371, loss: 0.38753968477249146, mean loss: 0.3487333057250762
Epoch: 27, step: 1372, loss: 0.32334619760513306, mean loss: 0.34873267672410696
Epoch: 27, step: 1373, loss: 0.30707770586013794, mean loss: 0.3487316446897463
Epoch: 27, step: 1374, loss: 0.3520147204399109, mean loss: 0.34873172602849095
Epoch: 27, step: 1375, loss: 0.37754905223846436, mean loss: 0.34873243996482556
Epoch: 27, step: 1376, loss: 0.3433031141757965, mean loss: 0.34873230545904604
Epoch: 27, step: 1377, loss: 0.3276912569999695, mean loss: 0.3487317842023335
Epoch: 27, step: 1378, loss: 0.3106137216091156, mean loss: 0.3487308399146085
Epoch: 27, step: 1379, loss: 0.321071594953537, mean loss: 0.3487301547371174
Epoch: 27, step: 1380, loss: 0.33689963817596436, mean loss: 0.34872986167767667
Epoch: 27, step: 1381, loss: 0.29997023940086365, mean loss: 0.34872865385943846
Epoch: 27, step: 1382, loss: 0.34104421734809875, mean loss: 0.3487284635139798
Epoch: 27, step: 1383, loss: 0.3371087908744812, mean loss: 0.34872817569884457
Epoch: 27, step: 1384, loss: 0.36456426978111267, mean loss: 0.3487285679435151
Epoch: 27, step: 1385, loss: 0.33540964126586914, mean loss: 0.34872823805480757
Epoch: 27, step: 1386, loss: 0.30683326721191406, mean loss: 0.3487272004084709
Epoch: 27, step: 1387, loss: 0.2960367202758789, mean loss: 0.348725895413421
Epoch: 27, step: 1388, loss: 0.3143801987171173, mean loss: 0.3487250447881468
Epoch: 27, step: 1389, loss: 0.33325108885765076, mean loss: 0.3487246615607475
Epoch: 27, step: 1390, loss: 0.36272937059402466, mean loss: 0.3487250083922449
Epoch: 27, step: 1391, loss: 0.3246881663799286, mean loss: 0.3487244131262218
Epoch: 27, step: 1392, loss: 0.3515990376472473, mean loss: 0.3487244843137734
Epoch: 27, step: 1393, loss: 0.2971348762512207, mean loss: 0.3487232067740759
Epoch: 27, step: 1394, loss: 0.32589998841285706, mean loss: 0.34872264160510974
Epoch: 27, step: 1395, loss: 0.3124971389770508, mean loss: 0.34872174457899474
Epoch: 27, step: 1396, loss: 0.34536147117614746, mean loss: 0.3487216613730172
Epoch: 27, step: 1397, loss: 0.4014429748058319, mean loss: 0.34872296680840154
Epoch: 27, step: 1398, loss: 0.3343520164489746, mean loss: 0.3487226109773084
Epoch: 27, step: 1399, loss: 0.3682571053504944, mean loss: 0.3487230946480614
Epoch: 27, step: 1400, loss: 0.33788397908210754, mean loss: 0.34872282628005113
Epoch: 27, step: 1401, loss: 0.32979294657707214, mean loss: 0.34872235760266307
Epoch: 27, step: 1402, loss: 0.36037972569465637, mean loss: 0.34872264621567317
Epoch: 27, step: 1403, loss: 0.3383558392524719, mean loss: 0.34872238956071766
Epoch: 27, step: 1404, loss: 0.332194983959198, mean loss: 0.3487219803956247
Epoch: 27, step: 1405, loss: 0.295504093170166, mean loss: 0.34872066292552456
Epoch: 27, step: 1406, loss: 0.34285739064216614, mean loss: 0.3487205177770586
Epoch: 27, step: 1407, loss: 0.32386350631713867, mean loss: 0.3487199024435736
Epoch: 27, step: 1408, loss: 0.3398731052875519, mean loss: 0.34871968344718385
Epoch: 27, step: 1409, loss: 0.3333076536655426, mean loss: 0.3487193019424118
Epoch: 27, step: 1410, loss: 0.33688417077064514, mean loss: 0.34871900898636904
Epoch: 27, step: 1411, loss: 0.32713574171066284, mean loss: 0.34871847474708
Epoch: 27, step: 1412, loss: 0.321249783039093, mean loss: 0.3487177948457977
Epoch: 27, step: 1413, loss: 0.34480157494544983, mean loss: 0.3487176979144601
Epoch: 27, step: 1414, loss: 0.31291794776916504, mean loss: 0.3487168118478278
Epoch: 27, step: 1415, loss: 0.31587180495262146, mean loss: 0.34871599893309424
Epoch: 27, step: 1416, loss: 0.3093549907207489, mean loss: 0.3487150247712773
Epoch: 27, step: 1417, loss: 0.32032668590545654, mean loss: 0.34871432219396536
Epoch: 27, step: 1418, loss: 0.33988526463508606, mean loss: 0.34871410369079614
Epoch: 27, step: 1419, loss: 0.33591893315315247, mean loss: 0.34871378704135697
Epoch: 27, step: 1420, loss: 0.3434271812438965, mean loss: 0.34871365621392253
Epoch: 27, step: 1421, loss: 0.3522856533527374, mean loss: 0.3487137446078136
Epoch: 27, step: 1422, loss: 0.3137914538383484, mean loss: 0.3487128804299717
Epoch: 27, step: 1423, loss: 0.33584263920783997, mean loss: 0.3487125619542412
Epoch: 27, step: 1424, loss: 0.32655128836631775, mean loss: 0.34871201358432097
Epoch: 27, step: 1425, loss: 0.3539552390575409, mean loss: 0.34871214332217104
Epoch: 27, step: 1426, loss: 0.3241064250469208, mean loss: 0.3487115344957879
Epoch: 27, step: 1427, loss: 0.32577693462371826, mean loss: 0.3487109670324102
Epoch: 27, step: 1428, loss: 0.3397951126098633, mean loss: 0.34871074643576966
Epoch: 27, step: 1429, loss: 0.29108408093452454, mean loss: 0.3487093206684011
Epoch: 27, step: 1430, loss: 0.3409874439239502, mean loss: 0.34870912962268635
Epoch: 27, step: 1431, loss: 0.3188365697860718, mean loss: 0.3487083905687567
Epoch: 27, step: 1432, loss: 0.31672579050064087, mean loss: 0.34870759933152684
Epoch: 27, step: 1433, loss: 0.3474736511707306, mean loss: 0.34870756880487896
Epoch: 27, step: 1434, loss: 0.3397156000137329, mean loss: 0.3487073463580346
Epoch: 27, step: 1435, loss: 0.36518576741218567, mean loss: 0.34870775399758175
Epoch: 27, step: 1436, loss: 0.3680441975593567, mean loss: 0.34870823232642684
Epoch: 27, step: 1437, loss: 0.3384743630886078, mean loss: 0.3487079791757506
Epoch: 27, step: 1438, loss: 0.3223903775215149, mean loss: 0.34870732818503514
Epoch: 27, step: 1439, loss: 0.3411126732826233, mean loss: 0.3487071403287251
Epoch: 27, step: 1440, loss: 0.34240928292274475, mean loss: 0.34870698455298477
Epoch: 27, step: 1441, loss: 0.34320053458213806, mean loss: 0.34870684835585464
Epoch: 27, step: 1442, loss: 0.3721264600753784, mean loss: 0.3487074276047409
Epoch: 27, step: 1443, loss: 0.3753066062927246, mean loss: 0.3487080854791643
Valid: 27, mean loss: 0.1865196501215299
Epoch: 28, step: 0, loss: 0.3111100196838379, mean loss: 0.34870715559353144
Epoch: 28, step: 1, loss: 0.2811338007450104, mean loss: 0.34870548439219473
Epoch: 28, step: 2, loss: 0.35079196095466614, mean loss: 0.34870553599295057
Epoch: 28, step: 3, loss: 0.3575453758239746, mean loss: 0.3487057546060634
Epoch: 28, step: 4, loss: 0.3141583800315857, mean loss: 0.3487049002554792
Epoch: 28, step: 5, loss: 0.32404932379722595, mean loss: 0.34870429054242563
Epoch: 28, step: 6, loss: 0.4121617376804352, mean loss: 0.34870585975647983
Epoch: 28, step: 7, loss: 0.33479583263397217, mean loss: 0.3487055157894392
Epoch: 28, step: 8, loss: 0.3234574496746063, mean loss: 0.3487048914708982
Epoch: 28, step: 9, loss: 0.3552912473678589, mean loss: 0.3487050543302004
Epoch: 28, step: 10, loss: 0.3423166871070862, mean loss: 0.34870489637042434
Epoch: 28, step: 11, loss: 0.35953769087791443, mean loss: 0.34870516421718795
Epoch: 28, step: 12, loss: 0.3654177784919739, mean loss: 0.3487055774354912
Epoch: 28, step: 13, loss: 0.3664349615573883, mean loss: 0.3487060157825248
Epoch: 28, step: 14, loss: 0.29573068022727966, mean loss: 0.34870470603555825
Epoch: 28, step: 15, loss: 0.3289649486541748, mean loss: 0.34870421800753754
Epoch: 28, step: 16, loss: 0.31449776887893677, mean loss: 0.34870337233893933
Epoch: 28, step: 17, loss: 0.3220856785774231, mean loss: 0.34870271429953853
Epoch: 28, step: 18, loss: 0.3306276202201843, mean loss: 0.348702267460299
Epoch: 28, step: 19, loss: 0.3272398114204407, mean loss: 0.34870173689429385
Epoch: 28, step: 20, loss: 0.3114657998085022, mean loss: 0.3487008164202354
Epoch: 28, step: 21, loss: 0.31663793325424194, mean loss: 0.3487000238438977
Epoch: 28, step: 22, loss: 0.3555520474910736, mean loss: 0.34870019321786005
Epoch: 28, step: 23, loss: 0.32126718759536743, mean loss: 0.3486995151230009
Epoch: 28, step: 24, loss: 0.31901249289512634, mean loss: 0.3486987813310186
Epoch: 28, step: 25, loss: 0.2972850799560547, mean loss: 0.34869751053905224
Epoch: 28, step: 26, loss: 0.31309202313423157, mean loss: 0.3486966305003117
Epoch: 28, step: 27, loss: 0.37834692001342773, mean loss: 0.348697363330008
Epoch: 28, step: 28, loss: 0.350793719291687, mean loss: 0.34869741514177643
Epoch: 28, step: 29, loss: 0.3226613998413086, mean loss: 0.34869677167345303
Epoch: 28, step: 30, loss: 0.3315819203853607, mean loss: 0.34869634869811045
Epoch: 28, step: 31, loss: 0.30950668454170227, mean loss: 0.34869538019118684
Epoch: 28, step: 32, loss: 0.30294474959373474, mean loss: 0.34869424956890593
Epoch: 28, step: 33, loss: 0.3234128952026367, mean loss: 0.34869362481344784
Epoch: 28, step: 34, loss: 0.3275444507598877, mean loss: 0.3486931021857746
Epoch: 28, step: 35, loss: 0.3198385238647461, mean loss: 0.3486923891636751
Epoch: 28, step: 36, loss: 0.30980199575424194, mean loss: 0.34869142817147347
Epoch: 28, step: 37, loss: 0.31580373644828796, mean loss: 0.3486906155277442
Epoch: 28, step: 38, loss: 0.293352872133255, mean loss: 0.3486892481846246
Epoch: 28, step: 39, loss: 0.309066504240036, mean loss: 0.3486882691684172
Epoch: 28, step: 40, loss: 0.3102196455001831, mean loss: 0.3486873186922067
Epoch: 28, step: 41, loss: 0.3118726313114166, mean loss: 0.3486864091036466
Epoch: 28, step: 42, loss: 0.3070547878742218, mean loss: 0.3486853805274581
Epoch: 28, step: 43, loss: 0.315009206533432, mean loss: 0.34868454852395003
Epoch: 28, step: 44, loss: 0.32934653759002686, mean loss: 0.34868407077088204
Epoch: 28, step: 45, loss: 0.2984480559825897, mean loss: 0.3486828297012939
Epoch: 28, step: 46, loss: 0.3238092362880707, mean loss: 0.3486822152198736
Epoch: 28, step: 47, loss: 0.35199761390686035, mean loss: 0.34868229712201504
Epoch: 28, step: 48, loss: 0.3891335427761078, mean loss: 0.348683296386995
Epoch: 28, step: 49, loss: 0.40040305256843567, mean loss: 0.3486845739858336
Epoch: 28, step: 50, loss: 0.32356974482536316, mean loss: 0.34868395360618876
Epoch: 28, step: 51, loss: 0.38206467032432556, mean loss: 0.3486847781471609
Epoch: 28, step: 52, loss: 0.3570115864276886, mean loss: 0.3486849838235418
Epoch: 28, step: 53, loss: 0.32679665088653564, mean loss: 0.34868444318398895
Epoch: 28, step: 54, loss: 0.32597967982292175, mean loss: 0.3486838823925408
Epoch: 28, step: 55, loss: 0.32586535811424255, mean loss: 0.34868331880519937
Epoch: 28, step: 56, loss: 0.36562496423721313, mean loss: 0.3486837372310788
Epoch: 28, step: 57, loss: 0.3190097510814667, mean loss: 0.3486830043591067
Epoch: 28, step: 58, loss: 0.3387536406517029, mean loss: 0.34868275913513824
Epoch: 28, step: 59, loss: 0.3185555934906006, mean loss: 0.3486820151075366
Epoch: 28, step: 60, loss: 0.3111058175563812, mean loss: 0.34868108713980017
Epoch: 28, step: 61, loss: 0.32250791788101196, mean loss: 0.3486804407929523
Epoch: 28, step: 62, loss: 0.30484655499458313, mean loss: 0.3486793583411484
Epoch: 28, step: 63, loss: 0.33134910464286804, mean loss: 0.34867893039138304
Epoch: 28, step: 64, loss: 0.346597820520401, mean loss: 0.3486788790021475
Epoch: 28, step: 65, loss: 0.3500264585018158, mean loss: 0.3486789122773586
Epoch: 28, step: 66, loss: 0.38784900307655334, mean loss: 0.3486798794639755
Epoch: 28, step: 67, loss: 0.37626636028289795, mean loss: 0.34868056061165004
Epoch: 28, step: 68, loss: 0.3433419466018677, mean loss: 0.34868042879727484
Epoch: 28, step: 69, loss: 0.37261447310447693, mean loss: 0.3486810197321498
Epoch: 28, step: 70, loss: 0.3425999879837036, mean loss: 0.3486808695943391
Epoch: 28, step: 71, loss: 0.3061297833919525, mean loss: 0.34867981905399237
Epoch: 28, step: 72, loss: 0.29040804505348206, mean loss: 0.34867838042236665
Epoch: 28, step: 73, loss: 0.3639269471168518, mean loss: 0.3486787568744156
Epoch: 28, step: 74, loss: 0.37595781683921814, mean loss: 0.3486794303150546
Epoch: 28, step: 75, loss: 0.3438241183757782, mean loss: 0.34867931045448536
Epoch: 28, step: 76, loss: 0.3260255753993988, mean loss: 0.3486787512272752
Epoch: 28, step: 77, loss: 0.3740331828594208, mean loss: 0.34867937710808566
Epoch: 28, step: 78, loss: 0.32800304889678955, mean loss: 0.3486788667200871
Epoch: 28, step: 79, loss: 0.3314484655857086, mean loss: 0.3486784414041033
Epoch: 28, step: 80, loss: 0.3311624228954315, mean loss: 0.3486780090485999
Epoch: 28, step: 81, loss: 0.3582329750061035, mean loss: 0.3486782448921591
Epoch: 28, step: 82, loss: 0.31204721331596375, mean loss: 0.3486773407571085
Epoch: 28, step: 83, loss: 0.32157769799232483, mean loss: 0.34867667189436874
Epoch: 28, step: 84, loss: 0.3390950560569763, mean loss: 0.34867643541052645
Epoch: 28, step: 85, loss: 0.38717010617256165, mean loss: 0.3486773854492935
Epoch: 28, step: 86, loss: 0.37613242864608765, mean loss: 0.34867806303371557
Epoch: 28, step: 87, loss: 0.29388540983200073, mean loss: 0.3486767107964697
Epoch: 28, step: 88, loss: 0.3123495578765869, mean loss: 0.3486758142945838
Epoch: 28, step: 89, loss: 0.3357878029346466, mean loss: 0.34867549624484884
Epoch: 28, step: 90, loss: 0.32893356680870056, mean loss: 0.34867500906647025
Epoch: 28, step: 91, loss: 0.33877286314964294, mean loss: 0.3486747647138418
Epoch: 28, step: 92, loss: 0.33884406089782715, mean loss: 0.34867452213015726
Epoch: 28, step: 93, loss: 0.3776223063468933, mean loss: 0.3486752364316974
Epoch: 28, step: 94, loss: 0.31565120816230774, mean loss: 0.3486744215668352
Epoch: 28, step: 95, loss: 0.32985368371009827, mean loss: 0.34867395717831723
Epoch: 28, step: 96, loss: 0.32737472653388977, mean loss: 0.3486734316476936
Epoch: 28, step: 97, loss: 0.31769847869873047, mean loss: 0.34867266740014985
Epoch: 28, step: 98, loss: 0.32005974650382996, mean loss: 0.3486719614486338
Epoch: 28, step: 99, loss: 0.2966143488883972, mean loss: 0.3486706770902859
Epoch: 28, step: 100, loss: 0.3480543792247772, mean loss: 0.34867066188544377
Epoch: 28, step: 101, loss: 0.3734843134880066, mean loss: 0.3486712740542799
Epoch: 28, step: 102, loss: 0.3193586766719818, mean loss: 0.3486705509113816
Epoch: 28, step: 103, loss: 0.37489771842956543, mean loss: 0.34867119792064544
Epoch: 28, step: 104, loss: 0.3230668008327484, mean loss: 0.34867056629035487
Epoch: 28, step: 105, loss: 0.29781219363212585, mean loss: 0.34866931170520865
Epoch: 28, step: 106, loss: 0.32043981552124023, mean loss: 0.34866861535117466
Epoch: 28, step: 107, loss: 0.3160969316959381, mean loss: 0.34866781190559853
Epoch: 28, step: 108, loss: 0.29529932141304016, mean loss: 0.34866649549775236
Epoch: 28, step: 109, loss: 0.31316331028938293, mean loss: 0.3486656197840429
Epoch: 28, step: 110, loss: 0.34127306938171387, mean loss: 0.3486654374455282
Epoch: 28, step: 111, loss: 0.36488276720046997, mean loss: 0.3486658374388627
Epoch: 28, step: 112, loss: 0.35789915919303894, mean loss: 0.34866606516908233
Epoch: 28, step: 113, loss: 0.36957138776779175, mean loss: 0.3486665807642729
Epoch: 28, step: 114, loss: 0.3214246332645416, mean loss: 0.34866590890328447
Epoch: 28, step: 115, loss: 0.3310210108757019, mean loss: 0.34866547374253604
Epoch: 28, step: 116, loss: 0.2964548170566559, mean loss: 0.3486641861483491
Epoch: 28, step: 117, loss: 0.33222344517707825, mean loss: 0.34866378070467535
Epoch: 28, step: 118, loss: 0.35174325108528137, mean loss: 0.34866385664535204
Epoch: 28, step: 119, loss: 0.3157797157764435, mean loss: 0.3486630457324287
Epoch: 28, step: 120, loss: 0.35045143961906433, mean loss: 0.3486630898325911
Epoch: 28, step: 121, loss: 0.33963146805763245, mean loss: 0.3486628671265257
Epoch: 28, step: 122, loss: 0.32188940048217773, mean loss: 0.34866220694981154
Epoch: 28, step: 123, loss: 0.31447353959083557, mean loss: 0.34866136395081365
Epoch: 28, step: 124, loss: 0.2949316203594208, mean loss: 0.3486600391550055
Epoch: 28, step: 125, loss: 0.313530832529068, mean loss: 0.3486591730075962
Epoch: 28, step: 126, loss: 0.35325342416763306, mean loss: 0.34865928628088105
Epoch: 28, step: 127, loss: 0.2951754033565521, mean loss: 0.3486579676447143
Epoch: 28, step: 128, loss: 0.3643674850463867, mean loss: 0.34865835495068315
Epoch: 28, step: 129, loss: 0.3344202935695648, mean loss: 0.3486580039309755
Epoch: 28, step: 130, loss: 0.35993966460227966, mean loss: 0.34865828205785643
Epoch: 28, step: 131, loss: 0.30664777755737305, mean loss: 0.34865724639804724
Epoch: 28, step: 132, loss: 0.3153246343135834, mean loss: 0.3486564246893801
Epoch: 28, step: 133, loss: 0.35301247239112854, mean loss: 0.34865653207112096
Epoch: 28, step: 134, loss: 0.34410491585731506, mean loss: 0.3486564198711502
Epoch: 28, step: 135, loss: 0.32570764422416687, mean loss: 0.34865585418450934
Epoch: 28, step: 136, loss: 0.3366522490978241, mean loss: 0.3486555583032925
Epoch: 28, step: 137, loss: 0.3256957530975342, mean loss: 0.34865499237267367
Epoch: 28, step: 138, loss: 0.28766146302223206, mean loss: 0.348653488995154
Epoch: 28, step: 139, loss: 0.32171905040740967, mean loss: 0.34865282512749685
Epoch: 28, step: 140, loss: 0.33792608976364136, mean loss: 0.34865256074637235
Epoch: 28, step: 141, loss: 0.3146827220916748, mean loss: 0.34865172351468077
Epoch: 28, step: 142, loss: 0.318043053150177, mean loss: 0.34865096914202853
Epoch: 28, step: 143, loss: 0.35078370571136475, mean loss: 0.3486510217035568
Epoch: 28, step: 144, loss: 0.3345348834991455, mean loss: 0.34865067381834586
Epoch: 28, step: 145, loss: 0.31189101934432983, mean loss: 0.34864976791725477
Epoch: 28, step: 146, loss: 0.37963321805000305, mean loss: 0.34865053145135205
Epoch: 28, step: 147, loss: 0.32957109808921814, mean loss: 0.34865006128295967
Epoch: 28, step: 148, loss: 0.3229430615901947, mean loss: 0.3486494278091741
Epoch: 28, step: 149, loss: 0.2963162660598755, mean loss: 0.3486481382433136
Epoch: 28, step: 150, loss: 0.3154783248901367, mean loss: 0.348647320910604
Epoch: 28, step: 151, loss: 0.31205663084983826, mean loss: 0.3486464193067685
Epoch: 28, step: 152, loss: 0.31130680441856384, mean loss: 0.34864549927190613
Epoch: 28, step: 153, loss: 0.33827275037765503, mean loss: 0.348645243697351
Epoch: 28, step: 154, loss: 0.3194606602191925, mean loss: 0.348644524635004
Epoch: 28, step: 155, loss: 0.32360389828681946, mean loss: 0.3486439076884595
Epoch: 28, step: 156, loss: 0.3424353003501892, mean loss: 0.34864375472565334
Epoch: 28, step: 157, loss: 0.3600810766220093, mean loss: 0.34864403650249237
Epoch: 28, step: 158, loss: 0.3212672770023346, mean loss: 0.34864336204856167
Epoch: 28, step: 159, loss: 0.3288765251636505, mean loss: 0.34864287508470465
Epoch: 28, step: 160, loss: 0.3625105917453766, mean loss: 0.34864321671298193
Epoch: 28, step: 161, loss: 0.35567429661750793, mean loss: 0.3486433899178867
Epoch: 28, step: 162, loss: 0.3368176221847534, mean loss: 0.34864309860694365
Epoch: 28, step: 163, loss: 0.36596012115478516, mean loss: 0.3486435251766192
Epoch: 28, step: 164, loss: 0.3035268485546112, mean loss: 0.3486424138463085
Epoch: 28, step: 165, loss: 0.3668457269668579, mean loss: 0.3486428622258622
Epoch: 28, step: 166, loss: 0.32807761430740356, mean loss: 0.34864235568018576
Epoch: 28, step: 167, loss: 0.3481825292110443, mean loss: 0.34864234435441066
Epoch: 28, step: 168, loss: 0.3360813558101654, mean loss: 0.3486420349780765
Epoch: 28, step: 169, loss: 0.31352365016937256, mean loss: 0.348641170035837
Epoch: 28, step: 170, loss: 0.33725666999816895, mean loss: 0.3486408896501503
Epoch: 28, step: 171, loss: 0.3147433400154114, mean loss: 0.3486400548173842
Epoch: 28, step: 172, loss: 0.30401119589805603, mean loss: 0.3486389557197627
Epoch: 28, step: 173, loss: 0.30581554770469666, mean loss: 0.3486379011118719
Epoch: 28, step: 174, loss: 0.31792905926704407, mean loss: 0.34863714486684405
Epoch: 28, step: 175, loss: 0.34551358222961426, mean loss: 0.34863706794696037
Epoch: 28, step: 176, loss: 0.32732251286506653, mean loss: 0.34863654307427006
Epoch: 28, step: 177, loss: 0.35565197467803955, mean loss: 0.34863671582560235
Epoch: 28, step: 178, loss: 0.334441602230072, mean loss: 0.34863636628696515
Epoch: 28, step: 179, loss: 0.3524430990219116, mean loss: 0.3486364600211505
Epoch: 28, step: 180, loss: 0.3382221460342407, mean loss: 0.3486362035930613
Epoch: 28, step: 181, loss: 0.31124147772789, mean loss: 0.3486352828581949
Epoch: 28, step: 182, loss: 0.32825547456741333, mean loss: 0.3486347810778603
Epoch: 28, step: 183, loss: 0.32397130131721497, mean loss: 0.348634173842294
Epoch: 28, step: 184, loss: 0.33617132902145386, mean loss: 0.34863386700415183
Epoch: 28, step: 185, loss: 0.30157628655433655, mean loss: 0.3486327084640846
Epoch: 28, step: 186, loss: 0.3724104166030884, mean loss: 0.3486332938479724
Epoch: 28, step: 187, loss: 0.3665544390678406, mean loss: 0.3486337350381551
Epoch: 28, step: 188, loss: 0.33965450525283813, mean loss: 0.34863351398919556
Epoch: 28, step: 189, loss: 0.31951451301574707, mean loss: 0.348632797160852
Epoch: 28, step: 190, loss: 0.3422751724720001, mean loss: 0.3486326406577703
Epoch: 28, step: 191, loss: 0.3200923502445221, mean loss: 0.3486319381102512
Epoch: 28, step: 192, loss: 0.31665605306625366, mean loss: 0.34863115101154246
Epoch: 28, step: 193, loss: 0.3063025176525116, mean loss: 0.3486301091015991
Epoch: 28, step: 194, loss: 0.34906840324401855, mean loss: 0.3486301198898469
Epoch: 28, step: 195, loss: 0.3615415394306183, mean loss: 0.34863043768593677
Epoch: 28, step: 196, loss: 0.33982741832733154, mean loss: 0.34863022101756297
Epoch: 28, step: 197, loss: 0.3097103536128998, mean loss: 0.34862926310795417
Epoch: 28, step: 198, loss: 0.3366605043411255, mean loss: 0.3486289685358598
Epoch: 28, step: 199, loss: 0.35197940468788147, mean loss: 0.34862905099392616
Epoch: 28, step: 200, loss: 0.2999861538410187, mean loss: 0.34862785386604606
Epoch: 28, step: 201, loss: 0.35430818796157837, mean loss: 0.34862799365868513
Epoch: 28, step: 202, loss: 0.32550960779190063, mean loss: 0.34862742473076913
Epoch: 28, step: 203, loss: 0.34259963035583496, mean loss: 0.3486272763944571
Epoch: 28, step: 204, loss: 0.3090033531188965, mean loss: 0.34862630132436645
Epoch: 28, step: 205, loss: 0.3291165232658386, mean loss: 0.3486258212373036
Epoch: 28, step: 206, loss: 0.3433224856853485, mean loss: 0.34862569073863114
Epoch: 28, step: 207, loss: 0.3257862627506256, mean loss: 0.3486251287448322
Epoch: 28, step: 208, loss: 0.3326702415943146, mean loss: 0.34862473616376505
Epoch: 28, step: 209, loss: 0.3224673867225647, mean loss: 0.34862409255987153
Epoch: 28, step: 210, loss: 0.3465994596481323, mean loss: 0.3486240427448256
Epoch: 28, step: 211, loss: 0.36481964588165283, mean loss: 0.3486244412194624
Epoch: 28, step: 212, loss: 0.36730533838272095, mean loss: 0.3486249008306609
Epoch: 28, step: 213, loss: 0.3440041244029999, mean loss: 0.3486247871472375
Epoch: 28, step: 214, loss: 0.3280285596847534, mean loss: 0.34862428043757965
Epoch: 28, step: 215, loss: 0.28680893778800964, mean loss: 0.34862275969012224
Epoch: 28, step: 216, loss: 0.3561941683292389, mean loss: 0.34862294595321947
Epoch: 28, step: 217, loss: 0.3417699635028839, mean loss: 0.3486227773681653
Epoch: 28, step: 218, loss: 0.33101025223731995, mean loss: 0.3486223441063727
Epoch: 28, step: 219, loss: 0.2911883592605591, mean loss: 0.3486209312857281
Epoch: 28, step: 220, loss: 0.3320198357105255, mean loss: 0.34862052292483037
Epoch: 28, step: 221, loss: 0.3239627480506897, mean loss: 0.3486199163971855
Epoch: 28, step: 222, loss: 0.3331246078014374, mean loss: 0.348619535255663
Epoch: 28, step: 223, loss: 0.29722994565963745, mean loss: 0.34861827124568673
Epoch: 28, step: 224, loss: 0.3292934000492096, mean loss: 0.3486177959309513
Epoch: 28, step: 225, loss: 0.3597448170185089, mean loss: 0.34861806960454783
Epoch: 28, step: 226, loss: 0.330832839012146, mean loss: 0.34861763218034675
Epoch: 28, step: 227, loss: 0.34198087453842163, mean loss: 0.34861746895463
Epoch: 28, step: 228, loss: 0.34749656915664673, mean loss: 0.348617441387679
Epoch: 28, step: 229, loss: 0.3269440531730652, mean loss: 0.3486169083743443
Epoch: 28, step: 230, loss: 0.3791212737560272, mean loss: 0.34861765854932847
Epoch: 28, step: 231, loss: 0.36236098408699036, mean loss: 0.3486179965221186
Epoch: 28, step: 232, loss: 0.3133911192417145, mean loss: 0.34861713025192853
Epoch: 28, step: 233, loss: 0.2984922528266907, mean loss: 0.3486158976527689
Epoch: 28, step: 234, loss: 0.34921276569366455, mean loss: 0.34861591232973155
Epoch: 28, step: 235, loss: 0.325264036655426, mean loss: 0.34861533812210704
Epoch: 28, step: 236, loss: 0.3432885706424713, mean loss: 0.34861520714353667
Epoch: 28, step: 237, loss: 0.33122357726097107, mean loss: 0.34861477951555825
Epoch: 28, step: 238, loss: 0.3054332435131073, mean loss: 0.34861371778764394
Epoch: 28, step: 239, loss: 0.3373538553714752, mean loss: 0.34861344094208885
Epoch: 28, step: 240, loss: 0.37941914796829224, mean loss: 0.3486141983415191
Epoch: 28, step: 241, loss: 0.31098473072052, mean loss: 0.3486132731935715
Epoch: 28, step: 242, loss: 0.3167967200279236, mean loss: 0.34861249097960306
Epoch: 28, step: 243, loss: 0.35133811831474304, mean loss: 0.3486125579878471
Epoch: 28, step: 244, loss: 0.3291454017162323, mean loss: 0.3486120794088892
Epoch: 28, step: 245, loss: 0.32733237743377686, mean loss: 0.34861155628331825
Epoch: 28, step: 246, loss: 0.346813440322876, mean loss: 0.3486115120807577
Epoch: 28, step: 247, loss: 0.3302686810493469, mean loss: 0.34861106117537344
Epoch: 28, step: 248, loss: 0.30166658759117126, mean loss: 0.34860990720979773
Epoch: 28, step: 249, loss: 0.33872804045677185, mean loss: 0.3486096643046615
Epoch: 28, step: 250, loss: 0.30348142981529236, mean loss: 0.3486085550395019
Epoch: 28, step: 251, loss: 0.30202895402908325, mean loss: 0.3486074101274723
Epoch: 28, step: 252, loss: 0.3500674366950989, mean loss: 0.3486074460135868
Epoch: 28, step: 253, loss: 0.3499836027622223, mean loss: 0.3486074798374266
Epoch: 28, step: 254, loss: 0.31683799624443054, mean loss: 0.34860669901103014
Epoch: 28, step: 255, loss: 0.31269511580467224, mean loss: 0.3486058164023198
Epoch: 28, step: 256, loss: 0.3110339939594269, mean loss: 0.3486048930121543
Epoch: 28, step: 257, loss: 0.3725610673427582, mean loss: 0.34860548176060185
Epoch: 28, step: 258, loss: 0.38145244121551514, mean loss: 0.34860628898970547
Epoch: 28, step: 259, loss: 0.3539191484451294, mean loss: 0.34860641955245625
Epoch: 28, step: 260, loss: 0.30351927876472473, mean loss: 0.3486053115697372
Epoch: 28, step: 261, loss: 0.33422064781188965, mean loss: 0.3486049580860846
Epoch: 28, step: 262, loss: 0.35399097204208374, mean loss: 0.3486050904368391
Epoch: 28, step: 263, loss: 0.3317575752735138, mean loss: 0.34860467645229115
Epoch: 28, step: 264, loss: 0.34858468174934387, mean loss: 0.3486046759609846
Epoch: 28, step: 265, loss: 0.3378753960132599, mean loss: 0.3486044123293578
Epoch: 28, step: 266, loss: 0.3303415775299072, mean loss: 0.34860396360003276
Epoch: 28, step: 267, loss: 0.30748364329338074, mean loss: 0.3486029532727525
Epoch: 28, step: 268, loss: 0.36496683955192566, mean loss: 0.348603355323962
Epoch: 28, step: 269, loss: 0.28244853019714355, mean loss: 0.3486017299781528
Epoch: 28, step: 270, loss: 0.34539470076560974, mean loss: 0.34860165118717396
Epoch: 28, step: 271, loss: 0.3518763780593872, mean loss: 0.3486017316393868
Epoch: 28, step: 272, loss: 0.33301764726638794, mean loss: 0.34860134878508453
Epoch: 28, step: 273, loss: 0.32265421748161316, mean loss: 0.34860071135740056
Epoch: 28, step: 274, loss: 0.31489500403404236, mean loss: 0.34859988334975267
Epoch: 28, step: 275, loss: 0.3093259930610657, mean loss: 0.3485989185789389
Epoch: 28, step: 276, loss: 0.3109019100666046, mean loss: 0.3485979925672827
Epoch: 28, step: 277, loss: 0.29910388588905334, mean loss: 0.3485967767945812
Epoch: 28, step: 278, loss: 0.3328796625137329, mean loss: 0.34859639072903914
Epoch: 28, step: 279, loss: 0.42864301800727844, mean loss: 0.3485983568969326
Epoch: 28, step: 280, loss: 0.33130428194999695, mean loss: 0.3485979321167654
Epoch: 28, step: 281, loss: 0.29893243312835693, mean loss: 0.3485967122538438
Epoch: 28, step: 282, loss: 0.3145825266838074, mean loss: 0.34859587683236354
Epoch: 28, step: 283, loss: 0.3532749116420746, mean loss: 0.34859599175118683
Epoch: 28, step: 284, loss: 0.3134694993495941, mean loss: 0.3485951290527463
Epoch: 28, step: 285, loss: 0.3399266302585602, mean loss: 0.34859491616167126
Epoch: 28, step: 286, loss: 0.34217673540115356, mean loss: 0.3485947585403947
Epoch: 28, step: 287, loss: 0.3625144362449646, mean loss: 0.34859510037923813
Epoch: 28, step: 288, loss: 0.3001316487789154, mean loss: 0.34859391024511566
Epoch: 28, step: 289, loss: 0.3413524031639099, mean loss: 0.3485937324172319
Epoch: 28, step: 290, loss: 0.3336140513420105, mean loss: 0.34859336457397194
Epoch: 28, step: 291, loss: 0.31800389289855957, mean loss: 0.34859261343283465
Epoch: 28, step: 292, loss: 0.35079777240753174, mean loss: 0.34859266758038465
Epoch: 28, step: 293, loss: 0.33268043398857117, mean loss: 0.34859227686601074
Epoch: 28, step: 294, loss: 0.3268870711326599, mean loss: 0.34859174392212255
Epoch: 28, step: 295, loss: 0.3288125693798065, mean loss: 0.3485912582814198
Epoch: 28, step: 296, loss: 0.337228924036026, mean loss: 0.34859097930736577
Epoch: 28, step: 297, loss: 0.34423431754112244, mean loss: 0.3485908723429227
Epoch: 28, step: 298, loss: 0.2919899821281433, mean loss: 0.3485894827160975
Epoch: 28, step: 299, loss: 0.3436899781227112, mean loss: 0.3485893624297233
Epoch: 28, step: 300, loss: 0.3629656732082367, mean loss: 0.3485897153698647
Epoch: 28, step: 301, loss: 0.3340449035167694, mean loss: 0.34858935830176796
Epoch: 28, step: 302, loss: 0.3316040337085724, mean loss: 0.34858894133050017
Epoch: 28, step: 303, loss: 0.3125227391719818, mean loss: 0.3485880559661502
Epoch: 28, step: 304, loss: 0.34621044993400574, mean loss: 0.3485879976013705
Epoch: 28, step: 305, loss: 0.34273818135261536, mean loss: 0.34858785400531156
Epoch: 28, step: 306, loss: 0.3395754396915436, mean loss: 0.3485876327820534
Epoch: 28, step: 307, loss: 0.32266417145729065, mean loss: 0.3485869964673424
Epoch: 28, step: 308, loss: 0.3577919900417328, mean loss: 0.348587222406656
Epoch: 28, step: 309, loss: 0.3258945643901825, mean loss: 0.348586665422266
Epoch: 28, step: 310, loss: 0.30316561460494995, mean loss: 0.3485855506037495
Epoch: 28, step: 311, loss: 0.3600466549396515, mean loss: 0.3485858318992614
Epoch: 28, step: 312, loss: 0.3350137174129486, mean loss: 0.34858549880036616
Epoch: 28, step: 313, loss: 0.28021326661109924, mean loss: 0.34858382078946476
Epoch: 28, step: 314, loss: 0.31627175211906433, mean loss: 0.34858302779688444
Epoch: 28, step: 315, loss: 0.31616583466529846, mean loss: 0.348582232243897
Epoch: 28, step: 316, loss: 0.31562095880508423, mean loss: 0.3485814233584412
Epoch: 28, step: 317, loss: 0.3514845371246338, mean loss: 0.3485814946004968
Epoch: 28, step: 318, loss: 0.3323058784008026, mean loss: 0.3485810952086733
Epoch: 28, step: 319, loss: 0.3482418656349182, mean loss: 0.34858108688442974
Epoch: 28, step: 320, loss: 0.3429092764854431, mean loss: 0.3485809477091445
Epoch: 28, step: 321, loss: 0.420465886592865, mean loss: 0.3485827115835834
Epoch: 28, step: 322, loss: 0.36292651295661926, mean loss: 0.3485830635355248
Epoch: 28, step: 323, loss: 0.33189865946769714, mean loss: 0.34858265416257195
Epoch: 28, step: 324, loss: 0.37945544719696045, mean loss: 0.3485834116470049
Epoch: 28, step: 325, loss: 0.34567487239837646, mean loss: 0.34858334028581817
Epoch: 28, step: 326, loss: 0.350197970867157, mean loss: 0.3485833798999054
Epoch: 28, step: 327, loss: 0.32721272110939026, mean loss: 0.34858285559522456
Epoch: 28, step: 328, loss: 0.3551751971244812, mean loss: 0.3485830173268192
Epoch: 28, step: 329, loss: 0.3712667226791382, mean loss: 0.34858357381829047
Epoch: 28, step: 330, loss: 0.34931042790412903, mean loss: 0.3485835916495121
Epoch: 28, step: 331, loss: 0.3540683388710022, mean loss: 0.3485837261983106
Epoch: 28, step: 332, loss: 0.31251922249794006, mean loss: 0.34858284150546864
Epoch: 28, step: 333, loss: 0.2775927186012268, mean loss: 0.3485811001003049
Epoch: 28, step: 334, loss: 0.33040452003479004, mean loss: 0.3485806542352654
Epoch: 28, step: 335, loss: 0.31977394223213196, mean loss: 0.3485799476342057
Epoch: 28, step: 336, loss: 0.3154055178165436, mean loss: 0.34857913391717027
Epoch: 28, step: 337, loss: 0.3354497253894806, mean loss: 0.3485788118811505
Epoch: 28, step: 338, loss: 0.29652777314186096, mean loss: 0.34857753521296136
Epoch: 28, step: 339, loss: 0.35073891282081604, mean loss: 0.34857758822428303
Epoch: 28, step: 340, loss: 0.2964613139629364, mean loss: 0.34857631001874845
Epoch: 28, step: 341, loss: 0.35407546162605286, mean loss: 0.3485764448878221
Epoch: 28, step: 342, loss: 0.3365743160247803, mean loss: 0.34857615053763535
Epoch: 28, step: 343, loss: 0.31280797719955444, mean loss: 0.3485752733507279
Epoch: 28, step: 344, loss: 0.32673180103302, mean loss: 0.3485747376695273
Epoch: 28, step: 345, loss: 0.31455984711647034, mean loss: 0.3485739035214437
Epoch: 28, step: 346, loss: 0.3262852132320404, mean loss: 0.3485733569486908
Epoch: 28, step: 347, loss: 0.33863499760627747, mean loss: 0.3485731132419879
Epoch: 28, step: 348, loss: 0.3346971273422241, mean loss: 0.34857277298584166
Epoch: 28, step: 349, loss: 0.34280452132225037, mean loss: 0.3485726315447239
Epoch: 28, step: 350, loss: 0.3219081461429596, mean loss: 0.34857197773099263
Epoch: 28, step: 351, loss: 0.34351542592048645, mean loss: 0.34857185374727817
Epoch: 28, step: 352, loss: 0.34108954668045044, mean loss: 0.34857167028995156
Epoch: 28, step: 353, loss: 0.34542757272720337, mean loss: 0.34857159320228515
Epoch: 28, step: 354, loss: 0.3306266665458679, mean loss: 0.3485711532354659
Epoch: 28, step: 355, loss: 0.34176385402679443, mean loss: 0.3485709863408104
Epoch: 28, step: 356, loss: 0.35582804679870605, mean loss: 0.34857116425790713
Epoch: 28, step: 357, loss: 0.38509228825569153, mean loss: 0.34857205960294263
Epoch: 28, step: 358, loss: 0.3278375267982483, mean loss: 0.34857155129148165
Epoch: 28, step: 359, loss: 0.3338705897331238, mean loss: 0.348571190903132
Epoch: 28, step: 360, loss: 0.35669174790382385, mean loss: 0.34857138997054554
Epoch: 28, step: 361, loss: 0.3101496398448944, mean loss: 0.34857044812247656
Epoch: 28, step: 362, loss: 0.3230785131454468, mean loss: 0.3485698232435704
Epoch: 28, step: 363, loss: 0.295297771692276, mean loss: 0.3485685174280112
Epoch: 28, step: 364, loss: 0.30781275033950806, mean loss: 0.3485675184386961
Epoch: 28, step: 365, loss: 0.3372805416584015, mean loss: 0.3485672417835468
Epoch: 28, step: 366, loss: 0.32416027784347534, mean loss: 0.348566643558984
Epoch: 28, step: 367, loss: 0.33955442905426025, mean loss: 0.34856642267137355
Epoch: 28, step: 368, loss: 0.37144187092781067, mean loss: 0.3485669833303833
Epoch: 28, step: 369, loss: 0.2977330982685089, mean loss: 0.34856573746289976
Epoch: 28, step: 370, loss: 0.3829323649406433, mean loss: 0.34856657972027
Epoch: 28, step: 371, loss: 0.35456910729408264, mean loss: 0.34856672682662165
Epoch: 28, step: 372, loss: 0.3082817792892456, mean loss: 0.34856573957144366
Epoch: 28, step: 373, loss: 0.3524611294269562, mean loss: 0.3485658350326468
Epoch: 28, step: 374, loss: 0.330776184797287, mean loss: 0.3485653990866024
Epoch: 28, step: 375, loss: 0.2933941185474396, mean loss: 0.34856404711442684
Epoch: 28, step: 376, loss: 0.3421073257923126, mean loss: 0.3485638888963543
Epoch: 28, step: 377, loss: 0.32265183329582214, mean loss: 0.3485632539525758
Epoch: 28, step: 378, loss: 0.37311863899230957, mean loss: 0.3485638556380292
Epoch: 28, step: 379, loss: 0.3592546582221985, mean loss: 0.34856411759045947
Epoch: 28, step: 380, loss: 0.3187144100666046, mean loss: 0.34856338621301786
Epoch: 28, step: 381, loss: 0.3516794741153717, mean loss: 0.3485634625615233
Epoch: 28, step: 382, loss: 0.3186306357383728, mean loss: 0.34856272918343134
Epoch: 28, step: 383, loss: 0.3360444903373718, mean loss: 0.348562422484126
Epoch: 28, step: 384, loss: 0.3107888102531433, mean loss: 0.34856149704589606
Epoch: 28, step: 385, loss: 0.3194896876811981, mean loss: 0.3485607848157681
Epoch: 28, step: 386, loss: 0.3155900835990906, mean loss: 0.34855997708649455
Epoch: 28, step: 387, loss: 0.30778148770332336, mean loss: 0.34855897810341313
Epoch: 28, step: 388, loss: 0.331747829914093, mean loss: 0.3485585662774366
Epoch: 28, step: 389, loss: 0.31510215997695923, mean loss: 0.3485577467094022
Epoch: 28, step: 390, loss: 0.29016536474227905, mean loss: 0.3485563163299111
Epoch: 28, step: 391, loss: 0.3359546363353729, mean loss: 0.3485560076467836
Epoch: 28, step: 392, loss: 0.3328765630722046, mean loss: 0.3485556235820053
Epoch: 28, step: 393, loss: 0.33058667182922363, mean loss: 0.3485551834469994
Epoch: 28, step: 394, loss: 0.30632659792900085, mean loss: 0.34855414911713145
Epoch: 28, step: 395, loss: 0.36950093507766724, mean loss: 0.3485546621666553
Epoch: 28, step: 396, loss: 0.31887272000312805, mean loss: 0.34855393518480016
Epoch: 28, step: 397, loss: 0.3245673179626465, mean loss: 0.34855334770948243
Epoch: 28, step: 398, loss: 0.32420769333839417, mean loss: 0.34855275145530373
Epoch: 28, step: 399, loss: 0.3129365146160126, mean loss: 0.3485518791924501
Epoch: 28, step: 400, loss: 0.29219093918800354, mean loss: 0.34855049891326406
Epoch: 28, step: 401, loss: 0.37548109889030457, mean loss: 0.34855115842739387
Epoch: 28, step: 402, loss: 0.34457141160964966, mean loss: 0.34855106096818445
Epoch: 28, step: 403, loss: 0.3247779905796051, mean loss: 0.3485504788085609
Epoch: 28, step: 404, loss: 0.3362826108932495, mean loss: 0.34855017839795494
Epoch: 28, step: 405, loss: 0.32135024666786194, mean loss: 0.3485495123532973
Epoch: 28, step: 406, loss: 0.34258925914764404, mean loss: 0.34854936640816625
Epoch: 28, step: 407, loss: 0.34307417273521423, mean loss: 0.3485492323436787
Epoch: 28, step: 408, loss: 0.3426355719566345, mean loss: 0.3485490875465291
Epoch: 28, step: 409, loss: 0.3448737859725952, mean loss: 0.34854899755824315
Epoch: 28, step: 410, loss: 0.29815468192100525, mean loss: 0.3485477637038339
Epoch: 28, step: 411, loss: 0.31866586208343506, mean loss: 0.34854703209327614
Epoch: 28, step: 412, loss: 0.3505859076976776, mean loss: 0.3485470820106615
Epoch: 28, step: 413, loss: 0.34031927585601807, mean loss: 0.3485468805758538
Epoch: 28, step: 414, loss: 0.3172386586666107, mean loss: 0.3485461141004233
Epoch: 28, step: 415, loss: 0.3456971347332001, mean loss: 0.3485460443545516
Epoch: 28, step: 416, loss: 0.3475140333175659, mean loss: 0.3485460190905051
Epoch: 28, step: 417, loss: 0.3303673565387726, mean loss: 0.34854557408040593
Epoch: 28, step: 418, loss: 0.3285873234272003, mean loss: 0.34854508551829844
Epoch: 28, step: 419, loss: 0.30406466126441956, mean loss: 0.34854399669953184
Epoch: 28, step: 420, loss: 0.2974751591682434, mean loss: 0.3485427466361942
Epoch: 28, step: 421, loss: 0.33921337127685547, mean loss: 0.34854251827727323
Epoch: 28, step: 422, loss: 0.32000958919525146, mean loss: 0.34854181988224003
Epoch: 28, step: 423, loss: 0.3470420241355896, mean loss: 0.34854178317292567
Epoch: 28, step: 424, loss: 0.3434985876083374, mean loss: 0.3485416597376376
Epoch: 28, step: 425, loss: 0.3146184980869293, mean loss: 0.3485408294678826
Epoch: 28, step: 426, loss: 0.3383760154247284, mean loss: 0.3485405806900358
Epoch: 28, step: 427, loss: 0.2816384434700012, mean loss: 0.3485389433396388
Epoch: 28, step: 428, loss: 0.3337799906730652, mean loss: 0.34853858214063077
Epoch: 28, step: 429, loss: 0.3575134575366974, mean loss: 0.3485388017793023
Epoch: 28, step: 430, loss: 0.3012552559375763, mean loss: 0.3485376446556001
Epoch: 28, step: 431, loss: 0.3045131266117096, mean loss: 0.3485365673132439
Epoch: 28, step: 432, loss: 0.3374965786933899, mean loss: 0.34853629715568557
Epoch: 28, step: 433, loss: 0.3303033411502838, mean loss: 0.34853585099124557
Epoch: 28, step: 434, loss: 0.30930572748184204, mean loss: 0.34853489104499286
Epoch: 28, step: 435, loss: 0.3372180461883545, mean loss: 0.34853461413286463
Epoch: 28, step: 436, loss: 0.34839102625846863, mean loss: 0.3485346106194957
Epoch: 28, step: 437, loss: 0.2879504859447479, mean loss: 0.34853312825774685
Epoch: 28, step: 438, loss: 0.3504944145679474, mean loss: 0.34853317624498253
Epoch: 28, step: 439, loss: 0.33501386642456055, mean loss: 0.34853284547306485
Epoch: 28, step: 440, loss: 0.3211674392223358, mean loss: 0.34853217595024416
Epoch: 28, step: 441, loss: 0.3284876048564911, mean loss: 0.34853168555118624
Epoch: 28, step: 442, loss: 0.3215552568435669, mean loss: 0.34853102557739524
Epoch: 28, step: 443, loss: 0.32263144850730896, mean loss: 0.3485303919640997
Epoch: 28, step: 444, loss: 0.3293451964855194, mean loss: 0.3485299226244838
Epoch: 28, step: 445, loss: 0.3626739978790283, mean loss: 0.34853026863151093
Epoch: 28, step: 446, loss: 0.3107945919036865, mean loss: 0.34852934552486137
Epoch: 28, step: 447, loss: 0.3416009545326233, mean loss: 0.34852917604367273
Epoch: 28, step: 448, loss: 0.3796905279159546, mean loss: 0.34852993828901585
Epoch: 28, step: 449, loss: 0.36706048250198364, mean loss: 0.3485303915580392
Epoch: 28, step: 450, loss: 0.33761584758758545, mean loss: 0.3485301245878078
Epoch: 28, step: 451, loss: 0.309025377035141, mean loss: 0.3485291583235589
Epoch: 28, step: 452, loss: 0.3470929265022278, mean loss: 0.34852912319498314
Epoch: 28, step: 453, loss: 0.3158932626247406, mean loss: 0.3485283249789539
Epoch: 28, step: 454, loss: 0.33395376801490784, mean loss: 0.34852796851951784
Epoch: 28, step: 455, loss: 0.3213352859020233, mean loss: 0.3485273034666266
Epoch: 28, step: 456, loss: 0.3172644078731537, mean loss: 0.3485265388870185
Epoch: 28, step: 457, loss: 0.3279608488082886, mean loss: 0.3485260359354392
Epoch: 28, step: 458, loss: 0.3895271420478821, mean loss: 0.3485270386281127
Epoch: 28, step: 459, loss: 0.3497377038002014, mean loss: 0.3485270682345191
Epoch: 28, step: 460, loss: 0.319673091173172, mean loss: 0.34852636263754505
Epoch: 28, step: 461, loss: 0.340106725692749, mean loss: 0.3485261567482472
Epoch: 28, step: 462, loss: 0.38649219274520874, mean loss: 0.34852708512667974
Epoch: 28, step: 463, loss: 0.33076873421669006, mean loss: 0.34852665089470325
Epoch: 28, step: 464, loss: 0.3428788185119629, mean loss: 0.3485265127957624
Epoch: 28, step: 465, loss: 0.37784138321876526, mean loss: 0.3485272295758109
Epoch: 28, step: 466, loss: 0.34882694482803345, mean loss: 0.34852723690399134
Epoch: 28, step: 467, loss: 0.30410099029541016, mean loss: 0.3485261506876928
Epoch: 28, step: 468, loss: 0.4010147750377655, mean loss: 0.3485274339967647
Epoch: 28, step: 469, loss: 0.34292808175086975, mean loss: 0.34852729709998104
Epoch: 28, step: 470, loss: 0.39588844776153564, mean loss: 0.34852845498939405
Epoch: 28, step: 471, loss: 0.3401029109954834, mean loss: 0.3485282490060185
Epoch: 28, step: 472, loss: 0.3034839332103729, mean loss: 0.3485271478126241
Epoch: 28, step: 473, loss: 0.32585278153419495, mean loss: 0.34852659350845655
Epoch: 28, step: 474, loss: 0.3397655785083771, mean loss: 0.3485263793393657
Epoch: 28, step: 475, loss: 0.36547353863716125, mean loss: 0.348526793614307
Epoch: 28, step: 476, loss: 0.3126707971096039, mean loss: 0.3485259171324447
Epoch: 28, step: 477, loss: 0.3346891701221466, mean loss: 0.3485255789083672
Epoch: 28, step: 478, loss: 0.3122272193431854, mean loss: 0.3485246916565385
Epoch: 28, step: 479, loss: 0.38230252265930176, mean loss: 0.348525517278141
Epoch: 28, step: 480, loss: 0.35351648926734924, mean loss: 0.3485256392680217
Epoch: 28, step: 481, loss: 0.3378348648548126, mean loss: 0.34852537796933636
Epoch: 28, step: 482, loss: 0.3284388482570648, mean loss: 0.3485248870361893
Epoch: 28, step: 483, loss: 0.30864208936691284, mean loss: 0.3485239122879815
Epoch: 28, step: 484, loss: 0.3548733592033386, mean loss: 0.3485240674666827
Epoch: 28, step: 485, loss: 0.431155800819397, mean loss: 0.3485260869137073
Epoch: 28, step: 486, loss: 0.34821754693984985, mean loss: 0.3485260793734455
Epoch: 28, step: 487, loss: 0.3139198422431946, mean loss: 0.3485252336687258
Epoch: 28, step: 488, loss: 0.2875082194805145, mean loss: 0.348523742575786
Epoch: 28, step: 489, loss: 0.31250613927841187, mean loss: 0.3485228624232202
Epoch: 28, step: 490, loss: 0.36069783568382263, mean loss: 0.34852315993252453
Epoch: 28, step: 491, loss: 0.28948864340782166, mean loss: 0.3485217173922908
Epoch: 28, step: 492, loss: 0.3239993751049042, mean loss: 0.34852111819028014
Epoch: 28, step: 493, loss: 0.3220486044883728, mean loss: 0.3485204713517496
Epoch: 28, step: 494, loss: 0.32682234048843384, mean loss: 0.34851994118509033
Epoch: 28, step: 495, loss: 0.3333630859851837, mean loss: 0.34851957085536006
Epoch: 28, step: 496, loss: 0.3150077760219574, mean loss: 0.34851875207662536
Epoch: 28, step: 497, loss: 0.36742353439331055, mean loss: 0.348519213957454
Epoch: 28, step: 498, loss: 0.386264830827713, mean loss: 0.34852013613421173
Epoch: 28, step: 499, loss: 0.3372170031070709, mean loss: 0.34851985999004514
Epoch: 28, step: 500, loss: 0.33315443992614746, mean loss: 0.34851948461027665
Epoch: 28, step: 501, loss: 0.3236502408981323, mean loss: 0.3485188770653577
Epoch: 28, step: 502, loss: 0.3309771716594696, mean loss: 0.3485184485395142
Epoch: 28, step: 503, loss: 0.3452472388744354, mean loss: 0.3485183686291745
Epoch: 28, step: 504, loss: 0.3353153169155121, mean loss: 0.34851804610794157
Epoch: 28, step: 505, loss: 0.34518370032310486, mean loss: 0.3485179646592683
Epoch: 28, step: 506, loss: 0.32402217388153076, mean loss: 0.34851736631073077
Epoch: 28, step: 507, loss: 0.33811283111572266, mean loss: 0.3485171121696659
Epoch: 28, step: 508, loss: 0.31843605637550354, mean loss: 0.3485163774280672
Epoch: 28, step: 509, loss: 0.2877196967601776, mean loss: 0.34851489248154116
Epoch: 28, step: 510, loss: 0.31027868390083313, mean loss: 0.3485139585927548
Epoch: 28, step: 511, loss: 0.3903357982635498, mean loss: 0.3485149800327624
Epoch: 28, step: 512, loss: 0.3305932581424713, mean loss: 0.34851454233043266
Epoch: 28, step: 513, loss: 0.3224579691886902, mean loss: 0.3485139059661201
Epoch: 28, step: 514, loss: 0.33318671584129333, mean loss: 0.3485135316483404
Epoch: 28, step: 515, loss: 0.35348597168922424, mean loss: 0.34851365308137844
Epoch: 28, step: 516, loss: 0.30730485916137695, mean loss: 0.3485126467370496
Epoch: 28, step: 517, loss: 0.31483936309814453, mean loss: 0.34851182443464085
Epoch: 28, step: 518, loss: 0.3083608150482178, mean loss: 0.34851084396995413
Epoch: 28, step: 519, loss: 0.32695847749710083, mean loss: 0.3485103176863423
Epoch: 28, step: 520, loss: 0.3510913848876953, mean loss: 0.34851038071144913
Epoch: 28, step: 521, loss: 0.31175318360328674, mean loss: 0.3485094831874684
Epoch: 28, step: 522, loss: 0.3496229648590088, mean loss: 0.34850951037539835
Epoch: 28, step: 523, loss: 0.3526028096675873, mean loss: 0.34850961031922323
Epoch: 28, step: 524, loss: 0.3123009204864502, mean loss: 0.3485087262532557
Epoch: 28, step: 525, loss: 0.3691978454589844, mean loss: 0.3485092313833696
Epoch: 28, step: 526, loss: 0.2922683358192444, mean loss: 0.34850785828110725
Epoch: 28, step: 527, loss: 0.3095296621322632, mean loss: 0.34850690666499035
Epoch: 28, step: 528, loss: 0.3321390450000763, mean loss: 0.3485065070687484
Epoch: 28, step: 529, loss: 0.3565636873245239, mean loss: 0.3485067037676463
Epoch: 28, step: 530, loss: 0.32724833488464355, mean loss: 0.3485061848025099
Epoch: 28, step: 531, loss: 0.3493026793003082, mean loss: 0.34850620424627754
Epoch: 28, step: 532, loss: 0.33163982629776, mean loss: 0.34850579251973174
Epoch: 28, step: 533, loss: 0.3300492465496063, mean loss: 0.348505341986461
Epoch: 28, step: 534, loss: 0.33526501059532166, mean loss: 0.34850501879141643
Epoch: 28, step: 535, loss: 0.32465696334838867, mean loss: 0.34850443667719455
Epoch: 28, step: 536, loss: 0.30294665694236755, mean loss: 0.34850332467105005
Epoch: 28, step: 537, loss: 0.3343029320240021, mean loss: 0.34850297806639674
Epoch: 28, step: 538, loss: 0.34019482135772705, mean loss: 0.3485027752849975
Epoch: 28, step: 539, loss: 0.3168187737464905, mean loss: 0.34850200197635894
Epoch: 28, step: 540, loss: 0.3136235773563385, mean loss: 0.3485011507224937
Epoch: 28, step: 541, loss: 0.37053173780441284, mean loss: 0.3485016883948489
Epoch: 28, step: 542, loss: 0.3868850767612457, mean loss: 0.34850262514624286
Epoch: 28, step: 543, loss: 0.3395223915576935, mean loss: 0.3485024059878675
Epoch: 28, step: 544, loss: 0.3344821333885193, mean loss: 0.34850206383806154
Epoch: 28, step: 545, loss: 0.34879446029663086, mean loss: 0.34850207097351127
Epoch: 28, step: 546, loss: 0.44539088010787964, mean loss: 0.3485044353262074
Epoch: 28, step: 547, loss: 0.317115843296051, mean loss: 0.3485036693771583
Epoch: 28, step: 548, loss: 0.3863293528556824, mean loss: 0.34850459238253834
Epoch: 28, step: 549, loss: 0.33007916808128357, mean loss: 0.34850414278456116
Epoch: 28, step: 550, loss: 0.34300705790519714, mean loss: 0.34850400865370496
Epoch: 28, step: 551, loss: 0.34120815992355347, mean loss: 0.3485038306367049
Epoch: 28, step: 552, loss: 0.35086971521377563, mean loss: 0.34850388836232593
Epoch: 28, step: 553, loss: 0.2998850345611572, mean loss: 0.34850270213156903
Epoch: 28, step: 554, loss: 0.344385027885437, mean loss: 0.3485026016686358
Epoch: 28, step: 555, loss: 0.3440311849117279, mean loss: 0.34850249257776145
Epoch: 28, step: 556, loss: 0.32090848684310913, mean loss: 0.3485018193726153
Epoch: 28, step: 557, loss: 0.31889304518699646, mean loss: 0.34850109703121046
Epoch: 28, step: 558, loss: 0.34161293506622314, mean loss: 0.3485009289903731
Epoch: 28, step: 559, loss: 0.34140825271606445, mean loss: 0.3485007559645077
Epoch: 28, step: 560, loss: 0.3378571569919586, mean loss: 0.34850049632020325
Epoch: 28, step: 561, loss: 0.3174450397491455, mean loss: 0.3484997387591804
Epoch: 28, step: 562, loss: 0.295724481344223, mean loss: 0.3484984514007851
Epoch: 28, step: 563, loss: 0.3213537931442261, mean loss: 0.3484977892713516
Epoch: 28, step: 564, loss: 0.305534690618515, mean loss: 0.3484967413142169
Epoch: 28, step: 565, loss: 0.29367268085479736, mean loss: 0.3484954040767794
Epoch: 28, step: 566, loss: 0.33446455001831055, mean loss: 0.34849506185247986
Epoch: 28, step: 567, loss: 0.3550625145435333, mean loss: 0.3484952220342528
Epoch: 28, step: 568, loss: 0.3331994116306305, mean loss: 0.34849484897480537
Epoch: 28, step: 569, loss: 0.3048595190048218, mean loss: 0.348493784750378
Epoch: 28, step: 570, loss: 0.31486162543296814, mean loss: 0.3484929645138266
Epoch: 28, step: 571, loss: 0.34616819024086, mean loss: 0.34849290781754644
Epoch: 28, step: 572, loss: 0.34056422114372253, mean loss: 0.34849271445852503
Epoch: 28, step: 573, loss: 0.3423035442829132, mean loss: 0.3484925635252427
Epoch: 28, step: 574, loss: 0.3190109431743622, mean loss: 0.3484918445840778
Epoch: 28, step: 575, loss: 0.3108980357646942, mean loss: 0.34849092784078817
Epoch: 28, step: 576, loss: 0.2951105535030365, mean loss: 0.3484896261661719
Epoch: 28, step: 577, loss: 0.29554516077041626, mean loss: 0.34848833515262895
Epoch: 28, step: 578, loss: 0.3087763488292694, mean loss: 0.34848736682739123
Epoch: 28, step: 579, loss: 0.3600727617740631, mean loss: 0.3484876493153203
Epoch: 28, step: 580, loss: 0.3254226744174957, mean loss: 0.3484870869332732
Epoch: 28, step: 581, loss: 0.3903215229511261, mean loss: 0.3484881069370772
Epoch: 28, step: 582, loss: 0.30189311504364014, mean loss: 0.3484869708894875
Epoch: 28, step: 583, loss: 0.3164229989051819, mean loss: 0.3484861891464608
Epoch: 28, step: 584, loss: 0.32755225896835327, mean loss: 0.3484856787744156
Epoch: 28, step: 585, loss: 0.3247705399990082, mean loss: 0.34848510061022486
Epoch: 28, step: 586, loss: 0.3431158661842346, mean loss: 0.3484849697139469
Epoch: 28, step: 587, loss: 0.30968332290649414, mean loss: 0.34848402379374194
Epoch: 28, step: 588, loss: 0.35443350672721863, mean loss: 0.3484841688287955
Epoch: 28, step: 589, loss: 0.30304670333862305, mean loss: 0.34848306119227146
Epoch: 28, step: 590, loss: 0.30072498321533203, mean loss: 0.3484818970141768
Epoch: 28, step: 591, loss: 0.33423781394958496, mean loss: 0.34848154980076357
Epoch: 28, step: 592, loss: 0.3368098735809326, mean loss: 0.34848126529921036
Epoch: 28, step: 593, loss: 0.3145860433578491, mean loss: 0.3484804391104047
Epoch: 28, step: 594, loss: 0.34198006987571716, mean loss: 0.348480280669153
Epoch: 28, step: 595, loss: 0.2927473783493042, mean loss: 0.3484789222577676
Epoch: 28, step: 596, loss: 0.351975679397583, mean loss: 0.348479007484245
Epoch: 28, step: 597, loss: 0.3428623676300049, mean loss: 0.3484788705931932
Epoch: 28, step: 598, loss: 0.3788730800151825, mean loss: 0.3484796113552858
Epoch: 28, step: 599, loss: 0.3316399157047272, mean loss: 0.34847920095131696
Epoch: 28, step: 600, loss: 0.307310551404953, mean loss: 0.34847819764545224
Epoch: 28, step: 601, loss: 0.2874959111213684, mean loss: 0.3484767115050193
Epoch: 28, step: 602, loss: 0.32776015996932983, mean loss: 0.3484762066542447
Epoch: 28, step: 603, loss: 0.3398233652114868, mean loss: 0.34847599579447663
Epoch: 28, step: 604, loss: 0.35532474517822266, mean loss: 0.34847616268653464
Epoch: 28, step: 605, loss: 0.35219502449035645, mean loss: 0.34847625330649185
Epoch: 28, step: 606, loss: 0.3811262547969818, mean loss: 0.3484770488912159
Epoch: 28, step: 607, loss: 0.4123695492744446, mean loss: 0.3484786057260206
Epoch: 28, step: 608, loss: 0.314260333776474, mean loss: 0.34847777196778007
Epoch: 28, step: 609, loss: 0.3421434760093689, mean loss: 0.34847761763085794
Epoch: 28, step: 610, loss: 0.353657066822052, mean loss: 0.3484777438265354
Epoch: 28, step: 611, loss: 0.30344516038894653, mean loss: 0.34847664664830136
Epoch: 28, step: 612, loss: 0.3186526596546173, mean loss: 0.3484759200314907
Epoch: 28, step: 613, loss: 0.3153117001056671, mean loss: 0.34847511205458853
Epoch: 28, step: 614, loss: 0.3501788377761841, mean loss: 0.34847515356129355
Epoch: 28, step: 615, loss: 0.3638339638710022, mean loss: 0.3484755277283738
Epoch: 28, step: 616, loss: 0.30775660276412964, mean loss: 0.3484745357693745
Epoch: 28, step: 617, loss: 0.315420538187027, mean loss: 0.34847373055627867
Epoch: 28, step: 618, loss: 0.3346641957759857, mean loss: 0.34847339415680534
Epoch: 28, step: 619, loss: 0.31589242815971375, mean loss: 0.34847260050568
Epoch: 28, step: 620, loss: 0.34940722584724426, mean loss: 0.3484726232719904
Epoch: 28, step: 621, loss: 0.32080644369125366, mean loss: 0.3484719493746946
Epoch: 28, step: 622, loss: 0.3410267233848572, mean loss: 0.348471768027088
Epoch: 28, step: 623, loss: 0.38669106364250183, mean loss: 0.3484726989335479
Epoch: 28, step: 624, loss: 0.36198708415031433, mean loss: 0.3484730280950847
Epoch: 28, step: 625, loss: 0.3033880591392517, mean loss: 0.348471930015077
Epoch: 28, step: 626, loss: 0.353513240814209, mean loss: 0.3484720527971905
Epoch: 28, step: 627, loss: 0.3038296699523926, mean loss: 0.34847096554967844
Epoch: 28, step: 628, loss: 0.2962600588798523, mean loss: 0.34846969400474115
Epoch: 28, step: 629, loss: 0.3070152699947357, mean loss: 0.34846868444787565
Epoch: 28, step: 630, loss: 0.35806000232696533, mean loss: 0.3484689180235491
Epoch: 28, step: 631, loss: 0.35722148418426514, mean loss: 0.34846913116805917
Epoch: 28, step: 632, loss: 0.3256131112575531, mean loss: 0.34846857458654423
Epoch: 28, step: 633, loss: 0.32583701610565186, mean loss: 0.34846802348445294
Epoch: 28, step: 634, loss: 0.30251941084861755, mean loss: 0.3484669046149802
Epoch: 28, step: 635, loss: 0.306596040725708, mean loss: 0.34846588506535786
Epoch: 28, step: 636, loss: 0.34903833270072937, mean loss: 0.3484658990040375
Epoch: 28, step: 637, loss: 0.3262098729610443, mean loss: 0.3484653570993372
Epoch: 28, step: 638, loss: 0.35091620683670044, mean loss: 0.34846541677282306
Epoch: 28, step: 639, loss: 0.3403322696685791, mean loss: 0.3484652187511269
Epoch: 28, step: 640, loss: 0.3035871386528015, mean loss: 0.348464126109243
Epoch: 28, step: 641, loss: 0.33440259099006653, mean loss: 0.34846378376286524
Epoch: 28, step: 642, loss: 0.33425775170326233, mean loss: 0.3484634379069417
Epoch: 28, step: 643, loss: 0.3226868510246277, mean loss: 0.3484628103729344
Epoch: 28, step: 644, loss: 0.3195478320121765, mean loss: 0.34846210645155845
Epoch: 28, step: 645, loss: 0.3626765310764313, mean loss: 0.34846245248653157
Epoch: 28, step: 646, loss: 0.39197078347206116, mean loss: 0.34846351162455796
Epoch: 28, step: 647, loss: 0.3137775659561157, mean loss: 0.3484626672733976
Epoch: 28, step: 648, loss: 0.357218474149704, mean loss: 0.3484628804085909
Epoch: 28, step: 649, loss: 0.3237384259700775, mean loss: 0.3484622785767804
Epoch: 28, step: 650, loss: 0.3496500253677368, mean loss: 0.34846230748768736
Epoch: 28, step: 651, loss: 0.33825528621673584, mean loss: 0.3484620590449537
Epoch: 28, step: 652, loss: 0.32712021470069885, mean loss: 0.3484615395890855
Epoch: 28, step: 653, loss: 0.3506990373134613, mean loss: 0.3484615940479699
Epoch: 28, step: 654, loss: 0.3596007823944092, mean loss: 0.3484618651602036
Epoch: 28, step: 655, loss: 0.32664546370506287, mean loss: 0.3484613341924891
Epoch: 28, step: 656, loss: 0.32640212774276733, mean loss: 0.34846079732845125
Epoch: 28, step: 657, loss: 0.3208824694156647, mean loss: 0.34846012615960453
Epoch: 28, step: 658, loss: 0.3154488801956177, mean loss: 0.3484593227903518
Epoch: 28, step: 659, loss: 0.31346017122268677, mean loss: 0.3484584710637002
Epoch: 28, step: 660, loss: 0.3304770886898041, mean loss: 0.3484580334859528
Epoch: 28, step: 661, loss: 0.2821444571018219, mean loss: 0.3484564197813637
Epoch: 28, step: 662, loss: 0.3527511954307556, mean loss: 0.34845652428983553
Epoch: 28, step: 663, loss: 0.3194849193096161, mean loss: 0.3484558193159943
Epoch: 28, step: 664, loss: 0.3337562084197998, mean loss: 0.34845546163511987
Epoch: 28, step: 665, loss: 0.3244730830192566, mean loss: 0.348454878093862
Epoch: 28, step: 666, loss: 0.3252969980239868, mean loss: 0.3484543146280825
Epoch: 28, step: 667, loss: 0.3202405869960785, mean loss: 0.34845362816269
Epoch: 28, step: 668, loss: 0.3881981074810028, mean loss: 0.34845459515812366
Epoch: 28, step: 669, loss: 0.3425670862197876, mean loss: 0.3484544519167014
Epoch: 28, step: 670, loss: 0.36683958768844604, mean loss: 0.34845489921095657
Epoch: 28, step: 671, loss: 0.3363643288612366, mean loss: 0.3484546050651228
Epoch: 28, step: 672, loss: 0.3125799298286438, mean loss: 0.3484537323081532
Epoch: 28, step: 673, loss: 0.34123486280441284, mean loss: 0.3484535566921968
Epoch: 28, step: 674, loss: 0.32523858547210693, mean loss: 0.34845299194723317
Epoch: 28, step: 675, loss: 0.30249643325805664, mean loss: 0.3484518740003934
Epoch: 28, step: 676, loss: 0.3405798375606537, mean loss: 0.3484516825085926
Epoch: 28, step: 677, loss: 0.2948451042175293, mean loss: 0.34845037852955363
Epoch: 28, step: 678, loss: 0.3043682277202606, mean loss: 0.34844930625812237
Epoch: 28, step: 679, loss: 0.3435613811016083, mean loss: 0.34844918736521624
Epoch: 28, step: 680, loss: 0.3094055652618408, mean loss: 0.3484482376991227
Epoch: 28, step: 681, loss: 0.29500025510787964, mean loss: 0.34844693770441065
Epoch: 28, step: 682, loss: 0.31603696942329407, mean loss: 0.34844614942839747
Epoch: 28, step: 683, loss: 0.32032158970832825, mean loss: 0.3484454653988294
Epoch: 28, step: 684, loss: 0.3069417178630829, mean loss: 0.34844445599280427
Epoch: 28, step: 685, loss: 0.3119438588619232, mean loss: 0.348443568289192
Epoch: 28, step: 686, loss: 0.31581780314445496, mean loss: 0.3484427748417554
Epoch: 28, step: 687, loss: 0.33315029740333557, mean loss: 0.348442402942985
Epoch: 28, step: 688, loss: 0.3078025281429291, mean loss: 0.34844141464321604
Epoch: 28, step: 689, loss: 0.3179333806037903, mean loss: 0.34844067275240237
Epoch: 28, step: 690, loss: 0.3474930226802826, mean loss: 0.34844064970811883
Epoch: 28, step: 691, loss: 0.35323283076286316, mean loss: 0.3484407662381513
Epoch: 28, step: 692, loss: 0.30267831683158875, mean loss: 0.3484396534734241
Epoch: 28, step: 693, loss: 0.32784774899482727, mean loss: 0.3484391527705967
Epoch: 28, step: 694, loss: 0.3441826403141022, mean loss: 0.34843904927380737
Epoch: 28, step: 695, loss: 0.32778316736221313, mean loss: 0.34843854703975974
Epoch: 28, step: 696, loss: 0.34569022059440613, mean loss: 0.34843848021765256
Epoch: 28, step: 697, loss: 0.3325447738170624, mean loss: 0.3484380937915305
Epoch: 28, step: 698, loss: 0.3247613310813904, mean loss: 0.34843751814876206
Epoch: 28, step: 699, loss: 0.33056360483169556, mean loss: 0.348437083598696
Epoch: 28, step: 700, loss: 0.32994866371154785, mean loss: 0.3484366341196916
Epoch: 28, step: 701, loss: 0.33109796047210693, mean loss: 0.3484362126028528
Epoch: 28, step: 702, loss: 0.3279048502445221, mean loss: 0.34843571348136604
Epoch: 28, step: 703, loss: 0.3322189748287201, mean loss: 0.34843531925882004
Epoch: 28, step: 704, loss: 0.37016531825065613, mean loss: 0.34843584749371787
Epoch: 28, step: 705, loss: 0.35597965121269226, mean loss: 0.34843603087170705
Epoch: 28, step: 706, loss: 0.34022533893585205, mean loss: 0.34843583128756705
Epoch: 28, step: 707, loss: 0.31196144223213196, mean loss: 0.3484349446957086
Epoch: 28, step: 708, loss: 0.3516048789024353, mean loss: 0.34843502174619856
Epoch: 28, step: 709, loss: 0.32243454456329346, mean loss: 0.3484343897769899
Epoch: 28, step: 710, loss: 0.33170756697654724, mean loss: 0.3484339832236807
Epoch: 28, step: 711, loss: 0.36367249488830566, mean loss: 0.34843435359388447
Epoch: 28, step: 712, loss: 0.3606289327144623, mean loss: 0.34843464997446827
Epoch: 28, step: 713, loss: 0.3189014494419098, mean loss: 0.3484339322084513
Epoch: 28, step: 714, loss: 0.3747481405735016, mean loss: 0.3484345717255088
Epoch: 28, step: 715, loss: 0.3347710371017456, mean loss: 0.3484342396672162
Epoch: 28, step: 716, loss: 0.29560232162475586, mean loss: 0.3484329557497931
Epoch: 28, step: 717, loss: 0.3192770183086395, mean loss: 0.34843224722154426
Epoch: 28, step: 718, loss: 0.365896612405777, mean loss: 0.3484326716186472
Epoch: 28, step: 719, loss: 0.3669392466545105, mean loss: 0.3484331213312987
Epoch: 28, step: 720, loss: 0.30275580286979675, mean loss: 0.348432011392328
Epoch: 28, step: 721, loss: 0.3207184076309204, mean loss: 0.34843133798017456
Epoch: 28, step: 722, loss: 0.3599693775177002, mean loss: 0.34843161833589165
Epoch: 28, step: 723, loss: 0.3222085237503052, mean loss: 0.34843098117254767
Epoch: 28, step: 724, loss: 0.3347736597061157, mean loss: 0.3484306493378302
Epoch: 28, step: 725, loss: 0.3136238753795624, mean loss: 0.34842980365111176
Epoch: 28, step: 726, loss: 0.3224034309387207, mean loss: 0.3484291713137685
Epoch: 28, step: 727, loss: 0.3424372971057892, mean loss: 0.34842902573859336
Epoch: 28, step: 728, loss: 0.34571877121925354, mean loss: 0.34842895989338746
Epoch: 28, step: 729, loss: 0.35448864102363586, mean loss: 0.34842910710880776
Epoch: 28, step: 730, loss: 0.3154416084289551, mean loss: 0.3484283057216717
Epoch: 28, step: 731, loss: 0.3386427164077759, mean loss: 0.3484280679996497
Epoch: 28, step: 732, loss: 0.32426854968070984, mean loss: 0.34842748110499844
Epoch: 28, step: 733, loss: 0.3332464396953583, mean loss: 0.3484271123287897
Epoch: 28, step: 734, loss: 0.37555643916130066, mean loss: 0.34842777133544145
Epoch: 28, step: 735, loss: 0.3378596901893616, mean loss: 0.34842751462923405
Epoch: 28, step: 736, loss: 0.3412027060985565, mean loss: 0.34842733913775914
Epoch: 28, step: 737, loss: 0.34233343601226807, mean loss: 0.348427191119709
Epoch: 28, step: 738, loss: 0.3484661877155304, mean loss: 0.34842719206689504
Epoch: 28, step: 739, loss: 0.3181605339050293, mean loss: 0.3484264569396687
Epoch: 28, step: 740, loss: 0.3557136058807373, mean loss: 0.3484266339282035
Epoch: 28, step: 741, loss: 0.3252502977848053, mean loss: 0.34842607104055245
Epoch: 28, step: 742, loss: 0.3253915011882782, mean loss: 0.3484255116095907
Epoch: 28, step: 743, loss: 0.316810667514801, mean loss: 0.348424743811745
Epoch: 28, step: 744, loss: 0.3569771647453308, mean loss: 0.34842495151072583
Epoch: 28, step: 745, loss: 0.3481596112251282, mean loss: 0.3484249450669868
Epoch: 28, step: 746, loss: 0.32159423828125, mean loss: 0.3484242935041323
Epoch: 28, step: 747, loss: 0.33639857172966003, mean loss: 0.3484240014759202
Epoch: 28, step: 748, loss: 0.33026236295700073, mean loss: 0.3484235604560683
Epoch: 28, step: 749, loss: 0.3943103849887848, mean loss: 0.3484246747007513
Epoch: 28, step: 750, loss: 0.30433374643325806, mean loss: 0.34842360409083295
Epoch: 28, step: 751, loss: 0.30685028433799744, mean loss: 0.34842259463765324
Epoch: 28, step: 752, loss: 0.3526042103767395, mean loss: 0.3484226961701466
Epoch: 28, step: 753, loss: 0.3585874140262604, mean loss: 0.3484229429704636
Epoch: 28, step: 754, loss: 0.3693123757839203, mean loss: 0.34842345015556603
Epoch: 28, step: 755, loss: 0.3215896487236023, mean loss: 0.34842279865995
Epoch: 28, step: 756, loss: 0.3519077003002167, mean loss: 0.3484228832675307
Epoch: 28, step: 757, loss: 0.3307727575302124, mean loss: 0.34842245476241446
Epoch: 28, step: 758, loss: 0.35511156916618347, mean loss: 0.3484226171550343
Epoch: 28, step: 759, loss: 0.3199259340763092, mean loss: 0.3484219253536389
Epoch: 28, step: 760, loss: 0.28186845779418945, mean loss: 0.3484203097037091
Epoch: 28, step: 761, loss: 0.3181728422641754, mean loss: 0.34841957543494567
Epoch: 28, step: 762, loss: 0.31068918108940125, mean loss: 0.34841865953752255
Epoch: 28, step: 763, loss: 0.34876683354377747, mean loss: 0.3484186679891685
Epoch: 28, step: 764, loss: 0.3517688512802124, mean loss: 0.3484187493102183
Epoch: 28, step: 765, loss: 0.3295248746871948, mean loss: 0.34841829069876573
Epoch: 28, step: 766, loss: 0.32725217938423157, mean loss: 0.3484177769457301
Epoch: 28, step: 767, loss: 0.29813647270202637, mean loss: 0.34841655652572423
Epoch: 28, step: 768, loss: 0.3372504711151123, mean loss: 0.3484162855108117
Epoch: 28, step: 769, loss: 0.368471622467041, mean loss: 0.34841677226720597
Epoch: 28, step: 770, loss: 0.31931087374687195, mean loss: 0.34841606586479545
Epoch: 28, step: 771, loss: 0.3695366382598877, mean loss: 0.3484165784502822
Epoch: 28, step: 772, loss: 0.3152863681316376, mean loss: 0.34841577441654065
Epoch: 28, step: 773, loss: 0.3234829306602478, mean loss: 0.3484151693385482
Epoch: 28, step: 774, loss: 0.34857186675071716, mean loss: 0.3484151731412374
Epoch: 28, step: 775, loss: 0.3013794422149658, mean loss: 0.34841403171891827
Epoch: 28, step: 776, loss: 0.327210932970047, mean loss: 0.34841351719299557
Epoch: 28, step: 777, loss: 0.3124505579471588, mean loss: 0.3484126445174497
Epoch: 28, step: 778, loss: 0.3337048590183258, mean loss: 0.34841228762765086
Epoch: 28, step: 779, loss: 0.33354318141937256, mean loss: 0.3484119268321008
Epoch: 28, step: 780, loss: 0.31464067101478577, mean loss: 0.3484111073999843
Epoch: 28, step: 781, loss: 0.33859556913375854, mean loss: 0.3484108692396925
Epoch: 28, step: 782, loss: 0.3379143178462982, mean loss: 0.34841061456175015
Epoch: 28, step: 783, loss: 0.3235067129135132, mean loss: 0.34841001033276997
Epoch: 28, step: 784, loss: 0.3035183846950531, mean loss: 0.3484089211796138
Epoch: 28, step: 785, loss: 0.3464811444282532, mean loss: 0.3484088744093496
Epoch: 28, step: 786, loss: 0.33413445949554443, mean loss: 0.3484085281026727
Epoch: 28, step: 787, loss: 0.31528881192207336, mean loss: 0.3484077246161084
Epoch: 28, step: 788, loss: 0.36977729201316833, mean loss: 0.3484082430306883
Epoch: 28, step: 789, loss: 0.3161412179470062, mean loss: 0.34840746026844766
Epoch: 28, step: 790, loss: 0.33219850063323975, mean loss: 0.3484070670666032
Epoch: 28, step: 791, loss: 0.34796133637428284, mean loss: 0.34840705625419555
Epoch: 28, step: 792, loss: 0.391429603099823, mean loss: 0.34840809985751503
Epoch: 28, step: 793, loss: 0.3319130837917328, mean loss: 0.34840769974554525
Epoch: 28, step: 794, loss: 0.343061625957489, mean loss: 0.34840757007145334
Epoch: 28, step: 795, loss: 0.31612685322761536, mean loss: 0.34840678709103123
Epoch: 28, step: 796, loss: 0.33872029185295105, mean loss: 0.34840655214729654
Epoch: 28, step: 797, loss: 0.38198745250701904, mean loss: 0.3484073666246276
Epoch: 28, step: 798, loss: 0.35440483689308167, mean loss: 0.3484075120848461
Epoch: 28, step: 799, loss: 0.3123050332069397, mean loss: 0.3484066364911597
Epoch: 28, step: 800, loss: 0.37345296144485474, mean loss: 0.3484072439251314
Epoch: 28, step: 801, loss: 0.3418477475643158, mean loss: 0.3484070848453341
Epoch: 28, step: 802, loss: 0.34151193499565125, mean loss: 0.3484069176293804
Epoch: 28, step: 803, loss: 0.34485360980033875, mean loss: 0.348406831459339
Epoch: 28, step: 804, loss: 0.32822751998901367, mean loss: 0.3484063421096901
Epoch: 28, step: 805, loss: 0.3311142325401306, mean loss: 0.34840592278504856
Epoch: 28, step: 806, loss: 0.32096606492996216, mean loss: 0.34840525739893696
Epoch: 28, step: 807, loss: 0.34448954463005066, mean loss: 0.3484051624495488
Epoch: 28, step: 808, loss: 0.31370803713798523, mean loss: 0.34840432112355496
Epoch: 28, step: 809, loss: 0.3436095416545868, mean loss: 0.3484042048639296
Epoch: 28, step: 810, loss: 0.3618709146976471, mean loss: 0.3484045313850322
Epoch: 28, step: 811, loss: 0.3449515998363495, mean loss: 0.34840444766542333
Epoch: 28, step: 812, loss: 0.3143496513366699, mean loss: 0.3484036219945219
Epoch: 28, step: 813, loss: 0.3735872805118561, mean loss: 0.34840423256666264
Epoch: 28, step: 814, loss: 0.3169066905975342, mean loss: 0.34840346893435076
Epoch: 28, step: 815, loss: 0.39236098527908325, mean loss: 0.34840453462278037
Epoch: 28, step: 816, loss: 0.32866552472114563, mean loss: 0.3484040560897274
Epoch: 28, step: 817, loss: 0.3489725589752197, mean loss: 0.34840406987161554
Epoch: 28, step: 818, loss: 0.37060683965682983, mean loss: 0.3484046081075319
Epoch: 28, step: 819, loss: 0.2958016097545624, mean loss: 0.3484033329451554
Epoch: 28, step: 820, loss: 0.3412432074546814, mean loss: 0.34840315937897864
Epoch: 28, step: 821, loss: 0.33313125371932983, mean loss: 0.3484027891868601
Epoch: 28, step: 822, loss: 0.3473704755306244, mean loss: 0.34840276416410754
Epoch: 28, step: 823, loss: 0.3634302318096161, mean loss: 0.3484031284133718
Epoch: 28, step: 824, loss: 0.3280712366104126, mean loss: 0.34840263560265355
Epoch: 28, step: 825, loss: 0.3034699559211731, mean loss: 0.3484015465367831
Epoch: 28, step: 826, loss: 0.33107489347457886, mean loss: 0.348401126588334
Epoch: 28, step: 827, loss: 0.3309815526008606, mean loss: 0.34840070439798043
Epoch: 28, step: 828, loss: 0.3306393325328827, mean loss: 0.3484002739340589
Epoch: 28, step: 829, loss: 0.32544681429862976, mean loss: 0.3483997176483812
Epoch: 28, step: 830, loss: 0.3112998306751251, mean loss: 0.348398818540537
Epoch: 28, step: 831, loss: 0.3710157871246338, mean loss: 0.34839936664466126
Epoch: 28, step: 832, loss: 0.296676367521286, mean loss: 0.348398113209568
Epoch: 28, step: 833, loss: 0.3841099143028259, mean loss: 0.34839897861452834
Epoch: 28, step: 834, loss: 0.33582204580307007, mean loss: 0.3483986738447895
Epoch: 28, step: 835, loss: 0.3437312841415405, mean loss: 0.34839856074530073
Epoch: 28, step: 836, loss: 0.34481102228164673, mean loss: 0.34839847381471206
Epoch: 28, step: 837, loss: 0.34835338592529297, mean loss: 0.34839847272220204
Epoch: 28, step: 838, loss: 0.3403574228286743, mean loss: 0.3483982778868481
Epoch: 28, step: 839, loss: 0.339540958404541, mean loss: 0.3483980632784094
Epoch: 28, step: 840, loss: 0.307997465133667, mean loss: 0.3483970844157596
Epoch: 28, step: 841, loss: 0.3312024772167206, mean loss: 0.34839666781918066
Epoch: 28, step: 842, loss: 0.34093955159187317, mean loss: 0.34839648715010185
Epoch: 28, step: 843, loss: 0.32597294449806213, mean loss: 0.3483959438914854
Epoch: 28, step: 844, loss: 0.36847835779190063, mean loss: 0.34839643041942836
Epoch: 28, step: 845, loss: 0.33629462122917175, mean loss: 0.3483961372412417
Epoch: 28, step: 846, loss: 0.3254004120826721, mean loss: 0.3483955801607611
Epoch: 28, step: 847, loss: 0.3051290810108185, mean loss: 0.3483945320382042
Epoch: 28, step: 848, loss: 0.41019752621650696, mean loss: 0.3483960291674932
Epoch: 28, step: 849, loss: 0.3096808195114136, mean loss: 0.3483950913444794
Epoch: 28, step: 850, loss: 0.33603236079216003, mean loss: 0.3483947918814909
Epoch: 28, step: 851, loss: 0.2930384874343872, mean loss: 0.3483934510156725
Epoch: 28, step: 852, loss: 0.3570324778556824, mean loss: 0.34839366026907786
Epoch: 28, step: 853, loss: 0.3011600971221924, mean loss: 0.34839251621145184
Epoch: 28, step: 854, loss: 0.34839627146720886, mean loss: 0.34839251630240675
Epoch: 28, step: 855, loss: 0.3229799270629883, mean loss: 0.34839190080663945
Epoch: 28, step: 856, loss: 0.35936203598976135, mean loss: 0.34839216649811133
Epoch: 28, step: 857, loss: 0.3972877562046051, mean loss: 0.3483933506974261
Epoch: 28, step: 858, loss: 0.295906662940979, mean loss: 0.3483920795563117
Epoch: 28, step: 859, loss: 0.3358522653579712, mean loss: 0.34839177587002385
Epoch: 28, step: 860, loss: 0.3427048921585083, mean loss: 0.3483916381497393
Epoch: 28, step: 861, loss: 0.3191341459751129, mean loss: 0.34839092963295293
Epoch: 28, step: 862, loss: 0.35848507285118103, mean loss: 0.3483911740727935
Epoch: 28, step: 863, loss: 0.30773866176605225, mean loss: 0.34839018965511853
Epoch: 28, step: 864, loss: 0.33308082818984985, mean loss: 0.3483898189414719
Epoch: 28, step: 865, loss: 0.29105931520462036, mean loss: 0.34838843072645576
Epoch: 28, step: 866, loss: 0.3438364565372467, mean loss: 0.34838832050649426
Epoch: 28, step: 867, loss: 0.34581735730171204, mean loss: 0.3483882582555692
Epoch: 28, step: 868, loss: 0.3902395963668823, mean loss: 0.34838927158062455
Epoch: 28, step: 869, loss: 0.331150084733963, mean loss: 0.3483888541871122
Epoch: 28, step: 870, loss: 0.34344154596328735, mean loss: 0.3483887344062676
Epoch: 28, step: 871, loss: 0.32464972138404846, mean loss: 0.3483881596674282
Epoch: 28, step: 872, loss: 0.3060520887374878, mean loss: 0.34838713470505245
Epoch: 28, step: 873, loss: 0.3259459435939789, mean loss: 0.3483865914137361
Epoch: 28, step: 874, loss: 0.3111876845359802, mean loss: 0.3483856908664469
Epoch: 28, step: 875, loss: 0.31936389207839966, mean loss: 0.34838498829554565
Epoch: 28, step: 876, loss: 0.3165254592895508, mean loss: 0.34838421704644723
Epoch: 28, step: 877, loss: 0.32286277413368225, mean loss: 0.34838359924342344
Epoch: 28, step: 878, loss: 0.3235073387622833, mean loss: 0.34838299707304554
Epoch: 28, step: 879, loss: 0.32291141152381897, mean loss: 0.34838238050678033
Epoch: 28, step: 880, loss: 0.3415246307849884, mean loss: 0.3483822145118218
Epoch: 28, step: 881, loss: 0.40222030878067017, mean loss: 0.34838351765589565
Epoch: 28, step: 882, loss: 0.3295951187610626, mean loss: 0.3483830628961499
Epoch: 28, step: 883, loss: 0.29423537850379944, mean loss: 0.34838175232193186
Epoch: 28, step: 884, loss: 0.39382779598236084, mean loss: 0.34838285225764015
Epoch: 28, step: 885, loss: 0.3718574047088623, mean loss: 0.34838342040112363
Epoch: 28, step: 886, loss: 0.3322492241859436, mean loss: 0.34838302992225884
Epoch: 28, step: 887, loss: 0.37071657180786133, mean loss: 0.34838357042424056
Epoch: 28, step: 888, loss: 0.32460761070251465, mean loss: 0.3483829950277177
Epoch: 28, step: 889, loss: 0.29829463362693787, mean loss: 0.3483817828801595
Epoch: 28, step: 890, loss: 0.3209974467754364, mean loss: 0.3483811201902264
Epoch: 28, step: 891, loss: 0.33744221925735474, mean loss: 0.348380855479624
Epoch: 28, step: 892, loss: 0.3073122501373291, mean loss: 0.34837986168397145
Epoch: 28, step: 893, loss: 0.3029583990573883, mean loss: 0.34837876258261574
Epoch: 28, step: 894, loss: 0.3347242772579193, mean loss: 0.34837843218153836
Epoch: 28, step: 895, loss: 0.27085235714912415, mean loss: 0.34837655630864267
Epoch: 28, step: 896, loss: 0.3331402540206909, mean loss: 0.3483761876497763
Epoch: 28, step: 897, loss: 0.3268466591835022, mean loss: 0.3483756667320781
Epoch: 28, step: 898, loss: 0.3409017026424408, mean loss: 0.348375485900158
Epoch: 28, step: 899, loss: 0.3295193016529083, mean loss: 0.34837502968743544
Epoch: 28, step: 900, loss: 0.4085037410259247, mean loss: 0.34837648442605446
Epoch: 28, step: 901, loss: 0.31122496724128723, mean loss: 0.3483755856135228
Epoch: 28, step: 902, loss: 0.3322119414806366, mean loss: 0.34837519457338406
Epoch: 28, step: 903, loss: 0.3158973157405853, mean loss: 0.3483744088689416
Epoch: 28, step: 904, loss: 0.30502402782440186, mean loss: 0.34837336016243065
Epoch: 28, step: 905, loss: 0.3427688479423523, mean loss: 0.3483732245847002
Epoch: 28, step: 906, loss: 0.29621151089668274, mean loss: 0.3483719627807454
Epoch: 28, step: 907, loss: 0.33719924092292786, mean loss: 0.34837169251654954
Epoch: 28, step: 908, loss: 0.30929768085479736, mean loss: 0.3483707473528703
Epoch: 28, step: 909, loss: 0.3422260880470276, mean loss: 0.3483705987229224
Epoch: 28, step: 910, loss: 0.3434384763240814, mean loss: 0.34837047942528077
Epoch: 28, step: 911, loss: 0.36192333698272705, mean loss: 0.3483708072324005
Epoch: 28, step: 912, loss: 0.31466779112815857, mean loss: 0.3483699920669366
Epoch: 28, step: 913, loss: 0.33110907673835754, mean loss: 0.34836957459208223
Epoch: 28, step: 914, loss: 0.3170725107192993, mean loss: 0.3483688176553305
Epoch: 28, step: 915, loss: 0.3533555865287781, mean loss: 0.3483689382601693
Epoch: 28, step: 916, loss: 0.35819947719573975, mean loss: 0.34836917600567546
Epoch: 28, step: 917, loss: 0.3214605450630188, mean loss: 0.3483685252528111
Epoch: 28, step: 918, loss: 0.35201311111450195, mean loss: 0.3483686133906037
Epoch: 28, step: 919, loss: 0.31538504362106323, mean loss: 0.3483678157612322
Epoch: 28, step: 920, loss: 0.34310752153396606, mean loss: 0.3483676885565741
Epoch: 28, step: 921, loss: 0.3202717900276184, mean loss: 0.3483670091567934
Epoch: 28, step: 922, loss: 0.3101454973220825, mean loss: 0.34836608492727256
Epoch: 28, step: 923, loss: 0.3387722969055176, mean loss: 0.34836585294671296
Epoch: 28, step: 924, loss: 0.3263843059539795, mean loss: 0.34836532143942295
Epoch: 28, step: 925, loss: 0.3477862775325775, mean loss: 0.34836530743865146
Epoch: 28, step: 926, loss: 0.3217962980270386, mean loss: 0.34836466503894614
Epoch: 28, step: 927, loss: 0.3746919631958008, mean loss: 0.348365301579037
Epoch: 28, step: 928, loss: 0.3240380585193634, mean loss: 0.34836471341039843
Epoch: 28, step: 929, loss: 0.3313618302345276, mean loss: 0.348364302335422
Epoch: 28, step: 930, loss: 0.34261399507522583, mean loss: 0.3483641633148659
Epoch: 28, step: 931, loss: 0.3280201852321625, mean loss: 0.3483636714867525
Epoch: 28, step: 932, loss: 0.3691718876361847, mean loss: 0.34836417452594387
Epoch: 28, step: 933, loss: 0.3263932466506958, mean loss: 0.3483636433910052
Epoch: 28, step: 934, loss: 0.32603007555007935, mean loss: 0.3483631035024988
Epoch: 28, step: 935, loss: 0.3687320053577423, mean loss: 0.34836359588554505
Epoch: 28, step: 936, loss: 0.33268240094184875, mean loss: 0.3483632168288856
Epoch: 28, step: 937, loss: 0.3592049479484558, mean loss: 0.34836347889635283
Epoch: 28, step: 938, loss: 0.36375463008880615, mean loss: 0.34836385092388883
Epoch: 28, step: 939, loss: 0.32819318771362305, mean loss: 0.34836336338006185
Epoch: 28, step: 940, loss: 0.32874226570129395, mean loss: 0.34836288913121166
Epoch: 28, step: 941, loss: 0.35628336668014526, mean loss: 0.34836308056732007
Epoch: 28, step: 942, loss: 0.41494816541671753, mean loss: 0.34836468987450675
Epoch: 28, step: 943, loss: 0.3190842270851135, mean loss: 0.3483639822067092
Epoch: 28, step: 944, loss: 0.3305917978286743, mean loss: 0.34836355268827196
Epoch: 28, step: 945, loss: 0.3360636830329895, mean loss: 0.34836325543200886
Epoch: 28, step: 946, loss: 0.2950728237628937, mean loss: 0.34836196757025123
Epoch: 28, step: 947, loss: 0.34413301944732666, mean loss: 0.3483618653723749
Epoch: 28, step: 948, loss: 0.3455253839492798, mean loss: 0.3483617968268728
Epoch: 28, step: 949, loss: 0.35679808259010315, mean loss: 0.3483620006905276
Epoch: 28, step: 950, loss: 0.3263551890850067, mean loss: 0.34836146890666453
Epoch: 28, step: 951, loss: 0.33723631501197815, mean loss: 0.34836120007924587
Epoch: 28, step: 952, loss: 0.3465856909751892, mean loss: 0.3483611571770082
Epoch: 28, step: 953, loss: 0.3448212742805481, mean loss: 0.3483610716436661
Epoch: 28, step: 954, loss: 0.30820727348327637, mean loss: 0.3483601014405066
Epoch: 28, step: 955, loss: 0.39436933398246765, mean loss: 0.3483612130968452
Epoch: 28, step: 956, loss: 0.3436480760574341, mean loss: 0.3483610992226989
Epoch: 28, step: 957, loss: 0.35429397225379944, mean loss: 0.34836124256343415
Epoch: 28, step: 958, loss: 0.31843283772468567, mean loss: 0.3483605194979166
Epoch: 28, step: 959, loss: 0.3412507176399231, mean loss: 0.3483603477303804
Epoch: 28, step: 960, loss: 0.3160453140735626, mean loss: 0.34835956704201143
Epoch: 28, step: 961, loss: 0.38907378911972046, mean loss: 0.3483605506198748
Epoch: 28, step: 962, loss: 0.30381399393081665, mean loss: 0.3483594744861222
Epoch: 28, step: 963, loss: 0.31314873695373535, mean loss: 0.3483586239030337
Epoch: 28, step: 964, loss: 0.327714741230011, mean loss: 0.3483581252223884
Epoch: 28, step: 965, loss: 0.3461768925189972, mean loss: 0.3483580725330627
Epoch: 28, step: 966, loss: 0.3351650834083557, mean loss: 0.34835775385413026
Epoch: 28, step: 967, loss: 0.38045844435691833, mean loss: 0.34835852923312793
Epoch: 28, step: 968, loss: 0.3279905915260315, mean loss: 0.3483580372658395
Epoch: 28, step: 969, loss: 0.3284071981906891, mean loss: 0.3483575553847933
Epoch: 28, step: 970, loss: 0.36181965470314026, mean loss: 0.348357880532713
Epoch: 28, step: 971, loss: 0.3512861132621765, mean loss: 0.348357951256139
Epoch: 28, step: 972, loss: 0.3487510681152344, mean loss: 0.34835796075056863
Epoch: 28, step: 973, loss: 0.3494446277618408, mean loss: 0.34835798699476056
Epoch: 28, step: 974, loss: 0.3745865225791931, mean loss: 0.3483586204271653
Epoch: 28, step: 975, loss: 0.3003661036491394, mean loss: 0.34835746141159396
Epoch: 28, step: 976, loss: 0.34487658739089966, mean loss: 0.3483573773507854
Epoch: 28, step: 977, loss: 0.31565752625465393, mean loss: 0.34835658769004896
Epoch: 28, step: 978, loss: 0.3257289230823517, mean loss: 0.3483560412732851
Epoch: 28, step: 979, loss: 0.30230745673179626, mean loss: 0.3483549293109423
Epoch: 28, step: 980, loss: 0.3260807693004608, mean loss: 0.3483543914566451
Epoch: 28, step: 981, loss: 0.3741777241230011, mean loss: 0.34835501499778254
Epoch: 28, step: 982, loss: 0.31807664036750793, mean loss: 0.3483542839009666
Epoch: 28, step: 983, loss: 0.362720787525177, mean loss: 0.34835463078390133
Epoch: 28, step: 984, loss: 0.3584909439086914, mean loss: 0.3483548755218863
Epoch: 28, step: 985, loss: 0.3107280433177948, mean loss: 0.34835396705619015
Epoch: 28, step: 986, loss: 0.3231390118598938, mean loss: 0.348353358278692
Epoch: 28, step: 987, loss: 0.30439281463623047, mean loss: 0.34835229694253456
Epoch: 28, step: 988, loss: 0.34095299243927, mean loss: 0.3483521183059854
Epoch: 28, step: 989, loss: 0.36269521713256836, mean loss: 0.3483524645736409
Epoch: 28, step: 990, loss: 0.33026647567749023, mean loss: 0.3483520279565708
Epoch: 28, step: 991, loss: 0.31489476561546326, mean loss: 0.3483512202783567
Epoch: 28, step: 992, loss: 0.31078052520751953, mean loss: 0.3483503133213242
Epoch: 28, step: 993, loss: 0.2985074520111084, mean loss: 0.34834911014309533
Epoch: 28, step: 994, loss: 0.36633482575416565, mean loss: 0.3483495442975263
Epoch: 28, step: 995, loss: 0.3379647135734558, mean loss: 0.3483492936257409
Epoch: 28, step: 996, loss: 0.3735218942165375, mean loss: 0.3483499012339523
Epoch: 28, step: 997, loss: 0.3000021278858185, mean loss: 0.3483487342589741
Epoch: 28, step: 998, loss: 0.31748446822166443, mean loss: 0.3483479893031189
Epoch: 28, step: 999, loss: 0.37889111042022705, mean loss: 0.3483487264898614
Epoch: 28, step: 1000, loss: 0.3584676682949066, mean loss: 0.3483489707140741
Epoch: 28, step: 1001, loss: 0.3337102234363556, mean loss: 0.34834861741129675
Epoch: 28, step: 1002, loss: 0.3237389028072357, mean loss: 0.34834802347586524
Epoch: 28, step: 1003, loss: 0.3524459898471832, mean loss: 0.3483481223745613
Epoch: 28, step: 1004, loss: 0.354192852973938, mean loss: 0.34834826342556885
Epoch: 28, step: 1005, loss: 0.308403342962265, mean loss: 0.34834729945721943
Epoch: 28, step: 1006, loss: 0.3400338888168335, mean loss: 0.34834709883918713
Epoch: 28, step: 1007, loss: 0.3613165318965912, mean loss: 0.34834741180813156
Epoch: 28, step: 1008, loss: 0.33695662021636963, mean loss: 0.34834713694045
Epoch: 28, step: 1009, loss: 0.351594477891922, mean loss: 0.3483472152991429
Epoch: 28, step: 1010, loss: 0.29490017890930176, mean loss: 0.3483459256474191
Epoch: 28, step: 1011, loss: 0.33318108320236206, mean loss: 0.3483455597357686
Epoch: 28, step: 1012, loss: 0.3822987675666809, mean loss: 0.34834637897108844
Epoch: 28, step: 1013, loss: 0.3504650890827179, mean loss: 0.3483464300908614
Epoch: 28, step: 1014, loss: 0.29428061842918396, mean loss: 0.3483451256342865
Epoch: 28, step: 1015, loss: 0.31471794843673706, mean loss: 0.3483443143242788
Epoch: 28, step: 1016, loss: 0.33167800307273865, mean loss: 0.3483439122322802
Epoch: 28, step: 1017, loss: 0.37201574444770813, mean loss: 0.34834448332594037
Epoch: 28, step: 1018, loss: 0.3231334090232849, mean loss: 0.34834387511204196
Epoch: 28, step: 1019, loss: 0.35649043321609497, mean loss: 0.3483440716419586
Epoch: 28, step: 1020, loss: 0.31844937801361084, mean loss: 0.34834335047114756
Epoch: 28, step: 1021, loss: 0.32793551683425903, mean loss: 0.3483428581704375
Epoch: 28, step: 1022, loss: 0.3288240432739258, mean loss: 0.3483423873269953
Epoch: 28, step: 1023, loss: 0.3604891896247864, mean loss: 0.34834268033168214
Epoch: 28, step: 1024, loss: 0.3309685289859772, mean loss: 0.34834226124319656
Epoch: 28, step: 1025, loss: 0.3453415632247925, mean loss: 0.34834218886396895
Epoch: 28, step: 1026, loss: 0.2968684136867523, mean loss: 0.34834094730543697
Epoch: 28, step: 1027, loss: 0.295015424489975, mean loss: 0.3483396611133768
Epoch: 28, step: 1028, loss: 0.3128686547279358, mean loss: 0.34833880558634206
Epoch: 28, step: 1029, loss: 0.34114769101142883, mean loss: 0.3483386321476615
Epoch: 28, step: 1030, loss: 0.293831467628479, mean loss: 0.34833731754995945
Epoch: 28, step: 1031, loss: 0.2889634072780609, mean loss: 0.34833588561116263
Epoch: 28, step: 1032, loss: 0.3154694736003876, mean loss: 0.3483350929809441
Epoch: 28, step: 1033, loss: 0.3406279981136322, mean loss: 0.3483349071155395
Epoch: 28, step: 1034, loss: 0.32378917932510376, mean loss: 0.34833431518152475
Epoch: 28, step: 1035, loss: 0.37301358580589294, mean loss: 0.3483349103216478
Epoch: 28, step: 1036, loss: 0.31704452633857727, mean loss: 0.34833415577285276
Epoch: 28, step: 1037, loss: 0.33081528544425964, mean loss: 0.3483337333260158
Epoch: 28, step: 1038, loss: 0.29951170086860657, mean loss: 0.3483325560688371
Epoch: 28, step: 1039, loss: 0.35141539573669434, mean loss: 0.34833263040428436
Epoch: 28, step: 1040, loss: 0.3419800400733948, mean loss: 0.3483324772301631
Epoch: 28, step: 1041, loss: 0.3244442939758301, mean loss: 0.34833190125043473
Epoch: 28, step: 1042, loss: 0.29766350984573364, mean loss: 0.3483306795894003
Epoch: 28, step: 1043, loss: 0.30544814467430115, mean loss: 0.3483296456773809
Epoch: 28, step: 1044, loss: 0.34935688972473145, mean loss: 0.34832967044397556
Epoch: 28, step: 1045, loss: 0.3198632001876831, mean loss: 0.34832898414111
Epoch: 28, step: 1046, loss: 0.3468951880931854, mean loss: 0.34832894957431604
Epoch: 28, step: 1047, loss: 0.38913068175315857, mean loss: 0.3483299332226328
Epoch: 28, step: 1048, loss: 0.33566412329673767, mean loss: 0.34832962788259936
Epoch: 28, step: 1049, loss: 0.3353085517883301, mean loss: 0.34832931398558153
Epoch: 28, step: 1050, loss: 0.30513715744018555, mean loss: 0.3483282727842088
Epoch: 28, step: 1051, loss: 0.37720581889152527, mean loss: 0.34832896889707415
Epoch: 28, step: 1052, loss: 0.35406023263931274, mean loss: 0.3483291070497496
Epoch: 28, step: 1053, loss: 0.2887943685054779, mean loss: 0.3483276719936212
Epoch: 28, step: 1054, loss: 0.32705873250961304, mean loss: 0.3483271593284614
Epoch: 28, step: 1055, loss: 0.4833649694919586, mean loss: 0.34833041419276345
Epoch: 28, step: 1056, loss: 0.31533634662628174, mean loss: 0.348329618944202
Epoch: 28, step: 1057, loss: 0.3313915729522705, mean loss: 0.3483292107001434
Epoch: 28, step: 1058, loss: 0.30357101559638977, mean loss: 0.34832813195547335
Epoch: 28, step: 1059, loss: 0.33448338508605957, mean loss: 0.3483277982827926
Epoch: 28, step: 1060, loss: 0.32320019602775574, mean loss: 0.3483271926962538
Epoch: 28, step: 1061, loss: 0.32216310501098633, mean loss: 0.34832656214514557
Epoch: 28, step: 1062, loss: 0.3212651312351227, mean loss: 0.3483259099838994
Epoch: 28, step: 1063, loss: 0.31874778866767883, mean loss: 0.3483251971893815
Epoch: 28, step: 1064, loss: 0.2983916103839874, mean loss: 0.3483239938834363
Epoch: 28, step: 1065, loss: 0.32052797079086304, mean loss: 0.3483233240674671
Epoch: 28, step: 1066, loss: 0.31239843368530273, mean loss: 0.3483224583865981
Epoch: 28, step: 1067, loss: 0.348409503698349, mean loss: 0.3483224604840755
Epoch: 28, step: 1068, loss: 0.31487396359443665, mean loss: 0.3483216545156196
Epoch: 28, step: 1069, loss: 0.3266502022743225, mean loss: 0.34832113233711637
Epoch: 28, step: 1070, loss: 0.3206479847431183, mean loss: 0.34832046556248336
Epoch: 28, step: 1071, loss: 0.30695435404777527, mean loss: 0.3483194688847772
Epoch: 28, step: 1072, loss: 0.32393860816955566, mean loss: 0.34831888146493106
Epoch: 28, step: 1073, loss: 0.2939464747905731, mean loss: 0.348317571475853
Epoch: 28, step: 1074, loss: 0.31002870202064514, mean loss: 0.3483166490080896
Epoch: 28, step: 1075, loss: 0.3237052261829376, mean loss: 0.34831605607605665
Epoch: 28, step: 1076, loss: 0.312633216381073, mean loss: 0.3483151964350223
Epoch: 28, step: 1077, loss: 0.32805371284484863, mean loss: 0.34831470832411915
Epoch: 28, step: 1078, loss: 0.34703758358955383, mean loss: 0.34831467755818396
Epoch: 28, step: 1079, loss: 0.36385074257850647, mean loss: 0.3483150518129782
Epoch: 28, step: 1080, loss: 0.37505367398262024, mean loss: 0.3483156959153599
Epoch: 28, step: 1081, loss: 0.30939576029777527, mean loss: 0.34831475840185555
Epoch: 28, step: 1082, loss: 0.34496381878852844, mean loss: 0.3483146776854973
Epoch: 28, step: 1083, loss: 0.31130295991897583, mean loss: 0.34831378618058917
Epoch: 28, step: 1084, loss: 0.32643193006515503, mean loss: 0.348313259122851
Epoch: 28, step: 1085, loss: 0.3219849467277527, mean loss: 0.34831262498073445
Epoch: 28, step: 1086, loss: 0.28677114844322205, mean loss: 0.34831114273220876
Epoch: 28, step: 1087, loss: 0.3304925858974457, mean loss: 0.3483107135762156
Epoch: 28, step: 1088, loss: 0.33540505170822144, mean loss: 0.34831040275369524
Epoch: 28, step: 1089, loss: 0.33535096049308777, mean loss: 0.34831009064343416
Epoch: 28, step: 1090, loss: 0.32361307740211487, mean loss: 0.348309495864318
Epoch: 28, step: 1091, loss: 0.31034424901008606, mean loss: 0.34830858156784233
Epoch: 28, step: 1092, loss: 0.317889928817749, mean loss: 0.34830784902954615
Epoch: 28, step: 1093, loss: 0.31763598322868347, mean loss: 0.34830711041119133
Epoch: 28, step: 1094, loss: 0.33108770847320557, mean loss: 0.34830669575561934
Epoch: 28, step: 1095, loss: 0.3211980164051056, mean loss: 0.34830604297486056
Epoch: 28, step: 1096, loss: 0.3013114333152771, mean loss: 0.34830491136539105
Epoch: 28, step: 1097, loss: 0.31950804591178894, mean loss: 0.34830421796627103
Epoch: 28, step: 1098, loss: 0.37530988454818726, mean loss: 0.34830486821949347
Epoch: 28, step: 1099, loss: 0.36121445894241333, mean loss: 0.34830517905428887
Epoch: 28, step: 1100, loss: 0.31687214970588684, mean loss: 0.34830442223370406
Epoch: 28, step: 1101, loss: 0.3039506673812866, mean loss: 0.34830335434342496
Epoch: 28, step: 1102, loss: 0.3072690963745117, mean loss: 0.3483023663993304
Epoch: 28, step: 1103, loss: 0.3698333203792572, mean loss: 0.3483028847678295
Epoch: 28, step: 1104, loss: 0.33534082770347595, mean loss: 0.3483025727073277
Epoch: 28, step: 1105, loss: 0.29906725883483887, mean loss: 0.34830138739956434
Epoch: 28, step: 1106, loss: 0.35028019547462463, mean loss: 0.348301435036919
Epoch: 28, step: 1107, loss: 0.32813435792922974, mean loss: 0.34830094955119184
Epoch: 28, step: 1108, loss: 0.3441500961780548, mean loss: 0.3483008496293466
Epoch: 28, step: 1109, loss: 0.32994019985198975, mean loss: 0.3483004076513538
Epoch: 28, step: 1110, loss: 0.3001144528388977, mean loss: 0.3482992477458387
Epoch: 28, step: 1111, loss: 0.35730797052383423, mean loss: 0.34829946459358513
Epoch: 28, step: 1112, loss: 0.29800504446029663, mean loss: 0.3482982539925469
Epoch: 28, step: 1113, loss: 0.35944411158561707, mean loss: 0.3482985222700608
Epoch: 28, step: 1114, loss: 0.35605576634407043, mean loss: 0.34829870898015
Epoch: 28, step: 1115, loss: 0.36286336183547974, mean loss: 0.34829905953018503
Epoch: 28, step: 1116, loss: 0.3355606198310852, mean loss: 0.3482987529418267
Epoch: 28, step: 1117, loss: 0.3299877941608429, mean loss: 0.34829831224486446
Epoch: 28, step: 1118, loss: 0.3456501364707947, mean loss: 0.3482982485117227
Epoch: 28, step: 1119, loss: 0.34073546528816223, mean loss: 0.3482980665040402
Epoch: 28, step: 1120, loss: 0.3427388072013855, mean loss: 0.3482979327168455
Epoch: 28, step: 1121, loss: 0.3104937970638275, mean loss: 0.34829702295760084
Epoch: 28, step: 1122, loss: 0.32466304302215576, mean loss: 0.3482964542178599
Epoch: 28, step: 1123, loss: 0.3121221959590912, mean loss: 0.348295583723629
Epoch: 28, step: 1124, loss: 0.2956131100654602, mean loss: 0.3482943160076327
Epoch: 28, step: 1125, loss: 0.30913954973220825, mean loss: 0.34829337383605863
Epoch: 28, step: 1126, loss: 0.37029534578323364, mean loss: 0.3482939032513946
Epoch: 28, step: 1127, loss: 0.3138117790222168, mean loss: 0.3482930735563939
Epoch: 28, step: 1128, loss: 0.29791316390037537, mean loss: 0.34829186136444334
Epoch: 28, step: 1129, loss: 0.3639966547489166, mean loss: 0.3482922392286795
Epoch: 28, step: 1130, loss: 0.35459691286087036, mean loss: 0.34829239091825037
Epoch: 28, step: 1131, loss: 0.31132835149765015, mean loss: 0.34829150158999944
Epoch: 28, step: 1132, loss: 0.3587457239627838, mean loss: 0.3482917531050331
Epoch: 28, step: 1133, loss: 0.35267019271850586, mean loss: 0.3482918584420781
Epoch: 28, step: 1134, loss: 0.31200411915779114, mean loss: 0.34829098544813375
Epoch: 28, step: 1135, loss: 0.35404008626937866, mean loss: 0.3482911237540619
Epoch: 28, step: 1136, loss: 0.3277166187763214, mean loss: 0.34829062880578365
Epoch: 28, step: 1137, loss: 0.3059706389904022, mean loss: 0.34828961076417153
Epoch: 28, step: 1138, loss: 0.33977338671684265, mean loss: 0.34828940590443647
Epoch: 28, step: 1139, loss: 0.33286362886428833, mean loss: 0.3482890348427353
Epoch: 28, step: 1140, loss: 0.39752545952796936, mean loss: 0.3482902191793164
Epoch: 28, step: 1141, loss: 0.34748905897140503, mean loss: 0.3482901999086134
Epoch: 28, step: 1142, loss: 0.32525599002838135, mean loss: 0.34828964586868844
Epoch: 28, step: 1143, loss: 0.327165424823761, mean loss: 0.3482891377817863
Epoch: 28, step: 1144, loss: 0.3194427490234375, mean loss: 0.3482884439753847
Epoch: 28, step: 1145, loss: 0.3251934349536896, mean loss: 0.3482878885131446
Epoch: 28, step: 1146, loss: 0.33068135380744934, mean loss: 0.34828746506537756
Epoch: 28, step: 1147, loss: 0.32560455799102783, mean loss: 0.3482869195409169
Epoch: 28, step: 1148, loss: 0.3259800374507904, mean loss: 0.3482863830727682
Epoch: 28, step: 1149, loss: 0.3130123019218445, mean loss: 0.34828553477107155
Epoch: 28, step: 1150, loss: 0.3846004605293274, mean loss: 0.3482864080828999
Epoch: 28, step: 1151, loss: 0.37311670184135437, mean loss: 0.34828700519461975
Epoch: 28, step: 1152, loss: 0.343520849943161, mean loss: 0.3482868905822535
Epoch: 28, step: 1153, loss: 0.33557644486427307, mean loss: 0.3482865849398325
Epoch: 28, step: 1154, loss: 0.3506730794906616, mean loss: 0.34828664232542295
Epoch: 28, step: 1155, loss: 0.3448389768600464, mean loss: 0.34828655942493564
Epoch: 28, step: 1156, loss: 0.3158237338066101, mean loss: 0.3482857788621518
Epoch: 28, step: 1157, loss: 0.3191367983818054, mean loss: 0.3482850779970284
Epoch: 28, step: 1158, loss: 0.2852054834365845, mean loss: 0.34828356133249616
Epoch: 28, step: 1159, loss: 0.3340775668621063, mean loss: 0.3482832197765606
Epoch: 28, step: 1160, loss: 0.34970420598983765, mean loss: 0.3482832539406318
Epoch: 28, step: 1161, loss: 0.3382905423641205, mean loss: 0.34828301369656833
Epoch: 28, step: 1162, loss: 0.3780762255191803, mean loss: 0.3482837299656349
Epoch: 28, step: 1163, loss: 0.365697979927063, mean loss: 0.3482841486176678
Epoch: 28, step: 1164, loss: 0.3142288327217102, mean loss: 0.34828332992122585
Epoch: 28, step: 1165, loss: 0.2959003448486328, mean loss: 0.3482820706543122
Epoch: 28, step: 1166, loss: 0.34559816122055054, mean loss: 0.3482820061357076
Epoch: 28, step: 1167, loss: 0.3048996031284332, mean loss: 0.34828096328948144
Epoch: 28, step: 1168, loss: 0.342903196811676, mean loss: 0.3482808340193563
Epoch: 28, step: 1169, loss: 0.3455357849597931, mean loss: 0.34828076803577235
Epoch: 28, step: 1170, loss: 0.3516281843185425, mean loss: 0.34828084849670743
Epoch: 28, step: 1171, loss: 0.33992689847946167, mean loss: 0.34828064769990863
Epoch: 28, step: 1172, loss: 0.32063227891921997, mean loss: 0.3482799831555322
Epoch: 28, step: 1173, loss: 0.32839545607566833, mean loss: 0.3482795052310242
Epoch: 28, step: 1174, loss: 0.33330339193344116, mean loss: 0.3482791452888679
Epoch: 28, step: 1175, loss: 0.3227529227733612, mean loss: 0.34827853179572915
Epoch: 28, step: 1176, loss: 0.34222379326820374, mean loss: 0.3482783862806116
Epoch: 28, step: 1177, loss: 0.3144035041332245, mean loss: 0.34827757217625815
Epoch: 28, step: 1178, loss: 0.374533474445343, mean loss: 0.34827820316090813
Epoch: 28, step: 1179, loss: 0.31903237104415894, mean loss: 0.34827750033883476
Epoch: 28, step: 1180, loss: 0.3469267785549164, mean loss: 0.3482774678797046
Epoch: 28, step: 1181, loss: 0.36307501792907715, mean loss: 0.3482778234703724
Epoch: 28, step: 1182, loss: 0.3728587031364441, mean loss: 0.3482784141439196
Epoch: 28, step: 1183, loss: 0.3639238476753235, mean loss: 0.34827879009147655
Epoch: 28, step: 1184, loss: 0.32500171661376953, mean loss: 0.34827823077500786
Epoch: 28, step: 1185, loss: 0.31405243277549744, mean loss: 0.3482774083953164
Epoch: 28, step: 1186, loss: 0.3236505091190338, mean loss: 0.3482768166728032
Epoch: 28, step: 1187, loss: 0.3068600594997406, mean loss: 0.3482758215561003
Epoch: 28, step: 1188, loss: 0.3730960190296173, mean loss: 0.3482764178944265
Epoch: 28, step: 1189, loss: 0.31447839736938477, mean loss: 0.34827560587144524
Epoch: 28, step: 1190, loss: 0.3041478395462036, mean loss: 0.34827454569398747
Epoch: 28, step: 1191, loss: 0.333089143037796, mean loss: 0.34827418087074474
Epoch: 28, step: 1192, loss: 0.40201395750045776, mean loss: 0.34827547191642955
Epoch: 28, step: 1193, loss: 0.3044964671134949, mean loss: 0.34827442019383303
Epoch: 28, step: 1194, loss: 0.3104127049446106, mean loss: 0.34827351064677825
Epoch: 28, step: 1195, loss: 0.3088824450969696, mean loss: 0.34827256438307236
Epoch: 28, step: 1196, loss: 0.3453315496444702, mean loss: 0.34827249373485264
Epoch: 28, step: 1197, loss: 0.3081631064414978, mean loss: 0.3482715302617012
Epoch: 28, step: 1198, loss: 0.4184127449989319, mean loss: 0.3482732150930706
Epoch: 28, step: 1199, loss: 0.33292222023010254, mean loss: 0.34827284636240996
Epoch: 28, step: 1200, loss: 0.3123226761817932, mean loss: 0.34827198286061617
Epoch: 28, step: 1201, loss: 0.3591924011707306, mean loss: 0.3482722451562954
Epoch: 28, step: 1202, loss: 0.34909501671791077, mean loss: 0.34827226491783164
Epoch: 28, step: 1203, loss: 0.30699726939201355, mean loss: 0.3482712735883205
Epoch: 28, step: 1204, loss: 0.3010508418083191, mean loss: 0.34827013949048014
Epoch: 28, step: 1205, loss: 0.3334985673427582, mean loss: 0.3482697847286725
Epoch: 28, step: 1206, loss: 0.3290458619594574, mean loss: 0.34826932304797004
Epoch: 28, step: 1207, loss: 0.33651819825172424, mean loss: 0.34826904084036203
Epoch: 28, step: 1208, loss: 0.3157256543636322, mean loss: 0.34826825931766864
Epoch: 28, step: 1209, loss: 0.33764326572418213, mean loss: 0.34826800416677306
Epoch: 28, step: 1210, loss: 0.33823341131210327, mean loss: 0.34826776319967523
Epoch: 28, step: 1211, loss: 0.30600282549858093, mean loss: 0.348266748289059
Epoch: 28, step: 1212, loss: 0.3316722810268402, mean loss: 0.348266349814638
Epoch: 28, step: 1213, loss: 0.32423874735832214, mean loss: 0.3482657728660125
Epoch: 28, step: 1214, loss: 0.30660444498062134, mean loss: 0.3482647725219809
Epoch: 28, step: 1215, loss: 0.33792904019355774, mean loss: 0.3482645243532254
Epoch: 28, step: 1216, loss: 0.31609705090522766, mean loss: 0.3482637520063876
Epoch: 28, step: 1217, loss: 0.3504756987094879, mean loss: 0.3482638051143517
Epoch: 28, step: 1218, loss: 0.31967514753341675, mean loss: 0.34826311872848864
Epoch: 28, step: 1219, loss: 0.3158499002456665, mean loss: 0.34826234053732175
Epoch: 28, step: 1220, loss: 0.34303686022758484, mean loss: 0.34826221508464583
Epoch: 28, step: 1221, loss: 0.3336561322212219, mean loss: 0.3482618644320587
Epoch: 28, step: 1222, loss: 0.33771219849586487, mean loss: 0.3482616111691626
Epoch: 28, step: 1223, loss: 0.3229357600212097, mean loss: 0.34826100319309317
Epoch: 28, step: 1224, loss: 0.36441996693611145, mean loss: 0.34826139109821697
Epoch: 28, step: 1225, loss: 0.2882962226867676, mean loss: 0.3482599516347667
Epoch: 28, step: 1226, loss: 0.36155062913894653, mean loss: 0.34826027066972925
Epoch: 28, step: 1227, loss: 0.3322831094264984, mean loss: 0.3482598871564973
Epoch: 28, step: 1228, loss: 0.31308457255363464, mean loss: 0.348259042834119
Epoch: 28, step: 1229, loss: 0.3114432096481323, mean loss: 0.3482581591551505
Epoch: 28, step: 1230, loss: 0.34819495677948, mean loss: 0.34825815763816
Epoch: 28, step: 1231, loss: 0.338157057762146, mean loss: 0.34825791519624666
Epoch: 28, step: 1232, loss: 0.3478740155696869, mean loss: 0.34825790598228706
Epoch: 28, step: 1233, loss: 0.37470412254333496, mean loss: 0.34825854070164003
Epoch: 28, step: 1234, loss: 0.33270323276519775, mean loss: 0.34825816737723614
Epoch: 28, step: 1235, loss: 0.3136516213417053, mean loss: 0.3482573368467083
Epoch: 28, step: 1236, loss: 0.3558359444141388, mean loss: 0.34825751872310484
Epoch: 28, step: 1237, loss: 0.36666610836982727, mean loss: 0.3482579604939147
Epoch: 28, step: 1238, loss: 0.28059670329093933, mean loss: 0.34825633679260676
Epoch: 28, step: 1239, loss: 0.31767138838768005, mean loss: 0.34825560284779
Epoch: 28, step: 1240, loss: 0.3517763316631317, mean loss: 0.3482556873324399
Epoch: 28, step: 1241, loss: 0.32754430174827576, mean loss: 0.34825519034665536
Epoch: 28, step: 1242, loss: 0.37477007508277893, mean loss: 0.34825582657664306
Epoch: 28, step: 1243, loss: 0.3357466161251068, mean loss: 0.3482555264228267
Epoch: 28, step: 1244, loss: 0.32217657566070557, mean loss: 0.3482549006831918
Epoch: 28, step: 1245, loss: 0.33193424344062805, mean loss: 0.3482545090939303
Epoch: 28, step: 1246, loss: 0.31311503052711487, mean loss: 0.34825366599600166
Epoch: 28, step: 1247, loss: 0.34755632281303406, mean loss: 0.34825364926511915
Epoch: 28, step: 1248, loss: 0.32846561074256897, mean loss: 0.34825317451550847
Epoch: 28, step: 1249, loss: 0.3616079092025757, mean loss: 0.3482534949112353
Epoch: 28, step: 1250, loss: 0.30108124017715454, mean loss: 0.3482523632207444
Epoch: 28, step: 1251, loss: 0.32794615626335144, mean loss: 0.34825187607443026
Epoch: 28, step: 1252, loss: 0.33405250310897827, mean loss: 0.3482515354393585
Epoch: 28, step: 1253, loss: 0.3327760398387909, mean loss: 0.3482511641997193
Epoch: 28, step: 1254, loss: 0.41151830554008484, mean loss: 0.34825268187048813
Epoch: 28, step: 1255, loss: 0.3313283324241638, mean loss: 0.3482522758939614
Epoch: 28, step: 1256, loss: 0.3234754204750061, mean loss: 0.3482516815679901
Epoch: 28, step: 1257, loss: 0.3389977514743805, mean loss: 0.34825145959797105
Epoch: 28, step: 1258, loss: 0.33732137084007263, mean loss: 0.34825119742894756
Epoch: 28, step: 1259, loss: 0.36538106203079224, mean loss: 0.3482516082958909
Epoch: 28, step: 1260, loss: 0.3300592601299286, mean loss: 0.3482511719553022
Epoch: 28, step: 1261, loss: 0.3165481388568878, mean loss: 0.34825041158131315
Epoch: 28, step: 1262, loss: 0.3214798867702484, mean loss: 0.3482497695253158
Epoch: 28, step: 1263, loss: 0.3101973831653595, mean loss: 0.34824885691052393
Epoch: 28, step: 1264, loss: 0.3369132876396179, mean loss: 0.3482485850547724
Epoch: 28, step: 1265, loss: 0.34001874923706055, mean loss: 0.34824838768713323
Epoch: 28, step: 1266, loss: 0.3296073377132416, mean loss: 0.3482479406488356
Epoch: 28, step: 1267, loss: 0.3146877586841583, mean loss: 0.34824713584830885
Epoch: 28, step: 1268, loss: 0.32541424036026, mean loss: 0.3482465883099887
Epoch: 28, step: 1269, loss: 0.3343445360660553, mean loss: 0.3482462549434297
Epoch: 28, step: 1270, loss: 0.3198767304420471, mean loss: 0.3482455746680418
Epoch: 28, step: 1271, loss: 0.34445706009864807, mean loss: 0.3482454838250874
Epoch: 28, step: 1272, loss: 0.3200480043888092, mean loss: 0.348244807707609
Epoch: 28, step: 1273, loss: 0.32324427366256714, mean loss: 0.3482442082606698
Epoch: 28, step: 1274, loss: 0.36677610874176025, mean loss: 0.3482446525961646
Epoch: 28, step: 1275, loss: 0.3002411723136902, mean loss: 0.34824350165437207
Epoch: 28, step: 1276, loss: 0.3156565725803375, mean loss: 0.3482427203618675
Epoch: 28, step: 1277, loss: 0.321760356426239, mean loss: 0.3482420854454461
Epoch: 28, step: 1278, loss: 0.3559894561767578, mean loss: 0.34824227118471707
Epoch: 28, step: 1279, loss: 0.34882912039756775, mean loss: 0.34824228525379103
Epoch: 28, step: 1280, loss: 0.3485817015171051, mean loss: 0.3482422933907331
Epoch: 28, step: 1281, loss: 0.33659911155700684, mean loss: 0.3482420142714486
Epoch: 28, step: 1282, loss: 0.30664634704589844, mean loss: 0.3482410171321168
Epoch: 28, step: 1283, loss: 0.3474334180355072, mean loss: 0.3482409977726601
Epoch: 28, step: 1284, loss: 0.35712921619415283, mean loss: 0.3482412108325259
Epoch: 28, step: 1285, loss: 0.32198238372802734, mean loss: 0.348240581396141
Epoch: 28, step: 1286, loss: 0.2957373857498169, mean loss: 0.3482393229001165
Epoch: 28, step: 1287, loss: 0.399396151304245, mean loss: 0.34824054909446944
Epoch: 28, step: 1288, loss: 0.32648035883903503, mean loss: 0.34824002753002337
Epoch: 28, step: 1289, loss: 0.3311159312725067, mean loss: 0.34823961709676854
Epoch: 28, step: 1290, loss: 0.3257664442062378, mean loss: 0.3482390784688441
Epoch: 28, step: 1291, loss: 0.35094743967056274, mean loss: 0.34823914338019496
Epoch: 28, step: 1292, loss: 0.351389616727829, mean loss: 0.3482392188858474
Epoch: 28, step: 1293, loss: 0.3307133913040161, mean loss: 0.3482387988640964
Epoch: 28, step: 1294, loss: 0.31506291031837463, mean loss: 0.3482380037940328
Epoch: 28, step: 1295, loss: 0.33606141805648804, mean loss: 0.34823771198551723
Epoch: 28, step: 1296, loss: 0.3401277959346771, mean loss: 0.3482375176382755
Epoch: 28, step: 1297, loss: 0.34695249795913696, mean loss: 0.34823748684460953
Epoch: 28, step: 1298, loss: 0.3191864490509033, mean loss: 0.34823679069455815
Epoch: 28, step: 1299, loss: 0.34318187832832336, mean loss: 0.34823666956659
Epoch: 28, step: 1300, loss: 0.323691189289093, mean loss: 0.3482360814114064
Epoch: 28, step: 1301, loss: 0.3053615391254425, mean loss: 0.34823505408255495
Epoch: 28, step: 1302, loss: 0.374541312456131, mean loss: 0.3482356843990369
Epoch: 28, step: 1303, loss: 0.29948386549949646, mean loss: 0.3482345162991016
Epoch: 28, step: 1304, loss: 0.32657864689826965, mean loss: 0.3482339974340802
Epoch: 28, step: 1305, loss: 0.3266541063785553, mean loss: 0.34823348040185403
Epoch: 28, step: 1306, loss: 0.3185163140296936, mean loss: 0.34823276842585144
Epoch: 28, step: 1307, loss: 0.3172377645969391, mean loss: 0.3482320258526883
Epoch: 28, step: 1308, loss: 0.30704692006111145, mean loss: 0.34823103917039055
Epoch: 28, step: 1309, loss: 0.3531356751918793, mean loss: 0.34823115666921717
Epoch: 28, step: 1310, loss: 0.3135986030101776, mean loss: 0.34823032700786893
Epoch: 28, step: 1311, loss: 0.3740605413913727, mean loss: 0.3482309457845646
Epoch: 28, step: 1312, loss: 0.33602309226989746, mean loss: 0.348230653345865
Epoch: 28, step: 1313, loss: 0.31506356596946716, mean loss: 0.34822985884849095
Epoch: 28, step: 1314, loss: 0.3300818204879761, mean loss: 0.3482294241337004
Epoch: 28, step: 1315, loss: 0.32962632179260254, mean loss: 0.3482289785290645
Epoch: 28, step: 1316, loss: 0.34051579236984253, mean loss: 0.3482287937776654
Epoch: 28, step: 1317, loss: 0.29586416482925415, mean loss: 0.34822753953505586
Epoch: 28, step: 1318, loss: 0.3235412836074829, mean loss: 0.34822694826165096
Epoch: 28, step: 1319, loss: 0.33735930919647217, mean loss: 0.34822668797138784
Epoch: 28, step: 1320, loss: 0.3167240619659424, mean loss: 0.34822593347168707
Epoch: 28, step: 1321, loss: 0.308335542678833, mean loss: 0.3482249781047571
Epoch: 28, step: 1322, loss: 0.37841853499412537, mean loss: 0.34822570121712426
Epoch: 28, step: 1323, loss: 0.3543858230113983, mean loss: 0.34822584874375023
Epoch: 28, step: 1324, loss: 0.3503396809101105, mean loss: 0.34822589936597326
Epoch: 28, step: 1325, loss: 0.3141822814941406, mean loss: 0.3482250841061938
Epoch: 28, step: 1326, loss: 0.3931673467159271, mean loss: 0.34822616033557213
Epoch: 28, step: 1327, loss: 0.33617788553237915, mean loss: 0.3482258718232445
Epoch: 28, step: 1328, loss: 0.3335057497024536, mean loss: 0.3482255193383394
Epoch: 28, step: 1329, loss: 0.3177621066570282, mean loss: 0.3482247898854233
Epoch: 28, step: 1330, loss: 0.3155326545238495, mean loss: 0.3482240070840115
Epoch: 28, step: 1331, loss: 0.3199006915092468, mean loss: 0.34822332890865537
Epoch: 28, step: 1332, loss: 0.32724717259407043, mean loss: 0.34822282666619603
Epoch: 28, step: 1333, loss: 0.3106060326099396, mean loss: 0.34822192601030233
Epoch: 28, step: 1334, loss: 0.3404295742511749, mean loss: 0.3482217394431139
Epoch: 28, step: 1335, loss: 0.331058531999588, mean loss: 0.34822132852548693
Epoch: 28, step: 1336, loss: 0.34207668900489807, mean loss: 0.34822118141544073
Epoch: 28, step: 1337, loss: 0.3506801128387451, mean loss: 0.34822124028380136
Epoch: 28, step: 1338, loss: 0.31106650829315186, mean loss: 0.34822035079750724
Epoch: 28, step: 1339, loss: 0.33041661977767944, mean loss: 0.3482199245854269
Epoch: 28, step: 1340, loss: 0.33992433547973633, mean loss: 0.34821972599808326
Epoch: 28, step: 1341, loss: 0.3345867097377777, mean loss: 0.348219399646375
Epoch: 28, step: 1342, loss: 0.31847044825553894, mean loss: 0.34821868752306223
Epoch: 28, step: 1343, loss: 0.35752958059310913, mean loss: 0.3482189103996677
Epoch: 28, step: 1344, loss: 0.2898241877555847, mean loss: 0.34821751262762457
Epoch: 28, step: 1345, loss: 0.3492470383644104, mean loss: 0.3482175372703968
Epoch: 28, step: 1346, loss: 0.37046757340431213, mean loss: 0.34821806983546855
Epoch: 28, step: 1347, loss: 0.3362599313259125, mean loss: 0.3482177836186541
Epoch: 28, step: 1348, loss: 0.3203609585762024, mean loss: 0.3482171168843719
Epoch: 28, step: 1349, loss: 0.33082908391952515, mean loss: 0.348216700723514
Epoch: 28, step: 1350, loss: 0.35370758175849915, mean loss: 0.3482168321377503
Epoch: 28, step: 1351, loss: 0.3359919488430023, mean loss: 0.34821653956443765
Epoch: 28, step: 1352, loss: 0.30714017152786255, mean loss: 0.3482155565234412
Epoch: 28, step: 1353, loss: 0.3642124533653259, mean loss: 0.34821593935254286
Epoch: 28, step: 1354, loss: 0.3241107761859894, mean loss: 0.3482153624945926
Epoch: 28, step: 1355, loss: 0.36054566502571106, mean loss: 0.3482156575626153
Epoch: 28, step: 1356, loss: 0.34526166319847107, mean loss: 0.3482155868742915
Epoch: 28, step: 1357, loss: 0.33443763852119446, mean loss: 0.3482152571794278
Epoch: 28, step: 1358, loss: 0.34616562724113464, mean loss: 0.3482152081346589
Epoch: 28, step: 1359, loss: 0.29685065150260925, mean loss: 0.34821397908228924
Epoch: 28, step: 1360, loss: 0.33006247878074646, mean loss: 0.34821354476313765
Epoch: 28, step: 1361, loss: 0.3202660381793976, mean loss: 0.3482128760665165
Epoch: 28, step: 1362, loss: 0.3399423062801361, mean loss: 0.34821267818232493
Epoch: 28, step: 1363, loss: 0.3052631616592407, mean loss: 0.3482116505835948
Epoch: 28, step: 1364, loss: 0.32490259408950806, mean loss: 0.34821109291063995
Epoch: 28, step: 1365, loss: 0.33645981550216675, mean loss: 0.3482108117661496
Epoch: 28, step: 1366, loss: 0.3557233512401581, mean loss: 0.3482109914962741
Epoch: 28, step: 1367, loss: 0.3409353196620941, mean loss: 0.34821081743713933
Epoch: 28, step: 1368, loss: 0.34867995977401733, mean loss: 0.34821082866037173
Epoch: 28, step: 1369, loss: 0.3379386067390442, mean loss: 0.34821058292519347
Epoch: 28, step: 1370, loss: 0.3179543614387512, mean loss: 0.3482098591440896
Epoch: 28, step: 1371, loss: 0.35933154821395874, mean loss: 0.34821012518774735
Epoch: 28, step: 1372, loss: 0.3115202784538269, mean loss: 0.348209247545199
Epoch: 28, step: 1373, loss: 0.33288753032684326, mean loss: 0.3482088810495472
Epoch: 28, step: 1374, loss: 0.3003527820110321, mean loss: 0.3482077363584898
Epoch: 28, step: 1375, loss: 0.33980444073677063, mean loss: 0.34820753536117777
Epoch: 28, step: 1376, loss: 0.31997624039649963, mean loss: 0.34820686011673363
Epoch: 28, step: 1377, loss: 0.36957257986068726, mean loss: 0.34820737113610084
Epoch: 28, step: 1378, loss: 0.3152995705604553, mean loss: 0.3482065840752658
Epoch: 28, step: 1379, loss: 0.3399171531200409, mean loss: 0.3482063858204357
Epoch: 28, step: 1380, loss: 0.3380604684352875, mean loss: 0.34820614317060467
Epoch: 28, step: 1381, loss: 0.31172648072242737, mean loss: 0.34820527074360774
Epoch: 28, step: 1382, loss: 0.3176722228527069, mean loss: 0.3482045405499478
Epoch: 28, step: 1383, loss: 0.29100850224494934, mean loss: 0.34820317274723345
Epoch: 28, step: 1384, loss: 0.3176118731498718, mean loss: 0.3482024411954818
Epoch: 28, step: 1385, loss: 0.3429889380931854, mean loss: 0.3482023165242134
Epoch: 28, step: 1386, loss: 0.3656834363937378, mean loss: 0.34820273454281425
Epoch: 28, step: 1387, loss: 0.34120380878448486, mean loss: 0.34820256718447473
Epoch: 28, step: 1388, loss: 0.34201428294181824, mean loss: 0.3482024192137365
Epoch: 28, step: 1389, loss: 0.3584161102771759, mean loss: 0.34820266343187684
Epoch: 28, step: 1390, loss: 0.30641746520996094, mean loss: 0.34820166433572824
Epoch: 28, step: 1391, loss: 0.34704482555389404, mean loss: 0.3482016366760405
Epoch: 28, step: 1392, loss: 0.3444439172744751, mean loss: 0.3482015468321815
Epoch: 28, step: 1393, loss: 0.33388546109199524, mean loss: 0.3482012045549917
Epoch: 28, step: 1394, loss: 0.3063296377658844, mean loss: 0.3482002034894888
Epoch: 28, step: 1395, loss: 0.3318790793418884, mean loss: 0.34819981329334876
Epoch: 28, step: 1396, loss: 0.3249827027320862, mean loss: 0.348199258245163
Epoch: 28, step: 1397, loss: 0.3245934545993805, mean loss: 0.34819869391803787
Epoch: 28, step: 1398, loss: 0.3396759629249573, mean loss: 0.3481984901760524
Epoch: 28, step: 1399, loss: 0.31841447949409485, mean loss: 0.34819777818497666
Epoch: 28, step: 1400, loss: 0.33674558997154236, mean loss: 0.3481975044253081
Epoch: 28, step: 1401, loss: 0.317851722240448, mean loss: 0.3481967790396843
Epoch: 28, step: 1402, loss: 0.3290805518627167, mean loss: 0.34819632209628343
Epoch: 28, step: 1403, loss: 0.36554646492004395, mean loss: 0.3481967368142972
Epoch: 28, step: 1404, loss: 0.29648882150650024, mean loss: 0.34819550087684215
Epoch: 28, step: 1405, loss: 0.3346208333969116, mean loss: 0.3481951764189933
Epoch: 28, step: 1406, loss: 0.3198288083076477, mean loss: 0.34819449843031974
Epoch: 28, step: 1407, loss: 0.3473770022392273, mean loss: 0.34819447889169186
Epoch: 28, step: 1408, loss: 0.3487853705883026, mean loss: 0.34819449301400485
Epoch: 28, step: 1409, loss: 0.3327890634536743, mean loss: 0.34819412483300105
Epoch: 28, step: 1410, loss: 0.4027993977069855, mean loss: 0.34819542983677404
Epoch: 28, step: 1411, loss: 0.3122880160808563, mean loss: 0.3481945717110271
Epoch: 28, step: 1412, loss: 0.3594416379928589, mean loss: 0.3481948404902428
Epoch: 28, step: 1413, loss: 0.4376172721385956, mean loss: 0.3481969774312084
Epoch: 28, step: 1414, loss: 0.32905063033103943, mean loss: 0.3481965198990771
Epoch: 28, step: 1415, loss: 0.2966209650039673, mean loss: 0.34819528744938066
Epoch: 28, step: 1416, loss: 0.30596718192100525, mean loss: 0.34819427839048966
Epoch: 28, step: 1417, loss: 0.3218535780906677, mean loss: 0.3481936489830751
Epoch: 28, step: 1418, loss: 0.29702672362327576, mean loss: 0.3481924263856375
Epoch: 28, step: 1419, loss: 0.29339680075645447, mean loss: 0.3481911171142615
Epoch: 28, step: 1420, loss: 0.33760198950767517, mean loss: 0.34819086410664896
Epoch: 28, step: 1421, loss: 0.3356906473636627, mean loss: 0.3481905654442333
Epoch: 28, step: 1422, loss: 0.32919660210609436, mean loss: 0.34819011164030694
Epoch: 28, step: 1423, loss: 0.308716356754303, mean loss: 0.34818916855556675
Epoch: 28, step: 1424, loss: 0.34872645139694214, mean loss: 0.3481891813917194
Epoch: 28, step: 1425, loss: 0.3115213215351105, mean loss: 0.34818830538570245
Epoch: 28, step: 1426, loss: 0.3030603229999542, mean loss: 0.34818722729061213
Epoch: 28, step: 1427, loss: 0.3540600836277008, mean loss: 0.34818736758818347
Epoch: 28, step: 1428, loss: 0.3446184992790222, mean loss: 0.34818728233297436
Epoch: 28, step: 1429, loss: 0.3668980598449707, mean loss: 0.34818772929627073
Epoch: 28, step: 1430, loss: 0.28446707129478455, mean loss: 0.34818620717272486
Epoch: 28, step: 1431, loss: 0.3326684534549713, mean loss: 0.3481858365021316
Epoch: 28, step: 1432, loss: 0.34124189615249634, mean loss: 0.34818567063708084
Epoch: 28, step: 1433, loss: 0.3343941271305084, mean loss: 0.3481853412159872
Epoch: 28, step: 1434, loss: 0.31769251823425293, mean loss: 0.3481846128900269
Epoch: 28, step: 1435, loss: 0.3277736008167267, mean loss: 0.34818412538137894
Epoch: 28, step: 1436, loss: 0.32293060421943665, mean loss: 0.3481835222257946
Epoch: 28, step: 1437, loss: 0.3144681453704834, mean loss: 0.3481827169863187
Epoch: 28, step: 1438, loss: 0.352760910987854, mean loss: 0.34818282632676917
Epoch: 28, step: 1439, loss: 0.3386436700820923, mean loss: 0.3481825985097018
Epoch: 28, step: 1440, loss: 0.35126325488090515, mean loss: 0.348182672081129
Epoch: 28, step: 1441, loss: 0.33481815457344055, mean loss: 0.34818235292085037
Epoch: 28, step: 1442, loss: 0.2908138632774353, mean loss: 0.34818098292706784
Epoch: 28, step: 1443, loss: 0.3339092433452606, mean loss: 0.3481806421175449
Valid: 28, mean loss: 0.18641765664021173
Epoch: 29, step: 0, loss: 0.3386586308479309, mean loss: 0.34818041473709094
Epoch: 29, step: 1, loss: 0.3075547516345978, mean loss: 0.3481794446415013
Epoch: 29, step: 2, loss: 0.3416973352432251, mean loss: 0.3481792898596441
Epoch: 29, step: 3, loss: 0.33913320302963257, mean loss: 0.348179073859481
Epoch: 29, step: 4, loss: 0.36259469389915466, mean loss: 0.34817941806377506
Epoch: 29, step: 5, loss: 0.3191394507884979, mean loss: 0.3481787246879268
Epoch: 29, step: 6, loss: 0.3350387215614319, mean loss: 0.34817841095674407
Epoch: 29, step: 7, loss: 0.30871063470840454, mean loss: 0.34817746864521104
Epoch: 29, step: 8, loss: 0.30688193440437317, mean loss: 0.3481764827186445
Epoch: 29, step: 9, loss: 0.3572884500026703, mean loss: 0.34817670026071784
Epoch: 29, step: 10, loss: 0.31107497215270996, mean loss: 0.3481758145031294
Epoch: 29, step: 11, loss: 0.369771808385849, mean loss: 0.3481763300683004
Epoch: 29, step: 12, loss: 0.3247123956680298, mean loss: 0.34817576992281113
Epoch: 29, step: 13, loss: 0.36641019582748413, mean loss: 0.34817620521586207
Epoch: 29, step: 14, loss: 0.34665200114250183, mean loss: 0.34817616883086117
Epoch: 29, step: 15, loss: 0.33033499121665955, mean loss: 0.3481757429457849
Epoch: 29, step: 16, loss: 0.34170088171958923, mean loss: 0.34817558838866974
Epoch: 29, step: 17, loss: 0.3529256582260132, mean loss: 0.34817570177172785
Epoch: 29, step: 18, loss: 0.36127153038978577, mean loss: 0.34817601435863843
Epoch: 29, step: 19, loss: 0.34277400374412537, mean loss: 0.3481758854200616
Epoch: 29, step: 20, loss: 0.31625571846961975, mean loss: 0.3481751235476853
Epoch: 29, step: 21, loss: 0.34953227639198303, mean loss: 0.34817515593951415
Epoch: 29, step: 22, loss: 0.3474613428115845, mean loss: 0.34817513890299473
Epoch: 29, step: 23, loss: 0.3396819531917572, mean loss: 0.3481749362016651
Epoch: 29, step: 24, loss: 0.3285527527332306, mean loss: 0.34817446790297374
Epoch: 29, step: 25, loss: 0.3325920104980469, mean loss: 0.3481740960243664
Epoch: 29, step: 26, loss: 0.31508299708366394, mean loss: 0.3481733063172108
Epoch: 29, step: 27, loss: 0.3007434010505676, mean loss: 0.34817217444661924
Epoch: 29, step: 28, loss: 0.3266911804676056, mean loss: 0.3481716618349028
Epoch: 29, step: 29, loss: 0.3226242959499359, mean loss: 0.3481710521998652
Epoch: 29, step: 30, loss: 0.3257676959037781, mean loss: 0.3481705176028696
Epoch: 29, step: 31, loss: 0.37142065167427063, mean loss: 0.34817107239274436
Epoch: 29, step: 32, loss: 0.37959739565849304, mean loss: 0.3481718222632558
Epoch: 29, step: 33, loss: 0.3648889660835266, mean loss: 0.34817222114523677
Epoch: 29, step: 34, loss: 0.28980690240859985, mean loss: 0.3481708285438019
Epoch: 29, step: 35, loss: 0.322834849357605, mean loss: 0.348170224039622
Epoch: 29, step: 36, loss: 0.3363359570503235, mean loss: 0.348169941686486
Epoch: 29, step: 37, loss: 0.3296012580394745, mean loss: 0.3481694986678372
Epoch: 29, step: 38, loss: 0.29930004477500916, mean loss: 0.3481683327498152
Epoch: 29, step: 39, loss: 0.3025057911872864, mean loss: 0.34816724336768035
Epoch: 29, step: 40, loss: 0.34415993094444275, mean loss: 0.3481671477665538
Epoch: 29, step: 41, loss: 0.299892395734787, mean loss: 0.3481659961192416
Epoch: 29, step: 42, loss: 0.30872929096221924, mean loss: 0.3481650553357029
Epoch: 29, step: 43, loss: 0.3863338530063629, mean loss: 0.3481659658509145
Epoch: 29, step: 44, loss: 0.34780651330947876, mean loss: 0.34816595727639243
Epoch: 29, step: 45, loss: 0.2974962890148163, mean loss: 0.34816474861105534
Epoch: 29, step: 46, loss: 0.3221755027770996, mean loss: 0.348164128682953
Epoch: 29, step: 47, loss: 0.333355575799942, mean loss: 0.34816377545919375
Epoch: 29, step: 48, loss: 0.3404679000377655, mean loss: 0.3481635918962737
Epoch: 29, step: 49, loss: 0.3720654845237732, mean loss: 0.3481641619934122
Epoch: 29, step: 50, loss: 0.3330715000629425, mean loss: 0.3481638020186482
Epoch: 29, step: 51, loss: 0.3885617256164551, mean loss: 0.34816476552569836
Epoch: 29, step: 52, loss: 0.3678610920906067, mean loss: 0.34816523527996307
Epoch: 29, step: 53, loss: 0.3676004409790039, mean loss: 0.34816569879548176
Epoch: 29, step: 54, loss: 0.34800124168395996, mean loss: 0.34816569487339283
Epoch: 29, step: 55, loss: 0.3385944664478302, mean loss: 0.3481654666174445
Epoch: 29, step: 56, loss: 0.3396831750869751, mean loss: 0.3481652643354344
Epoch: 29, step: 57, loss: 0.33430418372154236, mean loss: 0.34816493379027735
Epoch: 29, step: 58, loss: 0.3515763282775879, mean loss: 0.34816501513985376
Epoch: 29, step: 59, loss: 0.32327738404273987, mean loss: 0.348164421672878
Epoch: 29, step: 60, loss: 0.2965314984321594, mean loss: 0.34816319047075955
Epoch: 29, step: 61, loss: 0.3367728292942047, mean loss: 0.34816291887075057
Epoch: 29, step: 62, loss: 0.31037911772727966, mean loss: 0.34816201794795454
Epoch: 29, step: 63, loss: 0.3349774181842804, mean loss: 0.3481617035798152
Epoch: 29, step: 64, loss: 0.3449943959712982, mean loss: 0.3481616280616442
Epoch: 29, step: 65, loss: 0.3417325019836426, mean loss: 0.34816147477553294
Epoch: 29, step: 66, loss: 0.35638704895973206, mean loss: 0.3481616708886909
Epoch: 29, step: 67, loss: 0.31491807103157043, mean loss: 0.3481608783176472
Epoch: 29, step: 68, loss: 0.3378795385360718, mean loss: 0.3481606332028592
Epoch: 29, step: 69, loss: 0.337956041097641, mean loss: 0.3481603899235929
Epoch: 29, step: 70, loss: 0.3035019636154175, mean loss: 0.348159325284255
Epoch: 29, step: 71, loss: 0.35289856791496277, mean loss: 0.34815943826324397
Epoch: 29, step: 72, loss: 0.34200677275657654, mean loss: 0.34815929159310866
Epoch: 29, step: 73, loss: 0.3321109116077423, mean loss: 0.3481589090333951
Epoch: 29, step: 74, loss: 0.3471442461013794, mean loss: 0.34815888484653584
Epoch: 29, step: 75, loss: 0.34522444009780884, mean loss: 0.3481588148988635
Epoch: 29, step: 76, loss: 0.3195768892765045, mean loss: 0.34815813361443515
Epoch: 29, step: 77, loss: 0.3126658499240875, mean loss: 0.34815728763351106
Epoch: 29, step: 78, loss: 0.34894508123397827, mean loss: 0.34815730641061987
Epoch: 29, step: 79, loss: 0.3424496054649353, mean loss: 0.34815717037046007
Epoch: 29, step: 80, loss: 0.30034416913986206, mean loss: 0.34815603079896473
Epoch: 29, step: 81, loss: 0.32880112528800964, mean loss: 0.34815556950658877
Epoch: 29, step: 82, loss: 0.3393886685371399, mean loss: 0.34815536056688645
Epoch: 29, step: 83, loss: 0.346979022026062, mean loss: 0.34815533253212616
Epoch: 29, step: 84, loss: 0.289885550737381, mean loss: 0.3481539438668943
Epoch: 29, step: 85, loss: 0.2976967692375183, mean loss: 0.34815274141766334
Epoch: 29, step: 86, loss: 0.3028949499130249, mean loss: 0.3481516629010772
Epoch: 29, step: 87, loss: 0.3292110860347748, mean loss: 0.3481512115480873
Epoch: 29, step: 88, loss: 0.32767239212989807, mean loss: 0.3481507235504841
Epoch: 29, step: 89, loss: 0.32724031805992126, mean loss: 0.34815022528032513
Epoch: 29, step: 90, loss: 0.36166587471961975, mean loss: 0.34815054733454487
Epoch: 29, step: 91, loss: 0.3058409094810486, mean loss: 0.348149539194108
Epoch: 29, step: 92, loss: 0.3474249243736267, mean loss: 0.34814952192863063
Epoch: 29, step: 93, loss: 0.3851759731769562, mean loss: 0.3481504041409549
Epoch: 29, step: 94, loss: 0.4239843189716339, mean loss: 0.3481522109579197
Epoch: 29, step: 95, loss: 0.3505949079990387, mean loss: 0.3481522691561719
Epoch: 29, step: 96, loss: 0.36072176694869995, mean loss: 0.3481525686224429
Epoch: 29, step: 97, loss: 0.3056173622608185, mean loss: 0.34815155525210983
Epoch: 29, step: 98, loss: 0.3713828921318054, mean loss: 0.3481521087086168
Epoch: 29, step: 99, loss: 0.4038686156272888, mean loss: 0.348153436050596
Epoch: 29, step: 100, loss: 0.35632631182670593, mean loss: 0.34815363074949723
Epoch: 29, step: 101, loss: 0.31947946548461914, mean loss: 0.34815294767347493
Epoch: 29, step: 102, loss: 0.31287628412246704, mean loss: 0.3481521073327438
Epoch: 29, step: 103, loss: 0.32908421754837036, mean loss: 0.34815165311907575
Epoch: 29, step: 104, loss: 0.33536428213119507, mean loss: 0.34815134852006696
Epoch: 29, step: 105, loss: 0.3390985429286957, mean loss: 0.34815113288466154
Epoch: 29, step: 106, loss: 0.3174284100532532, mean loss: 0.34815040109506024
Epoch: 29, step: 107, loss: 0.31188568472862244, mean loss: 0.34814953732037546
Epoch: 29, step: 108, loss: 0.3140018880367279, mean loss: 0.3481487239906319
Epoch: 29, step: 109, loss: 0.3313579559326172, mean loss: 0.34814832407713553
Epoch: 29, step: 110, loss: 0.33700093626976013, mean loss: 0.3481480585809627
Epoch: 29, step: 111, loss: 0.3156442940235138, mean loss: 0.3481472844606293
Epoch: 29, step: 112, loss: 0.29950663447380066, mean loss: 0.3481461260465212
Epoch: 29, step: 113, loss: 0.37618979811668396, mean loss: 0.34814679391201464
Epoch: 29, step: 114, loss: 0.34874433279037476, mean loss: 0.34814680814218013
Epoch: 29, step: 115, loss: 0.32950475811958313, mean loss: 0.3481463641992857
Epoch: 29, step: 116, loss: 0.2914299964904785, mean loss: 0.34814501358447586
Epoch: 29, step: 117, loss: 0.32166463136672974, mean loss: 0.3481443830091028
Epoch: 29, step: 118, loss: 0.32876214385032654, mean loss: 0.3481439214722732
Epoch: 29, step: 119, loss: 0.3517429828643799, mean loss: 0.348144007172373
Epoch: 29, step: 120, loss: 0.3318786025047302, mean loss: 0.34814361987316905
Epoch: 29, step: 121, loss: 0.3323878049850464, mean loss: 0.34814324471685476
Epoch: 29, step: 122, loss: 0.3120788037776947, mean loss: 0.34814238601924435
Epoch: 29, step: 123, loss: 0.3311249315738678, mean loss: 0.34814198084175757
Epoch: 29, step: 124, loss: 0.30553582310676575, mean loss: 0.3481409664335831
Epoch: 29, step: 125, loss: 0.3297077715396881, mean loss: 0.3481405275688887
Epoch: 29, step: 126, loss: 0.3071657419204712, mean loss: 0.3481395520484342
Epoch: 29, step: 127, loss: 0.34389039874076843, mean loss: 0.3481394508877517
Epoch: 29, step: 128, loss: 0.33601340651512146, mean loss: 0.3481391622067763
Epoch: 29, step: 129, loss: 0.31392496824264526, mean loss: 0.3481383476994687
Epoch: 29, step: 130, loss: 0.34319013357162476, mean loss: 0.3481382299044791
Epoch: 29, step: 131, loss: 0.3420774042606354, mean loss: 0.34813808562658816
Epoch: 29, step: 132, loss: 0.33092227578163147, mean loss: 0.3481376758141707
Epoch: 29, step: 133, loss: 0.33895912766456604, mean loss: 0.3481374573293302
Epoch: 29, step: 134, loss: 0.34856611490249634, mean loss: 0.34813746753279057
Epoch: 29, step: 135, loss: 0.33137187361717224, mean loss: 0.3481370684660021
Epoch: 29, step: 136, loss: 0.3076806366443634, mean loss: 0.34813610551568147
Epoch: 29, step: 137, loss: 0.3178185522556305, mean loss: 0.3481353839097106
Epoch: 29, step: 138, loss: 0.34754616022109985, mean loss: 0.3481353698855838
Epoch: 29, step: 139, loss: 0.31756114959716797, mean loss: 0.3481346422051695
Epoch: 29, step: 140, loss: 0.3516441881656647, mean loss: 0.3481347257319791
Epoch: 29, step: 141, loss: 0.32356899976730347, mean loss: 0.3481341410843052
Epoch: 29, step: 142, loss: 0.31777867674827576, mean loss: 0.34813341866196446
Epoch: 29, step: 143, loss: 0.32679295539855957, mean loss: 0.3481329107975365
Epoch: 29, step: 144, loss: 0.3318871259689331, mean loss: 0.34813252418644136
Epoch: 29, step: 145, loss: 0.30772897601127625, mean loss: 0.3481315627008344
Epoch: 29, step: 146, loss: 0.3087846040725708, mean loss: 0.34813062638123254
Epoch: 29, step: 147, loss: 0.3337216079235077, mean loss: 0.3481302835052936
Epoch: 29, step: 148, loss: 0.3646855354309082, mean loss: 0.34813067744347154
Epoch: 29, step: 149, loss: 0.3161132037639618, mean loss: 0.3481299155942906
Epoch: 29, step: 150, loss: 0.3210623562335968, mean loss: 0.34812927154262474
Epoch: 29, step: 151, loss: 0.34877249598503113, mean loss: 0.34812928684728933
Epoch: 29, step: 152, loss: 0.33616435527801514, mean loss: 0.3481290021645329
Epoch: 29, step: 153, loss: 0.35149869322776794, mean loss: 0.34812908233800577
Epoch: 29, step: 154, loss: 0.3642626106739044, mean loss: 0.3481294661863162
Epoch: 29, step: 155, loss: 0.37917211651802063, mean loss: 0.3481302047343351
Epoch: 29, step: 156, loss: 0.3323858678340912, mean loss: 0.3481298301634765
Epoch: 29, step: 157, loss: 0.33920997381210327, mean loss: 0.3481296179577299
Epoch: 29, step: 158, loss: 0.3335428833961487, mean loss: 0.3481292709437044
Epoch: 29, step: 159, loss: 0.3407585024833679, mean loss: 0.3481290955995123
Epoch: 29, step: 160, loss: 0.28842291235923767, mean loss: 0.34812767527495914
Epoch: 29, step: 161, loss: 0.35912880301475525, mean loss: 0.3481279369698005
Epoch: 29, step: 162, loss: 0.33646318316459656, mean loss: 0.348127659495222
Epoch: 29, step: 163, loss: 0.31083551049232483, mean loss: 0.3481267724317348
Epoch: 29, step: 164, loss: 0.3269665837287903, mean loss: 0.34812626910905686
Epoch: 29, step: 165, loss: 0.33581116795539856, mean loss: 0.3481259761852865
Epoch: 29, step: 166, loss: 0.35763290524482727, mean loss: 0.34812620230923247
Epoch: 29, step: 167, loss: 0.28332579135894775, mean loss: 0.34812466105695034
Epoch: 29, step: 168, loss: 0.3461730182170868, mean loss: 0.3481246146389972
Epoch: 29, step: 169, loss: 0.3553488850593567, mean loss: 0.34812478645725387
Epoch: 29, step: 170, loss: 0.3083655536174774, mean loss: 0.3481238408670134
Epoch: 29, step: 171, loss: 0.32943376898765564, mean loss: 0.3481233963732948
Epoch: 29, step: 172, loss: 0.34427839517593384, mean loss: 0.3481233049323284
Epoch: 29, step: 173, loss: 0.3497956097126007, mean loss: 0.3481233447017643
Epoch: 29, step: 174, loss: 0.36138612031936646, mean loss: 0.34812366009915363
Epoch: 29, step: 175, loss: 0.31089669466018677, mean loss: 0.3481227748388702
Epoch: 29, step: 176, loss: 0.3262656331062317, mean loss: 0.3481222550866116
Epoch: 29, step: 177, loss: 0.3065667748451233, mean loss: 0.34812126694088846
Epoch: 29, step: 178, loss: 0.3513256907463074, mean loss: 0.34812134313691284
Epoch: 29, step: 179, loss: 0.3289836049079895, mean loss: 0.34812088808321706
Epoch: 29, step: 180, loss: 0.318904310464859, mean loss: 0.3481201933932102
Epoch: 29, step: 181, loss: 0.310016006231308, mean loss: 0.34811928740178977
Epoch: 29, step: 182, loss: 0.3369741141796112, mean loss: 0.34811902241276904
Epoch: 29, step: 183, loss: 0.367186576128006, mean loss: 0.34811947575451213
Epoch: 29, step: 184, loss: 0.3288525938987732, mean loss: 0.34811901768452197
Epoch: 29, step: 185, loss: 0.31673702597618103, mean loss: 0.34811827159561254
Epoch: 29, step: 186, loss: 0.30116137862205505, mean loss: 0.3481171552488714
Epoch: 29, step: 187, loss: 0.3341789245605469, mean loss: 0.348116823891162
Epoch: 29, step: 188, loss: 0.32081276178359985, mean loss: 0.34811617479899254
Epoch: 29, step: 189, loss: 0.35435548424720764, mean loss: 0.3481163231209021
Epoch: 29, step: 190, loss: 0.3101873993873596, mean loss: 0.348115421489606
Epoch: 29, step: 191, loss: 0.33856314420700073, mean loss: 0.3481151944220658
Epoch: 29, step: 192, loss: 0.3323083221912384, mean loss: 0.34811481868524696
Epoch: 29, step: 193, loss: 0.3546351194381714, mean loss: 0.3481149736721914
Epoch: 29, step: 194, loss: 0.34545934200286865, mean loss: 0.3481149105495732
Epoch: 29, step: 195, loss: 0.34464144706726074, mean loss: 0.34811482798959315
Epoch: 29, step: 196, loss: 0.3521776497364044, mean loss: 0.34811492455560333
Epoch: 29, step: 197, loss: 0.298373818397522, mean loss: 0.348113742326527
Epoch: 29, step: 198, loss: 0.3643393814563751, mean loss: 0.34811412796263225
Epoch: 29, step: 199, loss: 0.31662195920944214, mean loss: 0.34811337950344523
Epoch: 29, step: 200, loss: 0.32708269357681274, mean loss: 0.3481128796891541
Epoch: 29, step: 201, loss: 0.3248320519924164, mean loss: 0.34811232641124884
Epoch: 29, step: 202, loss: 0.3188905417919159, mean loss: 0.3481116319607006
Epoch: 29, step: 203, loss: 0.34012916684150696, mean loss: 0.3481114422633356
Epoch: 29, step: 204, loss: 0.31065940856933594, mean loss: 0.3481105522646737
Epoch: 29, step: 205, loss: 0.30808770656585693, mean loss: 0.34810960119662326
Epoch: 29, step: 206, loss: 0.35042059421539307, mean loss: 0.3481096561117438
Epoch: 29, step: 207, loss: 0.3428196609020233, mean loss: 0.34810953041087866
Epoch: 29, step: 208, loss: 0.35380131006240845, mean loss: 0.348109665655732
Epoch: 29, step: 209, loss: 0.32623714208602905, mean loss: 0.3481091459455298
Epoch: 29, step: 210, loss: 0.3535369336605072, mean loss: 0.34810927491142696
Epoch: 29, step: 211, loss: 0.334242045879364, mean loss: 0.34810894542964993
Epoch: 29, step: 212, loss: 0.3155243694782257, mean loss: 0.348108171246943
Epoch: 29, step: 213, loss: 0.3363860547542572, mean loss: 0.34810789274571957
Epoch: 29, step: 214, loss: 0.3466135561466217, mean loss: 0.34810785724319887
Epoch: 29, step: 215, loss: 0.326264888048172, mean loss: 0.3481073383092163
Epoch: 29, step: 216, loss: 0.3292129933834076, mean loss: 0.3481068894377905
Epoch: 29, step: 217, loss: 0.314220666885376, mean loss: 0.3481060844246639
Epoch: 29, step: 218, loss: 0.37698832154273987, mean loss: 0.3481067705450373
Epoch: 29, step: 219, loss: 0.36116698384284973, mean loss: 0.3481070807933578
Epoch: 29, step: 220, loss: 0.31675705313682556, mean loss: 0.3481063360840517
Epoch: 29, step: 221, loss: 0.30712705850601196, mean loss: 0.3481053626582933
Epoch: 29, step: 222, loss: 0.34388861060142517, mean loss: 0.3481052624955327
Epoch: 29, step: 223, loss: 0.31603455543518066, mean loss: 0.3481045007210182
Epoch: 29, step: 224, loss: 0.30043116211891174, mean loss: 0.3481033683645753
Epoch: 29, step: 225, loss: 0.3354376554489136, mean loss: 0.3481030675305789
Epoch: 29, step: 226, loss: 0.37703177332878113, mean loss: 0.3481037546242729
Epoch: 29, step: 227, loss: 0.33992576599121094, mean loss: 0.34810356039121587
Epoch: 29, step: 228, loss: 0.3856394290924072, mean loss: 0.3481044518736693
Epoch: 29, step: 229, loss: 0.3160408139228821, mean loss: 0.3481036903755942
Epoch: 29, step: 230, loss: 0.3049274981021881, mean loss: 0.34810266498332515
Epoch: 29, step: 231, loss: 0.3371203541755676, mean loss: 0.3481024041703963
Epoch: 29, step: 232, loss: 0.3288946747779846, mean loss: 0.34810194802730593
Epoch: 29, step: 233, loss: 0.3079215884208679, mean loss: 0.3481009938511101
Epoch: 29, step: 234, loss: 0.33799153566360474, mean loss: 0.34810075378418726
Epoch: 29, step: 235, loss: 0.34118083119392395, mean loss: 0.34810058946231726
Epoch: 29, step: 236, loss: 0.3193223476409912, mean loss: 0.348099906104641
Epoch: 29, step: 237, loss: 0.3504476845264435, mean loss: 0.3480999618528107
Epoch: 29, step: 238, loss: 0.31123945116996765, mean loss: 0.34809908661808003
Epoch: 29, step: 239, loss: 0.39066067337989807, mean loss: 0.3481000971980677
Epoch: 29, step: 240, loss: 0.3454582393169403, mean loss: 0.3481000344714281
Epoch: 29, step: 241, loss: 0.296783447265625, mean loss: 0.3480988160710481
Epoch: 29, step: 242, loss: 0.3294306993484497, mean loss: 0.3480983728478775
Epoch: 29, step: 243, loss: 0.32199254631996155, mean loss: 0.3480977530514262
Epoch: 29, step: 244, loss: 0.3532958924770355, mean loss: 0.3480978764611132
Epoch: 29, step: 245, loss: 0.3735329508781433, mean loss: 0.348098480304103
Epoch: 29, step: 246, loss: 0.3498636484146118, mean loss: 0.34809852220919313
Epoch: 29, step: 247, loss: 0.3219950199127197, mean loss: 0.34809790252677225
Epoch: 29, step: 248, loss: 0.3436025083065033, mean loss: 0.34809779581118244
Epoch: 29, step: 249, loss: 0.3262079656124115, mean loss: 0.3480972761836318
Epoch: 29, step: 250, loss: 0.32333892583847046, mean loss: 0.34809668847621505
Epoch: 29, step: 251, loss: 0.3062610328197479, mean loss: 0.34809569541564594
Epoch: 29, step: 252, loss: 0.3438085615634918, mean loss: 0.34809559365358533
Epoch: 29, step: 253, loss: 0.35131534934043884, mean loss: 0.3480956700778836
Epoch: 29, step: 254, loss: 0.33546483516693115, mean loss: 0.34809537027880666
Epoch: 29, step: 255, loss: 0.30853724479675293, mean loss: 0.34809443136953383
Epoch: 29, step: 256, loss: 0.3057522773742676, mean loss: 0.3480934264053966
Epoch: 29, step: 257, loss: 0.31876903772354126, mean loss: 0.3480927304261712
Epoch: 29, step: 258, loss: 0.38320350646972656, mean loss: 0.3480935637185895
Epoch: 29, step: 259, loss: 0.3288979232311249, mean loss: 0.3480931081546896
Epoch: 29, step: 260, loss: 0.28851139545440674, mean loss: 0.34809169415481533
Epoch: 29, step: 261, loss: 0.2916283905506134, mean loss: 0.3480903541931749
Epoch: 29, step: 262, loss: 0.33345744013786316, mean loss: 0.34809000693970293
Epoch: 29, step: 263, loss: 0.3522258698940277, mean loss: 0.34809010508547783
Epoch: 29, step: 264, loss: 0.33127444982528687, mean loss: 0.3480897060523448
Epoch: 29, step: 265, loss: 0.32736217975616455, mean loss: 0.34808921420273403
Epoch: 29, step: 266, loss: 0.3210870027542114, mean loss: 0.3480885734744648
Epoch: 29, step: 267, loss: 0.3536466658115387, mean loss: 0.3480887053578251
Epoch: 29, step: 268, loss: 0.31462785601615906, mean loss: 0.3480879114119397
Epoch: 29, step: 269, loss: 0.3083122968673706, mean loss: 0.3480869676541799
Epoch: 29, step: 270, loss: 0.3452284038066864, mean loss: 0.3480868998305187
Epoch: 29, step: 271, loss: 0.3144263029098511, mean loss: 0.3480861012019498
Epoch: 29, step: 272, loss: 0.36120542883872986, mean loss: 0.34808641246265914
Epoch: 29, step: 273, loss: 0.31335681676864624, mean loss: 0.3480855885102109
Epoch: 29, step: 274, loss: 0.3234138786792755, mean loss: 0.3480850031929033
Epoch: 29, step: 275, loss: 0.3848975896835327, mean loss: 0.34808587652243667
Epoch: 29, step: 276, loss: 0.3336271643638611, mean loss: 0.3480855335169054
Epoch: 29, step: 277, loss: 0.30519118905067444, mean loss: 0.3480845159540533
Epoch: 29, step: 278, loss: 0.31987524032592773, mean loss: 0.3480838467742258
Epoch: 29, step: 279, loss: 0.30520495772361755, mean loss: 0.3480828296262742
Epoch: 29, step: 280, loss: 0.36029306054115295, mean loss: 0.3480831192633668
Epoch: 29, step: 281, loss: 0.3166793882846832, mean loss: 0.34808237435775036
Epoch: 29, step: 282, loss: 0.36790546774864197, mean loss: 0.3480828445561277
Epoch: 29, step: 283, loss: 0.3295459747314453, mean loss: 0.34808240487705217
Epoch: 29, step: 284, loss: 0.3776107132434845, mean loss: 0.3480831052472608
Epoch: 29, step: 285, loss: 0.30774369835853577, mean loss: 0.34808214847559704
Epoch: 29, step: 286, loss: 0.34726542234420776, mean loss: 0.3480821291049135
Epoch: 29, step: 287, loss: 0.3481220304965973, mean loss: 0.3480821300512514
Epoch: 29, step: 288, loss: 0.3400411009788513, mean loss: 0.348081939347372
Epoch: 29, step: 289, loss: 0.34896448254585266, mean loss: 0.34808196027758115
Epoch: 29, step: 290, loss: 0.3348767161369324, mean loss: 0.3480816471122115
Epoch: 29, step: 291, loss: 0.37893566489219666, mean loss: 0.34808237880491166
Epoch: 29, step: 292, loss: 0.37154653668403625, mean loss: 0.3480829352363632
Epoch: 29, step: 293, loss: 0.3548237979412079, mean loss: 0.3480830950860835
Epoch: 29, step: 294, loss: 0.34526193141937256, mean loss: 0.3480830281878912
Epoch: 29, step: 295, loss: 0.3457270562648773, mean loss: 0.34808297232210533
Epoch: 29, step: 296, loss: 0.3640668988227844, mean loss: 0.3480833513306298
Epoch: 29, step: 297, loss: 0.3058306872844696, mean loss: 0.3480823494654037
Epoch: 29, step: 298, loss: 0.30966246128082275, mean loss: 0.3480814385018427
Epoch: 29, step: 299, loss: 0.35060515999794006, mean loss: 0.34808149833970065
Epoch: 29, step: 300, loss: 0.3261220157146454, mean loss: 0.34808097768904683
Epoch: 29, step: 301, loss: 0.32947203516960144, mean loss: 0.34808053648883536
Epoch: 29, step: 302, loss: 0.30642595887184143, mean loss: 0.3480795489220932
Epoch: 29, step: 303, loss: 0.3728281259536743, mean loss: 0.3480801356593391
Epoch: 29, step: 304, loss: 0.31366270780563354, mean loss: 0.34807931971311085
Epoch: 29, step: 305, loss: 0.33675163984298706, mean loss: 0.3480790511701335
Epoch: 29, step: 306, loss: 0.3289549946784973, mean loss: 0.34807859781080647
Epoch: 29, step: 307, loss: 0.3544176518917084, mean loss: 0.34807874808233313
Epoch: 29, step: 308, loss: 0.3152080774307251, mean loss: 0.34807796887952047
Epoch: 29, step: 309, loss: 0.34000861644744873, mean loss: 0.34807777759918024
Epoch: 29, step: 310, loss: 0.3482595682144165, mean loss: 0.3480777819083422
Epoch: 29, step: 311, loss: 0.3403918147087097, mean loss: 0.3480775997246123
Epoch: 29, step: 312, loss: 0.3508372902870178, mean loss: 0.3480776651371739
Epoch: 29, step: 313, loss: 0.33461904525756836, mean loss: 0.34807734613693975
Epoch: 29, step: 314, loss: 0.3476879298686981, mean loss: 0.34807733690709763
Epoch: 29, step: 315, loss: 0.3372017741203308, mean loss: 0.3480770791434745
Epoch: 29, step: 316, loss: 0.31384003162384033, mean loss: 0.348076267704432
Epoch: 29, step: 317, loss: 0.3207494914531708, mean loss: 0.34807562005841003
Epoch: 29, step: 318, loss: 0.34024477005004883, mean loss: 0.34807543447125494
Epoch: 29, step: 319, loss: 0.3757961392402649, mean loss: 0.34807609142226376
Epoch: 29, step: 320, loss: 0.35518208146095276, mean loss: 0.3480762598226249
Epoch: 29, step: 321, loss: 0.3170986473560333, mean loss: 0.3480755257211873
Epoch: 29, step: 322, loss: 0.334940105676651, mean loss: 0.3480752144479333
Epoch: 29, step: 323, loss: 0.36307457089424133, mean loss: 0.3480755698829202
Epoch: 29, step: 324, loss: 0.3336169123649597, mean loss: 0.34807522726882295
Epoch: 29, step: 325, loss: 0.34018442034721375, mean loss: 0.3480750402917384
Epoch: 29, step: 326, loss: 0.3112000823020935, mean loss: 0.3480741665396831
Epoch: 29, step: 327, loss: 0.3851025700569153, mean loss: 0.34807504390684063
Epoch: 29, step: 328, loss: 0.32349643111228943, mean loss: 0.34807446154425814
Epoch: 29, step: 329, loss: 0.32859471440315247, mean loss: 0.3480740000044974
Epoch: 29, step: 330, loss: 0.37793225049972534, mean loss: 0.3480747074286331
Epoch: 29, step: 331, loss: 0.3072967529296875, mean loss: 0.3480737413095443
Epoch: 29, step: 332, loss: 0.3264758288860321, mean loss: 0.34807322961979986
Epoch: 29, step: 333, loss: 0.3347134292125702, mean loss: 0.34807291311185373
Epoch: 29, step: 334, loss: 0.3866545259952545, mean loss: 0.3480738271298321
Epoch: 29, step: 335, loss: 0.3355049192905426, mean loss: 0.3480735293730843
Epoch: 29, step: 336, loss: 0.3488824963569641, mean loss: 0.34807354853701444
Epoch: 29, step: 337, loss: 0.3421342968940735, mean loss: 0.3480734078431299
Epoch: 29, step: 338, loss: 0.35477766394615173, mean loss: 0.3480735666553081
Epoch: 29, step: 339, loss: 0.2880248725414276, mean loss: 0.3480721442397757
Epoch: 29, step: 340, loss: 0.3067534267902374, mean loss: 0.3480711655175205
Epoch: 29, step: 341, loss: 0.35092222690582275, mean loss: 0.34807123304941184
Epoch: 29, step: 342, loss: 0.31575748324394226, mean loss: 0.34807046766534766
Epoch: 29, step: 343, loss: 0.3053027093410492, mean loss: 0.34806945469144135
Epoch: 29, step: 344, loss: 0.3411237299442291, mean loss: 0.3480692901826721
Epoch: 29, step: 345, loss: 0.32951951026916504, mean loss: 0.34806885084346706
Epoch: 29, step: 346, loss: 0.34234189987182617, mean loss: 0.34806871520765315
Epoch: 29, step: 347, loss: 0.3349996507167816, mean loss: 0.3480684056902107
Epoch: 29, step: 348, loss: 0.31649190187454224, mean loss: 0.348067657874845
Epoch: 29, step: 349, loss: 0.3632189631462097, mean loss: 0.3480680166894443
Epoch: 29, step: 350, loss: 0.36777785420417786, mean loss: 0.348068483448568
Epoch: 29, step: 351, loss: 0.3072569668292999, mean loss: 0.3480675169922684
Epoch: 29, step: 352, loss: 0.31241515278816223, mean loss: 0.3480666727296952
Epoch: 29, step: 353, loss: 0.33051106333732605, mean loss: 0.34806625701552535
Epoch: 29, step: 354, loss: 0.3271581828594208, mean loss: 0.3480657619272216
Epoch: 29, step: 355, loss: 0.30555060505867004, mean loss: 0.3480647552224274
Epoch: 29, step: 356, loss: 0.31948795914649963, mean loss: 0.3480640785762958
Epoch: 29, step: 357, loss: 0.3602270781993866, mean loss: 0.34806436656700523
Epoch: 29, step: 358, loss: 0.3158692419528961, mean loss: 0.3480636042815876
Epoch: 29, step: 359, loss: 0.31421807408332825, mean loss: 0.34806280293841596
Epoch: 29, step: 360, loss: 0.35286176204681396, mean loss: 0.34806291655820687
Epoch: 29, step: 361, loss: 0.3349063992500305, mean loss: 0.3480626050728783
Epoch: 29, step: 362, loss: 0.3368607759475708, mean loss: 0.34806233987178153
Epoch: 29, step: 363, loss: 0.3753221929073334, mean loss: 0.34806298522815077
Epoch: 29, step: 364, loss: 0.35501885414123535, mean loss: 0.34806314989917925
Epoch: 29, step: 365, loss: 0.3348236382007599, mean loss: 0.3480628364786097
Epoch: 29, step: 366, loss: 0.3581264019012451, mean loss: 0.3480630747089774
Epoch: 29, step: 367, loss: 0.3090638816356659, mean loss: 0.34806215152004943
Epoch: 29, step: 368, loss: 0.36276406049728394, mean loss: 0.3480624995354117
Epoch: 29, step: 369, loss: 0.38252225518226624, mean loss: 0.3480633152281553
Epoch: 29, step: 370, loss: 0.3705116808414459, mean loss: 0.34806384658814804
Epoch: 29, step: 371, loss: 0.3166865110397339, mean loss: 0.3480631038941614
Epoch: 29, step: 372, loss: 0.34806257486343384, mean loss: 0.34806310388163963
Epoch: 29, step: 373, loss: 0.36756640672683716, mean loss: 0.34806356549827505
Epoch: 29, step: 374, loss: 0.34086692333221436, mean loss: 0.3480633951675807
Epoch: 29, step: 375, loss: 0.3466714918613434, mean loss: 0.3480633622246832
Epoch: 29, step: 376, loss: 0.30954188108444214, mean loss: 0.3480624505383854
Epoch: 29, step: 377, loss: 0.3302064836025238, mean loss: 0.34806202795195723
Epoch: 29, step: 378, loss: 0.34746506810188293, mean loss: 0.3480620138244019
Epoch: 29, step: 379, loss: 0.3215273320674896, mean loss: 0.3480613858737734
Epoch: 29, step: 380, loss: 0.3566160500049591, mean loss: 0.34806158831748996
Epoch: 29, step: 381, loss: 0.34222450852394104, mean loss: 0.3480614501879099
Epoch: 29, step: 382, loss: 0.3416668176651001, mean loss: 0.3480612988678947
Epoch: 29, step: 383, loss: 0.30949175357818604, mean loss: 0.348060386195266
Epoch: 29, step: 384, loss: 0.3471394181251526, mean loss: 0.34806036440287896
Epoch: 29, step: 385, loss: 0.30296027660369873, mean loss: 0.3480592972482767
Epoch: 29, step: 386, loss: 0.35795995593070984, mean loss: 0.3480595315113125
Epoch: 29, step: 387, loss: 0.31891366839408875, mean loss: 0.3480588418969098
Epoch: 29, step: 388, loss: 0.3569825291633606, mean loss: 0.348059053033483
Epoch: 29, step: 389, loss: 0.33910346031188965, mean loss: 0.3480588411470324
Epoch: 29, step: 390, loss: 0.3522495925426483, mean loss: 0.34805894029652007
Epoch: 29, step: 391, loss: 0.31058984994888306, mean loss: 0.34805805383181043
Epoch: 29, step: 392, loss: 0.29113471508026123, mean loss: 0.34805670713946496
Epoch: 29, step: 393, loss: 0.37452226877212524, mean loss: 0.34805733324690835
Epoch: 29, step: 394, loss: 0.34004104137420654, mean loss: 0.3480571436064486
Epoch: 29, step: 395, loss: 0.3623194992542267, mean loss: 0.3480574810013116
Epoch: 29, step: 396, loss: 0.331846684217453, mean loss: 0.3480570975225714
Epoch: 29, step: 397, loss: 0.3321724236011505, mean loss: 0.3480567217674046
Epoch: 29, step: 398, loss: 0.334371954202652, mean loss: 0.3480563980591239
Epoch: 29, step: 399, loss: 0.3133722245693207, mean loss: 0.348055577636816
Epoch: 29, step: 400, loss: 0.3026195466518402, mean loss: 0.3480545029146033
Epoch: 29, step: 401, loss: 0.3373434245586395, mean loss: 0.3480542495658556
Epoch: 29, step: 402, loss: 0.3248157501220703, mean loss: 0.3480536999194722
Epoch: 29, step: 403, loss: 0.3694905936717987, mean loss: 0.3480542069415572
Epoch: 29, step: 404, loss: 0.31043508648872375, mean loss: 0.3480533172010011
Epoch: 29, step: 405, loss: 0.31517767906188965, mean loss: 0.3480525396682888
Epoch: 29, step: 406, loss: 0.34395530819892883, mean loss: 0.3480524427680814
Epoch: 29, step: 407, loss: 0.3088374435901642, mean loss: 0.348051515348746
Epoch: 29, step: 408, loss: 0.3666958510875702, mean loss: 0.34805195626953916
Epoch: 29, step: 409, loss: 0.3308519124984741, mean loss: 0.34805154951449563
Epoch: 29, step: 410, loss: 0.32898715138435364, mean loss: 0.34805109868095035
Epoch: 29, step: 411, loss: 0.34542062878608704, mean loss: 0.3480510364772544
Epoch: 29, step: 412, loss: 0.3232352137565613, mean loss: 0.3480504496621791
Epoch: 29, step: 413, loss: 0.32975685596466064, mean loss: 0.34805001708725125
Epoch: 29, step: 414, loss: 0.33076006174087524, mean loss: 0.3480496082542762
Epoch: 29, step: 415, loss: 0.3395078480243683, mean loss: 0.3480494062832124
Epoch: 29, step: 416, loss: 0.35238727927207947, mean loss: 0.34804950885037456
Epoch: 29, step: 417, loss: 0.38613519072532654, mean loss: 0.34805040934883474
Epoch: 29, step: 418, loss: 0.31217506527900696, mean loss: 0.3480495611316916
Epoch: 29, step: 419, loss: 0.3684592545032501, mean loss: 0.3480500436759835
Epoch: 29, step: 420, loss: 0.3327154219150543, mean loss: 0.348049681129662
Epoch: 29, step: 421, loss: 0.31726357340812683, mean loss: 0.34804895329128377
Epoch: 29, step: 422, loss: 0.3611568510532379, mean loss: 0.3480492631779894
Epoch: 29, step: 423, loss: 0.3293495774269104, mean loss: 0.3480488211050402
Epoch: 29, step: 424, loss: 0.32283705472946167, mean loss: 0.34804822509628447
Epoch: 29, step: 425, loss: 0.32749515771865845, mean loss: 0.34804773923113913
Epoch: 29, step: 426, loss: 0.3255898952484131, mean loss: 0.3480472083504928
Epoch: 29, step: 427, loss: 0.338309645652771, mean loss: 0.34804697816983143
Epoch: 29, step: 428, loss: 0.32826536893844604, mean loss: 0.34804651057476627
Epoch: 29, step: 429, loss: 0.3163711130619049, mean loss: 0.3480457618536035
Epoch: 29, step: 430, loss: 0.31584757566452026, mean loss: 0.34804500079311257
Epoch: 29, step: 431, loss: 0.3133244812488556, mean loss: 0.3480441801322554
Epoch: 29, step: 432, loss: 0.3182569444179535, mean loss: 0.3480434760920816
Epoch: 29, step: 433, loss: 0.3491044342517853, mean loss: 0.34804350116790667
Epoch: 29, step: 434, loss: 0.36090201139450073, mean loss: 0.3480438050725704
Epoch: 29, step: 435, loss: 0.3501409888267517, mean loss: 0.3480438546373216
Epoch: 29, step: 436, loss: 0.3592117428779602, mean loss: 0.34804411857247725
Epoch: 29, step: 437, loss: 0.31549498438835144, mean loss: 0.3480433493439906
Epoch: 29, step: 438, loss: 0.30055588483810425, mean loss: 0.34804222710685234
Epoch: 29, step: 439, loss: 0.3095030188560486, mean loss: 0.34804131635894964
Epoch: 29, step: 440, loss: 0.32499611377716064, mean loss: 0.34804077177397
Epoch: 29, step: 441, loss: 0.30364152789115906, mean loss: 0.3480397225929151
Epoch: 29, step: 442, loss: 0.31059205532073975, mean loss: 0.34803883770274113
Epoch: 29, step: 443, loss: 0.25834619998931885, mean loss: 0.3480367183114908
Epoch: 29, step: 444, loss: 0.3017948269844055, mean loss: 0.34803562566501917
Epoch: 29, step: 445, loss: 0.32069042325019836, mean loss: 0.3480349795423781
Epoch: 29, step: 446, loss: 0.35205787420272827, mean loss: 0.34803507459458755
Epoch: 29, step: 447, loss: 0.3324887156486511, mean loss: 0.3480347072767786
Epoch: 29, step: 448, loss: 0.343994677066803, mean loss: 0.34803461182420425
Epoch: 29, step: 449, loss: 0.32490870356559753, mean loss: 0.348034065448259
Epoch: 29, step: 450, loss: 0.3557332456111908, mean loss: 0.3480342473458696
Epoch: 29, step: 451, loss: 0.3333284556865692, mean loss: 0.3480338999211942
Epoch: 29, step: 452, loss: 0.3371860980987549, mean loss: 0.34803364364767436
Epoch: 29, step: 453, loss: 0.31094077229499817, mean loss: 0.34803276736911654
Epoch: 29, step: 454, loss: 0.3146441578865051, mean loss: 0.34803197861833146
Epoch: 29, step: 455, loss: 0.319623738527298, mean loss: 0.3480313075364055
Epoch: 29, step: 456, loss: 0.3461001217365265, mean loss: 0.34803126191748407
Epoch: 29, step: 457, loss: 0.3329103887081146, mean loss: 0.3480309047371276
Epoch: 29, step: 458, loss: 0.3759152591228485, mean loss: 0.3480315633967328
Epoch: 29, step: 459, loss: 0.3394499123096466, mean loss: 0.3480313606933341
Epoch: 29, step: 460, loss: 0.36499378085136414, mean loss: 0.3480317613457223
Epoch: 29, step: 461, loss: 0.3165034055709839, mean loss: 0.3480310166635036
Epoch: 29, step: 462, loss: 0.37444397807121277, mean loss: 0.34803164050821905
Epoch: 29, step: 463, loss: 0.34084147214889526, mean loss: 0.3480314706884656
Epoch: 29, step: 464, loss: 0.3064667284488678, mean loss: 0.3480304890219429
Epoch: 29, step: 465, loss: 0.32743504643440247, mean loss: 0.34803000261500444
Epoch: 29, step: 466, loss: 0.3047385513782501, mean loss: 0.3480289802157593
Epoch: 29, step: 467, loss: 0.3079717457294464, mean loss: 0.34802803422023487
Epoch: 29, step: 468, loss: 0.29101818799972534, mean loss: 0.34802668790198665
Epoch: 29, step: 469, loss: 0.34441208839416504, mean loss: 0.3480266025432867
Epoch: 29, step: 470, loss: 0.32338765263557434, mean loss: 0.3480260207086843
Epoch: 29, step: 471, loss: 0.3871029317378998, mean loss: 0.3480269434656275
Epoch: 29, step: 472, loss: 0.34819912910461426, mean loss: 0.3480269475315001
Epoch: 29, step: 473, loss: 0.32919660210609436, mean loss: 0.3480265028952445
Epoch: 29, step: 474, loss: 0.33426743745803833, mean loss: 0.34802617801353125
Epoch: 29, step: 475, loss: 0.37920063734054565, mean loss: 0.3480269140935116
Epoch: 29, step: 476, loss: 0.3055697977542877, mean loss: 0.34802591163521257
Epoch: 29, step: 477, loss: 0.370412141084671, mean loss: 0.3480264401857497
Epoch: 29, step: 478, loss: 0.32638177275657654, mean loss: 0.34802592915594377
Epoch: 29, step: 479, loss: 0.31793099641799927, mean loss: 0.3480252186324586
Epoch: 29, step: 480, loss: 0.3405285179615021, mean loss: 0.3480250416439875
Epoch: 29, step: 481, loss: 0.3381752371788025, mean loss: 0.3480248091069351
Epoch: 29, step: 482, loss: 0.3218589127063751, mean loss: 0.3480241913894158
Epoch: 29, step: 483, loss: 0.3376356363296509, mean loss: 0.34802394614496207
Epoch: 29, step: 484, loss: 0.33549970388412476, mean loss: 0.34802365048994305
Epoch: 29, step: 485, loss: 0.3527836203575134, mean loss: 0.34802376285408704
Epoch: 29, step: 486, loss: 0.3528161346912384, mean loss: 0.3480238759804435
Epoch: 29, step: 487, loss: 0.3443598747253418, mean loss: 0.34802378949188584
Epoch: 29, step: 488, loss: 0.32703620195388794, mean loss: 0.3480232940926757
Epoch: 29, step: 489, loss: 0.30800196528434753, mean loss: 0.34802234943590354
Epoch: 29, step: 490, loss: 0.33774909377098083, mean loss: 0.3480221069534133
Epoch: 29, step: 491, loss: 0.31052207946777344, mean loss: 0.3480212218508008
Epoch: 29, step: 492, loss: 0.3319479823112488, mean loss: 0.348020842487598
Epoch: 29, step: 493, loss: 0.3079085052013397, mean loss: 0.3480198957720614
Epoch: 29, step: 494, loss: 0.37632322311401367, mean loss: 0.3480205637602453
Epoch: 29, step: 495, loss: 0.2791532874107361, mean loss: 0.3480189384587172
Epoch: 29, step: 496, loss: 0.29516518115997314, mean loss: 0.3480176911135375
Epoch: 29, step: 497, loss: 0.3745276927947998, mean loss: 0.3480183167330608
Epoch: 29, step: 498, loss: 0.34505170583724976, mean loss: 0.34801824672454407
Epoch: 29, step: 499, loss: 0.3420795202255249, mean loss: 0.34801810658091326
Epoch: 29, step: 500, loss: 0.3584566116333008, mean loss: 0.3480183529056897
Epoch: 29, step: 501, loss: 0.35010045766830444, mean loss: 0.348018402037427
Epoch: 29, step: 502, loss: 0.31005358695983887, mean loss: 0.3480175061971505
Epoch: 29, step: 503, loss: 0.32709601521492004, mean loss: 0.3480170125328989
Epoch: 29, step: 504, loss: 0.33487313985824585, mean loss: 0.34801670239692584
Epoch: 29, step: 505, loss: 0.3351294994354248, mean loss: 0.34801639832437237
Epoch: 29, step: 506, loss: 0.35489505529403687, mean loss: 0.3480165606219202
Epoch: 29, step: 507, loss: 0.335025817155838, mean loss: 0.3480162541208003
Epoch: 29, step: 508, loss: 0.3500683903694153, mean loss: 0.3480163025373686
Epoch: 29, step: 509, loss: 0.3457944989204407, mean loss: 0.348016250119032
Epoch: 29, step: 510, loss: 0.37640443444252014, mean loss: 0.3480169198570253
Epoch: 29, step: 511, loss: 0.3104168772697449, mean loss: 0.34801603281251775
Epoch: 29, step: 512, loss: 0.31982895731925964, mean loss: 0.34801536785048764
Epoch: 29, step: 513, loss: 0.324342280626297, mean loss: 0.3480148093912467
Epoch: 29, step: 514, loss: 0.3857097327709198, mean loss: 0.348015698611208
Epoch: 29, step: 515, loss: 0.33658069372177124, mean loss: 0.3480154288668013
Epoch: 29, step: 516, loss: 0.3052210807800293, mean loss: 0.3480144193994815
Epoch: 29, step: 517, loss: 0.3199361562728882, mean loss: 0.3480137570825705
Epoch: 29, step: 518, loss: 0.32552334666252136, mean loss: 0.34801322658580386
Epoch: 29, step: 519, loss: 0.3254605531692505, mean loss: 0.3480126946329447
Epoch: 29, step: 520, loss: 0.3369467258453369, mean loss: 0.34801243362464723
Epoch: 29, step: 521, loss: 0.31484508514404297, mean loss: 0.34801165133896206
Epoch: 29, step: 522, loss: 0.3115522265434265, mean loss: 0.34801079142658686
Epoch: 29, step: 523, loss: 0.30522963404655457, mean loss: 0.348009782437026
Epoch: 29, step: 524, loss: 0.3410777449607849, mean loss: 0.34800961894943194
Epoch: 29, step: 525, loss: 0.32297804951667786, mean loss: 0.34800902861007454
Epoch: 29, step: 526, loss: 0.31814923882484436, mean loss: 0.34800832441957424
Epoch: 29, step: 527, loss: 0.37288081645965576, mean loss: 0.34800891097961667
Epoch: 29, step: 528, loss: 0.34122738242149353, mean loss: 0.3480087510567642
Epoch: 29, step: 529, loss: 0.3561502695083618, mean loss: 0.34800894304654045
Epoch: 29, step: 530, loss: 0.30154454708099365, mean loss: 0.3480078473690352
Epoch: 29, step: 531, loss: 0.2989756166934967, mean loss: 0.3480066911666518
Epoch: 29, step: 532, loss: 0.33747828006744385, mean loss: 0.3480064429077657
Epoch: 29, step: 533, loss: 0.3305130898952484, mean loss: 0.34800603042596867
Epoch: 29, step: 534, loss: 0.3407260477542877, mean loss: 0.34800585877279683
Epoch: 29, step: 535, loss: 0.37809526920318604, mean loss: 0.34800656822791404
Epoch: 29, step: 536, loss: 0.32633399963378906, mean loss: 0.34800605723909944
Epoch: 29, step: 537, loss: 0.3509100377559662, mean loss: 0.3480061257065988
Epoch: 29, step: 538, loss: 0.34697914123535156, mean loss: 0.34800610149383276
Epoch: 29, step: 539, loss: 0.30686154961586, mean loss: 0.3480051314695052
Epoch: 29, step: 540, loss: 0.324139267206192, mean loss: 0.3480045688209383
Epoch: 29, step: 541, loss: 0.34210205078125, mean loss: 0.3480044296696808
Epoch: 29, step: 542, loss: 0.32220253348350525, mean loss: 0.34800382140696395
Epoch: 29, step: 543, loss: 0.33510780334472656, mean loss: 0.34800351739899454
Epoch: 29, step: 544, loss: 0.33323755860328674, mean loss: 0.34800316931764813
Epoch: 29, step: 545, loss: 0.3198433816432953, mean loss: 0.3480025055161377
Epoch: 29, step: 546, loss: 0.3263247311115265, mean loss: 0.348001994525062
Epoch: 29, step: 547, loss: 0.3230676054954529, mean loss: 0.34800140678253344
Epoch: 29, step: 548, loss: 0.30314600467681885, mean loss: 0.3480003494955068
Epoch: 29, step: 549, loss: 0.3077124059200287, mean loss: 0.3479993998904633
Epoch: 29, step: 550, loss: 0.33230307698249817, mean loss: 0.3479990299297565
Epoch: 29, step: 551, loss: 0.28375929594039917, mean loss: 0.3479975158415603
Epoch: 29, step: 552, loss: 0.42262551188468933, mean loss: 0.34799927473279135
Epoch: 29, step: 553, loss: 0.30391639471054077, mean loss: 0.3479982357773348
Epoch: 29, step: 554, loss: 0.3254351317882538, mean loss: 0.3479977040174425
Epoch: 29, step: 555, loss: 0.31812146306037903, mean loss: 0.347996999920512
Epoch: 29, step: 556, loss: 0.31543809175491333, mean loss: 0.34799623261892676
Epoch: 29, step: 557, loss: 0.31327563524246216, mean loss: 0.3479954143930377
Epoch: 29, step: 558, loss: 0.3348446190357208, mean loss: 0.3479951044885872
Epoch: 29, step: 559, loss: 0.3644769787788391, mean loss: 0.3479954928822692
Epoch: 29, step: 560, loss: 0.34938475489616394, mean loss: 0.34799552561931507
Epoch: 29, step: 561, loss: 0.34640073776245117, mean loss: 0.3479954880400734
Epoch: 29, step: 562, loss: 0.3540617823600769, mean loss: 0.34799563098157343
Epoch: 29, step: 563, loss: 0.32067522406578064, mean loss: 0.34799498723965744
Epoch: 29, step: 564, loss: 0.3182310163974762, mean loss: 0.34799428593735915
Epoch: 29, step: 565, loss: 0.2938433885574341, mean loss: 0.34799301005739636
Epoch: 29, step: 566, loss: 0.3721067011356354, mean loss: 0.3479935782003429
Epoch: 29, step: 567, loss: 0.3204033374786377, mean loss: 0.34799292816168675
Epoch: 29, step: 568, loss: 0.2990054786205292, mean loss: 0.347991774022223
Epoch: 29, step: 569, loss: 0.3117239773273468, mean loss: 0.34799091957665224
Epoch: 29, step: 570, loss: 0.32692596316337585, mean loss: 0.34799042331174745
Epoch: 29, step: 571, loss: 0.31496521830558777, mean loss: 0.3479896452961753
Epoch: 29, step: 572, loss: 0.34296250343322754, mean loss: 0.34798952686837104
Epoch: 29, step: 573, loss: 0.3185635507106781, mean loss: 0.3479888336769421
Epoch: 29, step: 574, loss: 0.3121132254600525, mean loss: 0.3479879885706262
Epoch: 29, step: 575, loss: 0.30968984961509705, mean loss: 0.34798708641904424
Epoch: 29, step: 576, loss: 0.34413132071495056, mean loss: 0.3479869955947043
Epoch: 29, step: 577, loss: 0.34874922037124634, mean loss: 0.34798701354883765
Epoch: 29, step: 578, loss: 0.36929312348365784, mean loss: 0.3479875154004437
Epoch: 29, step: 579, loss: 0.3440071940422058, mean loss: 0.34798742164876295
Epoch: 29, step: 580, loss: 0.31757503747940063, mean loss: 0.34798670533851567
Epoch: 29, step: 581, loss: 0.3836338520050049, mean loss: 0.3479875449246164
Epoch: 29, step: 582, loss: 0.3154279887676239, mean loss: 0.34798677807763095
Epoch: 29, step: 583, loss: 0.3341228663921356, mean loss: 0.3479864515606341
Epoch: 29, step: 584, loss: 0.3633410334587097, mean loss: 0.34798681317675006
Epoch: 29, step: 585, loss: 0.33608436584472656, mean loss: 0.34798653286853726
Epoch: 29, step: 586, loss: 0.3214855492115021, mean loss: 0.34798590877265007
Epoch: 29, step: 587, loss: 0.3899191915988922, mean loss: 0.34798689627460055
Epoch: 29, step: 588, loss: 0.3218078017234802, mean loss: 0.34798627978821056
Epoch: 29, step: 589, loss: 0.2974940538406372, mean loss: 0.34798509078463247
Epoch: 29, step: 590, loss: 0.32377782464027405, mean loss: 0.34798452075929176
Epoch: 29, step: 591, loss: 0.3480631411075592, mean loss: 0.3479845226105762
Epoch: 29, step: 592, loss: 0.34485283493995667, mean loss: 0.3479844488700203
Epoch: 29, step: 593, loss: 0.3374069333076477, mean loss: 0.34798419981149514
Epoch: 29, step: 594, loss: 0.38857704401016235, mean loss: 0.3479851555894189
Epoch: 29, step: 595, loss: 0.32042545080184937, mean loss: 0.3479845066982721
Epoch: 29, step: 596, loss: 0.34360384941101074, mean loss: 0.34798440355845883
Epoch: 29, step: 597, loss: 0.33776775002479553, mean loss: 0.3479841630194577
Epoch: 29, step: 598, loss: 0.30908212065696716, mean loss: 0.347983247138531
Epoch: 29, step: 599, loss: 0.3193027079105377, mean loss: 0.34798257192101456
Epoch: 29, step: 600, loss: 0.3320195972919464, mean loss: 0.3479821961182359
Epoch: 29, step: 601, loss: 0.3016091287136078, mean loss: 0.3479811044221249
Epoch: 29, step: 602, loss: 0.3312203884124756, mean loss: 0.347980709857375
Epoch: 29, step: 603, loss: 0.33636969327926636, mean loss: 0.3479804365283595
Epoch: 29, step: 604, loss: 0.34343183040618896, mean loss: 0.3479803294544648
Epoch: 29, step: 605, loss: 0.32567837834358215, mean loss: 0.34797980448033194
Epoch: 29, step: 606, loss: 0.2993322014808655, mean loss: 0.3479786593728066
Epoch: 29, step: 607, loss: 0.3081355690956116, mean loss: 0.34797772153526124
Epoch: 29, step: 608, loss: 0.30852752923965454, mean loss: 0.3479767929677128
Epoch: 29, step: 609, loss: 0.32397913932800293, mean loss: 0.34797622813097506
Epoch: 29, step: 610, loss: 0.32979679107666016, mean loss: 0.3479758002486333
Epoch: 29, step: 611, loss: 0.3097553253173828, mean loss: 0.34797490068934755
Epoch: 29, step: 612, loss: 0.3036755919456482, mean loss: 0.3479738580828201
Epoch: 29, step: 613, loss: 0.3388502895832062, mean loss: 0.3479736433600971
Epoch: 29, step: 614, loss: 0.3617827892303467, mean loss: 0.34797396834999783
Epoch: 29, step: 615, loss: 0.3187659978866577, mean loss: 0.3479732809742456
Epoch: 29, step: 616, loss: 0.3560703992843628, mean loss: 0.34797347152606145
Epoch: 29, step: 617, loss: 0.3182183504104614, mean loss: 0.3479727713067101
Epoch: 29, step: 618, loss: 0.3243632912635803, mean loss: 0.34797221572417
Epoch: 29, step: 619, loss: 0.33109578490257263, mean loss: 0.34797181859430315
Epoch: 29, step: 620, loss: 0.3087078034877777, mean loss: 0.347970894669906
Epoch: 29, step: 621, loss: 0.3797913193702698, mean loss: 0.34797164342101666
Epoch: 29, step: 622, loss: 0.30796974897384644, mean loss: 0.34797070217782394
Epoch: 29, step: 623, loss: 0.3443794250488281, mean loss: 0.3479706176771856
Epoch: 29, step: 624, loss: 0.31302765011787415, mean loss: 0.34796979550905877
Epoch: 29, step: 625, loss: 0.32110586762428284, mean loss: 0.34796916344638207
Epoch: 29, step: 626, loss: 0.3250957727432251, mean loss: 0.3479686252869415
Epoch: 29, step: 627, loss: 0.3104165494441986, mean loss: 0.34796774179183887
Epoch: 29, step: 628, loss: 0.4226709306240082, mean loss: 0.34796949930716253
Epoch: 29, step: 629, loss: 0.32481735944747925, mean loss: 0.34796895462782645
Epoch: 29, step: 630, loss: 0.33293256163597107, mean loss: 0.3479686008886072
Epoch: 29, step: 631, loss: 0.3281823396682739, mean loss: 0.34796813541713784
Epoch: 29, step: 632, loss: 0.35600265860557556, mean loss: 0.34796832442471715
Epoch: 29, step: 633, loss: 0.3021414577960968, mean loss: 0.34796724639915544
Epoch: 29, step: 634, loss: 0.3283296823501587, mean loss: 0.347966784458386
Epoch: 29, step: 635, loss: 0.3374458849430084, mean loss: 0.3479665369776861
Epoch: 29, step: 636, loss: 0.2964951694011688, mean loss: 0.34796532625702237
Epoch: 29, step: 637, loss: 0.31282275915145874, mean loss: 0.34796449964538606
Epoch: 29, step: 638, loss: 0.33537745475769043, mean loss: 0.3479642035841162
Epoch: 29, step: 639, loss: 0.33949828147888184, mean loss: 0.3479640044609131
Epoch: 29, step: 640, loss: 0.3064277172088623, mean loss: 0.3479630275272806
Epoch: 29, step: 641, loss: 0.32530027627944946, mean loss: 0.3479624945118225
Epoch: 29, step: 642, loss: 0.37039437890052795, mean loss: 0.3479630220850107
Epoch: 29, step: 643, loss: 0.2963608205318451, mean loss: 0.34796180848666747
Epoch: 29, step: 644, loss: 0.3188810348510742, mean loss: 0.3479611245711049
Epoch: 29, step: 645, loss: 0.3548924922943115, mean loss: 0.34796128757773026
Epoch: 29, step: 646, loss: 0.36171239614486694, mean loss: 0.34796161095822004
Epoch: 29, step: 647, loss: 0.33346378803253174, mean loss: 0.3479612700255014
Epoch: 29, step: 648, loss: 0.3324844539165497, mean loss: 0.34796090607920843
Epoch: 29, step: 649, loss: 0.3174888789653778, mean loss: 0.34796018952869545
Epoch: 29, step: 650, loss: 0.31464001536369324, mean loss: 0.3479594060223544
Epoch: 29, step: 651, loss: 0.327624648809433, mean loss: 0.3479589278724952
Epoch: 29, step: 652, loss: 0.3229182958602905, mean loss: 0.34795833908291607
Epoch: 29, step: 653, loss: 0.3544427156448364, mean loss: 0.3479584915488592
Epoch: 29, step: 654, loss: 0.3698772192001343, mean loss: 0.3479590069077187
Epoch: 29, step: 655, loss: 0.331247478723526, mean loss: 0.3479586139911339
Epoch: 29, step: 656, loss: 0.3522997796535492, mean loss: 0.3479587160569572
Epoch: 29, step: 657, loss: 0.33698371052742004, mean loss: 0.3479584580279562
Epoch: 29, step: 658, loss: 0.31527042388916016, mean loss: 0.34795768953062134
Epoch: 29, step: 659, loss: 0.31888413429260254, mean loss: 0.3479570060259374
Epoch: 29, step: 660, loss: 0.3269270956516266, mean loss: 0.3479565116349278
Epoch: 29, step: 661, loss: 0.31875935196876526, mean loss: 0.3479558252566386
Epoch: 29, step: 662, loss: 0.3250623941421509, mean loss: 0.347955287081526
Epoch: 29, step: 663, loss: 0.3202517628669739, mean loss: 0.34795463584682423
Epoch: 29, step: 664, loss: 0.3381361961364746, mean loss: 0.347954405047367
Epoch: 29, step: 665, loss: 0.283927321434021, mean loss: 0.3479529000150786
Epoch: 29, step: 666, loss: 0.340239942073822, mean loss: 0.3479527187171461
Epoch: 29, step: 667, loss: 0.38015878200531006, mean loss: 0.34795347572314667
Epoch: 29, step: 668, loss: 0.3480716645717621, mean loss: 0.34795347850111935
Epoch: 29, step: 669, loss: 0.32802706956863403, mean loss: 0.3479530101513583
Epoch: 29, step: 670, loss: 0.31100142002105713, mean loss: 0.34795214166262517
Epoch: 29, step: 671, loss: 0.33552247285842896, mean loss: 0.34795184952976804
Epoch: 29, step: 672, loss: 0.33346864581108093, mean loss: 0.34795150914095235
Epoch: 29, step: 673, loss: 0.3628242015838623, mean loss: 0.3479518586754399
Epoch: 29, step: 674, loss: 0.35515138506889343, mean loss: 0.3479520278730238
Epoch: 29, step: 675, loss: 0.3426676392555237, mean loss: 0.3479519036864141
Epoch: 29, step: 676, loss: 0.3168254792690277, mean loss: 0.34795117221214866
Epoch: 29, step: 677, loss: 0.3092803359031677, mean loss: 0.3479502634647616
Epoch: 29, step: 678, loss: 0.30782005190849304, mean loss: 0.34794932044486837
Epoch: 29, step: 679, loss: 0.35439664125442505, mean loss: 0.3479494719469083
Epoch: 29, step: 680, loss: 0.31980612874031067, mean loss: 0.34794881063753014
Epoch: 29, step: 681, loss: 0.3539905548095703, mean loss: 0.34794895260247616
Epoch: 29, step: 682, loss: 0.339786171913147, mean loss: 0.34794876080331055
Epoch: 29, step: 683, loss: 0.30205410718917847, mean loss: 0.34794768245148694
Epoch: 29, step: 684, loss: 0.3154826760292053, mean loss: 0.34794691966380753
Epoch: 29, step: 685, loss: 0.3537546992301941, mean loss: 0.3479470561183812
Epoch: 29, step: 686, loss: 0.35755881667137146, mean loss: 0.3479472819427017
Epoch: 29, step: 687, loss: 0.3640480935573578, mean loss: 0.3479476602156933
Epoch: 29, step: 688, loss: 0.31539639830589294, mean loss: 0.3479468954732544
Epoch: 29, step: 689, loss: 0.3489437401294708, mean loss: 0.34794691889205476
Epoch: 29, step: 690, loss: 0.333784818649292, mean loss: 0.34794658619066066
Epoch: 29, step: 691, loss: 0.346609503030777, mean loss: 0.34794655478013725
Epoch: 29, step: 692, loss: 0.3615470826625824, mean loss: 0.34794687427385057
Epoch: 29, step: 693, loss: 0.37430498003959656, mean loss: 0.34794749344476356
Epoch: 29, step: 694, loss: 0.3278953433036804, mean loss: 0.3479470224163606
Epoch: 29, step: 695, loss: 0.3421860635280609, mean loss: 0.34794688709363936
Epoch: 29, step: 696, loss: 0.40444812178611755, mean loss: 0.34794821425486105
Epoch: 29, step: 697, loss: 0.30882441997528076, mean loss: 0.34794729529506685
Epoch: 29, step: 698, loss: 0.3736031949520111, mean loss: 0.34794789789987385
Epoch: 29, step: 699, loss: 0.35853004455566406, mean loss: 0.3479481464470989
Epoch: 29, step: 700, loss: 0.3472176492214203, mean loss: 0.3479481292900135
Epoch: 29, step: 701, loss: 0.3115746080875397, mean loss: 0.3479472750103103
Epoch: 29, step: 702, loss: 0.3457087278366089, mean loss: 0.34794722243633786
Epoch: 29, step: 703, loss: 0.35143372416496277, mean loss: 0.34794730431754334
Epoch: 29, step: 704, loss: 0.3569982647895813, mean loss: 0.34794751687620734
Epoch: 29, step: 705, loss: 0.3095034062862396, mean loss: 0.3479466140508213
Epoch: 29, step: 706, loss: 0.2903214693069458, mean loss: 0.3479452608078665
Epoch: 29, step: 707, loss: 0.29823485016822815, mean loss: 0.34794409345837746
Epoch: 29, step: 708, loss: 0.32671403884887695, mean loss: 0.347943594924748
Epoch: 29, step: 709, loss: 0.37171801924705505, mean loss: 0.3479441531932945
Epoch: 29, step: 710, loss: 0.35398027300834656, mean loss: 0.34794429492950074
Epoch: 29, step: 711, loss: 0.33680248260498047, mean loss: 0.3479440333109151
Epoch: 29, step: 712, loss: 0.32714200019836426, mean loss: 0.3479435448741565
Epoch: 29, step: 713, loss: 0.3416779935359955, mean loss: 0.347943397760953
Epoch: 29, step: 714, loss: 0.30810901522636414, mean loss: 0.34794246248395705
Epoch: 29, step: 715, loss: 0.3199937343597412, mean loss: 0.3479418062872975
Epoch: 29, step: 716, loss: 0.3115720748901367, mean loss: 0.3479409523974236
Epoch: 29, step: 717, loss: 0.33867982029914856, mean loss: 0.34794073496933287
Epoch: 29, step: 718, loss: 0.3676760494709015, mean loss: 0.34794119829400716
Epoch: 29, step: 719, loss: 0.32686206698417664, mean loss: 0.3479407034322523
Epoch: 29, step: 720, loss: 0.31371620297431946, mean loss: 0.3479398999836419
Epoch: 29, step: 721, loss: 0.36393603682518005, mean loss: 0.3479402754974416
Epoch: 29, step: 722, loss: 0.3485715985298157, mean loss: 0.347940290317579
Epoch: 29, step: 723, loss: 0.316836416721344, mean loss: 0.3479395601797012
Epoch: 29, step: 724, loss: 0.3357507586479187, mean loss: 0.3479392740643158
Epoch: 29, step: 725, loss: 0.3430253267288208, mean loss: 0.34793915871885467
Epoch: 29, step: 726, loss: 0.35997509956359863, mean loss: 0.347939441232782
Epoch: 29, step: 727, loss: 0.3081721365451813, mean loss: 0.3479385078156219
Epoch: 29, step: 728, loss: 0.31847840547561646, mean loss: 0.3479378163450823
Epoch: 29, step: 729, loss: 0.3296584486961365, mean loss: 0.34793738731237217
Epoch: 29, step: 730, loss: 0.32628193497657776, mean loss: 0.3479368790519376
Epoch: 29, step: 731, loss: 0.3581047058105469, mean loss: 0.34793711768850255
Epoch: 29, step: 732, loss: 0.3377804756164551, mean loss: 0.3479368793200341
Epoch: 29, step: 733, loss: 0.28176289796829224, mean loss: 0.3479353263047477
Epoch: 29, step: 734, loss: 0.3841157853603363, mean loss: 0.3479361753920504
Epoch: 29, step: 735, loss: 0.30380168557167053, mean loss: 0.3479351396629173
Epoch: 29, step: 736, loss: 0.3832799792289734, mean loss: 0.34793596910087204
Epoch: 29, step: 737, loss: 0.3142395317554474, mean loss: 0.3479351783645566
Epoch: 29, step: 738, loss: 0.322878360748291, mean loss: 0.3479345903833853
Epoch: 29, step: 739, loss: 0.2825400233268738, mean loss: 0.3479330558759924
Epoch: 29, step: 740, loss: 0.34222060441970825, mean loss: 0.3479329218343786
Epoch: 29, step: 741, loss: 0.3409397602081299, mean loss: 0.3479327577449885
Epoch: 29, step: 742, loss: 0.3521326780319214, mean loss: 0.3479328562907143
Epoch: 29, step: 743, loss: 0.3505055904388428, mean loss: 0.34793291665519455
Epoch: 29, step: 744, loss: 0.33690980076789856, mean loss: 0.34793265802409984
Epoch: 29, step: 745, loss: 0.34321433305740356, mean loss: 0.34793254732246764
Epoch: 29, step: 746, loss: 0.3297176957130432, mean loss: 0.3479321199745191
Epoch: 29, step: 747, loss: 0.3209553062915802, mean loss: 0.34793148707254645
Epoch: 29, step: 748, loss: 0.3287743628025055, mean loss: 0.347931037638546
Epoch: 29, step: 749, loss: 0.3124461770057678, mean loss: 0.34793020516867706
Epoch: 29, step: 750, loss: 0.32587382197380066, mean loss: 0.34792968774115
Epoch: 29, step: 751, loss: 0.3077602684497833, mean loss: 0.34792874541640356
Epoch: 29, step: 752, loss: 0.311579167842865, mean loss: 0.34792789272040847
Epoch: 29, step: 753, loss: 0.33195021748542786, mean loss: 0.3479275179215524
Epoch: 29, step: 754, loss: 0.38061970472335815, mean loss: 0.3479282847857311
Epoch: 29, step: 755, loss: 0.32218751311302185, mean loss: 0.3479276809958157
Epoch: 29, step: 756, loss: 0.32074159383773804, mean loss: 0.34792704331873087
Epoch: 29, step: 757, loss: 0.32722267508506775, mean loss: 0.34792655768828956
Epoch: 29, step: 758, loss: 0.34524598717689514, mean loss: 0.347926494815755
Epoch: 29, step: 759, loss: 0.31238847970962524, mean loss: 0.3479256612944325
Epoch: 29, step: 760, loss: 0.30465424060821533, mean loss: 0.34792464641485166
Epoch: 29, step: 761, loss: 0.2931627035140991, mean loss: 0.34792336206889496
Epoch: 29, step: 762, loss: 0.3295520842075348, mean loss: 0.34792293121268675
Epoch: 29, step: 763, loss: 0.3202761113643646, mean loss: 0.34792228283511056
Epoch: 29, step: 764, loss: 0.3554403781890869, mean loss: 0.34792245914653275
Epoch: 29, step: 765, loss: 0.32810041308403015, mean loss: 0.34792199429858794
Epoch: 29, step: 766, loss: 0.3114236295223236, mean loss: 0.3479211383934036
Epoch: 29, step: 767, loss: 0.31787675619125366, mean loss: 0.34792043385390914
Epoch: 29, step: 768, loss: 0.32884901762008667, mean loss: 0.3479199866404906
Epoch: 29, step: 769, loss: 0.2871589660644531, mean loss: 0.3479185618639447
Epoch: 29, step: 770, loss: 0.30355697870254517, mean loss: 0.3479175216598703
Epoch: 29, step: 771, loss: 0.34489354491233826, mean loss: 0.3479174507543941
Epoch: 29, step: 772, loss: 0.3370170295238495, mean loss: 0.34791719516994357
Epoch: 29, step: 773, loss: 0.3327946364879608, mean loss: 0.3479168405964692
Epoch: 29, step: 774, loss: 0.311953067779541, mean loss: 0.34791599738592743
Epoch: 29, step: 775, loss: 0.3196342885494232, mean loss: 0.34791533430544264
Epoch: 29, step: 776, loss: 0.33043450117111206, mean loss: 0.34791492446713973
Epoch: 29, step: 777, loss: 0.3065613806247711, mean loss: 0.3479139549556322
Epoch: 29, step: 778, loss: 0.30686283111572266, mean loss: 0.3479129925567613
Epoch: 29, step: 779, loss: 0.36772769689559937, mean loss: 0.347913457080025
Epoch: 29, step: 780, loss: 0.3077729642391205, mean loss: 0.3479125160740274
Epoch: 29, step: 781, loss: 0.3066328465938568, mean loss: 0.34791154838521215
Epoch: 29, step: 782, loss: 0.34353330731391907, mean loss: 0.3479114457517451
Epoch: 29, step: 783, loss: 0.36806318163871765, mean loss: 0.34791191813186434
Epoch: 29, step: 784, loss: 0.36381199955940247, mean loss: 0.347912290839523
Epoch: 29, step: 785, loss: 0.31539031863212585, mean loss: 0.34791152852242097
Epoch: 29, step: 786, loss: 0.3423202335834503, mean loss: 0.3479113974651831
Epoch: 29, step: 787, loss: 0.31031322479248047, mean loss: 0.34791051620293223
Epoch: 29, step: 788, loss: 0.37377357482910156, mean loss: 0.347911122392048
Epoch: 29, step: 789, loss: 0.3558764159679413, mean loss: 0.3479113090815332
Epoch: 29, step: 790, loss: 0.30106067657470703, mean loss: 0.3479102110284124
Epoch: 29, step: 791, loss: 0.33761072158813477, mean loss: 0.347909969641672
Epoch: 29, step: 792, loss: 0.3222352862358093, mean loss: 0.3479093679241861
Epoch: 29, step: 793, loss: 0.3450424373149872, mean loss: 0.34790930073574905
Epoch: 29, step: 794, loss: 0.3463745415210724, mean loss: 0.3479092647684829
Epoch: 29, step: 795, loss: 0.3016667068004608, mean loss: 0.3479081810939898
Epoch: 29, step: 796, loss: 0.31926730275154114, mean loss: 0.3479075099230306
Epoch: 29, step: 797, loss: 0.3701527416706085, mean loss: 0.3479080312060542
Epoch: 29, step: 798, loss: 0.3229057192802429, mean loss: 0.3479074453287976
Epoch: 29, step: 799, loss: 0.30867186188697815, mean loss: 0.3479065259459257
Epoch: 29, step: 800, loss: 0.36736440658569336, mean loss: 0.34790698187958174
Epoch: 29, step: 801, loss: 0.3212127387523651, mean loss: 0.34790635639940165
Epoch: 29, step: 802, loss: 0.3424100875854492, mean loss: 0.34790622761782725
Epoch: 29, step: 803, loss: 0.3040088713169098, mean loss: 0.3479051990949523
Epoch: 29, step: 804, loss: 0.32762259244918823, mean loss: 0.34790472388100124
Epoch: 29, step: 805, loss: 0.34943389892578125, mean loss: 0.347904759708166
Epoch: 29, step: 806, loss: 0.3475346267223358, mean loss: 0.34790475103649376
Epoch: 29, step: 807, loss: 0.34632790088653564, mean loss: 0.34790471409407625
Epoch: 29, step: 808, loss: 0.2935229241847992, mean loss: 0.3479034400683082
Epoch: 29, step: 809, loss: 0.34872967004776, mean loss: 0.3479034594243027
Epoch: 29, step: 810, loss: 0.34860095381736755, mean loss: 0.3479034757640406
Epoch: 29, step: 811, loss: 0.36884695291519165, mean loss: 0.34790396638147764
Epoch: 29, step: 812, loss: 0.33483248949050903, mean loss: 0.34790366017901586
Epoch: 29, step: 813, loss: 0.3181515038013458, mean loss: 0.3479029632439871
Epoch: 29, step: 814, loss: 0.30040740966796875, mean loss: 0.3479018507014471
Epoch: 29, step: 815, loss: 0.2939286231994629, mean loss: 0.34790058645457406
Epoch: 29, step: 816, loss: 0.31408563256263733, mean loss: 0.34789979440543506
Epoch: 29, step: 817, loss: 0.31832966208457947, mean loss: 0.34789910179915967
Epoch: 29, step: 818, loss: 0.3728944659233093, mean loss: 0.34789968723923753
Epoch: 29, step: 819, loss: 0.3382607698440552, mean loss: 0.347899461482319
Epoch: 29, step: 820, loss: 0.30764299631118774, mean loss: 0.3478985186417173
Epoch: 29, step: 821, loss: 0.3582167327404022, mean loss: 0.3478987602973943
Epoch: 29, step: 822, loss: 0.34091535210609436, mean loss: 0.34789859674770485
Epoch: 29, step: 823, loss: 0.33231469988822937, mean loss: 0.34789823178524915
Epoch: 29, step: 824, loss: 0.30899497866630554, mean loss: 0.34789732072337426
Epoch: 29, step: 825, loss: 0.3149874806404114, mean loss: 0.3478965500372218
Epoch: 29, step: 826, loss: 0.351080983877182, mean loss: 0.3478966246088875
Epoch: 29, step: 827, loss: 0.29931744933128357, mean loss: 0.34789548702984857
Epoch: 29, step: 828, loss: 0.2722938358783722, mean loss: 0.34789371670667446
Epoch: 29, step: 829, loss: 0.32162997126579285, mean loss: 0.3478931017170842
Epoch: 29, step: 830, loss: 0.3042232096195221, mean loss: 0.34789207917061415
Epoch: 29, step: 831, loss: 0.4278406798839569, mean loss: 0.34789395115246097
Epoch: 29, step: 832, loss: 0.3497115671634674, mean loss: 0.3478939937106106
Epoch: 29, step: 833, loss: 0.32328954339027405, mean loss: 0.3478934176288892
Epoch: 29, step: 834, loss: 0.3202327489852905, mean loss: 0.34789277000488966
Epoch: 29, step: 835, loss: 0.35081779956817627, mean loss: 0.3478928384875073
Epoch: 29, step: 836, loss: 0.3231808841228485, mean loss: 0.34789225992935485
Epoch: 29, step: 837, loss: 0.30524665117263794, mean loss: 0.3478912615304984
Epoch: 29, step: 838, loss: 0.3634065091609955, mean loss: 0.34789162475764646
Epoch: 29, step: 839, loss: 0.34326842427253723, mean loss: 0.34789151652652733
Epoch: 29, step: 840, loss: 0.32381322979927063, mean loss: 0.3478909528566365
Epoch: 29, step: 841, loss: 0.3184320628643036, mean loss: 0.347890263243593
Epoch: 29, step: 842, loss: 0.3426693081855774, mean loss: 0.3478901410273647
Epoch: 29, step: 843, loss: 0.31421324610710144, mean loss: 0.34788935271053606
Epoch: 29, step: 844, loss: 0.31629320979118347, mean loss: 0.34788861311776154
Epoch: 29, step: 845, loss: 0.32599228620529175, mean loss: 0.3478881005872875
Epoch: 29, step: 846, loss: 0.3174719512462616, mean loss: 0.3478873886487686
Epoch: 29, step: 847, loss: 0.30562472343444824, mean loss: 0.3478863994467928
Epoch: 29, step: 848, loss: 0.3064422905445099, mean loss: 0.34788542942668976
Epoch: 29, step: 849, loss: 0.3452643156051636, mean loss: 0.3478853680796453
Epoch: 29, step: 850, loss: 0.36553868651390076, mean loss: 0.3478857812450544
Epoch: 29, step: 851, loss: 0.32388269901275635, mean loss: 0.3478852194803514
Epoch: 29, step: 852, loss: 0.3229422867298126, mean loss: 0.3478846357331832
Epoch: 29, step: 853, loss: 0.35765305161476135, mean loss: 0.34788486434109056
Epoch: 29, step: 854, loss: 0.31294748187065125, mean loss: 0.34788404672899464
Epoch: 29, step: 855, loss: 0.31989243626594543, mean loss: 0.3478833916786702
Epoch: 29, step: 856, loss: 0.3695928454399109, mean loss: 0.34788389970417183
Epoch: 29, step: 857, loss: 0.30232933163642883, mean loss: 0.34788283370126855
Epoch: 29, step: 858, loss: 0.3141230046749115, mean loss: 0.3478820437204794
Epoch: 29, step: 859, loss: 0.31348586082458496, mean loss: 0.3478812388678283
Epoch: 29, step: 860, loss: 0.3699885606765747, mean loss: 0.34788175615546685
Epoch: 29, step: 861, loss: 0.3564313054084778, mean loss: 0.3478819562010762
Epoch: 29, step: 862, loss: 0.33073756098747253, mean loss: 0.3478815550593739
Epoch: 29, step: 863, loss: 0.3688608407974243, mean loss: 0.3478820459177206
Epoch: 29, step: 864, loss: 0.33168575167655945, mean loss: 0.34788166697725964
Epoch: 29, step: 865, loss: 0.3109367787837982, mean loss: 0.3478808026075953
Epoch: 29, step: 866, loss: 0.31607669591903687, mean loss: 0.347880058530046
Epoch: 29, step: 867, loss: 0.3568190932273865, mean loss: 0.3478802676596244
Epoch: 29, step: 868, loss: 0.3296171724796295, mean loss: 0.347879840402748
Epoch: 29, step: 869, loss: 0.35111480951309204, mean loss: 0.3478799160816211
Epoch: 29, step: 870, loss: 0.311682790517807, mean loss: 0.3478790693058108
Epoch: 29, step: 871, loss: 0.3607684075832367, mean loss: 0.3478793708249059
Epoch: 29, step: 872, loss: 0.37244459986686707, mean loss: 0.34787994546358847
Epoch: 29, step: 873, loss: 0.35617464780807495, mean loss: 0.3478801394917135
Epoch: 29, step: 874, loss: 0.30252957344055176, mean loss: 0.3478790786845733
Epoch: 29, step: 875, loss: 0.3270999491214752, mean loss: 0.3478785926458017
Epoch: 29, step: 876, loss: 0.2955766022205353, mean loss: 0.34787736929327845
Epoch: 29, step: 877, loss: 0.3341591954231262, mean loss: 0.34787704843034467
Epoch: 29, step: 878, loss: 0.3368323743343353, mean loss: 0.34787679010560846
Epoch: 29, step: 879, loss: 0.3354252278804779, mean loss: 0.3478764988818685
Epoch: 29, step: 880, loss: 0.3218827545642853, mean loss: 0.34787589094061167
Epoch: 29, step: 881, loss: 0.3365169167518616, mean loss: 0.3478756252833267
Epoch: 29, step: 882, loss: 0.33170992136001587, mean loss: 0.34787524721779844
Epoch: 29, step: 883, loss: 0.28283989429473877, mean loss: 0.34787372627876845
Epoch: 29, step: 884, loss: 0.30755484104156494, mean loss: 0.3478727833895648
Epoch: 29, step: 885, loss: 0.38105860352516174, mean loss: 0.3478735594482182
Epoch: 29, step: 886, loss: 0.3089212477207184, mean loss: 0.3478726485600268
Epoch: 29, step: 887, loss: 0.3436570167541504, mean loss: 0.34787254998103967
Epoch: 29, step: 888, loss: 0.3275569975376129, mean loss: 0.3478720749301232
Epoch: 29, step: 889, loss: 0.3142809271812439, mean loss: 0.3478712894662559
Epoch: 29, step: 890, loss: 0.3096672594547272, mean loss: 0.34787039615996806
Epoch: 29, step: 891, loss: 0.29899075627326965, mean loss: 0.3478692532578009
Epoch: 29, step: 892, loss: 0.33029904961586, mean loss: 0.3478688424414703
Epoch: 29, step: 893, loss: 0.32705673575401306, mean loss: 0.34786835583621695
Epoch: 29, step: 894, loss: 0.34273508191108704, mean loss: 0.34786823581858994
Epoch: 29, step: 895, loss: 0.3409692049026489, mean loss: 0.34786807452075685
Epoch: 29, step: 896, loss: 0.30494239926338196, mean loss: 0.3478670709513262
Epoch: 29, step: 897, loss: 0.3764534890651703, mean loss: 0.34786773926427594
Epoch: 29, step: 898, loss: 0.3874269127845764, mean loss: 0.3478686640842297
Epoch: 29, step: 899, loss: 0.3356776535511017, mean loss: 0.34786837908772383
Epoch: 29, step: 900, loss: 0.3118712902069092, mean loss: 0.3478675375820343
Epoch: 29, step: 901, loss: 0.33278897404670715, mean loss: 0.34786718509796455
Epoch: 29, step: 902, loss: 0.31337466835975647, mean loss: 0.3478663788024285
Epoch: 29, step: 903, loss: 0.2910747230052948, mean loss: 0.3478650512742425
Epoch: 29, step: 904, loss: 0.3590361475944519, mean loss: 0.3478653123970849
Epoch: 29, step: 905, loss: 0.3002381920814514, mean loss: 0.34786419914571015
Epoch: 29, step: 906, loss: 0.32033368945121765, mean loss: 0.3478635556539098
Epoch: 29, step: 907, loss: 0.35496529936790466, mean loss: 0.3478637216445538
Epoch: 29, step: 908, loss: 0.36109983921051025, mean loss: 0.3478640310080589
Epoch: 29, step: 909, loss: 0.3042924404144287, mean loss: 0.3478630126471326
Epoch: 29, step: 910, loss: 0.35107898712158203, mean loss: 0.34786308780955283
Epoch: 29, step: 911, loss: 0.31400737166404724, mean loss: 0.3478622965663037
Epoch: 29, step: 912, loss: 0.3238980770111084, mean loss: 0.3478617365106923
Epoch: 29, step: 913, loss: 0.3455204665660858, mean loss: 0.34786168179533955
Epoch: 29, step: 914, loss: 0.3415496349334717, mean loss: 0.34786153428659095
Epoch: 29, step: 915, loss: 0.3295978605747223, mean loss: 0.3478611074854666
Epoch: 29, step: 916, loss: 0.35125240683555603, mean loss: 0.34786118673439403
Epoch: 29, step: 917, loss: 0.3436736464500427, mean loss: 0.34786108888094996
Epoch: 29, step: 918, loss: 0.34645795822143555, mean loss: 0.34786105609369306
Epoch: 29, step: 919, loss: 0.3597586452960968, mean loss: 0.34786133410073117
Epoch: 29, step: 920, loss: 0.31095656752586365, mean loss: 0.3478604717793868
Epoch: 29, step: 921, loss: 0.32766422629356384, mean loss: 0.347859999882441
Epoch: 29, step: 922, loss: 0.32933509349823, mean loss: 0.3478595670474125
Epoch: 29, step: 923, loss: 0.29349255561828613, mean loss: 0.34785829679013613
Epoch: 29, step: 924, loss: 0.3211140036582947, mean loss: 0.34785767193807354
Epoch: 29, step: 925, loss: 0.3479548692703247, mean loss: 0.34785767420893315
Epoch: 29, step: 926, loss: 0.34468546509742737, mean loss: 0.3478576000970926
Epoch: 29, step: 927, loss: 0.32782095670700073, mean loss: 0.3478571319949669
Epoch: 29, step: 928, loss: 0.38420161604881287, mean loss: 0.3478579810659645
Epoch: 29, step: 929, loss: 0.3512958288192749, mean loss: 0.3478580613782514
Epoch: 29, step: 930, loss: 0.3477077782154083, mean loss: 0.34785805786753676
Epoch: 29, step: 931, loss: 0.33964893221855164, mean loss: 0.34785786610137975
Epoch: 29, step: 932, loss: 0.39397111535072327, mean loss: 0.3478589432872343
Epoch: 29, step: 933, loss: 0.3203921318054199, mean loss: 0.34785830168920856
Epoch: 29, step: 934, loss: 0.39336085319519043, mean loss: 0.3478593645597677
Epoch: 29, step: 935, loss: 0.33524882793426514, mean loss: 0.3478590700036473
Epoch: 29, step: 936, loss: 0.3372288942337036, mean loss: 0.34785882171047067
Epoch: 29, step: 937, loss: 0.32168975472450256, mean loss: 0.34785821048360593
Epoch: 29, step: 938, loss: 0.3195689618587494, mean loss: 0.347857549751418
Epoch: 29, step: 939, loss: 0.3239425718784332, mean loss: 0.3478569911990574
Epoch: 29, step: 940, loss: 0.3232797682285309, mean loss: 0.3478564171928689
Epoch: 29, step: 941, loss: 0.32710856199264526, mean loss: 0.34785593263368353
Epoch: 29, step: 942, loss: 0.3305092751979828, mean loss: 0.3478555275177902
Epoch: 29, step: 943, loss: 0.3190707266330719, mean loss: 0.34785485528983867
Epoch: 29, step: 944, loss: 0.3146694004535675, mean loss: 0.34785408030899195
Epoch: 29, step: 945, loss: 0.3761889934539795, mean loss: 0.3478547419995516
Epoch: 29, step: 946, loss: 0.32441750168800354, mean loss: 0.34785419469459133
Epoch: 29, step: 947, loss: 0.3466127812862396, mean loss: 0.34785416570586053
Epoch: 29, step: 948, loss: 0.3528643548488617, mean loss: 0.347854282698018
Epoch: 29, step: 949, loss: 0.35608839988708496, mean loss: 0.3478544749671346
Epoch: 29, step: 950, loss: 0.35496073961257935, mean loss: 0.3478546408966801
Epoch: 29, step: 951, loss: 0.34076276421546936, mean loss: 0.3478544753069565
Epoch: 29, step: 952, loss: 0.3468286395072937, mean loss: 0.34785445135505944
Epoch: 29, step: 953, loss: 0.33077695965766907, mean loss: 0.34785405262772584
Epoch: 29, step: 954, loss: 0.37745237350463867, mean loss: 0.3478547436767529
Epoch: 29, step: 955, loss: 0.3229959309101105, mean loss: 0.34785416329729907
Epoch: 29, step: 956, loss: 0.31369754672050476, mean loss: 0.34785336586035615
Epoch: 29, step: 957, loss: 0.31058672070503235, mean loss: 0.3478524958354891
Epoch: 29, step: 958, loss: 0.3236923813819885, mean loss: 0.347851931808071
Epoch: 29, step: 959, loss: 0.31848621368408203, mean loss: 0.34785124626978253
Epoch: 29, step: 960, loss: 0.3068021237850189, mean loss: 0.34785028800654083
Epoch: 29, step: 961, loss: 0.336607962846756, mean loss: 0.34785002556839806
Epoch: 29, step: 962, loss: 0.3175835609436035, mean loss: 0.3478493190517981
Epoch: 29, step: 963, loss: 0.33293992280960083, mean loss: 0.3478489710266757
Epoch: 29, step: 964, loss: 0.3580096662044525, mean loss: 0.3478492081988981
Epoch: 29, step: 965, loss: 0.34773755073547363, mean loss: 0.3478492055926364
Epoch: 29, step: 966, loss: 0.33977505564689636, mean loss: 0.3478490171336128
Epoch: 29, step: 967, loss: 0.3165110647678375, mean loss: 0.34784828569041504
Epoch: 29, step: 968, loss: 0.3269553780555725, mean loss: 0.3478477980510724
Epoch: 29, step: 969, loss: 0.3493782579898834, mean loss: 0.3478478337710915
Epoch: 29, step: 970, loss: 0.3318237066268921, mean loss: 0.34784745978628173
Epoch: 29, step: 971, loss: 0.2916335165500641, mean loss: 0.347846147847726
Epoch: 29, step: 972, loss: 0.33255651593208313, mean loss: 0.34784579102185104
Epoch: 29, step: 973, loss: 0.32660001516342163, mean loss: 0.3478452952044448
Epoch: 29, step: 974, loss: 0.33251622319221497, mean loss: 0.34784493747482326
Epoch: 29, step: 975, loss: 0.352321982383728, mean loss: 0.3478450419517417
Epoch: 29, step: 976, loss: 0.32153403759002686, mean loss: 0.34784442796895493
Epoch: 29, step: 977, loss: 0.3320111930370331, mean loss: 0.3478440584997121
Epoch: 29, step: 978, loss: 0.32850900292396545, mean loss: 0.3478436073258567
Epoch: 29, step: 979, loss: 0.3255854845046997, mean loss: 0.34784308795580765
Epoch: 29, step: 980, loss: 0.29796263575553894, mean loss: 0.34784192407471004
Epoch: 29, step: 981, loss: 0.34992197155952454, mean loss: 0.34784197260818067
Epoch: 29, step: 982, loss: 0.30505284667015076, mean loss: 0.3478409742385048
Epoch: 29, step: 983, loss: 0.3101467192173004, mean loss: 0.3478400947645192
Epoch: 29, step: 984, loss: 0.3089398443698883, mean loss: 0.34783918717369317
Epoch: 29, step: 985, loss: 0.30518779158592224, mean loss: 0.34783819208723926
Epoch: 29, step: 986, loss: 0.35024431347846985, mean loss: 0.3478382482223999
Epoch: 29, step: 987, loss: 0.3236561417579651, mean loss: 0.34783768406351445
Epoch: 29, step: 988, loss: 0.3617427349090576, mean loss: 0.34783800845522905
Epoch: 29, step: 989, loss: 0.3384762406349182, mean loss: 0.3478377900591151
Epoch: 29, step: 990, loss: 0.33172813057899475, mean loss: 0.34783741425349585
Epoch: 29, step: 991, loss: 0.33563515543937683, mean loss: 0.34783712960623414
Epoch: 29, step: 992, loss: 0.3360764980316162, mean loss: 0.3478368552673978
Epoch: 29, step: 993, loss: 0.33987754583358765, mean loss: 0.34783666960587617
Epoch: 29, step: 994, loss: 0.31151115894317627, mean loss: 0.3478358222845946
Epoch: 29, step: 995, loss: 0.32585763931274414, mean loss: 0.3478353096380427
Epoch: 29, step: 996, loss: 0.3091363310813904, mean loss: 0.347834406995854
Epoch: 29, step: 997, loss: 0.30478963255882263, mean loss: 0.34783340301268384
Epoch: 29, step: 998, loss: 0.32429832220077515, mean loss: 0.3478328540895162
Epoch: 29, step: 999, loss: 0.37711480259895325, mean loss: 0.3478335370344856
Epoch: 29, step: 1000, loss: 0.35559576749801636, mean loss: 0.34783371806931696
Epoch: 29, step: 1001, loss: 0.303732693195343, mean loss: 0.34783268954595126
Epoch: 29, step: 1002, loss: 0.3451155424118042, mean loss: 0.347832626178169
Epoch: 29, step: 1003, loss: 0.30245769023895264, mean loss: 0.34783156799402865
Epoch: 29, step: 1004, loss: 0.3437318801879883, mean loss: 0.34783147238786727
Epoch: 29, step: 1005, loss: 0.3183036148548126, mean loss: 0.34783078380390353
Epoch: 29, step: 1006, loss: 0.34026944637298584, mean loss: 0.34783060747907946
Epoch: 29, step: 1007, loss: 0.372667521238327, mean loss: 0.34783118664412377
Epoch: 29, step: 1008, loss: 0.31002146005630493, mean loss: 0.3478303049902451
Epoch: 29, step: 1009, loss: 0.2841627895832062, mean loss: 0.3478288204144999
Epoch: 29, step: 1010, loss: 0.35906127095222473, mean loss: 0.34782908232254983
Epoch: 29, step: 1011, loss: 0.3224913477897644, mean loss: 0.3478284915341117
Epoch: 29, step: 1012, loss: 0.35542839765548706, mean loss: 0.3478286687335363
Epoch: 29, step: 1013, loss: 0.3469303250312805, mean loss: 0.3478286477882413
Epoch: 29, step: 1014, loss: 0.39165398478507996, mean loss: 0.34782966957222855
Epoch: 29, step: 1015, loss: 0.3426465690135956, mean loss: 0.3478295487314993
Epoch: 29, step: 1016, loss: 0.32747623324394226, mean loss: 0.3478290742178144
Epoch: 29, step: 1017, loss: 0.3078158497810364, mean loss: 0.347828141378153
Epoch: 29, step: 1018, loss: 0.36664077639579773, mean loss: 0.34782857995222966
Epoch: 29, step: 1019, loss: 0.34996920824050903, mean loss: 0.34782862985497787
Epoch: 29, step: 1020, loss: 0.35116732120513916, mean loss: 0.34782870768539376
Epoch: 29, step: 1021, loss: 0.33683034777641296, mean loss: 0.34782845130141526
Epoch: 29, step: 1022, loss: 0.3085053265094757, mean loss: 0.34782753465709276
Epoch: 29, step: 1023, loss: 0.35249796509742737, mean loss: 0.34782764352493517
Epoch: 29, step: 1024, loss: 0.3204086720943451, mean loss: 0.34782700440296993
Epoch: 29, step: 1025, loss: 0.3292204737663269, mean loss: 0.3478265707045261
Epoch: 29, step: 1026, loss: 0.31006407737731934, mean loss: 0.34782569052147766
Epoch: 29, step: 1027, loss: 0.313586950302124, mean loss: 0.34782489249005355
Epoch: 29, step: 1028, loss: 0.3450201153755188, mean loss: 0.34782482711825274
Epoch: 29, step: 1029, loss: 0.30624762177467346, mean loss: 0.3478238580881557
Epoch: 29, step: 1030, loss: 0.30023127794265747, mean loss: 0.347822748884992
Epoch: 29, step: 1031, loss: 0.33022141456604004, mean loss: 0.34782233867397494
Epoch: 29, step: 1032, loss: 0.32026252150535583, mean loss: 0.3478216963887395
Epoch: 29, step: 1033, loss: 0.3093200623989105, mean loss: 0.34782079912390634
Epoch: 29, step: 1034, loss: 0.3518492579460144, mean loss: 0.34782089300330377
Epoch: 29, step: 1035, loss: 0.33216914534568787, mean loss: 0.34782052826272636
Epoch: 29, step: 1036, loss: 0.340501993894577, mean loss: 0.3478203577191995
Epoch: 29, step: 1037, loss: 0.349062979221344, mean loss: 0.34782038667528614
Epoch: 29, step: 1038, loss: 0.3280327022075653, mean loss: 0.34781992558512026
Epoch: 29, step: 1039, loss: 0.3278738558292389, mean loss: 0.3478194608151101
Epoch: 29, step: 1040, loss: 0.3164809048175812, mean loss: 0.34781873060200114
Epoch: 29, step: 1041, loss: 0.28903234004974365, mean loss: 0.34781736086458204
Epoch: 29, step: 1042, loss: 0.34324780106544495, mean loss: 0.3478172543951909
Epoch: 29, step: 1043, loss: 0.29893365502357483, mean loss: 0.34781611544832763
Epoch: 29, step: 1044, loss: 0.35219237208366394, mean loss: 0.347816217409061
Epoch: 29, step: 1045, loss: 0.3682354688644409, mean loss: 0.34781669313832464
Epoch: 29, step: 1046, loss: 0.33139514923095703, mean loss: 0.34781631055686696
Epoch: 29, step: 1047, loss: 0.3460182845592499, mean loss: 0.3478162686682732
Epoch: 29, step: 1048, loss: 0.3757399022579193, mean loss: 0.3478169191897313
Epoch: 29, step: 1049, loss: 0.3103450536727905, mean loss: 0.34781604624872775
Epoch: 29, step: 1050, loss: 0.30964720249176025, mean loss: 0.34781515709169936
Epoch: 29, step: 1051, loss: 0.30789312720298767, mean loss: 0.3478142271152297
Epoch: 29, step: 1052, loss: 0.33248984813690186, mean loss: 0.3478138701449071
Epoch: 29, step: 1053, loss: 0.3325132131576538, mean loss: 0.3478135137354734
Epoch: 29, step: 1054, loss: 0.34682178497314453, mean loss: 0.34781349063494554
Epoch: 29, step: 1055, loss: 0.3538481295108795, mean loss: 0.3478136311976698
Epoch: 29, step: 1056, loss: 0.2986231744289398, mean loss: 0.34781248544832155
Epoch: 29, step: 1057, loss: 0.3084106147289276, mean loss: 0.347811567717136
Epoch: 29, step: 1058, loss: 0.31659117341041565, mean loss: 0.34781084056226685
Epoch: 29, step: 1059, loss: 0.33200395107269287, mean loss: 0.3478104724122415
Epoch: 29, step: 1060, loss: 0.2975510060787201, mean loss: 0.34780930187246617
Epoch: 29, step: 1061, loss: 0.32802262902259827, mean loss: 0.34780884105284604
Epoch: 29, step: 1062, loss: 0.3417421281337738, mean loss: 0.347808699766069
Epoch: 29, step: 1063, loss: 0.3249737620353699, mean loss: 0.34780816797897696
Epoch: 29, step: 1064, loss: 0.3407739996910095, mean loss: 0.3478080041689053
Epoch: 29, step: 1065, loss: 0.32792335748672485, mean loss: 0.34780754111067136
Epoch: 29, step: 1066, loss: 0.34002578258514404, mean loss: 0.3478073598993325
Epoch: 29, step: 1067, loss: 0.3639448285102844, mean loss: 0.3478077356786872
Epoch: 29, step: 1068, loss: 0.31479451060295105, mean loss: 0.3478069669460041
Epoch: 29, step: 1069, loss: 0.3376687169075012, mean loss: 0.3478067308762878
Epoch: 29, step: 1070, loss: 0.37057632207870483, mean loss: 0.3478072610551408
Epoch: 29, step: 1071, loss: 0.32082512974739075, mean loss: 0.34780663280396945
Epoch: 29, step: 1072, loss: 0.30505117774009705, mean loss: 0.34780563731035924
Epoch: 29, step: 1073, loss: 0.30840933322906494, mean loss: 0.34780472005066004
Epoch: 29, step: 1074, loss: 0.3183031380176544, mean loss: 0.3478040331846492
Epoch: 29, step: 1075, loss: 0.3576827943325043, mean loss: 0.34780426318001956
Epoch: 29, step: 1076, loss: 0.31713855266571045, mean loss: 0.347803549243612
Epoch: 29, step: 1077, loss: 0.3443595767021179, mean loss: 0.34780346906545534
Epoch: 29, step: 1078, loss: 0.3154467046260834, mean loss: 0.3478027157942543
Epoch: 29, step: 1079, loss: 0.3257681131362915, mean loss: 0.3478022028367476
Epoch: 29, step: 1080, loss: 0.3371301591396332, mean loss: 0.3478019544012494
Epoch: 29, step: 1081, loss: 0.3997802138328552, mean loss: 0.3478031643798199
Epoch: 29, step: 1082, loss: 0.3162789046764374, mean loss: 0.34780243055781046
Epoch: 29, step: 1083, loss: 0.34246936440467834, mean loss: 0.3478023064175369
Epoch: 29, step: 1084, loss: 0.32452109456062317, mean loss: 0.347801764502501
Epoch: 29, step: 1085, loss: 0.3318355679512024, mean loss: 0.34780139286718253
Epoch: 29, step: 1086, loss: 0.3250863552093506, mean loss: 0.3478008641555549
Epoch: 29, step: 1087, loss: 0.38272836804389954, mean loss: 0.3478016771036949
Epoch: 29, step: 1088, loss: 0.30880701541900635, mean loss: 0.34780076951236044
Epoch: 29, step: 1089, loss: 0.33963242173194885, mean loss: 0.3478005794004631
Epoch: 29, step: 1090, loss: 0.35352304577827454, mean loss: 0.3478007125832866
Epoch: 29, step: 1091, loss: 0.35086479783058167, mean loss: 0.3478007838941516
Epoch: 29, step: 1092, loss: 0.37583357095718384, mean loss: 0.34780143628976384
Epoch: 29, step: 1093, loss: 0.3152180016040802, mean loss: 0.34780067800643394
Epoch: 29, step: 1094, loss: 0.35341334342956543, mean loss: 0.3478008086216261
Epoch: 29, step: 1095, loss: 0.3177792429924011, mean loss: 0.34780010999075883
Epoch: 29, step: 1096, loss: 0.3090481460094452, mean loss: 0.3477992082160635
Epoch: 29, step: 1097, loss: 0.3520611822605133, mean loss: 0.34779930739170567
Epoch: 29, step: 1098, loss: 0.35032230615615845, mean loss: 0.3477993661002284
Epoch: 29, step: 1099, loss: 0.362949401140213, mean loss: 0.34779971862338177
Epoch: 29, step: 1100, loss: 0.3785965144634247, mean loss: 0.3478004352112274
Epoch: 29, step: 1101, loss: 0.3387756645679474, mean loss: 0.3478002252254057
Epoch: 29, step: 1102, loss: 0.2818756401538849, mean loss: 0.3477986913464166
Epoch: 29, step: 1103, loss: 0.2999831736087799, mean loss: 0.34779757884018725
Epoch: 29, step: 1104, loss: 0.3598478138446808, mean loss: 0.34779785920209144
Epoch: 29, step: 1105, loss: 0.32130667567253113, mean loss: 0.3477972428700564
Epoch: 29, step: 1106, loss: 0.3338630199432373, mean loss: 0.3477969186901963
Epoch: 29, step: 1107, loss: 0.2916678488254547, mean loss: 0.3477956128771062
Epoch: 29, step: 1108, loss: 0.3441380560398102, mean loss: 0.34779552778796263
Epoch: 29, step: 1109, loss: 0.38215890526771545, mean loss: 0.3477963271965487
Epoch: 29, step: 1110, loss: 0.3383884131908417, mean loss: 0.34779610834168545
Epoch: 29, step: 1111, loss: 0.29884031414985657, mean loss: 0.34779496951703226
Epoch: 29, step: 1112, loss: 0.3337218761444092, mean loss: 0.34779464215204653
Epoch: 29, step: 1113, loss: 0.34535297751426697, mean loss: 0.3477945853559396
Epoch: 29, step: 1114, loss: 0.29890966415405273, mean loss: 0.34779344825931
Epoch: 29, step: 1115, loss: 0.35040271282196045, mean loss: 0.3477935089511728
Epoch: 29, step: 1116, loss: 0.31806257367134094, mean loss: 0.34779281742149865
Epoch: 29, step: 1117, loss: 0.3540152311325073, mean loss: 0.3477929621489888
Epoch: 29, step: 1118, loss: 0.3209456503391266, mean loss: 0.3477923377202922
Epoch: 29, step: 1119, loss: 0.2922213673591614, mean loss: 0.3477910452519147
Epoch: 29, step: 1120, loss: 0.3084789514541626, mean loss: 0.3477901309533869
Epoch: 29, step: 1121, loss: 0.33529239892959595, mean loss: 0.3477898402949371
Epoch: 29, step: 1122, loss: 0.3213007152080536, mean loss: 0.34778922425444575
Epoch: 29, step: 1123, loss: 0.33391112089157104, mean loss: 0.3477889015078559
Epoch: 29, step: 1124, loss: 0.31607377529144287, mean loss: 0.3477881639639333
Epoch: 29, step: 1125, loss: 0.3126470148563385, mean loss: 0.34778734676591677
Epoch: 29, step: 1126, loss: 0.3081148862838745, mean loss: 0.34778642421492073
Epoch: 29, step: 1127, loss: 0.3080790340900421, mean loss: 0.34778550087313564
Epoch: 29, step: 1128, loss: 0.3129110634326935, mean loss: 0.347784689934002
Epoch: 29, step: 1129, loss: 0.3068614900112152, mean loss: 0.34778373836445536
Epoch: 29, step: 1130, loss: 0.3802686333656311, mean loss: 0.34778449370416753
Epoch: 29, step: 1131, loss: 0.3022922873497009, mean loss: 0.3477834359426731
Epoch: 29, step: 1132, loss: 0.376273512840271, mean loss: 0.34778409836395463
Epoch: 29, step: 1133, loss: 0.30897343158721924, mean loss: 0.3477831960001607
Epoch: 29, step: 1134, loss: 0.31178438663482666, mean loss: 0.34778235903265553
Epoch: 29, step: 1135, loss: 0.3904814124107361, mean loss: 0.3477833517568576
Epoch: 29, step: 1136, loss: 0.31296098232269287, mean loss: 0.3477825421790687
Epoch: 29, step: 1137, loss: 0.314889520406723, mean loss: 0.3477817774740477
Epoch: 29, step: 1138, loss: 0.34148073196411133, mean loss: 0.347781630989205
Epoch: 29, step: 1139, loss: 0.36718741059303284, mean loss: 0.347782082118543
Epoch: 29, step: 1140, loss: 0.35943686962127686, mean loss: 0.3477823530529992
Epoch: 29, step: 1141, loss: 0.32591426372528076, mean loss: 0.3477818447055789
Epoch: 29, step: 1142, loss: 0.2933351695537567, mean loss: 0.34778057906306853
Epoch: 29, step: 1143, loss: 0.3903374969959259, mean loss: 0.3477815682987248
Epoch: 29, step: 1144, loss: 0.3209473788738251, mean loss: 0.34778094455242825
Epoch: 29, step: 1145, loss: 0.3412173092365265, mean loss: 0.3477807919878028
Epoch: 29, step: 1146, loss: 0.29793936014175415, mean loss: 0.34777963350439056
Epoch: 29, step: 1147, loss: 0.3898700475692749, mean loss: 0.3477806118052009
Epoch: 29, step: 1148, loss: 0.38361209630966187, mean loss: 0.34778144461134863
Epoch: 29, step: 1149, loss: 0.3046148121356964, mean loss: 0.3477804413428023
Epoch: 29, step: 1150, loss: 0.3221336603164673, mean loss: 0.34777984528030603
Epoch: 29, step: 1151, loss: 0.3218933641910553, mean loss: 0.3477792436608701
Epoch: 29, step: 1152, loss: 0.3456627130508423, mean loss: 0.34777919447240163
Epoch: 29, step: 1153, loss: 0.3231608271598816, mean loss: 0.3477786223513858
Epoch: 29, step: 1154, loss: 0.32463642954826355, mean loss: 0.3477780845485738
Epoch: 29, step: 1155, loss: 0.3286668062210083, mean loss: 0.3477776404307469
Epoch: 29, step: 1156, loss: 0.32682520151138306, mean loss: 0.34777715353838706
Epoch: 29, step: 1157, loss: 0.3052673935890198, mean loss: 0.3477761657203839
Epoch: 29, step: 1158, loss: 0.33705058693885803, mean loss: 0.34777591649118017
Epoch: 29, step: 1159, loss: 0.3069865107536316, mean loss: 0.3477749686938538
Epoch: 29, step: 1160, loss: 0.41146016120910645, mean loss: 0.3477764484715455
Epoch: 29, step: 1161, loss: 0.3262841999530792, mean loss: 0.34777594909312365
Epoch: 29, step: 1162, loss: 0.29393282532691956, mean loss: 0.3477746980621107
Epoch: 29, step: 1163, loss: 0.34503623843193054, mean loss: 0.34777463443618994
Epoch: 29, step: 1164, loss: 0.3219517767429352, mean loss: 0.3477740344766701
Epoch: 29, step: 1165, loss: 0.4212556481361389, mean loss: 0.34777574168390163
Epoch: 29, step: 1166, loss: 0.31222325563430786, mean loss: 0.3477749157078765
Epoch: 29, step: 1167, loss: 0.31185856461524963, mean loss: 0.34777408129771265
Epoch: 29, step: 1168, loss: 0.29850730299949646, mean loss: 0.3477729367564582
Epoch: 29, step: 1169, loss: 0.333257794380188, mean loss: 0.347772599555734
Epoch: 29, step: 1170, loss: 0.37053611874580383, mean loss: 0.34777312836190377
Epoch: 29, step: 1171, loss: 0.34457412362098694, mean loss: 0.3477730540493982
Epoch: 29, step: 1172, loss: 0.40727877616882324, mean loss: 0.347774436328246
Epoch: 29, step: 1173, loss: 0.3684171438217163, mean loss: 0.34777491583364656
Epoch: 29, step: 1174, loss: 0.3230748474597931, mean loss: 0.3477743420939338
Epoch: 29, step: 1175, loss: 0.32411879301071167, mean loss: 0.34777379262935415
Epoch: 29, step: 1176, loss: 0.33001741766929626, mean loss: 0.3477733801987463
Epoch: 29, step: 1177, loss: 0.3472587466239929, mean loss: 0.3477733682455347
Epoch: 29, step: 1178, loss: 0.35904771089553833, mean loss: 0.34777363010461376
Epoch: 29, step: 1179, loss: 0.3140256702899933, mean loss: 0.347772846289122
Epoch: 29, step: 1180, loss: 0.32101014256477356, mean loss: 0.3477722247245976
Epoch: 29, step: 1181, loss: 0.33298274874687195, mean loss: 0.34777188124659175
Epoch: 29, step: 1182, loss: 0.33086201548576355, mean loss: 0.3477714885327396
Epoch: 29, step: 1183, loss: 0.32355156540870667, mean loss: 0.3477709260635542
Epoch: 29, step: 1184, loss: 0.327189177274704, mean loss: 0.3477704480962801
Epoch: 29, step: 1185, loss: 0.3395513892173767, mean loss: 0.34777025723057764
Epoch: 29, step: 1186, loss: 0.34595128893852234, mean loss: 0.3477702149908755
Epoch: 29, step: 1187, loss: 0.34326493740081787, mean loss: 0.34777011037268885
Epoch: 29, step: 1188, loss: 0.3730113208293915, mean loss: 0.3477706964915895
Epoch: 29, step: 1189, loss: 0.3027050197124481, mean loss: 0.3477696500587473
Epoch: 29, step: 1190, loss: 0.33254551887512207, mean loss: 0.3477692965599853
Epoch: 29, step: 1191, loss: 0.28741389513015747, mean loss: 0.34776789516216255
Epoch: 29, step: 1192, loss: 0.33642035722732544, mean loss: 0.3477676316887145
Epoch: 29, step: 1193, loss: 0.36684858798980713, mean loss: 0.3477680747106857
Epoch: 29, step: 1194, loss: 0.3973405957221985, mean loss: 0.34776922565960755
Epoch: 29, step: 1195, loss: 0.3351598083972931, mean loss: 0.34776893290753513
Epoch: 29, step: 1196, loss: 0.31523430347442627, mean loss: 0.3477681775705622
Epoch: 29, step: 1197, loss: 0.3164401948451996, mean loss: 0.3477674502644675
Epoch: 29, step: 1198, loss: 0.4077679514884949, mean loss: 0.34776884319543033
Epoch: 29, step: 1199, loss: 0.3273029625415802, mean loss: 0.3477683680844485
Epoch: 29, step: 1200, loss: 0.32824984192848206, mean loss: 0.3477679149766147
Epoch: 29, step: 1201, loss: 0.34122395515441895, mean loss: 0.3477677630670594
Epoch: 29, step: 1202, loss: 0.35134223103523254, mean loss: 0.34776784604177957
Epoch: 29, step: 1203, loss: 0.3526255786418915, mean loss: 0.34776795880251776
Epoch: 29, step: 1204, loss: 0.3157849609851837, mean loss: 0.34776721641033054
Epoch: 29, step: 1205, loss: 0.3165891468524933, mean loss: 0.347766492719008
Epoch: 29, step: 1206, loss: 0.3621419072151184, mean loss: 0.34776682638691636
Epoch: 29, step: 1207, loss: 0.3501964509487152, mean loss: 0.3477668827796506
Epoch: 29, step: 1208, loss: 0.33431562781333923, mean loss: 0.3477665705769126
Epoch: 29, step: 1209, loss: 0.3003278374671936, mean loss: 0.34776546955260984
Epoch: 29, step: 1210, loss: 0.32425934076309204, mean loss: 0.3477649240022399
Epoch: 29, step: 1211, loss: 0.3626863658428192, mean loss: 0.3477652703038051
Epoch: 29, step: 1212, loss: 0.3088584244251251, mean loss: 0.34776436736231475
Epoch: 29, step: 1213, loss: 0.32363995909690857, mean loss: 0.3477638075013664
Epoch: 29, step: 1214, loss: 0.29284629225730896, mean loss: 0.34776253304695026
Epoch: 29, step: 1215, loss: 0.31116318702697754, mean loss: 0.3477616837165404
Epoch: 29, step: 1216, loss: 0.3554067015647888, mean loss: 0.34776186112395807
Epoch: 29, step: 1217, loss: 0.2980858385562897, mean loss: 0.3477607083875547
Epoch: 29, step: 1218, loss: 0.34150949120521545, mean loss: 0.34776056333088495
Epoch: 29, step: 1219, loss: 0.30995267629623413, mean loss: 0.34775968603630925
Epoch: 29, step: 1220, loss: 0.3381754755973816, mean loss: 0.34775946364935795
Epoch: 29, step: 1221, loss: 0.36145445704460144, mean loss: 0.3477597814133701
Epoch: 29, step: 1222, loss: 0.3570467531681061, mean loss: 0.34775999689335235
Epoch: 29, step: 1223, loss: 0.40615129470825195, mean loss: 0.34776135167984457
Epoch: 29, step: 1224, loss: 0.3456342816352844, mean loss: 0.3477613023290164
Epoch: 29, step: 1225, loss: 0.3410200774669647, mean loss: 0.34776114592734453
Epoch: 29, step: 1226, loss: 0.3414621949195862, mean loss: 0.34776099979016134
Epoch: 29, step: 1227, loss: 0.3050680458545685, mean loss: 0.34776000932630796
Epoch: 29, step: 1228, loss: 0.3048017919063568, mean loss: 0.34775901273154125
Epoch: 29, step: 1229, loss: 0.32128220796585083, mean loss: 0.34775839850603285
Epoch: 29, step: 1230, loss: 0.3183787167072296, mean loss: 0.34775771695357505
Epoch: 29, step: 1231, loss: 0.29526394605636597, mean loss: 0.34775649922668217
Epoch: 29, step: 1232, loss: 0.33506110310554504, mean loss: 0.34775620473142316
Epoch: 29, step: 1233, loss: 0.32164329290390015, mean loss: 0.3477555990039393
Epoch: 29, step: 1234, loss: 0.30350738763809204, mean loss: 0.34775457262525716
Epoch: 29, step: 1235, loss: 0.3068326413631439, mean loss: 0.3477536234247733
Epoch: 29, step: 1236, loss: 0.29924410581588745, mean loss: 0.34775249825330273
Epoch: 29, step: 1237, loss: 0.306380957365036, mean loss: 0.3477515386684605
Epoch: 29, step: 1238, loss: 0.343088299036026, mean loss: 0.3477514305102874
Epoch: 29, step: 1239, loss: 0.35640865564346313, mean loss: 0.3477516312994407
Epoch: 29, step: 1240, loss: 0.3247793912887573, mean loss: 0.3477510985109811
Epoch: 29, step: 1241, loss: 0.3320070803165436, mean loss: 0.3477507333730296
Epoch: 29, step: 1242, loss: 0.3085976541042328, mean loss: 0.34774982534920557
Epoch: 29, step: 1243, loss: 0.31558963656425476, mean loss: 0.34774907951922446
Epoch: 29, step: 1244, loss: 0.34830641746520996, mean loss: 0.34774909244420177
Epoch: 29, step: 1245, loss: 0.29263976216316223, mean loss: 0.3477478144577846
Epoch: 29, step: 1246, loss: 0.3426869809627533, mean loss: 0.3477476970996811
Epoch: 29, step: 1247, loss: 0.31921881437301636, mean loss: 0.3477470355450311
Epoch: 29, step: 1248, loss: 0.31914132833480835, mean loss: 0.34774637222428423
Epoch: 29, step: 1249, loss: 0.3416469991207123, mean loss: 0.3477462307928252
Epoch: 29, step: 1250, loss: 0.3267858326435089, mean loss: 0.3477457447771471
Epoch: 29, step: 1251, loss: 0.31483209133148193, mean loss: 0.34774498161508427
Epoch: 29, step: 1252, loss: 0.3636937737464905, mean loss: 0.34774535140784857
Epoch: 29, step: 1253, loss: 0.2906981110572815, mean loss: 0.34774402872664406
Epoch: 29, step: 1254, loss: 0.3617057204246521, mean loss: 0.3477443524309796
Epoch: 29, step: 1255, loss: 0.3352355360984802, mean loss: 0.34774406241854494
Epoch: 29, step: 1256, loss: 0.38307297229766846, mean loss: 0.34774488148770033
Epoch: 29, step: 1257, loss: 0.3287569582462311, mean loss: 0.3477444412799004
Epoch: 29, step: 1258, loss: 0.3249755799770355, mean loss: 0.34774391342870525
Epoch: 29, step: 1259, loss: 0.33689624071121216, mean loss: 0.34774366195261297
Epoch: 29, step: 1260, loss: 0.324974924325943, mean loss: 0.3477431341287581
Epoch: 29, step: 1261, loss: 0.3253760039806366, mean loss: 0.34774261562696973
Epoch: 29, step: 1262, loss: 0.3606266379356384, mean loss: 0.3477429142899501
Epoch: 29, step: 1263, loss: 0.33593252301216125, mean loss: 0.3477426405210285
Epoch: 29, step: 1264, loss: 0.3393799662590027, mean loss: 0.3477424466758635
Epoch: 29, step: 1265, loss: 0.3232974112033844, mean loss: 0.34774188005782375
Epoch: 29, step: 1266, loss: 0.34328874945640564, mean loss: 0.34774177683990654
Epoch: 29, step: 1267, loss: 0.3541089594364166, mean loss: 0.3477419244196997
Epoch: 29, step: 1268, loss: 0.3288774788379669, mean loss: 0.3477414871860554
Epoch: 29, step: 1269, loss: 0.3377906084060669, mean loss: 0.3477412565533483
Epoch: 29, step: 1270, loss: 0.3280879557132721, mean loss: 0.34774080105700234
Epoch: 29, step: 1271, loss: 0.39343732595443726, mean loss: 0.34774186012173064
Epoch: 29, step: 1272, loss: 0.3416207432746887, mean loss: 0.34774171826173744
Epoch: 29, step: 1273, loss: 0.33258795738220215, mean loss: 0.34774136707376807
Epoch: 29, step: 1274, loss: 0.3159255087375641, mean loss: 0.34774062975926
Epoch: 29, step: 1275, loss: 0.2945910394191742, mean loss: 0.347739398076132
Epoch: 29, step: 1276, loss: 0.33759576082229614, mean loss: 0.34773916301397517
Epoch: 29, step: 1277, loss: 0.3577929437160492, mean loss: 0.347739395988455
Epoch: 29, step: 1278, loss: 0.3585484027862549, mean loss: 0.3477396464578513
Epoch: 29, step: 1279, loss: 0.29272544384002686, mean loss: 0.3477383716825566
Epoch: 29, step: 1280, loss: 0.3115946054458618, mean loss: 0.34773753418768355
Epoch: 29, step: 1281, loss: 0.32210013270378113, mean loss: 0.34773694015178097
Epoch: 29, step: 1282, loss: 0.3172377645969391, mean loss: 0.34773623348166455
Epoch: 29, step: 1283, loss: 0.31450605392456055, mean loss: 0.34773546355164703
Epoch: 29, step: 1284, loss: 0.3125516176223755, mean loss: 0.3477346483748455
Epoch: 29, step: 1285, loss: 0.30960318446159363, mean loss: 0.34773376492496105
Epoch: 29, step: 1286, loss: 0.3134446442127228, mean loss: 0.34773297051491747
Epoch: 29, step: 1287, loss: 0.3355913460254669, mean loss: 0.34773268922438627
Epoch: 29, step: 1288, loss: 0.3615807592868805, mean loss: 0.3477330100414849
Epoch: 29, step: 1289, loss: 0.3709147572517395, mean loss: 0.34773354707867177
Epoch: 29, step: 1290, loss: 0.41857999563217163, mean loss: 0.3477351882964667
Epoch: 29, step: 1291, loss: 0.35576802492141724, mean loss: 0.34773537437959834
Epoch: 29, step: 1292, loss: 0.2941524386405945, mean loss: 0.3477341331431616
Epoch: 29, step: 1293, loss: 0.34704098105430603, mean loss: 0.3477341170868241
Epoch: 29, step: 1294, loss: 0.34786662459373474, mean loss: 0.347734120156188
Epoch: 29, step: 1295, loss: 0.3378438949584961, mean loss: 0.34773389106730634
Epoch: 29, step: 1296, loss: 0.3304215371608734, mean loss: 0.3477334900677486
Epoch: 29, step: 1297, loss: 0.333360880613327, mean loss: 0.34773315716809944
Epoch: 29, step: 1298, loss: 0.3631329834461212, mean loss: 0.3477335138519739
Epoch: 29, step: 1299, loss: 0.3109872341156006, mean loss: 0.34773266277082376
Epoch: 29, step: 1300, loss: 0.33217594027519226, mean loss: 0.34773230246967973
Epoch: 29, step: 1301, loss: 0.3548250198364258, mean loss: 0.34773246673660657
Epoch: 29, step: 1302, loss: 0.30056533217430115, mean loss: 0.34773137437377827
Epoch: 29, step: 1303, loss: 0.3160548806190491, mean loss: 0.3477306407819822
Epoch: 29, step: 1304, loss: 0.28626254200935364, mean loss: 0.34772921728324957
Epoch: 29, step: 1305, loss: 0.3421972692012787, mean loss: 0.3477290891755176
Epoch: 29, step: 1306, loss: 0.3208635747432709, mean loss: 0.34772846704378907
Epoch: 29, step: 1307, loss: 0.3370119035243988, mean loss: 0.34772821888327776
Epoch: 29, step: 1308, loss: 0.32867419719696045, mean loss: 0.3477277776647601
Epoch: 29, step: 1309, loss: 0.3206073045730591, mean loss: 0.3477271496725151
Epoch: 29, step: 1310, loss: 0.37607821822166443, mean loss: 0.3477278061447996
Epoch: 29, step: 1311, loss: 0.3175968825817108, mean loss: 0.3477271084759202
Epoch: 29, step: 1312, loss: 0.36701908707618713, mean loss: 0.3477275551632387
Epoch: 29, step: 1313, loss: 0.3798525333404541, mean loss: 0.3477282989691701
Epoch: 29, step: 1314, loss: 0.3391064703464508, mean loss: 0.34772809934821614
Epoch: 29, step: 1315, loss: 0.3142039477825165, mean loss: 0.34772732318245475
Epoch: 29, step: 1316, loss: 0.376822292804718, mean loss: 0.3477279967862707
Epoch: 29, step: 1317, loss: 0.36566027998924255, mean loss: 0.3477284119430796
Epoch: 29, step: 1318, loss: 0.32633888721466064, mean loss: 0.34772791675787923
Epoch: 29, step: 1319, loss: 0.30381888151168823, mean loss: 0.3477269002509053
Epoch: 29, step: 1320, loss: 0.3635697662830353, mean loss: 0.34772726700938467
Epoch: 29, step: 1321, loss: 0.34579455852508545, mean loss: 0.347727222268691
Epoch: 29, step: 1322, loss: 0.2906684875488281, mean loss: 0.3477259014340717
Epoch: 29, step: 1323, loss: 0.34181830286979675, mean loss: 0.347725764684105
Epoch: 29, step: 1324, loss: 0.3194729685783386, mean loss: 0.34772511069933365
Epoch: 29, step: 1325, loss: 0.2922009229660034, mean loss: 0.34772382547671127
Epoch: 29, step: 1326, loss: 0.28777286410331726, mean loss: 0.34772243781934087
Epoch: 29, step: 1327, loss: 0.34296178817749023, mean loss: 0.3477223276293205
Epoch: 29, step: 1328, loss: 0.3693107068538666, mean loss: 0.3477228273024885
Epoch: 29, step: 1329, loss: 0.389847069978714, mean loss: 0.3477238022652871
Epoch: 29, step: 1330, loss: 0.32395949959754944, mean loss: 0.3477232522548104
Epoch: 29, step: 1331, loss: 0.31923437118530273, mean loss: 0.3477225929120713
Epoch: 29, step: 1332, loss: 0.31803905963897705, mean loss: 0.3477219059363655
Epoch: 29, step: 1333, loss: 0.29948288202285767, mean loss: 0.347720789550716
Epoch: 29, step: 1334, loss: 0.369576632976532, mean loss: 0.3477212953442275
Epoch: 29, step: 1335, loss: 0.3233046233654022, mean loss: 0.34772073030044387
Epoch: 29, step: 1336, loss: 0.35229361057281494, mean loss: 0.34772083612230936
Epoch: 29, step: 1337, loss: 0.32786738872528076, mean loss: 0.3477203767006544
Epoch: 29, step: 1338, loss: 0.36433494091033936, mean loss: 0.3477207611635541
Epoch: 29, step: 1339, loss: 0.33162763714790344, mean loss: 0.34772038877545675
Epoch: 29, step: 1340, loss: 0.33186230063438416, mean loss: 0.3477200218344812
Epoch: 29, step: 1341, loss: 0.40533605217933655, mean loss: 0.3477213549834086
Epoch: 29, step: 1342, loss: 0.31695666909217834, mean loss: 0.34772064315097634
Epoch: 29, step: 1343, loss: 0.3183134198188782, mean loss: 0.3477199627432176
Epoch: 29, step: 1344, loss: 0.35727909207344055, mean loss: 0.34772018391184695
Epoch: 29, step: 1345, loss: 0.3085111677646637, mean loss: 0.3477192767577091
Epoch: 29, step: 1346, loss: 0.3561832010746002, mean loss: 0.3477194725776271
Epoch: 29, step: 1347, loss: 0.343406617641449, mean loss: 0.34771937279845494
Epoch: 29, step: 1348, loss: 0.33393892645835876, mean loss: 0.3477190539911365
Epoch: 29, step: 1349, loss: 0.3564307987689972, mean loss: 0.34771925553059835
Epoch: 29, step: 1350, loss: 0.3267596364021301, mean loss: 0.34771877065727547
Epoch: 29, step: 1351, loss: 0.39820733666419983, mean loss: 0.3477199386170702
Epoch: 29, step: 1352, loss: 0.2903898060321808, mean loss: 0.3477186124209383
Epoch: 29, step: 1353, loss: 0.370577335357666, mean loss: 0.347719141190842
Epoch: 29, step: 1354, loss: 0.3477981686592102, mean loss: 0.3477191430188698
Epoch: 29, step: 1355, loss: 0.31906044483184814, mean loss: 0.347718480114119
Epoch: 29, step: 1356, loss: 0.33030059933662415, mean loss: 0.3477180772301929
Epoch: 29, step: 1357, loss: 0.3414926528930664, mean loss: 0.34771793323647643
Epoch: 29, step: 1358, loss: 0.3448633849620819, mean loss: 0.34771786721246173
Epoch: 29, step: 1359, loss: 0.33976617455482483, mean loss: 0.34771768329876346
Epoch: 29, step: 1360, loss: 0.3292425870895386, mean loss: 0.34771725600047243
Epoch: 29, step: 1361, loss: 0.33678680658340454, mean loss: 0.347717003203178
Epoch: 29, step: 1362, loss: 0.3402523398399353, mean loss: 0.3477168305658977
Epoch: 29, step: 1363, loss: 0.3517284393310547, mean loss: 0.34771692334130855
Epoch: 29, step: 1364, loss: 0.3244459927082062, mean loss: 0.3477163851731202
Epoch: 29, step: 1365, loss: 0.34128913283348083, mean loss: 0.3477162365386366
Epoch: 29, step: 1366, loss: 0.3107285797595978, mean loss: 0.34771538119426226
Epoch: 29, step: 1367, loss: 0.3186108469963074, mean loss: 0.347714708163687
Epoch: 29, step: 1368, loss: 0.3797706365585327, mean loss: 0.3477154494269173
Epoch: 29, step: 1369, loss: 0.35998448729515076, mean loss: 0.3477157331303319
Epoch: 29, step: 1370, loss: 0.30105337500572205, mean loss: 0.34771465415703606
Epoch: 29, step: 1371, loss: 0.375179648399353, mean loss: 0.34771528921517153
Epoch: 29, step: 1372, loss: 0.31591612100601196, mean loss: 0.3477145539572879
Epoch: 29, step: 1373, loss: 0.3675520122051239, mean loss: 0.34771501262684273
Epoch: 29, step: 1374, loss: 0.3722611367702484, mean loss: 0.3477155801541633
Epoch: 29, step: 1375, loss: 0.3523833453655243, mean loss: 0.34771568807437997
Epoch: 29, step: 1376, loss: 0.3317374587059021, mean loss: 0.34771531866117467
Epoch: 29, step: 1377, loss: 0.30896613001823425, mean loss: 0.34771442280903053
Epoch: 29, step: 1378, loss: 0.3579462468624115, mean loss: 0.34771465935565066
Epoch: 29, step: 1379, loss: 0.3304853141307831, mean loss: 0.3477142610445441
Epoch: 29, step: 1380, loss: 0.3337332010269165, mean loss: 0.34771393783535215
Epoch: 29, step: 1381, loss: 0.31700795888900757, mean loss: 0.3477132280018197
Epoch: 29, step: 1382, loss: 0.3386763036251068, mean loss: 0.34771301909906244
Epoch: 29, step: 1383, loss: 0.336611270904541, mean loss: 0.347712762470579
Epoch: 29, step: 1384, loss: 0.330632746219635, mean loss: 0.3477123676573234
Epoch: 29, step: 1385, loss: 0.3309490382671356, mean loss: 0.3477119801734024
Epoch: 29, step: 1386, loss: 0.34825578331947327, mean loss: 0.3477119927431073
Epoch: 29, step: 1387, loss: 0.30791690945625305, mean loss: 0.3477110729233198
Epoch: 29, step: 1388, loss: 0.3373998701572418, mean loss: 0.34771083459666396
Epoch: 29, step: 1389, loss: 0.3103947937488556, mean loss: 0.34770997211709925
Epoch: 29, step: 1390, loss: 0.31509292125701904, mean loss: 0.3477092182619473
Epoch: 29, step: 1391, loss: 0.3600101172924042, mean loss: 0.3477095025574782
Epoch: 29, step: 1392, loss: 0.3803936541080475, mean loss: 0.34771025792856486
Epoch: 29, step: 1393, loss: 0.3177588880062103, mean loss: 0.34770956573143236
Epoch: 29, step: 1394, loss: 0.3173721134662628, mean loss: 0.3477088646278696
Epoch: 29, step: 1395, loss: 0.3453706204891205, mean loss: 0.3477088105919078
Epoch: 29, step: 1396, loss: 0.3129371404647827, mean loss: 0.3477080070499734
Epoch: 29, step: 1397, loss: 0.2968430519104004, mean loss: 0.3477068316339005
Epoch: 29, step: 1398, loss: 0.332502156496048, mean loss: 0.3477064802838106
Epoch: 29, step: 1399, loss: 0.32745978236198425, mean loss: 0.34770601243331795
Epoch: 29, step: 1400, loss: 0.35785192251205444, mean loss: 0.3477062468744779
Epoch: 29, step: 1401, loss: 0.32043763995170593, mean loss: 0.3477056167943697
Epoch: 29, step: 1402, loss: 0.35421115159988403, mean loss: 0.34770576711056933
Epoch: 29, step: 1403, loss: 0.3315674364566803, mean loss: 0.3477053942286226
Epoch: 29, step: 1404, loss: 0.30308955907821655, mean loss: 0.34770436338748795
Epoch: 29, step: 1405, loss: 0.3811435401439667, mean loss: 0.347705135976018
Epoch: 29, step: 1406, loss: 0.33637720346450806, mean loss: 0.34770487425819546
Epoch: 29, step: 1407, loss: 0.34305092692375183, mean loss: 0.34770476673700207
Epoch: 29, step: 1408, loss: 0.3039981424808502, mean loss: 0.347703756996347
Epoch: 29, step: 1409, loss: 0.29787689447402954, mean loss: 0.3477026058883092
Epoch: 29, step: 1410, loss: 0.35260942578315735, mean loss: 0.3477027192438177
Epoch: 29, step: 1411, loss: 0.34356385469436646, mean loss: 0.3477026236315337
Epoch: 29, step: 1412, loss: 0.3304367959499359, mean loss: 0.34770222478130197
Epoch: 29, step: 1413, loss: 0.33180415630340576, mean loss: 0.3477018575355529
Epoch: 29, step: 1414, loss: 0.32959869503974915, mean loss: 0.34770143936174086
Epoch: 29, step: 1415, loss: 0.37240809202194214, mean loss: 0.34770201005962176
Epoch: 29, step: 1416, loss: 0.31389787793159485, mean loss: 0.34770122923749974
Epoch: 29, step: 1417, loss: 0.31896859407424927, mean loss: 0.3477005655742863
Epoch: 29, step: 1418, loss: 0.31198424100875854, mean loss: 0.34769974062164594
Epoch: 29, step: 1419, loss: 0.3377932608127594, mean loss: 0.3476995118134464
Epoch: 29, step: 1420, loss: 0.30712512135505676, mean loss: 0.34769857469562165
Epoch: 29, step: 1421, loss: 0.35066717863082886, mean loss: 0.34769864325777083
Epoch: 29, step: 1422, loss: 0.3552248477935791, mean loss: 0.3476988170771324
Epoch: 29, step: 1423, loss: 0.34730565547943115, mean loss: 0.3476988079971879
Epoch: 29, step: 1424, loss: 0.30790069699287415, mean loss: 0.3476978888934488
Epoch: 29, step: 1425, loss: 0.32043135166168213, mean loss: 0.34769725921035727
Epoch: 29, step: 1426, loss: 0.3586786389350891, mean loss: 0.34769751280432826
Epoch: 29, step: 1427, loss: 0.28748422861099243, mean loss: 0.3476961223257537
Epoch: 29, step: 1428, loss: 0.39443764090538025, mean loss: 0.3476972016819153
Epoch: 29, step: 1429, loss: 0.3364693224430084, mean loss: 0.34769694241347127
Epoch: 29, step: 1430, loss: 0.3169967532157898, mean loss: 0.34769623351677564
Epoch: 29, step: 1431, loss: 0.3077620267868042, mean loss: 0.34769531141908633
Epoch: 29, step: 1432, loss: 0.3134098947048187, mean loss: 0.3476945197726222
Epoch: 29, step: 1433, loss: 0.3064497709274292, mean loss: 0.34769356745794094
Epoch: 29, step: 1434, loss: 0.329486608505249, mean loss: 0.34769314708069377
Epoch: 29, step: 1435, loss: 0.2965199649333954, mean loss: 0.3476919655794436
Epoch: 29, step: 1436, loss: 0.346547931432724, mean loss: 0.34769193916626173
Epoch: 29, step: 1437, loss: 0.3075684905052185, mean loss: 0.3476910128272337
Epoch: 29, step: 1438, loss: 0.31872689723968506, mean loss: 0.34769034414166083
Epoch: 29, step: 1439, loss: 0.35508638620376587, mean loss: 0.3476905148878531
Epoch: 29, step: 1440, loss: 0.31723159551620483, mean loss: 0.3476898117246753
Epoch: 29, step: 1441, loss: 0.3143814504146576, mean loss: 0.3476890427981018
Epoch: 29, step: 1442, loss: 0.31422337889671326, mean loss: 0.34768827025801774
Epoch: 29, step: 1443, loss: 0.30283573269844055, mean loss: 0.3476872348808811
Valid: 29, mean loss: 0.1856296534339587
Epoch: 30, step: 0, loss: 0.3240320384502411, mean loss: 0.34768668883632003
Epoch: 30, step: 1, loss: 0.3268318176269531, mean loss: 0.3476862074441588
Epoch: 30, step: 2, loss: 0.350478857755661, mean loss: 0.3476862719053067
Epoch: 30, step: 3, loss: 0.31694498658180237, mean loss: 0.3476855623382002
Epoch: 30, step: 4, loss: 0.3346669375896454, mean loss: 0.3476852618506122
Epoch: 30, step: 5, loss: 0.3178444802761078, mean loss: 0.34768457310063355
Epoch: 30, step: 6, loss: 0.3179687559604645, mean loss: 0.34768388725076765
Epoch: 30, step: 7, loss: 0.35692378878593445, mean loss: 0.34768410050551135
Epoch: 30, step: 8, loss: 0.31899407505989075, mean loss: 0.34768343836178667
Epoch: 30, step: 9, loss: 0.37218427658081055, mean loss: 0.3476840038092415
Epoch: 30, step: 10, loss: 0.30396658182144165, mean loss: 0.34768299489133087
Epoch: 30, step: 11, loss: 0.33824658393859863, mean loss: 0.3476827771213006
Epoch: 30, step: 12, loss: 0.32793283462524414, mean loss: 0.3476823213498909
Epoch: 30, step: 13, loss: 0.39247241616249084, mean loss: 0.34768335495156194
Epoch: 30, step: 14, loss: 0.3086763322353363, mean loss: 0.3476824548241195
Epoch: 30, step: 15, loss: 0.34185636043548584, mean loss: 0.3476823203840607
Epoch: 30, step: 16, loss: 0.32977327704429626, mean loss: 0.34768190713341257
Epoch: 30, step: 17, loss: 0.33192580938339233, mean loss: 0.3476815435703097
Epoch: 30, step: 18, loss: 0.356021523475647, mean loss: 0.34768173600621977
Epoch: 30, step: 19, loss: 0.32735589146614075, mean loss: 0.3476812670204205
Epoch: 30, step: 20, loss: 0.3336983323097229, mean loss: 0.3476809443943918
Epoch: 30, step: 21, loss: 0.33533069491386414, mean loss: 0.3476806594456243
Epoch: 30, step: 22, loss: 0.31676962971687317, mean loss: 0.3476799462732613
Epoch: 30, step: 23, loss: 0.29917341470718384, mean loss: 0.3476788271672359
Epoch: 30, step: 24, loss: 0.3277148902416229, mean loss: 0.34767836658500206
Epoch: 30, step: 25, loss: 0.32297587394714355, mean loss: 0.3476777966940632
Epoch: 30, step: 26, loss: 0.33528223633766174, mean loss: 0.34767751073285813
Epoch: 30, step: 27, loss: 0.3444896340370178, mean loss: 0.3476774371913638
Epoch: 30, step: 28, loss: 0.3293874263763428, mean loss: 0.3476770152667331
Epoch: 30, step: 29, loss: 0.3232119083404541, mean loss: 0.34767645090440497
Epoch: 30, step: 30, loss: 0.38096901774406433, mean loss: 0.3476772188813107
Epoch: 30, step: 31, loss: 0.3495652973651886, mean loss: 0.34767726243359165
Epoch: 30, step: 32, loss: 0.3030589818954468, mean loss: 0.34767623324805574
Epoch: 30, step: 33, loss: 0.35616937279701233, mean loss: 0.34767642915015357
Epoch: 30, step: 34, loss: 0.3351730704307556, mean loss: 0.3476761407553036
Epoch: 30, step: 35, loss: 0.34116631746292114, mean loss: 0.34767599060715126
Epoch: 30, step: 36, loss: 0.32160139083862305, mean loss: 0.34767538921407126
Epoch: 30, step: 37, loss: 0.3590192496776581, mean loss: 0.34767565084653734
Epoch: 30, step: 38, loss: 0.3378187119960785, mean loss: 0.3476754235133689
Epoch: 30, step: 39, loss: 0.32282739877700806, mean loss: 0.3476748504500678
Epoch: 30, step: 40, loss: 0.33038535714149475, mean loss: 0.3476744517163368
Epoch: 30, step: 41, loss: 0.3148949444293976, mean loss: 0.34767369576625873
Epoch: 30, step: 42, loss: 0.3418697714805603, mean loss: 0.3476735619211768
Epoch: 30, step: 43, loss: 0.3514956831932068, mean loss: 0.3476736500615991
Epoch: 30, step: 44, loss: 0.3717769980430603, mean loss: 0.34767420588652664
Epoch: 30, step: 45, loss: 0.3182678520679474, mean loss: 0.3476735277895424
Epoch: 30, step: 46, loss: 0.34859946370124817, mean loss: 0.34767354914070603
Epoch: 30, step: 47, loss: 0.3074559271335602, mean loss: 0.3476726217836223
Epoch: 30, step: 48, loss: 0.39111676812171936, mean loss: 0.3476736235163424
Epoch: 30, step: 49, loss: 0.3810272514820099, mean loss: 0.34767439256471605
Epoch: 30, step: 50, loss: 0.3169974684715271, mean loss: 0.3476736852505178
Epoch: 30, step: 51, loss: 0.34517958760261536, mean loss: 0.3476736277457302
Epoch: 30, step: 52, loss: 0.2931334674358368, mean loss: 0.34767237027771297
Epoch: 30, step: 53, loss: 0.3627376854419708, mean loss: 0.34767271761287144
Epoch: 30, step: 54, loss: 0.30798202753067017, mean loss: 0.3476718025537341
Epoch: 30, step: 55, loss: 0.3560978174209595, mean loss: 0.3476719968089643
Epoch: 30, step: 56, loss: 0.3584064543247223, mean loss: 0.3476722442778422
Epoch: 30, step: 57, loss: 0.3552384078502655, mean loss: 0.3476724187018261
Epoch: 30, step: 58, loss: 0.34630075097084045, mean loss: 0.34767238708127857
Epoch: 30, step: 59, loss: 0.3371107876300812, mean loss: 0.3476721436142557
Epoch: 30, step: 60, loss: 0.30294695496559143, mean loss: 0.34767111262860184
Epoch: 30, step: 61, loss: 0.3289167284965515, mean loss: 0.34767068032063697
Epoch: 30, step: 62, loss: 0.3162069320678711, mean loss: 0.34766995506539294
Epoch: 30, step: 63, loss: 0.33412832021713257, mean loss: 0.34766964293108427
Epoch: 30, step: 64, loss: 0.35978275537490845, mean loss: 0.3476699221315555
Epoch: 30, step: 65, loss: 0.3003227114677429, mean loss: 0.3476688308299683
Epoch: 30, step: 66, loss: 0.3092557489871979, mean loss: 0.34766794547071683
Epoch: 30, step: 67, loss: 0.31253477931022644, mean loss: 0.3476671357268669
Epoch: 30, step: 68, loss: 0.338386207818985, mean loss: 0.34766692182638737
Epoch: 30, step: 69, loss: 0.36412274837493896, mean loss: 0.3476673010802834
Epoch: 30, step: 70, loss: 0.31497064232826233, mean loss: 0.3476665475447863
Epoch: 30, step: 71, loss: 0.36632150411605835, mean loss: 0.3476669774617427
Epoch: 30, step: 72, loss: 0.37821340560913086, mean loss: 0.3476676814100327
Epoch: 30, step: 73, loss: 0.318401038646698, mean loss: 0.3476670069701847
Epoch: 30, step: 74, loss: 0.33290669322013855, mean loss: 0.3476666668316031
Epoch: 30, step: 75, loss: 0.3414718806743622, mean loss: 0.34766652408143817
Epoch: 30, step: 76, loss: 0.31957826018333435, mean loss: 0.3476658768416774
Epoch: 30, step: 77, loss: 0.3034592270851135, mean loss: 0.3476648582083358
Epoch: 30, step: 78, loss: 0.3564538359642029, mean loss: 0.34766506072401027
Epoch: 30, step: 79, loss: 0.30925610661506653, mean loss: 0.34766417572506764
Epoch: 30, step: 80, loss: 0.3200225532054901, mean loss: 0.3476635388359978
Epoch: 30, step: 81, loss: 0.3149368464946747, mean loss: 0.3476627847994939
Epoch: 30, step: 82, loss: 0.3286797106266022, mean loss: 0.3476623474317043
Epoch: 30, step: 83, loss: 0.29464730620384216, mean loss: 0.34766112599954996
Epoch: 30, step: 84, loss: 0.3268297016620636, mean loss: 0.3476606460681057
Epoch: 30, step: 85, loss: 0.32602211833000183, mean loss: 0.3476601475534363
Epoch: 30, step: 86, loss: 0.3245243728160858, mean loss: 0.34765961455703626
Epoch: 30, step: 87, loss: 0.31234756112098694, mean loss: 0.3476588010652044
Epoch: 30, step: 88, loss: 0.3238305449485779, mean loss: 0.34765825214087726
Epoch: 30, step: 89, loss: 0.31018128991127014, mean loss: 0.3476573888153249
Epoch: 30, step: 90, loss: 0.33585289120674133, mean loss: 0.34765711689121326
Epoch: 30, step: 91, loss: 0.3384917676448822, mean loss: 0.34765690576642644
Epoch: 30, step: 92, loss: 0.3186546862125397, mean loss: 0.34765623771262794
Epoch: 30, step: 93, loss: 0.37107253074645996, mean loss: 0.34765677708455944
Epoch: 30, step: 94, loss: 0.357906699180603, mean loss: 0.3476570131762811
Epoch: 30, step: 95, loss: 0.33831217885017395, mean loss: 0.34765679793686877
Epoch: 30, step: 96, loss: 0.37024644017219543, mean loss: 0.3476573182317356
Epoch: 30, step: 97, loss: 0.32398292422294617, mean loss: 0.34765677296493364
Epoch: 30, step: 98, loss: 0.37363484501838684, mean loss: 0.347657371276089
Epoch: 30, step: 99, loss: 0.31628096103668213, mean loss: 0.34765664865033497
Epoch: 30, step: 100, loss: 0.33197495341300964, mean loss: 0.3476562874957039
Epoch: 30, step: 101, loss: 0.32882198691368103, mean loss: 0.3476558537455178
Epoch: 30, step: 102, loss: 0.35928264260292053, mean loss: 0.34765612150197994
Epoch: 30, step: 103, loss: 0.3138892352581024, mean loss: 0.3476553438931405
Epoch: 30, step: 104, loss: 0.3075254261493683, mean loss: 0.3476544197729852
Epoch: 30, step: 105, loss: 0.3158480226993561, mean loss: 0.34765368734547464
Epoch: 30, step: 106, loss: 0.3424544930458069, mean loss: 0.34765356762285277
Epoch: 30, step: 107, loss: 0.31196144223213196, mean loss: 0.34765274575388827
Epoch: 30, step: 108, loss: 0.33881479501724243, mean loss: 0.34765254225045195
Epoch: 30, step: 109, loss: 0.30732637643814087, mean loss: 0.3476516137179672
Epoch: 30, step: 110, loss: 0.33843958377838135, mean loss: 0.347651401610718
Epoch: 30, step: 111, loss: 0.32741984724998474, mean loss: 0.34765093578933376
Epoch: 30, step: 112, loss: 0.341997891664505, mean loss: 0.347650805633827
Epoch: 30, step: 113, loss: 0.344259649515152, mean loss: 0.34765072755775484
Epoch: 30, step: 114, loss: 0.33368751406669617, mean loss: 0.3476504060839781
Epoch: 30, step: 115, loss: 0.3318621516227722, mean loss: 0.3476500426008199
Epoch: 30, step: 116, loss: 0.34182870388031006, mean loss: 0.3476499085828463
Epoch: 30, step: 117, loss: 0.31694331765174866, mean loss: 0.34764920167665975
Epoch: 30, step: 118, loss: 0.34218481183052063, mean loss: 0.3476490758821008
Epoch: 30, step: 119, loss: 0.3675168752670288, mean loss: 0.3476495332439651
Epoch: 30, step: 120, loss: 0.38760921359062195, mean loss: 0.3476504531049339
Epoch: 30, step: 121, loss: 0.30923327803611755, mean loss: 0.34764956877237396
Epoch: 30, step: 122, loss: 0.3369552195072174, mean loss: 0.34764932260269726
Epoch: 30, step: 123, loss: 0.35395005345344543, mean loss: 0.34764946763379134
Epoch: 30, step: 124, loss: 0.32754459977149963, mean loss: 0.3476490048678145
Epoch: 30, step: 125, loss: 0.3149944543838501, mean loss: 0.347648253255457
Epoch: 30, step: 126, loss: 0.3183170557022095, mean loss: 0.3476475781525143
Epoch: 30, step: 127, loss: 0.35739070177078247, mean loss: 0.3476478024004341
Epoch: 30, step: 128, loss: 0.32982248067855835, mean loss: 0.3476473921419305
Epoch: 30, step: 129, loss: 0.32922276854515076, mean loss: 0.34764696809996054
Epoch: 30, step: 130, loss: 0.35715925693511963, mean loss: 0.3476471870198665
Epoch: 30, step: 131, loss: 0.3472937047481537, mean loss: 0.34764717888486074
Epoch: 30, step: 132, loss: 0.3690052032470703, mean loss: 0.3476476704049943
Epoch: 30, step: 133, loss: 0.31922000646591187, mean loss: 0.3476470162036793
Epoch: 30, step: 134, loss: 0.33954083919525146, mean loss: 0.3476468296618082
Epoch: 30, step: 135, loss: 0.3616812527179718, mean loss: 0.3476471526188925
Epoch: 30, step: 136, loss: 0.3686484396457672, mean loss: 0.3476476358848112
Epoch: 30, step: 137, loss: 0.33905306458473206, mean loss: 0.3476474381175117
Epoch: 30, step: 138, loss: 0.2915023863315582, mean loss: 0.34764614620900514
Epoch: 30, step: 139, loss: 0.3319253921508789, mean loss: 0.3476457844797355
Epoch: 30, step: 140, loss: 0.3588367998600006, mean loss: 0.34764604197531496
Epoch: 30, step: 141, loss: 0.32765641808509827, mean loss: 0.3476455820419504
Epoch: 30, step: 142, loss: 0.327852338552475, mean loss: 0.3476451266375032
Epoch: 30, step: 143, loss: 0.3755176067352295, mean loss: 0.34764576791488444
Epoch: 30, step: 144, loss: 0.34992340207099915, mean loss: 0.3476458203164525
Epoch: 30, step: 145, loss: 0.3463630676269531, mean loss: 0.3476457908048184
Epoch: 30, step: 146, loss: 0.3761814534664154, mean loss: 0.3476464472950906
Epoch: 30, step: 147, loss: 0.33360326290130615, mean loss: 0.34764612422560515
Epoch: 30, step: 148, loss: 0.34425482153892517, mean loss: 0.34764604620902584
Epoch: 30, step: 149, loss: 0.32546037435531616, mean loss: 0.3476455358416034
Epoch: 30, step: 150, loss: 0.3434121906757355, mean loss: 0.34764543845840157
Epoch: 30, step: 151, loss: 0.30792272090911865, mean loss: 0.34764452470431734
Epoch: 30, step: 152, loss: 0.3398374319076538, mean loss: 0.34764434511945325
Epoch: 30, step: 153, loss: 0.3289679288864136, mean loss: 0.34764391551977913
Epoch: 30, step: 154, loss: 0.34503093361854553, mean loss: 0.3476438554166877
Epoch: 30, step: 155, loss: 0.3097858130931854, mean loss: 0.34764298463643367
Epoch: 30, step: 156, loss: 0.3311196267604828, mean loss: 0.34764260458818114
Epoch: 30, step: 157, loss: 0.2892190217971802, mean loss: 0.34764126083771446
Epoch: 30, step: 158, loss: 0.355087548494339, mean loss: 0.3476414320994191
Epoch: 30, step: 159, loss: 0.31254875659942627, mean loss: 0.34764062500016657
Epoch: 30, step: 160, loss: 0.33058610558509827, mean loss: 0.3476402327709305
Epoch: 30, step: 161, loss: 0.3767242133617401, mean loss: 0.3476409016449609
Epoch: 30, step: 162, loss: 0.32294002175331116, mean loss: 0.34764033358664176
Epoch: 30, step: 163, loss: 0.34486719965934753, mean loss: 0.3476402698129796
Epoch: 30, step: 164, loss: 0.33951014280319214, mean loss: 0.34764008284903775
Epoch: 30, step: 165, loss: 0.32626593112945557, mean loss: 0.3476395913310384
Epoch: 30, step: 166, loss: 0.3479515314102173, mean loss: 0.3476395985042184
Epoch: 30, step: 167, loss: 0.3308720886707306, mean loss: 0.3476392129378591
Epoch: 30, step: 168, loss: 0.34712323546409607, mean loss: 0.34763920107330776
Epoch: 30, step: 169, loss: 0.30932459235191345, mean loss: 0.34763832007517664
Epoch: 30, step: 170, loss: 0.32809993624687195, mean loss: 0.3476378708239792
Epoch: 30, step: 171, loss: 0.33496877551078796, mean loss: 0.3476375795268369
Epoch: 30, step: 172, loss: 0.3032631576061249, mean loss: 0.34763655926100284
Epoch: 30, step: 173, loss: 0.3626106083393097, mean loss: 0.34763690353950283
Epoch: 30, step: 174, loss: 0.33915528655052185, mean loss: 0.3476367085373879
Epoch: 30, step: 175, loss: 0.31434786319732666, mean loss: 0.34763594320620017
Epoch: 30, step: 176, loss: 0.3053686022758484, mean loss: 0.3476349714761744
Epoch: 30, step: 177, loss: 0.360426127910614, mean loss: 0.3476352655392677
Epoch: 30, step: 178, loss: 0.3097339868545532, mean loss: 0.34763439422547465
Epoch: 30, step: 179, loss: 0.3330831527709961, mean loss: 0.3476340597141768
Epoch: 30, step: 180, loss: 0.3062286078929901, mean loss: 0.34763310788659074
Epoch: 30, step: 181, loss: 0.32342788577079773, mean loss: 0.3476325514702854
Epoch: 30, step: 182, loss: 0.34805914759635925, mean loss: 0.34763256127641656
Epoch: 30, step: 183, loss: 0.32641610503196716, mean loss: 0.3476320735866353
Epoch: 30, step: 184, loss: 0.31768596172332764, mean loss: 0.34763138524938986
Epoch: 30, step: 185, loss: 0.3176243305206299, mean loss: 0.34763069552717385
Epoch: 30, step: 186, loss: 0.33127671480178833, mean loss: 0.3476303196340825
Epoch: 30, step: 187, loss: 0.3254241943359375, mean loss: 0.3476298092423086
Epoch: 30, step: 188, loss: 0.3351580500602722, mean loss: 0.34762952259450736
Epoch: 30, step: 189, loss: 0.32014068961143494, mean loss: 0.34762889081254955
Epoch: 30, step: 190, loss: 0.41097864508628845, mean loss: 0.347630346760569
Epoch: 30, step: 191, loss: 0.36237308382987976, mean loss: 0.34763068558059723
Epoch: 30, step: 192, loss: 0.34283506870269775, mean loss: 0.34763057536946773
Epoch: 30, step: 193, loss: 0.33024096488952637, mean loss: 0.3476301757369246
Epoch: 30, step: 194, loss: 0.36502140760421753, mean loss: 0.34763057539754433
Epoch: 30, step: 195, loss: 0.33983102440834045, mean loss: 0.34763039616344676
Epoch: 30, step: 196, loss: 0.34104445576667786, mean loss: 0.34763024482166316
Epoch: 30, step: 197, loss: 0.3109002709388733, mean loss: 0.34762940080369625
Epoch: 30, step: 198, loss: 0.31734010577201843, mean loss: 0.34762870480206404
Epoch: 30, step: 199, loss: 0.33553317189216614, mean loss: 0.3476284268716203
Epoch: 30, step: 200, loss: 0.3768627345561981, mean loss: 0.3476290986003877
Epoch: 30, step: 201, loss: 0.3239210546016693, mean loss: 0.34762855386338115
Epoch: 30, step: 202, loss: 0.3118687570095062, mean loss: 0.3476277322335106
Epoch: 30, step: 203, loss: 0.32358646392822266, mean loss: 0.34762717986543085
Epoch: 30, step: 204, loss: 0.32622238993644714, mean loss: 0.3476266880839276
Epoch: 30, step: 205, loss: 0.3245098292827606, mean loss: 0.347626156979328
Epoch: 30, step: 206, loss: 0.36252307891845703, mean loss: 0.3476264992248754
Epoch: 30, step: 207, loss: 0.3063766062259674, mean loss: 0.34762555156146335
Epoch: 30, step: 208, loss: 0.32518360018730164, mean loss: 0.347625035998244
Epoch: 30, step: 209, loss: 0.3180719017982483, mean loss: 0.3476243570840653
Epoch: 30, step: 210, loss: 0.34537065029144287, mean loss: 0.34762430531160904
Epoch: 30, step: 211, loss: 0.3304908275604248, mean loss: 0.34762391172809
Epoch: 30, step: 212, loss: 0.336078941822052, mean loss: 0.34762364652766947
Epoch: 30, step: 213, loss: 0.3281223177909851, mean loss: 0.34762319857138846
Epoch: 30, step: 214, loss: 0.3150881230831146, mean loss: 0.3476224512399198
Epoch: 30, step: 215, loss: 0.3023099899291992, mean loss: 0.34762141043549794
Epoch: 30, step: 216, loss: 0.31126701831817627, mean loss: 0.34762057541259517
Epoch: 30, step: 217, loss: 0.38411080837249756, mean loss: 0.34762141353637116
Epoch: 30, step: 218, loss: 0.30080515146255493, mean loss: 0.3476203382644983
Epoch: 30, step: 219, loss: 0.3918379843235016, mean loss: 0.3476213538282571
Epoch: 30, step: 220, loss: 0.33279168605804443, mean loss: 0.34762101323737105
Epoch: 30, step: 221, loss: 0.34685829281806946, mean loss: 0.34762099572048116
Epoch: 30, step: 222, loss: 0.31525948643684387, mean loss: 0.34762025251240447
Epoch: 30, step: 223, loss: 0.36016109585762024, mean loss: 0.34762054051633945
Epoch: 30, step: 224, loss: 0.32936331629753113, mean loss: 0.3476201212437658
Epoch: 30, step: 225, loss: 0.33693963289260864, mean loss: 0.347619875974663
Epoch: 30, step: 226, loss: 0.29738298058509827, mean loss: 0.34761872234994967
Epoch: 30, step: 227, loss: 0.338153600692749, mean loss: 0.3476185050007796
Epoch: 30, step: 228, loss: 0.3052915334701538, mean loss: 0.34761753306177917
Epoch: 30, step: 229, loss: 0.3283824026584625, mean loss: 0.34761709138255065
Epoch: 30, step: 230, loss: 0.3767630159854889, mean loss: 0.34761776061918365
Epoch: 30, step: 231, loss: 0.3158162832260132, mean loss: 0.3476170304236153
Epoch: 30, step: 232, loss: 0.33790066838264465, mean loss: 0.3476168073307849
Epoch: 30, step: 233, loss: 0.3077787160873413, mean loss: 0.34761589264806364
Epoch: 30, step: 234, loss: 0.34022611379623413, mean loss: 0.34761572298260957
Epoch: 30, step: 235, loss: 0.3531363010406494, mean loss: 0.34761584972928183
Epoch: 30, step: 236, loss: 0.36801832914352417, mean loss: 0.34761631813802013
Epoch: 30, step: 237, loss: 0.32427820563316345, mean loss: 0.3476157823440786
Epoch: 30, step: 238, loss: 0.352013498544693, mean loss: 0.3476158833040685
Epoch: 30, step: 239, loss: 0.34391656517982483, mean loss: 0.34761579837941003
Epoch: 30, step: 240, loss: 0.4654809534549713, mean loss: 0.3476185041289354
Epoch: 30, step: 241, loss: 0.2988927662372589, mean loss: 0.3476173855912675
Epoch: 30, step: 242, loss: 0.30333003401756287, mean loss: 0.3476163689635886
Epoch: 30, step: 243, loss: 0.32345050573349, mean loss: 0.34761581424264404
Epoch: 30, step: 244, loss: 0.34330376982688904, mean loss: 0.3476157152630867
Epoch: 30, step: 245, loss: 0.3070976138114929, mean loss: 0.3476147852235731
Epoch: 30, step: 246, loss: 0.3334035277366638, mean loss: 0.3476144590304111
Epoch: 30, step: 247, loss: 0.3280130922794342, mean loss: 0.3476140091275753
Epoch: 30, step: 248, loss: 0.3434523642063141, mean loss: 0.34761391360908916
Epoch: 30, step: 249, loss: 0.3151709735393524, mean loss: 0.34761316899260836
Epoch: 30, step: 250, loss: 0.365831583738327, mean loss: 0.34761358712427265
Epoch: 30, step: 251, loss: 0.33776694536209106, mean loss: 0.3476133611387369
Epoch: 30, step: 252, loss: 0.33441463112831116, mean loss: 0.3476130582279892
Epoch: 30, step: 253, loss: 0.318135142326355, mean loss: 0.3476123817255818
Epoch: 30, step: 254, loss: 0.3562788963317871, mean loss: 0.34761258061289346
Epoch: 30, step: 255, loss: 0.31376025080680847, mean loss: 0.34761180375568296
Epoch: 30, step: 256, loss: 0.3266600966453552, mean loss: 0.34761132295831026
Epoch: 30, step: 257, loss: 0.32130682468414307, mean loss: 0.3476107193395514
Epoch: 30, step: 258, loss: 0.31369128823280334, mean loss: 0.3476099409960578
Epoch: 30, step: 259, loss: 0.2947264611721039, mean loss: 0.3476087275155662
Epoch: 30, step: 260, loss: 0.3215675950050354, mean loss: 0.3476081299814915
Epoch: 30, step: 261, loss: 0.3560467064380646, mean loss: 0.3476083236067601
Epoch: 30, step: 262, loss: 0.32661959528923035, mean loss: 0.3476078420261365
Epoch: 30, step: 263, loss: 0.32998237013816833, mean loss: 0.34760743762378954
Epoch: 30, step: 264, loss: 0.34612229466438293, mean loss: 0.3476074035491547
Epoch: 30, step: 265, loss: 0.30613821744918823, mean loss: 0.34760645211552693
Epoch: 30, step: 266, loss: 0.3353033661842346, mean loss: 0.34760616985049536
Epoch: 30, step: 267, loss: 0.3071960508823395, mean loss: 0.3476052427577412
Epoch: 30, step: 268, loss: 0.3261023461818695, mean loss: 0.3476047494475809
Epoch: 30, step: 269, loss: 0.33139699697494507, mean loss: 0.3476043776248584
Epoch: 30, step: 270, loss: 0.31400159001350403, mean loss: 0.34760360675959695
Epoch: 30, step: 271, loss: 0.36288440227508545, mean loss: 0.34760395730087784
Epoch: 30, step: 272, loss: 0.33894965052604675, mean loss: 0.3476037587757299
Epoch: 30, step: 273, loss: 0.3393048048019409, mean loss: 0.34760356840655127
Epoch: 30, step: 274, loss: 0.32677751779556274, mean loss: 0.347603090690056
Epoch: 30, step: 275, loss: 0.3519531786441803, mean loss: 0.3476031904718698
Epoch: 30, step: 276, loss: 0.3479684591293335, mean loss: 0.3476031988501678
Epoch: 30, step: 277, loss: 0.3293921649456024, mean loss: 0.34760278114674326
Epoch: 30, step: 278, loss: 0.3609083592891693, mean loss: 0.34760308632755343
Epoch: 30, step: 279, loss: 0.33457496762275696, mean loss: 0.3476027875174914
Epoch: 30, step: 280, loss: 0.3162723183631897, mean loss: 0.3476020689452303
Epoch: 30, step: 281, loss: 0.3342708349227905, mean loss: 0.34760176319700725
Epoch: 30, step: 282, loss: 0.2918432056903839, mean loss: 0.3476004844189987
Epoch: 30, step: 283, loss: 0.3229161500930786, mean loss: 0.3475999183164777
Epoch: 30, step: 284, loss: 0.31910791993141174, mean loss: 0.3475992649052087
Epoch: 30, step: 285, loss: 0.33044081926345825, mean loss: 0.3475988714170272
Epoch: 30, step: 286, loss: 0.3362726867198944, mean loss: 0.34759861168384915
Epoch: 30, step: 287, loss: 0.37842079997062683, mean loss: 0.34759931848508485
Epoch: 30, step: 288, loss: 0.35435643792152405, mean loss: 0.3475994734329038
Epoch: 30, step: 289, loss: 0.2992178797721863, mean loss: 0.34759836401777744
Epoch: 30, step: 290, loss: 0.3346388638019562, mean loss: 0.34759806685650585
Epoch: 30, step: 291, loss: 0.34259048104286194, mean loss: 0.3475979520352224
Epoch: 30, step: 292, loss: 0.3277066946029663, mean loss: 0.3475974959497105
Epoch: 30, step: 293, loss: 0.41984111070632935, mean loss: 0.34759915238146993
Epoch: 30, step: 294, loss: 0.31332701444625854, mean loss: 0.34759836659360027
Epoch: 30, step: 295, loss: 0.3263164162635803, mean loss: 0.3475978786545336
Epoch: 30, step: 296, loss: 0.3582959473133087, mean loss: 0.34759812392744693
Epoch: 30, step: 297, loss: 0.3497299551963806, mean loss: 0.34759817280248173
Epoch: 30, step: 298, loss: 0.30903545022010803, mean loss: 0.34759728872163204
Epoch: 30, step: 299, loss: 0.34899598360061646, mean loss: 0.3475973207870809
Epoch: 30, step: 300, loss: 0.36564671993255615, mean loss: 0.3475977345648289
Epoch: 30, step: 301, loss: 0.3210130035877228, mean loss: 0.3475971251308053
Epoch: 30, step: 302, loss: 0.3472428619861603, mean loss: 0.34759711700978785
Epoch: 30, step: 303, loss: 0.3389890789985657, mean loss: 0.34759691968634177
Epoch: 30, step: 304, loss: 0.2929043769836426, mean loss: 0.3475956659890878
Epoch: 30, step: 305, loss: 0.3354881703853607, mean loss: 0.34759538845973365
Epoch: 30, step: 306, loss: 0.29897794127464294, mean loss: 0.34759427407077303
Epoch: 30, step: 307, loss: 0.3482975661754608, mean loss: 0.3475942901909735
Epoch: 30, step: 308, loss: 0.30256155133247375, mean loss: 0.3475932580165285
Epoch: 30, step: 309, loss: 0.31595367193222046, mean loss: 0.34759253283692537
Epoch: 30, step: 310, loss: 0.332709938287735, mean loss: 0.3475921917355399
Epoch: 30, step: 311, loss: 0.33189937472343445, mean loss: 0.3475918320725171
Epoch: 30, step: 312, loss: 0.3317042589187622, mean loss: 0.3475914679542315
Epoch: 30, step: 313, loss: 0.31786543130874634, mean loss: 0.3475907866956569
Epoch: 30, step: 314, loss: 0.3224121034145355, mean loss: 0.34759020966613285
Epoch: 30, step: 315, loss: 0.3228531777858734, mean loss: 0.34758964277109483
Epoch: 30, step: 316, loss: 0.37077784538269043, mean loss: 0.34759017415965526
Epoch: 30, step: 317, loss: 0.3396776020526886, mean loss: 0.3475899928366774
Epoch: 30, step: 318, loss: 0.3651806116104126, mean loss: 0.3475903959306707
Epoch: 30, step: 319, loss: 0.34277966618537903, mean loss: 0.3475902856939671
Epoch: 30, step: 320, loss: 0.34429433941841125, mean loss: 0.3475902101698894
Epoch: 30, step: 321, loss: 0.40917956829071045, mean loss: 0.3475916214103944
Epoch: 30, step: 322, loss: 0.31411394476890564, mean loss: 0.3475908543302981
Epoch: 30, step: 323, loss: 0.34165942668914795, mean loss: 0.34759071842553135
Epoch: 30, step: 324, loss: 0.3654381334781647, mean loss: 0.3475911273478604
Epoch: 30, step: 325, loss: 0.3216657340526581, mean loss: 0.3475905333554374
Epoch: 30, step: 326, loss: 0.3334084153175354, mean loss: 0.3475902084277668
Epoch: 30, step: 327, loss: 0.3460882604122162, mean loss: 0.34759017401730086
Epoch: 30, step: 328, loss: 0.34820112586021423, mean loss: 0.3475901880142273
Epoch: 30, step: 329, loss: 0.3160875141620636, mean loss: 0.34758946630348614
Epoch: 30, step: 330, loss: 0.37087392807006836, mean loss: 0.34758999972681587
Epoch: 30, step: 331, loss: 0.3084602355957031, mean loss: 0.34758910332426546
Epoch: 30, step: 332, loss: 0.361511766910553, mean loss: 0.3475894222637103
Epoch: 30, step: 333, loss: 0.3092244267463684, mean loss: 0.34758854342109524
Epoch: 30, step: 334, loss: 0.32909736037254333, mean loss: 0.347588119845719
Epoch: 30, step: 335, loss: 0.3087412416934967, mean loss: 0.3475872300051896
Epoch: 30, step: 336, loss: 0.32866138219833374, mean loss: 0.34758679649285923
Epoch: 30, step: 337, loss: 0.3121321201324463, mean loss: 0.3475859843925257
Epoch: 30, step: 338, loss: 0.35787513852119446, mean loss: 0.3475862200633869
Epoch: 30, step: 339, loss: 0.34591391682624817, mean loss: 0.3475861817605184
Epoch: 30, step: 340, loss: 0.30526140332221985, mean loss: 0.3475852123649838
Epoch: 30, step: 341, loss: 0.32437431812286377, mean loss: 0.34758468076097476
Epoch: 30, step: 342, loss: 0.35135263204574585, mean loss: 0.3475847670571817
Epoch: 30, step: 343, loss: 0.3705735504627228, mean loss: 0.34758529355002266
Epoch: 30, step: 344, loss: 0.3337702751159668, mean loss: 0.34758497716347886
Epoch: 30, step: 345, loss: 0.3386716842651367, mean loss: 0.34758477303915103
Epoch: 30, step: 346, loss: 0.3124891221523285, mean loss: 0.3475839693280903
Epoch: 30, step: 347, loss: 0.3161413073539734, mean loss: 0.347583249289115
Epoch: 30, step: 348, loss: 0.31537926197052, mean loss: 0.3475825118326283
Epoch: 30, step: 349, loss: 0.31918084621429443, mean loss: 0.3475818614624515
Epoch: 30, step: 350, loss: 0.3632197976112366, mean loss: 0.3475822195475915
Epoch: 30, step: 351, loss: 0.34167173504829407, mean loss: 0.3475820842095145
Epoch: 30, step: 352, loss: 0.3360883891582489, mean loss: 0.3475818210332946
Epoch: 30, step: 353, loss: 0.36162883043289185, mean loss: 0.34758214266651805
Epoch: 30, step: 354, loss: 0.3458893299102783, mean loss: 0.3475821039072105
Epoch: 30, step: 355, loss: 0.3741949796676636, mean loss: 0.3475827132321432
Epoch: 30, step: 356, loss: 0.3016479015350342, mean loss: 0.3475816615387646
Epoch: 30, step: 357, loss: 0.31669288873672485, mean loss: 0.34758095434583447
Epoch: 30, step: 358, loss: 0.3264220356941223, mean loss: 0.347580469927266
Epoch: 30, step: 359, loss: 0.29802197217941284, mean loss: 0.3475793353462736
Epoch: 30, step: 360, loss: 0.35314735770225525, mean loss: 0.3475794628163946
Epoch: 30, step: 361, loss: 0.31924816966056824, mean loss: 0.34757881423590026
Epoch: 30, step: 362, loss: 0.32175636291503906, mean loss: 0.34757822310316394
Epoch: 30, step: 363, loss: 0.31090518832206726, mean loss: 0.3475773835959123
Epoch: 30, step: 364, loss: 0.3161609172821045, mean loss: 0.3475766644367887
Epoch: 30, step: 365, loss: 0.3294387459754944, mean loss: 0.34757624924843405
Epoch: 30, step: 366, loss: 0.3353312313556671, mean loss: 0.3475759689586936
Epoch: 30, step: 367, loss: 0.38026270270347595, mean loss: 0.34757671714432226
Epoch: 30, step: 368, loss: 0.33448415994644165, mean loss: 0.34757641746803764
Epoch: 30, step: 369, loss: 0.32085850834846497, mean loss: 0.3475758059342972
Epoch: 30, step: 370, loss: 0.326794296503067, mean loss: 0.3475753302869229
Epoch: 30, step: 371, loss: 0.336397647857666, mean loss: 0.3475750744578826
Epoch: 30, step: 372, loss: 0.3813205063343048, mean loss: 0.34757584678827597
Epoch: 30, step: 373, loss: 0.35105931758880615, mean loss: 0.34757592651251273
Epoch: 30, step: 374, loss: 0.36582836508750916, mean loss: 0.34757634423624717
Epoch: 30, step: 375, loss: 0.3203432559967041, mean loss: 0.3475757209964028
Epoch: 30, step: 376, loss: 0.3099801540374756, mean loss: 0.3475748606268818
Epoch: 30, step: 377, loss: 0.3916151821613312, mean loss: 0.34757586846068506
Epoch: 30, step: 378, loss: 0.3323981463909149, mean loss: 0.34757552113644263
Epoch: 30, step: 379, loss: 0.3189330995082855, mean loss: 0.3475748657034534
Epoch: 30, step: 380, loss: 0.3058195412158966, mean loss: 0.3475739102259017
Epoch: 30, step: 381, loss: 0.36701878905296326, mean loss: 0.34757435516844043
Epoch: 30, step: 382, loss: 0.31059062480926514, mean loss: 0.3475735089169163
Epoch: 30, step: 383, loss: 0.36987847089767456, mean loss: 0.34757401928123033
Epoch: 30, step: 384, loss: 0.329232394695282, mean loss: 0.3475735996124376
Epoch: 30, step: 385, loss: 0.35157716274261475, mean loss: 0.3475736912145776
Epoch: 30, step: 386, loss: 0.31740444898605347, mean loss: 0.34757300095347005
Epoch: 30, step: 387, loss: 0.3309348523616791, mean loss: 0.3475726202874915
Epoch: 30, step: 388, loss: 0.37517815828323364, mean loss: 0.3475732518630937
Epoch: 30, step: 389, loss: 0.33047202229499817, mean loss: 0.3475728606201386
Epoch: 30, step: 390, loss: 0.3159219026565552, mean loss: 0.34757213652419106
Epoch: 30, step: 391, loss: 0.3420691192150116, mean loss: 0.34757201063159154
Epoch: 30, step: 392, loss: 0.33757370710372925, mean loss: 0.34757178190550253
Epoch: 30, step: 393, loss: 0.35196617245674133, mean loss: 0.3475718824314336
Epoch: 30, step: 394, loss: 0.33868464827537537, mean loss: 0.34757167913201337
Epoch: 30, step: 395, loss: 0.3287034034729004, mean loss: 0.3475712475217183
Epoch: 30, step: 396, loss: 0.33819305896759033, mean loss: 0.3475710330013131
Epoch: 30, step: 397, loss: 0.3480643033981323, mean loss: 0.34757104428431773
Epoch: 30, step: 398, loss: 0.31842225790023804, mean loss: 0.3475703775539171
Epoch: 30, step: 399, loss: 0.3303200900554657, mean loss: 0.34756998299107406
Epoch: 30, step: 400, loss: 0.2991560399532318, mean loss: 0.3475688756526546
Epoch: 30, step: 401, loss: 0.34742772579193115, mean loss: 0.3475688724243059
Epoch: 30, step: 402, loss: 0.3781123459339142, mean loss: 0.3475695709919593
Epoch: 30, step: 403, loss: 0.3064485490322113, mean loss: 0.34756863052397924
Epoch: 30, step: 404, loss: 0.30520862340927124, mean loss: 0.34756766174165526
Epoch: 30, step: 405, loss: 0.3414519727230072, mean loss: 0.34756752187775236
Epoch: 30, step: 406, loss: 0.36737051606178284, mean loss: 0.34756797475570383
Epoch: 30, step: 407, loss: 0.3420686423778534, mean loss: 0.3475678489934376
Epoch: 30, step: 408, loss: 0.32495808601379395, mean loss: 0.3475673319506747
Epoch: 30, step: 409, loss: 0.3278350234031677, mean loss: 0.34756688072020253
Epoch: 30, step: 410, loss: 0.3182806074619293, mean loss: 0.3475662110288335
Epoch: 30, step: 411, loss: 0.3323158025741577, mean loss: 0.3475658623045937
Epoch: 30, step: 412, loss: 0.33590009808540344, mean loss: 0.3475655955549031
Epoch: 30, step: 413, loss: 0.3221112787723541, mean loss: 0.3475650135290929
Epoch: 30, step: 414, loss: 0.3306695818901062, mean loss: 0.34756462721534787
Epoch: 30, step: 415, loss: 0.3716828525066376, mean loss: 0.3475651786655329
Epoch: 30, step: 416, loss: 0.3213956952095032, mean loss: 0.3475645803281193
Epoch: 30, step: 417, loss: 0.35134395956993103, mean loss: 0.3475646667376315
Epoch: 30, step: 418, loss: 0.3122756779193878, mean loss: 0.3475638599293181
Epoch: 30, step: 419, loss: 0.31505632400512695, mean loss: 0.3475631167300514
Epoch: 30, step: 420, loss: 0.3194553852081299, mean loss: 0.34756247413542574
Epoch: 30, step: 421, loss: 0.3783387541770935, mean loss: 0.3475631777219111
Epoch: 30, step: 422, loss: 0.30106523633003235, mean loss: 0.3475621147417453
Epoch: 30, step: 423, loss: 0.2833307981491089, mean loss: 0.34756064639599293
Epoch: 30, step: 424, loss: 0.3192519247531891, mean loss: 0.3475599992655405
Epoch: 30, step: 425, loss: 0.3958253264427185, mean loss: 0.3475611025738927
Epoch: 30, step: 426, loss: 0.34565332531929016, mean loss: 0.34756105896456513
Epoch: 30, step: 427, loss: 0.3044423460960388, mean loss: 0.3475600733489286
Epoch: 30, step: 428, loss: 0.3541613519191742, mean loss: 0.34756022423874483
Epoch: 30, step: 429, loss: 0.32080551981925964, mean loss: 0.3475596127026438
Epoch: 30, step: 430, loss: 0.3476448357105255, mean loss: 0.34755961465055374
Epoch: 30, step: 431, loss: 0.3238011300563812, mean loss: 0.34755907162430133
Epoch: 30, step: 432, loss: 0.3159794211387634, mean loss: 0.34755834985321166
Epoch: 30, step: 433, loss: 0.332516074180603, mean loss: 0.34755800606120013
Epoch: 30, step: 434, loss: 0.35129624605178833, mean loss: 0.3475580914969216
Epoch: 30, step: 435, loss: 0.3377678394317627, mean loss: 0.34755786775041675
Epoch: 30, step: 436, loss: 0.38851723074913025, mean loss: 0.34755880381465787
Epoch: 30, step: 437, loss: 0.315985769033432, mean loss: 0.34755808227722973
Epoch: 30, step: 438, loss: 0.3606197237968445, mean loss: 0.3475583807676321
Epoch: 30, step: 439, loss: 0.3486317992210388, mean loss: 0.34755840529730425
Epoch: 30, step: 440, loss: 0.28198179602622986, mean loss: 0.34755690678014806
Epoch: 30, step: 441, loss: 0.3257594108581543, mean loss: 0.3475564086882893
Epoch: 30, step: 442, loss: 0.31143367290496826, mean loss: 0.3475555832710239
Epoch: 30, step: 443, loss: 0.3269388973712921, mean loss: 0.34755511218323715
Epoch: 30, step: 444, loss: 0.3422223627567291, mean loss: 0.3475549903335987
Epoch: 30, step: 445, loss: 0.31424716114997864, mean loss: 0.34755422929011326
Epoch: 30, step: 446, loss: 0.2913155257701874, mean loss: 0.3475529443333303
Epoch: 30, step: 447, loss: 0.31922879815101624, mean loss: 0.3475522971905277
Epoch: 30, step: 448, loss: 0.3331069350242615, mean loss: 0.34755196715415115
Epoch: 30, step: 449, loss: 0.343526154756546, mean loss: 0.3475518751776285
Epoch: 30, step: 450, loss: 0.3545053005218506, mean loss: 0.3475520340368125
Epoch: 30, step: 451, loss: 0.36589911580085754, mean loss: 0.3475524531879083
Epoch: 30, step: 452, loss: 0.3567020297050476, mean loss: 0.3475526622111993
Epoch: 30, step: 453, loss: 0.3012230098247528, mean loss: 0.3475516038283148
Epoch: 30, step: 454, loss: 0.3131181001663208, mean loss: 0.3475508172262894
Epoch: 30, step: 455, loss: 0.31898051500320435, mean loss: 0.34755016457866916
Epoch: 30, step: 456, loss: 0.35200345516204834, mean loss: 0.34755026630538827
Epoch: 30, step: 457, loss: 0.32687097787857056, mean loss: 0.34754979393825347
Epoch: 30, step: 458, loss: 0.3911169469356537, mean loss: 0.34755078909924386
Epoch: 30, step: 459, loss: 0.3247859477996826, mean loss: 0.3475502691165737
Epoch: 30, step: 460, loss: 0.3096194267272949, mean loss: 0.34754940273978036
Epoch: 30, step: 461, loss: 0.29542076587677, mean loss: 0.34754821209894937
Epoch: 30, step: 462, loss: 0.3089835047721863, mean loss: 0.34754733128431065
Epoch: 30, step: 463, loss: 0.32518133521080017, mean loss: 0.34754682045852786
Epoch: 30, step: 464, loss: 0.3795081675052643, mean loss: 0.3475475504196343
Epoch: 30, step: 465, loss: 0.2928541600704193, mean loss: 0.3475463013128342
Epoch: 30, step: 466, loss: 0.32710564136505127, mean loss: 0.3475458344925463
Epoch: 30, step: 467, loss: 0.34181398153305054, mean loss: 0.3475457035924604
Epoch: 30, step: 468, loss: 0.3200894296169281, mean loss: 0.34754507657942113
Epoch: 30, step: 469, loss: 0.3287218511104584, mean loss: 0.34754464672727525
Epoch: 30, step: 470, loss: 0.33166778087615967, mean loss: 0.3475442841672549
Epoch: 30, step: 471, loss: 0.3318147659301758, mean loss: 0.347543924980229
Epoch: 30, step: 472, loss: 0.31086280941963196, mean loss: 0.34754308737797385
Epoch: 30, step: 473, loss: 0.31840065121650696, mean loss: 0.34754242193439344
Epoch: 30, step: 474, loss: 0.3985248804092407, mean loss: 0.34754358605035357
Epoch: 30, step: 475, loss: 0.32982203364372253, mean loss: 0.34754318141174717
Epoch: 30, step: 476, loss: 0.3623736500740051, mean loss: 0.3475435200301151
Epoch: 30, step: 477, loss: 0.37985771894454956, mean loss: 0.34754425783090315
Epoch: 30, step: 478, loss: 0.33873826265335083, mean loss: 0.34754405677619465
Epoch: 30, step: 479, loss: 0.35423269867897034, mean loss: 0.3475442094849139
Epoch: 30, step: 480, loss: 0.30902090668678284, mean loss: 0.3475433299775328
Epoch: 30, step: 481, loss: 0.3039523661136627, mean loss: 0.3475423347954894
Epoch: 30, step: 482, loss: 0.32081541419029236, mean loss: 0.34754172463361455
Epoch: 30, step: 483, loss: 0.2999892830848694, mean loss: 0.34754063906057214
Epoch: 30, step: 484, loss: 0.29205867648124695, mean loss: 0.347539372493683
Epoch: 30, step: 485, loss: 0.33280444145202637, mean loss: 0.34753903612581005
Epoch: 30, step: 486, loss: 0.2991552948951721, mean loss: 0.3475379316506981
Epoch: 30, step: 487, loss: 0.35334670543670654, mean loss: 0.34753806424688566
Epoch: 30, step: 488, loss: 0.34087324142456055, mean loss: 0.34753791211324137
Epoch: 30, step: 489, loss: 0.3374495804309845, mean loss: 0.3475376818386081
Epoch: 30, step: 490, loss: 0.3158125877380371, mean loss: 0.34753695770325166
Epoch: 30, step: 491, loss: 0.3203814625740051, mean loss: 0.3475363378845917
Epoch: 30, step: 492, loss: 0.31350788474082947, mean loss: 0.34753556120978873
Epoch: 30, step: 493, loss: 0.3360196053981781, mean loss: 0.34753529837243513
Epoch: 30, step: 494, loss: 0.35139185190200806, mean loss: 0.347535386391459
Epoch: 30, step: 495, loss: 0.3259943425655365, mean loss: 0.3475348947663945
Epoch: 30, step: 496, loss: 0.36062994599342346, mean loss: 0.3475351936241718
Epoch: 30, step: 497, loss: 0.3699464201927185, mean loss: 0.34753570508582154
Epoch: 30, step: 498, loss: 0.3453023135662079, mean loss: 0.34753565411725723
Epoch: 30, step: 499, loss: 0.29842689633369446, mean loss: 0.3475345334244735
Epoch: 30, step: 500, loss: 0.323137104511261, mean loss: 0.3475339766724844
Epoch: 30, step: 501, loss: 0.3923436105251312, mean loss: 0.34753499920988234
Epoch: 30, step: 502, loss: 0.32391780614852905, mean loss: 0.347534460287557
Epoch: 30, step: 503, loss: 0.324664831161499, mean loss: 0.3475339384358519
Epoch: 30, step: 504, loss: 0.3358205258846283, mean loss: 0.34753367115889694
Epoch: 30, step: 505, loss: 0.3329002857208252, mean loss: 0.3475333372615429
Epoch: 30, step: 506, loss: 0.35792985558509827, mean loss: 0.34753357447874517
Epoch: 30, step: 507, loss: 0.32708096504211426, mean loss: 0.34753310782251084
Epoch: 30, step: 508, loss: 0.32388246059417725, mean loss: 0.3475325682106733
Epoch: 30, step: 509, loss: 0.32647207379341125, mean loss: 0.34753208770657984
Epoch: 30, step: 510, loss: 0.3547080159187317, mean loss: 0.34753225142468375
Epoch: 30, step: 511, loss: 0.3439798355102539, mean loss: 0.34753217037850936
Epoch: 30, step: 512, loss: 0.3072752058506012, mean loss: 0.34753125196168805
Epoch: 30, step: 513, loss: 0.3199315369129181, mean loss: 0.34753062231997045
Epoch: 30, step: 514, loss: 0.375294953584671, mean loss: 0.3475312557026844
Epoch: 30, step: 515, loss: 0.33865290880203247, mean loss: 0.3475310531671679
Epoch: 30, step: 516, loss: 0.35451561212539673, mean loss: 0.3475312124973903
Epoch: 30, step: 517, loss: 0.3418884575366974, mean loss: 0.3475310837790418
Epoch: 30, step: 518, loss: 0.31973111629486084, mean loss: 0.3475304496412311
Epoch: 30, step: 519, loss: 0.3380964994430542, mean loss: 0.34753023445076126
Epoch: 30, step: 520, loss: 0.32118332386016846, mean loss: 0.34752963348566945
Epoch: 30, step: 521, loss: 0.3807936906814575, mean loss: 0.3475303922114848
Epoch: 30, step: 522, loss: 0.3345206379890442, mean loss: 0.3475300954764479
Epoch: 30, step: 523, loss: 0.32114794850349426, mean loss: 0.3475294937488005
Epoch: 30, step: 524, loss: 0.37292370200157166, mean loss: 0.3475300729301952
Epoch: 30, step: 525, loss: 0.347476065158844, mean loss: 0.3475300716984347
Epoch: 30, step: 526, loss: 0.3553300201892853, mean loss: 0.3475302495885638
Epoch: 30, step: 527, loss: 0.3634094297885895, mean loss: 0.34753061173005717
Epoch: 30, step: 528, loss: 0.3692695200443268, mean loss: 0.34753110749753907
Epoch: 30, step: 529, loss: 0.3255176246166229, mean loss: 0.34753060547968545
Epoch: 30, step: 530, loss: 0.30623579025268555, mean loss: 0.3475296637721936
Epoch: 30, step: 531, loss: 0.3699171543121338, mean loss: 0.34753017429601324
Epoch: 30, step: 532, loss: 0.30905115604400635, mean loss: 0.34752929684137496
Epoch: 30, step: 533, loss: 0.3533117175102234, mean loss: 0.34752942869754927
Epoch: 30, step: 534, loss: 0.31480300426483154, mean loss: 0.3475286824559706
Epoch: 30, step: 535, loss: 0.30937913060188293, mean loss: 0.3475278125738141
Epoch: 30, step: 536, loss: 0.31893473863601685, mean loss: 0.34752716061234984
Epoch: 30, step: 537, loss: 0.31237703561782837, mean loss: 0.3475263591593653
Epoch: 30, step: 538, loss: 0.3348056375980377, mean loss: 0.3475260691226212
Epoch: 30, step: 539, loss: 0.3891814351081848, mean loss: 0.34752701885736775
Epoch: 30, step: 540, loss: 0.37154892086982727, mean loss: 0.347527566539865
Epoch: 30, step: 541, loss: 0.3548886179924011, mean loss: 0.3475277343628428
Epoch: 30, step: 542, loss: 0.3840530216693878, mean loss: 0.3475285670757741
Epoch: 30, step: 543, loss: 0.30305296182632446, mean loss: 0.3475275531325576
Epoch: 30, step: 544, loss: 0.352183073759079, mean loss: 0.3475276592654797
Epoch: 30, step: 545, loss: 0.2944432497024536, mean loss: 0.34752644911617125
Epoch: 30, step: 546, loss: 0.33155858516693115, mean loss: 0.34752608510988064
Epoch: 30, step: 547, loss: 0.3014746606349945, mean loss: 0.3475250353372793
Epoch: 30, step: 548, loss: 0.32143113017082214, mean loss: 0.3475244405230559
Epoch: 30, step: 549, loss: 0.3357836604118347, mean loss: 0.3475241728964293
Epoch: 30, step: 550, loss: 0.3366343677043915, mean loss: 0.3475239246731111
Epoch: 30, step: 551, loss: 0.3160666525363922, mean loss: 0.3475232076492203
Epoch: 30, step: 552, loss: 0.40254950523376465, mean loss: 0.3475244618670213
Epoch: 30, step: 553, loss: 0.3462776243686676, mean loss: 0.3475244334484249
Epoch: 30, step: 554, loss: 0.34987136721611023, mean loss: 0.3475244869397928
Epoch: 30, step: 555, loss: 0.3691805303096771, mean loss: 0.34752498051357733
Epoch: 30, step: 556, loss: 0.328093945980072, mean loss: 0.34752453766118235
Epoch: 30, step: 557, loss: 0.3436557352542877, mean loss: 0.34752444948937855
Epoch: 30, step: 558, loss: 0.35972487926483154, mean loss: 0.34752472753650304
Epoch: 30, step: 559, loss: 0.34319791197776794, mean loss: 0.34752462893086133
Epoch: 30, step: 560, loss: 0.3324638307094574, mean loss: 0.34752428571174093
Epoch: 30, step: 561, loss: 0.31130680441856384, mean loss: 0.3475234603737597
Epoch: 30, step: 562, loss: 0.3137759864330292, mean loss: 0.347522691340787
Epoch: 30, step: 563, loss: 0.31152480840682983, mean loss: 0.3475218710444846
Epoch: 30, step: 564, loss: 0.3174643814563751, mean loss: 0.3475211861296028
Epoch: 30, step: 565, loss: 0.3121936619281769, mean loss: 0.34752038114568534
Epoch: 30, step: 566, loss: 0.3463600277900696, mean loss: 0.34752035470611653
Epoch: 30, step: 567, loss: 0.36403101682662964, mean loss: 0.34752073090603725
Epoch: 30, step: 568, loss: 0.3094150125980377, mean loss: 0.3475198626766789
Epoch: 30, step: 569, loss: 0.3752107322216034, mean loss: 0.3475204935919112
Epoch: 30, step: 570, loss: 0.33143100142478943, mean loss: 0.34752012701352
Epoch: 30, step: 571, loss: 0.3299081325531006, mean loss: 0.3475197257560138
Epoch: 30, step: 572, loss: 0.3072277009487152, mean loss: 0.3475188077958651
Epoch: 30, step: 573, loss: 0.30351758003234863, mean loss: 0.3475178053529853
Epoch: 30, step: 574, loss: 0.3264974057674408, mean loss: 0.34751732647385136
Epoch: 30, step: 575, loss: 0.3227151036262512, mean loss: 0.347516761451461
Epoch: 30, step: 576, loss: 0.31920453906059265, mean loss: 0.34751611648204644
Epoch: 30, step: 577, loss: 0.3206225335597992, mean loss: 0.3475155038440465
Epoch: 30, step: 578, loss: 0.3358447849750519, mean loss: 0.34751523799018036
Epoch: 30, step: 579, loss: 0.3381440341472626, mean loss: 0.34751502452312244
Epoch: 30, step: 580, loss: 0.32362332940101624, mean loss: 0.347514480305562
Epoch: 30, step: 581, loss: 0.32350778579711914, mean loss: 0.34751393348094106
Epoch: 30, step: 582, loss: 0.34810760617256165, mean loss: 0.3475139470033129
Epoch: 30, step: 583, loss: 0.3103816509246826, mean loss: 0.3475131012421959
Epoch: 30, step: 584, loss: 0.3293359875679016, mean loss: 0.3475126872320906
Epoch: 30, step: 585, loss: 0.2983657121658325, mean loss: 0.3475115678640073
Epoch: 30, step: 586, loss: 0.37052634358406067, mean loss: 0.34751209203499867
Epoch: 30, step: 587, loss: 0.2989599406719208, mean loss: 0.3475109862649485
Epoch: 30, step: 588, loss: 0.30353233218193054, mean loss: 0.3475099846786203
Epoch: 30, step: 589, loss: 0.3174133002758026, mean loss: 0.34750929926107527
Epoch: 30, step: 590, loss: 0.30971330404281616, mean loss: 0.3475084385201398
Epoch: 30, step: 591, loss: 0.3424086570739746, mean loss: 0.34750832238374324
Epoch: 30, step: 592, loss: 0.3543896973133087, mean loss: 0.347508479088476
Epoch: 30, step: 593, loss: 0.3562837541103363, mean loss: 0.34750867891711884
Epoch: 30, step: 594, loss: 0.3169853091239929, mean loss: 0.3475079838614478
Epoch: 30, step: 595, loss: 0.2924373745918274, mean loss: 0.3475067298626941
Epoch: 30, step: 596, loss: 0.3150686025619507, mean loss: 0.3475059912392157
Epoch: 30, step: 597, loss: 0.30449336767196655, mean loss: 0.347505011854372
Epoch: 30, step: 598, loss: 0.364213764667511, mean loss: 0.3475053922991183
Epoch: 30, step: 599, loss: 0.33155566453933716, mean loss: 0.3475050291450254
Epoch: 30, step: 600, loss: 0.2830120921134949, mean loss: 0.347503560760038
Epoch: 30, step: 601, loss: 0.31994375586509705, mean loss: 0.34750293328849996
Epoch: 30, step: 602, loss: 0.37313199043273926, mean loss: 0.3475035167881959
Epoch: 30, step: 603, loss: 0.32337456941604614, mean loss: 0.3475029674541787
Epoch: 30, step: 604, loss: 0.33210742473602295, mean loss: 0.34750261695804396
Epoch: 30, step: 605, loss: 0.3030129373073578, mean loss: 0.3475016041255609
Epoch: 30, step: 606, loss: 0.35323065519332886, mean loss: 0.3475017345476491
Epoch: 30, step: 607, loss: 0.3267202377319336, mean loss: 0.34750126146677096
Epoch: 30, step: 608, loss: 0.3375656306743622, mean loss: 0.3475010352920164
Epoch: 30, step: 609, loss: 0.3370632529258728, mean loss: 0.3475007976916894
Epoch: 30, step: 610, loss: 0.33859848976135254, mean loss: 0.34750059504872816
Epoch: 30, step: 611, loss: 0.3437339961528778, mean loss: 0.3475005093117051
Epoch: 30, step: 612, loss: 0.3180919885635376, mean loss: 0.3474998399169279
Epoch: 30, step: 613, loss: 0.3055991232395172, mean loss: 0.3474988861973331
Epoch: 30, step: 614, loss: 0.3376358449459076, mean loss: 0.34749866170566923
Epoch: 30, step: 615, loss: 0.2959226667881012, mean loss: 0.34749748781649137
Epoch: 30, step: 616, loss: 0.32454127073287964, mean loss: 0.3474969653361881
Epoch: 30, step: 617, loss: 0.38649988174438477, mean loss: 0.34749785301692937
Epoch: 30, step: 618, loss: 0.3080404996871948, mean loss: 0.34749695501394046
Epoch: 30, step: 619, loss: 0.33418071269989014, mean loss: 0.3474966519588127
Epoch: 30, step: 620, loss: 0.3398321568965912, mean loss: 0.34749647753185237
Epoch: 30, step: 621, loss: 0.3105567693710327, mean loss: 0.34749563688490503
Epoch: 30, step: 622, loss: 0.3660210371017456, mean loss: 0.34749605846286324
Epoch: 30, step: 623, loss: 0.33710959553718567, mean loss: 0.34749582210606994
Epoch: 30, step: 624, loss: 0.3413937985897064, mean loss: 0.3474956832501474
Epoch: 30, step: 625, loss: 0.34370529651641846, mean loss: 0.34749559699914084
Epoch: 30, step: 626, loss: 0.3707817792892456, mean loss: 0.34749612686880865
Epoch: 30, step: 627, loss: 0.298249751329422, mean loss: 0.3474950063087026
Epoch: 30, step: 628, loss: 0.2916821241378784, mean loss: 0.3474937363621243
Epoch: 30, step: 629, loss: 0.33667513728141785, mean loss: 0.3474934902051486
Epoch: 30, step: 630, loss: 0.31860318779945374, mean loss: 0.3474928328753403
Epoch: 30, step: 631, loss: 0.30441999435424805, mean loss: 0.3474918528781042
Epoch: 30, step: 632, loss: 0.3006880581378937, mean loss: 0.3474907880180323
Epoch: 30, step: 633, loss: 0.35704097151756287, mean loss: 0.34749100529481025
Epoch: 30, step: 634, loss: 0.32762476801872253, mean loss: 0.347490553327178
Epoch: 30, step: 635, loss: 0.38389745354652405, mean loss: 0.3474913815849862
Epoch: 30, step: 636, loss: 0.3440164029598236, mean loss: 0.3474913025309419
Epoch: 30, step: 637, loss: 0.31056010723114014, mean loss: 0.3474904623836354
Epoch: 30, step: 638, loss: 0.329111784696579, mean loss: 0.34749004429683433
Epoch: 30, step: 639, loss: 0.30140554904937744, mean loss: 0.34748899596891697
Epoch: 30, step: 640, loss: 0.3515763282775879, mean loss: 0.3474890889452439
Epoch: 30, step: 641, loss: 0.3488139808177948, mean loss: 0.3474891190824504
Epoch: 30, step: 642, loss: 0.3115623891353607, mean loss: 0.3474883018786666
Epoch: 30, step: 643, loss: 0.2909339964389801, mean loss: 0.34748701550105215
Epoch: 30, step: 644, loss: 0.2973082959651947, mean loss: 0.34748587416772936
Epoch: 30, step: 645, loss: 0.33867356181144714, mean loss: 0.3474856737330217
Epoch: 30, step: 646, loss: 0.34502068161964417, mean loss: 0.34748561766842523
Epoch: 30, step: 647, loss: 0.32997411489486694, mean loss: 0.3474852193900688
Epoch: 30, step: 648, loss: 0.3100108504295349, mean loss: 0.3474843670993876
Epoch: 30, step: 649, loss: 0.3417624831199646, mean loss: 0.34748423696784386
Epoch: 30, step: 650, loss: 0.35433974862098694, mean loss: 0.3474843928776856
Epoch: 30, step: 651, loss: 0.36190065741539, mean loss: 0.34748472072869396
Epoch: 30, step: 652, loss: 0.32814598083496094, mean loss: 0.3474842809420091
Epoch: 30, step: 653, loss: 0.3418593406677246, mean loss: 0.3474841530268712
Epoch: 30, step: 654, loss: 0.3931436836719513, mean loss: 0.34748519133342365
Epoch: 30, step: 655, loss: 0.3121274709701538, mean loss: 0.3474843873103119
Epoch: 30, step: 656, loss: 0.32640933990478516, mean loss: 0.3474839080814558
Epoch: 30, step: 657, loss: 0.34747663140296936, mean loss: 0.347483907915994
Epoch: 30, step: 658, loss: 0.2978256046772003, mean loss: 0.34748277877928696
Epoch: 30, step: 659, loss: 0.294838011264801, mean loss: 0.34748158176319976
Epoch: 30, step: 660, loss: 0.34482333064079285, mean loss: 0.34748152132230203
Epoch: 30, step: 661, loss: 0.3170357048511505, mean loss: 0.3474808290887412
Epoch: 30, step: 662, loss: 0.33893895149230957, mean loss: 0.3474806348801243
Epoch: 30, step: 663, loss: 0.3143001198768616, mean loss: 0.34747988050319173
Epoch: 30, step: 664, loss: 0.34641897678375244, mean loss: 0.34747985638352097
Epoch: 30, step: 665, loss: 0.3895670473575592, mean loss: 0.34748081321503493
Epoch: 30, step: 666, loss: 0.33527347445487976, mean loss: 0.34748053569352266
Epoch: 30, step: 667, loss: 0.302530974149704, mean loss: 0.3474795138338895
Epoch: 30, step: 668, loss: 0.38503551483154297, mean loss: 0.3474803675928064
Epoch: 30, step: 669, loss: 0.3389168679714203, mean loss: 0.34748017292357203
Epoch: 30, step: 670, loss: 0.34872281551361084, mean loss: 0.347480201171227
Epoch: 30, step: 671, loss: 0.315606027841568, mean loss: 0.3474794766264614
Epoch: 30, step: 672, loss: 0.30563321709632874, mean loss: 0.3474785254237807
Epoch: 30, step: 673, loss: 0.3589443862438202, mean loss: 0.34747878604706617
Epoch: 30, step: 674, loss: 0.3087880313396454, mean loss: 0.34747790661179606
Epoch: 30, step: 675, loss: 0.31174251437187195, mean loss: 0.34747709436995045
Epoch: 30, step: 676, loss: 0.31581413745880127, mean loss: 0.3474763747082255
Epoch: 30, step: 677, loss: 0.35417240858078003, mean loss: 0.34747652689773123
Epoch: 30, step: 678, loss: 0.3179605305194855, mean loss: 0.3474758560643855
Epoch: 30, step: 679, loss: 0.3639608919620514, mean loss: 0.3474762307242923
Epoch: 30, step: 680, loss: 0.337755411863327, mean loss: 0.34747600980161186
Epoch: 30, step: 681, loss: 0.2985767424106598, mean loss: 0.3474748985051392
Epoch: 30, step: 682, loss: 0.2971828281879425, mean loss: 0.3474737555814677
Epoch: 30, step: 683, loss: 0.37225577235221863, mean loss: 0.34747431875792373
Epoch: 30, step: 684, loss: 0.3858361840248108, mean loss: 0.34747519051943415
Epoch: 30, step: 685, loss: 0.3619401752948761, mean loss: 0.34747551922426473
Epoch: 30, step: 686, loss: 0.3215784728527069, mean loss: 0.34747493074865016
Epoch: 30, step: 687, loss: 0.3198069930076599, mean loss: 0.34747430204619284
Epoch: 30, step: 688, loss: 0.3179815411567688, mean loss: 0.34747363189324937
Epoch: 30, step: 689, loss: 0.3082737922668457, mean loss: 0.3474727411902358
Epoch: 30, step: 690, loss: 0.30484214425086975, mean loss: 0.3474717725551914
Epoch: 30, step: 691, loss: 0.35095691680908203, mean loss: 0.3474718517414191
Epoch: 30, step: 692, loss: 0.32174116373062134, mean loss: 0.3474712671257826
Epoch: 30, step: 693, loss: 0.3132242262363434, mean loss: 0.3474704890315196
Epoch: 30, step: 694, loss: 0.3476546108722687, mean loss: 0.3474704932146808
Epoch: 30, step: 695, loss: 0.3591301143169403, mean loss: 0.34747075810974404
Epoch: 30, step: 696, loss: 0.34524330496788025, mean loss: 0.3474707075053607
Epoch: 30, step: 697, loss: 0.3055897653102875, mean loss: 0.347469756054995
Epoch: 30, step: 698, loss: 0.3673035502433777, mean loss: 0.34747020662847894
Epoch: 30, step: 699, loss: 0.3347720801830292, mean loss: 0.34746991816581546
Epoch: 30, step: 700, loss: 0.32860803604125977, mean loss: 0.3474694896911755
Epoch: 30, step: 701, loss: 0.3110373020172119, mean loss: 0.3474686621007054
Epoch: 30, step: 702, loss: 0.4038957953453064, mean loss: 0.3474699438655385
Epoch: 30, step: 703, loss: 0.3051638603210449, mean loss: 0.3474689828878094
Epoch: 30, step: 704, loss: 0.32115787267684937, mean loss: 0.3474683852476002
Epoch: 30, step: 705, loss: 0.3243427574634552, mean loss: 0.3474678599755386
Epoch: 30, step: 706, loss: 0.30729079246520996, mean loss: 0.34746694742034495
Epoch: 30, step: 707, loss: 0.3015432059764862, mean loss: 0.34746590436271246
Epoch: 30, step: 708, loss: 0.3364452123641968, mean loss: 0.3474656540574137
Epoch: 30, step: 709, loss: 0.33123672008514404, mean loss: 0.3474652854693153
Epoch: 30, step: 710, loss: 0.3294195532798767, mean loss: 0.34746487562779027
Epoch: 30, step: 711, loss: 0.3055543601512909, mean loss: 0.34746392380830726
Epoch: 30, step: 712, loss: 0.3286312222480774, mean loss: 0.3474634961131341
Epoch: 30, step: 713, loss: 0.31075942516326904, mean loss: 0.347462662573802
Epoch: 30, step: 714, loss: 0.31018418073654175, mean loss: 0.34746181600898224
Epoch: 30, step: 715, loss: 0.3340078890323639, mean loss: 0.34746151048788637
Epoch: 30, step: 716, loss: 0.32579731941223145, mean loss: 0.34746101853359623
Epoch: 30, step: 717, loss: 0.3421947658061981, mean loss: 0.3474608989493116
Epoch: 30, step: 718, loss: 0.3650745749473572, mean loss: 0.347461298905623
Epoch: 30, step: 719, loss: 0.37362655997276306, mean loss: 0.3474618930305337
Epoch: 30, step: 720, loss: 0.3449455201625824, mean loss: 0.3474618358934826
Epoch: 30, step: 721, loss: 0.3045913279056549, mean loss: 0.3474608624929107
Epoch: 30, step: 722, loss: 0.3089691400527954, mean loss: 0.34745998853513216
Epoch: 30, step: 723, loss: 0.319139689207077, mean loss: 0.34745934553496577
Epoch: 30, step: 724, loss: 0.3397308886051178, mean loss: 0.3474591700676726
Epoch: 30, step: 725, loss: 0.4033638834953308, mean loss: 0.34746043930241416
Epoch: 30, step: 726, loss: 0.3593637943267822, mean loss: 0.34746070954454245
Epoch: 30, step: 727, loss: 0.3360961973667145, mean loss: 0.34746045154163246
Epoch: 30, step: 728, loss: 0.3462882339954376, mean loss: 0.3474604249299603
Epoch: 30, step: 729, loss: 0.334421306848526, mean loss: 0.3474601289227394
Epoch: 30, step: 730, loss: 0.4030071198940277, mean loss: 0.3474613898927735
Epoch: 30, step: 731, loss: 0.3014378547668457, mean loss: 0.3474603451380489
Epoch: 30, step: 732, loss: 0.3510107100009918, mean loss: 0.34746042573108143
Epoch: 30, step: 733, loss: 0.2928750216960907, mean loss: 0.34745918667437753
Epoch: 30, step: 734, loss: 0.33153030276298523, mean loss: 0.3474588251062488
Epoch: 30, step: 735, loss: 0.3521077334880829, mean loss: 0.3474589306289559
Epoch: 30, step: 736, loss: 0.3432845175266266, mean loss: 0.34745883587867554
Epoch: 30, step: 737, loss: 0.33152496814727783, mean loss: 0.3474584742220472
Epoch: 30, step: 738, loss: 0.2854299545288086, mean loss: 0.34745706637076385
Epoch: 30, step: 739, loss: 0.3143717348575592, mean loss: 0.3474563154553868
Epoch: 30, step: 740, loss: 0.3376213610172272, mean loss: 0.34745609224314833
Epoch: 30, step: 741, loss: 0.32245826721191406, mean loss: 0.347455524910185
Epoch: 30, step: 742, loss: 0.3569132387638092, mean loss: 0.34745573955090064
Epoch: 30, step: 743, loss: 0.3570024073123932, mean loss: 0.3474559562054885
Epoch: 30, step: 744, loss: 0.3324452340602875, mean loss: 0.3474556155559448
Epoch: 30, step: 745, loss: 0.3485507071018219, mean loss: 0.34745564040711224
Epoch: 30, step: 746, loss: 0.3505089282989502, mean loss: 0.34745570969451306
Epoch: 30, step: 747, loss: 0.3339941203594208, mean loss: 0.3474554042213957
Epoch: 30, step: 748, loss: 0.3531337082386017, mean loss: 0.347455533071699
Epoch: 30, step: 749, loss: 0.3083927631378174, mean loss: 0.34745464669162335
Epoch: 30, step: 750, loss: 0.31222060322761536, mean loss: 0.3474538472079841
Epoch: 30, step: 751, loss: 0.30492591857910156, mean loss: 0.34745288224318494
Epoch: 30, step: 752, loss: 0.32838600873947144, mean loss: 0.3474524496229071
Epoch: 30, step: 753, loss: 0.3451162278652191, mean loss: 0.3474523966161059
Epoch: 30, step: 754, loss: 0.35945940017700195, mean loss: 0.3474526690381946
Epoch: 30, step: 755, loss: 0.3020872175693512, mean loss: 0.3474516397830111
Epoch: 30, step: 756, loss: 0.3134974241256714, mean loss: 0.3474508694443842
Epoch: 30, step: 757, loss: 0.3105211555957794, mean loss: 0.3474500316179436
Epoch: 30, step: 758, loss: 0.3104197382926941, mean loss: 0.34744919152871
Epoch: 30, step: 759, loss: 0.3155009150505066, mean loss: 0.3474484667492981
Epoch: 30, step: 760, loss: 0.3192438781261444, mean loss: 0.3474478269137993
Epoch: 30, step: 761, loss: 0.3352539539337158, mean loss: 0.34744755029583774
Epoch: 30, step: 762, loss: 0.3432599902153015, mean loss: 0.34744745530320836
Epoch: 30, step: 763, loss: 0.3718351423740387, mean loss: 0.3474480085126964
Epoch: 30, step: 764, loss: 0.35227254033088684, mean loss: 0.34744811794973435
Epoch: 30, step: 765, loss: 0.3203839957714081, mean loss: 0.34744750405593183
Epoch: 30, step: 766, loss: 0.30384713411331177, mean loss: 0.3474465150938808
Epoch: 30, step: 767, loss: 0.30681517720222473, mean loss: 0.34744559349757587
Epoch: 30, step: 768, loss: 0.303850919008255, mean loss: 0.3474446047095678
Epoch: 30, step: 769, loss: 0.3273228704929352, mean loss: 0.34744414833092824
Epoch: 30, step: 770, loss: 0.36049404740333557, mean loss: 0.34744444430741034
Epoch: 30, step: 771, loss: 0.33944976329803467, mean loss: 0.3474442629892345
Epoch: 30, step: 772, loss: 0.3485240042209625, mean loss: 0.3474442874770496
Epoch: 30, step: 773, loss: 0.3303530514240265, mean loss: 0.34744389986794055
Epoch: 30, step: 774, loss: 0.3440109193325043, mean loss: 0.34744382201374996
Epoch: 30, step: 775, loss: 0.3088635504245758, mean loss: 0.3474429470983021
Epoch: 30, step: 776, loss: 0.3327104151248932, mean loss: 0.3474426130045548
Epoch: 30, step: 777, loss: 0.30209261178970337, mean loss: 0.347441584613217
Epoch: 30, step: 778, loss: 0.30012115836143494, mean loss: 0.3474405115633462
Epoch: 30, step: 779, loss: 0.326564759016037, mean loss: 0.3474400381902726
Epoch: 30, step: 780, loss: 0.3414666950702667, mean loss: 0.3474399027433866
Epoch: 30, step: 781, loss: 0.31075772643089294, mean loss: 0.3474390709857268
Epoch: 30, step: 782, loss: 0.32550621032714844, mean loss: 0.3474385736757783
Epoch: 30, step: 783, loss: 0.34414517879486084, mean loss: 0.3474384990023954
Epoch: 30, step: 784, loss: 0.3580593168735504, mean loss: 0.3474387398099653
Epoch: 30, step: 785, loss: 0.30683010816574097, mean loss: 0.3474378191045818
Epoch: 30, step: 786, loss: 0.30233797430992126, mean loss: 0.3474367965946674
Epoch: 30, step: 787, loss: 0.344194620847702, mean loss: 0.3474367230892773
Epoch: 30, step: 788, loss: 0.3130803108215332, mean loss: 0.34743594419126855
Epoch: 30, step: 789, loss: 0.3544965088367462, mean loss: 0.3474361042584788
Epoch: 30, step: 790, loss: 0.3348679542541504, mean loss: 0.34743581933748396
Epoch: 30, step: 791, loss: 0.3172873258590698, mean loss: 0.34743513588414976
Epoch: 30, step: 792, loss: 0.3280333876609802, mean loss: 0.3474346960648624
Epoch: 30, step: 793, loss: 0.35350942611694336, mean loss: 0.3474348337701272
Epoch: 30, step: 794, loss: 0.3782370984554291, mean loss: 0.347435531996687
Epoch: 30, step: 795, loss: 0.38531914353370667, mean loss: 0.34743639072394095
Epoch: 30, step: 796, loss: 0.33286747336387634, mean loss: 0.347436060490304
Epoch: 30, step: 797, loss: 0.29828640818595886, mean loss: 0.3474349464404308
Epoch: 30, step: 798, loss: 0.3498546779155731, mean loss: 0.34743500128599564
Epoch: 30, step: 799, loss: 0.3339325189590454, mean loss: 0.3474346952460517
Epoch: 30, step: 800, loss: 0.32011303305625916, mean loss: 0.3474340760021046
Epoch: 30, step: 801, loss: 0.3750082850456238, mean loss: 0.34743470095584744
Epoch: 30, step: 802, loss: 0.3573451340198517, mean loss: 0.34743492556507766
Epoch: 30, step: 803, loss: 0.3024100065231323, mean loss: 0.3474339051471862
Epoch: 30, step: 804, loss: 0.3627447187900543, mean loss: 0.3474342521344642
Epoch: 30, step: 805, loss: 0.37592217326164246, mean loss: 0.3474348977384421
Epoch: 30, step: 806, loss: 0.3445291519165039, mean loss: 0.3474348318888303
Epoch: 30, step: 807, loss: 0.3263133466243744, mean loss: 0.34743435324748545
Epoch: 30, step: 808, loss: 0.3043387234210968, mean loss: 0.34743337666451674
Epoch: 30, step: 809, loss: 0.31798839569091797, mean loss: 0.3474327094317732
Epoch: 30, step: 810, loss: 0.33565497398376465, mean loss: 0.34743244255054573
Epoch: 30, step: 811, loss: 0.3441609740257263, mean loss: 0.34743236842137587
Epoch: 30, step: 812, loss: 0.3215253949165344, mean loss: 0.34743178140092623
Epoch: 30, step: 813, loss: 0.35800331830978394, mean loss: 0.3474320209336427
Epoch: 30, step: 814, loss: 0.31233668327331543, mean loss: 0.34743122575209384
Epoch: 30, step: 815, loss: 0.3117370009422302, mean loss: 0.34743041701943095
Epoch: 30, step: 816, loss: 0.3626194894313812, mean loss: 0.34743076115411187
Epoch: 30, step: 817, loss: 0.29987579584121704, mean loss: 0.34742968373861244
Epoch: 30, step: 818, loss: 0.35729432106018066, mean loss: 0.3474299072288891
Epoch: 30, step: 819, loss: 0.33323097229003906, mean loss: 0.3474295855493481
Epoch: 30, step: 820, loss: 0.3488379716873169, mean loss: 0.347429617455878
Epoch: 30, step: 821, loss: 0.3263190686702728, mean loss: 0.347429139214095
Epoch: 30, step: 822, loss: 0.3110217750072479, mean loss: 0.3474283144544682
Epoch: 30, step: 823, loss: 0.33577314019203186, mean loss: 0.34742805042822994
Epoch: 30, step: 824, loss: 0.3471018075942993, mean loss: 0.3474280430379743
Epoch: 30, step: 825, loss: 0.3386918306350708, mean loss: 0.3474278451443395
Epoch: 30, step: 826, loss: 0.35007238388061523, mean loss: 0.34742790504736204
Epoch: 30, step: 827, loss: 0.32606732845306396, mean loss: 0.3474274212071746
Epoch: 30, step: 828, loss: 0.2901284694671631, mean loss: 0.34742612335327666
Epoch: 30, step: 829, loss: 0.3257010281085968, mean loss: 0.3474256312786392
Epoch: 30, step: 830, loss: 0.2980494797229767, mean loss: 0.34742451293134113
Epoch: 30, step: 831, loss: 0.30167973041534424, mean loss: 0.34742347685636116
Epoch: 30, step: 832, loss: 0.3085764944553375, mean loss: 0.34742259702979444
Epoch: 30, step: 833, loss: 0.33016642928123474, mean loss: 0.34742220621202596
Epoch: 30, step: 834, loss: 0.32665058970451355, mean loss: 0.34742173578701163
Epoch: 30, step: 835, loss: 0.35277312994003296, mean loss: 0.34742185697992206
Epoch: 30, step: 836, loss: 0.2979579269886017, mean loss: 0.34742073679671237
Epoch: 30, step: 837, loss: 0.3132854700088501, mean loss: 0.3474199637710593
Epoch: 30, step: 838, loss: 0.30840447545051575, mean loss: 0.3474190802481462
Epoch: 30, step: 839, loss: 0.34011271595954895, mean loss: 0.34741891479605636
Epoch: 30, step: 840, loss: 0.29969051480293274, mean loss: 0.3474178340143713
Epoch: 30, step: 841, loss: 0.4154268205165863, mean loss: 0.3474193740031966
Epoch: 30, step: 842, loss: 0.3601032793521881, mean loss: 0.3474196612098028
Epoch: 30, step: 843, loss: 0.3168923258781433, mean loss: 0.34741896998311744
Epoch: 30, step: 844, loss: 0.42217591404914856, mean loss: 0.34742066265704624
Epoch: 30, step: 845, loss: 0.35127586126327515, mean loss: 0.3474207499458794
Epoch: 30, step: 846, loss: 0.38588273525238037, mean loss: 0.34742162077671024
Epoch: 30, step: 847, loss: 0.3662688136100769, mean loss: 0.3474220474927226
Epoch: 30, step: 848, loss: 0.2973702847957611, mean loss: 0.34742091430513183
Epoch: 30, step: 849, loss: 0.3147006332874298, mean loss: 0.34742017352448845
Epoch: 30, step: 850, loss: 0.34389743208885193, mean loss: 0.3474200937721298
Epoch: 30, step: 851, loss: 0.3303678631782532, mean loss: 0.3474197077305063
Epoch: 30, step: 852, loss: 0.2991963028907776, mean loss: 0.34741861603637547
Epoch: 30, step: 853, loss: 0.37735462188720703, mean loss: 0.3474192937202133
Epoch: 30, step: 854, loss: 0.31793978810310364, mean loss: 0.34741862638562093
Epoch: 30, step: 855, loss: 0.3340379595756531, mean loss: 0.347418323491135
Epoch: 30, step: 856, loss: 0.3364226818084717, mean loss: 0.34741807459144325
Epoch: 30, step: 857, loss: 0.36743247509002686, mean loss: 0.34741852763142916
Epoch: 30, step: 858, loss: 0.3252949118614197, mean loss: 0.34741802685921225
Epoch: 30, step: 859, loss: 0.33161666989326477, mean loss: 0.34741766920061184
Epoch: 30, step: 860, loss: 0.323175847530365, mean loss: 0.3474171205072443
Epoch: 30, step: 861, loss: 0.35892102122306824, mean loss: 0.3474173808825265
Epoch: 30, step: 862, loss: 0.3336167335510254, mean loss: 0.34741706853055104
Epoch: 30, step: 863, loss: 0.33021271228790283, mean loss: 0.34741667915077007
Epoch: 30, step: 864, loss: 0.3681706488132477, mean loss: 0.3474171488569976
Epoch: 30, step: 865, loss: 0.321961373090744, mean loss: 0.3474165727519922
Epoch: 30, step: 866, loss: 0.3372688293457031, mean loss: 0.34741634309749186
Epoch: 30, step: 867, loss: 0.30353108048439026, mean loss: 0.34741534994861406
Epoch: 30, step: 868, loss: 0.39926186203956604, mean loss: 0.34741652323862043
Epoch: 30, step: 869, loss: 0.3718792200088501, mean loss: 0.34741707681854284
Epoch: 30, step: 870, loss: 0.3240087926387787, mean loss: 0.34741654711149433
Epoch: 30, step: 871, loss: 0.29581984877586365, mean loss: 0.34741537955405555
Epoch: 30, step: 872, loss: 0.31145986914634705, mean loss: 0.3474145659521184
Epoch: 30, step: 873, loss: 0.37046003341674805, mean loss: 0.34741508741357163
Epoch: 30, step: 874, loss: 0.3442511558532715, mean loss: 0.3474150158233112
Epoch: 30, step: 875, loss: 0.3343857228755951, mean loss: 0.3474147210162484
Epoch: 30, step: 876, loss: 0.33296433091163635, mean loss: 0.3474143940621541
Epoch: 30, step: 877, loss: 0.30162546038627625, mean loss: 0.34741335806655077
Epoch: 30, step: 878, loss: 0.336261510848999, mean loss: 0.3474131057566067
Epoch: 30, step: 879, loss: 0.3269619643688202, mean loss: 0.3474126430611002
Epoch: 30, step: 880, loss: 0.34828218817710876, mean loss: 0.34741266273362154
Epoch: 30, step: 881, loss: 0.34382036328315735, mean loss: 0.3474125814635557
Epoch: 30, step: 882, loss: 0.36488988995552063, mean loss: 0.3474129768509387
Epoch: 30, step: 883, loss: 0.38547563552856445, mean loss: 0.3474138379191379
Epoch: 30, step: 884, loss: 0.3613635003566742, mean loss: 0.34741415348666277
Epoch: 30, step: 885, loss: 0.33477920293807983, mean loss: 0.3474138676668521
Epoch: 30, step: 886, loss: 0.314492404460907, mean loss: 0.3474131229553086
Epoch: 30, step: 887, loss: 0.3294159471988678, mean loss: 0.34741271585307015
Epoch: 30, step: 888, loss: 0.3160659372806549, mean loss: 0.3474120067943135
Epoch: 30, step: 889, loss: 0.2995017170906067, mean loss: 0.34741092309628807
Epoch: 30, step: 890, loss: 0.30946627259254456, mean loss: 0.34741006483362713
Epoch: 30, step: 891, loss: 0.3120972812175751, mean loss: 0.3474092661187168
Epoch: 30, step: 892, loss: 0.3342669904232025, mean loss: 0.34740896886958883
Epoch: 30, step: 893, loss: 0.32825738191604614, mean loss: 0.34740853571296526
Epoch: 30, step: 894, loss: 0.3091229498386383, mean loss: 0.34740766981709564
Epoch: 30, step: 895, loss: 0.3427678346633911, mean loss: 0.34740756488143537
Epoch: 30, step: 896, loss: 0.31362664699554443, mean loss: 0.34740680090111364
Epoch: 30, step: 897, loss: 0.34022098779678345, mean loss: 0.3474066383923366
Epoch: 30, step: 898, loss: 0.3067191243171692, mean loss: 0.34740571825587774
Epoch: 30, step: 899, loss: 0.3192974328994751, mean loss: 0.3474050826094427
Epoch: 30, step: 900, loss: 0.3502027094364166, mean loss: 0.3474051458741094
Epoch: 30, step: 901, loss: 0.3660775423049927, mean loss: 0.34740556811635154
Epoch: 30, step: 902, loss: 0.3555522561073303, mean loss: 0.3474057523346992
Epoch: 30, step: 903, loss: 0.3019028902053833, mean loss: 0.3474047234168689
Epoch: 30, step: 904, loss: 0.3524813950061798, mean loss: 0.34740483820876467
Epoch: 30, step: 905, loss: 0.328372597694397, mean loss: 0.34740440786822935
Epoch: 30, step: 906, loss: 0.3285438120365143, mean loss: 0.34740398141841744
Epoch: 30, step: 907, loss: 0.3398172855377197, mean loss: 0.3474038098823796
Epoch: 30, step: 908, loss: 0.30830109119415283, mean loss: 0.34740292578554977
Epoch: 30, step: 909, loss: 0.3442210555076599, mean loss: 0.34740285384636194
Epoch: 30, step: 910, loss: 0.37238800525665283, mean loss: 0.3474034187250988
Epoch: 30, step: 911, loss: 0.3432864844799042, mean loss: 0.34740332564917537
Epoch: 30, step: 912, loss: 0.36967822909355164, mean loss: 0.34740382923029
Epoch: 30, step: 913, loss: 0.33219021558761597, mean loss: 0.34740348529545156
Epoch: 30, step: 914, loss: 0.3105878233909607, mean loss: 0.3474026530209652
Epoch: 30, step: 915, loss: 0.33972761034965515, mean loss: 0.34740247951877984
Epoch: 30, step: 916, loss: 0.32962679862976074, mean loss: 0.34740207769042597
Epoch: 30, step: 917, loss: 0.3288619816303253, mean loss: 0.34740165859155037
Epoch: 30, step: 918, loss: 0.3275035321712494, mean loss: 0.3474012088045656
Epoch: 30, step: 919, loss: 0.2995988130569458, mean loss: 0.3474001282802494
Epoch: 30, step: 920, loss: 0.354830265045166, mean loss: 0.34740029622710333
Epoch: 30, step: 921, loss: 0.3241613805294037, mean loss: 0.3473997709589035
Epoch: 30, step: 922, loss: 0.2971484363079071, mean loss: 0.3473986351558465
Epoch: 30, step: 923, loss: 0.3297276496887207, mean loss: 0.34739823575738643
Epoch: 30, step: 924, loss: 0.32633742690086365, mean loss: 0.347397759753118
Epoch: 30, step: 925, loss: 0.35824552178382874, mean loss: 0.3473980049224447
Epoch: 30, step: 926, loss: 0.32487231492996216, mean loss: 0.34739749583278906
Epoch: 30, step: 927, loss: 0.32525405287742615, mean loss: 0.34739699539338037
Epoch: 30, step: 928, loss: 0.3368453085422516, mean loss: 0.3473967569317914
Epoch: 30, step: 929, loss: 0.36871734261512756, mean loss: 0.34739723875293677
Epoch: 30, step: 930, loss: 0.3214673697948456, mean loss: 0.3473966527804399
Epoch: 30, step: 931, loss: 0.3376161754131317, mean loss: 0.3473964317626923
Epoch: 30, step: 932, loss: 0.32057440280914307, mean loss: 0.3473958256562373
Epoch: 30, step: 933, loss: 0.3050630986690521, mean loss: 0.34739486907091194
Epoch: 30, step: 934, loss: 0.332899808883667, mean loss: 0.3473945415359399
Epoch: 30, step: 935, loss: 0.29888349771499634, mean loss: 0.3473934453897943
Epoch: 30, step: 936, loss: 0.39208605885505676, mean loss: 0.3473944552326093
Epoch: 30, step: 937, loss: 0.3055741488933563, mean loss: 0.3473935103117738
Epoch: 30, step: 938, loss: 0.3403926193714142, mean loss: 0.34739335213172134
Epoch: 30, step: 939, loss: 0.3248867988586426, mean loss: 0.3473928436239655
Epoch: 30, step: 940, loss: 0.3163565993309021, mean loss: 0.3473921424142257
Epoch: 30, step: 941, loss: 0.3289842903614044, mean loss: 0.3473917265303512
Epoch: 30, step: 942, loss: 0.3738664388656616, mean loss: 0.34739232465321535
Epoch: 30, step: 943, loss: 0.32059234380722046, mean loss: 0.34739171919548795
Epoch: 30, step: 944, loss: 0.3328661620616913, mean loss: 0.34739139104554706
Epoch: 30, step: 945, loss: 0.3215705156326294, mean loss: 0.34739080773385383
Epoch: 30, step: 946, loss: 0.38199180364608765, mean loss: 0.347391589376972
Epoch: 30, step: 947, loss: 0.3332613706588745, mean loss: 0.34739127017983823
Epoch: 30, step: 948, loss: 0.3581104874610901, mean loss: 0.3473915123180677
Epoch: 30, step: 949, loss: 0.33382102847099304, mean loss: 0.34739120577901533
Epoch: 30, step: 950, loss: 0.2969329357147217, mean loss: 0.3473900660200294
Epoch: 30, step: 951, loss: 0.323618084192276, mean loss: 0.3473895290670608
Epoch: 30, step: 952, loss: 0.30861902236938477, mean loss: 0.3473886533525915
Epoch: 30, step: 953, loss: 0.30563294887542725, mean loss: 0.34738771023237475
Epoch: 30, step: 954, loss: 0.36689358949661255, mean loss: 0.3473881507943005
Epoch: 30, step: 955, loss: 0.30514225363731384, mean loss: 0.34738719664539014
Epoch: 30, step: 956, loss: 0.3798655569553375, mean loss: 0.3473879301720588
Epoch: 30, step: 957, loss: 0.30948492884635925, mean loss: 0.3473870741487216
Epoch: 30, step: 958, loss: 0.33775126934051514, mean loss: 0.347386856533039
Epoch: 30, step: 959, loss: 0.33825549483299255, mean loss: 0.34738665031439175
Epoch: 30, step: 960, loss: 0.3649842441082001, mean loss: 0.3473870477217176
Epoch: 30, step: 961, loss: 0.3008979260921478, mean loss: 0.3473859978793069
Epoch: 30, step: 962, loss: 0.3427017331123352, mean loss: 0.34738589209910303
Epoch: 30, step: 963, loss: 0.3494924008846283, mean loss: 0.34738593966727177
Epoch: 30, step: 964, loss: 0.2990606427192688, mean loss: 0.34738484843328854
Epoch: 30, step: 965, loss: 0.33418068289756775, mean loss: 0.3473845502766355
Epoch: 30, step: 966, loss: 0.3356117904186249, mean loss: 0.3473842844478402
Epoch: 30, step: 967, loss: 0.33620741963386536, mean loss: 0.34738403208004726
Epoch: 30, step: 968, loss: 0.3245459794998169, mean loss: 0.3473835164203444
Epoch: 30, step: 969, loss: 0.34453079104423523, mean loss: 0.34738345201019816
Epoch: 30, step: 970, loss: 0.32336169481277466, mean loss: 0.34738290964815627
Epoch: 30, step: 971, loss: 0.3148755729198456, mean loss: 0.3473821757156915
Epoch: 30, step: 972, loss: 0.3331082761287689, mean loss: 0.347381853454847
Epoch: 30, step: 973, loss: 0.3418021500110626, mean loss: 0.347381727485112
Epoch: 30, step: 974, loss: 0.3542284369468689, mean loss: 0.3473818820558189
Epoch: 30, step: 975, loss: 0.31945544481277466, mean loss: 0.3473812516052761
Epoch: 30, step: 976, loss: 0.3718070089817047, mean loss: 0.3473818030141159
Epoch: 30, step: 977, loss: 0.3387663960456848, mean loss: 0.34738160852662286
Epoch: 30, step: 978, loss: 0.31372904777526855, mean loss: 0.34738084885799037
Epoch: 30, step: 979, loss: 0.3252520263195038, mean loss: 0.3473803493360369
Epoch: 30, step: 980, loss: 0.34088990092277527, mean loss: 0.34738020282809323
Epoch: 30, step: 981, loss: 0.3142697811126709, mean loss: 0.3473794554482523
Epoch: 30, step: 982, loss: 0.31107017397880554, mean loss: 0.3473786358811469
Epoch: 30, step: 983, loss: 0.29473304748535156, mean loss: 0.347377447600441
Epoch: 30, step: 984, loss: 0.35751402378082275, mean loss: 0.3473776763912362
Epoch: 30, step: 985, loss: 0.3549010455608368, mean loss: 0.3473778461959843
Epoch: 30, step: 986, loss: 0.3500034809112549, mean loss: 0.34737790545602704
Epoch: 30, step: 987, loss: 0.31473949551582336, mean loss: 0.34737716883036257
Epoch: 30, step: 988, loss: 0.33892735838890076, mean loss: 0.3473769781284636
Epoch: 30, step: 989, loss: 0.3856901228427887, mean loss: 0.34737784278982026
Epoch: 30, step: 990, loss: 0.31796368956565857, mean loss: 0.3473771789782786
Epoch: 30, step: 991, loss: 0.3500395715236664, mean loss: 0.3473772390611578
Epoch: 30, step: 992, loss: 0.3342280685901642, mean loss: 0.3473769423272316
Epoch: 30, step: 993, loss: 0.34661567211151123, mean loss: 0.3473769251482314
Epoch: 30, step: 994, loss: 0.3469209372997284, mean loss: 0.34737691485853606
Epoch: 30, step: 995, loss: 0.34273573756217957, mean loss: 0.34737681012937965
Epoch: 30, step: 996, loss: 0.31700101494789124, mean loss: 0.34737612470854384
Epoch: 30, step: 997, loss: 0.31281229853630066, mean loss: 0.3473753448036255
Epoch: 30, step: 998, loss: 0.3303014934062958, mean loss: 0.3473749595546037
Epoch: 30, step: 999, loss: 0.3415175974369049, mean loss: 0.34737482739390607
Epoch: 30, step: 1000, loss: 0.33872631192207336, mean loss: 0.34737463226032445
Epoch: 30, step: 1001, loss: 0.36316898465156555, mean loss: 0.3473749886150104
Epoch: 30, step: 1002, loss: 0.3215906322002411, mean loss: 0.34737440687739307
Epoch: 30, step: 1003, loss: 0.3670291602611542, mean loss: 0.3473748503110494
Epoch: 30, step: 1004, loss: 0.34029585123062134, mean loss: 0.3473746906043584
Epoch: 30, step: 1005, loss: 0.32712048292160034, mean loss: 0.3473742336669473
Epoch: 30, step: 1006, loss: 0.3805537819862366, mean loss: 0.3473749821847428
Epoch: 30, step: 1007, loss: 0.34666284918785095, mean loss: 0.34737496611965984
Epoch: 30, step: 1008, loss: 0.32101142406463623, mean loss: 0.34737437139516675
Epoch: 30, step: 1009, loss: 0.34087738394737244, mean loss: 0.3473742248355582
Epoch: 30, step: 1010, loss: 0.32771316170692444, mean loss: 0.3473737813295888
Epoch: 30, step: 1011, loss: 0.3204544186592102, mean loss: 0.3473731741076572
Epoch: 30, step: 1012, loss: 0.2982404828071594, mean loss: 0.3473720658431297
Epoch: 30, step: 1013, loss: 0.3702163100242615, mean loss: 0.34737258111908453
Epoch: 30, step: 1014, loss: 0.3270823657512665, mean loss: 0.3473721234622588
Epoch: 30, step: 1015, loss: 0.3810224235057831, mean loss: 0.34737288244592995
Epoch: 30, step: 1016, loss: 0.337544709444046, mean loss: 0.3473726607761507
Epoch: 30, step: 1017, loss: 0.3364580571651459, mean loss: 0.3473724146079967
Epoch: 30, step: 1018, loss: 0.32778555154800415, mean loss: 0.34737197285552013
Epoch: 30, step: 1019, loss: 0.3211364150047302, mean loss: 0.3473713811649958
Epoch: 30, step: 1020, loss: 0.3165470361709595, mean loss: 0.3473706859992351
Epoch: 30, step: 1021, loss: 0.31869378685951233, mean loss: 0.3473700392783127
Epoch: 30, step: 1022, loss: 0.3147410452365875, mean loss: 0.3473693034464105
Epoch: 30, step: 1023, loss: 0.3516554832458496, mean loss: 0.3473694001039019
Epoch: 30, step: 1024, loss: 0.3337627053260803, mean loss: 0.34736909326672116
Epoch: 30, step: 1025, loss: 0.32766905426979065, mean loss: 0.34736864903186354
Epoch: 30, step: 1026, loss: 0.3364340662956238, mean loss: 0.3473684024631501
Epoch: 30, step: 1027, loss: 0.2977753281593323, mean loss: 0.3473672841923306
Epoch: 30, step: 1028, loss: 0.3408902883529663, mean loss: 0.34736713814629033
Epoch: 30, step: 1029, loss: 0.33336594700813293, mean loss: 0.3473668224486322
Epoch: 30, step: 1030, loss: 0.3388061225414276, mean loss: 0.34736662942705643
Epoch: 30, step: 1031, loss: 0.29293832182884216, mean loss: 0.34736540223758133
Epoch: 30, step: 1032, loss: 0.36517882347106934, mean loss: 0.3473658038659094
Epoch: 30, step: 1033, loss: 0.3190813958644867, mean loss: 0.34736516616901614
Epoch: 30, step: 1034, loss: 0.32846957445144653, mean loss: 0.3473647401608611
Epoch: 30, step: 1035, loss: 0.3321765661239624, mean loss: 0.3473643977455388
Epoch: 30, step: 1036, loss: 0.3223099708557129, mean loss: 0.3473638329096191
Epoch: 30, step: 1037, loss: 0.3048228919506073, mean loss: 0.34736287387312154
Epoch: 30, step: 1038, loss: 0.3310016095638275, mean loss: 0.3473625050355844
Epoch: 30, step: 1039, loss: 0.32836151123046875, mean loss: 0.347362076699385
Epoch: 30, step: 1040, loss: 0.31895455718040466, mean loss: 0.34736143632789834
Epoch: 30, step: 1041, loss: 0.33076906204223633, mean loss: 0.34736106230566566
Epoch: 30, step: 1042, loss: 0.305968314409256, mean loss: 0.34736012925903004
Epoch: 30, step: 1043, loss: 0.3059922456741333, mean loss: 0.3473591967938875
Epoch: 30, step: 1044, loss: 0.33952072262763977, mean loss: 0.3473590201124006
Epoch: 30, step: 1045, loss: 0.32633742690086365, mean loss: 0.34735854629025725
Epoch: 30, step: 1046, loss: 0.319513738155365, mean loss: 0.3473579186884781
Epoch: 30, step: 1047, loss: 0.31496763229370117, mean loss: 0.3473571886513704
Epoch: 30, step: 1048, loss: 0.37424251437187195, mean loss: 0.34735779459979654
Epoch: 30, step: 1049, loss: 0.33821675181388855, mean loss: 0.3473575885812528
Epoch: 30, step: 1050, loss: 0.33292338252067566, mean loss: 0.3473572632740463
Epoch: 30, step: 1051, loss: 0.3079008460044861, mean loss: 0.34735637405523107
Epoch: 30, step: 1052, loss: 0.33598166704177856, mean loss: 0.34735611771225194
Epoch: 30, step: 1053, loss: 0.34583690762519836, mean loss: 0.34735608347576014
Epoch: 30, step: 1054, loss: 0.33971428871154785, mean loss: 0.34735591126630067
Epoch: 30, step: 1055, loss: 0.3204062283039093, mean loss: 0.3473553039631872
Epoch: 30, step: 1056, loss: 0.3369300663471222, mean loss: 0.34735506903884317
Epoch: 30, step: 1057, loss: 0.35730770230293274, mean loss: 0.34735529330837456
Epoch: 30, step: 1058, loss: 0.324878066778183, mean loss: 0.34735478682498083
Epoch: 30, step: 1059, loss: 0.3352665901184082, mean loss: 0.34735451444560483
Epoch: 30, step: 1060, loss: 0.3190559446811676, mean loss: 0.34735387681757113
Epoch: 30, step: 1061, loss: 0.3097677528858185, mean loss: 0.34735302993991957
Epoch: 30, step: 1062, loss: 0.29959020018577576, mean loss: 0.3473519537884707
Epoch: 30, step: 1063, loss: 0.36243152618408203, mean loss: 0.34735229354091296
Epoch: 30, step: 1064, loss: 0.3551308810710907, mean loss: 0.34735246879353276
Epoch: 30, step: 1065, loss: 0.3024069368839264, mean loss: 0.34735145618748786
Epoch: 30, step: 1066, loss: 0.31001225113868713, mean loss: 0.3473506149680982
Epoch: 30, step: 1067, loss: 0.29625675082206726, mean loss: 0.3473494638942912
Epoch: 30, step: 1068, loss: 0.3433164954185486, mean loss: 0.34734937303915875
Epoch: 30, step: 1069, loss: 0.33350932598114014, mean loss: 0.34734906125616577
Epoch: 30, step: 1070, loss: 0.30065181851387024, mean loss: 0.3473480093032307
Epoch: 30, step: 1071, loss: 0.32924795150756836, mean loss: 0.347347601570806
Epoch: 30, step: 1072, loss: 0.3357203006744385, mean loss: 0.3473473396533664
Epoch: 30, step: 1073, loss: 0.34924402832984924, mean loss: 0.34734738237735335
Epoch: 30, step: 1074, loss: 0.3127574026584625, mean loss: 0.34734660323601496
Epoch: 30, step: 1075, loss: 0.33679869771003723, mean loss: 0.347346365649171
Epoch: 30, step: 1076, loss: 0.3706195652484894, mean loss: 0.3473468898557525
Epoch: 30, step: 1077, loss: 0.34370237588882446, mean loss: 0.347346807768407
Epoch: 30, step: 1078, loss: 0.3086211383342743, mean loss: 0.3473459355490004
Epoch: 30, step: 1079, loss: 0.34771931171417236, mean loss: 0.3473459439583735
Epoch: 30, step: 1080, loss: 0.2924051582813263, mean loss: 0.3473447065811595
Epoch: 30, step: 1081, loss: 0.3788450062274933, mean loss: 0.34734541601541125
Epoch: 30, step: 1082, loss: 0.30613216757774353, mean loss: 0.3473444878518088
Epoch: 30, step: 1083, loss: 0.356010764837265, mean loss: 0.34734468302064464
Epoch: 30, step: 1084, loss: 0.32001641392707825, mean loss: 0.3473440675883939
Epoch: 30, step: 1085, loss: 0.3237989842891693, mean loss: 0.34734353736537676
Epoch: 30, step: 1086, loss: 0.36313489079475403, mean loss: 0.34734389297042617
Epoch: 30, step: 1087, loss: 0.3410800099372864, mean loss: 0.3473437519173944
Epoch: 30, step: 1088, loss: 0.34228086471557617, mean loss: 0.3473436379115127
Epoch: 30, step: 1089, loss: 0.35532909631729126, mean loss: 0.3473438177236812
Epoch: 30, step: 1090, loss: 0.3011060357093811, mean loss: 0.3473427765901329
Epoch: 30, step: 1091, loss: 0.35016995668411255, mean loss: 0.34734284024815537
Epoch: 30, step: 1092, loss: 0.32767799496650696, mean loss: 0.34734239747587514
Epoch: 30, step: 1093, loss: 0.34351518750190735, mean loss: 0.3473423113046234
Epoch: 30, step: 1094, loss: 0.3263309597969055, mean loss: 0.3473418382358064
Epoch: 30, step: 1095, loss: 0.3423663377761841, mean loss: 0.347341726215353
Epoch: 30, step: 1096, loss: 0.3265364170074463, mean loss: 0.3473412578066534
Epoch: 30, step: 1097, loss: 0.32977667450904846, mean loss: 0.34734086236824335
Epoch: 30, step: 1098, loss: 0.3367733359336853, mean loss: 0.34734062446269764
Epoch: 30, step: 1099, loss: 0.3521907329559326, mean loss: 0.34734073365019186
Epoch: 30, step: 1100, loss: 0.2995753884315491, mean loss: 0.3473396583627103
Epoch: 30, step: 1101, loss: 0.33393892645835876, mean loss: 0.3473393566938997
Epoch: 30, step: 1102, loss: 0.3230476677417755, mean loss: 0.34733880986705434
Epoch: 30, step: 1103, loss: 0.33791446685791016, mean loss: 0.3473385977217498
Epoch: 30, step: 1104, loss: 0.3348783254623413, mean loss: 0.3473383172429145
Epoch: 30, step: 1105, loss: 0.36484426259994507, mean loss: 0.34733871129021465
Epoch: 30, step: 1106, loss: 0.3043932318687439, mean loss: 0.3473377446375165
Epoch: 30, step: 1107, loss: 0.33453866839408875, mean loss: 0.3473374565517093
Epoch: 30, step: 1108, loss: 0.2870495021343231, mean loss: 0.3473360996011946
Epoch: 30, step: 1109, loss: 0.30428022146224976, mean loss: 0.347335130528988
Epoch: 30, step: 1110, loss: 0.3154667615890503, mean loss: 0.34733441327371717
Epoch: 30, step: 1111, loss: 0.3098229467868805, mean loss: 0.34733356902933277
Epoch: 30, step: 1112, loss: 0.30606794357299805, mean loss: 0.3473326403136157
Epoch: 30, step: 1113, loss: 0.29980745911598206, mean loss: 0.3473315707456903
Epoch: 30, step: 1114, loss: 0.3518025577068329, mean loss: 0.3473316713642784
Epoch: 30, step: 1115, loss: 0.338595986366272, mean loss: 0.34733147477401377
Epoch: 30, step: 1116, loss: 0.31854331493377686, mean loss: 0.3473308269319038
Epoch: 30, step: 1117, loss: 0.36158981919288635, mean loss: 0.3473311478057564
Epoch: 30, step: 1118, loss: 0.34598302841186523, mean loss: 0.34733111746935386
Epoch: 30, step: 1119, loss: 0.36206385493278503, mean loss: 0.34733144898909873
Epoch: 30, step: 1120, loss: 0.36397233605384827, mean loss: 0.3473318234380775
Epoch: 30, step: 1121, loss: 0.3394126892089844, mean loss: 0.3473316452477569
Epoch: 30, step: 1122, loss: 0.34515801072120667, mean loss: 0.34733159633939054
Epoch: 30, step: 1123, loss: 0.35772189497947693, mean loss: 0.34733183012344776
Epoch: 30, step: 1124, loss: 0.3430083990097046, mean loss: 0.34733173284746366
Epoch: 30, step: 1125, loss: 0.3271388113498688, mean loss: 0.34733127852263135
Epoch: 30, step: 1126, loss: 0.2882590591907501, mean loss: 0.34732994947411666
Epoch: 30, step: 1127, loss: 0.33186379075050354, mean loss: 0.3473296015133822
Epoch: 30, step: 1128, loss: 0.3104797601699829, mean loss: 0.3473287724769282
Epoch: 30, step: 1129, loss: 0.31550946831703186, mean loss: 0.34732805663206523
Epoch: 30, step: 1130, loss: 0.3256802260875702, mean loss: 0.3473275696277111
Epoch: 30, step: 1131, loss: 0.3575461208820343, mean loss: 0.34732779950603504
Epoch: 30, step: 1132, loss: 0.32784485816955566, mean loss: 0.3473273612242242
Epoch: 30, step: 1133, loss: 0.3387558162212372, mean loss: 0.34732716840591754
Epoch: 30, step: 1134, loss: 0.3861323297023773, mean loss: 0.3473280413147309
Epoch: 30, step: 1135, loss: 0.39157092571258545, mean loss: 0.3473290365208762
Epoch: 30, step: 1136, loss: 0.33014482259750366, mean loss: 0.34732864998525925
Epoch: 30, step: 1137, loss: 0.32632964849472046, mean loss: 0.3473281776517874
Epoch: 30, step: 1138, loss: 0.3251610994338989, mean loss: 0.3473276790558177
Epoch: 30, step: 1139, loss: 0.32910221815109253, mean loss: 0.3473272691264226
Epoch: 30, step: 1140, loss: 0.3185817003250122, mean loss: 0.3473266225919586
Epoch: 30, step: 1141, loss: 0.3364812731742859, mean loss: 0.3473263786679467
Epoch: 30, step: 1142, loss: 0.3214484453201294, mean loss: 0.34732579665743574
Epoch: 30, step: 1143, loss: 0.3195669949054718, mean loss: 0.3473251723590876
Epoch: 30, step: 1144, loss: 0.35408470034599304, mean loss: 0.3473253243781585
Epoch: 30, step: 1145, loss: 0.34748053550720215, mean loss: 0.347325327868716
Epoch: 30, step: 1146, loss: 0.37212005257606506, mean loss: 0.3473258854670408
Epoch: 30, step: 1147, loss: 0.3173648416996002, mean loss: 0.3473252117006522
Epoch: 30, step: 1148, loss: 0.3417976200580597, mean loss: 0.3473250873985172
Epoch: 30, step: 1149, loss: 0.30465564131736755, mean loss: 0.34732412788769906
Epoch: 30, step: 1150, loss: 0.331946462392807, mean loss: 0.34732378209683545
Epoch: 30, step: 1151, loss: 0.35865479707717896, mean loss: 0.34732403688670277
Epoch: 30, step: 1152, loss: 0.3088151216506958, mean loss: 0.34732317099244703
Epoch: 30, step: 1153, loss: 0.2943311035633087, mean loss: 0.34732197946329674
Epoch: 30, step: 1154, loss: 0.37130460143089294, mean loss: 0.3473225187015647
Epoch: 30, step: 1155, loss: 0.3501584827899933, mean loss: 0.3473225824654843
Epoch: 30, step: 1156, loss: 0.31255534291267395, mean loss: 0.34732180077518254
Epoch: 30, step: 1157, loss: 0.34360790252685547, mean loss: 0.3473217172755142
Epoch: 30, step: 1158, loss: 0.36044976115226746, mean loss: 0.34732201242702115
Epoch: 30, step: 1159, loss: 0.32733359932899475, mean loss: 0.3473215630472303
Epoch: 30, step: 1160, loss: 0.36662644147872925, mean loss: 0.3473219970500277
Epoch: 30, step: 1161, loss: 0.3107130825519562, mean loss: 0.3473211740448908
Epoch: 30, step: 1162, loss: 0.319873571395874, mean loss: 0.34732055700910974
Epoch: 30, step: 1163, loss: 0.3417948782444, mean loss: 0.34732043279189084
Epoch: 30, step: 1164, loss: 0.32714274525642395, mean loss: 0.34731997920781676
Epoch: 30, step: 1165, loss: 0.3445777893066406, mean loss: 0.3473199175661789
Epoch: 30, step: 1166, loss: 0.33651718497276306, mean loss: 0.3473196747372043
Epoch: 30, step: 1167, loss: 0.2914726138114929, mean loss: 0.34731841940855557
Epoch: 30, step: 1168, loss: 0.3708310127258301, mean loss: 0.3473189479120804
Epoch: 30, step: 1169, loss: 0.323419451713562, mean loss: 0.3473184107240337
Epoch: 30, step: 1170, loss: 0.29870089888572693, mean loss: 0.3473173179746723
Epoch: 30, step: 1171, loss: 0.3199084997177124, mean loss: 0.3473167019354235
Epoch: 30, step: 1172, loss: 0.3204117715358734, mean loss: 0.34731609723512463
Epoch: 30, step: 1173, loss: 0.33626607060432434, mean loss: 0.34731584888643424
Epoch: 30, step: 1174, loss: 0.31613996624946594, mean loss: 0.34731514822607606
Epoch: 30, step: 1175, loss: 0.3463228940963745, mean loss: 0.347315125926226
Epoch: 30, step: 1176, loss: 0.3113267123699188, mean loss: 0.3473143171433068
Epoch: 30, step: 1177, loss: 0.3270680904388428, mean loss: 0.3473138621514711
Epoch: 30, step: 1178, loss: 0.3436184525489807, mean loss: 0.3473137791066925
Epoch: 30, step: 1179, loss: 0.3054417073726654, mean loss: 0.34731283816126024
Epoch: 30, step: 1180, loss: 0.37325748801231384, mean loss: 0.34731342117399816
Epoch: 30, step: 1181, loss: 0.32934868335723877, mean loss: 0.34731301749016785
Epoch: 30, step: 1182, loss: 0.31272509694099426, mean loss: 0.3473122402859221
Epoch: 30, step: 1183, loss: 0.3795188367366791, mean loss: 0.3473129639646128
Epoch: 30, step: 1184, loss: 0.31634294986724854, mean loss: 0.34731226808742827
Epoch: 30, step: 1185, loss: 0.3177264332771301, mean loss: 0.34731160332683847
Epoch: 30, step: 1186, loss: 0.31395071744918823, mean loss: 0.34731085376191884
Epoch: 30, step: 1187, loss: 0.3400917947292328, mean loss: 0.34731069156503214
Epoch: 30, step: 1188, loss: 0.3169173300266266, mean loss: 0.3473100087062499
Epoch: 30, step: 1189, loss: 0.3774469792842865, mean loss: 0.3473106857893903
Epoch: 30, step: 1190, loss: 0.35954970121383667, mean loss: 0.34731096075547563
Epoch: 30, step: 1191, loss: 0.30857226252555847, mean loss: 0.3473100904576182
Epoch: 30, step: 1192, loss: 0.31253671646118164, mean loss: 0.34730930926169795
Epoch: 30, step: 1193, loss: 0.31967929005622864, mean loss: 0.3473086885576676
Epoch: 30, step: 1194, loss: 0.35025733709335327, mean loss: 0.34730875479710455
Epoch: 30, step: 1195, loss: 0.35719388723373413, mean loss: 0.34730897685507106
Epoch: 30, step: 1196, loss: 0.37726107239723206, mean loss: 0.347309649678836
Epoch: 30, step: 1197, loss: 0.29785698652267456, mean loss: 0.3473085388323659
Epoch: 30, step: 1198, loss: 0.3074215352535248, mean loss: 0.34730764287774923
Epoch: 30, step: 1199, loss: 0.34207481145858765, mean loss: 0.3473075253388584
Epoch: 30, step: 1200, loss: 0.3083055317401886, mean loss: 0.3473066493029742
Epoch: 30, step: 1201, loss: 0.3313014507293701, mean loss: 0.3473062898133158
Epoch: 30, step: 1202, loss: 0.35356321930885315, mean loss: 0.3473064303458382
Epoch: 30, step: 1203, loss: 0.35672837495803833, mean loss: 0.3473066419608012
Epoch: 30, step: 1204, loss: 0.3390660285949707, mean loss: 0.347306456882455
Epoch: 30, step: 1205, loss: 0.3058822453022003, mean loss: 0.3473055265448639
Epoch: 30, step: 1206, loss: 0.3482097089290619, mean loss: 0.3473055468512484
Epoch: 30, step: 1207, loss: 0.3123224675655365, mean loss: 0.34730476120897197
Epoch: 30, step: 1208, loss: 0.3155685365200043, mean loss: 0.3473040484998456
Epoch: 30, step: 1209, loss: 0.3488270044326782, mean loss: 0.34730408270051777
Epoch: 30, step: 1210, loss: 0.29335394501686096, mean loss: 0.3473028711818525
Epoch: 30, step: 1211, loss: 0.3088013827800751, mean loss: 0.34730200660158655
Epoch: 30, step: 1212, loss: 0.33446288108825684, mean loss: 0.34730171829571194
Epoch: 30, step: 1213, loss: 0.32996666431427, mean loss: 0.3473013290413449
Epoch: 30, step: 1214, loss: 0.336232453584671, mean loss: 0.3473010804980541
Epoch: 30, step: 1215, loss: 0.3093472123146057, mean loss: 0.3473002282915653
Epoch: 30, step: 1216, loss: 0.3184957504272461, mean loss: 0.3472995815376783
Epoch: 30, step: 1217, loss: 0.3371753394603729, mean loss: 0.34729935422073377
Epoch: 30, step: 1218, loss: 0.3175439238548279, mean loss: 0.3472986861448819
Epoch: 30, step: 1219, loss: 0.3100905120372772, mean loss: 0.34729785075704833
Epoch: 30, step: 1220, loss: 0.30204352736473083, mean loss: 0.3472968347420646
Epoch: 30, step: 1221, loss: 0.3249594569206238, mean loss: 0.3472963332518346
Epoch: 30, step: 1222, loss: 0.3370688855648041, mean loss: 0.34729610364341834
Epoch: 30, step: 1223, loss: 0.3137032687664032, mean loss: 0.3472953494939285
Epoch: 30, step: 1224, loss: 0.33573225140571594, mean loss: 0.3472950899115267
Epoch: 30, step: 1225, loss: 0.3516945242881775, mean loss: 0.3472951886731299
Epoch: 30, step: 1226, loss: 0.3255796432495117, mean loss: 0.34729470119820627
Epoch: 30, step: 1227, loss: 0.3233999013900757, mean loss: 0.3472941648149835
Epoch: 30, step: 1228, loss: 0.31827157735824585, mean loss: 0.3472935133393621
Epoch: 30, step: 1229, loss: 0.332309752702713, mean loss: 0.34729317700354534
Epoch: 30, step: 1230, loss: 0.3607225716114044, mean loss: 0.3472934784422248
Epoch: 30, step: 1231, loss: 0.3931958079338074, mean loss: 0.3472945087512904
Epoch: 30, step: 1232, loss: 0.34207937121391296, mean loss: 0.3472943916966019
Epoch: 30, step: 1233, loss: 0.3628867268562317, mean loss: 0.3472947416614796
Epoch: 30, step: 1234, loss: 0.3307839334011078, mean loss: 0.3472943710900901
Epoch: 30, step: 1235, loss: 0.3449724316596985, mean loss: 0.3472943189772561
Epoch: 30, step: 1236, loss: 0.32922640442848206, mean loss: 0.3472939134761104
Epoch: 30, step: 1237, loss: 0.3788174092769623, mean loss: 0.34729462094717733
Epoch: 30, step: 1238, loss: 0.30960825085639954, mean loss: 0.3472937751838054
Epoch: 30, step: 1239, loss: 0.3177093267440796, mean loss: 0.3472931112599176
Epoch: 30, step: 1240, loss: 0.32799968123435974, mean loss: 0.3472926782931972
Epoch: 30, step: 1241, loss: 0.33074814081192017, mean loss: 0.34729230702311326
Epoch: 30, step: 1242, loss: 0.30361759662628174, mean loss: 0.34729132695645715
Epoch: 30, step: 1243, loss: 0.32775893807411194, mean loss: 0.3472908886567336
Epoch: 30, step: 1244, loss: 0.35238921642303467, mean loss: 0.34729100305879274
Epoch: 30, step: 1245, loss: 0.3237115740776062, mean loss: 0.34729047396870205
Epoch: 30, step: 1246, loss: 0.3364821672439575, mean loss: 0.34729023145054455
Epoch: 30, step: 1247, loss: 0.3520326316356659, mean loss: 0.347290337858734
Epoch: 30, step: 1248, loss: 0.35707730054855347, mean loss: 0.34729055744999
Epoch: 30, step: 1249, loss: 0.31047049164772034, mean loss: 0.34728973133229196
Epoch: 30, step: 1250, loss: 0.30817458033561707, mean loss: 0.34728885374033763
Epoch: 30, step: 1251, loss: 0.35288310050964355, mean loss: 0.34728897925067526
Epoch: 30, step: 1252, loss: 0.3204302191734314, mean loss: 0.34728837667153367
Epoch: 30, step: 1253, loss: 0.3160693347454071, mean loss: 0.3472876762847179
Epoch: 30, step: 1254, loss: 0.33651936054229736, mean loss: 0.34728743470724754
Epoch: 30, step: 1255, loss: 0.33729347586631775, mean loss: 0.34728721050680694
Epoch: 30, step: 1256, loss: 0.3447570502758026, mean loss: 0.3472871537474864
Epoch: 30, step: 1257, loss: 0.3286605775356293, mean loss: 0.3472867359051379
Epoch: 30, step: 1258, loss: 0.33389022946357727, mean loss: 0.34728643539354187
Epoch: 30, step: 1259, loss: 0.4179280698299408, mean loss: 0.3472880199972753
Epoch: 30, step: 1260, loss: 0.28003713488578796, mean loss: 0.34728651148725737
Epoch: 30, step: 1261, loss: 0.30183014273643494, mean loss: 0.34728549187466146
Epoch: 30, step: 1262, loss: 0.32418447732925415, mean loss: 0.3472849737171901
Epoch: 30, step: 1263, loss: 0.33280980587005615, mean loss: 0.347284649045383
Epoch: 30, step: 1264, loss: 0.3535456955432892, mean loss: 0.34728478947482105
Epoch: 30, step: 1265, loss: 0.32962971925735474, mean loss: 0.34728439349693074
Epoch: 30, step: 1266, loss: 0.39254283905029297, mean loss: 0.34728540855615325
Epoch: 30, step: 1267, loss: 0.3291354477405548, mean loss: 0.3472850014968365
Epoch: 30, step: 1268, loss: 0.37205037474632263, mean loss: 0.34728555691124924
Epoch: 30, step: 1269, loss: 0.366245836019516, mean loss: 0.34728598212495426
Epoch: 30, step: 1270, loss: 0.3434121608734131, mean loss: 0.3472858952504448
Epoch: 30, step: 1271, loss: 0.31106123328208923, mean loss: 0.3472850828925786
Epoch: 30, step: 1272, loss: 0.3236941993236542, mean loss: 0.34728455386596974
Epoch: 30, step: 1273, loss: 0.37509992718696594, mean loss: 0.34728517761296085
Epoch: 30, step: 1274, loss: 0.31188443303108215, mean loss: 0.34728438378529897
Epoch: 30, step: 1275, loss: 0.3166680335998535, mean loss: 0.34728369725847624
Epoch: 30, step: 1276, loss: 0.31684795022010803, mean loss: 0.34728301479671786
Epoch: 30, step: 1277, loss: 0.34132814407348633, mean loss: 0.3472828812734495
Epoch: 30, step: 1278, loss: 0.3490053713321686, mean loss: 0.34728291989516874
Epoch: 30, step: 1279, loss: 0.3389143943786621, mean loss: 0.34728273226006745
Epoch: 30, step: 1280, loss: 0.31182044744491577, mean loss: 0.3472819371594012
Epoch: 30, step: 1281, loss: 0.30999279022216797, mean loss: 0.34728110111736415
Epoch: 30, step: 1282, loss: 0.34367698431015015, mean loss: 0.34728102031300556
Epoch: 30, step: 1283, loss: 0.30785125494003296, mean loss: 0.3472801363168309
Epoch: 30, step: 1284, loss: 0.35973259806632996, mean loss: 0.34728041548871186
Epoch: 30, step: 1285, loss: 0.3677939176559448, mean loss: 0.34728087537083907
Epoch: 30, step: 1286, loss: 0.31447088718414307, mean loss: 0.3472801398363224
Epoch: 30, step: 1287, loss: 0.31513112783432007, mean loss: 0.3472794191357305
Epoch: 30, step: 1288, loss: 0.30477091670036316, mean loss: 0.3472784662225866
Epoch: 30, step: 1289, loss: 0.31181490421295166, mean loss: 0.3472776712537005
Epoch: 30, step: 1290, loss: 0.362653523683548, mean loss: 0.3472780159187479
Epoch: 30, step: 1291, loss: 0.30478745698928833, mean loss: 0.34727706347189663
Epoch: 30, step: 1292, loss: 0.3575662672519684, mean loss: 0.34727729410430824
Epoch: 30, step: 1293, loss: 0.32595565915107727, mean loss: 0.34727681619076195
Epoch: 30, step: 1294, loss: 0.4097227454185486, mean loss: 0.34727821585296587
Epoch: 30, step: 1295, loss: 0.3578779399394989, mean loss: 0.3472784534297116
Epoch: 30, step: 1296, loss: 0.3109948933124542, mean loss: 0.34727764020694635
Epoch: 30, step: 1297, loss: 0.32599177956581116, mean loss: 0.347277163138036
Epoch: 30, step: 1298, loss: 0.3207092881202698, mean loss: 0.3472765676994332
Epoch: 30, step: 1299, loss: 0.34475013613700867, mean loss: 0.34727651107837626
Epoch: 30, step: 1300, loss: 0.355072557926178, mean loss: 0.3472766857953671
Epoch: 30, step: 1301, loss: 0.33238211274147034, mean loss: 0.34727635200098195
Epoch: 30, step: 1302, loss: 0.33145928382873535, mean loss: 0.3472759975409911
Epoch: 30, step: 1303, loss: 0.29286620020866394, mean loss: 0.3472747782465008
Epoch: 30, step: 1304, loss: 0.3154662549495697, mean loss: 0.3472740654504606
Epoch: 30, step: 1305, loss: 0.3284004032611847, mean loss: 0.3472736425207293
Epoch: 30, step: 1306, loss: 0.3227851390838623, mean loss: 0.34727309378334076
Epoch: 30, step: 1307, loss: 0.3810328245162964, mean loss: 0.3472738502530623
Epoch: 30, step: 1308, loss: 0.3037310540676117, mean loss: 0.3472728745915824
Epoch: 30, step: 1309, loss: 0.30569279193878174, mean loss: 0.34727194292941227
Epoch: 30, step: 1310, loss: 0.34466785192489624, mean loss: 0.34727188458227676
Epoch: 30, step: 1311, loss: 0.30411815643310547, mean loss: 0.34727091770362134
Epoch: 30, step: 1312, loss: 0.33946242928504944, mean loss: 0.3472707427548521
Epoch: 30, step: 1313, loss: 0.3423645496368408, mean loss: 0.347270632834318
Epoch: 30, step: 1314, loss: 0.31742024421691895, mean loss: 0.3472699640679101
Epoch: 30, step: 1315, loss: 0.31528377532958984, mean loss: 0.3472692474672125
Epoch: 30, step: 1316, loss: 0.3196907341480255, mean loss: 0.3472686296274536
Epoch: 30, step: 1317, loss: 0.29780974984169006, mean loss: 0.34726752162799607
Epoch: 30, step: 1318, loss: 0.33835387229919434, mean loss: 0.3472673219449985
Epoch: 30, step: 1319, loss: 0.3302982449531555, mean loss: 0.34726694181334544
Epoch: 30, step: 1320, loss: 0.3137178421020508, mean loss: 0.3472661902822482
Epoch: 30, step: 1321, loss: 0.35013529658317566, mean loss: 0.3472662545514633
Epoch: 30, step: 1322, loss: 0.36226171255111694, mean loss: 0.34726659044864766
Epoch: 30, step: 1323, loss: 0.32686352729797363, mean loss: 0.34726613343173274
Epoch: 30, step: 1324, loss: 0.35248053073883057, mean loss: 0.34726625022862617
Epoch: 30, step: 1325, loss: 0.3147030174732208, mean loss: 0.3472655208635598
Epoch: 30, step: 1326, loss: 0.3441959023475647, mean loss: 0.3472654521104853
Epoch: 30, step: 1327, loss: 0.30659589171409607, mean loss: 0.34726454121726735
Epoch: 30, step: 1328, loss: 0.35504597425460815, mean loss: 0.34726471549738647
Epoch: 30, step: 1329, loss: 0.30475226044654846, mean loss: 0.3472637633707336
Epoch: 30, step: 1330, loss: 0.3317064642906189, mean loss: 0.347263414950786
Epoch: 30, step: 1331, loss: 0.34236302971839905, mean loss: 0.3472633052046328
Epoch: 30, step: 1332, loss: 0.3183927536010742, mean loss: 0.3472626586511738
Epoch: 30, step: 1333, loss: 0.36016425490379333, mean loss: 0.3472629475748145
Epoch: 30, step: 1334, loss: 0.3034641742706299, mean loss: 0.3472619667490771
Epoch: 30, step: 1335, loss: 0.3344462513923645, mean loss: 0.34726167976154226
Epoch: 30, step: 1336, loss: 0.3226284384727478, mean loss: 0.3472611281516874
Epoch: 30, step: 1337, loss: 0.32154008746147156, mean loss: 0.3472605521957402
Epoch: 30, step: 1338, loss: 0.347665011882782, mean loss: 0.3472605612523623
Epoch: 30, step: 1339, loss: 0.32921844720840454, mean loss: 0.3472601572641392
Epoch: 30, step: 1340, loss: 0.28889337182044983, mean loss: 0.3472588503792633
Epoch: 30, step: 1341, loss: 0.34390988945961, mean loss: 0.3472587753946921
Epoch: 30, step: 1342, loss: 0.3337787389755249, mean loss: 0.34725847357805595
Epoch: 30, step: 1343, loss: 0.3571561276912689, mean loss: 0.34725869518055713
Epoch: 30, step: 1344, loss: 0.3249742090702057, mean loss: 0.34725819625553506
Epoch: 30, step: 1345, loss: 0.3423601984977722, mean loss: 0.3472580865972322
Epoch: 30, step: 1346, loss: 0.33229297399520874, mean loss: 0.3472577515598981
Epoch: 30, step: 1347, loss: 0.34597888588905334, mean loss: 0.34725772292943174
Epoch: 30, step: 1348, loss: 0.3316527307033539, mean loss: 0.3472573735821836
Epoch: 30, step: 1349, loss: 0.3408648669719696, mean loss: 0.3472572304770435
Epoch: 30, step: 1350, loss: 0.33478274941444397, mean loss: 0.34725695122470834
Epoch: 30, step: 1351, loss: 0.3031645119190216, mean loss: 0.34725596419839866
Epoch: 30, step: 1352, loss: 0.3101900815963745, mean loss: 0.34725513448285233
Epoch: 30, step: 1353, loss: 0.32418766617774963, mean loss: 0.34725461813176883
Epoch: 30, step: 1354, loss: 0.3541000485420227, mean loss: 0.34725477135908633
Epoch: 30, step: 1355, loss: 0.309003084897995, mean loss: 0.3472539151569541
Epoch: 30, step: 1356, loss: 0.3166593611240387, mean loss: 0.3472532303626744
Epoch: 30, step: 1357, loss: 0.3503471910953522, mean loss: 0.34725329961288104
Epoch: 30, step: 1358, loss: 0.3325989246368408, mean loss: 0.3472529716204243
Epoch: 30, step: 1359, loss: 0.33820849657058716, mean loss: 0.3472527691926031
Epoch: 30, step: 1360, loss: 0.3195635974407196, mean loss: 0.34725214948463434
Epoch: 30, step: 1361, loss: 0.4076089560985565, mean loss: 0.34725350029271396
Epoch: 30, step: 1362, loss: 0.33889898657798767, mean loss: 0.34725331331973286
Epoch: 30, step: 1363, loss: 0.4285125732421875, mean loss: 0.34725513185119655
Epoch: 30, step: 1364, loss: 0.3396032750606537, mean loss: 0.34725496061125494
Epoch: 30, step: 1365, loss: 0.30260810256004333, mean loss: 0.34725396148718807
Epoch: 30, step: 1366, loss: 0.3266197443008423, mean loss: 0.3472534997373014
Epoch: 30, step: 1367, loss: 0.30680710077285767, mean loss: 0.34725259465318564
Epoch: 30, step: 1368, loss: 0.32641085982322693, mean loss: 0.3472521282803684
Epoch: 30, step: 1369, loss: 0.36613404750823975, mean loss: 0.34725255078918976
Epoch: 30, step: 1370, loss: 0.34514424204826355, mean loss: 0.34725250361394777
Epoch: 30, step: 1371, loss: 0.35507649183273315, mean loss: 0.34725267867857273
Epoch: 30, step: 1372, loss: 0.3805623948574066, mean loss: 0.3472534239790936
Epoch: 30, step: 1373, loss: 0.3361217677593231, mean loss: 0.3472531749153217
Epoch: 30, step: 1374, loss: 0.32635489106178284, mean loss: 0.3472527073398915
Epoch: 30, step: 1375, loss: 0.3407297432422638, mean loss: 0.3472525613992235
Epoch: 30, step: 1376, loss: 0.4043160080909729, mean loss: 0.34725383807208055
Epoch: 30, step: 1377, loss: 0.35592544078826904, mean loss: 0.3472540320763473
Epoch: 30, step: 1378, loss: 0.3246631324291229, mean loss: 0.34725352667578696
Epoch: 30, step: 1379, loss: 0.3641034960746765, mean loss: 0.3472539036325968
Epoch: 30, step: 1380, loss: 0.32184189558029175, mean loss: 0.34725333514401596
Epoch: 30, step: 1381, loss: 0.29216137528419495, mean loss: 0.34725210271683465
Epoch: 30, step: 1382, loss: 0.3063593804836273, mean loss: 0.34725118795222754
Epoch: 30, step: 1383, loss: 0.29529061913490295, mean loss: 0.3472500256274061
Epoch: 30, step: 1384, loss: 0.30139580368995667, mean loss: 0.34724899992061853
Epoch: 30, step: 1385, loss: 0.332456111907959, mean loss: 0.34724866902794166
Epoch: 30, step: 1386, loss: 0.34276241064071655, mean loss: 0.3472485686799338
Epoch: 30, step: 1387, loss: 0.34493523836135864, mean loss: 0.3472485169368382
Epoch: 30, step: 1388, loss: 0.3392990827560425, mean loss: 0.34724833913294684
Epoch: 30, step: 1389, loss: 0.3496493101119995, mean loss: 0.3472483928339305
Epoch: 30, step: 1390, loss: 0.31188687682151794, mean loss: 0.34724760194318743
Epoch: 30, step: 1391, loss: 0.3254704177379608, mean loss: 0.3472471148886114
Epoch: 30, step: 1392, loss: 0.29563963413238525, mean loss: 0.3472459606945122
Epoch: 30, step: 1393, loss: 0.3245280385017395, mean loss: 0.3472454526227183
Epoch: 30, step: 1394, loss: 0.34048956632614136, mean loss: 0.3472453015350229
Epoch: 30, step: 1395, loss: 0.3076840043067932, mean loss: 0.34724441681149604
Epoch: 30, step: 1396, loss: 0.3643537759780884, mean loss: 0.3472447994256957
Epoch: 30, step: 1397, loss: 0.3734739124774933, mean loss: 0.34724538597055576
Epoch: 30, step: 1398, loss: 0.38728564977645874, mean loss: 0.3472462813453138
Epoch: 30, step: 1399, loss: 0.3228147327899933, mean loss: 0.3472457350226717
Epoch: 30, step: 1400, loss: 0.3691680431365967, mean loss: 0.34724622522432447
Epoch: 30, step: 1401, loss: 0.3263494074344635, mean loss: 0.3472457579639651
Epoch: 30, step: 1402, loss: 0.3448796272277832, mean loss: 0.3472457050576141
Epoch: 30, step: 1403, loss: 0.30836939811706543, mean loss: 0.3472448358082862
Epoch: 30, step: 1404, loss: 0.323415607213974, mean loss: 0.34724430301390735
Epoch: 30, step: 1405, loss: 0.33206355571746826, mean loss: 0.3472439635972974
Epoch: 30, step: 1406, loss: 0.31084588170051575, mean loss: 0.34724314981408155
Epoch: 30, step: 1407, loss: 0.35316377878189087, mean loss: 0.3472432821837151
Epoch: 30, step: 1408, loss: 0.3988524079322815, mean loss: 0.3472444360017246
Epoch: 30, step: 1409, loss: 0.3365863263607025, mean loss: 0.34724419772518444
Epoch: 30, step: 1410, loss: 0.304350882768631, mean loss: 0.34724323880821506
Epoch: 30, step: 1411, loss: 0.3517966866493225, mean loss: 0.3472433406021845
Epoch: 30, step: 1412, loss: 0.310407429933548, mean loss: 0.3472425171405193
Epoch: 30, step: 1413, loss: 0.32866135239601135, mean loss: 0.34724210177044856
Epoch: 30, step: 1414, loss: 0.3370742201805115, mean loss: 0.34724187447903043
Epoch: 30, step: 1415, loss: 0.32649335265159607, mean loss: 0.3472414106798122
Epoch: 30, step: 1416, loss: 0.34988731145858765, mean loss: 0.3472414698232679
Epoch: 30, step: 1417, loss: 0.30348023772239685, mean loss: 0.34724049165633825
Epoch: 30, step: 1418, loss: 0.3537968099117279, mean loss: 0.34724063820226586
Epoch: 30, step: 1419, loss: 0.3027847111225128, mean loss: 0.34723964455168294
Epoch: 30, step: 1420, loss: 0.3284059166908264, mean loss: 0.34723922360159554
Epoch: 30, step: 1421, loss: 0.31362825632095337, mean loss: 0.34723847238423194
Epoch: 30, step: 1422, loss: 0.338844895362854, mean loss: 0.3472382847889205
Epoch: 30, step: 1423, loss: 0.3625182807445526, mean loss: 0.34723862628713154
Epoch: 30, step: 1424, loss: 0.3358175456523895, mean loss: 0.3472383710389332
Epoch: 30, step: 1425, loss: 0.3167770504951477, mean loss: 0.34723769027818263
Epoch: 30, step: 1426, loss: 0.3554718494415283, mean loss: 0.3472378742940756
Epoch: 30, step: 1427, loss: 0.32999080419540405, mean loss: 0.34723748886746214
Epoch: 30, step: 1428, loss: 0.31144773960113525, mean loss: 0.34723668907865646
Epoch: 30, step: 1429, loss: 0.33864492177963257, mean loss: 0.34723649708385645
Epoch: 30, step: 1430, loss: 0.3426434397697449, mean loss: 0.3472363944479977
Epoch: 30, step: 1431, loss: 0.3452151417732239, mean loss: 0.34723634928235875
Epoch: 30, step: 1432, loss: 0.3629056513309479, mean loss: 0.34723669941088753
Epoch: 30, step: 1433, loss: 0.3285151720046997, mean loss: 0.347236281090125
Epoch: 30, step: 1434, loss: 0.31458768248558044, mean loss: 0.3472355515940105
Epoch: 30, step: 1435, loss: 0.3644990622997284, mean loss: 0.3472359373190687
Epoch: 30, step: 1436, loss: 0.30153366923332214, mean loss: 0.3472349161990632
Epoch: 30, step: 1437, loss: 0.32648807764053345, mean loss: 0.34723445266542546
Epoch: 30, step: 1438, loss: 0.3656126856803894, mean loss: 0.3472348632696171
Epoch: 30, step: 1439, loss: 0.31056344509124756, mean loss: 0.34723404397966673
Epoch: 30, step: 1440, loss: 0.35999563336372375, mean loss: 0.3472343290847668
Epoch: 30, step: 1441, loss: 0.34050366282463074, mean loss: 0.34723417871913836
Epoch: 30, step: 1442, loss: 0.34025707840919495, mean loss: 0.34723402285156224
Epoch: 30, step: 1443, loss: 0.3546711206436157, mean loss: 0.3472341889917149
Valid: 30, mean loss: 0.18540334701538086
Epoch: 31, step: 0, loss: 0.3422512710094452, mean loss: 0.3472340776789039
Epoch: 31, step: 1, loss: 0.3121578097343445, mean loss: 0.3472332941318382
Epoch: 31, step: 2, loss: 0.31896382570266724, mean loss: 0.34723266265176517
Epoch: 31, step: 3, loss: 0.30785566568374634, mean loss: 0.3472317830726692
Epoch: 31, step: 4, loss: 0.2924058437347412, mean loss: 0.3472305584319728
Epoch: 31, step: 5, loss: 0.3103135824203491, mean loss: 0.34722973384014766
Epoch: 31, step: 6, loss: 0.3422320485115051, mean loss: 0.34722962221241255
Epoch: 31, step: 7, loss: 0.36486250162124634, mean loss: 0.34723001604961906
Epoch: 31, step: 8, loss: 0.34321579337120056, mean loss: 0.3472299263923998
Epoch: 31, step: 9, loss: 0.348699688911438, mean loss: 0.34722995921864985
Epoch: 31, step: 10, loss: 0.34528881311416626, mean loss: 0.347229915865303
Epoch: 31, step: 11, loss: 0.35576677322387695, mean loss: 0.3472301065222924
Epoch: 31, step: 12, loss: 0.31363868713378906, mean loss: 0.3472293563286799
Epoch: 31, step: 13, loss: 0.3304141163825989, mean loss: 0.34722898080409315
Epoch: 31, step: 14, loss: 0.3568829596042633, mean loss: 0.34722919639574995
Epoch: 31, step: 15, loss: 0.36670899391174316, mean loss: 0.3472296314068602
Epoch: 31, step: 16, loss: 0.30800867080688477, mean loss: 0.34722875556753996
Epoch: 31, step: 17, loss: 0.3114868998527527, mean loss: 0.3472279574375834
Epoch: 31, step: 18, loss: 0.314767062664032, mean loss: 0.3472272325889852
Epoch: 31, step: 19, loss: 0.3109578490257263, mean loss: 0.34722642271529003
Epoch: 31, step: 20, loss: 0.32695046067237854, mean loss: 0.3472259699752645
Epoch: 31, step: 21, loss: 0.33716943860054016, mean loss: 0.347225745428947
Epoch: 31, step: 22, loss: 0.2920239567756653, mean loss: 0.34722451288850775
Epoch: 31, step: 23, loss: 0.32570502161979675, mean loss: 0.347224032414022
Epoch: 31, step: 24, loss: 0.31348928809165955, mean loss: 0.34722327922140056
Epoch: 31, step: 25, loss: 0.37244805693626404, mean loss: 0.3472238424001841
Epoch: 31, step: 26, loss: 0.3249547481536865, mean loss: 0.3472233452223081
Epoch: 31, step: 27, loss: 0.30788809061050415, mean loss: 0.3472224670464148
Epoch: 31, step: 28, loss: 0.3646473288536072, mean loss: 0.3472228560550056
Epoch: 31, step: 29, loss: 0.3426571488380432, mean loss: 0.34722275412824716
Epoch: 31, step: 30, loss: 0.36405235528945923, mean loss: 0.34722312983091846
Epoch: 31, step: 31, loss: 0.32179421186447144, mean loss: 0.34722256217045844
Epoch: 31, step: 32, loss: 0.32219168543815613, mean loss: 0.34722200340811427
Epoch: 31, step: 33, loss: 0.35081416368484497, mean loss: 0.34722208359384304
Epoch: 31, step: 34, loss: 0.3326103389263153, mean loss: 0.34722175743154776
Epoch: 31, step: 35, loss: 0.34933558106422424, mean loss: 0.347221804615111
Epoch: 31, step: 36, loss: 0.2943381071090698, mean loss: 0.347220624201783
Epoch: 31, step: 37, loss: 0.30805179476737976, mean loss: 0.3472197499365843
Epoch: 31, step: 38, loss: 0.29175466299057007, mean loss: 0.34721851195950804
Epoch: 31, step: 39, loss: 0.34414735436439514, mean loss: 0.34721844341300334
Epoch: 31, step: 40, loss: 0.3189307153224945, mean loss: 0.3472178120609647
Epoch: 31, step: 41, loss: 0.34147360920906067, mean loss: 0.3472176838593209
Epoch: 31, step: 42, loss: 0.35229408740997314, mean loss: 0.3472177971541978
Epoch: 31, step: 43, loss: 0.33035802841186523, mean loss: 0.34721742088726465
Epoch: 31, step: 44, loss: 0.3201921880245209, mean loss: 0.34721681776662233
Epoch: 31, step: 45, loss: 0.34611204266548157, mean loss: 0.34721679311196707
Epoch: 31, step: 46, loss: 0.34778285026550293, mean loss: 0.34721680574406977
Epoch: 31, step: 47, loss: 0.3107879161834717, mean loss: 0.34721599281696186
Epoch: 31, step: 48, loss: 0.36856135725975037, mean loss: 0.3472164691377715
Epoch: 31, step: 49, loss: 0.30600184202194214, mean loss: 0.34721554945581684
Epoch: 31, step: 50, loss: 0.34399738907814026, mean loss: 0.3472154776459233
Epoch: 31, step: 51, loss: 0.33735477924346924, mean loss: 0.34721525761962907
Epoch: 31, step: 52, loss: 0.3480202853679657, mean loss: 0.3472152755821823
Epoch: 31, step: 53, loss: 0.297007292509079, mean loss: 0.3472141553183804
Epoch: 31, step: 54, loss: 0.34629255533218384, mean loss: 0.3472141347556729
Epoch: 31, step: 55, loss: 0.3722516894340515, mean loss: 0.3472146933802753
Epoch: 31, step: 56, loss: 0.3608265519142151, mean loss: 0.3472149970740468
Epoch: 31, step: 57, loss: 0.3363160490989685, mean loss: 0.3472147539133673
Epoch: 31, step: 58, loss: 0.3461492955684662, mean loss: 0.3472147301430185
Epoch: 31, step: 59, loss: 0.3049657344818115, mean loss: 0.34721378759001875
Epoch: 31, step: 60, loss: 0.3353706896305084, mean loss: 0.34721352338259076
Epoch: 31, step: 61, loss: 0.3334779143333435, mean loss: 0.34721321696200785
Epoch: 31, step: 62, loss: 0.3262828588485718, mean loss: 0.34721275004791335
Epoch: 31, step: 63, loss: 0.34108832478523254, mean loss: 0.34721261342738013
Epoch: 31, step: 64, loss: 0.3138898015022278, mean loss: 0.3472118700957884
Epoch: 31, step: 65, loss: 0.3523772358894348, mean loss: 0.34721198531697495
Epoch: 31, step: 66, loss: 0.34436458349227905, mean loss: 0.347211921802848
Epoch: 31, step: 67, loss: 0.39335134625434875, mean loss: 0.34721295096559895
Epoch: 31, step: 68, loss: 0.30298924446105957, mean loss: 0.3472119645558895
Epoch: 31, step: 69, loss: 0.33213281631469727, mean loss: 0.3472116282230117
Epoch: 31, step: 70, loss: 0.326494425535202, mean loss: 0.34721116614644904
Epoch: 31, step: 71, loss: 0.35910332202911377, mean loss: 0.3472114313832204
Epoch: 31, step: 72, loss: 0.33088526129722595, mean loss: 0.3472110672605073
Epoch: 31, step: 73, loss: 0.347867488861084, mean loss: 0.3472110819003575
Epoch: 31, step: 74, loss: 0.33866772055625916, mean loss: 0.34721089136619426
Epoch: 31, step: 75, loss: 0.3537687659263611, mean loss: 0.347211037616742
Epoch: 31, step: 76, loss: 0.30127206444740295, mean loss: 0.3472100131308213
Epoch: 31, step: 77, loss: 0.3397197127342224, mean loss: 0.34720984609321376
Epoch: 31, step: 78, loss: 0.3411152958869934, mean loss: 0.3472097101845947
Epoch: 31, step: 79, loss: 0.34252995252609253, mean loss: 0.34720960582821125
Epoch: 31, step: 80, loss: 0.34262815117836, mean loss: 0.3472095036662166
Epoch: 31, step: 81, loss: 0.3577024042606354, mean loss: 0.34720973764250423
Epoch: 31, step: 82, loss: 0.35052913427352905, mean loss: 0.3472098116585283
Epoch: 31, step: 83, loss: 0.31967249512672424, mean loss: 0.34720919764415686
Epoch: 31, step: 84, loss: 0.35742321610450745, mean loss: 0.3472094253865471
Epoch: 31, step: 85, loss: 0.36765193939208984, mean loss: 0.3472098811839608
Epoch: 31, step: 86, loss: 0.34118780493736267, mean loss: 0.3472097469154663
Epoch: 31, step: 87, loss: 0.30478647351264954, mean loss: 0.34720880106526114
Epoch: 31, step: 88, loss: 0.3438139259815216, mean loss: 0.3472087253763421
Epoch: 31, step: 89, loss: 0.31725722551345825, mean loss: 0.347208057620961
Epoch: 31, step: 90, loss: 0.3509375751018524, mean loss: 0.34720814076704243
Epoch: 31, step: 91, loss: 0.32829388976097107, mean loss: 0.34720771910102216
Epoch: 31, step: 92, loss: 0.34009259939193726, mean loss: 0.3472075604831987
Epoch: 31, step: 93, loss: 0.39133206009864807, mean loss: 0.34720854413159175
Epoch: 31, step: 94, loss: 0.3322314918041229, mean loss: 0.3472082102620822
Epoch: 31, step: 95, loss: 0.3389427661895752, mean loss: 0.3472080260123258
Epoch: 31, step: 96, loss: 0.3065856099128723, mean loss: 0.3472071204949254
Epoch: 31, step: 97, loss: 0.3197776973247528, mean loss: 0.3472065090771739
Epoch: 31, step: 98, loss: 0.3504108786582947, mean loss: 0.34720658050283826
Epoch: 31, step: 99, loss: 0.29512232542037964, mean loss: 0.34720541956633943
Epoch: 31, step: 100, loss: 0.3129413425922394, mean loss: 0.3472046558512614
Epoch: 31, step: 101, loss: 0.32985907793045044, mean loss: 0.34720426924274
Epoch: 31, step: 102, loss: 0.317162424325943, mean loss: 0.34720359966721864
Epoch: 31, step: 103, loss: 0.299508661031723, mean loss: 0.34720253666154344
Epoch: 31, step: 104, loss: 0.3120366930961609, mean loss: 0.347201752916785
Epoch: 31, step: 105, loss: 0.32446223497390747, mean loss: 0.34720124613011366
Epoch: 31, step: 106, loss: 0.35500606894493103, mean loss: 0.34720142006924615
Epoch: 31, step: 107, loss: 0.35827991366386414, mean loss: 0.34720166696026045
Epoch: 31, step: 108, loss: 0.3129711151123047, mean loss: 0.3472009041284496
Epoch: 31, step: 109, loss: 0.3385315537452698, mean loss: 0.347200710935278
Epoch: 31, step: 110, loss: 0.3126986026763916, mean loss: 0.34719994208606886
Epoch: 31, step: 111, loss: 0.3119998574256897, mean loss: 0.34719915770054743
Epoch: 31, step: 112, loss: 0.35986313223838806, mean loss: 0.3471994398935313
Epoch: 31, step: 113, loss: 0.3288748264312744, mean loss: 0.3471990315728962
Epoch: 31, step: 114, loss: 0.299195259809494, mean loss: 0.34719796194630553
Epoch: 31, step: 115, loss: 0.30589303374290466, mean loss: 0.347197041604768
Epoch: 31, step: 116, loss: 0.3456402122974396, mean loss: 0.34719700691683086
Epoch: 31, step: 117, loss: 0.2956814467906952, mean loss: 0.34719585911681916
Epoch: 31, step: 118, loss: 0.32848212122917175, mean loss: 0.3471954421719205
Epoch: 31, step: 119, loss: 0.3619626462459564, mean loss: 0.34719577118012107
Epoch: 31, step: 120, loss: 0.3958853483200073, mean loss: 0.34719685594289573
Epoch: 31, step: 121, loss: 0.33768269419670105, mean loss: 0.34719664398010674
Epoch: 31, step: 122, loss: 0.32050594687461853, mean loss: 0.3471960493603481
Epoch: 31, step: 123, loss: 0.31690481305122375, mean loss: 0.3471953745422161
Epoch: 31, step: 124, loss: 0.3699107766151428, mean loss: 0.34719588057714834
Epoch: 31, step: 125, loss: 0.34924232959747314, mean loss: 0.34719592616523076
Epoch: 31, step: 126, loss: 0.3468262851238251, mean loss: 0.3471959179310404
Epoch: 31, step: 127, loss: 0.3263514041900635, mean loss: 0.347195453605242
Epoch: 31, step: 128, loss: 0.33733904361724854, mean loss: 0.3471952340518598
Epoch: 31, step: 129, loss: 0.3014317750930786, mean loss: 0.3471942146849297
Epoch: 31, step: 130, loss: 0.3234548568725586, mean loss: 0.34719368590983646
Epoch: 31, step: 131, loss: 0.32625269889831543, mean loss: 0.3471932194765905
Epoch: 31, step: 132, loss: 0.29873114824295044, mean loss: 0.3471921400710348
Epoch: 31, step: 133, loss: 0.3453109562397003, mean loss: 0.3471920981719785
Epoch: 31, step: 134, loss: 0.33996087312698364, mean loss: 0.3471919371166088
Epoch: 31, step: 135, loss: 0.3414897620677948, mean loss: 0.34719181011939165
Epoch: 31, step: 136, loss: 0.3555895686149597, mean loss: 0.34719199714770943
Epoch: 31, step: 137, loss: 0.41446995735168457, mean loss: 0.3471934954765189
Epoch: 31, step: 138, loss: 0.3252929151058197, mean loss: 0.34719300774562406
Epoch: 31, step: 139, loss: 0.30605649948120117, mean loss: 0.3471920916466515
Epoch: 31, step: 140, loss: 0.3488214313983917, mean loss: 0.3471921279308014
Epoch: 31, step: 141, loss: 0.32390716671943665, mean loss: 0.34719160940407423
Epoch: 31, step: 142, loss: 0.3377566933631897, mean loss: 0.3471913993050687
Epoch: 31, step: 143, loss: 0.34074440598487854, mean loss: 0.34719125574505
Epoch: 31, step: 144, loss: 0.3077068030834198, mean loss: 0.34719037653481016
Epoch: 31, step: 145, loss: 0.34962165355682373, mean loss: 0.3471904306714617
Epoch: 31, step: 146, loss: 0.3409792482852936, mean loss: 0.3471902923716602
Epoch: 31, step: 147, loss: 0.3873354494571686, mean loss: 0.3471911862342601
Epoch: 31, step: 148, loss: 0.29895615577697754, mean loss: 0.34719011226836033
Epoch: 31, step: 149, loss: 0.3250895142555237, mean loss: 0.3471896202035696
Epoch: 31, step: 150, loss: 0.30773431062698364, mean loss: 0.3471887417596293
Epoch: 31, step: 151, loss: 0.33291393518447876, mean loss: 0.3471884239484579
Epoch: 31, step: 152, loss: 0.35153713822364807, mean loss: 0.34718852076512585
Epoch: 31, step: 153, loss: 0.37436050176620483, mean loss: 0.34718912568923205
Epoch: 31, step: 154, loss: 0.35039955377578735, mean loss: 0.3471891971607271
Epoch: 31, step: 155, loss: 0.3347669541835785, mean loss: 0.3471889206192539
Epoch: 31, step: 156, loss: 0.3232971727848053, mean loss: 0.34718838875781194
Epoch: 31, step: 157, loss: 0.3256847560405731, mean loss: 0.34718791006958083
Epoch: 31, step: 158, loss: 0.34131255745887756, mean loss: 0.3471877792823981
Epoch: 31, step: 159, loss: 0.32699206471443176, mean loss: 0.3471873297294961
Epoch: 31, step: 160, loss: 0.3368472754955292, mean loss: 0.34718709956690885
Epoch: 31, step: 161, loss: 0.3437838554382324, mean loss: 0.34718702381469124
Epoch: 31, step: 162, loss: 0.34034034609794617, mean loss: 0.347186871419078
Epoch: 31, step: 163, loss: 0.3768625259399414, mean loss: 0.34718753193489266
Epoch: 31, step: 164, loss: 0.3335098624229431, mean loss: 0.3471872275063607
Epoch: 31, step: 165, loss: 0.31145280599594116, mean loss: 0.34718643217091644
Epoch: 31, step: 166, loss: 0.3551000952720642, mean loss: 0.3471866083001613
Epoch: 31, step: 167, loss: 0.34940680861473083, mean loss: 0.34718665771261376
Epoch: 31, step: 168, loss: 0.3481496572494507, mean loss: 0.3471866791445132
Epoch: 31, step: 169, loss: 0.336483359336853, mean loss: 0.34718644094360057
Epoch: 31, step: 170, loss: 0.32700416445732117, mean loss: 0.3471859917998043
Epoch: 31, step: 171, loss: 0.33083054423332214, mean loss: 0.3471856278277648
Epoch: 31, step: 172, loss: 0.30397656559944153, mean loss: 0.3471846662802154
Epoch: 31, step: 173, loss: 0.3110273778438568, mean loss: 0.34718386167635146
Epoch: 31, step: 174, loss: 0.3373449742794037, mean loss: 0.3471836427376257
Epoch: 31, step: 175, loss: 0.3204740285873413, mean loss: 0.34718304839819203
Epoch: 31, step: 176, loss: 0.31430894136428833, mean loss: 0.3471823169034092
Epoch: 31, step: 177, loss: 0.296935498714447, mean loss: 0.347181198866424
Epoch: 31, step: 178, loss: 0.3150818645954132, mean loss: 0.3471804846432019
Epoch: 31, step: 179, loss: 0.3439233899116516, mean loss: 0.347180412173134
Epoch: 31, step: 180, loss: 0.336591511964798, mean loss: 0.3471801765762888
Epoch: 31, step: 181, loss: 0.33134663105010986, mean loss: 0.3471798242969864
Epoch: 31, step: 182, loss: 0.34377139806747437, mean loss: 0.34717974846486793
Epoch: 31, step: 183, loss: 0.32220184803009033, mean loss: 0.347179192758264
Epoch: 31, step: 184, loss: 0.34099486470222473, mean loss: 0.34717905517282144
Epoch: 31, step: 185, loss: 0.39876487851142883, mean loss: 0.34718020279959205
Epoch: 31, step: 186, loss: 0.30090799927711487, mean loss: 0.3471791734075091
Epoch: 31, step: 187, loss: 0.3474186658859253, mean loss: 0.34717917873524706
Epoch: 31, step: 188, loss: 0.3079468011856079, mean loss: 0.3471783059931042
Epoch: 31, step: 189, loss: 0.3437086045742035, mean loss: 0.34717822880972965
Epoch: 31, step: 190, loss: 0.3408059775829315, mean loss: 0.3471780870623995
Epoch: 31, step: 191, loss: 0.30393409729003906, mean loss: 0.3471771251443069
Epoch: 31, step: 192, loss: 0.3192060589790344, mean loss: 0.34717650297053715
Epoch: 31, step: 193, loss: 0.3022688925266266, mean loss: 0.3471755040913512
Epoch: 31, step: 194, loss: 0.3288581967353821, mean loss: 0.3471750966688694
Epoch: 31, step: 195, loss: 0.3299408257007599, mean loss: 0.3471747133443372
Epoch: 31, step: 196, loss: 0.319036602973938, mean loss: 0.3471740875106064
Epoch: 31, step: 197, loss: 0.39156726002693176, mean loss: 0.34717507485931237
Epoch: 31, step: 198, loss: 0.3606199324131012, mean loss: 0.347175373879786
Epoch: 31, step: 199, loss: 0.3570708930492401, mean loss: 0.3471755939562732
Epoch: 31, step: 200, loss: 0.3121030926704407, mean loss: 0.3471748139606925
Epoch: 31, step: 201, loss: 0.3097873032093048, mean loss: 0.3471739824989047
Epoch: 31, step: 202, loss: 0.35334330797195435, mean loss: 0.3471741196956373
Epoch: 31, step: 203, loss: 0.3202155530452728, mean loss: 0.3471735201900633
Epoch: 31, step: 204, loss: 0.31261879205703735, mean loss: 0.3471727517778653
Epoch: 31, step: 205, loss: 0.3822639286518097, mean loss: 0.3471735321020119
Epoch: 31, step: 206, loss: 0.3418540060520172, mean loss: 0.3471734138140919
Epoch: 31, step: 207, loss: 0.325615793466568, mean loss: 0.34717293445759567
Epoch: 31, step: 208, loss: 0.3620053827762604, mean loss: 0.34717326426544304
Epoch: 31, step: 209, loss: 0.3210790157318115, mean loss: 0.34717268405802243
Epoch: 31, step: 210, loss: 0.3652787506580353, mean loss: 0.34717308663871393
Epoch: 31, step: 211, loss: 0.3063089847564697, mean loss: 0.3471721780629873
Epoch: 31, step: 212, loss: 0.3162112832069397, mean loss: 0.34717148969126715
Epoch: 31, step: 213, loss: 0.317070335149765, mean loss: 0.34717082044953695
Epoch: 31, step: 214, loss: 0.3019360601902008, mean loss: 0.3471698147633221
Epoch: 31, step: 215, loss: 0.34551823139190674, mean loss: 0.3471697780451502
Epoch: 31, step: 216, loss: 0.3620237708091736, mean loss: 0.34717010827330796
Epoch: 31, step: 217, loss: 0.31051722168922424, mean loss: 0.3471692934387834
Epoch: 31, step: 218, loss: 0.35072776675224304, mean loss: 0.347169372545853
Epoch: 31, step: 219, loss: 0.3117378056049347, mean loss: 0.34716858489764607
Epoch: 31, step: 220, loss: 0.36489561200141907, mean loss: 0.3471689789629368
Epoch: 31, step: 221, loss: 0.3394494950771332, mean loss: 0.34716880736546457
Epoch: 31, step: 222, loss: 0.31587788462638855, mean loss: 0.34716811181068785
Epoch: 31, step: 223, loss: 0.35906335711479187, mean loss: 0.34716837621998153
Epoch: 31, step: 224, loss: 0.33189132809638977, mean loss: 0.3471680366470165
Epoch: 31, step: 225, loss: 0.3358861207962036, mean loss: 0.34716778588204983
Epoch: 31, step: 226, loss: 0.32289692759513855, mean loss: 0.3471672464217514
Epoch: 31, step: 227, loss: 0.31962814927101135, mean loss: 0.34716663433299894
Epoch: 31, step: 228, loss: 0.33157894015312195, mean loss: 0.34716628788590315
Epoch: 31, step: 229, loss: 0.31819063425064087, mean loss: 0.3471656438966238
Epoch: 31, step: 230, loss: 0.33729997277259827, mean loss: 0.34716542463512534
Epoch: 31, step: 231, loss: 0.33071252703666687, mean loss: 0.34716505898267624
Epoch: 31, step: 232, loss: 0.35054582357406616, mean loss: 0.34716513411578714
Epoch: 31, step: 233, loss: 0.36895042657852173, mean loss: 0.3471656182549147
Epoch: 31, step: 234, loss: 0.3185930550098419, mean loss: 0.3471649832949546
Epoch: 31, step: 235, loss: 0.3885709345340729, mean loss: 0.3471659034272044
Epoch: 31, step: 236, loss: 0.3153616189956665, mean loss: 0.34716519668103357
Epoch: 31, step: 237, loss: 0.35616737604141235, mean loss: 0.34716539672057317
Epoch: 31, step: 238, loss: 0.35556384921073914, mean loss: 0.3471655833404094
Epoch: 31, step: 239, loss: 0.34502190351486206, mean loss: 0.347165535707314
Epoch: 31, step: 240, loss: 0.3064929246902466, mean loss: 0.34716463197192865
Epoch: 31, step: 241, loss: 0.35809198021888733, mean loss: 0.3471648747695167
Epoch: 31, step: 242, loss: 0.33707258105278015, mean loss: 0.3471646505312045
Epoch: 31, step: 243, loss: 0.3649508059024811, mean loss: 0.3471650457088478
Epoch: 31, step: 244, loss: 0.3220781683921814, mean loss: 0.34716448833416014
Epoch: 31, step: 245, loss: 0.3208276331424713, mean loss: 0.3471639032007411
Epoch: 31, step: 246, loss: 0.3156059682369232, mean loss: 0.3471632020846814
Epoch: 31, step: 247, loss: 0.35855844616889954, mean loss: 0.34716345524481834
Epoch: 31, step: 248, loss: 0.3511531949043274, mean loss: 0.3471635438800939
Epoch: 31, step: 249, loss: 0.29806432127952576, mean loss: 0.3471624531256042
Epoch: 31, step: 250, loss: 0.3420601487159729, mean loss: 0.347162339778844
Epoch: 31, step: 251, loss: 0.3533063530921936, mean loss: 0.34716247626394514
Epoch: 31, step: 252, loss: 0.32262280583381653, mean loss: 0.34716193114386984
Epoch: 31, step: 253, loss: 0.2936864495277405, mean loss: 0.3471607432749815
Epoch: 31, step: 254, loss: 0.34264451265335083, mean loss: 0.3471606429566576
Epoch: 31, step: 255, loss: 0.3373817503452301, mean loss: 0.34716042574447165
Epoch: 31, step: 256, loss: 0.32741278409957886, mean loss: 0.3471599871126855
Epoch: 31, step: 257, loss: 0.31156590580940247, mean loss: 0.34715919651961313
Epoch: 31, step: 258, loss: 0.34800007939338684, mean loss: 0.34715921519635334
Epoch: 31, step: 259, loss: 0.30723366141319275, mean loss: 0.34715832843476435
Epoch: 31, step: 260, loss: 0.3399445116519928, mean loss: 0.34715816821673473
Epoch: 31, step: 261, loss: 0.2943617105484009, mean loss: 0.3471569956396089
Epoch: 31, step: 262, loss: 0.3488045930862427, mean loss: 0.3471570322309307
Epoch: 31, step: 263, loss: 0.30778875946998596, mean loss: 0.3471561579244378
Epoch: 31, step: 264, loss: 0.3396155536174774, mean loss: 0.3471559904633726
Epoch: 31, step: 265, loss: 0.3599741458892822, mean loss: 0.3471562751214989
Epoch: 31, step: 266, loss: 0.3332260549068451, mean loss: 0.34715596577415564
Epoch: 31, step: 267, loss: 0.363951176404953, mean loss: 0.34715633873584134
Epoch: 31, step: 268, loss: 0.3222750723361969, mean loss: 0.3471557862239856
Epoch: 31, step: 269, loss: 0.30668097734451294, mean loss: 0.3471548874628522
Epoch: 31, step: 270, loss: 0.31980326771736145, mean loss: 0.3471542801214567
Epoch: 31, step: 271, loss: 0.3337096869945526, mean loss: 0.3471539815915445
Epoch: 31, step: 272, loss: 0.38009846210479736, mean loss: 0.34715471308965745
Epoch: 31, step: 273, loss: 0.3193880021572113, mean loss: 0.34715409657225144
Epoch: 31, step: 274, loss: 0.33443886041641235, mean loss: 0.34715381425612196
Epoch: 31, step: 275, loss: 0.3507339656352997, mean loss: 0.34715389374438527
Epoch: 31, step: 276, loss: 0.3199640214443207, mean loss: 0.3471532900750107
Epoch: 31, step: 277, loss: 0.31895551085472107, mean loss: 0.3471526640419922
Epoch: 31, step: 278, loss: 0.31049174070358276, mean loss: 0.34715185013254257
Epoch: 31, step: 279, loss: 0.35483330488204956, mean loss: 0.34715202066479434
Epoch: 31, step: 280, loss: 0.32924652099609375, mean loss: 0.3471516231623042
Epoch: 31, step: 281, loss: 0.3771824538707733, mean loss: 0.3471522898326125
Epoch: 31, step: 282, loss: 0.32740065455436707, mean loss: 0.34715185136533877
Epoch: 31, step: 283, loss: 0.3494685888290405, mean loss: 0.34715190279353675
Epoch: 31, step: 284, loss: 0.34927991032600403, mean loss: 0.3471519500311565
Epoch: 31, step: 285, loss: 0.29084718227386475, mean loss: 0.3471507002027934
Epoch: 31, step: 286, loss: 0.31292587518692017, mean loss: 0.3471499405121092
Epoch: 31, step: 287, loss: 0.3453230559825897, mean loss: 0.3471498999615336
Epoch: 31, step: 288, loss: 0.3300391733646393, mean loss: 0.3471495201704743
Epoch: 31, step: 289, loss: 0.33985161781311035, mean loss: 0.3471493581892438
Epoch: 31, step: 290, loss: 0.28612178564071655, mean loss: 0.3471480036764806
Epoch: 31, step: 291, loss: 0.3177706003189087, mean loss: 0.34714735165669725
Epoch: 31, step: 292, loss: 0.3277166783809662, mean loss: 0.34714692041020334
Epoch: 31, step: 293, loss: 0.3358396589756012, mean loss: 0.34714666946117245
Epoch: 31, step: 294, loss: 0.32385069131851196, mean loss: 0.3471461524506276
Epoch: 31, step: 295, loss: 0.32840850949287415, mean loss: 0.347145736613012
Epoch: 31, step: 296, loss: 0.3297075033187866, mean loss: 0.34714534962130533
Epoch: 31, step: 297, loss: 0.381555438041687, mean loss: 0.347146113237843
Epoch: 31, step: 298, loss: 0.30277493596076965, mean loss: 0.347145128590188
Epoch: 31, step: 299, loss: 0.3592572808265686, mean loss: 0.3471453973668664
Epoch: 31, step: 300, loss: 0.31662678718566895, mean loss: 0.34714472015372577
Epoch: 31, step: 301, loss: 0.3163498640060425, mean loss: 0.34714403682580347
Epoch: 31, step: 302, loss: 0.32416871190071106, mean loss: 0.34714352702206847
Epoch: 31, step: 303, loss: 0.33964598178863525, mean loss: 0.3471433606613417
Epoch: 31, step: 304, loss: 0.35339927673339844, mean loss: 0.3471434994688607
Epoch: 31, step: 305, loss: 0.3113269805908203, mean loss: 0.3471427047823979
Epoch: 31, step: 306, loss: 0.2954719066619873, mean loss: 0.34714155835125327
Epoch: 31, step: 307, loss: 0.31293371319770813, mean loss: 0.34714079939125253
Epoch: 31, step: 308, loss: 0.3452393114566803, mean loss: 0.3471407572044015
Epoch: 31, step: 309, loss: 0.3052084743976593, mean loss: 0.3471398269057192
Epoch: 31, step: 310, loss: 0.3403252065181732, mean loss: 0.34713967572168397
Epoch: 31, step: 311, loss: 0.35507556796073914, mean loss: 0.3471398517775061
Epoch: 31, step: 312, loss: 0.3580380082130432, mean loss: 0.3471400935450691
Epoch: 31, step: 313, loss: 0.31816017627716064, mean loss: 0.3471394506612395
Epoch: 31, step: 314, loss: 0.34696248173713684, mean loss: 0.34713944673548863
Epoch: 31, step: 315, loss: 0.3413355350494385, mean loss: 0.3471393179885568
Epoch: 31, step: 316, loss: 0.3507768511772156, mean loss: 0.34713939867738774
Epoch: 31, step: 317, loss: 0.33295938372612, mean loss: 0.34713908413910305
Epoch: 31, step: 318, loss: 0.3405679762363434, mean loss: 0.34713893838332144
Epoch: 31, step: 319, loss: 0.29644837975502014, mean loss: 0.3471378140252647
Epoch: 31, step: 320, loss: 0.3508094847202301, mean loss: 0.3471378954641179
Epoch: 31, step: 321, loss: 0.31899964809417725, mean loss: 0.3471372713624595
Epoch: 31, step: 322, loss: 0.3367665708065033, mean loss: 0.3471370413471434
Epoch: 31, step: 323, loss: 0.3385154604911804, mean loss: 0.3471368501303927
Epoch: 31, step: 324, loss: 0.33090049028396606, mean loss: 0.3471364900345856
Epoch: 31, step: 325, loss: 0.3357273042201996, mean loss: 0.34713623700318585
Epoch: 31, step: 326, loss: 0.33278802037239075, mean loss: 0.3471359187974102
Epoch: 31, step: 327, loss: 0.34803804755210876, mean loss: 0.3471359388038139
Epoch: 31, step: 328, loss: 0.3413395285606384, mean loss: 0.34713581026035384
Epoch: 31, step: 329, loss: 0.3896954655647278, mean loss: 0.34713675405898126
Epoch: 31, step: 330, loss: 0.29090747237205505, mean loss: 0.3471355071517479
Epoch: 31, step: 331, loss: 0.34403297305107117, mean loss: 0.3471354383533157
Epoch: 31, step: 332, loss: 0.3514939844608307, mean loss: 0.3471355350015652
Epoch: 31, step: 333, loss: 0.33380404114723206, mean loss: 0.3471352393899227
Epoch: 31, step: 334, loss: 0.3699744939804077, mean loss: 0.3471357458147789
Epoch: 31, step: 335, loss: 0.316042959690094, mean loss: 0.3471350563960178
Epoch: 31, step: 336, loss: 0.3213752806186676, mean loss: 0.34713448523848744
Epoch: 31, step: 337, loss: 0.36563166975975037, mean loss: 0.3471348953574294
Epoch: 31, step: 338, loss: 0.3468363285064697, mean loss: 0.3471348887377622
Epoch: 31, step: 339, loss: 0.31530338525772095, mean loss: 0.34713418300205184
Epoch: 31, step: 340, loss: 0.32687777280807495, mean loss: 0.3471337339074904
Epoch: 31, step: 341, loss: 0.310147762298584, mean loss: 0.34713291392851625
Epoch: 31, step: 342, loss: 0.33341774344444275, mean loss: 0.34713260986993366
Epoch: 31, step: 343, loss: 0.2981429100036621, mean loss: 0.34713152381646495
Epoch: 31, step: 344, loss: 0.31450507044792175, mean loss: 0.3471308005361136
Epoch: 31, step: 345, loss: 0.3071955144405365, mean loss: 0.34712991524934583
Epoch: 31, step: 346, loss: 0.34910693764686584, mean loss: 0.34712995907507344
Epoch: 31, step: 347, loss: 0.31737062335014343, mean loss: 0.3471292993983638
Epoch: 31, step: 348, loss: 0.3473389148712158, mean loss: 0.3471293040448176
Epoch: 31, step: 349, loss: 0.32390260696411133, mean loss: 0.34712878920026646
Epoch: 31, step: 350, loss: 0.32738375663757324, mean loss: 0.3471283515402296
Epoch: 31, step: 351, loss: 0.37522321939468384, mean loss: 0.3471289742653793
Epoch: 31, step: 352, loss: 0.3593791127204895, mean loss: 0.347129245784728
Epoch: 31, step: 353, loss: 0.3371245563030243, mean loss: 0.34712902403975965
Epoch: 31, step: 354, loss: 0.3091350495815277, mean loss: 0.3471281819560597
Epoch: 31, step: 355, loss: 0.3255593478679657, mean loss: 0.3471277039233893
Epoch: 31, step: 356, loss: 0.33933591842651367, mean loss: 0.3471275312369352
Epoch: 31, step: 357, loss: 0.34372764825820923, mean loss: 0.3471274558882587
Epoch: 31, step: 358, loss: 0.3560541272163391, mean loss: 0.34712765371799803
Epoch: 31, step: 359, loss: 0.3459070324897766, mean loss: 0.34712762666762065
Epoch: 31, step: 360, loss: 0.3423347473144531, mean loss: 0.3471275204542278
Epoch: 31, step: 361, loss: 0.2989659309387207, mean loss: 0.3471264531850367
Epoch: 31, step: 362, loss: 0.32039880752563477, mean loss: 0.3471258609088903
Epoch: 31, step: 363, loss: 0.38547295331954956, mean loss: 0.3471267106494596
Epoch: 31, step: 364, loss: 0.2939421236515045, mean loss: 0.34712553214811903
Epoch: 31, step: 365, loss: 0.3359495997428894, mean loss: 0.3471252845094661
Epoch: 31, step: 366, loss: 0.2899472713470459, mean loss: 0.347124017575138
Epoch: 31, step: 367, loss: 0.28469526767730713, mean loss: 0.34712263432711227
Epoch: 31, step: 368, loss: 0.3503583073616028, mean loss: 0.3471227060190679
Epoch: 31, step: 369, loss: 0.3646291494369507, mean loss: 0.34712309389613216
Epoch: 31, step: 370, loss: 0.3355303108692169, mean loss: 0.34712283704927216
Epoch: 31, step: 371, loss: 0.307991087436676, mean loss: 0.34712197007502515
Epoch: 31, step: 372, loss: 0.33875513076782227, mean loss: 0.34712178470959754
Epoch: 31, step: 373, loss: 0.3580883741378784, mean loss: 0.34712202766651695
Epoch: 31, step: 374, loss: 0.347447007894516, mean loss: 0.3471220348660612
Epoch: 31, step: 375, loss: 0.32291921973228455, mean loss: 0.3471214986938163
Epoch: 31, step: 376, loss: 0.31410878896713257, mean loss: 0.3471207673695274
Epoch: 31, step: 377, loss: 0.34962528944015503, mean loss: 0.3471208228505001
Epoch: 31, step: 378, loss: 0.3122216761112213, mean loss: 0.3471200497705821
Epoch: 31, step: 379, loss: 0.3534379303455353, mean loss: 0.3471201897200898
Epoch: 31, step: 380, loss: 0.3290186822414398, mean loss: 0.3471197887563623
Epoch: 31, step: 381, loss: 0.37427854537963867, mean loss: 0.34712039033250686
Epoch: 31, step: 382, loss: 0.33023834228515625, mean loss: 0.3471200163974049
Epoch: 31, step: 383, loss: 0.35555440187454224, mean loss: 0.347120203213775
Epoch: 31, step: 384, loss: 0.3353126049041748, mean loss: 0.34711994168864024
Epoch: 31, step: 385, loss: 0.34686726331710815, mean loss: 0.34711993609222
Epoch: 31, step: 386, loss: 0.3524262309074402, mean loss: 0.3471200536155266
Epoch: 31, step: 387, loss: 0.3284561336040497, mean loss: 0.34711964025797853
Epoch: 31, step: 388, loss: 0.3489550054073334, mean loss: 0.3471196809056686
Epoch: 31, step: 389, loss: 0.32669398188591003, mean loss: 0.3471192285493099
Epoch: 31, step: 390, loss: 0.3146461546421051, mean loss: 0.3471185094025065
Epoch: 31, step: 391, loss: 0.337179958820343, mean loss: 0.34711828930881833
Epoch: 31, step: 392, loss: 0.3089694380760193, mean loss: 0.34711744450399884
Epoch: 31, step: 393, loss: 0.3181946873664856, mean loss: 0.3471168040248559
Epoch: 31, step: 394, loss: 0.31195271015167236, mean loss: 0.34711602535185887
Epoch: 31, step: 395, loss: 0.3281117081642151, mean loss: 0.3471156045299548
Epoch: 31, step: 396, loss: 0.3279365003108978, mean loss: 0.34711517984705986
Epoch: 31, step: 397, loss: 0.3498404324054718, mean loss: 0.34711524019098966
Epoch: 31, step: 398, loss: 0.3513493239879608, mean loss: 0.34711533394215316
Epoch: 31, step: 399, loss: 0.30756616592407227, mean loss: 0.3471144582631164
Epoch: 31, step: 400, loss: 0.3124493360519409, mean loss: 0.3471136907413139
Epoch: 31, step: 401, loss: 0.31769871711730957, mean loss: 0.3471130394776725
Epoch: 31, step: 402, loss: 0.31806764006614685, mean loss: 0.34711239641084474
Epoch: 31, step: 403, loss: 0.3272005021572113, mean loss: 0.34711195557011115
Epoch: 31, step: 404, loss: 0.334441602230072, mean loss: 0.34711167506017426
Epoch: 31, step: 405, loss: 0.34148988127708435, mean loss: 0.34711155060160037
Epoch: 31, step: 406, loss: 0.3109325170516968, mean loss: 0.3471107496666299
Epoch: 31, step: 407, loss: 0.30397117137908936, mean loss: 0.3471097946595838
Epoch: 31, step: 408, loss: 0.30572035908699036, mean loss: 0.3471088784167934
Epoch: 31, step: 409, loss: 0.33197692036628723, mean loss: 0.3471085434462783
Epoch: 31, step: 410, loss: 0.33947044610977173, mean loss: 0.3471083743683074
Epoch: 31, step: 411, loss: 0.334896057844162, mean loss: 0.34710810404077674
Epoch: 31, step: 412, loss: 0.32846587896347046, mean loss: 0.3471076913921928
Epoch: 31, step: 413, loss: 0.3231540322303772, mean loss: 0.3471071611859162
Epoch: 31, step: 414, loss: 0.3257666230201721, mean loss: 0.347106688830659
Epoch: 31, step: 415, loss: 0.31329643726348877, mean loss: 0.34710594048511745
Epoch: 31, step: 416, loss: 0.3256945013999939, mean loss: 0.34710546658150565
Epoch: 31, step: 417, loss: 0.3575582504272461, mean loss: 0.3471056979299153
Epoch: 31, step: 418, loss: 0.30381160974502563, mean loss: 0.34710473973572314
Epoch: 31, step: 419, loss: 0.3328462839126587, mean loss: 0.34710442417145654
Epoch: 31, step: 420, loss: 0.31604376435279846, mean loss: 0.34710373676059414
Epoch: 31, step: 421, loss: 0.3132894039154053, mean loss: 0.34710298842409953
Epoch: 31, step: 422, loss: 0.34724661707878113, mean loss: 0.3471029916026388
Epoch: 31, step: 423, loss: 0.33123719692230225, mean loss: 0.3471026404962681
Epoch: 31, step: 424, loss: 0.3068315386772156, mean loss: 0.3471017493258103
Epoch: 31, step: 425, loss: 0.34176790714263916, mean loss: 0.3471016312943391
Epoch: 31, step: 426, loss: 0.3347509205341339, mean loss: 0.34710135799410763
Epoch: 31, step: 427, loss: 0.3391379714012146, mean loss: 0.34710118178180027
Epoch: 31, step: 428, loss: 0.31957119703292847, mean loss: 0.34710057261700156
Epoch: 31, step: 429, loss: 0.328779399394989, mean loss: 0.34710016722749804
Epoch: 31, step: 430, loss: 0.3669498562812805, mean loss: 0.3471006064284949
Epoch: 31, step: 431, loss: 0.31310948729515076, mean loss: 0.34709985434602886
Epoch: 31, step: 432, loss: 0.322737455368042, mean loss: 0.3470993153191249
Epoch: 31, step: 433, loss: 0.313679963350296, mean loss: 0.34709857592021415
Epoch: 31, step: 434, loss: 0.35401880741119385, mean loss: 0.3470987290260681
Epoch: 31, step: 435, loss: 0.3457145392894745, mean loss: 0.3470986984024014
Epoch: 31, step: 436, loss: 0.3212227523326874, mean loss: 0.3470981259383836
Epoch: 31, step: 437, loss: 0.303689181804657, mean loss: 0.34709716560600595
Epoch: 31, step: 438, loss: 0.36058536171913147, mean loss: 0.34709746399761965
Epoch: 31, step: 439, loss: 0.3006433844566345, mean loss: 0.3470964363434399
Epoch: 31, step: 440, loss: 0.33125901222229004, mean loss: 0.34709608599670566
Epoch: 31, step: 441, loss: 0.3557790517807007, mean loss: 0.3470962780722218
Epoch: 31, step: 442, loss: 0.3725765347480774, mean loss: 0.347096841707426
Epoch: 31, step: 443, loss: 0.36969009041786194, mean loss: 0.3470973414696077
Epoch: 31, step: 444, loss: 0.37618497014045715, mean loss: 0.3470979848731041
Epoch: 31, step: 445, loss: 0.31196728348731995, mean loss: 0.3470972078171124
Epoch: 31, step: 446, loss: 0.36019352078437805, mean loss: 0.3470974974880546
Epoch: 31, step: 447, loss: 0.36188870668411255, mean loss: 0.3470978246403415
Epoch: 31, step: 448, loss: 0.30961036682128906, mean loss: 0.3470969955102723
Epoch: 31, step: 449, loss: 0.36090192198753357, mean loss: 0.34709730083443024
Epoch: 31, step: 450, loss: 0.34752732515335083, mean loss: 0.3470973103450864
Epoch: 31, step: 451, loss: 0.32913273572921753, mean loss: 0.3470969130393845
Epoch: 31, step: 452, loss: 0.3084672689437866, mean loss: 0.34709605872255467
Epoch: 31, step: 453, loss: 0.3281766474246979, mean loss: 0.3470956403181295
Epoch: 31, step: 454, loss: 0.30660223960876465, mean loss: 0.3470947448228574
Epoch: 31, step: 455, loss: 0.34323036670684814, mean loss: 0.3470946593655793
Epoch: 31, step: 456, loss: 0.3145282566547394, mean loss: 0.34709393920453224
Epoch: 31, step: 457, loss: 0.3836933374404907, mean loss: 0.34709474853181177
Epoch: 31, step: 458, loss: 0.2987876236438751, mean loss: 0.3470936803336629
Epoch: 31, step: 459, loss: 0.40312230587005615, mean loss: 0.3470949192471941
Epoch: 31, step: 460, loss: 0.30272185802459717, mean loss: 0.347093938084978
Epoch: 31, step: 461, loss: 0.3246303200721741, mean loss: 0.34709344138798925
Epoch: 31, step: 462, loss: 0.34652334451675415, mean loss: 0.3470934287827563
Epoch: 31, step: 463, loss: 0.335115522146225, mean loss: 0.34709316394887824
Epoch: 31, step: 464, loss: 0.3238027095794678, mean loss: 0.3470926490037243
Epoch: 31, step: 465, loss: 0.33199164271354675, mean loss: 0.34709231513226085
Epoch: 31, step: 466, loss: 0.32002803683280945, mean loss: 0.34709171677541933
Epoch: 31, step: 467, loss: 0.34155339002609253, mean loss: 0.34709159433275155
Epoch: 31, step: 468, loss: 0.313690721988678, mean loss: 0.34709085591450944
Epoch: 31, step: 469, loss: 0.3403886556625366, mean loss: 0.3470907077471961
Epoch: 31, step: 470, loss: 0.3390060365200043, mean loss: 0.3470905290211824
Epoch: 31, step: 471, loss: 0.3193069100379944, mean loss: 0.3470899148285265
Epoch: 31, step: 472, loss: 0.3416537940502167, mean loss: 0.3470897946587368
Epoch: 31, step: 473, loss: 0.3181503415107727, mean loss: 0.34708915494316256
Epoch: 31, step: 474, loss: 0.3576008081436157, mean loss: 0.3470893873013756
Epoch: 31, step: 475, loss: 0.35603129863739014, mean loss: 0.3470895849563565
Epoch: 31, step: 476, loss: 0.33001014590263367, mean loss: 0.34708920743510246
Epoch: 31, step: 477, loss: 0.33081772923469543, mean loss: 0.3470888477808387
Epoch: 31, step: 478, loss: 0.3460857570171356, mean loss: 0.3470888256096572
Epoch: 31, step: 479, loss: 0.31936317682266235, mean loss: 0.34708821280688146
Epoch: 31, step: 480, loss: 0.3151109516620636, mean loss: 0.34708750604898236
Epoch: 31, step: 481, loss: 0.31905612349510193, mean loss: 0.34708688651614955
Epoch: 31, step: 482, loss: 0.30371472239494324, mean loss: 0.34708592795173376
Epoch: 31, step: 483, loss: 0.3364943563938141, mean loss: 0.347085693873508
Epoch: 31, step: 484, loss: 0.3138909935951233, mean loss: 0.3470849602727593
Epoch: 31, step: 485, loss: 0.334428995847702, mean loss: 0.3470846805829378
Epoch: 31, step: 486, loss: 0.34117528796195984, mean loss: 0.3470845499915117
Epoch: 31, step: 487, loss: 0.30390942096710205, mean loss: 0.3470835958871843
Epoch: 31, step: 488, loss: 0.3730084300041199, mean loss: 0.34708416877371373
Epoch: 31, step: 489, loss: 0.37441542744636536, mean loss: 0.3470847727260422
Epoch: 31, step: 490, loss: 0.33288031816482544, mean loss: 0.3470844588501266
Epoch: 31, step: 491, loss: 0.313925176858902, mean loss: 0.3470837261454689
Epoch: 31, step: 492, loss: 0.36250001192092896, mean loss: 0.34708406678417175
Epoch: 31, step: 493, loss: 0.33029621839523315, mean loss: 0.34708369584757737
Epoch: 31, step: 494, loss: 0.3074378967285156, mean loss: 0.3470828198715479
Epoch: 31, step: 495, loss: 0.3112361431121826, mean loss: 0.3470820278548276
Epoch: 31, step: 496, loss: 0.35548165440559387, mean loss: 0.34708221343681983
Epoch: 31, step: 497, loss: 0.34627729654312134, mean loss: 0.34708219565331727
Epoch: 31, step: 498, loss: 0.32893210649490356, mean loss: 0.34708179466157657
Epoch: 31, step: 499, loss: 0.2827363908290863, mean loss: 0.3470803731035209
Epoch: 31, step: 500, loss: 0.3415188491344452, mean loss: 0.3470802502376429
Epoch: 31, step: 501, loss: 0.3043273687362671, mean loss: 0.3470793057565422
Epoch: 31, step: 502, loss: 0.3288249373435974, mean loss: 0.34707890249658657
Epoch: 31, step: 503, loss: 0.321440190076828, mean loss: 0.3470783361205059
Epoch: 31, step: 504, loss: 0.29384201765060425, mean loss: 0.34707716012106987
Epoch: 31, step: 505, loss: 0.34170085191726685, mean loss: 0.3470770413601199
Epoch: 31, step: 506, loss: 0.3304152488708496, mean loss: 0.347076673314517
Epoch: 31, step: 507, loss: 0.34885576367378235, mean loss: 0.3470767126123249
Epoch: 31, step: 508, loss: 0.3276051878929138, mean loss: 0.3470762825209963
Epoch: 31, step: 509, loss: 0.2984822392463684, mean loss: 0.34707520918876866
Epoch: 31, step: 510, loss: 0.3279253840446472, mean loss: 0.34707478622189636
Epoch: 31, step: 511, loss: 0.32375219464302063, mean loss: 0.34707427110148864
Epoch: 31, step: 512, loss: 0.3049311935901642, mean loss: 0.34707334031814363
Epoch: 31, step: 513, loss: 0.37921661138534546, mean loss: 0.3470740502273946
Epoch: 31, step: 514, loss: 0.3471923768520355, mean loss: 0.34707405284067283
Epoch: 31, step: 515, loss: 0.3189789056777954, mean loss: 0.3470734323648079
Epoch: 31, step: 516, loss: 0.30126509070396423, mean loss: 0.34707242071882705
Epoch: 31, step: 517, loss: 0.3349396884441376, mean loss: 0.3470721527816274
Epoch: 31, step: 518, loss: 0.354200541973114, mean loss: 0.3470723102002876
Epoch: 31, step: 519, loss: 0.3271915912628174, mean loss: 0.3470718711772566
Epoch: 31, step: 520, loss: 0.3207346498966217, mean loss: 0.34707128958906447
Epoch: 31, step: 521, loss: 0.3317159414291382, mean loss: 0.347070950514115
Epoch: 31, step: 522, loss: 0.33686137199401855, mean loss: 0.34707072507240944
Epoch: 31, step: 523, loss: 0.3323443830013275, mean loss: 0.3470703999014575
Epoch: 31, step: 524, loss: 0.3223802149295807, mean loss: 0.3470698547318805
Epoch: 31, step: 525, loss: 0.3543442189693451, mean loss: 0.3470700153493289
Epoch: 31, step: 526, loss: 0.3184587061405182, mean loss: 0.3470693836275915
Epoch: 31, step: 527, loss: 0.294225811958313, mean loss: 0.3470682168967854
Epoch: 31, step: 528, loss: 0.3123120665550232, mean loss: 0.3470674495342715
Epoch: 31, step: 529, loss: 0.30048301815986633, mean loss: 0.34706642104415414
Epoch: 31, step: 530, loss: 0.317581444978714, mean loss: 0.347065770089831
Epoch: 31, step: 531, loss: 0.32954877614974976, mean loss: 0.3470653833670754
Epoch: 31, step: 532, loss: 0.31227999925613403, mean loss: 0.34706461542694444
Epoch: 31, step: 533, loss: 0.31228044629096985, mean loss: 0.3470638475305884
Epoch: 31, step: 534, loss: 0.31198790669441223, mean loss: 0.3470630732101655
Epoch: 31, step: 535, loss: 0.38685542345046997, mean loss: 0.3470639516284931
Epoch: 31, step: 536, loss: 0.3569672107696533, mean loss: 0.3470641702386593
Epoch: 31, step: 537, loss: 0.32941532135009766, mean loss: 0.3470637806565462
Epoch: 31, step: 538, loss: 0.31890395283699036, mean loss: 0.3470631590679578
Epoch: 31, step: 539, loss: 0.3336961269378662, mean loss: 0.347062864016039
Epoch: 31, step: 540, loss: 0.3431539535522461, mean loss: 0.3470627777361479
Epoch: 31, step: 541, loss: 0.3119955062866211, mean loss: 0.3470620037267132
Epoch: 31, step: 542, loss: 0.3086036741733551, mean loss: 0.347061154888133
Epoch: 31, step: 543, loss: 0.34344568848609924, mean loss: 0.3470610750906049
Epoch: 31, step: 544, loss: 0.30666273832321167, mean loss: 0.347060183472234
Epoch: 31, step: 545, loss: 0.3103555142879486, mean loss: 0.34705937339346143
Epoch: 31, step: 546, loss: 0.30735769867897034, mean loss: 0.34705849718956583
Epoch: 31, step: 547, loss: 0.3454693555831909, mean loss: 0.3470584621184675
Epoch: 31, step: 548, loss: 0.3394780457019806, mean loss: 0.347058294828365
Epoch: 31, step: 549, loss: 0.34888598322868347, mean loss: 0.34705833516222206
Epoch: 31, step: 550, loss: 0.3524478077888489, mean loss: 0.34705845409574576
Epoch: 31, step: 551, loss: 0.3348912298679352, mean loss: 0.34705818559843293
Epoch: 31, step: 552, loss: 0.3668006956577301, mean loss: 0.34705862125194176
Epoch: 31, step: 553, loss: 0.36362892389297485, mean loss: 0.3470589868969976
Epoch: 31, step: 554, loss: 0.36647582054138184, mean loss: 0.34705941534496965
Epoch: 31, step: 555, loss: 0.2832709848880768, mean loss: 0.34705800783326496
Epoch: 31, step: 556, loss: 0.3649197220802307, mean loss: 0.3470584019488901
Epoch: 31, step: 557, loss: 0.3302471339702606, mean loss: 0.34705803101936405
Epoch: 31, step: 558, loss: 0.3464204967021942, mean loss: 0.3470580169529007
Epoch: 31, step: 559, loss: 0.3672373294830322, mean loss: 0.34705846217645847
Epoch: 31, step: 560, loss: 0.296017050743103, mean loss: 0.3470573360559635
Epoch: 31, step: 561, loss: 0.3604632318019867, mean loss: 0.34705763182209654
Epoch: 31, step: 562, loss: 0.37146055698394775, mean loss: 0.3470581701971304
Epoch: 31, step: 563, loss: 0.3298124670982361, mean loss: 0.34705778973244855
Epoch: 31, step: 564, loss: 0.3377809524536133, mean loss: 0.3470575850767694
Epoch: 31, step: 565, loss: 0.3542010486125946, mean loss: 0.3470577426647583
Epoch: 31, step: 566, loss: 0.35559701919555664, mean loss: 0.3470579310408482
Epoch: 31, step: 567, loss: 0.3515857458114624, mean loss: 0.3470580309220529
Epoch: 31, step: 568, loss: 0.35404399037361145, mean loss: 0.3470581850252327
Epoch: 31, step: 569, loss: 0.3727920651435852, mean loss: 0.34705875267600517
Epoch: 31, step: 570, loss: 0.3165941834449768, mean loss: 0.347058080688154
Epoch: 31, step: 571, loss: 0.3341398239135742, mean loss: 0.347057795743369
Epoch: 31, step: 572, loss: 0.359510213136673, mean loss: 0.34705807040683134
Epoch: 31, step: 573, loss: 0.3215121328830719, mean loss: 0.3470575069515064
Epoch: 31, step: 574, loss: 0.3110538721084595, mean loss: 0.34705671285294126
Epoch: 31, step: 575, loss: 0.31831714510917664, mean loss: 0.34705607898510393
Epoch: 31, step: 576, loss: 0.3407607972621918, mean loss: 0.34705594014207614
Epoch: 31, step: 577, loss: 0.3125843405723572, mean loss: 0.3470551798844878
Epoch: 31, step: 578, loss: 0.37415653467178345, mean loss: 0.34705577758104045
Epoch: 31, step: 579, loss: 0.3224189281463623, mean loss: 0.3470552342489693
Epoch: 31, step: 580, loss: 0.3078335225582123, mean loss: 0.34705436928675315
Epoch: 31, step: 581, loss: 0.3638509213924408, mean loss: 0.34705473969543543
Epoch: 31, step: 582, loss: 0.33324167132377625, mean loss: 0.3470544350872282
Epoch: 31, step: 583, loss: 0.32901814579963684, mean loss: 0.34705403735658324
Epoch: 31, step: 584, loss: 0.3253949284553528, mean loss: 0.3470535597471784
Epoch: 31, step: 585, loss: 0.31639721989631653, mean loss: 0.3470528837529149
Epoch: 31, step: 586, loss: 0.3436335325241089, mean loss: 0.3470528083554324
Epoch: 31, step: 587, loss: 0.3353571891784668, mean loss: 0.34705255047002104
Epoch: 31, step: 588, loss: 0.3022692799568176, mean loss: 0.3470515630321335
Epoch: 31, step: 589, loss: 0.3771229684352875, mean loss: 0.3470522260696915
Epoch: 31, step: 590, loss: 0.281329870223999, mean loss: 0.34705077700440995
Epoch: 31, step: 591, loss: 0.32022687792778015, mean loss: 0.34705018559645784
Epoch: 31, step: 592, loss: 0.36654365062713623, mean loss: 0.34705061537499327
Epoch: 31, step: 593, loss: 0.30954742431640625, mean loss: 0.34704978854861074
Epoch: 31, step: 594, loss: 0.3169044554233551, mean loss: 0.34704912395430476
Epoch: 31, step: 595, loss: 0.31753644347190857, mean loss: 0.347048473322019
Epoch: 31, step: 596, loss: 0.31389081478118896, mean loss: 0.347047742349189
Epoch: 31, step: 597, loss: 0.3615697920322418, mean loss: 0.3470480624860807
Epoch: 31, step: 598, loss: 0.3352789580821991, mean loss: 0.347047803043266
Epoch: 31, step: 599, loss: 0.319381445646286, mean loss: 0.3470471931685328
Epoch: 31, step: 600, loss: 0.3392849564552307, mean loss: 0.3470470220622457
Epoch: 31, step: 601, loss: 0.35434335470199585, mean loss: 0.3470471828948657
Epoch: 31, step: 602, loss: 0.2955624759197235, mean loss: 0.3470460480455925
Epoch: 31, step: 603, loss: 0.4005090594291687, mean loss: 0.3470472264755736
Epoch: 31, step: 604, loss: 0.3360684812068939, mean loss: 0.3470469844877566
Epoch: 31, step: 605, loss: 0.3216468393802643, mean loss: 0.34704642464325347
Epoch: 31, step: 606, loss: 0.34123045206069946, mean loss: 0.34704629645624896
Epoch: 31, step: 607, loss: 0.3349018096923828, mean loss: 0.3470460287914609
Epoch: 31, step: 608, loss: 0.35968002676963806, mean loss: 0.34704630723895125
Epoch: 31, step: 609, loss: 0.3527195453643799, mean loss: 0.34704643227174814
Epoch: 31, step: 610, loss: 0.3626718819141388, mean loss: 0.3470467766342747
Epoch: 31, step: 611, loss: 0.3137846887111664, mean loss: 0.34704604360166
Epoch: 31, step: 612, loss: 0.35697656869888306, mean loss: 0.34704626244656156
Epoch: 31, step: 613, loss: 0.328809529542923, mean loss: 0.34704586056166353
Epoch: 31, step: 614, loss: 0.3406262695789337, mean loss: 0.3470457190955452
Epoch: 31, step: 615, loss: 0.34473222494125366, mean loss: 0.3470456681150658
Epoch: 31, step: 616, loss: 0.3074777126312256, mean loss: 0.3470447962093017
Epoch: 31, step: 617, loss: 0.3428923785686493, mean loss: 0.3470447047100808
Epoch: 31, step: 618, loss: 0.34063583612442017, mean loss: 0.34704456349269575
Epoch: 31, step: 619, loss: 0.3073462247848511, mean loss: 0.34704368877167713
Epoch: 31, step: 620, loss: 0.34853699803352356, mean loss: 0.3470437216748227
Epoch: 31, step: 621, loss: 0.31419533491134644, mean loss: 0.34704299791889
Epoch: 31, step: 622, loss: 0.3606439530849457, mean loss: 0.3470432975852078
Epoch: 31, step: 623, loss: 0.3384227156639099, mean loss: 0.34704310765434676
Epoch: 31, step: 624, loss: 0.316301167011261, mean loss: 0.34704243035498694
Epoch: 31, step: 625, loss: 0.3718477785587311, mean loss: 0.34704297684866847
Epoch: 31, step: 626, loss: 0.3136579692363739, mean loss: 0.3470422413502742
Epoch: 31, step: 627, loss: 0.3131941854953766, mean loss: 0.3470414956669852
Epoch: 31, step: 628, loss: 0.3041863441467285, mean loss: 0.3470405515753517
Epoch: 31, step: 629, loss: 0.3215130865573883, mean loss: 0.3470399892220667
Epoch: 31, step: 630, loss: 0.3464492857456207, mean loss: 0.3470399762095438
Epoch: 31, step: 631, loss: 0.3389948904514313, mean loss: 0.3470397989893976
Epoch: 31, step: 632, loss: 0.33673930168151855, mean loss: 0.3470395720912037
Epoch: 31, step: 633, loss: 0.32033196091651917, mean loss: 0.3470389837919135
Epoch: 31, step: 634, loss: 0.3380069136619568, mean loss: 0.3470387848432554
Epoch: 31, step: 635, loss: 0.35749518871307373, mean loss: 0.34703901516052127
Epoch: 31, step: 636, loss: 0.38036301732063293, mean loss: 0.3470397491532122
Epoch: 31, step: 637, loss: 0.2909560203552246, mean loss: 0.3470385138832065
Epoch: 31, step: 638, loss: 0.32189372181892395, mean loss: 0.3470379600697566
Epoch: 31, step: 639, loss: 0.3343523442745209, mean loss: 0.34703768067552276
Epoch: 31, step: 640, loss: 0.33629679679870605, mean loss: 0.34703744411823
Epoch: 31, step: 641, loss: 0.3316381871700287, mean loss: 0.3470371049723694
Epoch: 31, step: 642, loss: 0.3204677700996399, mean loss: 0.34703651983494843
Epoch: 31, step: 643, loss: 0.37627482414245605, mean loss: 0.3470371637369989
Epoch: 31, step: 644, loss: 0.37662822008132935, mean loss: 0.347037815393198
Epoch: 31, step: 645, loss: 0.334384560585022, mean loss: 0.34703753674852045
Epoch: 31, step: 646, loss: 0.33660411834716797, mean loss: 0.34703730699321
Epoch: 31, step: 647, loss: 0.3743084967136383, mean loss: 0.34703790752147834
Epoch: 31, step: 648, loss: 0.3219400644302368, mean loss: 0.3470373548638012
Epoch: 31, step: 649, loss: 0.3979335427284241, mean loss: 0.34703847557961276
Epoch: 31, step: 650, loss: 0.375980019569397, mean loss: 0.34703911284800404
Epoch: 31, step: 651, loss: 0.3734630048274994, mean loss: 0.3470396946670101
Epoch: 31, step: 652, loss: 0.31270474195480347, mean loss: 0.3470389386735999
Epoch: 31, step: 653, loss: 0.32527387142181396, mean loss: 0.3470384594568301
Epoch: 31, step: 654, loss: 0.35736775398254395, mean loss: 0.3470386868791539
Epoch: 31, step: 655, loss: 0.3651820123195648, mean loss: 0.3470390863359007
Epoch: 31, step: 656, loss: 0.3036801815032959, mean loss: 0.3470381317354993
Epoch: 31, step: 657, loss: 0.3122481405735016, mean loss: 0.3470373658072891
Epoch: 31, step: 658, loss: 0.3571087718009949, mean loss: 0.347037587532098
Epoch: 31, step: 659, loss: 0.3510455787181854, mean loss: 0.3470376757671981
Epoch: 31, step: 660, loss: 0.29701516032218933, mean loss: 0.34703657455607106
Epoch: 31, step: 661, loss: 0.3563608229160309, mean loss: 0.3470367798184398
Epoch: 31, step: 662, loss: 0.33647847175598145, mean loss: 0.3470365473948137
Epoch: 31, step: 663, loss: 0.31643831729888916, mean loss: 0.3470358738403958
Epoch: 31, step: 664, loss: 0.33608490228652954, mean loss: 0.34703563278354765
Epoch: 31, step: 665, loss: 0.3671487867832184, mean loss: 0.347036075512009
Epoch: 31, step: 666, loss: 0.3794434666633606, mean loss: 0.34703678884412037
Epoch: 31, step: 667, loss: 0.3279876112937927, mean loss: 0.3470363695542465
Epoch: 31, step: 668, loss: 0.3752250075340271, mean loss: 0.34703698999837257
Epoch: 31, step: 669, loss: 0.3192335367202759, mean loss: 0.3470363780457979
Epoch: 31, step: 670, loss: 0.3228926956653595, mean loss: 0.34703584665628806
Epoch: 31, step: 671, loss: 0.29996272921562195, mean loss: 0.3470348106250036
Epoch: 31, step: 672, loss: 0.31229734420776367, mean loss: 0.34703404610563793
Epoch: 31, step: 673, loss: 0.34394440054893494, mean loss: 0.3470339781086848
Epoch: 31, step: 674, loss: 0.3327852189540863, mean loss: 0.34703366452873907
Epoch: 31, step: 675, loss: 0.321293443441391, mean loss: 0.34703309806260596
Epoch: 31, step: 676, loss: 0.29244667291641235, mean loss: 0.34703189680327745
Epoch: 31, step: 677, loss: 0.31047356128692627, mean loss: 0.3470310922978526
Epoch: 31, step: 678, loss: 0.3245113492012024, mean loss: 0.3470305967376322
Epoch: 31, step: 679, loss: 0.32313817739486694, mean loss: 0.34703007098243144
Epoch: 31, step: 680, loss: 0.32459867000579834, mean loss: 0.3470295773879551
Epoch: 31, step: 681, loss: 0.29377609491348267, mean loss: 0.3470284055910428
Epoch: 31, step: 682, loss: 0.33536919951438904, mean loss: 0.3470281490459226
Epoch: 31, step: 683, loss: 0.38713449239730835, mean loss: 0.34702903151255154
Epoch: 31, step: 684, loss: 0.4096764028072357, mean loss: 0.3470304099228861
Epoch: 31, step: 685, loss: 0.33169233798980713, mean loss: 0.3470300724515564
Epoch: 31, step: 686, loss: 0.33839839696884155, mean loss: 0.3470298825398827
Epoch: 31, step: 687, loss: 0.32753050327301025, mean loss: 0.34702945352951425
Epoch: 31, step: 688, loss: 0.3545341491699219, mean loss: 0.34702961863843207
Epoch: 31, step: 689, loss: 0.30843931436538696, mean loss: 0.3470287696415501
Epoch: 31, step: 690, loss: 0.3248535692691803, mean loss: 0.3470282817920204
Epoch: 31, step: 691, loss: 0.32530996203422546, mean loss: 0.3470278040042749
Epoch: 31, step: 692, loss: 0.3927924335002899, mean loss: 0.3470288107717584
Epoch: 31, step: 693, loss: 0.3934919238090515, mean loss: 0.3470298328825648
Epoch: 31, step: 694, loss: 0.3093353509902954, mean loss: 0.3470290036852245
Epoch: 31, step: 695, loss: 0.3497839570045471, mean loss: 0.3470290642869253
Epoch: 31, step: 696, loss: 0.31924545764923096, mean loss: 0.3470284531343629
Epoch: 31, step: 697, loss: 0.3360297679901123, mean loss: 0.3470282112029665
Epoch: 31, step: 698, loss: 0.31877636909484863, mean loss: 0.34702758977802517
Epoch: 31, step: 699, loss: 0.35709330439567566, mean loss: 0.3470278111776956
Epoch: 31, step: 700, loss: 0.3495276868343353, mean loss: 0.34702786616231357
Epoch: 31, step: 701, loss: 0.3119194507598877, mean loss: 0.34702709397176673
Epoch: 31, step: 702, loss: 0.33586385846138, mean loss: 0.347026848447859
Epoch: 31, step: 703, loss: 0.3105948865413666, mean loss: 0.3470260471818718
Epoch: 31, step: 704, loss: 0.3415411710739136, mean loss: 0.34702592655295744
Epoch: 31, step: 705, loss: 0.2963865399360657, mean loss: 0.3470248128651057
Epoch: 31, step: 706, loss: 0.31942999362945557, mean loss: 0.34702420599876815
Epoch: 31, step: 707, loss: 0.29131510853767395, mean loss: 0.3470229808690738
Epoch: 31, step: 708, loss: 0.32087236642837524, mean loss: 0.3470224057890386
Epoch: 31, step: 709, loss: 0.30879294872283936, mean loss: 0.3470215651007977
Epoch: 31, step: 710, loss: 0.34586894512176514, mean loss: 0.34702153975456396
Epoch: 31, step: 711, loss: 0.28747299313545227, mean loss: 0.3470202303045987
Epoch: 31, step: 712, loss: 0.30852746963500977, mean loss: 0.34701938388199677
Epoch: 31, step: 713, loss: 0.3037585914134979, mean loss: 0.3470184326354057
Epoch: 31, step: 714, loss: 0.3441287577152252, mean loss: 0.3470183690967413
Epoch: 31, step: 715, loss: 0.3794557452201843, mean loss: 0.3470190823196112
Epoch: 31, step: 716, loss: 0.31549447774887085, mean loss: 0.3470183891817169
Epoch: 31, step: 717, loss: 0.2924095094203949, mean loss: 0.34701718851156693
Epoch: 31, step: 718, loss: 0.3120366036891937, mean loss: 0.34701641942015204
Epoch: 31, step: 719, loss: 0.30180346965789795, mean loss: 0.34701542537939567
Epoch: 31, step: 720, loss: 0.36561450362205505, mean loss: 0.34701583428515015
Epoch: 31, step: 721, loss: 0.3291267454624176, mean loss: 0.3470154409973512
Epoch: 31, step: 722, loss: 0.35253432393074036, mean loss: 0.347015562326147
Epoch: 31, step: 723, loss: 0.3188723921775818, mean loss: 0.3470149436317628
Epoch: 31, step: 724, loss: 0.3000434935092926, mean loss: 0.3470139110425627
Epoch: 31, step: 725, loss: 0.33460086584091187, mean loss: 0.3470136381684101
Epoch: 31, step: 726, loss: 0.4118593633174896, mean loss: 0.34701506363114226
Epoch: 31, step: 727, loss: 0.3390977382659912, mean loss: 0.34701488959339133
Epoch: 31, step: 728, loss: 0.31226179003715515, mean loss: 0.34701412567147905
Epoch: 31, step: 729, loss: 0.3278608024120331, mean loss: 0.347013704663802
Epoch: 31, step: 730, loss: 0.3211873769760132, mean loss: 0.3470131369898227
Epoch: 31, step: 731, loss: 0.3502644896507263, mean loss: 0.3470132084544056
Epoch: 31, step: 732, loss: 0.3631126284599304, mean loss: 0.3470135623111435
Epoch: 31, step: 733, loss: 0.3444923162460327, mean loss: 0.3470135068967063
Epoch: 31, step: 734, loss: 0.3118150234222412, mean loss: 0.3470127332866605
Epoch: 31, step: 735, loss: 0.33169469237327576, mean loss: 0.34701239662642064
Epoch: 31, step: 736, loss: 0.35995346307754517, mean loss: 0.3470126810392127
Epoch: 31, step: 737, loss: 0.3197121322154999, mean loss: 0.3470120810535236
Epoch: 31, step: 738, loss: 0.3301665484905243, mean loss: 0.34701171084644794
Epoch: 31, step: 739, loss: 0.3195902705192566, mean loss: 0.347011108230407
Epoch: 31, step: 740, loss: 0.3268464207649231, mean loss: 0.34701066509915846
Epoch: 31, step: 741, loss: 0.30662867426872253, mean loss: 0.34700977769989616
Epoch: 31, step: 742, loss: 0.3747082054615021, mean loss: 0.3470103863629098
Epoch: 31, step: 743, loss: 0.30870676040649414, mean loss: 0.34700954467296613
Epoch: 31, step: 744, loss: 0.3476943373680115, mean loss: 0.3470095597203786
Epoch: 31, step: 745, loss: 0.3169357478618622, mean loss: 0.3470088989027153
Epoch: 31, step: 746, loss: 0.32995226979255676, mean loss: 0.3470085241223521
Epoch: 31, step: 747, loss: 0.31971290707588196, mean loss: 0.3470079243768554
Epoch: 31, step: 748, loss: 0.33704453706741333, mean loss: 0.34700770546385673
Epoch: 31, step: 749, loss: 0.30952537059783936, mean loss: 0.3470068819296724
Epoch: 31, step: 750, loss: 0.3665573000907898, mean loss: 0.3470073114675865
Epoch: 31, step: 751, loss: 0.3510685861110687, mean loss: 0.3470074006949932
Epoch: 31, step: 752, loss: 0.33248311281204224, mean loss: 0.34700708159909754
Epoch: 31, step: 753, loss: 0.3101707696914673, mean loss: 0.3470062723299753
Epoch: 31, step: 754, loss: 0.32387280464172363, mean loss: 0.3470057641143359
Epoch: 31, step: 755, loss: 0.3596249222755432, mean loss: 0.3470060413366154
Epoch: 31, step: 756, loss: 0.3377703130245209, mean loss: 0.34700583844721683
Epoch: 31, step: 757, loss: 0.3026190400123596, mean loss: 0.34700486338464415
Epoch: 31, step: 758, loss: 0.3437884747982025, mean loss: 0.3470047927305004
Epoch: 31, step: 759, loss: 0.36958450078964233, mean loss: 0.3470052887261963
Epoch: 31, step: 760, loss: 0.33723002672195435, mean loss: 0.34700507400325276
Epoch: 31, step: 761, loss: 0.3565182685852051, mean loss: 0.3470052829650456
Epoch: 31, step: 762, loss: 0.29897037148475647, mean loss: 0.34700422787880053
Epoch: 31, step: 763, loss: 0.32371577620506287, mean loss: 0.3470037163594789
Epoch: 31, step: 764, loss: 0.34768790006637573, mean loss: 0.34700373138690555
Epoch: 31, step: 765, loss: 0.3249753415584564, mean loss: 0.3470032475654729
Epoch: 31, step: 766, loss: 0.34233859181404114, mean loss: 0.34700314511536745
Epoch: 31, step: 767, loss: 0.3418720066547394, mean loss: 0.3470030324223502
Epoch: 31, step: 768, loss: 0.315010130405426, mean loss: 0.3470023297912471
Epoch: 31, step: 769, loss: 0.32929670810699463, mean loss: 0.3470019409472693
Epoch: 31, step: 770, loss: 0.3321477174758911, mean loss: 0.3470016147317544
Epoch: 31, step: 771, loss: 0.3247468173503876, mean loss: 0.3470011260020157
Epoch: 31, step: 772, loss: 0.34225699305534363, mean loss: 0.3470010218200769
Epoch: 31, step: 773, loss: 0.31997549533843994, mean loss: 0.34700042834810885
Epoch: 31, step: 774, loss: 0.3293033540248871, mean loss: 0.34700003973451776
Epoch: 31, step: 775, loss: 0.3592834770679474, mean loss: 0.34700030946304944
Epoch: 31, step: 776, loss: 0.3562358617782593, mean loss: 0.3470005122594816
Epoch: 31, step: 777, loss: 0.3197648227214813, mean loss: 0.3469999142249302
Epoch: 31, step: 778, loss: 0.31664201617240906, mean loss: 0.3469992476483311
Epoch: 31, step: 779, loss: 0.35709965229034424, mean loss: 0.3469994694207851
Epoch: 31, step: 780, loss: 0.29978126287460327, mean loss: 0.34699843268334857
Epoch: 31, step: 781, loss: 0.30818769335746765, mean loss: 0.34699758056155244
Epoch: 31, step: 782, loss: 0.3301268517971039, mean loss: 0.3469972101589186
Epoch: 31, step: 783, loss: 0.3070477545261383, mean loss: 0.3469963330741809
Epoch: 31, step: 784, loss: 0.2999708354473114, mean loss: 0.3469953006585927
Epoch: 31, step: 785, loss: 0.31399214267730713, mean loss: 0.34699457611066775
Epoch: 31, step: 786, loss: 0.30167508125305176, mean loss: 0.34699358119299617
Epoch: 31, step: 787, loss: 0.3243400752544403, mean loss: 0.3469930838821001
Epoch: 31, step: 788, loss: 0.3449411392211914, mean loss: 0.3469930388368855
Epoch: 31, step: 789, loss: 0.35771530866622925, mean loss: 0.34699327421182136
Epoch: 31, step: 790, loss: 0.35690441727638245, mean loss: 0.34699349177615163
Epoch: 31, step: 791, loss: 0.33291998505592346, mean loss: 0.34699318284853026
Epoch: 31, step: 792, loss: 0.34686335921287537, mean loss: 0.3469931799988335
Epoch: 31, step: 793, loss: 0.30882754921913147, mean loss: 0.34699234226164616
Epoch: 31, step: 794, loss: 0.32989954948425293, mean loss: 0.346991967082367
Epoch: 31, step: 795, loss: 0.3481310307979584, mean loss: 0.3469919920837655
Epoch: 31, step: 796, loss: 0.32651519775390625, mean loss: 0.3469915426468715
Epoch: 31, step: 797, loss: 0.31629785895347595, mean loss: 0.34699086897838255
Epoch: 31, step: 798, loss: 0.3466806709766388, mean loss: 0.34699086217027064
Epoch: 31, step: 799, loss: 0.374742716550827, mean loss: 0.3469914712444165
Epoch: 31, step: 800, loss: 0.34606048464775085, mean loss: 0.34699145081236127
Epoch: 31, step: 801, loss: 0.3384249210357666, mean loss: 0.3469912628096887
Epoch: 31, step: 802, loss: 0.34650999307632446, mean loss: 0.3469912522478845
Epoch: 31, step: 803, loss: 0.3280659019947052, mean loss: 0.3469908369268203
Epoch: 31, step: 804, loss: 0.3126528561115265, mean loss: 0.3469900833886515
Epoch: 31, step: 805, loss: 0.2925484776496887, mean loss: 0.3469888887078146
Epoch: 31, step: 806, loss: 0.30918556451797485, mean loss: 0.34698805915998393
Epoch: 31, step: 807, loss: 0.30975764989852905, mean loss: 0.3469872422019996
Epoch: 31, step: 808, loss: 0.32732096314430237, mean loss: 0.3469868106684368
Epoch: 31, step: 809, loss: 0.3257671296596527, mean loss: 0.346986345059076
Epoch: 31, step: 810, loss: 0.3679567873477936, mean loss: 0.34698680518946085
Epoch: 31, step: 811, loss: 0.3235526382923126, mean loss: 0.34698629101167217
Epoch: 31, step: 812, loss: 0.3684737980365753, mean loss: 0.3469867624667268
Epoch: 31, step: 813, loss: 0.333503782749176, mean loss: 0.3469864666446258
Epoch: 31, step: 814, loss: 0.3354804813861847, mean loss: 0.34698621420413217
Epoch: 31, step: 815, loss: 0.3572113513946533, mean loss: 0.34698643853798894
Epoch: 31, step: 816, loss: 0.32237446308135986, mean loss: 0.3469858985767012
Epoch: 31, step: 817, loss: 0.34202146530151367, mean loss: 0.3469857896645588
Epoch: 31, step: 818, loss: 0.3360079526901245, mean loss: 0.3469855488327361
Epoch: 31, step: 819, loss: 0.3418571650981903, mean loss: 0.3469854363287054
Epoch: 31, step: 820, loss: 0.33317428827285767, mean loss: 0.3469851333529885
Epoch: 31, step: 821, loss: 0.3412987291812897, mean loss: 0.3469850086128452
Epoch: 31, step: 822, loss: 0.3351750373840332, mean loss: 0.346984749548392
Epoch: 31, step: 823, loss: 0.28926512598991394, mean loss: 0.3469834834339856
Epoch: 31, step: 824, loss: 0.302846223115921, mean loss: 0.34698251527806384
Epoch: 31, step: 825, loss: 0.34461936354637146, mean loss: 0.34698246344319367
Epoch: 31, step: 826, loss: 0.35360047221183777, mean loss: 0.346982608603615
Epoch: 31, step: 827, loss: 0.3770710527896881, mean loss: 0.34698326855369804
Epoch: 31, step: 828, loss: 0.32752907276153564, mean loss: 0.3469828418610963
Epoch: 31, step: 829, loss: 0.3541545867919922, mean loss: 0.34698299915690123
Epoch: 31, step: 830, loss: 0.3103249669075012, mean loss: 0.34698219516452816
Epoch: 31, step: 831, loss: 0.3045821189880371, mean loss: 0.34698126525672535
Epoch: 31, step: 832, loss: 0.3232496678829193, mean loss: 0.34698074479271734
Epoch: 31, step: 833, loss: 0.2936786115169525, mean loss: 0.34697957583501576
Epoch: 31, step: 834, loss: 0.3033874034881592, mean loss: 0.34697861984535927
Epoch: 31, step: 835, loss: 0.3334209620952606, mean loss: 0.34697832252830335
Epoch: 31, step: 836, loss: 0.3534987270832062, mean loss: 0.3469784655164956
Epoch: 31, step: 837, loss: 0.35040849447250366, mean loss: 0.34697854073312984
Epoch: 31, step: 838, loss: 0.30034783482551575, mean loss: 0.3469775181972022
Epoch: 31, step: 839, loss: 0.2947273850440979, mean loss: 0.34697637246145197
Epoch: 31, step: 840, loss: 0.32423704862594604, mean loss: 0.3469758738467423
Epoch: 31, step: 841, loss: 0.328563928604126, mean loss: 0.346975470129134
Epoch: 31, step: 842, loss: 0.3358248770236969, mean loss: 0.34697522563611527
Epoch: 31, step: 843, loss: 0.315311074256897, mean loss: 0.34697453136863193
Epoch: 31, step: 844, loss: 0.39727863669395447, mean loss: 0.3469756343111504
Epoch: 31, step: 845, loss: 0.3804274797439575, mean loss: 0.3469763677434116
Epoch: 31, step: 846, loss: 0.31838515400886536, mean loss: 0.34697574089432404
Epoch: 31, step: 847, loss: 0.3574582040309906, mean loss: 0.34697597071242314
Epoch: 31, step: 848, loss: 0.3730609714984894, mean loss: 0.3469765425888791
Epoch: 31, step: 849, loss: 0.3149939179420471, mean loss: 0.3469758414307994
Epoch: 31, step: 850, loss: 0.30196109414100647, mean loss: 0.3469748545899074
Epoch: 31, step: 851, loss: 0.3220468759536743, mean loss: 0.34697430811545465
Epoch: 31, step: 852, loss: 0.3780803680419922, mean loss: 0.3469749900116759
Epoch: 31, step: 853, loss: 0.29661962389945984, mean loss: 0.3469738861630611
Epoch: 31, step: 854, loss: 0.3340948820114136, mean loss: 0.3469736038463914
Epoch: 31, step: 855, loss: 0.3359690308570862, mean loss: 0.34697336262383577
Epoch: 31, step: 856, loss: 0.3408103883266449, mean loss: 0.3469732275331035
Epoch: 31, step: 857, loss: 0.32622459530830383, mean loss: 0.3469727727386573
Epoch: 31, step: 858, loss: 0.30303487181663513, mean loss: 0.3469718096739548
Epoch: 31, step: 859, loss: 0.3654269576072693, mean loss: 0.34697221417921376
Epoch: 31, step: 860, loss: 0.33494919538497925, mean loss: 0.3469719506609936
Epoch: 31, step: 861, loss: 0.3264204263687134, mean loss: 0.3469715002264981
Epoch: 31, step: 862, loss: 0.29784923791885376, mean loss: 0.3469704236213672
Epoch: 31, step: 863, loss: 0.33390501141548157, mean loss: 0.3469701372749964
Epoch: 31, step: 864, loss: 0.34079810976982117, mean loss: 0.34697000200954015
Epoch: 31, step: 865, loss: 0.3565236032009125, mean loss: 0.3469702113805941
Epoch: 31, step: 866, loss: 0.3392118811607361, mean loss: 0.3469700413573594
Epoch: 31, step: 867, loss: 0.3152613639831543, mean loss: 0.3469693464792613
Epoch: 31, step: 868, loss: 0.33453452587127686, mean loss: 0.3469690739830281
Epoch: 31, step: 869, loss: 0.31706106662750244, mean loss: 0.34696841859434085
Epoch: 31, step: 870, loss: 0.3227629065513611, mean loss: 0.3469678881788255
Epoch: 31, step: 871, loss: 0.3245455324649811, mean loss: 0.3469673968483909
Epoch: 31, step: 872, loss: 0.30043452978134155, mean loss: 0.34696637721811135
Epoch: 31, step: 873, loss: 0.31542059779167175, mean loss: 0.34696568600071737
Epoch: 31, step: 874, loss: 0.32007771730422974, mean loss: 0.3469650968561547
Epoch: 31, step: 875, loss: 0.3052598536014557, mean loss: 0.34696418306905447
Epoch: 31, step: 876, loss: 0.38058918714523315, mean loss: 0.34696491979708577
Epoch: 31, step: 877, loss: 0.30173179507255554, mean loss: 0.3469639287553978
Epoch: 31, step: 878, loss: 0.32946887612342834, mean loss: 0.3469635454534099
Epoch: 31, step: 879, loss: 0.3477935194969177, mean loss: 0.34696356363704944
Epoch: 31, step: 880, loss: 0.31473830342292786, mean loss: 0.34696285763945467
Epoch: 31, step: 881, loss: 0.3145883083343506, mean loss: 0.3469621483867424
Epoch: 31, step: 882, loss: 0.33178192377090454, mean loss: 0.34696181582984675
Epoch: 31, step: 883, loss: 0.3376353085041046, mean loss: 0.3469616115162443
Epoch: 31, step: 884, loss: 0.3172297477722168, mean loss: 0.3469609602015661
Epoch: 31, step: 885, loss: 0.329190194606781, mean loss: 0.3469605709186396
Epoch: 31, step: 886, loss: 0.35429567098617554, mean loss: 0.3469607315963918
Epoch: 31, step: 887, loss: 0.3020325303077698, mean loss: 0.34695974745109065
Epoch: 31, step: 888, loss: 0.31519991159439087, mean loss: 0.34695905177203656
Epoch: 31, step: 889, loss: 0.3152490258216858, mean loss: 0.34695835719925106
Epoch: 31, step: 890, loss: 0.33256128430366516, mean loss: 0.3469580418543185
Epoch: 31, step: 891, loss: 0.32623836398124695, mean loss: 0.3469575880327425
Epoch: 31, step: 892, loss: 0.3818378746509552, mean loss: 0.34695835199635416
Epoch: 31, step: 893, loss: 0.3380982577800751, mean loss: 0.34695815794286483
Epoch: 31, step: 894, loss: 0.33055251836776733, mean loss: 0.3469577986349611
Epoch: 31, step: 895, loss: 0.31836235523223877, mean loss: 0.3469571723659422
Epoch: 31, step: 896, loss: 0.34040215611457825, mean loss: 0.3469570288076265
Epoch: 31, step: 897, loss: 0.35497450828552246, mean loss: 0.34695720439081335
Epoch: 31, step: 898, loss: 0.35608598589897156, mean loss: 0.34695740430719
Epoch: 31, step: 899, loss: 0.3209281861782074, mean loss: 0.3469568342910257
Epoch: 31, step: 900, loss: 0.30665677785873413, mean loss: 0.34695595177582955
Epoch: 31, step: 901, loss: 0.3351854979991913, mean loss: 0.3469556940249038
Epoch: 31, step: 902, loss: 0.3639189898967743, mean loss: 0.3469560654812261
Epoch: 31, step: 903, loss: 0.3391382694244385, mean loss: 0.3469558942936099
Epoch: 31, step: 904, loss: 0.3060721158981323, mean loss: 0.3469549990741307
Epoch: 31, step: 905, loss: 0.32875877618789673, mean loss: 0.3469546006457776
Epoch: 31, step: 906, loss: 0.41600266098976135, mean loss: 0.34695611250363806
Epoch: 31, step: 907, loss: 0.3201512098312378, mean loss: 0.3469555256035095
Epoch: 31, step: 908, loss: 0.3275151252746582, mean loss: 0.34695509996034335
Epoch: 31, step: 909, loss: 0.3274249732494354, mean loss: 0.3469546723620005
Epoch: 31, step: 910, loss: 0.32523515820503235, mean loss: 0.3469541968389757
Epoch: 31, step: 911, loss: 0.30637067556381226, mean loss: 0.34695330833032184
Epoch: 31, step: 912, loss: 0.3242228925228119, mean loss: 0.34695281069659356
Epoch: 31, step: 913, loss: 0.3602158725261688, mean loss: 0.3469531010565443
Epoch: 31, step: 914, loss: 0.34291180968284607, mean loss: 0.34695301258500655
Epoch: 31, step: 915, loss: 0.34082821011543274, mean loss: 0.34695287850439205
Epoch: 31, step: 916, loss: 0.327205628156662, mean loss: 0.34695244621853255
Epoch: 31, step: 917, loss: 0.3374357521533966, mean loss: 0.3469522378937205
Epoch: 31, step: 918, loss: 0.36691024899482727, mean loss: 0.3469526747742034
Epoch: 31, step: 919, loss: 0.3370823860168457, mean loss: 0.3469524587184999
Epoch: 31, step: 920, loss: 0.3333503305912018, mean loss: 0.3469521609812092
Epoch: 31, step: 921, loss: 0.3227072060108185, mean loss: 0.34695163029445675
Epoch: 31, step: 922, loss: 0.3398662805557251, mean loss: 0.3469514752098651
Epoch: 31, step: 923, loss: 0.34938040375709534, mean loss: 0.346951528373246
Epoch: 31, step: 924, loss: 0.3295126259326935, mean loss: 0.3469511466861344
Epoch: 31, step: 925, loss: 0.30997535586357117, mean loss: 0.3469503374107826
Epoch: 31, step: 926, loss: 0.30532318353652954, mean loss: 0.3469494263527214
Epoch: 31, step: 927, loss: 0.38313108682632446, mean loss: 0.34695021821257593
Epoch: 31, step: 928, loss: 0.34373408555984497, mean loss: 0.3469501478269008
Epoch: 31, step: 929, loss: 0.3256573975086212, mean loss: 0.34694968184120645
Epoch: 31, step: 930, loss: 0.3350956439971924, mean loss: 0.3469494224246873
Epoch: 31, step: 931, loss: 0.3080127239227295, mean loss: 0.3469485703435751
Epoch: 31, step: 932, loss: 0.3780885338783264, mean loss: 0.3469492517879486
Epoch: 31, step: 933, loss: 0.30732616782188416, mean loss: 0.34694838472409534
Epoch: 31, step: 934, loss: 0.33298298716545105, mean loss: 0.34694807912884035
Epoch: 31, step: 935, loss: 0.348206490278244, mean loss: 0.3469481066651893
Epoch: 31, step: 936, loss: 0.3266950249671936, mean loss: 0.3469476635002324
Epoch: 31, step: 937, loss: 0.2969472408294678, mean loss: 0.3469465694469596
Epoch: 31, step: 938, loss: 0.38020768761634827, mean loss: 0.34694729721358697
Epoch: 31, step: 939, loss: 0.32368868589401245, mean loss: 0.34694678831696263
Epoch: 31, step: 940, loss: 0.2944939434528351, mean loss: 0.34694564067786704
Epoch: 31, step: 941, loss: 0.3524811863899231, mean loss: 0.34694576178988107
Epoch: 31, step: 942, loss: 0.3178194463253021, mean loss: 0.3469451245501702
Epoch: 31, step: 943, loss: 0.3249569237232208, mean loss: 0.3469446434921316
Epoch: 31, step: 944, loss: 0.31791508197784424, mean loss: 0.3469440083970406
Epoch: 31, step: 945, loss: 0.33770492672920227, mean loss: 0.34694380627318
Epoch: 31, step: 946, loss: 0.34032493829727173, mean loss: 0.34694366147503564
Epoch: 31, step: 947, loss: 0.3508216142654419, mean loss: 0.34694374630949465
Epoch: 31, step: 948, loss: 0.30901458859443665, mean loss: 0.34694291658583365
Epoch: 31, step: 949, loss: 0.3268272876739502, mean loss: 0.346942476553701
Epoch: 31, step: 950, loss: 0.34975090622901917, mean loss: 0.3469425379871402
Epoch: 31, step: 951, loss: 0.318445086479187, mean loss: 0.3469419146287644
Epoch: 31, step: 952, loss: 0.3294326066970825, mean loss: 0.3469415316353936
Epoch: 31, step: 953, loss: 0.3086462616920471, mean loss: 0.3469406939944219
Epoch: 31, step: 954, loss: 0.3256092071533203, mean loss: 0.3469402274162631
Epoch: 31, step: 955, loss: 0.3297875225543976, mean loss: 0.3469398522477403
Epoch: 31, step: 956, loss: 0.31030136346817017, mean loss: 0.3469390508984964
Epoch: 31, step: 957, loss: 0.32126015424728394, mean loss: 0.3469384892674074
Epoch: 31, step: 958, loss: 0.29839250445365906, mean loss: 0.34693742752638396
Epoch: 31, step: 959, loss: 0.3695746064186096, mean loss: 0.34693792260946704
Epoch: 31, step: 960, loss: 0.3171168863773346, mean loss: 0.3469372704271547
Epoch: 31, step: 961, loss: 0.3086617887020111, mean loss: 0.346936433365489
Epoch: 31, step: 962, loss: 0.29793694615364075, mean loss: 0.3469353617997355
Epoch: 31, step: 963, loss: 0.331770658493042, mean loss: 0.3469350301713392
Epoch: 31, step: 964, loss: 0.34855395555496216, mean loss: 0.3469350655739368
Epoch: 31, step: 965, loss: 0.34504491090774536, mean loss: 0.34693502424101164
Epoch: 31, step: 966, loss: 0.36274799704551697, mean loss: 0.34693537002336505
Epoch: 31, step: 967, loss: 0.300199031829834, mean loss: 0.3469343480619771
Epoch: 31, step: 968, loss: 0.32708197832107544, mean loss: 0.3469339139690958
Epoch: 31, step: 969, loss: 0.2949290871620178, mean loss: 0.3469327768538903
Epoch: 31, step: 970, loss: 0.3299485445022583, mean loss: 0.34693240549208093
Epoch: 31, step: 971, loss: 0.33296868205070496, mean loss: 0.34693210018065357
Epoch: 31, step: 972, loss: 0.2805812656879425, mean loss: 0.34693064947696745
Epoch: 31, step: 973, loss: 0.3477686047554016, mean loss: 0.34693066779773524
Epoch: 31, step: 974, loss: 0.30184292793273926, mean loss: 0.34692968203635294
Epoch: 31, step: 975, loss: 0.30017462372779846, mean loss: 0.3469286598444354
Epoch: 31, step: 976, loss: 0.3522625267505646, mean loss: 0.3469287764546299
Epoch: 31, step: 977, loss: 0.31380775570869446, mean loss: 0.3469280523712766
Epoch: 31, step: 978, loss: 0.3090105652809143, mean loss: 0.3469272234469146
Epoch: 31, step: 979, loss: 0.29836878180503845, mean loss: 0.34692616192099557
Epoch: 31, step: 980, loss: 0.3200003206729889, mean loss: 0.3469255733136888
Epoch: 31, step: 981, loss: 0.349936842918396, mean loss: 0.3469256391395447
Epoch: 31, step: 982, loss: 0.36275267601013184, mean loss: 0.3469259851083923
Epoch: 31, step: 983, loss: 0.37575268745422363, mean loss: 0.34692661522779306
Epoch: 31, step: 984, loss: 0.3271588385105133, mean loss: 0.3469261831357972
Epoch: 31, step: 985, loss: 0.29780182242393494, mean loss: 0.3469251093792789
Epoch: 31, step: 986, loss: 0.3528629243373871, mean loss: 0.34692523916474716
Epoch: 31, step: 987, loss: 0.3281080722808838, mean loss: 0.3469248278785327
Epoch: 31, step: 988, loss: 0.289048969745636, mean loss: 0.34692356291540166
Epoch: 31, step: 989, loss: 0.30068740248680115, mean loss: 0.34692255237729724
Epoch: 31, step: 990, loss: 0.3288269639015198, mean loss: 0.3469221568885315
Epoch: 31, step: 991, loss: 0.3413199782371521, mean loss: 0.3469220344525963
Epoch: 31, step: 992, loss: 0.2971716523170471, mean loss: 0.3469209471789084
Epoch: 31, step: 993, loss: 0.31035441160202026, mean loss: 0.34692014805010957
Epoch: 31, step: 994, loss: 0.2956448197364807, mean loss: 0.3469190274983424
Epoch: 31, step: 995, loss: 0.33309322595596313, mean loss: 0.34691872536107093
Epoch: 31, step: 996, loss: 0.34928080439567566, mean loss: 0.34691877697880297
Epoch: 31, step: 997, loss: 0.3153928518295288, mean loss: 0.3469180880682407
Epoch: 31, step: 998, loss: 0.34726983308792114, mean loss: 0.34691809575447236
Epoch: 31, step: 999, loss: 0.35353073477745056, mean loss: 0.3469182402488134
Epoch: 31, step: 1000, loss: 0.37958526611328125, mean loss: 0.34691895404813305
Epoch: 31, step: 1001, loss: 0.3202767074108124, mean loss: 0.34691837190753444
Epoch: 31, step: 1002, loss: 0.3320273756980896, mean loss: 0.3469180465421793
Epoch: 31, step: 1003, loss: 0.3269190788269043, mean loss: 0.3469176095781932
Epoch: 31, step: 1004, loss: 0.32397666573524475, mean loss: 0.34691710834496015
Epoch: 31, step: 1005, loss: 0.29911914467811584, mean loss: 0.34691606403725495
Epoch: 31, step: 1006, loss: 0.3140084445476532, mean loss: 0.3469153450750411
Epoch: 31, step: 1007, loss: 0.36989328265190125, mean loss: 0.34691584708363976
Epoch: 31, step: 1008, loss: 0.300582617521286, mean loss: 0.34691483484433794
Epoch: 31, step: 1009, loss: 0.29224836826324463, mean loss: 0.3469136405753953
Epoch: 31, step: 1010, loss: 0.33336228132247925, mean loss: 0.3469133445325935
Epoch: 31, step: 1011, loss: 0.3040068745613098, mean loss: 0.3469124072189363
Epoch: 31, step: 1012, loss: 0.37748369574546814, mean loss: 0.3469130750496925
Epoch: 31, step: 1013, loss: 0.356538861989975, mean loss: 0.3469132853207166
Epoch: 31, step: 1014, loss: 0.3050899803638458, mean loss: 0.3469123717292236
Epoch: 31, step: 1015, loss: 0.34757503867149353, mean loss: 0.34691238620425513
Epoch: 31, step: 1016, loss: 0.32845520973205566, mean loss: 0.34691198304188486
Epoch: 31, step: 1017, loss: 0.337502121925354, mean loss: 0.3469117775056235
Epoch: 31, step: 1018, loss: 0.3577878773212433, mean loss: 0.3469120150632282
Epoch: 31, step: 1019, loss: 0.31655246019363403, mean loss: 0.3469113519591991
Epoch: 31, step: 1020, loss: 0.32818803191185, mean loss: 0.3469109430191522
Epoch: 31, step: 1021, loss: 0.394530326128006, mean loss: 0.34691198306159116
Epoch: 31, step: 1022, loss: 0.29546090960502625, mean loss: 0.3469108593567523
Epoch: 31, step: 1023, loss: 0.3419708013534546, mean loss: 0.34691075146695577
Epoch: 31, step: 1024, loss: 0.3312339186668396, mean loss: 0.3469104090958011
Epoch: 31, step: 1025, loss: 0.2916252315044403, mean loss: 0.3469092017322372
Epoch: 31, step: 1026, loss: 0.34985384345054626, mean loss: 0.3469092660383611
Epoch: 31, step: 1027, loss: 0.3325195014476776, mean loss: 0.34690895179647185
Epoch: 31, step: 1028, loss: 0.3215424716472626, mean loss: 0.3469083978585305
Epoch: 31, step: 1029, loss: 0.34566766023635864, mean loss: 0.34690837076464
Epoch: 31, step: 1030, loss: 0.34979939460754395, mean loss: 0.3469084338943232
Epoch: 31, step: 1031, loss: 0.3424570560455322, mean loss: 0.346908336694178
Epoch: 31, step: 1032, loss: 0.3185657262802124, mean loss: 0.3469077178193518
Epoch: 31, step: 1033, loss: 0.34344610571861267, mean loss: 0.346907642235001
Epoch: 31, step: 1034, loss: 0.33901461958885193, mean loss: 0.3469074698944991
Epoch: 31, step: 1035, loss: 0.3231765329837799, mean loss: 0.3469069517517718
Epoch: 31, step: 1036, loss: 0.3330554664134979, mean loss: 0.3469066493241973
Epoch: 31, step: 1037, loss: 0.3362593650817871, mean loss: 0.34690641686089346
Epoch: 31, step: 1038, loss: 0.3002520799636841, mean loss: 0.3469053982739691
Epoch: 31, step: 1039, loss: 0.32916706800460815, mean loss: 0.3469050110080039
Epoch: 31, step: 1040, loss: 0.33368808031082153, mean loss: 0.3469047224602319
Epoch: 31, step: 1041, loss: 0.38276049494743347, mean loss: 0.34690550523481356
Epoch: 31, step: 1042, loss: 0.3184865415096283, mean loss: 0.34690488482824416
Epoch: 31, step: 1043, loss: 0.34699440002441406, mean loss: 0.34690488678238307
Epoch: 31, step: 1044, loss: 0.31189486384391785, mean loss: 0.34690412252158415
Epoch: 31, step: 1045, loss: 0.35068443417549133, mean loss: 0.3469042050431221
Epoch: 31, step: 1046, loss: 0.3087841868400574, mean loss: 0.3469033729281671
Epoch: 31, step: 1047, loss: 0.33229169249534607, mean loss: 0.34690305397941057
Epoch: 31, step: 1048, loss: 0.32344672083854675, mean loss: 0.34690254197772674
Epoch: 31, step: 1049, loss: 0.3442634344100952, mean loss: 0.3469024843728992
Epoch: 31, step: 1050, loss: 0.3865717351436615, mean loss: 0.34690335023016805
Epoch: 31, step: 1051, loss: 0.35111844539642334, mean loss: 0.3469034422306737
Epoch: 31, step: 1052, loss: 0.3294210731983185, mean loss: 0.34690306066119003
Epoch: 31, step: 1053, loss: 0.33231523633003235, mean loss: 0.3469027422748717
Epoch: 31, step: 1054, loss: 0.28483641147613525, mean loss: 0.3469013876767618
Epoch: 31, step: 1055, loss: 0.34200456738471985, mean loss: 0.34690128080595667
Epoch: 31, step: 1056, loss: 0.346203476190567, mean loss: 0.3469012655770307
Epoch: 31, step: 1057, loss: 0.3232613503932953, mean loss: 0.3469007496694932
Epoch: 31, step: 1058, loss: 0.33905312418937683, mean loss: 0.3469005784099624
Epoch: 31, step: 1059, loss: 0.30574852228164673, mean loss: 0.3468996803640448
Epoch: 31, step: 1060, loss: 0.31596115231513977, mean loss: 0.34689900521886097
Epoch: 31, step: 1061, loss: 0.33693307638168335, mean loss: 0.3468987877456179
Epoch: 31, step: 1062, loss: 0.32698285579681396, mean loss: 0.3468983531561412
Epoch: 31, step: 1063, loss: 0.3140822947025299, mean loss: 0.3468976370860868
Epoch: 31, step: 1064, loss: 0.32779359817504883, mean loss: 0.3468972202312806
Epoch: 31, step: 1065, loss: 0.3380184769630432, mean loss: 0.34689702649915605
Epoch: 31, step: 1066, loss: 0.3029669225215912, mean loss: 0.3468960679753626
Epoch: 31, step: 1067, loss: 0.33197975158691406, mean loss: 0.34689574251899175
Epoch: 31, step: 1068, loss: 0.3465541899204254, mean loss: 0.3468957350668809
Epoch: 31, step: 1069, loss: 0.3276061415672302, mean loss: 0.34689531420914427
Epoch: 31, step: 1070, loss: 0.33722028136253357, mean loss: 0.3468951031251943
Epoch: 31, step: 1071, loss: 0.3676576316356659, mean loss: 0.3468955560994615
Epoch: 31, step: 1072, loss: 0.2997059226036072, mean loss: 0.34689452658981873
Epoch: 31, step: 1073, loss: 0.32030752301216125, mean loss: 0.34689394656879735
Epoch: 31, step: 1074, loss: 0.35112082958221436, mean loss: 0.3468940387802988
Epoch: 31, step: 1075, loss: 0.34663382172584534, mean loss: 0.34689403310366146
Epoch: 31, step: 1076, loss: 0.35327473282814026, mean loss: 0.3468941722956452
Epoch: 31, step: 1077, loss: 0.31961098313331604, mean loss: 0.34689357713860225
Epoch: 31, step: 1078, loss: 0.3034573793411255, mean loss: 0.3468926296395774
Epoch: 31, step: 1079, loss: 0.34721943736076355, mean loss: 0.34689263676826865
Epoch: 31, step: 1080, loss: 0.31766432523727417, mean loss: 0.3468919992219379
Epoch: 31, step: 1081, loss: 0.3608787953853607, mean loss: 0.3468923043040861
Epoch: 31, step: 1082, loss: 0.3462246358394623, mean loss: 0.3468922897411165
Epoch: 31, step: 1083, loss: 0.3317725658416748, mean loss: 0.3468919599617608
Epoch: 31, step: 1084, loss: 0.3293819725513458, mean loss: 0.3468915780562141
Epoch: 31, step: 1085, loss: 0.30063068866729736, mean loss: 0.34689056909461347
Epoch: 31, step: 1086, loss: 0.333273321390152, mean loss: 0.346890272105503
Epoch: 31, step: 1087, loss: 0.3107108175754547, mean loss: 0.34688948305694395
Epoch: 31, step: 1088, loss: 0.325101375579834, mean loss: 0.34688900788394594
Epoch: 31, step: 1089, loss: 0.37300488352775574, mean loss: 0.3468895774280565
Epoch: 31, step: 1090, loss: 0.36509525775909424, mean loss: 0.3468899744552145
Epoch: 31, step: 1091, loss: 0.3272853493690491, mean loss: 0.34688954692937085
Epoch: 31, step: 1092, loss: 0.3341658413410187, mean loss: 0.3468892694645217
Epoch: 31, step: 1093, loss: 0.33015552163124084, mean loss: 0.34688890456095345
Epoch: 31, step: 1094, loss: 0.3066087067127228, mean loss: 0.3468880262121485
Epoch: 31, step: 1095, loss: 0.3327208161354065, mean loss: 0.3468877172891202
Epoch: 31, step: 1096, loss: 0.4032686650753021, mean loss: 0.346888946676787
Epoch: 31, step: 1097, loss: 0.33257266879081726, mean loss: 0.34688863451687496
Epoch: 31, step: 1098, loss: 0.35595688223838806, mean loss: 0.34688883224157074
Epoch: 31, step: 1099, loss: 0.32764261960983276, mean loss: 0.34688841260497927
Epoch: 31, step: 1100, loss: 0.3700263202190399, mean loss: 0.34688891708350567
Epoch: 31, step: 1101, loss: 0.3337705731391907, mean loss: 0.3468886310689427
Epoch: 31, step: 1102, loss: 0.32894179224967957, mean loss: 0.3468882397889632
Epoch: 31, step: 1103, loss: 0.33910223841667175, mean loss: 0.34688807004096084
Epoch: 31, step: 1104, loss: 0.29625675082206726, mean loss: 0.34688696621660847
Epoch: 31, step: 1105, loss: 0.325019896030426, mean loss: 0.34688648949827
Epoch: 31, step: 1106, loss: 0.3531394302845001, mean loss: 0.34688662581404217
Epoch: 31, step: 1107, loss: 0.3272372782230377, mean loss: 0.34688619746237687
Epoch: 31, step: 1108, loss: 0.3142639696598053, mean loss: 0.34688548632014066
Epoch: 31, step: 1109, loss: 0.3112894296646118, mean loss: 0.3468847103673863
Epoch: 31, step: 1110, loss: 0.3398650586605072, mean loss: 0.3468845573504553
Epoch: 31, step: 1111, loss: 0.3083173632621765, mean loss: 0.34688371666700235
Epoch: 31, step: 1112, loss: 0.2966324985027313, mean loss: 0.34688262132035447
Epoch: 31, step: 1113, loss: 0.3777354657649994, mean loss: 0.3468832938179447
Epoch: 31, step: 1114, loss: 0.34514328837394714, mean loss: 0.3468832558919776
Epoch: 31, step: 1115, loss: 0.32622772455215454, mean loss: 0.34688280568423263
Epoch: 31, step: 1116, loss: 0.3077962398529053, mean loss: 0.346881953772421
Epoch: 31, step: 1117, loss: 0.33603745698928833, mean loss: 0.3468817174161858
Epoch: 31, step: 1118, loss: 0.3681364059448242, mean loss: 0.34688218065286447
Epoch: 31, step: 1119, loss: 0.35973355174064636, mean loss: 0.3468824607367954
Epoch: 31, step: 1120, loss: 0.33156687021255493, mean loss: 0.34688212695472015
Epoch: 31, step: 1121, loss: 0.3416011929512024, mean loss: 0.3468820118665886
Epoch: 31, step: 1122, loss: 0.32556039094924927, mean loss: 0.3468815472116555
Epoch: 31, step: 1123, loss: 0.3138580024242401, mean loss: 0.3468808275563036
Epoch: 31, step: 1124, loss: 0.328878790140152, mean loss: 0.3468804352610386
Epoch: 31, step: 1125, loss: 0.3011236786842346, mean loss: 0.346879438164578
Epoch: 31, step: 1126, loss: 0.3256624937057495, mean loss: 0.3468789758311257
Epoch: 31, step: 1127, loss: 0.34830242395401, mean loss: 0.34687900684847345
Epoch: 31, step: 1128, loss: 0.327082097530365, mean loss: 0.34687857547747314
Epoch: 31, step: 1129, loss: 0.3697167932987213, mean loss: 0.3468790731071812
Epoch: 31, step: 1130, loss: 0.33048102259635925, mean loss: 0.34687871581225777
Epoch: 31, step: 1131, loss: 0.35289424657821655, mean loss: 0.346878846880995
Epoch: 31, step: 1132, loss: 0.34557247161865234, mean loss: 0.3468788184178
Epoch: 31, step: 1133, loss: 0.3110625147819519, mean loss: 0.34687803807217193
Epoch: 31, step: 1134, loss: 0.35640573501586914, mean loss: 0.3468782456517912
Epoch: 31, step: 1135, loss: 0.3048553466796875, mean loss: 0.3468773301202232
Epoch: 31, step: 1136, loss: 0.33865201473236084, mean loss: 0.3468771509233563
Epoch: 31, step: 1137, loss: 0.3526136875152588, mean loss: 0.3468772758969215
Epoch: 31, step: 1138, loss: 0.31786835193634033, mean loss: 0.34687664393552553
Epoch: 31, step: 1139, loss: 0.3226553201675415, mean loss: 0.3468761162838227
Epoch: 31, step: 1140, loss: 0.3503945767879486, mean loss: 0.34687619293038635
Epoch: 31, step: 1141, loss: 0.3608279824256897, mean loss: 0.3468764968512136
Epoch: 31, step: 1142, loss: 0.33340126276016235, mean loss: 0.34687620331789426
Epoch: 31, step: 1143, loss: 0.33993491530418396, mean loss: 0.3468760521179288
Epoch: 31, step: 1144, loss: 0.37093618512153625, mean loss: 0.34687657620107165
Epoch: 31, step: 1145, loss: 0.32643234729766846, mean loss: 0.3468761308900522
Epoch: 31, step: 1146, loss: 0.30400609970092773, mean loss: 0.34687519712622245
Epoch: 31, step: 1147, loss: 0.2708120048046112, mean loss: 0.34687354040919155
Epoch: 31, step: 1148, loss: 0.3352566957473755, mean loss: 0.34687328739055495
Epoch: 31, step: 1149, loss: 0.2974393963813782, mean loss: 0.3468722107278593
Epoch: 31, step: 1150, loss: 0.33739686012268066, mean loss: 0.34687200436064586
Epoch: 31, step: 1151, loss: 0.35405805706977844, mean loss: 0.3468721608649735
Epoch: 31, step: 1152, loss: 0.3234432339668274, mean loss: 0.346871650619816
Epoch: 31, step: 1153, loss: 0.3181155323982239, mean loss: 0.34687102437045364
Epoch: 31, step: 1154, loss: 0.35254988074302673, mean loss: 0.34687114804162184
Epoch: 31, step: 1155, loss: 0.30607882142066956, mean loss: 0.3468702597069829
Epoch: 31, step: 1156, loss: 0.34158140420913696, mean loss: 0.3468701445340664
Epoch: 31, step: 1157, loss: 0.3224271535873413, mean loss: 0.34686961226214996
Epoch: 31, step: 1158, loss: 0.36513587832450867, mean loss: 0.34687001002070367
Epoch: 31, step: 1159, loss: 0.3484196364879608, mean loss: 0.34687004376398534
Epoch: 31, step: 1160, loss: 0.35122784972190857, mean loss: 0.34687013865360883
Epoch: 31, step: 1161, loss: 0.34170886874198914, mean loss: 0.3468700262713001
Epoch: 31, step: 1162, loss: 0.3438207805156708, mean loss: 0.3468699598779856
Epoch: 31, step: 1163, loss: 0.33432337641716003, mean loss: 0.3468696866985861
Epoch: 31, step: 1164, loss: 0.32912445068359375, mean loss: 0.3468693003362439
Epoch: 31, step: 1165, loss: 0.33026430010795593, mean loss: 0.34686893880782615
Epoch: 31, step: 1166, loss: 0.3577975928783417, mean loss: 0.346869176744167
Epoch: 31, step: 1167, loss: 0.37385982275009155, mean loss: 0.3468697643659994
Epoch: 31, step: 1168, loss: 0.32032033801078796, mean loss: 0.34686918636268255
Epoch: 31, step: 1169, loss: 0.3672594726085663, mean loss: 0.3468696302666806
Epoch: 31, step: 1170, loss: 0.3074740767478943, mean loss: 0.3468687726297258
Epoch: 31, step: 1171, loss: 0.3328213393688202, mean loss: 0.34686846682527483
Epoch: 31, step: 1172, loss: 0.3512537479400635, mean loss: 0.3468685622882157
Epoch: 31, step: 1173, loss: 0.3022337257862091, mean loss: 0.34686759065609196
Epoch: 31, step: 1174, loss: 0.36100536584854126, mean loss: 0.34686789840713556
Epoch: 31, step: 1175, loss: 0.330112099647522, mean loss: 0.3468675336749031
Epoch: 31, step: 1176, loss: 0.33393335342407227, mean loss: 0.34686725213596725
Epoch: 31, step: 1177, loss: 0.34785839915275574, mean loss: 0.3468672737098434
Epoch: 31, step: 1178, loss: 0.3358093500137329, mean loss: 0.34686703302195415
Epoch: 31, step: 1179, loss: 0.31137529015541077, mean loss: 0.34686626052189173
Epoch: 31, step: 1180, loss: 0.31116247177124023, mean loss: 0.3468654834234316
Epoch: 31, step: 1181, loss: 0.3285568058490753, mean loss: 0.3468650849409179
Epoch: 31, step: 1182, loss: 0.32247424125671387, mean loss: 0.34686455409355715
Epoch: 31, step: 1183, loss: 0.35695531964302063, mean loss: 0.3468647737062835
Epoch: 31, step: 1184, loss: 0.3445873558521271, mean loss: 0.3468647241422483
Epoch: 31, step: 1185, loss: 0.3580648899078369, mean loss: 0.3468649678890549
Epoch: 31, step: 1186, loss: 0.3586274981498718, mean loss: 0.34686522386890867
Epoch: 31, step: 1187, loss: 0.3432828485965729, mean loss: 0.34686514590983675
Epoch: 31, step: 1188, loss: 0.3064609169960022, mean loss: 0.34686426665866893
Epoch: 31, step: 1189, loss: 0.3324829936027527, mean loss: 0.3468639537093488
Epoch: 31, step: 1190, loss: 0.3246895372867584, mean loss: 0.346863471184783
Epoch: 31, step: 1191, loss: 0.29422199726104736, mean loss: 0.34686232570924286
Epoch: 31, step: 1192, loss: 0.38487517833709717, mean loss: 0.3468631528488
Epoch: 31, step: 1193, loss: 0.34500956535339355, mean loss: 0.3468631125165946
Epoch: 31, step: 1194, loss: 0.3068518340587616, mean loss: 0.3468622419302359
Epoch: 31, step: 1195, loss: 0.29820939898490906, mean loss: 0.34686118333922317
Epoch: 31, step: 1196, loss: 0.31458136439323425, mean loss: 0.3468604810085744
Epoch: 31, step: 1197, loss: 0.3408227264881134, mean loss: 0.3468603496445232
Epoch: 31, step: 1198, loss: 0.34838926792144775, mean loss: 0.34686038290863297
Epoch: 31, step: 1199, loss: 0.33027926087379456, mean loss: 0.34686002216713885
Epoch: 31, step: 1200, loss: 0.301584392786026, mean loss: 0.346859037164868
Epoch: 31, step: 1201, loss: 0.31829071044921875, mean loss: 0.34685841565491027
Epoch: 31, step: 1202, loss: 0.3114684224128723, mean loss: 0.3468576457549115
Epoch: 31, step: 1203, loss: 0.2979934513568878, mean loss: 0.3468565827503345
Epoch: 31, step: 1204, loss: 0.35284125804901123, mean loss: 0.3468567129397077
Epoch: 31, step: 1205, loss: 0.3412996828556061, mean loss: 0.3468565920558686
Epoch: 31, step: 1206, loss: 0.39911141991615295, mean loss: 0.34685772874699694
Epoch: 31, step: 1207, loss: 0.308013916015625, mean loss: 0.34685688380197105
Epoch: 31, step: 1208, loss: 0.33806687593460083, mean loss: 0.3468566926026178
Epoch: 31, step: 1209, loss: 0.3421159088611603, mean loss: 0.34685658948381715
Epoch: 31, step: 1210, loss: 0.32435956597328186, mean loss: 0.3468561001521475
Epoch: 31, step: 1211, loss: 0.3607516288757324, mean loss: 0.3468564023865464
Epoch: 31, step: 1212, loss: 0.326704740524292, mean loss: 0.34685596408779135
Epoch: 31, step: 1213, loss: 0.31926408410072327, mean loss: 0.346855363977304
Epoch: 31, step: 1214, loss: 0.33520933985710144, mean loss: 0.3468551106872342
Epoch: 31, step: 1215, loss: 0.32274073362350464, mean loss: 0.34685458623362253
Epoch: 31, step: 1216, loss: 0.32515063881874084, mean loss: 0.346854114213714
Epoch: 31, step: 1217, loss: 0.3500387668609619, mean loss: 0.3468541834723945
Epoch: 31, step: 1218, loss: 0.3599395751953125, mean loss: 0.3468544680425992
Epoch: 31, step: 1219, loss: 0.33409929275512695, mean loss: 0.34685419065969886
Epoch: 31, step: 1220, loss: 0.30018752813339233, mean loss: 0.3468531758361145
Epoch: 31, step: 1221, loss: 0.31778186559677124, mean loss: 0.3468525436587075
Epoch: 31, step: 1222, loss: 0.33501288294792175, mean loss: 0.3468522862020195
Epoch: 31, step: 1223, loss: 0.3154291808605194, mean loss: 0.3468516029127845
Epoch: 31, step: 1224, loss: 0.33288508653640747, mean loss: 0.34685129922024116
Epoch: 31, step: 1225, loss: 0.3320106863975525, mean loss: 0.3468509765280728
Epoch: 31, step: 1226, loss: 0.3501015305519104, mean loss: 0.34685104720611903
Epoch: 31, step: 1227, loss: 0.36162737011909485, mean loss: 0.346851368486405
Epoch: 31, step: 1228, loss: 0.31364545226097107, mean loss: 0.3468506465087948
Epoch: 31, step: 1229, loss: 0.3569260835647583, mean loss: 0.34685086556860817
Epoch: 31, step: 1230, loss: 0.3448251783847809, mean loss: 0.34685082152714314
Epoch: 31, step: 1231, loss: 0.3405768871307373, mean loss: 0.34685068512540396
Epoch: 31, step: 1232, loss: 0.3082486391067505, mean loss: 0.3468498458957581
Epoch: 31, step: 1233, loss: 0.36244523525238037, mean loss: 0.34685018494070263
Epoch: 31, step: 1234, loss: 0.2986485958099365, mean loss: 0.34684913705728926
Epoch: 31, step: 1235, loss: 0.30885961651802063, mean loss: 0.3468483111981471
Epoch: 31, step: 1236, loss: 0.3578212857246399, mean loss: 0.34684854973588597
Epoch: 31, step: 1237, loss: 0.38206130266189575, mean loss: 0.3468493151972339
Epoch: 31, step: 1238, loss: 0.35261088609695435, mean loss: 0.3468494404406071
Epoch: 31, step: 1239, loss: 0.3088873326778412, mean loss: 0.34684861524915067
Epoch: 31, step: 1240, loss: 0.3386877775192261, mean loss: 0.34684843785891634
Epoch: 31, step: 1241, loss: 0.342171847820282, mean loss: 0.3468483362071744
Epoch: 31, step: 1242, loss: 0.3557843565940857, mean loss: 0.34684853043893016
Epoch: 31, step: 1243, loss: 0.30272844433784485, mean loss: 0.34684757147340023
Epoch: 31, step: 1244, loss: 0.3084688186645508, mean loss: 0.3468467373158917
Epoch: 31, step: 1245, loss: 0.3504234552383423, mean loss: 0.3468468150537296
Epoch: 31, step: 1246, loss: 0.3598780333995819, mean loss: 0.3468470982733585
Epoch: 31, step: 1247, loss: 0.3357433080673218, mean loss: 0.34684685694956896
Epoch: 31, step: 1248, loss: 0.3564140498638153, mean loss: 0.34684706487326256
Epoch: 31, step: 1249, loss: 0.3119971454143524, mean loss: 0.34684630749682366
Epoch: 31, step: 1250, loss: 0.3194761574268341, mean loss: 0.34684571268752085
Epoch: 31, step: 1251, loss: 0.34688329696655273, mean loss: 0.3468457135042863
Epoch: 31, step: 1252, loss: 0.35144343972206116, mean loss: 0.34684581341793164
Epoch: 31, step: 1253, loss: 0.29890912771224976, mean loss: 0.34684477172368794
Epoch: 31, step: 1254, loss: 0.3339066803455353, mean loss: 0.3468444905769577
Epoch: 31, step: 1255, loss: 0.3361627161502838, mean loss: 0.34684425846538824
Epoch: 31, step: 1256, loss: 0.3384573757648468, mean loss: 0.3468440762250479
Epoch: 31, step: 1257, loss: 0.3348270058631897, mean loss: 0.34684381510926937
Epoch: 31, step: 1258, loss: 0.3254431188106537, mean loss: 0.34684335010924117
Epoch: 31, step: 1259, loss: 0.3308047354221344, mean loss: 0.34684300162552206
Epoch: 31, step: 1260, loss: 0.36802801489830017, mean loss: 0.3468434619191293
Epoch: 31, step: 1261, loss: 0.36953961849212646, mean loss: 0.34684395503511967
Epoch: 31, step: 1262, loss: 0.3233166038990021, mean loss: 0.34684344387099564
Epoch: 31, step: 1263, loss: 0.29440951347351074, mean loss: 0.3468423046963542
Epoch: 31, step: 1264, loss: 0.33534085750579834, mean loss: 0.34684205482242275
Epoch: 31, step: 1265, loss: 0.31171566247940063, mean loss: 0.3468412917028846
Epoch: 31, step: 1266, loss: 0.3320066034793854, mean loss: 0.34684096942684833
Epoch: 31, step: 1267, loss: 0.3612118661403656, mean loss: 0.3468412816204683
Epoch: 31, step: 1268, loss: 0.3055865168571472, mean loss: 0.34684038542068196
Epoch: 31, step: 1269, loss: 0.31533196568489075, mean loss: 0.3468397009609406
Epoch: 31, step: 1270, loss: 0.38338327407836914, mean loss: 0.3468404947824485
Epoch: 31, step: 1271, loss: 0.3222973644733429, mean loss: 0.3468399616533689
Epoch: 31, step: 1272, loss: 0.31994763016700745, mean loss: 0.34683937750732363
Epoch: 31, step: 1273, loss: 0.3396982252597809, mean loss: 0.3468392223930214
Epoch: 31, step: 1274, loss: 0.3362445831298828, mean loss: 0.34683899226988096
Epoch: 31, step: 1275, loss: 0.3570486605167389, mean loss: 0.346839214026359
Epoch: 31, step: 1276, loss: 0.31047409772872925, mean loss: 0.34683842418434213
Epoch: 31, step: 1277, loss: 0.312623530626297, mean loss: 0.34683768106081236
Epoch: 31, step: 1278, loss: 0.33070024847984314, mean loss: 0.34683733057468896
Epoch: 31, step: 1279, loss: 0.3953147530555725, mean loss: 0.3468383834246256
Epoch: 31, step: 1280, loss: 0.31690600514411926, mean loss: 0.34683773335668594
Epoch: 31, step: 1281, loss: 0.3419385254383087, mean loss: 0.34683762695856407
Epoch: 31, step: 1282, loss: 0.33183708786964417, mean loss: 0.3468373011927359
Epoch: 31, step: 1283, loss: 0.2903613746166229, mean loss: 0.3468360747349837
Epoch: 31, step: 1284, loss: 0.3127109408378601, mean loss: 0.3468353336736382
Epoch: 31, step: 1285, loss: 0.2810189723968506, mean loss: 0.3468339044366941
Epoch: 31, step: 1286, loss: 0.33758458495140076, mean loss: 0.3468337035872123
Epoch: 31, step: 1287, loss: 0.34271296858787537, mean loss: 0.34683361410716806
Epoch: 31, step: 1288, loss: 0.2988176941871643, mean loss: 0.34683257148410507
Epoch: 31, step: 1289, loss: 0.3339266777038574, mean loss: 0.34683229125016707
Epoch: 31, step: 1290, loss: 0.33182457089424133, mean loss: 0.3468319653849981
Epoch: 31, step: 1291, loss: 0.3281109631061554, mean loss: 0.3468315589015371
Epoch: 31, step: 1292, loss: 0.3955115079879761, mean loss: 0.34683261585160086
Epoch: 31, step: 1293, loss: 0.34430423378944397, mean loss: 0.34683256095598963
Epoch: 31, step: 1294, loss: 0.3547615110874176, mean loss: 0.34683273310367263
Epoch: 31, step: 1295, loss: 0.31356605887413025, mean loss: 0.3468320108571631
Epoch: 31, step: 1296, loss: 0.32864823937416077, mean loss: 0.34683161608129015
Epoch: 31, step: 1297, loss: 0.32528167963027954, mean loss: 0.34683114823498623
Epoch: 31, step: 1298, loss: 0.31495165824890137, mean loss: 0.34683045615045016
Epoch: 31, step: 1299, loss: 0.38441362977027893, mean loss: 0.3468312720408118
Epoch: 31, step: 1300, loss: 0.34625187516212463, mean loss: 0.3468312594630005
Epoch: 31, step: 1301, loss: 0.3287656605243683, mean loss: 0.3468308672952642
Epoch: 31, step: 1302, loss: 0.3271315097808838, mean loss: 0.3468304396712054
Epoch: 31, step: 1303, loss: 0.3199843764305115, mean loss: 0.34682985692258944
Epoch: 31, step: 1304, loss: 0.3329618275165558, mean loss: 0.34682955589523035
Epoch: 31, step: 1305, loss: 0.32203409075737, mean loss: 0.34682901768239904
Epoch: 31, step: 1306, loss: 0.34518519043922424, mean loss: 0.34682898200209594
Epoch: 31, step: 1307, loss: 0.3427370488643646, mean loss: 0.34682889318604415
Epoch: 31, step: 1308, loss: 0.3322592079639435, mean loss: 0.34682857695560065
Epoch: 31, step: 1309, loss: 0.3312602937221527, mean loss: 0.34682823905823484
Epoch: 31, step: 1310, loss: 0.3242062032222748, mean loss: 0.34682774807536265
Epoch: 31, step: 1311, loss: 0.40063923597335815, mean loss: 0.34682891596076715
Epoch: 31, step: 1312, loss: 0.29257631301879883, mean loss: 0.34682773852727666
Epoch: 31, step: 1313, loss: 0.3654088079929352, mean loss: 0.3468281417797934
Epoch: 31, step: 1314, loss: 0.3366192877292633, mean loss: 0.34682792022867354
Epoch: 31, step: 1315, loss: 0.3144195079803467, mean loss: 0.34682721692111607
Epoch: 31, step: 1316, loss: 0.3208800256252289, mean loss: 0.34682665384324673
Epoch: 31, step: 1317, loss: 0.31496870517730713, mean loss: 0.34682596251151926
Epoch: 31, step: 1318, loss: 0.3106759488582611, mean loss: 0.3468251780570859
Epoch: 31, step: 1319, loss: 0.3260332942008972, mean loss: 0.346824726883493
Epoch: 31, step: 1320, loss: 0.30771470069885254, mean loss: 0.3468238782336897
Epoch: 31, step: 1321, loss: 0.3298148810863495, mean loss: 0.3468235091628841
Epoch: 31, step: 1322, loss: 0.33200588822364807, mean loss: 0.34682318764877085
Epoch: 31, step: 1323, loss: 0.344387024641037, mean loss: 0.3468231347898269
Epoch: 31, step: 1324, loss: 0.33295127749443054, mean loss: 0.34682283381004225
Epoch: 31, step: 1325, loss: 0.29402151703834534, mean loss: 0.34682168819674714
Epoch: 31, step: 1326, loss: 0.3101627230644226, mean loss: 0.34682089283615325
Epoch: 31, step: 1327, loss: 0.3529057204723358, mean loss: 0.34682102485098526
Epoch: 31, step: 1328, loss: 0.36643555760383606, mean loss: 0.3468214503935352
Epoch: 31, step: 1329, loss: 0.28646525740623474, mean loss: 0.3468201409781452
Epoch: 31, step: 1330, loss: 0.3224831521511078, mean loss: 0.34681961300355296
Epoch: 31, step: 1331, loss: 0.30169814825057983, mean loss: 0.3468186341449806
Epoch: 31, step: 1332, loss: 0.3789639472961426, mean loss: 0.3468193314856568
Epoch: 31, step: 1333, loss: 0.3298185169696808, mean loss: 0.346818962688431
Epoch: 31, step: 1334, loss: 0.3234151005744934, mean loss: 0.3468184550014505
Epoch: 31, step: 1335, loss: 0.3314571678638458, mean loss: 0.34681812178480975
Epoch: 31, step: 1336, loss: 0.3227722644805908, mean loss: 0.34681760019401336
Epoch: 31, step: 1337, loss: 0.374863862991333, mean loss: 0.3468182085464232
Epoch: 31, step: 1338, loss: 0.33460181951522827, mean loss: 0.34681794356607415
Epoch: 31, step: 1339, loss: 0.34158244729042053, mean loss: 0.34681783000767846
Epoch: 31, step: 1340, loss: 0.3269321024417877, mean loss: 0.346817398693774
Epoch: 31, step: 1341, loss: 0.31041663885116577, mean loss: 0.3468166091921941
Epoch: 31, step: 1342, loss: 0.32018524408340454, mean loss: 0.3468160315930202
Epoch: 31, step: 1343, loss: 0.3379381000995636, mean loss: 0.34681583904657504
Epoch: 31, step: 1344, loss: 0.3144930601119995, mean loss: 0.346815138038552
Epoch: 31, step: 1345, loss: 0.3382658064365387, mean loss: 0.3468149526268929
Epoch: 31, step: 1346, loss: 0.3214113116264343, mean loss: 0.3468144017032304
Epoch: 31, step: 1347, loss: 0.3158521354198456, mean loss: 0.3468137302453391
Epoch: 31, step: 1348, loss: 0.35229867696762085, mean loss: 0.34681384919111846
Epoch: 31, step: 1349, loss: 0.35829439759254456, mean loss: 0.3468140981512694
Epoch: 31, step: 1350, loss: 0.318762868642807, mean loss: 0.3468134898626538
Epoch: 31, step: 1351, loss: 0.3598030209541321, mean loss: 0.3468137715334642
Epoch: 31, step: 1352, loss: 0.3073122501373291, mean loss: 0.3468129149833548
Epoch: 31, step: 1353, loss: 0.3326101303100586, mean loss: 0.3468126070171665
Epoch: 31, step: 1354, loss: 0.33717963099479675, mean loss: 0.3468123981449875
Epoch: 31, step: 1355, loss: 0.3199719786643982, mean loss: 0.346811816175788
Epoch: 31, step: 1356, loss: 0.3520348072052002, mean loss: 0.3468119294211866
Epoch: 31, step: 1357, loss: 0.34352973103523254, mean loss: 0.3468118582577855
Epoch: 31, step: 1358, loss: 0.3442237973213196, mean loss: 0.34681180214563023
Epoch: 31, step: 1359, loss: 0.3231769800186157, mean loss: 0.3468112897264531
Epoch: 31, step: 1360, loss: 0.39674195647239685, mean loss: 0.3468123722341332
Epoch: 31, step: 1361, loss: 0.30198290944099426, mean loss: 0.3468114003427315
Epoch: 31, step: 1362, loss: 0.311506986618042, mean loss: 0.34681063496857484
Epoch: 31, step: 1363, loss: 0.3266877233982086, mean loss: 0.3468101987278627
Epoch: 31, step: 1364, loss: 0.3335977792739868, mean loss: 0.3468099123045833
Epoch: 31, step: 1365, loss: 0.3065769076347351, mean loss: 0.34680904013886316
Epoch: 31, step: 1366, loss: 0.3468852937221527, mean loss: 0.34680904179184235
Epoch: 31, step: 1367, loss: 0.3777298033237457, mean loss: 0.3468097120589353
Epoch: 31, step: 1368, loss: 0.3396890163421631, mean loss: 0.34680955770747934
Epoch: 31, step: 1369, loss: 0.36567625403404236, mean loss: 0.34680996666175007
Epoch: 31, step: 1370, loss: 0.322268009185791, mean loss: 0.3468094347021212
Epoch: 31, step: 1371, loss: 0.29802894592285156, mean loss: 0.3468083773827008
Epoch: 31, step: 1372, loss: 0.28747642040252686, mean loss: 0.34680709138757804
Epoch: 31, step: 1373, loss: 0.36559394001960754, mean loss: 0.3468074985757663
Epoch: 31, step: 1374, loss: 0.37686726450920105, mean loss: 0.34680815008026217
Epoch: 31, step: 1375, loss: 0.31654518842697144, mean loss: 0.3468074941859914
Epoch: 31, step: 1376, loss: 0.3026042580604553, mean loss: 0.34680653618256435
Epoch: 31, step: 1377, loss: 0.36683550477027893, mean loss: 0.3468069702549623
Epoch: 31, step: 1378, loss: 0.3368363082408905, mean loss: 0.3468067541731728
Epoch: 31, step: 1379, loss: 0.33708974719047546, mean loss: 0.34680654359309776
Epoch: 31, step: 1380, loss: 0.3402916491031647, mean loss: 0.3468064024099904
Epoch: 31, step: 1381, loss: 0.3494473695755005, mean loss: 0.34680645964067486
Epoch: 31, step: 1382, loss: 0.37030288577079773, mean loss: 0.34680696880543377
Epoch: 31, step: 1383, loss: 0.30191928148269653, mean loss: 0.34680599611566776
Epoch: 31, step: 1384, loss: 0.3207032084465027, mean loss: 0.3468054304958782
Epoch: 31, step: 1385, loss: 0.3402380347251892, mean loss: 0.34680528819044437
Epoch: 31, step: 1386, loss: 0.33489614725112915, mean loss: 0.34680503014314445
Epoch: 31, step: 1387, loss: 0.30474916100502014, mean loss: 0.3468041188961966
Epoch: 31, step: 1388, loss: 0.34521350264549255, mean loss: 0.34680408443221267
Epoch: 31, step: 1389, loss: 0.37537533044815063, mean loss: 0.34680470347381287
Epoch: 31, step: 1390, loss: 0.32211461663246155, mean loss: 0.34680416853530477
Epoch: 31, step: 1391, loss: 0.293710321187973, mean loss: 0.34680301822229354
Epoch: 31, step: 1392, loss: 0.336988627910614, mean loss: 0.34680280559169985
Epoch: 31, step: 1393, loss: 0.34350666403770447, mean loss: 0.3468027341817264
Epoch: 31, step: 1394, loss: 0.432835191488266, mean loss: 0.3468045980101739
Epoch: 31, step: 1395, loss: 0.34161069989204407, mean loss: 0.34680448549071724
Epoch: 31, step: 1396, loss: 0.34073829650878906, mean loss: 0.3468043540769918
Epoch: 31, step: 1397, loss: 0.32916098833084106, mean loss: 0.34680397187159023
Epoch: 31, step: 1398, loss: 0.3669716417789459, mean loss: 0.3468044087511238
Epoch: 31, step: 1399, loss: 0.323610782623291, mean loss: 0.34680390633308966
Epoch: 31, step: 1400, loss: 0.3226169943809509, mean loss: 0.34680338240994546
Epoch: 31, step: 1401, loss: 0.334598183631897, mean loss: 0.34680311803359104
Epoch: 31, step: 1402, loss: 0.31403419375419617, mean loss: 0.3468024082425221
Epoch: 31, step: 1403, loss: 0.3187359571456909, mean loss: 0.3468018003225105
Epoch: 31, step: 1404, loss: 0.34197375178337097, mean loss: 0.3468016957491271
Epoch: 31, step: 1405, loss: 0.39942291378974915, mean loss: 0.3468028354766134
Epoch: 31, step: 1406, loss: 0.3309657573699951, mean loss: 0.3468024924674062
Epoch: 31, step: 1407, loss: 0.2990972697734833, mean loss: 0.3468014592606425
Epoch: 31, step: 1408, loss: 0.3235107660293579, mean loss: 0.3468009548382911
Epoch: 31, step: 1409, loss: 0.32328858971595764, mean loss: 0.34680044562606943
Epoch: 31, step: 1410, loss: 0.34755608439445496, mean loss: 0.34680046199074227
Epoch: 31, step: 1411, loss: 0.3389987349510193, mean loss: 0.3468002930344221
Epoch: 31, step: 1412, loss: 0.3796091675758362, mean loss: 0.3468010035369351
Epoch: 31, step: 1413, loss: 0.32167330384254456, mean loss: 0.3468004593882129
Epoch: 31, step: 1414, loss: 0.3249770700931549, mean loss: 0.346799986805669
Epoch: 31, step: 1415, loss: 0.3155548870563507, mean loss: 0.34679931021191085
Epoch: 31, step: 1416, loss: 0.32707369327545166, mean loss: 0.34679888307484286
Epoch: 31, step: 1417, loss: 0.33545976877212524, mean loss: 0.3467986375438069
Epoch: 31, step: 1418, loss: 0.34532630443573, mean loss: 0.34679860566339404
Epoch: 31, step: 1419, loss: 0.3365214169025421, mean loss: 0.34679838313635525
Epoch: 31, step: 1420, loss: 0.33930137753486633, mean loss: 0.34679822081080364
Epoch: 31, step: 1421, loss: 0.3281169533729553, mean loss: 0.3467978163317962
Epoch: 31, step: 1422, loss: 0.33426082134246826, mean loss: 0.3467975448918891
Epoch: 31, step: 1423, loss: 0.3091796338558197, mean loss: 0.3467967304398445
Epoch: 31, step: 1424, loss: 0.2986438572406769, mean loss: 0.3467956879216432
Epoch: 31, step: 1425, loss: 0.30999740958213806, mean loss: 0.3467948912496722
Epoch: 31, step: 1426, loss: 0.30443450808525085, mean loss: 0.3467939741796117
Epoch: 31, step: 1427, loss: 0.3480628728866577, mean loss: 0.3467940016497084
Epoch: 31, step: 1428, loss: 0.32793179154396057, mean loss: 0.3467935933148935
Epoch: 31, step: 1429, loss: 0.29736772179603577, mean loss: 0.34679252335187843
Epoch: 31, step: 1430, loss: 0.2952738106250763, mean loss: 0.3467914081075289
Epoch: 31, step: 1431, loss: 0.30809125304222107, mean loss: 0.3467905703693034
Epoch: 31, step: 1432, loss: 0.31386494636535645, mean loss: 0.3467898576471785
Epoch: 31, step: 1433, loss: 0.35640472173690796, mean loss: 0.3467900657701295
Epoch: 31, step: 1434, loss: 0.33929991722106934, mean loss: 0.34678990364219275
Epoch: 31, step: 1435, loss: 0.3339131772518158, mean loss: 0.3467896249251713
Epoch: 31, step: 1436, loss: 0.3388662338256836, mean loss: 0.34678945342691153
Epoch: 31, step: 1437, loss: 0.390397846698761, mean loss: 0.3467903972906679
Epoch: 31, step: 1438, loss: 0.2990005314350128, mean loss: 0.34678936294515234
Epoch: 31, step: 1439, loss: 0.34058916568756104, mean loss: 0.3467892287533668
Epoch: 31, step: 1440, loss: 0.3134208619594574, mean loss: 0.34678850657250343
Epoch: 31, step: 1441, loss: 0.31911009550094604, mean loss: 0.34678790755049177
Epoch: 31, step: 1442, loss: 0.3155289590358734, mean loss: 0.3467872310523743
Epoch: 31, step: 1443, loss: 0.3204663097858429, mean loss: 0.346786661434099
Valid: 31, mean loss: 0.1862523009379705
Epoch: 32, step: 0, loss: 0.3443656265735626, mean loss: 0.3467866090409535
Epoch: 32, step: 1, loss: 0.30839595198631287, mean loss: 0.34678577825417456
Epoch: 32, step: 2, loss: 0.34035778045654297, mean loss: 0.34678563915314237
Epoch: 32, step: 3, loss: 0.3459855318069458, mean loss: 0.3467856218392986
Epoch: 32, step: 4, loss: 0.33333316445350647, mean loss: 0.3467853307424777
Epoch: 32, step: 5, loss: 0.3559873104095459, mean loss: 0.34678552985918837
Epoch: 32, step: 6, loss: 0.3554061949253082, mean loss: 0.34678571639310735
Epoch: 32, step: 7, loss: 0.32165589928627014, mean loss: 0.34678517264598285
Epoch: 32, step: 8, loss: 0.3139618933200836, mean loss: 0.3467844624467201
Epoch: 32, step: 9, loss: 0.3077833354473114, mean loss: 0.34678361859525536
Epoch: 32, step: 10, loss: 0.35173630714416504, mean loss: 0.3467837257522373
Epoch: 32, step: 11, loss: 0.3340606391429901, mean loss: 0.34678345047991777
Epoch: 32, step: 12, loss: 0.3351611793041229, mean loss: 0.34678319902990207
Epoch: 32, step: 13, loss: 0.3356211483478546, mean loss: 0.34678295754206767
Epoch: 32, step: 14, loss: 0.33073222637176514, mean loss: 0.34678261029651525
Epoch: 32, step: 15, loss: 0.3271596431732178, mean loss: 0.3467821857774965
Epoch: 32, step: 16, loss: 0.28517135977745056, mean loss: 0.34678085293107136
Epoch: 32, step: 17, loss: 0.35310330986976624, mean loss: 0.346780989703817
Epoch: 32, step: 18, loss: 0.30999162793159485, mean loss: 0.34678019386238723
Epoch: 32, step: 19, loss: 0.3924008905887604, mean loss: 0.3467811807252566
Epoch: 32, step: 20, loss: 0.3540082275867462, mean loss: 0.3467813370567122
Epoch: 32, step: 21, loss: 0.3404778242111206, mean loss: 0.34678120070557994
Epoch: 32, step: 22, loss: 0.36847472190856934, mean loss: 0.3467816699474567
Epoch: 32, step: 23, loss: 0.3465135395526886, mean loss: 0.34678166414778555
Epoch: 32, step: 24, loss: 0.3363293409347534, mean loss: 0.3467814380685086
Epoch: 32, step: 25, loss: 0.3470282256603241, mean loss: 0.3467814434063031
Epoch: 32, step: 26, loss: 0.30932673811912537, mean loss: 0.3467806333121042
Epoch: 32, step: 27, loss: 0.3322412073612213, mean loss: 0.34678031885094945
Epoch: 32, step: 28, loss: 0.31240734457969666, mean loss: 0.3467795754425477
Epoch: 32, step: 29, loss: 0.33912697434425354, mean loss: 0.34677940993796064
Epoch: 32, step: 30, loss: 0.31658151745796204, mean loss: 0.34677875685522785
Epoch: 32, step: 31, loss: 0.3889008164405823, mean loss: 0.34677966779942304
Epoch: 32, step: 32, loss: 0.3383546769618988, mean loss: 0.34677948560200433
Epoch: 32, step: 33, loss: 0.35136282444000244, mean loss: 0.3467795847183669
Epoch: 32, step: 34, loss: 0.33453357219696045, mean loss: 0.3467793198996371
Epoch: 32, step: 35, loss: 0.35027065873146057, mean loss: 0.34677939539783864
Epoch: 32, step: 36, loss: 0.36336615681648254, mean loss: 0.34677975406929323
Epoch: 32, step: 37, loss: 0.3416857421398163, mean loss: 0.34677964391896826
Epoch: 32, step: 38, loss: 0.3510810434818268, mean loss: 0.3467797369282351
Epoch: 32, step: 39, loss: 0.3293999433517456, mean loss: 0.3467793611326639
Epoch: 32, step: 40, loss: 0.40911754965782166, mean loss: 0.3467807090145322
Epoch: 32, step: 41, loss: 0.29555177688598633, mean loss: 0.34677960136194563
Epoch: 32, step: 42, loss: 0.314547598361969, mean loss: 0.34677890446884063
Epoch: 32, step: 43, loss: 0.311807781457901, mean loss: 0.3467781483691474
Epoch: 32, step: 44, loss: 0.3125544488430023, mean loss: 0.3467774084452608
Epoch: 32, step: 45, loss: 0.3340972363948822, mean loss: 0.3467771343030882
Epoch: 32, step: 46, loss: 0.33156245946884155, mean loss: 0.3467768053727059
Epoch: 32, step: 47, loss: 0.3544296324253082, mean loss: 0.3467769708177736
Epoch: 32, step: 48, loss: 0.42823925614356995, mean loss: 0.34677873189794145
Epoch: 32, step: 49, loss: 0.35945162177085876, mean loss: 0.3467790058589833
Epoch: 32, step: 50, loss: 0.33196356892585754, mean loss: 0.3467786855875349
Epoch: 32, step: 51, loss: 0.33488762378692627, mean loss: 0.346778428539074
Epoch: 32, step: 52, loss: 0.3335523307323456, mean loss: 0.34677814263738993
Epoch: 32, step: 53, loss: 0.347506046295166, mean loss: 0.34677815837176496
Epoch: 32, step: 54, loss: 0.31024426221847534, mean loss: 0.3467773686716557
Epoch: 32, step: 55, loss: 0.3281317949295044, mean loss: 0.34677696564611227
Epoch: 32, step: 56, loss: 0.3609318137168884, mean loss: 0.3467772715976538
Epoch: 32, step: 57, loss: 0.30959150195121765, mean loss: 0.3467764678590629
Epoch: 32, step: 58, loss: 0.35219866037368774, mean loss: 0.3467765850525813
Epoch: 32, step: 59, loss: 0.3383210599422455, mean loss: 0.3467764023015415
Epoch: 32, step: 60, loss: 0.3061649799346924, mean loss: 0.34677552457731214
Epoch: 32, step: 61, loss: 0.30599039793014526, mean loss: 0.3467746431179076
Epoch: 32, step: 62, loss: 0.3027645945549011, mean loss: 0.34677369198115754
Epoch: 32, step: 63, loss: 0.3829677402973175, mean loss: 0.34677447418310076
Epoch: 32, step: 64, loss: 0.331242173910141, mean loss: 0.34677413851650746
Epoch: 32, step: 65, loss: 0.3391190469264984, mean loss: 0.3467739730868582
Epoch: 32, step: 66, loss: 0.36278608441352844, mean loss: 0.3467743191076324
Epoch: 32, step: 67, loss: 0.33792644739151, mean loss: 0.3467741279097822
Epoch: 32, step: 68, loss: 0.3320988416671753, mean loss: 0.3467738107914244
Epoch: 32, step: 69, loss: 0.29373809695243835, mean loss: 0.34677266476709667
Epoch: 32, step: 70, loss: 0.3286345601081848, mean loss: 0.3467722728376112
Epoch: 32, step: 71, loss: 0.31481581926345825, mean loss: 0.34677158233515715
Epoch: 32, step: 72, loss: 0.3433381915092468, mean loss: 0.34677150814940433
Epoch: 32, step: 73, loss: 0.3630841076374054, mean loss: 0.3467718606103932
Epoch: 32, step: 74, loss: 0.3266039192676544, mean loss: 0.34677142485771206
Epoch: 32, step: 75, loss: 0.33498719334602356, mean loss: 0.34677117025068777
Epoch: 32, step: 76, loss: 0.3326875567436218, mean loss: 0.34677086597039164
Epoch: 32, step: 77, loss: 0.33954688906669617, mean loss: 0.34677070989777997
Epoch: 32, step: 78, loss: 0.3208697736263275, mean loss: 0.3467701503251943
Epoch: 32, step: 79, loss: 0.406412273645401, mean loss: 0.34677143882595735
Epoch: 32, step: 80, loss: 0.3270571529865265, mean loss: 0.3467710129302621
Epoch: 32, step: 81, loss: 0.30589622259140015, mean loss: 0.34677012991470063
Epoch: 32, step: 82, loss: 0.3423544466495514, mean loss: 0.3467700345250295
Epoch: 32, step: 83, loss: 0.30453866720199585, mean loss: 0.34676912224283557
Epoch: 32, step: 84, loss: 0.31134429574012756, mean loss: 0.3467683570120987
Epoch: 32, step: 85, loss: 0.3253573179244995, mean loss: 0.3467678945107143
Epoch: 32, step: 86, loss: 0.32564878463745117, mean loss: 0.3467674383251679
Epoch: 32, step: 87, loss: 0.3280997574329376, mean loss: 0.34676703510067997
Epoch: 32, step: 88, loss: 0.31442156434059143, mean loss: 0.3467663364491311
Epoch: 32, step: 89, loss: 0.3272349238395691, mean loss: 0.34676591458614325
Epoch: 32, step: 90, loss: 0.33754608035087585, mean loss: 0.34676571544935336
Epoch: 32, step: 91, loss: 0.3346477448940277, mean loss: 0.3467654537221275
Epoch: 32, step: 92, loss: 0.32913950085639954, mean loss: 0.3467650730402229
Epoch: 32, step: 93, loss: 0.32165104150772095, mean loss: 0.346764530643965
Epoch: 32, step: 94, loss: 0.3361681401729584, mean loss: 0.3467643017950682
Epoch: 32, step: 95, loss: 0.34296566247940063, mean loss: 0.3467642197581099
Epoch: 32, step: 96, loss: 0.3830125331878662, mean loss: 0.3467650025745105
Epoch: 32, step: 97, loss: 0.34850406646728516, mean loss: 0.34676504013041887
Epoch: 32, step: 98, loss: 0.3706764578819275, mean loss: 0.34676555649765817
Epoch: 32, step: 99, loss: 0.37019219994544983, mean loss: 0.34676606238526825
Epoch: 32, step: 100, loss: 0.2899004817008972, mean loss: 0.34676483442567757
Epoch: 32, step: 101, loss: 0.30788883566856384, mean loss: 0.3467639949525885
Epoch: 32, step: 102, loss: 0.33310452103614807, mean loss: 0.3467637000016283
Epoch: 32, step: 103, loss: 0.3319185674190521, mean loss: 0.3467633794554938
Epoch: 32, step: 104, loss: 0.34140515327453613, mean loss: 0.34676326375955135
Epoch: 32, step: 105, loss: 0.3271428346633911, mean loss: 0.3467628401202825
Epoch: 32, step: 106, loss: 0.36426085233688354, mean loss: 0.34676321792471343
Epoch: 32, step: 107, loss: 0.3256419897079468, mean loss: 0.34676276190026795
Epoch: 32, step: 108, loss: 0.3219773471355438, mean loss: 0.3467622267746172
Epoch: 32, step: 109, loss: 0.2881571352481842, mean loss: 0.346760961497802
Epoch: 32, step: 110, loss: 0.3378557860851288, mean loss: 0.34676076924029614
Epoch: 32, step: 111, loss: 0.3528226613998413, mean loss: 0.3467609001101614
Epoch: 32, step: 112, loss: 0.31603309512138367, mean loss: 0.3467602367435461
Epoch: 32, step: 113, loss: 0.3229251801967621, mean loss: 0.34675972219200374
Epoch: 32, step: 114, loss: 0.3333243727684021, mean loss: 0.3467594321557491
Epoch: 32, step: 115, loss: 0.29600656032562256, mean loss: 0.34675833654932847
Epoch: 32, step: 116, loss: 0.3872886896133423, mean loss: 0.3467592114625085
Epoch: 32, step: 117, loss: 0.33223894238471985, mean loss: 0.3467588980257974
Epoch: 32, step: 118, loss: 0.30133286118507385, mean loss: 0.34675791747370377
Epoch: 32, step: 119, loss: 0.34540849924087524, mean loss: 0.34675788834621646
Epoch: 32, step: 120, loss: 0.31409287452697754, mean loss: 0.34675718327997673
Epoch: 32, step: 121, loss: 0.2987860143184662, mean loss: 0.34675614785651543
Epoch: 32, step: 122, loss: 0.3228650689125061, mean loss: 0.34675563219574956
Epoch: 32, step: 123, loss: 0.38179174065589905, mean loss: 0.3467563883925134
Epoch: 32, step: 124, loss: 0.3038666844367981, mean loss: 0.34675546270879
Epoch: 32, step: 125, loss: 0.3264417350292206, mean loss: 0.3467550242893209
Epoch: 32, step: 126, loss: 0.30937811732292175, mean loss: 0.3467542176225039
Epoch: 32, step: 127, loss: 0.3158562183380127, mean loss: 0.3467535507975884
Epoch: 32, step: 128, loss: 0.32810109853744507, mean loss: 0.34675314825853193
Epoch: 32, step: 129, loss: 0.38845327496528625, mean loss: 0.346754048170628
Epoch: 32, step: 130, loss: 0.3013332188129425, mean loss: 0.34675306798483724
Epoch: 32, step: 131, loss: 0.3288004696369171, mean loss: 0.3467526805744284
Epoch: 32, step: 132, loss: 0.36699098348617554, mean loss: 0.34675311730006897
Epoch: 32, step: 133, loss: 0.387066125869751, mean loss: 0.3467539872022866
Epoch: 32, step: 134, loss: 0.34118348360061646, mean loss: 0.34675386700066824
Epoch: 32, step: 135, loss: 0.3358042240142822, mean loss: 0.34675363073183113
Epoch: 32, step: 136, loss: 0.37326109409332275, mean loss: 0.34675420269133833
Epoch: 32, step: 137, loss: 0.36350780725479126, mean loss: 0.3467545641811015
Epoch: 32, step: 138, loss: 0.30822187662124634, mean loss: 0.34675373278559457
Epoch: 32, step: 139, loss: 0.3595215678215027, mean loss: 0.346754008263178
Epoch: 32, step: 140, loss: 0.35090523958206177, mean loss: 0.3467540978278141
Epoch: 32, step: 141, loss: 0.31943202018737793, mean loss: 0.34675350835472585
Epoch: 32, step: 142, loss: 0.3433470129966736, mean loss: 0.346753434861266
Epoch: 32, step: 143, loss: 0.3449500799179077, mean loss: 0.3467533959556105
Epoch: 32, step: 144, loss: 0.3178428113460541, mean loss: 0.34675277225089646
Epoch: 32, step: 145, loss: 0.335521936416626, mean loss: 0.3467525299668253
Epoch: 32, step: 146, loss: 0.32011863589286804, mean loss: 0.3467519554032599
Epoch: 32, step: 147, loss: 0.3535575270652771, mean loss: 0.3467521022142803
Epoch: 32, step: 148, loss: 0.3118499219417572, mean loss: 0.3467513493143888
Epoch: 32, step: 149, loss: 0.3316945433616638, mean loss: 0.3467510245202658
Epoch: 32, step: 150, loss: 0.3212621510028839, mean loss: 0.34675047470526726
Epoch: 32, step: 151, loss: 0.3243938684463501, mean loss: 0.34674999246613314
Epoch: 32, step: 152, loss: 0.3321433961391449, mean loss: 0.3467496774039833
Epoch: 32, step: 153, loss: 0.3709319829940796, mean loss: 0.3467501990015328
Epoch: 32, step: 154, loss: 0.33364617824554443, mean loss: 0.34674991636191166
Epoch: 32, step: 155, loss: 0.3088432252407074, mean loss: 0.34674909877302545
Epoch: 32, step: 156, loss: 0.33647841215133667, mean loss: 0.34674887725492726
Epoch: 32, step: 157, loss: 0.3262092173099518, mean loss: 0.3467484342652377
Epoch: 32, step: 158, loss: 0.3468843102455139, mean loss: 0.3467484371956835
Epoch: 32, step: 159, loss: 0.3161347806453705, mean loss: 0.34674777696326997
Epoch: 32, step: 160, loss: 0.3685302734375, mean loss: 0.3467482467274761
Epoch: 32, step: 161, loss: 0.40942811965942383, mean loss: 0.346749598460772
Epoch: 32, step: 162, loss: 0.3519241213798523, mean loss: 0.34674971005040606
Epoch: 32, step: 163, loss: 0.3138493001461029, mean loss: 0.34674900056170804
Epoch: 32, step: 164, loss: 0.33496877551078796, mean loss: 0.34674874652972715
Epoch: 32, step: 165, loss: 0.33018258213996887, mean loss: 0.34674838930015045
Epoch: 32, step: 166, loss: 0.34694868326187134, mean loss: 0.3467483936191577
Epoch: 32, step: 167, loss: 0.3225468695163727, mean loss: 0.3467478717646618
Epoch: 32, step: 168, loss: 0.33615681529045105, mean loss: 0.34674764339593434
Epoch: 32, step: 169, loss: 0.3670494854450226, mean loss: 0.3467480811431862
Epoch: 32, step: 170, loss: 0.3365316092967987, mean loss: 0.3467478608609066
Epoch: 32, step: 171, loss: 0.34582826495170593, mean loss: 0.34674784103348294
Epoch: 32, step: 172, loss: 0.32063835859298706, mean loss: 0.3467472780986079
Epoch: 32, step: 173, loss: 0.33543747663497925, mean loss: 0.34674703425829345
Epoch: 32, step: 174, loss: 0.3592992424964905, mean loss: 0.3467473048791726
Epoch: 32, step: 175, loss: 0.31057408452033997, mean loss: 0.34674652501498754
Epoch: 32, step: 176, loss: 0.32955342531204224, mean loss: 0.34674615435421996
Epoch: 32, step: 177, loss: 0.32057854533195496, mean loss: 0.34674559022691814
Epoch: 32, step: 178, loss: 0.3098888695240021, mean loss: 0.34674479567843036
Epoch: 32, step: 179, loss: 0.352561354637146, mean loss: 0.34674492106773275
Epoch: 32, step: 180, loss: 0.3188556730747223, mean loss: 0.3467443198638268
Epoch: 32, step: 181, loss: 0.3469162583351135, mean loss: 0.3467443235701961
Epoch: 32, step: 182, loss: 0.308729350566864, mean loss: 0.3467435041230403
Epoch: 32, step: 183, loss: 0.3289071321487427, mean loss: 0.3467431196521838
Epoch: 32, step: 184, loss: 0.30601179599761963, mean loss: 0.34674224168948137
Epoch: 32, step: 185, loss: 0.3174995183944702, mean loss: 0.34674161137686993
Epoch: 32, step: 186, loss: 0.3577246367931366, mean loss: 0.34674184810551345
Epoch: 32, step: 187, loss: 0.31230518221855164, mean loss: 0.34674110587200435
Epoch: 32, step: 188, loss: 0.3150435984134674, mean loss: 0.34674042269189664
Epoch: 32, step: 189, loss: 0.3196735382080078, mean loss: 0.346739839328724
Epoch: 32, step: 190, loss: 0.31623217463493347, mean loss: 0.34673918182178
Epoch: 32, step: 191, loss: 0.37296411395072937, mean loss: 0.3467397470142828
Epoch: 32, step: 192, loss: 0.3157639801502228, mean loss: 0.3467390794474876
Epoch: 32, step: 193, loss: 0.3018862307071686, mean loss: 0.34673811283292916
Epoch: 32, step: 194, loss: 0.3407595753669739, mean loss: 0.34673798399346906
Epoch: 32, step: 195, loss: 0.30299028754234314, mean loss: 0.3467370412364556
Epoch: 32, step: 196, loss: 0.3372146487236023, mean loss: 0.3467368360345913
Epoch: 32, step: 197, loss: 0.36035025119781494, mean loss: 0.3467371293892257
Epoch: 32, step: 198, loss: 0.36038464307785034, mean loss: 0.3467374234723099
Epoch: 32, step: 199, loss: 0.3231837749481201, mean loss: 0.34673691593808037
Epoch: 32, step: 200, loss: 0.3233430087566376, mean loss: 0.3467364118568207
Epoch: 32, step: 201, loss: 0.316466361284256, mean loss: 0.3467357596256082
Epoch: 32, step: 202, loss: 0.31363967061042786, mean loss: 0.34673504651688364
Epoch: 32, step: 203, loss: 0.34399425983428955, mean loss: 0.3467349874634776
Epoch: 32, step: 204, loss: 0.3048575818538666, mean loss: 0.34673408518597754
Epoch: 32, step: 205, loss: 0.3945366144180298, mean loss: 0.34673511510215005
Epoch: 32, step: 206, loss: 0.3441752791404724, mean loss: 0.34673505995110054
Epoch: 32, step: 207, loss: 0.33329299092292786, mean loss: 0.34673477035119904
Epoch: 32, step: 208, loss: 0.3285113275051117, mean loss: 0.3467343777484275
Epoch: 32, step: 209, loss: 0.33191144466400146, mean loss: 0.34673405841254307
Epoch: 32, step: 210, loss: 0.39819949865341187, mean loss: 0.3467351671275141
Epoch: 32, step: 211, loss: 0.30398622155189514, mean loss: 0.34673424621097865
Epoch: 32, step: 212, loss: 0.3311239778995514, mean loss: 0.34673390993497616
Epoch: 32, step: 213, loss: 0.32136908173561096, mean loss: 0.3467333635382634
Epoch: 32, step: 214, loss: 0.34134894609451294, mean loss: 0.3467332475522771
Epoch: 32, step: 215, loss: 0.3396163582801819, mean loss: 0.3467330942503369
Epoch: 32, step: 216, loss: 0.3144172430038452, mean loss: 0.34673239816307255
Epoch: 32, step: 217, loss: 0.3357941508293152, mean loss: 0.3467321625570041
Epoch: 32, step: 218, loss: 0.2857065498828888, mean loss: 0.34673084811470384
Epoch: 32, step: 219, loss: 0.33828404545783997, mean loss: 0.3467306661813305
Epoch: 32, step: 220, loss: 0.33135831356048584, mean loss: 0.34673033508756107
Epoch: 32, step: 221, loss: 0.3475172519683838, mean loss: 0.34673035203601854
Epoch: 32, step: 222, loss: 0.3287578523159027, mean loss: 0.34672996495627184
Epoch: 32, step: 223, loss: 0.305112361907959, mean loss: 0.34672906864331854
Epoch: 32, step: 224, loss: 0.3601050078868866, mean loss: 0.34672935671299404
Epoch: 32, step: 225, loss: 0.3515661060810089, mean loss: 0.3467294608769551
Epoch: 32, step: 226, loss: 0.3638994097709656, mean loss: 0.34672983064004104
Epoch: 32, step: 227, loss: 0.322331964969635, mean loss: 0.34672930523161505
Epoch: 32, step: 228, loss: 0.35196956992149353, mean loss: 0.3467294180783685
Epoch: 32, step: 229, loss: 0.33935195207595825, mean loss: 0.346729259211363
Epoch: 32, step: 230, loss: 0.3441992402076721, mean loss: 0.34672920473088314
Epoch: 32, step: 231, loss: 0.33767420053482056, mean loss: 0.34672900974801935
Epoch: 32, step: 232, loss: 0.33100253343582153, mean loss: 0.34672867111456374
Epoch: 32, step: 233, loss: 0.356046199798584, mean loss: 0.34672887174176936
Epoch: 32, step: 234, loss: 0.3264521360397339, mean loss: 0.3467284351477573
Epoch: 32, step: 235, loss: 0.30932122468948364, mean loss: 0.3467276297216429
Epoch: 32, step: 236, loss: 0.3630450963973999, mean loss: 0.34672798105045494
Epoch: 32, step: 237, loss: 0.410311222076416, mean loss: 0.3467293500217555
Epoch: 32, step: 238, loss: 0.3302885591983795, mean loss: 0.3467289960529131
Epoch: 32, step: 239, loss: 0.29893723130226135, mean loss: 0.346727967122394
Epoch: 32, step: 240, loss: 0.30463600158691406, mean loss: 0.3467270609249401
Epoch: 32, step: 241, loss: 0.3254855275154114, mean loss: 0.3467266036260508
Epoch: 32, step: 242, loss: 0.3561580181121826, mean loss: 0.346726806666125
Epoch: 32, step: 243, loss: 0.33002969622612, mean loss: 0.3467264472174373
Epoch: 32, step: 244, loss: 0.38749170303344727, mean loss: 0.3467273247766007
Epoch: 32, step: 245, loss: 0.38456135988235474, mean loss: 0.34672813921744766
Epoch: 32, step: 246, loss: 0.31002944707870483, mean loss: 0.34672734923376153
Epoch: 32, step: 247, loss: 0.3753942549228668, mean loss: 0.3467279663102573
Epoch: 32, step: 248, loss: 0.3429984450340271, mean loss: 0.3467278860312622
Epoch: 32, step: 249, loss: 0.3500646650791168, mean loss: 0.3467279578548243
Epoch: 32, step: 250, loss: 0.3391716778278351, mean loss: 0.34672779521077196
Epoch: 32, step: 251, loss: 0.31192922592163086, mean loss: 0.34672704621014155
Epoch: 32, step: 252, loss: 0.3499687612056732, mean loss: 0.3467271159829617
Epoch: 32, step: 253, loss: 0.3266567289829254, mean loss: 0.3467266840087247
Epoch: 32, step: 254, loss: 0.3355611264705658, mean loss: 0.34672644369799277
Epoch: 32, step: 255, loss: 0.3068002760410309, mean loss: 0.34672558440547263
Epoch: 32, step: 256, loss: 0.3217947483062744, mean loss: 0.34672504785460423
Epoch: 32, step: 257, loss: 0.36673739552497864, mean loss: 0.34672547854258406
Epoch: 32, step: 258, loss: 0.34355348348617554, mean loss: 0.3467254102791916
Epoch: 32, step: 259, loss: 0.3582550883293152, mean loss: 0.346725658400007
Epoch: 32, step: 260, loss: 0.31622034311294556, mean loss: 0.34672500193407735
Epoch: 32, step: 261, loss: 0.37427476048469543, mean loss: 0.3467255947844873
Epoch: 32, step: 262, loss: 0.33016449213027954, mean loss: 0.34672523840948666
Epoch: 32, step: 263, loss: 0.32872357964515686, mean loss: 0.34672485104378764
Epoch: 32, step: 264, loss: 0.32942453026771545, mean loss: 0.346724478777724
Epoch: 32, step: 265, loss: 0.326119065284729, mean loss: 0.34672403540264346
Epoch: 32, step: 266, loss: 0.32315269112586975, mean loss: 0.34672352821933466
Epoch: 32, step: 267, loss: 0.3405056595802307, mean loss: 0.34672339443267836
Epoch: 32, step: 268, loss: 0.34065112471580505, mean loss: 0.3467232637816097
Epoch: 32, step: 269, loss: 0.32763904333114624, mean loss: 0.34672285317400076
Epoch: 32, step: 270, loss: 0.32411494851112366, mean loss: 0.3467223667628331
Epoch: 32, step: 271, loss: 0.35392725467681885, mean loss: 0.34672252177333035
Epoch: 32, step: 272, loss: 0.3389156758785248, mean loss: 0.3467223538155434
Epoch: 32, step: 273, loss: 0.304986834526062, mean loss: 0.34672145592992554
Epoch: 32, step: 274, loss: 0.33858931064605713, mean loss: 0.3467212809811209
Epoch: 32, step: 275, loss: 0.3183945119380951, mean loss: 0.3467206715936103
Epoch: 32, step: 276, loss: 0.3234221637248993, mean loss: 0.34672017038875136
Epoch: 32, step: 277, loss: 0.3581833243370056, mean loss: 0.3467204169824344
Epoch: 32, step: 278, loss: 0.33749619126319885, mean loss: 0.3467202185565149
Epoch: 32, step: 279, loss: 0.31475865840911865, mean loss: 0.34671953103371017
Epoch: 32, step: 280, loss: 0.3127523958683014, mean loss: 0.34671880038484343
Epoch: 32, step: 281, loss: 0.37451332807540894, mean loss: 0.3467193982451938
Epoch: 32, step: 282, loss: 0.3597184419631958, mean loss: 0.3467196778486379
Epoch: 32, step: 283, loss: 0.36215659976005554, mean loss: 0.3467200098825773
Epoch: 32, step: 284, loss: 0.3496563732624054, mean loss: 0.3467200730396844
Epoch: 32, step: 285, loss: 0.3774057924747467, mean loss: 0.3467207330327896
Epoch: 32, step: 286, loss: 0.33759137988090515, mean loss: 0.34672053668150127
Epoch: 32, step: 287, loss: 0.3001670241355896, mean loss: 0.3467195354445659
Epoch: 32, step: 288, loss: 0.32538485527038574, mean loss: 0.346719076604637
Epoch: 32, step: 289, loss: 0.33323749899864197, mean loss: 0.3467187866657664
Epoch: 32, step: 290, loss: 0.3573530912399292, mean loss: 0.34671901536540667
Epoch: 32, step: 291, loss: 0.333629310131073, mean loss: 0.34671873386636937
Epoch: 32, step: 292, loss: 0.35936135053634644, mean loss: 0.346719005744752
Epoch: 32, step: 293, loss: 0.3750571310520172, mean loss: 0.3467196151405911
Epoch: 32, step: 294, loss: 0.35199931263923645, mean loss: 0.34671972867514794
Epoch: 32, step: 295, loss: 0.3334818184375763, mean loss: 0.34671944401339333
Epoch: 32, step: 296, loss: 0.3092304766178131, mean loss: 0.3467186378857211
Epoch: 32, step: 297, loss: 0.3249938488006592, mean loss: 0.3467181707462319
Epoch: 32, step: 298, loss: 0.3594752252101898, mean loss: 0.3467184450501961
Epoch: 32, step: 299, loss: 0.3558327853679657, mean loss: 0.3467186410237989
Epoch: 32, step: 300, loss: 0.3353255093097687, mean loss: 0.34671839605762644
Epoch: 32, step: 301, loss: 0.31821152567863464, mean loss: 0.34671778313846113
Epoch: 32, step: 302, loss: 0.32284533977508545, mean loss: 0.34671726987399976
Epoch: 32, step: 303, loss: 0.327791690826416, mean loss: 0.3467168629773054
Epoch: 32, step: 304, loss: 0.3367992639541626, mean loss: 0.3467166497552165
Epoch: 32, step: 305, loss: 0.345147043466568, mean loss: 0.34671661601040227
Epoch: 32, step: 306, loss: 0.29912278056144714, mean loss: 0.3467155928171216
Epoch: 32, step: 307, loss: 0.3475501537322998, mean loss: 0.3467156107584948
Epoch: 32, step: 308, loss: 0.34818318486213684, mean loss: 0.3467156423076941
Epoch: 32, step: 309, loss: 0.29628419876098633, mean loss: 0.3467145581801833
Epoch: 32, step: 310, loss: 0.3621637523174286, mean loss: 0.3467148902852186
Epoch: 32, step: 311, loss: 0.30254241824150085, mean loss: 0.3467139407479864
Epoch: 32, step: 312, loss: 0.31854408979415894, mean loss: 0.34671333521820513
Epoch: 32, step: 313, loss: 0.3614698648452759, mean loss: 0.34671365241285773
Epoch: 32, step: 314, loss: 0.33951643109321594, mean loss: 0.3467134977104241
Epoch: 32, step: 315, loss: 0.29946330189704895, mean loss: 0.3467124821013661
Epoch: 32, step: 316, loss: 0.33642444014549255, mean loss: 0.3467122609720388
Epoch: 32, step: 317, loss: 0.3532233238220215, mean loss: 0.3467124009166472
Epoch: 32, step: 318, loss: 0.3474567234516144, mean loss: 0.34671241691429444
Epoch: 32, step: 319, loss: 0.3932177424430847, mean loss: 0.34671341642696485
Epoch: 32, step: 320, loss: 0.371412068605423, mean loss: 0.3467139472497244
Epoch: 32, step: 321, loss: 0.33952853083610535, mean loss: 0.34671379282426956
Epoch: 32, step: 322, loss: 0.3243405222892761, mean loss: 0.3467133119992167
Epoch: 32, step: 323, loss: 0.3304402530193329, mean loss: 0.3467129622816249
Epoch: 32, step: 324, loss: 0.33996322751045227, mean loss: 0.346712817228979
Epoch: 32, step: 325, loss: 0.3261816203594208, mean loss: 0.3467123760204676
Epoch: 32, step: 326, loss: 0.3136712908744812, mean loss: 0.34671166599392533
Epoch: 32, step: 327, loss: 0.3465341329574585, mean loss: 0.3467116621789641
Epoch: 32, step: 328, loss: 0.32328173518180847, mean loss: 0.3467111587101759
Epoch: 32, step: 329, loss: 0.32962724566459656, mean loss: 0.34671079161418883
Epoch: 32, step: 330, loss: 0.3194865584373474, mean loss: 0.34671020663743435
Epoch: 32, step: 331, loss: 0.301521360874176, mean loss: 0.34670923566954087
Epoch: 32, step: 332, loss: 0.3693474233150482, mean loss: 0.3467097220834049
Epoch: 32, step: 333, loss: 0.3327496647834778, mean loss: 0.3467094221380373
Epoch: 32, step: 334, loss: 0.33675846457481384, mean loss: 0.3467092083366587
Epoch: 32, step: 335, loss: 0.30471208691596985, mean loss: 0.346708306026556
Epoch: 32, step: 336, loss: 0.28862252831459045, mean loss: 0.3467070580777385
Epoch: 32, step: 337, loss: 0.32352694869041443, mean loss: 0.3467065600734119
Epoch: 32, step: 338, loss: 0.3038932681083679, mean loss: 0.3467056402871321
Epoch: 32, step: 339, loss: 0.32361915707588196, mean loss: 0.3467051443155928
Epoch: 32, step: 340, loss: 0.38728490471839905, mean loss: 0.34670601607997875
Epoch: 32, step: 341, loss: 0.3368363082408905, mean loss: 0.34670580405617984
Epoch: 32, step: 342, loss: 0.32354894280433655, mean loss: 0.34670530660475557
Epoch: 32, step: 343, loss: 0.34196266531944275, mean loss: 0.3467052047263984
Epoch: 32, step: 344, loss: 0.2878243327140808, mean loss: 0.3467039399127019
Epoch: 32, step: 345, loss: 0.30564847588539124, mean loss: 0.3467030580236262
Epoch: 32, step: 346, loss: 0.32314229011535645, mean loss: 0.3467025519390401
Epoch: 32, step: 347, loss: 0.3387241065502167, mean loss: 0.34670238056595415
Epoch: 32, step: 348, loss: 0.37127310037612915, mean loss: 0.34670290832160444
Epoch: 32, step: 349, loss: 0.31314393877983093, mean loss: 0.3467021875223961
Epoch: 32, step: 350, loss: 0.33742162585258484, mean loss: 0.34670198819333686
Epoch: 32, step: 351, loss: 0.29559391736984253, mean loss: 0.34670089051140335
Epoch: 32, step: 352, loss: 0.33272403478622437, mean loss: 0.3467005903276503
Epoch: 32, step: 353, loss: 0.33189094066619873, mean loss: 0.34670027226464484
Epoch: 32, step: 354, loss: 0.34759989380836487, mean loss: 0.3467002915851685
Epoch: 32, step: 355, loss: 0.30362558364868164, mean loss: 0.3466993665205706
Epoch: 32, step: 356, loss: 0.31992006301879883, mean loss: 0.34669879142546695
Epoch: 32, step: 357, loss: 0.3348330557346344, mean loss: 0.34669853661002886
Epoch: 32, step: 358, loss: 0.30436909198760986, mean loss: 0.34669762760913503
Epoch: 32, step: 359, loss: 0.3147907853126526, mean loss: 0.3466969424424477
Epoch: 32, step: 360, loss: 0.30691859126091003, mean loss: 0.3466960882615295
Epoch: 32, step: 361, loss: 0.31513696908950806, mean loss: 0.3466954105909439
Epoch: 32, step: 362, loss: 0.3690313696861267, mean loss: 0.3466958902018411
Epoch: 32, step: 363, loss: 0.3289889395236969, mean loss: 0.3466955099959088
Epoch: 32, step: 364, loss: 0.36701226234436035, mean loss: 0.3466959462304728
Epoch: 32, step: 365, loss: 0.3309227526187897, mean loss: 0.34669560756096596
Epoch: 32, step: 366, loss: 0.3876846730709076, mean loss: 0.34669648762678473
Epoch: 32, step: 367, loss: 0.32015877962112427, mean loss: 0.3466959178546273
Epoch: 32, step: 368, loss: 0.34503719210624695, mean loss: 0.34669588224207715
Epoch: 32, step: 369, loss: 0.32600468397140503, mean loss: 0.34669543801522607
Epoch: 32, step: 370, loss: 0.3308141231536865, mean loss: 0.34669509706082896
Epoch: 32, step: 371, loss: 0.3280241787433624, mean loss: 0.34669469622531335
Epoch: 32, step: 372, loss: 0.3436148762702942, mean loss: 0.3466946301077986
Epoch: 32, step: 373, loss: 0.2980042099952698, mean loss: 0.3466935848452484
Epoch: 32, step: 374, loss: 0.36277544498443604, mean loss: 0.3466939300754856
Epoch: 32, step: 375, loss: 0.29412001371383667, mean loss: 0.34669280149235915
Epoch: 32, step: 376, loss: 0.35974130034446716, mean loss: 0.34669308159322537
Epoch: 32, step: 377, loss: 0.3332615792751312, mean loss: 0.34669279327694325
Epoch: 32, step: 378, loss: 0.3257780075073242, mean loss: 0.3466923443365571
Epoch: 32, step: 379, loss: 0.299509733915329, mean loss: 0.34669133157339016
Epoch: 32, step: 380, loss: 0.3297458589076996, mean loss: 0.3466909678507804
Epoch: 32, step: 381, loss: 0.2967376410961151, mean loss: 0.34668989566089514
Epoch: 32, step: 382, loss: 0.2956712543964386, mean loss: 0.34668880062878027
Epoch: 32, step: 383, loss: 0.3399553894996643, mean loss: 0.34668865611016914
Epoch: 32, step: 384, loss: 0.37785038352012634, mean loss: 0.3466893249172305
Epoch: 32, step: 385, loss: 0.3134872019290924, mean loss: 0.3466886123335719
Epoch: 32, step: 386, loss: 0.3353789150714874, mean loss: 0.3466883696101625
Epoch: 32, step: 387, loss: 0.35586702823638916, mean loss: 0.3466885665939943
Epoch: 32, step: 388, loss: 0.2815510332584381, mean loss: 0.34668716870285676
Epoch: 32, step: 389, loss: 0.34103530645370483, mean loss: 0.34668704741305356
Epoch: 32, step: 390, loss: 0.34464403986930847, mean loss: 0.34668700357074916
Epoch: 32, step: 391, loss: 0.3077152967453003, mean loss: 0.3466861672680276
Epoch: 32, step: 392, loss: 0.3340946137905121, mean loss: 0.3466858970688156
Epoch: 32, step: 393, loss: 0.33518368005752563, mean loss: 0.3466856502507174
Epoch: 32, step: 394, loss: 0.3616851270198822, mean loss: 0.34668597210718094
Epoch: 32, step: 395, loss: 0.31838127970695496, mean loss: 0.3466853647624809
Epoch: 32, step: 396, loss: 0.3155404031276703, mean loss: 0.34668469648736805
Epoch: 32, step: 397, loss: 0.3042180836200714, mean loss: 0.3466837853039825
Epoch: 32, step: 398, loss: 0.3111668527126312, mean loss: 0.34668302325251826
Epoch: 32, step: 399, loss: 0.3594379723072052, mean loss: 0.34668329691689037
Epoch: 32, step: 400, loss: 0.33944442868232727, mean loss: 0.34668314160636593
Epoch: 32, step: 401, loss: 0.32540056109428406, mean loss: 0.34668268499661453
Epoch: 32, step: 402, loss: 0.3242379128932953, mean loss: 0.34668220346281126
Epoch: 32, step: 403, loss: 0.34477588534355164, mean loss: 0.34668216256522866
Epoch: 32, step: 404, loss: 0.32128337025642395, mean loss: 0.34668161767877403
Epoch: 32, step: 405, loss: 0.3490433394908905, mean loss: 0.3466816683442782
Epoch: 32, step: 406, loss: 0.33660587668418884, mean loss: 0.34668145219514895
Epoch: 32, step: 407, loss: 0.3182416260242462, mean loss: 0.346680842107922
Epoch: 32, step: 408, loss: 0.31581759452819824, mean loss: 0.3466801800479958
Epoch: 32, step: 409, loss: 0.35817381739616394, mean loss: 0.3466804265973404
Epoch: 32, step: 410, loss: 0.3382793366909027, mean loss: 0.34668024638991624
Epoch: 32, step: 411, loss: 0.32190585136413574, mean loss: 0.3466797149786115
Epoch: 32, step: 412, loss: 0.3001866042613983, mean loss: 0.3466787177217805
Epoch: 32, step: 413, loss: 0.296286016702652, mean loss: 0.34667763684363245
Epoch: 32, step: 414, loss: 0.38095447421073914, mean loss: 0.3466783720352196
Epoch: 32, step: 415, loss: 0.34990179538726807, mean loss: 0.34667844117178775
Epoch: 32, step: 416, loss: 0.32009461522102356, mean loss: 0.34667787100930086
Epoch: 32, step: 417, loss: 0.3522516191005707, mean loss: 0.34667799055093196
Epoch: 32, step: 418, loss: 0.34700846672058105, mean loss: 0.3466779976385887
Epoch: 32, step: 419, loss: 0.3092026114463806, mean loss: 0.3466771939286678
Epoch: 32, step: 420, loss: 0.34163227677345276, mean loss: 0.3466770857359732
Epoch: 32, step: 421, loss: 0.32892224192619324, mean loss: 0.3466767049758658
Epoch: 32, step: 422, loss: 0.3150559365749359, mean loss: 0.3466760268697046
Epoch: 32, step: 423, loss: 0.3374038338661194, mean loss: 0.34667582803214664
Epoch: 32, step: 424, loss: 0.3265111446380615, mean loss: 0.34667539561983357
Epoch: 32, step: 425, loss: 0.3285817801952362, mean loss: 0.3466750076279087
Epoch: 32, step: 426, loss: 0.31621938943862915, mean loss: 0.3466743545643687
Epoch: 32, step: 427, loss: 0.35644274950027466, mean loss: 0.3466745640247627
Epoch: 32, step: 428, loss: 0.31598594784736633, mean loss: 0.3466739059932389
Epoch: 32, step: 429, loss: 0.3045552670955658, mean loss: 0.3466730028962172
Epoch: 32, step: 430, loss: 0.4228670001029968, mean loss: 0.34667463659327774
Epoch: 32, step: 431, loss: 0.32166898250579834, mean loss: 0.34667410045146624
Epoch: 32, step: 432, loss: 0.3520601689815521, mean loss: 0.34667421593073405
Epoch: 32, step: 433, loss: 0.3097776770591736, mean loss: 0.3466734248724846
Epoch: 32, step: 434, loss: 0.335215300321579, mean loss: 0.34667317921666163
Epoch: 32, step: 435, loss: 0.3176550567150116, mean loss: 0.34667255709757877
Epoch: 32, step: 436, loss: 0.30327939987182617, mean loss: 0.34667162681229147
Epoch: 32, step: 437, loss: 0.3380904495716095, mean loss: 0.3466714428484523
Epoch: 32, step: 438, loss: 0.2876860499382019, mean loss: 0.3466701783428483
Epoch: 32, step: 439, loss: 0.32217925786972046, mean loss: 0.3466696533274034
Epoch: 32, step: 440, loss: 0.3349746763706207, mean loss: 0.3466694026258459
Epoch: 32, step: 441, loss: 0.33440515398979187, mean loss: 0.3466691397266254
Epoch: 32, step: 442, loss: 0.3186400532722473, mean loss: 0.3466685389016387
Epoch: 32, step: 443, loss: 0.33827874064445496, mean loss: 0.34666835906372695
Epoch: 32, step: 444, loss: 0.33529865741729736, mean loss: 0.34666811535589154
Epoch: 32, step: 445, loss: 0.32425570487976074, mean loss: 0.3466676349595595
Epoch: 32, step: 446, loss: 0.31449759006500244, mean loss: 0.346666945429072
Epoch: 32, step: 447, loss: 0.327831894159317, mean loss: 0.3466665417285561
Epoch: 32, step: 448, loss: 0.34736016392707825, mean loss: 0.3466665565949684
Epoch: 32, step: 449, loss: 0.33237603306770325, mean loss: 0.34666625031258325
Epoch: 32, step: 450, loss: 0.3452085852622986, mean loss: 0.3466662190717712
Epoch: 32, step: 451, loss: 0.3475324213504791, mean loss: 0.3466662376359006
Epoch: 32, step: 452, loss: 0.37310677766799927, mean loss: 0.346666804287709
Epoch: 32, step: 453, loss: 0.3095008134841919, mean loss: 0.346666007793971
Epoch: 32, step: 454, loss: 0.38458773493766785, mean loss: 0.3466668204662626
Epoch: 32, step: 455, loss: 0.31258201599121094, mean loss: 0.3466660900358564
Epoch: 32, step: 456, loss: 0.36744001507759094, mean loss: 0.346666535207292
Epoch: 32, step: 457, loss: 0.3346891403198242, mean loss: 0.3466662785451635
Epoch: 32, step: 458, loss: 0.36021727323532104, mean loss: 0.34666656892154707
Epoch: 32, step: 459, loss: 0.3665253818035126, mean loss: 0.3466669944553793
Epoch: 32, step: 460, loss: 0.3410009741783142, mean loss: 0.3466668730467295
Epoch: 32, step: 461, loss: 0.3404887318611145, mean loss: 0.34666674066744546
Epoch: 32, step: 462, loss: 0.3497796058654785, mean loss: 0.3466668073655063
Epoch: 32, step: 463, loss: 0.3184153735637665, mean loss: 0.3466662020468184
Epoch: 32, step: 464, loss: 0.34007424116134644, mean loss: 0.3466660608096816
Epoch: 32, step: 465, loss: 0.3843367397785187, mean loss: 0.3466668679116863
Epoch: 32, step: 466, loss: 0.3467271327972412, mean loss: 0.3466668692028462
Epoch: 32, step: 467, loss: 0.33414220809936523, mean loss: 0.3466666008709175
Epoch: 32, step: 468, loss: 0.33211931586265564, mean loss: 0.34666628921239173
Epoch: 32, step: 469, loss: 0.3738119304180145, mean loss: 0.34666687076346947
Epoch: 32, step: 470, loss: 0.3474475145339966, mean loss: 0.3466668874871304
Epoch: 32, step: 471, loss: 0.36090222001075745, mean loss: 0.34666719244284
Epoch: 32, step: 472, loss: 0.3139801025390625, mean loss: 0.3466664922202676
Epoch: 32, step: 473, loss: 0.3316146433353424, mean loss: 0.3466661697865911
Epoch: 32, step: 474, loss: 0.3121488392353058, mean loss: 0.3466654303882973
Epoch: 32, step: 475, loss: 0.3225070834159851, mean loss: 0.3466649129016429
Epoch: 32, step: 476, loss: 0.283738374710083, mean loss: 0.3466635650053552
Epoch: 32, step: 477, loss: 0.34305858612060547, mean loss: 0.3466634877877978
Epoch: 32, step: 478, loss: 0.3096623420715332, mean loss: 0.34666269525142335
Epoch: 32, step: 479, loss: 0.3327009677886963, mean loss: 0.3466623962082546
Epoch: 32, step: 480, loss: 0.30366960167884827, mean loss: 0.3466614753747707
Epoch: 32, step: 481, loss: 0.3643452525138855, mean loss: 0.3466618541234779
Epoch: 32, step: 482, loss: 0.2999071776866913, mean loss: 0.34666085275969394
Epoch: 32, step: 483, loss: 0.3383326232433319, mean loss: 0.3466606743944597
Epoch: 32, step: 484, loss: 0.3479757010936737, mean loss: 0.34666070255771114
Epoch: 32, step: 485, loss: 0.3432212173938751, mean loss: 0.3466606288976014
Epoch: 32, step: 486, loss: 0.3240951597690582, mean loss: 0.3466601456452376
Epoch: 32, step: 487, loss: 0.38069388270378113, mean loss: 0.34666087448147753
Epoch: 32, step: 488, loss: 0.35320350527763367, mean loss: 0.34666101458963855
Epoch: 32, step: 489, loss: 0.37623143196105957, mean loss: 0.3466616478162729
Epoch: 32, step: 490, loss: 0.35411980748176575, mean loss: 0.34666180752332587
Epoch: 32, step: 491, loss: 0.32955271005630493, mean loss: 0.3466614411614957
Epoch: 32, step: 492, loss: 0.33523285388946533, mean loss: 0.3466611964432397
Epoch: 32, step: 493, loss: 0.34756284952163696, mean loss: 0.34666121574975933
Epoch: 32, step: 494, loss: 0.2864653170108795, mean loss: 0.34665992684115093
Epoch: 32, step: 495, loss: 0.351375550031662, mean loss: 0.34666002780944466
Epoch: 32, step: 496, loss: 0.3239116370677948, mean loss: 0.3466595407440182
Epoch: 32, step: 497, loss: 0.330997109413147, mean loss: 0.34665920540313416
Epoch: 32, step: 498, loss: 0.3870551586151123, mean loss: 0.3466600702831995
Epoch: 32, step: 499, loss: 0.32938525080680847, mean loss: 0.3466597004360753
Epoch: 32, step: 500, loss: 0.2963515818119049, mean loss: 0.3466586233820038
Epoch: 32, step: 501, loss: 0.32605934143066406, mean loss: 0.3466581823783226
Epoch: 32, step: 502, loss: 0.3190491199493408, mean loss: 0.3466575913170644
Epoch: 32, step: 503, loss: 0.3055427670478821, mean loss: 0.3466567111401448
Epoch: 32, step: 504, loss: 0.32897767424583435, mean loss: 0.3466563326793974
Epoch: 32, step: 505, loss: 0.32772940397262573, mean loss: 0.3466559275133078
Epoch: 32, step: 506, loss: 0.3860218822956085, mean loss: 0.3466567701967025
Epoch: 32, step: 507, loss: 0.3583533763885498, mean loss: 0.3466570205735796
Epoch: 32, step: 508, loss: 0.3221184015274048, mean loss: 0.34665649531256015
Epoch: 32, step: 509, loss: 0.355991005897522, mean loss: 0.346656695118001
Epoch: 32, step: 510, loss: 0.299133837223053, mean loss: 0.34665567791177027
Epoch: 32, step: 511, loss: 0.35280290246009827, mean loss: 0.3466558094876382
Epoch: 32, step: 512, loss: 0.3377324938774109, mean loss: 0.346655618496101
Epoch: 32, step: 513, loss: 0.3386059105396271, mean loss: 0.3466554462066451
Epoch: 32, step: 514, loss: 0.348891943693161, mean loss: 0.34665549407380875
Epoch: 32, step: 515, loss: 0.31283947825431824, mean loss: 0.3466547703340643
Epoch: 32, step: 516, loss: 0.32901903986930847, mean loss: 0.3466543928973502
Epoch: 32, step: 517, loss: 0.2751240134239197, mean loss: 0.3466528620498676
Epoch: 32, step: 518, loss: 0.3394700884819031, mean loss: 0.3466527083320264
Epoch: 32, step: 519, loss: 0.3295973241329193, mean loss: 0.3466523433392127
Epoch: 32, step: 520, loss: 0.3588002324104309, mean loss: 0.3466526033038828
Epoch: 32, step: 521, loss: 0.28877779841423035, mean loss: 0.346651364810305
Epoch: 32, step: 522, loss: 0.35388171672821045, mean loss: 0.34665151953312107
Epoch: 32, step: 523, loss: 0.3226265609264374, mean loss: 0.34665100543232064
Epoch: 32, step: 524, loss: 0.34694990515708923, mean loss: 0.34665101182822344
Epoch: 32, step: 525, loss: 0.3650694489479065, mean loss: 0.34665140594037136
Epoch: 32, step: 526, loss: 0.3554476499557495, mean loss: 0.3466515941557135
Epoch: 32, step: 527, loss: 0.32887768745422363, mean loss: 0.34665121385130787
Epoch: 32, step: 528, loss: 0.34016096591949463, mean loss: 0.34665107498385955
Epoch: 32, step: 529, loss: 0.3399161100387573, mean loss: 0.34665093088344995
Epoch: 32, step: 530, loss: 0.2907434403896332, mean loss: 0.3466497347198501
Epoch: 32, step: 531, loss: 0.3429303765296936, mean loss: 0.34664965514436463
Epoch: 32, step: 532, loss: 0.3178830146789551, mean loss: 0.34664903969667493
Epoch: 32, step: 533, loss: 0.3396288752555847, mean loss: 0.34664888950702877
Epoch: 32, step: 534, loss: 0.3247830271720886, mean loss: 0.3466484217180051
Epoch: 32, step: 535, loss: 0.3180605471134186, mean loss: 0.3466478101341739
Epoch: 32, step: 536, loss: 0.33341872692108154, mean loss: 0.34664752712886393
Epoch: 32, step: 537, loss: 0.35650503635406494, mean loss: 0.3466477380027189
Epoch: 32, step: 538, loss: 0.31719842553138733, mean loss: 0.3466471080304753
Epoch: 32, step: 539, loss: 0.3668464124202728, mean loss: 0.34664754011964255
Epoch: 32, step: 540, loss: 0.32539045810699463, mean loss: 0.34664708541297473
Epoch: 32, step: 541, loss: 0.3483233153820038, mean loss: 0.3466471212681612
Epoch: 32, step: 542, loss: 0.3556306064128876, mean loss: 0.346647313424161
Epoch: 32, step: 543, loss: 0.3470321595668793, mean loss: 0.3466473216558119
Epoch: 32, step: 544, loss: 0.3247597813606262, mean loss: 0.3466468535031737
Epoch: 32, step: 545, loss: 0.33242061734199524, mean loss: 0.3466465492246914
Epoch: 32, step: 546, loss: 0.3041499853134155, mean loss: 0.34664564030449224
Epoch: 32, step: 547, loss: 0.35356396436691284, mean loss: 0.3466457882710433
Epoch: 32, step: 548, loss: 0.3275197446346283, mean loss: 0.34664537921905886
Epoch: 32, step: 549, loss: 0.3085901141166687, mean loss: 0.34664456534196614
Epoch: 32, step: 550, loss: 0.37340351939201355, mean loss: 0.3466451376158396
Epoch: 32, step: 551, loss: 0.34033307433128357, mean loss: 0.3466450026273177
Epoch: 32, step: 552, loss: 0.36869364976882935, mean loss: 0.34664547414518815
Epoch: 32, step: 553, loss: 0.32383206486701965, mean loss: 0.34664498628305057
Epoch: 32, step: 554, loss: 0.35802513360977173, mean loss: 0.3466452296409901
Epoch: 32, step: 555, loss: 0.34025198221206665, mean loss: 0.3466450929279752
Epoch: 32, step: 556, loss: 0.3525781035423279, mean loss: 0.34664521979658663
Epoch: 32, step: 557, loss: 0.3712339997291565, mean loss: 0.3466457455798465
Epoch: 32, step: 558, loss: 0.3396218419075012, mean loss: 0.34664559539053197
Epoch: 32, step: 559, loss: 0.31602901220321655, mean loss: 0.34664494074241387
Epoch: 32, step: 560, loss: 0.32430627942085266, mean loss: 0.3466444631042065
Epoch: 32, step: 561, loss: 0.31276705861091614, mean loss: 0.3466437387637213
Epoch: 32, step: 562, loss: 0.3209439516067505, mean loss: 0.34664318928247956
Epoch: 32, step: 563, loss: 0.3541871905326843, mean loss: 0.3466433505755876
Epoch: 32, step: 564, loss: 0.30926311016082764, mean loss: 0.346642551391434
Epoch: 32, step: 565, loss: 0.3244267702102661, mean loss: 0.3466420764313882
Epoch: 32, step: 566, loss: 0.3271123170852661, mean loss: 0.3466416589058009
Epoch: 32, step: 567, loss: 0.3105775713920593, mean loss: 0.34664088791025804
Epoch: 32, step: 568, loss: 0.355647474527359, mean loss: 0.3466410804533159
Epoch: 32, step: 569, loss: 0.3503018617630005, mean loss: 0.34664115871192697
Epoch: 32, step: 570, loss: 0.342035710811615, mean loss: 0.34664106026074376
Epoch: 32, step: 571, loss: 0.3037290871143341, mean loss: 0.34664014294622586
Epoch: 32, step: 572, loss: 0.3223940134048462, mean loss: 0.34663962465611786
Epoch: 32, step: 573, loss: 0.3297756314277649, mean loss: 0.34663926417573593
Epoch: 32, step: 574, loss: 0.3579069972038269, mean loss: 0.3466395050267508
Epoch: 32, step: 575, loss: 0.33162108063697815, mean loss: 0.3466391840104976
Epoch: 32, step: 576, loss: 0.37450721859931946, mean loss: 0.34663977967223936
Epoch: 32, step: 577, loss: 0.3176622688770294, mean loss: 0.34663916030937875
Epoch: 32, step: 578, loss: 0.3309744596481323, mean loss: 0.3466388255005502
Epoch: 32, step: 579, loss: 0.34148821234703064, mean loss: 0.3466387154164869
Epoch: 32, step: 580, loss: 0.3201005458831787, mean loss: 0.3466381482282689
Epoch: 32, step: 581, loss: 0.3628740906715393, mean loss: 0.3466384952242604
Epoch: 32, step: 582, loss: 0.29088035225868225, mean loss: 0.3466373035817871
Epoch: 32, step: 583, loss: 0.30563053488731384, mean loss: 0.34663642721897525
Epoch: 32, step: 584, loss: 0.4255719482898712, mean loss: 0.34663811412772383
Epoch: 32, step: 585, loss: 0.34514620900154114, mean loss: 0.34663808224532167
Epoch: 32, step: 586, loss: 0.28994226455688477, mean loss: 0.3466368706667836
Epoch: 32, step: 587, loss: 0.31973448395729065, mean loss: 0.3466362957803252
Epoch: 32, step: 588, loss: 0.3163881301879883, mean loss: 0.34663564941056657
Epoch: 32, step: 589, loss: 0.3829709589481354, mean loss: 0.34663642583925025
Epoch: 32, step: 590, loss: 0.3319261372089386, mean loss: 0.3466361115101272
Epoch: 32, step: 591, loss: 0.3250017464160919, mean loss: 0.3466356492373688
Epoch: 32, step: 592, loss: 0.3763073980808258, mean loss: 0.34663628323554924
Epoch: 32, step: 593, loss: 0.35903164744377136, mean loss: 0.34663654808244054
Epoch: 32, step: 594, loss: 0.3509453237056732, mean loss: 0.3466366401443943
Epoch: 32, step: 595, loss: 0.3061933219432831, mean loss: 0.3466357760447832
Epoch: 32, step: 596, loss: 0.27856627106666565, mean loss: 0.3466343217235573
Epoch: 32, step: 597, loss: 0.3470990061759949, mean loss: 0.3466343316514395
Epoch: 32, step: 598, loss: 0.2829876244068146, mean loss: 0.3466329718824467
Epoch: 32, step: 599, loss: 0.3191796541213989, mean loss: 0.3466323853733508
Epoch: 32, step: 600, loss: 0.34524765610694885, mean loss: 0.34663235579080753
Epoch: 32, step: 601, loss: 0.3235614597797394, mean loss: 0.34663186292825654
Epoch: 32, step: 602, loss: 0.3021886944770813, mean loss: 0.3466309135110586
Epoch: 32, step: 603, loss: 0.3157922625541687, mean loss: 0.3466302547344424
Epoch: 32, step: 604, loss: 0.36661627888679504, mean loss: 0.346630681667648
Epoch: 32, step: 605, loss: 0.3264477550983429, mean loss: 0.3466302505375038
Epoch: 32, step: 606, loss: 0.3253505527973175, mean loss: 0.34662979598879634
Epoch: 32, step: 607, loss: 0.30301398038864136, mean loss: 0.3466288643454351
Epoch: 32, step: 608, loss: 0.3274647891521454, mean loss: 0.34662845500534084
Epoch: 32, step: 609, loss: 0.3226880729198456, mean loss: 0.3466279436553881
Epoch: 32, step: 610, loss: 0.35793182253837585, mean loss: 0.34662818509324206
Epoch: 32, step: 611, loss: 0.37332120537757874, mean loss: 0.3466287552132823
Epoch: 32, step: 612, loss: 0.314754456281662, mean loss: 0.3466280744439922
Epoch: 32, step: 613, loss: 0.3207341730594635, mean loss: 0.3466275214154717
Epoch: 32, step: 614, loss: 0.31816765666007996, mean loss: 0.34662691359741743
Epoch: 32, step: 615, loss: 0.3423914909362793, mean loss: 0.34662682314331994
Epoch: 32, step: 616, loss: 0.33362406492233276, mean loss: 0.34662654545494365
Epoch: 32, step: 617, loss: 0.32563063502311707, mean loss: 0.3466260970734797
Epoch: 32, step: 618, loss: 0.29172709584236145, mean loss: 0.3466249246942705
Epoch: 32, step: 619, loss: 0.32797926664352417, mean loss: 0.346624526520997
Epoch: 32, step: 620, loss: 0.328217476606369, mean loss: 0.3466241334515333
Epoch: 32, step: 621, loss: 0.3143516182899475, mean loss: 0.34662344430963365
Epoch: 32, step: 622, loss: 0.2932596504688263, mean loss: 0.3466223048124237
Epoch: 32, step: 623, loss: 0.31435826420783997, mean loss: 0.34662161588091095
Epoch: 32, step: 624, loss: 0.2950868010520935, mean loss: 0.3466205154855737
Epoch: 32, step: 625, loss: 0.298979789018631, mean loss: 0.3466194982603428
Epoch: 32, step: 626, loss: 0.33719754219055176, mean loss: 0.34661929708694533
Epoch: 32, step: 627, loss: 0.34655484557151794, mean loss: 0.3466192957108348
Epoch: 32, step: 628, loss: 0.29553890228271484, mean loss: 0.3466182051116626
Epoch: 32, step: 629, loss: 0.3217124342918396, mean loss: 0.3466176733688294
Epoch: 32, step: 630, loss: 0.3196602463722229, mean loss: 0.3466170978350436
Epoch: 32, step: 631, loss: 0.34812724590301514, mean loss: 0.3466171300756086
Epoch: 32, step: 632, loss: 0.35638362169265747, mean loss: 0.346617338578664
Epoch: 32, step: 633, loss: 0.3132033944129944, mean loss: 0.3466166252456687
Epoch: 32, step: 634, loss: 0.32298019528388977, mean loss: 0.3466161206573639
Epoch: 32, step: 635, loss: 0.32466989755630493, mean loss: 0.34661565216143914
Epoch: 32, step: 636, loss: 0.3283337652683258, mean loss: 0.34661526189808356
Epoch: 32, step: 637, loss: 0.3185312747955322, mean loss: 0.34661466240213723
Epoch: 32, step: 638, loss: 0.3183089792728424, mean loss: 0.34661405818664576
Epoch: 32, step: 639, loss: 0.3330264091491699, mean loss: 0.3466137681497384
Epoch: 32, step: 640, loss: 0.355881005525589, mean loss: 0.34661396596052146
Epoch: 32, step: 641, loss: 0.35039249062538147, mean loss: 0.3466140466120618
Epoch: 32, step: 642, loss: 0.32665929198265076, mean loss: 0.3466136206925589
Epoch: 32, step: 643, loss: 0.3392448127269745, mean loss: 0.34661346341415106
Epoch: 32, step: 644, loss: 0.33269748091697693, mean loss: 0.34661316640045936
Epoch: 32, step: 645, loss: 0.3024314045906067, mean loss: 0.34661222343375836
Epoch: 32, step: 646, loss: 0.34771668910980225, mean loss: 0.34661224700575016
Epoch: 32, step: 647, loss: 0.330579549074173, mean loss: 0.3466119048361682
Epoch: 32, step: 648, loss: 0.3695034384727478, mean loss: 0.3466123933764853
Epoch: 32, step: 649, loss: 0.3189961016178131, mean loss: 0.3466118040151861
Epoch: 32, step: 650, loss: 0.3277811110019684, mean loss: 0.3466114021565674
Epoch: 32, step: 651, loss: 0.3051590621471405, mean loss: 0.34661051755690864
Epoch: 32, step: 652, loss: 0.3219560980796814, mean loss: 0.34660999143882587
Epoch: 32, step: 653, loss: 0.30596277117729187, mean loss: 0.3466091240575732
Epoch: 32, step: 654, loss: 0.3537450432777405, mean loss: 0.3466092763294982
Epoch: 32, step: 655, loss: 0.329243004322052, mean loss: 0.3466089057620689
Epoch: 32, step: 656, loss: 0.35143131017684937, mean loss: 0.3466090086619817
Epoch: 32, step: 657, loss: 0.33333706855773926, mean loss: 0.3466087254728872
Epoch: 32, step: 658, loss: 0.3327323794364929, mean loss: 0.3466084293936409
Epoch: 32, step: 659, loss: 0.36651694774627686, mean loss: 0.34660885417213266
Epoch: 32, step: 660, loss: 0.2938471734523773, mean loss: 0.3466077284455176
Epoch: 32, step: 661, loss: 0.32890555262565613, mean loss: 0.34660735075881355
Epoch: 32, step: 662, loss: 0.34033966064453125, mean loss: 0.3466072170366802
Epoch: 32, step: 663, loss: 0.32988080382347107, mean loss: 0.346606860183693
Epoch: 32, step: 664, loss: 0.341378778219223, mean loss: 0.34660674864651886
Epoch: 32, step: 665, loss: 0.3441048264503479, mean loss: 0.34660669527104
Epoch: 32, step: 666, loss: 0.32793888449668884, mean loss: 0.34660629702441015
Epoch: 32, step: 667, loss: 0.32538318634033203, mean loss: 0.34660584427437424
Epoch: 32, step: 668, loss: 0.29623734951019287, mean loss: 0.3466047697923305
Epoch: 32, step: 669, loss: 0.33057817816734314, mean loss: 0.3466044279135894
Epoch: 32, step: 670, loss: 0.343722939491272, mean loss: 0.34660436644708154
Epoch: 32, step: 671, loss: 0.3553384244441986, mean loss: 0.34660455275377944
Epoch: 32, step: 672, loss: 0.3723509907722473, mean loss: 0.3466051019408279
Epoch: 32, step: 673, loss: 0.32687103748321533, mean loss: 0.3466046810103117
Epoch: 32, step: 674, loss: 0.2919393479824066, mean loss: 0.3466035150155369
Epoch: 32, step: 675, loss: 0.34789934754371643, mean loss: 0.3466035426546574
Epoch: 32, step: 676, loss: 0.3687845766544342, mean loss: 0.3466040157491226
Epoch: 32, step: 677, loss: 0.31466394662857056, mean loss: 0.3466033345208429
Epoch: 32, step: 678, loss: 0.2993929386138916, mean loss: 0.34660232762349596
Epoch: 32, step: 679, loss: 0.34529200196266174, mean loss: 0.3466022996776322
Epoch: 32, step: 680, loss: 0.3325926661491394, mean loss: 0.34660200089468673
Epoch: 32, step: 681, loss: 0.39818498492240906, mean loss: 0.34660310097965213
Epoch: 32, step: 682, loss: 0.3124772608280182, mean loss: 0.34660237321014087
Epoch: 32, step: 683, loss: 0.3480711281299591, mean loss: 0.3466024045322197
Epoch: 32, step: 684, loss: 0.31549742817878723, mean loss: 0.346601741214105
Epoch: 32, step: 685, loss: 0.3572641909122467, mean loss: 0.3466019685875365
Epoch: 32, step: 686, loss: 0.3195846378803253, mean loss: 0.3466013924636276
Epoch: 32, step: 687, loss: 0.31666794419288635, mean loss: 0.34660075416935365
Epoch: 32, step: 688, loss: 0.3122032880783081, mean loss: 0.3466000207009849
Epoch: 32, step: 689, loss: 0.3204896152019501, mean loss: 0.346599463952179
Epoch: 32, step: 690, loss: 0.34443044662475586, mean loss: 0.3465994177034887
Epoch: 32, step: 691, loss: 0.35939040780067444, mean loss: 0.3465996904324886
Epoch: 32, step: 692, loss: 0.35094982385635376, mean loss: 0.3465997831838889
Epoch: 32, step: 693, loss: 0.33485087752342224, mean loss: 0.3465995326848556
Epoch: 32, step: 694, loss: 0.31883901357650757, mean loss: 0.3465989408139922
Epoch: 32, step: 695, loss: 0.31758958101272583, mean loss: 0.346598322330285
Epoch: 32, step: 696, loss: 0.3345264792442322, mean loss: 0.34659806496234796
Epoch: 32, step: 697, loss: 0.40289148688316345, mean loss: 0.34659926509499456
Epoch: 32, step: 698, loss: 0.32395362854003906, mean loss: 0.3465987823176574
Epoch: 32, step: 699, loss: 0.31096765398979187, mean loss: 0.3465980227216753
Epoch: 32, step: 700, loss: 0.30457937717437744, mean loss: 0.34659712697361955
Epoch: 32, step: 701, loss: 0.3456279933452606, mean loss: 0.3465971063141945
Epoch: 32, step: 702, loss: 0.3096925616264343, mean loss: 0.3465963196214212
Epoch: 32, step: 703, loss: 0.34097835421562195, mean loss: 0.34659619986601947
Epoch: 32, step: 704, loss: 0.3325907588005066, mean loss: 0.3465959013252938
Epoch: 32, step: 705, loss: 0.3053540885448456, mean loss: 0.3465950222313606
Epoch: 32, step: 706, loss: 0.3756128251552582, mean loss: 0.3465956407500204
Epoch: 32, step: 707, loss: 0.33657774329185486, mean loss: 0.3465954272216408
Epoch: 32, step: 708, loss: 0.34680885076522827, mean loss: 0.3465954317706005
Epoch: 32, step: 709, loss: 0.32391440868377686, mean loss: 0.3465949483522304
Epoch: 32, step: 710, loss: 0.3517577350139618, mean loss: 0.34659505838839194
Epoch: 32, step: 711, loss: 0.305350661277771, mean loss: 0.3465941793517954
Epoch: 32, step: 712, loss: 0.3418976068496704, mean loss: 0.34659407925647556
Epoch: 32, step: 713, loss: 0.3291846811771393, mean loss: 0.34659370822800106
Epoch: 32, step: 714, loss: 0.3272579610347748, mean loss: 0.3465932961540247
Epoch: 32, step: 715, loss: 0.3311195969581604, mean loss: 0.34659296639315185
Epoch: 32, step: 716, loss: 0.30038565397262573, mean loss: 0.3465919816875062
Epoch: 32, step: 717, loss: 0.379751980304718, mean loss: 0.34659268833198087
Epoch: 32, step: 718, loss: 0.30080780386924744, mean loss: 0.34659171267011324
Epoch: 32, step: 719, loss: 0.34761160612106323, mean loss: 0.34659173440326724
Epoch: 32, step: 720, loss: 0.3518116772174835, mean loss: 0.3465918456339096
Epoch: 32, step: 721, loss: 0.3402346968650818, mean loss: 0.34659171017367585
Epoch: 32, step: 722, loss: 0.37862685322761536, mean loss: 0.3465923927745804
Epoch: 32, step: 723, loss: 0.3532751202583313, mean loss: 0.3465925351662851
Epoch: 32, step: 724, loss: 0.33503609895706177, mean loss: 0.3465922889336511
Epoch: 32, step: 725, loss: 0.332611620426178, mean loss: 0.3465919910543204
Epoch: 32, step: 726, loss: 0.31613782048225403, mean loss: 0.346591342195887
Epoch: 32, step: 727, loss: 0.3418172597885132, mean loss: 0.3465912404811604
Epoch: 32, step: 728, loss: 0.3400769829750061, mean loss: 0.3465911016939029
Epoch: 32, step: 729, loss: 0.3513849079608917, mean loss: 0.34659120382450637
Epoch: 32, step: 730, loss: 0.3258664906024933, mean loss: 0.3465907623001189
Epoch: 32, step: 731, loss: 0.365556925535202, mean loss: 0.3465911663513169
Epoch: 32, step: 732, loss: 0.30260738730430603, mean loss: 0.3465902293499951
Epoch: 32, step: 733, loss: 0.30321940779685974, mean loss: 0.34658930542639677
Epoch: 32, step: 734, loss: 0.30631616711616516, mean loss: 0.3465884475106626
Epoch: 32, step: 735, loss: 0.3260340988636017, mean loss: 0.3465880096624041
Epoch: 32, step: 736, loss: 0.3032485246658325, mean loss: 0.34658708646536507
Epoch: 32, step: 737, loss: 0.3168046474456787, mean loss: 0.34658645206756716
Epoch: 32, step: 738, loss: 0.369276762008667, mean loss: 0.3465869353851368
Epoch: 32, step: 739, loss: 0.3018641173839569, mean loss: 0.3465859827818736
Epoch: 32, step: 740, loss: 0.31019702553749084, mean loss: 0.3465852077077028
Epoch: 32, step: 741, loss: 0.34811636805534363, mean loss: 0.34658524032027677
Epoch: 32, step: 742, loss: 0.3024415075778961, mean loss: 0.3465843001117031
Epoch: 32, step: 743, loss: 0.3014640510082245, mean loss: 0.34658333912496975
Epoch: 32, step: 744, loss: 0.3483150899410248, mean loss: 0.34658337600761446
Epoch: 32, step: 745, loss: 0.33747148513793945, mean loss: 0.34658318194766496
Epoch: 32, step: 746, loss: 0.308805376291275, mean loss: 0.3465823773942488
Epoch: 32, step: 747, loss: 0.3275611996650696, mean loss: 0.34658197230911103
Epoch: 32, step: 748, loss: 0.34719207882881165, mean loss: 0.3465819853019879
Epoch: 32, step: 749, loss: 0.2993118166923523, mean loss: 0.346580978654162
Epoch: 32, step: 750, loss: 0.3091025650501251, mean loss: 0.3465801805448836
Epoch: 32, step: 751, loss: 0.34641194343566895, mean loss: 0.34658017696232163
Epoch: 32, step: 752, loss: 0.32070693373680115, mean loss: 0.3465796260106122
Epoch: 32, step: 753, loss: 0.2948248088359833, mean loss: 0.3465785239532643
Epoch: 32, step: 754, loss: 0.33536526560783386, mean loss: 0.34657828518533323
Epoch: 32, step: 755, loss: 0.3743743896484375, mean loss: 0.3465788770451506
Epoch: 32, step: 756, loss: 0.3138676881790161, mean loss: 0.3465781805437375
Epoch: 32, step: 757, loss: 0.302621454000473, mean loss: 0.34657724461718337
Epoch: 32, step: 758, loss: 0.3785202205181122, mean loss: 0.34657792473249627
Epoch: 32, step: 759, loss: 0.34118616580963135, mean loss: 0.346577809936062
Epoch: 32, step: 760, loss: 0.3206583559513092, mean loss: 0.3465772580943369
Epoch: 32, step: 761, loss: 0.28966379165649414, mean loss: 0.3465760463960947
Epoch: 32, step: 762, loss: 0.3761463463306427, mean loss: 0.34657667593985436
Epoch: 32, step: 763, loss: 0.3702284097671509, mean loss: 0.346577179468208
Epoch: 32, step: 764, loss: 0.3570045828819275, mean loss: 0.34657740145537963
Epoch: 32, step: 765, loss: 0.3296985626220703, mean loss: 0.3465770421323747
Epoch: 32, step: 766, loss: 0.33523228764533997, mean loss: 0.3465768006261589
Epoch: 32, step: 767, loss: 0.3305858373641968, mean loss: 0.3465764602190731
Epoch: 32, step: 768, loss: 0.2976287603378296, mean loss: 0.34657541826875954
Epoch: 32, step: 769, loss: 0.35004764795303345, mean loss: 0.34657549218058387
Epoch: 32, step: 770, loss: 0.3213913142681122, mean loss: 0.34657495610748923
Epoch: 32, step: 771, loss: 0.3483799397945404, mean loss: 0.3465749945277465
Epoch: 32, step: 772, loss: 0.3393647074699402, mean loss: 0.34657484105534153
Epoch: 32, step: 773, loss: 0.31645235419273376, mean loss: 0.3465741999058191
Epoch: 32, step: 774, loss: 0.32678917050361633, mean loss: 0.3465737787954302
Epoch: 32, step: 775, loss: 0.32530397176742554, mean loss: 0.3465733260922328
Epoch: 32, step: 776, loss: 0.35628700256347656, mean loss: 0.3465735328321811
Epoch: 32, step: 777, loss: 0.3254219889640808, mean loss: 0.34657308266524056
Epoch: 32, step: 778, loss: 0.35255080461502075, mean loss: 0.3465732098860027
Epoch: 32, step: 779, loss: 0.3352377116680145, mean loss: 0.34657296864359577
Epoch: 32, step: 780, loss: 0.3034825026988983, mean loss: 0.34657205161054666
Epoch: 32, step: 781, loss: 0.29265761375427246, mean loss: 0.3465709042507285
Epoch: 32, step: 782, loss: 0.3055236339569092, mean loss: 0.3465700307372835
Epoch: 32, step: 783, loss: 0.3267778158187866, mean loss: 0.3465696095546371
Epoch: 32, step: 784, loss: 0.35462018847465515, mean loss: 0.3465697808690652
Epoch: 32, step: 785, loss: 0.3534576892852783, mean loss: 0.34656992743901915
Epoch: 32, step: 786, loss: 0.3174229860305786, mean loss: 0.34656930722534945
Epoch: 32, step: 787, loss: 0.3319953978061676, mean loss: 0.34656899711577804
Epoch: 32, step: 788, loss: 0.3059379458427429, mean loss: 0.3465681325701417
Epoch: 32, step: 789, loss: 0.31733134388923645, mean loss: 0.3465675104843363
Epoch: 32, step: 790, loss: 0.33320581912994385, mean loss: 0.34656722618698205
Epoch: 32, step: 791, loss: 0.33366984128952026, mean loss: 0.34656695177453745
Epoch: 32, step: 792, loss: 0.3601773977279663, mean loss: 0.3465672413523327
Epoch: 32, step: 793, loss: 0.3310575485229492, mean loss: 0.3465669113729099
Epoch: 32, step: 794, loss: 0.35770148038864136, mean loss: 0.346567148263513
Epoch: 32, step: 795, loss: 0.33097630739212036, mean loss: 0.3465668165717235
Epoch: 32, step: 796, loss: 0.3228845000267029, mean loss: 0.34656631274624655
Epoch: 32, step: 797, loss: 0.31086358428001404, mean loss: 0.346565553210688
Epoch: 32, step: 798, loss: 0.32365256547927856, mean loss: 0.34656506577290785
Epoch: 32, step: 799, loss: 0.36855441331863403, mean loss: 0.34656553355174435
Epoch: 32, step: 800, loss: 0.36837297677993774, mean loss: 0.34656599745106637
Epoch: 32, step: 801, loss: 0.34424299001693726, mean loss: 0.34656594803589014
Epoch: 32, step: 802, loss: 0.3548012971878052, mean loss: 0.34656612321508545
Epoch: 32, step: 803, loss: 0.3433670401573181, mean loss: 0.3465660551668625
Epoch: 32, step: 804, loss: 0.34144389629364014, mean loss: 0.34656594621489445
Epoch: 32, step: 805, loss: 0.308067262172699, mean loss: 0.3465651273378782
Epoch: 32, step: 806, loss: 0.3377331495285034, mean loss: 0.3465649394834103
Epoch: 32, step: 807, loss: 0.3702045679092407, mean loss: 0.346565442283062
Epoch: 32, step: 808, loss: 0.3065095841884613, mean loss: 0.3465645903389121
Epoch: 32, step: 809, loss: 0.3816036581993103, mean loss: 0.34656533556558833
Epoch: 32, step: 810, loss: 0.3298848569393158, mean loss: 0.34656498080520154
Epoch: 32, step: 811, loss: 0.29121413826942444, mean loss: 0.346563803628627
Epoch: 32, step: 812, loss: 0.329109251499176, mean loss: 0.34656343242103615
Epoch: 32, step: 813, loss: 0.3667745590209961, mean loss: 0.34656386224381275
Epoch: 32, step: 814, loss: 0.30918997526168823, mean loss: 0.34656306744367277
Epoch: 32, step: 815, loss: 0.35122206807136536, mean loss: 0.34656316652075314
Epoch: 32, step: 816, loss: 0.30267542600631714, mean loss: 0.3465622332354684
Epoch: 32, step: 817, loss: 0.3084051012992859, mean loss: 0.3465614218304598
Epoch: 32, step: 818, loss: 0.37817564606666565, mean loss: 0.3465620940873385
Epoch: 32, step: 819, loss: 0.3267648220062256, mean loss: 0.3465616731195729
Epoch: 32, step: 820, loss: 0.31812354922294617, mean loss: 0.3465610684262157
Epoch: 32, step: 821, loss: 0.34953197836875916, mean loss: 0.34656113159674395
Epoch: 32, step: 822, loss: 0.35221603512763977, mean loss: 0.34656125183453457
Epoch: 32, step: 823, loss: 0.34376683831214905, mean loss: 0.3465611924193806
Epoch: 32, step: 824, loss: 0.30558788776397705, mean loss: 0.3465603212586072
Epoch: 32, step: 825, loss: 0.31479623913764954, mean loss: 0.3465596459156187
Epoch: 32, step: 826, loss: 0.32363027334213257, mean loss: 0.3465591584196567
Epoch: 32, step: 827, loss: 0.32842206954956055, mean loss: 0.3465587728195021
Epoch: 32, step: 828, loss: 0.2791616916656494, mean loss: 0.34655733996704224
Epoch: 32, step: 829, loss: 0.30906710028648376, mean loss: 0.3465565429467676
Epoch: 32, step: 830, loss: 0.3046944737434387, mean loss: 0.34655565300290814
Epoch: 32, step: 831, loss: 0.32582035660743713, mean loss: 0.3465552122015392
Epoch: 32, step: 832, loss: 0.33975014090538025, mean loss: 0.3465550675389832
Epoch: 32, step: 833, loss: 0.3070248067378998, mean loss: 0.3465542272205273
Epoch: 32, step: 834, loss: 0.36095839738845825, mean loss: 0.3465545334121003
Epoch: 32, step: 835, loss: 0.32531070709228516, mean loss: 0.34655408183854536
Epoch: 32, step: 836, loss: 0.33952751755714417, mean loss: 0.34655393248018035
Epoch: 32, step: 837, loss: 0.32490548491477966, mean loss: 0.3465534723252774
Epoch: 32, step: 838, loss: 0.3393230140209198, mean loss: 0.34655331863942485
Epoch: 32, step: 839, loss: 0.3311821520328522, mean loss: 0.3465529919269906
Epoch: 32, step: 840, loss: 0.3035951256752014, mean loss: 0.3465520788817345
Epoch: 32, step: 841, loss: 0.3383485972881317, mean loss: 0.34655190452505874
Epoch: 32, step: 842, loss: 0.3457581102848053, mean loss: 0.34655188765412637
Epoch: 32, step: 843, loss: 0.3324615955352783, mean loss: 0.34655158819199683
Epoch: 32, step: 844, loss: 0.3137005865573883, mean loss: 0.34655089002181355
Epoch: 32, step: 845, loss: 0.38094907999038696, mean loss: 0.34655162105828163
Epoch: 32, step: 846, loss: 0.3264530897140503, mean loss: 0.3465511939297864
Epoch: 32, step: 847, loss: 0.40545645356178284, mean loss: 0.3465524457416623
Epoch: 32, step: 848, loss: 0.34382662177085876, mean loss: 0.3465523878156583
Epoch: 32, step: 849, loss: 0.30160561203956604, mean loss: 0.34655143267995814
Epoch: 32, step: 850, loss: 0.33299458026885986, mean loss: 0.3465511445979247
Epoch: 32, step: 851, loss: 0.34395790100097656, mean loss: 0.3465510894928759
Epoch: 32, step: 852, loss: 0.29470109939575195, mean loss: 0.3465499877315428
Epoch: 32, step: 853, loss: 0.344269722700119, mean loss: 0.3465499392791814
Epoch: 32, step: 854, loss: 0.36887651681900024, mean loss: 0.3465504136768513
Epoch: 32, step: 855, loss: 0.4022088348865509, mean loss: 0.34655159628821475
Epoch: 32, step: 856, loss: 0.35400110483169556, mean loss: 0.3465517545694969
Epoch: 32, step: 857, loss: 0.34489479660987854, mean loss: 0.346551719364509
Epoch: 32, step: 858, loss: 0.33076587319374084, mean loss: 0.34655138397355206
Epoch: 32, step: 859, loss: 0.3410610854625702, mean loss: 0.34655126732745467
Epoch: 32, step: 860, loss: 0.3511905074119568, mean loss: 0.3465513658899923
Epoch: 32, step: 861, loss: 0.3563043773174286, mean loss: 0.3465515730922746
Epoch: 32, step: 862, loss: 0.3285309076309204, mean loss: 0.3465511902521934
Epoch: 32, step: 863, loss: 0.3147238492965698, mean loss: 0.34655051411051774
Epoch: 32, step: 864, loss: 0.30792200565338135, mean loss: 0.3465496935019214
Epoch: 32, step: 865, loss: 0.30895134806632996, mean loss: 0.34654889479466394
Epoch: 32, step: 866, loss: 0.3368111848831177, mean loss: 0.34654868793943483
Epoch: 32, step: 867, loss: 0.3853350877761841, mean loss: 0.3465495118497041
Epoch: 32, step: 868, loss: 0.2932218611240387, mean loss: 0.3465483790746606
Epoch: 32, step: 869, loss: 0.3049738109111786, mean loss: 0.3465474959749502
Epoch: 32, step: 870, loss: 0.3416060209274292, mean loss: 0.34654739101360765
Epoch: 32, step: 871, loss: 0.3057367205619812, mean loss: 0.34654652417693704
Epoch: 32, step: 872, loss: 0.32923680543899536, mean loss: 0.3465461565186728
Epoch: 32, step: 873, loss: 0.31320860981941223, mean loss: 0.346545448444532
Epoch: 32, step: 874, loss: 0.29419809579849243, mean loss: 0.3465443366344807
Epoch: 32, step: 875, loss: 0.3354094922542572, mean loss: 0.3465441001455592
Epoch: 32, step: 876, loss: 0.30952492356300354, mean loss: 0.3465433139253918
Epoch: 32, step: 877, loss: 0.35024288296699524, mean loss: 0.34654339249585947
Epoch: 32, step: 878, loss: 0.3464856743812561, mean loss: 0.3465433912700835
Epoch: 32, step: 879, loss: 0.41927438974380493, mean loss: 0.34654493584616386
Epoch: 32, step: 880, loss: 0.32252374291419983, mean loss: 0.3465444257229306
Epoch: 32, step: 881, loss: 0.3411538898944855, mean loss: 0.3465443112498826
Epoch: 32, step: 882, loss: 0.33294588327407837, mean loss: 0.346544022480734
Epoch: 32, step: 883, loss: 0.3539605438709259, mean loss: 0.3465441799707831
Epoch: 32, step: 884, loss: 0.3344234228134155, mean loss: 0.3465439225916151
Epoch: 32, step: 885, loss: 0.36439865827560425, mean loss: 0.3465443017213489
Epoch: 32, step: 886, loss: 0.3623636066913605, mean loss: 0.34654463762335486
Epoch: 32, step: 887, loss: 0.2907368242740631, mean loss: 0.3465434526434553
Epoch: 32, step: 888, loss: 0.35189029574394226, mean loss: 0.34654356617177134
Epoch: 32, step: 889, loss: 0.3308747410774231, mean loss: 0.3465432334861988
Epoch: 32, step: 890, loss: 0.33092185854911804, mean loss: 0.3465429018151456
Epoch: 32, step: 891, loss: 0.27955520153045654, mean loss: 0.3465414795709782
Epoch: 32, step: 892, loss: 0.3701936900615692, mean loss: 0.34654198173039075
Epoch: 32, step: 893, loss: 0.34506839513778687, mean loss: 0.34654195044537967
Epoch: 32, step: 894, loss: 0.316127747297287, mean loss: 0.34654130474970957
Epoch: 32, step: 895, loss: 0.33149513602256775, mean loss: 0.34654098532527156
Epoch: 32, step: 896, loss: 0.32623153924942017, mean loss: 0.346540554172611
Epoch: 32, step: 897, loss: 0.34156492352485657, mean loss: 0.34654044854635
Epoch: 32, step: 898, loss: 0.36610206961631775, mean loss: 0.346540863805676
Epoch: 32, step: 899, loss: 0.3567396402359009, mean loss: 0.346541080303435
Epoch: 32, step: 900, loss: 0.3274521827697754, mean loss: 0.3465406750964144
Epoch: 32, step: 901, loss: 0.31872501969337463, mean loss: 0.3465400846558412
Epoch: 32, step: 902, loss: 0.3087766170501709, mean loss: 0.34653928307091186
Epoch: 32, step: 903, loss: 0.3177364766597748, mean loss: 0.3465386717021224
Epoch: 32, step: 904, loss: 0.3147294223308563, mean loss: 0.3465379965328618
Epoch: 32, step: 905, loss: 0.30063432455062866, mean loss: 0.34653702222221144
Epoch: 32, step: 906, loss: 0.3361852467060089, mean loss: 0.34653680250926405
Epoch: 32, step: 907, loss: 0.38041457533836365, mean loss: 0.34653752153831635
Epoch: 32, step: 908, loss: 0.3381800353527069, mean loss: 0.3465373441610176
Epoch: 32, step: 909, loss: 0.36305034160614014, mean loss: 0.34653769462150924
Epoch: 32, step: 910, loss: 0.3784940540790558, mean loss: 0.3465383728268926
Epoch: 32, step: 911, loss: 0.296161413192749, mean loss: 0.34653730370635705
Epoch: 32, step: 912, loss: 0.33194616436958313, mean loss: 0.34653699405377464
Epoch: 32, step: 913, loss: 0.30513614416122437, mean loss: 0.34653611546521956
Epoch: 32, step: 914, loss: 0.33219078183174133, mean loss: 0.34653581104203696
Epoch: 32, step: 915, loss: 0.2914453148841858, mean loss: 0.3465346419881333
Epoch: 32, step: 916, loss: 0.3540647327899933, mean loss: 0.3465348017778585
Epoch: 32, step: 917, loss: 0.3368155360221863, mean loss: 0.3465345955378688
Epoch: 32, step: 918, loss: 0.32560309767723083, mean loss: 0.34653415138700283
Epoch: 32, step: 919, loss: 0.3432212471961975, mean loss: 0.3465340810911237
Epoch: 32, step: 920, loss: 0.33453646302223206, mean loss: 0.3465338265213669
Epoch: 32, step: 921, loss: 0.34740784764289856, mean loss: 0.34653384506626655
Epoch: 32, step: 922, loss: 0.34402531385421753, mean loss: 0.3465337918416116
Epoch: 32, step: 923, loss: 0.30954912304878235, mean loss: 0.3465330071376145
Epoch: 32, step: 924, loss: 0.33244413137435913, mean loss: 0.3465327082201731
Epoch: 32, step: 925, loss: 0.34607988595962524, mean loss: 0.3465326986130475
Epoch: 32, step: 926, loss: 0.3362271189689636, mean loss: 0.346532479973403
Epoch: 32, step: 927, loss: 0.3391081392765045, mean loss: 0.3465323224644778
Epoch: 32, step: 928, loss: 0.3507660925388336, mean loss: 0.34653241228288106
Epoch: 32, step: 929, loss: 0.3122027814388275, mean loss: 0.3465316840035556
Epoch: 32, step: 930, loss: 0.3352968692779541, mean loss: 0.3465314456698038
Epoch: 32, step: 931, loss: 0.3879806697368622, mean loss: 0.3465323249490585
Epoch: 32, step: 932, loss: 0.3067721724510193, mean loss: 0.34653148151865826
Epoch: 32, step: 933, loss: 0.3032340407371521, mean loss: 0.3465305630713972
Epoch: 32, step: 934, loss: 0.32495230436325073, mean loss: 0.34653010535214496
Epoch: 32, step: 935, loss: 0.343401700258255, mean loss: 0.3465300389936456
Epoch: 32, step: 936, loss: 0.34263381361961365, mean loss: 0.34652995635019723
Epoch: 32, step: 937, loss: 0.32678577303886414, mean loss: 0.3465295375621068
Epoch: 32, step: 938, loss: 0.32925543189048767, mean loss: 0.3465291711738812
Epoch: 32, step: 939, loss: 0.31850242614746094, mean loss: 0.34652857673201676
Epoch: 32, step: 940, loss: 0.3488367795944214, mean loss: 0.34652862568751663
Epoch: 32, step: 941, loss: 0.38855770230293274, mean loss: 0.346529517078325
Epoch: 32, step: 942, loss: 0.3294384777545929, mean loss: 0.3465291546037365
Epoch: 32, step: 943, loss: 0.3289966881275177, mean loss: 0.3465287827750447
Epoch: 32, step: 944, loss: 0.34482914209365845, mean loss: 0.3465287467298157
Epoch: 32, step: 945, loss: 0.2973671555519104, mean loss: 0.34652770415461154
Epoch: 32, step: 946, loss: 0.31889280676841736, mean loss: 0.3465271181107692
Epoch: 32, step: 947, loss: 0.3476904630661011, mean loss: 0.3465271427809057
Epoch: 32, step: 948, loss: 0.3863445222377777, mean loss: 0.3465279871386777
Epoch: 32, step: 949, loss: 0.3560926914215088, mean loss: 0.3465281899611953
Epoch: 32, step: 950, loss: 0.3380608856678009, mean loss: 0.34652801041319187
Epoch: 32, step: 951, loss: 0.3226338028907776, mean loss: 0.3465275037506066
Epoch: 32, step: 952, loss: 0.33670496940612793, mean loss: 0.34652729547397243
Epoch: 32, step: 953, loss: 0.3053591251373291, mean loss: 0.34652642256420746
Epoch: 32, step: 954, loss: 0.33585330843925476, mean loss: 0.3465261962615099
Epoch: 32, step: 955, loss: 0.33920931816101074, mean loss: 0.3465260411245813
Epoch: 32, step: 956, loss: 0.3010823428630829, mean loss: 0.3465250776199007
Epoch: 32, step: 957, loss: 0.3834078907966614, mean loss: 0.34652585959872395
Epoch: 32, step: 958, loss: 0.3194575011730194, mean loss: 0.3465252857153219
Epoch: 32, step: 959, loss: 0.300017386674881, mean loss: 0.3465242997099996
Epoch: 32, step: 960, loss: 0.37321680784225464, mean loss: 0.34652486560090534
Epoch: 32, step: 961, loss: 0.287547767162323, mean loss: 0.3465236152914197
Epoch: 32, step: 962, loss: 0.2999444603919983, mean loss: 0.34652262783821963
Epoch: 32, step: 963, loss: 0.41834908723831177, mean loss: 0.34652415048850793
Epoch: 32, step: 964, loss: 0.31934815645217896, mean loss: 0.3465235743963782
Epoch: 32, step: 965, loss: 0.35379689931869507, mean loss: 0.3465237285771753
Epoch: 32, step: 966, loss: 0.3501458168029785, mean loss: 0.3465238053569999
Epoch: 32, step: 967, loss: 0.33615362644195557, mean loss: 0.34652358553804713
Epoch: 32, step: 968, loss: 0.354933500289917, mean loss: 0.3465237638010726
Epoch: 32, step: 969, loss: 0.32569944858551025, mean loss: 0.34652332240221684
Epoch: 32, step: 970, loss: 0.34922587871551514, mean loss: 0.34652337968525193
Epoch: 32, step: 971, loss: 0.3575684726238251, mean loss: 0.34652361379065544
Epoch: 32, step: 972, loss: 0.33401578664779663, mean loss: 0.34652334868760243
Epoch: 32, step: 973, loss: 0.3233185112476349, mean loss: 0.3465228568721338
Epoch: 32, step: 974, loss: 0.2937394976615906, mean loss: 0.3465217381777055
Epoch: 32, step: 975, loss: 0.36675187945365906, mean loss: 0.3465221669277325
Epoch: 32, step: 976, loss: 0.35205429792404175, mean loss: 0.34652228417115727
Epoch: 32, step: 977, loss: 0.3755553066730499, mean loss: 0.34652289946006715
Epoch: 32, step: 978, loss: 0.37160590291023254, mean loss: 0.34652343102603766
Epoch: 32, step: 979, loss: 0.3471181392669678, mean loss: 0.3465234436289927
Epoch: 32, step: 980, loss: 0.3331288695335388, mean loss: 0.34652315977949183
Epoch: 32, step: 981, loss: 0.34418413043022156, mean loss: 0.34652311021328397
Epoch: 32, step: 982, loss: 0.32775506377220154, mean loss: 0.346522712509348
Epoch: 32, step: 983, loss: 0.2967369854450226, mean loss: 0.346521657548188
Epoch: 32, step: 984, loss: 0.35763096809387207, mean loss: 0.3465218929498481
Epoch: 32, step: 985, loss: 0.30507150292396545, mean loss: 0.3465210146519707
Epoch: 32, step: 986, loss: 0.33626416325569153, mean loss: 0.3465207973227749
Epoch: 32, step: 987, loss: 0.350326806306839, mean loss: 0.3465208779653926
Epoch: 32, step: 988, loss: 0.3037528097629547, mean loss: 0.34651997180465777
Epoch: 32, step: 989, loss: 0.33129820227622986, mean loss: 0.34651964929587503
Epoch: 32, step: 990, loss: 0.3454900085926056, mean loss: 0.3465196274809912
Epoch: 32, step: 991, loss: 0.329840749502182, mean loss: 0.34651927411493233
Epoch: 32, step: 992, loss: 0.2980078458786011, mean loss: 0.34651824635221046
Epoch: 32, step: 993, loss: 0.36807048320770264, mean loss: 0.3465187029480508
Epoch: 32, step: 994, loss: 0.33585333824157715, mean loss: 0.3465184770012952
Epoch: 32, step: 995, loss: 0.33283159136772156, mean loss: 0.34651818704947684
Epoch: 32, step: 996, loss: 0.31210678815841675, mean loss: 0.3465174580716378
Epoch: 32, step: 997, loss: 0.2972952127456665, mean loss: 0.34651641536000527
Epoch: 32, step: 998, loss: 0.316830575466156, mean loss: 0.34651578651598014
Epoch: 32, step: 999, loss: 0.3042467534542084, mean loss: 0.34651489113737777
Epoch: 32, step: 1000, loss: 0.33469337224960327, mean loss: 0.34651464072921645
Epoch: 32, step: 1001, loss: 0.37116214632987976, mean loss: 0.34651516281152106
Epoch: 32, step: 1002, loss: 0.34557393193244934, mean loss: 0.34651514287483515
Epoch: 32, step: 1003, loss: 0.35719016194343567, mean loss: 0.3465153689830083
Epoch: 32, step: 1004, loss: 0.3044664263725281, mean loss: 0.34651447836087856
Epoch: 32, step: 1005, loss: 0.3082953989505768, mean loss: 0.3465136688747217
Epoch: 32, step: 1006, loss: 0.301750510931015, mean loss: 0.346512720804025
Epoch: 32, step: 1007, loss: 0.32573455572128296, mean loss: 0.3465122807378381
Epoch: 32, step: 1008, loss: 0.31639364361763, mean loss: 0.3465116428608633
Epoch: 32, step: 1009, loss: 0.38165223598480225, mean loss: 0.34651238708114207
Epoch: 32, step: 1010, loss: 0.30897948145866394, mean loss: 0.34651159221243194
Epoch: 32, step: 1011, loss: 0.3203186094760895, mean loss: 0.34651103751139983
Epoch: 32, step: 1012, loss: 0.2954806983470917, mean loss: 0.3465099568409531
Epoch: 32, step: 1013, loss: 0.3549366593360901, mean loss: 0.3465101352896104
Epoch: 32, step: 1014, loss: 0.3019900619983673, mean loss: 0.3465091925271156
Epoch: 32, step: 1015, loss: 0.3254132866859436, mean loss: 0.3465087458071037
Epoch: 32, step: 1016, loss: 0.3110925257205963, mean loss: 0.3465079958606752
Epoch: 32, step: 1017, loss: 0.3188808262348175, mean loss: 0.34650741086153014
Epoch: 32, step: 1018, loss: 0.29127076268196106, mean loss: 0.3465062412626105
Epoch: 32, step: 1019, loss: 0.34893232583999634, mean loss: 0.346506292632234
Epoch: 32, step: 1020, loss: 0.35972100496292114, mean loss: 0.34650657243304134
Epoch: 32, step: 1021, loss: 0.3234294056892395, mean loss: 0.34650608382057585
Epoch: 32, step: 1022, loss: 0.33848756551742554, mean loss: 0.3465059140482165
Epoch: 32, step: 1023, loss: 0.3211022615432739, mean loss: 0.34650537619988264
Epoch: 32, step: 1024, loss: 0.33374354243278503, mean loss: 0.34650510601095186
Epoch: 32, step: 1025, loss: 0.35768556594848633, mean loss: 0.3465053427145962
Epoch: 32, step: 1026, loss: 0.31656989455223083, mean loss: 0.3465047089589455
Epoch: 32, step: 1027, loss: 0.3420048952102661, mean loss: 0.34650461369656615
Epoch: 32, step: 1028, loss: 0.3196851313114166, mean loss: 0.3465040459322631
Epoch: 32, step: 1029, loss: 0.3155677020549774, mean loss: 0.34650339102850175
Epoch: 32, step: 1030, loss: 0.2990647852420807, mean loss: 0.34650238680305695
Epoch: 32, step: 1031, loss: 0.3269825875759125, mean loss: 0.3465019735981622
Epoch: 32, step: 1032, loss: 0.37416139245033264, mean loss: 0.34650255909421124
Epoch: 32, step: 1033, loss: 0.3227037787437439, mean loss: 0.34650205533102696
Epoch: 32, step: 1034, loss: 0.3554419279098511, mean loss: 0.3465022445627137
Epoch: 32, step: 1035, loss: 0.3362188935279846, mean loss: 0.34650202689801485
Epoch: 32, step: 1036, loss: 0.3540864586830139, mean loss: 0.3465021874320774
Epoch: 32, step: 1037, loss: 0.3625509440898895, mean loss: 0.34650252711705937
Epoch: 32, step: 1038, loss: 0.2990845739841461, mean loss: 0.3465015234987739
Epoch: 32, step: 1039, loss: 0.32309791445732117, mean loss: 0.3465010281633302
Epoch: 32, step: 1040, loss: 0.37903615832328796, mean loss: 0.3465017167520868
Epoch: 32, step: 1041, loss: 0.34216734766960144, mean loss: 0.3465016250194078
Epoch: 32, step: 1042, loss: 0.31156569719314575, mean loss: 0.34650088565033993
Epoch: 32, step: 1043, loss: 0.3232825696468353, mean loss: 0.34650039427820745
Epoch: 32, step: 1044, loss: 0.36541232466697693, mean loss: 0.3465007945052912
Epoch: 32, step: 1045, loss: 0.30915263295173645, mean loss: 0.3465000041349193
Epoch: 32, step: 1046, loss: 0.32169365882873535, mean loss: 0.34649947918845214
Epoch: 32, step: 1047, loss: 0.366610586643219, mean loss: 0.3464999047663143
Epoch: 32, step: 1048, loss: 0.3562808930873871, mean loss: 0.3465001117406953
Epoch: 32, step: 1049, loss: 0.34019917249679565, mean loss: 0.34649997841005825
Epoch: 32, step: 1050, loss: 0.2906385660171509, mean loss: 0.3464987963830921
Epoch: 32, step: 1051, loss: 0.32443535327911377, mean loss: 0.34649832953072
Epoch: 32, step: 1052, loss: 0.36660653352737427, mean loss: 0.3464987550021234
Epoch: 32, step: 1053, loss: 0.3133560121059418, mean loss: 0.346498053746508
Epoch: 32, step: 1054, loss: 0.3910162150859833, mean loss: 0.34649899567066306
Epoch: 32, step: 1055, loss: 0.2922966778278351, mean loss: 0.34649784887145346
Epoch: 32, step: 1056, loss: 0.3166908025741577, mean loss: 0.3464972182346969
Epoch: 32, step: 1057, loss: 0.34612059593200684, mean loss: 0.3464972102665527
Epoch: 32, step: 1058, loss: 0.3357977271080017, mean loss: 0.3464969839039074
Epoch: 32, step: 1059, loss: 0.3526398539543152, mean loss: 0.3464971138622312
Epoch: 32, step: 1060, loss: 0.30296558141708374, mean loss: 0.34649619293027906
Epoch: 32, step: 1061, loss: 0.32505419850349426, mean loss: 0.3464957393234581
Epoch: 32, step: 1062, loss: 0.36252620816230774, mean loss: 0.3464960784419206
Epoch: 32, step: 1063, loss: 0.3376482129096985, mean loss: 0.3464958912726548
Epoch: 32, step: 1064, loss: 0.31608104705810547, mean loss: 0.34649524788543135
Epoch: 32, step: 1065, loss: 0.3362777531147003, mean loss: 0.34649503175193785
Epoch: 32, step: 1066, loss: 0.3089335858821869, mean loss: 0.3464942372210892
Epoch: 32, step: 1067, loss: 0.3602093756198883, mean loss: 0.3464945273289325
Epoch: 32, step: 1068, loss: 0.3345678150653839, mean loss: 0.34649427505589775
Epoch: 32, step: 1069, loss: 0.3079771399497986, mean loss: 0.3464934603612172
Epoch: 32, step: 1070, loss: 0.3497963845729828, mean loss: 0.3464935302214979
Epoch: 32, step: 1071, loss: 0.34590867161750793, mean loss: 0.3464935178513921
Epoch: 32, step: 1072, loss: 0.37207815051078796, mean loss: 0.3464940589700795
Epoch: 32, step: 1073, loss: 0.34841272234916687, mean loss: 0.3464940995492297
Epoch: 32, step: 1074, loss: 0.33434629440307617, mean loss: 0.3464938426322586
Epoch: 32, step: 1075, loss: 0.30180999636650085, mean loss: 0.3464928976223976
Epoch: 32, step: 1076, loss: 0.30161628127098083, mean loss: 0.3464919485557517
Epoch: 32, step: 1077, loss: 0.3066723048686981, mean loss: 0.3464911064535716
Epoch: 32, step: 1078, loss: 0.3056049942970276, mean loss: 0.3464902418160992
Epoch: 32, step: 1079, loss: 0.2856887876987457, mean loss: 0.3464889560468952
Epoch: 32, step: 1080, loss: 0.3305702209472656, mean loss: 0.3464886194202992
Epoch: 32, step: 1081, loss: 0.34227582812309265, mean loss: 0.3464885303361102
Epoch: 32, step: 1082, loss: 0.32150799036026, mean loss: 0.34648800210579206
Epoch: 32, step: 1083, loss: 0.31729528307914734, mean loss: 0.34648738481916797
Epoch: 32, step: 1084, loss: 0.34337881207466125, mean loss: 0.3464873190890865
Epoch: 32, step: 1085, loss: 0.3265461325645447, mean loss: 0.346486897446034
Epoch: 32, step: 1086, loss: 0.36279311776161194, mean loss: 0.346487242222867
Epoch: 32, step: 1087, loss: 0.37304532527923584, mean loss: 0.346487803752025
Epoch: 32, step: 1088, loss: 0.3538711667060852, mean loss: 0.34648795985839437
Epoch: 32, step: 1089, loss: 0.298597127199173, mean loss: 0.3464869473244044
Epoch: 32, step: 1090, loss: 0.34767934679985046, mean loss: 0.3464869725342286
Epoch: 32, step: 1091, loss: 0.3829139471054077, mean loss: 0.3464877426605409
Epoch: 32, step: 1092, loss: 0.2910241186618805, mean loss: 0.3464865700928574
Epoch: 32, step: 1093, loss: 0.3081241250038147, mean loss: 0.3464857590817989
Epoch: 32, step: 1094, loss: 0.34766504168510437, mean loss: 0.34648578401219665
Epoch: 32, step: 1095, loss: 0.31753239035606384, mean loss: 0.34648517194146994
Epoch: 32, step: 1096, loss: 0.3500082790851593, mean loss: 0.34648524641789197
Epoch: 32, step: 1097, loss: 0.33600714802742004, mean loss: 0.34648502492170985
Epoch: 32, step: 1098, loss: 0.30193406343460083, mean loss: 0.34648408318028706
Epoch: 32, step: 1099, loss: 0.35927996039390564, mean loss: 0.3464843536604852
Epoch: 32, step: 1100, loss: 0.35757261514663696, mean loss: 0.3464845880400216
Epoch: 32, step: 1101, loss: 0.3352035880088806, mean loss: 0.34648434959148994
Epoch: 32, step: 1102, loss: 0.34519264101982117, mean loss: 0.34648432228899007
Epoch: 32, step: 1103, loss: 0.30136680603027344, mean loss: 0.34648336867222773
Epoch: 32, step: 1104, loss: 0.3513818085193634, mean loss: 0.3464834722048688
Epoch: 32, step: 1105, loss: 0.3099577724933624, mean loss: 0.34648270021983874
Epoch: 32, step: 1106, loss: 0.3326837420463562, mean loss: 0.3464824085795941
Epoch: 32, step: 1107, loss: 0.33045539259910583, mean loss: 0.34648206985662555
Epoch: 32, step: 1108, loss: 0.31692132353782654, mean loss: 0.34648144511823725
Epoch: 32, step: 1109, loss: 0.3233121931552887, mean loss: 0.34648095546837965
Epoch: 32, step: 1110, loss: 0.340082585811615, mean loss: 0.34648082025060967
Epoch: 32, step: 1111, loss: 0.36139798164367676, mean loss: 0.34648113549070675
Epoch: 32, step: 1112, loss: 0.3611232340335846, mean loss: 0.3464814449114405
Epoch: 32, step: 1113, loss: 0.3453131318092346, mean loss: 0.346481420222858
Epoch: 32, step: 1114, loss: 0.33724814653396606, mean loss: 0.34648122511110074
Epoch: 32, step: 1115, loss: 0.3242512047290802, mean loss: 0.3464807553701578
Epoch: 32, step: 1116, loss: 0.3283909559249878, mean loss: 0.34648037312399943
Epoch: 32, step: 1117, loss: 0.33864569664001465, mean loss: 0.34648020757701714
Epoch: 32, step: 1118, loss: 0.3713952898979187, mean loss: 0.3464807340224356
Epoch: 32, step: 1119, loss: 0.29849350452423096, mean loss: 0.3464797200934824
Epoch: 32, step: 1120, loss: 0.33634647727012634, mean loss: 0.34647950599128663
Epoch: 32, step: 1121, loss: 0.36167412996292114, mean loss: 0.3464798270270773
Epoch: 32, step: 1122, loss: 0.31873753666877747, mean loss: 0.3464792408934575
Epoch: 32, step: 1123, loss: 0.34290462732315063, mean loss: 0.3464791653713251
Epoch: 32, step: 1124, loss: 0.32034051418304443, mean loss: 0.3464786131424111
Epoch: 32, step: 1125, loss: 0.307211309671402, mean loss: 0.3464777835631769
Epoch: 32, step: 1126, loss: 0.3044898509979248, mean loss: 0.34647689652541275
Epoch: 32, step: 1127, loss: 0.379587858915329, mean loss: 0.3464775960133794
Epoch: 32, step: 1128, loss: 0.31984713673591614, mean loss: 0.34647703344162206
Epoch: 32, step: 1129, loss: 0.37100785970687866, mean loss: 0.3464775516474243
Epoch: 32, step: 1130, loss: 0.34359443187713623, mean loss: 0.3464774907437345
Epoch: 32, step: 1131, loss: 0.307957261800766, mean loss: 0.34647667705068547
Epoch: 32, step: 1132, loss: 0.2915303409099579, mean loss: 0.3464755164005906
Epoch: 32, step: 1133, loss: 0.31367582082748413, mean loss: 0.34647482357613085
Epoch: 32, step: 1134, loss: 0.3479573726654053, mean loss: 0.34647485489119517
Epoch: 32, step: 1135, loss: 0.34937584400177, mean loss: 0.3464749161658891
Epoch: 32, step: 1136, loss: 0.3358542323112488, mean loss: 0.34647469184053575
Epoch: 32, step: 1137, loss: 0.2900571823120117, mean loss: 0.34647350024019935
Epoch: 32, step: 1138, loss: 0.3443901538848877, mean loss: 0.3464734562385444
Epoch: 32, step: 1139, loss: 0.31379908323287964, mean loss: 0.34647276614872
Epoch: 32, step: 1140, loss: 0.3493990898132324, mean loss: 0.3464728279520034
Epoch: 32, step: 1141, loss: 0.31488141417503357, mean loss: 0.3464721607626945
Epoch: 32, step: 1142, loss: 0.33038729429244995, mean loss: 0.3464718210683592
Epoch: 32, step: 1143, loss: 0.3625129759311676, mean loss: 0.3464721598324001
Epoch: 32, step: 1144, loss: 0.29361602663993835, mean loss: 0.34647104361730935
Epoch: 32, step: 1145, loss: 0.37257495522499084, mean loss: 0.34647159486771284
Epoch: 32, step: 1146, loss: 0.3241032063961029, mean loss: 0.3464711225123444
Epoch: 32, step: 1147, loss: 0.3466556668281555, mean loss: 0.34647112640930183
Epoch: 32, step: 1148, loss: 0.3016051948070526, mean loss: 0.34647017901120647
Epoch: 32, step: 1149, loss: 0.3136303126811981, mean loss: 0.346469485572583
Epoch: 32, step: 1150, loss: 0.37333157658576965, mean loss: 0.34647005277398113
Epoch: 32, step: 1151, loss: 0.3590421974658966, mean loss: 0.34647031823311736
Epoch: 32, step: 1152, loss: 0.39702215790748596, mean loss: 0.34647138560584334
Epoch: 32, step: 1153, loss: 0.30108383297920227, mean loss: 0.3464704272942723
Epoch: 32, step: 1154, loss: 0.34261244535446167, mean loss: 0.34647034583866476
Epoch: 32, step: 1155, loss: 0.3286735713481903, mean loss: 0.34646997009391156
Epoch: 32, step: 1156, loss: 0.3738994300365448, mean loss: 0.3464705492021126
Epoch: 32, step: 1157, loss: 0.3159657418727875, mean loss: 0.3464699051788189
Epoch: 32, step: 1158, loss: 0.3347313702106476, mean loss: 0.3464696573578683
Epoch: 32, step: 1159, loss: 0.33336034417152405, mean loss: 0.34646938060324095
Epoch: 32, step: 1160, loss: 0.3857842683792114, mean loss: 0.346470210574061
Epoch: 32, step: 1161, loss: 0.3137248456478119, mean loss: 0.34646951930606595
Epoch: 32, step: 1162, loss: 0.31760331988334656, mean loss: 0.3464689099416991
Epoch: 32, step: 1163, loss: 0.32634198665618896, mean loss: 0.34646848507208655
Epoch: 32, step: 1164, loss: 0.3267013728618622, mean loss: 0.34646806780672
Epoch: 32, step: 1165, loss: 0.31513381004333496, mean loss: 0.3464674063836237
Epoch: 32, step: 1166, loss: 0.36449819803237915, mean loss: 0.34646778698080893
Epoch: 32, step: 1167, loss: 0.2914818823337555, mean loss: 0.3464666263529668
Epoch: 32, step: 1168, loss: 0.3426365554332733, mean loss: 0.34646654551055556
Epoch: 32, step: 1169, loss: 0.31424885988235474, mean loss: 0.34646586549692837
Epoch: 32, step: 1170, loss: 0.33825647830963135, mean loss: 0.3464656922263404
Epoch: 32, step: 1171, loss: 0.3178819715976715, mean loss: 0.3464650889397083
Epoch: 32, step: 1172, loss: 0.32439368963241577, mean loss: 0.3464646231116484
Epoch: 32, step: 1173, loss: 0.32005980610847473, mean loss: 0.346464065836375
Epoch: 32, step: 1174, loss: 0.32551243901252747, mean loss: 0.3464636236603451
Epoch: 32, step: 1175, loss: 0.31564104557037354, mean loss: 0.3464629731754116
Epoch: 32, step: 1176, loss: 0.29545292258262634, mean loss: 0.3464618966733415
Epoch: 32, step: 1177, loss: 0.37458541989326477, mean loss: 0.3464624901719111
Epoch: 32, step: 1178, loss: 0.3267110586166382, mean loss: 0.34646207336072754
Epoch: 32, step: 1179, loss: 0.3070429563522339, mean loss: 0.34646124152319463
Epoch: 32, step: 1180, loss: 0.33548200130462646, mean loss: 0.346461009839888
Epoch: 32, step: 1181, loss: 0.33364686369895935, mean loss: 0.3464607394422062
Epoch: 32, step: 1182, loss: 0.3509365916252136, mean loss: 0.34646083388740007
Epoch: 32, step: 1183, loss: 0.29843878746032715, mean loss: 0.3464598205930376
Epoch: 32, step: 1184, loss: 0.41592106223106384, mean loss: 0.3464612862365216
Epoch: 32, step: 1185, loss: 0.3152371346950531, mean loss: 0.3464606274157523
Epoch: 32, step: 1186, loss: 0.3234972059726715, mean loss: 0.34646014290427546
Epoch: 32, step: 1187, loss: 0.2981363832950592, mean loss: 0.3464591233296361
Epoch: 32, step: 1188, loss: 0.3469598591327667, mean loss: 0.34645913389435123
Epoch: 32, step: 1189, loss: 0.34951674938201904, mean loss: 0.346459198403729
Epoch: 32, step: 1190, loss: 0.2987590432167053, mean loss: 0.34645819205011
Epoch: 32, step: 1191, loss: 0.3240070044994354, mean loss: 0.34645771839636424
Epoch: 32, step: 1192, loss: 0.3274642825126648, mean loss: 0.3464573176994194
Epoch: 32, step: 1193, loss: 0.31808149814605713, mean loss: 0.3464567190786955
Epoch: 32, step: 1194, loss: 0.30738022923469543, mean loss: 0.34645589473234945
Epoch: 32, step: 1195, loss: 0.37566059827804565, mean loss: 0.34645651081334566
Epoch: 32, step: 1196, loss: 0.32623618841171265, mean loss: 0.34645608426925956
Epoch: 32, step: 1197, loss: 0.33730772137641907, mean loss: 0.34645589129025073
Epoch: 32, step: 1198, loss: 0.3187331259250641, mean loss: 0.3464553065081433
Epoch: 32, step: 1199, loss: 0.33641985058784485, mean loss: 0.34645509482539105
Epoch: 32, step: 1200, loss: 0.396304726600647, mean loss: 0.3464561463057381
Epoch: 32, step: 1201, loss: 0.33089882135391235, mean loss: 0.34645581816136034
Epoch: 32, step: 1202, loss: 0.3324653208255768, mean loss: 0.34645552307166944
Epoch: 32, step: 1203, loss: 0.32942965626716614, mean loss: 0.34645516396707976
Epoch: 32, step: 1204, loss: 0.31655094027519226, mean loss: 0.3464545332492662
Epoch: 32, step: 1205, loss: 0.3271983563899994, mean loss: 0.34645412712076284
Epoch: 32, step: 1206, loss: 0.3263366222381592, mean loss: 0.34645370283509624
Epoch: 32, step: 1207, loss: 0.31935128569602966, mean loss: 0.34645313124708504
Epoch: 32, step: 1208, loss: 0.3234127461910248, mean loss: 0.3464526453372836
Epoch: 32, step: 1209, loss: 0.3206804692745209, mean loss: 0.34645210182688535
Epoch: 32, step: 1210, loss: 0.34089651703834534, mean loss: 0.3464519846674179
Epoch: 32, step: 1211, loss: 0.3309110999107361, mean loss: 0.34645165693893293
Epoch: 32, step: 1212, loss: 0.30033063888549805, mean loss: 0.3464506843525671
Epoch: 32, step: 1213, loss: 0.34683769941329956, mean loss: 0.34645069251365396
Epoch: 32, step: 1214, loss: 0.30419519543647766, mean loss: 0.34644980147982907
Epoch: 32, step: 1215, loss: 0.3315642774105072, mean loss: 0.3464494875981643
Epoch: 32, step: 1216, loss: 0.3476562798023224, mean loss: 0.3464495130444944
Epoch: 32, step: 1217, loss: 0.31668758392333984, mean loss: 0.34644888549991715
Epoch: 32, step: 1218, loss: 0.32399335503578186, mean loss: 0.34644841202425003
Epoch: 32, step: 1219, loss: 0.3300626575946808, mean loss: 0.3464480665373134
Epoch: 32, step: 1220, loss: 0.3272440433502197, mean loss: 0.3464476616368688
Epoch: 32, step: 1221, loss: 0.3456673324108124, mean loss: 0.3464476451846397
Epoch: 32, step: 1222, loss: 0.3856663107872009, mean loss: 0.3464484720418766
Epoch: 32, step: 1223, loss: 0.3608821630477905, mean loss: 0.3464487763446892
Epoch: 32, step: 1224, loss: 0.33547669649124146, mean loss: 0.34644854502725503
Epoch: 32, step: 1225, loss: 0.32558032870292664, mean loss: 0.346448105085097
Epoch: 32, step: 1226, loss: 0.3343229591846466, mean loss: 0.34644784946907714
Epoch: 32, step: 1227, loss: 0.31411653757095337, mean loss: 0.34644716789154323
Epoch: 32, step: 1228, loss: 0.3184632360935211, mean loss: 0.34644657797371964
Epoch: 32, step: 1229, loss: 0.3296140730381012, mean loss: 0.346446223142046
Epoch: 32, step: 1230, loss: 0.3292340338230133, mean loss: 0.34644586031421826
Epoch: 32, step: 1231, loss: 0.33258768916130066, mean loss: 0.346445568194253
Epoch: 32, step: 1232, loss: 0.32014474272727966, mean loss: 0.34644501380405324
Epoch: 32, step: 1233, loss: 0.3450649082660675, mean loss: 0.3464449847136789
Epoch: 32, step: 1234, loss: 0.3086521625518799, mean loss: 0.3464441881194045
Epoch: 32, step: 1235, loss: 0.33549875020980835, mean loss: 0.3464439574171469
Epoch: 32, step: 1236, loss: 0.34758201241493225, mean loss: 0.3464439814039737
Epoch: 32, step: 1237, loss: 0.3702574372291565, mean loss: 0.3464444833104742
Epoch: 32, step: 1238, loss: 0.30189061164855957, mean loss: 0.3464435442864756
Epoch: 32, step: 1239, loss: 0.3163082003593445, mean loss: 0.3464429091628892
Epoch: 32, step: 1240, loss: 0.35644131898880005, mean loss: 0.3464431198819734
Epoch: 32, step: 1241, loss: 0.3236992359161377, mean loss: 0.3464426405588129
Epoch: 32, step: 1242, loss: 0.3569086790084839, mean loss: 0.34644286112399486
Epoch: 32, step: 1243, loss: 0.34565699100494385, mean loss: 0.3464428445626251
Epoch: 32, step: 1244, loss: 0.3466838598251343, mean loss: 0.34644284964165617
Epoch: 32, step: 1245, loss: 0.31397852301597595, mean loss: 0.3464421655196301
Epoch: 32, step: 1246, loss: 0.3629467487335205, mean loss: 0.34644251331402925
Epoch: 32, step: 1247, loss: 0.3371090888977051, mean loss: 0.3464423166387002
Epoch: 32, step: 1248, loss: 0.31557324528694153, mean loss: 0.3464416661746727
Epoch: 32, step: 1249, loss: 0.3408950865268707, mean loss: 0.3464415493012341
Epoch: 32, step: 1250, loss: 0.29005351662635803, mean loss: 0.34644036115920257
Epoch: 32, step: 1251, loss: 0.3266933560371399, mean loss: 0.3464399450823985
Epoch: 32, step: 1252, loss: 0.30105626583099365, mean loss: 0.34643898885140356
Epoch: 32, step: 1253, loss: 0.3873497545719147, mean loss: 0.34643985082025697
Epoch: 32, step: 1254, loss: 0.32821372151374817, mean loss: 0.34643946681315024
Epoch: 32, step: 1255, loss: 0.3085169196128845, mean loss: 0.3464386678381966
Epoch: 32, step: 1256, loss: 0.32041704654693604, mean loss: 0.3464381196106333
Epoch: 32, step: 1257, loss: 0.3070216476917267, mean loss: 0.34643728919576966
Epoch: 32, step: 1258, loss: 0.33269813656806946, mean loss: 0.3464369997493621
Epoch: 32, step: 1259, loss: 0.3509487509727478, mean loss: 0.3464370947976309
Epoch: 32, step: 1260, loss: 0.31401070952415466, mean loss: 0.3464364116910714
Epoch: 32, step: 1261, loss: 0.33788996934890747, mean loss: 0.3464362316522608
Epoch: 32, step: 1262, loss: 0.34387949109077454, mean loss: 0.34643617779326136
Epoch: 32, step: 1263, loss: 0.3332560360431671, mean loss: 0.34643590015293124
Epoch: 32, step: 1264, loss: 0.3037717342376709, mean loss: 0.3464350014491224
Epoch: 32, step: 1265, loss: 0.3136347830295563, mean loss: 0.3464343105400265
Epoch: 32, step: 1266, loss: 0.35125932097435, mean loss: 0.3464344121726844
Epoch: 32, step: 1267, loss: 0.3613213002681732, mean loss: 0.34643472573928846
Epoch: 32, step: 1268, loss: 0.3461320698261261, mean loss: 0.34643471936449827
Epoch: 32, step: 1269, loss: 0.32121649384498596, mean loss: 0.3464341882084782
Epoch: 32, step: 1270, loss: 0.33768904209136963, mean loss: 0.34643400401870766
Epoch: 32, step: 1271, loss: 0.3148612082004547, mean loss: 0.34643333904828183
Epoch: 32, step: 1272, loss: 0.3425624966621399, mean loss: 0.3464332575242536
Epoch: 32, step: 1273, loss: 0.3015075623989105, mean loss: 0.34643231136159985
Epoch: 32, step: 1274, loss: 0.3314777910709381, mean loss: 0.34643199641687666
Epoch: 32, step: 1275, loss: 0.3236463665962219, mean loss: 0.34643151655777
Epoch: 32, step: 1276, loss: 0.34406930208206177, mean loss: 0.3464314668112295
Epoch: 32, step: 1277, loss: 0.33613136410713196, mean loss: 0.3464312499030312
Epoch: 32, step: 1278, loss: 0.333516389131546, mean loss: 0.3464309779367926
Epoch: 32, step: 1279, loss: 0.3461381196975708, mean loss: 0.34643097176979804
Epoch: 32, step: 1280, loss: 0.34298720955848694, mean loss: 0.34643089925274756
Epoch: 32, step: 1281, loss: 0.3221149146556854, mean loss: 0.346430387229488
Epoch: 32, step: 1282, loss: 0.3185880184173584, mean loss: 0.3464298009632731
Epoch: 32, step: 1283, loss: 0.32038453221321106, mean loss: 0.3464292525494613
Epoch: 32, step: 1284, loss: 0.3464835286140442, mean loss: 0.34642925369228367
Epoch: 32, step: 1285, loss: 0.3132101595401764, mean loss: 0.3464285542545831
Epoch: 32, step: 1286, loss: 0.3211447298526764, mean loss: 0.3464280219075065
Epoch: 32, step: 1287, loss: 0.3139377236366272, mean loss: 0.34642733784362173
Epoch: 32, step: 1288, loss: 0.31141000986099243, mean loss: 0.34642660059015346
Epoch: 32, step: 1289, loss: 0.3331587612628937, mean loss: 0.3464263212554588
Epoch: 32, step: 1290, loss: 0.30591529607772827, mean loss: 0.34642546837381544
Epoch: 32, step: 1291, loss: 0.3730323612689972, mean loss: 0.346426028518929
Epoch: 32, step: 1292, loss: 0.38193991780281067, mean loss: 0.3464267761640161
Epoch: 32, step: 1293, loss: 0.3483794033527374, mean loss: 0.3464268172702262
Epoch: 32, step: 1294, loss: 0.3280566930770874, mean loss: 0.34642643055519357
Epoch: 32, step: 1295, loss: 0.34936273097991943, mean loss: 0.3464264923668394
Epoch: 32, step: 1296, loss: 0.3049596846103668, mean loss: 0.3464256194732965
Epoch: 32, step: 1297, loss: 0.3032691478729248, mean loss: 0.3464247110307503
Epoch: 32, step: 1298, loss: 0.3159758150577545, mean loss: 0.34642407009581494
Epoch: 32, step: 1299, loss: 0.33617785573005676, mean loss: 0.3464238544223628
Epoch: 32, step: 1300, loss: 0.3049832880496979, mean loss: 0.3464229821546583
Epoch: 32, step: 1301, loss: 0.33287203311920166, mean loss: 0.34642269693156763
Epoch: 32, step: 1302, loss: 0.35153770446777344, mean loss: 0.34642280459100516
Epoch: 32, step: 1303, loss: 0.37466108798980713, mean loss: 0.3464233989310329
Epoch: 32, step: 1304, loss: 0.32357779145240784, mean loss: 0.34642291810247067
Epoch: 32, step: 1305, loss: 0.30262643098831177, mean loss: 0.34642199634283954
Epoch: 32, step: 1306, loss: 0.3225151300430298, mean loss: 0.34642149319927856
Epoch: 32, step: 1307, loss: 0.3326060175895691, mean loss: 0.3464212024450987
Epoch: 32, step: 1308, loss: 0.34178030490875244, mean loss: 0.3464211047769476
Epoch: 32, step: 1309, loss: 0.3348449468612671, mean loss: 0.34642086116067766
Epoch: 32, step: 1310, loss: 0.32027512788772583, mean loss: 0.3464203109442743
Epoch: 32, step: 1311, loss: 0.34526577591896057, mean loss: 0.34642028664850355
Epoch: 32, step: 1312, loss: 0.3274793326854706, mean loss: 0.34641988806779267
Epoch: 32, step: 1313, loss: 0.360988587141037, mean loss: 0.3464201946352577
Epoch: 32, step: 1314, loss: 0.36474353075027466, mean loss: 0.34642058020300626
Epoch: 32, step: 1315, loss: 0.34448617696762085, mean loss: 0.3464205394992937
Epoch: 32, step: 1316, loss: 0.349283903837204, mean loss: 0.34642059974893785
Epoch: 32, step: 1317, loss: 0.3211386203765869, mean loss: 0.34642006778791923
Epoch: 32, step: 1318, loss: 0.3646010160446167, mean loss: 0.3464204503272812
Epoch: 32, step: 1319, loss: 0.3639533221721649, mean loss: 0.3464208192229184
Epoch: 32, step: 1320, loss: 0.33384349942207336, mean loss: 0.3464205545987984
Epoch: 32, step: 1321, loss: 0.3382995128631592, mean loss: 0.34642038373741113
Epoch: 32, step: 1322, loss: 0.31000852584838867, mean loss: 0.3464196176719404
Epoch: 32, step: 1323, loss: 0.3304601311683655, mean loss: 0.3464192819089491
Epoch: 32, step: 1324, loss: 0.3697628676891327, mean loss: 0.3464197730116731
Epoch: 32, step: 1325, loss: 0.33675509691238403, mean loss: 0.3464195696903431
Epoch: 32, step: 1326, loss: 0.38891735672950745, mean loss: 0.3464204637218365
Epoch: 32, step: 1327, loss: 0.4140926003456116, mean loss: 0.34642188731945983
Epoch: 32, step: 1328, loss: 0.3253171145915985, mean loss: 0.34642144335428054
Epoch: 32, step: 1329, loss: 0.3113614618778229, mean loss: 0.34642070583941925
Epoch: 32, step: 1330, loss: 0.31281909346580505, mean loss: 0.34641999901739157
Epoch: 32, step: 1331, loss: 0.34141600131988525, mean loss: 0.3464198937587105
Epoch: 32, step: 1332, loss: 0.3631008267402649, mean loss: 0.3464202446333867
Epoch: 32, step: 1333, loss: 0.3298424482345581, mean loss: 0.3464198959354691
Epoch: 32, step: 1334, loss: 0.3431150019168854, mean loss: 0.34641982642168123
Epoch: 32, step: 1335, loss: 0.31397345662117004, mean loss: 0.34641914397237533
Epoch: 32, step: 1336, loss: 0.3599584400653839, mean loss: 0.3464194287404076
Epoch: 32, step: 1337, loss: 0.33657288551330566, mean loss: 0.34641922164531597
Epoch: 32, step: 1338, loss: 0.3056124448776245, mean loss: 0.34641836340448545
Epoch: 32, step: 1339, loss: 0.32377997040748596, mean loss: 0.34641788728786654
Epoch: 32, step: 1340, loss: 0.35326263308525085, mean loss: 0.34641803123928083
Epoch: 32, step: 1341, loss: 0.3406938314437866, mean loss: 0.3464179108565301
Epoch: 32, step: 1342, loss: 0.299821674823761, mean loss: 0.34641693093526593
Epoch: 32, step: 1343, loss: 0.32059022784233093, mean loss: 0.3464163878097803
Epoch: 32, step: 1344, loss: 0.35485076904296875, mean loss: 0.3464165651777956
Epoch: 32, step: 1345, loss: 0.3254524767398834, mean loss: 0.34641612432974
Epoch: 32, step: 1346, loss: 0.31677666306495667, mean loss: 0.34641550106275937
Epoch: 32, step: 1347, loss: 0.3024182617664337, mean loss: 0.3464145758958131
Epoch: 32, step: 1348, loss: 0.31596121191978455, mean loss: 0.346413935540787
Epoch: 32, step: 1349, loss: 0.3673376142978668, mean loss: 0.3464143755020712
Epoch: 32, step: 1350, loss: 0.3316093683242798, mean loss: 0.3464140642043741
Epoch: 32, step: 1351, loss: 0.29455122351646423, mean loss: 0.34641297373253455
Epoch: 32, step: 1352, loss: 0.3213958442211151, mean loss: 0.34641244773161967
Epoch: 32, step: 1353, loss: 0.3092258870601654, mean loss: 0.34641166587718397
Epoch: 32, step: 1354, loss: 0.38199684023857117, mean loss: 0.3464124140464408
Epoch: 32, step: 1355, loss: 0.32830116152763367, mean loss: 0.3464120332699603
Epoch: 32, step: 1356, loss: 0.3567032217979431, mean loss: 0.34641224963048856
Epoch: 32, step: 1357, loss: 0.3194217383861542, mean loss: 0.34641168219763224
Epoch: 32, step: 1358, loss: 0.332952618598938, mean loss: 0.34641139924803277
Epoch: 32, step: 1359, loss: 0.36048218607902527, mean loss: 0.3464116950516577
Epoch: 32, step: 1360, loss: 0.37334078550338745, mean loss: 0.3464122611575345
Epoch: 32, step: 1361, loss: 0.33228448033332825, mean loss: 0.3464119641682382
Epoch: 32, step: 1362, loss: 0.30610525608062744, mean loss: 0.3464111168724469
Epoch: 32, step: 1363, loss: 0.3114910125732422, mean loss: 0.3464103828250178
Epoch: 32, step: 1364, loss: 0.28449341654777527, mean loss: 0.3464090813101611
Epoch: 32, step: 1365, loss: 0.33505332469940186, mean loss: 0.3464088426134652
Epoch: 32, step: 1366, loss: 0.3555958569049835, mean loss: 0.3464090357193883
Epoch: 32, step: 1367, loss: 0.310066819190979, mean loss: 0.34640827184229633
Epoch: 32, step: 1368, loss: 0.3309493660926819, mean loss: 0.34640794691836774
Epoch: 32, step: 1369, loss: 0.32823169231414795, mean loss: 0.34640756488771063
Epoch: 32, step: 1370, loss: 0.333528608083725, mean loss: 0.346407294201971
Epoch: 32, step: 1371, loss: 0.3669060170650482, mean loss: 0.34640772502842887
Epoch: 32, step: 1372, loss: 0.32258182764053345, mean loss: 0.34640722428448933
Epoch: 32, step: 1373, loss: 0.34975308179855347, mean loss: 0.3464072946022043
Epoch: 32, step: 1374, loss: 0.335304319858551, mean loss: 0.346407061263097
Epoch: 32, step: 1375, loss: 0.32654693722724915, mean loss: 0.3464066438933081
Epoch: 32, step: 1376, loss: 0.3375951945781708, mean loss: 0.34640645872047393
Epoch: 32, step: 1377, loss: 0.3502635061740875, mean loss: 0.3464065397747221
Epoch: 32, step: 1378, loss: 0.32438215613365173, mean loss: 0.34640607695118536
Epoch: 32, step: 1379, loss: 0.3339231610298157, mean loss: 0.3464058146389234
Epoch: 32, step: 1380, loss: 0.360370934009552, mean loss: 0.34640610809159883
Epoch: 32, step: 1381, loss: 0.3174748420715332, mean loss: 0.3464055001641767
Epoch: 32, step: 1382, loss: 0.327806293964386, mean loss: 0.3464051093506573
Epoch: 32, step: 1383, loss: 0.3506740927696228, mean loss: 0.3464051990502585
Epoch: 32, step: 1384, loss: 0.29986608028411865, mean loss: 0.346404221193877
Epoch: 32, step: 1385, loss: 0.351314514875412, mean loss: 0.34640432436431196
Epoch: 32, step: 1386, loss: 0.34067875146865845, mean loss: 0.3464042040665308
Epoch: 32, step: 1387, loss: 0.29148122668266296, mean loss: 0.34640305012549827
Epoch: 32, step: 1388, loss: 0.34992220997810364, mean loss: 0.34640312406208784
Epoch: 32, step: 1389, loss: 0.308880478143692, mean loss: 0.3464023357380843
Epoch: 32, step: 1390, loss: 0.3440488278865814, mean loss: 0.3464022862936033
Epoch: 32, step: 1391, loss: 0.36810848116874695, mean loss: 0.3464027423061007
Epoch: 32, step: 1392, loss: 0.38556742668151855, mean loss: 0.3464035650763025
Epoch: 32, step: 1393, loss: 0.3206309974193573, mean loss: 0.34640302365855413
Epoch: 32, step: 1394, loss: 0.3947047293186188, mean loss: 0.3464040383363194
Epoch: 32, step: 1395, loss: 0.39516204595565796, mean loss: 0.3464050625781398
Epoch: 32, step: 1396, loss: 0.3767353892326355, mean loss: 0.3464056997029514
Epoch: 32, step: 1397, loss: 0.320867657661438, mean loss: 0.3464051632570823
Epoch: 32, step: 1398, loss: 0.37904518842697144, mean loss: 0.34640584887107123
Epoch: 32, step: 1399, loss: 0.30943718552589417, mean loss: 0.3464050723489879
Epoch: 32, step: 1400, loss: 0.3461756408214569, mean loss: 0.34640506752990896
Epoch: 32, step: 1401, loss: 0.34707900881767273, mean loss: 0.34640508168536555
Epoch: 32, step: 1402, loss: 0.3492336571216583, mean loss: 0.34640514109549003
Epoch: 32, step: 1403, loss: 0.36115092039108276, mean loss: 0.3464054508026919
Epoch: 32, step: 1404, loss: 0.3371450901031494, mean loss: 0.3464052563104167
Epoch: 32, step: 1405, loss: 0.3147273361682892, mean loss: 0.3464045910035712
Epoch: 32, step: 1406, loss: 0.3173868954181671, mean loss: 0.3464039815801629
Epoch: 32, step: 1407, loss: 0.3119003176689148, mean loss: 0.3464032569568449
Epoch: 32, step: 1408, loss: 0.36188310384750366, mean loss: 0.34640358204760846
Epoch: 32, step: 1409, loss: 0.3251628577709198, mean loss: 0.3464031359825852
Epoch: 32, step: 1410, loss: 0.4024300277233124, mean loss: 0.3464043125484883
Epoch: 32, step: 1411, loss: 0.2723206877708435, mean loss: 0.3464027568234825
Epoch: 32, step: 1412, loss: 0.33697688579559326, mean loss: 0.34640255888830623
Epoch: 32, step: 1413, loss: 0.2896527349948883, mean loss: 0.34640136721588816
Epoch: 32, step: 1414, loss: 0.3387998640537262, mean loss: 0.3464012075975701
Epoch: 32, step: 1415, loss: 0.2881165146827698, mean loss: 0.34639998374629943
Epoch: 32, step: 1416, loss: 0.3474920690059662, mean loss: 0.34640000667722354
Epoch: 32, step: 1417, loss: 0.35192498564720154, mean loss: 0.34640012268484477
Epoch: 32, step: 1418, loss: 0.31712183356285095, mean loss: 0.34639950794343505
Epoch: 32, step: 1419, loss: 0.35542869567871094, mean loss: 0.34639969752073696
Epoch: 32, step: 1420, loss: 0.3178010880947113, mean loss: 0.3463990970754321
Epoch: 32, step: 1421, loss: 0.3545755445957184, mean loss: 0.34639926874134686
Epoch: 32, step: 1422, loss: 0.33976292610168457, mean loss: 0.3463991294131228
Epoch: 32, step: 1423, loss: 0.316764771938324, mean loss: 0.34639850726084126
Epoch: 32, step: 1424, loss: 0.34052330255508423, mean loss: 0.34639838391768196
Epoch: 32, step: 1425, loss: 0.3084191083908081, mean loss: 0.34639758660325265
Epoch: 32, step: 1426, loss: 0.3086853325366974, mean loss: 0.3463967949111341
Epoch: 32, step: 1427, loss: 0.3012368977069855, mean loss: 0.34639584689078806
Epoch: 32, step: 1428, loss: 0.3295019865036011, mean loss: 0.3463954922534182
Epoch: 32, step: 1429, loss: 0.32884085178375244, mean loss: 0.34639512375263165
Epoch: 32, step: 1430, loss: 0.3227675259113312, mean loss: 0.34639462778088914
Epoch: 32, step: 1431, loss: 0.3242337107658386, mean loss: 0.3463941626063086
Epoch: 32, step: 1432, loss: 0.39632701873779297, mean loss: 0.34639521071311014
Epoch: 32, step: 1433, loss: 0.2795114517211914, mean loss: 0.34639380683084253
Epoch: 32, step: 1434, loss: 0.32174769043922424, mean loss: 0.34639328952260434
Epoch: 32, step: 1435, loss: 0.38374555110931396, mean loss: 0.34639407350928864
Epoch: 32, step: 1436, loss: 0.32728636264801025, mean loss: 0.34639367246592917
Epoch: 32, step: 1437, loss: 0.34035801887512207, mean loss: 0.34639354578890297
Epoch: 32, step: 1438, loss: 0.2933565378189087, mean loss: 0.34639243266513925
Epoch: 32, step: 1439, loss: 0.2984536290168762, mean loss: 0.34639142656197336
Epoch: 32, step: 1440, loss: 0.35146915912628174, mean loss: 0.3463915331273276
Epoch: 32, step: 1441, loss: 0.29858511686325073, mean loss: 0.3463905298447198
Epoch: 32, step: 1442, loss: 0.3127759099006653, mean loss: 0.346389824411047
Epoch: 32, step: 1443, loss: 0.38388946652412415, mean loss: 0.34639061135896343
Valid: 32, mean loss: 0.186403493086497
Epoch: 33, step: 0, loss: 0.3113738000392914, mean loss: 0.34638987652985886
Epoch: 33, step: 1, loss: 0.35047978162765503, mean loss: 0.34638996235487035
Epoch: 33, step: 2, loss: 0.309632271528244, mean loss: 0.3463891910257165
Epoch: 33, step: 3, loss: 0.33888569474220276, mean loss: 0.34638903357447676
Epoch: 33, step: 4, loss: 0.3566664159297943, mean loss: 0.34638924922763065
Epoch: 33, step: 5, loss: 0.3226727843284607, mean loss: 0.34638875158893623
Epoch: 33, step: 6, loss: 0.35260462760925293, mean loss: 0.34638888201290696
Epoch: 33, step: 7, loss: 0.32116231322288513, mean loss: 0.3463883527101627
Epoch: 33, step: 8, loss: 0.33714720606803894, mean loss: 0.3463881588169032
Epoch: 33, step: 9, loss: 0.339914470911026, mean loss: 0.3463880229919713
Epoch: 33, step: 10, loss: 0.30645063519477844, mean loss: 0.3463871850802201
Epoch: 33, step: 11, loss: 0.30918729305267334, mean loss: 0.3463864046192427
Epoch: 33, step: 12, loss: 0.316699743270874, mean loss: 0.3463857818003746
Epoch: 33, step: 13, loss: 0.3644333779811859, mean loss: 0.34638616042656895
Epoch: 33, step: 14, loss: 0.3539388179779053, mean loss: 0.3463863188728221
Epoch: 33, step: 15, loss: 0.28903695940971375, mean loss: 0.34638511577305997
Epoch: 33, step: 16, loss: 0.3702497184276581, mean loss: 0.3463856164045533
Epoch: 33, step: 17, loss: 0.3416348397731781, mean loss: 0.3463855167448799
Epoch: 33, step: 18, loss: 0.32000991702079773, mean loss: 0.34638496346091846
Epoch: 33, step: 19, loss: 0.33615702390670776, mean loss: 0.3463847489127654
Epoch: 33, step: 20, loss: 0.35080355405807495, mean loss: 0.3463848416026558
Epoch: 33, step: 21, loss: 0.3435930907726288, mean loss: 0.3463847830434657
Epoch: 33, step: 22, loss: 0.35462430119514465, mean loss: 0.3463849558702754
Epoch: 33, step: 23, loss: 0.3332754969596863, mean loss: 0.3463846809005021
Epoch: 33, step: 24, loss: 0.35069918632507324, mean loss: 0.34638477139498425
Epoch: 33, step: 25, loss: 0.3500712215900421, mean loss: 0.34638484871471653
Epoch: 33, step: 26, loss: 0.29676347970962524, mean loss: 0.3463838079762571
Epoch: 33, step: 27, loss: 0.3259943425655365, mean loss: 0.34638338034485167
Epoch: 33, step: 28, loss: 0.31917592883110046, mean loss: 0.3463828097307388
Epoch: 33, step: 29, loss: 0.37581613659858704, mean loss: 0.3463834270145538
Epoch: 33, step: 30, loss: 0.32033610343933105, mean loss: 0.34638288075438617
Epoch: 33, step: 31, loss: 0.30014991760253906, mean loss: 0.3463819111846531
Epoch: 33, step: 32, loss: 0.3732684552669525, mean loss: 0.34638247502116526
Epoch: 33, step: 33, loss: 0.38120076060295105, mean loss: 0.3463832051785612
Epoch: 33, step: 34, loss: 0.31765738129615784, mean loss: 0.34638260279585975
Epoch: 33, step: 35, loss: 0.34398961067199707, mean loss: 0.34638255261568607
Epoch: 33, step: 36, loss: 0.3143109679222107, mean loss: 0.34638188010033255
Epoch: 33, step: 37, loss: 0.32806211709976196, mean loss: 0.3463814959576821
Epoch: 33, step: 38, loss: 0.2950192391872406, mean loss: 0.3463804189776068
Epoch: 33, step: 39, loss: 0.3235218822956085, mean loss: 0.3463799396826164
Epoch: 33, step: 40, loss: 0.3649723529815674, mean loss: 0.3463803295178815
Epoch: 33, step: 41, loss: 0.30177634954452515, mean loss: 0.34637939430632503
Epoch: 33, step: 42, loss: 0.33141180872917175, mean loss: 0.3463790804875688
Epoch: 33, step: 43, loss: 0.3306310176849365, mean loss: 0.346378750311814
Epoch: 33, step: 44, loss: 0.3167703449726105, mean loss: 0.3463781295514865
Epoch: 33, step: 45, loss: 0.34231510758399963, mean loss: 0.34637804436925734
Epoch: 33, step: 46, loss: 0.3649802803993225, mean loss: 0.34637843436141713
Epoch: 33, step: 47, loss: 0.31035101413726807, mean loss: 0.34637767906958855
Epoch: 33, step: 48, loss: 0.3917383849620819, mean loss: 0.3463786300078476
Epoch: 33, step: 49, loss: 0.3593587875366211, mean loss: 0.3463789021171413
Epoch: 33, step: 50, loss: 0.3444952368736267, mean loss: 0.3463788626297874
Epoch: 33, step: 51, loss: 0.3111523687839508, mean loss: 0.3463781241907918
Epoch: 33, step: 52, loss: 0.3573108911514282, mean loss: 0.3463783533652381
Epoch: 33, step: 53, loss: 0.38494911789894104, mean loss: 0.34637916187495454
Epoch: 33, step: 54, loss: 0.33111295104026794, mean loss: 0.3463788418755659
Epoch: 33, step: 55, loss: 0.3763996958732605, mean loss: 0.3463794711380375
Epoch: 33, step: 56, loss: 0.36892184615135193, mean loss: 0.34637994363536534
Epoch: 33, step: 57, loss: 0.34909456968307495, mean loss: 0.3463800005338363
Epoch: 33, step: 58, loss: 0.3257283866405487, mean loss: 0.3463795676857741
Epoch: 33, step: 59, loss: 0.33476218581199646, mean loss: 0.3463793241960467
Epoch: 33, step: 60, loss: 0.3349090814590454, mean loss: 0.34637908379526
Epoch: 33, step: 61, loss: 0.32378315925598145, mean loss: 0.3463786102251435
Epoch: 33, step: 62, loss: 0.3734061121940613, mean loss: 0.34637917666131596
Epoch: 33, step: 63, loss: 0.3481806516647339, mean loss: 0.3463792144154237
Epoch: 33, step: 64, loss: 0.35300543904304504, mean loss: 0.3463793532804954
Epoch: 33, step: 65, loss: 0.362144410610199, mean loss: 0.34637968366017036
Epoch: 33, step: 66, loss: 0.3543281555175781, mean loss: 0.3463798502284525
Epoch: 33, step: 67, loss: 0.31039944291114807, mean loss: 0.3463790962383579
Epoch: 33, step: 68, loss: 0.32814326882362366, mean loss: 0.34637871410413157
Epoch: 33, step: 69, loss: 0.30437812209129333, mean loss: 0.34637783399449634
Epoch: 33, step: 70, loss: 0.3043404817581177, mean loss: 0.34637695313301997
Epoch: 33, step: 71, loss: 0.3153557777404785, mean loss: 0.3463763031209633
Epoch: 33, step: 72, loss: 0.3295285999774933, mean loss: 0.34637595010465855
Epoch: 33, step: 73, loss: 0.3196781873703003, mean loss: 0.3463753907080459
Epoch: 33, step: 74, loss: 0.3083827495574951, mean loss: 0.3463745946672063
Epoch: 33, step: 75, loss: 0.36383798718452454, mean loss: 0.34637496056128353
Epoch: 33, step: 76, loss: 0.31462064385414124, mean loss: 0.3463742952568207
Epoch: 33, step: 77, loss: 0.3381776511669159, mean loss: 0.3463741235274243
Epoch: 33, step: 78, loss: 0.41151249408721924, mean loss: 0.3463754882248025
Epoch: 33, step: 79, loss: 0.3025747537612915, mean loss: 0.346374570586018
Epoch: 33, step: 80, loss: 0.35962003469467163, mean loss: 0.346374848076729
Epoch: 33, step: 81, loss: 0.3403216302394867, mean loss: 0.3463747212652773
Epoch: 33, step: 82, loss: 0.3291601836681366, mean loss: 0.3463743606381149
Epoch: 33, step: 83, loss: 0.30239591002464294, mean loss: 0.34637343935332743
Epoch: 33, step: 84, loss: 0.32049861550331116, mean loss: 0.34637289732463167
Epoch: 33, step: 85, loss: 0.3520313799381256, mean loss: 0.3463730158566735
Epoch: 33, step: 86, loss: 0.3087696135044098, mean loss: 0.3463722281694083
Epoch: 33, step: 87, loss: 0.324969083070755, mean loss: 0.3463717798421126
Epoch: 33, step: 88, loss: 0.3242432773113251, mean loss: 0.3463713163306124
Epoch: 33, step: 89, loss: 0.34183377027511597, mean loss: 0.34637122128754644
Epoch: 33, step: 90, loss: 0.3183717727661133, mean loss: 0.3463706348256877
Epoch: 33, step: 91, loss: 0.3872153162956238, mean loss: 0.34637149031918363
Epoch: 33, step: 92, loss: 0.35496020317077637, mean loss: 0.34637167020635196
Epoch: 33, step: 93, loss: 0.33262014389038086, mean loss: 0.3463713821921452
Epoch: 33, step: 94, loss: 0.29837244749069214, mean loss: 0.3463703769156943
Epoch: 33, step: 95, loss: 0.38507577776908875, mean loss: 0.34637118753395796
Epoch: 33, step: 96, loss: 0.33968421816825867, mean loss: 0.3463710474897818
Epoch: 33, step: 97, loss: 0.46027278900146484, mean loss: 0.3463734328665674
Epoch: 33, step: 98, loss: 0.313953697681427, mean loss: 0.3463727539334522
Epoch: 33, step: 99, loss: 0.3454829752445221, mean loss: 0.34637273530012397
Epoch: 33, step: 100, loss: 0.3381898105144501, mean loss: 0.3463725639407374
Epoch: 33, step: 101, loss: 0.3474631905555725, mean loss: 0.3463725867791722
Epoch: 33, step: 102, loss: 0.3383370339870453, mean loss: 0.3463724185129636
Epoch: 33, step: 103, loss: 0.3560202121734619, mean loss: 0.3463726205356133
Epoch: 33, step: 104, loss: 0.37210240960121155, mean loss: 0.34637315930038215
Epoch: 33, step: 105, loss: 0.3416052460670471, mean loss: 0.3463730594655224
Epoch: 33, step: 106, loss: 0.3580949008464813, mean loss: 0.34637330490285106
Epoch: 33, step: 107, loss: 0.31791967153549194, mean loss: 0.34637270914000834
Epoch: 33, step: 108, loss: 0.31140780448913574, mean loss: 0.34637197705934314
Epoch: 33, step: 109, loss: 0.34751129150390625, mean loss: 0.3463720009133368
Epoch: 33, step: 110, loss: 0.3683743178844452, mean loss: 0.34637246156942986
Epoch: 33, step: 111, loss: 0.3189595341682434, mean loss: 0.34637188764498045
Epoch: 33, step: 112, loss: 0.32723501324653625, mean loss: 0.34637148699859927
Epoch: 33, step: 113, loss: 0.3253558874130249, mean loss: 0.34637104702875493
Epoch: 33, step: 114, loss: 0.3197128474712372, mean loss: 0.3463704889405443
Epoch: 33, step: 115, loss: 0.3872278034687042, mean loss: 0.34637134426868293
Epoch: 33, step: 116, loss: 0.34462520480155945, mean loss: 0.34637130771486213
Epoch: 33, step: 117, loss: 0.3433111011981964, mean loss: 0.3463712436535995
Epoch: 33, step: 118, loss: 0.3167067766189575, mean loss: 0.34637062268131436
Epoch: 33, step: 119, loss: 0.3644225597381592, mean loss: 0.3463710005582518
Epoch: 33, step: 120, loss: 0.3139107823371887, mean loss: 0.3463703210903888
Epoch: 33, step: 121, loss: 0.3151147663593292, mean loss: 0.3463696668526291
Epoch: 33, step: 122, loss: 0.333412230014801, mean loss: 0.34636939563469427
Epoch: 33, step: 123, loss: 0.33535727858543396, mean loss: 0.3463691651399469
Epoch: 33, step: 124, loss: 0.3388313055038452, mean loss: 0.34636900736822335
Epoch: 33, step: 125, loss: 0.3326053321361542, mean loss: 0.3463687192926398
Epoch: 33, step: 126, loss: 0.3660830557346344, mean loss: 0.346369131907731
Epoch: 33, step: 127, loss: 0.29953089356422424, mean loss: 0.34636815161810475
Epoch: 33, step: 128, loss: 0.29848065972328186, mean loss: 0.3463671493893549
Epoch: 33, step: 129, loss: 0.33990031480789185, mean loss: 0.34636701404896353
Epoch: 33, step: 130, loss: 0.3274572789669037, mean loss: 0.34636661830706617
Epoch: 33, step: 131, loss: 0.3276071846485138, mean loss: 0.3463662257188848
Epoch: 33, step: 132, loss: 0.31397056579589844, mean loss: 0.346365547772669
Epoch: 33, step: 133, loss: 0.32929402589797974, mean loss: 0.3463651905232262
Epoch: 33, step: 134, loss: 0.2886617183685303, mean loss: 0.34636398300921284
Epoch: 33, step: 135, loss: 0.36035534739494324, mean loss: 0.34636427578908197
Epoch: 33, step: 136, loss: 0.4361869990825653, mean loss: 0.34636615535808934
Epoch: 33, step: 137, loss: 0.3295382559299469, mean loss: 0.3463658032363185
Epoch: 33, step: 138, loss: 0.3151722848415375, mean loss: 0.346365150529357
Epoch: 33, step: 139, loss: 0.32189759612083435, mean loss: 0.34636463857015026
Epoch: 33, step: 140, loss: 0.31079772114753723, mean loss: 0.3463638943833986
Epoch: 33, step: 141, loss: 0.3810209333896637, mean loss: 0.3463646195170766
Epoch: 33, step: 142, loss: 0.32832902669906616, mean loss: 0.34636424216394723
Epoch: 33, step: 143, loss: 0.31491270661354065, mean loss: 0.3463635841269661
Epoch: 33, step: 144, loss: 0.333922803401947, mean loss: 0.34636332384325114
Epoch: 33, step: 145, loss: 0.32664954662323, mean loss: 0.3463629114038767
Epoch: 33, step: 146, loss: 0.3288954198360443, mean loss: 0.3463625459675377
Epoch: 33, step: 147, loss: 0.3255515992641449, mean loss: 0.34636211059208366
Epoch: 33, step: 148, loss: 0.3448426127433777, mean loss: 0.34636207880409076
Epoch: 33, step: 149, loss: 0.33627989888191223, mean loss: 0.34636186788864953
Epoch: 33, step: 150, loss: 0.3155819773674011, mean loss: 0.346361223998297
Epoch: 33, step: 151, loss: 0.3213545083999634, mean loss: 0.3463607008890258
Epoch: 33, step: 152, loss: 0.3828135132789612, mean loss: 0.346361463420401
Epoch: 33, step: 153, loss: 0.3355017602443695, mean loss: 0.346361236258472
Epoch: 33, step: 154, loss: 0.3318627178668976, mean loss: 0.3463609329865998
Epoch: 33, step: 155, loss: 0.32789283990859985, mean loss: 0.3463605466894722
Epoch: 33, step: 156, loss: 0.3209785223007202, mean loss: 0.346360015784739
Epoch: 33, step: 157, loss: 0.359401136636734, mean loss: 0.34636028855447026
Epoch: 33, step: 158, loss: 0.3617405295372009, mean loss: 0.34636061024280523
Epoch: 33, step: 159, loss: 0.3105974495410919, mean loss: 0.34635986224730825
Epoch: 33, step: 160, loss: 0.3542439639568329, mean loss: 0.3463600271418288
Epoch: 33, step: 161, loss: 0.35474681854248047, mean loss: 0.34636020254634214
Epoch: 33, step: 162, loss: 0.31688806414604187, mean loss: 0.3463595861678333
Epoch: 33, step: 163, loss: 0.3203659653663635, mean loss: 0.346359042550199
Epoch: 33, step: 164, loss: 0.30652859807014465, mean loss: 0.34635820957354885
Epoch: 33, step: 165, loss: 0.33299893140792847, mean loss: 0.346357930195947
Epoch: 33, step: 166, loss: 0.31675297021865845, mean loss: 0.34635731109140744
Epoch: 33, step: 167, loss: 0.3204408884048462, mean loss: 0.346356769133593
Epoch: 33, step: 168, loss: 0.3667106330394745, mean loss: 0.3463571947596549
Epoch: 33, step: 169, loss: 0.30614835023880005, mean loss: 0.34635635395741904
Epoch: 33, step: 170, loss: 0.32445845007896423, mean loss: 0.3463558960626011
Epoch: 33, step: 171, loss: 0.3152620494365692, mean loss: 0.3463552458901641
Epoch: 33, step: 172, loss: 0.3249548375606537, mean loss: 0.34635479841691097
Epoch: 33, step: 173, loss: 0.3716277480125427, mean loss: 0.3463553268522724
Epoch: 33, step: 174, loss: 0.34978577494621277, mean loss: 0.3463553985784541
Epoch: 33, step: 175, loss: 0.3174341022968292, mean loss: 0.3463547938846287
Epoch: 33, step: 176, loss: 0.3319135904312134, mean loss: 0.3463544919505834
Epoch: 33, step: 177, loss: 0.30585309863090515, mean loss: 0.34635364517255035
Epoch: 33, step: 178, loss: 0.3511604070663452, mean loss: 0.34635374566724825
Epoch: 33, step: 179, loss: 0.37685176730155945, mean loss: 0.3463543832743237
Epoch: 33, step: 180, loss: 0.35765722393989563, mean loss: 0.3463546195722909
Epoch: 33, step: 181, loss: 0.3492752015590668, mean loss: 0.34635468062890307
Epoch: 33, step: 182, loss: 0.31702175736427307, mean loss: 0.346354067418424
Epoch: 33, step: 183, loss: 0.3136570155620575, mean loss: 0.3463533838944702
Epoch: 33, step: 184, loss: 0.32735535502433777, mean loss: 0.3463529867535778
Epoch: 33, step: 185, loss: 0.3196827471256256, mean loss: 0.3463524292419839
Epoch: 33, step: 186, loss: 0.32991302013397217, mean loss: 0.34635208560166725
Epoch: 33, step: 187, loss: 0.34743762016296387, mean loss: 0.3463521082926071
Epoch: 33, step: 188, loss: 0.37493038177490234, mean loss: 0.34635270565205784
Epoch: 33, step: 189, loss: 0.33478274941444397, mean loss: 0.34635246381525675
Epoch: 33, step: 190, loss: 0.31020715832710266, mean loss: 0.34635170831695006
Epoch: 33, step: 191, loss: 0.317150354385376, mean loss: 0.34635109797178804
Epoch: 33, step: 192, loss: 0.4370865523815155, mean loss: 0.3463529944176948
Epoch: 33, step: 193, loss: 0.2977680563926697, mean loss: 0.3463519789736028
Epoch: 33, step: 194, loss: 0.3201107382774353, mean loss: 0.34635143053293366
Epoch: 33, step: 195, loss: 0.3258504867553711, mean loss: 0.34635100207314895
Epoch: 33, step: 196, loss: 0.36431050300598145, mean loss: 0.3463513774101661
Epoch: 33, step: 197, loss: 0.40522676706314087, mean loss: 0.3463526078258328
Epoch: 33, step: 198, loss: 0.3056657910346985, mean loss: 0.34635175754440106
Epoch: 33, step: 199, loss: 0.29727616906166077, mean loss: 0.3463507319741327
Epoch: 33, step: 200, loss: 0.28613337874412537, mean loss: 0.3463494735921456
Epoch: 33, step: 201, loss: 0.34740859270095825, mean loss: 0.34634949572444607
Epoch: 33, step: 202, loss: 0.32456642389297485, mean loss: 0.34634904053539933
Epoch: 33, step: 203, loss: 0.3580811023712158, mean loss: 0.3463492856888145
Epoch: 33, step: 204, loss: 0.3318629562854767, mean loss: 0.34634898298849054
Epoch: 33, step: 205, loss: 0.3779745399951935, mean loss: 0.3463496438091894
Epoch: 33, step: 206, loss: 0.3354085087776184, mean loss: 0.3463494151973289
Epoch: 33, step: 207, loss: 0.30703145265579224, mean loss: 0.3463485936770084
Epoch: 33, step: 208, loss: 0.32509636878967285, mean loss: 0.34634814963645577
Epoch: 33, step: 209, loss: 0.346386194229126, mean loss: 0.3463481504313367
Epoch: 33, step: 210, loss: 0.35207805037498474, mean loss: 0.3463482701459376
Epoch: 33, step: 211, loss: 0.30168411135673523, mean loss: 0.34634733699871234
Epoch: 33, step: 212, loss: 0.3287637233734131, mean loss: 0.34634696964023276
Epoch: 33, step: 213, loss: 0.35793206095695496, mean loss: 0.3463472116719738
Epoch: 33, step: 214, loss: 0.29964226484298706, mean loss: 0.3463462359486816
Epoch: 33, step: 215, loss: 0.3230483829975128, mean loss: 0.34634574923829153
Epoch: 33, step: 216, loss: 0.32086771726608276, mean loss: 0.3463452169933737
Epoch: 33, step: 217, loss: 0.3276223838329315, mean loss: 0.34634482587507076
Epoch: 33, step: 218, loss: 0.34644851088523865, mean loss: 0.3463448280409961
Epoch: 33, step: 219, loss: 0.29228678345680237, mean loss: 0.3463436988204792
Epoch: 33, step: 220, loss: 0.398396760225296, mean loss: 0.3463447861361144
Epoch: 33, step: 221, loss: 0.32612887024879456, mean loss: 0.3463443638627325
Epoch: 33, step: 222, loss: 0.35174497961997986, mean loss: 0.34634447666932794
Epoch: 33, step: 223, loss: 0.3125004470348358, mean loss: 0.3463437697591927
Epoch: 33, step: 224, loss: 0.3360787332057953, mean loss: 0.34634355535485334
Epoch: 33, step: 225, loss: 0.3578164279460907, mean loss: 0.3463437949820849
Epoch: 33, step: 226, loss: 0.3097977042198181, mean loss: 0.3463430316810393
Epoch: 33, step: 227, loss: 0.30254101753234863, mean loss: 0.3463421168520053
Epoch: 33, step: 228, loss: 0.3828006088733673, mean loss: 0.3463428782916582
Epoch: 33, step: 229, loss: 0.3310830891132355, mean loss: 0.3463425595959233
Epoch: 33, step: 230, loss: 0.35231566429138184, mean loss: 0.34634268433966736
Epoch: 33, step: 231, loss: 0.3118888735771179, mean loss: 0.34634196481308727
Epoch: 33, step: 232, loss: 0.30314692854881287, mean loss: 0.34634106275531834
Epoch: 33, step: 233, loss: 0.33732593059539795, mean loss: 0.3463408744929419
Epoch: 33, step: 234, loss: 0.305818647146225, mean loss: 0.3463400282877641
Epoch: 33, step: 235, loss: 0.332123339176178, mean loss: 0.34633973141403557
Epoch: 33, step: 236, loss: 0.35619378089904785, mean loss: 0.3463399371825729
Epoch: 33, step: 237, loss: 0.3651852607727051, mean loss: 0.346340330695281
Epoch: 33, step: 238, loss: 0.336779922246933, mean loss: 0.3463401310667819
Epoch: 33, step: 239, loss: 0.3965390920639038, mean loss: 0.346341179236852
Epoch: 33, step: 240, loss: 0.32354459166526794, mean loss: 0.34634070324688326
Epoch: 33, step: 241, loss: 0.34413015842437744, mean loss: 0.3463406570919406
Epoch: 33, step: 242, loss: 0.34468671679496765, mean loss: 0.346340622559311
Epoch: 33, step: 243, loss: 0.3492615520954132, mean loss: 0.34634068354414344
Epoch: 33, step: 244, loss: 0.3898209035396576, mean loss: 0.3463415913300172
Epoch: 33, step: 245, loss: 0.34375375509262085, mean loss: 0.3463415373019526
Epoch: 33, step: 246, loss: 0.3592287600040436, mean loss: 0.3463418063518848
Epoch: 33, step: 247, loss: 0.35959628224372864, mean loss: 0.34634208306328124
Epoch: 33, step: 248, loss: 0.31889790296554565, mean loss: 0.34634151012784986
Epoch: 33, step: 249, loss: 0.3383854031562805, mean loss: 0.3463413440365182
Epoch: 33, step: 250, loss: 0.3279809057712555, mean loss: 0.3463409607528352
Epoch: 33, step: 251, loss: 0.3017983138561249, mean loss: 0.3463400309213619
Epoch: 33, step: 252, loss: 0.3186367452144623, mean loss: 0.3463394526250315
Epoch: 33, step: 253, loss: 0.3394818902015686, mean loss: 0.3463393094788197
Epoch: 33, step: 254, loss: 0.3375629186630249, mean loss: 0.3463391262824013
Epoch: 33, step: 255, loss: 0.37259677052497864, mean loss: 0.34633967436715213
Epoch: 33, step: 256, loss: 0.3332635760307312, mean loss: 0.34633940143099534
Epoch: 33, step: 257, loss: 0.31608864665031433, mean loss: 0.3463387700230475
Epoch: 33, step: 258, loss: 0.32457202672958374, mean loss: 0.346338315706851
Epoch: 33, step: 259, loss: 0.35323530435562134, mean loss: 0.34633845965802496
Epoch: 33, step: 260, loss: 0.3377462923526764, mean loss: 0.3463382803295065
Epoch: 33, step: 261, loss: 0.3832900822162628, mean loss: 0.3463390515404654
Epoch: 33, step: 262, loss: 0.3314104974269867, mean loss: 0.3463387399771947
Epoch: 33, step: 263, loss: 0.3663957118988037, mean loss: 0.3463391585633021
Epoch: 33, step: 264, loss: 0.3433155119419098, mean loss: 0.34633909546155073
Epoch: 33, step: 265, loss: 0.342507928609848, mean loss: 0.34633901550898905
Epoch: 33, step: 266, loss: 0.33934110403060913, mean loss: 0.3463388694727304
Epoch: 33, step: 267, loss: 0.3406100273132324, mean loss: 0.3463387499226019
Epoch: 33, step: 268, loss: 0.3238913416862488, mean loss: 0.34633828149731366
Epoch: 33, step: 269, loss: 0.2971874177455902, mean loss: 0.34633725585431563
Epoch: 33, step: 270, loss: 0.3094465732574463, mean loss: 0.3463364860635555
Epoch: 33, step: 271, loss: 0.336056649684906, mean loss: 0.34633627156066804
Epoch: 33, step: 272, loss: 0.34858402609825134, mean loss: 0.34633631846217117
Epoch: 33, step: 273, loss: 0.30638208985328674, mean loss: 0.34633548479717496
Epoch: 33, step: 274, loss: 0.3310669958591461, mean loss: 0.34633516621915134
Epoch: 33, step: 275, loss: 0.36744964122772217, mean loss: 0.3463356067648659
Epoch: 33, step: 276, loss: 0.363010048866272, mean loss: 0.34633595466367667
Epoch: 33, step: 277, loss: 0.3061235845088959, mean loss: 0.34633511568245084
Epoch: 33, step: 278, loss: 0.33235928416252136, mean loss: 0.3463348241001446
Epoch: 33, step: 279, loss: 0.2927539050579071, mean loss: 0.34633370624737314
Epoch: 33, step: 280, loss: 0.3238348960876465, mean loss: 0.3463332368669847
Epoch: 33, step: 281, loss: 0.3418315649032593, mean loss: 0.3463331429530204
Epoch: 33, step: 282, loss: 0.37624627351760864, mean loss: 0.34633376698828827
Epoch: 33, step: 283, loss: 0.3136928975582123, mean loss: 0.3463330860622738
Epoch: 33, step: 284, loss: 0.2832910716533661, mean loss: 0.34633177096090306
Epoch: 33, step: 285, loss: 0.34244805574417114, mean loss: 0.3463316899455245
Epoch: 33, step: 286, loss: 0.3191531002521515, mean loss: 0.3463311230044182
Epoch: 33, step: 287, loss: 0.3612220585346222, mean loss: 0.3463314336205119
Epoch: 33, step: 288, loss: 0.30741456151008606, mean loss: 0.34633062185454727
Epoch: 33, step: 289, loss: 0.3555855453014374, mean loss: 0.3463308148987141
Epoch: 33, step: 290, loss: 0.3193291425704956, mean loss: 0.3463302516950696
Epoch: 33, step: 291, loss: 0.34586602449417114, mean loss: 0.3463302420123731
Epoch: 33, step: 292, loss: 0.3161225914955139, mean loss: 0.3463296119643907
Epoch: 33, step: 293, loss: 0.34736523032188416, mean loss: 0.3463296335640728
Epoch: 33, step: 294, loss: 0.3118811845779419, mean loss: 0.3463289150947424
Epoch: 33, step: 295, loss: 0.32764682173728943, mean loss: 0.34632852546236237
Epoch: 33, step: 296, loss: 0.33210742473602295, mean loss: 0.34632822887430575
Epoch: 33, step: 297, loss: 0.31859928369522095, mean loss: 0.34632765058556375
Epoch: 33, step: 298, loss: 0.3331000506877899, mean loss: 0.34632737472896225
Epoch: 33, step: 299, loss: 0.36885204911231995, mean loss: 0.34632784446274567
Epoch: 33, step: 300, loss: 0.3137951195240021, mean loss: 0.34632716603334734
Epoch: 33, step: 301, loss: 0.3303641676902771, mean loss: 0.34632683315187046
Epoch: 33, step: 302, loss: 0.31235867738723755, mean loss: 0.3463261248178956
Epoch: 33, step: 303, loss: 0.3280726671218872, mean loss: 0.3463257441886168
Epoch: 33, step: 304, loss: 0.32797396183013916, mean loss: 0.34632536151700766
Epoch: 33, step: 305, loss: 0.3140827715396881, mean loss: 0.3463246892081128
Epoch: 33, step: 306, loss: 0.33658483624458313, mean loss: 0.3463244861210392
Epoch: 33, step: 307, loss: 0.31008481979370117, mean loss: 0.3463237304983051
Epoch: 33, step: 308, loss: 0.3158777952194214, mean loss: 0.3463230956922069
Epoch: 33, step: 309, loss: 0.3145348131656647, mean loss: 0.3463224329116196
Epoch: 33, step: 310, loss: 0.2893834114074707, mean loss: 0.34632124576691425
Epoch: 33, step: 311, loss: 0.34000343084335327, mean loss: 0.34632111404698007
Epoch: 33, step: 312, loss: 0.3327086567878723, mean loss: 0.34632083024718313
Epoch: 33, step: 313, loss: 0.3367183208465576, mean loss: 0.3463206300530998
Epoch: 33, step: 314, loss: 0.32158324122428894, mean loss: 0.34632011433627724
Epoch: 33, step: 315, loss: 0.3221393823623657, mean loss: 0.3463196102349602
Epoch: 33, step: 316, loss: 0.3528561592102051, mean loss: 0.34631974650106906
Epoch: 33, step: 317, loss: 0.3888629376888275, mean loss: 0.3463206333718464
Epoch: 33, step: 318, loss: 0.30556145310401917, mean loss: 0.34631978370891947
Epoch: 33, step: 319, loss: 0.3741782307624817, mean loss: 0.3463203644319882
Epoch: 33, step: 320, loss: 0.32230469584465027, mean loss: 0.3463198638239673
Epoch: 33, step: 321, loss: 0.3750689923763275, mean loss: 0.3463204630887472
Epoch: 33, step: 322, loss: 0.35352852940559387, mean loss: 0.34632061333504877
Epoch: 33, step: 323, loss: 0.36131614446640015, mean loss: 0.34632092589822894
Epoch: 33, step: 324, loss: 0.3401187062263489, mean loss: 0.3463207966233749
Epoch: 33, step: 325, loss: 0.3407876491546631, mean loss: 0.3463206812966112
Epoch: 33, step: 326, loss: 0.2984344959259033, mean loss: 0.34631968323109563
Epoch: 33, step: 327, loss: 0.330500990152359, mean loss: 0.34631935353761756
Epoch: 33, step: 328, loss: 0.3603626489639282, mean loss: 0.3463196462221266
Epoch: 33, step: 329, loss: 0.3135089576244354, mean loss: 0.34631896240968446
Epoch: 33, step: 330, loss: 0.3547379970550537, mean loss: 0.3463191378683812
Epoch: 33, step: 331, loss: 0.31040024757385254, mean loss: 0.34631838930864683
Epoch: 33, step: 332, loss: 0.30130869150161743, mean loss: 0.3463174513134857
Epoch: 33, step: 333, loss: 0.35422852635383606, mean loss: 0.34631761617563384
Epoch: 33, step: 334, loss: 0.39110809564590454, mean loss: 0.34631854956341535
Epoch: 33, step: 335, loss: 0.3118165135383606, mean loss: 0.3463178305912551
Epoch: 33, step: 336, loss: 0.3020113706588745, mean loss: 0.34631690732842546
Epoch: 33, step: 337, loss: 0.3790866732597351, mean loss: 0.3463175901741419
Epoch: 33, step: 338, loss: 0.35047465562820435, mean loss: 0.34631767679591374
Epoch: 33, step: 339, loss: 0.37153956294059753, mean loss: 0.3463182023394657
Epoch: 33, step: 340, loss: 0.3529042899608612, mean loss: 0.3463183395696372
Epoch: 33, step: 341, loss: 0.30064162611961365, mean loss: 0.3463173878524757
Epoch: 33, step: 342, loss: 0.3557998836040497, mean loss: 0.346317585425051
Epoch: 33, step: 343, loss: 0.2988342344760895, mean loss: 0.34631659610612964
Epoch: 33, step: 344, loss: 0.3105611205101013, mean loss: 0.3463158511538285
Epoch: 33, step: 345, loss: 0.32577982544898987, mean loss: 0.3463154233021325
Epoch: 33, step: 346, loss: 0.3469712734222412, mean loss: 0.34631543696596134
Epoch: 33, step: 347, loss: 0.31302428245544434, mean loss: 0.3463147434002424
Epoch: 33, step: 348, loss: 0.3555256724357605, mean loss: 0.3463149352905996
Epoch: 33, step: 349, loss: 0.36105969548225403, mean loss: 0.3463152424603049
Epoch: 33, step: 350, loss: 0.3544999957084656, mean loss: 0.34631541296534096
Epoch: 33, step: 351, loss: 0.3161841928958893, mean loss: 0.3463147852838963
Epoch: 33, step: 352, loss: 0.32876405119895935, mean loss: 0.3463144196816864
Epoch: 33, step: 353, loss: 0.342801958322525, mean loss: 0.346314346514554
Epoch: 33, step: 354, loss: 0.31439009308815, mean loss: 0.3463136815229189
Epoch: 33, step: 355, loss: 0.3318173289299011, mean loss: 0.3463133795658994
Epoch: 33, step: 356, loss: 0.3152049779891968, mean loss: 0.3463127315956943
Epoch: 33, step: 357, loss: 0.3521192669868469, mean loss: 0.3463128525399849
Epoch: 33, step: 358, loss: 0.36092954874038696, mean loss: 0.3463131569847205
Epoch: 33, step: 359, loss: 0.31342965364456177, mean loss: 0.3463124720829597
Epoch: 33, step: 360, loss: 0.37035050988197327, mean loss: 0.34631297273981926
Epoch: 33, step: 361, loss: 0.3032474219799042, mean loss: 0.3463120758024518
Epoch: 33, step: 362, loss: 0.2944132089614868, mean loss: 0.346310994913837
Epoch: 33, step: 363, loss: 0.3391197621822357, mean loss: 0.3463108451464109
Epoch: 33, step: 364, loss: 0.3496784567832947, mean loss: 0.3463109152801477
Epoch: 33, step: 365, loss: 0.3050543963909149, mean loss: 0.3463100560915332
Epoch: 33, step: 366, loss: 0.35859614610671997, mean loss: 0.34631031195046436
Epoch: 33, step: 367, loss: 0.3493189811706543, mean loss: 0.34631037460496705
Epoch: 33, step: 368, loss: 0.3773514926433563, mean loss: 0.3463110210121231
Epoch: 33, step: 369, loss: 0.35008251667022705, mean loss: 0.3463110995489532
Epoch: 33, step: 370, loss: 0.34358516335487366, mean loss: 0.34631104278581487
Epoch: 33, step: 371, loss: 0.33585020899772644, mean loss: 0.34631082496069016
Epoch: 33, step: 372, loss: 0.3685494661331177, mean loss: 0.3463112880245355
Epoch: 33, step: 373, loss: 0.38604995608329773, mean loss: 0.3463121154652563
Epoch: 33, step: 374, loss: 0.36523523926734924, mean loss: 0.3463125094753715
Epoch: 33, step: 375, loss: 0.3551790714263916, mean loss: 0.34631269408772164
Epoch: 33, step: 376, loss: 0.3351363241672516, mean loss: 0.3463124613872715
Epoch: 33, step: 377, loss: 0.35931187868118286, mean loss: 0.3463127320393076
Epoch: 33, step: 378, loss: 0.277241975069046, mean loss: 0.3463112939939417
Epoch: 33, step: 379, loss: 0.3395130932331085, mean loss: 0.34631115245911576
Epoch: 33, step: 380, loss: 0.3503468930721283, mean loss: 0.3463112364792813
Epoch: 33, step: 381, loss: 0.3442597985267639, mean loss: 0.34631119377124214
Epoch: 33, step: 382, loss: 0.3052201569080353, mean loss: 0.34631033833173214
Epoch: 33, step: 383, loss: 0.33894532918930054, mean loss: 0.3463101850090337
Epoch: 33, step: 384, loss: 0.31816112995147705, mean loss: 0.34630959902208497
Epoch: 33, step: 385, loss: 0.35582876205444336, mean loss: 0.3463097971811056
Epoch: 33, step: 386, loss: 0.35017213225364685, mean loss: 0.3463098775810946
Epoch: 33, step: 387, loss: 0.3299158215522766, mean loss: 0.3463095363226427
Epoch: 33, step: 388, loss: 0.36627867817878723, mean loss: 0.346309951991381
Epoch: 33, step: 389, loss: 0.34955620765686035, mean loss: 0.34631001956258256
Epoch: 33, step: 390, loss: 0.29156094789505005, mean loss: 0.34630887997780085
Epoch: 33, step: 391, loss: 0.3298395574092865, mean loss: 0.3463085371811443
Epoch: 33, step: 392, loss: 0.29647156596183777, mean loss: 0.3463074998833772
Epoch: 33, step: 393, loss: 0.32770732045173645, mean loss: 0.34630711275064124
Epoch: 33, step: 394, loss: 0.3570170998573303, mean loss: 0.34630733565711
Epoch: 33, step: 395, loss: 0.32132211327552795, mean loss: 0.3463068156516492
Epoch: 33, step: 396, loss: 0.2949865162372589, mean loss: 0.34630574756907906
Epoch: 33, step: 397, loss: 0.34915968775749207, mean loss: 0.3463058069642963
Epoch: 33, step: 398, loss: 0.3228053152561188, mean loss: 0.3463053178903601
Epoch: 33, step: 399, loss: 0.3445301353931427, mean loss: 0.346305280947413
Epoch: 33, step: 400, loss: 0.3144245445728302, mean loss: 0.34630461749796393
Epoch: 33, step: 401, loss: 0.3099474310874939, mean loss: 0.3463038609077444
Epoch: 33, step: 402, loss: 0.32728976011276245, mean loss: 0.34630346523402067
Epoch: 33, step: 403, loss: 0.3149643540382385, mean loss: 0.34630281309669764
Epoch: 33, step: 404, loss: 0.3351469039916992, mean loss: 0.3463025809575898
Epoch: 33, step: 405, loss: 0.2984577715396881, mean loss: 0.3463015853937
Epoch: 33, step: 406, loss: 0.34047964215278625, mean loss: 0.346301464252119
Epoch: 33, step: 407, loss: 0.37553468346595764, mean loss: 0.346302072517188
Epoch: 33, step: 408, loss: 0.34043195843696594, mean loss: 0.34630195037836276
Epoch: 33, step: 409, loss: 0.3638114929199219, mean loss: 0.34630231468992995
Epoch: 33, step: 410, loss: 0.2996264100074768, mean loss: 0.3463013435498704
Epoch: 33, step: 411, loss: 0.334303081035614, mean loss: 0.3463010939189093
Epoch: 33, step: 412, loss: 0.31316977739334106, mean loss: 0.34630040461657857
Epoch: 33, step: 413, loss: 0.35838568210601807, mean loss: 0.34630065604747545
Epoch: 33, step: 414, loss: 0.3421782851219177, mean loss: 0.3463005702844587
Epoch: 33, step: 415, loss: 0.34235724806785583, mean loss: 0.34630048824813064
Epoch: 33, step: 416, loss: 0.30148690938949585, mean loss: 0.3462995559720513
Epoch: 33, step: 417, loss: 0.34306129813194275, mean loss: 0.3462994886065876
Epoch: 33, step: 418, loss: 0.3350435197353363, mean loss: 0.34629925445358745
Epoch: 33, step: 419, loss: 0.3156868815422058, mean loss: 0.3462986176510223
Epoch: 33, step: 420, loss: 0.332692950963974, mean loss: 0.3462983346300607
Epoch: 33, step: 421, loss: 0.302062451839447, mean loss: 0.3462974144677528
Epoch: 33, step: 422, loss: 0.33135154843330383, mean loss: 0.34629710358130383
Epoch: 33, step: 423, loss: 0.3382825553417206, mean loss: 0.3462969368754997
Epoch: 33, step: 424, loss: 0.328523725271225, mean loss: 0.3462965671932898
Epoch: 33, step: 425, loss: 0.34037548303604126, mean loss: 0.346296444037498
Epoch: 33, step: 426, loss: 0.3270528316497803, mean loss: 0.3462960437876511
Epoch: 33, step: 427, loss: 0.35596850514411926, mean loss: 0.34629624496197214
Epoch: 33, step: 428, loss: 0.3044147491455078, mean loss: 0.3462953739007252
Epoch: 33, step: 429, loss: 0.3347502648830414, mean loss: 0.3462951337878135
Epoch: 33, step: 430, loss: 0.3135190010070801, mean loss: 0.34629445213041316
Epoch: 33, step: 431, loss: 0.3262959122657776, mean loss: 0.34629403622200566
Epoch: 33, step: 432, loss: 0.31602808833122253, mean loss: 0.3462934067960331
Epoch: 33, step: 433, loss: 0.34313681721687317, mean loss: 0.34629334115136357
Epoch: 33, step: 434, loss: 0.3469810485839844, mean loss: 0.3462933554526806
Epoch: 33, step: 435, loss: 0.3118806481361389, mean loss: 0.3462926398332471
Epoch: 33, step: 436, loss: 0.35321709513664246, mean loss: 0.34629278382574646
Epoch: 33, step: 437, loss: 0.33363470435142517, mean loss: 0.3462925206092883
Epoch: 33, step: 438, loss: 0.29793041944503784, mean loss: 0.34629151497203464
Epoch: 33, step: 439, loss: 0.3381693959236145, mean loss: 0.34629134608492146
Epoch: 33, step: 440, loss: 0.34731781482696533, mean loss: 0.34629136742833405
Epoch: 33, step: 441, loss: 0.37014856934547424, mean loss: 0.3462918634819357
Epoch: 33, step: 442, loss: 0.37896883487701416, mean loss: 0.3462925429074767
Epoch: 33, step: 443, loss: 0.3837427496910095, mean loss: 0.34629332156280734
Epoch: 33, step: 444, loss: 0.35797590017318726, mean loss: 0.346293564459009
Epoch: 33, step: 445, loss: 0.3268946707248688, mean loss: 0.3462931611388349
Epoch: 33, step: 446, loss: 0.3360788822174072, mean loss: 0.3462929487793488
Epoch: 33, step: 447, loss: 0.2986305356025696, mean loss: 0.34629195787678796
Epoch: 33, step: 448, loss: 0.31364578008651733, mean loss: 0.3462912791761832
Epoch: 33, step: 449, loss: 0.35023003816604614, mean loss: 0.34629136105965974
Epoch: 33, step: 450, loss: 0.3101215362548828, mean loss: 0.34629060913514764
Epoch: 33, step: 451, loss: 0.3780366778373718, mean loss: 0.3462912690816948
Epoch: 33, step: 452, loss: 0.31959736347198486, mean loss: 0.34629071417252505
Epoch: 33, step: 453, loss: 0.34700146317481995, mean loss: 0.3462907289471686
Epoch: 33, step: 454, loss: 0.30558061599731445, mean loss: 0.34628988270622757
Epoch: 33, step: 455, loss: 0.3372058570384979, mean loss: 0.3462896938805506
Epoch: 33, step: 456, loss: 0.35621559619903564, mean loss: 0.34628990020166134
Epoch: 33, step: 457, loss: 0.3269011080265045, mean loss: 0.3462894971920547
Epoch: 33, step: 458, loss: 0.31525975465774536, mean loss: 0.3462888522305587
Epoch: 33, step: 459, loss: 0.3225138783454895, mean loss: 0.34628835807164027
Epoch: 33, step: 460, loss: 0.3705255687236786, mean loss: 0.3462888618276034
Epoch: 33, step: 461, loss: 0.3315925896167755, mean loss: 0.34628855638070205
Epoch: 33, step: 462, loss: 0.30253708362579346, mean loss: 0.3462876470702426
Epoch: 33, step: 463, loss: 0.33870962262153625, mean loss: 0.34628748957534594
Epoch: 33, step: 464, loss: 0.3292787969112396, mean loss: 0.3462871360892046
Epoch: 33, step: 465, loss: 0.29798266291618347, mean loss: 0.34628613221387367
Epoch: 33, step: 466, loss: 0.3457430303096771, mean loss: 0.3462861209272321
Epoch: 33, step: 467, loss: 0.3730449974536896, mean loss: 0.34628667701361043
Epoch: 33, step: 468, loss: 0.3285096287727356, mean loss: 0.34628630758969486
Epoch: 33, step: 469, loss: 0.3382309675216675, mean loss: 0.3462861401955702
Epoch: 33, step: 470, loss: 0.31322842836380005, mean loss: 0.34628545325352933
Epoch: 33, step: 471, loss: 0.29988160729408264, mean loss: 0.3462844889977327
Epoch: 33, step: 472, loss: 0.30418598651885986, mean loss: 0.34628361422365517
Epoch: 33, step: 473, loss: 0.35998401045799255, mean loss: 0.3462838989012979
Epoch: 33, step: 474, loss: 0.34341663122177124, mean loss: 0.3462838393241857
Epoch: 33, step: 475, loss: 0.3462819755077362, mean loss: 0.34628383928545947
Epoch: 33, step: 476, loss: 0.3359391689300537, mean loss: 0.3462836243491351
Epoch: 33, step: 477, loss: 0.370022177696228, mean loss: 0.3462841175665327
Epoch: 33, step: 478, loss: 0.3117436170578003, mean loss: 0.34628339993131824
Epoch: 33, step: 479, loss: 0.3107384443283081, mean loss: 0.3462826614422548
Epoch: 33, step: 480, loss: 0.32431507110595703, mean loss: 0.3462822050487132
Epoch: 33, step: 481, loss: 0.2989341914653778, mean loss: 0.34628122137784473
Epoch: 33, step: 482, loss: 0.35431283712387085, mean loss: 0.34628138823389015
Epoch: 33, step: 483, loss: 0.31320643424987793, mean loss: 0.34628070111917386
Epoch: 33, step: 484, loss: 0.3837183713912964, mean loss: 0.346281478850862
Epoch: 33, step: 485, loss: 0.32612067461013794, mean loss: 0.3462810600381934
Epoch: 33, step: 486, loss: 0.337526798248291, mean loss: 0.3462808781843579
Epoch: 33, step: 487, loss: 0.3427043855190277, mean loss: 0.3462808038907836
Epoch: 33, step: 488, loss: 0.40479525923728943, mean loss: 0.34628201937146214
Epoch: 33, step: 489, loss: 0.32367807626724243, mean loss: 0.3462815498449966
Epoch: 33, step: 490, loss: 0.33339157700538635, mean loss: 0.3462812821015481
Epoch: 33, step: 491, loss: 0.33090290427207947, mean loss: 0.34628096267695047
Epoch: 33, step: 492, loss: 0.32625293731689453, mean loss: 0.3462805466830703
Epoch: 33, step: 493, loss: 0.3545784056186676, mean loss: 0.3462807190309068
Epoch: 33, step: 494, loss: 0.32576531171798706, mean loss: 0.34628029293151713
Epoch: 33, step: 495, loss: 0.3522336483001709, mean loss: 0.3462804165785091
Epoch: 33, step: 496, loss: 0.3424570858478546, mean loss: 0.34628033717227574
Epoch: 33, step: 497, loss: 0.32723474502563477, mean loss: 0.34627994162519066
Epoch: 33, step: 498, loss: 0.31733065843582153, mean loss: 0.34627934040645814
Epoch: 33, step: 499, loss: 0.3104111850261688, mean loss: 0.3462785955120533
Epoch: 33, step: 500, loss: 0.37945860624313354, mean loss: 0.34627928456591767
Epoch: 33, step: 501, loss: 0.3425067365169525, mean loss: 0.3462792062225184
Epoch: 33, step: 502, loss: 0.31173455715179443, mean loss: 0.3462784888588164
Epoch: 33, step: 503, loss: 0.34192776679992676, mean loss: 0.3462783985123994
Epoch: 33, step: 504, loss: 0.3305699825286865, mean loss: 0.3462780723206519
Epoch: 33, step: 505, loss: 0.3071644604206085, mean loss: 0.3462772601272074
Epoch: 33, step: 506, loss: 0.31724312901496887, mean loss: 0.3462766572465182
Epoch: 33, step: 507, loss: 0.3206631541252136, mean loss: 0.34627612540467595
Epoch: 33, step: 508, loss: 0.3413033187389374, mean loss: 0.34627602215086756
Epoch: 33, step: 509, loss: 0.338899701833725, mean loss: 0.3462758689944306
Epoch: 33, step: 510, loss: 0.3003012537956238, mean loss: 0.34627491443148395
Epoch: 33, step: 511, loss: 0.3781012296676636, mean loss: 0.3462755752220171
Epoch: 33, step: 512, loss: 0.35010507702827454, mean loss: 0.34627565472999605
Epoch: 33, step: 513, loss: 0.3465239107608795, mean loss: 0.34627565988417186
Epoch: 33, step: 514, loss: 0.3224991261959076, mean loss: 0.3462751662571308
Epoch: 33, step: 515, loss: 0.33131933212280273, mean loss: 0.34627485576397904
Epoch: 33, step: 516, loss: 0.37519749999046326, mean loss: 0.34627545620501426
Epoch: 33, step: 517, loss: 0.3478318452835083, mean loss: 0.3462754885153543
Epoch: 33, step: 518, loss: 0.33354905247688293, mean loss: 0.34627522432245733
Epoch: 33, step: 519, loss: 0.3142824172973633, mean loss: 0.34627456018546854
Epoch: 33, step: 520, loss: 0.3247699737548828, mean loss: 0.34627411378216316
Epoch: 33, step: 521, loss: 0.3368077874183655, mean loss: 0.34627391727935325
Epoch: 33, step: 522, loss: 0.30528220534324646, mean loss: 0.3462730663875642
Epoch: 33, step: 523, loss: 0.31914496421813965, mean loss: 0.34627250328348397
Epoch: 33, step: 524, loss: 0.34043827652931213, mean loss: 0.3462723821836489
Epoch: 33, step: 525, loss: 0.3277111053466797, mean loss: 0.34627199691907096
Epoch: 33, step: 526, loss: 0.3065071105957031, mean loss: 0.3462711715618339
Epoch: 33, step: 527, loss: 0.35408443212509155, mean loss: 0.34627133372996516
Epoch: 33, step: 528, loss: 0.3098974823951721, mean loss: 0.3462705787881554
Epoch: 33, step: 529, loss: 0.2994426488876343, mean loss: 0.3462696068913911
Epoch: 33, step: 530, loss: 0.3440733551979065, mean loss: 0.3462695613099268
Epoch: 33, step: 531, loss: 0.3095090389251709, mean loss: 0.34626879839023594
Epoch: 33, step: 532, loss: 0.3501546382904053, mean loss: 0.3462688790344177
Epoch: 33, step: 533, loss: 0.3726752698421478, mean loss: 0.3462694270440223
Epoch: 33, step: 534, loss: 0.36403217911720276, mean loss: 0.3462697956652702
Epoch: 33, step: 535, loss: 0.316222608089447, mean loss: 0.34626917212439745
Epoch: 33, step: 536, loss: 0.35311460494995117, mean loss: 0.3462693141782443
Epoch: 33, step: 537, loss: 0.33491477370262146, mean loss: 0.3462690785579813
Epoch: 33, step: 538, loss: 0.315918505191803, mean loss: 0.3462684487604389
Epoch: 33, step: 539, loss: 0.3354564607143402, mean loss: 0.3462682244080973
Epoch: 33, step: 540, loss: 0.3977136015892029, mean loss: 0.34626929189460326
Epoch: 33, step: 541, loss: 0.31692418456077576, mean loss: 0.3462686829991529
Epoch: 33, step: 542, loss: 0.3437996804714203, mean loss: 0.34626863176971984
Epoch: 33, step: 543, loss: 0.3672269284725189, mean loss: 0.3462690666252411
Epoch: 33, step: 544, loss: 0.3109374940395355, mean loss: 0.3462683335594365
Epoch: 33, step: 545, loss: 0.3245604336261749, mean loss: 0.3462678831693802
Epoch: 33, step: 546, loss: 0.31747540831565857, mean loss: 0.3462672858027366
Epoch: 33, step: 547, loss: 0.3311404585838318, mean loss: 0.346266971968147
Epoch: 33, step: 548, loss: 0.38625380396842957, mean loss: 0.3462678015532593
Epoch: 33, step: 549, loss: 0.3516501486301422, mean loss: 0.3462679132155778
Epoch: 33, step: 550, loss: 0.35058778524398804, mean loss: 0.3462680028339009
Epoch: 33, step: 551, loss: 0.3005811870098114, mean loss: 0.34626705505330546
Epoch: 33, step: 552, loss: 0.3292735517024994, mean loss: 0.34626670252756436
Epoch: 33, step: 553, loss: 0.37442031502723694, mean loss: 0.3462672865547083
Epoch: 33, step: 554, loss: 0.3198949694633484, mean loss: 0.3462667394906493
Epoch: 33, step: 555, loss: 0.3016972243785858, mean loss: 0.3462658149653607
Epoch: 33, step: 556, loss: 0.3103266656398773, mean loss: 0.3462650694790547
Epoch: 33, step: 557, loss: 0.3213600814342499, mean loss: 0.34626455288523506
Epoch: 33, step: 558, loss: 0.30465343594551086, mean loss: 0.34626368978102773
Epoch: 33, step: 559, loss: 0.3350244164466858, mean loss: 0.34626345665912167
Epoch: 33, step: 560, loss: 0.3339698016643524, mean loss: 0.34626320167281105
Epoch: 33, step: 561, loss: 0.3538651466369629, mean loss: 0.34626335934371505
Epoch: 33, step: 562, loss: 0.35747671127319336, mean loss: 0.34626359191349476
Epoch: 33, step: 563, loss: 0.32270678877830505, mean loss: 0.34626310334531957
Epoch: 33, step: 564, loss: 0.36073997616767883, mean loss: 0.3462634035894829
Epoch: 33, step: 565, loss: 0.3690005838871002, mean loss: 0.3462638751391178
Epoch: 33, step: 566, loss: 0.32952141761779785, mean loss: 0.34626352792209714
Epoch: 33, step: 567, loss: 0.3220466077327728, mean loss: 0.346263025704756
Epoch: 33, step: 568, loss: 0.3058074712753296, mean loss: 0.3462621867434232
Epoch: 33, step: 569, loss: 0.32671400904655457, mean loss: 0.34626178136459823
Epoch: 33, step: 570, loss: 0.2969752252101898, mean loss: 0.346260759309642
Epoch: 33, step: 571, loss: 0.3059893250465393, mean loss: 0.3462599242185201
Epoch: 33, step: 572, loss: 0.3502664864063263, mean loss: 0.3462600072991253
Epoch: 33, step: 573, loss: 0.3919902443885803, mean loss: 0.3462609555477275
Epoch: 33, step: 574, loss: 0.3920634984970093, mean loss: 0.34626190527594924
Epoch: 33, step: 575, loss: 0.28389379382133484, mean loss: 0.34626061208296066
Epoch: 33, step: 576, loss: 0.3477098047733307, mean loss: 0.3462606421311203
Epoch: 33, step: 577, loss: 0.3851524889469147, mean loss: 0.3462614485140109
Epoch: 33, step: 578, loss: 0.36811894178390503, mean loss: 0.3462619016975085
Epoch: 33, step: 579, loss: 0.35821694135665894, mean loss: 0.34626214956281903
Epoch: 33, step: 580, loss: 0.34435248374938965, mean loss: 0.34626210997030327
Epoch: 33, step: 581, loss: 0.3688107430934906, mean loss: 0.34626257745450784
Epoch: 33, step: 582, loss: 0.3364008665084839, mean loss: 0.3462623730031562
Epoch: 33, step: 583, loss: 0.3801380395889282, mean loss: 0.3462630752932836
Epoch: 33, step: 584, loss: 0.3150485157966614, mean loss: 0.3462624281850576
Epoch: 33, step: 585, loss: 0.3165244162082672, mean loss: 0.3462618116998804
Epoch: 33, step: 586, loss: 0.34811803698539734, mean loss: 0.3462618501796434
Epoch: 33, step: 587, loss: 0.32943233847618103, mean loss: 0.3462615013091686
Epoch: 33, step: 588, loss: 0.3296719193458557, mean loss: 0.3462611574194905
Epoch: 33, step: 589, loss: 0.3532143831253052, mean loss: 0.3462613015516928
Epoch: 33, step: 590, loss: 0.34789586067199707, mean loss: 0.34626133543348125
Epoch: 33, step: 591, loss: 0.3233140707015991, mean loss: 0.34626085978335414
Epoch: 33, step: 592, loss: 0.30607134103775024, mean loss: 0.3462600267536361
Epoch: 33, step: 593, loss: 0.36232852935791016, mean loss: 0.3462603598072075
Epoch: 33, step: 594, loss: 0.338760107755661, mean loss: 0.3462602043519035
Epoch: 33, step: 595, loss: 0.34691691398620605, mean loss: 0.3462602179630301
Epoch: 33, step: 596, loss: 0.3184432089328766, mean loss: 0.3462596414327594
Epoch: 33, step: 597, loss: 0.30771446228027344, mean loss: 0.34625884256894274
Epoch: 33, step: 598, loss: 0.30084219574928284, mean loss: 0.34625790131079637
Epoch: 33, step: 599, loss: 0.36474043130874634, mean loss: 0.34625828435253553
Epoch: 33, step: 600, loss: 0.3257128894329071, mean loss: 0.3462578585677155
Epoch: 33, step: 601, loss: 0.32273855805397034, mean loss: 0.3462573711614795
Epoch: 33, step: 602, loss: 0.31715548038482666, mean loss: 0.34625676807598
Epoch: 33, step: 603, loss: 0.34870049357414246, mean loss: 0.3462568187168433
Epoch: 33, step: 604, loss: 0.35052260756492615, mean loss: 0.34625690711415036
Epoch: 33, step: 605, loss: 0.32750028371810913, mean loss: 0.346256518440285
Epoch: 33, step: 606, loss: 0.315868616104126, mean loss: 0.34625588875665425
Epoch: 33, step: 607, loss: 0.3160809576511383, mean loss: 0.34625526349906816
Epoch: 33, step: 608, loss: 0.31117555499076843, mean loss: 0.3462545366241897
Epoch: 33, step: 609, loss: 0.32429569959640503, mean loss: 0.3462540816319178
Epoch: 33, step: 610, loss: 0.3365423381328583, mean loss: 0.346253880406476
Epoch: 33, step: 611, loss: 0.30395233631134033, mean loss: 0.3462530039448463
Epoch: 33, step: 612, loss: 0.352454274892807, mean loss: 0.34625313242865335
Epoch: 33, step: 613, loss: 0.32070866227149963, mean loss: 0.3462526031850832
Epoch: 33, step: 614, loss: 0.31654515862464905, mean loss: 0.34625198770360394
Epoch: 33, step: 615, loss: 0.31250742077827454, mean loss: 0.34625128859514853
Epoch: 33, step: 616, loss: 0.30164748430252075, mean loss: 0.3462503645278529
Epoch: 33, step: 617, loss: 0.3128407299518585, mean loss: 0.34624967238709103
Epoch: 33, step: 618, loss: 0.3340069055557251, mean loss: 0.3462494187613772
Epoch: 33, step: 619, loss: 0.31709522008895874, mean loss: 0.34624881480465963
Epoch: 33, step: 620, loss: 0.3979719877243042, mean loss: 0.3462498862767645
Epoch: 33, step: 621, loss: 0.32249772548675537, mean loss: 0.34624939424874135
Epoch: 33, step: 622, loss: 0.3230447769165039, mean loss: 0.34624891357308457
Epoch: 33, step: 623, loss: 0.34115171432495117, mean loss: 0.3462488079885447
Epoch: 33, step: 624, loss: 0.30876460671424866, mean loss: 0.3462480315483915
Epoch: 33, step: 625, loss: 0.3731050193309784, mean loss: 0.3462485878470738
Epoch: 33, step: 626, loss: 0.37885206937789917, mean loss: 0.3462492631610101
Epoch: 33, step: 627, loss: 0.34452423453330994, mean loss: 0.3462492274313368
Epoch: 33, step: 628, loss: 0.3450202941894531, mean loss: 0.34624920197757153
Epoch: 33, step: 629, loss: 0.34494200348854065, mean loss: 0.34624917490333085
Epoch: 33, step: 630, loss: 0.3322990834712982, mean loss: 0.3462488859798706
Epoch: 33, step: 631, loss: 0.3304007947444916, mean loss: 0.3462485577533103
Epoch: 33, step: 632, loss: 0.35532549023628235, mean loss: 0.3462487457399
Epoch: 33, step: 633, loss: 0.33000314235687256, mean loss: 0.3462484092944835
Epoch: 33, step: 634, loss: 0.36766088008880615, mean loss: 0.34624885273621303
Epoch: 33, step: 635, loss: 0.35706356167793274, mean loss: 0.34624907669887334
Epoch: 33, step: 636, loss: 0.2881021201610565, mean loss: 0.34624787255390166
Epoch: 33, step: 637, loss: 0.3450162410736084, mean loss: 0.3462478470490046
Epoch: 33, step: 638, loss: 0.39228084683418274, mean loss: 0.346248800290805
Epoch: 33, step: 639, loss: 0.36453595757484436, mean loss: 0.346249178969619
Epoch: 33, step: 640, loss: 0.3488644063472748, mean loss: 0.3462492331229617
Epoch: 33, step: 641, loss: 0.38881275057792664, mean loss: 0.34625011446469056
Epoch: 33, step: 642, loss: 0.3430817723274231, mean loss: 0.34625004886075356
Epoch: 33, step: 643, loss: 0.3432883024215698, mean loss: 0.3462499875358728
Epoch: 33, step: 644, loss: 0.32648375630378723, mean loss: 0.3462495782717108
Epoch: 33, step: 645, loss: 0.31287455558776855, mean loss: 0.34624888724883857
Epoch: 33, step: 646, loss: 0.3761802017688751, mean loss: 0.34624950695762174
Epoch: 33, step: 647, loss: 0.2849782407283783, mean loss: 0.34624823840138513
Epoch: 33, step: 648, loss: 0.3299279510974884, mean loss: 0.34624790051423365
Epoch: 33, step: 649, loss: 0.32669299840927124, mean loss: 0.3462474956675999
Epoch: 33, step: 650, loss: 0.33180683851242065, mean loss: 0.34624719670775983
Epoch: 33, step: 651, loss: 0.32092955708503723, mean loss: 0.34624667257643277
Epoch: 33, step: 652, loss: 0.3210026025772095, mean loss: 0.3462461499789791
Epoch: 33, step: 653, loss: 0.3020061254501343, mean loss: 0.34624523415020986
Epoch: 33, step: 654, loss: 0.3245157301425934, mean loss: 0.34624478432919
Epoch: 33, step: 655, loss: 0.3791005313396454, mean loss: 0.3462454644597483
Epoch: 33, step: 656, loss: 0.31710419058799744, mean loss: 0.34624486123314724
Epoch: 33, step: 657, loss: 0.3439495265483856, mean loss: 0.34624481372052696
Epoch: 33, step: 658, loss: 0.3227255940437317, mean loss: 0.3462443268910331
Epoch: 33, step: 659, loss: 0.322268545627594, mean loss: 0.3462438306213431
Epoch: 33, step: 660, loss: 0.3730469048023224, mean loss: 0.3462443854010956
Epoch: 33, step: 661, loss: 0.3737855553627014, mean loss: 0.34624495544642325
Epoch: 33, step: 662, loss: 0.307132363319397, mean loss: 0.346244145913315
Epoch: 33, step: 663, loss: 0.2913127839565277, mean loss: 0.3462430089946554
Epoch: 33, step: 664, loss: 0.3215166926383972, mean loss: 0.34624249724275946
Epoch: 33, step: 665, loss: 0.31450435519218445, mean loss: 0.3462418403831616
Epoch: 33, step: 666, loss: 0.3589962124824524, mean loss: 0.3462421043450006
Epoch: 33, step: 667, loss: 0.3022835850715637, mean loss: 0.34624119460743286
Epoch: 33, step: 668, loss: 0.3582035005092621, mean loss: 0.3462414421665873
Epoch: 33, step: 669, loss: 0.31950321793556213, mean loss: 0.34624088883220067
Epoch: 33, step: 670, loss: 0.3276466727256775, mean loss: 0.34624050404201573
Epoch: 33, step: 671, loss: 0.32597482204437256, mean loss: 0.3462400846710614
Epoch: 33, step: 672, loss: 0.3172209560871124, mean loss: 0.3462394841717632
Epoch: 33, step: 673, loss: 0.30736035108566284, mean loss: 0.3462386796538415
Epoch: 33, step: 674, loss: 0.31184548139572144, mean loss: 0.34623796797717504
Epoch: 33, step: 675, loss: 0.3438553810119629, mean loss: 0.3462379186768323
Epoch: 33, step: 676, loss: 0.3777143359184265, mean loss: 0.34623856997144303
Epoch: 33, step: 677, loss: 0.3453112840652466, mean loss: 0.3462385507848942
Epoch: 33, step: 678, loss: 0.34143686294555664, mean loss: 0.34623845143483234
Epoch: 33, step: 679, loss: 0.36172929406166077, mean loss: 0.34623877194386626
Epoch: 33, step: 680, loss: 0.3019242584705353, mean loss: 0.3462378550855402
Epoch: 33, step: 681, loss: 0.3293689489364624, mean loss: 0.34623750607850273
Epoch: 33, step: 682, loss: 0.29081466794013977, mean loss: 0.3462363594386323
Epoch: 33, step: 683, loss: 0.39861783385276794, mean loss: 0.34623744313348526
Epoch: 33, step: 684, loss: 0.3390078544616699, mean loss: 0.346237293567135
Epoch: 33, step: 685, loss: 0.3309037983417511, mean loss: 0.3462369763530338
Epoch: 33, step: 686, loss: 0.3270304799079895, mean loss: 0.3462365790238287
Epoch: 33, step: 687, loss: 0.33243730664253235, mean loss: 0.3462362935610157
Epoch: 33, step: 688, loss: 0.35213375091552734, mean loss: 0.34623641555802354
Epoch: 33, step: 689, loss: 0.3259235918521881, mean loss: 0.3462359953680499
Epoch: 33, step: 690, loss: 0.34068939089775085, mean loss: 0.3462358806336629
Epoch: 33, step: 691, loss: 0.3378574550151825, mean loss: 0.34623570732517334
Epoch: 33, step: 692, loss: 0.3217903971672058, mean loss: 0.34623520168218735
Epoch: 33, step: 693, loss: 0.3933252692222595, mean loss: 0.34623617570418586
Epoch: 33, step: 694, loss: 0.34960439801216125, mean loss: 0.34623624537184483
Epoch: 33, step: 695, loss: 0.3214191198348999, mean loss: 0.3462357320698357
Epoch: 33, step: 696, loss: 0.3105069398880005, mean loss: 0.3462349930929762
Epoch: 33, step: 697, loss: 0.344685435295105, mean loss: 0.346234961044211
Epoch: 33, step: 698, loss: 0.3164934813976288, mean loss: 0.3462343459280883
Epoch: 33, step: 699, loss: 0.3408796191215515, mean loss: 0.3462342351834075
Epoch: 33, step: 700, loss: 0.34052956104278564, mean loss: 0.3462341172036722
Epoch: 33, step: 701, loss: 0.32539600133895874, mean loss: 0.34623368625450845
Epoch: 33, step: 702, loss: 0.3486454486846924, mean loss: 0.3462337361306832
Epoch: 33, step: 703, loss: 0.3165770173072815, mean loss: 0.3462331228310136
Epoch: 33, step: 704, loss: 0.3079887330532074, mean loss: 0.34623233195503333
Epoch: 33, step: 705, loss: 0.33504945039749146, mean loss: 0.3462321007030883
Epoch: 33, step: 706, loss: 0.33976081013679504, mean loss: 0.34623196688537977
Epoch: 33, step: 707, loss: 0.31867003440856934, mean loss: 0.3462313969529464
Epoch: 33, step: 708, loss: 0.33690202236175537, mean loss: 0.3462312040418281
Epoch: 33, step: 709, loss: 0.3516838252544403, mean loss: 0.3462313167878108
Epoch: 33, step: 710, loss: 0.37471383810043335, mean loss: 0.3462319057198727
Epoch: 33, step: 711, loss: 0.3328545391559601, mean loss: 0.3462316291222678
Epoch: 33, step: 712, loss: 0.40455126762390137, mean loss: 0.3462328349454561
Epoch: 33, step: 713, loss: 0.3344632089138031, mean loss: 0.3462325916004197
Epoch: 33, step: 714, loss: 0.3691789209842682, mean loss: 0.3462330660216032
Epoch: 33, step: 715, loss: 0.30681851506233215, mean loss: 0.3462322511326072
Epoch: 33, step: 716, loss: 0.31075727939605713, mean loss: 0.3462315177088908
Epoch: 33, step: 717, loss: 0.34426841139793396, mean loss: 0.34623147712368696
Epoch: 33, step: 718, loss: 0.3272494673728943, mean loss: 0.3462310846982719
Epoch: 33, step: 719, loss: 0.3300012946128845, mean loss: 0.3462307491779278
Epoch: 33, step: 720, loss: 0.3493850827217102, mean loss: 0.3462308143864851
Epoch: 33, step: 721, loss: 0.3037799000740051, mean loss: 0.34622993683006403
Epoch: 33, step: 722, loss: 0.32599639892578125, mean loss: 0.3462295185657146
Epoch: 33, step: 723, loss: 0.32440879940986633, mean loss: 0.34622906750074117
Epoch: 33, step: 724, loss: 0.3460772931575775, mean loss: 0.34622906436341677
Epoch: 33, step: 725, loss: 0.33980172872543335, mean loss: 0.34622893150683653
Epoch: 33, step: 726, loss: 0.3566586673259735, mean loss: 0.3462291470907845
Epoch: 33, step: 727, loss: 0.31410905718803406, mean loss: 0.34622848317821936
Epoch: 33, step: 728, loss: 0.32722628116607666, mean loss: 0.3462280904165565
Epoch: 33, step: 729, loss: 0.33666810393333435, mean loss: 0.3462278928226893
Epoch: 33, step: 730, loss: 0.3170890510082245, mean loss: 0.3462272905689676
Epoch: 33, step: 731, loss: 0.4016353487968445, mean loss: 0.34622843574212875
Epoch: 33, step: 732, loss: 0.3256806433200836, mean loss: 0.34622801106934953
Epoch: 33, step: 733, loss: 0.3476448953151703, mean loss: 0.3462280403522877
Epoch: 33, step: 734, loss: 0.37050506472587585, mean loss: 0.34622854207846154
Epoch: 33, step: 735, loss: 0.31187519431114197, mean loss: 0.34622783212252684
Epoch: 33, step: 736, loss: 0.31253060698509216, mean loss: 0.3462271357405983
Epoch: 33, step: 737, loss: 0.3582575023174286, mean loss: 0.3462273843532575
Epoch: 33, step: 738, loss: 0.3098450303077698, mean loss: 0.3462266325119224
Epoch: 33, step: 739, loss: 0.34378308057785034, mean loss: 0.34622658201696593
Epoch: 33, step: 740, loss: 0.3329167366027832, mean loss: 0.3462263069803818
Epoch: 33, step: 741, loss: 0.3630308210849762, mean loss: 0.3462266542241332
Epoch: 33, step: 742, loss: 0.32157573103904724, mean loss: 0.34622614485491765
Epoch: 33, step: 743, loss: 0.4117019772529602, mean loss: 0.34622749777318357
Epoch: 33, step: 744, loss: 0.3246506154537201, mean loss: 0.3462270519421957
Epoch: 33, step: 745, loss: 0.33076024055480957, mean loss: 0.3462267323667714
Epoch: 33, step: 746, loss: 0.3144489526748657, mean loss: 0.3462260757875096
Epoch: 33, step: 747, loss: 0.299206018447876, mean loss: 0.34622510429872155
Epoch: 33, step: 748, loss: 0.35072627663612366, mean loss: 0.3462251972962286
Epoch: 33, step: 749, loss: 0.3324591815471649, mean loss: 0.3462249128861681
Epoch: 33, step: 750, loss: 0.33929604291915894, mean loss: 0.34622476973657057
Epoch: 33, step: 751, loss: 0.33014461398124695, mean loss: 0.3462244375294027
Epoch: 33, step: 752, loss: 0.32732632756233215, mean loss: 0.3462240471129175
Epoch: 33, step: 753, loss: 0.32623475790023804, mean loss: 0.3462236341622665
Epoch: 33, step: 754, loss: 0.31439346075057983, mean loss: 0.34622297660915613
Epoch: 33, step: 755, loss: 0.30690011382102966, mean loss: 0.3462221642875814
Epoch: 33, step: 756, loss: 0.3085821866989136, mean loss: 0.3462213867466781
Epoch: 33, step: 757, loss: 0.31661495566368103, mean loss: 0.34622077516991534
Epoch: 33, step: 758, loss: 0.3302805721759796, mean loss: 0.34622044590171197
Epoch: 33, step: 759, loss: 0.31762537360191345, mean loss: 0.3462198552408779
Epoch: 33, step: 760, loss: 0.3119128942489624, mean loss: 0.3462191466097046
Epoch: 33, step: 761, loss: 0.30339929461479187, mean loss: 0.34621826215785195
Epoch: 33, step: 762, loss: 0.3513062000274658, mean loss: 0.34621836724796595
Epoch: 33, step: 763, loss: 0.2996892035007477, mean loss: 0.34621740621930297
Epoch: 33, step: 764, loss: 0.3102801442146301, mean loss: 0.34621666397459544
Epoch: 33, step: 765, loss: 0.33185335993766785, mean loss: 0.34621636732244054
Epoch: 33, step: 766, loss: 0.36718815565109253, mean loss: 0.34621680045382136
Epoch: 33, step: 767, loss: 0.31408029794692993, mean loss: 0.3462161367507543
Epoch: 33, step: 768, loss: 0.40847083926200867, mean loss: 0.34621742244709497
Epoch: 33, step: 769, loss: 0.3537982404232025, mean loss: 0.34621757900440314
Epoch: 33, step: 770, loss: 0.33130311965942383, mean loss: 0.34621727100078203
Epoch: 33, step: 771, loss: 0.35340213775634766, mean loss: 0.34621741937486833
Epoch: 33, step: 772, loss: 0.3275308907032013, mean loss: 0.3462170334888865
Epoch: 33, step: 773, loss: 0.3187487721443176, mean loss: 0.34621646626753133
Epoch: 33, step: 774, loss: 0.3416089117527008, mean loss: 0.34621637112320036
Epoch: 33, step: 775, loss: 0.36618438363075256, mean loss: 0.34621678344690787
Epoch: 33, step: 776, loss: 0.3248308002948761, mean loss: 0.3462163418523436
Epoch: 33, step: 777, loss: 0.3261124789714813, mean loss: 0.3462159267405765
Epoch: 33, step: 778, loss: 0.3110268712043762, mean loss: 0.34621520015934676
Epoch: 33, step: 779, loss: 0.30404460430145264, mean loss: 0.346214329441725
Epoch: 33, step: 780, loss: 0.36503490805625916, mean loss: 0.34621471803170734
Epoch: 33, step: 781, loss: 0.33522897958755493, mean loss: 0.34621449121297576
Epoch: 33, step: 782, loss: 0.36446815729141235, mean loss: 0.3462148680823074
Epoch: 33, step: 783, loss: 0.3361680507659912, mean loss: 0.34621466065772
Epoch: 33, step: 784, loss: 0.30983221530914307, mean loss: 0.34621390952851405
Epoch: 33, step: 785, loss: 0.3257755935192108, mean loss: 0.3462134875805391
Epoch: 33, step: 786, loss: 0.41653233766555786, mean loss: 0.346214939279585
Epoch: 33, step: 787, loss: 0.336261510848999, mean loss: 0.3462147338000551
Epoch: 33, step: 788, loss: 0.3012758493423462, mean loss: 0.3462138060965713
Epoch: 33, step: 789, loss: 0.29544636607170105, mean loss: 0.34621275809194674
Epoch: 33, step: 790, loss: 0.31990715861320496, mean loss: 0.3462122150702619
Epoch: 33, step: 791, loss: 0.3203587532043457, mean loss: 0.3462116813929878
Epoch: 33, step: 792, loss: 0.33965468406677246, mean loss: 0.3462115460436777
Epoch: 33, step: 793, loss: 0.3414183557033539, mean loss: 0.3462114471048522
Epoch: 33, step: 794, loss: 0.34237849712371826, mean loss: 0.3462113679884986
Epoch: 33, step: 795, loss: 0.2925328314304352, mean loss: 0.3462102600266311
Epoch: 33, step: 796, loss: 0.314313143491745, mean loss: 0.3462096016618241
Epoch: 33, step: 797, loss: 0.34612801671028137, mean loss: 0.34620959997792417
Epoch: 33, step: 798, loss: 0.3324093222618103, mean loss: 0.34620931514834963
Epoch: 33, step: 799, loss: 0.28281325101852417, mean loss: 0.34620800671806545
Epoch: 33, step: 800, loss: 0.33305200934410095, mean loss: 0.3462077351972644
Epoch: 33, step: 801, loss: 0.33684584498405457, mean loss: 0.34620754198534764
Epoch: 33, step: 802, loss: 0.30852699279785156, mean loss: 0.34620676434528597
Epoch: 33, step: 803, loss: 0.313581258058548, mean loss: 0.3462060910436043
Epoch: 33, step: 804, loss: 0.3262900114059448, mean loss: 0.34620568003839064
Epoch: 33, step: 805, loss: 0.30900517106056213, mean loss: 0.34620491235278705
Epoch: 33, step: 806, loss: 0.38538020849227905, mean loss: 0.34620572077425965
Epoch: 33, step: 807, loss: 0.33553409576416016, mean loss: 0.34620550055913357
Epoch: 33, step: 808, loss: 0.3092215061187744, mean loss: 0.34620473738886387
Epoch: 33, step: 809, loss: 0.3703005313873291, mean loss: 0.3462052345989253
Epoch: 33, step: 810, loss: 0.3381570279598236, mean loss: 0.3462050685298285
Epoch: 33, step: 811, loss: 0.3366951048374176, mean loss: 0.3462048723024496
Epoch: 33, step: 812, loss: 0.2986437976360321, mean loss: 0.3462038909535449
Epoch: 33, step: 813, loss: 0.34331291913986206, mean loss: 0.3462038313040625
Epoch: 33, step: 814, loss: 0.3242904245853424, mean loss: 0.34620337917360844
Epoch: 33, step: 815, loss: 0.3539453446865082, mean loss: 0.34620353890715455
Epoch: 33, step: 816, loss: 0.33477553725242615, mean loss: 0.34620330312755
Epoch: 33, step: 817, loss: 0.29927629232406616, mean loss: 0.3462023349614513
Epoch: 33, step: 818, loss: 0.3525128662586212, mean loss: 0.34620246515334535
Epoch: 33, step: 819, loss: 0.3678745627403259, mean loss: 0.34620291225884103
Epoch: 33, step: 820, loss: 0.3730943202972412, mean loss: 0.34620346702970395
Epoch: 33, step: 821, loss: 0.30679237842559814, mean loss: 0.3462026539940848
Epoch: 33, step: 822, loss: 0.3797168731689453, mean loss: 0.34620334536529
Epoch: 33, step: 823, loss: 0.32625073194503784, mean loss: 0.34620293376752165
Epoch: 33, step: 824, loss: 0.3962038457393646, mean loss: 0.3462039652032947
Epoch: 33, step: 825, loss: 0.32226496934890747, mean loss: 0.34620347139175434
Epoch: 33, step: 826, loss: 0.4079824984073639, mean loss: 0.34620474573790455
Epoch: 33, step: 827, loss: 0.33600926399230957, mean loss: 0.34620453543506324
Epoch: 33, step: 828, loss: 0.34984090924263, mean loss: 0.34620461044122663
Epoch: 33, step: 829, loss: 0.32494431734085083, mean loss: 0.34620417192191844
Epoch: 33, step: 830, loss: 0.29530346393585205, mean loss: 0.34620312205479004
Epoch: 33, step: 831, loss: 0.301962286233902, mean loss: 0.34620220957158276
Epoch: 33, step: 832, loss: 0.34295451641082764, mean loss: 0.34620214258812065
Epoch: 33, step: 833, loss: 0.3502298593521118, mean loss: 0.346202225657806
Epoch: 33, step: 834, loss: 0.2924104928970337, mean loss: 0.3462011162525477
Epoch: 33, step: 835, loss: 0.3279079496860504, mean loss: 0.3462007389805099
Epoch: 33, step: 836, loss: 0.3186633288860321, mean loss: 0.346200171070054
Epoch: 33, step: 837, loss: 0.3346382677555084, mean loss: 0.3461999326311323
Epoch: 33, step: 838, loss: 0.3236023485660553, mean loss: 0.34619946661508677
Epoch: 33, step: 839, loss: 0.3400217890739441, mean loss: 0.34619933921927837
Epoch: 33, step: 840, loss: 0.2983592450618744, mean loss: 0.34619835268319776
Epoch: 33, step: 841, loss: 0.33597564697265625, mean loss: 0.3461981418796816
Epoch: 33, step: 842, loss: 0.3112829625606537, mean loss: 0.3461974219048529
Epoch: 33, step: 843, loss: 0.3664013147354126, mean loss: 0.3461978385143224
Epoch: 33, step: 844, loss: 0.32047513127326965, mean loss: 0.3461973081164165
Epoch: 33, step: 845, loss: 0.3394871652126312, mean loss: 0.34619716975724907
Epoch: 33, step: 846, loss: 0.3629016876220703, mean loss: 0.34619751418739947
Epoch: 33, step: 847, loss: 0.33364081382751465, mean loss: 0.34619725528636114
Epoch: 33, step: 848, loss: 0.3440565764904022, mean loss: 0.34619721114956403
Epoch: 33, step: 849, loss: 0.2965569794178009, mean loss: 0.3461961876818363
Epoch: 33, step: 850, loss: 0.3882671296596527, mean loss: 0.34619705507028603
Epoch: 33, step: 851, loss: 0.30253371596336365, mean loss: 0.3461961548694963
Epoch: 33, step: 852, loss: 0.29036179184913635, mean loss: 0.34619500376418716
Epoch: 33, step: 853, loss: 0.3405703604221344, mean loss: 0.34619488780650476
Epoch: 33, step: 854, loss: 0.3700544536113739, mean loss: 0.3461953796853223
Epoch: 33, step: 855, loss: 0.39877253770828247, mean loss: 0.34619646357165085
Epoch: 33, step: 856, loss: 0.3705650269985199, mean loss: 0.3461969659230377
Epoch: 33, step: 857, loss: 0.31599652767181396, mean loss: 0.3461963433619524
Epoch: 33, step: 858, loss: 0.32710933685302734, mean loss: 0.3461959499046642
Epoch: 33, step: 859, loss: 0.3202742338180542, mean loss: 0.34619541556849814
Epoch: 33, step: 860, loss: 0.3234597146511078, mean loss: 0.3461949469167776
Epoch: 33, step: 861, loss: 0.32702332735061646, mean loss: 0.34619455173972424
Epoch: 33, step: 862, loss: 0.33409422636032104, mean loss: 0.3461943023256177
Epoch: 33, step: 863, loss: 0.3213033676147461, mean loss: 0.3461937892797213
Epoch: 33, step: 864, loss: 0.35667333006858826, mean loss: 0.3461940052770168
Epoch: 33, step: 865, loss: 0.3237573206424713, mean loss: 0.3461935428365899
Epoch: 33, step: 866, loss: 0.2921571135520935, mean loss: 0.3461924291197102
Epoch: 33, step: 867, loss: 0.3550836145877838, mean loss: 0.3461926123675558
Epoch: 33, step: 868, loss: 0.39082440733909607, mean loss: 0.3461935322124677
Epoch: 33, step: 869, loss: 0.342525839805603, mean loss: 0.3461934566242313
Epoch: 33, step: 870, loss: 0.3389887511730194, mean loss: 0.3461933081440167
Epoch: 33, step: 871, loss: 0.3165372908115387, mean loss: 0.3461926969821724
Epoch: 33, step: 872, loss: 0.31106287240982056, mean loss: 0.3461919730290643
Epoch: 33, step: 873, loss: 0.32138001918792725, mean loss: 0.34619146171649284
Epoch: 33, step: 874, loss: 0.3197822570800781, mean loss: 0.34619091749977565
Epoch: 33, step: 875, loss: 0.2995717525482178, mean loss: 0.3461899568344906
Epoch: 33, step: 876, loss: 0.3416670560836792, mean loss: 0.34618986363453286
Epoch: 33, step: 877, loss: 0.2974693477153778, mean loss: 0.34618885970879787
Epoch: 33, step: 878, loss: 0.32915717363357544, mean loss: 0.34618850876432783
Epoch: 33, step: 879, loss: 0.3207727372646332, mean loss: 0.34618798507333015
Epoch: 33, step: 880, loss: 0.32541319727897644, mean loss: 0.3461875570184439
Epoch: 33, step: 881, loss: 0.3259503245353699, mean loss: 0.3461871400482275
Epoch: 33, step: 882, loss: 0.3501718044281006, mean loss: 0.34618722214700937
Epoch: 33, step: 883, loss: 0.3415737748146057, mean loss: 0.3461871270949381
Epoch: 33, step: 884, loss: 0.32826414704322815, mean loss: 0.34618675783066444
Epoch: 33, step: 885, loss: 0.29992079734802246, mean loss: 0.3461858046401646
Epoch: 33, step: 886, loss: 0.3230409622192383, mean loss: 0.34618532781034894
Epoch: 33, step: 887, loss: 0.2918706238269806, mean loss: 0.3461842088424053
Epoch: 33, step: 888, loss: 0.32858994603157043, mean loss: 0.34618384638051103
Epoch: 33, step: 889, loss: 0.3272211253643036, mean loss: 0.34618345573486364
Epoch: 33, step: 890, loss: 0.32242104411125183, mean loss: 0.3461829662222331
Epoch: 33, step: 891, loss: 0.38715028762817383, mean loss: 0.34618381014365296
Epoch: 33, step: 892, loss: 0.32285037636756897, mean loss: 0.3461833294878949
Epoch: 33, step: 893, loss: 0.3516453504562378, mean loss: 0.34618344200017126
Epoch: 33, step: 894, loss: 0.32311341166496277, mean loss: 0.3461829667899557
Epoch: 33, step: 895, loss: 0.30645790696144104, mean loss: 0.346182148526385
Epoch: 33, step: 896, loss: 0.3306187093257904, mean loss: 0.34618182795460806
Epoch: 33, step: 897, loss: 0.3519895076751709, mean loss: 0.34618194757725934
Epoch: 33, step: 898, loss: 0.3311561346054077, mean loss: 0.3461816380921206
Epoch: 33, step: 899, loss: 0.3299727141857147, mean loss: 0.3461813042454427
Epoch: 33, step: 900, loss: 0.3182006776332855, mean loss: 0.346180727955067
Epoch: 33, step: 901, loss: 0.3109815716743469, mean loss: 0.3461800030064267
Epoch: 33, step: 902, loss: 0.3316796123981476, mean loss: 0.3461797043679629
Epoch: 33, step: 903, loss: 0.308411180973053, mean loss: 0.34617892653363974
Epoch: 33, step: 904, loss: 0.3252841532230377, mean loss: 0.34617849621930175
Epoch: 33, step: 905, loss: 0.31356391310691833, mean loss: 0.3461778245568957
Epoch: 33, step: 906, loss: 0.3385124206542969, mean loss: 0.3461776666993636
Epoch: 33, step: 907, loss: 0.33939385414123535, mean loss: 0.346177526999764
Epoch: 33, step: 908, loss: 0.34397539496421814, mean loss: 0.34617748165201506
Epoch: 33, step: 909, loss: 0.2935234010219574, mean loss: 0.3461763973869389
Epoch: 33, step: 910, loss: 0.32444241642951965, mean loss: 0.34617594984496336
Epoch: 33, step: 911, loss: 0.30011501908302307, mean loss: 0.34617500138662466
Epoch: 33, step: 912, loss: 0.3360937237739563, mean loss: 0.34617479380343485
Epoch: 33, step: 913, loss: 0.3121911883354187, mean loss: 0.346174094062763
Epoch: 33, step: 914, loss: 0.3830685317516327, mean loss: 0.34617485372339035
Epoch: 33, step: 915, loss: 0.35650745034217834, mean loss: 0.346175066468338
Epoch: 33, step: 916, loss: 0.31978118419647217, mean loss: 0.34617452303770796
Epoch: 33, step: 917, loss: 0.36414003372192383, mean loss: 0.3461748929267482
Epoch: 33, step: 918, loss: 0.35066545009613037, mean loss: 0.3461749853802116
Epoch: 33, step: 919, loss: 0.3871212601661682, mean loss: 0.34617582838183364
Epoch: 33, step: 920, loss: 0.3225405216217041, mean loss: 0.34617534178831955
Epoch: 33, step: 921, loss: 0.34278395771980286, mean loss: 0.3461752719694027
Epoch: 33, step: 922, loss: 0.3369993269443512, mean loss: 0.34617508306677736
Epoch: 33, step: 923, loss: 0.32970333099365234, mean loss: 0.3461747439743845
Epoch: 33, step: 924, loss: 0.35293471813201904, mean loss: 0.3461748831343606
Epoch: 33, step: 925, loss: 0.3153965473175049, mean loss: 0.3461742495484613
Epoch: 33, step: 926, loss: 0.34656545519828796, mean loss: 0.34617425760144
Epoch: 33, step: 927, loss: 0.32605645060539246, mean loss: 0.34617384348437547
Epoch: 33, step: 928, loss: 0.31553134322166443, mean loss: 0.346173212733665
Epoch: 33, step: 929, loss: 0.32582008838653564, mean loss: 0.3461727937899339
Epoch: 33, step: 930, loss: 0.3628341555595398, mean loss: 0.34617313673626837
Epoch: 33, step: 931, loss: 0.35823124647140503, mean loss: 0.34617338492723115
Epoch: 33, step: 932, loss: 0.3189184367656708, mean loss: 0.34617282395268834
Epoch: 33, step: 933, loss: 0.3011223375797272, mean loss: 0.3461718967208443
Epoch: 33, step: 934, loss: 0.3396296203136444, mean loss: 0.3461717620700857
Epoch: 33, step: 935, loss: 0.3779343068599701, mean loss: 0.3461724157818003
Epoch: 33, step: 936, loss: 0.3338218927383423, mean loss: 0.3461721615982805
Epoch: 33, step: 937, loss: 0.3232000768184662, mean loss: 0.3461716888243604
Epoch: 33, step: 938, loss: 0.3218204379081726, mean loss: 0.3461711876770097
Epoch: 33, step: 939, loss: 0.3345120847225189, mean loss: 0.3461709477382759
Epoch: 33, step: 940, loss: 0.33691394329071045, mean loss: 0.34617075723749496
Epoch: 33, step: 941, loss: 0.32454702258110046, mean loss: 0.34617031224974637
Epoch: 33, step: 942, loss: 0.34028956294059753, mean loss: 0.346170191234224
Epoch: 33, step: 943, loss: 0.3155953884124756, mean loss: 0.34616956207127186
Epoch: 33, step: 944, loss: 0.33601489663124084, mean loss: 0.34616935311464
Epoch: 33, step: 945, loss: 0.32493695616722107, mean loss: 0.346168916216065
Epoch: 33, step: 946, loss: 0.318866103887558, mean loss: 0.34616835441824345
Epoch: 33, step: 947, loss: 0.34468626976013184, mean loss: 0.3461683239226744
Epoch: 33, step: 948, loss: 0.33318689465522766, mean loss: 0.3461680568205722
Epoch: 33, step: 949, loss: 0.3135662078857422, mean loss: 0.34616738602823993
Epoch: 33, step: 950, loss: 0.3670945167541504, mean loss: 0.346167816601059
Epoch: 33, step: 951, loss: 0.35414060950279236, mean loss: 0.34616798063679477
Epoch: 33, step: 952, loss: 0.3491332232952118, mean loss: 0.34616804164374176
Epoch: 33, step: 953, loss: 0.3496425151824951, mean loss: 0.3461681131261419
Epoch: 33, step: 954, loss: 0.3276044726371765, mean loss: 0.3461677312132386
Epoch: 33, step: 955, loss: 0.33332163095474243, mean loss: 0.3461674669336908
Epoch: 33, step: 956, loss: 0.3358173072338104, mean loss: 0.34616725400687276
Epoch: 33, step: 957, loss: 0.3242909610271454, mean loss: 0.3461668039699878
Epoch: 33, step: 958, loss: 0.3437563478946686, mean loss: 0.3461667543833495
Epoch: 33, step: 959, loss: 0.3332882225513458, mean loss: 0.3461664894583961
Epoch: 33, step: 960, loss: 0.34631696343421936, mean loss: 0.3461664925537405
Epoch: 33, step: 961, loss: 0.34383413195610046, mean loss: 0.3461664445766023
Epoch: 33, step: 962, loss: 0.33723434805870056, mean loss: 0.34616626084531527
Epoch: 33, step: 963, loss: 0.31405898928642273, mean loss: 0.34616560041929173
Epoch: 33, step: 964, loss: 0.3305491805076599, mean loss: 0.34616527920613765
Epoch: 33, step: 965, loss: 0.29954853653907776, mean loss: 0.34616432036902656
Epoch: 33, step: 966, loss: 0.368322491645813, mean loss: 0.34616477612030233
Epoch: 33, step: 967, loss: 0.33489206433296204, mean loss: 0.34616454426691307
Epoch: 33, step: 968, loss: 0.3451039493083954, mean loss: 0.3461645224533971
Epoch: 33, step: 969, loss: 0.3115268349647522, mean loss: 0.3461638100662578
Epoch: 33, step: 970, loss: 0.33036041259765625, mean loss: 0.34616348504728595
Epoch: 33, step: 971, loss: 0.30143794417381287, mean loss: 0.3461625652229014
Epoch: 33, step: 972, loss: 0.3294045329093933, mean loss: 0.3461622205847047
Epoch: 33, step: 973, loss: 0.3377472460269928, mean loss: 0.34616204752966095
Epoch: 33, step: 974, loss: 0.3485032320022583, mean loss: 0.3461620956754333
Epoch: 33, step: 975, loss: 0.30540719628334045, mean loss: 0.3461612575801098
Epoch: 33, step: 976, loss: 0.29736945033073425, mean loss: 0.3461602542321641
Epoch: 33, step: 977, loss: 0.33917826414108276, mean loss: 0.3461601106584423
Epoch: 33, step: 978, loss: 0.42595598101615906, mean loss: 0.3461617515021502
Epoch: 33, step: 979, loss: 0.31629979610443115, mean loss: 0.34616113746292915
Epoch: 33, step: 980, loss: 0.34304526448249817, mean loss: 0.3461610733938201
Epoch: 33, step: 981, loss: 0.3482114374637604, mean loss: 0.3461611155528872
Epoch: 33, step: 982, loss: 0.30975142121315, mean loss: 0.3461603669213597
Epoch: 33, step: 983, loss: 0.32062315940856934, mean loss: 0.34615984185335424
Epoch: 33, step: 984, loss: 0.3312229514122009, mean loss: 0.3461595347437373
Epoch: 33, step: 985, loss: 0.33300670981407166, mean loss: 0.3461592643209212
Epoch: 33, step: 986, loss: 0.33300188183784485, mean loss: 0.3461589938099633
Epoch: 33, step: 987, loss: 0.31949397921562195, mean loss: 0.34615844559831455
Epoch: 33, step: 988, loss: 0.31087639927864075, mean loss: 0.3461577202422092
Epoch: 33, step: 989, loss: 0.3337193429470062, mean loss: 0.3461574645295063
Epoch: 33, step: 990, loss: 0.31019753217697144, mean loss: 0.3461567252672825
Epoch: 33, step: 991, loss: 0.31753218173980713, mean loss: 0.3461561368176581
Epoch: 33, step: 992, loss: 0.3435472548007965, mean loss: 0.34615608318661656
Epoch: 33, step: 993, loss: 0.30253082513809204, mean loss: 0.3461551863963759
Epoch: 33, step: 994, loss: 0.3445771634578705, mean loss: 0.3461551539581384
Epoch: 33, step: 995, loss: 0.2956165373325348, mean loss: 0.34615411509494515
Epoch: 33, step: 996, loss: 0.32311490178108215, mean loss: 0.3461536415145362
Epoch: 33, step: 997, loss: 0.2931853234767914, mean loss: 0.3461525527515755
Epoch: 33, step: 998, loss: 0.3739040791988373, mean loss: 0.3461531231720488
Epoch: 33, step: 999, loss: 0.310078501701355, mean loss: 0.34615238168924295
Epoch: 33, step: 1000, loss: 0.35474368929862976, mean loss: 0.3461525582725494
Epoch: 33, step: 1001, loss: 0.30189186334609985, mean loss: 0.3461516485694433
Epoch: 33, step: 1002, loss: 0.3049626350402832, mean loss: 0.34615080201690956
Epoch: 33, step: 1003, loss: 0.31276461482048035, mean loss: 0.3461501158489715
Epoch: 33, step: 1004, loss: 0.29485809803009033, mean loss: 0.34614906169401294
Epoch: 33, step: 1005, loss: 0.31371331214904785, mean loss: 0.3461483950872978
Epoch: 33, step: 1006, loss: 0.3277711868286133, mean loss: 0.346148017413933
Epoch: 33, step: 1007, loss: 0.3131799101829529, mean loss: 0.34614733989426116
Epoch: 33, step: 1008, loss: 0.30892395973205566, mean loss: 0.34614657494121537
Epoch: 33, step: 1009, loss: 0.3507917523384094, mean loss: 0.3461466703992195
Epoch: 33, step: 1010, loss: 0.32920706272125244, mean loss: 0.3461463222988624
Epoch: 33, step: 1011, loss: 0.34612107276916504, mean loss: 0.346146321780008
Epoch: 33, step: 1012, loss: 0.34064623713493347, mean loss: 0.34614620876069957
Epoch: 33, step: 1013, loss: 0.28754210472106934, mean loss: 0.3461450045502849
Epoch: 33, step: 1014, loss: 0.3093152940273285, mean loss: 0.3461442477805945
Epoch: 33, step: 1015, loss: 0.3107580840587616, mean loss: 0.34614352068756166
Epoch: 33, step: 1016, loss: 0.35557106137275696, mean loss: 0.34614371439486374
Epoch: 33, step: 1017, loss: 0.3427252769470215, mean loss: 0.3461436441578091
Epoch: 33, step: 1018, loss: 0.3076189160346985, mean loss: 0.3461428526242856
Epoch: 33, step: 1019, loss: 0.35342004895210266, mean loss: 0.3461430021393318
Epoch: 33, step: 1020, loss: 0.34829458594322205, mean loss: 0.34614304634420523
Epoch: 33, step: 1021, loss: 0.34419727325439453, mean loss: 0.34614300636859013
Epoch: 33, step: 1022, loss: 0.30484992265701294, mean loss: 0.3461421580258328
Epoch: 33, step: 1023, loss: 0.30623355507850647, mean loss: 0.34614133814328396
Epoch: 33, step: 1024, loss: 0.3019142150878906, mean loss: 0.34614042955970126
Epoch: 33, step: 1025, loss: 0.3320121467113495, mean loss: 0.3461401393201095
Epoch: 33, step: 1026, loss: 0.3467561900615692, mean loss: 0.3461401519754792
Epoch: 33, step: 1027, loss: 0.30304208397865295, mean loss: 0.34613926664129685
Epoch: 33, step: 1028, loss: 0.32754501700401306, mean loss: 0.34613888468016957
Epoch: 33, step: 1029, loss: 0.3066449463367462, mean loss: 0.34613807341649216
Epoch: 33, step: 1030, loss: 0.32569563388824463, mean loss: 0.3461376535072933
Epoch: 33, step: 1031, loss: 0.33556729555130005, mean loss: 0.3461374363854883
Epoch: 33, step: 1032, loss: 0.3317597806453705, mean loss: 0.3461371410654566
Epoch: 33, step: 1033, loss: 0.35696032643318176, mean loss: 0.3461373633713632
Epoch: 33, step: 1034, loss: 0.3291766047477722, mean loss: 0.34613701500817334
Epoch: 33, step: 1035, loss: 0.36198216676712036, mean loss: 0.34613734045082367
Epoch: 33, step: 1036, loss: 0.3147668242454529, mean loss: 0.34613669614684933
Epoch: 33, step: 1037, loss: 0.3411770462989807, mean loss: 0.3461365942850739
Epoch: 33, step: 1038, loss: 0.3038809597492218, mean loss: 0.3461357264525271
Epoch: 33, step: 1039, loss: 0.32626137137413025, mean loss: 0.3461353182878372
Epoch: 33, step: 1040, loss: 0.35086673498153687, mean loss: 0.34613541545615084
Epoch: 33, step: 1041, loss: 0.3421802222728729, mean loss: 0.3461353342306778
Epoch: 33, step: 1042, loss: 0.3444612920284271, mean loss: 0.346135299852565
Epoch: 33, step: 1043, loss: 0.3236595094203949, mean loss: 0.3461348382994512
Epoch: 33, step: 1044, loss: 0.29898253083229065, mean loss: 0.34613387001993773
Epoch: 33, step: 1045, loss: 0.3520081043243408, mean loss: 0.34613399064571915
Epoch: 33, step: 1046, loss: 0.30574455857276917, mean loss: 0.346133161276901
Epoch: 33, step: 1047, loss: 0.34757938981056213, mean loss: 0.34613319097358547
Epoch: 33, step: 1048, loss: 0.35427844524383545, mean loss: 0.3461333582238323
Epoch: 33, step: 1049, loss: 0.3447038233280182, mean loss: 0.34613332887113846
Epoch: 33, step: 1050, loss: 0.2931847870349884, mean loss: 0.346132241699058
Epoch: 33, step: 1051, loss: 0.30776655673980713, mean loss: 0.346131453967353
Epoch: 33, step: 1052, loss: 0.33487606048583984, mean loss: 0.3461312228741699
Epoch: 33, step: 1053, loss: 0.32518860697746277, mean loss: 0.34613079289396426
Epoch: 33, step: 1054, loss: 0.33273354172706604, mean loss: 0.3461305178359404
Epoch: 33, step: 1055, loss: 0.3155970573425293, mean loss: 0.34612989096847524
Epoch: 33, step: 1056, loss: 0.30692729353904724, mean loss: 0.34612908613574556
Epoch: 33, step: 1057, loss: 0.3506278693675995, mean loss: 0.34612917849425984
Epoch: 33, step: 1058, loss: 0.33376485109329224, mean loss: 0.3461289246639669
Epoch: 33, step: 1059, loss: 0.3451491594314575, mean loss: 0.34612890455054035
Epoch: 33, step: 1060, loss: 0.33633315563201904, mean loss: 0.34612870345947805
Epoch: 33, step: 1061, loss: 0.3244137763977051, mean loss: 0.3461282576958975
Epoch: 33, step: 1062, loss: 0.3656599223613739, mean loss: 0.34612865863328157
Epoch: 33, step: 1063, loss: 0.35780882835388184, mean loss: 0.3461288983937241
Epoch: 33, step: 1064, loss: 0.31027209758758545, mean loss: 0.3461281623713745
Epoch: 33, step: 1065, loss: 0.30053451657295227, mean loss: 0.346127226502788
Epoch: 33, step: 1066, loss: 0.34956124424934387, mean loss: 0.3461272969889997
Epoch: 33, step: 1067, loss: 0.3533318042755127, mean loss: 0.346127444864765
Epoch: 33, step: 1068, loss: 0.31239521503448486, mean loss: 0.3461267525097265
Epoch: 33, step: 1069, loss: 0.3474763333797455, mean loss: 0.3461267802093462
Epoch: 33, step: 1070, loss: 0.32425370812416077, mean loss: 0.3461263312823079
Epoch: 33, step: 1071, loss: 0.36317533254623413, mean loss: 0.3461266811920293
Epoch: 33, step: 1072, loss: 0.3556479513645172, mean loss: 0.34612687660034475
Epoch: 33, step: 1073, loss: 0.318236768245697, mean loss: 0.34612630421376767
Epoch: 33, step: 1074, loss: 0.3357506990432739, mean loss: 0.3461260912803802
Epoch: 33, step: 1075, loss: 0.3219640552997589, mean loss: 0.3461255954251023
Epoch: 33, step: 1076, loss: 0.322814404964447, mean loss: 0.3461251170407632
Epoch: 33, step: 1077, loss: 0.3346098065376282, mean loss: 0.3461248807323187
Epoch: 33, step: 1078, loss: 0.29796046018600464, mean loss: 0.3461238923589927
Epoch: 33, step: 1079, loss: 0.2936154305934906, mean loss: 0.346122814864497
Epoch: 33, step: 1080, loss: 0.36512815952301025, mean loss: 0.346123204853717
Epoch: 33, step: 1081, loss: 0.3735365569591522, mean loss: 0.346123767363507
Epoch: 33, step: 1082, loss: 0.32345420122146606, mean loss: 0.34612330220363946
Epoch: 33, step: 1083, loss: 0.3088833689689636, mean loss: 0.3461225380881348
Epoch: 33, step: 1084, loss: 0.3731319010257721, mean loss: 0.34612309227413185
Epoch: 33, step: 1085, loss: 0.336427241563797, mean loss: 0.3461228933359171
Epoch: 33, step: 1086, loss: 0.3330605924129486, mean loss: 0.34612262533080984
Epoch: 33, step: 1087, loss: 0.30953270196914673, mean loss: 0.34612187461428623
Epoch: 33, step: 1088, loss: 0.3465309143066406, mean loss: 0.34612188300639335
Epoch: 33, step: 1089, loss: 0.36524665355682373, mean loss: 0.3461222753737675
Epoch: 33, step: 1090, loss: 0.34869641065597534, mean loss: 0.3461223281841255
Epoch: 33, step: 1091, loss: 0.33046087622642517, mean loss: 0.34612200688402794
Epoch: 33, step: 1092, loss: 0.3935403525829315, mean loss: 0.34612297966781497
Epoch: 33, step: 1093, loss: 0.31981533765792847, mean loss: 0.3461224399795942
Epoch: 33, step: 1094, loss: 0.2924278676509857, mean loss: 0.3461213384846852
Epoch: 33, step: 1095, loss: 0.34289565682411194, mean loss: 0.3461212723141416
Epoch: 33, step: 1096, loss: 0.3262738883495331, mean loss: 0.3461208651799652
Epoch: 33, step: 1097, loss: 0.3155316114425659, mean loss: 0.3461202377080937
Epoch: 33, step: 1098, loss: 0.31945160031318665, mean loss: 0.34611969067034276
Epoch: 33, step: 1099, loss: 0.3331085741519928, mean loss: 0.34611942378659405
Epoch: 33, step: 1100, loss: 0.3519541025161743, mean loss: 0.3461195434649468
Epoch: 33, step: 1101, loss: 0.31164678931236267, mean loss: 0.3461188363895447
Epoch: 33, step: 1102, loss: 0.32379403710365295, mean loss: 0.34611837849190785
Epoch: 33, step: 1103, loss: 0.30598434805870056, mean loss: 0.3461175553310572
Epoch: 33, step: 1104, loss: 0.3334401249885559, mean loss: 0.34611729531853913
Epoch: 33, step: 1105, loss: 0.35550761222839355, mean loss: 0.3461174879088199
Epoch: 33, step: 1106, loss: 0.33526694774627686, mean loss: 0.3461172653747203
Epoch: 33, step: 1107, loss: 0.3511018753051758, mean loss: 0.34611736760215944
Epoch: 33, step: 1108, loss: 0.3204662501811981, mean loss: 0.3461168415440921
Epoch: 33, step: 1109, loss: 0.35981228947639465, mean loss: 0.34611712240722187
Epoch: 33, step: 1110, loss: 0.35410016775131226, mean loss: 0.34611728611834186
Epoch: 33, step: 1111, loss: 0.37581372261047363, mean loss: 0.3461178951011261
Epoch: 33, step: 1112, loss: 0.3165057897567749, mean loss: 0.34611728786016754
Epoch: 33, step: 1113, loss: 0.3011980354785919, mean loss: 0.3461163667419216
Epoch: 33, step: 1114, loss: 0.29103416204452515, mean loss: 0.3461152372444192
Epoch: 33, step: 1115, loss: 0.3364332616329193, mean loss: 0.3461150387130952
Epoch: 33, step: 1116, loss: 0.3025650978088379, mean loss: 0.3461141457290089
Epoch: 33, step: 1117, loss: 0.3541240096092224, mean loss: 0.34611430996652953
Epoch: 33, step: 1118, loss: 0.33239611983299255, mean loss: 0.3461140286889233
Epoch: 33, step: 1119, loss: 0.33064326643943787, mean loss: 0.3461137114831034
Epoch: 33, step: 1120, loss: 0.36388280987739563, mean loss: 0.346114075805544
Epoch: 33, step: 1121, loss: 0.3213330805301666, mean loss: 0.34611356772756646
Epoch: 33, step: 1122, loss: 0.326939195394516, mean loss: 0.3461131746087078
Epoch: 33, step: 1123, loss: 0.31970009207725525, mean loss: 0.34611263309069623
Epoch: 33, step: 1124, loss: 0.373043030500412, mean loss: 0.3461131852033192
Epoch: 33, step: 1125, loss: 0.3274275064468384, mean loss: 0.3461128021273678
Epoch: 33, step: 1126, loss: 0.3503004014492035, mean loss: 0.3461128879757723
Epoch: 33, step: 1127, loss: 0.3414921462535858, mean loss: 0.3461127932496197
Epoch: 33, step: 1128, loss: 0.327085018157959, mean loss: 0.346112403184326
Epoch: 33, step: 1129, loss: 0.28850531578063965, mean loss: 0.3461112222756424
Epoch: 33, step: 1130, loss: 0.3890465497970581, mean loss: 0.34611210240452994
Epoch: 33, step: 1131, loss: 0.31422415375709534, mean loss: 0.3461114487486459
Epoch: 33, step: 1132, loss: 0.3276522755622864, mean loss: 0.3461110703705956
Epoch: 33, step: 1133, loss: 0.3288225531578064, mean loss: 0.34611071599603704
Epoch: 33, step: 1134, loss: 0.3224695324897766, mean loss: 0.3461102314164665
Epoch: 33, step: 1135, loss: 0.33899447321891785, mean loss: 0.34611008556588446
Epoch: 33, step: 1136, loss: 0.29383528232574463, mean loss: 0.34610901411938544
Epoch: 33, step: 1137, loss: 0.3291653096675873, mean loss: 0.3461086668411634
Epoch: 33, step: 1138, loss: 0.30469679832458496, mean loss: 0.3461078180807667
Epoch: 33, step: 1139, loss: 0.35450297594070435, mean loss: 0.3461079901408966
Epoch: 33, step: 1140, loss: 0.3283803462982178, mean loss: 0.3461076268173903
Epoch: 33, step: 1141, loss: 0.31960803270339966, mean loss: 0.34610708372614724
Epoch: 33, step: 1142, loss: 0.38667336106300354, mean loss: 0.34610791508750266
Epoch: 33, step: 1143, loss: 0.3317393362522125, mean loss: 0.3461076206252755
Epoch: 33, step: 1144, loss: 0.3627665042877197, mean loss: 0.34610796201682953
Epoch: 33, step: 1145, loss: 0.30042383074760437, mean loss: 0.3461070258282302
Epoch: 33, step: 1146, loss: 0.3149428367614746, mean loss: 0.346106387204712
Epoch: 33, step: 1147, loss: 0.2934413254261017, mean loss: 0.34610530800262634
Epoch: 33, step: 1148, loss: 0.3275410830974579, mean loss: 0.3461049275959768
Epoch: 33, step: 1149, loss: 0.30318138003349304, mean loss: 0.34610404805113104
Epoch: 33, step: 1150, loss: 0.38343584537506104, mean loss: 0.3461048129999523
Epoch: 33, step: 1151, loss: 0.3228907585144043, mean loss: 0.34610433734110296
Epoch: 33, step: 1152, loss: 0.35256344079971313, mean loss: 0.34610446968622044
Epoch: 33, step: 1153, loss: 0.3138693571090698, mean loss: 0.3461038092118407
Epoch: 33, step: 1154, loss: 0.34429121017456055, mean loss: 0.346103772073745
Epoch: 33, step: 1155, loss: 0.3160250782966614, mean loss: 0.34610315580809636
Epoch: 33, step: 1156, loss: 0.29730746150016785, mean loss: 0.3461021560807037
Epoch: 33, step: 1157, loss: 0.3057847321033478, mean loss: 0.34610133007324667
Epoch: 33, step: 1158, loss: 0.35049358010292053, mean loss: 0.34610142005808675
Epoch: 33, step: 1159, loss: 0.32773539423942566, mean loss: 0.34610104379762174
Epoch: 33, step: 1160, loss: 0.3114177882671356, mean loss: 0.3461003332644537
Epoch: 33, step: 1161, loss: 0.3094581961631775, mean loss: 0.3460995826163384
Epoch: 33, step: 1162, loss: 0.34880268573760986, mean loss: 0.346099637990775
Epoch: 33, step: 1163, loss: 0.30893823504447937, mean loss: 0.3460988767362079
Epoch: 33, step: 1164, loss: 0.3493538796901703, mean loss: 0.34609894341386027
Epoch: 33, step: 1165, loss: 0.30396997928619385, mean loss: 0.34609808043372736
Epoch: 33, step: 1166, loss: 0.34044763445854187, mean loss: 0.34609796469096377
Epoch: 33, step: 1167, loss: 0.36517974734306335, mean loss: 0.34609835555091156
Epoch: 33, step: 1168, loss: 0.3697875738143921, mean loss: 0.3460988407769058
Epoch: 33, step: 1169, loss: 0.3760741353034973, mean loss: 0.3460994547479542
Epoch: 33, step: 1170, loss: 0.3497622311115265, mean loss: 0.34609952976948843
Epoch: 33, step: 1171, loss: 0.3275900185108185, mean loss: 0.34609915066267094
Epoch: 33, step: 1172, loss: 0.3436833918094635, mean loss: 0.34609910118476306
Epoch: 33, step: 1173, loss: 0.2949618995189667, mean loss: 0.34609805384929293
Epoch: 33, step: 1174, loss: 0.33994245529174805, mean loss: 0.3460979277797298
Epoch: 33, step: 1175, loss: 0.33186209201812744, mean loss: 0.34609763622906703
Epoch: 33, step: 1176, loss: 0.3024398982524872, mean loss: 0.34609674213461544
Epoch: 33, step: 1177, loss: 0.3252693712711334, mean loss: 0.34609631560643883
Epoch: 33, step: 1178, loss: 0.3254619538784027, mean loss: 0.3460958930395914
Epoch: 33, step: 1179, loss: 0.3300769329071045, mean loss: 0.3460955649973213
Epoch: 33, step: 1180, loss: 0.4165601432323456, mean loss: 0.3460970079678174
Epoch: 33, step: 1181, loss: 0.3624248206615448, mean loss: 0.34609734232119194
Epoch: 33, step: 1182, loss: 0.34961652755737305, mean loss: 0.34609741438395913
Epoch: 33, step: 1183, loss: 0.35938790440559387, mean loss: 0.3460976865293032
Epoch: 33, step: 1184, loss: 0.3769534230232239, mean loss: 0.34609831833994864
Epoch: 33, step: 1185, loss: 0.3181993365287781, mean loss: 0.3460977470843319
Epoch: 33, step: 1186, loss: 0.36210471391677856, mean loss: 0.3460980748340162
Epoch: 33, step: 1187, loss: 0.3089892864227295, mean loss: 0.3460973150308137
Epoch: 33, step: 1188, loss: 0.31141558289527893, mean loss: 0.34609660493617733
Epoch: 33, step: 1189, loss: 0.33654099702835083, mean loss: 0.34609640929292135
Epoch: 33, step: 1190, loss: 0.35902711749076843, mean loss: 0.3460966740331748
Epoch: 33, step: 1191, loss: 0.33647429943084717, mean loss: 0.3460964770309923
Epoch: 33, step: 1192, loss: 0.3283759355545044, mean loss: 0.3460961142396835
Epoch: 33, step: 1193, loss: 0.39101725816726685, mean loss: 0.34609703388804625
Epoch: 33, step: 1194, loss: 0.3163529932498932, mean loss: 0.3460964249654791
Epoch: 33, step: 1195, loss: 0.3057901859283447, mean loss: 0.34609559982956695
Epoch: 33, step: 1196, loss: 0.3059505820274353, mean loss: 0.34609477801094624
Epoch: 33, step: 1197, loss: 0.3366655707359314, mean loss: 0.34609458498725587
Epoch: 33, step: 1198, loss: 0.2960914969444275, mean loss: 0.34609356140354125
Epoch: 33, step: 1199, loss: 0.2949451804161072, mean loss: 0.3460925143966431
Epoch: 33, step: 1200, loss: 0.33930644392967224, mean loss: 0.3460923754886852
Epoch: 33, step: 1201, loss: 0.3230980634689331, mean loss: 0.3460919048145947
Epoch: 33, step: 1202, loss: 0.3394804000854492, mean loss: 0.346091769485463
Epoch: 33, step: 1203, loss: 0.3365265130996704, mean loss: 0.34609157370078175
Epoch: 33, step: 1204, loss: 0.2901049256324768, mean loss: 0.3460904277718858
Epoch: 33, step: 1205, loss: 0.3297487795352936, mean loss: 0.34609009329957346
Epoch: 33, step: 1206, loss: 0.34755435585975647, mean loss: 0.34609012326872063
Epoch: 33, step: 1207, loss: 0.34494563937187195, mean loss: 0.34609009984498146
Epoch: 33, step: 1208, loss: 0.30122023820877075, mean loss: 0.34608918152849927
Epoch: 33, step: 1209, loss: 0.33216559886932373, mean loss: 0.3460888965712184
Epoch: 33, step: 1210, loss: 0.3888213634490967, mean loss: 0.34608977110751127
Epoch: 33, step: 1211, loss: 0.3364867568016052, mean loss: 0.3460895745821694
Epoch: 33, step: 1212, loss: 0.27161070704460144, mean loss: 0.34608805040602003
Epoch: 33, step: 1213, loss: 0.3098753094673157, mean loss: 0.3460873093439127
Epoch: 33, step: 1214, loss: 0.30266907811164856, mean loss: 0.3460864208459236
Epoch: 33, step: 1215, loss: 0.3206653892993927, mean loss: 0.346085900648012
Epoch: 33, step: 1216, loss: 0.3165590465068817, mean loss: 0.34608529644383057
Epoch: 33, step: 1217, loss: 0.3213803768157959, mean loss: 0.3460847909206133
Epoch: 33, step: 1218, loss: 0.3436676263809204, mean loss: 0.34608474146051343
Epoch: 33, step: 1219, loss: 0.4014149606227875, mean loss: 0.34608587360610116
Epoch: 33, step: 1220, loss: 0.32697877287864685, mean loss: 0.34608548265198075
Epoch: 33, step: 1221, loss: 0.32034364342689514, mean loss: 0.3460849559539567
Epoch: 33, step: 1222, loss: 0.3394468426704407, mean loss: 0.3460848201357821
Epoch: 33, step: 1223, loss: 0.35606849193573, mean loss: 0.3460850244011025
Epoch: 33, step: 1224, loss: 0.36043086647987366, mean loss: 0.34608531791015745
Epoch: 33, step: 1225, loss: 0.3165205419063568, mean loss: 0.34608471304138205
Epoch: 33, step: 1226, loss: 0.32066428661346436, mean loss: 0.34608419297291854
Epoch: 33, step: 1227, loss: 0.35954850912094116, mean loss: 0.3460844684294682
Epoch: 33, step: 1228, loss: 0.3177378475666046, mean loss: 0.3460838885186468
Epoch: 33, step: 1229, loss: 0.34601348638534546, mean loss: 0.3460838870784002
Epoch: 33, step: 1230, loss: 0.33968910574913025, mean loss: 0.3460837562602972
Epoch: 33, step: 1231, loss: 0.3166998028755188, mean loss: 0.3460831551647775
Epoch: 33, step: 1232, loss: 0.31587913632392883, mean loss: 0.34608253730615335
Epoch: 33, step: 1233, loss: 0.3587733507156372, mean loss: 0.3460827969063131
Epoch: 33, step: 1234, loss: 0.3586845099925995, mean loss: 0.34608305467858563
Epoch: 33, step: 1235, loss: 0.3239050507545471, mean loss: 0.3460826010293481
Epoch: 33, step: 1236, loss: 0.3498477339744568, mean loss: 0.34608267804325604
Epoch: 33, step: 1237, loss: 0.36542195081710815, mean loss: 0.3460830736102999
Epoch: 33, step: 1238, loss: 0.31784647703170776, mean loss: 0.346082496068491
Epoch: 33, step: 1239, loss: 0.3166195750236511, mean loss: 0.34608189345618134
Epoch: 33, step: 1240, loss: 0.29804161190986633, mean loss: 0.34608091089668314
Epoch: 33, step: 1241, loss: 0.31758031249046326, mean loss: 0.3460803279908377
Epoch: 33, step: 1242, loss: 0.3624197542667389, mean loss: 0.3460806621646034
Epoch: 33, step: 1243, loss: 0.30865678191185, mean loss: 0.3460798967874713
Epoch: 33, step: 1244, loss: 0.2968956232070923, mean loss: 0.3460788909123955
Epoch: 33, step: 1245, loss: 0.310774564743042, mean loss: 0.3460781689130056
Epoch: 33, step: 1246, loss: 0.34126630425453186, mean loss: 0.346078070508853
Epoch: 33, step: 1247, loss: 0.30353081226348877, mean loss: 0.3460772004217723
Epoch: 33, step: 1248, loss: 0.31358540058135986, mean loss: 0.3460765359813756
Epoch: 33, step: 1249, loss: 0.3611280620098114, mean loss: 0.3460768437709553
Epoch: 33, step: 1250, loss: 0.35194680094718933, mean loss: 0.3460769638036154
Epoch: 33, step: 1251, loss: 0.324746698141098, mean loss: 0.3460765276375418
Epoch: 33, step: 1252, loss: 0.3326602578163147, mean loss: 0.34607625330424624
Epoch: 33, step: 1253, loss: 0.3440280854701996, mean loss: 0.3460762114245621
Epoch: 33, step: 1254, loss: 0.34705886244773865, mean loss: 0.34607623151679884
Epoch: 33, step: 1255, loss: 0.33232128620147705, mean loss: 0.3460759502755844
Epoch: 33, step: 1256, loss: 0.3045825660228729, mean loss: 0.34607510189626256
Epoch: 33, step: 1257, loss: 0.3497783839702606, mean loss: 0.34607517761251844
Epoch: 33, step: 1258, loss: 0.32552289962768555, mean loss: 0.34607475741505805
Epoch: 33, step: 1259, loss: 0.36419159173965454, mean loss: 0.3460751278115727
Epoch: 33, step: 1260, loss: 0.32602718472480774, mean loss: 0.34607471794214967
Epoch: 33, step: 1261, loss: 0.35316234827041626, mean loss: 0.3460748628419806
Epoch: 33, step: 1262, loss: 0.3377467691898346, mean loss: 0.34607469258554285
Epoch: 33, step: 1263, loss: 0.33083540201187134, mean loss: 0.3460743810455442
Epoch: 33, step: 1264, loss: 0.3291236162185669, mean loss: 0.3460740345246041
Epoch: 33, step: 1265, loss: 0.3383195102214813, mean loss: 0.34607387600372624
Epoch: 33, step: 1266, loss: 0.31949061155319214, mean loss: 0.34607333258982875
Epoch: 33, step: 1267, loss: 0.334259957075119, mean loss: 0.34607309110627366
Epoch: 33, step: 1268, loss: 0.3472839891910553, mean loss: 0.34607311585838596
Epoch: 33, step: 1269, loss: 0.35931622982025146, mean loss: 0.3460733865569257
Epoch: 33, step: 1270, loss: 0.3196851313114166, mean loss: 0.34607284717350184
Epoch: 33, step: 1271, loss: 0.33983683586120605, mean loss: 0.34607271971026676
Epoch: 33, step: 1272, loss: 0.3514174818992615, mean loss: 0.34607282895425634
Epoch: 33, step: 1273, loss: 0.32271888852119446, mean loss: 0.3460723516223585
Epoch: 33, step: 1274, loss: 0.3135915696620941, mean loss: 0.34607168776023817
Epoch: 33, step: 1275, loss: 0.3385394215583801, mean loss: 0.3460715338143135
Epoch: 33, step: 1276, loss: 0.3406430184841156, mean loss: 0.34607142286752673
Epoch: 33, step: 1277, loss: 0.36451420187950134, mean loss: 0.34607179978923147
Epoch: 33, step: 1278, loss: 0.35299330949783325, mean loss: 0.34607194124372265
Epoch: 33, step: 1279, loss: 0.31037357449531555, mean loss: 0.3460712116931883
Epoch: 33, step: 1280, loss: 0.3367784321308136, mean loss: 0.34607102178495536
Epoch: 33, step: 1281, loss: 0.32375916838645935, mean loss: 0.3460705658268608
Epoch: 33, step: 1282, loss: 0.3673493564128876, mean loss: 0.3460710006647189
Epoch: 33, step: 1283, loss: 0.34196463227272034, mean loss: 0.3460709167516816
Epoch: 33, step: 1284, loss: 0.3820188641548157, mean loss: 0.34607165132771617
Epoch: 33, step: 1285, loss: 0.31167641282081604, mean loss: 0.3460709484947743
Epoch: 33, step: 1286, loss: 0.30988216400146484, mean loss: 0.34607020902759084
Epoch: 33, step: 1287, loss: 0.3207169473171234, mean loss: 0.3460696909797422
Epoch: 33, step: 1288, loss: 0.3409503996372223, mean loss: 0.3460695863784602
Epoch: 33, step: 1289, loss: 0.3007358908653259, mean loss: 0.3460686601045949
Epoch: 33, step: 1290, loss: 0.311997652053833, mean loss: 0.34606796396810857
Epoch: 33, step: 1291, loss: 0.31104421615600586, mean loss: 0.34606724837993
Epoch: 33, step: 1292, loss: 0.32595548033714294, mean loss: 0.3460668374744638
Epoch: 33, step: 1293, loss: 0.34658098220825195, mean loss: 0.34606684797878967
Epoch: 33, step: 1294, loss: 0.35474276542663574, mean loss: 0.3460670252300502
Epoch: 33, step: 1295, loss: 0.34235072135925293, mean loss: 0.34606694930654214
Epoch: 33, step: 1296, loss: 0.33784109354019165, mean loss: 0.346066781257026
Epoch: 33, step: 1297, loss: 0.35567986965179443, mean loss: 0.3460669776428972
Epoch: 33, step: 1298, loss: 0.30763205885887146, mean loss: 0.3460661924716283
Epoch: 33, step: 1299, loss: 0.35002845525741577, mean loss: 0.34606627341342405
Epoch: 33, step: 1300, loss: 0.3807584345340729, mean loss: 0.3460669820964694
Epoch: 33, step: 1301, loss: 0.32048845291137695, mean loss: 0.3460664595951583
Epoch: 33, step: 1302, loss: 0.3306698501110077, mean loss: 0.34606614508980676
Epoch: 33, step: 1303, loss: 0.3514500856399536, mean loss: 0.3460662550648977
Epoch: 33, step: 1304, loss: 0.322801798582077, mean loss: 0.34606577986305764
Epoch: 33, step: 1305, loss: 0.36830076575279236, mean loss: 0.34606623402756376
Epoch: 33, step: 1306, loss: 0.3849591612815857, mean loss: 0.3460670284254733
Epoch: 33, step: 1307, loss: 0.33266475796699524, mean loss: 0.3460667546862891
Epoch: 33, step: 1308, loss: 0.3158159852027893, mean loss: 0.3460661368318849
Epoch: 33, step: 1309, loss: 0.35510462522506714, mean loss: 0.3460663214339925
Epoch: 33, step: 1310, loss: 0.31793901324272156, mean loss: 0.34606574697351844
Epoch: 33, step: 1311, loss: 0.3432502746582031, mean loss: 0.3460656894726542
Epoch: 33, step: 1312, loss: 0.3569290339946747, mean loss: 0.3460659113320338
Epoch: 33, step: 1313, loss: 0.3595449924468994, mean loss: 0.3460661866063285
Epoch: 33, step: 1314, loss: 0.3398458957672119, mean loss: 0.3460660595760665
Epoch: 33, step: 1315, loss: 0.3071002960205078, mean loss: 0.3460652638367356
Epoch: 33, step: 1316, loss: 0.34803125262260437, mean loss: 0.3460653039843552
Epoch: 33, step: 1317, loss: 0.33998751640319824, mean loss: 0.34606517987188673
Epoch: 33, step: 1318, loss: 0.384876012802124, mean loss: 0.34606597239874815
Epoch: 33, step: 1319, loss: 0.3276427388191223, mean loss: 0.34606559619941835
Epoch: 33, step: 1320, loss: 0.3648688793182373, mean loss: 0.34606598015145557
Epoch: 33, step: 1321, loss: 0.3736180067062378, mean loss: 0.34606654273622617
Epoch: 33, step: 1322, loss: 0.3616831302642822, mean loss: 0.3460668616047821
Epoch: 33, step: 1323, loss: 0.33626872301101685, mean loss: 0.34606666154478144
Epoch: 33, step: 1324, loss: 0.3348134458065033, mean loss: 0.3460664317794684
Epoch: 33, step: 1325, loss: 0.29147249460220337, mean loss: 0.3460653171170245
Epoch: 33, step: 1326, loss: 0.3712764382362366, mean loss: 0.3460658318503004
Epoch: 33, step: 1327, loss: 0.3390199542045593, mean loss: 0.3460656879981639
Epoch: 33, step: 1328, loss: 0.41162967681884766, mean loss: 0.3460670265577854
Epoch: 33, step: 1329, loss: 0.3464832007884979, mean loss: 0.3460670350542582
Epoch: 33, step: 1330, loss: 0.3099246323108673, mean loss: 0.3460662971982113
Epoch: 33, step: 1331, loss: 0.36437103152275085, mean loss: 0.3460666708862385
Epoch: 33, step: 1332, loss: 0.31811657547950745, mean loss: 0.34606610030145935
Epoch: 33, step: 1333, loss: 0.32188880443573, mean loss: 0.3460656067462422
Epoch: 33, step: 1334, loss: 0.33383870124816895, mean loss: 0.3460653571513395
Epoch: 33, step: 1335, loss: 0.37013065814971924, mean loss: 0.3460658484002372
Epoch: 33, step: 1336, loss: 0.29107141494750977, mean loss: 0.3460647258128512
Epoch: 33, step: 1337, loss: 0.2938328981399536, mean loss: 0.346063659639598
Epoch: 33, step: 1338, loss: 0.3037741184234619, mean loss: 0.3460627964291876
Epoch: 33, step: 1339, loss: 0.38794392347335815, mean loss: 0.34606365128563443
Epoch: 33, step: 1340, loss: 0.2879844903945923, mean loss: 0.34606246582728545
Epoch: 33, step: 1341, loss: 0.31621477007865906, mean loss: 0.3460618566160402
Epoch: 33, step: 1342, loss: 0.3562704622745514, mean loss: 0.34606206497619246
Epoch: 33, step: 1343, loss: 0.31596532464027405, mean loss: 0.3460614507068575
Epoch: 33, step: 1344, loss: 0.3374614715576172, mean loss: 0.3460612751863328
Epoch: 33, step: 1345, loss: 0.31509843468666077, mean loss: 0.346060643265836
Epoch: 33, step: 1346, loss: 0.2971213757991791, mean loss: 0.3460596444848922
Epoch: 33, step: 1347, loss: 0.32706964015960693, mean loss: 0.3460592569337835
Epoch: 33, step: 1348, loss: 0.33967164158821106, mean loss: 0.346059126576947
Epoch: 33, step: 1349, loss: 0.3482944667339325, mean loss: 0.34605917219427196
Epoch: 33, step: 1350, loss: 0.32040515542030334, mean loss: 0.34605864867496144
Epoch: 33, step: 1351, loss: 0.3388878107070923, mean loss: 0.3460585023432749
Epoch: 33, step: 1352, loss: 0.36070436239242554, mean loss: 0.3460588012078816
Epoch: 33, step: 1353, loss: 0.34042471647262573, mean loss: 0.34605868624063807
Epoch: 33, step: 1354, loss: 0.3431026041507721, mean loss: 0.34605862592104925
Epoch: 33, step: 1355, loss: 0.33746400475502014, mean loss: 0.34605845054924944
Epoch: 33, step: 1356, loss: 0.33729657530784607, mean loss: 0.34605827176830634
Epoch: 33, step: 1357, loss: 0.30371055006980896, mean loss: 0.34605740770542737
Epoch: 33, step: 1358, loss: 0.3002227544784546, mean loss: 0.34605647251428195
Epoch: 33, step: 1359, loss: 0.3003242015838623, mean loss: 0.3460555394311405
Epoch: 33, step: 1360, loss: 0.33686262369155884, mean loss: 0.3460553518703762
Epoch: 33, step: 1361, loss: 0.36666616797447205, mean loss: 0.34605577237913093
Epoch: 33, step: 1362, loss: 0.3339507281780243, mean loss: 0.34605552541301443
Epoch: 33, step: 1363, loss: 0.31017860770225525, mean loss: 0.3460547934700221
Epoch: 33, step: 1364, loss: 0.2933492362499237, mean loss: 0.34605371821945147
Epoch: 33, step: 1365, loss: 0.3418882489204407, mean loss: 0.34605363324109045
Epoch: 33, step: 1366, loss: 0.3249532878398895, mean loss: 0.34605320278870666
Epoch: 33, step: 1367, loss: 0.3714103698730469, mean loss: 0.34605372007077695
Epoch: 33, step: 1368, loss: 0.35060620307922363, mean loss: 0.3460538129387929
Epoch: 33, step: 1369, loss: 0.30787524580955505, mean loss: 0.3460530341340291
Epoch: 33, step: 1370, loss: 0.31884583830833435, mean loss: 0.34605247914563947
Epoch: 33, step: 1371, loss: 0.33103179931640625, mean loss: 0.3460521727512239
Epoch: 33, step: 1372, loss: 0.3004304766654968, mean loss: 0.3460512421709876
Epoch: 33, step: 1373, loss: 0.31877854466438293, mean loss: 0.34605068588049875
Epoch: 33, step: 1374, loss: 0.326938658952713, mean loss: 0.3460502960539353
Epoch: 33, step: 1375, loss: 0.34674328565597534, mean loss: 0.3460503101885033
Epoch: 33, step: 1376, loss: 0.37261971831321716, mean loss: 0.34605085210059866
Epoch: 33, step: 1377, loss: 0.3044026494026184, mean loss: 0.3460500026573456
Epoch: 33, step: 1378, loss: 0.3628656268119812, mean loss: 0.34605034561637465
Epoch: 33, step: 1379, loss: 0.3874702453613281, mean loss: 0.346051190368776
Epoch: 33, step: 1380, loss: 0.3214781582355499, mean loss: 0.3460506892158355
Epoch: 33, step: 1381, loss: 0.33441081643104553, mean loss: 0.3460504518321265
Epoch: 33, step: 1382, loss: 0.32894691824913025, mean loss: 0.3460501030295654
Epoch: 33, step: 1383, loss: 0.35326457023620605, mean loss: 0.3460502501554975
Epoch: 33, step: 1384, loss: 0.2867186367511749, mean loss: 0.3460490402198692
Epoch: 33, step: 1385, loss: 0.31512242555618286, mean loss: 0.3460484095535561
Epoch: 33, step: 1386, loss: 0.2846255600452423, mean loss: 0.34604715702292727
Epoch: 33, step: 1387, loss: 0.3329519033432007, mean loss: 0.34604688999083755
Epoch: 33, step: 1388, loss: 0.3092622458934784, mean loss: 0.3460461399114326
Epoch: 33, step: 1389, loss: 0.346536248922348, mean loss: 0.34604614990509136
Epoch: 33, step: 1390, loss: 0.3456384837627411, mean loss: 0.3460461415926687
Epoch: 33, step: 1391, loss: 0.367912232875824, mean loss: 0.34604658743907774
Epoch: 33, step: 1392, loss: 0.3228670358657837, mean loss: 0.3460461148210418
Epoch: 33, step: 1393, loss: 0.31073617935180664, mean loss: 0.3460453948859713
Epoch: 33, step: 1394, loss: 0.3109322786331177, mean loss: 0.34604467897844887
Epoch: 33, step: 1395, loss: 0.3411199748516083, mean loss: 0.3460445785726397
Epoch: 33, step: 1396, loss: 0.3335378170013428, mean loss: 0.3460443235875927
Epoch: 33, step: 1397, loss: 0.31952860951423645, mean loss: 0.3460437830021885
Epoch: 33, step: 1398, loss: 0.32947972416877747, mean loss: 0.3460434453116453
Epoch: 33, step: 1399, loss: 0.3399813175201416, mean loss: 0.34604332172590385
Epoch: 33, step: 1400, loss: 0.309765487909317, mean loss: 0.346042582161885
Epoch: 33, step: 1401, loss: 0.3431909680366516, mean loss: 0.34604252402974234
Epoch: 33, step: 1402, loss: 0.32934728264808655, mean loss: 0.34604218369254164
Epoch: 33, step: 1403, loss: 0.3281867802143097, mean loss: 0.34604181971252945
Epoch: 33, step: 1404, loss: 0.30910640954971313, mean loss: 0.3460410668044804
Epoch: 33, step: 1405, loss: 0.2960968613624573, mean loss: 0.3460400487400374
Epoch: 33, step: 1406, loss: 0.343337744474411, mean loss: 0.3460399936572949
Epoch: 33, step: 1407, loss: 0.30951181054115295, mean loss: 0.3460392490958779
Epoch: 33, step: 1408, loss: 0.3015172779560089, mean loss: 0.3460383416139444
Epoch: 33, step: 1409, loss: 0.3228304088115692, mean loss: 0.34603786858119395
Epoch: 33, step: 1410, loss: 0.3122028410434723, mean loss: 0.34603717895708747
Epoch: 33, step: 1411, loss: 0.33130940794944763, mean loss: 0.3460368787823971
Epoch: 33, step: 1412, loss: 0.3176993131637573, mean loss: 0.3460363012308712
Epoch: 33, step: 1413, loss: 0.34707483649253845, mean loss: 0.346036322396959
Epoch: 33, step: 1414, loss: 0.3762456476688385, mean loss: 0.34603693807195995
Epoch: 33, step: 1415, loss: 0.391396701335907, mean loss: 0.34603786249853663
Epoch: 33, step: 1416, loss: 0.3400702178478241, mean loss: 0.34603774088112743
Epoch: 33, step: 1417, loss: 0.3468666970729828, mean loss: 0.3460377577744674
Epoch: 33, step: 1418, loss: 0.35687685012817383, mean loss: 0.3460379786603746
Epoch: 33, step: 1419, loss: 0.3551079034805298, mean loss: 0.3460381634892958
Epoch: 33, step: 1420, loss: 0.31069856882095337, mean loss: 0.34603744334594466
Epoch: 33, step: 1421, loss: 0.3357223570346832, mean loss: 0.34603723315141577
Epoch: 33, step: 1422, loss: 0.3155904710292816, mean loss: 0.34603661273853503
Epoch: 33, step: 1423, loss: 0.32273855805397034, mean loss: 0.3460361380043537
Epoch: 33, step: 1424, loss: 0.3128425180912018, mean loss: 0.3460354616463874
Epoch: 33, step: 1425, loss: 0.33257684111595154, mean loss: 0.34603518741719036
Epoch: 33, step: 1426, loss: 0.3303714096546173, mean loss: 0.34603486826281143
Epoch: 33, step: 1427, loss: 0.34040939807891846, mean loss: 0.34603475364442954
Epoch: 33, step: 1428, loss: 0.3362358510494232, mean loss: 0.34603455399685523
Epoch: 33, step: 1429, loss: 0.3361191749572754, mean loss: 0.34603435198024957
Epoch: 33, step: 1430, loss: 0.34508180618286133, mean loss: 0.3460343325734122
Epoch: 33, step: 1431, loss: 0.3666723370552063, mean loss: 0.3460347530363835
Epoch: 33, step: 1432, loss: 0.34186744689941406, mean loss: 0.3460346681365946
Epoch: 33, step: 1433, loss: 0.32852622866630554, mean loss: 0.3460343114475291
Epoch: 33, step: 1434, loss: 0.33477750420570374, mean loss: 0.34603408212393544
Epoch: 33, step: 1435, loss: 0.3202758729457855, mean loss: 0.346033557388579
Epoch: 33, step: 1436, loss: 0.34292295575141907, mean loss: 0.34603349402200734
Epoch: 33, step: 1437, loss: 0.33955565094947815, mean loss: 0.34603336206350105
Epoch: 33, step: 1438, loss: 0.3620913326740265, mean loss: 0.346033689169704
Epoch: 33, step: 1439, loss: 0.300719290971756, mean loss: 0.34603276611914185
Epoch: 33, step: 1440, loss: 0.3440699577331543, mean loss: 0.34603272613771097
Epoch: 33, step: 1441, loss: 0.3247210383415222, mean loss: 0.34603229203806957
Epoch: 33, step: 1442, loss: 0.3427805006504059, mean loss: 0.3460322258033942
Epoch: 33, step: 1443, loss: 0.334786981344223, mean loss: 0.3460319967573526
Valid: 33, mean loss: 0.18439370642105737
Epoch: 34, step: 0, loss: 0.3127899765968323, mean loss: 0.3460313196890967
Epoch: 34, step: 1, loss: 0.3081304430961609, mean loss: 0.3460305477457061
Epoch: 34, step: 2, loss: 0.3341834247112274, mean loss: 0.3460303064551903
Epoch: 34, step: 3, loss: 0.3213285505771637, mean loss: 0.3460298033644392
Epoch: 34, step: 4, loss: 0.2985265552997589, mean loss: 0.3460288359045491
Epoch: 34, step: 5, loss: 0.32536742091178894, mean loss: 0.34602841511893967
Epoch: 34, step: 6, loss: 0.30587857961654663, mean loss: 0.3460275974533082
Epoch: 34, step: 7, loss: 0.36880558729171753, mean loss: 0.3460280613256982
Epoch: 34, step: 8, loss: 0.34959033131599426, mean loss: 0.34602813386963444
Epoch: 34, step: 9, loss: 0.35192209482192993, mean loss: 0.3460282538949053
Epoch: 34, step: 10, loss: 0.28516826033592224, mean loss: 0.34602701456052204
Epoch: 34, step: 11, loss: 0.3086550831794739, mean loss: 0.34602625354538435
Epoch: 34, step: 12, loss: 0.3116399347782135, mean loss: 0.3460255533413735
Epoch: 34, step: 13, loss: 0.31899815797805786, mean loss: 0.3460250029973425
Epoch: 34, step: 14, loss: 0.318453311920166, mean loss: 0.34602444158154816
Epoch: 34, step: 15, loss: 0.31872016191482544, mean loss: 0.3460238856221153
Epoch: 34, step: 16, loss: 0.32421329617500305, mean loss: 0.34602344153217074
Epoch: 34, step: 17, loss: 0.296026349067688, mean loss: 0.34602242355170765
Epoch: 34, step: 18, loss: 0.3050789535045624, mean loss: 0.3460215899271521
Epoch: 34, step: 19, loss: 0.31913042068481445, mean loss: 0.3460210424239099
Epoch: 34, step: 20, loss: 0.3038412034511566, mean loss: 0.34602018366138426
Epoch: 34, step: 21, loss: 0.3552669584751129, mean loss: 0.34602037191772234
Epoch: 34, step: 22, loss: 0.31774815917015076, mean loss: 0.34601979633164065
Epoch: 34, step: 23, loss: 0.29461225867271423, mean loss: 0.3460187497612486
Epoch: 34, step: 24, loss: 0.3116241693496704, mean loss: 0.34601804956010423
Epoch: 34, step: 25, loss: 0.30539336800575256, mean loss: 0.34601722254407163
Epoch: 34, step: 26, loss: 0.3479437828063965, mean loss: 0.34601726176318004
Epoch: 34, step: 27, loss: 0.37116336822509766, mean loss: 0.34601777365362996
Epoch: 34, step: 28, loss: 0.3084658086299896, mean loss: 0.34601700923703915
Epoch: 34, step: 29, loss: 0.32408037781715393, mean loss: 0.3460165626989245
Epoch: 34, step: 30, loss: 0.35690322518348694, mean loss: 0.3460167843013526
Epoch: 34, step: 31, loss: 0.3530579209327698, mean loss: 0.3460169276236256
Epoch: 34, step: 32, loss: 0.32410767674446106, mean loss: 0.3460164816700976
Epoch: 34, step: 33, loss: 0.3265687823295593, mean loss: 0.3460160858284664
Epoch: 34, step: 34, loss: 0.30257487297058105, mean loss: 0.34601520163696087
Epoch: 34, step: 35, loss: 0.3280813694000244, mean loss: 0.34601483662368565
Epoch: 34, step: 36, loss: 0.32294613122940063, mean loss: 0.3460143671081789
Epoch: 34, step: 37, loss: 0.29811564087867737, mean loss: 0.346013392249095
Epoch: 34, step: 38, loss: 0.3042408525943756, mean loss: 0.34601254209055926
Epoch: 34, step: 39, loss: 0.31217747926712036, mean loss: 0.3460118534902901
Epoch: 34, step: 40, loss: 0.37414389848709106, mean loss: 0.34601242601293086
Epoch: 34, step: 41, loss: 0.32987308502197266, mean loss: 0.34601209756364537
Epoch: 34, step: 42, loss: 0.32568660378456116, mean loss: 0.3460116839310159
Epoch: 34, step: 43, loss: 0.27939045429229736, mean loss: 0.346010328187637
Epoch: 34, step: 44, loss: 0.3156212866306305, mean loss: 0.3460097097826074
Epoch: 34, step: 45, loss: 0.330030620098114, mean loss: 0.34600938462104125
Epoch: 34, step: 46, loss: 0.2913839519023895, mean loss: 0.34600827306023463
Epoch: 34, step: 47, loss: 0.3375425934791565, mean loss: 0.3460081007975051
Epoch: 34, step: 48, loss: 0.33933866024017334, mean loss: 0.3460079650880625
Epoch: 34, step: 49, loss: 0.3244116008281708, mean loss: 0.3460075256552651
Epoch: 34, step: 50, loss: 0.34462568163871765, mean loss: 0.34600749753871646
Epoch: 34, step: 51, loss: 0.33939632773399353, mean loss: 0.34600736302317553
Epoch: 34, step: 52, loss: 0.3010467290878296, mean loss: 0.34600644824090254
Epoch: 34, step: 53, loss: 0.34400132298469543, mean loss: 0.34600640744486477
Epoch: 34, step: 54, loss: 0.3137717843055725, mean loss: 0.34600575161643526
Epoch: 34, step: 55, loss: 0.34616997838020325, mean loss: 0.3460057549576373
Epoch: 34, step: 56, loss: 0.3270066976547241, mean loss: 0.3460053684286909
Epoch: 34, step: 57, loss: 0.33766070008277893, mean loss: 0.3460051986628866
Epoch: 34, step: 58, loss: 0.31151556968688965, mean loss: 0.3460044970124141
Epoch: 34, step: 59, loss: 0.3179894983768463, mean loss: 0.34600392709218797
Epoch: 34, step: 60, loss: 0.3029291331768036, mean loss: 0.34600305082240107
Epoch: 34, step: 61, loss: 0.34822750091552734, mean loss: 0.34600309607343027
Epoch: 34, step: 62, loss: 0.32035353779792786, mean loss: 0.3460025743061389
Epoch: 34, step: 63, loss: 0.39596590399742126, mean loss: 0.3460035906472636
Epoch: 34, step: 64, loss: 0.29243701696395874, mean loss: 0.3460025010320466
Epoch: 34, step: 65, loss: 0.33912193775177, mean loss: 0.3460023610751026
Epoch: 34, step: 66, loss: 0.3502236604690552, mean loss: 0.34600244693844284
Epoch: 34, step: 67, loss: 0.3193758726119995, mean loss: 0.34600190535162473
Epoch: 34, step: 68, loss: 0.327383428812027, mean loss: 0.3460015266579089
Epoch: 34, step: 69, loss: 0.32648560404777527, mean loss: 0.3460011297185075
Epoch: 34, step: 70, loss: 0.3407997488975525, mean loss: 0.34600102392842835
Epoch: 34, step: 71, loss: 0.3538540005683899, mean loss: 0.3460011836456558
Epoch: 34, step: 72, loss: 0.4255511164665222, mean loss: 0.34600280153361
Epoch: 34, step: 73, loss: 0.3059271574020386, mean loss: 0.3460019864910204
Epoch: 34, step: 74, loss: 0.33415111899375916, mean loss: 0.34600174547766904
Epoch: 34, step: 75, loss: 0.34929218888282776, mean loss: 0.3460018123946829
Epoch: 34, step: 76, loss: 0.36104169487953186, mean loss: 0.3460021182511994
Epoch: 34, step: 77, loss: 0.34849706292152405, mean loss: 0.34600216898826924
Epoch: 34, step: 78, loss: 0.32394686341285706, mean loss: 0.346001720481801
Epoch: 34, step: 79, loss: 0.31599369645118713, mean loss: 0.3460011102649466
Epoch: 34, step: 80, loss: 0.35091254115104675, mean loss: 0.346001210137466
Epoch: 34, step: 81, loss: 0.3602253198623657, mean loss: 0.34600149937472097
Epoch: 34, step: 82, loss: 0.31186285614967346, mean loss: 0.3460008052035661
Epoch: 34, step: 83, loss: 0.30583328008651733, mean loss: 0.3459999884584437
Epoch: 34, step: 84, loss: 0.3147878348827362, mean loss: 0.3459993538199944
Epoch: 34, step: 85, loss: 0.33676889538764954, mean loss: 0.3459991661403874
Epoch: 34, step: 86, loss: 0.3139782249927521, mean loss: 0.3459985150832915
Epoch: 34, step: 87, loss: 0.28179222345352173, mean loss: 0.3459972096528338
Epoch: 34, step: 88, loss: 0.379305362701416, mean loss: 0.34599788685427835
Epoch: 34, step: 89, loss: 0.33003902435302734, mean loss: 0.3459975623948285
Epoch: 34, step: 90, loss: 0.3542338013648987, mean loss: 0.3459977298423038
Epoch: 34, step: 91, loss: 0.3349744379520416, mean loss: 0.3459975057369958
Epoch: 34, step: 92, loss: 0.3476615250110626, mean loss: 0.34599753956608914
Epoch: 34, step: 93, loss: 0.34313660860061646, mean loss: 0.3459974814052645
Epoch: 34, step: 94, loss: 0.31947264075279236, mean loss: 0.3459969421838489
Epoch: 34, step: 95, loss: 0.35738784074783325, mean loss: 0.3459971737438295
Epoch: 34, step: 96, loss: 0.33901748061180115, mean loss: 0.3459970318599612
Epoch: 34, step: 97, loss: 0.36746886372566223, mean loss: 0.3459974683325365
Epoch: 34, step: 98, loss: 0.33999666571617126, mean loss: 0.34599734635260726
Epoch: 34, step: 99, loss: 0.3711712062358856, mean loss: 0.3459978580580281
Epoch: 34, step: 100, loss: 0.31891971826553345, mean loss: 0.34599730765577197
Epoch: 34, step: 101, loss: 0.29396286606788635, mean loss: 0.34599625000217654
Epoch: 34, step: 102, loss: 0.3257671296596527, mean loss: 0.34599583883283686
Epoch: 34, step: 103, loss: 0.30178505182266235, mean loss: 0.3459949402396049
Epoch: 34, step: 104, loss: 0.29132965207099915, mean loss: 0.3459938291790946
Epoch: 34, step: 105, loss: 0.3659282624721527, mean loss: 0.3459942343340333
Epoch: 34, step: 106, loss: 0.3403843939304352, mean loss: 0.345994120319839
Epoch: 34, step: 107, loss: 0.30476608872413635, mean loss: 0.34599328241983907
Epoch: 34, step: 108, loss: 0.3533698618412018, mean loss: 0.34599343233507984
Epoch: 34, step: 109, loss: 0.2987198531627655, mean loss: 0.34599247160713664
Epoch: 34, step: 110, loss: 0.3131166100502014, mean loss: 0.34599180349362524
Epoch: 34, step: 111, loss: 0.3463633060455322, mean loss: 0.34599181104326254
Epoch: 34, step: 112, loss: 0.3402981162071228, mean loss: 0.34599169533892316
Epoch: 34, step: 113, loss: 0.29369887709617615, mean loss: 0.34599063269274877
Epoch: 34, step: 114, loss: 0.2910623252391815, mean loss: 0.3459895165132878
Epoch: 34, step: 115, loss: 0.30240559577941895, mean loss: 0.3459886308772491
Epoch: 34, step: 116, loss: 0.3172127306461334, mean loss: 0.34598804615572776
Epoch: 34, step: 117, loss: 0.29770657420158386, mean loss: 0.345987065104158
Epoch: 34, step: 118, loss: 0.3508290946483612, mean loss: 0.3459871634893971
Epoch: 34, step: 119, loss: 0.3197751045227051, mean loss: 0.3459866308971717
Epoch: 34, step: 120, loss: 0.34129655361175537, mean loss: 0.3459865356033243
Epoch: 34, step: 121, loss: 0.30598488450050354, mean loss: 0.3459857228589807
Epoch: 34, step: 122, loss: 0.2950023114681244, mean loss: 0.34598468701080437
Epoch: 34, step: 123, loss: 0.3719348609447479, mean loss: 0.3459852142390436
Epoch: 34, step: 124, loss: 0.3114122748374939, mean loss: 0.34598451183682905
Epoch: 34, step: 125, loss: 0.35821035504341125, mean loss: 0.34598476021851216
Epoch: 34, step: 126, loss: 0.3292904794216156, mean loss: 0.3459844210624104
Epoch: 34, step: 127, loss: 0.3357475697994232, mean loss: 0.345984213097774
Epoch: 34, step: 128, loss: 0.3471604585647583, mean loss: 0.34598423699306025
Epoch: 34, step: 129, loss: 0.3807392716407776, mean loss: 0.3459849430230982
Epoch: 34, step: 130, loss: 0.3168761730194092, mean loss: 0.3459843517059348
Epoch: 34, step: 131, loss: 0.3264215588569641, mean loss: 0.34598395431435175
Epoch: 34, step: 132, loss: 0.32953178882598877, mean loss: 0.3459836201177301
Epoch: 34, step: 133, loss: 0.3294898271560669, mean loss: 0.3459832850823256
Epoch: 34, step: 134, loss: 0.3414870798587799, mean loss: 0.3459831937535851
Epoch: 34, step: 135, loss: 0.35704153776168823, mean loss: 0.34598341837058233
Epoch: 34, step: 136, loss: 0.37406209111213684, mean loss: 0.3459839886927797
Epoch: 34, step: 137, loss: 0.34029391407966614, mean loss: 0.34598387312072354
Epoch: 34, step: 138, loss: 0.33468538522720337, mean loss: 0.3459836436399092
Epoch: 34, step: 139, loss: 0.3124518096446991, mean loss: 0.345982962596892
Epoch: 34, step: 140, loss: 0.30456244945526123, mean loss: 0.3459821213491892
Epoch: 34, step: 141, loss: 0.30141976475715637, mean loss: 0.34598121630924866
Epoch: 34, step: 142, loss: 0.3807840347290039, mean loss: 0.3459819231233273
Epoch: 34, step: 143, loss: 0.3040177822113037, mean loss: 0.3459810708865094
Epoch: 34, step: 144, loss: 0.3417961597442627, mean loss: 0.3459809858981635
Epoch: 34, step: 145, loss: 0.3253941833972931, mean loss: 0.34598056782411085
Epoch: 34, step: 146, loss: 0.4048631489276886, mean loss: 0.345981763579469
Epoch: 34, step: 147, loss: 0.3415246605873108, mean loss: 0.3459816730688892
Epoch: 34, step: 148, loss: 0.3544312119483948, mean loss: 0.3459818446505499
Epoch: 34, step: 149, loss: 0.3323430120944977, mean loss: 0.3459815676974459
Epoch: 34, step: 150, loss: 0.3352973461151123, mean loss: 0.3459813507457213
Epoch: 34, step: 151, loss: 0.31089556217193604, mean loss: 0.34598063831499165
Epoch: 34, step: 152, loss: 0.3365853726863861, mean loss: 0.34598044754430335
Epoch: 34, step: 153, loss: 0.3435652554035187, mean loss: 0.345980398504869
Epoch: 34, step: 154, loss: 0.3197985589504242, mean loss: 0.3459798669047075
Epoch: 34, step: 155, loss: 0.3715769350528717, mean loss: 0.3459803866210266
Epoch: 34, step: 156, loss: 0.317630410194397, mean loss: 0.34597981102204933
Epoch: 34, step: 157, loss: 0.3468863368034363, mean loss: 0.34597982942716937
Epoch: 34, step: 158, loss: 0.3142748475074768, mean loss: 0.34597918573654063
Epoch: 34, step: 159, loss: 0.37358444929122925, mean loss: 0.3459797461812287
Epoch: 34, step: 160, loss: 0.37791961431503296, mean loss: 0.3459803946143069
Epoch: 34, step: 161, loss: 0.3116331100463867, mean loss: 0.3459796973207796
Epoch: 34, step: 162, loss: 0.3063669502735138, mean loss: 0.345978893147998
Epoch: 34, step: 163, loss: 0.3388686180114746, mean loss: 0.34597874880623725
Epoch: 34, step: 164, loss: 0.34334036707878113, mean loss: 0.34597869524699715
Epoch: 34, step: 165, loss: 0.31952887773513794, mean loss: 0.3459781583256884
Epoch: 34, step: 166, loss: 0.3396036624908447, mean loss: 0.3459780289284565
Epoch: 34, step: 167, loss: 0.3075725734233856, mean loss: 0.3459772493438612
Epoch: 34, step: 168, loss: 0.33387309312820435, mean loss: 0.3459770036490228
Epoch: 34, step: 169, loss: 0.3083908259868622, mean loss: 0.345976240725756
Epoch: 34, step: 170, loss: 0.33469337224960327, mean loss: 0.3459760117110306
Epoch: 34, step: 171, loss: 0.3360005021095276, mean loss: 0.3459758092366131
Epoch: 34, step: 172, loss: 0.331742525100708, mean loss: 0.3459755203473696
Epoch: 34, step: 173, loss: 0.34553080797195435, mean loss: 0.3459755113213421
Epoch: 34, step: 174, loss: 0.3332928419113159, mean loss: 0.34597525391496897
Epoch: 34, step: 175, loss: 0.3329947590827942, mean loss: 0.3459749904693034
Epoch: 34, step: 176, loss: 0.3245675563812256, mean loss: 0.3459745560034887
Epoch: 34, step: 177, loss: 0.3126258850097656, mean loss: 0.3459738792029246
Epoch: 34, step: 178, loss: 0.34231624007225037, mean loss: 0.34597380497381997
Epoch: 34, step: 179, loss: 0.33484092354774475, mean loss: 0.34597357904473836
Epoch: 34, step: 180, loss: 0.29248616099357605, mean loss: 0.34597249360085885
Epoch: 34, step: 181, loss: 0.3866638243198395, mean loss: 0.34597331935130976
Epoch: 34, step: 182, loss: 0.32478657364845276, mean loss: 0.3459728894167392
Epoch: 34, step: 183, loss: 0.3353990614414215, mean loss: 0.34597267485042477
Epoch: 34, step: 184, loss: 0.3066297769546509, mean loss: 0.34597187651236555
Epoch: 34, step: 185, loss: 0.3108125329017639, mean loss: 0.3459711630806134
Epoch: 34, step: 186, loss: 0.3401196300983429, mean loss: 0.3459710443473183
Epoch: 34, step: 187, loss: 0.3078014552593231, mean loss: 0.345970269864949
Epoch: 34, step: 188, loss: 0.3009597063064575, mean loss: 0.3459693565939019
Epoch: 34, step: 189, loss: 0.3572925627231598, mean loss: 0.34596958633878133
Epoch: 34, step: 190, loss: 0.31223559379577637, mean loss: 0.34596890189881657
Epoch: 34, step: 191, loss: 0.34955328702926636, mean loss: 0.34596897462209875
Epoch: 34, step: 192, loss: 0.3282310366630554, mean loss: 0.3459686147459
Epoch: 34, step: 193, loss: 0.3651115596294403, mean loss: 0.34596900311970574
Epoch: 34, step: 194, loss: 0.3221660852432251, mean loss: 0.34596852021374164
Epoch: 34, step: 195, loss: 0.34551340341567993, mean loss: 0.34596851098066533
Epoch: 34, step: 196, loss: 0.3390689492225647, mean loss: 0.34596837101024847
Epoch: 34, step: 197, loss: 0.2948216199874878, mean loss: 0.34596733342451746
Epoch: 34, step: 198, loss: 0.33416548371315, mean loss: 0.345967094011804
Epoch: 34, step: 199, loss: 0.3255411982536316, mean loss: 0.34596667965981276
Epoch: 34, step: 200, loss: 0.31638190150260925, mean loss: 0.3459660795263735
Epoch: 34, step: 201, loss: 0.35084792971611023, mean loss: 0.34596617855372125
Epoch: 34, step: 202, loss: 0.3577006757259369, mean loss: 0.3459664165808044
Epoch: 34, step: 203, loss: 0.3459756672382355, mean loss: 0.34596641676844453
Epoch: 34, step: 204, loss: 0.3135392963886261, mean loss: 0.34596575903086557
Epoch: 34, step: 205, loss: 0.3184749484062195, mean loss: 0.3459652014305527
Epoch: 34, step: 206, loss: 0.36626920104026794, mean loss: 0.34596561325132646
Epoch: 34, step: 207, loss: 0.3232370615005493, mean loss: 0.3459651522633387
Epoch: 34, step: 208, loss: 0.35702380537986755, mean loss: 0.3459653765540418
Epoch: 34, step: 209, loss: 0.3300343453884125, mean loss: 0.3459650534487166
Epoch: 34, step: 210, loss: 0.3316881060600281, mean loss: 0.34596476389657616
Epoch: 34, step: 211, loss: 0.31723496317863464, mean loss: 0.345964181236547
Epoch: 34, step: 212, loss: 0.32827746868133545, mean loss: 0.3459638225451812
Epoch: 34, step: 213, loss: 0.32191166281700134, mean loss: 0.3459633347706988
Epoch: 34, step: 214, loss: 0.36289164423942566, mean loss: 0.3459636780675183
Epoch: 34, step: 215, loss: 0.31271183490753174, mean loss: 0.3459630037520746
Epoch: 34, step: 216, loss: 0.323326051235199, mean loss: 0.34596254470572746
Epoch: 34, step: 217, loss: 0.35304558277130127, mean loss: 0.34596268833711136
Epoch: 34, step: 218, loss: 0.384231835603714, mean loss: 0.3459634643514532
Epoch: 34, step: 219, loss: 0.3536570072174072, mean loss: 0.345963620356459
Epoch: 34, step: 220, loss: 0.3142869174480438, mean loss: 0.34596297804847376
Epoch: 34, step: 221, loss: 0.3228507339954376, mean loss: 0.3459625094113828
Epoch: 34, step: 222, loss: 0.3236083388328552, mean loss: 0.345962056154614
Epoch: 34, step: 223, loss: 0.35275527834892273, mean loss: 0.34596219389229027
Epoch: 34, step: 224, loss: 0.328110933303833, mean loss: 0.34596183195192837
Epoch: 34, step: 225, loss: 0.32659026980400085, mean loss: 0.3459614391949001
Epoch: 34, step: 226, loss: 0.334518700838089, mean loss: 0.3459612071989072
Epoch: 34, step: 227, loss: 0.305376261472702, mean loss: 0.34596038437541915
Epoch: 34, step: 228, loss: 0.3384256660938263, mean loss: 0.3459602316188397
Epoch: 34, step: 229, loss: 0.32849881052970886, mean loss: 0.3459598776184933
Epoch: 34, step: 230, loss: 0.36319008469581604, mean loss: 0.34596022692429085
Epoch: 34, step: 231, loss: 0.33636951446533203, mean loss: 0.3459600324969381
Epoch: 34, step: 232, loss: 0.30323466658592224, mean loss: 0.3459591663661446
Epoch: 34, step: 233, loss: 0.3292272090911865, mean loss: 0.3459588271819306
Epoch: 34, step: 234, loss: 0.3434441089630127, mean loss: 0.3459587762055016
Epoch: 34, step: 235, loss: 0.3415956497192383, mean loss: 0.3459586877613581
Epoch: 34, step: 236, loss: 0.338596910238266, mean loss: 0.3459585385351297
Epoch: 34, step: 237, loss: 0.3739781081676483, mean loss: 0.3459591064917039
Epoch: 34, step: 238, loss: 0.3171454966068268, mean loss: 0.34595852245177516
Epoch: 34, step: 239, loss: 0.3229018747806549, mean loss: 0.34595805511255695
Epoch: 34, step: 240, loss: 0.35971158742904663, mean loss: 0.345958333879655
Epoch: 34, step: 241, loss: 0.2971096336841583, mean loss: 0.3459573437969562
Epoch: 34, step: 242, loss: 0.3779454529285431, mean loss: 0.34595799213010303
Epoch: 34, step: 243, loss: 0.3249448835849762, mean loss: 0.34595756624626545
Epoch: 34, step: 244, loss: 0.31839731335639954, mean loss: 0.345957007679295
Epoch: 34, step: 245, loss: 0.32954177260398865, mean loss: 0.34595667499648775
Epoch: 34, step: 246, loss: 0.2911629378795624, mean loss: 0.34595556453021864
Epoch: 34, step: 247, loss: 0.34336599707603455, mean loss: 0.3459555120503335
Epoch: 34, step: 248, loss: 0.3528273403644562, mean loss: 0.34595565131121736
Epoch: 34, step: 249, loss: 0.34759560227394104, mean loss: 0.34595568454493364
Epoch: 34, step: 250, loss: 0.3083301782608032, mean loss: 0.3459549220769764
Epoch: 34, step: 251, loss: 0.32191067934036255, mean loss: 0.3459544348385324
Epoch: 34, step: 252, loss: 0.3531184792518616, mean loss: 0.34595458000954726
Epoch: 34, step: 253, loss: 0.317310094833374, mean loss: 0.345953999574184
Epoch: 34, step: 254, loss: 0.317240834236145, mean loss: 0.345953417758915
Epoch: 34, step: 255, loss: 0.33641600608825684, mean loss: 0.3459532245061255
Epoch: 34, step: 256, loss: 0.3459465205669403, mean loss: 0.34595322437028897
Epoch: 34, step: 257, loss: 0.32031309604644775, mean loss: 0.3459527048555926
Epoch: 34, step: 258, loss: 0.3351192772388458, mean loss: 0.34595248535548895
Epoch: 34, step: 259, loss: 0.33172091841697693, mean loss: 0.3459521970102637
Epoch: 34, step: 260, loss: 0.32072895765304565, mean loss: 0.34595168597354437
Epoch: 34, step: 261, loss: 0.3382965326309204, mean loss: 0.3459515308790644
Epoch: 34, step: 262, loss: 0.30726978182792664, mean loss: 0.3459507471972829
Epoch: 34, step: 263, loss: 0.29272645711898804, mean loss: 0.3459496689093964
Epoch: 34, step: 264, loss: 0.36760053038597107, mean loss: 0.34595010753222566
Epoch: 34, step: 265, loss: 0.31780004501342773, mean loss: 0.34594953725422806
Epoch: 34, step: 266, loss: 0.3406100869178772, mean loss: 0.345949429087173
Epoch: 34, step: 267, loss: 0.36663416028022766, mean loss: 0.34594984811179
Epoch: 34, step: 268, loss: 0.3287369906902313, mean loss: 0.34594949942633635
Epoch: 34, step: 269, loss: 0.3500305116176605, mean loss: 0.3459495820948165
Epoch: 34, step: 270, loss: 0.29473936557769775, mean loss: 0.34594854475779957
Epoch: 34, step: 271, loss: 0.3417641520500183, mean loss: 0.345948459998589
Epoch: 34, step: 272, loss: 0.32668131589889526, mean loss: 0.345948069730524
Epoch: 34, step: 273, loss: 0.29535457491874695, mean loss: 0.34594704494837264
Epoch: 34, step: 274, loss: 0.33608540892601013, mean loss: 0.34594684520285357
Epoch: 34, step: 275, loss: 0.30783167481422424, mean loss: 0.34594607320312926
Epoch: 34, step: 276, loss: 0.3404991924762726, mean loss: 0.3459459628820889
Epoch: 34, step: 277, loss: 0.31372278928756714, mean loss: 0.34594531024763364
Epoch: 34, step: 278, loss: 0.3358629047870636, mean loss: 0.3459451060470167
Epoch: 34, step: 279, loss: 0.41469472646713257, mean loss: 0.34594649841619246
Epoch: 34, step: 280, loss: 0.31782859563827515, mean loss: 0.34594592896274695
Epoch: 34, step: 281, loss: 0.36441439390182495, mean loss: 0.3459463029848811
Epoch: 34, step: 282, loss: 0.41624629497528076, mean loss: 0.345947726666851
Epoch: 34, step: 283, loss: 0.32432031631469727, mean loss: 0.34594728868770247
Epoch: 34, step: 284, loss: 0.319340318441391, mean loss: 0.34594674987783136
Epoch: 34, step: 285, loss: 0.34307464957237244, mean loss: 0.34594669171695686
Epoch: 34, step: 286, loss: 0.3142283260822296, mean loss: 0.34594604942374596
Epoch: 34, step: 287, loss: 0.34084466099739075, mean loss: 0.34594594612331614
Epoch: 34, step: 288, loss: 0.3748222589492798, mean loss: 0.34594653084160765
Epoch: 34, step: 289, loss: 0.3284111022949219, mean loss: 0.34594617577279163
Epoch: 34, step: 290, loss: 0.3755330741405487, mean loss: 0.3459467748555132
Epoch: 34, step: 291, loss: 0.3658415675163269, mean loss: 0.34594717768196215
Epoch: 34, step: 292, loss: 0.32102397084236145, mean loss: 0.3459466730512379
Epoch: 34, step: 293, loss: 0.31208962202072144, mean loss: 0.3459459875470664
Epoch: 34, step: 294, loss: 0.3445162773132324, mean loss: 0.34594595860029
Epoch: 34, step: 295, loss: 0.4067573845386505, mean loss: 0.3459471898001997
Epoch: 34, step: 296, loss: 0.32019326090812683, mean loss: 0.34594666839172294
Epoch: 34, step: 297, loss: 0.4210902452468872, mean loss: 0.34594818970153496
Epoch: 34, step: 298, loss: 0.31851622462272644, mean loss: 0.3459476343423877
Epoch: 34, step: 299, loss: 0.3206949234008789, mean loss: 0.34594712311251197
Epoch: 34, step: 300, loss: 0.3445743918418884, mean loss: 0.3459470953227419
Epoch: 34, step: 301, loss: 0.3245338797569275, mean loss: 0.34594666183928985
Epoch: 34, step: 302, loss: 0.3652961254119873, mean loss: 0.34594705353676497
Epoch: 34, step: 303, loss: 0.3831765055656433, mean loss: 0.34594780716939716
Epoch: 34, step: 304, loss: 0.36599138379096985, mean loss: 0.3459482129016014
Epoch: 34, step: 305, loss: 0.31828898191452026, mean loss: 0.3459476530208073
Epoch: 34, step: 306, loss: 0.3403841257095337, mean loss: 0.34594754040563597
Epoch: 34, step: 307, loss: 0.34417569637298584, mean loss: 0.34594750454125184
Epoch: 34, step: 308, loss: 0.3331294357776642, mean loss: 0.34594724509243563
Epoch: 34, step: 309, loss: 0.3513079285621643, mean loss: 0.34594735359511686
Epoch: 34, step: 310, loss: 0.3128375709056854, mean loss: 0.3459466834515605
Epoch: 34, step: 311, loss: 0.3122923672199249, mean loss: 0.3459460023004062
Epoch: 34, step: 312, loss: 0.2991831302642822, mean loss: 0.3459450558559925
Epoch: 34, step: 313, loss: 0.3483315110206604, mean loss: 0.3459451041550244
Epoch: 34, step: 314, loss: 0.29406988620758057, mean loss: 0.34594405428317504
Epoch: 34, step: 315, loss: 0.33769944310188293, mean loss: 0.3459438874287433
Epoch: 34, step: 316, loss: 0.33979180455207825, mean loss: 0.34594376292541673
Epoch: 34, step: 317, loss: 0.3487173020839691, mean loss: 0.3459438190540272
Epoch: 34, step: 318, loss: 0.37490418553352356, mean loss: 0.3459444051183089
Epoch: 34, step: 319, loss: 0.3094225823879242, mean loss: 0.3459436660495309
Epoch: 34, step: 320, loss: 0.3385017514228821, mean loss: 0.34594351545530977
Epoch: 34, step: 321, loss: 0.320125550031662, mean loss: 0.3459429930147937
Epoch: 34, step: 322, loss: 0.32849618792533875, mean loss: 0.3459426399763856
Epoch: 34, step: 323, loss: 0.3377630114555359, mean loss: 0.34594247446387
Epoch: 34, step: 324, loss: 0.3601180613040924, mean loss: 0.345942761297136
Epoch: 34, step: 325, loss: 0.32596075534820557, mean loss: 0.34594235698314735
Epoch: 34, step: 326, loss: 0.33799365162849426, mean loss: 0.34594219615306104
Epoch: 34, step: 327, loss: 0.3190321624279022, mean loss: 0.3459416516800575
Epoch: 34, step: 328, loss: 0.3497205972671509, mean loss: 0.34594172813823837
Epoch: 34, step: 329, loss: 0.4161039888858795, mean loss: 0.34594314767979034
Epoch: 34, step: 330, loss: 0.34307143092155457, mean loss: 0.3459430895796273
Epoch: 34, step: 331, loss: 0.33102500438690186, mean loss: 0.345942787765166
Epoch: 34, step: 332, loss: 0.36066681146621704, mean loss: 0.3459430856474558
Epoch: 34, step: 333, loss: 0.3856024146080017, mean loss: 0.34594388798063325
Epoch: 34, step: 334, loss: 0.37401044368743896, mean loss: 0.3459444557732271
Epoch: 34, step: 335, loss: 0.3401995003223419, mean loss: 0.3459443395538661
Epoch: 34, step: 336, loss: 0.2917778789997101, mean loss: 0.3459432437987925
Epoch: 34, step: 337, loss: 0.3234628140926361, mean loss: 0.3459427890423555
Epoch: 34, step: 338, loss: 0.32091599702835083, mean loss: 0.3459422827858163
Epoch: 34, step: 339, loss: 0.35005998611450195, mean loss: 0.3459423660794349
Epoch: 34, step: 340, loss: 0.35014089941978455, mean loss: 0.3459424510063791
Epoch: 34, step: 341, loss: 0.31839850544929504, mean loss: 0.34594189386520113
Epoch: 34, step: 342, loss: 0.380164235830307, mean loss: 0.3459425860786756
Epoch: 34, step: 343, loss: 0.35282018780708313, mean loss: 0.3459427251887429
Epoch: 34, step: 344, loss: 0.3643512725830078, mean loss: 0.3459430975223809
Epoch: 34, step: 345, loss: 0.2748273015022278, mean loss: 0.3459416591542724
Epoch: 34, step: 346, loss: 0.33883151412010193, mean loss: 0.3459415153493853
Epoch: 34, step: 347, loss: 0.35117197036743164, mean loss: 0.3459416211348197
Epoch: 34, step: 348, loss: 0.3205314576625824, mean loss: 0.3459411072271754
Epoch: 34, step: 349, loss: 0.3216211497783661, mean loss: 0.34594061537834137
Epoch: 34, step: 350, loss: 0.379920095205307, mean loss: 0.3459413025682584
Epoch: 34, step: 351, loss: 0.3096957206726074, mean loss: 0.3459405695642563
Epoch: 34, step: 352, loss: 0.33822786808013916, mean loss: 0.3459404135914058
Epoch: 34, step: 353, loss: 0.3344449996948242, mean loss: 0.3459401811260085
Epoch: 34, step: 354, loss: 0.3181193768978119, mean loss: 0.3459396185326488
Epoch: 34, step: 355, loss: 0.3639874756336212, mean loss: 0.3459399834897203
Epoch: 34, step: 356, loss: 0.3641207814216614, mean loss: 0.34594035112763777
Epoch: 34, step: 357, loss: 0.34857067465782166, mean loss: 0.3459404043149134
Epoch: 34, step: 358, loss: 0.3419640362262726, mean loss: 0.3459403239111506
Epoch: 34, step: 359, loss: 0.32596075534820557, mean loss: 0.34593991992440354
Epoch: 34, step: 360, loss: 0.3310222327709198, mean loss: 0.3459396182949648
Epoch: 34, step: 361, loss: 0.3143017590045929, mean loss: 0.34593897860352374
Epoch: 34, step: 362, loss: 0.31766653060913086, mean loss: 0.3459384069694835
Epoch: 34, step: 363, loss: 0.33286717534065247, mean loss: 0.34593814269063944
Epoch: 34, step: 364, loss: 0.3080979883670807, mean loss: 0.3459373776403104
Epoch: 34, step: 365, loss: 0.31246480345726013, mean loss: 0.34593670090717826
Epoch: 34, step: 366, loss: 0.37354978919029236, mean loss: 0.3459372591646289
Epoch: 34, step: 367, loss: 0.3611154556274414, mean loss: 0.3459375660180266
Epoch: 34, step: 368, loss: 0.3289817273616791, mean loss: 0.3459372232334586
Epoch: 34, step: 369, loss: 0.3441970646381378, mean loss: 0.34593718805457624
Epoch: 34, step: 370, loss: 0.3406602144241333, mean loss: 0.3459370813779306
Epoch: 34, step: 371, loss: 0.34792011976242065, mean loss: 0.34593712146522715
Epoch: 34, step: 372, loss: 0.2993156313896179, mean loss: 0.3459361790267288
Epoch: 34, step: 373, loss: 0.2982237935066223, mean loss: 0.3459352145556247
Epoch: 34, step: 374, loss: 0.3496842384338379, mean loss: 0.3459352903378785
Epoch: 34, step: 375, loss: 0.3547952473163605, mean loss: 0.345935469428212
Epoch: 34, step: 376, loss: 0.32086119055747986, mean loss: 0.34593496260067236
Epoch: 34, step: 377, loss: 0.30255064368247986, mean loss: 0.34593408568918516
Epoch: 34, step: 378, loss: 0.35154473781585693, mean loss: 0.3459341990929674
Epoch: 34, step: 379, loss: 0.3224177658557892, mean loss: 0.34593372378305476
Epoch: 34, step: 380, loss: 0.34976568818092346, mean loss: 0.34593380123246353
Epoch: 34, step: 381, loss: 0.37986287474632263, mean loss: 0.3459344869730657
Epoch: 34, step: 382, loss: 0.32421350479125977, mean loss: 0.34593404797910504
Epoch: 34, step: 383, loss: 0.2863694727420807, mean loss: 0.34593284416796444
Epoch: 34, step: 384, loss: 0.342805951833725, mean loss: 0.34593278097416613
Epoch: 34, step: 385, loss: 0.32363539934158325, mean loss: 0.3459323303581516
Epoch: 34, step: 386, loss: 0.3318161368370056, mean loss: 0.3459320450845521
Epoch: 34, step: 387, loss: 0.34704580903053284, mean loss: 0.34593206759210904
Epoch: 34, step: 388, loss: 0.32285723090171814, mean loss: 0.3459316012924891
Epoch: 34, step: 389, loss: 0.31341663002967834, mean loss: 0.34593094423854936
Epoch: 34, step: 390, loss: 0.34120723605155945, mean loss: 0.34593084878503255
Epoch: 34, step: 391, loss: 0.32117587327957153, mean loss: 0.3459303485632514
Epoch: 34, step: 392, loss: 0.33286914229393005, mean loss: 0.34593008464184927
Epoch: 34, step: 393, loss: 0.3088636100292206, mean loss: 0.3459293356728735
Epoch: 34, step: 394, loss: 0.36413121223449707, mean loss: 0.34592970345442087
Epoch: 34, step: 395, loss: 0.36022335290908813, mean loss: 0.34592999226169185
Epoch: 34, step: 396, loss: 0.31170928478240967, mean loss: 0.3459293008364907
Epoch: 34, step: 397, loss: 0.31739455461502075, mean loss: 0.3459287243070887
Epoch: 34, step: 398, loss: 0.34629008173942566, mean loss: 0.3459287316079763
Epoch: 34, step: 399, loss: 0.3061921298503876, mean loss: 0.3459279287834702
Epoch: 34, step: 400, loss: 0.3914181888103485, mean loss: 0.34592884783432226
Epoch: 34, step: 401, loss: 0.32038742303848267, mean loss: 0.3459283318250937
Epoch: 34, step: 402, loss: 0.3450830578804016, mean loss: 0.3459283147485074
Epoch: 34, step: 403, loss: 0.31940868496894836, mean loss: 0.3459277789984108
Epoch: 34, step: 404, loss: 0.3224465847015381, mean loss: 0.34592730464043225
Epoch: 34, step: 405, loss: 0.3381001353263855, mean loss: 0.34592714652218826
Epoch: 34, step: 406, loss: 0.3537353277206421, mean loss: 0.3459273042536631
Epoch: 34, step: 407, loss: 0.3341982960700989, mean loss: 0.3459270673231487
Epoch: 34, step: 408, loss: 0.362083375453949, mean loss: 0.3459273936802466
Epoch: 34, step: 409, loss: 0.32558631896972656, mean loss: 0.3459269827992481
Epoch: 34, step: 410, loss: 0.3113657534122467, mean loss: 0.34592628469131614
Epoch: 34, step: 411, loss: 0.34261420369148254, mean loss: 0.345926217791401
Epoch: 34, step: 412, loss: 0.33876028656959534, mean loss: 0.34592607305143
Epoch: 34, step: 413, loss: 0.35941118001937866, mean loss: 0.3459263454228089
Epoch: 34, step: 414, loss: 0.3138263523578644, mean loss: 0.34592569708217624
Epoch: 34, step: 415, loss: 0.3580209016799927, mean loss: 0.34592594137052246
Epoch: 34, step: 416, loss: 0.34132641553878784, mean loss: 0.3459258484752054
Epoch: 34, step: 417, loss: 0.32429298758506775, mean loss: 0.3459254115712815
Epoch: 34, step: 418, loss: 0.32035550475120544, mean loss: 0.3459248951639944
Epoch: 34, step: 419, loss: 0.33928194642066956, mean loss: 0.34592476100637376
Epoch: 34, step: 420, loss: 0.31078749895095825, mean loss: 0.34592405140639687
Epoch: 34, step: 421, loss: 0.2983799874782562, mean loss: 0.34592309126939763
Epoch: 34, step: 422, loss: 0.3855351209640503, mean loss: 0.34592389120537564
Epoch: 34, step: 423, loss: 0.31978997588157654, mean loss: 0.3459233634607205
Epoch: 34, step: 424, loss: 0.32312050461769104, mean loss: 0.34592290299225575
Epoch: 34, step: 425, loss: 0.35490113496780396, mean loss: 0.34592308429010266
Epoch: 34, step: 426, loss: 0.33442583680152893, mean loss: 0.34592285213034885
Epoch: 34, step: 427, loss: 0.3619728088378906, mean loss: 0.34592317621476665
Epoch: 34, step: 428, loss: 0.30366358160972595, mean loss: 0.3459223229165414
Epoch: 34, step: 429, loss: 0.34911441802978516, mean loss: 0.3459223873694573
Epoch: 34, step: 430, loss: 0.3196500539779663, mean loss: 0.3459218569045918
Epoch: 34, step: 431, loss: 0.3452566862106323, mean loss: 0.3459218434743969
Epoch: 34, step: 432, loss: 0.30181649327278137, mean loss: 0.34592095297892556
Epoch: 34, step: 433, loss: 0.289331316947937, mean loss: 0.3459198104463992
Epoch: 34, step: 434, loss: 0.2946080267429352, mean loss: 0.3459187744934868
Epoch: 34, step: 435, loss: 0.2974589467048645, mean loss: 0.34591779613953805
Epoch: 34, step: 436, loss: 0.3315329849720001, mean loss: 0.345917505730898
Epoch: 34, step: 437, loss: 0.33434709906578064, mean loss: 0.34591727214575113
Epoch: 34, step: 438, loss: 0.33084598183631897, mean loss: 0.3459169678903699
Epoch: 34, step: 439, loss: 0.33500927686691284, mean loss: 0.345916747693119
Epoch: 34, step: 440, loss: 0.30496007204055786, mean loss: 0.34591592090353435
Epoch: 34, step: 441, loss: 0.3106175363063812, mean loss: 0.34591520835186496
Epoch: 34, step: 442, loss: 0.34397023916244507, mean loss: 0.3459151690904913
Epoch: 34, step: 443, loss: 0.3146466910839081, mean loss: 0.3459145379141084
Epoch: 34, step: 444, loss: 0.3237399160861969, mean loss: 0.3459140903126908
Epoch: 34, step: 445, loss: 0.30378228425979614, mean loss: 0.3459132398866674
Epoch: 34, step: 446, loss: 0.3607923984527588, mean loss: 0.34591354021483817
Epoch: 34, step: 447, loss: 0.3238879144191742, mean loss: 0.34591309564787154
Epoch: 34, step: 448, loss: 0.33386293053627014, mean loss: 0.3459128524312985
Epoch: 34, step: 449, loss: 0.3181499242782593, mean loss: 0.34591229208478913
Epoch: 34, step: 450, loss: 0.3022473156452179, mean loss: 0.34591141080082766
Epoch: 34, step: 451, loss: 0.3479325771331787, mean loss: 0.34591145159291475
Epoch: 34, step: 452, loss: 0.3459774851799011, mean loss: 0.3459114529256074
Epoch: 34, step: 453, loss: 0.3464735746383667, mean loss: 0.34591146427014247
Epoch: 34, step: 454, loss: 0.3261973559856415, mean loss: 0.3459110664152398
Epoch: 34, step: 455, loss: 0.3283015489578247, mean loss: 0.34591071104073506
Epoch: 34, step: 456, loss: 0.3790755569934845, mean loss: 0.34591138032101987
Epoch: 34, step: 457, loss: 0.3352808654308319, mean loss: 0.3459111657971693
Epoch: 34, step: 458, loss: 0.3255991041660309, mean loss: 0.34591075590792236
Epoch: 34, step: 459, loss: 0.30895692110061646, mean loss: 0.3459100102094235
Epoch: 34, step: 460, loss: 0.34189993143081665, mean loss: 0.3459099292909099
Epoch: 34, step: 461, loss: 0.35139501094818115, mean loss: 0.34591003997095465
Epoch: 34, step: 462, loss: 0.3115174472332001, mean loss: 0.34590934599826073
Epoch: 34, step: 463, loss: 0.3187851309776306, mean loss: 0.3459087986977155
Epoch: 34, step: 464, loss: 0.30967092514038086, mean loss: 0.3459080675205085
Epoch: 34, step: 465, loss: 0.35198062658309937, mean loss: 0.34590819004500434
Epoch: 34, step: 466, loss: 0.3142715096473694, mean loss: 0.3459075517325455
Epoch: 34, step: 467, loss: 0.3349766433238983, mean loss: 0.3459073311912573
Epoch: 34, step: 468, loss: 0.34406349062919617, mean loss: 0.34590729399080206
Epoch: 34, step: 469, loss: 0.33494722843170166, mean loss: 0.34590707287016376
Epoch: 34, step: 470, loss: 0.33697089552879333, mean loss: 0.34590689258535046
Epoch: 34, step: 471, loss: 0.33484968543052673, mean loss: 0.3459066695138698
Epoch: 34, step: 472, loss: 0.3187616467475891, mean loss: 0.34590612189292186
Epoch: 34, step: 473, loss: 0.34317415952682495, mean loss: 0.3459060667797008
Epoch: 34, step: 474, loss: 0.34786126017570496, mean loss: 0.34590610622198353
Epoch: 34, step: 475, loss: 0.3083939552307129, mean loss: 0.3459053495014358
Epoch: 34, step: 476, loss: 0.35367482900619507, mean loss: 0.3459055062294834
Epoch: 34, step: 477, loss: 0.29120856523513794, mean loss: 0.34590440289021296
Epoch: 34, step: 478, loss: 0.3362894356250763, mean loss: 0.3459042089423105
Epoch: 34, step: 479, loss: 0.3113388121128082, mean loss: 0.3459035117219452
Epoch: 34, step: 480, loss: 0.31067192554473877, mean loss: 0.3459028010781754
Epoch: 34, step: 481, loss: 0.3030988574028015, mean loss: 0.34590193771249556
Epoch: 34, step: 482, loss: 0.3477051854133606, mean loss: 0.34590197408369505
Epoch: 34, step: 483, loss: 0.3239712417125702, mean loss: 0.34590153175347377
Epoch: 34, step: 484, loss: 0.3214415907859802, mean loss: 0.3459010384205243
Epoch: 34, step: 485, loss: 0.3137631416320801, mean loss: 0.34590039024383135
Epoch: 34, step: 486, loss: 0.3032074272632599, mean loss: 0.3458995292034953
Epoch: 34, step: 487, loss: 0.3224811851978302, mean loss: 0.34589905690710926
Epoch: 34, step: 488, loss: 0.3542814254760742, mean loss: 0.3458992259575997
Epoch: 34, step: 489, loss: 0.3836461305618286, mean loss: 0.3458999871987687
Epoch: 34, step: 490, loss: 0.36965319514274597, mean loss: 0.34590046621964
Epoch: 34, step: 491, loss: 0.33512672781944275, mean loss: 0.34590024895460814
Epoch: 34, step: 492, loss: 0.3513842523097992, mean loss: 0.34590035954371773
Epoch: 34, step: 493, loss: 0.35836029052734375, mean loss: 0.3459006108026607
Epoch: 34, step: 494, loss: 0.3820798993110657, mean loss: 0.34590134035617864
Epoch: 34, step: 495, loss: 0.30365613102912903, mean loss: 0.34590048850085264
Epoch: 34, step: 496, loss: 0.3144955337047577, mean loss: 0.34589985524707095
Epoch: 34, step: 497, loss: 0.3102702498435974, mean loss: 0.345899136821346
Epoch: 34, step: 498, loss: 0.3456677496433258, mean loss: 0.3458991321558116
Epoch: 34, step: 499, loss: 0.36177200078964233, mean loss: 0.3458994521991343
Epoch: 34, step: 500, loss: 0.33838748931884766, mean loss: 0.3458993007391089
Epoch: 34, step: 501, loss: 0.3391397297382355, mean loss: 0.3458991644519401
Epoch: 34, step: 502, loss: 0.30217793583869934, mean loss: 0.3458982829577847
Epoch: 34, step: 503, loss: 0.35156360268592834, mean loss: 0.3458983971779405
Epoch: 34, step: 504, loss: 0.32119324803352356, mean loss: 0.34589789910029806
Epoch: 34, step: 505, loss: 0.334777295589447, mean loss: 0.3458976749036223
Epoch: 34, step: 506, loss: 0.32429739832878113, mean loss: 0.3458972394405137
Epoch: 34, step: 507, loss: 0.31312549114227295, mean loss: 0.3458965787730615
Epoch: 34, step: 508, loss: 0.36119136214256287, mean loss: 0.34589688710454763
Epoch: 34, step: 509, loss: 0.32891157269477844, mean loss: 0.3458965447001125
Epoch: 34, step: 510, loss: 0.3174467086791992, mean loss: 0.34589597119564697
Epoch: 34, step: 511, loss: 0.29806989431381226, mean loss: 0.34589500711572274
Epoch: 34, step: 512, loss: 0.3201107084751129, mean loss: 0.34589448736530165
Epoch: 34, step: 513, loss: 0.33318933844566345, mean loss: 0.3458942312647389
Epoch: 34, step: 514, loss: 0.3795376420021057, mean loss: 0.3458949094089153
Epoch: 34, step: 515, loss: 0.307371586561203, mean loss: 0.34589413291688015
Epoch: 34, step: 516, loss: 0.317317396402359, mean loss: 0.3458935569239647
Epoch: 34, step: 517, loss: 0.327572762966156, mean loss: 0.3458931876573472
Epoch: 34, step: 518, loss: 0.35897964239120483, mean loss: 0.34589345141739425
Epoch: 34, step: 519, loss: 0.34593847393989563, mean loss: 0.34589345232481367
Epoch: 34, step: 520, loss: 0.3013029992580414, mean loss: 0.3458925536317636
Epoch: 34, step: 521, loss: 0.31337210536003113, mean loss: 0.34589189821541727
Epoch: 34, step: 522, loss: 0.3467007577419281, mean loss: 0.34589191451682455
Epoch: 34, step: 523, loss: 0.33915308117866516, mean loss: 0.3458917787080108
Epoch: 34, step: 524, loss: 0.35215210914611816, mean loss: 0.3458919048709345
Epoch: 34, step: 525, loss: 0.3231058418750763, mean loss: 0.34589144567817737
Epoch: 34, step: 526, loss: 0.31451165676116943, mean loss: 0.345890813314376
Epoch: 34, step: 527, loss: 0.3492295742034912, mean loss: 0.3458908805955482
Epoch: 34, step: 528, loss: 0.3308245539665222, mean loss: 0.3458905769919889
Epoch: 34, step: 529, loss: 0.31865617632865906, mean loss: 0.3458900281990041
Epoch: 34, step: 530, loss: 0.3357766568660736, mean loss: 0.3458898244113213
Epoch: 34, step: 531, loss: 0.30548396706581116, mean loss: 0.34588901023671537
Epoch: 34, step: 532, loss: 0.341119647026062, mean loss: 0.3458889141363867
Epoch: 34, step: 533, loss: 0.35811835527420044, mean loss: 0.3458891605486603
Epoch: 34, step: 534, loss: 0.3439076244831085, mean loss: 0.34588912062328975
Epoch: 34, step: 535, loss: 0.3245055377483368, mean loss: 0.34588868978063025
Epoch: 34, step: 536, loss: 0.3556158244609833, mean loss: 0.34588888576182586
Epoch: 34, step: 537, loss: 0.3265058100223541, mean loss: 0.3458884952417038
Epoch: 34, step: 538, loss: 0.30531829595565796, mean loss: 0.3458876778709113
Epoch: 34, step: 539, loss: 0.32022541761398315, mean loss: 0.3458871608618804
Epoch: 34, step: 540, loss: 0.33264926075935364, mean loss: 0.3458868941676785
Epoch: 34, step: 541, loss: 0.3228060007095337, mean loss: 0.3458864291833226
Epoch: 34, step: 542, loss: 0.28925958275794983, mean loss: 0.34588528841001076
Epoch: 34, step: 543, loss: 0.29593023657798767, mean loss: 0.34588428206327765
Epoch: 34, step: 544, loss: 0.31195640563964844, mean loss: 0.3458835985984719
Epoch: 34, step: 545, loss: 0.30605608224868774, mean loss: 0.34588279630371443
Epoch: 34, step: 546, loss: 0.3625819683074951, mean loss: 0.34588313268894505
Epoch: 34, step: 547, loss: 0.3201334476470947, mean loss: 0.34588261400219455
Epoch: 34, step: 548, loss: 0.3126623034477234, mean loss: 0.34588194484496715
Epoch: 34, step: 549, loss: 0.3439611494541168, mean loss: 0.3458819061551353
Epoch: 34, step: 550, loss: 0.3255656957626343, mean loss: 0.3458814969418819
Epoch: 34, step: 551, loss: 0.3438156545162201, mean loss: 0.3458814553321005
Epoch: 34, step: 552, loss: 0.31975769996643066, mean loss: 0.34588092916328816
Epoch: 34, step: 553, loss: 0.30800434947013855, mean loss: 0.3458801662915924
Epoch: 34, step: 554, loss: 0.3715464472770691, mean loss: 0.34588068322541016
Epoch: 34, step: 555, loss: 0.37408584356307983, mean loss: 0.3458812512822928
Epoch: 34, step: 556, loss: 0.32885581254959106, mean loss: 0.34588090839387253
Epoch: 34, step: 557, loss: 0.3299330770969391, mean loss: 0.3458805872146866
Epoch: 34, step: 558, loss: 0.29796072840690613, mean loss: 0.3458796221586236
Epoch: 34, step: 559, loss: 0.3221975862979889, mean loss: 0.34587914523668345
Epoch: 34, step: 560, loss: 0.32005247473716736, mean loss: 0.3458786251353785
Epoch: 34, step: 561, loss: 0.3045416474342346, mean loss: 0.34587779270198
Epoch: 34, step: 562, loss: 0.3215855658054352, mean loss: 0.34587730352122936
Epoch: 34, step: 563, loss: 0.33625152707099915, mean loss: 0.3458771096876319
Epoch: 34, step: 564, loss: 0.35101455450057983, mean loss: 0.34587721313792114
Epoch: 34, step: 565, loss: 0.36719125509262085, mean loss: 0.3458776423200313
Epoch: 34, step: 566, loss: 0.29715287685394287, mean loss: 0.34587666121205424
Epoch: 34, step: 567, loss: 0.3336605131626129, mean loss: 0.34587641523613505
Epoch: 34, step: 568, loss: 0.3870322108268738, mean loss: 0.3458772439041224
Epoch: 34, step: 569, loss: 0.3349643051624298, mean loss: 0.3458770241775742
Epoch: 34, step: 570, loss: 0.3241099715232849, mean loss: 0.3458765859177104
Epoch: 34, step: 571, loss: 0.33461835980415344, mean loss: 0.34587635924810195
Epoch: 34, step: 572, loss: 0.304584264755249, mean loss: 0.3458755279027056
Epoch: 34, step: 573, loss: 0.33134394884109497, mean loss: 0.3458752353402119
Epoch: 34, step: 574, loss: 0.3330308496952057, mean loss: 0.3458749767509819
Epoch: 34, step: 575, loss: 0.3625097870826721, mean loss: 0.3458753116440873
Epoch: 34, step: 576, loss: 0.36296284198760986, mean loss: 0.3458756556444566
Epoch: 34, step: 577, loss: 0.33188802003860474, mean loss: 0.34587537405578633
Epoch: 34, step: 578, loss: 0.34393030405044556, mean loss: 0.34587533489987277
Epoch: 34, step: 579, loss: 0.34989216923713684, mean loss: 0.3458754157605366
Epoch: 34, step: 580, loss: 0.4173133373260498, mean loss: 0.34587685380875943
Epoch: 34, step: 581, loss: 0.3108607232570648, mean loss: 0.3458761489468376
Epoch: 34, step: 582, loss: 0.30155637860298157, mean loss: 0.3458752568240021
Epoch: 34, step: 583, loss: 0.30668509006500244, mean loss: 0.3458744679720142
Epoch: 34, step: 584, loss: 0.33000698685646057, mean loss: 0.34587414858470084
Epoch: 34, step: 585, loss: 0.2993324100971222, mean loss: 0.34587321179192904
Epoch: 34, step: 586, loss: 0.3469700813293457, mean loss: 0.34587323386929025
Epoch: 34, step: 587, loss: 0.34220778942108154, mean loss: 0.3458731600941424
Epoch: 34, step: 588, loss: 0.3335377871990204, mean loss: 0.34587291182257357
Epoch: 34, step: 589, loss: 0.3197457790374756, mean loss: 0.3458723859776115
Epoch: 34, step: 590, loss: 0.33097267150878906, mean loss: 0.34587208610612663
Epoch: 34, step: 591, loss: 0.3170112669467926, mean loss: 0.34587150526529664
Epoch: 34, step: 592, loss: 0.3338238596916199, mean loss: 0.34587126280427766
Epoch: 34, step: 593, loss: 0.33016136288642883, mean loss: 0.3458709466460986
Epoch: 34, step: 594, loss: 0.3528123199939728, mean loss: 0.3458710863368544
Epoch: 34, step: 595, loss: 0.35234785079956055, mean loss: 0.34587121667502685
Epoch: 34, step: 596, loss: 0.3297213315963745, mean loss: 0.3458708916818673
Epoch: 34, step: 597, loss: 0.3329208493232727, mean loss: 0.3458706310861745
Epoch: 34, step: 598, loss: 0.31277984380722046, mean loss: 0.34586996520857555
Epoch: 34, step: 599, loss: 0.37137266993522644, mean loss: 0.3458704783827692
Epoch: 34, step: 600, loss: 0.34538960456848145, mean loss: 0.34587046870665566
Epoch: 34, step: 601, loss: 0.3448176085948944, mean loss: 0.34587044752149504
Epoch: 34, step: 602, loss: 0.34251558780670166, mean loss: 0.3458703800179293
Epoch: 34, step: 603, loss: 0.3668726086616516, mean loss: 0.3458708025979825
Epoch: 34, step: 604, loss: 0.32874950766563416, mean loss: 0.345870458112058
Epoch: 34, step: 605, loss: 0.3125723600387573, mean loss: 0.3458697881571654
Epoch: 34, step: 606, loss: 0.3635587692260742, mean loss: 0.3458701440507949
Epoch: 34, step: 607, loss: 0.3286832869052887, mean loss: 0.34586979826660963
Epoch: 34, step: 608, loss: 0.34307047724723816, mean loss: 0.3458697419479089
Epoch: 34, step: 609, loss: 0.34744733572006226, mean loss: 0.34586977368640676
Epoch: 34, step: 610, loss: 0.3581360876560211, mean loss: 0.3458700204587722
Epoch: 34, step: 611, loss: 0.38242870569229126, mean loss: 0.3458707559276149
Epoch: 34, step: 612, loss: 0.3630249500274658, mean loss: 0.3458711010199342
Epoch: 34, step: 613, loss: 0.32181304693222046, mean loss: 0.34587061705183747
Epoch: 34, step: 614, loss: 0.35268324613571167, mean loss: 0.3458707540965375
Epoch: 34, step: 615, loss: 0.34530121088027954, mean loss: 0.3458707426396817
Epoch: 34, step: 616, loss: 0.33716559410095215, mean loss: 0.3458705675315905
Epoch: 34, step: 617, loss: 0.3347221612930298, mean loss: 0.34587034328075095
Epoch: 34, step: 618, loss: 0.2980273365974426, mean loss: 0.34586938093524794
Epoch: 34, step: 619, loss: 0.33173081278800964, mean loss: 0.3458690965485687
Epoch: 34, step: 620, loss: 0.3946724832057953, mean loss: 0.3458700781722921
Epoch: 34, step: 621, loss: 0.3373900055885315, mean loss: 0.34586990760886266
Epoch: 34, step: 622, loss: 0.3047696352005005, mean loss: 0.3458690809576346
Epoch: 34, step: 623, loss: 0.3259032368659973, mean loss: 0.3458686793919851
Epoch: 34, step: 624, loss: 0.35108333826065063, mean loss: 0.345868784270384
Epoch: 34, step: 625, loss: 0.3481433689594269, mean loss: 0.34586883001642577
Epoch: 34, step: 626, loss: 0.33280396461486816, mean loss: 0.3458685672634663
Epoch: 34, step: 627, loss: 0.35207730531692505, mean loss: 0.34586869212747673
Epoch: 34, step: 628, loss: 0.36576247215270996, mean loss: 0.3458690922034953
Epoch: 34, step: 629, loss: 0.33923831582069397, mean loss: 0.3458689588572301
Epoch: 34, step: 630, loss: 0.33106935024261475, mean loss: 0.34586866124006815
Epoch: 34, step: 631, loss: 0.3050542175769806, mean loss: 0.3458678404862944
Epoch: 34, step: 632, loss: 0.33162397146224976, mean loss: 0.3458675540564642
Epoch: 34, step: 633, loss: 0.3044546842575073, mean loss: 0.34586672130219515
Epoch: 34, step: 634, loss: 0.3272188603878021, mean loss: 0.3458663463276136
Epoch: 34, step: 635, loss: 0.32592639327049255, mean loss: 0.3458659453794704
Epoch: 34, step: 636, loss: 0.34650561213493347, mean loss: 0.3458659582414887
Epoch: 34, step: 637, loss: 0.3039344251155853, mean loss: 0.3458651151254488
Epoch: 34, step: 638, loss: 0.3124648928642273, mean loss: 0.3458644435617158
Epoch: 34, step: 639, loss: 0.32474085688591003, mean loss: 0.3458640188474912
Epoch: 34, step: 640, loss: 0.31832846999168396, mean loss: 0.34586346522445693
Epoch: 34, step: 641, loss: 0.33255594968795776, mean loss: 0.3458631976721722
Epoch: 34, step: 642, loss: 0.3266438841819763, mean loss: 0.3458628112688772
Epoch: 34, step: 643, loss: 0.31551986932754517, mean loss: 0.34586220123787714
Epoch: 34, step: 644, loss: 0.30675408244132996, mean loss: 0.34586141500280354
Epoch: 34, step: 645, loss: 0.3809312582015991, mean loss: 0.3458621200376473
Epoch: 34, step: 646, loss: 0.3039504885673523, mean loss: 0.345861277474242
Epoch: 34, step: 647, loss: 0.3439294695854187, mean loss: 0.34586123863924906
Epoch: 34, step: 648, loss: 0.34858065843582153, mean loss: 0.3458612933064477
Epoch: 34, step: 649, loss: 0.3604755699634552, mean loss: 0.3458615870843727
Epoch: 34, step: 650, loss: 0.33873358368873596, mean loss: 0.34586144379928224
Epoch: 34, step: 651, loss: 0.35410192608833313, mean loss: 0.34586160944377625
Epoch: 34, step: 652, loss: 0.36888739466667175, mean loss: 0.34586207228293325
Epoch: 34, step: 653, loss: 0.3754061460494995, mean loss: 0.34586266613366223
Epoch: 34, step: 654, loss: 0.33643630146980286, mean loss: 0.34586247666280406
Epoch: 34, step: 655, loss: 0.34442856907844543, mean loss: 0.34586244784169967
Epoch: 34, step: 656, loss: 0.3255726993083954, mean loss: 0.3458620400321498
Epoch: 34, step: 657, loss: 0.33785319328308105, mean loss: 0.34586187906324783
Epoch: 34, step: 658, loss: 0.33429375290870667, mean loss: 0.345861646561466
Epoch: 34, step: 659, loss: 0.3418995141983032, mean loss: 0.34586156693021824
Epoch: 34, step: 660, loss: 0.3026883602142334, mean loss: 0.34586069924915397
Epoch: 34, step: 661, loss: 0.2879224419593811, mean loss: 0.34585953484830806
Epoch: 34, step: 662, loss: 0.33041009306907654, mean loss: 0.345859224362933
Epoch: 34, step: 663, loss: 0.314107209444046, mean loss: 0.34585858625973925
Epoch: 34, step: 664, loss: 0.31272241473197937, mean loss: 0.3458579203532758
Epoch: 34, step: 665, loss: 0.33423012495040894, mean loss: 0.34585768668510725
Epoch: 34, step: 666, loss: 0.32741621136665344, mean loss: 0.3458573160990228
Epoch: 34, step: 667, loss: 0.3186201751232147, mean loss: 0.3458567687728236
Epoch: 34, step: 668, loss: 0.35411104559898376, mean loss: 0.3458569346379261
Epoch: 34, step: 669, loss: 0.3468519449234009, mean loss: 0.3458569546317027
Epoch: 34, step: 670, loss: 0.35184141993522644, mean loss: 0.34585707488137224
Epoch: 34, step: 671, loss: 0.34707021713256836, mean loss: 0.34585709925732167
Epoch: 34, step: 672, loss: 0.3369966447353363, mean loss: 0.34585692122572526
Epoch: 34, step: 673, loss: 0.3514970541000366, mean loss: 0.3458570345496729
Epoch: 34, step: 674, loss: 0.3343539834022522, mean loss: 0.34585680343012243
Epoch: 34, step: 675, loss: 0.3116956055164337, mean loss: 0.34585611707639113
Epoch: 34, step: 676, loss: 0.33515235781669617, mean loss: 0.34585590202487204
Epoch: 34, step: 677, loss: 0.32617682218551636, mean loss: 0.3458555066562089
Epoch: 34, step: 678, loss: 0.35110652446746826, mean loss: 0.345855612151293
Epoch: 34, step: 679, loss: 0.3343844711780548, mean loss: 0.34585538169603397
Epoch: 34, step: 680, loss: 0.33811450004577637, mean loss: 0.34585522618482095
Epoch: 34, step: 681, loss: 0.3354237377643585, mean loss: 0.34585501662460516
Epoch: 34, step: 682, loss: 0.3310030996799469, mean loss: 0.345854718267528
Epoch: 34, step: 683, loss: 0.3622966408729553, mean loss: 0.34585504855926374
Epoch: 34, step: 684, loss: 0.35155606269836426, mean loss: 0.3458551630811524
Epoch: 34, step: 685, loss: 0.31241682171821594, mean loss: 0.3458544913857331
Epoch: 34, step: 686, loss: 0.3220141530036926, mean loss: 0.345854012500604
Epoch: 34, step: 687, loss: 0.34061199426651, mean loss: 0.34585390720536385
Epoch: 34, step: 688, loss: 0.31904512643814087, mean loss: 0.34585336871423666
Epoch: 34, step: 689, loss: 0.3152662217617035, mean loss: 0.34585275434178353
Epoch: 34, step: 690, loss: 0.3394923806190491, mean loss: 0.34585262659008686
Epoch: 34, step: 691, loss: 0.30911076068878174, mean loss: 0.34585188862379174
Epoch: 34, step: 692, loss: 0.2843838632106781, mean loss: 0.34585065405339643
Epoch: 34, step: 693, loss: 0.2956615090370178, mean loss: 0.3458496460368265
Epoch: 34, step: 694, loss: 0.379428505897522, mean loss: 0.34585032043299974
Epoch: 34, step: 695, loss: 0.37266528606414795, mean loss: 0.34585085897263723
Epoch: 34, step: 696, loss: 0.32579565048217773, mean loss: 0.3458504562009928
Epoch: 34, step: 697, loss: 0.3431962728500366, mean loss: 0.3458504028977163
Epoch: 34, step: 698, loss: 0.3482276499271393, mean loss: 0.34585045063839365
Epoch: 34, step: 699, loss: 0.31024685502052307, mean loss: 0.3458497356493259
Epoch: 34, step: 700, loss: 0.3058643639087677, mean loss: 0.34584893268184314
Epoch: 34, step: 701, loss: 0.3640285134315491, mean loss: 0.34584929774832673
Epoch: 34, step: 702, loss: 0.292377233505249, mean loss: 0.34584822399053555
Epoch: 34, step: 703, loss: 0.32419276237487793, mean loss: 0.3458477891419087
Epoch: 34, step: 704, loss: 0.3478533923625946, mean loss: 0.34584782941425707
Epoch: 34, step: 705, loss: 0.3173183798789978, mean loss: 0.34584725655675064
Epoch: 34, step: 706, loss: 0.3046432137489319, mean loss: 0.3458464292161726
Epoch: 34, step: 707, loss: 0.31195971369743347, mean loss: 0.3458457488146884
Epoch: 34, step: 708, loss: 0.3327343761920929, mean loss: 0.3458454855605448
Epoch: 34, step: 709, loss: 0.35196471214294434, mean loss: 0.34584560842177803
Epoch: 34, step: 710, loss: 0.3163205683231354, mean loss: 0.3458450156328106
Epoch: 34, step: 711, loss: 0.3486519455909729, mean loss: 0.345845071987813
Epoch: 34, step: 712, loss: 0.3788759410381317, mean loss: 0.34584573513842937
Epoch: 34, step: 713, loss: 0.31756749749183655, mean loss: 0.3458451674163325
Epoch: 34, step: 714, loss: 0.34345683455467224, mean loss: 0.34584511946843216
Epoch: 34, step: 715, loss: 0.28825390338897705, mean loss: 0.34584396329690564
Epoch: 34, step: 716, loss: 0.3222411274909973, mean loss: 0.3458434894680697
Epoch: 34, step: 717, loss: 0.33080753684043884, mean loss: 0.3458431876261653
Epoch: 34, step: 718, loss: 0.3177992105484009, mean loss: 0.34584262466366245
Epoch: 34, step: 719, loss: 0.33501967787742615, mean loss: 0.34584240740521566
Epoch: 34, step: 720, loss: 0.305147647857666, mean loss: 0.3458415905202256
Epoch: 34, step: 721, loss: 0.31407421827316284, mean loss: 0.3458409528516671
Epoch: 34, step: 722, loss: 0.3618205487728119, mean loss: 0.34584127360471156
Epoch: 34, step: 723, loss: 0.36915674805641174, mean loss: 0.34584174159897996
Epoch: 34, step: 724, loss: 0.32126376032829285, mean loss: 0.3458412482732484
Epoch: 34, step: 725, loss: 0.29540175199508667, mean loss: 0.34584023587920004
Epoch: 34, step: 726, loss: 0.32592129707336426, mean loss: 0.345839836085153
Epoch: 34, step: 727, loss: 0.2839078903198242, mean loss: 0.34583859307082726
Epoch: 34, step: 728, loss: 0.3779797852039337, mean loss: 0.3458392381524556
Epoch: 34, step: 729, loss: 0.3230036199092865, mean loss: 0.3458387798451814
Epoch: 34, step: 730, loss: 0.3261144757270813, mean loss: 0.34583838398943817
Epoch: 34, step: 731, loss: 0.3061493933200836, mean loss: 0.34583758746959653
Epoch: 34, step: 732, loss: 0.344233900308609, mean loss: 0.3458375552857847
Epoch: 34, step: 733, loss: 0.351129949092865, mean loss: 0.3458376614947714
Epoch: 34, step: 734, loss: 0.3601949214935303, mean loss: 0.34583794961381376
Epoch: 34, step: 735, loss: 0.3337049186229706, mean loss: 0.3458377061351055
Epoch: 34, step: 736, loss: 0.30914756655693054, mean loss: 0.3458369698731992
Epoch: 34, step: 737, loss: 0.3113463222980499, mean loss: 0.34583627776243997
Epoch: 34, step: 738, loss: 0.35295867919921875, mean loss: 0.3458364206821036
Epoch: 34, step: 739, loss: 0.3304956555366516, mean loss: 0.3458361128571348
Epoch: 34, step: 740, loss: 0.3415183126926422, mean loss: 0.34583602621869014
Epoch: 34, step: 741, loss: 0.35131457448005676, mean loss: 0.34583613614581926
Epoch: 34, step: 742, loss: 0.2972329258918762, mean loss: 0.3458351609414561
Epoch: 34, step: 743, loss: 0.34832605719566345, mean loss: 0.34583521091931035
Epoch: 34, step: 744, loss: 0.37594133615493774, mean loss: 0.34583581496267296
Epoch: 34, step: 745, loss: 0.33562225103378296, mean loss: 0.3458356100438509
Epoch: 34, step: 746, loss: 0.33343350887298584, mean loss: 0.3458353612205222
Epoch: 34, step: 747, loss: 0.3595212697982788, mean loss: 0.3458356357953673
Epoch: 34, step: 748, loss: 0.3099213242530823, mean loss: 0.34583491527552496
Epoch: 34, step: 749, loss: 0.35246050357818604, mean loss: 0.3458350481966882
Epoch: 34, step: 750, loss: 0.28859108686447144, mean loss: 0.34583389980337803
Epoch: 34, step: 751, loss: 0.33659127354621887, mean loss: 0.3458337143871877
Epoch: 34, step: 752, loss: 0.31225454807281494, mean loss: 0.3458330407695361
Epoch: 34, step: 753, loss: 0.4303544759750366, mean loss: 0.34583473628478595
Epoch: 34, step: 754, loss: 0.3365393280982971, mean loss: 0.34583454982096
Epoch: 34, step: 755, loss: 0.3103221356868744, mean loss: 0.345833837464101
Epoch: 34, step: 756, loss: 0.3710680603981018, mean loss: 0.3458343436367072
Epoch: 34, step: 757, loss: 0.34307408332824707, mean loss: 0.3458342882698297
Epoch: 34, step: 758, loss: 0.29531165957450867, mean loss: 0.3458332748784207
Epoch: 34, step: 759, loss: 0.3108329474925995, mean loss: 0.3458325728500312
Epoch: 34, step: 760, loss: 0.3423548638820648, mean loss: 0.3458325030963563
Epoch: 34, step: 761, loss: 0.3709222674369812, mean loss: 0.34583300632080055
Epoch: 34, step: 762, loss: 0.37656140327453613, mean loss: 0.34583362262672235
Epoch: 34, step: 763, loss: 0.31855419278144836, mean loss: 0.34583307550618797
Epoch: 34, step: 764, loss: 0.32076719403266907, mean loss: 0.3458325727910103
Epoch: 34, step: 765, loss: 0.37859734892845154, mean loss: 0.3458332299001543
Epoch: 34, step: 766, loss: 0.3551083207130432, mean loss: 0.345833415911642
Epoch: 34, step: 767, loss: 0.3203423023223877, mean loss: 0.3458329046988715
Epoch: 34, step: 768, loss: 0.34053897857666016, mean loss: 0.34583279853370313
Epoch: 34, step: 769, loss: 0.32253313064575195, mean loss: 0.34583233128812724
Epoch: 34, step: 770, loss: 0.3456890285015106, mean loss: 0.34583232841442746
Epoch: 34, step: 771, loss: 0.30848976969718933, mean loss: 0.34583157958634697
Epoch: 34, step: 772, loss: 0.3679000437259674, mean loss: 0.345832022115055
Epoch: 34, step: 773, loss: 0.34239858388900757, mean loss: 0.3458319532672863
Epoch: 34, step: 774, loss: 0.3277607560157776, mean loss: 0.34583159090845544
Epoch: 34, step: 775, loss: 0.3241247534751892, mean loss: 0.34583115565746425
Epoch: 34, step: 776, loss: 0.3151674270629883, mean loss: 0.3458305408212083
Epoch: 34, step: 777, loss: 0.3350241780281067, mean loss: 0.3458303241479358
Epoch: 34, step: 778, loss: 0.3493088483810425, mean loss: 0.3458303938927826
Epoch: 34, step: 779, loss: 0.3649163544178009, mean loss: 0.3458307765610103
Epoch: 34, step: 780, loss: 0.3283468186855316, mean loss: 0.34583042601952074
Epoch: 34, step: 781, loss: 0.33324533700942993, mean loss: 0.345830173702086
Epoch: 34, step: 782, loss: 0.3306591510772705, mean loss: 0.34582986954557476
Epoch: 34, step: 783, loss: 0.3128003180027008, mean loss: 0.34582920736531125
Epoch: 34, step: 784, loss: 0.3174479305744171, mean loss: 0.34582863838560374
Epoch: 34, step: 785, loss: 0.3717396855354309, mean loss: 0.3458291578324413
Epoch: 34, step: 786, loss: 0.3416253328323364, mean loss: 0.3458290735587408
Epoch: 34, step: 787, loss: 0.31361067295074463, mean loss: 0.3458284276923186
Epoch: 34, step: 788, loss: 0.33627432584762573, mean loss: 0.34582823616977987
Epoch: 34, step: 789, loss: 0.30780529975891113, mean loss: 0.34582747397324354
Epoch: 34, step: 790, loss: 0.3364560306072235, mean loss: 0.3458272861198275
Epoch: 34, step: 791, loss: 0.3380700349807739, mean loss: 0.34582713062649967
Epoch: 34, step: 792, loss: 0.3573656380176544, mean loss: 0.34582736191009705
Epoch: 34, step: 793, loss: 0.3501295745372772, mean loss: 0.3458274481440643
Epoch: 34, step: 794, loss: 0.3073786795139313, mean loss: 0.3458266774886629
Epoch: 34, step: 795, loss: 0.33089226484298706, mean loss: 0.3458263781538468
Epoch: 34, step: 796, loss: 0.3299507200717926, mean loss: 0.3458260599597498
Epoch: 34, step: 797, loss: 0.33026355504989624, mean loss: 0.34582574804839955
Epoch: 34, step: 798, loss: 0.3263765573501587, mean loss: 0.3458253582460005
Epoch: 34, step: 799, loss: 0.3895677924156189, mean loss: 0.345826234918162
Epoch: 34, step: 800, loss: 0.3424222767353058, mean loss: 0.3458261666984658
Epoch: 34, step: 801, loss: 0.31791165471076965, mean loss: 0.3458256072669858
Epoch: 34, step: 802, loss: 0.3296588659286499, mean loss: 0.3458252832777007
Epoch: 34, step: 803, loss: 0.36985331773757935, mean loss: 0.34582576480143734
Epoch: 34, step: 804, loss: 0.41200658679008484, mean loss: 0.3458270910438371
Epoch: 34, step: 805, loss: 0.34749943017959595, mean loss: 0.3458271245563042
Epoch: 34, step: 806, loss: 0.3221302926540375, mean loss: 0.3458266496984419
Epoch: 34, step: 807, loss: 0.3224647343158722, mean loss: 0.34582618156131095
Epoch: 34, step: 808, loss: 0.33559370040893555, mean loss: 0.34582597652211344
Epoch: 34, step: 809, loss: 0.35411497950553894, mean loss: 0.3458261426144267
Epoch: 34, step: 810, loss: 0.34004515409469604, mean loss: 0.34582602677920277
Epoch: 34, step: 811, loss: 0.34158068895339966, mean loss: 0.34582594171592984
Epoch: 34, step: 812, loss: 0.3029782176017761, mean loss: 0.34582508319894667
Epoch: 34, step: 813, loss: 0.3129747211933136, mean loss: 0.345824425006961
Epoch: 34, step: 814, loss: 0.356711208820343, mean loss: 0.34582464313089784
Epoch: 34, step: 815, loss: 0.3236635625362396, mean loss: 0.34582419912784057
Epoch: 34, step: 816, loss: 0.30096420645713806, mean loss: 0.34582330036413833
Epoch: 34, step: 817, loss: 0.3253333270549774, mean loss: 0.3458228898586026
Epoch: 34, step: 818, loss: 0.3381960988044739, mean loss: 0.345822737063029
Epoch: 34, step: 819, loss: 0.30529212951660156, mean loss: 0.34582192508675796
Epoch: 34, step: 820, loss: 0.3145388066768646, mean loss: 0.3458212983840633
Epoch: 34, step: 821, loss: 0.34487977623939514, mean loss: 0.3458212795226877
Epoch: 34, step: 822, loss: 0.33870306611061096, mean loss: 0.3458211369274151
Epoch: 34, step: 823, loss: 0.3013650178909302, mean loss: 0.3458202463801588
Epoch: 34, step: 824, loss: 0.3070950210094452, mean loss: 0.34581947064999774
Epoch: 34, step: 825, loss: 0.3489193022251129, mean loss: 0.3458195327434951
Epoch: 34, step: 826, loss: 0.3354160189628601, mean loss: 0.345819324352297
Epoch: 34, step: 827, loss: 0.352895051240921, mean loss: 0.3458194660822643
Epoch: 34, step: 828, loss: 0.351848840713501, mean loss: 0.3458195868509099
Epoch: 34, step: 829, loss: 0.2788649797439575, mean loss: 0.3458182457739739
Epoch: 34, step: 830, loss: 0.33019137382507324, mean loss: 0.3458179327795631
Epoch: 34, step: 831, loss: 0.3276533782482147, mean loss: 0.3458175689645789
Epoch: 34, step: 832, loss: 0.34536778926849365, mean loss: 0.34581755995619307
Epoch: 34, step: 833, loss: 0.3780781030654907, mean loss: 0.34581820607161684
Epoch: 34, step: 834, loss: 0.3047095239162445, mean loss: 0.3458173827618062
Epoch: 34, step: 835, loss: 0.35801687836647034, mean loss: 0.34581762708399644
Epoch: 34, step: 836, loss: 0.35084837675094604, mean loss: 0.3458177278339948
Epoch: 34, step: 837, loss: 0.3402004539966583, mean loss: 0.345817615340026
Epoch: 34, step: 838, loss: 0.31315672397613525, mean loss: 0.34581696127191014
Epoch: 34, step: 839, loss: 0.3275272250175476, mean loss: 0.3458165950083677
Epoch: 34, step: 840, loss: 0.4085443913936615, mean loss: 0.3458178511470301
Epoch: 34, step: 841, loss: 0.3374437689781189, mean loss: 0.3458176834574517
Epoch: 34, step: 842, loss: 0.3786722421646118, mean loss: 0.3458183413512563
Epoch: 34, step: 843, loss: 0.31352555751800537, mean loss: 0.34581769471962165
Epoch: 34, step: 844, loss: 0.30760276317596436, mean loss: 0.34581692951805293
Epoch: 34, step: 845, loss: 0.357119083404541, mean loss: 0.34581715582364514
Epoch: 34, step: 846, loss: 0.31408122181892395, mean loss: 0.34581652038055993
Epoch: 34, step: 847, loss: 0.314998596906662, mean loss: 0.34581590333099493
Epoch: 34, step: 848, loss: 0.3474105894565582, mean loss: 0.34581593525983917
Epoch: 34, step: 849, loss: 0.3477333188056946, mean loss: 0.3458159736489703
Epoch: 34, step: 850, loss: 0.31702378392219543, mean loss: 0.3458153971941337
Epoch: 34, step: 851, loss: 0.35808318853378296, mean loss: 0.3458156428053962
Epoch: 34, step: 852, loss: 0.31982484459877014, mean loss: 0.3458151224586784
Epoch: 34, step: 853, loss: 0.37502503395080566, mean loss: 0.34581570724169125
Epoch: 34, step: 854, loss: 0.3412991464138031, mean loss: 0.34581561682186324
Epoch: 34, step: 855, loss: 0.354104608297348, mean loss: 0.34581578276099434
Epoch: 34, step: 856, loss: 0.29444584250450134, mean loss: 0.34581475439552567
Epoch: 34, step: 857, loss: 0.3250497281551361, mean loss: 0.34581433871257256
Epoch: 34, step: 858, loss: 0.3550390601158142, mean loss: 0.3458145233731952
Epoch: 34, step: 859, loss: 0.3188442289829254, mean loss: 0.3458139834922121
Epoch: 34, step: 860, loss: 0.39339005947113037, mean loss: 0.34581493583274453
Epoch: 34, step: 861, loss: 0.38775575160980225, mean loss: 0.34581577535425817
Epoch: 34, step: 862, loss: 0.38982900977134705, mean loss: 0.34581665634135594
Epoch: 34, step: 863, loss: 0.36432695388793945, mean loss: 0.34581702684370874
Epoch: 34, step: 864, loss: 0.30844753980636597, mean loss: 0.34581627887054894
Epoch: 34, step: 865, loss: 0.3332211375236511, mean loss: 0.34581602677613027
Epoch: 34, step: 866, loss: 0.33797499537467957, mean loss: 0.345815869839369
Epoch: 34, step: 867, loss: 0.31216537952423096, mean loss: 0.3458151963446465
Epoch: 34, step: 868, loss: 0.3313659429550171, mean loss: 0.34581490715714747
Epoch: 34, step: 869, loss: 0.35093212127685547, mean loss: 0.3458150095710713
Epoch: 34, step: 870, loss: 0.3272045850753784, mean loss: 0.3458146371167615
Epoch: 34, step: 871, loss: 0.3486144244670868, mean loss: 0.34581469314836877
Epoch: 34, step: 872, loss: 0.3249039351940155, mean loss: 0.3458142746737554
Epoch: 34, step: 873, loss: 0.35482120513916016, mean loss: 0.34581445492051277
Epoch: 34, step: 874, loss: 0.34942302107810974, mean loss: 0.3458145271337196
Epoch: 34, step: 875, loss: 0.3157462775707245, mean loss: 0.34581392543177525
Epoch: 34, step: 876, loss: 0.3056921660900116, mean loss: 0.3458131225630393
Epoch: 34, step: 877, loss: 0.33327940106391907, mean loss: 0.3458128717581908
Epoch: 34, step: 878, loss: 0.3777308464050293, mean loss: 0.3458135104370232
Epoch: 34, step: 879, loss: 0.3156719207763672, mean loss: 0.3458129073157318
Epoch: 34, step: 880, loss: 0.3283507227897644, mean loss: 0.3458125579113152
Epoch: 34, step: 881, loss: 0.36140862107276917, mean loss: 0.3458128699698842
Epoch: 34, step: 882, loss: 0.32289814949035645, mean loss: 0.3458124114829101
Epoch: 34, step: 883, loss: 0.3036758601665497, mean loss: 0.34581156841465643
Epoch: 34, step: 884, loss: 0.33090248703956604, mean loss: 0.34581127011967683
Epoch: 34, step: 885, loss: 0.34209248423576355, mean loss: 0.3458111957171742
Epoch: 34, step: 886, loss: 0.326183021068573, mean loss: 0.34581080302016426
Epoch: 34, step: 887, loss: 0.349717915058136, mean loss: 0.34581088118741854
Epoch: 34, step: 888, loss: 0.3459243178367615, mean loss: 0.34581088345683236
Epoch: 34, step: 889, loss: 0.3588670790195465, mean loss: 0.3458111446538788
Epoch: 34, step: 890, loss: 0.32167840003967285, mean loss: 0.3458106618734636
Epoch: 34, step: 891, loss: 0.3653945028781891, mean loss: 0.3458110536443087
Epoch: 34, step: 892, loss: 0.30828744173049927, mean loss: 0.3458103030069302
Epoch: 34, step: 893, loss: 0.31738168001174927, mean loss: 0.3458097343207331
Epoch: 34, step: 894, loss: 0.3173193335533142, mean loss: 0.3458091644101338
Epoch: 34, step: 895, loss: 0.33418017625808716, mean loss: 0.3458089317931521
Epoch: 34, step: 896, loss: 0.3223741352558136, mean loss: 0.34580846303159474
Epoch: 34, step: 897, loss: 0.341426819562912, mean loss: 0.34580837538820813
Epoch: 34, step: 898, loss: 0.37219250202178955, mean loss: 0.3458089031235143
Epoch: 34, step: 899, loss: 0.33253219723701477, mean loss: 0.34580863756815217
Epoch: 34, step: 900, loss: 0.3622675836086273, mean loss: 0.3458089667668249
Epoch: 34, step: 901, loss: 0.38663771748542786, mean loss: 0.3458097833745036
Epoch: 34, step: 902, loss: 0.3158869445323944, mean loss: 0.34580918490575735
Epoch: 34, step: 903, loss: 0.3077223002910614, mean loss: 0.34580842316806504
Epoch: 34, step: 904, loss: 0.34724321961402893, mean loss: 0.3458084518634201
Epoch: 34, step: 905, loss: 0.3299964964389801, mean loss: 0.34580813563696067
Epoch: 34, step: 906, loss: 0.31881991028785706, mean loss: 0.3458075959048376
Epoch: 34, step: 907, loss: 0.3178694546222687, mean loss: 0.3458070371867094
Epoch: 34, step: 908, loss: 0.3589710295200348, mean loss: 0.3458073004402307
Epoch: 34, step: 909, loss: 0.3424719274044037, mean loss: 0.34580723374077393
Epoch: 34, step: 910, loss: 0.3166886866092682, mean loss: 0.3458066514513518
Epoch: 34, step: 911, loss: 0.3170280158519745, mean loss: 0.3458060759707167
Epoch: 34, step: 912, loss: 0.36040323972702026, mean loss: 0.3458063678614515
Epoch: 34, step: 913, loss: 0.32160434126853943, mean loss: 0.3458058839177084
Epoch: 34, step: 914, loss: 0.3438141942024231, mean loss: 0.3458058440926756
Epoch: 34, step: 915, loss: 0.3702290952205658, mean loss: 0.3458063324404947
Epoch: 34, step: 916, loss: 0.34525787830352783, mean loss: 0.34580632147426316
Epoch: 34, step: 917, loss: 0.3016068637371063, mean loss: 0.34580543773255606
Epoch: 34, step: 918, loss: 0.33137476444244385, mean loss: 0.3458051492056483
Epoch: 34, step: 919, loss: 0.31670108437538147, mean loss: 0.34580456731055814
Epoch: 34, step: 920, loss: 0.3165340721607208, mean loss: 0.34580398209962687
Epoch: 34, step: 921, loss: 0.30477893352508545, mean loss: 0.34580316189392946
Epoch: 34, step: 922, loss: 0.3188871145248413, mean loss: 0.34580262377746634
Epoch: 34, step: 923, loss: 0.3315677046775818, mean loss: 0.34580233919291814
Epoch: 34, step: 924, loss: 0.32160112261772156, mean loss: 0.34580185537179153
Epoch: 34, step: 925, loss: 0.297811359167099, mean loss: 0.34580089598399805
Epoch: 34, step: 926, loss: 0.3173554241657257, mean loss: 0.3458003273361397
Epoch: 34, step: 927, loss: 0.3705439567565918, mean loss: 0.34580082197130324
Epoch: 34, step: 928, loss: 0.31439366936683655, mean loss: 0.34580019414216573
Epoch: 34, step: 929, loss: 0.34248796105384827, mean loss: 0.34580012793193327
Epoch: 34, step: 930, loss: 0.3223857581615448, mean loss: 0.34579965989727657
Epoch: 34, step: 931, loss: 0.3246336877346039, mean loss: 0.34579923681475955
Epoch: 34, step: 932, loss: 0.3445010781288147, mean loss: 0.34579921086663573
Epoch: 34, step: 933, loss: 0.36107999086380005, mean loss: 0.34579951629897626
Epoch: 34, step: 934, loss: 0.3702228367328644, mean loss: 0.3458000044627234
Epoch: 34, step: 935, loss: 0.35543182492256165, mean loss: 0.3458001969759242
Epoch: 34, step: 936, loss: 0.32857170701026917, mean loss: 0.3457998526333909
Epoch: 34, step: 937, loss: 0.3587009608745575, mean loss: 0.3458001104802199
Epoch: 34, step: 938, loss: 0.3125970661640167, mean loss: 0.34579944688385106
Epoch: 34, step: 939, loss: 0.3203563094139099, mean loss: 0.34579893838721926
Epoch: 34, step: 940, loss: 0.34578415751457214, mean loss: 0.3457989380918204
Epoch: 34, step: 941, loss: 0.3311766982078552, mean loss: 0.34579864586911196
Epoch: 34, step: 942, loss: 0.3747556805610657, mean loss: 0.34579922455842815
Epoch: 34, step: 943, loss: 0.2966301441192627, mean loss: 0.34579824196289577
Epoch: 34, step: 944, loss: 0.33780500292778015, mean loss: 0.3457980822290968
Epoch: 34, step: 945, loss: 0.33757665753364563, mean loss: 0.3457979179386069
Epoch: 34, step: 946, loss: 0.33945316076278687, mean loss: 0.3457977911524995
Epoch: 34, step: 947, loss: 0.3490358591079712, mean loss: 0.3457978558569187
Epoch: 34, step: 948, loss: 0.34066930413246155, mean loss: 0.34579775337811514
Epoch: 34, step: 949, loss: 0.32683485746383667, mean loss: 0.34579737446879344
Epoch: 34, step: 950, loss: 0.3152174651622772, mean loss: 0.3457967634449697
Epoch: 34, step: 951, loss: 0.4049156606197357, mean loss: 0.345797944688919
Epoch: 34, step: 952, loss: 0.3306609094142914, mean loss: 0.3457976422446089
Epoch: 34, step: 953, loss: 0.3496244549751282, mean loss: 0.34579771870440373
Epoch: 34, step: 954, loss: 0.3165711760520935, mean loss: 0.3457971347691646
Epoch: 34, step: 955, loss: 0.31611788272857666, mean loss: 0.34579654180081093
Epoch: 34, step: 956, loss: 0.32415804266929626, mean loss: 0.34579610948907874
Epoch: 34, step: 957, loss: 0.3241558372974396, mean loss: 0.34579567715056053
Epoch: 34, step: 958, loss: 0.33454087376594543, mean loss: 0.34579545230182646
Epoch: 34, step: 959, loss: 0.33416852355003357, mean loss: 0.34579522002340324
Epoch: 34, step: 960, loss: 0.3299318253993988, mean loss: 0.3457949031167843
Epoch: 34, step: 961, loss: 0.3371303975582123, mean loss: 0.34579473002745675
Epoch: 34, step: 962, loss: 0.34512707591056824, mean loss: 0.34579471669011247
Epoch: 34, step: 963, loss: 0.34501737356185913, mean loss: 0.34579470116188377
Epoch: 34, step: 964, loss: 0.32992199063301086, mean loss: 0.3457943840944954
Epoch: 34, step: 965, loss: 0.3363209664821625, mean loss: 0.345794194860793
Epoch: 34, step: 966, loss: 0.3293665647506714, mean loss: 0.34579386672164614
Epoch: 34, step: 967, loss: 0.3588269352912903, mean loss: 0.3457941270497975
Epoch: 34, step: 968, loss: 0.3317892849445343, mean loss: 0.34579384731660856
Epoch: 34, step: 969, loss: 0.3184202313423157, mean loss: 0.3457933005659999
Epoch: 34, step: 970, loss: 0.331533282995224, mean loss: 0.34579301574730553
Epoch: 34, step: 971, loss: 0.2802210748195648, mean loss: 0.34579170608962145
Epoch: 34, step: 972, loss: 0.3622841536998749, mean loss: 0.3457920354840094
Epoch: 34, step: 973, loss: 0.4124634563922882, mean loss: 0.34579336704823765
Epoch: 34, step: 974, loss: 0.3328598141670227, mean loss: 0.34579310874397207
Epoch: 34, step: 975, loss: 0.3354945182800293, mean loss: 0.3457929030683357
Epoch: 34, step: 976, loss: 0.3367404639720917, mean loss: 0.34579272228349967
Epoch: 34, step: 977, loss: 0.34136244654655457, mean loss: 0.3457926338089273
Epoch: 34, step: 978, loss: 0.33327409625053406, mean loss: 0.34579238381316973
Epoch: 34, step: 979, loss: 0.3631901144981384, mean loss: 0.3457927312396951
Epoch: 34, step: 980, loss: 0.35957300662994385, mean loss: 0.3457930064214231
Epoch: 34, step: 981, loss: 0.35895204544067383, mean loss: 0.3457932691922809
Epoch: 34, step: 982, loss: 0.37405288219451904, mean loss: 0.3457938334929459
Epoch: 34, step: 983, loss: 0.3328835070133209, mean loss: 0.3457935756988868
Epoch: 34, step: 984, loss: 0.3233841359615326, mean loss: 0.3457931282349836
Epoch: 34, step: 985, loss: 0.33921435475349426, mean loss: 0.3457929968749444
Epoch: 34, step: 986, loss: 0.3244630992412567, mean loss: 0.34579257098397076
Epoch: 34, step: 987, loss: 0.3005911409854889, mean loss: 0.3457916684715916
Epoch: 34, step: 988, loss: 0.31119871139526367, mean loss: 0.34579097778661455
Epoch: 34, step: 989, loss: 0.3044793903827667, mean loss: 0.34579015297354493
Epoch: 34, step: 990, loss: 0.3340454697608948, mean loss: 0.3457899184878857
Epoch: 34, step: 991, loss: 0.32336094975471497, mean loss: 0.3457894706966237
Epoch: 34, step: 992, loss: 0.3390147387981415, mean loss: 0.34578933544273766
Epoch: 34, step: 993, loss: 0.33019596338272095, mean loss: 0.3457890241356492
Epoch: 34, step: 994, loss: 0.30768144130706787, mean loss: 0.3457882633685887
Epoch: 34, step: 995, loss: 0.3249252438545227, mean loss: 0.34578784687454744
Epoch: 34, step: 996, loss: 0.3261014521121979, mean loss: 0.3457874538776265
Epoch: 34, step: 997, loss: 0.30198371410369873, mean loss: 0.34578657944676106
Epoch: 34, step: 998, loss: 0.3394351303577423, mean loss: 0.34578645265867664
Epoch: 34, step: 999, loss: 0.3539946675300598, mean loss: 0.3457866165083826
Epoch: 34, step: 1000, loss: 0.29898905754089355, mean loss: 0.3457856823694328
Epoch: 34, step: 1001, loss: 0.2915900647640228, mean loss: 0.3457846005773931
Epoch: 34, step: 1002, loss: 0.33831050992012024, mean loss: 0.345784451390969
Epoch: 34, step: 1003, loss: 0.2977273762226105, mean loss: 0.34578349216791177
Epoch: 34, step: 1004, loss: 0.30789491534233093, mean loss: 0.345782735923988
Epoch: 34, step: 1005, loss: 0.2966702878475189, mean loss: 0.34578175567473496
Epoch: 34, step: 1006, loss: 0.3616335093975067, mean loss: 0.3457820720580598
Epoch: 34, step: 1007, loss: 0.3571326434612274, mean loss: 0.3457822985982842
Epoch: 34, step: 1008, loss: 0.35132020711898804, mean loss: 0.3457824091243499
Epoch: 34, step: 1009, loss: 0.35555633902549744, mean loss: 0.34578260418941
Epoch: 34, step: 1010, loss: 0.33743172883987427, mean loss: 0.3457824375285572
Epoch: 34, step: 1011, loss: 0.363388329744339, mean loss: 0.3457827888874663
Epoch: 34, step: 1012, loss: 0.2844288945198059, mean loss: 0.3457815644787898
Epoch: 34, step: 1013, loss: 0.3279494643211365, mean loss: 0.3457812086196767
Epoch: 34, step: 1014, loss: 0.31748098134994507, mean loss: 0.3457806438688781
Epoch: 34, step: 1015, loss: 0.31428101658821106, mean loss: 0.3457800152843618
Epoch: 34, step: 1016, loss: 0.305156409740448, mean loss: 0.34577920464429746
Epoch: 34, step: 1017, loss: 0.37168511748313904, mean loss: 0.3457797215839319
Epoch: 34, step: 1018, loss: 0.30643579363822937, mean loss: 0.34577893651104064
Epoch: 34, step: 1019, loss: 0.36757513880729675, mean loss: 0.34577937142608367
Epoch: 34, step: 1020, loss: 0.3351288139820099, mean loss: 0.3457791589122172
Epoch: 34, step: 1021, loss: 0.31597065925598145, mean loss: 0.34577856414587266
Epoch: 34, step: 1022, loss: 0.33752909302711487, mean loss: 0.3457783995481928
Epoch: 34, step: 1023, loss: 0.3593815267086029, mean loss: 0.3457786709593492
Epoch: 34, step: 1024, loss: 0.30731645226478577, mean loss: 0.34577790357205257
Epoch: 34, step: 1025, loss: 0.3250919282436371, mean loss: 0.3457774908595645
Epoch: 34, step: 1026, loss: 0.3205047845840454, mean loss: 0.3457769866458048
Epoch: 34, step: 1027, loss: 0.33955076336860657, mean loss: 0.345776862429396
Epoch: 34, step: 1028, loss: 0.3384781777858734, mean loss: 0.34577671681972727
Epoch: 34, step: 1029, loss: 0.31407037377357483, mean loss: 0.3457760842868492
Epoch: 34, step: 1030, loss: 0.3161822259426117, mean loss: 0.34577549390924145
Epoch: 34, step: 1031, loss: 0.31473666429519653, mean loss: 0.3457748747177793
Epoch: 34, step: 1032, loss: 0.32911908626556396, mean loss: 0.3457745424592373
Epoch: 34, step: 1033, loss: 0.34562304615974426, mean loss: 0.3457745394371687
Epoch: 34, step: 1034, loss: 0.321339875459671, mean loss: 0.3457740520209197
Epoch: 34, step: 1035, loss: 0.32216310501098633, mean loss: 0.345773581045355
Epoch: 34, step: 1036, loss: 0.3715488314628601, mean loss: 0.34577409518275787
Epoch: 34, step: 1037, loss: 0.30963969230651855, mean loss: 0.34577337442632755
Epoch: 34, step: 1038, loss: 0.3086930811405182, mean loss: 0.34577263481740594
Epoch: 34, step: 1039, loss: 0.30282825231552124, mean loss: 0.34577177825959315
Epoch: 34, step: 1040, loss: 0.31837424635887146, mean loss: 0.3457712318062373
Epoch: 34, step: 1041, loss: 0.34825360774993896, mean loss: 0.34577128131710616
Epoch: 34, step: 1042, loss: 0.3342394530773163, mean loss: 0.3457710513199335
Epoch: 34, step: 1043, loss: 0.3152253329753876, mean loss: 0.34577044211135066
Epoch: 34, step: 1044, loss: 0.3699685037136078, mean loss: 0.3457709247116499
Epoch: 34, step: 1045, loss: 0.3262329399585724, mean loss: 0.3457705350585696
Epoch: 34, step: 1046, loss: 0.30923694372177124, mean loss: 0.3457698064705047
Epoch: 34, step: 1047, loss: 0.34053152799606323, mean loss: 0.3457697020057936
Epoch: 34, step: 1048, loss: 0.31707286834716797, mean loss: 0.3457691297287239
Epoch: 34, step: 1049, loss: 0.3327369689941406, mean loss: 0.34576886984437155
Epoch: 34, step: 1050, loss: 0.3322625756263733, mean loss: 0.34576860051032926
Epoch: 34, step: 1051, loss: 0.3722263276576996, mean loss: 0.3457691281031973
Epoch: 34, step: 1052, loss: 0.3449209928512573, mean loss: 0.34576911119089093
Epoch: 34, step: 1053, loss: 0.31402042508125305, mean loss: 0.3457684781163922
Epoch: 34, step: 1054, loss: 0.3332809805870056, mean loss: 0.34576822911841554
Epoch: 34, step: 1055, loss: 0.30067214369773865, mean loss: 0.3457673299302392
Epoch: 34, step: 1056, loss: 0.36090660095214844, mean loss: 0.34576763179196274
Epoch: 34, step: 1057, loss: 0.31784963607788086, mean loss: 0.34576707514651644
Epoch: 34, step: 1058, loss: 0.3183533549308777, mean loss: 0.34576652856651013
Epoch: 34, step: 1059, loss: 0.33666297793388367, mean loss: 0.3457663470617922
Epoch: 34, step: 1060, loss: 0.34691888093948364, mean loss: 0.3457663700403172
Epoch: 34, step: 1061, loss: 0.3002069890499115, mean loss: 0.34576546172298017
Epoch: 34, step: 1062, loss: 0.29351499676704407, mean loss: 0.34576442002627655
Epoch: 34, step: 1063, loss: 0.3380068838596344, mean loss: 0.34576426537045185
Epoch: 34, step: 1064, loss: 0.3099135756492615, mean loss: 0.34576355065803144
Epoch: 34, step: 1065, loss: 0.3667429983615875, mean loss: 0.34576396889190775
Epoch: 34, step: 1066, loss: 0.32412439584732056, mean loss: 0.3457635375067624
Epoch: 34, step: 1067, loss: 0.334340363740921, mean loss: 0.3457633097901974
Epoch: 34, step: 1068, loss: 0.29572921991348267, mean loss: 0.3457623123997882
Epoch: 34, step: 1069, loss: 0.3190051019191742, mean loss: 0.34576177902637834
Epoch: 34, step: 1070, loss: 0.34727901220321655, mean loss: 0.3457618092700281
Epoch: 34, step: 1071, loss: 0.3665464222431183, mean loss: 0.34576222357023884
Epoch: 34, step: 1072, loss: 0.3246464431285858, mean loss: 0.3457618026772483
Epoch: 34, step: 1073, loss: 0.3354196846485138, mean loss: 0.34576159653576877
Epoch: 34, step: 1074, loss: 0.37262123823165894, mean loss: 0.345762131897665
Epoch: 34, step: 1075, loss: 0.34340596199035645, mean loss: 0.3457620849358156
Epoch: 34, step: 1076, loss: 0.3278285264968872, mean loss: 0.34576172750137
Epoch: 34, step: 1077, loss: 0.3636128604412079, mean loss: 0.34576208328589864
Epoch: 34, step: 1078, loss: 0.3723301887512207, mean loss: 0.34576261279472703
Epoch: 34, step: 1079, loss: 0.3261406123638153, mean loss: 0.3457622217312618
Epoch: 34, step: 1080, loss: 0.3061625361442566, mean loss: 0.34576143253131786
Epoch: 34, step: 1081, loss: 0.3463554084300995, mean loss: 0.34576144436869477
Epoch: 34, step: 1082, loss: 0.3298940062522888, mean loss: 0.34576112815198823
Epoch: 34, step: 1083, loss: 0.3254527151584625, mean loss: 0.34576072344068903
Epoch: 34, step: 1084, loss: 0.30412623286247253, mean loss: 0.345759893754342
Epoch: 34, step: 1085, loss: 0.3493214547634125, mean loss: 0.3457599647272209
Epoch: 34, step: 1086, loss: 0.31900832056999207, mean loss: 0.34575943164541717
Epoch: 34, step: 1087, loss: 0.31194719672203064, mean loss: 0.3457587578801748
Epoch: 34, step: 1088, loss: 0.36076074838638306, mean loss: 0.34575905681393004
Epoch: 34, step: 1089, loss: 0.2920723855495453, mean loss: 0.3457579870599894
Epoch: 34, step: 1090, loss: 0.3376227021217346, mean loss: 0.3457578249605426
Epoch: 34, step: 1091, loss: 0.3510330021381378, mean loss: 0.3457579300688788
Epoch: 34, step: 1092, loss: 0.32236194610595703, mean loss: 0.34575746391127526
Epoch: 34, step: 1093, loss: 0.3176506459712982, mean loss: 0.3457569039029481
Epoch: 34, step: 1094, loss: 0.33232739567756653, mean loss: 0.34575663633489356
Epoch: 34, step: 1095, loss: 0.3394377529621124, mean loss: 0.34575651044065997
Epoch: 34, step: 1096, loss: 0.3195415735244751, mean loss: 0.34575598815793296
Epoch: 34, step: 1097, loss: 0.34297555685043335, mean loss: 0.3457559327642344
Epoch: 34, step: 1098, loss: 0.3558253049850464, mean loss: 0.345756133369319
Epoch: 34, step: 1099, loss: 0.3468281030654907, mean loss: 0.34575615472499865
Epoch: 34, step: 1100, loss: 0.3570495843887329, mean loss: 0.3457563797071622
Epoch: 34, step: 1101, loss: 0.3085249662399292, mean loss: 0.3457556380159899
Epoch: 34, step: 1102, loss: 0.3500628173351288, mean loss: 0.34575572381808395
Epoch: 34, step: 1103, loss: 0.3038793206214905, mean loss: 0.3457548896267852
Epoch: 34, step: 1104, loss: 0.3230352997779846, mean loss: 0.3457544370543295
Epoch: 34, step: 1105, loss: 0.29126882553100586, mean loss: 0.3457533517268222
Epoch: 34, step: 1106, loss: 0.3385135531425476, mean loss: 0.34575320751634503
Epoch: 34, step: 1107, loss: 0.3105953633785248, mean loss: 0.3457525072166849
Epoch: 34, step: 1108, loss: 0.3481753468513489, mean loss: 0.34575255547561595
Epoch: 34, step: 1109, loss: 0.31463536620140076, mean loss: 0.3457519356853663
Epoch: 34, step: 1110, loss: 0.3334752023220062, mean loss: 0.3457516911630215
Epoch: 34, step: 1111, loss: 0.32415613532066345, mean loss: 0.3457512610412114
Epoch: 34, step: 1112, loss: 0.32423317432403564, mean loss: 0.34575083247090094
Epoch: 34, step: 1113, loss: 0.3287351727485657, mean loss: 0.34575049358104387
Epoch: 34, step: 1114, loss: 0.3421558439731598, mean loss: 0.3457504219901652
Epoch: 34, step: 1115, loss: 0.3093143105506897, mean loss: 0.3457496963446733
Epoch: 34, step: 1116, loss: 0.35084268450737, mean loss: 0.3457497977723546
Epoch: 34, step: 1117, loss: 0.34356287121772766, mean loss: 0.34574975422022663
Epoch: 34, step: 1118, loss: 0.37912794947624207, mean loss: 0.34575041892589736
Epoch: 34, step: 1119, loss: 0.3431945741176605, mean loss: 0.3457503680288763
Epoch: 34, step: 1120, loss: 0.3827957510948181, mean loss: 0.34575110573489354
Epoch: 34, step: 1121, loss: 0.31843942403793335, mean loss: 0.34575056187249964
Epoch: 34, step: 1122, loss: 0.2892633378505707, mean loss: 0.34574943705472105
Epoch: 34, step: 1123, loss: 0.36289218068122864, mean loss: 0.34574977840764076
Epoch: 34, step: 1124, loss: 0.34066107869148254, mean loss: 0.34574967708150794
Epoch: 34, step: 1125, loss: 0.326631098985672, mean loss: 0.34574929640017116
Epoch: 34, step: 1126, loss: 0.3390744626522064, mean loss: 0.3457491634962477
Epoch: 34, step: 1127, loss: 0.3166414201259613, mean loss: 0.3457485839378021
Epoch: 34, step: 1128, loss: 0.35665223002433777, mean loss: 0.3457488010337919
Epoch: 34, step: 1129, loss: 0.32762467861175537, mean loss: 0.3457484401823918
Epoch: 34, step: 1130, loss: 0.28409358859062195, mean loss: 0.34574721265831926
Epoch: 34, step: 1131, loss: 0.33137404918670654, mean loss: 0.34574692649993205
Epoch: 34, step: 1132, loss: 0.3344859182834625, mean loss: 0.3457467023065733
Epoch: 34, step: 1133, loss: 0.29857200384140015, mean loss: 0.3457457631328033
Epoch: 34, step: 1134, loss: 0.4156613051891327, mean loss: 0.3457471550131572
Epoch: 34, step: 1135, loss: 0.3641887605190277, mean loss: 0.3457475221417905
Epoch: 34, step: 1136, loss: 0.353702574968338, mean loss: 0.34574768050487503
Epoch: 34, step: 1137, loss: 0.3503667712211609, mean loss: 0.3457477724563564
Epoch: 34, step: 1138, loss: 0.2914487421512604, mean loss: 0.3457466915559821
Epoch: 34, step: 1139, loss: 0.3446924090385437, mean loss: 0.34574667056938846
Epoch: 34, step: 1140, loss: 0.32950058579444885, mean loss: 0.345746347180556
Epoch: 34, step: 1141, loss: 0.37088021636009216, mean loss: 0.3457468474765308
Epoch: 34, step: 1142, loss: 0.32099080085754395, mean loss: 0.34574635471101756
Epoch: 34, step: 1143, loss: 0.3106996417045593, mean loss: 0.34574565712516947
Epoch: 34, step: 1144, loss: 0.3365510404109955, mean loss: 0.3457454741149445
Epoch: 34, step: 1145, loss: 0.32787778973579407, mean loss: 0.3457451184825179
Epoch: 34, step: 1146, loss: 0.33586251735687256, mean loss: 0.3457449217864383
Epoch: 34, step: 1147, loss: 0.298629492521286, mean loss: 0.3457439840539873
Epoch: 34, step: 1148, loss: 0.3123129904270172, mean loss: 0.34574331869437686
Epoch: 34, step: 1149, loss: 0.3339998126029968, mean loss: 0.3457430849741585
Epoch: 34, step: 1150, loss: 0.36641713976860046, mean loss: 0.34574349642269864
Epoch: 34, step: 1151, loss: 0.2917427122592926, mean loss: 0.3457424217374542
Epoch: 34, step: 1152, loss: 0.3314082622528076, mean loss: 0.3457421364748721
Epoch: 34, step: 1153, loss: 0.3196151554584503, mean loss: 0.3457416165349514
Epoch: 34, step: 1154, loss: 0.3356359004974365, mean loss: 0.3457414154301766
Epoch: 34, step: 1155, loss: 0.3254321813583374, mean loss: 0.3457410112824
Epoch: 34, step: 1156, loss: 0.3015207350254059, mean loss: 0.3457401313294368
Epoch: 34, step: 1157, loss: 0.3046300709247589, mean loss: 0.34573931328390006
Epoch: 34, step: 1158, loss: 0.31896528601646423, mean loss: 0.3457387805204483
Epoch: 34, step: 1159, loss: 0.3312495946884155, mean loss: 0.3457384922128665
Epoch: 34, step: 1160, loss: 0.3352644145488739, mean loss: 0.3457382838025423
Epoch: 34, step: 1161, loss: 0.33912840485572815, mean loss: 0.3457381522836011
Epoch: 34, step: 1162, loss: 0.2938023805618286, mean loss: 0.345737118920985
Epoch: 34, step: 1163, loss: 0.3430309295654297, mean loss: 0.34573706507718566
Epoch: 34, step: 1164, loss: 0.3452851176261902, mean loss: 0.3457370560851749
Epoch: 34, step: 1165, loss: 0.3157729506492615, mean loss: 0.34573645992693536
Epoch: 34, step: 1166, loss: 0.32778939604759216, mean loss: 0.3457361028638098
Epoch: 34, step: 1167, loss: 0.338340699672699, mean loss: 0.34573595573259874
Epoch: 34, step: 1168, loss: 0.3194352686405182, mean loss: 0.3457354324920319
Epoch: 34, step: 1169, loss: 0.3265429437160492, mean loss: 0.34573505067353083
Epoch: 34, step: 1170, loss: 0.3241642713546753, mean loss: 0.34573462154946694
Epoch: 34, step: 1171, loss: 0.3403633236885071, mean loss: 0.345734514696243
Epoch: 34, step: 1172, loss: 0.37720948457717896, mean loss: 0.34573514082705686
Epoch: 34, step: 1173, loss: 0.33356279134750366, mean loss: 0.34573489868762025
Epoch: 34, step: 1174, loss: 0.2924228012561798, mean loss: 0.34573383819354947
Epoch: 34, step: 1175, loss: 0.339846670627594, mean loss: 0.34573372108725636
Epoch: 34, step: 1176, loss: 0.34758761525154114, mean loss: 0.34573375796379374
Epoch: 34, step: 1177, loss: 0.34551867842674255, mean loss: 0.34573375368564724
Epoch: 34, step: 1178, loss: 0.3555265963077545, mean loss: 0.3457339484711793
Epoch: 34, step: 1179, loss: 0.31188276410102844, mean loss: 0.3457332751641467
Epoch: 34, step: 1180, loss: 0.37339189648628235, mean loss: 0.34573382528888214
Epoch: 34, step: 1181, loss: 0.34946224093437195, mean loss: 0.34573389944488764
Epoch: 34, step: 1182, loss: 0.3132811188697815, mean loss: 0.3457332539909093
Epoch: 34, step: 1183, loss: 0.29788708686828613, mean loss: 0.3457323023964956
Epoch: 34, step: 1184, loss: 0.3440225422382355, mean loss: 0.34573226839239546
Epoch: 34, step: 1185, loss: 0.2834319770336151, mean loss: 0.34573102937462846
Epoch: 34, step: 1186, loss: 0.37342703342437744, mean loss: 0.3457315801771671
Epoch: 34, step: 1187, loss: 0.3540336787700653, mean loss: 0.3457317452813472
Epoch: 34, step: 1188, loss: 0.3239975869655609, mean loss: 0.34573131306183214
Epoch: 34, step: 1189, loss: 0.34907859563827515, mean loss: 0.34573137962673245
Epoch: 34, step: 1190, loss: 0.3151627480983734, mean loss: 0.3457307717433525
Epoch: 34, step: 1191, loss: 0.32949596643447876, mean loss: 0.34573044890678495
Epoch: 34, step: 1192, loss: 0.3024856150150299, mean loss: 0.3457295889804812
Epoch: 34, step: 1193, loss: 0.3328842520713806, mean loss: 0.3457293335552096
Epoch: 34, step: 1194, loss: 0.3072298765182495, mean loss: 0.34572856802147517
Epoch: 34, step: 1195, loss: 0.2862253189086914, mean loss: 0.3457273848661202
Epoch: 34, step: 1196, loss: 0.33199605345726013, mean loss: 0.34572711183942845
Epoch: 34, step: 1197, loss: 0.3261968195438385, mean loss: 0.3457267235169189
Epoch: 34, step: 1198, loss: 0.3458804190158844, mean loss: 0.3457267265727992
Epoch: 34, step: 1199, loss: 0.3455530107021332, mean loss: 0.34572672311892866
Epoch: 34, step: 1200, loss: 0.31762605905532837, mean loss: 0.3457261644242935
Epoch: 34, step: 1201, loss: 0.3888654112815857, mean loss: 0.34572702209749834
Epoch: 34, step: 1202, loss: 0.3645949065685272, mean loss: 0.345727397212003
Epoch: 34, step: 1203, loss: 0.3372468650341034, mean loss: 0.34572722861295374
Epoch: 34, step: 1204, loss: 0.34464341402053833, mean loss: 0.34572720706637233
Epoch: 34, step: 1205, loss: 0.31994861364364624, mean loss: 0.345726694589862
Epoch: 34, step: 1206, loss: 0.3627578914165497, mean loss: 0.34572703316205106
Epoch: 34, step: 1207, loss: 0.3649943172931671, mean loss: 0.34572741617899067
Epoch: 34, step: 1208, loss: 0.31711751222610474, mean loss: 0.34572684745015747
Epoch: 34, step: 1209, loss: 0.322383314371109, mean loss: 0.34572638341936435
Epoch: 34, step: 1210, loss: 0.29750722646713257, mean loss: 0.3457254249214028
Epoch: 34, step: 1211, loss: 0.3777777850627899, mean loss: 0.34572606204393086
Epoch: 34, step: 1212, loss: 0.3319109082221985, mean loss: 0.3457257874379196
Epoch: 34, step: 1213, loss: 0.3110593855381012, mean loss: 0.34572509838202814
Epoch: 34, step: 1214, loss: 0.3473687767982483, mean loss: 0.34572513105238684
Epoch: 34, step: 1215, loss: 0.31965672969818115, mean loss: 0.3457246129175213
Epoch: 34, step: 1216, loss: 0.32573190331459045, mean loss: 0.34572421555084465
Epoch: 34, step: 1217, loss: 0.29161036014556885, mean loss: 0.3457231400280199
Epoch: 34, step: 1218, loss: 0.3244364857673645, mean loss: 0.3457227169602616
Epoch: 34, step: 1219, loss: 0.3183470368385315, mean loss: 0.34572217288521345
Epoch: 34, step: 1220, loss: 0.3057693839073181, mean loss: 0.3457213788635314
Epoch: 34, step: 1221, loss: 0.30960702896118164, mean loss: 0.34572066114124705
Epoch: 34, step: 1222, loss: 0.3015645146369934, mean loss: 0.3457197836169222
Epoch: 34, step: 1223, loss: 0.3291268050670624, mean loss: 0.34571945386774594
Epoch: 34, step: 1224, loss: 0.29122719168663025, mean loss: 0.34571837097467584
Epoch: 34, step: 1225, loss: 0.30219268798828125, mean loss: 0.3457175060312518
Epoch: 34, step: 1226, loss: 0.32733064889907837, mean loss: 0.3457171406544433
Epoch: 34, step: 1227, loss: 0.3151266872882843, mean loss: 0.34571653278437403
Epoch: 34, step: 1228, loss: 0.2980283796787262, mean loss: 0.3457155851807356
Epoch: 34, step: 1229, loss: 0.3033983111381531, mean loss: 0.34571474431768184
Epoch: 34, step: 1230, loss: 0.33930182456970215, mean loss: 0.3457146168926466
Epoch: 34, step: 1231, loss: 0.3230856955051422, mean loss: 0.3457141672637842
Epoch: 34, step: 1232, loss: 0.34596505761146545, mean loss: 0.3457141722487898
Epoch: 34, step: 1233, loss: 0.3220463991165161, mean loss: 0.34571370199698903
Epoch: 34, step: 1234, loss: 0.33823540806770325, mean loss: 0.34571355341472504
Epoch: 34, step: 1235, loss: 0.3687659800052643, mean loss: 0.34571401142208796
Epoch: 34, step: 1236, loss: 0.30493104457855225, mean loss: 0.3457132011591026
Epoch: 34, step: 1237, loss: 0.3147721588611603, mean loss: 0.34571258644454983
Epoch: 34, step: 1238, loss: 0.30649128556251526, mean loss: 0.34571180723920797
Epoch: 34, step: 1239, loss: 0.3438853323459625, mean loss: 0.3457117709535497
Epoch: 34, step: 1240, loss: 0.2970665395259857, mean loss: 0.3457108045623975
Epoch: 34, step: 1241, loss: 0.3142550587654114, mean loss: 0.3457101796717424
Epoch: 34, step: 1242, loss: 0.33923372626304626, mean loss: 0.34571005101496716
Epoch: 34, step: 1243, loss: 0.321445494890213, mean loss: 0.345709569001536
Epoch: 34, step: 1244, loss: 0.34578070044517517, mean loss: 0.34570957041452827
Epoch: 34, step: 1245, loss: 0.3227214813232422, mean loss: 0.34570911377615293
Epoch: 34, step: 1246, loss: 0.332919716835022, mean loss: 0.3457088597309641
Epoch: 34, step: 1247, loss: 0.4002627432346344, mean loss: 0.3457099433533124
Epoch: 34, step: 1248, loss: 0.34093335270881653, mean loss: 0.34570984847615194
Epoch: 34, step: 1249, loss: 0.3391851484775543, mean loss: 0.3457097188789645
Epoch: 34, step: 1250, loss: 0.3681834936141968, mean loss: 0.3457101652565984
Epoch: 34, step: 1251, loss: 0.3630272150039673, mean loss: 0.3457105092037214
Epoch: 34, step: 1252, loss: 0.3679080903530121, mean loss: 0.3457109500780416
Epoch: 34, step: 1253, loss: 0.32719743251800537, mean loss: 0.3457105823815657
Epoch: 34, step: 1254, loss: 0.3177042305469513, mean loss: 0.34571002615921
Epoch: 34, step: 1255, loss: 0.3205929100513458, mean loss: 0.34570952732865495
Epoch: 34, step: 1256, loss: 0.31491076946258545, mean loss: 0.34570891567179507
Epoch: 34, step: 1257, loss: 0.31855443120002747, mean loss: 0.3457083764001489
Epoch: 34, step: 1258, loss: 0.31913262605667114, mean loss: 0.3457078486322938
Epoch: 34, step: 1259, loss: 0.3170509934425354, mean loss: 0.34570727954707675
Epoch: 34, step: 1260, loss: 0.36350151896476746, mean loss: 0.345707632908862
Epoch: 34, step: 1261, loss: 0.307230681180954, mean loss: 0.34570686884055646
Epoch: 34, step: 1262, loss: 0.3111587166786194, mean loss: 0.345706182803261
Epoch: 34, step: 1263, loss: 0.3226340711116791, mean loss: 0.3457057246596611
Epoch: 34, step: 1264, loss: 0.3332446813583374, mean loss: 0.34570547722527134
Epoch: 34, step: 1265, loss: 0.3582986891269684, mean loss: 0.3457057272791195
Epoch: 34, step: 1266, loss: 0.3022642135620117, mean loss: 0.3457048647110891
Epoch: 34, step: 1267, loss: 0.3186420798301697, mean loss: 0.3457043273672546
Epoch: 34, step: 1268, loss: 0.30129918456077576, mean loss: 0.34570344570056527
Epoch: 34, step: 1269, loss: 0.3427158296108246, mean loss: 0.34570338638245207
Epoch: 34, step: 1270, loss: 0.33378738164901733, mean loss: 0.34570314979888084
Epoch: 34, step: 1271, loss: 0.376860648393631, mean loss: 0.3457037683959781
Epoch: 34, step: 1272, loss: 0.3121589124202728, mean loss: 0.34570310241380703
Epoch: 34, step: 1273, loss: 0.3412752151489258, mean loss: 0.34570301450657526
Epoch: 34, step: 1274, loss: 0.3003423810005188, mean loss: 0.34570211397584316
Epoch: 34, step: 1275, loss: 0.4447921812534332, mean loss: 0.3457040811414764
Epoch: 34, step: 1276, loss: 0.3083546757698059, mean loss: 0.34570333968463696
Epoch: 34, step: 1277, loss: 0.322848916053772, mean loss: 0.3457028859898017
Epoch: 34, step: 1278, loss: 0.3198278546333313, mean loss: 0.34570237234153656
Epoch: 34, step: 1279, loss: 0.30852219462394714, mean loss: 0.3457016342881437
Epoch: 34, step: 1280, loss: 0.3080437481403351, mean loss: 0.3457008867667322
Epoch: 34, step: 1281, loss: 0.31165528297424316, mean loss: 0.3457002109637271
Epoch: 34, step: 1282, loss: 0.30872535705566406, mean loss: 0.3456994770298676
Epoch: 34, step: 1283, loss: 0.33795294165611267, mean loss: 0.3456993232677522
Epoch: 34, step: 1284, loss: 0.3753581941127777, mean loss: 0.34569991195933925
Epoch: 34, step: 1285, loss: 0.34229519963264465, mean loss: 0.34569984438138823
Epoch: 34, step: 1286, loss: 0.2901686429977417, mean loss: 0.34569874220006946
Epoch: 34, step: 1287, loss: 0.35223719477653503, mean loss: 0.34569887197246896
Epoch: 34, step: 1288, loss: 0.3046683967113495, mean loss: 0.34569805763337474
Epoch: 34, step: 1289, loss: 0.3504689633846283, mean loss: 0.3456981523205051
Epoch: 34, step: 1290, loss: 0.3366483449935913, mean loss: 0.34569797271450897
Epoch: 34, step: 1291, loss: 0.31663814187049866, mean loss: 0.34569739599324906
Epoch: 34, step: 1292, loss: 0.3299001455307007, mean loss: 0.34569708248731595
Epoch: 34, step: 1293, loss: 0.31816092133522034, mean loss: 0.34569653602648737
Epoch: 34, step: 1294, loss: 0.4068256616592407, mean loss: 0.3456977491225885
Epoch: 34, step: 1295, loss: 0.35909953713417053, mean loss: 0.3456980150732952
Epoch: 34, step: 1296, loss: 0.33066320419311523, mean loss: 0.3456977167221178
Epoch: 34, step: 1297, loss: 0.3711332678794861, mean loss: 0.3456982214558392
Epoch: 34, step: 1298, loss: 0.30448219180107117, mean loss: 0.3456974035963362
Epoch: 34, step: 1299, loss: 0.3443964719772339, mean loss: 0.34569737778215215
Epoch: 34, step: 1300, loss: 0.3388347625732422, mean loss: 0.34569724161104654
Epoch: 34, step: 1301, loss: 0.2992939352989197, mean loss: 0.3456963208739873
Epoch: 34, step: 1302, loss: 0.30846452713012695, mean loss: 0.34569558213326335
Epoch: 34, step: 1303, loss: 0.35944682359695435, mean loss: 0.3456958549753559
Epoch: 34, step: 1304, loss: 0.351777583360672, mean loss: 0.3456959756421757
Epoch: 34, step: 1305, loss: 0.3714205324649811, mean loss: 0.3456964860297957
Epoch: 34, step: 1306, loss: 0.3320751190185547, mean loss: 0.34569621578066345
Epoch: 34, step: 1307, loss: 0.32621222734451294, mean loss: 0.3456958292242704
Epoch: 34, step: 1308, loss: 0.3270550072193146, mean loss: 0.34569545940337953
Epoch: 34, step: 1309, loss: 0.3135931193828583, mean loss: 0.34569482252800715
Epoch: 34, step: 1310, loss: 0.34855902194976807, mean loss: 0.3456948793494689
Epoch: 34, step: 1311, loss: 0.32828831672668457, mean loss: 0.34569453403597455
Epoch: 34, step: 1312, loss: 0.3287737965583801, mean loss: 0.3456941983669972
Epoch: 34, step: 1313, loss: 0.3296453058719635, mean loss: 0.34569387999975865
Epoch: 34, step: 1314, loss: 0.37497660517692566, mean loss: 0.3456944608794313
Epoch: 34, step: 1315, loss: 0.28816643357276917, mean loss: 0.3456933197220222
Epoch: 34, step: 1316, loss: 0.3015201985836029, mean loss: 0.34569244349721634
Epoch: 34, step: 1317, loss: 0.3339557349681854, mean loss: 0.34569221069068384
Epoch: 34, step: 1318, loss: 0.309731662273407, mean loss: 0.3456914974000279
Epoch: 34, step: 1319, loss: 0.3485261797904968, mean loss: 0.34569155362587667
Epoch: 34, step: 1320, loss: 0.38777101039886475, mean loss: 0.34569238825421184
Epoch: 34, step: 1321, loss: 0.354436993598938, mean loss: 0.3456925616963425
Epoch: 34, step: 1322, loss: 0.32331037521362305, mean loss: 0.34569211777269304
Epoch: 34, step: 1323, loss: 0.303175687789917, mean loss: 0.3456912745273542
Epoch: 34, step: 1324, loss: 0.3140970468521118, mean loss: 0.34569064791884435
Epoch: 34, step: 1325, loss: 0.3940662443637848, mean loss: 0.3456916073333151
Epoch: 34, step: 1326, loss: 0.312348335981369, mean loss: 0.3456909460622414
Epoch: 34, step: 1327, loss: 0.3172541558742523, mean loss: 0.34569038210876313
Epoch: 34, step: 1328, loss: 0.3653058707714081, mean loss: 0.3456907711120088
Epoch: 34, step: 1329, loss: 0.38263756036758423, mean loss: 0.3456915038052475
Epoch: 34, step: 1330, loss: 0.2849147617816925, mean loss: 0.34569029856317435
Epoch: 34, step: 1331, loss: 0.37494733929634094, mean loss: 0.3456908787376951
Epoch: 34, step: 1332, loss: 0.32307255268096924, mean loss: 0.34569043021946044
Epoch: 34, step: 1333, loss: 0.32096707820892334, mean loss: 0.34568993996857783
Epoch: 34, step: 1334, loss: 0.3026025593280792, mean loss: 0.345689085585745
Epoch: 34, step: 1335, loss: 0.34019821882247925, mean loss: 0.3456889767091039
Epoch: 34, step: 1336, loss: 0.3660212457180023, mean loss: 0.3456893798631699
Epoch: 34, step: 1337, loss: 0.340122789144516, mean loss: 0.3456892694893998
Epoch: 34, step: 1338, loss: 0.3507058024406433, mean loss: 0.34568936895471064
Epoch: 34, step: 1339, loss: 0.3572171628475189, mean loss: 0.3456895975175208
Epoch: 34, step: 1340, loss: 0.3328895568847656, mean loss: 0.3456893437347694
Epoch: 34, step: 1341, loss: 0.3225362002849579, mean loss: 0.3456888846931054
Epoch: 34, step: 1342, loss: 0.32974910736083984, mean loss: 0.3456885686722221
Epoch: 34, step: 1343, loss: 0.3546815514564514, mean loss: 0.3456887469629196
Epoch: 34, step: 1344, loss: 0.31298089027404785, mean loss: 0.3456880985250082
Epoch: 34, step: 1345, loss: 0.35450467467308044, mean loss: 0.34568827331141927
Epoch: 34, step: 1346, loss: 0.32956212759017944, mean loss: 0.3456879536209623
Epoch: 34, step: 1347, loss: 0.324746698141098, mean loss: 0.3456875384822841
Epoch: 34, step: 1348, loss: 0.3998384177684784, mean loss: 0.3456886119460424
Epoch: 34, step: 1349, loss: 0.32379889488220215, mean loss: 0.3456881780223009
Epoch: 34, step: 1350, loss: 0.3321681320667267, mean loss: 0.34568791001734606
Epoch: 34, step: 1351, loss: 0.33570483326911926, mean loss: 0.34568771212889166
Epoch: 34, step: 1352, loss: 0.2960715889930725, mean loss: 0.34568672863817557
Epoch: 34, step: 1353, loss: 0.3435874581336975, mean loss: 0.3456866870272637
Epoch: 34, step: 1354, loss: 0.369393527507782, mean loss: 0.3456871569255904
Epoch: 34, step: 1355, loss: 0.3244168162345886, mean loss: 0.34568673533000066
Epoch: 34, step: 1356, loss: 0.3666435182094574, mean loss: 0.3456871507023844
Epoch: 34, step: 1357, loss: 0.3521811068058014, mean loss: 0.3456872794128158
Epoch: 34, step: 1358, loss: 0.3579769432544708, mean loss: 0.3456875229895444
Epoch: 34, step: 1359, loss: 0.32300713658332825, mean loss: 0.3456870734813312
Epoch: 34, step: 1360, loss: 0.32905805110931396, mean loss: 0.3456867439131371
Epoch: 34, step: 1361, loss: 0.33651164174079895, mean loss: 0.3456865620767153
Epoch: 34, step: 1362, loss: 0.32415294647216797, mean loss: 0.34568613532201137
Epoch: 34, step: 1363, loss: 0.3609373867511749, mean loss: 0.34568643756639167
Epoch: 34, step: 1364, loss: 0.2842008173465729, mean loss: 0.34568521908835476
Epoch: 34, step: 1365, loss: 0.31093671917915344, mean loss: 0.3456845304810877
Epoch: 34, step: 1366, loss: 0.3260827660560608, mean loss: 0.34568414204273834
Epoch: 34, step: 1367, loss: 0.3410637676715851, mean loss: 0.3456840504849076
Epoch: 34, step: 1368, loss: 0.32212212681770325, mean loss: 0.34568358358857015
Epoch: 34, step: 1369, loss: 0.3274119794368744, mean loss: 0.34568322153086495
Epoch: 34, step: 1370, loss: 0.3439186215400696, mean loss: 0.34568318656544217
Epoch: 34, step: 1371, loss: 0.3031756281852722, mean loss: 0.3456823442978988
Epoch: 34, step: 1372, loss: 0.3492266535758972, mean loss: 0.34568241452535087
Epoch: 34, step: 1373, loss: 0.3130964934825897, mean loss: 0.3456817688760336
Epoch: 34, step: 1374, loss: 0.3842003345489502, mean loss: 0.3456825320581713
Epoch: 34, step: 1375, loss: 0.3163330554962158, mean loss: 0.34568195055800166
Epoch: 34, step: 1376, loss: 0.3368057310581207, mean loss: 0.3456817746972543
Epoch: 34, step: 1377, loss: 0.34032294154167175, mean loss: 0.34568166852708443
Epoch: 34, step: 1378, loss: 0.3504723906517029, mean loss: 0.34568176343985557
Epoch: 34, step: 1379, loss: 0.32133597135543823, mean loss: 0.3456812811157395
Epoch: 34, step: 1380, loss: 0.34915339946746826, mean loss: 0.34568134990188665
Epoch: 34, step: 1381, loss: 0.33074137568473816, mean loss: 0.3456810539318756
Epoch: 34, step: 1382, loss: 0.32658541202545166, mean loss: 0.34568067564304444
Epoch: 34, step: 1383, loss: 0.3233512341976166, mean loss: 0.345680233300702
Epoch: 34, step: 1384, loss: 0.3737863004207611, mean loss: 0.34568079006596264
Epoch: 34, step: 1385, loss: 0.3067430555820465, mean loss: 0.3456800187467898
Epoch: 34, step: 1386, loss: 0.32860010862350464, mean loss: 0.3456796804168545
Epoch: 34, step: 1387, loss: 0.33003315329551697, mean loss: 0.3456793704864385
Epoch: 34, step: 1388, loss: 0.33086729049682617, mean loss: 0.3456790770907766
Epoch: 34, step: 1389, loss: 0.41367778182029724, mean loss: 0.3456804239731743
Epoch: 34, step: 1390, loss: 0.31947773694992065, mean loss: 0.3456799049744811
Epoch: 34, step: 1391, loss: 0.3731452226638794, mean loss: 0.3456804489714247
Epoch: 34, step: 1392, loss: 0.3143654763698578, mean loss: 0.34567982873785696
Epoch: 34, step: 1393, loss: 0.3340342342853546, mean loss: 0.3456795980863527
Epoch: 34, step: 1394, loss: 0.3625362515449524, mean loss: 0.3456799319409695
Epoch: 34, step: 1395, loss: 0.3335103690624237, mean loss: 0.34567969092134504
Epoch: 34, step: 1396, loss: 0.3239419162273407, mean loss: 0.34567926041068625
Epoch: 34, step: 1397, loss: 0.3292507827281952, mean loss: 0.34567893505564046
Epoch: 34, step: 1398, loss: 0.33005979657173157, mean loss: 0.3456786257351437
Epoch: 34, step: 1399, loss: 0.32549920678138733, mean loss: 0.34567822611103577
Epoch: 34, step: 1400, loss: 0.32125747203826904, mean loss: 0.345677742503018
Epoch: 34, step: 1401, loss: 0.34113216400146484, mean loss: 0.3456776524879976
Epoch: 34, step: 1402, loss: 0.3842878043651581, mean loss: 0.34567841706060054
Epoch: 34, step: 1403, loss: 0.30866384506225586, mean loss: 0.3456776840987788
Epoch: 34, step: 1404, loss: 0.31555911898612976, mean loss: 0.34567708770335864
Epoch: 34, step: 1405, loss: 0.33897122740745544, mean loss: 0.3456769549193046
Epoch: 34, step: 1406, loss: 0.3114597499370575, mean loss: 0.3456762773911383
Epoch: 34, step: 1407, loss: 0.31157663464546204, mean loss: 0.34567560220416804
Epoch: 34, step: 1408, loss: 0.3226577341556549, mean loss: 0.3456751464499249
Epoch: 34, step: 1409, loss: 0.31493982672691345, mean loss: 0.3456745379020351
Epoch: 34, step: 1410, loss: 0.34916678071022034, mean loss: 0.3456746070457738
Epoch: 34, step: 1411, loss: 0.33924126625061035, mean loss: 0.34567447967306464
Epoch: 34, step: 1412, loss: 0.3024059236049652, mean loss: 0.34567362302264454
Epoch: 34, step: 1413, loss: 0.33100754022598267, mean loss: 0.3456733326626604
Epoch: 34, step: 1414, loss: 0.3353111147880554, mean loss: 0.3456731275149129
Epoch: 34, step: 1415, loss: 0.33253636956214905, mean loss: 0.3456728674428914
Epoch: 34, step: 1416, loss: 0.3398095369338989, mean loss: 0.34567275136721765
Epoch: 34, step: 1417, loss: 0.3535173833370209, mean loss: 0.34567290666341216
Epoch: 34, step: 1418, loss: 0.32097867131233215, mean loss: 0.34567241781385555
Epoch: 34, step: 1419, loss: 0.4118272662162781, mean loss: 0.34567372739593655
Epoch: 34, step: 1420, loss: 0.33490121364593506, mean loss: 0.34567351415061814
Epoch: 34, step: 1421, loss: 0.3084719777107239, mean loss: 0.34567277774901
Epoch: 34, step: 1422, loss: 0.3029063045978546, mean loss: 0.3456719312066566
Epoch: 34, step: 1423, loss: 0.32302626967430115, mean loss: 0.3456714829552407
Epoch: 34, step: 1424, loss: 0.33265337347984314, mean loss: 0.34567122527804756
Epoch: 34, step: 1425, loss: 0.3846021592617035, mean loss: 0.3456719958519358
Epoch: 34, step: 1426, loss: 0.3110881745815277, mean loss: 0.3456713113355518
Epoch: 34, step: 1427, loss: 0.37851056456565857, mean loss: 0.34567196130889577
Epoch: 34, step: 1428, loss: 0.35984134674072266, mean loss: 0.3456722417519523
Epoch: 34, step: 1429, loss: 0.3528696298599243, mean loss: 0.34567238420114893
Epoch: 34, step: 1430, loss: 0.3196164071559906, mean loss: 0.3456718685169198
Epoch: 34, step: 1431, loss: 0.3239459991455078, mean loss: 0.3456714385400877
Epoch: 34, step: 1432, loss: 0.3294229805469513, mean loss: 0.3456711169731065
Epoch: 34, step: 1433, loss: 0.3357054889202118, mean loss: 0.3456709197510987
Epoch: 34, step: 1434, loss: 0.32941269874572754, mean loss: 0.34567059800363664
Epoch: 34, step: 1435, loss: 0.334701269865036, mean loss: 0.3456703809267717
Epoch: 34, step: 1436, loss: 0.31080278754234314, mean loss: 0.3456696909302668
Epoch: 34, step: 1437, loss: 0.3241969347000122, mean loss: 0.34566926601325587
Epoch: 34, step: 1438, loss: 0.30472931265830994, mean loss: 0.34566845588258693
Epoch: 34, step: 1439, loss: 0.30961093306541443, mean loss: 0.345667742380869
Epoch: 34, step: 1440, loss: 0.38286450505256653, mean loss: 0.34566847841115717
Epoch: 34, step: 1441, loss: 0.28722622990608215, mean loss: 0.34566732200907346
Epoch: 34, step: 1442, loss: 0.29545727372169495, mean loss: 0.3456663285179421
Epoch: 34, step: 1443, loss: 0.3753047585487366, mean loss: 0.34566691495304364
Valid: 34, mean loss: 0.18538438777128854
Epoch: 35, step: 0, loss: 0.28757014870643616, mean loss: 0.34566576545528443
Epoch: 35, step: 1, loss: 0.35580265522003174, mean loss: 0.3456659660189694
Epoch: 35, step: 2, loss: 0.3119085431098938, mean loss: 0.34566529812385216
Epoch: 35, step: 3, loss: 0.34162452816963196, mean loss: 0.3456652181782611
Epoch: 35, step: 4, loss: 0.3560730516910553, mean loss: 0.3456654240904881
Epoch: 35, step: 5, loss: 0.37468084692955017, mean loss: 0.34566599813042875
Epoch: 35, step: 6, loss: 0.31593436002731323, mean loss: 0.34566540993255146
Epoch: 35, step: 7, loss: 0.3073613941669464, mean loss: 0.34566465215745124
Epoch: 35, step: 8, loss: 0.32379403710365295, mean loss: 0.34566421949577536
Epoch: 35, step: 9, loss: 0.3891168236732483, mean loss: 0.34566507909229716
Epoch: 35, step: 10, loss: 0.31678467988967896, mean loss: 0.3456645077801727
Epoch: 35, step: 11, loss: 0.30397310853004456, mean loss: 0.3456636830571301
Epoch: 35, step: 12, loss: 0.31539374589920044, mean loss: 0.3456630842808526
Epoch: 35, step: 13, loss: 0.3253519535064697, mean loss: 0.3456626825098597
Epoch: 35, step: 14, loss: 0.3233701288700104, mean loss: 0.3456622415534036
Epoch: 35, step: 15, loss: 0.3333258628845215, mean loss: 0.3456619975392674
Epoch: 35, step: 16, loss: 0.36564797163009644, mean loss: 0.3456623928549327
Epoch: 35, step: 17, loss: 0.3226894736289978, mean loss: 0.3456619384675118
Epoch: 35, step: 18, loss: 0.31353551149368286, mean loss: 0.3456613030430182
Epoch: 35, step: 19, loss: 0.37027499079704285, mean loss: 0.34566178986437407
Epoch: 35, step: 20, loss: 0.30639466643333435, mean loss: 0.3456610132356794
Epoch: 35, step: 21, loss: 0.34804436564445496, mean loss: 0.3456610603729051
Epoch: 35, step: 22, loss: 0.3560461699962616, mean loss: 0.34566126576241174
Epoch: 35, step: 23, loss: 0.32967305183410645, mean loss: 0.3456609495648418
Epoch: 35, step: 24, loss: 0.2751045227050781, mean loss: 0.3456595542038834
Epoch: 35, step: 25, loss: 0.34208613634109497, mean loss: 0.3456594835354923
Epoch: 35, step: 26, loss: 0.403219997882843, mean loss: 0.34566062183743523
Epoch: 35, step: 27, loss: 0.3245770037174225, mean loss: 0.34566020490146543
Epoch: 35, step: 28, loss: 0.31692296266555786, mean loss: 0.34565963662362253
Epoch: 35, step: 29, loss: 0.33722594380378723, mean loss: 0.34565946985097434
Epoch: 35, step: 30, loss: 0.3619844913482666, mean loss: 0.3456597926648696
Epoch: 35, step: 31, loss: 0.3405667543411255, mean loss: 0.3456596919562102
Epoch: 35, step: 32, loss: 0.33728039264678955, mean loss: 0.3456595262689995
Epoch: 35, step: 33, loss: 0.30688753724098206, mean loss: 0.34565875963023196
Epoch: 35, step: 34, loss: 0.3479035496711731, mean loss: 0.345658804015601
Epoch: 35, step: 35, loss: 0.3521218001842499, mean loss: 0.34565893180340884
Epoch: 35, step: 36, loss: 0.32387983798980713, mean loss: 0.34565850119080205
Epoch: 35, step: 37, loss: 0.33652785420417786, mean loss: 0.34565832066474356
Epoch: 35, step: 38, loss: 0.31899309158325195, mean loss: 0.3456577934651334
Epoch: 35, step: 39, loss: 0.3381688594818115, mean loss: 0.3456576454039633
Epoch: 35, step: 40, loss: 0.3349497318267822, mean loss: 0.34565743370562646
Epoch: 35, step: 41, loss: 0.32132279872894287, mean loss: 0.3456569526128469
Epoch: 35, step: 42, loss: 0.33009806275367737, mean loss: 0.34565664502156407
Epoch: 35, step: 43, loss: 0.32723820209503174, mean loss: 0.3456562809055802
Epoch: 35, step: 44, loss: 0.32701611518859863, mean loss: 0.34565591241362176
Epoch: 35, step: 45, loss: 0.36446455121040344, mean loss: 0.3456562842287247
Epoch: 35, step: 46, loss: 0.3475421369075775, mean loss: 0.3456563215081182
Epoch: 35, step: 47, loss: 0.3194149136543274, mean loss: 0.3456558027802014
Epoch: 35, step: 48, loss: 0.3079070746898651, mean loss: 0.3456550565956931
Epoch: 35, step: 49, loss: 0.3528103232383728, mean loss: 0.34565519803207667
Epoch: 35, step: 50, loss: 0.34821343421936035, mean loss: 0.34565524859909824
Epoch: 35, step: 51, loss: 0.38932907581329346, mean loss: 0.34565611185469625
Epoch: 35, step: 52, loss: 0.31180325150489807, mean loss: 0.34565544273326937
Epoch: 35, step: 53, loss: 0.3214705288410187, mean loss: 0.3456549647138621
Epoch: 35, step: 54, loss: 0.3544733226299286, mean loss: 0.34565513900693284
Epoch: 35, step: 55, loss: 0.31849291920661926, mean loss: 0.34565460216173166
Epoch: 35, step: 56, loss: 0.35141414403915405, mean loss: 0.34565471599341885
Epoch: 35, step: 57, loss: 0.31701746582984924, mean loss: 0.3456541500174877
Epoch: 35, step: 58, loss: 0.3489615321159363, mean loss: 0.3456542153820621
Epoch: 35, step: 59, loss: 0.3480209708213806, mean loss: 0.345654262155885
Epoch: 35, step: 60, loss: 0.3432518243789673, mean loss: 0.3456542146778159
Epoch: 35, step: 61, loss: 0.3175834119319916, mean loss: 0.34565365994079467
Epoch: 35, step: 62, loss: 0.33998605608940125, mean loss: 0.3456535479394538
Epoch: 35, step: 63, loss: 0.3430393636226654, mean loss: 0.3456534962798159
Epoch: 35, step: 64, loss: 0.3070096969604492, mean loss: 0.345652732643825
Epoch: 35, step: 65, loss: 0.32473522424697876, mean loss: 0.3456523193033437
Epoch: 35, step: 66, loss: 0.33774158358573914, mean loss: 0.34565216298631807
Epoch: 35, step: 67, loss: 0.36087119579315186, mean loss: 0.34565246371017216
Epoch: 35, step: 68, loss: 0.3266805410385132, mean loss: 0.34565208883766585
Epoch: 35, step: 69, loss: 0.32762011885643005, mean loss: 0.3456517325450363
Epoch: 35, step: 70, loss: 0.3591414988040924, mean loss: 0.3456519990832643
Epoch: 35, step: 71, loss: 0.33570951223373413, mean loss: 0.34565180263801715
Epoch: 35, step: 72, loss: 0.3377079665660858, mean loss: 0.34565164568553314
Epoch: 35, step: 73, loss: 0.35641124844551086, mean loss: 0.34565185826708683
Epoch: 35, step: 74, loss: 0.36587759852409363, mean loss: 0.3456522578668153
Epoch: 35, step: 75, loss: 0.3295991122722626, mean loss: 0.3456519407112599
Epoch: 35, step: 76, loss: 0.3344272971153259, mean loss: 0.3456517189548619
Epoch: 35, step: 77, loss: 0.3546857535839081, mean loss: 0.34565189742960667
Epoch: 35, step: 78, loss: 0.2964995801448822, mean loss: 0.34565092640455114
Epoch: 35, step: 79, loss: 0.30510303378105164, mean loss: 0.3456501253794104
Epoch: 35, step: 80, loss: 0.3190437853336334, mean loss: 0.3456495997805474
Epoch: 35, step: 81, loss: 0.3483087718486786, mean loss: 0.3456496523105159
Epoch: 35, step: 82, loss: 0.3329944908618927, mean loss: 0.3456494023221421
Epoch: 35, step: 83, loss: 0.31412044167518616, mean loss: 0.34564877951555534
Epoch: 35, step: 84, loss: 0.2956813871860504, mean loss: 0.3456477925053365
Epoch: 35, step: 85, loss: 0.32893481850624084, mean loss: 0.34564746237903776
Epoch: 35, step: 86, loss: 0.3294523060321808, mean loss: 0.34564714248735257
Epoch: 35, step: 87, loss: 0.31955522298812866, mean loss: 0.345646627121952
Epoch: 35, step: 88, loss: 0.29974526166915894, mean loss: 0.34564572049994774
Epoch: 35, step: 89, loss: 0.34519729018211365, mean loss: 0.34564571164293967
Epoch: 35, step: 90, loss: 0.34236645698547363, mean loss: 0.3456456468752152
Epoch: 35, step: 91, loss: 0.3767976760864258, mean loss: 0.3456462621388669
Epoch: 35, step: 92, loss: 0.3569674491882324, mean loss: 0.34564648573191986
Epoch: 35, step: 93, loss: 0.33190587162971497, mean loss: 0.3456462143606258
Epoch: 35, step: 94, loss: 0.34300100803375244, mean loss: 0.3456461621199558
Epoch: 35, step: 95, loss: 0.3303510546684265, mean loss: 0.3456458600600093
Epoch: 35, step: 96, loss: 0.32657963037490845, mean loss: 0.3456454835323776
Epoch: 35, step: 97, loss: 0.33447083830833435, mean loss: 0.3456452628553125
Epoch: 35, step: 98, loss: 0.3114285469055176, mean loss: 0.34564458715642526
Epoch: 35, step: 99, loss: 0.3224351406097412, mean loss: 0.3456441288340211
Epoch: 35, step: 100, loss: 0.3269653618335724, mean loss: 0.34564375998729613
Epoch: 35, step: 101, loss: 0.36537256836891174, mean loss: 0.3456441495613331
Epoch: 35, step: 102, loss: 0.3765251934528351, mean loss: 0.34564475934045147
Epoch: 35, step: 103, loss: 0.35081592202186584, mean loss: 0.3456448614485528
Epoch: 35, step: 104, loss: 0.3601885735988617, mean loss: 0.345645148618306
Epoch: 35, step: 105, loss: 0.3565906882286072, mean loss: 0.34564536473684665
Epoch: 35, step: 106, loss: 0.40173304080963135, mean loss: 0.3456464721603085
Epoch: 35, step: 107, loss: 0.3130897581577301, mean loss: 0.3456458293567624
Epoch: 35, step: 108, loss: 0.3454149663448334, mean loss: 0.34564582479866623
Epoch: 35, step: 109, loss: 0.33432817459106445, mean loss: 0.3456456013504884
Epoch: 35, step: 110, loss: 0.33014053106307983, mean loss: 0.34564529523471005
Epoch: 35, step: 111, loss: 0.3264497220516205, mean loss: 0.34564491626501126
Epoch: 35, step: 112, loss: 0.3532413840293884, mean loss: 0.3456450662357487
Epoch: 35, step: 113, loss: 0.34706616401672363, mean loss: 0.34564509429074497
Epoch: 35, step: 114, loss: 0.34117504954338074, mean loss: 0.345645006045858
Epoch: 35, step: 115, loss: 0.35058078169822693, mean loss: 0.3456451034829958
Epoch: 35, step: 116, loss: 0.3282371461391449, mean loss: 0.34564475983932674
Epoch: 35, step: 117, loss: 0.32336166501045227, mean loss: 0.345644319966161
Epoch: 35, step: 118, loss: 0.2812163829803467, mean loss: 0.34564304816969865
Epoch: 35, step: 119, loss: 0.37703701853752136, mean loss: 0.34564366786907424
Epoch: 35, step: 120, loss: 0.29437455534935, mean loss: 0.34564265586551096
Epoch: 35, step: 121, loss: 0.31457605957984924, mean loss: 0.3456420426525252
Epoch: 35, step: 122, loss: 0.3257003426551819, mean loss: 0.34564164903785577
Epoch: 35, step: 123, loss: 0.399445116519928, mean loss: 0.34564271100429117
Epoch: 35, step: 124, loss: 0.30745795369148254, mean loss: 0.3456419573329734
Epoch: 35, step: 125, loss: 0.3267778158187866, mean loss: 0.34564158500949194
Epoch: 35, step: 126, loss: 0.3771592974662781, mean loss: 0.34564220706551374
Epoch: 35, step: 127, loss: 0.3049454092979431, mean loss: 0.345641403860379
Epoch: 35, step: 128, loss: 0.2676803171634674, mean loss: 0.3456398652255787
Epoch: 35, step: 129, loss: 0.3152712881565094, mean loss: 0.34563926588519844
Epoch: 35, step: 130, loss: 0.36620739102363586, mean loss: 0.3456396718003203
Epoch: 35, step: 131, loss: 0.29151979088783264, mean loss: 0.34563860375720157
Epoch: 35, step: 132, loss: 0.3752139210700989, mean loss: 0.3456391874076133
Epoch: 35, step: 133, loss: 0.3158959746360779, mean loss: 0.34563860045547273
Epoch: 35, step: 134, loss: 0.3289441168308258, mean loss: 0.34563827101327
Epoch: 35, step: 135, loss: 0.2998209297657013, mean loss: 0.3456373668901891
Epoch: 35, step: 136, loss: 0.3937571048736572, mean loss: 0.34563831642820403
Epoch: 35, step: 137, loss: 0.34894129633903503, mean loss: 0.3456383816040182
Epoch: 35, step: 138, loss: 0.33664554357528687, mean loss: 0.3456382041569883
Epoch: 35, step: 139, loss: 0.33688443899154663, mean loss: 0.3456380314307617
Epoch: 35, step: 140, loss: 0.31333863735198975, mean loss: 0.3456373941230117
Epoch: 35, step: 141, loss: 0.30992069840431213, mean loss: 0.3456366894014988
Epoch: 35, step: 142, loss: 0.31842052936553955, mean loss: 0.3456361524135534
Epoch: 35, step: 143, loss: 0.3550161123275757, mean loss: 0.3456363374810286
Epoch: 35, step: 144, loss: 0.38216546177864075, mean loss: 0.34563705818980434
Epoch: 35, step: 145, loss: 0.32432809472084045, mean loss: 0.345636637778577
Epoch: 35, step: 146, loss: 0.3243405222892761, mean loss: 0.3456362176291207
Epoch: 35, step: 147, loss: 0.308120459318161, mean loss: 0.3456354774981566
Epoch: 35, step: 148, loss: 0.34750866889953613, mean loss: 0.3456355144527503
Epoch: 35, step: 149, loss: 0.3458896279335022, mean loss: 0.3456355194658393
Epoch: 35, step: 150, loss: 0.31109654903411865, mean loss: 0.34563483810286694
Epoch: 35, step: 151, loss: 0.3033897280693054, mean loss: 0.3456340047344847
Epoch: 35, step: 152, loss: 0.34698009490966797, mean loss: 0.345634031288253
Epoch: 35, step: 153, loss: 0.355356901884079, mean loss: 0.34563422308354624
Epoch: 35, step: 154, loss: 0.3524678349494934, mean loss: 0.3456343578820839
Epoch: 35, step: 155, loss: 0.33881425857543945, mean loss: 0.3456342233527462
Epoch: 35, step: 156, loss: 0.30078718066215515, mean loss: 0.3456333387433474
Epoch: 35, step: 157, loss: 0.335758239030838, mean loss: 0.3456331439605214
Epoch: 35, step: 158, loss: 0.32231399416923523, mean loss: 0.3456326840076665
Epoch: 35, step: 159, loss: 0.334025114774704, mean loss: 0.3456324550615278
Epoch: 35, step: 160, loss: 0.3167116940021515, mean loss: 0.3456318846435664
Epoch: 35, step: 161, loss: 0.3271642029285431, mean loss: 0.34563152040385764
Epoch: 35, step: 162, loss: 0.2929529547691345, mean loss: 0.34563048144037156
Epoch: 35, step: 163, loss: 0.2891981601715088, mean loss: 0.3456293684646444
Epoch: 35, step: 164, loss: 0.3890519142150879, mean loss: 0.34563022484065764
Epoch: 35, step: 165, loss: 0.3134008049964905, mean loss: 0.34562958922712383
Epoch: 35, step: 166, loss: 0.355211079120636, mean loss: 0.3456297781850565
Epoch: 35, step: 167, loss: 0.30553534626960754, mean loss: 0.34562898749262305
Epoch: 35, step: 168, loss: 0.31278395652770996, mean loss: 0.3456283397766167
Epoch: 35, step: 169, loss: 0.328365296125412, mean loss: 0.3456279993498044
Epoch: 35, step: 170, loss: 0.2931770086288452, mean loss: 0.3456269650379052
Epoch: 35, step: 171, loss: 0.3553640842437744, mean loss: 0.3456271570460927
Epoch: 35, step: 172, loss: 0.32100021839141846, mean loss: 0.34562667143217407
Epoch: 35, step: 173, loss: 0.31557533144950867, mean loss: 0.3456260788672022
Epoch: 35, step: 174, loss: 0.3266480565071106, mean loss: 0.34562570465794734
Epoch: 35, step: 175, loss: 0.30480024218559265, mean loss: 0.3456248996760388
Epoch: 35, step: 176, loss: 0.30006682872772217, mean loss: 0.3456240013959562
Epoch: 35, step: 177, loss: 0.2937370538711548, mean loss: 0.34562297834797473
Epoch: 35, step: 178, loss: 0.3875277042388916, mean loss: 0.34562380456154146
Epoch: 35, step: 179, loss: 0.3159726560115814, mean loss: 0.3456232199568776
Epoch: 35, step: 180, loss: 0.3692258596420288, mean loss: 0.34562368529943166
Epoch: 35, step: 181, loss: 0.36418700218200684, mean loss: 0.34562405128099555
Epoch: 35, step: 182, loss: 0.3147898316383362, mean loss: 0.34562344338675344
Epoch: 35, step: 183, loss: 0.3246934115886688, mean loss: 0.34562303076093925
Epoch: 35, step: 184, loss: 0.32374107837677, mean loss: 0.34562259937695927
Epoch: 35, step: 185, loss: 0.30664145946502686, mean loss: 0.34562183091226834
Epoch: 35, step: 186, loss: 0.36838579177856445, mean loss: 0.3456222796665977
Epoch: 35, step: 187, loss: 0.3333669900894165, mean loss: 0.3456220380783313
Epoch: 35, step: 188, loss: 0.4124939441680908, mean loss: 0.34562335629682744
Epoch: 35, step: 189, loss: 0.3202541768550873, mean loss: 0.34562285621444144
Epoch: 35, step: 190, loss: 0.32304680347442627, mean loss: 0.345622411199505
Epoch: 35, step: 191, loss: 0.3189702033996582, mean loss: 0.34562188584651676
Epoch: 35, step: 192, loss: 0.37036675214767456, mean loss: 0.3456223735934724
Epoch: 35, step: 193, loss: 0.3614102900028229, mean loss: 0.34562268478353053
Epoch: 35, step: 194, loss: 0.306065171957016, mean loss: 0.3456219050946998
Epoch: 35, step: 195, loss: 0.3148255944252014, mean loss: 0.34562129810339837
Epoch: 35, step: 196, loss: 0.344731867313385, mean loss: 0.34562128057317804
Epoch: 35, step: 197, loss: 0.3568078577518463, mean loss: 0.3456215010504767
Epoch: 35, step: 198, loss: 0.35241708159446716, mean loss: 0.3456216349825712
Epoch: 35, step: 199, loss: 0.33565273880958557, mean loss: 0.3456214385124062
Epoch: 35, step: 200, loss: 0.32240286469459534, mean loss: 0.3456209809224135
Epoch: 35, step: 201, loss: 0.3181675672531128, mean loss: 0.3456204398831626
Epoch: 35, step: 202, loss: 0.32710105180740356, mean loss: 0.34562007491877195
Epoch: 35, step: 203, loss: 0.3216989040374756, mean loss: 0.34561960350991805
Epoch: 35, step: 204, loss: 0.31374889612197876, mean loss: 0.3456189754538064
Epoch: 35, step: 205, loss: 0.34897977113723755, mean loss: 0.34561904168160135
Epoch: 35, step: 206, loss: 0.3587498068809509, mean loss: 0.34561930043118655
Epoch: 35, step: 207, loss: 0.3393040597438812, mean loss: 0.34561917598804226
Epoch: 35, step: 208, loss: 0.33622488379478455, mean loss: 0.34561899087518894
Epoch: 35, step: 209, loss: 0.3310684263706207, mean loss: 0.3456187041645583
Epoch: 35, step: 210, loss: 0.3119754195213318, mean loss: 0.3456180412557557
Epoch: 35, step: 211, loss: 0.34543946385383606, mean loss: 0.3456180377371278
Epoch: 35, step: 212, loss: 0.35488060116767883, mean loss: 0.34561822023990457
Epoch: 35, step: 213, loss: 0.31498584151268005, mean loss: 0.3456176166938052
Epoch: 35, step: 214, loss: 0.3305733799934387, mean loss: 0.3456173202848465
Epoch: 35, step: 215, loss: 0.3264961242675781, mean loss: 0.3456169435570504
Epoch: 35, step: 216, loss: 0.3049463629722595, mean loss: 0.3456161422768214
Epoch: 35, step: 217, loss: 0.39290332794189453, mean loss: 0.3456170738971702
Epoch: 35, step: 218, loss: 0.346785306930542, mean loss: 0.3456170969124588
Epoch: 35, step: 219, loss: 0.31471535563468933, mean loss: 0.34561648813110973
Epoch: 35, step: 220, loss: 0.29004180431365967, mean loss: 0.3456153933007514
Epoch: 35, step: 221, loss: 0.3337642550468445, mean loss: 0.34561515983598934
Epoch: 35, step: 222, loss: 0.3392011821269989, mean loss: 0.345615033484558
Epoch: 35, step: 223, loss: 0.35671988129615784, mean loss: 0.3456152522389472
Epoch: 35, step: 224, loss: 0.3628137707710266, mean loss: 0.3456155910258778
Epoch: 35, step: 225, loss: 0.32525983452796936, mean loss: 0.3456151900536425
Epoch: 35, step: 226, loss: 0.34757184982299805, mean loss: 0.3456152285956042
Epoch: 35, step: 227, loss: 0.3062518537044525, mean loss: 0.3456144532376052
Epoch: 35, step: 228, loss: 0.36688676476478577, mean loss: 0.3456148722395853
Epoch: 35, step: 229, loss: 0.31177523732185364, mean loss: 0.3456142057114207
Epoch: 35, step: 230, loss: 0.33099839091300964, mean loss: 0.3456139178341916
Epoch: 35, step: 231, loss: 0.3070094883441925, mean loss: 0.34561315748538735
Epoch: 35, step: 232, loss: 0.35735464096069336, mean loss: 0.34561338873986264
Epoch: 35, step: 233, loss: 0.35354673862457275, mean loss: 0.34561354498813707
Epoch: 35, step: 234, loss: 0.36813631653785706, mean loss: 0.34561398856807896
Epoch: 35, step: 235, loss: 0.30439817905426025, mean loss: 0.345613176849757
Epoch: 35, step: 236, loss: 0.334632009267807, mean loss: 0.34561296058712665
Epoch: 35, step: 237, loss: 0.3327663540840149, mean loss: 0.3456127075916069
Epoch: 35, step: 238, loss: 0.2832130491733551, mean loss: 0.34561147874388604
Epoch: 35, step: 239, loss: 0.31598711013793945, mean loss: 0.34561089535734396
Epoch: 35, step: 240, loss: 0.3116288185119629, mean loss: 0.3456102261685362
Epoch: 35, step: 241, loss: 0.3113950192928314, mean loss: 0.34560955240210567
Epoch: 35, step: 242, loss: 0.30619266629219055, mean loss: 0.34560877621940456
Epoch: 35, step: 243, loss: 0.3181479275226593, mean loss: 0.34560823548120556
Epoch: 35, step: 244, loss: 0.3154429793357849, mean loss: 0.34560764150156303
Epoch: 35, step: 245, loss: 0.34957030415534973, mean loss: 0.3456077195282368
Epoch: 35, step: 246, loss: 0.3767516016960144, mean loss: 0.3456083327537112
Epoch: 35, step: 247, loss: 0.3206803500652313, mean loss: 0.3456078419294478
Epoch: 35, step: 248, loss: 0.34413769841194153, mean loss: 0.3456078129833469
Epoch: 35, step: 249, loss: 0.29750463366508484, mean loss: 0.3456068658839313
Epoch: 35, step: 250, loss: 0.3159288465976715, mean loss: 0.34560628156743256
Epoch: 35, step: 251, loss: 0.3643427789211273, mean loss: 0.345606650454213
Epoch: 35, step: 252, loss: 0.3257238268852234, mean loss: 0.3456062590061086
Epoch: 35, step: 253, loss: 0.3476843237876892, mean loss: 0.3456062999177277
Epoch: 35, step: 254, loss: 0.36933740973472595, mean loss: 0.34560676711154237
Epoch: 35, step: 255, loss: 0.3576565980911255, mean loss: 0.34560700433161834
Epoch: 35, step: 256, loss: 0.32833778858184814, mean loss: 0.34560666436634974
Epoch: 35, step: 257, loss: 0.3463388979434967, mean loss: 0.345606678780964
Epoch: 35, step: 258, loss: 0.3087092638015747, mean loss: 0.34560595243959946
Epoch: 35, step: 259, loss: 0.3182564675807953, mean loss: 0.34560541406391326
Epoch: 35, step: 260, loss: 0.3296733796596527, mean loss: 0.3456051004473623
Epoch: 35, step: 261, loss: 0.32986193895339966, mean loss: 0.34560479055480897
Epoch: 35, step: 262, loss: 0.32740092277526855, mean loss: 0.34560443223211584
Epoch: 35, step: 263, loss: 0.3337666094303131, mean loss: 0.34560419922245517
Epoch: 35, step: 264, loss: 0.3115358054637909, mean loss: 0.3456035286507839
Epoch: 35, step: 265, loss: 0.33284181356430054, mean loss: 0.34560327746558756
Epoch: 35, step: 266, loss: 0.3637889325618744, mean loss: 0.3456036354016022
Epoch: 35, step: 267, loss: 0.33144304156303406, mean loss: 0.345603356693646
Epoch: 35, step: 268, loss: 0.32864394783973694, mean loss: 0.3456030229061506
Epoch: 35, step: 269, loss: 0.3160567879676819, mean loss: 0.34560244140182195
Epoch: 35, step: 270, loss: 0.32246142625808716, mean loss: 0.3456019859686452
Epoch: 35, step: 271, loss: 0.3384120762348175, mean loss: 0.3456018444684143
Epoch: 35, step: 272, loss: 0.3279421925544739, mean loss: 0.345601496926409
Epoch: 35, step: 273, loss: 0.3214482367038727, mean loss: 0.3456010215995262
Epoch: 35, step: 274, loss: 0.3025931715965271, mean loss: 0.3456001752382155
Epoch: 35, step: 275, loss: 0.332625150680542, mean loss: 0.34559991990476624
Epoch: 35, step: 276, loss: 0.330160915851593, mean loss: 0.3455996160890342
Epoch: 35, step: 277, loss: 0.3006119430065155, mean loss: 0.34559873081859693
Epoch: 35, step: 278, loss: 0.32700115442276, mean loss: 0.3455983648614471
Epoch: 35, step: 279, loss: 0.3507591784000397, mean loss: 0.34559846641228414
Epoch: 35, step: 280, loss: 0.3336300253868103, mean loss: 0.3455982309104045
Epoch: 35, step: 281, loss: 0.2980862557888031, mean loss: 0.3455972960401687
Epoch: 35, step: 282, loss: 0.3295005261898041, mean loss: 0.3455969793180183
Epoch: 35, step: 283, loss: 0.31780916452407837, mean loss: 0.3455964325720952
Epoch: 35, step: 284, loss: 0.3538728356361389, mean loss: 0.345596595413277
Epoch: 35, step: 285, loss: 0.3245846629142761, mean loss: 0.3455961820041458
Epoch: 35, step: 286, loss: 0.29583197832107544, mean loss: 0.3455952029142195
Epoch: 35, step: 287, loss: 0.31987857818603516, mean loss: 0.3455946969603215
Epoch: 35, step: 288, loss: 0.3025624454021454, mean loss: 0.3455938503520554
Epoch: 35, step: 289, loss: 0.3044978678226471, mean loss: 0.34559304185348116
Epoch: 35, step: 290, loss: 0.4180113673210144, mean loss: 0.34559446654167275
Epoch: 35, step: 291, loss: 0.31125274300575256, mean loss: 0.34559379094906306
Epoch: 35, step: 292, loss: 0.3341517150402069, mean loss: 0.3455935658575692
Epoch: 35, step: 293, loss: 0.39007440209388733, mean loss: 0.3455944408789375
Epoch: 35, step: 294, loss: 0.3377837836742401, mean loss: 0.3455942872317022
Epoch: 35, step: 295, loss: 0.31113776564598083, mean loss: 0.34559360943404727
Epoch: 35, step: 296, loss: 0.3462142050266266, mean loss: 0.3455936216416046
Epoch: 35, step: 297, loss: 0.3456561267375946, mean loss: 0.3455936228711002
Epoch: 35, step: 298, loss: 0.3242551386356354, mean loss: 0.34559320314442904
Epoch: 35, step: 299, loss: 0.3158431351184845, mean loss: 0.34559261797393287
Epoch: 35, step: 300, loss: 0.33735963702201843, mean loss: 0.345592456038075
Epoch: 35, step: 301, loss: 0.3085598349571228, mean loss: 0.3455917276516802
Epoch: 35, step: 302, loss: 0.31006187200546265, mean loss: 0.3455910288365897
Epoch: 35, step: 303, loss: 0.30543357133865356, mean loss: 0.3455902390195514
Epoch: 35, step: 304, loss: 0.3051804006099701, mean loss: 0.34558944425431565
Epoch: 35, step: 305, loss: 0.3096235692501068, mean loss: 0.34558873690516323
Epoch: 35, step: 306, loss: 0.33950069546699524, mean loss: 0.34558861717260403
Epoch: 35, step: 307, loss: 0.3218259811401367, mean loss: 0.3455881498457469
Epoch: 35, step: 308, loss: 0.37578192353248596, mean loss: 0.34558874363861763
Epoch: 35, step: 309, loss: 0.32351964712142944, mean loss: 0.345588309634753
Epoch: 35, step: 310, loss: 0.35446295142173767, mean loss: 0.34558848415721644
Epoch: 35, step: 311, loss: 0.29319822788238525, mean loss: 0.34558745390754536
Epoch: 35, step: 312, loss: 0.3287602663040161, mean loss: 0.3455871230089238
Epoch: 35, step: 313, loss: 0.32731059193611145, mean loss: 0.3455867636167212
Epoch: 35, step: 314, loss: 0.3283329904079437, mean loss: 0.34558642434284037
Epoch: 35, step: 315, loss: 0.33987754583358765, mean loss: 0.3455863120870887
Epoch: 35, step: 316, loss: 0.33751609921455383, mean loss: 0.34558615340268195
Epoch: 35, step: 317, loss: 0.3025338649749756, mean loss: 0.3455853068831879
Epoch: 35, step: 318, loss: 0.35048118233680725, mean loss: 0.3455854031468866
Epoch: 35, step: 319, loss: 0.348265677690506, mean loss: 0.34558545584595357
Epoch: 35, step: 320, loss: 0.3951053321361542, mean loss: 0.3455864294775434
Epoch: 35, step: 321, loss: 0.31141796708106995, mean loss: 0.34558575768991423
Epoch: 35, step: 322, loss: 0.339016854763031, mean loss: 0.3455856285409665
Epoch: 35, step: 323, loss: 0.3050101101398468, mean loss: 0.34558483081529806
Epoch: 35, step: 324, loss: 0.3189111053943634, mean loss: 0.34558430641295024
Epoch: 35, step: 325, loss: 0.3406938314437866, mean loss: 0.3455842102686698
Epoch: 35, step: 326, loss: 0.2990754246711731, mean loss: 0.3455832959472906
Epoch: 35, step: 327, loss: 0.33495670557022095, mean loss: 0.3455830870420776
Epoch: 35, step: 328, loss: 0.3378189206123352, mean loss: 0.345582934411469
Epoch: 35, step: 329, loss: 0.3021591305732727, mean loss: 0.34558208078843305
Epoch: 35, step: 330, loss: 0.28454649448394775, mean loss: 0.3455808809774149
Epoch: 35, step: 331, loss: 0.3058334290981293, mean loss: 0.3455800996546464
Epoch: 35, step: 332, loss: 0.3576797842979431, mean loss: 0.3455803374956356
Epoch: 35, step: 333, loss: 0.29391610622406006, mean loss: 0.3455793219625289
Epoch: 35, step: 334, loss: 0.3123103082180023, mean loss: 0.3455786680261408
Epoch: 35, step: 335, loss: 0.33042505383491516, mean loss: 0.345578370172257
Epoch: 35, step: 336, loss: 0.3216818869113922, mean loss: 0.34557790048097686
Epoch: 35, step: 337, loss: 0.345539391040802, mean loss: 0.3455778997240792
Epoch: 35, step: 338, loss: 0.30970120429992676, mean loss: 0.34557719458648956
Epoch: 35, step: 339, loss: 0.34164777398109436, mean loss: 0.345577117357311
Epoch: 35, step: 340, loss: 0.3414745032787323, mean loss: 0.3455770367257574
Epoch: 35, step: 341, loss: 0.33509132266044617, mean loss: 0.34557683064671046
Epoch: 35, step: 342, loss: 0.3515610694885254, mean loss: 0.34557694825453317
Epoch: 35, step: 343, loss: 0.32509443163871765, mean loss: 0.34557654572099383
Epoch: 35, step: 344, loss: 0.33045512437820435, mean loss: 0.3455762485524502
Epoch: 35, step: 345, loss: 0.33351925015449524, mean loss: 0.3455760116110833
Epoch: 35, step: 346, loss: 0.32444196939468384, mean loss: 0.34557559629789497
Epoch: 35, step: 347, loss: 0.3601790964603424, mean loss: 0.3455758832712514
Epoch: 35, step: 348, loss: 0.30111706256866455, mean loss: 0.3455750096282106
Epoch: 35, step: 349, loss: 0.32431021332740784, mean loss: 0.3455745917701579
Epoch: 35, step: 350, loss: 0.3178795874118805, mean loss: 0.34557404756775756
Epoch: 35, step: 351, loss: 0.32974666357040405, mean loss: 0.3455737365683078
Epoch: 35, step: 352, loss: 0.4158379137516022, mean loss: 0.3455751171938788
Epoch: 35, step: 353, loss: 0.3245556354522705, mean loss: 0.34557470418877523
Epoch: 35, step: 354, loss: 0.28717565536499023, mean loss: 0.3455735567470064
Epoch: 35, step: 355, loss: 0.34212151169776917, mean loss: 0.34557348892153783
Epoch: 35, step: 356, loss: 0.33170726895332336, mean loss: 0.3455732164846561
Epoch: 35, step: 357, loss: 0.35215699672698975, mean loss: 0.3455733458370912
Epoch: 35, step: 358, loss: 0.337424099445343, mean loss: 0.34557318573087314
Epoch: 35, step: 359, loss: 0.35198670625686646, mean loss: 0.345573311733241
Epoch: 35, step: 360, loss: 0.35248038172721863, mean loss: 0.34557344742939616
Epoch: 35, step: 361, loss: 0.3176933825016022, mean loss: 0.34557289970897404
Epoch: 35, step: 362, loss: 0.303431898355484, mean loss: 0.345572071840256
Epoch: 35, step: 363, loss: 0.3063957393169403, mean loss: 0.34557130222819166
Epoch: 35, step: 364, loss: 0.3494494557380676, mean loss: 0.345571378412329
Epoch: 35, step: 365, loss: 0.33019497990608215, mean loss: 0.3455710763575907
Epoch: 35, step: 366, loss: 0.3189516067504883, mean loss: 0.3455705534536756
Epoch: 35, step: 367, loss: 0.2789386510848999, mean loss: 0.345569244584689
Epoch: 35, step: 368, loss: 0.33482807874679565, mean loss: 0.34556903359712615
Epoch: 35, step: 369, loss: 0.3090816140174866, mean loss: 0.34556831689275413
Epoch: 35, step: 370, loss: 0.31508877873420715, mean loss: 0.34556771820999094
Epoch: 35, step: 371, loss: 0.3573299050331116, mean loss: 0.3455679492397447
Epoch: 35, step: 372, loss: 0.360016793012619, mean loss: 0.34556823303452744
Epoch: 35, step: 373, loss: 0.33250322937965393, mean loss: 0.34556797642527154
Epoch: 35, step: 374, loss: 0.32447630167007446, mean loss: 0.3455675621726003
Epoch: 35, step: 375, loss: 0.4311141073703766, mean loss: 0.3455692423231463
Epoch: 35, step: 376, loss: 0.38103240728378296, mean loss: 0.3455699388128248
Epoch: 35, step: 377, loss: 0.31215783953666687, mean loss: 0.34556928261856584
Epoch: 35, step: 378, loss: 0.3481498658657074, mean loss: 0.34556933329872935
Epoch: 35, step: 379, loss: 0.3596973419189453, mean loss: 0.3455696107537298
Epoch: 35, step: 380, loss: 0.3106333315372467, mean loss: 0.34556892466588357
Epoch: 35, step: 381, loss: 0.33398759365081787, mean loss: 0.3455686972331234
Epoch: 35, step: 382, loss: 0.313926637172699, mean loss: 0.3455680758624253
Epoch: 35, step: 383, loss: 0.31329241394996643, mean loss: 0.34556744206182216
Epoch: 35, step: 384, loss: 0.34284117817878723, mean loss: 0.3455673885269398
Epoch: 35, step: 385, loss: 0.34911778569221497, mean loss: 0.3455674582437282
Epoch: 35, step: 386, loss: 0.32437658309936523, mean loss: 0.3455670421407741
Epoch: 35, step: 387, loss: 0.3776136338710785, mean loss: 0.3455676713936749
Epoch: 35, step: 388, loss: 0.38459309935569763, mean loss: 0.3455684376649145
Epoch: 35, step: 389, loss: 0.3688715696334839, mean loss: 0.34556889521708356
Epoch: 35, step: 390, loss: 0.37741410732269287, mean loss: 0.34556952047894973
Epoch: 35, step: 391, loss: 0.3104710876941681, mean loss: 0.3455688313555541
Epoch: 35, step: 392, loss: 0.30721813440322876, mean loss: 0.34556807839191656
Epoch: 35, step: 393, loss: 0.3110572397708893, mean loss: 0.345567400831964
Epoch: 35, step: 394, loss: 0.35148710012435913, mean loss: 0.34556751705262356
Epoch: 35, step: 395, loss: 0.37656375765800476, mean loss: 0.34556812558569655
Epoch: 35, step: 396, loss: 0.32688507437705994, mean loss: 0.3455677587982688
Epoch: 35, step: 397, loss: 0.32485201954841614, mean loss: 0.3455673521129013
Epoch: 35, step: 398, loss: 0.3331998884677887, mean loss: 0.34556710932321866
Epoch: 35, step: 399, loss: 0.3447309732437134, mean loss: 0.34556709290908283
Epoch: 35, step: 400, loss: 0.35387158393859863, mean loss: 0.34556725593083404
Epoch: 35, step: 401, loss: 0.33522602915763855, mean loss: 0.34556705293081885
Epoch: 35, step: 402, loss: 0.34325870871543884, mean loss: 0.34556700761852444
Epoch: 35, step: 403, loss: 0.35314664244651794, mean loss: 0.3455671564021855
Epoch: 35, step: 404, loss: 0.33884844183921814, mean loss: 0.34556702452045884
Epoch: 35, step: 405, loss: 0.29686594009399414, mean loss: 0.3455660685850679
Epoch: 35, step: 406, loss: 0.30644288659095764, mean loss: 0.3455653006658186
Epoch: 35, step: 407, loss: 0.3482602834701538, mean loss: 0.3455653535625526
Epoch: 35, step: 408, loss: 0.36470627784729004, mean loss: 0.3455657292504814
Epoch: 35, step: 409, loss: 0.3477840721607208, mean loss: 0.3455657727900871
Epoch: 35, step: 410, loss: 0.28284579515457153, mean loss: 0.34556454180389184
Epoch: 35, step: 411, loss: 0.33306798338890076, mean loss: 0.3455642965425004
Epoch: 35, step: 412, loss: 0.34814417362213135, mean loss: 0.34556434717498685
Epoch: 35, step: 413, loss: 0.3149130344390869, mean loss: 0.34556374562628145
Epoch: 35, step: 414, loss: 0.344197154045105, mean loss: 0.3455637188067038
Epoch: 35, step: 415, loss: 0.3366466164588928, mean loss: 0.3455635438105827
Epoch: 35, step: 416, loss: 0.34501975774765015, mean loss: 0.34556353313911337
Epoch: 35, step: 417, loss: 0.3720034062862396, mean loss: 0.34556405199529194
Epoch: 35, step: 418, loss: 0.3719233572483063, mean loss: 0.34556456926025503
Epoch: 35, step: 419, loss: 0.32749053835868835, mean loss: 0.34556421458931896
Epoch: 35, step: 420, loss: 0.3161657452583313, mean loss: 0.345563637707599
Epoch: 35, step: 421, loss: 0.31393811106681824, mean loss: 0.34556301713684745
Epoch: 35, step: 422, loss: 0.3679966628551483, mean loss: 0.3455634573316107
Epoch: 35, step: 423, loss: 0.2881512939929962, mean loss: 0.34556233080772447
Epoch: 35, step: 424, loss: 0.33965441584587097, mean loss: 0.34556221488670097
Epoch: 35, step: 425, loss: 0.32157960534095764, mean loss: 0.34556174432574766
Epoch: 35, step: 426, loss: 0.3307447135448456, mean loss: 0.34556145360762064
Epoch: 35, step: 427, loss: 0.3038601279258728, mean loss: 0.3455606354211962
Epoch: 35, step: 428, loss: 0.2853909432888031, mean loss: 0.345559454905743
Epoch: 35, step: 429, loss: 0.3092546761035919, mean loss: 0.34555874262834846
Epoch: 35, step: 430, loss: 0.35651856660842896, mean loss: 0.3455589576491246
Epoch: 35, step: 431, loss: 0.34368082880973816, mean loss: 0.34555892080283956
Epoch: 35, step: 432, loss: 0.29433149099349976, mean loss: 0.34555791581137724
Epoch: 35, step: 433, loss: 0.345064640045166, mean loss: 0.34555790613437
Epoch: 35, step: 434, loss: 0.33008134365081787, mean loss: 0.3455576025235317
Epoch: 35, step: 435, loss: 0.3305409848690033, mean loss: 0.34555730794142137
Epoch: 35, step: 436, loss: 0.3448156416416168, mean loss: 0.34555729339238356
Epoch: 35, step: 437, loss: 0.3313165605068207, mean loss: 0.3455570140418228
Epoch: 35, step: 438, loss: 0.3150902986526489, mean loss: 0.3455564164091625
Epoch: 35, step: 439, loss: 0.32219964265823364, mean loss: 0.34555595825353774
Epoch: 35, step: 440, loss: 0.33769914507865906, mean loss: 0.345555804140963
Epoch: 35, step: 441, loss: 0.32655784487724304, mean loss: 0.3455554315004376
Epoch: 35, step: 442, loss: 0.3749831020832062, mean loss: 0.3455560087059881
Epoch: 35, step: 443, loss: 0.3493082821369171, mean loss: 0.3455560823030662
Epoch: 35, step: 444, loss: 0.32294008135795593, mean loss: 0.34555563872160217
Epoch: 35, step: 445, loss: 0.3478524088859558, mean loss: 0.3455556837686771
Epoch: 35, step: 446, loss: 0.32650503516197205, mean loss: 0.3455553101313067
Epoch: 35, step: 447, loss: 0.3006851375102997, mean loss: 0.3455544301169382
Epoch: 35, step: 448, loss: 0.3760230839252472, mean loss: 0.34555502767040674
Epoch: 35, step: 449, loss: 0.36730456352233887, mean loss: 0.34555545421553036
Epoch: 35, step: 450, loss: 0.3389696478843689, mean loss: 0.3455553250592806
Epoch: 35, step: 451, loss: 0.32516714930534363, mean loss: 0.34555492522841
Epoch: 35, step: 452, loss: 0.34923452138900757, mean loss: 0.34555499738725853
Epoch: 35, step: 453, loss: 0.3454205393791199, mean loss: 0.3455549947505168
Epoch: 35, step: 454, loss: 0.41346627473831177, mean loss: 0.3455563264748033
Epoch: 35, step: 455, loss: 0.32392561435699463, mean loss: 0.3455559023099253
Epoch: 35, step: 456, loss: 0.34505394101142883, mean loss: 0.3455558924669679
Epoch: 35, step: 457, loss: 0.34689801931381226, mean loss: 0.3455559187842126
Epoch: 35, step: 458, loss: 0.3868635892868042, mean loss: 0.34555672875441795
Epoch: 35, step: 459, loss: 0.3402825891971588, mean loss: 0.3455566253399168
Epoch: 35, step: 460, loss: 0.2970191240310669, mean loss: 0.3455556736428656
Epoch: 35, step: 461, loss: 0.3035711944103241, mean loss: 0.3455548504500647
Epoch: 35, step: 462, loss: 0.37864166498184204, mean loss: 0.34555549917297373
Epoch: 35, step: 463, loss: 0.3408668339252472, mean loss: 0.34555540724557104
Epoch: 35, step: 464, loss: 0.3063165843486786, mean loss: 0.34555463793230967
Epoch: 35, step: 465, loss: 0.31240594387054443, mean loss: 0.34555398803437487
Epoch: 35, step: 466, loss: 0.3240508735179901, mean loss: 0.34555356646254126
Epoch: 35, step: 467, loss: 0.38422802090644836, mean loss: 0.34555432466624353
Epoch: 35, step: 468, loss: 0.34994444251060486, mean loss: 0.34555441073179755
Epoch: 35, step: 469, loss: 0.3042050302028656, mean loss: 0.34555360011857406
Epoch: 35, step: 470, loss: 0.37365585565567017, mean loss: 0.3455541510243696
Epoch: 35, step: 471, loss: 0.3176053762435913, mean loss: 0.34555360313809225
Epoch: 35, step: 472, loss: 0.3514668345451355, mean loss: 0.34555371905425886
Epoch: 35, step: 473, loss: 0.33284899592399597, mean loss: 0.3455534700104056
Epoch: 35, step: 474, loss: 0.3308872580528259, mean loss: 0.3455531825221775
Epoch: 35, step: 475, loss: 0.36665934324264526, mean loss: 0.3455535962386727
Epoch: 35, step: 476, loss: 0.3319726884365082, mean loss: 0.3455533300350974
Epoch: 35, step: 477, loss: 0.31479138135910034, mean loss: 0.34555272707244356
Epoch: 35, step: 478, loss: 0.330832302570343, mean loss: 0.34555243854415996
Epoch: 35, step: 479, loss: 0.34672635793685913, mean loss: 0.3455524615531641
Epoch: 35, step: 480, loss: 0.3060925602912903, mean loss: 0.34555168814807086
Epoch: 35, step: 481, loss: 0.3137003779411316, mean loss: 0.3455510638818679
Epoch: 35, step: 482, loss: 0.29982784390449524, mean loss: 0.34555016775227976
Epoch: 35, step: 483, loss: 0.29834967851638794, mean loss: 0.3455492426878153
Epoch: 35, step: 484, loss: 0.32107001543045044, mean loss: 0.3455487629381385
Epoch: 35, step: 485, loss: 0.3071044981479645, mean loss: 0.34554800951312403
Epoch: 35, step: 486, loss: 0.3647118806838989, mean loss: 0.34554838507647617
Epoch: 35, step: 487, loss: 0.3172193765640259, mean loss: 0.345547829910518
Epoch: 35, step: 488, loss: 0.33531975746154785, mean loss: 0.34554762947405154
Epoch: 35, step: 489, loss: 0.3009130656719208, mean loss: 0.3455467548010395
Epoch: 35, step: 490, loss: 0.3241851031780243, mean loss: 0.34554633619956937
Epoch: 35, step: 491, loss: 0.33182480931282043, mean loss: 0.3455460673187321
Epoch: 35, step: 492, loss: 0.3486241400241852, mean loss: 0.34554612763407133
Epoch: 35, step: 493, loss: 0.3650723993778229, mean loss: 0.3455465102470694
Epoch: 35, step: 494, loss: 0.31019216775894165, mean loss: 0.3455458175000823
Epoch: 35, step: 495, loss: 0.313368022441864, mean loss: 0.34554518700797754
Epoch: 35, step: 496, loss: 0.36676350235939026, mean loss: 0.34554560275175855
Epoch: 35, step: 497, loss: 0.298193097114563, mean loss: 0.34554467496254976
Epoch: 35, step: 498, loss: 0.3247651755809784, mean loss: 0.34554426783271996
Epoch: 35, step: 499, loss: 0.30789315700531006, mean loss: 0.3455435301542163
Epoch: 35, step: 500, loss: 0.3175354599952698, mean loss: 0.34554298141751133
Epoch: 35, step: 501, loss: 0.3381824493408203, mean loss: 0.3455428372121104
Epoch: 35, step: 502, loss: 0.3442797064781189, mean loss: 0.3455428124657057
Epoch: 35, step: 503, loss: 0.41992416977882385, mean loss: 0.34554426966649937
Epoch: 35, step: 504, loss: 0.3732377588748932, mean loss: 0.345544812197388
Epoch: 35, step: 505, loss: 0.3415648639202118, mean loss: 0.34554473422951043
Epoch: 35, step: 506, loss: 0.32481491565704346, mean loss: 0.345544328136722
Epoch: 35, step: 507, loss: 0.3439887464046478, mean loss: 0.3455442976637998
Epoch: 35, step: 508, loss: 0.30466383695602417, mean loss: 0.34554349685554286
Epoch: 35, step: 509, loss: 0.2983417510986328, mean loss: 0.34554257223760443
Epoch: 35, step: 510, loss: 0.31899595260620117, mean loss: 0.3455420522356528
Epoch: 35, step: 511, loss: 0.3629429042339325, mean loss: 0.34554239308130036
Epoch: 35, step: 512, loss: 0.32840052247047424, mean loss: 0.34554205731512383
Epoch: 35, step: 513, loss: 0.3313433825969696, mean loss: 0.3455417792042076
Epoch: 35, step: 514, loss: 0.33070796728134155, mean loss: 0.3455414886584839
Epoch: 35, step: 515, loss: 0.3244806230068207, mean loss: 0.3455410761532807
Epoch: 35, step: 516, loss: 0.3252198100090027, mean loss: 0.345540678141918
Epoch: 35, step: 517, loss: 0.33911165595054626, mean loss: 0.345540552225858
Epoch: 35, step: 518, loss: 0.3106635808944702, mean loss: 0.34553986915389556
Epoch: 35, step: 519, loss: 0.34352993965148926, mean loss: 0.34553982978982384
Epoch: 35, step: 520, loss: 0.3021996319293976, mean loss: 0.34553898099724517
Epoch: 35, step: 521, loss: 0.2952527105808258, mean loss: 0.34553799618916053
Epoch: 35, step: 522, loss: 0.32056137919425964, mean loss: 0.34553750705579594
Epoch: 35, step: 523, loss: 0.30084529519081116, mean loss: 0.345536631836231
Epoch: 35, step: 524, loss: 0.37650829553604126, mean loss: 0.34553723835074585
Epoch: 35, step: 525, loss: 0.34774690866470337, mean loss: 0.3455372816216172
Epoch: 35, step: 526, loss: 0.32489123940467834, mean loss: 0.3455368773283903
Epoch: 35, step: 527, loss: 0.2972410023212433, mean loss: 0.34553593161140495
Epoch: 35, step: 528, loss: 0.31717750430107117, mean loss: 0.34553537631509385
Epoch: 35, step: 529, loss: 0.34025925397872925, mean loss: 0.3455352730035149
Epoch: 35, step: 530, loss: 0.3361798822879791, mean loss: 0.34553508981950215
Epoch: 35, step: 531, loss: 0.31668639183044434, mean loss: 0.34553452495621134
Epoch: 35, step: 532, loss: 0.336210161447525, mean loss: 0.345534342386879
Epoch: 35, step: 533, loss: 0.32239654660224915, mean loss: 0.345533889361939
Epoch: 35, step: 534, loss: 0.33063986897468567, mean loss: 0.34553359775116294
Epoch: 35, step: 535, loss: 0.3561626672744751, mean loss: 0.34553380585417653
Epoch: 35, step: 536, loss: 0.36188846826553345, mean loss: 0.3455341260503981
Epoch: 35, step: 537, loss: 0.32994765043258667, mean loss: 0.34553382089992984
Epoch: 35, step: 538, loss: 0.3017745316028595, mean loss: 0.3455329642016919
Epoch: 35, step: 539, loss: 0.3420582115650177, mean loss: 0.3455328961759942
Epoch: 35, step: 540, loss: 0.3627370595932007, mean loss: 0.34553323297761157
Epoch: 35, step: 541, loss: 0.3569003939628601, mean loss: 0.34553345550533143
Epoch: 35, step: 542, loss: 0.3281177282333374, mean loss: 0.3455331145753298
Epoch: 35, step: 543, loss: 0.34193235635757446, mean loss: 0.34553304408832375
Epoch: 35, step: 544, loss: 0.37842121720314026, mean loss: 0.34553368788147465
Epoch: 35, step: 545, loss: 0.37869584560394287, mean loss: 0.3455343370252268
Epoch: 35, step: 546, loss: 0.3114885985851288, mean loss: 0.34553367059857343
Epoch: 35, step: 547, loss: 0.3549371361732483, mean loss: 0.3455338546626506
Epoch: 35, step: 548, loss: 0.2801628112792969, mean loss: 0.3455325751104303
Epoch: 35, step: 549, loss: 0.3156091272830963, mean loss: 0.3455319894097486
Epoch: 35, step: 550, loss: 0.3516174554824829, mean loss: 0.3455321085200826
Epoch: 35, step: 551, loss: 0.32264721393585205, mean loss: 0.34553166060466367
Epoch: 35, step: 552, loss: 0.31822946667671204, mean loss: 0.3455311262419539
Epoch: 35, step: 553, loss: 0.3473226726055145, mean loss: 0.34553116130568673
Epoch: 35, step: 554, loss: 0.37142422795295715, mean loss: 0.3455316680689052
Epoch: 35, step: 555, loss: 0.35787174105644226, mean loss: 0.345531909576518
Epoch: 35, step: 556, loss: 0.299599289894104, mean loss: 0.34553101064664576
Epoch: 35, step: 557, loss: 0.3194546699523926, mean loss: 0.3455305003264631
Epoch: 35, step: 558, loss: 0.3455629050731659, mean loss: 0.34553050096061927
Epoch: 35, step: 559, loss: 0.3528132438659668, mean loss: 0.3455306434800499
Epoch: 35, step: 560, loss: 0.3435775339603424, mean loss: 0.34553060525947654
Epoch: 35, step: 561, loss: 0.3738781809806824, mean loss: 0.34553115998484385
Epoch: 35, step: 562, loss: 0.32243192195892334, mean loss: 0.34553070797149776
Epoch: 35, step: 563, loss: 0.353763610124588, mean loss: 0.3455308690724322
Epoch: 35, step: 564, loss: 0.35560154914855957, mean loss: 0.3455310661310385
Epoch: 35, step: 565, loss: 0.3138143718242645, mean loss: 0.3455304455249589
Epoch: 35, step: 566, loss: 0.3482942581176758, mean loss: 0.3455304996039029
Epoch: 35, step: 567, loss: 0.3366527259349823, mean loss: 0.34553032589775773
Epoch: 35, step: 568, loss: 0.3619406521320343, mean loss: 0.34553064698262015
Epoch: 35, step: 569, loss: 0.2988418638706207, mean loss: 0.34552973348657023
Epoch: 35, step: 570, loss: 0.3537106513977051, mean loss: 0.34552989354835556
Epoch: 35, step: 571, loss: 0.3280598819255829, mean loss: 0.34552955174972466
Epoch: 35, step: 572, loss: 0.33406180143356323, mean loss: 0.34552932738898834
Epoch: 35, step: 573, loss: 0.31197136640548706, mean loss: 0.34552867085729483
Epoch: 35, step: 574, loss: 0.34363314509391785, mean loss: 0.34552863377374277
Epoch: 35, step: 575, loss: 0.336946964263916, mean loss: 0.3455284658875719
Epoch: 35, step: 576, loss: 0.3062592148780823, mean loss: 0.34552769766465175
Epoch: 35, step: 577, loss: 0.3444744944572449, mean loss: 0.345527677061279
Epoch: 35, step: 578, loss: 0.36683785915374756, mean loss: 0.3455280939352807
Epoch: 35, step: 579, loss: 0.299390584230423, mean loss: 0.3455271914018358
Epoch: 35, step: 580, loss: 0.3231898248195648, mean loss: 0.34552675445094316
Epoch: 35, step: 581, loss: 0.3251434564590454, mean loss: 0.3455263557322312
Epoch: 35, step: 582, loss: 0.34901759028434753, mean loss: 0.3455264240231091
Epoch: 35, step: 583, loss: 0.3602655231952667, mean loss: 0.3455267123240866
Epoch: 35, step: 584, loss: 0.33928927779197693, mean loss: 0.34552659032047717
Epoch: 35, step: 585, loss: 0.3370403051376343, mean loss: 0.34552642433281566
Epoch: 35, step: 586, loss: 0.3311316668987274, mean loss: 0.3455261427837822
Epoch: 35, step: 587, loss: 0.33311015367507935, mean loss: 0.3455258999424993
Epoch: 35, step: 588, loss: 0.30648890137672424, mean loss: 0.34552513644236116
Epoch: 35, step: 589, loss: 0.37371447682380676, mean loss: 0.34552568776918263
Epoch: 35, step: 590, loss: 0.3397643268108368, mean loss: 0.3455255750907496
Epoch: 35, step: 591, loss: 0.33083969354629517, mean loss: 0.34552528787566816
Epoch: 35, step: 592, loss: 0.3532305359840393, mean loss: 0.34552543856598766
Epoch: 35, step: 593, loss: 0.3233930766582489, mean loss: 0.3455250057353484
Epoch: 35, step: 594, loss: 0.32377660274505615, mean loss: 0.34552458042190376
Epoch: 35, step: 595, loss: 0.35891667008399963, mean loss: 0.3455248423135195
Epoch: 35, step: 596, loss: 0.3407653272151947, mean loss: 0.3455247492397158
Epoch: 35, step: 597, loss: 0.34995901584625244, mean loss: 0.34552483595148803
Epoch: 35, step: 598, loss: 0.34860914945602417, mean loss: 0.3455248962638427
Epoch: 35, step: 599, loss: 0.3326686918735504, mean loss: 0.3455246448715003
Epoch: 35, step: 600, loss: 0.3036884665489197, mean loss: 0.3455238268159613
Epoch: 35, step: 601, loss: 0.33790937066078186, mean loss: 0.34552367792745176
Epoch: 35, step: 602, loss: 0.3621700406074524, mean loss: 0.345524003414081
Epoch: 35, step: 603, loss: 0.31277912855148315, mean loss: 0.34552336316547194
Epoch: 35, step: 604, loss: 0.3174312710762024, mean loss: 0.345522813901769
Epoch: 35, step: 605, loss: 0.31652724742889404, mean loss: 0.34552224698419043
Epoch: 35, step: 606, loss: 0.34574997425079346, mean loss: 0.34552225143659754
Epoch: 35, step: 607, loss: 0.32718947529792786, mean loss: 0.3455218930105371
Epoch: 35, step: 608, loss: 0.3253321945667267, mean loss: 0.34552149828730805
Epoch: 35, step: 609, loss: 0.3480650782585144, mean loss: 0.3455215480151667
Epoch: 35, step: 610, loss: 0.31106284260749817, mean loss: 0.34552087434885703
Epoch: 35, step: 611, loss: 0.38735130429267883, mean loss: 0.3455216921160987
Epoch: 35, step: 612, loss: 0.31079578399658203, mean loss: 0.34552101325253015
Epoch: 35, step: 613, loss: 0.3341410160064697, mean loss: 0.34552079078708764
Epoch: 35, step: 614, loss: 0.3132227957248688, mean loss: 0.345520159411952
Epoch: 35, step: 615, loss: 0.34931236505508423, mean loss: 0.34552023354217415
Epoch: 35, step: 616, loss: 0.3431307375431061, mean loss: 0.3455201868331021
Epoch: 35, step: 617, loss: 0.325615257024765, mean loss: 0.3455197977457686
Epoch: 35, step: 618, loss: 0.32881999015808105, mean loss: 0.345519471316253
Epoch: 35, step: 619, loss: 0.3749760091304779, mean loss: 0.3455200470890797
Epoch: 35, step: 620, loss: 0.3654992878437042, mean loss: 0.3455204376060898
Epoch: 35, step: 621, loss: 0.3522235155105591, mean loss: 0.3455205686228191
Epoch: 35, step: 622, loss: 0.3453855514526367, mean loss: 0.34552056598385794
Epoch: 35, step: 623, loss: 0.32674485445022583, mean loss: 0.34552019901271547
Epoch: 35, step: 624, loss: 0.3004167377948761, mean loss: 0.3455193174831304
Epoch: 35, step: 625, loss: 0.30122050642967224, mean loss: 0.34551845169704093
Epoch: 35, step: 626, loss: 0.29985716938972473, mean loss: 0.34551755929994304
Epoch: 35, step: 627, loss: 0.3300311267375946, mean loss: 0.3455172566413955
Epoch: 35, step: 628, loss: 0.2997179329395294, mean loss: 0.34551636158142357
Epoch: 35, step: 629, loss: 0.30862492322921753, mean loss: 0.3455156406230817
Epoch: 35, step: 630, loss: 0.3272766172885895, mean loss: 0.34551528419027144
Epoch: 35, step: 631, loss: 0.35767465829849243, mean loss: 0.34551552180799416
Epoch: 35, step: 632, loss: 0.3398605287075043, mean loss: 0.3455154113006348
Epoch: 35, step: 633, loss: 0.3421456217765808, mean loss: 0.3455153454509939
Epoch: 35, step: 634, loss: 0.31886276602745056, mean loss: 0.34551482463849903
Epoch: 35, step: 635, loss: 0.3645464777946472, mean loss: 0.34551519652479645
Epoch: 35, step: 636, loss: 0.36438116431236267, mean loss: 0.3455155651663305
Epoch: 35, step: 637, loss: 0.33821138739585876, mean loss: 0.34551542244528294
Epoch: 35, step: 638, loss: 0.329619437456131, mean loss: 0.3455151118494333
Epoch: 35, step: 639, loss: 0.34414348006248474, mean loss: 0.34551508504928113
Epoch: 35, step: 640, loss: 0.3397963047027588, mean loss: 0.34551497331288783
Epoch: 35, step: 641, loss: 0.3516239821910858, mean loss: 0.3455150926714295
Epoch: 35, step: 642, loss: 0.29255712032318115, mean loss: 0.3455140579924863
Epoch: 35, step: 643, loss: 0.333087295293808, mean loss: 0.34551381520640667
Epoch: 35, step: 644, loss: 0.3038184940814972, mean loss: 0.3455130006060135
Epoch: 35, step: 645, loss: 0.3683176338672638, mean loss: 0.34551344613083007
Epoch: 35, step: 646, loss: 0.3406401574611664, mean loss: 0.34551335092523744
Epoch: 35, step: 647, loss: 0.3284558355808258, mean loss: 0.34551301769253945
Epoch: 35, step: 648, loss: 0.36490872502326965, mean loss: 0.3455133965963534
Epoch: 35, step: 649, loss: 0.316673219203949, mean loss: 0.34551283320160064
Epoch: 35, step: 650, loss: 0.2978345453739166, mean loss: 0.3455119018213223
Epoch: 35, step: 651, loss: 0.33659419417381287, mean loss: 0.3455117276201259
Epoch: 35, step: 652, loss: 0.31675487756729126, mean loss: 0.3455111658860987
Epoch: 35, step: 653, loss: 0.33026400208473206, mean loss: 0.3455108680550286
Epoch: 35, step: 654, loss: 0.3378072679042816, mean loss: 0.3455107175793933
Epoch: 35, step: 655, loss: 0.3492228090763092, mean loss: 0.345510790086845
Epoch: 35, step: 656, loss: 0.320023775100708, mean loss: 0.34551029226441426
Epoch: 35, step: 657, loss: 0.3632639944553375, mean loss: 0.3455106390299557
Epoch: 35, step: 658, loss: 0.32659292221069336, mean loss: 0.3455102695360824
Epoch: 35, step: 659, loss: 0.31026995182037354, mean loss: 0.345509581248627
Epoch: 35, step: 660, loss: 0.33057743310928345, mean loss: 0.34550928961080474
Epoch: 35, step: 661, loss: 0.32462945580482483, mean loss: 0.34550888181748013
Epoch: 35, step: 662, loss: 0.34715962409973145, mean loss: 0.3455089140566513
Epoch: 35, step: 663, loss: 0.38682031631469727, mean loss: 0.34550972085694537
Epoch: 35, step: 664, loss: 0.3683129549026489, mean loss: 0.34551016618912084
Epoch: 35, step: 665, loss: 0.3500179648399353, mean loss: 0.3455102542217469
Epoch: 35, step: 666, loss: 0.2954884171485901, mean loss: 0.34550927736629605
Epoch: 35, step: 667, loss: 0.33290815353393555, mean loss: 0.34550903128904575
Epoch: 35, step: 668, loss: 0.29839590191841125, mean loss: 0.3455081112724594
Epoch: 35, step: 669, loss: 0.38601016998291016, mean loss: 0.3455089021738207
Epoch: 35, step: 670, loss: 0.35311704874038696, mean loss: 0.3455090507385151
Epoch: 35, step: 671, loss: 0.33862438797950745, mean loss: 0.3455089163039537
Epoch: 35, step: 672, loss: 0.42242270708084106, mean loss: 0.34551041814510297
Epoch: 35, step: 673, loss: 0.3055848479270935, mean loss: 0.3455096385619769
Epoch: 35, step: 674, loss: 0.318074494600296, mean loss: 0.3455091028762606
Epoch: 35, step: 675, loss: 0.39990437030792236, mean loss: 0.34551016495192893
Epoch: 35, step: 676, loss: 0.33354130387306213, mean loss: 0.34550993126270313
Epoch: 35, step: 677, loss: 0.3081090450286865, mean loss: 0.34550920103336513
Epoch: 35, step: 678, loss: 0.3414887487888336, mean loss: 0.34550912253803634
Epoch: 35, step: 679, loss: 0.2902832329273224, mean loss: 0.3455080443285555
Epoch: 35, step: 680, loss: 0.3100518584251404, mean loss: 0.3455073521088428
Epoch: 35, step: 681, loss: 0.33845585584640503, mean loss: 0.34550721444345955
Epoch: 35, step: 682, loss: 0.3112848699092865, mean loss: 0.3455065463384182
Epoch: 35, step: 683, loss: 0.35717901587486267, mean loss: 0.34550677420952425
Epoch: 35, step: 684, loss: 0.32450488209724426, mean loss: 0.3455063642165108
Epoch: 35, step: 685, loss: 0.3226499557495117, mean loss: 0.3455059180288626
Epoch: 35, step: 686, loss: 0.33307206630706787, mean loss: 0.34550567530819337
Epoch: 35, step: 687, loss: 0.3825685977935791, mean loss: 0.3455063987977398
Epoch: 35, step: 688, loss: 0.3437034785747528, mean loss: 0.34550636360438797
Epoch: 35, step: 689, loss: 0.3428262770175934, mean loss: 0.3455063112896
Epoch: 35, step: 690, loss: 0.29344838857650757, mean loss: 0.34550529514853867
Epoch: 35, step: 691, loss: 0.3178066909313202, mean loss: 0.3455047544980816
Epoch: 35, step: 692, loss: 0.34495726227760315, mean loss: 0.3455047438117618
Epoch: 35, step: 693, loss: 0.3584197759628296, mean loss: 0.3455049958910871
Epoch: 35, step: 694, loss: 0.3578079044818878, mean loss: 0.34550523601812116
Epoch: 35, step: 695, loss: 0.33916160464286804, mean loss: 0.3455051122061262
Epoch: 35, step: 696, loss: 0.34500324726104736, mean loss: 0.34550510241115484
Epoch: 35, step: 697, loss: 0.37836629152297974, mean loss: 0.3455057437552571
Epoch: 35, step: 698, loss: 0.3491384983062744, mean loss: 0.3455058146534899
Epoch: 35, step: 699, loss: 0.3192863464355469, mean loss: 0.3455053029542663
Epoch: 35, step: 700, loss: 0.3446393311023712, mean loss: 0.34550528605428676
Epoch: 35, step: 701, loss: 0.36422649025917053, mean loss: 0.3455056514031062
Epoch: 35, step: 702, loss: 0.3406718373298645, mean loss: 0.34550555707189856
Epoch: 35, step: 703, loss: 0.34873414039611816, mean loss: 0.3455056200760224
Epoch: 35, step: 704, loss: 0.37371179461479187, mean loss: 0.345506170494103
Epoch: 35, step: 705, loss: 0.31723102927207947, mean loss: 0.3455056187409667
Epoch: 35, step: 706, loss: 0.2891317903995514, mean loss: 0.34550451869943566
Epoch: 35, step: 707, loss: 0.31048867106437683, mean loss: 0.3455038354367203
Epoch: 35, step: 708, loss: 0.35038065910339355, mean loss: 0.34550393059611206
Epoch: 35, step: 709, loss: 0.3314661383628845, mean loss: 0.34550365668797095
Epoch: 35, step: 710, loss: 0.3268190026283264, mean loss: 0.34550329211646874
Epoch: 35, step: 711, loss: 0.3517107665538788, mean loss: 0.34550341323319467
Epoch: 35, step: 712, loss: 0.3803596496582031, mean loss: 0.3455040933150713
Epoch: 35, step: 713, loss: 0.3115123212337494, mean loss: 0.34550343011274404
Epoch: 35, step: 714, loss: 0.3132723271846771, mean loss: 0.34550280127452476
Epoch: 35, step: 715, loss: 0.3224557936191559, mean loss: 0.3455023516294558
Epoch: 35, step: 716, loss: 0.3842073678970337, mean loss: 0.34550310674614754
Epoch: 35, step: 717, loss: 0.36324992775917053, mean loss: 0.345503452971537
Epoch: 35, step: 718, loss: 0.3155469298362732, mean loss: 0.34550286855664136
Epoch: 35, step: 719, loss: 0.32167237997055054, mean loss: 0.3455024036622093
Epoch: 35, step: 720, loss: 0.31455376744270325, mean loss: 0.3455017999159652
Epoch: 35, step: 721, loss: 0.3234265446662903, mean loss: 0.3455013692801092
Epoch: 35, step: 722, loss: 0.3230192959308624, mean loss: 0.34550093071675264
Epoch: 35, step: 723, loss: 0.3088794946670532, mean loss: 0.3455002163472916
Epoch: 35, step: 724, loss: 0.3374520242214203, mean loss: 0.34550005935534533
Epoch: 35, step: 725, loss: 0.31398385763168335, mean loss: 0.34549944459699233
Epoch: 35, step: 726, loss: 0.37312403321266174, mean loss: 0.3454999834346192
Epoch: 35, step: 727, loss: 0.32528597116470337, mean loss: 0.34549958915334683
Epoch: 35, step: 728, loss: 0.34773218631744385, mean loss: 0.34549963270007417
Epoch: 35, step: 729, loss: 0.3242388963699341, mean loss: 0.3454992180182655
Epoch: 35, step: 730, loss: 0.3383869230747223, mean loss: 0.34549907929862
Epoch: 35, step: 731, loss: 0.31384938955307007, mean loss: 0.3454984620086811
Epoch: 35, step: 732, loss: 0.32570526003837585, mean loss: 0.34549807597310744
Epoch: 35, step: 733, loss: 0.3369026184082031, mean loss: 0.3454979083353658
Epoch: 35, step: 734, loss: 0.32194191217422485, mean loss: 0.34549744893027245
Epoch: 35, step: 735, loss: 0.33750683069229126, mean loss: 0.34549729309482824
Epoch: 35, step: 736, loss: 0.36516073346138, mean loss: 0.34549767656968766
Epoch: 35, step: 737, loss: 0.30500975251197815, mean loss: 0.34549688699279196
Epoch: 35, step: 738, loss: 0.3050881028175354, mean loss: 0.3454960989746135
Epoch: 35, step: 739, loss: 0.2957156300544739, mean loss: 0.3454951282166392
Epoch: 35, step: 740, loss: 0.34573835134506226, mean loss: 0.34549513295958745
Epoch: 35, step: 741, loss: 0.3336959481239319, mean loss: 0.3454949028752531
Epoch: 35, step: 742, loss: 0.3067014813423157, mean loss: 0.3454941464175277
Epoch: 35, step: 743, loss: 0.3841336965560913, mean loss: 0.34549489986012455
Epoch: 35, step: 744, loss: 0.3852443993091583, mean loss: 0.34549567493079725
Epoch: 35, step: 745, loss: 0.32216259837150574, mean loss: 0.34549521997083626
Epoch: 35, step: 746, loss: 0.33331775665283203, mean loss: 0.3454949825332143
Epoch: 35, step: 747, loss: 0.36651015281677246, mean loss: 0.34549539228150405
Epoch: 35, step: 748, loss: 0.3551587164402008, mean loss: 0.34549558069079567
Epoch: 35, step: 749, loss: 0.3300950229167938, mean loss: 0.34549528042646005
Epoch: 35, step: 750, loss: 0.3562438189983368, mean loss: 0.345495489986394
Epoch: 35, step: 751, loss: 0.3483160138130188, mean loss: 0.34549554497594065
Epoch: 35, step: 752, loss: 0.32207927107810974, mean loss: 0.34549508845606663
Epoch: 35, step: 753, loss: 0.35486215353012085, mean loss: 0.34549527107128625
Epoch: 35, step: 754, loss: 0.33175498247146606, mean loss: 0.34549500320329524
Epoch: 35, step: 755, loss: 0.3358604609966278, mean loss: 0.34549481538080995
Epoch: 35, step: 756, loss: 0.3494628667831421, mean loss: 0.34549489273526346
Epoch: 35, step: 757, loss: 0.323602557182312, mean loss: 0.345494465967445
Epoch: 35, step: 758, loss: 0.35715124011039734, mean loss: 0.3454946931994406
Epoch: 35, step: 759, loss: 0.3138708770275116, mean loss: 0.34549407675078225
Epoch: 35, step: 760, loss: 0.32155174016952515, mean loss: 0.3454936100476657
Epoch: 35, step: 761, loss: 0.3263015151023865, mean loss: 0.3454932359473393
Epoch: 35, step: 762, loss: 0.3967911899089813, mean loss: 0.34549423584898176
Epoch: 35, step: 763, loss: 0.35200121998786926, mean loss: 0.3454943626808884
Epoch: 35, step: 764, loss: 0.29700616002082825, mean loss: 0.3454934175838674
Epoch: 35, step: 765, loss: 0.35379210114479065, mean loss: 0.3454935793326602
Epoch: 35, step: 766, loss: 0.33418700098991394, mean loss: 0.345493358961593
Epoch: 35, step: 767, loss: 0.3698458969593048, mean loss: 0.345493833595919
Epoch: 35, step: 768, loss: 0.3478730320930481, mean loss: 0.3454938799659223
Epoch: 35, step: 769, loss: 0.3744528889656067, mean loss: 0.34549444435900356
Epoch: 35, step: 770, loss: 0.3348645567893982, mean loss: 0.3454942371931411
Epoch: 35, step: 771, loss: 0.30365923047065735, mean loss: 0.345493421886649
Epoch: 35, step: 772, loss: 0.32291197776794434, mean loss: 0.3454929818140725
Epoch: 35, step: 773, loss: 0.3390668034553528, mean loss: 0.3454928565816143
Epoch: 35, step: 774, loss: 0.3227269649505615, mean loss: 0.3454924129317725
Epoch: 35, step: 775, loss: 0.3335806131362915, mean loss: 0.3454921808053442
Epoch: 35, step: 776, loss: 0.38608336448669434, mean loss: 0.345492971794367
Epoch: 35, step: 777, loss: 0.3402386009693146, mean loss: 0.34549286940591023
Epoch: 35, step: 778, loss: 0.33900532126426697, mean loss: 0.34549274298980426
Epoch: 35, step: 779, loss: 0.32613232731819153, mean loss: 0.3454923657408629
Epoch: 35, step: 780, loss: 0.30661019682884216, mean loss: 0.3454916081139867
Epoch: 35, step: 781, loss: 0.3060190975666046, mean loss: 0.3454908389991715
Epoch: 35, step: 782, loss: 0.3396575450897217, mean loss: 0.3454907253406965
Epoch: 35, step: 783, loss: 0.3271482586860657, mean loss: 0.3454903679549383
Epoch: 35, step: 784, loss: 0.32095199823379517, mean loss: 0.3454898898571357
Epoch: 35, step: 785, loss: 0.29822486639022827, mean loss: 0.34548896897837117
Epoch: 35, step: 786, loss: 0.3627249598503113, mean loss: 0.34548930478585793
Epoch: 35, step: 787, loss: 0.3229208290576935, mean loss: 0.34548886509454463
Epoch: 35, step: 788, loss: 0.3089980483055115, mean loss: 0.3454881541744646
Epoch: 35, step: 789, loss: 0.3554355502128601, mean loss: 0.3454883479674909
Epoch: 35, step: 790, loss: 0.32289236783981323, mean loss: 0.3454879077660507
Epoch: 35, step: 791, loss: 0.3196764588356018, mean loss: 0.34548740493255636
Epoch: 35, step: 792, loss: 0.32677191495895386, mean loss: 0.3454870403427219
Epoch: 35, step: 793, loss: 0.3677140474319458, mean loss: 0.34548747333074326
Epoch: 35, step: 794, loss: 0.2961999177932739, mean loss: 0.34548651321473006
Epoch: 35, step: 795, loss: 0.31830495595932007, mean loss: 0.34548598373138006
Epoch: 35, step: 796, loss: 0.34895139932632446, mean loss: 0.3454860512346544
Epoch: 35, step: 797, loss: 0.31672316789627075, mean loss: 0.3454854909696784
Epoch: 35, step: 798, loss: 0.3813091218471527, mean loss: 0.34548618875558923
Epoch: 35, step: 799, loss: 0.3496420979499817, mean loss: 0.3454862697043464
Epoch: 35, step: 800, loss: 0.3266734182834625, mean loss: 0.3454859032749543
Epoch: 35, step: 801, loss: 0.31666091084480286, mean loss: 0.34548534184391483
Epoch: 35, step: 802, loss: 0.3857700526714325, mean loss: 0.3454861264632559
Epoch: 35, step: 803, loss: 0.333604097366333, mean loss: 0.34548589504324384
Epoch: 35, step: 804, loss: 0.2984071373939514, mean loss: 0.345484978132977
Epoch: 35, step: 805, loss: 0.31715232133865356, mean loss: 0.3454844263342625
Epoch: 35, step: 806, loss: 0.35044237971305847, mean loss: 0.34548452289206294
Epoch: 35, step: 807, loss: 0.3613870143890381, mean loss: 0.34548483259237256
Epoch: 35, step: 808, loss: 0.3030615746974945, mean loss: 0.345484006417415
Epoch: 35, step: 809, loss: 0.3110480010509491, mean loss: 0.3454833358038733
Epoch: 35, step: 810, loss: 0.34879282116889954, mean loss: 0.34548340025218716
Epoch: 35, step: 811, loss: 0.2905377149581909, mean loss: 0.34548233027077857
Epoch: 35, step: 812, loss: 0.3049447536468506, mean loss: 0.3454815408801563
Epoch: 35, step: 813, loss: 0.3203640282154083, mean loss: 0.34548105177487404
Epoch: 35, step: 814, loss: 0.314814954996109, mean loss: 0.3454804546354177
Epoch: 35, step: 815, loss: 0.32855528593063354, mean loss: 0.3454801250698615
Epoch: 35, step: 816, loss: 0.35325703024864197, mean loss: 0.34548027649819996
Epoch: 35, step: 817, loss: 0.32739466428756714, mean loss: 0.3454799243502929
Epoch: 35, step: 818, loss: 0.3441338539123535, mean loss: 0.345479898141246
Epoch: 35, step: 819, loss: 0.29567837715148926, mean loss: 0.3454789284854635
Epoch: 35, step: 820, loss: 0.3435586392879486, mean loss: 0.3454788910973831
Epoch: 35, step: 821, loss: 0.34127089381217957, mean loss: 0.3454788091691621
Epoch: 35, step: 822, loss: 0.38771265745162964, mean loss: 0.3454796314312629
Epoch: 35, step: 823, loss: 0.36068975925445557, mean loss: 0.34547992755554885
Epoch: 35, step: 824, loss: 0.3115125596523285, mean loss: 0.3454792662615178
Epoch: 35, step: 825, loss: 0.29240310192108154, mean loss: 0.345478232967815
Epoch: 35, step: 826, loss: 0.32661402225494385, mean loss: 0.3454778657240454
Epoch: 35, step: 827, loss: 0.32872897386550903, mean loss: 0.3454775396671255
Epoch: 35, step: 828, loss: 0.31623575091362, mean loss: 0.3454769704174077
Epoch: 35, step: 829, loss: 0.30930474400520325, mean loss: 0.34547626626661126
Epoch: 35, step: 830, loss: 0.3193124532699585, mean loss: 0.3454757569556577
Epoch: 35, step: 831, loss: 0.33204400539398193, mean loss: 0.34547549549510403
Epoch: 35, step: 832, loss: 0.33109065890312195, mean loss: 0.3454752154873842
Epoch: 35, step: 833, loss: 0.3521251082420349, mean loss: 0.34547534492820553
Epoch: 35, step: 834, loss: 0.3572028875350952, mean loss: 0.34547557320154093
Epoch: 35, step: 835, loss: 0.34425419569015503, mean loss: 0.34547554942823216
Epoch: 35, step: 836, loss: 0.35856276750564575, mean loss: 0.3454758041573537
Epoch: 35, step: 837, loss: 0.37650197744369507, mean loss: 0.34547640803787233
Epoch: 35, step: 838, loss: 0.3479316830635071, mean loss: 0.34547645582539305
Epoch: 35, step: 839, loss: 0.32361507415771484, mean loss: 0.3454760303411255
Epoch: 35, step: 840, loss: 0.3087664544582367, mean loss: 0.34547531588294283
Epoch: 35, step: 841, loss: 0.3381209969520569, mean loss: 0.3454751727526846
Epoch: 35, step: 842, loss: 0.3598482310771942, mean loss: 0.3454754524766852
Epoch: 35, step: 843, loss: 0.34508633613586426, mean loss: 0.34547544490397114
Epoch: 35, step: 844, loss: 0.39085784554481506, mean loss: 0.3454763280877921
Epoch: 35, step: 845, loss: 0.33265334367752075, mean loss: 0.3454760785454185
Epoch: 35, step: 846, loss: 0.304523766040802, mean loss: 0.3454752816062607
Epoch: 35, step: 847, loss: 0.31862637400627136, mean loss: 0.3454747591319943
Epoch: 35, step: 848, loss: 0.32604217529296875, mean loss: 0.34547438098523453
Epoch: 35, step: 849, loss: 0.3555135130882263, mean loss: 0.3454745763370949
Epoch: 35, step: 850, loss: 0.4144940972328186, mean loss: 0.3454759193644906
Epoch: 35, step: 851, loss: 0.3317740559577942, mean loss: 0.34547565274977615
Epoch: 35, step: 852, loss: 0.37339547276496887, mean loss: 0.34547619601092094
Epoch: 35, step: 853, loss: 0.34268635511398315, mean loss: 0.3454761417275241
Epoch: 35, step: 854, loss: 0.33461666107177734, mean loss: 0.34547593043302743
Epoch: 35, step: 855, loss: 0.3242284655570984, mean loss: 0.34547551702605267
Epoch: 35, step: 856, loss: 0.33708450198173523, mean loss: 0.345475353767204
Epoch: 35, step: 857, loss: 0.304440438747406, mean loss: 0.34547455539148864
Epoch: 35, step: 858, loss: 0.31516462564468384, mean loss: 0.34547396569266675
Epoch: 35, step: 859, loss: 0.3248075842857361, mean loss: 0.3454735636229896
Epoch: 35, step: 860, loss: 0.3197614550590515, mean loss: 0.34547306339714645
Epoch: 35, step: 861, loss: 0.4011419415473938, mean loss: 0.34547414640711005
Epoch: 35, step: 862, loss: 0.31985971331596375, mean loss: 0.3454736481009199
Epoch: 35, step: 863, loss: 0.39030349254608154, mean loss: 0.34547452020901354
Epoch: 35, step: 864, loss: 0.3288640081882477, mean loss: 0.345474197078734
Epoch: 35, step: 865, loss: 0.3420422673225403, mean loss: 0.34547413031746577
Epoch: 35, step: 866, loss: 0.34261763095855713, mean loss: 0.3454740747511157
Epoch: 35, step: 867, loss: 0.3709813058376312, mean loss: 0.34547457092352246
Epoch: 35, step: 868, loss: 0.319404274225235, mean loss: 0.3454740638081011
Epoch: 35, step: 869, loss: 0.2936501204967499, mean loss: 0.3454730557562958
Epoch: 35, step: 870, loss: 0.336393803358078, mean loss: 0.34547287915493813
Epoch: 35, step: 871, loss: 0.34223735332489014, mean loss: 0.3454728162216574
Epoch: 35, step: 872, loss: 0.31423869729042053, mean loss: 0.3454722087076253
Epoch: 35, step: 873, loss: 0.29929155111312866, mean loss: 0.34547131049590096
Epoch: 35, step: 874, loss: 0.3083381652832031, mean loss: 0.34547058827193494
Epoch: 35, step: 875, loss: 0.36401867866516113, mean loss: 0.34547094901743036
Epoch: 35, step: 876, loss: 0.33017903566360474, mean loss: 0.34547065160775353
Epoch: 35, step: 877, loss: 0.30741602182388306, mean loss: 0.3454699115044865
Epoch: 35, step: 878, loss: 0.35846272110939026, mean loss: 0.34547016418947857
Epoch: 35, step: 879, loss: 0.32306399941444397, mean loss: 0.3454697284414277
Epoch: 35, step: 880, loss: 0.3662274181842804, mean loss: 0.3454701321226035
Epoch: 35, step: 881, loss: 0.32235509157180786, mean loss: 0.3454696826060435
Epoch: 35, step: 882, loss: 0.36875253915786743, mean loss: 0.3454701353773044
Epoch: 35, step: 883, loss: 0.3254396915435791, mean loss: 0.3454697458618285
Epoch: 35, step: 884, loss: 0.2964364290237427, mean loss: 0.3454687923700086
Epoch: 35, step: 885, loss: 0.31463178992271423, mean loss: 0.34546819273164575
Epoch: 35, step: 886, loss: 0.39343124628067017, mean loss: 0.3454691253750733
Epoch: 35, step: 887, loss: 0.33349087834358215, mean loss: 0.3454688924621264
Epoch: 35, step: 888, loss: 0.3191126585006714, mean loss: 0.34546837998407004
Epoch: 35, step: 889, loss: 0.36122041940689087, mean loss: 0.34546868626521765
Epoch: 35, step: 890, loss: 0.3642532229423523, mean loss: 0.3454690515028502
Epoch: 35, step: 891, loss: 0.332614541053772, mean loss: 0.34546880157069804
Epoch: 35, step: 892, loss: 0.3430245518684387, mean loss: 0.34546875404771277
Epoch: 35, step: 893, loss: 0.30158311128616333, mean loss: 0.3454679008058346
Epoch: 35, step: 894, loss: 0.34519830346107483, mean loss: 0.3454678955643192
Epoch: 35, step: 895, loss: 0.3005881607532501, mean loss: 0.3454670230288419
Epoch: 35, step: 896, loss: 0.40595364570617676, mean loss: 0.34546819896489334
Epoch: 35, step: 897, loss: 0.3121008574962616, mean loss: 0.34546755027440246
Epoch: 35, step: 898, loss: 0.32077354192733765, mean loss: 0.34546707021047535
Epoch: 35, step: 899, loss: 0.2970234751701355, mean loss: 0.3454661284609606
Epoch: 35, step: 900, loss: 0.32503366470336914, mean loss: 0.3454657312590447
Epoch: 35, step: 901, loss: 0.35049277544021606, mean loss: 0.34546582898160955
Epoch: 35, step: 902, loss: 0.32416635751724243, mean loss: 0.3454654149413812
Epoch: 35, step: 903, loss: 0.32831448316574097, mean loss: 0.34546508155105826
Epoch: 35, step: 904, loss: 0.32957473397254944, mean loss: 0.34546477267074766
Epoch: 35, step: 905, loss: 0.3320571184158325, mean loss: 0.34546451205467926
Epoch: 35, step: 906, loss: 0.2964259386062622, mean loss: 0.3454635588684206
Epoch: 35, step: 907, loss: 0.33708125352859497, mean loss: 0.3454633959407006
Epoch: 35, step: 908, loss: 0.3089427947998047, mean loss: 0.3454626860998652
Epoch: 35, step: 909, loss: 0.33558472990989685, mean loss: 0.3454624941084912
Epoch: 35, step: 910, loss: 0.3454003930091858, mean loss: 0.3454624929014962
Epoch: 35, step: 911, loss: 0.31161192059516907, mean loss: 0.34546183499563626
Epoch: 35, step: 912, loss: 0.36358147859573364, mean loss: 0.345462187154764
Epoch: 35, step: 913, loss: 0.31241947412490845, mean loss: 0.3454615449750884
Epoch: 35, step: 914, loss: 0.30704569816589355, mean loss: 0.3454607983839542
Epoch: 35, step: 915, loss: 0.33852919936180115, mean loss: 0.34546066367470707
Epoch: 35, step: 916, loss: 0.35179442167282104, mean loss: 0.34546078676307207
Epoch: 35, step: 917, loss: 0.345114141702652, mean loss: 0.3454607800266062
Epoch: 35, step: 918, loss: 0.37664681673049927, mean loss: 0.34546138606319265
Epoch: 35, step: 919, loss: 0.3209244906902313, mean loss: 0.3454609092482806
Epoch: 35, step: 920, loss: 0.3474539518356323, mean loss: 0.34546094797746557
Epoch: 35, step: 921, loss: 0.3122055232524872, mean loss: 0.34546030176424564
Epoch: 35, step: 922, loss: 0.30458828806877136, mean loss: 0.3454595075623201
Epoch: 35, step: 923, loss: 0.3366117477416992, mean loss: 0.34545933564098047
Epoch: 35, step: 924, loss: 0.3269021213054657, mean loss: 0.3454589750616676
Epoch: 35, step: 925, loss: 0.32313400506973267, mean loss: 0.345458541280725
Epoch: 35, step: 926, loss: 0.3427112102508545, mean loss: 0.3454584879002865
Epoch: 35, step: 927, loss: 0.31248947978019714, mean loss: 0.34545784732734564
Epoch: 35, step: 928, loss: 0.34320685267448425, mean loss: 0.3454578035923857
Epoch: 35, step: 929, loss: 0.3462775647640228, mean loss: 0.3454578195193562
Epoch: 35, step: 930, loss: 0.3171338737010956, mean loss: 0.34545726922995407
Epoch: 35, step: 931, loss: 0.3054346442222595, mean loss: 0.3454564916688527
Epoch: 35, step: 932, loss: 0.30005893111228943, mean loss: 0.34545560970043127
Epoch: 35, step: 933, loss: 0.29860565066337585, mean loss: 0.3454546995329868
Epoch: 35, step: 934, loss: 0.33805906772613525, mean loss: 0.3454545558587409
Epoch: 35, step: 935, loss: 0.3047492802143097, mean loss: 0.34545376509652853
Epoch: 35, step: 936, loss: 0.303266704082489, mean loss: 0.34545294556429057
Epoch: 35, step: 937, loss: 0.31434622406959534, mean loss: 0.3454523412921453
Epoch: 35, step: 938, loss: 0.30799946188926697, mean loss: 0.34545161375510297
Epoch: 35, step: 939, loss: 0.2927701473236084, mean loss: 0.3454505904165942
Epoch: 35, step: 940, loss: 0.3458113968372345, mean loss: 0.3454505974251298
Epoch: 35, step: 941, loss: 0.31579166650772095, mean loss: 0.3454500213222022
Epoch: 35, step: 942, loss: 0.3154279291629791, mean loss: 0.3454494381764617
Epoch: 35, step: 943, loss: 0.3232473134994507, mean loss: 0.3454490069332662
Epoch: 35, step: 944, loss: 0.36703503131866455, mean loss: 0.3454494262014877
Epoch: 35, step: 945, loss: 0.31789547204971313, mean loss: 0.34544889102776766
Epoch: 35, step: 946, loss: 0.3864208459854126, mean loss: 0.3454496868005833
Epoch: 35, step: 947, loss: 0.37382665276527405, mean loss: 0.3454502379380515
Epoch: 35, step: 948, loss: 0.3051030933856964, mean loss: 0.34544945433097907
Epoch: 35, step: 949, loss: 0.34536582231521606, mean loss: 0.34544945270674104
Epoch: 35, step: 950, loss: 0.32602056860923767, mean loss: 0.34544907538091524
Epoch: 35, step: 951, loss: 0.3083404004573822, mean loss: 0.34544835471217206
Epoch: 35, step: 952, loss: 0.30548855662345886, mean loss: 0.3454475786882836
Epoch: 35, step: 953, loss: 0.3060406744480133, mean loss: 0.3454468134165191
Epoch: 35, step: 954, loss: 0.3526332378387451, mean loss: 0.34544695297229
Epoch: 35, step: 955, loss: 0.3214554786682129, mean loss: 0.3454464870822344
Epoch: 35, step: 956, loss: 0.331736296415329, mean loss: 0.3454462208494312
Epoch: 35, step: 957, loss: 0.34125837683677673, mean loss: 0.3454461395289137
Epoch: 35, step: 958, loss: 0.3291027843952179, mean loss: 0.34544582217604985
Epoch: 35, step: 959, loss: 0.32063159346580505, mean loss: 0.34544534034636615
Epoch: 35, step: 960, loss: 0.3388667404651642, mean loss: 0.345445212609043
Epoch: 35, step: 961, loss: 0.28177410364151, mean loss: 0.3454439763248411
Epoch: 35, step: 962, loss: 0.3310897648334503, mean loss: 0.34544369761852317
Epoch: 35, step: 963, loss: 0.3395998477935791, mean loss: 0.34544358415452375
Epoch: 35, step: 964, loss: 0.2917759418487549, mean loss: 0.3454425421655459
Epoch: 35, step: 965, loss: 0.30975374579429626, mean loss: 0.34544184925993543
Epoch: 35, step: 966, loss: 0.30922943353652954, mean loss: 0.34544114620179334
Epoch: 35, step: 967, loss: 0.37076905369758606, mean loss: 0.3454416379294375
Epoch: 35, step: 968, loss: 0.3438015878200531, mean loss: 0.3454416060893686
Epoch: 35, step: 969, loss: 0.38340336084365845, mean loss: 0.34544234306771754
Epoch: 35, step: 970, loss: 0.3137056827545166, mean loss: 0.3454417269534834
Epoch: 35, step: 971, loss: 0.3266569972038269, mean loss: 0.3454413622864204
Epoch: 35, step: 972, loss: 0.3241932690143585, mean loss: 0.34544094980620627
Epoch: 35, step: 973, loss: 0.3015460968017578, mean loss: 0.3454400977106011
Epoch: 35, step: 974, loss: 0.33454829454421997, mean loss: 0.3454398862808589
Epoch: 35, step: 975, loss: 0.31261134147644043, mean loss: 0.3454392490313674
Epoch: 35, step: 976, loss: 0.33577969670295715, mean loss: 0.34543906152913845
Epoch: 35, step: 977, loss: 0.3384082317352295, mean loss: 0.345438925055871
Epoch: 35, step: 978, loss: 0.358963280916214, mean loss: 0.34543918756787356
Epoch: 35, step: 979, loss: 0.33794811367988586, mean loss: 0.34543904216659466
Epoch: 35, step: 980, loss: 0.3404351770877838, mean loss: 0.34543894504376943
Epoch: 35, step: 981, loss: 0.3436877429485321, mean loss: 0.34543891105436497
Epoch: 35, step: 982, loss: 0.3106114864349365, mean loss: 0.34543823509557725
Epoch: 35, step: 983, loss: 0.3138132691383362, mean loss: 0.34543762130460687
Epoch: 35, step: 984, loss: 0.3801572918891907, mean loss: 0.34543829514586033
Epoch: 35, step: 985, loss: 0.2975348234176636, mean loss: 0.3454373654507214
Epoch: 35, step: 986, loss: 0.3319327235221863, mean loss: 0.34543710336207023
Epoch: 35, step: 987, loss: 0.3418218791484833, mean loss: 0.3454370332016873
Epoch: 35, step: 988, loss: 0.4022555947303772, mean loss: 0.3454381358538158
Epoch: 35, step: 989, loss: 0.33065682649612427, mean loss: 0.34543784900519636
Epoch: 35, step: 990, loss: 0.3318963348865509, mean loss: 0.34543758622135523
Epoch: 35, step: 991, loss: 0.3452819883823395, mean loss: 0.34543758320191414
Epoch: 35, step: 992, loss: 0.3601292073726654, mean loss: 0.3454378682934898
Epoch: 35, step: 993, loss: 0.3298322260379791, mean loss: 0.3454375654712316
Epoch: 35, step: 994, loss: 0.3468628525733948, mean loss: 0.3454375931279135
Epoch: 35, step: 995, loss: 0.3450649082660675, mean loss: 0.3454375858963693
Epoch: 35, step: 996, loss: 0.32365578413009644, mean loss: 0.3454371632524093
Epoch: 35, step: 997, loss: 0.3119634985923767, mean loss: 0.34543651375757717
Epoch: 35, step: 998, loss: 0.3218075633049011, mean loss: 0.34543605529019417
Epoch: 35, step: 999, loss: 0.34416133165359497, mean loss: 0.3454360305574888
Epoch: 35, step: 1000, loss: 0.33183959126472473, mean loss: 0.3454357667589732
Epoch: 35, step: 1001, loss: 0.32116231322288513, mean loss: 0.3454352958138501
Epoch: 35, step: 1002, loss: 0.33161982893943787, mean loss: 0.3454350277761558
Epoch: 35, step: 1003, loss: 0.3802776038646698, mean loss: 0.3454357037534973
Epoch: 35, step: 1004, loss: 0.3262690603733063, mean loss: 0.34543533191057596
Epoch: 35, step: 1005, loss: 0.3239666223526001, mean loss: 0.34543491541444515
Epoch: 35, step: 1006, loss: 0.30253440141677856, mean loss: 0.34543408315429425
Epoch: 35, step: 1007, loss: 0.38308992981910706, mean loss: 0.3454348136549279
Epoch: 35, step: 1008, loss: 0.3595142662525177, mean loss: 0.345435086782488
Epoch: 35, step: 1009, loss: 0.2971574664115906, mean loss: 0.34543415026220925
Epoch: 35, step: 1010, loss: 0.28803274035453796, mean loss: 0.34543303677440285
Epoch: 35, step: 1011, loss: 0.35050538182258606, mean loss: 0.34543313516719165
Epoch: 35, step: 1012, loss: 0.35550007224082947, mean loss: 0.3454333304407368
Epoch: 35, step: 1013, loss: 0.33317431807518005, mean loss: 0.3454330926509947
Epoch: 35, step: 1014, loss: 0.33329519629478455, mean loss: 0.3454328572151232
Epoch: 35, step: 1015, loss: 0.3212844729423523, mean loss: 0.3454323888237764
Epoch: 35, step: 1016, loss: 0.3515717387199402, mean loss: 0.34543250790265795
Epoch: 35, step: 1017, loss: 0.30440255999565125, mean loss: 0.34543171210088314
Epoch: 35, step: 1018, loss: 0.31122347712516785, mean loss: 0.3454310486234112
Epoch: 35, step: 1019, loss: 0.32068532705307007, mean loss: 0.34543056868311695
Epoch: 35, step: 1020, loss: 0.3150769770145416, mean loss: 0.34542997999027414
Epoch: 35, step: 1021, loss: 0.3163596987724304, mean loss: 0.345429416197535
Epoch: 35, step: 1022, loss: 0.36315691471099854, mean loss: 0.3454297600002329
Epoch: 35, step: 1023, loss: 0.34466445446014404, mean loss: 0.3454297451583754
Epoch: 35, step: 1024, loss: 0.3306197226047516, mean loss: 0.3454294579476209
Epoch: 35, step: 1025, loss: 0.31932491064071655, mean loss: 0.3454289517119752
Epoch: 35, step: 1026, loss: 0.34478577971458435, mean loss: 0.34542893923942497
Epoch: 35, step: 1027, loss: 0.31971094012260437, mean loss: 0.3454284405193056
Epoch: 35, step: 1028, loss: 0.35185009241104126, mean loss: 0.34542856504473546
Epoch: 35, step: 1029, loss: 0.3097529411315918, mean loss: 0.3454278732544715
Epoch: 35, step: 1030, loss: 0.3354374170303345, mean loss: 0.3454276795321038
Epoch: 35, step: 1031, loss: 0.3206217288970947, mean loss: 0.34542719853562054
Epoch: 35, step: 1032, loss: 0.33179977536201477, mean loss: 0.34542693430000937
Epoch: 35, step: 1033, loss: 0.30932167172431946, mean loss: 0.3454262342328714
Epoch: 35, step: 1034, loss: 0.3859652876853943, mean loss: 0.34542702025426647
Epoch: 35, step: 1035, loss: 0.32122254371643066, mean loss: 0.345426550956986
Epoch: 35, step: 1036, loss: 0.32986557483673096, mean loss: 0.345426249253201
Epoch: 35, step: 1037, loss: 0.3339973986148834, mean loss: 0.3454260276693738
Epoch: 35, step: 1038, loss: 0.34174400568008423, mean loss: 0.345425956283306
Epoch: 35, step: 1039, loss: 0.30767592787742615, mean loss: 0.3454252244099364
Epoch: 35, step: 1040, loss: 0.3423589766025543, mean loss: 0.3454251649646405
Epoch: 35, step: 1041, loss: 0.3391309976577759, mean loss: 0.3454250429420879
Epoch: 35, step: 1042, loss: 0.3108603060245514, mean loss: 0.34542437286208255
Epoch: 35, step: 1043, loss: 0.3589283227920532, mean loss: 0.3454246346477124
Epoch: 35, step: 1044, loss: 0.3507753908634186, mean loss: 0.34542473837469145
Epoch: 35, step: 1045, loss: 0.29846563935279846, mean loss: 0.3454238280676504
Epoch: 35, step: 1046, loss: 0.3315391540527344, mean loss: 0.3454235589170114
Epoch: 35, step: 1047, loss: 0.327974796295166, mean loss: 0.3454232206840382
Epoch: 35, step: 1048, loss: 0.35920190811157227, mean loss: 0.3454234877698012
Epoch: 35, step: 1049, loss: 0.34422075748443604, mean loss: 0.34542346445655664
Epoch: 35, step: 1050, loss: 0.30837297439575195, mean loss: 0.3454227462985434
Epoch: 35, step: 1051, loss: 0.3283923864364624, mean loss: 0.34542241620163183
Epoch: 35, step: 1052, loss: 0.31516173481941223, mean loss: 0.3454218296747506
Epoch: 35, step: 1053, loss: 0.34813839197158813, mean loss: 0.34542188232742915
Epoch: 35, step: 1054, loss: 0.3294026553630829, mean loss: 0.3454215718472089
Epoch: 35, step: 1055, loss: 0.4150080978870392, mean loss: 0.34542292052784385
Epoch: 35, step: 1056, loss: 0.3251957297325134, mean loss: 0.3454225285052302
Epoch: 35, step: 1057, loss: 0.33907362818717957, mean loss: 0.34542240545975716
Epoch: 35, step: 1058, loss: 0.3887713849544525, mean loss: 0.3454232455725403
Epoch: 35, step: 1059, loss: 0.3344387114048004, mean loss: 0.3454230326939711
Epoch: 35, step: 1060, loss: 0.3166019320487976, mean loss: 0.34542247415633337
Epoch: 35, step: 1061, loss: 0.306010365486145, mean loss: 0.3454217103853813
Epoch: 35, step: 1062, loss: 0.3773598372936249, mean loss: 0.3454223293053454
Epoch: 35, step: 1063, loss: 0.31001463532447815, mean loss: 0.34542164316291496
Epoch: 35, step: 1064, loss: 0.33176541328430176, mean loss: 0.3454213785329396
Epoch: 35, step: 1065, loss: 0.2741449773311615, mean loss: 0.3454199973679355
Epoch: 35, step: 1066, loss: 0.3332344889640808, mean loss: 0.3454197612467038
Epoch: 35, step: 1067, loss: 0.3083671033382416, mean loss: 0.3454190432832503
Epoch: 35, step: 1068, loss: 0.31801262497901917, mean loss: 0.34541851224373576
Epoch: 35, step: 1069, loss: 0.362972229719162, mean loss: 0.3454188523661437
Epoch: 35, step: 1070, loss: 0.32678312063217163, mean loss: 0.34541849128552654
Epoch: 35, step: 1071, loss: 0.27738097310066223, mean loss: 0.3454171730355423
Epoch: 35, step: 1072, loss: 0.351441890001297, mean loss: 0.34541728976421465
Epoch: 35, step: 1073, loss: 0.30066922307014465, mean loss: 0.34541642278884566
Epoch: 35, step: 1074, loss: 0.3417551517486572, mean loss: 0.34541635185460096
Epoch: 35, step: 1075, loss: 0.3509122133255005, mean loss: 0.3454164583305284
Epoch: 35, step: 1076, loss: 0.355984628200531, mean loss: 0.34541666307256824
Epoch: 35, step: 1077, loss: 0.3124006986618042, mean loss: 0.34541602345142036
Epoch: 35, step: 1078, loss: 0.3195522129535675, mean loss: 0.34541552239927875
Epoch: 35, step: 1079, loss: 0.31764698028564453, mean loss: 0.34541498445774227
Epoch: 35, step: 1080, loss: 0.33598074316978455, mean loss: 0.34541480169798777
Epoch: 35, step: 1081, loss: 0.33754438161849976, mean loss: 0.3454146492354703
Epoch: 35, step: 1082, loss: 0.3166889548301697, mean loss: 0.345414092783997
Epoch: 35, step: 1083, loss: 0.3071558177471161, mean loss: 0.3454133516892535
Epoch: 35, step: 1084, loss: 0.3148198127746582, mean loss: 0.34541275907833024
Epoch: 35, step: 1085, loss: 0.32624125480651855, mean loss: 0.345412387724666
Epoch: 35, step: 1086, loss: 0.30970609188079834, mean loss: 0.3454116961040829
Epoch: 35, step: 1087, loss: 0.360877126455307, mean loss: 0.3454119956591761
Epoch: 35, step: 1088, loss: 0.3352728486061096, mean loss: 0.3454117992744494
Epoch: 35, step: 1089, loss: 0.30243679881095886, mean loss: 0.3454109669095363
Epoch: 35, step: 1090, loss: 0.33493417501449585, mean loss: 0.34541076399284104
Epoch: 35, step: 1091, loss: 0.3131820857524872, mean loss: 0.345410139793154
Epoch: 35, step: 1092, loss: 0.31454354524612427, mean loss: 0.34540954198565593
Epoch: 35, step: 1093, loss: 0.36615246534347534, mean loss: 0.34540994371558886
Epoch: 35, step: 1094, loss: 0.30365505814552307, mean loss: 0.3454091350608862
Epoch: 35, step: 1095, loss: 0.33911067247390747, mean loss: 0.3454090130827588
Epoch: 35, step: 1096, loss: 0.3172341287136078, mean loss: 0.34540846744911685
Epoch: 35, step: 1097, loss: 0.33234426379203796, mean loss: 0.34540821445319025
Epoch: 35, step: 1098, loss: 0.33623868227005005, mean loss: 0.34540803688328797
Epoch: 35, step: 1099, loss: 0.34218618273735046, mean loss: 0.345407974492619
Epoch: 35, step: 1100, loss: 0.3584156632423401, mean loss: 0.3454082263794676
Epoch: 35, step: 1101, loss: 0.3214803636074066, mean loss: 0.345407763038335
Epoch: 35, step: 1102, loss: 0.3556751310825348, mean loss: 0.3454079618526572
Epoch: 35, step: 1103, loss: 0.32973992824554443, mean loss: 0.34540765846729576
Epoch: 35, step: 1104, loss: 0.3367018699645996, mean loss: 0.3454074898974729
Epoch: 35, step: 1105, loss: 0.33589911460876465, mean loss: 0.3454073057907601
Epoch: 35, step: 1106, loss: 0.34072765707969666, mean loss: 0.34540721518242445
Epoch: 35, step: 1107, loss: 0.39983639121055603, mean loss: 0.3454082690310929
Epoch: 35, step: 1108, loss: 0.31419065594673157, mean loss: 0.3454076646125546
Epoch: 35, step: 1109, loss: 0.3504900634288788, mean loss: 0.34540776301330617
Epoch: 35, step: 1110, loss: 0.32293009757995605, mean loss: 0.34540732782975825
Epoch: 35, step: 1111, loss: 0.3109683394432068, mean loss: 0.34540666107942164
Epoch: 35, step: 1112, loss: 0.3523898422718048, mean loss: 0.3454067962735283
Epoch: 35, step: 1113, loss: 0.353485643863678, mean loss: 0.3454069526766644
Epoch: 35, step: 1114, loss: 0.35621005296707153, mean loss: 0.3454071618161531
Epoch: 35, step: 1115, loss: 0.345219224691391, mean loss: 0.34540715817790923
Epoch: 35, step: 1116, loss: 0.310404509305954, mean loss: 0.3454064805805096
Epoch: 35, step: 1117, loss: 0.34698790311813354, mean loss: 0.3454065111938229
Epoch: 35, step: 1118, loss: 0.3595420718193054, mean loss: 0.3454067848259223
Epoch: 35, step: 1119, loss: 0.36549338698387146, mean loss: 0.345407173649038
Epoch: 35, step: 1120, loss: 0.3527796268463135, mean loss: 0.3454073163573324
Epoch: 35, step: 1121, loss: 0.32454752922058105, mean loss: 0.3454069125830469
Epoch: 35, step: 1122, loss: 0.3322119414806366, mean loss: 0.3454066571783839
Epoch: 35, step: 1123, loss: 0.35369518399238586, mean loss: 0.3454068176097639
Epoch: 35, step: 1124, loss: 0.3239438831806183, mean loss: 0.34540640218472896
Epoch: 35, step: 1125, loss: 0.32245147228240967, mean loss: 0.34540595789003026
Epoch: 35, step: 1126, loss: 0.3285849094390869, mean loss: 0.345405632323451
Epoch: 35, step: 1127, loss: 0.33626094460487366, mean loss: 0.34540545533406264
Epoch: 35, step: 1128, loss: 0.3338233232498169, mean loss: 0.3454052311738876
Epoch: 35, step: 1129, loss: 0.32074204087257385, mean loss: 0.34540475385261216
Epoch: 35, step: 1130, loss: 0.3491232693195343, mean loss: 0.3454048258178435
Epoch: 35, step: 1131, loss: 0.3447735011577606, mean loss: 0.3454048135999177
Epoch: 35, step: 1132, loss: 0.32087719440460205, mean loss: 0.3454043389299896
Epoch: 35, step: 1133, loss: 0.32610782980918884, mean loss: 0.34540396550217056
Epoch: 35, step: 1134, loss: 0.30690619349479675, mean loss: 0.34540322050416367
Epoch: 35, step: 1135, loss: 0.3333279490470886, mean loss: 0.3454029868314441
Epoch: 35, step: 1136, loss: 0.32908934354782104, mean loss: 0.3454026711466465
Epoch: 35, step: 1137, loss: 0.33743005990982056, mean loss: 0.34540251687188284
Epoch: 35, step: 1138, loss: 0.3173273503780365, mean loss: 0.3454019736112452
Epoch: 35, step: 1139, loss: 0.33924514055252075, mean loss: 0.34540185447747856
Epoch: 35, step: 1140, loss: 0.35217076539993286, mean loss: 0.34540198545232276
Epoch: 35, step: 1141, loss: 0.3296842575073242, mean loss: 0.3454016813284896
Epoch: 35, step: 1142, loss: 0.2801777720451355, mean loss: 0.3454004193292
Epoch: 35, step: 1143, loss: 0.3343343436717987, mean loss: 0.34540020521892106
Epoch: 35, step: 1144, loss: 0.3265850841999054, mean loss: 0.34539984118446193
Epoch: 35, step: 1145, loss: 0.3079891502857208, mean loss: 0.3453991173774175
Epoch: 35, step: 1146, loss: 0.3163363039493561, mean loss: 0.34539855509263745
Epoch: 35, step: 1147, loss: 0.3208293318748474, mean loss: 0.3453980797555531
Epoch: 35, step: 1148, loss: 0.344396710395813, mean loss: 0.34539806038258475
Epoch: 35, step: 1149, loss: 0.2855257987976074, mean loss: 0.3453969020877195
Epoch: 35, step: 1150, loss: 0.3141975402832031, mean loss: 0.345396298513368
Epoch: 35, step: 1151, loss: 0.33888617157936096, mean loss: 0.3453961725726628
Epoch: 35, step: 1152, loss: 0.31809866428375244, mean loss: 0.3453956445029379
Epoch: 35, step: 1153, loss: 0.3555169701576233, mean loss: 0.34539584029598264
Epoch: 35, step: 1154, loss: 0.33904245495796204, mean loss: 0.34539571739463165
Epoch: 35, step: 1155, loss: 0.32965120673179626, mean loss: 0.34539541283507846
Epoch: 35, step: 1156, loss: 0.3278186023235321, mean loss: 0.34539507283835696
Epoch: 35, step: 1157, loss: 0.31338590383529663, mean loss: 0.3453944536815423
Epoch: 35, step: 1158, loss: 0.3487352430820465, mean loss: 0.3453945183015427
Epoch: 35, step: 1159, loss: 0.30402809381484985, mean loss: 0.345393718177278
Epoch: 35, step: 1160, loss: 0.30761662125587463, mean loss: 0.3453929874932115
Epoch: 35, step: 1161, loss: 0.31704404950141907, mean loss: 0.3453924391790652
Epoch: 35, step: 1162, loss: 0.32675620913505554, mean loss: 0.3453920787313147
Epoch: 35, step: 1163, loss: 0.3315986096858978, mean loss: 0.34539181195371443
Epoch: 35, step: 1164, loss: 0.31514519453048706, mean loss: 0.3453912269693334
Epoch: 35, step: 1165, loss: 0.3241308331489563, mean loss: 0.3453908157908663
Epoch: 35, step: 1166, loss: 0.34930121898651123, mean loss: 0.3453908914170522
Epoch: 35, step: 1167, loss: 0.2990282475948334, mean loss: 0.3453899947928582
Epoch: 35, step: 1168, loss: 0.3148382008075714, mean loss: 0.3453894039519217
Epoch: 35, step: 1169, loss: 0.3128848969936371, mean loss: 0.34538877535963863
Epoch: 35, step: 1170, loss: 0.32034268975257874, mean loss: 0.3453882910122927
Epoch: 35, step: 1171, loss: 0.34505757689476013, mean loss: 0.3453882846169856
Epoch: 35, step: 1172, loss: 0.3261461853981018, mean loss: 0.34538791252294315
Epoch: 35, step: 1173, loss: 0.3119569420814514, mean loss: 0.34538726606414205
Epoch: 35, step: 1174, loss: 0.3794384002685547, mean loss: 0.3453879245023941
Epoch: 35, step: 1175, loss: 0.3291528820991516, mean loss: 0.3453876105755165
Epoch: 35, step: 1176, loss: 0.3401561677455902, mean loss: 0.34538750942032903
Epoch: 35, step: 1177, loss: 0.307685524225235, mean loss: 0.3453867804287749
Epoch: 35, step: 1178, loss: 0.32504644989967346, mean loss: 0.3453863871433183
Epoch: 35, step: 1179, loss: 0.3711516857147217, mean loss: 0.34538688531227757
Epoch: 35, step: 1180, loss: 0.331215500831604, mean loss: 0.34538661131555515
Epoch: 35, step: 1181, loss: 0.32162603735923767, mean loss: 0.3453861519254705
Epoch: 35, step: 1182, loss: 0.2933940291404724, mean loss: 0.3453851467223155
Epoch: 35, step: 1183, loss: 0.3129046857357025, mean loss: 0.3453845187650619
Epoch: 35, step: 1184, loss: 0.3331753611564636, mean loss: 0.3453842827252821
Epoch: 35, step: 1185, loss: 0.32184240221977234, mean loss: 0.34538382759864356
Epoch: 35, step: 1186, loss: 0.3667134940624237, mean loss: 0.34538423994937845
Epoch: 35, step: 1187, loss: 0.32279202342033386, mean loss: 0.34538380319913625
Epoch: 35, step: 1188, loss: 0.3340538740158081, mean loss: 0.34538358417442705
Epoch: 35, step: 1189, loss: 0.3219153881072998, mean loss: 0.34538313050738534
Epoch: 35, step: 1190, loss: 0.32729610800743103, mean loss: 0.3453827808713354
Epoch: 35, step: 1191, loss: 0.3753751814365387, mean loss: 0.3453833606362887
Epoch: 35, step: 1192, loss: 0.3137694001197815, mean loss: 0.3453827495377536
Epoch: 35, step: 1193, loss: 0.35432225465774536, mean loss: 0.3453829223352392
Epoch: 35, step: 1194, loss: 0.30607467889785767, mean loss: 0.34538216253542403
Epoch: 35, step: 1195, loss: 0.34318506717681885, mean loss: 0.3453821200679863
Epoch: 35, step: 1196, loss: 0.3562512695789337, mean loss: 0.3453823301526358
Epoch: 35, step: 1197, loss: 0.36588579416275024, mean loss: 0.3453827264467332
Epoch: 35, step: 1198, loss: 0.35742756724357605, mean loss: 0.34538295924676404
Epoch: 35, step: 1199, loss: 0.33572709560394287, mean loss: 0.3453827726239646
Epoch: 35, step: 1200, loss: 0.3643854260444641, mean loss: 0.34538313988886904
Epoch: 35, step: 1201, loss: 0.33901461958885193, mean loss: 0.3453830168066476
Epoch: 35, step: 1202, loss: 0.3091413974761963, mean loss: 0.3453823163907589
Epoch: 35, step: 1203, loss: 0.33609437942504883, mean loss: 0.34538213689290476
Epoch: 35, step: 1204, loss: 0.34690922498703003, mean loss: 0.3453821664047048
Epoch: 35, step: 1205, loss: 0.33799636363983154, mean loss: 0.34538202367284604
Epoch: 35, step: 1206, loss: 0.32855644822120667, mean loss: 0.34538169852210393
Epoch: 35, step: 1207, loss: 0.31595680117607117, mean loss: 0.3453811299030782
Epoch: 35, step: 1208, loss: 0.3478657603263855, mean loss: 0.34538117791618805
Epoch: 35, step: 1209, loss: 0.363790899515152, mean loss: 0.3453815336596006
Epoch: 35, step: 1210, loss: 0.3323361873626709, mean loss: 0.3453812815804853
Epoch: 35, step: 1211, loss: 0.3162379264831543, mean loss: 0.34538071844562873
Epoch: 35, step: 1212, loss: 0.34228622913360596, mean loss: 0.3453806586522001
Epoch: 35, step: 1213, loss: 0.3307240605354309, mean loss: 0.34538037545480244
Epoch: 35, step: 1214, loss: 0.332547664642334, mean loss: 0.3453801275036709
Epoch: 35, step: 1215, loss: 0.3232576847076416, mean loss: 0.34537970006641155
Epoch: 35, step: 1216, loss: 0.3125167489051819, mean loss: 0.3453790651194254
Epoch: 35, step: 1217, loss: 0.3084591031074524, mean loss: 0.3453783518004793
Epoch: 35, step: 1218, loss: 0.3256540596485138, mean loss: 0.34537797072101195
Epoch: 35, step: 1219, loss: 0.32586538791656494, mean loss: 0.3453775937391185
Epoch: 35, step: 1220, loss: 0.33025214076042175, mean loss: 0.34537730152194773
Epoch: 35, step: 1221, loss: 0.3430701792240143, mean loss: 0.3453772569502098
Epoch: 35, step: 1222, loss: 0.3466097414493561, mean loss: 0.3453772807603541
Epoch: 35, step: 1223, loss: 0.32660600543022156, mean loss: 0.34537691812849936
Epoch: 35, step: 1224, loss: 0.3321138918399811, mean loss: 0.34537666191240185
Epoch: 35, step: 1225, loss: 0.3165886402130127, mean loss: 0.3453761057940674
Epoch: 35, step: 1226, loss: 0.3703951835632324, mean loss: 0.34537658909574165
Epoch: 35, step: 1227, loss: 0.4053533673286438, mean loss: 0.34537774766432133
Epoch: 35, step: 1228, loss: 0.3201817274093628, mean loss: 0.345377260963395
Epoch: 35, step: 1229, loss: 0.33030349016189575, mean loss: 0.3453769697953285
Epoch: 35, step: 1230, loss: 0.28068625926971436, mean loss: 0.3453757202403551
Epoch: 35, step: 1231, loss: 0.34733662009239197, mean loss: 0.345375758116038
Epoch: 35, step: 1232, loss: 0.3016897737979889, mean loss: 0.3453749143174496
Epoch: 35, step: 1233, loss: 0.2988474369049072, mean loss: 0.3453740156525326
Epoch: 35, step: 1234, loss: 0.33886927366256714, mean loss: 0.3453738900177284
Epoch: 35, step: 1235, loss: 0.3089805543422699, mean loss: 0.3453731871180128
Epoch: 35, step: 1236, loss: 0.32231763005256653, mean loss: 0.34537274183232486
Epoch: 35, step: 1237, loss: 0.34186652302742004, mean loss: 0.3453726741159433
Epoch: 35, step: 1238, loss: 0.3513075113296509, mean loss: 0.3453727887345573
Epoch: 35, step: 1239, loss: 0.3317919671535492, mean loss: 0.34537252645526834
Epoch: 35, step: 1240, loss: 0.3229198157787323, mean loss: 0.34537209284620946
Epoch: 35, step: 1241, loss: 0.3316531777381897, mean loss: 0.34537182791022575
Epoch: 35, step: 1242, loss: 0.3233442008495331, mean loss: 0.3453714025268555
Epoch: 35, step: 1243, loss: 0.33644527196884155, mean loss: 0.34537123015449034
Epoch: 35, step: 1244, loss: 0.31917640566825867, mean loss: 0.34537072431641974
Epoch: 35, step: 1245, loss: 0.3066007196903229, mean loss: 0.34536997565839195
Epoch: 35, step: 1246, loss: 0.3420839309692383, mean loss: 0.34536991220531127
Epoch: 35, step: 1247, loss: 0.31175315380096436, mean loss: 0.34536926308276544
Epoch: 35, step: 1248, loss: 0.31188321113586426, mean loss: 0.34536861649658024
Epoch: 35, step: 1249, loss: 0.3186171054840088, mean loss: 0.34536809995842593
Epoch: 35, step: 1250, loss: 0.3216727077960968, mean loss: 0.345367642438931
Epoch: 35, step: 1251, loss: 0.3757205605506897, mean loss: 0.3453682284931114
Epoch: 35, step: 1252, loss: 0.29761630296707153, mean loss: 0.34536730651667585
Epoch: 35, step: 1253, loss: 0.36008626222610474, mean loss: 0.3453675906993169
Epoch: 35, step: 1254, loss: 0.35963740944862366, mean loss: 0.3453678662050365
Epoch: 35, step: 1255, loss: 0.2983556389808655, mean loss: 0.3453669585629942
Epoch: 35, step: 1256, loss: 0.36043766140937805, mean loss: 0.3453672495200544
Epoch: 35, step: 1257, loss: 0.33171623945236206, mean loss: 0.34536698597686605
Epoch: 35, step: 1258, loss: 0.3438897430896759, mean loss: 0.345366957458113
Epoch: 35, step: 1259, loss: 0.34300869703292847, mean loss: 0.34536691193185
Epoch: 35, step: 1260, loss: 0.28016483783721924, mean loss: 0.34536565322885016
Epoch: 35, step: 1261, loss: 0.38188180327415466, mean loss: 0.3453663581466148
Epoch: 35, step: 1262, loss: 0.3217969238758087, mean loss: 0.34536590316458154
Epoch: 35, step: 1263, loss: 0.32405078411102295, mean loss: 0.34536549170756947
Epoch: 35, step: 1264, loss: 0.3132651746273041, mean loss: 0.3453648720701391
Epoch: 35, step: 1265, loss: 0.3286201059818268, mean loss: 0.3453645488495452
Epoch: 35, step: 1266, loss: 0.3063446581363678, mean loss: 0.34536379567158254
Epoch: 35, step: 1267, loss: 0.30073264241218567, mean loss: 0.34536293419935316
Epoch: 35, step: 1268, loss: 0.364690363407135, mean loss: 0.34536330725093123
Epoch: 35, step: 1269, loss: 0.35162174701690674, mean loss: 0.34536342804691206
Epoch: 35, step: 1270, loss: 0.329172819852829, mean loss: 0.345363115553268
Epoch: 35, step: 1271, loss: 0.31416648626327515, mean loss: 0.3453625134412227
Epoch: 35, step: 1272, loss: 0.34530723094940186, mean loss: 0.3453625123742609
Epoch: 35, step: 1273, loss: 0.31492358446121216, mean loss: 0.34536192490894435
Epoch: 35, step: 1274, loss: 0.35186612606048584, mean loss: 0.3453620504363235
Epoch: 35, step: 1275, loss: 0.2977178394794464, mean loss: 0.3453611309479231
Epoch: 35, step: 1276, loss: 0.33735236525535583, mean loss: 0.34536097638927066
Epoch: 35, step: 1277, loss: 0.3895432949066162, mean loss: 0.34536182903349694
Epoch: 35, step: 1278, loss: 0.29936572909355164, mean loss: 0.3453609414034782
Epoch: 35, step: 1279, loss: 0.33452168107032776, mean loss: 0.3453607322321094
Epoch: 35, step: 1280, loss: 0.346048504114151, mean loss: 0.3453607455041783
Epoch: 35, step: 1281, loss: 0.32648536562919617, mean loss: 0.34536038126929974
Epoch: 35, step: 1282, loss: 0.31774991750717163, mean loss: 0.3453598484853281
Epoch: 35, step: 1283, loss: 0.3610312044620514, mean loss: 0.3453601508810516
Epoch: 35, step: 1284, loss: 0.34178677201271057, mean loss: 0.34536008193018103
Epoch: 35, step: 1285, loss: 0.33286958932876587, mean loss: 0.3453598409219496
Epoch: 35, step: 1286, loss: 0.34291642904281616, mean loss: 0.34535979377641
Epoch: 35, step: 1287, loss: 0.37072163820266724, mean loss: 0.3453602831227947
Epoch: 35, step: 1288, loss: 0.3102952539920807, mean loss: 0.3453596065704952
Epoch: 35, step: 1289, loss: 0.33451685309410095, mean loss: 0.3453593973720874
Epoch: 35, step: 1290, loss: 0.32429102063179016, mean loss: 0.3453589908899292
Epoch: 35, step: 1291, loss: 0.29335692524909973, mean loss: 0.3453579876088357
Epoch: 35, step: 1292, loss: 0.3394455313682556, mean loss: 0.3453578735414222
Epoch: 35, step: 1293, loss: 0.3266012966632843, mean loss: 0.34535751168285683
Epoch: 35, step: 1294, loss: 0.35730621218681335, mean loss: 0.34535774219699794
Epoch: 35, step: 1295, loss: 0.29687637090682983, mean loss: 0.3453568069131934
Epoch: 35, step: 1296, loss: 0.33085933327674866, mean loss: 0.3453565272389523
Epoch: 35, step: 1297, loss: 0.309868723154068, mean loss: 0.3453558426484186
Epoch: 35, step: 1298, loss: 0.3121475279331207, mean loss: 0.3453552020435706
Epoch: 35, step: 1299, loss: 0.34215471148490906, mean loss: 0.3453551403057126
Epoch: 35, step: 1300, loss: 0.3654167354106903, mean loss: 0.345355527288894
Epoch: 35, step: 1301, loss: 0.3616674244403839, mean loss: 0.34535584193526475
Epoch: 35, step: 1302, loss: 0.33290499448776245, mean loss: 0.34535560177077873
Epoch: 35, step: 1303, loss: 0.3358231484889984, mean loss: 0.3453554179027654
Epoch: 35, step: 1304, loss: 0.41342324018478394, mean loss: 0.3453567308128297
Epoch: 35, step: 1305, loss: 0.31299087405204773, mean loss: 0.34535610654371035
Epoch: 35, step: 1306, loss: 0.30593276023864746, mean loss: 0.3453553461651676
Epoch: 35, step: 1307, loss: 0.3581046760082245, mean loss: 0.345355592063367
Epoch: 35, step: 1308, loss: 0.31141263246536255, mean loss: 0.34535493741314044
Epoch: 35, step: 1309, loss: 0.31996968388557434, mean loss: 0.3453544478229085
Epoch: 35, step: 1310, loss: 0.3444993793964386, mean loss: 0.3453544313320322
Epoch: 35, step: 1311, loss: 0.3340880274772644, mean loss: 0.3453542140520072
Epoch: 35, step: 1312, loss: 0.33268240094184875, mean loss: 0.34535396967245136
Epoch: 35, step: 1313, loss: 0.31141355633735657, mean loss: 0.3453533151344536
Epoch: 35, step: 1314, loss: 0.3297230303287506, mean loss: 0.3453530137115473
Epoch: 35, step: 1315, loss: 0.36029255390167236, mean loss: 0.34535330180820323
Epoch: 35, step: 1316, loss: 0.3518967628479004, mean loss: 0.3453534279909951
Epoch: 35, step: 1317, loss: 0.33811527490615845, mean loss: 0.3453532884145925
Epoch: 35, step: 1318, loss: 0.3218999207019806, mean loss: 0.34535283616199003
Epoch: 35, step: 1319, loss: 0.30313003063201904, mean loss: 0.3453520219929671
Epoch: 35, step: 1320, loss: 0.32765302062034607, mean loss: 0.34535168071529465
Epoch: 35, step: 1321, loss: 0.3272411823272705, mean loss: 0.3453513315097417
Epoch: 35, step: 1322, loss: 0.34297242760658264, mean loss: 0.3453512856407425
Epoch: 35, step: 1323, loss: 0.3209737539291382, mean loss: 0.34535081561275177
Epoch: 35, step: 1324, loss: 0.30688539147377014, mean loss: 0.34535007396763195
Epoch: 35, step: 1325, loss: 0.3543185293674469, mean loss: 0.34535024688351906
Epoch: 35, step: 1326, loss: 0.3272206485271454, mean loss: 0.34534989734338073
Epoch: 35, step: 1327, loss: 0.29633891582489014, mean loss: 0.3453489524258686
Epoch: 35, step: 1328, loss: 0.29473885893821716, mean loss: 0.3453479766967532
Epoch: 35, step: 1329, loss: 0.3534967005252838, mean loss: 0.3453481337957281
Epoch: 35, step: 1330, loss: 0.3284957706928253, mean loss: 0.34534780890584543
Epoch: 35, step: 1331, loss: 0.35815975069999695, mean loss: 0.3453480558973205
Epoch: 35, step: 1332, loss: 0.3189186155796051, mean loss: 0.34534754639449017
Epoch: 35, step: 1333, loss: 0.34127476811408997, mean loss: 0.34534746788158815
Epoch: 35, step: 1334, loss: 0.35604119300842285, mean loss: 0.345347674025687
Epoch: 35, step: 1335, loss: 0.3270111382007599, mean loss: 0.3453473205571115
Epoch: 35, step: 1336, loss: 0.32313334941864014, mean loss: 0.3453468923524902
Epoch: 35, step: 1337, loss: 0.33563855290412903, mean loss: 0.34534670521460037
Epoch: 35, step: 1338, loss: 0.3223492205142975, mean loss: 0.34534626192377554
Epoch: 35, step: 1339, loss: 0.3236692249774933, mean loss: 0.3453458440934566
Epoch: 35, step: 1340, loss: 0.3159058690071106, mean loss: 0.34534527664149756
Epoch: 35, step: 1341, loss: 0.32995495200157166, mean loss: 0.3453449800005693
Epoch: 35, step: 1342, loss: 0.4008236229419708, mean loss: 0.3453460493034805
Epoch: 35, step: 1343, loss: 0.34141939878463745, mean loss: 0.3453459736221429
Epoch: 35, step: 1344, loss: 0.3151102066040039, mean loss: 0.3453453908763201
Epoch: 35, step: 1345, loss: 0.327220618724823, mean loss: 0.3453450415571945
Epoch: 35, step: 1346, loss: 0.3106525242328644, mean loss: 0.3453443729404441
Epoch: 35, step: 1347, loss: 0.32629042863845825, mean loss: 0.34534400572751817
Epoch: 35, step: 1348, loss: 0.287922739982605, mean loss: 0.3453428991102053
Epoch: 35, step: 1349, loss: 0.29479295015335083, mean loss: 0.3453419249350472
Epoch: 35, step: 1350, loss: 0.29842409491539, mean loss: 0.3453410207738242
Epoch: 35, step: 1351, loss: 0.34253087639808655, mean loss: 0.34534096662011315
Epoch: 35, step: 1352, loss: 0.3523758053779602, mean loss: 0.34534110218442354
Epoch: 35, step: 1353, loss: 0.3264417350292206, mean loss: 0.3453407379926643
Epoch: 35, step: 1354, loss: 0.36289912462234497, mean loss: 0.34534107633714123
Epoch: 35, step: 1355, loss: 0.3399134576320648, mean loss: 0.3453409717506855
Epoch: 35, step: 1356, loss: 0.344323992729187, mean loss: 0.34534095215458127
Epoch: 35, step: 1357, loss: 0.3213753402233124, mean loss: 0.34534049037162373
Epoch: 35, step: 1358, loss: 0.31858205795288086, mean loss: 0.345339974784957
Epoch: 35, step: 1359, loss: 0.3270237445831299, mean loss: 0.34533962187108025
Epoch: 35, step: 1360, loss: 0.3399411737918854, mean loss: 0.3453395178567437
Epoch: 35, step: 1361, loss: 0.35768061876296997, mean loss: 0.34533975563372543
Epoch: 35, step: 1362, loss: 0.3160490393638611, mean loss: 0.3453391912980171
Epoch: 35, step: 1363, loss: 0.35701584815979004, mean loss: 0.3453394162644332
Epoch: 35, step: 1364, loss: 0.3101421296596527, mean loss: 0.34533873815468263
Epoch: 35, step: 1365, loss: 0.322426974773407, mean loss: 0.34533829674591715
Epoch: 35, step: 1366, loss: 0.29280173778533936, mean loss: 0.34533728461732255
Epoch: 35, step: 1367, loss: 0.3486921191215515, mean loss: 0.3453373492477168
Epoch: 35, step: 1368, loss: 0.31397315859794617, mean loss: 0.34533674503282824
Epoch: 35, step: 1369, loss: 0.30034008622169495, mean loss: 0.3453358782122
Epoch: 35, step: 1370, loss: 0.3178621232509613, mean loss: 0.3453353489649314
Epoch: 35, step: 1371, loss: 0.3108217716217041, mean loss: 0.34533468411716317
Epoch: 35, step: 1372, loss: 0.33770641684532166, mean loss: 0.3453345371738682
Epoch: 35, step: 1373, loss: 0.3102725148200989, mean loss: 0.3453338617872219
Epoch: 35, step: 1374, loss: 0.3506056070327759, mean loss: 0.3453339633329264
Epoch: 35, step: 1375, loss: 0.3464675843715668, mean loss: 0.345333985168604
Epoch: 35, step: 1376, loss: 0.30920758843421936, mean loss: 0.34533328931952306
Epoch: 35, step: 1377, loss: 0.34222742915153503, mean loss: 0.34533322949710754
Epoch: 35, step: 1378, loss: 0.3258899748325348, mean loss: 0.34533285500502053
Epoch: 35, step: 1379, loss: 0.2997686266899109, mean loss: 0.34533197741972943
Epoch: 35, step: 1380, loss: 0.3446076214313507, mean loss: 0.3453319634686116
Epoch: 35, step: 1381, loss: 0.42512047290802, mean loss: 0.3453335001680731
Epoch: 35, step: 1382, loss: 0.33350667357444763, mean loss: 0.3453332723918161
Epoch: 35, step: 1383, loss: 0.38821426033973694, mean loss: 0.34533409823319866
Epoch: 35, step: 1384, loss: 0.3469306230545044, mean loss: 0.34533412897994537
Epoch: 35, step: 1385, loss: 0.35384321212768555, mean loss: 0.3453342928493585
Epoch: 35, step: 1386, loss: 0.34338244795799255, mean loss: 0.3453342552611117
Epoch: 35, step: 1387, loss: 0.3525356650352478, mean loss: 0.3453343939417806
Epoch: 35, step: 1388, loss: 0.3492032587528229, mean loss: 0.3453344684447522
Epoch: 35, step: 1389, loss: 0.35372623801231384, mean loss: 0.34533463004247156
Epoch: 35, step: 1390, loss: 0.32682788372039795, mean loss: 0.3453342736706258
Epoch: 35, step: 1391, loss: 0.34985750913619995, mean loss: 0.34533436076982216
Epoch: 35, step: 1392, loss: 0.34631645679473877, mean loss: 0.34533437968065006
Epoch: 35, step: 1393, loss: 0.32941868901252747, mean loss: 0.3453340732207073
Epoch: 35, step: 1394, loss: 0.3356889486312866, mean loss: 0.345333887505398
Epoch: 35, step: 1395, loss: 0.31207090616226196, mean loss: 0.3453332470444202
Epoch: 35, step: 1396, loss: 0.3415592610836029, mean loss: 0.34533317437973104
Epoch: 35, step: 1397, loss: 0.2812815308570862, mean loss: 0.3453319411469627
Epoch: 35, step: 1398, loss: 0.3520786762237549, mean loss: 0.3453320710442475
Epoch: 35, step: 1399, loss: 0.3912665545940399, mean loss: 0.3453329554201341
Epoch: 35, step: 1400, loss: 0.3321923315525055, mean loss: 0.34533270242878106
Epoch: 35, step: 1401, loss: 0.3189536929130554, mean loss: 0.34533219457368275
Epoch: 35, step: 1402, loss: 0.3512437045574188, mean loss: 0.34533230838131773
Epoch: 35, step: 1403, loss: 0.3506839871406555, mean loss: 0.34533241140917004
Epoch: 35, step: 1404, loss: 0.3083694577217102, mean loss: 0.3453316998305063
Epoch: 35, step: 1405, loss: 0.361377090215683, mean loss: 0.34533200871647224
Epoch: 35, step: 1406, loss: 0.33129775524139404, mean loss: 0.345331738551622
Epoch: 35, step: 1407, loss: 0.358364075422287, mean loss: 0.34533198942435767
Epoch: 35, step: 1408, loss: 0.3099120259284973, mean loss: 0.34533130760250363
Epoch: 35, step: 1409, loss: 0.33894604444503784, mean loss: 0.34533118469079704
Epoch: 35, step: 1410, loss: 0.3391571640968323, mean loss: 0.34533106584764495
Epoch: 35, step: 1411, loss: 0.3606148064136505, mean loss: 0.3453313600372924
Epoch: 35, step: 1412, loss: 0.31515681743621826, mean loss: 0.34533077923266897
Epoch: 35, step: 1413, loss: 0.31825149059295654, mean loss: 0.34533025801604195
Epoch: 35, step: 1414, loss: 0.28357189893722534, mean loss: 0.3453290693266169
Epoch: 35, step: 1415, loss: 0.3353048264980316, mean loss: 0.3453288763894618
Epoch: 35, step: 1416, loss: 0.3221385180950165, mean loss: 0.34532843005194624
Epoch: 35, step: 1417, loss: 0.33095043897628784, mean loss: 0.34532815332861055
Epoch: 35, step: 1418, loss: 0.32672783732414246, mean loss: 0.34532779534797187
Epoch: 35, step: 1419, loss: 0.32540827989578247, mean loss: 0.3453274119854728
Epoch: 35, step: 1420, loss: 0.3289308249950409, mean loss: 0.34532709642982545
Epoch: 35, step: 1421, loss: 0.3465614318847656, mean loss: 0.34532712018440487
Epoch: 35, step: 1422, loss: 0.3086320459842682, mean loss: 0.3453264140074289
Epoch: 35, step: 1423, loss: 0.31539374589920044, mean loss: 0.3453258379804081
Epoch: 35, step: 1424, loss: 0.33403950929641724, mean loss: 0.3453256207894395
Epoch: 35, step: 1425, loss: 0.361752450466156, mean loss: 0.3453259368966957
Epoch: 35, step: 1426, loss: 0.32018977403640747, mean loss: 0.3453254532019883
Epoch: 35, step: 1427, loss: 0.3655393123626709, mean loss: 0.34532584216941364
Epoch: 35, step: 1428, loss: 0.3140006959438324, mean loss: 0.3453252394034142
Epoch: 35, step: 1429, loss: 0.35532012581825256, mean loss: 0.3453254317237224
Epoch: 35, step: 1430, loss: 0.32622480392456055, mean loss: 0.3453250641989913
Epoch: 35, step: 1431, loss: 0.32501742243766785, mean loss: 0.34532467345701945
Epoch: 35, step: 1432, loss: 0.3133419454097748, mean loss: 0.3453240580850369
Epoch: 35, step: 1433, loss: 0.3309629559516907, mean loss: 0.3453237817718393
Epoch: 35, step: 1434, loss: 0.33953526616096497, mean loss: 0.34532367040068757
Epoch: 35, step: 1435, loss: 0.35690465569496155, mean loss: 0.3453238932147805
Epoch: 35, step: 1436, loss: 0.3819591701030731, mean loss: 0.34532459805109056
Epoch: 35, step: 1437, loss: 0.30598899722099304, mean loss: 0.3453238412770548
Epoch: 35, step: 1438, loss: 0.3142336308956146, mean loss: 0.34532324314684104
Epoch: 35, step: 1439, loss: 0.33723974227905273, mean loss: 0.34532308763508907
Epoch: 35, step: 1440, loss: 0.316853404045105, mean loss: 0.3453225399410549
Epoch: 35, step: 1441, loss: 0.3564900755882263, mean loss: 0.34532275477572166
Epoch: 35, step: 1442, loss: 0.35355257987976074, mean loss: 0.34532291309334673
Epoch: 35, step: 1443, loss: 0.36403888463974, mean loss: 0.34532327312665595
Valid: 35, mean loss: 0.18672208736340207
Epoch: 36, step: 0, loss: 0.34482505917549133, mean loss: 0.34532326354285386
Epoch: 36, step: 1, loss: 0.2973262369632721, mean loss: 0.34532234027453973
Epoch: 36, step: 2, loss: 0.3360597789287567, mean loss: 0.34532216210381733
Epoch: 36, step: 3, loss: 0.3349955081939697, mean loss: 0.34532196346848015
Epoch: 36, step: 4, loss: 0.37337273359298706, mean loss: 0.34532250302050316
Epoch: 36, step: 5, loss: 0.32019540667533875, mean loss: 0.34532201971416837
Epoch: 36, step: 6, loss: 0.37112459540367126, mean loss: 0.3453225160034432
Epoch: 36, step: 7, loss: 0.30793866515159607, mean loss: 0.3453217969726144
Epoch: 36, step: 8, loss: 0.28822746872901917, mean loss: 0.3453206988569403
Epoch: 36, step: 9, loss: 0.3516092300415039, mean loss: 0.3453208198041877
Epoch: 36, step: 10, loss: 0.3220271170139313, mean loss: 0.345320371805288
Epoch: 36, step: 11, loss: 0.2840435206890106, mean loss: 0.3453191933136518
Epoch: 36, step: 12, loss: 0.31177303194999695, mean loss: 0.3453185481579435
Epoch: 36, step: 13, loss: 0.32380732893943787, mean loss: 0.3453181344647396
Epoch: 36, step: 14, loss: 0.31925544142723083, mean loss: 0.34531763324946546
Epoch: 36, step: 15, loss: 0.3216535151004791, mean loss: 0.3453171781702703
Epoch: 36, step: 16, loss: 0.325128436088562, mean loss: 0.3453167899326964
Epoch: 36, step: 17, loss: 0.31570038199424744, mean loss: 0.3453162204082946
Epoch: 36, step: 18, loss: 0.31505659222602844, mean loss: 0.34531563852593816
Epoch: 36, step: 19, loss: 0.3096352517604828, mean loss: 0.34531495241743176
Epoch: 36, step: 20, loss: 0.35866260528564453, mean loss: 0.3453152090783849
Epoch: 36, step: 21, loss: 0.3292292356491089, mean loss: 0.34531489976843166
Epoch: 36, step: 22, loss: 0.374165415763855, mean loss: 0.34531545451137
Epoch: 36, step: 23, loss: 0.3659210205078125, mean loss: 0.3453158507113007
Epoch: 36, step: 24, loss: 0.34558752179145813, mean loss: 0.3453158559348405
Epoch: 36, step: 25, loss: 0.3174508512020111, mean loss: 0.3453153201723961
Epoch: 36, step: 26, loss: 0.3046640455722809, mean loss: 0.34531453858245165
Epoch: 36, step: 27, loss: 0.3516019880771637, mean loss: 0.3453146594670455
Epoch: 36, step: 28, loss: 0.34537675976753235, mean loss: 0.34531466066098354
Epoch: 36, step: 29, loss: 0.33533039689064026, mean loss: 0.3453144687075908
Epoch: 36, step: 30, loss: 0.35014015436172485, mean loss: 0.345314561482476
Epoch: 36, step: 31, loss: 0.3087814748287201, mean loss: 0.3453138591392229
Epoch: 36, step: 32, loss: 0.2913592457771301, mean loss: 0.34531282188960527
Epoch: 36, step: 33, loss: 0.34291210770606995, mean loss: 0.3453127757380004
Epoch: 36, step: 34, loss: 0.35406365990638733, mean loss: 0.3453129439627677
Epoch: 36, step: 35, loss: 0.3484925627708435, mean loss: 0.3453130050857744
Epoch: 36, step: 36, loss: 0.32963335514068604, mean loss: 0.34531270367576794
Epoch: 36, step: 37, loss: 0.32070958614349365, mean loss: 0.345312230738981
Epoch: 36, step: 38, loss: 0.313182532787323, mean loss: 0.34531161313334596
Epoch: 36, step: 39, loss: 0.349555641412735, mean loss: 0.3453116947116229
Epoch: 36, step: 40, loss: 0.3458094894886017, mean loss: 0.3453117042799992
Epoch: 36, step: 41, loss: 0.3135266602039337, mean loss: 0.3453110933346243
Epoch: 36, step: 42, loss: 0.30730509757995605, mean loss: 0.3453103628293913
Epoch: 36, step: 43, loss: 0.35318368673324585, mean loss: 0.34531051415798175
Epoch: 36, step: 44, loss: 0.3068700432777405, mean loss: 0.3453097753301957
Epoch: 36, step: 45, loss: 0.3432442843914032, mean loss: 0.3453097356321188
Epoch: 36, step: 46, loss: 0.3393939435482025, mean loss: 0.3453096219346676
Epoch: 36, step: 47, loss: 0.33077147603034973, mean loss: 0.3453093425268819
Epoch: 36, step: 48, loss: 0.35324522852897644, mean loss: 0.345309495043285
Epoch: 36, step: 49, loss: 0.31910496950149536, mean loss: 0.345308991439381
Epoch: 36, step: 50, loss: 0.35817036032676697, mean loss: 0.3453092386070352
Epoch: 36, step: 51, loss: 0.37645700573921204, mean loss: 0.34530983718815467
Epoch: 36, step: 52, loss: 0.2935642600059509, mean loss: 0.3453088427884548
Epoch: 36, step: 53, loss: 0.349642813205719, mean loss: 0.3453089260731778
Epoch: 36, step: 54, loss: 0.3422483205795288, mean loss: 0.3453088672594901
Epoch: 36, step: 55, loss: 0.3118771016597748, mean loss: 0.3453082248350935
Epoch: 36, step: 56, loss: 0.34704309701919556, mean loss: 0.34530825817173544
Epoch: 36, step: 57, loss: 0.37767869234085083, mean loss: 0.3453088801776954
Epoch: 36, step: 58, loss: 0.3412764370441437, mean loss: 0.3453088026947845
Epoch: 36, step: 59, loss: 0.3197070062160492, mean loss: 0.3453083107687896
Epoch: 36, step: 60, loss: 0.3452080190181732, mean loss: 0.3453083088417697
Epoch: 36, step: 61, loss: 0.3264656662940979, mean loss: 0.3453079468035238
Epoch: 36, step: 62, loss: 0.3154338002204895, mean loss: 0.34530737281949814
Epoch: 36, step: 63, loss: 0.3323691785335541, mean loss: 0.34530712423752985
Epoch: 36, step: 64, loss: 0.29052120447158813, mean loss: 0.3453060716540073
Epoch: 36, step: 65, loss: 0.31672942638397217, mean loss: 0.3453055226310434
Epoch: 36, step: 66, loss: 0.34375613927841187, mean loss: 0.34530549286440393
Epoch: 36, step: 67, loss: 0.3389151692390442, mean loss: 0.34530537009633305
Epoch: 36, step: 68, loss: 0.34323492646217346, mean loss: 0.3453053303206499
Epoch: 36, step: 69, loss: 0.337184339761734, mean loss: 0.34530517430976587
Epoch: 36, step: 70, loss: 0.3127800226211548, mean loss: 0.34530454948694983
Epoch: 36, step: 71, loss: 0.33770665526390076, mean loss: 0.34530440353078296
Epoch: 36, step: 72, loss: 0.326908677816391, mean loss: 0.34530405015418203
Epoch: 36, step: 73, loss: 0.3248613476753235, mean loss: 0.34530365746328956
Epoch: 36, step: 74, loss: 0.36629703640937805, mean loss: 0.345304060724569
Epoch: 36, step: 75, loss: 0.33869469165802, mean loss: 0.34530393376780627
Epoch: 36, step: 76, loss: 0.3389969766139984, mean loss: 0.3453038126222817
Epoch: 36, step: 77, loss: 0.3632989227771759, mean loss: 0.34530415826997396
Epoch: 36, step: 78, loss: 0.37797069549560547, mean loss: 0.3453047857124422
Epoch: 36, step: 79, loss: 0.3098079562187195, mean loss: 0.3453041039202347
Epoch: 36, step: 80, loss: 0.3269970118999481, mean loss: 0.3453037523002977
Epoch: 36, step: 81, loss: 0.30572310090065, mean loss: 0.3453029920987958
Epoch: 36, step: 82, loss: 0.3130297064781189, mean loss: 0.34530237225732957
Epoch: 36, step: 83, loss: 0.3114076554775238, mean loss: 0.3453017212871218
Epoch: 36, step: 84, loss: 0.3159390687942505, mean loss: 0.34530115736900363
Epoch: 36, step: 85, loss: 0.3184410035610199, mean loss: 0.3453006415219937
Epoch: 36, step: 86, loss: 0.3047749400138855, mean loss: 0.34529986324422857
Epoch: 36, step: 87, loss: 0.30892685055732727, mean loss: 0.34529916473038835
Epoch: 36, step: 88, loss: 0.3349657654762268, mean loss: 0.34529896628975204
Epoch: 36, step: 89, loss: 0.3538122773170471, mean loss: 0.34529912977462024
Epoch: 36, step: 90, loss: 0.3358384370803833, mean loss: 0.34529894810025263
Epoch: 36, step: 91, loss: 0.3168109655380249, mean loss: 0.3452984010539633
Epoch: 36, step: 92, loss: 0.3328835964202881, mean loss: 0.3452981626607257
Epoch: 36, step: 93, loss: 0.29464513063430786, mean loss: 0.3452971900229127
Epoch: 36, step: 94, loss: 0.31187692284584045, mean loss: 0.3452965483003916
Epoch: 36, step: 95, loss: 0.35100406408309937, mean loss: 0.34529665789170844
Epoch: 36, step: 96, loss: 0.3001469373703003, mean loss: 0.3452957909782367
Epoch: 36, step: 97, loss: 0.33844438195228577, mean loss: 0.3452956594278157
Epoch: 36, step: 98, loss: 0.36765286326408386, mean loss: 0.3452960886888766
Epoch: 36, step: 99, loss: 0.33867335319519043, mean loss: 0.34529596153398273
Epoch: 36, step: 100, loss: 0.3686355948448181, mean loss: 0.3452964096406029
Epoch: 36, step: 101, loss: 0.33920469880104065, mean loss: 0.34529629268574286
Epoch: 36, step: 102, loss: 0.3485966622829437, mean loss: 0.3452963560483784
Epoch: 36, step: 103, loss: 0.32565730810165405, mean loss: 0.34529597901244025
Epoch: 36, step: 104, loss: 0.32214778661727905, mean loss: 0.34529553461549667
Epoch: 36, step: 105, loss: 0.3592131435871124, mean loss: 0.3452958017993894
Epoch: 36, step: 106, loss: 0.32438918948173523, mean loss: 0.3452954004515113
Epoch: 36, step: 107, loss: 0.3628166615962982, mean loss: 0.34529573680375625
Epoch: 36, step: 108, loss: 0.3810555934906006, mean loss: 0.34529642326559734
Epoch: 36, step: 109, loss: 0.3244715631008148, mean loss: 0.3452960235101521
Epoch: 36, step: 110, loss: 0.320735365152359, mean loss: 0.34529555205111845
Epoch: 36, step: 111, loss: 0.329833060503006, mean loss: 0.3452952552434643
Epoch: 36, step: 112, loss: 0.33478790521621704, mean loss: 0.3452950535552668
Epoch: 36, step: 113, loss: 0.3269728720188141, mean loss: 0.3452947018684163
Epoch: 36, step: 114, loss: 0.32025372982025146, mean loss: 0.34529422122633013
Epoch: 36, step: 115, loss: 0.3288048505783081, mean loss: 0.34529390473169197
Epoch: 36, step: 116, loss: 0.3252187669277191, mean loss: 0.34529351941974396
Epoch: 36, step: 117, loss: 0.3291430175304413, mean loss: 0.345293209441204
Epoch: 36, step: 118, loss: 0.33465802669525146, mean loss: 0.3452930053227704
Epoch: 36, step: 119, loss: 0.33479607105255127, mean loss: 0.34529280386157224
Epoch: 36, step: 120, loss: 0.3647683262825012, mean loss: 0.3452931776361125
Epoch: 36, step: 121, loss: 0.30991512537002563, mean loss: 0.3452924986729937
Epoch: 36, step: 122, loss: 0.34971410036087036, mean loss: 0.34529258352918746
Epoch: 36, step: 123, loss: 0.3119412958621979, mean loss: 0.34529194348758796
Epoch: 36, step: 124, loss: 0.3345922827720642, mean loss: 0.34529173815528996
Epoch: 36, step: 125, loss: 0.3308713138103485, mean loss: 0.3452914614248285
Epoch: 36, step: 126, loss: 0.3135603964328766, mean loss: 0.3452908525118353
Epoch: 36, step: 127, loss: 0.3323404788970947, mean loss: 0.345290604001442
Epoch: 36, step: 128, loss: 0.33695200085639954, mean loss: 0.34529044399140335
Epoch: 36, step: 129, loss: 0.32255104184150696, mean loss: 0.34529000765179885
Epoch: 36, step: 130, loss: 0.32768887281417847, mean loss: 0.3452896699153537
Epoch: 36, step: 131, loss: 0.3297896087169647, mean loss: 0.3452893725007172
Epoch: 36, step: 132, loss: 0.2941353917121887, mean loss: 0.34528839097874187
Epoch: 36, step: 133, loss: 0.3605674207210541, mean loss: 0.3452886841409841
Epoch: 36, step: 134, loss: 0.32968801259994507, mean loss: 0.3452883848130703
Epoch: 36, step: 135, loss: 0.3199092149734497, mean loss: 0.3452878978758132
Epoch: 36, step: 136, loss: 0.3938447833061218, mean loss: 0.345288829494267
Epoch: 36, step: 137, loss: 0.40459126234054565, mean loss: 0.34528996725630307
Epoch: 36, step: 138, loss: 0.3068227767944336, mean loss: 0.34528922924831307
Epoch: 36, step: 139, loss: 0.35531774163246155, mean loss: 0.3452894216455271
Epoch: 36, step: 140, loss: 0.33940017223358154, mean loss: 0.345289308662325
Epoch: 36, step: 141, loss: 0.3079056441783905, mean loss: 0.3452885914834798
Epoch: 36, step: 142, loss: 0.32470273971557617, mean loss: 0.34528819656622445
Epoch: 36, step: 143, loss: 0.29307374358177185, mean loss: 0.34528719490774945
Epoch: 36, step: 144, loss: 0.33569782972335815, mean loss: 0.3452870109532292
Epoch: 36, step: 145, loss: 0.2993372976779938, mean loss: 0.3452861295085088
Epoch: 36, step: 146, loss: 0.31277820467948914, mean loss: 0.3452855059270538
Epoch: 36, step: 147, loss: 0.3274068236351013, mean loss: 0.3452851629768065
Epoch: 36, step: 148, loss: 0.4256214201450348, mean loss: 0.3452867039634593
Epoch: 36, step: 149, loss: 0.3227769732475281, mean loss: 0.3452862721966523
Epoch: 36, step: 150, loss: 0.34381717443466187, mean loss: 0.34528624401792857
Epoch: 36, step: 151, loss: 0.3013252317905426, mean loss: 0.34528540081913645
Epoch: 36, step: 152, loss: 0.3563004732131958, mean loss: 0.3452856120908321
Epoch: 36, step: 153, loss: 0.33801430463790894, mean loss: 0.34528547262810905
Epoch: 36, step: 154, loss: 0.33941254019737244, mean loss: 0.34528535998819593
Epoch: 36, step: 155, loss: 0.36354950070381165, mean loss: 0.34528571027858174
Epoch: 36, step: 156, loss: 0.3733384609222412, mean loss: 0.34528624829570154
Epoch: 36, step: 157, loss: 0.3933861553668976, mean loss: 0.3452871707748368
Epoch: 36, step: 158, loss: 0.3096677362918854, mean loss: 0.3452864876642662
Epoch: 36, step: 159, loss: 0.3337751626968384, mean loss: 0.3452862669039684
Epoch: 36, step: 160, loss: 0.37166064977645874, mean loss: 0.345286772693265
Epoch: 36, step: 161, loss: 0.3431035578250885, mean loss: 0.3452867308259143
Epoch: 36, step: 162, loss: 0.32495826482772827, mean loss: 0.3452863409958954
Epoch: 36, step: 163, loss: 0.2749348282814026, mean loss: 0.3452849919218616
Epoch: 36, step: 164, loss: 0.3182772397994995, mean loss: 0.34528447402598395
Epoch: 36, step: 165, loss: 0.3229621946811676, mean loss: 0.34528404598611157
Epoch: 36, step: 166, loss: 0.34060734510421753, mean loss: 0.3452839563099619
Epoch: 36, step: 167, loss: 0.29863467812538147, mean loss: 0.3452830618231122
Epoch: 36, step: 168, loss: 0.3153645992279053, mean loss: 0.3452824881559675
Epoch: 36, step: 169, loss: 0.37104037404060364, mean loss: 0.34528298203727836
Epoch: 36, step: 170, loss: 0.3173769414424896, mean loss: 0.3452824469775411
Epoch: 36, step: 171, loss: 0.34400495886802673, mean loss: 0.34528242248394286
Epoch: 36, step: 172, loss: 0.31005117297172546, mean loss: 0.34528174699935765
Epoch: 36, step: 173, loss: 0.3183414936065674, mean loss: 0.3452812304869647
Epoch: 36, step: 174, loss: 0.3679070472717285, mean loss: 0.3452816642724434
Epoch: 36, step: 175, loss: 0.33224526047706604, mean loss: 0.34528141434138904
Epoch: 36, step: 176, loss: 0.3062131702899933, mean loss: 0.34528066534800217
Epoch: 36, step: 177, loss: 0.3750443756580353, mean loss: 0.34528123594940374
Epoch: 36, step: 178, loss: 0.2957976162433624, mean loss: 0.34528028731493665
Epoch: 36, step: 179, loss: 0.31267836689949036, mean loss: 0.34527966232604745
Epoch: 36, step: 180, loss: 0.3422549068927765, mean loss: 0.34527960434166266
Epoch: 36, step: 181, loss: 0.3258918821811676, mean loss: 0.345279232687287
Epoch: 36, step: 182, loss: 0.32860881090164185, mean loss: 0.3452789131285279
Epoch: 36, step: 183, loss: 0.3485828638076782, mean loss: 0.34527897646142697
Epoch: 36, step: 184, loss: 0.29587218165397644, mean loss: 0.345278029408679
Epoch: 36, step: 185, loss: 0.33720842003822327, mean loss: 0.34527787472956517
Epoch: 36, step: 186, loss: 0.3082166612148285, mean loss: 0.34527716434997663
Epoch: 36, step: 187, loss: 0.3527904152870178, mean loss: 0.34527730835923326
Epoch: 36, step: 188, loss: 0.31393322348594666, mean loss: 0.345276707587093
Epoch: 36, step: 189, loss: 0.35265836119651794, mean loss: 0.3452768490685514
Epoch: 36, step: 190, loss: 0.35836148262023926, mean loss: 0.34527709985213645
Epoch: 36, step: 191, loss: 0.33004531264305115, mean loss: 0.3452768079212255
Epoch: 36, step: 192, loss: 0.3215351998806, mean loss: 0.3452763529006601
Epoch: 36, step: 193, loss: 0.32644882798194885, mean loss: 0.34527599206803106
Epoch: 36, step: 194, loss: 0.3242996633052826, mean loss: 0.34527559006092545
Epoch: 36, step: 195, loss: 0.3227511942386627, mean loss: 0.34527515839370004
Epoch: 36, step: 196, loss: 0.3148978054523468, mean loss: 0.3452745762401779
Epoch: 36, step: 197, loss: 0.2853488326072693, mean loss: 0.3452734278414267
Epoch: 36, step: 198, loss: 0.31101396679878235, mean loss: 0.34527277131610157
Epoch: 36, step: 199, loss: 0.35814371705055237, mean loss: 0.34527301796154336
Epoch: 36, step: 200, loss: 0.3147026598453522, mean loss: 0.34527243215416353
Epoch: 36, step: 201, loss: 0.3091042935848236, mean loss: 0.345271739092067
Epoch: 36, step: 202, loss: 0.32106032967567444, mean loss: 0.3452712751564237
Epoch: 36, step: 203, loss: 0.297161728143692, mean loss: 0.3452703533056723
Epoch: 36, step: 204, loss: 0.30172356963157654, mean loss: 0.3452695189002674
Epoch: 36, step: 205, loss: 0.3132535219192505, mean loss: 0.3452689054494726
Epoch: 36, step: 206, loss: 0.3449607193470001, mean loss: 0.3452688995445062
Epoch: 36, step: 207, loss: 0.3575632870197296, mean loss: 0.34526913510527174
Epoch: 36, step: 208, loss: 0.34327706694602966, mean loss: 0.34526909693792823
Epoch: 36, step: 209, loss: 0.30681857466697693, mean loss: 0.34526836025320834
Epoch: 36, step: 210, loss: 0.3268229365348816, mean loss: 0.34526800685875064
Epoch: 36, step: 211, loss: 0.31527096033096313, mean loss: 0.3452674321586486
Epoch: 36, step: 212, loss: 0.34285926818847656, mean loss: 0.3452673860225877
Epoch: 36, step: 213, loss: 0.361828088760376, mean loss: 0.3452677032895853
Epoch: 36, step: 214, loss: 0.33315032720565796, mean loss: 0.34526747115149675
Epoch: 36, step: 215, loss: 0.2925277352333069, mean loss: 0.3452664608117282
Epoch: 36, step: 216, loss: 0.3161444067955017, mean loss: 0.3452659029286605
Epoch: 36, step: 217, loss: 0.38219141960144043, mean loss: 0.3452666102869355
Epoch: 36, step: 218, loss: 0.3146452307701111, mean loss: 0.3452660237041813
Epoch: 36, step: 219, loss: 0.30046793818473816, mean loss: 0.3452651655690668
Epoch: 36, step: 220, loss: 0.305869996547699, mean loss: 0.3452644109446243
Epoch: 36, step: 221, loss: 0.30974721908569336, mean loss: 0.34526373061684856
Epoch: 36, step: 222, loss: 0.3224019408226013, mean loss: 0.3452632927102499
Epoch: 36, step: 223, loss: 0.3346365988254547, mean loss: 0.34526308916493337
Epoch: 36, step: 224, loss: 0.30700621008872986, mean loss: 0.3452623564008682
Epoch: 36, step: 225, loss: 0.30884841084480286, mean loss: 0.3452616589493157
Epoch: 36, step: 226, loss: 0.33072277903556824, mean loss: 0.3452613804853921
Epoch: 36, step: 227, loss: 0.3325115442276001, mean loss: 0.34526113629179184
Epoch: 36, step: 228, loss: 0.31738945841789246, mean loss: 0.3452606024845432
Epoch: 36, step: 229, loss: 0.33689939975738525, mean loss: 0.3452604423511934
Epoch: 36, step: 230, loss: 0.32798299193382263, mean loss: 0.34526011146063673
Epoch: 36, step: 231, loss: 0.35685262084007263, mean loss: 0.34526033347131124
Epoch: 36, step: 232, loss: 0.3819763660430908, mean loss: 0.34526103661458973
Epoch: 36, step: 233, loss: 0.3740094304084778, mean loss: 0.3452615871602597
Epoch: 36, step: 234, loss: 0.4124748706817627, mean loss: 0.34526287430255503
Epoch: 36, step: 235, loss: 0.36569079756736755, mean loss: 0.3452632654922001
Epoch: 36, step: 236, loss: 0.30837422609329224, mean loss: 0.34526255908980646
Epoch: 36, step: 237, loss: 0.30845165252685547, mean loss: 0.34526185419710675
Epoch: 36, step: 238, loss: 0.31560301780700684, mean loss: 0.3452612862704003
Epoch: 36, step: 239, loss: 0.35438454151153564, mean loss: 0.34526146096508553
Epoch: 36, step: 240, loss: 0.3355390131473541, mean loss: 0.3452612748004552
Epoch: 36, step: 241, loss: 0.3390541970729828, mean loss: 0.3452611559501177
Epoch: 36, step: 242, loss: 0.3350433111190796, mean loss: 0.34526096030715847
Epoch: 36, step: 243, loss: 0.30082792043685913, mean loss: 0.3452601095558398
Epoch: 36, step: 244, loss: 0.30281731486320496, mean loss: 0.3452592969269422
Epoch: 36, step: 245, loss: 0.3218224048614502, mean loss: 0.34525884820222336
Epoch: 36, step: 246, loss: 0.3465622067451477, mean loss: 0.34525887315595855
Epoch: 36, step: 247, loss: 0.3281553387641907, mean loss: 0.3452585457027806
Epoch: 36, step: 248, loss: 0.33137550950050354, mean loss: 0.34525827991226116
Epoch: 36, step: 249, loss: 0.34970468282699585, mean loss: 0.3452583650369484
Epoch: 36, step: 250, loss: 0.34546568989753723, mean loss: 0.34525836900602774
Epoch: 36, step: 251, loss: 0.3438543677330017, mean loss: 0.3452583421279882
Epoch: 36, step: 252, loss: 0.32064422965049744, mean loss: 0.3452578709272593
Epoch: 36, step: 253, loss: 0.30498436093330383, mean loss: 0.345257099965316
Epoch: 36, step: 254, loss: 0.3190360367298126, mean loss: 0.3452565980211127
Epoch: 36, step: 255, loss: 0.32844415307044983, mean loss: 0.3452562761902369
Epoch: 36, step: 256, loss: 0.34468090534210205, mean loss: 0.3452562651764575
Epoch: 36, step: 257, loss: 0.3854497969150543, mean loss: 0.3452570345484521
Epoch: 36, step: 258, loss: 0.33389759063720703, mean loss: 0.345256817113697
Epoch: 36, step: 259, loss: 0.3602396547794342, mean loss: 0.3452571038995033
Epoch: 36, step: 260, loss: 0.3930841386318207, mean loss: 0.345258019337052
Epoch: 36, step: 261, loss: 0.3134610950946808, mean loss: 0.3452574107368866
Epoch: 36, step: 262, loss: 0.34844473004341125, mean loss: 0.3452574717417157
Epoch: 36, step: 263, loss: 0.31177523732185364, mean loss: 0.345256830908872
Epoch: 36, step: 264, loss: 0.31149089336395264, mean loss: 0.3452561846584644
Epoch: 36, step: 265, loss: 0.37401220202445984, mean loss: 0.34525673501286375
Epoch: 36, step: 266, loss: 0.337032288312912, mean loss: 0.3452565776101978
Epoch: 36, step: 267, loss: 0.3426222503185272, mean loss: 0.3452565271943804
Epoch: 36, step: 268, loss: 0.30955225229263306, mean loss: 0.3452558438982079
Epoch: 36, step: 269, loss: 0.3003501892089844, mean loss: 0.3452549845256299
Epoch: 36, step: 270, loss: 0.3335762023925781, mean loss: 0.3452547610296557
Epoch: 36, step: 271, loss: 0.35924360156059265, mean loss: 0.3452550287279206
Epoch: 36, step: 272, loss: 0.33311524987220764, mean loss: 0.34525479641877815
Epoch: 36, step: 273, loss: 0.3668789267539978, mean loss: 0.34525521021437566
Epoch: 36, step: 274, loss: 0.31169313192367554, mean loss: 0.3452545679885717
Epoch: 36, step: 275, loss: 0.348172664642334, mean loss: 0.34525462382662475
Epoch: 36, step: 276, loss: 0.3714236617088318, mean loss: 0.3452551245640366
Epoch: 36, step: 277, loss: 0.3216998875141144, mean loss: 0.345254673849616
Epoch: 36, step: 278, loss: 0.3407266139984131, mean loss: 0.3452545872097398
Epoch: 36, step: 279, loss: 0.3146081864833832, mean loss: 0.34525400083286995
Epoch: 36, step: 280, loss: 0.3119697570800781, mean loss: 0.34525336399667456
Epoch: 36, step: 281, loss: 0.31189122796058655, mean loss: 0.34525272568235865
Epoch: 36, step: 282, loss: 0.4002211093902588, mean loss: 0.3452537773666663
Epoch: 36, step: 283, loss: 0.37150734663009644, mean loss: 0.3452542796542852
Epoch: 36, step: 284, loss: 0.3575327694416046, mean loss: 0.34525451456388334
Epoch: 36, step: 285, loss: 0.3410956561565399, mean loss: 0.3452544349989626
Epoch: 36, step: 286, loss: 0.28366807103157043, mean loss: 0.34525325678611096
Epoch: 36, step: 287, loss: 0.3460872769355774, mean loss: 0.345253272741501
Epoch: 36, step: 288, loss: 0.3415779769420624, mean loss: 0.34525320243186125
Epoch: 36, step: 289, loss: 0.3133566081523895, mean loss: 0.3452525922510012
Epoch: 36, step: 290, loss: 0.3108372092247009, mean loss: 0.3452519338983847
Epoch: 36, step: 291, loss: 0.37246885895729065, mean loss: 0.345252454537398
Epoch: 36, step: 292, loss: 0.3427899181842804, mean loss: 0.34525240743185726
Epoch: 36, step: 293, loss: 0.3000927269458771, mean loss: 0.3452515435946698
Epoch: 36, step: 294, loss: 0.3611462414264679, mean loss: 0.34525184763066574
Epoch: 36, step: 295, loss: 0.3454965651035309, mean loss: 0.34525185231156613
Epoch: 36, step: 296, loss: 0.340511679649353, mean loss: 0.34525176164435123
Epoch: 36, step: 297, loss: 0.3299376368522644, mean loss: 0.34525146873044604
Epoch: 36, step: 298, loss: 0.2994926869869232, mean loss: 0.3452505935170546
Epoch: 36, step: 299, loss: 0.34330594539642334, mean loss: 0.3452505563231115
Epoch: 36, step: 300, loss: 0.3163352906703949, mean loss: 0.34525000329134997
Epoch: 36, step: 301, loss: 0.2990413010120392, mean loss: 0.3452491195231849
Epoch: 36, step: 302, loss: 0.3323826193809509, mean loss: 0.3452488734486321
Epoch: 36, step: 303, loss: 0.3193126320838928, mean loss: 0.3452483774219842
Epoch: 36, step: 304, loss: 0.3197159171104431, mean loss: 0.3452478891269258
Epoch: 36, step: 305, loss: 0.3339841961860657, mean loss: 0.3452476737187609
Epoch: 36, step: 306, loss: 0.3108143210411072, mean loss: 0.3452470152239401
Epoch: 36, step: 307, loss: 0.3104303181171417, mean loss: 0.3452463494108691
Epoch: 36, step: 308, loss: 0.3571443259716034, mean loss: 0.34524657693609356
Epoch: 36, step: 309, loss: 0.34106016159057617, mean loss: 0.3452464968807269
Epoch: 36, step: 310, loss: 0.3606012463569641, mean loss: 0.3452467904986536
Epoch: 36, step: 311, loss: 0.34478554129600525, mean loss: 0.3452467816786826
Epoch: 36, step: 312, loss: 0.3512369692325592, mean loss: 0.34524689622038773
Epoch: 36, step: 313, loss: 0.3274845778942108, mean loss: 0.34524655658372233
Epoch: 36, step: 314, loss: 0.30172446370124817, mean loss: 0.3452457244054229
Epoch: 36, step: 315, loss: 0.3241363763809204, mean loss: 0.34524532078500175
Epoch: 36, step: 316, loss: 0.32510197162628174, mean loss: 0.34524493564228637
Epoch: 36, step: 317, loss: 0.3576723337173462, mean loss: 0.345245173250754
Epoch: 36, step: 318, loss: 0.34878796339035034, mean loss: 0.3452452409866418
Epoch: 36, step: 319, loss: 0.4209998846054077, mean loss: 0.3452466893394182
Epoch: 36, step: 320, loss: 0.31988921761512756, mean loss: 0.3452462045392705
Epoch: 36, step: 321, loss: 0.3531125783920288, mean loss: 0.34524635493069505
Epoch: 36, step: 322, loss: 0.34326794743537903, mean loss: 0.3452463171076982
Epoch: 36, step: 323, loss: 0.33384329080581665, mean loss: 0.3452460991099483
Epoch: 36, step: 324, loss: 0.30567213892936707, mean loss: 0.3452453425678584
Epoch: 36, step: 325, loss: 0.3224383294582367, mean loss: 0.3452449065706665
Epoch: 36, step: 326, loss: 0.3370122015476227, mean loss: 0.3452447491906695
Epoch: 36, step: 327, loss: 0.360415518283844, mean loss: 0.3452450391961958
Epoch: 36, step: 328, loss: 0.3580511212348938, mean loss: 0.34524528399351273
Epoch: 36, step: 329, loss: 0.32976824045181274, mean loss: 0.3452449881445327
Epoch: 36, step: 330, loss: 0.3305976092815399, mean loss: 0.34524470816022873
Epoch: 36, step: 331, loss: 0.33004048466682434, mean loss: 0.3452444175374079
Epoch: 36, step: 332, loss: 0.3306402564048767, mean loss: 0.34524413838988166
Epoch: 36, step: 333, loss: 0.31896719336509705, mean loss: 0.3452436361354945
Epoch: 36, step: 334, loss: 0.3129644989967346, mean loss: 0.34524301916771727
Epoch: 36, step: 335, loss: 0.3516963720321655, mean loss: 0.3452431425116176
Epoch: 36, step: 336, loss: 0.3628476858139038, mean loss: 0.3452434789834607
Epoch: 36, step: 337, loss: 0.3267371356487274, mean loss: 0.3452431252824681
Epoch: 36, step: 338, loss: 0.3202284872531891, mean loss: 0.34524264720135595
Epoch: 36, step: 339, loss: 0.3316501975059509, mean loss: 0.34524238742668856
Epoch: 36, step: 340, loss: 0.3059733808040619, mean loss: 0.34524163694400106
Epoch: 36, step: 341, loss: 0.37368065118789673, mean loss: 0.3452421804408142
Epoch: 36, step: 342, loss: 0.3191845715045929, mean loss: 0.3452416824644552
Epoch: 36, step: 343, loss: 0.39361172914505005, mean loss: 0.34524260682706565
Epoch: 36, step: 344, loss: 0.3208520710468292, mean loss: 0.34524214072727816
Epoch: 36, step: 345, loss: 0.308846652507782, mean loss: 0.34524144522778993
Epoch: 36, step: 346, loss: 0.3611387014389038, mean loss: 0.34524174901056137
Epoch: 36, step: 347, loss: 0.3050106465816498, mean loss: 0.3452409802437948
Epoch: 36, step: 348, loss: 0.3421648144721985, mean loss: 0.3452409214631827
Epoch: 36, step: 349, loss: 0.3287493884563446, mean loss: 0.3452406063423624
Epoch: 36, step: 350, loss: 0.34951215982437134, mean loss: 0.3452406879618041
Epoch: 36, step: 351, loss: 0.33673450350761414, mean loss: 0.3452405254315295
Epoch: 36, step: 352, loss: 0.3087514340877533, mean loss: 0.34523982823659394
Epoch: 36, step: 353, loss: 0.35421469807624817, mean loss: 0.34523999971563096
Epoch: 36, step: 354, loss: 0.35396063327789307, mean loss: 0.3452401663338996
Epoch: 36, step: 355, loss: 0.3329850137233734, mean loss: 0.34523993218883636
Epoch: 36, step: 356, loss: 0.33515846729278564, mean loss: 0.3452397395775967
Epoch: 36, step: 357, loss: 0.37470632791519165, mean loss: 0.34524030254019533
Epoch: 36, step: 358, loss: 0.3294256329536438, mean loss: 0.3452400004048652
Epoch: 36, step: 359, loss: 0.32714414596557617, mean loss: 0.34523965469467033
Epoch: 36, step: 360, loss: 0.33190152049064636, mean loss: 0.3452393998826691
Epoch: 36, step: 361, loss: 0.36550718545913696, mean loss: 0.34523978707148156
Epoch: 36, step: 362, loss: 0.3932666480541229, mean loss: 0.3452407045426066
Epoch: 36, step: 363, loss: 0.3671998977661133, mean loss: 0.3452411240274622
Epoch: 36, step: 364, loss: 0.2990693747997284, mean loss: 0.34524024202877596
Epoch: 36, step: 365, loss: 0.3179870843887329, mean loss: 0.3452397214335966
Epoch: 36, step: 366, loss: 0.33545854687690735, mean loss: 0.34523953459524476
Epoch: 36, step: 367, loss: 0.30854830145835876, mean loss: 0.34523883373886605
Epoch: 36, step: 368, loss: 0.3273192048072815, mean loss: 0.34523849145420366
Epoch: 36, step: 369, loss: 0.34674885869026184, mean loss: 0.34523852030333146
Epoch: 36, step: 370, loss: 0.3518977463245392, mean loss: 0.34523864749702876
Epoch: 36, step: 371, loss: 0.33615341782569885, mean loss: 0.34523847396907265
Epoch: 36, step: 372, loss: 0.33640173077583313, mean loss: 0.3452383051904338
Epoch: 36, step: 373, loss: 0.3822559416294098, mean loss: 0.3452390122005648
Epoch: 36, step: 374, loss: 0.38838687539100647, mean loss: 0.34523983627786176
Epoch: 36, step: 375, loss: 0.3313204348087311, mean loss: 0.3452395704374976
Epoch: 36, step: 376, loss: 0.3345201015472412, mean loss: 0.3452393657151109
Epoch: 36, step: 377, loss: 0.3146924674510956, mean loss: 0.34523878233597594
Epoch: 36, step: 378, loss: 0.3132915794849396, mean loss: 0.34523817222572917
Epoch: 36, step: 379, loss: 0.33346056938171387, mean loss: 0.34523794730779234
Epoch: 36, step: 380, loss: 0.31561094522476196, mean loss: 0.3452373815290836
Epoch: 36, step: 381, loss: 0.32633090019226074, mean loss: 0.34523702048410526
Epoch: 36, step: 382, loss: 0.37781471014022827, mean loss: 0.3452376425875226
Epoch: 36, step: 383, loss: 0.31877195835113525, mean loss: 0.3452371372085844
Epoch: 36, step: 384, loss: 0.3309301733970642, mean loss: 0.3452368640133007
Epoch: 36, step: 385, loss: 0.3307393193244934, mean loss: 0.34523658718411054
Epoch: 36, step: 386, loss: 0.3507211208343506, mean loss: 0.34523669190874157
Epoch: 36, step: 387, loss: 0.3799116909503937, mean loss: 0.3452373539991533
Epoch: 36, step: 388, loss: 0.33462926745414734, mean loss: 0.34523715145038686
Epoch: 36, step: 389, loss: 0.33755940198898315, mean loss: 0.34523700485571274
Epoch: 36, step: 390, loss: 0.3250119388103485, mean loss: 0.34523661869693384
Epoch: 36, step: 391, loss: 0.3586401343345642, mean loss: 0.34523687460642744
Epoch: 36, step: 392, loss: 0.3033478260040283, mean loss: 0.3452360748460631
Epoch: 36, step: 393, loss: 0.3298817574977875, mean loss: 0.3452357817016638
Epoch: 36, step: 394, loss: 0.28554999828338623, mean loss: 0.34523464220332634
Epoch: 36, step: 395, loss: 0.3600051701068878, mean loss: 0.34523492419125884
Epoch: 36, step: 396, loss: 0.30304139852523804, mean loss: 0.34523411867922843
Epoch: 36, step: 397, loss: 0.2891550362110138, mean loss: 0.34523304809997474
Epoch: 36, step: 398, loss: 0.347332626581192, mean loss: 0.34523308818126985
Epoch: 36, step: 399, loss: 0.32156047224998474, mean loss: 0.34523263627580386
Epoch: 36, step: 400, loss: 0.38267606496810913, mean loss: 0.34523335104966457
Epoch: 36, step: 401, loss: 0.3123147785663605, mean loss: 0.34523272266474336
Epoch: 36, step: 402, loss: 0.3896861672401428, mean loss: 0.34523357122344256
Epoch: 36, step: 403, loss: 0.3428574502468109, mean loss: 0.3452335258672355
Epoch: 36, step: 404, loss: 0.3149120807647705, mean loss: 0.3452329470922044
Epoch: 36, step: 405, loss: 0.357571005821228, mean loss: 0.345233182596284
Epoch: 36, step: 406, loss: 0.31988444924354553, mean loss: 0.3452326987587288
Epoch: 36, step: 407, loss: 0.32473331689834595, mean loss: 0.3452323074894155
Epoch: 36, step: 408, loss: 0.3088107407093048, mean loss: 0.3452316123284822
Epoch: 36, step: 409, loss: 0.30455026030540466, mean loss: 0.3452308358778958
Epoch: 36, step: 410, loss: 0.3175240755081177, mean loss: 0.3452303070724684
Epoch: 36, step: 411, loss: 0.32795339822769165, mean loss: 0.34522997733529676
Epoch: 36, step: 412, loss: 0.3515677750110626, mean loss: 0.34523009829255913
Epoch: 36, step: 413, loss: 0.29715731739997864, mean loss: 0.3452291808380591
Epoch: 36, step: 414, loss: 0.317562073469162, mean loss: 0.34522865282975035
Epoch: 36, step: 415, loss: 0.3215791881084442, mean loss: 0.34522820150408773
Epoch: 36, step: 416, loss: 0.33015158772468567, mean loss: 0.3452279137879415
Epoch: 36, step: 417, loss: 0.3302830755710602, mean loss: 0.34522762859199063
Epoch: 36, step: 418, loss: 0.34112489223480225, mean loss: 0.34522755029997765
Epoch: 36, step: 419, loss: 0.32592150568962097, mean loss: 0.3452271818921345
Epoch: 36, step: 420, loss: 0.3289462625980377, mean loss: 0.3452268712172124
Epoch: 36, step: 421, loss: 0.3672719895839691, mean loss: 0.34522729187741097
Epoch: 36, step: 422, loss: 0.3478660583496094, mean loss: 0.3452273422288234
Epoch: 36, step: 423, loss: 0.3352018892765045, mean loss: 0.34522715093259093
Epoch: 36, step: 424, loss: 0.32025057077407837, mean loss: 0.34522667436215154
Epoch: 36, step: 425, loss: 0.32544443011283875, mean loss: 0.3452262969104391
Epoch: 36, step: 426, loss: 0.31614190340042114, mean loss: 0.3452257419812542
Epoch: 36, step: 427, loss: 0.3778335452079773, mean loss: 0.34522636412509966
Epoch: 36, step: 428, loss: 0.33304113149642944, mean loss: 0.3452261316401698
Epoch: 36, step: 429, loss: 0.32979661226272583, mean loss: 0.3452258372623437
Epoch: 36, step: 430, loss: 0.3811213970184326, mean loss: 0.34522652209606985
Epoch: 36, step: 431, loss: 0.33717140555381775, mean loss: 0.3452263684193959
Epoch: 36, step: 432, loss: 0.3324272036552429, mean loss: 0.34522612423974497
Epoch: 36, step: 433, loss: 0.32572802901268005, mean loss: 0.3452257522664681
Epoch: 36, step: 434, loss: 0.3253806233406067, mean loss: 0.3452253736799074
Epoch: 36, step: 435, loss: 0.3588425815105438, mean loss: 0.34522563345113655
Epoch: 36, step: 436, loss: 0.35359856486320496, mean loss: 0.34522579317589214
Epoch: 36, step: 437, loss: 0.33367249369621277, mean loss: 0.3452255727856079
Epoch: 36, step: 438, loss: 0.33110901713371277, mean loss: 0.345225303503887
Epoch: 36, step: 439, loss: 0.32819414138793945, mean loss: 0.3452249786305062
Epoch: 36, step: 440, loss: 0.33538007736206055, mean loss: 0.3452247908403056
Epoch: 36, step: 441, loss: 0.3377038240432739, mean loss: 0.3452246473815867
Epoch: 36, step: 442, loss: 0.33277028799057007, mean loss: 0.3452244098253773
Epoch: 36, step: 443, loss: 0.31988897919654846, mean loss: 0.3452239265830139
Epoch: 36, step: 444, loss: 0.329525351524353, mean loss: 0.34522362715759936
Epoch: 36, step: 445, loss: 0.3397350311279297, mean loss: 0.34522352247333404
Epoch: 36, step: 446, loss: 0.3292621374130249, mean loss: 0.3452232180468486
Epoch: 36, step: 447, loss: 0.31892529129981995, mean loss: 0.34522271648431524
Epoch: 36, step: 448, loss: 0.3420853912830353, mean loss: 0.3452226566493792
Epoch: 36, step: 449, loss: 0.3195209801197052, mean loss: 0.3452221664774196
Epoch: 36, step: 450, loss: 0.31252071261405945, mean loss: 0.3452215428204374
Epoch: 36, step: 451, loss: 0.3142624795436859, mean loss: 0.34522095240424855
Epoch: 36, step: 452, loss: 0.33676451444625854, mean loss: 0.3452207911357176
Epoch: 36, step: 453, loss: 0.3648834824562073, mean loss: 0.34522116610599335
Epoch: 36, step: 454, loss: 0.3317863643169403, mean loss: 0.34522090990732845
Epoch: 36, step: 455, loss: 0.3374691903591156, mean loss: 0.3452207620865895
Epoch: 36, step: 456, loss: 0.319305956363678, mean loss: 0.34522026791588867
Epoch: 36, step: 457, loss: 0.3412391245365143, mean loss: 0.345220192000718
Epoch: 36, step: 458, loss: 0.35633543133735657, mean loss: 0.34522040394967857
Epoch: 36, step: 459, loss: 0.32019364833831787, mean loss: 0.34521992674054863
Epoch: 36, step: 460, loss: 0.37665602564811707, mean loss: 0.34522052615133914
Epoch: 36, step: 461, loss: 0.3492283821105957, mean loss: 0.34522060257005477
Epoch: 36, step: 462, loss: 0.34784579277038574, mean loss: 0.3452206526242085
Epoch: 36, step: 463, loss: 0.2923930585384369, mean loss: 0.3452196453866763
Epoch: 36, step: 464, loss: 0.2976381778717041, mean loss: 0.34521873819173426
Epoch: 36, step: 465, loss: 0.3466925323009491, mean loss: 0.345218766290764
Epoch: 36, step: 466, loss: 0.3339869976043701, mean loss: 0.3452185521524504
Epoch: 36, step: 467, loss: 0.3240537941455841, mean loss: 0.34521814864528183
Epoch: 36, step: 468, loss: 0.3095839321613312, mean loss: 0.34521746929011654
Epoch: 36, step: 469, loss: 0.3574526011943817, mean loss: 0.3452177025446234
Epoch: 36, step: 470, loss: 0.3436114490032196, mean loss: 0.34521767192307085
Epoch: 36, step: 471, loss: 0.3171164095401764, mean loss: 0.34521713621195327
Epoch: 36, step: 472, loss: 0.35647052526474, mean loss: 0.3452173507379279
Epoch: 36, step: 473, loss: 0.31291845440864563, mean loss: 0.34521673502828726
Epoch: 36, step: 474, loss: 0.3348912000656128, mean loss: 0.34521653819771553
Epoch: 36, step: 475, loss: 0.3399693965911865, mean loss: 0.34521643817595404
Epoch: 36, step: 476, loss: 0.3189457654953003, mean loss: 0.3452159374101913
Epoch: 36, step: 477, loss: 0.31804361939430237, mean loss: 0.34521541946733714
Epoch: 36, step: 478, loss: 0.289053350687027, mean loss: 0.34521434895919273
Epoch: 36, step: 479, loss: 0.33024924993515015, mean loss: 0.34521406371409086
Epoch: 36, step: 480, loss: 0.3375937044620514, mean loss: 0.3452139184675598
Epoch: 36, step: 481, loss: 0.3586489260196686, mean loss: 0.34521417453830183
Epoch: 36, step: 482, loss: 0.3243250548839569, mean loss: 0.3452137764000501
Epoch: 36, step: 483, loss: 0.31672871112823486, mean loss: 0.34521323349646554
Epoch: 36, step: 484, loss: 0.2862505614757538, mean loss: 0.34521210973439614
Epoch: 36, step: 485, loss: 0.34742963314056396, mean loss: 0.3452121519970873
Epoch: 36, step: 486, loss: 0.3365384042263031, mean loss: 0.3452119866915324
Epoch: 36, step: 487, loss: 0.3617594540119171, mean loss: 0.3452123020495771
Epoch: 36, step: 488, loss: 0.3260481357574463, mean loss: 0.345211936830011
Epoch: 36, step: 489, loss: 0.32359007000923157, mean loss: 0.34521152478086625
Epoch: 36, step: 490, loss: 0.3203827738761902, mean loss: 0.3452110516269662
Epoch: 36, step: 491, loss: 0.3492181599140167, mean loss: 0.3452111279877461
Epoch: 36, step: 492, loss: 0.3261418044567108, mean loss: 0.345210764603339
Epoch: 36, step: 493, loss: 0.3296903967857361, mean loss: 0.345210468853352
Epoch: 36, step: 494, loss: 0.3180694282054901, mean loss: 0.34520995167427754
Epoch: 36, step: 495, loss: 0.29183223843574524, mean loss: 0.34520893456846125
Epoch: 36, step: 496, loss: 0.3760485053062439, mean loss: 0.34520952220152346
Epoch: 36, step: 497, loss: 0.3378579616546631, mean loss: 0.3452093821237721
Epoch: 36, step: 498, loss: 0.36479461193084717, mean loss: 0.34520975529660536
Epoch: 36, step: 499, loss: 0.35374507308006287, mean loss: 0.34520991792364947
Epoch: 36, step: 500, loss: 0.3303496837615967, mean loss: 0.34520963479067507
Epoch: 36, step: 501, loss: 0.35134243965148926, mean loss: 0.34520975163716483
Epoch: 36, step: 502, loss: 0.3211197853088379, mean loss: 0.3452092926670136
Epoch: 36, step: 503, loss: 0.3214191198348999, mean loss: 0.3452088394172645
Epoch: 36, step: 504, loss: 0.3199929893016815, mean loss: 0.34520835901470176
Epoch: 36, step: 505, loss: 0.3588961362838745, mean loss: 0.34520861978393913
Epoch: 36, step: 506, loss: 0.36931338906288147, mean loss: 0.3452090790011245
Epoch: 36, step: 507, loss: 0.32127028703689575, mean loss: 0.34520862295464194
Epoch: 36, step: 508, loss: 0.3241614103317261, mean loss: 0.3452082220018935
Epoch: 36, step: 509, loss: 0.3149928152561188, mean loss: 0.34520764640455387
Epoch: 36, step: 510, loss: 0.38706082105636597, mean loss: 0.3452084436838119
Epoch: 36, step: 511, loss: 0.3469187021255493, mean loss: 0.3452084762626454
Epoch: 36, step: 512, loss: 0.3157728314399719, mean loss: 0.34520791555165575
Epoch: 36, step: 513, loss: 0.31353265047073364, mean loss: 0.34520731219028805
Epoch: 36, step: 514, loss: 0.3107961416244507, mean loss: 0.3452066567269351
Epoch: 36, step: 515, loss: 0.2877558767795563, mean loss: 0.3452055624263647
Epoch: 36, step: 516, loss: 0.315929651260376, mean loss: 0.34520500480058297
Epoch: 36, step: 517, loss: 0.31074830889701843, mean loss: 0.34520434850756737
Epoch: 36, step: 518, loss: 0.36133795976638794, mean loss: 0.3452046557968891
Epoch: 36, step: 519, loss: 0.33339130878448486, mean loss: 0.3452044307978983
Epoch: 36, step: 520, loss: 0.3335762023925781, mean loss: 0.3452042093289257
Epoch: 36, step: 521, loss: 0.26867547631263733, mean loss: 0.34520275180534715
Epoch: 36, step: 522, loss: 0.3354431092739105, mean loss: 0.34520256593217724
Epoch: 36, step: 523, loss: 0.3258034288883209, mean loss: 0.3452021964811023
Epoch: 36, step: 524, loss: 0.3540208637714386, mean loss: 0.34520236442692664
Epoch: 36, step: 525, loss: 0.3230006694793701, mean loss: 0.3452019416180341
Epoch: 36, step: 526, loss: 0.29465630650520325, mean loss: 0.34520097904571373
Epoch: 36, step: 527, loss: 0.30887046456336975, mean loss: 0.3452002871940516
Epoch: 36, step: 528, loss: 0.3149142265319824, mean loss: 0.34519971045951614
Epoch: 36, step: 529, loss: 0.3224993348121643, mean loss: 0.34519927818668134
Epoch: 36, step: 530, loss: 0.3339156210422516, mean loss: 0.3451990633212687
Epoch: 36, step: 531, loss: 0.3745224177837372, mean loss: 0.34519962169118384
Epoch: 36, step: 532, loss: 0.3224988877773285, mean loss: 0.3451991894362204
Epoch: 36, step: 533, loss: 0.352533221244812, mean loss: 0.3451993290841851
Epoch: 36, step: 534, loss: 0.4150581359863281, mean loss: 0.34520065924673393
Epoch: 36, step: 535, loss: 0.3657108247280121, mean loss: 0.3452010497677827
Epoch: 36, step: 536, loss: 0.34579795598983765, mean loss: 0.345201061132879
Epoch: 36, step: 537, loss: 0.31203556060791016, mean loss: 0.345200429673671
Epoch: 36, step: 538, loss: 0.3716100752353668, mean loss: 0.34520093249425554
Epoch: 36, step: 539, loss: 0.3191990852355957, mean loss: 0.3452004374472816
Epoch: 36, step: 540, loss: 0.330321341753006, mean loss: 0.3452001541708286
Epoch: 36, step: 541, loss: 0.3136669397354126, mean loss: 0.3451995538354816
Epoch: 36, step: 542, loss: 0.3626963496208191, mean loss: 0.3451998869364732
Epoch: 36, step: 543, loss: 0.33018043637275696, mean loss: 0.3451996010041978
Epoch: 36, step: 544, loss: 0.2994751036167145, mean loss: 0.345198730542217
Epoch: 36, step: 545, loss: 0.33504459261894226, mean loss: 0.3451985372405242
Epoch: 36, step: 546, loss: 0.30556488037109375, mean loss: 0.3451977827592299
Epoch: 36, step: 547, loss: 0.32370972633361816, mean loss: 0.3451973737122409
Epoch: 36, step: 548, loss: 0.34625890851020813, mean loss: 0.3451973939192498
Epoch: 36, step: 549, loss: 0.3285433053970337, mean loss: 0.3451970769038213
Epoch: 36, step: 550, loss: 0.3078043758869171, mean loss: 0.3451963651364088
Epoch: 36, step: 551, loss: 0.33819085359573364, mean loss: 0.34519623178953157
Epoch: 36, step: 552, loss: 0.33737266063690186, mean loss: 0.3451960828740786
Epoch: 36, step: 553, loss: 0.3532455563545227, mean loss: 0.3451962360864864
Epoch: 36, step: 554, loss: 0.36419329047203064, mean loss: 0.34519659766653904
Epoch: 36, step: 555, loss: 0.3263692855834961, mean loss: 0.3451962393240936
Epoch: 36, step: 556, loss: 0.38679882884025574, mean loss: 0.3451970311360027
Epoch: 36, step: 557, loss: 0.3514673113822937, mean loss: 0.3451971504744414
Epoch: 36, step: 558, loss: 0.38004693388938904, mean loss: 0.34519781373659647
Epoch: 36, step: 559, loss: 0.3215968906879425, mean loss: 0.34519736457164807
Epoch: 36, step: 560, loss: 0.31328433752059937, mean loss: 0.34519675722504894
Epoch: 36, step: 561, loss: 0.31068578362464905, mean loss: 0.3451961004486321
Epoch: 36, step: 562, loss: 0.31949806213378906, mean loss: 0.34519561140000293
Epoch: 36, step: 563, loss: 0.36632460355758667, mean loss: 0.34519601348937184
Epoch: 36, step: 564, loss: 0.32645103335380554, mean loss: 0.34519565677506453
Epoch: 36, step: 565, loss: 0.2965836822986603, mean loss: 0.34519473171370435
Epoch: 36, step: 566, loss: 0.3227667212486267, mean loss: 0.3451943049280968
Epoch: 36, step: 567, loss: 0.31864163279533386, mean loss: 0.345193799663366
Epoch: 36, step: 568, loss: 0.30410540103912354, mean loss: 0.34519301781649475
Epoch: 36, step: 569, loss: 0.3409274220466614, mean loss: 0.3451929366505365
Epoch: 36, step: 570, loss: 0.41059061884880066, mean loss: 0.34519418101705157
Epoch: 36, step: 571, loss: 0.3001183867454529, mean loss: 0.34519332334534386
Epoch: 36, step: 572, loss: 0.3086036443710327, mean loss: 0.34519262715494153
Epoch: 36, step: 573, loss: 0.30373287200927734, mean loss: 0.34519183831679806
Epoch: 36, step: 574, loss: 0.3819863796234131, mean loss: 0.3451925383784679
Epoch: 36, step: 575, loss: 0.3352431356906891, mean loss: 0.3451923490823742
Epoch: 36, step: 576, loss: 0.32848456501960754, mean loss: 0.34519203120820774
Epoch: 36, step: 577, loss: 0.308455228805542, mean loss: 0.3451913322849856
Epoch: 36, step: 578, loss: 0.3184893727302551, mean loss: 0.34519082428583114
Epoch: 36, step: 579, loss: 0.36748063564300537, mean loss: 0.34519124833672826
Epoch: 36, step: 580, loss: 0.3195474147796631, mean loss: 0.34519076048676045
Epoch: 36, step: 581, loss: 0.32145950198173523, mean loss: 0.34519030903033415
Epoch: 36, step: 582, loss: 0.33156025409698486, mean loss: 0.3451900497411426
Epoch: 36, step: 583, loss: 0.3122938871383667, mean loss: 0.34518942395810726
Epoch: 36, step: 584, loss: 0.3447938859462738, mean loss: 0.3451894164339388
Epoch: 36, step: 585, loss: 0.35316526889801025, mean loss: 0.3451895681526465
Epoch: 36, step: 586, loss: 0.31435054540634155, mean loss: 0.34518898153601857
Epoch: 36, step: 587, loss: 0.3138561546802521, mean loss: 0.34518838553763814
Epoch: 36, step: 588, loss: 0.3364240825176239, mean loss: 0.3451882188303355
Epoch: 36, step: 589, loss: 0.310551255941391, mean loss: 0.34518756000728823
Epoch: 36, step: 590, loss: 0.35689377784729004, mean loss: 0.345187782664784
Epoch: 36, step: 591, loss: 0.34549611806869507, mean loss: 0.34518778852934967
Epoch: 36, step: 592, loss: 0.3370799124240875, mean loss: 0.34518763431978833
Epoch: 36, step: 593, loss: 0.3801090717315674, mean loss: 0.3451882985032379
Epoch: 36, step: 594, loss: 0.3633759319782257, mean loss: 0.3451886444138386
Epoch: 36, step: 595, loss: 0.3173234164714813, mean loss: 0.3451881144551482
Epoch: 36, step: 596, loss: 0.31395983695983887, mean loss: 0.34518752054713014
Epoch: 36, step: 597, loss: 0.3253122568130493, mean loss: 0.3451871425610563
Epoch: 36, step: 598, loss: 0.3339691460132599, mean loss: 0.34518692922221017
Epoch: 36, step: 599, loss: 0.3565540015697479, mean loss: 0.3451871453920023
Epoch: 36, step: 600, loss: 0.3230685293674469, mean loss: 0.34518672476604384
Epoch: 36, step: 601, loss: 0.36453714966773987, mean loss: 0.3451870927427848
Epoch: 36, step: 602, loss: 0.4110850393772125, mean loss: 0.3451883458651655
Epoch: 36, step: 603, loss: 0.37639713287353516, mean loss: 0.34518893932350214
Epoch: 36, step: 604, loss: 0.3440057337284088, mean loss: 0.34518891682439407
Epoch: 36, step: 605, loss: 0.3163284361362457, mean loss: 0.3451883680417227
Epoch: 36, step: 606, loss: 0.30467116832733154, mean loss: 0.3451875976209337
Epoch: 36, step: 607, loss: 0.3322981297969818, mean loss: 0.34518735253674176
Epoch: 36, step: 608, loss: 0.33358991146087646, mean loss: 0.3451871320237253
Epoch: 36, step: 609, loss: 0.33162227272987366, mean loss: 0.34518687410724636
Epoch: 36, step: 610, loss: 0.3278087377548218, mean loss: 0.34518654369301777
Epoch: 36, step: 611, loss: 0.35681644082069397, mean loss: 0.3451867648105386
Epoch: 36, step: 612, loss: 0.3227328062057495, mean loss: 0.3451863379048481
Epoch: 36, step: 613, loss: 0.33398374915122986, mean loss: 0.3451861249197773
Epoch: 36, step: 614, loss: 0.3855934143066406, mean loss: 0.34518689313380013
Epoch: 36, step: 615, loss: 0.26915544271469116, mean loss: 0.34518544766896325
Epoch: 36, step: 616, loss: 0.3201703429222107, mean loss: 0.3451849721056708
Epoch: 36, step: 617, loss: 0.32856059074401855, mean loss: 0.34518465606480997
Epoch: 36, step: 618, loss: 0.3370794355869293, mean loss: 0.3451845019819539
Epoch: 36, step: 619, loss: 0.3194619417190552, mean loss: 0.3451840129970808
Epoch: 36, step: 620, loss: 0.3067981004714966, mean loss: 0.34518328329624387
Epoch: 36, step: 621, loss: 0.3591116666793823, mean loss: 0.34518354806420537
Epoch: 36, step: 622, loss: 0.31638118624687195, mean loss: 0.3451830005636481
Epoch: 36, step: 623, loss: 0.3352738320827484, mean loss: 0.3451828122050623
Epoch: 36, step: 624, loss: 0.3447456657886505, mean loss: 0.3451828038957157
Epoch: 36, step: 625, loss: 0.30692026019096375, mean loss: 0.34518207660919786
Epoch: 36, step: 626, loss: 0.36750659346580505, mean loss: 0.34518250094093184
Epoch: 36, step: 627, loss: 0.3366868495941162, mean loss: 0.34518233946348664
Epoch: 36, step: 628, loss: 0.31868433952331543, mean loss: 0.34518183582370293
Epoch: 36, step: 629, loss: 0.32487785816192627, mean loss: 0.3451814499192353
Epoch: 36, step: 630, loss: 0.31726381182670593, mean loss: 0.3451809193169718
Epoch: 36, step: 631, loss: 0.31281232833862305, mean loss: 0.34518030413164835
Epoch: 36, step: 632, loss: 0.3630021810531616, mean loss: 0.34518064284113237
Epoch: 36, step: 633, loss: 0.3204284608364105, mean loss: 0.3451801724283078
Epoch: 36, step: 634, loss: 0.329943984746933, mean loss: 0.3451798828715378
Epoch: 36, step: 635, loss: 0.3364793658256531, mean loss: 0.34517971752533777
Epoch: 36, step: 636, loss: 0.3278757929801941, mean loss: 0.34517938868467446
Epoch: 36, step: 637, loss: 0.3076809346675873, mean loss: 0.3451786760843549
Epoch: 36, step: 638, loss: 0.31544795632362366, mean loss: 0.34517811110858837
Epoch: 36, step: 639, loss: 0.30892038345336914, mean loss: 0.3451774221125475
Epoch: 36, step: 640, loss: 0.33958810567855835, mean loss: 0.345177315902259
Epoch: 36, step: 641, loss: 0.33260032534599304, mean loss: 0.34517707691410565
Epoch: 36, step: 642, loss: 0.3438321053981781, mean loss: 0.34517705135742344
Epoch: 36, step: 643, loss: 0.30923333764076233, mean loss: 0.3451763683804204
Epoch: 36, step: 644, loss: 0.3079572916030884, mean loss: 0.34517566118330895
Epoch: 36, step: 645, loss: 0.35946962237358093, mean loss: 0.3451759327767194
Epoch: 36, step: 646, loss: 0.33153173327445984, mean loss: 0.3451756735340772
Epoch: 36, step: 647, loss: 0.3321042060852051, mean loss: 0.3451754251781825
Epoch: 36, step: 648, loss: 0.3177391290664673, mean loss: 0.34517490390263084
Epoch: 36, step: 649, loss: 0.3510156273841858, mean loss: 0.34517501487127245
Epoch: 36, step: 650, loss: 0.3222414255142212, mean loss: 0.3451745791613958
Epoch: 36, step: 651, loss: 0.31095069646835327, mean loss: 0.34517392896224136
Epoch: 36, step: 652, loss: 0.3463093340396881, mean loss: 0.3451739505327161
Epoch: 36, step: 653, loss: 0.3178034722805023, mean loss: 0.34517343055706634
Epoch: 36, step: 654, loss: 0.317763090133667, mean loss: 0.34517290983402027
Epoch: 36, step: 655, loss: 0.3346506655216217, mean loss: 0.34517270994336086
Epoch: 36, step: 656, loss: 0.3300820589065552, mean loss: 0.3451724232723053
Epoch: 36, step: 657, loss: 0.32326585054397583, mean loss: 0.34517200712981966
Epoch: 36, step: 658, loss: 0.3465731739997864, mean loss: 0.3451720337462144
Epoch: 36, step: 659, loss: 0.3078681230545044, mean loss: 0.34517132513914256
Epoch: 36, step: 660, loss: 0.3200780749320984, mean loss: 0.3451708484889344
Epoch: 36, step: 661, loss: 0.29668810963630676, mean loss: 0.3451699275692282
Epoch: 36, step: 662, loss: 0.3703550696372986, mean loss: 0.3451704059467629
Epoch: 36, step: 663, loss: 0.3115423023700714, mean loss: 0.34516976721208015
Epoch: 36, step: 664, loss: 0.3421315848827362, mean loss: 0.3451697095057167
Epoch: 36, step: 665, loss: 0.35409438610076904, mean loss: 0.34516987901524365
Epoch: 36, step: 666, loss: 0.3885636627674103, mean loss: 0.34517070319301335
Epoch: 36, step: 667, loss: 0.346192330121994, mean loss: 0.3451707225963965
Epoch: 36, step: 668, loss: 0.3491770625114441, mean loss: 0.34517079868588646
Epoch: 36, step: 669, loss: 0.36245661973953247, mean loss: 0.3451711269766346
Epoch: 36, step: 670, loss: 0.3454042673110962, mean loss: 0.34517113140433064
Epoch: 36, step: 671, loss: 0.3607873022556305, mean loss: 0.3451714279739685
Epoch: 36, step: 672, loss: 0.3796646296977997, mean loss: 0.34517208302840996
Epoch: 36, step: 673, loss: 0.39116236567497253, mean loss: 0.345172956405345
Epoch: 36, step: 674, loss: 0.37132591009140015, mean loss: 0.34517345305271174
Epoch: 36, step: 675, loss: 0.28432613611221313, mean loss: 0.3451722975776464
Epoch: 36, step: 676, loss: 0.3080771863460541, mean loss: 0.3451715931643001
Epoch: 36, step: 677, loss: 0.32421207427978516, mean loss: 0.3451711951634857
Epoch: 36, step: 678, loss: 0.2962268888950348, mean loss: 0.3451702657765106
Epoch: 36, step: 679, loss: 0.30994129180908203, mean loss: 0.3451695968380713
Epoch: 36, step: 680, loss: 0.3204770088195801, mean loss: 0.34516912797662597
Epoch: 36, step: 681, loss: 0.3736182153224945, mean loss: 0.34516966815600825
Epoch: 36, step: 682, loss: 0.3458559215068817, mean loss: 0.3451696811860527
Epoch: 36, step: 683, loss: 0.36889275908470154, mean loss: 0.34517013161283744
Epoch: 36, step: 684, loss: 0.3618471026420593, mean loss: 0.34517044825015786
Epoch: 36, step: 685, loss: 0.32901251316070557, mean loss: 0.34517014147333824
Epoch: 36, step: 686, loss: 0.33575570583343506, mean loss: 0.34516996273293765
Epoch: 36, step: 687, loss: 0.3126619756221771, mean loss: 0.3451693455551751
Epoch: 36, step: 688, loss: 0.33444899320602417, mean loss: 0.34516914202865584
Epoch: 36, step: 689, loss: 0.3306351900100708, mean loss: 0.3451688661059612
Epoch: 36, step: 690, loss: 0.3323674201965332, mean loss: 0.34516862307898616
Epoch: 36, step: 691, loss: 0.3923286497592926, mean loss: 0.34516951836387266
Epoch: 36, step: 692, loss: 0.3397453725337982, mean loss: 0.3451694153939649
Epoch: 36, step: 693, loss: 0.3763568699359894, mean loss: 0.3451700074334224
Epoch: 36, step: 694, loss: 0.3113328516483307, mean loss: 0.34516936510619933
Epoch: 36, step: 695, loss: 0.3122105300426483, mean loss: 0.345168739463924
Epoch: 36, step: 696, loss: 0.3385320007801056, mean loss: 0.345168613484184
Epoch: 36, step: 697, loss: 0.3043930232524872, mean loss: 0.3451678394894565
Epoch: 36, step: 698, loss: 0.35291919112205505, mean loss: 0.34516798662138964
Epoch: 36, step: 699, loss: 0.3117162883281708, mean loss: 0.3451673516715321
Epoch: 36, step: 700, loss: 0.3565492033958435, mean loss: 0.34516756770743845
Epoch: 36, step: 701, loss: 0.32176607847213745, mean loss: 0.3451671235384138
Epoch: 36, step: 702, loss: 0.33769115805625916, mean loss: 0.34516698164448395
Epoch: 36, step: 703, loss: 0.29567626118659973, mean loss: 0.3451660423277428
Epoch: 36, step: 704, loss: 0.33482927083969116, mean loss: 0.34516584614312196
Epoch: 36, step: 705, loss: 0.32143980264663696, mean loss: 0.34516539584812295
Epoch: 36, step: 706, loss: 0.34053733944892883, mean loss: 0.34516530801421585
Epoch: 36, step: 707, loss: 0.2793149948120117, mean loss: 0.34516405829294505
Epoch: 36, step: 708, loss: 0.35915952920913696, mean loss: 0.34516432389693263
Epoch: 36, step: 709, loss: 0.3327028751373291, mean loss: 0.34516408740987986
Epoch: 36, step: 710, loss: 0.3270666301250458, mean loss: 0.34516374397203403
Epoch: 36, step: 711, loss: 0.3320867121219635, mean loss: 0.34516349581217654
Epoch: 36, step: 712, loss: 0.3036870062351227, mean loss: 0.3451627087372088
Epoch: 36, step: 713, loss: 0.33085769414901733, mean loss: 0.3451624372845049
Epoch: 36, step: 714, loss: 0.3867698609828949, mean loss: 0.34516322681416767
Epoch: 36, step: 715, loss: 0.32076868414878845, mean loss: 0.3451627639196199
Epoch: 36, step: 716, loss: 0.2922110855579376, mean loss: 0.345161759163005
Epoch: 36, step: 717, loss: 0.2781992554664612, mean loss: 0.3451604885754809
Epoch: 36, step: 718, loss: 0.33926764130592346, mean loss: 0.3451603767631121
Epoch: 36, step: 719, loss: 0.36409449577331543, mean loss: 0.3451607360170399
Epoch: 36, step: 720, loss: 0.3291570544242859, mean loss: 0.3451604323706763
Epoch: 36, step: 721, loss: 0.3336638808250427, mean loss: 0.3451602142446272
Epoch: 36, step: 722, loss: 0.29293256998062134, mean loss: 0.3451592233393534
Epoch: 36, step: 723, loss: 0.31754860281944275, mean loss: 0.3451586994981809
Epoch: 36, step: 724, loss: 0.3546164929866791, mean loss: 0.34515887893230957
Epoch: 36, step: 725, loss: 0.3284887373447418, mean loss: 0.345158562670849
Epoch: 36, step: 726, loss: 0.31935447454452515, mean loss: 0.3451580731318889
Epoch: 36, step: 727, loss: 0.3357408344745636, mean loss: 0.3451578944773386
Epoch: 36, step: 728, loss: 0.34351539611816406, mean loss: 0.34515786331807313
Epoch: 36, step: 729, loss: 0.3265073299407959, mean loss: 0.34515750951199925
Epoch: 36, step: 730, loss: 0.3342569172382355, mean loss: 0.3451573027284979
Epoch: 36, step: 731, loss: 0.3106840252876282, mean loss: 0.3451566487851516
Epoch: 36, step: 732, loss: 0.37031057476997375, mean loss: 0.3451571259353306
Epoch: 36, step: 733, loss: 0.3230993151664734, mean loss: 0.34515670752395744
Epoch: 36, step: 734, loss: 0.3518410921096802, mean loss: 0.3451568343166619
Epoch: 36, step: 735, loss: 0.308057576417923, mean loss: 0.345156130612984
Epoch: 36, step: 736, loss: 0.29250481724739075, mean loss: 0.3451551319347843
Epoch: 36, step: 737, loss: 0.35064446926116943, mean loss: 0.3451552360533179
Epoch: 36, step: 738, loss: 0.31939736008644104, mean loss: 0.34515474750228764
Epoch: 36, step: 739, loss: 0.34138455986976624, mean loss: 0.34515467599429067
Epoch: 36, step: 740, loss: 0.3058769702911377, mean loss: 0.3451539310401759
Epoch: 36, step: 741, loss: 0.38199281692504883, mean loss: 0.3451546297255661
Epoch: 36, step: 742, loss: 0.3788799047470093, mean loss: 0.34515526934615937
Epoch: 36, step: 743, loss: 0.3534679412841797, mean loss: 0.3451554269981078
Epoch: 36, step: 744, loss: 0.3202448785305023, mean loss: 0.3451549545721474
Epoch: 36, step: 745, loss: 0.34084945917129517, mean loss: 0.3451548729204235
Epoch: 36, step: 746, loss: 0.3261047601699829, mean loss: 0.34515451165071975
Epoch: 36, step: 747, loss: 0.42163580656051636, mean loss: 0.3451559620280032
Epoch: 36, step: 748, loss: 0.330811083316803, mean loss: 0.3451556899995066
Epoch: 36, step: 749, loss: 0.30032116174697876, mean loss: 0.34515483979796197
Epoch: 36, step: 750, loss: 0.368774950504303, mean loss: 0.34515528769993803
Epoch: 36, step: 751, loss: 0.32023918628692627, mean loss: 0.3451548152313888
Epoch: 36, step: 752, loss: 0.3253494203090668, mean loss: 0.3451544396811125
Epoch: 36, step: 753, loss: 0.3336714506149292, mean loss: 0.3451542219445835
Epoch: 36, step: 754, loss: 0.3022109568119049, mean loss: 0.3451534076844509
Epoch: 36, step: 755, loss: 0.33304476737976074, mean loss: 0.34515317809324303
Epoch: 36, step: 756, loss: 0.3106495141983032, mean loss: 0.3451525238837306
Epoch: 36, step: 757, loss: 0.3320702910423279, mean loss: 0.3451522758416988
Epoch: 36, step: 758, loss: 0.30611202120780945, mean loss: 0.34515153564385953
Epoch: 36, step: 759, loss: 0.40905579924583435, mean loss: 0.3451527472369052
Epoch: 36, step: 760, loss: 0.35358917713165283, mean loss: 0.3451529071843864
Epoch: 36, step: 761, loss: 0.3248708248138428, mean loss: 0.3451525226607757
Epoch: 36, step: 762, loss: 0.3803353011608124, mean loss: 0.34515318967081415
Epoch: 36, step: 763, loss: 0.32493001222610474, mean loss: 0.3451528062785065
Epoch: 36, step: 764, loss: 0.3195333778858185, mean loss: 0.34515232059293155
Epoch: 36, step: 765, loss: 0.2958073019981384, mean loss: 0.34515138514234206
Epoch: 36, step: 766, loss: 0.34245437383651733, mean loss: 0.34515133401513487
Epoch: 36, step: 767, loss: 0.3086695969104767, mean loss: 0.3451506424444436
Epoch: 36, step: 768, loss: 0.3134556710720062, mean loss: 0.3451500416260755
Epoch: 36, step: 769, loss: 0.4087409973144531, mean loss: 0.34515124705041655
Epoch: 36, step: 770, loss: 0.33777517080307007, mean loss: 0.3451511072328401
Epoch: 36, step: 771, loss: 0.308010995388031, mean loss: 0.34515040323496604
Epoch: 36, step: 772, loss: 0.2928076684474945, mean loss: 0.34514941108729297
Epoch: 36, step: 773, loss: 0.3656686246395111, mean loss: 0.34514980001813855
Epoch: 36, step: 774, loss: 0.3568955361843109, mean loss: 0.3451500226481385
Epoch: 36, step: 775, loss: 0.33277639746665955, mean loss: 0.34514978812150504
Epoch: 36, step: 776, loss: 0.3361837863922119, mean loss: 0.3451496181853452
Epoch: 36, step: 777, loss: 0.3120497763156891, mean loss: 0.34514899084290424
Epoch: 36, step: 778, loss: 0.3370993137359619, mean loss: 0.3451488382799888
Epoch: 36, step: 779, loss: 0.3268132209777832, mean loss: 0.34514849077757614
Epoch: 36, step: 780, loss: 0.3326479494571686, mean loss: 0.3451482538678572
Epoch: 36, step: 781, loss: 0.33321723341941833, mean loss: 0.3451480277559585
Epoch: 36, step: 782, loss: 0.3543989658355713, mean loss: 0.34514820307269206
Epoch: 36, step: 783, loss: 0.31780368089675903, mean loss: 0.34514768486995223
Epoch: 36, step: 784, loss: 0.315047949552536, mean loss: 0.34514711446431035
Epoch: 36, step: 785, loss: 0.36278650164604187, mean loss: 0.34514744873353875
Epoch: 36, step: 786, loss: 0.3771531581878662, mean loss: 0.345148055235395
Epoch: 36, step: 787, loss: 0.34204408526420593, mean loss: 0.3451479964168933
Epoch: 36, step: 788, loss: 0.3334380090236664, mean loss: 0.34514777452336076
Epoch: 36, step: 789, loss: 0.34610503911972046, mean loss: 0.3451477926623041
Epoch: 36, step: 790, loss: 0.3636128902435303, mean loss: 0.34514814254572584
Epoch: 36, step: 791, loss: 0.3057154715061188, mean loss: 0.345147395375212
Epoch: 36, step: 792, loss: 0.3042551279067993, mean loss: 0.34514662056293643
Epoch: 36, step: 793, loss: 0.32259857654571533, mean loss: 0.3451461933386381
Epoch: 36, step: 794, loss: 0.34569406509399414, mean loss: 0.3451462037191257
Epoch: 36, step: 795, loss: 0.3384841978549957, mean loss: 0.3451460774969608
Epoch: 36, step: 796, loss: 0.3156012296676636, mean loss: 0.345145517734019
Epoch: 36, step: 797, loss: 0.31105053424835205, mean loss: 0.3451448717754823
Epoch: 36, step: 798, loss: 0.32523810863494873, mean loss: 0.34514449463202435
Epoch: 36, step: 799, loss: 0.3266286551952362, mean loss: 0.34514414384694864
Epoch: 36, step: 800, loss: 0.31421253085136414, mean loss: 0.3451435578544698
Epoch: 36, step: 801, loss: 0.32858097553253174, mean loss: 0.3451432440860024
Epoch: 36, step: 802, loss: 0.330706924200058, mean loss: 0.34514297060351834
Epoch: 36, step: 803, loss: 0.35776492953300476, mean loss: 0.3451432097101132
Epoch: 36, step: 804, loss: 0.34412986040115356, mean loss: 0.34514319051389225
Epoch: 36, step: 805, loss: 0.3041532337665558, mean loss: 0.3451424140418948
Epoch: 36, step: 806, loss: 0.35237306356430054, mean loss: 0.34514255100936125
Epoch: 36, step: 807, loss: 0.3348756730556488, mean loss: 0.3451423565314488
Epoch: 36, step: 808, loss: 0.30029305815696716, mean loss: 0.3451415070002918
Epoch: 36, step: 809, loss: 0.3164530396461487, mean loss: 0.3451409635963566
Epoch: 36, step: 810, loss: 0.3033657968044281, mean loss: 0.34514017232508487
Epoch: 36, step: 811, loss: 0.38823872804641724, mean loss: 0.3451409886474525
Epoch: 36, step: 812, loss: 0.33287981152534485, mean loss: 0.3451407564149938
Epoch: 36, step: 813, loss: 0.3123430609703064, mean loss: 0.3451401352229895
Epoch: 36, step: 814, loss: 0.31590020656585693, mean loss: 0.3451395814259733
Epoch: 36, step: 815, loss: 0.32305654883384705, mean loss: 0.34513916318671967
Epoch: 36, step: 816, loss: 0.3332585394382477, mean loss: 0.34513893817916774
Epoch: 36, step: 817, loss: 0.31003326177597046, mean loss: 0.34513827332411673
Epoch: 36, step: 818, loss: 0.32018232345581055, mean loss: 0.3451378007004047
Epoch: 36, step: 819, loss: 0.39275676012039185, mean loss: 0.3451387025063175
Epoch: 36, step: 820, loss: 0.33291271328926086, mean loss: 0.3451384709754167
Epoch: 36, step: 821, loss: 0.3061838746070862, mean loss: 0.34513773328279906
Epoch: 36, step: 822, loss: 0.34751611948013306, mean loss: 0.3451377783220211
Epoch: 36, step: 823, loss: 0.3931707739830017, mean loss: 0.34513868790003316
Epoch: 36, step: 824, loss: 0.3535997271537781, mean loss: 0.34513884811967854
Epoch: 36, step: 825, loss: 0.33472228050231934, mean loss: 0.34513865087355816
Epoch: 36, step: 826, loss: 0.33762097358703613, mean loss: 0.3451385085229629
Epoch: 36, step: 827, loss: 0.31277164816856384, mean loss: 0.3451378956535326
Epoch: 36, step: 828, loss: 0.35689854621887207, mean loss: 0.34513811833829894
Epoch: 36, step: 829, loss: 0.3259051442146301, mean loss: 0.3451377541739841
Epoch: 36, step: 830, loss: 0.32332322001457214, mean loss: 0.34513734113726807
Epoch: 36, step: 831, loss: 0.3312208652496338, mean loss: 0.34513707764749435
Epoch: 36, step: 832, loss: 0.3381626009941101, mean loss: 0.3451369455976495
Epoch: 36, step: 833, loss: 0.31582188606262207, mean loss: 0.3451363905774001
Epoch: 36, step: 834, loss: 0.3034650683403015, mean loss: 0.3451356016317132
Epoch: 36, step: 835, loss: 0.3154679834842682, mean loss: 0.3451350399577611
Epoch: 36, step: 836, loss: 0.36516493558883667, mean loss: 0.3451354191610256
Epoch: 36, step: 837, loss: 0.3105267286300659, mean loss: 0.34513476396639964
Epoch: 36, step: 838, loss: 0.30816352367401123, mean loss: 0.34513406405839947
Epoch: 36, step: 839, loss: 0.35700932145118713, mean loss: 0.3451342888663919
Epoch: 36, step: 840, loss: 0.35603851079940796, mean loss: 0.3451344952880092
Epoch: 36, step: 841, loss: 0.3213672935962677, mean loss: 0.3451340453731625
Epoch: 36, step: 842, loss: 0.32616740465164185, mean loss: 0.3451336863400786
Epoch: 36, step: 843, loss: 0.34092971682548523, mean loss: 0.34513360676164456
Epoch: 36, step: 844, loss: 0.3373943865299225, mean loss: 0.3451334602659655
Epoch: 36, step: 845, loss: 0.31709372997283936, mean loss: 0.3451329295120322
Epoch: 36, step: 846, loss: 0.32848554849624634, mean loss: 0.34513261440573073
Epoch: 36, step: 847, loss: 0.32109305262565613, mean loss: 0.3451321593867691
Epoch: 36, step: 848, loss: 0.3342667520046234, mean loss: 0.3451319537310732
Epoch: 36, step: 849, loss: 0.29984113574028015, mean loss: 0.34513109650243273
Epoch: 36, step: 850, loss: 0.3386189341545105, mean loss: 0.34513097324772757
Epoch: 36, step: 851, loss: 0.3515920042991638, mean loss: 0.34513109553236404
Epoch: 36, step: 852, loss: 0.3367721140384674, mean loss: 0.34513093732918265
Epoch: 36, step: 853, loss: 0.2912103235721588, mean loss: 0.3451299168398803
Epoch: 36, step: 854, loss: 0.29345864057540894, mean loss: 0.34512893893953656
Epoch: 36, step: 855, loss: 0.36919981241226196, mean loss: 0.34512939448218366
Epoch: 36, step: 856, loss: 0.3794553577899933, mean loss: 0.34513004409069425
Epoch: 36, step: 857, loss: 0.3204001486301422, mean loss: 0.34512957609373235
Epoch: 36, step: 858, loss: 0.36048653721809387, mean loss: 0.3451298667085938
Epoch: 36, step: 859, loss: 0.30849477648735046, mean loss: 0.345129173439912
Epoch: 36, step: 860, loss: 0.31731459498405457, mean loss: 0.3451286470972409
Epoch: 36, step: 861, loss: 0.3253355026245117, mean loss: 0.34512827255338757
Epoch: 36, step: 862, loss: 0.3691820204257965, mean loss: 0.34512872771163444
Epoch: 36, step: 863, loss: 0.3123778998851776, mean loss: 0.3451281079941839
Epoch: 36, step: 864, loss: 0.28557300567626953, mean loss: 0.34512698110242973
Epoch: 36, step: 865, loss: 0.3520752489566803, mean loss: 0.3451271125739123
Epoch: 36, step: 866, loss: 0.3129517734050751, mean loss: 0.3451265037805277
Epoch: 36, step: 867, loss: 0.3138396143913269, mean loss: 0.3451259118088069
Epoch: 36, step: 868, loss: 0.3510388433933258, mean loss: 0.3451260236838487
Epoch: 36, step: 869, loss: 0.36721178889274597, mean loss: 0.3451264415474959
Epoch: 36, step: 870, loss: 0.3890359699726105, mean loss: 0.34512727230198315
Epoch: 36, step: 871, loss: 0.3233291506767273, mean loss: 0.34512685989617065
Epoch: 36, step: 872, loss: 0.30736368894577026, mean loss: 0.3451261454558704
Epoch: 36, step: 873, loss: 0.3066219687461853, mean loss: 0.3451254170102858
Epoch: 36, step: 874, loss: 0.3670012056827545, mean loss: 0.34512583086201726
Epoch: 36, step: 875, loss: 0.3093758225440979, mean loss: 0.3451251545470661
Epoch: 36, step: 876, loss: 0.3068494498729706, mean loss: 0.3451244304649512
Epoch: 36, step: 877, loss: 0.3211650848388672, mean loss: 0.34512397722168336
Epoch: 36, step: 878, loss: 0.2994772493839264, mean loss: 0.34512311373062465
Epoch: 36, step: 879, loss: 0.3564835488796234, mean loss: 0.3451233286298973
Epoch: 36, step: 880, loss: 0.34762704372406006, mean loss: 0.3451233759904401
Epoch: 36, step: 881, loss: 0.3051227629184723, mean loss: 0.3451226193488732
Epoch: 36, step: 882, loss: 0.3301408290863037, mean loss: 0.34512233596244574
Epoch: 36, step: 883, loss: 0.34296783804893494, mean loss: 0.34512229521004517
Epoch: 36, step: 884, loss: 0.3132150173187256, mean loss: 0.3451216916942251
Epoch: 36, step: 885, loss: 0.41419553756713867, mean loss: 0.345122998178921
Epoch: 36, step: 886, loss: 0.3161924183368683, mean loss: 0.34512245098707967
Epoch: 36, step: 887, loss: 0.31577572226524353, mean loss: 0.34512189593471315
Epoch: 36, step: 888, loss: 0.3306165337562561, mean loss: 0.34512162159124526
Epoch: 36, step: 889, loss: 0.3673080801963806, mean loss: 0.34512204120123513
Epoch: 36, step: 890, loss: 0.31256920099258423, mean loss: 0.3451214255446827
Epoch: 36, step: 891, loss: 0.3611730933189392, mean loss: 0.3451217291165825
Epoch: 36, step: 892, loss: 0.3418391942977905, mean loss: 0.3451216670378939
Epoch: 36, step: 893, loss: 0.36381494998931885, mean loss: 0.3451220205551024
Epoch: 36, step: 894, loss: 0.3156323730945587, mean loss: 0.345121462873462
Epoch: 36, step: 895, loss: 0.33711501955986023, mean loss: 0.34512131146568376
Epoch: 36, step: 896, loss: 0.3106183707714081, mean loss: 0.34512065900183675
Epoch: 36, step: 897, loss: 0.3424660861492157, mean loss: 0.34512060880379486
Epoch: 36, step: 898, loss: 0.33495718240737915, mean loss: 0.34512041661677073
Epoch: 36, step: 899, loss: 0.3023698627948761, mean loss: 0.34511960823325544
Epoch: 36, step: 900, loss: 0.3191930055618286, mean loss: 0.345119117988334
Epoch: 36, step: 901, loss: 0.29531142115592957, mean loss: 0.3451181761947245
Epoch: 36, step: 902, loss: 0.33765292167663574, mean loss: 0.34511803503991295
Epoch: 36, step: 903, loss: 0.30284053087234497, mean loss: 0.34511723566190344
Epoch: 36, step: 904, loss: 0.3330483138561249, mean loss: 0.3451170074684832
Epoch: 36, step: 905, loss: 0.32466891407966614, mean loss: 0.34511662085299083
Epoch: 36, step: 906, loss: 0.32887354493141174, mean loss: 0.3451163137482675
Epoch: 36, step: 907, loss: 0.30813702940940857, mean loss: 0.34511561460124457
Epoch: 36, step: 908, loss: 0.35633715987205505, mean loss: 0.34511582675682795
Epoch: 36, step: 909, loss: 0.3257710039615631, mean loss: 0.3451154610287152
Epoch: 36, step: 910, loss: 0.39041057229042053, mean loss: 0.34511631734994147
Epoch: 36, step: 911, loss: 0.32374459505081177, mean loss: 0.3451159133170789
Epoch: 36, step: 912, loss: 0.3004756569862366, mean loss: 0.34511506940804193
Epoch: 36, step: 913, loss: 0.32162830233573914, mean loss: 0.34511462540700083
Epoch: 36, step: 914, loss: 0.37102359533309937, mean loss: 0.34511511518884785
Epoch: 36, step: 915, loss: 0.29715216159820557, mean loss: 0.3451142085167573
Epoch: 36, step: 916, loss: 0.37969210743904114, mean loss: 0.3451148621508837
Epoch: 36, step: 917, loss: 0.31029704213142395, mean loss: 0.34511420399391385
Epoch: 36, step: 918, loss: 0.3390025198459625, mean loss: 0.3451140884676838
Epoch: 36, step: 919, loss: 0.3958894610404968, mean loss: 0.3451150482320225
Epoch: 36, step: 920, loss: 0.3037198483943939, mean loss: 0.3451142657880222
Epoch: 36, step: 921, loss: 0.33327701687812805, mean loss: 0.34511404204687923
Epoch: 36, step: 922, loss: 0.32011815905570984, mean loss: 0.3451135695974304
Epoch: 36, step: 923, loss: 0.3285699188709259, mean loss: 0.3451132569102994
Epoch: 36, step: 924, loss: 0.3939957320690155, mean loss: 0.3451141808074655
Epoch: 36, step: 925, loss: 0.32229509949684143, mean loss: 0.34511374952639745
Epoch: 36, step: 926, loss: 0.40914374589920044, mean loss: 0.3451149596716673
Epoch: 36, step: 927, loss: 0.32501500844955444, mean loss: 0.34511457979656857
Epoch: 36, step: 928, loss: 0.3345957398414612, mean loss: 0.3451143810015663
Epoch: 36, step: 929, loss: 0.3696894943714142, mean loss: 0.3451148454365621
Epoch: 36, step: 930, loss: 0.3357008397579193, mean loss: 0.3451146675284892
Epoch: 36, step: 931, loss: 0.3365788459777832, mean loss: 0.345114506219593
Epoch: 36, step: 932, loss: 0.3023669719696045, mean loss: 0.34511369839726275
Epoch: 36, step: 933, loss: 0.347097247838974, mean loss: 0.3451137358807172
Epoch: 36, step: 934, loss: 0.3404959440231323, mean loss: 0.345113648619207
Epoch: 36, step: 935, loss: 0.29707035422325134, mean loss: 0.3451127407716183
Epoch: 36, step: 936, loss: 0.2994396686553955, mean loss: 0.3451118777291188
Epoch: 36, step: 937, loss: 0.3246477246284485, mean loss: 0.3451114910439387
Epoch: 36, step: 938, loss: 0.333281546831131, mean loss: 0.34511126751269117
Epoch: 36, step: 939, loss: 0.3376617133617401, mean loss: 0.3451111267532219
Epoch: 36, step: 940, loss: 0.3239349126815796, mean loss: 0.34511072663580916
Epoch: 36, step: 941, loss: 0.33725589513778687, mean loss: 0.3451105782242251
Epoch: 36, step: 942, loss: 0.34230974316596985, mean loss: 0.3451105253053924
Epoch: 36, step: 943, loss: 0.32365795969963074, mean loss: 0.3451101199893856
Epoch: 36, step: 944, loss: 0.3125416040420532, mean loss: 0.34510950466478196
Epoch: 36, step: 945, loss: 0.3164723217487335, mean loss: 0.34510896362599647
Epoch: 36, step: 946, loss: 0.3037834167480469, mean loss: 0.3451081828822569
Epoch: 36, step: 947, loss: 0.36760321259498596, mean loss: 0.3451086078620369
Epoch: 36, step: 948, loss: 0.32202890515327454, mean loss: 0.3451081718447564
Epoch: 36, step: 949, loss: 0.33742284774780273, mean loss: 0.34510802665784257
Epoch: 36, step: 950, loss: 0.3352055847644806, mean loss: 0.34510783958989333
Epoch: 36, step: 951, loss: 0.3291454017162323, mean loss: 0.3451075380476938
Epoch: 36, step: 952, loss: 0.33397650718688965, mean loss: 0.3451073277783007
Epoch: 36, step: 953, loss: 0.36457768082618713, mean loss: 0.3451076955737038
Epoch: 36, step: 954, loss: 0.3313475549221039, mean loss: 0.34510743564925017
Epoch: 36, step: 955, loss: 0.3139105439186096, mean loss: 0.3451068463615333
Epoch: 36, step: 956, loss: 0.33807721734046936, mean loss: 0.3451067135792092
Epoch: 36, step: 957, loss: 0.3351401090621948, mean loss: 0.3451065253240523
Epoch: 36, step: 958, loss: 0.3281894624233246, mean loss: 0.34510620579053697
Epoch: 36, step: 959, loss: 0.41258352994918823, mean loss: 0.345107480294242
Epoch: 36, step: 960, loss: 0.4143596589565277, mean loss: 0.3451087882964832
Epoch: 36, step: 961, loss: 0.3693666458129883, mean loss: 0.3451092464587149
Epoch: 36, step: 962, loss: 0.3061318099498749, mean loss: 0.345108510299225
Epoch: 36, step: 963, loss: 0.33444681763648987, mean loss: 0.3451083089376502
Epoch: 36, step: 964, loss: 0.3279505670070648, mean loss: 0.3451079848948556
Epoch: 36, step: 965, loss: 0.3550054132938385, mean loss: 0.34510817181512754
Epoch: 36, step: 966, loss: 0.3311874270439148, mean loss: 0.3451079089165086
Epoch: 36, step: 967, loss: 0.30469605326652527, mean loss: 0.34510714573748513
Epoch: 36, step: 968, loss: 0.31571733951568604, mean loss: 0.3451065907206547
Epoch: 36, step: 969, loss: 0.33223235607147217, mean loss: 0.3451063475995562
Epoch: 36, step: 970, loss: 0.3635692596435547, mean loss: 0.34510669625241325
Epoch: 36, step: 971, loss: 0.3628237247467041, mean loss: 0.34510703081371874
Epoch: 36, step: 972, loss: 0.31106749176979065, mean loss: 0.3451063880367668
Epoch: 36, step: 973, loss: 0.3300803601741791, mean loss: 0.3451061043019607
Epoch: 36, step: 974, loss: 0.3178887367248535, mean loss: 0.3451055903691527
Epoch: 36, step: 975, loss: 0.34894275665283203, mean loss: 0.3451056628231989
Epoch: 36, step: 976, loss: 0.332977831363678, mean loss: 0.34510543382768405
Epoch: 36, step: 977, loss: 0.30357542634010315, mean loss: 0.3451046496804183
Epoch: 36, step: 978, loss: 0.377774178981781, mean loss: 0.3451052665172535
Epoch: 36, step: 979, loss: 0.33690792322158813, mean loss: 0.3451051117452707
Epoch: 36, step: 980, loss: 0.33808064460754395, mean loss: 0.34510497912057253
Epoch: 36, step: 981, loss: 0.32169678807258606, mean loss: 0.345104537173077
Epoch: 36, step: 982, loss: 0.34823209047317505, mean loss: 0.34510459622028183
Epoch: 36, step: 983, loss: 0.354599267244339, mean loss: 0.34510477547324636
Epoch: 36, step: 984, loss: 0.33725881576538086, mean loss: 0.3451046273496324
Epoch: 36, step: 985, loss: 0.322607159614563, mean loss: 0.345104202628701
Epoch: 36, step: 986, loss: 0.37460651993751526, mean loss: 0.34510475958094483
Epoch: 36, step: 987, loss: 0.30055689811706543, mean loss: 0.3451039186109708
Epoch: 36, step: 988, loss: 0.3146900236606598, mean loss: 0.34510334447141006
Epoch: 36, step: 989, loss: 0.320383220911026, mean loss: 0.34510287782506355
Epoch: 36, step: 990, loss: 0.2936541736125946, mean loss: 0.34510190663668766
Epoch: 36, step: 991, loss: 0.32160380482673645, mean loss: 0.3451014630754182
Epoch: 36, step: 992, loss: 0.3139589726924896, mean loss: 0.3451008752261557
Epoch: 36, step: 993, loss: 0.30754679441452026, mean loss: 0.34510016636434865
Epoch: 36, step: 994, loss: 0.3159446120262146, mean loss: 0.34509961604149736
Epoch: 36, step: 995, loss: 0.3424718677997589, mean loss: 0.3450995664426253
Epoch: 36, step: 996, loss: 0.3260907828807831, mean loss: 0.3450992076577107
Epoch: 36, step: 997, loss: 0.30795496702194214, mean loss: 0.3450985065848815
Epoch: 36, step: 998, loss: 0.3298863470554352, mean loss: 0.3450982194709104
Epoch: 36, step: 999, loss: 0.3200269937515259, mean loss: 0.34509774628606743
Epoch: 36, step: 1000, loss: 0.31403830647468567, mean loss: 0.34509716009299746
Epoch: 36, step: 1001, loss: 0.3378256559371948, mean loss: 0.34509702285855526
Epoch: 36, step: 1002, loss: 0.37867099046707153, mean loss: 0.34509765648506
Epoch: 36, step: 1003, loss: 0.32963308691978455, mean loss: 0.34509736463464924
Epoch: 36, step: 1004, loss: 0.36128002405166626, mean loss: 0.34509767003123
Epoch: 36, step: 1005, loss: 0.30295583605766296, mean loss: 0.34509687475223444
Epoch: 36, step: 1006, loss: 0.30845531821250916, mean loss: 0.34509618328469205
Epoch: 36, step: 1007, loss: 0.3259575366973877, mean loss: 0.34509582212363776
Epoch: 36, step: 1008, loss: 0.33504387736320496, mean loss: 0.34509563243925
Epoch: 36, step: 1009, loss: 0.3058571517467499, mean loss: 0.34509489200673515
Epoch: 36, step: 1010, loss: 0.3317606747150421, mean loss: 0.3450946403939926
Epoch: 36, step: 1011, loss: 0.3197515904903412, mean loss: 0.34509416218714867
Epoch: 36, step: 1012, loss: 0.2986220419406891, mean loss: 0.34509328530505634
Epoch: 36, step: 1013, loss: 0.3364863693714142, mean loss: 0.34509312290428773
Epoch: 36, step: 1014, loss: 0.31539231538772583, mean loss: 0.3450925625011194
Epoch: 36, step: 1015, loss: 0.3303006589412689, mean loss: 0.34509228340859943
Epoch: 36, step: 1016, loss: 0.30204930901527405, mean loss: 0.34509147129233003
Epoch: 36, step: 1017, loss: 0.3080453872680664, mean loss: 0.3450907723359883
Epoch: 36, step: 1018, loss: 0.3250555098056793, mean loss: 0.3450903943335633
Epoch: 36, step: 1019, loss: 0.31097903847694397, mean loss: 0.34508975077164616
Epoch: 36, step: 1020, loss: 0.3252246081829071, mean loss: 0.34508937599299155
Epoch: 36, step: 1021, loss: 0.36814308166503906, mean loss: 0.34508981091933333
Epoch: 36, step: 1022, loss: 0.3526446521282196, mean loss: 0.34508995344468296
Epoch: 36, step: 1023, loss: 0.39351582527160645, mean loss: 0.3450908670024823
Epoch: 36, step: 1024, loss: 0.34671029448509216, mean loss: 0.3450908975525301
Epoch: 36, step: 1025, loss: 0.3633291721343994, mean loss: 0.3450912416060027
Epoch: 36, step: 1026, loss: 0.33688127994537354, mean loss: 0.3450910867332091
Epoch: 36, step: 1027, loss: 0.3187274634838104, mean loss: 0.34509058941895476
Epoch: 36, step: 1028, loss: 0.3008642792701721, mean loss: 0.3450897551649011
Epoch: 36, step: 1029, loss: 0.3427017033100128, mean loss: 0.3450897101192178
Epoch: 36, step: 1030, loss: 0.3186914026737213, mean loss: 0.34508921217887173
Epoch: 36, step: 1031, loss: 0.33855143189430237, mean loss: 0.34508908886175454
Epoch: 36, step: 1032, loss: 0.34502050280570984, mean loss: 0.345089087568093
Epoch: 36, step: 1033, loss: 0.3301391899585724, mean loss: 0.34508880559031924
Epoch: 36, step: 1034, loss: 0.30504322052001953, mean loss: 0.3450880502840126
Epoch: 36, step: 1035, loss: 0.333855003118515, mean loss: 0.3450878384196753
Epoch: 36, step: 1036, loss: 0.3575298488140106, mean loss: 0.3450880730816091
Epoch: 36, step: 1037, loss: 0.3099213242530823, mean loss: 0.3450874098333569
Epoch: 36, step: 1038, loss: 0.3355393707752228, mean loss: 0.34508722975982165
Epoch: 36, step: 1039, loss: 0.3038853108882904, mean loss: 0.3450864527169944
Epoch: 36, step: 1040, loss: 0.34747907519340515, mean loss: 0.3450864978395305
Epoch: 36, step: 1041, loss: 0.3569546341896057, mean loss: 0.3450867216568343
Epoch: 36, step: 1042, loss: 0.34317052364349365, mean loss: 0.3450866855205638
Epoch: 36, step: 1043, loss: 0.3293280601501465, mean loss: 0.34508638834500804
Epoch: 36, step: 1044, loss: 0.3765646815299988, mean loss: 0.34508698195026527
Epoch: 36, step: 1045, loss: 0.3495164215564728, mean loss: 0.345087065477318
Epoch: 36, step: 1046, loss: 0.3167371451854706, mean loss: 0.3450865308858471
Epoch: 36, step: 1047, loss: 0.3124375343322754, mean loss: 0.34508591523875565
Epoch: 36, step: 1048, loss: 0.30383896827697754, mean loss: 0.34508513747873903
Epoch: 36, step: 1049, loss: 0.3300422430038452, mean loss: 0.34508485383250315
Epoch: 36, step: 1050, loss: 0.32499030232429504, mean loss: 0.34508447494023375
Epoch: 36, step: 1051, loss: 0.33180177211761475, mean loss: 0.3450842244933143
Epoch: 36, step: 1052, loss: 0.32952603697776794, mean loss: 0.3450839311473951
Epoch: 36, step: 1053, loss: 0.3253307640552521, mean loss: 0.34508355871315755
Epoch: 36, step: 1054, loss: 0.35735946893692017, mean loss: 0.3450837901637924
Epoch: 36, step: 1055, loss: 0.42602527141571045, mean loss: 0.345085316209819
Epoch: 36, step: 1056, loss: 0.32047685980796814, mean loss: 0.3450848522582268
Epoch: 36, step: 1057, loss: 0.30834466218948364, mean loss: 0.3450841595959956
Epoch: 36, step: 1058, loss: 0.34732121229171753, mean loss: 0.3450842017703201
Epoch: 36, step: 1059, loss: 0.3522832989692688, mean loss: 0.3450843374896701
Epoch: 36, step: 1060, loss: 0.3256491422653198, mean loss: 0.3450839710989599
Epoch: 36, step: 1061, loss: 0.3149740695953369, mean loss: 0.34508340348026095
Epoch: 36, step: 1062, loss: 0.3805679678916931, mean loss: 0.3450840724071449
Epoch: 36, step: 1063, loss: 0.3602883815765381, mean loss: 0.3450843590213277
Epoch: 36, step: 1064, loss: 0.3251476585865021, mean loss: 0.34508398320462175
Epoch: 36, step: 1065, loss: 0.33500534296035767, mean loss: 0.34508379322082827
Epoch: 36, step: 1066, loss: 0.31452417373657227, mean loss: 0.34508321717853907
Epoch: 36, step: 1067, loss: 0.38191646337509155, mean loss: 0.3450839114642624
Epoch: 36, step: 1068, loss: 0.33556368947029114, mean loss: 0.34508373201687975
Epoch: 36, step: 1069, loss: 0.3202638030052185, mean loss: 0.34508326419298313
Epoch: 36, step: 1070, loss: 0.3133738040924072, mean loss: 0.3450826665215082
Epoch: 36, step: 1071, loss: 0.3469524383544922, mean loss: 0.3450827017629858
Epoch: 36, step: 1072, loss: 0.36656516790390015, mean loss: 0.34508310665708347
Epoch: 36, step: 1073, loss: 0.3339990973472595, mean loss: 0.34508289775344386
Epoch: 36, step: 1074, loss: 0.30853521823883057, mean loss: 0.34508220894137587
Epoch: 36, step: 1075, loss: 0.3323252499103546, mean loss: 0.3450819685162151
Epoch: 36, step: 1076, loss: 0.3545953035354614, mean loss: 0.345082147806749
Epoch: 36, step: 1077, loss: 0.30732059478759766, mean loss: 0.3450814361571124
Epoch: 36, step: 1078, loss: 0.38664036989212036, mean loss: 0.3450822193569642
Epoch: 36, step: 1079, loss: 0.3188212811946869, mean loss: 0.3450817244651701
Epoch: 36, step: 1080, loss: 0.31028321385383606, mean loss: 0.34508106869374616
Epoch: 36, step: 1081, loss: 0.3328927457332611, mean loss: 0.34508083901140796
Epoch: 36, step: 1082, loss: 0.3609848916530609, mean loss: 0.3450811387090099
Epoch: 36, step: 1083, loss: 0.3409704267978668, mean loss: 0.34508106124779203
Epoch: 36, step: 1084, loss: 0.3084182143211365, mean loss: 0.34508037039537487
Epoch: 36, step: 1085, loss: 0.37110981345176697, mean loss: 0.3450808608691464
Epoch: 36, step: 1086, loss: 0.343867689371109, mean loss: 0.3450808380097411
Epoch: 36, step: 1087, loss: 0.30828961730003357, mean loss: 0.34508014477751486
Epoch: 36, step: 1088, loss: 0.30283644795417786, mean loss: 0.34507934882294616
Epoch: 36, step: 1089, loss: 0.33314087986946106, mean loss: 0.3450791238828822
Epoch: 36, step: 1090, loss: 0.32114872336387634, mean loss: 0.3450786730039275
Epoch: 36, step: 1091, loss: 0.3208637237548828, mean loss: 0.34507821677231154
Epoch: 36, step: 1092, loss: 0.3642862141132355, mean loss: 0.34507857866159203
Epoch: 36, step: 1093, loss: 0.3124164342880249, mean loss: 0.34507796330034307
Epoch: 36, step: 1094, loss: 0.31956955790519714, mean loss: 0.345077482726003
Epoch: 36, step: 1095, loss: 0.34190383553504944, mean loss: 0.3450774229361162
Epoch: 36, step: 1096, loss: 0.3556804656982422, mean loss: 0.34507762268824527
Epoch: 36, step: 1097, loss: 0.33431103825569153, mean loss: 0.3450774198589541
Epoch: 36, step: 1098, loss: 0.3166965842247009, mean loss: 0.34507688520877167
Epoch: 36, step: 1099, loss: 0.30173006653785706, mean loss: 0.34507606863845536
Epoch: 36, step: 1100, loss: 0.3112500011920929, mean loss: 0.3450754314327015
Epoch: 36, step: 1101, loss: 0.3315991461277008, mean loss: 0.3450751775750873
Epoch: 36, step: 1102, loss: 0.3051179051399231, mean loss: 0.3450744248998102
Epoch: 36, step: 1103, loss: 0.3560210168361664, mean loss: 0.3450746310969157
Epoch: 36, step: 1104, loss: 0.3617485463619232, mean loss: 0.34507494517168197
Epoch: 36, step: 1105, loss: 0.3376997709274292, mean loss: 0.34507480625335
Epoch: 36, step: 1106, loss: 0.32198163866996765, mean loss: 0.34507437128004786
Epoch: 36, step: 1107, loss: 0.427165150642395, mean loss: 0.34507591747870986
Epoch: 36, step: 1108, loss: 0.3372919261455536, mean loss: 0.3450757708682088
Epoch: 36, step: 1109, loss: 0.3069935739040375, mean loss: 0.3450750536083119
Epoch: 36, step: 1110, loss: 0.3302561938762665, mean loss: 0.34507477450746
Epoch: 36, step: 1111, loss: 0.34648388624191284, mean loss: 0.3450748010464033
Epoch: 36, step: 1112, loss: 0.32097116112709045, mean loss: 0.3450743470915675
Epoch: 36, step: 1113, loss: 0.32437753677368164, mean loss: 0.3450739573064472
Epoch: 36, step: 1114, loss: 0.3461203873157501, mean loss: 0.34507397701359815
Epoch: 36, step: 1115, loss: 0.31209173798561096, mean loss: 0.34507335587915317
Epoch: 36, step: 1116, loss: 0.3516988158226013, mean loss: 0.3450734806500604
Epoch: 36, step: 1117, loss: 0.36311107873916626, mean loss: 0.34507382032837924
Epoch: 36, step: 1118, loss: 0.30267852544784546, mean loss: 0.3450730219686843
Epoch: 36, step: 1119, loss: 0.2964867353439331, mean loss: 0.3450721070416237
Epoch: 36, step: 1120, loss: 0.31981775164604187, mean loss: 0.3450716314864896
Epoch: 36, step: 1121, loss: 0.32991355657577515, mean loss: 0.3450713460559373
Epoch: 36, step: 1122, loss: 0.32454782724380493, mean loss: 0.34507095959993694
Epoch: 36, step: 1123, loss: 0.3376724123954773, mean loss: 0.3450708202885864
Epoch: 36, step: 1124, loss: 0.31103894114494324, mean loss: 0.3450701794955166
Epoch: 36, step: 1125, loss: 0.31988993287086487, mean loss: 0.3450697053805359
Epoch: 36, step: 1126, loss: 0.28757062554359436, mean loss: 0.345068622759613
Epoch: 36, step: 1127, loss: 0.30558475852012634, mean loss: 0.34506787935201694
Epoch: 36, step: 1128, loss: 0.34079691767692566, mean loss: 0.3450677989392804
Epoch: 36, step: 1129, loss: 0.3378411829471588, mean loss: 0.34506766288068963
Epoch: 36, step: 1130, loss: 0.33873024582862854, mean loss: 0.34506754356567404
Epoch: 36, step: 1131, loss: 0.3532993197441101, mean loss: 0.34506769854301
Epoch: 36, step: 1132, loss: 0.3312414288520813, mean loss: 0.34506743824461794
Epoch: 36, step: 1133, loss: 0.3377273678779602, mean loss: 0.3450673000603797
Epoch: 36, step: 1134, loss: 0.3729991912841797, mean loss: 0.3450678258965443
Epoch: 36, step: 1135, loss: 0.31948480010032654, mean loss: 0.34506734428837793
Epoch: 36, step: 1136, loss: 0.3526483476161957, mean loss: 0.34506748700036244
Epoch: 36, step: 1137, loss: 0.32181671261787415, mean loss: 0.3450670493140106
Epoch: 36, step: 1138, loss: 0.3734229803085327, mean loss: 0.3450675830928069
Epoch: 36, step: 1139, loss: 0.325390487909317, mean loss: 0.34506721269345475
Epoch: 36, step: 1140, loss: 0.2911289632320404, mean loss: 0.3450661973852296
Epoch: 36, step: 1141, loss: 0.35393422842025757, mean loss: 0.3450663643097305
Epoch: 36, step: 1142, loss: 0.3294782340526581, mean loss: 0.34506607089714825
Epoch: 36, step: 1143, loss: 0.30200573801994324, mean loss: 0.34506526039547536
Epoch: 36, step: 1144, loss: 0.3512992560863495, mean loss: 0.34506537773244184
Epoch: 36, step: 1145, loss: 0.32136866450309753, mean loss: 0.34506493171864117
Epoch: 36, step: 1146, loss: 0.3464707136154175, mean loss: 0.34506495817742977
Epoch: 36, step: 1147, loss: 0.32159364223480225, mean loss: 0.3450645164226315
Epoch: 36, step: 1148, loss: 0.3154110908508301, mean loss: 0.34506395832454606
Epoch: 36, step: 1149, loss: 0.33869239687919617, mean loss: 0.3450638384095868
Epoch: 36, step: 1150, loss: 0.30311548709869385, mean loss: 0.34506304894216777
Epoch: 36, step: 1151, loss: 0.37682732939720154, mean loss: 0.34506364673425705
Epoch: 36, step: 1152, loss: 0.3084964454174042, mean loss: 0.3450629585659126
Epoch: 36, step: 1153, loss: 0.3177584409713745, mean loss: 0.3450624447242627
Epoch: 36, step: 1154, loss: 0.311602920293808, mean loss: 0.34506181506385447
Epoch: 36, step: 1155, loss: 0.34055349230766296, mean loss: 0.3450617302252629
Epoch: 36, step: 1156, loss: 0.3398498296737671, mean loss: 0.345061632148438
Epoch: 36, step: 1157, loss: 0.33058151602745056, mean loss: 0.3450613596687398
Epoch: 36, step: 1158, loss: 0.367820143699646, mean loss: 0.34506178792427733
Epoch: 36, step: 1159, loss: 0.31641921401023865, mean loss: 0.34506124896270285
Epoch: 36, step: 1160, loss: 0.37473350763320923, mean loss: 0.34506180728914315
Epoch: 36, step: 1161, loss: 0.33980390429496765, mean loss: 0.34506170835595923
Epoch: 36, step: 1162, loss: 0.33154094219207764, mean loss: 0.34506145395277255
Epoch: 36, step: 1163, loss: 0.3081519603729248, mean loss: 0.3450607594864976
Epoch: 36, step: 1164, loss: 0.3559410572052002, mean loss: 0.34506096419961957
Epoch: 36, step: 1165, loss: 0.286733478307724, mean loss: 0.34505986678690287
Epoch: 36, step: 1166, loss: 0.31254735589027405, mean loss: 0.3450592550860713
Epoch: 36, step: 1167, loss: 0.3747715950012207, mean loss: 0.3450598140930685
Epoch: 36, step: 1168, loss: 0.35448044538497925, mean loss: 0.34505999132918486
Epoch: 36, step: 1169, loss: 0.3022172749042511, mean loss: 0.3450591853180394
Epoch: 36, step: 1170, loss: 0.3216419517993927, mean loss: 0.34505874477183457
Epoch: 36, step: 1171, loss: 0.3102464973926544, mean loss: 0.34505808986462977
Epoch: 36, step: 1172, loss: 0.34145858883857727, mean loss: 0.3450580221501044
Epoch: 36, step: 1173, loss: 0.32930925488471985, mean loss: 0.3450577258867524
Epoch: 36, step: 1174, loss: 0.35723763704299927, mean loss: 0.34505795500903
Epoch: 36, step: 1175, loss: 0.34995540976524353, mean loss: 0.3450580471357184
Epoch: 36, step: 1176, loss: 0.31056883931159973, mean loss: 0.34505739836673693
Epoch: 36, step: 1177, loss: 0.2940663695335388, mean loss: 0.3450564392036348
Epoch: 36, step: 1178, loss: 0.3381354808807373, mean loss: 0.3450563090198919
Epoch: 36, step: 1179, loss: 0.36192646622657776, mean loss: 0.3450566263428399
Epoch: 36, step: 1180, loss: 0.34042420983314514, mean loss: 0.3450565392100174
Epoch: 36, step: 1181, loss: 0.3538688123226166, mean loss: 0.3450567049601794
Epoch: 36, step: 1182, loss: 0.3179318606853485, mean loss: 0.34505619477821925
Epoch: 36, step: 1183, loss: 0.3496535122394562, mean loss: 0.3450562812459717
Epoch: 36, step: 1184, loss: 0.31368783116340637, mean loss: 0.3450556912696682
Epoch: 36, step: 1185, loss: 0.33470746874809265, mean loss: 0.34505549664445617
Epoch: 36, step: 1186, loss: 0.34238654375076294, mean loss: 0.3450554464488064
Epoch: 36, step: 1187, loss: 0.3870505690574646, mean loss: 0.34505623624649334
Epoch: 36, step: 1188, loss: 0.3968586325645447, mean loss: 0.3450572104701843
Epoch: 36, step: 1189, loss: 0.33968695998191833, mean loss: 0.34505710947626833
Epoch: 36, step: 1190, loss: 0.33410167694091797, mean loss: 0.3450569034502686
Epoch: 36, step: 1191, loss: 0.3295096755027771, mean loss: 0.34505661107724417
Epoch: 36, step: 1192, loss: 0.3381653428077698, mean loss: 0.3450564814861001
Epoch: 36, step: 1193, loss: 0.3502025902271271, mean loss: 0.34505657825748565
Epoch: 36, step: 1194, loss: 0.3680794835090637, mean loss: 0.34505701118975685
Epoch: 36, step: 1195, loss: 0.2916688919067383, mean loss: 0.345056007276269
Epoch: 36, step: 1196, loss: 0.3066779673099518, mean loss: 0.3450552856268084
Epoch: 36, step: 1197, loss: 0.33210569620132446, mean loss: 0.34505504213108756
Epoch: 36, step: 1198, loss: 0.3253503143787384, mean loss: 0.34505467162307274
Epoch: 36, step: 1199, loss: 0.3517008125782013, mean loss: 0.3450547965881178
Epoch: 36, step: 1200, loss: 0.33594468235969543, mean loss: 0.34505462529707276
Epoch: 36, step: 1201, loss: 0.33278927206993103, mean loss: 0.3450543946846329
Epoch: 36, step: 1202, loss: 0.3525278568267822, mean loss: 0.34505453519758045
Epoch: 36, step: 1203, loss: 0.29984164237976074, mean loss: 0.34505368513943163
Epoch: 36, step: 1204, loss: 0.3257230818271637, mean loss: 0.34505332170708075
Epoch: 36, step: 1205, loss: 0.32402291893959045, mean loss: 0.345052926324438
Epoch: 36, step: 1206, loss: 0.3180461823940277, mean loss: 0.34505241859298097
Epoch: 36, step: 1207, loss: 0.28739893436431885, mean loss: 0.3450513347178827
Epoch: 36, step: 1208, loss: 0.32312214374542236, mean loss: 0.3450509224608005
Epoch: 36, step: 1209, loss: 0.32506999373435974, mean loss: 0.34505054683706987
Epoch: 36, step: 1210, loss: 0.3464347720146179, mean loss: 0.34505057285878576
Epoch: 36, step: 1211, loss: 0.38447991013526917, mean loss: 0.3450513140674721
Epoch: 36, step: 1212, loss: 0.3111046254634857, mean loss: 0.34505067593583677
Epoch: 36, step: 1213, loss: 0.41845569014549255, mean loss: 0.34505205578121084
Epoch: 36, step: 1214, loss: 0.31970787048339844, mean loss: 0.3450515793777954
Epoch: 36, step: 1215, loss: 0.325289249420166, mean loss: 0.34505120790542776
Epoch: 36, step: 1216, loss: 0.3108707666397095, mean loss: 0.34505056542800694
Epoch: 36, step: 1217, loss: 0.3932584524154663, mean loss: 0.34505147155723115
Epoch: 36, step: 1218, loss: 0.3352258503437042, mean loss: 0.34505128687551745
Epoch: 36, step: 1219, loss: 0.32269713282585144, mean loss: 0.3450508667162428
Epoch: 36, step: 1220, loss: 0.32560816407203674, mean loss: 0.3450505012862523
Epoch: 36, step: 1221, loss: 0.31048232316970825, mean loss: 0.3450498515817431
Epoch: 36, step: 1222, loss: 0.35617706179618835, mean loss: 0.3450500607123127
Epoch: 36, step: 1223, loss: 0.3510412275791168, mean loss: 0.34505017331129906
Epoch: 36, step: 1224, loss: 0.3065488040447235, mean loss: 0.34504944972376184
Epoch: 36, step: 1225, loss: 0.3104906678199768, mean loss: 0.34504880024468076
Epoch: 36, step: 1226, loss: 0.2928360402584076, mean loss: 0.3450478190047118
Epoch: 36, step: 1227, loss: 0.3486573398113251, mean loss: 0.34504788683754667
Epoch: 36, step: 1228, loss: 0.35909217596054077, mean loss: 0.3450481507634505
Epoch: 36, step: 1229, loss: 0.32412928342819214, mean loss: 0.3450477576551081
Epoch: 36, step: 1230, loss: 0.3003186583518982, mean loss: 0.3450469171195579
Epoch: 36, step: 1231, loss: 0.3080124258995056, mean loss: 0.3450462211918065
Epoch: 36, step: 1232, loss: 0.32190194725990295, mean loss: 0.34504578628803645
Epoch: 36, step: 1233, loss: 0.351619154214859, mean loss: 0.34504590980579225
Epoch: 36, step: 1234, loss: 0.32410797476768494, mean loss: 0.3450455163760954
Epoch: 36, step: 1235, loss: 0.3427172303199768, mean loss: 0.34504547262776664
Epoch: 36, step: 1236, loss: 0.33901989459991455, mean loss: 0.3450453594097131
Epoch: 36, step: 1237, loss: 0.2993600070476532, mean loss: 0.3450445010174625
Epoch: 36, step: 1238, loss: 0.32411274313926697, mean loss: 0.34504410773339583
Epoch: 36, step: 1239, loss: 0.30707019567489624, mean loss: 0.34504339425992414
Epoch: 36, step: 1240, loss: 0.3495415449142456, mean loss: 0.3450434787719139
Epoch: 36, step: 1241, loss: 0.28833097219467163, mean loss: 0.3450424132680891
Epoch: 36, step: 1242, loss: 0.3254295289516449, mean loss: 0.3450420447918587
Epoch: 36, step: 1243, loss: 0.32236382365226746, mean loss: 0.34504161873374756
Epoch: 36, step: 1244, loss: 0.3047546446323395, mean loss: 0.3450408618723731
Epoch: 36, step: 1245, loss: 0.3202005922794342, mean loss: 0.34504039521316604
Epoch: 36, step: 1246, loss: 0.3304211497306824, mean loss: 0.34504012057535194
Epoch: 36, step: 1247, loss: 0.31031185388565063, mean loss: 0.34503946818080183
Epoch: 36, step: 1248, loss: 0.3231118619441986, mean loss: 0.34503905626326503
Epoch: 36, step: 1249, loss: 0.2899948060512543, mean loss: 0.3450380222577383
Epoch: 36, step: 1250, loss: 0.33046674728393555, mean loss: 0.3450377485416685
Epoch: 36, step: 1251, loss: 0.365591436624527, mean loss: 0.3450381346279275
Epoch: 36, step: 1252, loss: 0.3446688652038574, mean loss: 0.34503812769159703
Epoch: 36, step: 1253, loss: 0.29788991808891296, mean loss: 0.3450372420796356
Epoch: 36, step: 1254, loss: 0.3209632933139801, mean loss: 0.3450367898932917
Epoch: 36, step: 1255, loss: 0.3323347270488739, mean loss: 0.34503655131209626
Epoch: 36, step: 1256, loss: 0.31326043605804443, mean loss: 0.3450359544766639
Epoch: 36, step: 1257, loss: 0.30889031291007996, mean loss: 0.3450352755832796
Epoch: 36, step: 1258, loss: 0.36861929297447205, mean loss: 0.34503571853385323
Epoch: 36, step: 1259, loss: 0.3185526430606842, mean loss: 0.3450352211430585
Epoch: 36, step: 1260, loss: 0.3180004358291626, mean loss: 0.34503471339988423
Epoch: 36, step: 1261, loss: 0.3500511050224304, mean loss: 0.3450348076114987
Epoch: 36, step: 1262, loss: 0.32844266295433044, mean loss: 0.3450344960043723
Epoch: 36, step: 1263, loss: 0.37447452545166016, mean loss: 0.34503504888954073
Epoch: 36, step: 1264, loss: 0.32623112201690674, mean loss: 0.3450346957575219
Epoch: 36, step: 1265, loss: 0.346447616815567, mean loss: 0.34503472229125065
Epoch: 36, step: 1266, loss: 0.36899712681770325, mean loss: 0.3450351722810072
Epoch: 36, step: 1267, loss: 0.3309306204319, mean loss: 0.34503490741674203
Epoch: 36, step: 1268, loss: 0.3659498691558838, mean loss: 0.34503530016385
Epoch: 36, step: 1269, loss: 0.31710487604141235, mean loss: 0.3450347756882402
Epoch: 36, step: 1270, loss: 0.3185916244983673, mean loss: 0.3450342791498647
Epoch: 36, step: 1271, loss: 0.3161751925945282, mean loss: 0.34503373725624603
Epoch: 36, step: 1272, loss: 0.33203086256980896, mean loss: 0.3450334931029012
Epoch: 36, step: 1273, loss: 0.3293667733669281, mean loss: 0.34503319893639595
Epoch: 36, step: 1274, loss: 0.36107346415519714, mean loss: 0.3450335001111311
Epoch: 36, step: 1275, loss: 0.32927584648132324, mean loss: 0.3450332042483142
Epoch: 36, step: 1276, loss: 0.3423250615596771, mean loss: 0.345033153401678
Epoch: 36, step: 1277, loss: 0.3818681538105011, mean loss: 0.3450338449829256
Epoch: 36, step: 1278, loss: 0.32468900084495544, mean loss: 0.3450334630133757
Epoch: 36, step: 1279, loss: 0.3021562993526459, mean loss: 0.3450326580200657
Epoch: 36, step: 1280, loss: 0.32492053508758545, mean loss: 0.34503228043397854
Epoch: 36, step: 1281, loss: 0.35058924555778503, mean loss: 0.34503238475878467
Epoch: 36, step: 1282, loss: 0.300633043050766, mean loss: 0.34503155123443174
Epoch: 36, step: 1283, loss: 0.3346148431301117, mean loss: 0.3450313556816026
Epoch: 36, step: 1284, loss: 0.3841697871685028, mean loss: 0.3450320904134633
Epoch: 36, step: 1285, loss: 0.30682891607284546, mean loss: 0.34503137325231553
Epoch: 36, step: 1286, loss: 0.35857272148132324, mean loss: 0.345031627449688
Epoch: 36, step: 1287, loss: 0.3217921257019043, mean loss: 0.34503119120735154
Epoch: 36, step: 1288, loss: 0.3031003177165985, mean loss: 0.3450304041130732
Epoch: 36, step: 1289, loss: 0.34730595350265503, mean loss: 0.3450304468271436
Epoch: 36, step: 1290, loss: 0.3349660336971283, mean loss: 0.34503025791277236
Epoch: 36, step: 1291, loss: 0.30519869923591614, mean loss: 0.3450295102673283
Epoch: 36, step: 1292, loss: 0.3320606052875519, mean loss: 0.34502926684324325
Epoch: 36, step: 1293, loss: 0.30643168091773987, mean loss: 0.3450285423868837
Epoch: 36, step: 1294, loss: 0.35183578729629517, mean loss: 0.34502867015288735
Epoch: 36, step: 1295, loss: 0.35427799820899963, mean loss: 0.3450288437513869
Epoch: 36, step: 1296, loss: 0.33121737837791443, mean loss: 0.3450285845320522
Epoch: 36, step: 1297, loss: 0.33922725915908813, mean loss: 0.3450284756524048
Epoch: 36, step: 1298, loss: 0.316328227519989, mean loss: 0.3450279370144127
Epoch: 36, step: 1299, loss: 0.3033599853515625, mean loss: 0.3450271550169714
Epoch: 36, step: 1300, loss: 0.3746240735054016, mean loss: 0.34502771046256564
Epoch: 36, step: 1301, loss: 0.34865108132362366, mean loss: 0.345027778461118
Epoch: 36, step: 1302, loss: 0.2991238832473755, mean loss: 0.3450269170147012
Epoch: 36, step: 1303, loss: 0.3229770362377167, mean loss: 0.34502650322771766
Epoch: 36, step: 1304, loss: 0.3372556269168854, mean loss: 0.3450263574025697
Epoch: 36, step: 1305, loss: 0.3179283142089844, mean loss: 0.3450258489011024
Epoch: 36, step: 1306, loss: 0.31915220618247986, mean loss: 0.34502536338492296
Epoch: 36, step: 1307, loss: 0.3079979419708252, mean loss: 0.3450246685822994
Epoch: 36, step: 1308, loss: 0.2868088483810425, mean loss: 0.34502357620956375
Epoch: 36, step: 1309, loss: 0.3004997968673706, mean loss: 0.3450227407725663
Epoch: 36, step: 1310, loss: 0.3603350818157196, mean loss: 0.345023028085467
Epoch: 36, step: 1311, loss: 0.28813496232032776, mean loss: 0.345021960687055
Epoch: 36, step: 1312, loss: 0.3255811333656311, mean loss: 0.3450215959230472
Epoch: 36, step: 1313, loss: 0.3779817521572113, mean loss: 0.345022214335675
Epoch: 36, step: 1314, loss: 0.29919254779815674, mean loss: 0.34502135447589266
Epoch: 36, step: 1315, loss: 0.323392778635025, mean loss: 0.34502094868647726
Epoch: 36, step: 1316, loss: 0.35917046666145325, mean loss: 0.34502121415087705
Epoch: 36, step: 1317, loss: 0.3537931442260742, mean loss: 0.34502137872125105
Epoch: 36, step: 1318, loss: 0.3588767349720001, mean loss: 0.34502163865701924
Epoch: 36, step: 1319, loss: 0.3491174280643463, mean loss: 0.34502171549533167
Epoch: 36, step: 1320, loss: 0.33079928159713745, mean loss: 0.345021448682952
Epoch: 36, step: 1321, loss: 0.3678608238697052, mean loss: 0.3450218771408214
Epoch: 36, step: 1322, loss: 0.33453652262687683, mean loss: 0.34502168044330483
Epoch: 36, step: 1323, loss: 0.33751168847084045, mean loss: 0.3450215395640377
Epoch: 36, step: 1324, loss: 0.33355212211608887, mean loss: 0.3450213244142985
Epoch: 36, step: 1325, loss: 0.4690769612789154, mean loss: 0.345023651475579
Epoch: 36, step: 1326, loss: 0.32025834918022156, mean loss: 0.3450231869316332
Epoch: 36, step: 1327, loss: 0.3297814130783081, mean loss: 0.3450229010340144
Epoch: 36, step: 1328, loss: 0.32799220085144043, mean loss: 0.34502258158659665
Epoch: 36, step: 1329, loss: 0.3168063461780548, mean loss: 0.34502205234033095
Epoch: 36, step: 1330, loss: 0.31286823749542236, mean loss: 0.34502144924899
Epoch: 36, step: 1331, loss: 0.353880912065506, mean loss: 0.3450216154179227
Epoch: 36, step: 1332, loss: 0.29831501841545105, mean loss: 0.3450207394009487
Epoch: 36, step: 1333, loss: 0.32678502798080444, mean loss: 0.3450203973830294
Epoch: 36, step: 1334, loss: 0.3242422640323639, mean loss: 0.34502000768829866
Epoch: 36, step: 1335, loss: 0.3456510901451111, mean loss: 0.34502001952405364
Epoch: 36, step: 1336, loss: 0.32329821586608887, mean loss: 0.3450196121460289
Epoch: 36, step: 1337, loss: 0.3297814726829529, mean loss: 0.34501932637018656
Epoch: 36, step: 1338, loss: 0.31133803725242615, mean loss: 0.3450186947236341
Epoch: 36, step: 1339, loss: 0.2971230447292328, mean loss: 0.3450177965230116
Epoch: 36, step: 1340, loss: 0.3150862157344818, mean loss: 0.34501723521816796
Epoch: 36, step: 1341, loss: 0.33713674545288086, mean loss: 0.34501708743866516
Epoch: 36, step: 1342, loss: 0.36082229018211365, mean loss: 0.34501738382141206
Epoch: 36, step: 1343, loss: 0.34436318278312683, mean loss: 0.3450173715539158
Epoch: 36, step: 1344, loss: 0.28491416573524475, mean loss: 0.3450162445272358
Epoch: 36, step: 1345, loss: 0.3443557918071747, mean loss: 0.3450162321429733
Epoch: 36, step: 1346, loss: 0.32183602452278137, mean loss: 0.34501579749506456
Epoch: 36, step: 1347, loss: 0.3923425078392029, mean loss: 0.34501668489306847
Epoch: 36, step: 1348, loss: 0.3409327566623688, mean loss: 0.34501660831893555
Epoch: 36, step: 1349, loss: 0.30482304096221924, mean loss: 0.34501585469896784
Epoch: 36, step: 1350, loss: 0.3503510057926178, mean loss: 0.34501595472992486
Epoch: 36, step: 1351, loss: 0.31305041909217834, mean loss: 0.34501535540609785
Epoch: 36, step: 1352, loss: 0.356240451335907, mean loss: 0.3450155658621777
Epoch: 36, step: 1353, loss: 0.3488735854625702, mean loss: 0.34501563819371617
Epoch: 36, step: 1354, loss: 0.33839282393455505, mean loss: 0.34501551402914127
Epoch: 36, step: 1355, loss: 0.3367384374141693, mean loss: 0.3450153588533517
Epoch: 36, step: 1356, loss: 0.3535347878932953, mean loss: 0.345015518569687
Epoch: 36, step: 1357, loss: 0.3010779619216919, mean loss: 0.3450146948743503
Epoch: 36, step: 1358, loss: 0.3221990764141083, mean loss: 0.3450142671590276
Epoch: 36, step: 1359, loss: 0.33646559715270996, mean loss: 0.3450141069035161
Epoch: 36, step: 1360, loss: 0.3770390748977661, mean loss: 0.3450147072403423
Epoch: 36, step: 1361, loss: 0.35545283555984497, mean loss: 0.345014902908777
Epoch: 36, step: 1362, loss: 0.28311046957969666, mean loss: 0.34501374249800737
Epoch: 36, step: 1363, loss: 0.33224204182624817, mean loss: 0.3450135030944558
Epoch: 36, step: 1364, loss: 0.30290716886520386, mean loss: 0.3450127138325347
Epoch: 36, step: 1365, loss: 0.3538930118083954, mean loss: 0.345012880286105
Epoch: 36, step: 1366, loss: 0.29972532391548157, mean loss: 0.3450120314256081
Epoch: 36, step: 1367, loss: 0.322988897562027, mean loss: 0.3450116186363244
Epoch: 36, step: 1368, loss: 0.37971529364585876, mean loss: 0.3450122690903759
Epoch: 36, step: 1369, loss: 0.32212379574775696, mean loss: 0.3450118400977354
Epoch: 36, step: 1370, loss: 0.32776254415512085, mean loss: 0.3450115168047742
Epoch: 36, step: 1371, loss: 0.35130545496940613, mean loss: 0.3450116347659813
Epoch: 36, step: 1372, loss: 0.36021023988723755, mean loss: 0.34501191961342625
Epoch: 36, step: 1373, loss: 0.3185688555240631, mean loss: 0.34501142403517954
Epoch: 36, step: 1374, loss: 0.33585378527641296, mean loss: 0.34501125241204644
Epoch: 36, step: 1375, loss: 0.3069842457771301, mean loss: 0.3450105397619971
Epoch: 36, step: 1376, loss: 0.30425751209259033, mean loss: 0.34500977603890964
Epoch: 36, step: 1377, loss: 0.3365422189235687, mean loss: 0.34500961735750496
Epoch: 36, step: 1378, loss: 0.30218586325645447, mean loss: 0.34500881485850565
Epoch: 36, step: 1379, loss: 0.31347963213920593, mean loss: 0.3450082240260583
Epoch: 36, step: 1380, loss: 0.30290958285331726, mean loss: 0.3450074351449345
Epoch: 36, step: 1381, loss: 0.3263261914253235, mean loss: 0.34500708508602584
Epoch: 36, step: 1382, loss: 0.31368184089660645, mean loss: 0.34500649810822703
Epoch: 36, step: 1383, loss: 0.325560599565506, mean loss: 0.3450061337344723
Epoch: 36, step: 1384, loss: 0.3303202986717224, mean loss: 0.34500585855908844
Epoch: 36, step: 1385, loss: 0.31656986474990845, mean loss: 0.3450053257505104
Epoch: 36, step: 1386, loss: 0.3731880486011505, mean loss: 0.34500585380362636
Epoch: 36, step: 1387, loss: 0.29699620604515076, mean loss: 0.3450049542748892
Epoch: 36, step: 1388, loss: 0.37444978952407837, mean loss: 0.3450055059552379
Epoch: 36, step: 1389, loss: 0.30201512575149536, mean loss: 0.34500470049976883
Epoch: 36, step: 1390, loss: 0.325683057308197, mean loss: 0.3450043385017699
Epoch: 36, step: 1391, loss: 0.37436291575431824, mean loss: 0.3450048885350668
Epoch: 36, step: 1392, loss: 0.3415224254131317, mean loss: 0.34500482329230076
Epoch: 36, step: 1393, loss: 0.3363956809043884, mean loss: 0.3450046620059583
Epoch: 36, step: 1394, loss: 0.3375326693058014, mean loss: 0.34500452202595305
Epoch: 36, step: 1395, loss: 0.30446645617485046, mean loss: 0.34500376260171456
Epoch: 36, step: 1396, loss: 0.3183765113353729, mean loss: 0.34500326378656937
Epoch: 36, step: 1397, loss: 0.3390944004058838, mean loss: 0.3450031530963858
Epoch: 36, step: 1398, loss: 0.31477832794189453, mean loss: 0.3450025869081769
Epoch: 36, step: 1399, loss: 0.353727787733078, mean loss: 0.34500275035042227
Epoch: 36, step: 1400, loss: 0.3806151747703552, mean loss: 0.3450034174371399
Epoch: 36, step: 1401, loss: 0.3115971088409424, mean loss: 0.3450027916867822
Epoch: 36, step: 1402, loss: 0.3621046543121338, mean loss: 0.34500311202436673
Epoch: 36, step: 1403, loss: 0.3470724821090698, mean loss: 0.34500315078532584
Epoch: 36, step: 1404, loss: 0.3434062898159027, mean loss: 0.34500312087540114
Epoch: 36, step: 1405, loss: 0.3085699677467346, mean loss: 0.34500243847882633
Epoch: 36, step: 1406, loss: 0.3563916087150574, mean loss: 0.34500265179512
Epoch: 36, step: 1407, loss: 0.3186914026737213, mean loss: 0.34500215900127224
Epoch: 36, step: 1408, loss: 0.3270862400531769, mean loss: 0.34500182345318636
Epoch: 36, step: 1409, loss: 0.29865342378616333, mean loss: 0.3450009554080939
Epoch: 36, step: 1410, loss: 0.3491268455982208, mean loss: 0.34500103267919024
Epoch: 36, step: 1411, loss: 0.36029502749443054, mean loss: 0.34500131910504267
Epoch: 36, step: 1412, loss: 0.3027934432029724, mean loss: 0.345000528650974
Epoch: 36, step: 1413, loss: 0.3430202007293701, mean loss: 0.3450004915647925
Epoch: 36, step: 1414, loss: 0.3385426998138428, mean loss: 0.34500037063009803
Epoch: 36, step: 1415, loss: 0.3315557539463043, mean loss: 0.34500011885825
Epoch: 36, step: 1416, loss: 0.3374618589878082, mean loss: 0.3449999776949783
Epoch: 36, step: 1417, loss: 0.3267592489719391, mean loss: 0.34499963612109114
Epoch: 36, step: 1418, loss: 0.35958755016326904, mean loss: 0.3449999092876556
Epoch: 36, step: 1419, loss: 0.34099048376083374, mean loss: 0.34499983421040437
Epoch: 36, step: 1420, loss: 0.33765894174575806, mean loss: 0.34499969675337855
Epoch: 36, step: 1421, loss: 0.43139517307281494, mean loss: 0.3450013144644282
Epoch: 36, step: 1422, loss: 0.32300445437431335, mean loss: 0.34500090259220006
Epoch: 36, step: 1423, loss: 0.2984534800052643, mean loss: 0.34500003104818816
Epoch: 36, step: 1424, loss: 0.3341929018497467, mean loss: 0.3449998287015949
Epoch: 36, step: 1425, loss: 0.31460443139076233, mean loss: 0.3449992596059703
Epoch: 36, step: 1426, loss: 0.33127206563949585, mean loss: 0.3449990025953551
Epoch: 36, step: 1427, loss: 0.3047425150871277, mean loss: 0.344998248897918
Epoch: 36, step: 1428, loss: 0.336302250623703, mean loss: 0.344998086091143
Epoch: 36, step: 1429, loss: 0.32586240768432617, mean loss: 0.3449977278390292
Epoch: 36, step: 1430, loss: 0.3396194875240326, mean loss: 0.3449976271512015
Epoch: 36, step: 1431, loss: 0.3152828812599182, mean loss: 0.3449970708619644
Epoch: 36, step: 1432, loss: 0.4073190987110138, mean loss: 0.3449982375697138
Epoch: 36, step: 1433, loss: 0.3607303500175476, mean loss: 0.34499853207928827
Epoch: 36, step: 1434, loss: 0.3208231031894684, mean loss: 0.3449980795169249
Epoch: 36, step: 1435, loss: 0.34377941489219666, mean loss: 0.34499805670403416
Epoch: 36, step: 1436, loss: 0.35744455456733704, mean loss: 0.34499828969289364
Epoch: 36, step: 1437, loss: 0.3112041652202606, mean loss: 0.34499765710473757
Epoch: 36, step: 1438, loss: 0.3195672929286957, mean loss: 0.34499718108571625
Epoch: 36, step: 1439, loss: 0.28206682205200195, mean loss: 0.3449960031439853
Epoch: 36, step: 1440, loss: 0.3851950168609619, mean loss: 0.34499675558223925
Epoch: 36, step: 1441, loss: 0.35160452127456665, mean loss: 0.34499687926295075
Epoch: 36, step: 1442, loss: 0.31800591945648193, mean loss: 0.3449963740697
Epoch: 36, step: 1443, loss: 0.3585953414440155, mean loss: 0.34499662859854957
Valid: 36, mean loss: 0.18518995245297748
Epoch: 37, step: 0, loss: 0.3512265086174011, mean loss: 0.3449967451996467
Epoch: 37, step: 1, loss: 0.3316197693347931, mean loss: 0.3449964948351349
Epoch: 37, step: 2, loss: 0.3020298480987549, mean loss: 0.344995690683112
Epoch: 37, step: 3, loss: 0.35955458879470825, mean loss: 0.34499596315837233
Epoch: 37, step: 4, loss: 0.37587955594062805, mean loss: 0.34499654114562334
Epoch: 37, step: 5, loss: 0.3192300498485565, mean loss: 0.3449960589340858
Epoch: 37, step: 6, loss: 0.3065564036369324, mean loss: 0.3449953395618523
Epoch: 37, step: 7, loss: 0.330457478761673, mean loss: 0.34499506750068004
Epoch: 37, step: 8, loss: 0.3049848675727844, mean loss: 0.3449943187647868
Epoch: 37, step: 9, loss: 0.35431697964668274, mean loss: 0.34499449322230546
Epoch: 37, step: 10, loss: 0.3387775719165802, mean loss: 0.34499437688552326
Epoch: 37, step: 11, loss: 0.32230767607688904, mean loss: 0.34499395235893626
Epoch: 37, step: 12, loss: 0.3284342288970947, mean loss: 0.34499364248966996
Epoch: 37, step: 13, loss: 0.3554754853248596, mean loss: 0.3449938386245982
Epoch: 37, step: 14, loss: 0.3012125790119171, mean loss: 0.3449930194104895
Epoch: 37, step: 15, loss: 0.3257807195186615, mean loss: 0.34499265992579725
Epoch: 37, step: 16, loss: 0.34793567657470703, mean loss: 0.3449927149920644
Epoch: 37, step: 17, loss: 0.3206988275051117, mean loss: 0.3449922604419112
Epoch: 37, step: 18, loss: 0.30205038189888, mean loss: 0.3449914569940368
Epoch: 37, step: 19, loss: 0.34997275471687317, mean loss: 0.3449915501929914
Epoch: 37, step: 20, loss: 0.350867360830307, mean loss: 0.34499166012602356
Epoch: 37, step: 21, loss: 0.30227071046829224, mean loss: 0.3449908608566193
Epoch: 37, step: 22, loss: 0.3661513924598694, mean loss: 0.34499125674316217
Epoch: 37, step: 23, loss: 0.31407588720321655, mean loss: 0.34499067836687053
Epoch: 37, step: 24, loss: 0.3474041819572449, mean loss: 0.3449907235187533
Epoch: 37, step: 25, loss: 0.3195253908634186, mean loss: 0.3449902471216146
Epoch: 37, step: 26, loss: 0.29539480805397034, mean loss: 0.3449893193236711
Epoch: 37, step: 27, loss: 0.34176546335220337, mean loss: 0.3449892590150814
Epoch: 37, step: 28, loss: 0.31728291511535645, mean loss: 0.3449887407229232
Epoch: 37, step: 29, loss: 0.32275867462158203, mean loss: 0.3449883248812138
Epoch: 37, step: 30, loss: 0.3085869252681732, mean loss: 0.3449876439593931
Epoch: 37, step: 31, loss: 0.35961470007896423, mean loss: 0.3449879175668775
Epoch: 37, step: 32, loss: 0.35962581634521484, mean loss: 0.34498819137205844
Epoch: 37, step: 33, loss: 0.33022814989089966, mean loss: 0.3449879152873351
Epoch: 37, step: 34, loss: 0.3076716363430023, mean loss: 0.34498721730407667
Epoch: 37, step: 35, loss: 0.3420222997665405, mean loss: 0.34498716184774086
Epoch: 37, step: 36, loss: 0.3198282718658447, mean loss: 0.34498669128026715
Epoch: 37, step: 37, loss: 0.3371018171310425, mean loss: 0.3449865438057198
Epoch: 37, step: 38, loss: 0.34134283661842346, mean loss: 0.34498647565700774
Epoch: 37, step: 39, loss: 0.31738898158073425, mean loss: 0.3449859595072719
Epoch: 37, step: 40, loss: 0.34922048449516296, mean loss: 0.34498603870316086
Epoch: 37, step: 41, loss: 0.31182003021240234, mean loss: 0.34498541842995173
Epoch: 37, step: 42, loss: 0.34526413679122925, mean loss: 0.3449854236424662
Epoch: 37, step: 43, loss: 0.3184259235858917, mean loss: 0.3449849269432581
Epoch: 37, step: 44, loss: 0.36065244674682617, mean loss: 0.34498521994196407
Epoch: 37, step: 45, loss: 0.293724924325943, mean loss: 0.34498426133973464
Epoch: 37, step: 46, loss: 0.37405505776405334, mean loss: 0.3449848049731414
Epoch: 37, step: 47, loss: 0.32409629225730896, mean loss: 0.3449844143584223
Epoch: 37, step: 48, loss: 0.3613554537296295, mean loss: 0.3449847204907665
Epoch: 37, step: 49, loss: 0.33218345046043396, mean loss: 0.3449844811162568
Epoch: 37, step: 50, loss: 0.34288644790649414, mean loss: 0.3449844418852837
Epoch: 37, step: 51, loss: 0.3526604175567627, mean loss: 0.3449845854151205
Epoch: 37, step: 52, loss: 0.32839784026145935, mean loss: 0.34498427527235664
Epoch: 37, step: 53, loss: 0.32039114832878113, mean loss: 0.3449838154330286
Epoch: 37, step: 54, loss: 0.38034898042678833, mean loss: 0.344984476674264
Epoch: 37, step: 55, loss: 0.3246019780635834, mean loss: 0.34498409557900916
Epoch: 37, step: 56, loss: 0.3369631767272949, mean loss: 0.34498394561324586
Epoch: 37, step: 57, loss: 0.33714890480041504, mean loss: 0.34498379912555166
Epoch: 37, step: 58, loss: 0.33746039867401123, mean loss: 0.34498365846706547
Epoch: 37, step: 59, loss: 0.3442844748497009, mean loss: 0.3449836453952808
Epoch: 37, step: 60, loss: 0.3199367821216583, mean loss: 0.344983177133334
Epoch: 37, step: 61, loss: 0.3126906752586365, mean loss: 0.3449825734223249
Epoch: 37, step: 62, loss: 0.3466291129589081, mean loss: 0.34498260420394306
Epoch: 37, step: 63, loss: 0.3170629143714905, mean loss: 0.3449820822625344
Epoch: 37, step: 64, loss: 0.3870601952075958, mean loss: 0.34498286887223933
Epoch: 37, step: 65, loss: 0.2919906675815582, mean loss: 0.3449818782527065
Epoch: 37, step: 66, loss: 0.35444360971450806, mean loss: 0.3449820551240302
Epoch: 37, step: 67, loss: 0.3083244562149048, mean loss: 0.3449813698840326
Epoch: 37, step: 68, loss: 0.39176973700523376, mean loss: 0.34498224448199366
Epoch: 37, step: 69, loss: 0.3608089089393616, mean loss: 0.34498254031855685
Epoch: 37, step: 70, loss: 0.3346807658672333, mean loss: 0.3449823477584258
Epoch: 37, step: 71, loss: 0.3263263404369354, mean loss: 0.3449819990480086
Epoch: 37, step: 72, loss: 0.33648234605789185, mean loss: 0.3449818401789596
Epoch: 37, step: 73, loss: 0.39594823122024536, mean loss: 0.34498279278617133
Epoch: 37, step: 74, loss: 0.3190723657608032, mean loss: 0.34498230850628003
Epoch: 37, step: 75, loss: 0.38414520025253296, mean loss: 0.34498304046822204
Epoch: 37, step: 76, loss: 0.3299047648906708, mean loss: 0.3449827586576328
Epoch: 37, step: 77, loss: 0.2953231632709503, mean loss: 0.344981830544984
Epoch: 37, step: 78, loss: 0.3073596954345703, mean loss: 0.34498112741950304
Epoch: 37, step: 79, loss: 0.3008953928947449, mean loss: 0.3449803035102834
Epoch: 37, step: 80, loss: 0.3403952419757843, mean loss: 0.3449802178226134
Epoch: 37, step: 81, loss: 0.30768290162086487, mean loss: 0.3449795208067995
Epoch: 37, step: 82, loss: 0.33982178568840027, mean loss: 0.3449794244203534
Epoch: 37, step: 83, loss: 0.33479663729667664, mean loss: 0.34497923413056564
Epoch: 37, step: 84, loss: 0.32147106528282166, mean loss: 0.34497879483228583
Epoch: 37, step: 85, loss: 0.287677526473999, mean loss: 0.34497772406074273
Epoch: 37, step: 86, loss: 0.3585706353187561, mean loss: 0.34497797806263486
Epoch: 37, step: 87, loss: 0.32372036576271057, mean loss: 0.3449775808428819
Epoch: 37, step: 88, loss: 0.31698545813560486, mean loss: 0.3449770577918381
Epoch: 37, step: 89, loss: 0.31701919436454773, mean loss: 0.34497653539071277
Epoch: 37, step: 90, loss: 0.31169065833091736, mean loss: 0.3449759134456641
Epoch: 37, step: 91, loss: 0.3468097448348999, mean loss: 0.34497594771007717
Epoch: 37, step: 92, loss: 0.3060269355773926, mean loss: 0.34497521997681113
Epoch: 37, step: 93, loss: 0.323846697807312, mean loss: 0.3449748252134957
Epoch: 37, step: 94, loss: 0.3331097662448883, mean loss: 0.3449746035319949
Epoch: 37, step: 95, loss: 0.3444828987121582, mean loss: 0.3449745943453717
Epoch: 37, step: 96, loss: 0.32611268758773804, mean loss: 0.34497424195103715
Epoch: 37, step: 97, loss: 0.2997318208217621, mean loss: 0.34497339670907756
Epoch: 37, step: 98, loss: 0.3589145839214325, mean loss: 0.3449736571605733
Epoch: 37, step: 99, loss: 0.3596775531768799, mean loss: 0.34497393185598535
Epoch: 37, step: 100, loss: 0.34755241870880127, mean loss: 0.3449739800258905
Epoch: 37, step: 101, loss: 0.3029176890850067, mean loss: 0.34497319436755053
Epoch: 37, step: 102, loss: 0.3441002368927002, mean loss: 0.3449731780600376
Epoch: 37, step: 103, loss: 0.3438841700553894, mean loss: 0.3449731577169156
Epoch: 37, step: 104, loss: 0.3305666744709015, mean loss: 0.3449728886028505
Epoch: 37, step: 105, loss: 0.36843690276145935, mean loss: 0.3449733269040079
Epoch: 37, step: 106, loss: 0.37656158208847046, mean loss: 0.3449739169526711
Epoch: 37, step: 107, loss: 0.31958529353141785, mean loss: 0.3449734427180734
Epoch: 37, step: 108, loss: 0.3166324496269226, mean loss: 0.34497291334599256
Epoch: 37, step: 109, loss: 0.35843023657798767, mean loss: 0.3449731647062083
Epoch: 37, step: 110, loss: 0.29933029413223267, mean loss: 0.34497231218990104
Epoch: 37, step: 111, loss: 0.3392971158027649, mean loss: 0.3449722061907156
Epoch: 37, step: 112, loss: 0.29436853528022766, mean loss: 0.34497126105201986
Epoch: 37, step: 113, loss: 0.31228670477867126, mean loss: 0.34497065060496385
Epoch: 37, step: 114, loss: 0.3033861815929413, mean loss: 0.34496987394939704
Epoch: 37, step: 115, loss: 0.339148610830307, mean loss: 0.34496976523015455
Epoch: 37, step: 116, loss: 0.32347816228866577, mean loss: 0.3449693638555548
Epoch: 37, step: 117, loss: 0.31580403447151184, mean loss: 0.34496881917753247
Epoch: 37, step: 118, loss: 0.38763269782066345, mean loss: 0.3449696159332544
Epoch: 37, step: 119, loss: 0.32763952016830444, mean loss: 0.3449692922965964
Epoch: 37, step: 120, loss: 0.3348316252231598, mean loss: 0.3449691029808842
Epoch: 37, step: 121, loss: 0.36352136731147766, mean loss: 0.34496944942839736
Epoch: 37, step: 122, loss: 0.3319703936576843, mean loss: 0.3449692066867908
Epoch: 37, step: 123, loss: 0.32515576481819153, mean loss: 0.3449688367016947
Epoch: 37, step: 124, loss: 0.2987913489341736, mean loss: 0.3449679744253
Epoch: 37, step: 125, loss: 0.32892265915870667, mean loss: 0.3449676748152752
Epoch: 37, step: 126, loss: 0.3217483162879944, mean loss: 0.3449672412542906
Epoch: 37, step: 127, loss: 0.31448253989219666, mean loss: 0.3449666720425989
Epoch: 37, step: 128, loss: 0.29733824729919434, mean loss: 0.3449657827391513
Epoch: 37, step: 129, loss: 0.3550967574119568, mean loss: 0.34496597189809436
Epoch: 37, step: 130, loss: 0.31608474254608154, mean loss: 0.34496543265670915
Epoch: 37, step: 131, loss: 0.372111439704895, mean loss: 0.3449659394902985
Epoch: 37, step: 132, loss: 0.31148189306259155, mean loss: 0.34496531433306793
Epoch: 37, step: 133, loss: 0.32739973068237305, mean loss: 0.34496498638445416
Epoch: 37, step: 134, loss: 0.3311294615268707, mean loss: 0.3449647280806837
Epoch: 37, step: 135, loss: 0.3487752079963684, mean loss: 0.3449647992195067
Epoch: 37, step: 136, loss: 0.36723098158836365, mean loss: 0.34496521490479315
Epoch: 37, step: 137, loss: 0.3544946014881134, mean loss: 0.34496539280470323
Epoch: 37, step: 138, loss: 0.3402688801288605, mean loss: 0.3449653051292188
Epoch: 37, step: 139, loss: 0.324662983417511, mean loss: 0.34496492612829077
Epoch: 37, step: 140, loss: 0.3222138583660126, mean loss: 0.34496450142243923
Epoch: 37, step: 141, loss: 0.32283294200897217, mean loss: 0.34496408828897995
Epoch: 37, step: 142, loss: 0.35309097170829773, mean loss: 0.3449642399920174
Epoch: 37, step: 143, loss: 0.28779852390289307, mean loss: 0.34496317291003264
Epoch: 37, step: 144, loss: 0.35456612706184387, mean loss: 0.3449633521599188
Epoch: 37, step: 145, loss: 0.3856913149356842, mean loss: 0.3449641123787334
Epoch: 37, step: 146, loss: 0.38154077529907227, mean loss: 0.34496479509759337
Epoch: 37, step: 147, loss: 0.3472970128059387, mean loss: 0.34496483862860927
Epoch: 37, step: 148, loss: 0.3047366440296173, mean loss: 0.34496408778039833
Epoch: 37, step: 149, loss: 0.3313729465007782, mean loss: 0.3449638341102113
Epoch: 37, step: 150, loss: 0.34757834672927856, mean loss: 0.3449638829075502
Epoch: 37, step: 151, loss: 0.3295252323150635, mean loss: 0.34496359476550853
Epoch: 37, step: 152, loss: 0.31149908900260925, mean loss: 0.3449629702063222
Epoch: 37, step: 153, loss: 0.28536146879196167, mean loss: 0.3449618578644646
Epoch: 37, step: 154, loss: 0.31015345454216003, mean loss: 0.34496120824791976
Epoch: 37, step: 155, loss: 0.3930531442165375, mean loss: 0.3449621057534432
Epoch: 37, step: 156, loss: 0.3227282762527466, mean loss: 0.3449616908270739
Epoch: 37, step: 157, loss: 0.3115180730819702, mean loss: 0.34496106671596755
Epoch: 37, step: 158, loss: 0.31146544218063354, mean loss: 0.34496044164599654
Epoch: 37, step: 159, loss: 0.31466200947761536, mean loss: 0.3449598762501585
Epoch: 37, step: 160, loss: 0.3079891800880432, mean loss: 0.34495918635678186
Epoch: 37, step: 161, loss: 0.3313083052635193, mean loss: 0.34495893162864055
Epoch: 37, step: 162, loss: 0.32128286361694336, mean loss: 0.3449584898367723
Epoch: 37, step: 163, loss: 0.3285323679447174, mean loss: 0.34495818333352757
Epoch: 37, step: 164, loss: 0.3121042251586914, mean loss: 0.3449575703064872
Epoch: 37, step: 165, loss: 0.3589392900466919, mean loss: 0.3449578311886707
Epoch: 37, step: 166, loss: 0.3115375339984894, mean loss: 0.34495720761749443
Epoch: 37, step: 167, loss: 0.35236555337905884, mean loss: 0.3449573458432158
Epoch: 37, step: 168, loss: 0.3090645968914032, mean loss: 0.34495667616489517
Epoch: 37, step: 169, loss: 0.3486954867839813, mean loss: 0.3449567459214275
Epoch: 37, step: 170, loss: 0.3401230275630951, mean loss: 0.3449566557384323
Epoch: 37, step: 171, loss: 0.3671456277370453, mean loss: 0.3449570697117905
Epoch: 37, step: 172, loss: 0.315888911485672, mean loss: 0.34495652740552335
Epoch: 37, step: 173, loss: 0.4008151590824127, mean loss: 0.3449575695052897
Epoch: 37, step: 174, loss: 0.3018234372138977, mean loss: 0.3449567648090546
Epoch: 37, step: 175, loss: 0.3172333836555481, mean loss: 0.3449562476203904
Epoch: 37, step: 176, loss: 0.35252150893211365, mean loss: 0.3449563887501602
Epoch: 37, step: 177, loss: 0.3041202127933502, mean loss: 0.3449556269664801
Epoch: 37, step: 178, loss: 0.3274417519569397, mean loss: 0.34495530025774784
Epoch: 37, step: 179, loss: 0.3109644055366516, mean loss: 0.34495466619390064
Epoch: 37, step: 180, loss: 0.3486824631690979, mean loss: 0.3449547357306757
Epoch: 37, step: 181, loss: 0.3378736674785614, mean loss: 0.3449546036458361
Epoch: 37, step: 182, loss: 0.40304625034332275, mean loss: 0.34495568722283887
Epoch: 37, step: 183, loss: 0.3656836450099945, mean loss: 0.34495607385191046
Epoch: 37, step: 184, loss: 0.33120256662368774, mean loss: 0.34495581731884517
Epoch: 37, step: 185, loss: 0.3243810832500458, mean loss: 0.34495543356210123
Epoch: 37, step: 186, loss: 0.33660826086997986, mean loss: 0.3449552778748366
Epoch: 37, step: 187, loss: 0.329018235206604, mean loss: 0.3449549806306806
Epoch: 37, step: 188, loss: 0.3481837213039398, mean loss: 0.3449550408492805
Epoch: 37, step: 189, loss: 0.31633517146110535, mean loss: 0.34495450707574576
Epoch: 37, step: 190, loss: 0.35285046696662903, mean loss: 0.34495465433622974
Epoch: 37, step: 191, loss: 0.32861992716789246, mean loss: 0.34495434969752836
Epoch: 37, step: 192, loss: 0.35237181186676025, mean loss: 0.3449544880288196
Epoch: 37, step: 193, loss: 0.2909031808376312, mean loss: 0.3449534800226432
Epoch: 37, step: 194, loss: 0.36081987619400024, mean loss: 0.34495377591053034
Epoch: 37, step: 195, loss: 0.34522610902786255, mean loss: 0.34495378098909807
Epoch: 37, step: 196, loss: 0.2961145043373108, mean loss: 0.3449528702333563
Epoch: 37, step: 197, loss: 0.31858205795288086, mean loss: 0.34495237847912735
Epoch: 37, step: 198, loss: 0.3203027844429016, mean loss: 0.34495191883018117
Epoch: 37, step: 199, loss: 0.30935102701187134, mean loss: 0.3449512549812251
Epoch: 37, step: 200, loss: 0.3557186722755432, mean loss: 0.3449514557572473
Epoch: 37, step: 201, loss: 0.3289213478565216, mean loss: 0.34495115685536587
Epoch: 37, step: 202, loss: 0.3204192817211151, mean loss: 0.34495069943568074
Epoch: 37, step: 203, loss: 0.3339231610298157, mean loss: 0.3449504938207791
Epoch: 37, step: 204, loss: 0.3399369418621063, mean loss: 0.3449504003419142
Epoch: 37, step: 205, loss: 0.3125417232513428, mean loss: 0.3449497960857131
Epoch: 37, step: 206, loss: 0.3236123025417328, mean loss: 0.3449493982579226
Epoch: 37, step: 207, loss: 0.33198612928390503, mean loss: 0.3449491565682184
Epoch: 37, step: 208, loss: 0.34410327672958374, mean loss: 0.34494914079776445
Epoch: 37, step: 209, loss: 0.3357354402542114, mean loss: 0.3449489690221475
Epoch: 37, step: 210, loss: 0.4017553925514221, mean loss: 0.34495002807290404
Epoch: 37, step: 211, loss: 0.3296799063682556, mean loss: 0.3449497433950199
Epoch: 37, step: 212, loss: 0.3377205729484558, mean loss: 0.34494960862552554
Epoch: 37, step: 213, loss: 0.3260241746902466, mean loss: 0.3449492558155271
Epoch: 37, step: 214, loss: 0.3333108723163605, mean loss: 0.3449490388555603
Epoch: 37, step: 215, loss: 0.3120695948600769, mean loss: 0.3449484259362404
Epoch: 37, step: 216, loss: 0.3401137888431549, mean loss: 0.34494833581344997
Epoch: 37, step: 217, loss: 0.3457104563713074, mean loss: 0.34494835001992497
Epoch: 37, step: 218, loss: 0.3346445858478546, mean loss: 0.34494815795393485
Epoch: 37, step: 219, loss: 0.33325299620628357, mean loss: 0.34494793995584083
Epoch: 37, step: 220, loss: 0.32937705516815186, mean loss: 0.3449476497195869
Epoch: 37, step: 221, loss: 0.30334895849227905, mean loss: 0.34494687434789584
Epoch: 37, step: 222, loss: 0.33111461997032166, mean loss: 0.34494661652876146
Epoch: 37, step: 223, loss: 0.31638988852500916, mean loss: 0.3449460842703554
Epoch: 37, step: 224, loss: 0.3310467600822449, mean loss: 0.3449458252107653
Epoch: 37, step: 225, loss: 0.31784874200820923, mean loss: 0.34494532017697094
Epoch: 37, step: 226, loss: 0.3629894554615021, mean loss: 0.3449456564762028
Epoch: 37, step: 227, loss: 0.32448095083236694, mean loss: 0.3449452750704766
Epoch: 37, step: 228, loss: 0.3583984076976776, mean loss: 0.34494552579512816
Epoch: 37, step: 229, loss: 0.3044840395450592, mean loss: 0.3449447717326165
Epoch: 37, step: 230, loss: 0.31313666701316833, mean loss: 0.34494417895032986
Epoch: 37, step: 231, loss: 0.3303438425064087, mean loss: 0.3449439068605713
Epoch: 37, step: 232, loss: 0.3627839982509613, mean loss: 0.3449442393197389
Epoch: 37, step: 233, loss: 0.3538353443145752, mean loss: 0.34494440500691037
Epoch: 37, step: 234, loss: 0.3477167785167694, mean loss: 0.34494445666957385
Epoch: 37, step: 235, loss: 0.3220033645629883, mean loss: 0.3449440291745659
Epoch: 37, step: 236, loss: 0.30848732590675354, mean loss: 0.3449433498360162
Epoch: 37, step: 237, loss: 0.35534152388572693, mean loss: 0.3449435435932191
Epoch: 37, step: 238, loss: 0.3209276497364044, mean loss: 0.34494309609487084
Epoch: 37, step: 239, loss: 0.31274503469467163, mean loss: 0.3449424961458994
Epoch: 37, step: 240, loss: 0.3572523295879364, mean loss: 0.3449427255117054
Epoch: 37, step: 241, loss: 0.30030667781829834, mean loss: 0.3449418938357655
Epoch: 37, step: 242, loss: 0.3211689293384552, mean loss: 0.34494145089703704
Epoch: 37, step: 243, loss: 0.34411710500717163, mean loss: 0.344941435538081
Epoch: 37, step: 244, loss: 0.3644864857196808, mean loss: 0.34494179968858835
Epoch: 37, step: 245, loss: 0.3537456691265106, mean loss: 0.3449419637134316
Epoch: 37, step: 246, loss: 0.3395693302154541, mean loss: 0.3449418636177912
Epoch: 37, step: 247, loss: 0.3049086928367615, mean loss: 0.3449411177877968
Epoch: 37, step: 248, loss: 0.35608598589897156, mean loss: 0.34494132541616856
Epoch: 37, step: 249, loss: 0.29978734254837036, mean loss: 0.3449404842152507
Epoch: 37, step: 250, loss: 0.3192393183708191, mean loss: 0.34494000542157266
Epoch: 37, step: 251, loss: 0.32902446389198303, mean loss: 0.34493970893234893
Epoch: 37, step: 252, loss: 0.3462388813495636, mean loss: 0.3449397331340668
Epoch: 37, step: 253, loss: 0.29819291830062866, mean loss: 0.3449388623242081
Epoch: 37, step: 254, loss: 0.358171671628952, mean loss: 0.3449391088232731
Epoch: 37, step: 255, loss: 0.3189629018306732, mean loss: 0.34493862495085315
Epoch: 37, step: 256, loss: 0.3437053859233856, mean loss: 0.34493860197909143
Epoch: 37, step: 257, loss: 0.338890939950943, mean loss: 0.3449384893303184
Epoch: 37, step: 258, loss: 0.3412264585494995, mean loss: 0.34493842018823967
Epoch: 37, step: 259, loss: 0.33468517661094666, mean loss: 0.3449382292099284
Epoch: 37, step: 260, loss: 0.33720505237579346, mean loss: 0.3449380851734063
Epoch: 37, step: 261, loss: 0.33938124775886536, mean loss: 0.34493798167485135
Epoch: 37, step: 262, loss: 0.3179984390735626, mean loss: 0.34493747992329893
Epoch: 37, step: 263, loss: 0.31716689467430115, mean loss: 0.3449369627031311
Epoch: 37, step: 264, loss: 0.30995264649391174, mean loss: 0.3449363111411732
Epoch: 37, step: 265, loss: 0.36181411147117615, mean loss: 0.3449366254742519
Epoch: 37, step: 266, loss: 0.3376588225364685, mean loss: 0.34493648993457526
Epoch: 37, step: 267, loss: 0.3434389531612396, mean loss: 0.3449364620454071
Epoch: 37, step: 268, loss: 0.31982070207595825, mean loss: 0.34493599431424954
Epoch: 37, step: 269, loss: 0.34565964341163635, mean loss: 0.3449360077905261
Epoch: 37, step: 270, loss: 0.319243848323822, mean loss: 0.3449355293428927
Epoch: 37, step: 271, loss: 0.33720868825912476, mean loss: 0.34493538545385943
Epoch: 37, step: 272, loss: 0.31396040320396423, mean loss: 0.34493480864928877
Epoch: 37, step: 273, loss: 0.3187425136566162, mean loss: 0.3449343209152194
Epoch: 37, step: 274, loss: 0.34265124797821045, mean loss: 0.34493427840226976
Epoch: 37, step: 275, loss: 0.3078717887401581, mean loss: 0.3449335882769595
Epoch: 37, step: 276, loss: 0.3145650327205658, mean loss: 0.3449330228071605
Epoch: 37, step: 277, loss: 0.3133275806903839, mean loss: 0.34493243431719445
Epoch: 37, step: 278, loss: 0.3322536051273346, mean loss: 0.344932198243141
Epoch: 37, step: 279, loss: 0.32087400555610657, mean loss: 0.3449317502988368
Epoch: 37, step: 280, loss: 0.3029632270336151, mean loss: 0.3449309688930526
Epoch: 37, step: 281, loss: 0.4043736457824707, mean loss: 0.34493207562693623
Epoch: 37, step: 282, loss: 0.3336249887943268, mean loss: 0.3449318651097827
Epoch: 37, step: 283, loss: 0.30396029353141785, mean loss: 0.3449311023087033
Epoch: 37, step: 284, loss: 0.316742867231369, mean loss: 0.34493057751516953
Epoch: 37, step: 285, loss: 0.418212890625, mean loss: 0.34493194182080883
Epoch: 37, step: 286, loss: 0.33085647225379944, mean loss: 0.344931679780977
Epoch: 37, step: 287, loss: 0.3259451985359192, mean loss: 0.34493132632053236
Epoch: 37, step: 288, loss: 0.30150529742240906, mean loss: 0.34493051789807955
Epoch: 37, step: 289, loss: 0.33845752477645874, mean loss: 0.3449303973985613
Epoch: 37, step: 290, loss: 0.2937586307525635, mean loss: 0.34492944481629717
Epoch: 37, step: 291, loss: 0.3445653021335602, mean loss: 0.3449294380377662
Epoch: 37, step: 292, loss: 0.3354220688343048, mean loss: 0.3449292610609936
Epoch: 37, step: 293, loss: 0.3572200834751129, mean loss: 0.34492948984663846
Epoch: 37, step: 294, loss: 0.3243185579776764, mean loss: 0.3449291061947227
Epoch: 37, step: 295, loss: 0.33397018909454346, mean loss: 0.3449289022092209
Epoch: 37, step: 296, loss: 0.3236786425113678, mean loss: 0.3449285066715811
Epoch: 37, step: 297, loss: 0.3263287842273712, mean loss: 0.3449281604756528
Epoch: 37, step: 298, loss: 0.32603907585144043, mean loss: 0.34492780890038105
Epoch: 37, step: 299, loss: 0.3567342162132263, mean loss: 0.34492802864441235
Epoch: 37, step: 300, loss: 0.33389410376548767, mean loss: 0.34492782328185434
Epoch: 37, step: 301, loss: 0.34614214301109314, mean loss: 0.3449278458822588
Epoch: 37, step: 302, loss: 0.3421171307563782, mean loss: 0.3449277935713931
Epoch: 37, step: 303, loss: 0.32486492395401, mean loss: 0.34492742018366107
Epoch: 37, step: 304, loss: 0.31495431065559387, mean loss: 0.34492686236798864
Epoch: 37, step: 305, loss: 0.33254876732826233, mean loss: 0.3449266320092765
Epoch: 37, step: 306, loss: 0.3365136981010437, mean loss: 0.34492647544588373
Epoch: 37, step: 307, loss: 0.39552193880081177, mean loss: 0.3449274170020724
Epoch: 37, step: 308, loss: 0.3444057106971741, mean loss: 0.3449274072935605
Epoch: 37, step: 309, loss: 0.3159954249858856, mean loss: 0.3449268689039236
Epoch: 37, step: 310, loss: 0.3411458134651184, mean loss: 0.34492679854430697
Epoch: 37, step: 311, loss: 0.30442818999290466, mean loss: 0.34492604494161716
Epoch: 37, step: 312, loss: 0.37100693583488464, mean loss: 0.34492653024875497
Epoch: 37, step: 313, loss: 0.31682074069976807, mean loss: 0.34492600727250644
Epoch: 37, step: 314, loss: 0.347564160823822, mean loss: 0.34492605636082585
Epoch: 37, step: 315, loss: 0.34170007705688477, mean loss: 0.34492599633590576
Epoch: 37, step: 316, loss: 0.3565724194049835, mean loss: 0.3449262130337022
Epoch: 37, step: 317, loss: 0.448727011680603, mean loss: 0.3449281443550777
Epoch: 37, step: 318, loss: 0.3062785267829895, mean loss: 0.3449274252522892
Epoch: 37, step: 319, loss: 0.3551119565963745, mean loss: 0.3449276147389928
Epoch: 37, step: 320, loss: 0.2935332655906677, mean loss: 0.34492665854726556
Epoch: 37, step: 321, loss: 0.3119804859161377, mean loss: 0.3449260455952166
Epoch: 37, step: 322, loss: 0.3548516035079956, mean loss: 0.3449262302533237
Epoch: 37, step: 323, loss: 0.3681665062904358, mean loss: 0.3449266626144644
Epoch: 37, step: 324, loss: 0.32444292306900024, mean loss: 0.3449262815429048
Epoch: 37, step: 325, loss: 0.3392179012298584, mean loss: 0.3449261753483832
Epoch: 37, step: 326, loss: 0.32959961891174316, mean loss: 0.34492589022966985
Epoch: 37, step: 327, loss: 0.3217458128929138, mean loss: 0.34492545902055205
Epoch: 37, step: 328, loss: 0.3527899384498596, mean loss: 0.3449256053173958
Epoch: 37, step: 329, loss: 0.3175906538963318, mean loss: 0.34492509683584105
Epoch: 37, step: 330, loss: 0.3556171953678131, mean loss: 0.344925295725302
Epoch: 37, step: 331, loss: 0.35619044303894043, mean loss: 0.3449255052704529
Epoch: 37, step: 332, loss: 0.3088870644569397, mean loss: 0.3449248349250201
Epoch: 37, step: 333, loss: 0.3256109654903412, mean loss: 0.34492447567742074
Epoch: 37, step: 334, loss: 0.3154240548610687, mean loss: 0.3449239269650941
Epoch: 37, step: 335, loss: 0.35303205251693726, mean loss: 0.34492407777466094
Epoch: 37, step: 336, loss: 0.3189201056957245, mean loss: 0.3449235941148064
Epoch: 37, step: 337, loss: 0.3074322044849396, mean loss: 0.3449228968081511
Epoch: 37, step: 338, loss: 0.3510270416736603, mean loss: 0.34492301033772993
Epoch: 37, step: 339, loss: 0.3288164436817169, mean loss: 0.3449227107809925
Epoch: 37, step: 340, loss: 0.32959413528442383, mean loss: 0.34492242569896575
Epoch: 37, step: 341, loss: 0.32275694608688354, mean loss: 0.3449220134713367
Epoch: 37, step: 342, loss: 0.323068231344223, mean loss: 0.34492160704813224
Epoch: 37, step: 343, loss: 0.3297605812549591, mean loss: 0.34492132509793894
Epoch: 37, step: 344, loss: 0.34688395261764526, mean loss: 0.34492136159632136
Epoch: 37, step: 345, loss: 0.29084688425064087, mean loss: 0.34492035600854015
Epoch: 37, step: 346, loss: 0.38325926661491394, mean loss: 0.3449210689589931
Epoch: 37, step: 347, loss: 0.3197023570537567, mean loss: 0.34492060000050034
Epoch: 37, step: 348, loss: 0.3398009240627289, mean loss: 0.34492050479853786
Epoch: 37, step: 349, loss: 0.33603808283805847, mean loss: 0.34492033963021695
Epoch: 37, step: 350, loss: 0.31430715322494507, mean loss: 0.344919770389688
Epoch: 37, step: 351, loss: 0.3278760313987732, mean loss: 0.3449194534737529
Epoch: 37, step: 352, loss: 0.3436339199542999, mean loss: 0.3449194295706362
Epoch: 37, step: 353, loss: 0.35280561447143555, mean loss: 0.34491957620305785
Epoch: 37, step: 354, loss: 0.3006151020526886, mean loss: 0.34491875243952386
Epoch: 37, step: 355, loss: 0.32077714800834656, mean loss: 0.34491830357732634
Epoch: 37, step: 356, loss: 0.3416823446750641, mean loss: 0.3449182434126168
Epoch: 37, step: 357, loss: 0.33701393008232117, mean loss: 0.34491809645405264
Epoch: 37, step: 358, loss: 0.32650452852249146, mean loss: 0.3449177541117035
Epoch: 37, step: 359, loss: 0.3646206259727478, mean loss: 0.3449181204177915
Epoch: 37, step: 360, loss: 0.3461758494377136, mean loss: 0.3449181438004352
Epoch: 37, step: 361, loss: 0.3045838475227356, mean loss: 0.34491739395294907
Epoch: 37, step: 362, loss: 0.31679457426071167, mean loss: 0.3449168711364985
Epoch: 37, step: 363, loss: 0.3212011754512787, mean loss: 0.344916430258753
Epoch: 37, step: 364, loss: 0.28469207882881165, mean loss: 0.34491531070134906
Epoch: 37, step: 365, loss: 0.33102840185165405, mean loss: 0.3449150525515768
Epoch: 37, step: 366, loss: 0.3351821303367615, mean loss: 0.3449148716254272
Epoch: 37, step: 367, loss: 0.3760432302951813, mean loss: 0.3449154502624759
Epoch: 37, step: 368, loss: 0.30860117077827454, mean loss: 0.3449147752382276
Epoch: 37, step: 369, loss: 0.3397674858570099, mean loss: 0.344914679560147
Epoch: 37, step: 370, loss: 0.3172183334827423, mean loss: 0.3449141647486063
Epoch: 37, step: 371, loss: 0.3423300087451935, mean loss: 0.34491411671596683
Epoch: 37, step: 372, loss: 0.33726581931114197, mean loss: 0.3449139745569474
Epoch: 37, step: 373, loss: 0.3178844749927521, mean loss: 0.34491347216856844
Epoch: 37, step: 374, loss: 0.3043361306190491, mean loss: 0.34491271798494394
Epoch: 37, step: 375, loss: 0.3300938308238983, mean loss: 0.34491244256142223
Epoch: 37, step: 376, loss: 0.33724403381347656, mean loss: 0.3449123000391892
Epoch: 37, step: 377, loss: 0.33481621742248535, mean loss: 0.3449121124005873
Epoch: 37, step: 378, loss: 0.3463630676269531, mean loss: 0.3449121393665067
Epoch: 37, step: 379, loss: 0.3397482931613922, mean loss: 0.34491204339850556
Epoch: 37, step: 380, loss: 0.33511146903038025, mean loss: 0.34491186126216467
Epoch: 37, step: 381, loss: 0.32704871892929077, mean loss: 0.3449115292952007
Epoch: 37, step: 382, loss: 0.35463955998420715, mean loss: 0.3449117100766522
Epoch: 37, step: 383, loss: 0.32921841740608215, mean loss: 0.34491141844481044
Epoch: 37, step: 384, loss: 0.32245123386383057, mean loss: 0.34491100107011324
Epoch: 37, step: 385, loss: 0.34119951725006104, mean loss: 0.3449109321013724
Epoch: 37, step: 386, loss: 0.3338993787765503, mean loss: 0.34491072748270984
Epoch: 37, step: 387, loss: 0.3407024145126343, mean loss: 0.34491064928453513
Epoch: 37, step: 388, loss: 0.30862703919410706, mean loss: 0.344909975081029
Epoch: 37, step: 389, loss: 0.33002007007598877, mean loss: 0.3449096984095621
Epoch: 37, step: 390, loss: 0.3256150782108307, mean loss: 0.3449093399001101
Epoch: 37, step: 391, loss: 0.33483973145484924, mean loss: 0.34490915280221995
Epoch: 37, step: 392, loss: 0.32870757579803467, mean loss: 0.3449088517751672
Epoch: 37, step: 393, loss: 0.3542657792568207, mean loss: 0.3449090256246615
Epoch: 37, step: 394, loss: 0.28949952125549316, mean loss: 0.3449079961483341
Epoch: 37, step: 395, loss: 0.31551143527030945, mean loss: 0.34490744998749734
Epoch: 37, step: 396, loss: 0.3660443425178528, mean loss: 0.34490784268406083
Epoch: 37, step: 397, loss: 0.33941876888275146, mean loss: 0.3449077407059499
Epoch: 37, step: 398, loss: 0.3076632022857666, mean loss: 0.3449070487755354
Epoch: 37, step: 399, loss: 0.38278621435165405, mean loss: 0.3449077524830032
Epoch: 37, step: 400, loss: 0.3988487720489502, mean loss: 0.34490875456402953
Epoch: 37, step: 401, loss: 0.32503190636634827, mean loss: 0.3449083853117873
Epoch: 37, step: 402, loss: 0.319369375705719, mean loss: 0.3449079108823766
Epoch: 37, step: 403, loss: 0.3339861333370209, mean loss: 0.34490770799603493
Epoch: 37, step: 404, loss: 0.31993216276168823, mean loss: 0.3449072440511455
Epoch: 37, step: 405, loss: 0.3027275800704956, mean loss: 0.34490646053767854
Epoch: 37, step: 406, loss: 0.3362818658351898, mean loss: 0.3449063003334489
Epoch: 37, step: 407, loss: 0.33531492948532104, mean loss: 0.34490612217439454
Epoch: 37, step: 408, loss: 0.3298265337944031, mean loss: 0.34490584207727953
Epoch: 37, step: 409, loss: 0.3153204023838043, mean loss: 0.3449052925501854
Epoch: 37, step: 410, loss: 0.3336665630340576, mean loss: 0.34490508380318946
Epoch: 37, step: 411, loss: 0.3277711272239685, mean loss: 0.3449047655647686
Epoch: 37, step: 412, loss: 0.322083055973053, mean loss: 0.34490434169244844
Epoch: 37, step: 413, loss: 0.2929615080356598, mean loss: 0.3449033769654016
Epoch: 37, step: 414, loss: 0.3884294331073761, mean loss: 0.3449041853537927
Epoch: 37, step: 415, loss: 0.34865301847457886, mean loss: 0.34490425497776417
Epoch: 37, step: 416, loss: 0.31583499908447266, mean loss: 0.3449037151085861
Epoch: 37, step: 417, loss: 0.34554120898246765, mean loss: 0.34490372694779187
Epoch: 37, step: 418, loss: 0.323396235704422, mean loss: 0.3449033275292311
Epoch: 37, step: 419, loss: 0.32309791445732117, mean loss: 0.3449029225854435
Epoch: 37, step: 420, loss: 0.3169075548648834, mean loss: 0.3449024026989513
Epoch: 37, step: 421, loss: 0.3240160644054413, mean loss: 0.3449020148375159
Epoch: 37, step: 422, loss: 0.3297021985054016, mean loss: 0.34490173258061574
Epoch: 37, step: 423, loss: 0.33586129546165466, mean loss: 0.34490156470501004
Epoch: 37, step: 424, loss: 0.3285370469093323, mean loss: 0.34490126083117206
Epoch: 37, step: 425, loss: 0.35057222843170166, mean loss: 0.3449013661337977
Epoch: 37, step: 426, loss: 0.312058687210083, mean loss: 0.3449007562985192
Epoch: 37, step: 427, loss: 0.31152936816215515, mean loss: 0.3449001366574739
Epoch: 37, step: 428, loss: 0.31545066833496094, mean loss: 0.34489958984891933
Epoch: 37, step: 429, loss: 0.3605573773384094, mean loss: 0.3448998805724421
Epoch: 37, step: 430, loss: 0.36380890011787415, mean loss: 0.3449002316561894
Epoch: 37, step: 431, loss: 0.3280032277107239, mean loss: 0.3448999179353586
Epoch: 37, step: 432, loss: 0.36072584986686707, mean loss: 0.3449002117645102
Epoch: 37, step: 433, loss: 0.36778393387794495, mean loss: 0.3449006366228911
Epoch: 37, step: 434, loss: 0.3306432068347931, mean loss: 0.34490037192486483
Epoch: 37, step: 435, loss: 0.3745653033256531, mean loss: 0.34490092266248923
Epoch: 37, step: 436, loss: 0.3700622320175171, mean loss: 0.34490138978045737
Epoch: 37, step: 437, loss: 0.3230530917644501, mean loss: 0.34490098417584564
Epoch: 37, step: 438, loss: 0.3222130239009857, mean loss: 0.34490056299107064
Epoch: 37, step: 439, loss: 0.3302498757839203, mean loss: 0.3449002910172233
Epoch: 37, step: 440, loss: 0.30730071663856506, mean loss: 0.34489959303555706
Epoch: 37, step: 441, loss: 0.3537588119506836, mean loss: 0.34489975749107804
Epoch: 37, step: 442, loss: 0.31438350677490234, mean loss: 0.3448991910220926
Epoch: 37, step: 443, loss: 0.3391510844230652, mean loss: 0.3448990843227572
Epoch: 37, step: 444, loss: 0.28947576880455017, mean loss: 0.34489805554553077
Epoch: 37, step: 445, loss: 0.32410094141960144, mean loss: 0.34489766951304524
Epoch: 37, step: 446, loss: 0.3331952691078186, mean loss: 0.3448974522991166
Epoch: 37, step: 447, loss: 0.3084908425807953, mean loss: 0.34489677655092227
Epoch: 37, step: 448, loss: 0.3455897271633148, mean loss: 0.34489678941263713
Epoch: 37, step: 449, loss: 0.33435317873954773, mean loss: 0.34489659371846376
Epoch: 37, step: 450, loss: 0.3105064034461975, mean loss: 0.3448959554328558
Epoch: 37, step: 451, loss: 0.2766619324684143, mean loss: 0.34489468902559955
Epoch: 37, step: 452, loss: 0.35438576340675354, mean loss: 0.34489486517441603
Epoch: 37, step: 453, loss: 0.35929781198501587, mean loss: 0.34489513247976494
Epoch: 37, step: 454, loss: 0.3544572591781616, mean loss: 0.34489530994068396
Epoch: 37, step: 455, loss: 0.3229171931743622, mean loss: 0.3448949020623385
Epoch: 37, step: 456, loss: 0.32106950879096985, mean loss: 0.3448944599097307
Epoch: 37, step: 457, loss: 0.3492196202278137, mean loss: 0.3448945401747405
Epoch: 37, step: 458, loss: 0.32929834723472595, mean loss: 0.3448942507507062
Epoch: 37, step: 459, loss: 0.336736798286438, mean loss: 0.3448940993728027
Epoch: 37, step: 460, loss: 0.31611910462379456, mean loss: 0.34489356540492894
Epoch: 37, step: 461, loss: 0.31134718656539917, mean loss: 0.34489294290764116
Epoch: 37, step: 462, loss: 0.30145567655563354, mean loss: 0.34489213688685194
Epoch: 37, step: 463, loss: 0.32647204399108887, mean loss: 0.34489179509042767
Epoch: 37, step: 464, loss: 0.39107829332351685, mean loss: 0.34489265209408737
Epoch: 37, step: 465, loss: 0.3382713794708252, mean loss: 0.3448925292367633
Epoch: 37, step: 466, loss: 0.32479700446128845, mean loss: 0.34489215637240156
Epoch: 37, step: 467, loss: 0.3434821665287018, mean loss: 0.3448921302110938
Epoch: 37, step: 468, loss: 0.3769133985042572, mean loss: 0.3448927243307719
Epoch: 37, step: 469, loss: 0.35902929306030273, mean loss: 0.3448929866145065
Epoch: 37, step: 470, loss: 0.3616533875465393, mean loss: 0.3448932975739108
Epoch: 37, step: 471, loss: 0.3572625517845154, mean loss: 0.3448935270591466
Epoch: 37, step: 472, loss: 0.31954172253608704, mean loss: 0.3448930567189948
Epoch: 37, step: 473, loss: 0.3470933139324188, mean loss: 0.3448930975385787
Epoch: 37, step: 474, loss: 0.3362320363521576, mean loss: 0.3448929368599303
Epoch: 37, step: 475, loss: 0.3196943402290344, mean loss: 0.34489246938819107
Epoch: 37, step: 476, loss: 0.3557981252670288, mean loss: 0.3448926717007016
Epoch: 37, step: 477, loss: 0.3299493193626404, mean loss: 0.34489239448940157
Epoch: 37, step: 478, loss: 0.3616940379142761, mean loss: 0.3448927061677258
Epoch: 37, step: 479, loss: 0.3533889949321747, mean loss: 0.3448928637749226
Epoch: 37, step: 480, loss: 0.29689720273017883, mean loss: 0.34489197346604944
Epoch: 37, step: 481, loss: 0.3771836757659912, mean loss: 0.34489257245885785
Epoch: 37, step: 482, loss: 0.3495776951313019, mean loss: 0.34489265936362073
Epoch: 37, step: 483, loss: 0.3511641025543213, mean loss: 0.34489277569102816
Epoch: 37, step: 484, loss: 0.32898738980293274, mean loss: 0.3448924806715359
Epoch: 37, step: 485, loss: 0.3183467984199524, mean loss: 0.34489198830068135
Epoch: 37, step: 486, loss: 0.3272664248943329, mean loss: 0.3448916613867723
Epoch: 37, step: 487, loss: 0.3002128303050995, mean loss: 0.3448908327119618
Epoch: 37, step: 488, loss: 0.3670245409011841, mean loss: 0.34489124322642273
Epoch: 37, step: 489, loss: 0.304644912481308, mean loss: 0.3448904967905248
Epoch: 37, step: 490, loss: 0.33804622292518616, mean loss: 0.34489036985430815
Epoch: 37, step: 491, loss: 0.32040929794311523, mean loss: 0.34488991582849376
Epoch: 37, step: 492, loss: 0.315736323595047, mean loss: 0.3448893751561725
Epoch: 37, step: 493, loss: 0.3231081962585449, mean loss: 0.3448889712175408
Epoch: 37, step: 494, loss: 0.35433483123779297, mean loss: 0.34488914639065843
Epoch: 37, step: 495, loss: 0.3249242305755615, mean loss: 0.3448887761489142
Epoch: 37, step: 496, loss: 0.32005923986434937, mean loss: 0.34488831570317874
Epoch: 37, step: 497, loss: 0.3426464796066284, mean loss: 0.3448882741307258
Epoch: 37, step: 498, loss: 0.3226354420185089, mean loss: 0.3448878614834042
Epoch: 37, step: 499, loss: 0.36149662733078003, mean loss: 0.34488816946378265
Epoch: 37, step: 500, loss: 0.3421889543533325, mean loss: 0.34488811941250946
Epoch: 37, step: 501, loss: 0.33191823959350586, mean loss: 0.34488787891779743
Epoch: 37, step: 502, loss: 0.3147795498371124, mean loss: 0.3448873206427964
Epoch: 37, step: 503, loss: 0.3116379678249359, mean loss: 0.3448867041377008
Epoch: 37, step: 504, loss: 0.36913248896598816, mean loss: 0.3448871536914958
Epoch: 37, step: 505, loss: 0.3333544135093689, mean loss: 0.34488693986088464
Epoch: 37, step: 506, loss: 0.35503706336021423, mean loss: 0.34488712805266175
Epoch: 37, step: 507, loss: 0.3606020212173462, mean loss: 0.3448874194145196
Epoch: 37, step: 508, loss: 0.3266485631465912, mean loss: 0.34488708126341244
Epoch: 37, step: 509, loss: 0.361406534910202, mean loss: 0.3448873875308611
Epoch: 37, step: 510, loss: 0.3250270187854767, mean loss: 0.3448870193303245
Epoch: 37, step: 511, loss: 0.37131747603416443, mean loss: 0.34488750932766793
Epoch: 37, step: 512, loss: 0.34485936164855957, mean loss: 0.34488750880584446
Epoch: 37, step: 513, loss: 0.31335878372192383, mean loss: 0.3448869243127763
Epoch: 37, step: 514, loss: 0.32096150517463684, mean loss: 0.3448864807812868
Epoch: 37, step: 515, loss: 0.32392245531082153, mean loss: 0.34488609215557364
Epoch: 37, step: 516, loss: 0.32205015420913696, mean loss: 0.34488566883667576
Epoch: 37, step: 517, loss: 0.3700597584247589, mean loss: 0.3448861354901735
Epoch: 37, step: 518, loss: 0.3077605962753296, mean loss: 0.3448854473047468
Epoch: 37, step: 519, loss: 0.29462310671806335, mean loss: 0.3448845156234873
Epoch: 37, step: 520, loss: 0.3222898542881012, mean loss: 0.34488409680828525
Epoch: 37, step: 521, loss: 0.3088034987449646, mean loss: 0.3448834280298225
Epoch: 37, step: 522, loss: 0.32867109775543213, mean loss: 0.3448831275288073
Epoch: 37, step: 523, loss: 0.32831209897994995, mean loss: 0.34488282038489143
Epoch: 37, step: 524, loss: 0.3641822636127472, mean loss: 0.3448831780933271
Epoch: 37, step: 525, loss: 0.3222636878490448, mean loss: 0.3448827588567507
Epoch: 37, step: 526, loss: 0.363097220659256, mean loss: 0.3448830964429207
Epoch: 37, step: 527, loss: 0.3238930106163025, mean loss: 0.34488270742064653
Epoch: 37, step: 528, loss: 0.36965930461883545, mean loss: 0.34488316661217305
Epoch: 37, step: 529, loss: 0.36291155219078064, mean loss: 0.34488350073103546
Epoch: 37, step: 530, loss: 0.3254758417606354, mean loss: 0.34488314105685747
Epoch: 37, step: 531, loss: 0.3605468273162842, mean loss: 0.3448834313401462
Epoch: 37, step: 532, loss: 0.31772130727767944, mean loss: 0.34488292797430675
Epoch: 37, step: 533, loss: 0.32843369245529175, mean loss: 0.34488262314432416
Epoch: 37, step: 534, loss: 0.31653690338134766, mean loss: 0.3448820978636733
Epoch: 37, step: 535, loss: 0.31958404183387756, mean loss: 0.3448816290686242
Epoch: 37, step: 536, loss: 0.30943915247917175, mean loss: 0.34488097230078224
Epoch: 37, step: 537, loss: 0.3131771385669708, mean loss: 0.3448803848228566
Epoch: 37, step: 538, loss: 0.33787569403648376, mean loss: 0.3448802550270409
Epoch: 37, step: 539, loss: 0.322421133518219, mean loss: 0.3448798388707722
Epoch: 37, step: 540, loss: 0.367102712392807, mean loss: 0.3448802506418542
Epoch: 37, step: 541, loss: 0.3509399890899658, mean loss: 0.3448803629216105
Epoch: 37, step: 542, loss: 0.33960720896720886, mean loss: 0.34488026521814097
Epoch: 37, step: 543, loss: 0.31978750228881836, mean loss: 0.3448798002962754
Epoch: 37, step: 544, loss: 0.353119820356369, mean loss: 0.3448799529655741
Epoch: 37, step: 545, loss: 0.3470650315284729, mean loss: 0.34487999344948417
Epoch: 37, step: 546, loss: 0.33194470405578613, mean loss: 0.3448797537961374
Epoch: 37, step: 547, loss: 0.3216054439544678, mean loss: 0.3448793225987563
Epoch: 37, step: 548, loss: 0.3662395477294922, mean loss: 0.3448797183270319
Epoch: 37, step: 549, loss: 0.3215144872665405, mean loss: 0.3448792854612151
Epoch: 37, step: 550, loss: 0.34557339549064636, mean loss: 0.3448792983201052
Epoch: 37, step: 551, loss: 0.3174493610858917, mean loss: 0.34487879017010087
Epoch: 37, step: 552, loss: 0.3146560490131378, mean loss: 0.3448782302927152
Epoch: 37, step: 553, loss: 0.35117265582084656, mean loss: 0.34487834689501834
Epoch: 37, step: 554, loss: 0.3590462803840637, mean loss: 0.3448786093467807
Epoch: 37, step: 555, loss: 0.31894540786743164, mean loss: 0.34487812895997205
Epoch: 37, step: 556, loss: 0.33129599690437317, mean loss: 0.34487787736912173
Epoch: 37, step: 557, loss: 0.3813791871070862, mean loss: 0.34487855349459384
Epoch: 37, step: 558, loss: 0.32342660427093506, mean loss: 0.3448781561406156
Epoch: 37, step: 559, loss: 0.316739022731781, mean loss: 0.34487763492972784
Epoch: 37, step: 560, loss: 0.30616214871406555, mean loss: 0.3448769178302036
Epoch: 37, step: 561, loss: 0.3474201560020447, mean loss: 0.34487696493593006
Epoch: 37, step: 562, loss: 0.3073429763317108, mean loss: 0.34487626974620206
Epoch: 37, step: 563, loss: 0.3433324098587036, mean loss: 0.34487624115196797
Epoch: 37, step: 564, loss: 0.32475388050079346, mean loss: 0.34487586846734863
Epoch: 37, step: 565, loss: 0.33810028433799744, mean loss: 0.34487574297962537
Epoch: 37, step: 566, loss: 0.34401267766952515, mean loss: 0.34487572699545443
Epoch: 37, step: 567, loss: 0.3168277144432068, mean loss: 0.3448752075493371
Epoch: 37, step: 568, loss: 0.33121681213378906, mean loss: 0.34487495460203604
Epoch: 37, step: 569, loss: 0.338534951210022, mean loss: 0.3448748371902172
Epoch: 37, step: 570, loss: 0.32232388854026794, mean loss: 0.3448744195723234
Epoch: 37, step: 571, loss: 0.3307238519191742, mean loss: 0.34487415752477424
Epoch: 37, step: 572, loss: 0.32910123467445374, mean loss: 0.3448738654390193
Epoch: 37, step: 573, loss: 0.3494771420955658, mean loss: 0.3448739506817262
Epoch: 37, step: 574, loss: 0.34863409399986267, mean loss: 0.34487402031014164
Epoch: 37, step: 575, loss: 0.3608173131942749, mean loss: 0.3448743155344377
Epoch: 37, step: 576, loss: 0.33776524662971497, mean loss: 0.3448741838972022
Epoch: 37, step: 577, loss: 0.31694093346595764, mean loss: 0.3448736666722563
Epoch: 37, step: 578, loss: 0.3307822644710541, mean loss: 0.34487340575418635
Epoch: 37, step: 579, loss: 0.3042125701904297, mean loss: 0.3448726528872858
Epoch: 37, step: 580, loss: 0.3247215151786804, mean loss: 0.3448722797802535
Epoch: 37, step: 581, loss: 0.31979045271873474, mean loss: 0.3448718153879731
Epoch: 37, step: 582, loss: 0.3015262186527252, mean loss: 0.3448710128552162
Epoch: 37, step: 583, loss: 0.33659735321998596, mean loss: 0.34487085967333747
Epoch: 37, step: 584, loss: 0.32535138726234436, mean loss: 0.3448704982886262
Epoch: 37, step: 585, loss: 0.32019078731536865, mean loss: 0.3448700413754005
Epoch: 37, step: 586, loss: 0.3270162045955658, mean loss: 0.3448697108406087
Epoch: 37, step: 587, loss: 0.35366207361221313, mean loss: 0.34486987361391236
Epoch: 37, step: 588, loss: 0.3518162667751312, mean loss: 0.3448700022103387
Epoch: 37, step: 589, loss: 0.3193707764148712, mean loss: 0.34486953015980376
Epoch: 37, step: 590, loss: 0.31214120984077454, mean loss: 0.3448689242929732
Epoch: 37, step: 591, loss: 0.3146628141403198, mean loss: 0.3448683651276612
Epoch: 37, step: 592, loss: 0.32669585943222046, mean loss: 0.3448680287305991
Epoch: 37, step: 593, loss: 0.3957204520702362, mean loss: 0.34486897005863837
Epoch: 37, step: 594, loss: 0.3433338701725006, mean loss: 0.34486894164296567
Epoch: 37, step: 595, loss: 0.3069588541984558, mean loss: 0.34486823991618787
Epoch: 37, step: 596, loss: 0.28148460388183594, mean loss: 0.34486706668831124
Epoch: 37, step: 597, loss: 0.3255930244922638, mean loss: 0.3448667099333748
Epoch: 37, step: 598, loss: 0.3463708758354187, mean loss: 0.34486673777437843
Epoch: 37, step: 599, loss: 0.33369383215904236, mean loss: 0.3448665309759477
Epoch: 37, step: 600, loss: 0.3353555202484131, mean loss: 0.34486635494065687
Epoch: 37, step: 601, loss: 0.34359124302864075, mean loss: 0.3448663313405845
Epoch: 37, step: 602, loss: 0.33771151304244995, mean loss: 0.34486619891996856
Epoch: 37, step: 603, loss: 0.3225674629211426, mean loss: 0.34486578622497305
Epoch: 37, step: 604, loss: 0.3423866033554077, mean loss: 0.3448657403422186
Epoch: 37, step: 605, loss: 0.3829529881477356, mean loss: 0.34486644521781185
Epoch: 37, step: 606, loss: 0.3745104670524597, mean loss: 0.34486699382560004
Epoch: 37, step: 607, loss: 0.3883054852485657, mean loss: 0.3448677977061875
Epoch: 37, step: 608, loss: 0.2881292998790741, mean loss: 0.3448667477127047
Epoch: 37, step: 609, loss: 0.39643368124961853, mean loss: 0.3448677019843938
Epoch: 37, step: 610, loss: 0.3697327673435211, mean loss: 0.34486816211624965
Epoch: 37, step: 611, loss: 0.33137238025665283, mean loss: 0.34486791237935366
Epoch: 37, step: 612, loss: 0.3061981797218323, mean loss: 0.3448671968164911
Epoch: 37, step: 613, loss: 0.339782178401947, mean loss: 0.3448671027226675
Epoch: 37, step: 614, loss: 0.36336004734039307, mean loss: 0.3448674449121207
Epoch: 37, step: 615, loss: 0.3642945885658264, mean loss: 0.3448678043811395
Epoch: 37, step: 616, loss: 0.31619173288345337, mean loss: 0.3448672737849419
Epoch: 37, step: 617, loss: 0.3223787248134613, mean loss: 0.34486685768478703
Epoch: 37, step: 618, loss: 0.31777623295783997, mean loss: 0.3448663564428175
Epoch: 37, step: 619, loss: 0.32080331444740295, mean loss: 0.34486591122667637
Epoch: 37, step: 620, loss: 0.31765681505203247, mean loss: 0.3448654078113278
Epoch: 37, step: 621, loss: 0.31260037422180176, mean loss: 0.3448648108634353
Epoch: 37, step: 622, loss: 0.3250390291213989, mean loss: 0.344864444065749
Epoch: 37, step: 623, loss: 0.34574201703071594, mean loss: 0.34486446030146584
Epoch: 37, step: 624, loss: 0.30403903126716614, mean loss: 0.34486370501630065
Epoch: 37, step: 625, loss: 0.326734334230423, mean loss: 0.3448633696226057
Epoch: 37, step: 626, loss: 0.3115571439266205, mean loss: 0.34486275346821305
Epoch: 37, step: 627, loss: 0.3247789442539215, mean loss: 0.3448623819311179
Epoch: 37, step: 628, loss: 0.350155770778656, mean loss: 0.3448624798534748
Epoch: 37, step: 629, loss: 0.3603404760360718, mean loss: 0.34486276617550266
Epoch: 37, step: 630, loss: 0.336196631193161, mean loss: 0.3448626058666737
Epoch: 37, step: 631, loss: 0.35226160287857056, mean loss: 0.34486274273306317
Epoch: 37, step: 632, loss: 0.34750086069107056, mean loss: 0.34486279153197474
Epoch: 37, step: 633, loss: 0.32720938324928284, mean loss: 0.3448624649919229
Epoch: 37, step: 634, loss: 0.30649587512016296, mean loss: 0.3448617553274598
Epoch: 37, step: 635, loss: 0.3334375023841858, mean loss: 0.34486154401766134
Epoch: 37, step: 636, loss: 0.28528088331222534, mean loss: 0.34486044199859717
Epoch: 37, step: 637, loss: 0.32394319772720337, mean loss: 0.3448600551150794
Epoch: 37, step: 638, loss: 0.3420056998729706, mean loss: 0.3448600023221513
Epoch: 37, step: 639, loss: 0.3423650860786438, mean loss: 0.34485995617810594
Epoch: 37, step: 640, loss: 0.3094961941242218, mean loss: 0.34485930212935245
Epoch: 37, step: 641, loss: 0.33659976720809937, mean loss: 0.34485914937301954
Epoch: 37, step: 642, loss: 0.31514498591423035, mean loss: 0.34485859983327627
Epoch: 37, step: 643, loss: 0.35338473320007324, mean loss: 0.34485875751439343
Epoch: 37, step: 644, loss: 0.3677629828453064, mean loss: 0.34485918109409736
Epoch: 37, step: 645, loss: 0.33340466022491455, mean loss: 0.34485896926362675
Epoch: 37, step: 646, loss: 0.33786383271217346, mean loss: 0.3448588399037275
Epoch: 37, step: 647, loss: 0.3144688308238983, mean loss: 0.34485827791672624
Epoch: 37, step: 648, loss: 0.351420134305954, mean loss: 0.3448583992595594
Epoch: 37, step: 649, loss: 0.30759724974632263, mean loss: 0.34485771023353196
Epoch: 37, step: 650, loss: 0.31837528944015503, mean loss: 0.34485722053474327
Epoch: 37, step: 651, loss: 0.3099795877933502, mean loss: 0.34485657560810234
Epoch: 37, step: 652, loss: 0.3363972008228302, mean loss: 0.3448564191876444
Epoch: 37, step: 653, loss: 0.3008200228214264, mean loss: 0.3448556049352801
Epoch: 37, step: 654, loss: 0.3360889256000519, mean loss: 0.3448554428385152
Epoch: 37, step: 655, loss: 0.30869704484939575, mean loss: 0.34485477427853467
Epoch: 37, step: 656, loss: 0.4519251883029938, mean loss: 0.34485675394783344
Epoch: 37, step: 657, loss: 0.3031007945537567, mean loss: 0.34485598191885375
Epoch: 37, step: 658, loss: 0.3053850531578064, mean loss: 0.3448552521514649
Epoch: 37, step: 659, loss: 0.33007439970970154, mean loss: 0.34485497887731087
Epoch: 37, step: 660, loss: 0.3676975667476654, mean loss: 0.3448554011921599
Epoch: 37, step: 661, loss: 0.37375038862228394, mean loss: 0.344855935394183
Epoch: 37, step: 662, loss: 0.37607526779174805, mean loss: 0.34485651255734134
Epoch: 37, step: 663, loss: 0.3780438303947449, mean loss: 0.34485712609202
Epoch: 37, step: 664, loss: 0.32206255197525024, mean loss: 0.3448567046960147
Epoch: 37, step: 665, loss: 0.3198143243789673, mean loss: 0.3448562417540929
Epoch: 37, step: 666, loss: 0.3257434070110321, mean loss: 0.34485588843428994
Epoch: 37, step: 667, loss: 0.34032195806503296, mean loss: 0.34485580462161675
Epoch: 37, step: 668, loss: 0.31439894437789917, mean loss: 0.3448552416170094
Epoch: 37, step: 669, loss: 0.3497055768966675, mean loss: 0.34485533127531987
Epoch: 37, step: 670, loss: 0.3840421140193939, mean loss: 0.34485605562850097
Epoch: 37, step: 671, loss: 0.32019010186195374, mean loss: 0.344855599695899
Epoch: 37, step: 672, loss: 0.31609046459198, mean loss: 0.3448550680026752
Epoch: 37, step: 673, loss: 0.37390971183776855, mean loss: 0.3448556050372365
Epoch: 37, step: 674, loss: 0.38248035311698914, mean loss: 0.3448563004653658
Epoch: 37, step: 675, loss: 0.33267199993133545, mean loss: 0.3448560752638921
Epoch: 37, step: 676, loss: 0.3345213830471039, mean loss: 0.3448558842521147
Epoch: 37, step: 677, loss: 0.3173322379589081, mean loss: 0.34485537555351764
Epoch: 37, step: 678, loss: 0.33436548709869385, mean loss: 0.34485518168047985
Epoch: 37, step: 679, loss: 0.3415960669517517, mean loss: 0.3448551214469704
Epoch: 37, step: 680, loss: 0.3138974606990814, mean loss: 0.3448545493118219
Epoch: 37, step: 681, loss: 0.3081623613834381, mean loss: 0.3448538712081825
Epoch: 37, step: 682, loss: 0.3906124532222748, mean loss: 0.344854716851065
Epoch: 37, step: 683, loss: 0.32198116183280945, mean loss: 0.34485429414343977
Epoch: 37, step: 684, loss: 0.33380502462387085, mean loss: 0.3448540899546216
Epoch: 37, step: 685, loss: 0.33497369289398193, mean loss: 0.34485390736976257
Epoch: 37, step: 686, loss: 0.33295542001724243, mean loss: 0.3448536874956546
Epoch: 37, step: 687, loss: 0.3208082914352417, mean loss: 0.34485324316503035
Epoch: 37, step: 688, loss: 0.3340538442134857, mean loss: 0.3448530436085333
Epoch: 37, step: 689, loss: 0.3030564785003662, mean loss: 0.3448522712857367
Epoch: 37, step: 690, loss: 0.31535089015960693, mean loss: 0.34485172616514825
Epoch: 37, step: 691, loss: 0.34555739164352417, mean loss: 0.34485173920405215
Epoch: 37, step: 692, loss: 0.33110156655311584, mean loss: 0.3448514851405158
Epoch: 37, step: 693, loss: 0.36141839623451233, mean loss: 0.34485179124359944
Epoch: 37, step: 694, loss: 0.3503651022911072, mean loss: 0.3448518931099233
Epoch: 37, step: 695, loss: 0.32249119877815247, mean loss: 0.3448514799716791
Epoch: 37, step: 696, loss: 0.37843188643455505, mean loss: 0.34485210039489317
Epoch: 37, step: 697, loss: 0.337457537651062, mean loss: 0.3448519637773204
Epoch: 37, step: 698, loss: 0.3183393180370331, mean loss: 0.34485147395439025
Epoch: 37, step: 699, loss: 0.41633519530296326, mean loss: 0.3448527945965967
Epoch: 37, step: 700, loss: 0.3332177400588989, mean loss: 0.3448525796461166
Epoch: 37, step: 701, loss: 0.34347036480903625, mean loss: 0.34485255411101895
Epoch: 37, step: 702, loss: 0.35490304231643677, mean loss: 0.3448527397807499
Epoch: 37, step: 703, loss: 0.31848254799842834, mean loss: 0.34485225263466657
Epoch: 37, step: 704, loss: 0.364762544631958, mean loss: 0.3448526204378919
Epoch: 37, step: 705, loss: 0.3147881031036377, mean loss: 0.34485206506571664
Epoch: 37, step: 706, loss: 0.3121455907821655, mean loss: 0.34485146090067953
Epoch: 37, step: 707, loss: 0.31075528264045715, mean loss: 0.34485083107619563
Epoch: 37, step: 708, loss: 0.3403441309928894, mean loss: 0.34485074782998537
Epoch: 37, step: 709, loss: 0.30966803431510925, mean loss: 0.34485009795903493
Epoch: 37, step: 710, loss: 0.3734881579875946, mean loss: 0.34485062693186463
Epoch: 37, step: 711, loss: 0.33828166127204895, mean loss: 0.34485050559891933
Epoch: 37, step: 712, loss: 0.3178984522819519, mean loss: 0.34485000778666397
Epoch: 37, step: 713, loss: 0.3694072961807251, mean loss: 0.3448504613585378
Epoch: 37, step: 714, loss: 0.36040198802948, mean loss: 0.3448507485891433
Epoch: 37, step: 715, loss: 0.30677539110183716, mean loss: 0.3448500453651944
Epoch: 37, step: 716, loss: 0.332379013299942, mean loss: 0.34484981503862566
Epoch: 37, step: 717, loss: 0.32443252205848694, mean loss: 0.3448494379601161
Epoch: 37, step: 718, loss: 0.31819605827331543, mean loss: 0.3448489457190005
Epoch: 37, step: 719, loss: 0.3426617980003357, mean loss: 0.34484890532696905
Epoch: 37, step: 720, loss: 0.3304789960384369, mean loss: 0.3448486399497822
Epoch: 37, step: 721, loss: 0.31731924414634705, mean loss: 0.34484813155835464
Epoch: 37, step: 722, loss: 0.3523859977722168, mean loss: 0.34484827075922286
Epoch: 37, step: 723, loss: 0.30065375566482544, mean loss: 0.34484745463950256
Epoch: 37, step: 724, loss: 0.31916263699531555, mean loss: 0.34484698033858396
Epoch: 37, step: 725, loss: 0.39024868607521057, mean loss: 0.3448478187199729
Epoch: 37, step: 726, loss: 0.31493592262268066, mean loss: 0.3448472663813874
Epoch: 37, step: 727, loss: 0.35848841071128845, mean loss: 0.3448475182675003
Epoch: 37, step: 728, loss: 0.34885111451148987, mean loss: 0.34484759219323924
Epoch: 37, step: 729, loss: 0.3320934474468231, mean loss: 0.3448473566944256
Epoch: 37, step: 730, loss: 0.2980739176273346, mean loss: 0.34484649306254417
Epoch: 37, step: 731, loss: 0.3168518543243408, mean loss: 0.34484597617482743
Epoch: 37, step: 732, loss: 0.3209031820297241, mean loss: 0.3448455341077654
Epoch: 37, step: 733, loss: 0.3436714708805084, mean loss: 0.34484551243088446
Epoch: 37, step: 734, loss: 0.3505595326423645, mean loss: 0.3448456179276297
Epoch: 37, step: 735, loss: 0.33833950757980347, mean loss: 0.3448454978089097
Epoch: 37, step: 736, loss: 0.3319414258003235, mean loss: 0.3448452595725577
Epoch: 37, step: 737, loss: 0.30943891406059265, mean loss: 0.34484460590890315
Epoch: 37, step: 738, loss: 0.31172263622283936, mean loss: 0.3448439944301488
Epoch: 37, step: 739, loss: 0.3709271252155304, mean loss: 0.3448444759530181
Epoch: 37, step: 740, loss: 0.38011860847473145, mean loss: 0.3448451271397212
Epoch: 37, step: 741, loss: 0.3159453272819519, mean loss: 0.34484459363778547
Epoch: 37, step: 742, loss: 0.3553656339645386, mean loss: 0.3448447878568386
Epoch: 37, step: 743, loss: 0.3325318992137909, mean loss: 0.3448445605643509
Epoch: 37, step: 744, loss: 0.3073427677154541, mean loss: 0.34484386830450103
Epoch: 37, step: 745, loss: 0.30704766511917114, mean loss: 0.3448431706228976
Epoch: 37, step: 746, loss: 0.31671416759490967, mean loss: 0.34484265139810705
Epoch: 37, step: 747, loss: 0.31896960735321045, mean loss: 0.34484217382419896
Epoch: 37, step: 748, loss: 0.37876370549201965, mean loss: 0.34484279994841527
Epoch: 37, step: 749, loss: 0.37193742394447327, mean loss: 0.3448433000522212
Epoch: 37, step: 750, loss: 0.33584681153297424, mean loss: 0.34484313400101096
Epoch: 37, step: 751, loss: 0.33916082978248596, mean loss: 0.3448430291227493
Epoch: 37, step: 752, loss: 0.3029564917087555, mean loss: 0.34484225603739804
Epoch: 37, step: 753, loss: 0.30174723267555237, mean loss: 0.3448414606621191
Epoch: 37, step: 754, loss: 0.31882208585739136, mean loss: 0.34484098044923306
Epoch: 37, step: 755, loss: 0.3471457362174988, mean loss: 0.3448410229849589
Epoch: 37, step: 756, loss: 0.3840283751487732, mean loss: 0.34484174619898794
Epoch: 37, step: 757, loss: 0.3223418891429901, mean loss: 0.344841330965218
Epoch: 37, step: 758, loss: 0.3619022071361542, mean loss: 0.3448416458170491
Epoch: 37, step: 759, loss: 0.3447439968585968, mean loss: 0.34484164401500883
Epoch: 37, step: 760, loss: 0.34455883502960205, mean loss: 0.34484163879607166
Epoch: 37, step: 761, loss: 0.3395480513572693, mean loss: 0.34484154111038356
Epoch: 37, step: 762, loss: 0.29908862709999084, mean loss: 0.34484069682048285
Epoch: 37, step: 763, loss: 0.33853355050086975, mean loss: 0.3448405804352909
Epoch: 37, step: 764, loss: 0.31386759877204895, mean loss: 0.3448400089042507
Epoch: 37, step: 765, loss: 0.34782734513282776, mean loss: 0.3448400640272575
Epoch: 37, step: 766, loss: 0.35857683420181274, mean loss: 0.34484031749658445
Epoch: 37, step: 767, loss: 0.37515825033187866, mean loss: 0.344840876909324
Epoch: 37, step: 768, loss: 0.406237930059433, mean loss: 0.3448420097589864
Epoch: 37, step: 769, loss: 0.35045409202575684, mean loss: 0.34484211330676057
Epoch: 37, step: 770, loss: 0.3070467412471771, mean loss: 0.3448414159623066
Epoch: 37, step: 771, loss: 0.3608669936656952, mean loss: 0.344841711637172
Epoch: 37, step: 772, loss: 0.3370320200920105, mean loss: 0.3448415675495805
Epoch: 37, step: 773, loss: 0.382829487323761, mean loss: 0.34484226840784726
Epoch: 37, step: 774, loss: 0.3832353949546814, mean loss: 0.3448429767289097
Epoch: 37, step: 775, loss: 0.32626914978027344, mean loss: 0.3448426340636645
Epoch: 37, step: 776, loss: 0.3203757703304291, mean loss: 0.34484218268715433
Epoch: 37, step: 777, loss: 0.3724002242088318, mean loss: 0.3448426910818251
Epoch: 37, step: 778, loss: 0.28784239292144775, mean loss: 0.34484163955161384
Epoch: 37, step: 779, loss: 0.3026876747608185, mean loss: 0.34484086191796587
Epoch: 37, step: 780, loss: 0.3495999574661255, mean loss: 0.34484094970957885
Epoch: 37, step: 781, loss: 0.28972476720809937, mean loss: 0.3448399329934287
Epoch: 37, step: 782, loss: 0.3264588713645935, mean loss: 0.34483959392826424
Epoch: 37, step: 783, loss: 0.3076938986778259, mean loss: 0.3448389087350367
Epoch: 37, step: 784, loss: 0.33511462807655334, mean loss: 0.34483872936328713
Epoch: 37, step: 785, loss: 0.36878541111946106, mean loss: 0.34483917106988976
Epoch: 37, step: 786, loss: 0.35701489448547363, mean loss: 0.3448393956520795
Epoch: 37, step: 787, loss: 0.3771982192993164, mean loss: 0.34483999250215414
Epoch: 37, step: 788, loss: 0.34775927662849426, mean loss: 0.34484004634659643
Epoch: 37, step: 789, loss: 0.3474436104297638, mean loss: 0.34484009436688645
Epoch: 37, step: 790, loss: 0.3239416480064392, mean loss: 0.3448397089218144
Epoch: 37, step: 791, loss: 0.3294190764427185, mean loss: 0.34483942451324784
Epoch: 37, step: 792, loss: 0.33304131031036377, mean loss: 0.3448392069201713
Epoch: 37, step: 793, loss: 0.3232671916484833, mean loss: 0.34483880907399683
Epoch: 37, step: 794, loss: 0.32448476552963257, mean loss: 0.3448384336974307
Epoch: 37, step: 795, loss: 0.3363267779350281, mean loss: 0.3448382767253194
Epoch: 37, step: 796, loss: 0.35119640827178955, mean loss: 0.3448383939799353
Epoch: 37, step: 797, loss: 0.3440433442592621, mean loss: 0.3448383793181546
Epoch: 37, step: 798, loss: 0.3371071517467499, mean loss: 0.3448382367466022
Epoch: 37, step: 799, loss: 0.32989999651908875, mean loss: 0.3448379612756236
Epoch: 37, step: 800, loss: 0.35340815782546997, mean loss: 0.34483811931277253
Epoch: 37, step: 801, loss: 0.3567068576812744, mean loss: 0.3448383381720454
Epoch: 37, step: 802, loss: 0.29552021622657776, mean loss: 0.3448374287637375
Epoch: 37, step: 803, loss: 0.3607608377933502, mean loss: 0.3448377223802191
Epoch: 37, step: 804, loss: 0.3507382571697235, mean loss: 0.3448378311799313
Epoch: 37, step: 805, loss: 0.3210020661354065, mean loss: 0.3448373916813687
Epoch: 37, step: 806, loss: 0.3315703868865967, mean loss: 0.34483714706064783
Epoch: 37, step: 807, loss: 0.3494235873222351, mean loss: 0.34483723162514857
Epoch: 37, step: 808, loss: 0.3314135670661926, mean loss: 0.3448369841250184
Epoch: 37, step: 809, loss: 0.330881804227829, mean loss: 0.344836726829766
Epoch: 37, step: 810, loss: 0.3246127963066101, mean loss: 0.3448363539628156
Epoch: 37, step: 811, loss: 0.32922908663749695, mean loss: 0.3448360662182115
Epoch: 37, step: 812, loss: 0.323535680770874, mean loss: 0.34483567351923017
Epoch: 37, step: 813, loss: 0.34285974502563477, mean loss: 0.34483563709121323
Epoch: 37, step: 814, loss: 0.33303308486938477, mean loss: 0.34483541950457125
Epoch: 37, step: 815, loss: 0.33287763595581055, mean loss: 0.34483519906021703
Epoch: 37, step: 816, loss: 0.32664918899536133, mean loss: 0.3448348638033258
Epoch: 37, step: 817, loss: 0.33863565325737, mean loss: 0.3448347495237375
Epoch: 37, step: 818, loss: 0.34846553206443787, mean loss: 0.34483481645430586
Epoch: 37, step: 819, loss: 0.3426153063774109, mean loss: 0.34483477554016934
Epoch: 37, step: 820, loss: 0.35953137278556824, mean loss: 0.3448350464501814
Epoch: 37, step: 821, loss: 0.34767329692840576, mean loss: 0.3448350987681626
Epoch: 37, step: 822, loss: 0.37305712699890137, mean loss: 0.34483561898029197
Epoch: 37, step: 823, loss: 0.3080487847328186, mean loss: 0.34483494090696293
Epoch: 37, step: 824, loss: 0.3131219446659088, mean loss: 0.34483435636792836
Epoch: 37, step: 825, loss: 0.35707888007164, mean loss: 0.3448345820567938
Epoch: 37, step: 826, loss: 0.3223598599433899, mean loss: 0.34483416781438087
Epoch: 37, step: 827, loss: 0.3276884853839874, mean loss: 0.34483385179988607
Epoch: 37, step: 828, loss: 0.33885133266448975, mean loss: 0.3448337415372631
Epoch: 37, step: 829, loss: 0.29947879910469055, mean loss: 0.34483290562472607
Epoch: 37, step: 830, loss: 0.3077630400657654, mean loss: 0.34483222242257416
Epoch: 37, step: 831, loss: 0.2836022973060608, mean loss: 0.34483109396837003
Epoch: 37, step: 832, loss: 0.31441253423690796, mean loss: 0.344830533371261
Epoch: 37, step: 833, loss: 0.32960060238838196, mean loss: 0.3448302526972906
Epoch: 37, step: 834, loss: 0.3468500077724457, mean loss: 0.34483028991887943
Epoch: 37, step: 835, loss: 0.31872794032096863, mean loss: 0.3448298088937136
Epoch: 37, step: 836, loss: 0.3427106738090515, mean loss: 0.34482976984211344
Epoch: 37, step: 837, loss: 0.2929041087627411, mean loss: 0.34482881296928186
Epoch: 37, step: 838, loss: 0.31877776980400085, mean loss: 0.3448283329161526
Epoch: 37, step: 839, loss: 0.3275599777698517, mean loss: 0.34482801471103824
Epoch: 37, step: 840, loss: 0.336892306804657, mean loss: 0.34482786848192204
Epoch: 37, step: 841, loss: 0.330522745847702, mean loss: 0.3448276048902022
Epoch: 37, step: 842, loss: 0.34011510014533997, mean loss: 0.344827518057368
Epoch: 37, step: 843, loss: 0.3840312659740448, mean loss: 0.3448282404141619
Epoch: 37, step: 844, loss: 0.31553030014038086, mean loss: 0.34482770058882933
Epoch: 37, step: 845, loss: 0.34242916107177734, mean loss: 0.34482765639567026
Epoch: 37, step: 846, loss: 0.2981872856616974, mean loss: 0.34482679706134073
Epoch: 37, step: 847, loss: 0.2884121835231781, mean loss: 0.3448257576587772
Epoch: 37, step: 848, loss: 0.32847678661346436, mean loss: 0.3448254564451684
Epoch: 37, step: 849, loss: 0.4212464690208435, mean loss: 0.34482686440074106
Epoch: 37, step: 850, loss: 0.33228617906570435, mean loss: 0.34482663335954034
Epoch: 37, step: 851, loss: 0.30982834100723267, mean loss: 0.34482598858628405
Epoch: 37, step: 852, loss: 0.3620559275150299, mean loss: 0.3448263060074614
Epoch: 37, step: 853, loss: 0.324778288602829, mean loss: 0.3448259366766076
Epoch: 37, step: 854, loss: 0.3074050843715668, mean loss: 0.34482524731064945
Epoch: 37, step: 855, loss: 0.3705607056617737, mean loss: 0.34482572139985346
Epoch: 37, step: 856, loss: 0.3257121443748474, mean loss: 0.3448253693030123
Epoch: 37, step: 857, loss: 0.3305075466632843, mean loss: 0.344825105555036
Epoch: 37, step: 858, loss: 0.359848290681839, mean loss: 0.3448253822913656
Epoch: 37, step: 859, loss: 0.32697275280952454, mean loss: 0.34482505344098463
Epoch: 37, step: 860, loss: 0.3545284569263458, mean loss: 0.3448252321770727
Epoch: 37, step: 861, loss: 0.3108174502849579, mean loss: 0.344824605767386
Epoch: 37, step: 862, loss: 0.3152468800544739, mean loss: 0.3448240609675902
Epoch: 37, step: 863, loss: 0.30962663888931274, mean loss: 0.3448234126690918
Epoch: 37, step: 864, loss: 0.34794431924819946, mean loss: 0.34482347015176135
Epoch: 37, step: 865, loss: 0.3754331171512604, mean loss: 0.3448240339276298
Epoch: 37, step: 866, loss: 0.3218635022640228, mean loss: 0.3448236110428031
Epoch: 37, step: 867, loss: 0.3457179367542267, mean loss: 0.3448236275141032
Epoch: 37, step: 868, loss: 0.3070962727069855, mean loss: 0.3448229326809668
Epoch: 37, step: 869, loss: 0.35556620359420776, mean loss: 0.34482313053854746
Epoch: 37, step: 870, loss: 0.3158828020095825, mean loss: 0.3448225975576725
Epoch: 37, step: 871, loss: 0.32464590668678284, mean loss: 0.3448222259795718
Epoch: 37, step: 872, loss: 0.30735617876052856, mean loss: 0.344821536009825
Epoch: 37, step: 873, loss: 0.31538286805152893, mean loss: 0.34482099388121173
Epoch: 37, step: 874, loss: 0.3007487952709198, mean loss: 0.3448201822833514
Epoch: 37, step: 875, loss: 0.30848169326782227, mean loss: 0.34481951311553655
Epoch: 37, step: 876, loss: 0.35667356848716736, mean loss: 0.34481973140216526
Epoch: 37, step: 877, loss: 0.3410949110984802, mean loss: 0.3448196628126852
Epoch: 37, step: 878, loss: 0.36379626393318176, mean loss: 0.34482001224463915
Epoch: 37, step: 879, loss: 0.33910325169563293, mean loss: 0.34481990697910647
Epoch: 37, step: 880, loss: 0.3382321000099182, mean loss: 0.3448197856767999
Epoch: 37, step: 881, loss: 0.3543475568294525, mean loss: 0.34481996110989055
Epoch: 37, step: 882, loss: 0.31536468863487244, mean loss: 0.34481941876538436
Epoch: 37, step: 883, loss: 0.3393253684043884, mean loss: 0.34481931760817486
Epoch: 37, step: 884, loss: 0.34499096870422363, mean loss: 0.34481932076858024
Epoch: 37, step: 885, loss: 0.3187629282474518, mean loss: 0.34481884103237004
Epoch: 37, step: 886, loss: 0.32602694630622864, mean loss: 0.34481849505253526
Epoch: 37, step: 887, loss: 0.3076132833957672, mean loss: 0.3448178100755182
Epoch: 37, step: 888, loss: 0.3310701847076416, mean loss: 0.3448175569756532
Epoch: 37, step: 889, loss: 0.3366162180900574, mean loss: 0.34481740598815575
Epoch: 37, step: 890, loss: 0.34884750843048096, mean loss: 0.3448174801813928
Epoch: 37, step: 891, loss: 0.3185209631919861, mean loss: 0.34481699607761906
Epoch: 37, step: 892, loss: 0.29192760586738586, mean loss: 0.34481602243224785
Epoch: 37, step: 893, loss: 0.37752535939216614, mean loss: 0.34481662457018386
Epoch: 37, step: 894, loss: 0.33652761578559875, mean loss: 0.34481647198272025
Epoch: 37, step: 895, loss: 0.3268437087535858, mean loss: 0.34481614113883485
Epoch: 37, step: 896, loss: 0.29268503189086914, mean loss: 0.3448151815233862
Epoch: 37, step: 897, loss: 0.3341508209705353, mean loss: 0.3448149852203167
Epoch: 37, step: 898, loss: 0.3175400197505951, mean loss: 0.34481448316856583
Epoch: 37, step: 899, loss: 0.34834811091423035, mean loss: 0.34481454821104385
Epoch: 37, step: 900, loss: 0.347298264503479, mean loss: 0.3448145939272597
Epoch: 37, step: 901, loss: 0.34975358843803406, mean loss: 0.34481468483457633
Epoch: 37, step: 902, loss: 0.341521680355072, mean loss: 0.344814624224529
Epoch: 37, step: 903, loss: 0.3995606005191803, mean loss: 0.3448156318439116
Epoch: 37, step: 904, loss: 0.32074135541915894, mean loss: 0.34481518875635114
Epoch: 37, step: 905, loss: 0.3526630699634552, mean loss: 0.34481533319411034
Epoch: 37, step: 906, loss: 0.3588739037513733, mean loss: 0.3448155919328709
Epoch: 37, step: 907, loss: 0.3248848617076874, mean loss: 0.344815225127618
Epoch: 37, step: 908, loss: 0.3452131450176239, mean loss: 0.34481523245080276
Epoch: 37, step: 909, loss: 0.34871914982795715, mean loss: 0.3448153042958721
Epoch: 37, step: 910, loss: 0.3427674174308777, mean loss: 0.3448152666086334
Epoch: 37, step: 911, loss: 0.3342670798301697, mean loss: 0.34481507249404414
Epoch: 37, step: 912, loss: 0.36416569352149963, mean loss: 0.3448154285901967
Epoch: 37, step: 913, loss: 0.32720521092414856, mean loss: 0.3448151045274521
Epoch: 37, step: 914, loss: 0.29688966274261475, mean loss: 0.34481422262100997
Epoch: 37, step: 915, loss: 0.3634296655654907, mean loss: 0.34481456516927556
Epoch: 37, step: 916, loss: 0.3183205723762512, mean loss: 0.3448140776544574
Epoch: 37, step: 917, loss: 0.32721057534217834, mean loss: 0.34481375373913126
Epoch: 37, step: 918, loss: 0.32458677887916565, mean loss: 0.34481338155713664
Epoch: 37, step: 919, loss: 0.33356985449790955, mean loss: 0.34481317467690076
Epoch: 37, step: 920, loss: 0.3567577302455902, mean loss: 0.34481339445197606
Epoch: 37, step: 921, loss: 0.32540419697761536, mean loss: 0.3448130373370271
Epoch: 37, step: 922, loss: 0.3481418490409851, mean loss: 0.34481309858358566
Epoch: 37, step: 923, loss: 0.32025739550590515, mean loss: 0.3448126467933465
Epoch: 37, step: 924, loss: 0.3367900848388672, mean loss: 0.34481249919225815
Epoch: 37, step: 925, loss: 0.32657548785209656, mean loss: 0.3448121636693649
Epoch: 37, step: 926, loss: 0.3168427050113678, mean loss: 0.34481164909924883
Epoch: 37, step: 927, loss: 0.3450634181499481, mean loss: 0.34481165373110273
Epoch: 37, step: 928, loss: 0.33190232515335083, mean loss: 0.3448114162395455
Epoch: 37, step: 929, loss: 0.29212671518325806, mean loss: 0.3448104470224835
Epoch: 37, step: 930, loss: 0.36762943863868713, mean loss: 0.3448108668056218
Epoch: 37, step: 931, loss: 0.3432045578956604, mean loss: 0.3448108372561569
Epoch: 37, step: 932, loss: 0.31068339943885803, mean loss: 0.344810209463478
Epoch: 37, step: 933, loss: 0.3405130207538605, mean loss: 0.34481013041582137
Epoch: 37, step: 934, loss: 0.3171769976615906, mean loss: 0.34480962210809823
Epoch: 37, step: 935, loss: 0.31807321310043335, mean loss: 0.34480913030453325
Epoch: 37, step: 936, loss: 0.3813572824001312, mean loss: 0.34480980257809335
Epoch: 37, step: 937, loss: 0.3565560281276703, mean loss: 0.34481001863639354
Epoch: 37, step: 938, loss: 0.31385257840156555, mean loss: 0.3448094492203832
Epoch: 37, step: 939, loss: 0.31345459818840027, mean loss: 0.34480887250520087
Epoch: 37, step: 940, loss: 0.3017560839653015, mean loss: 0.3448080806424015
Epoch: 37, step: 941, loss: 0.3207462728023529, mean loss: 0.34480763808570036
Epoch: 37, step: 942, loss: 0.31899112462997437, mean loss: 0.3448071632643166
Epoch: 37, step: 943, loss: 0.33281201124191284, mean loss: 0.3448069426516479
Epoch: 37, step: 944, loss: 0.3635645806789398, mean loss: 0.34480728763239255
Epoch: 37, step: 945, loss: 0.30824947357177734, mean loss: 0.34480661529241274
Epoch: 37, step: 946, loss: 0.3389264941215515, mean loss: 0.3448065071522533
Epoch: 37, step: 947, loss: 0.3433692455291748, mean loss: 0.34480648072034176
Epoch: 37, step: 948, loss: 0.31538382172584534, mean loss: 0.34480593963387146
Epoch: 37, step: 949, loss: 0.31484317779541016, mean loss: 0.3448053886249738
Epoch: 37, step: 950, loss: 0.35219937562942505, mean loss: 0.3448055245963415
Epoch: 37, step: 951, loss: 0.31087470054626465, mean loss: 0.344804900638562
Epoch: 37, step: 952, loss: 0.30697235465049744, mean loss: 0.3448042049443676
Epoch: 37, step: 953, loss: 0.36327120661735535, mean loss: 0.34480454452367093
Epoch: 37, step: 954, loss: 0.34729769825935364, mean loss: 0.3448045903680292
Epoch: 37, step: 955, loss: 0.3017595410346985, mean loss: 0.34480379886594525
Epoch: 37, step: 956, loss: 0.2826206684112549, mean loss: 0.3448026554784219
Epoch: 37, step: 957, loss: 0.3226892948150635, mean loss: 0.3448022488781817
Epoch: 37, step: 958, loss: 0.2805326282978058, mean loss: 0.34480106716893905
Epoch: 37, step: 959, loss: 0.3533354103565216, mean loss: 0.34480122408486147
Epoch: 37, step: 960, loss: 0.32515987753868103, mean loss: 0.344800862957675
Epoch: 37, step: 961, loss: 0.31520402431488037, mean loss: 0.3448003187981118
Epoch: 37, step: 962, loss: 0.31571516394615173, mean loss: 0.3447997840560616
Epoch: 37, step: 963, loss: 0.343386709690094, mean loss: 0.34479975807660934
Epoch: 37, step: 964, loss: 0.3181855082511902, mean loss: 0.34479926878111494
Epoch: 37, step: 965, loss: 0.32658153772354126, mean loss: 0.34479893385941296
Epoch: 37, step: 966, loss: 0.3319859802722931, mean loss: 0.34479869830552773
Epoch: 37, step: 967, loss: 0.33772164583206177, mean loss: 0.344798568203085
Epoch: 37, step: 968, loss: 0.32031112909317017, mean loss: 0.3447981180415116
Epoch: 37, step: 969, loss: 0.3015473783016205, mean loss: 0.3447973229619179
Epoch: 37, step: 970, loss: 0.3055073916912079, mean loss: 0.3447966007072575
Epoch: 37, step: 971, loss: 0.3609410226345062, mean loss: 0.34479689747971937
Epoch: 37, step: 972, loss: 0.3240414261817932, mean loss: 0.3447965159523339
Epoch: 37, step: 973, loss: 0.3158109188079834, mean loss: 0.34479598314844534
Epoch: 37, step: 974, loss: 0.34642350673675537, mean loss: 0.3447960130645086
Epoch: 37, step: 975, loss: 0.35909125208854675, mean loss: 0.344796275825317
Epoch: 37, step: 976, loss: 0.28377458453178406, mean loss: 0.3447951542061406
Epoch: 37, step: 977, loss: 0.35966378450393677, mean loss: 0.3447954274964082
Epoch: 37, step: 978, loss: 0.333443284034729, mean loss: 0.34479521884414904
Epoch: 37, step: 979, loss: 0.3644479811191559, mean loss: 0.3447955800550422
Epoch: 37, step: 980, loss: 0.3550049960613251, mean loss: 0.3447957676970868
Epoch: 37, step: 981, loss: 0.31422159075737, mean loss: 0.3447952057750699
Epoch: 37, step: 982, loss: 0.2966206669807434, mean loss: 0.3447943203927245
Epoch: 37, step: 983, loss: 0.33234167098999023, mean loss: 0.34479409153421164
Epoch: 37, step: 984, loss: 0.3568282425403595, mean loss: 0.3447943126973713
Epoch: 37, step: 985, loss: 0.30120256543159485, mean loss: 0.3447935115846565
Epoch: 37, step: 986, loss: 0.3538016378879547, mean loss: 0.34479367712956693
Epoch: 37, step: 987, loss: 0.3391728103160858, mean loss: 0.34479357383519005
Epoch: 37, step: 988, loss: 0.3459281921386719, mean loss: 0.34479359468562837
Epoch: 37, step: 989, loss: 0.2874215841293335, mean loss: 0.34479254040192525
Epoch: 37, step: 990, loss: 0.29559504985809326, mean loss: 0.34479163635204296
Epoch: 37, step: 991, loss: 0.35856297612190247, mean loss: 0.3447918894086356
Epoch: 37, step: 992, loss: 0.3582446873188019, mean loss: 0.34479213660728886
Epoch: 37, step: 993, loss: 0.417856901884079, mean loss: 0.34479347916664493
Epoch: 37, step: 994, loss: 0.3340058922767639, mean loss: 0.3447932809492205
Epoch: 37, step: 995, loss: 0.3405938446521759, mean loss: 0.3447932037877422
Epoch: 37, step: 996, loss: 0.3435938358306885, mean loss: 0.3447931817506644
Epoch: 37, step: 997, loss: 0.35144323110580444, mean loss: 0.3447933039358214
Epoch: 37, step: 998, loss: 0.3400731086730957, mean loss: 0.34479321721056994
Epoch: 37, step: 999, loss: 0.3408944606781006, mean loss: 0.34479314557912044
Epoch: 37, step: 1000, loss: 0.31920528411865234, mean loss: 0.34479267546463255
Epoch: 37, step: 1001, loss: 0.3123961389064789, mean loss: 0.3447920802682967
Epoch: 37, step: 1002, loss: 0.32153207063674927, mean loss: 0.3447916529381056
Epoch: 37, step: 1003, loss: 0.3232238292694092, mean loss: 0.3447912567038377
Epoch: 37, step: 1004, loss: 0.3569507598876953, mean loss: 0.34479148008860766
Epoch: 37, step: 1005, loss: 0.2921164035797119, mean loss: 0.3447905124015645
Epoch: 37, step: 1006, loss: 0.34187114238739014, mean loss: 0.34479045877117936
Epoch: 37, step: 1007, loss: 0.37656986713409424, mean loss: 0.3447910425651459
Epoch: 37, step: 1008, loss: 0.32575106620788574, mean loss: 0.3447906928034699
Epoch: 37, step: 1009, loss: 0.31641364097595215, mean loss: 0.3447901715306122
Epoch: 37, step: 1010, loss: 0.3276856243610382, mean loss: 0.34478985733404044
Epoch: 37, step: 1011, loss: 0.35393548011779785, mean loss: 0.34479002532858094
Epoch: 37, step: 1012, loss: 0.31294122338294983, mean loss: 0.3447894403135749
Epoch: 37, step: 1013, loss: 0.3121500313282013, mean loss: 0.34478884078730865
Epoch: 37, step: 1014, loss: 0.3335399031639099, mean loss: 0.3447886341686869
Epoch: 37, step: 1015, loss: 0.3838866353034973, mean loss: 0.34478935230110064
Epoch: 37, step: 1016, loss: 0.3232370615005493, mean loss: 0.3447889564467375
Epoch: 37, step: 1017, loss: 0.3433900773525238, mean loss: 0.3447889307537739
Epoch: 37, step: 1018, loss: 0.3612571656703949, mean loss: 0.3447892332173608
Epoch: 37, step: 1019, loss: 0.3525700569152832, mean loss: 0.34478937612111665
Epoch: 37, step: 1020, loss: 0.3132777214050293, mean loss: 0.34478879738404683
Epoch: 37, step: 1021, loss: 0.3006117343902588, mean loss: 0.34478798605139316
Epoch: 37, step: 1022, loss: 0.32054486870765686, mean loss: 0.34478754082325513
Epoch: 37, step: 1023, loss: 0.3460180461406708, mean loss: 0.3447875634212372
Epoch: 37, step: 1024, loss: 0.3305988609790802, mean loss: 0.3447873028533632
Epoch: 37, step: 1025, loss: 0.3523957431316376, mean loss: 0.3447874425757027
Epoch: 37, step: 1026, loss: 0.3380187749862671, mean loss: 0.34478731827733544
Epoch: 37, step: 1027, loss: 0.3035796582698822, mean loss: 0.3447865615625564
Epoch: 37, step: 1028, loss: 0.3553372919559479, mean loss: 0.3447867553068022
Epoch: 37, step: 1029, loss: 0.30216825008392334, mean loss: 0.3447859727127807
Epoch: 37, step: 1030, loss: 0.28461629152297974, mean loss: 0.3447848678507526
Epoch: 37, step: 1031, loss: 0.3548196256160736, mean loss: 0.3447850521099844
Epoch: 37, step: 1032, loss: 0.3392983675003052, mean loss: 0.3447849513647794
Epoch: 37, step: 1033, loss: 0.3197517991065979, mean loss: 0.34478449172039877
Epoch: 37, step: 1034, loss: 0.3099077641963959, mean loss: 0.3447838513456944
Epoch: 37, step: 1035, loss: 0.40017181634902954, mean loss: 0.34478486831038674
Epoch: 37, step: 1036, loss: 0.34978634119033813, mean loss: 0.34478496013950416
Epoch: 37, step: 1037, loss: 0.3029938340187073, mean loss: 0.3447841928511753
Epoch: 37, step: 1038, loss: 0.30154258012771606, mean loss: 0.3447833989463756
Epoch: 37, step: 1039, loss: 0.35095661878585815, mean loss: 0.3447835122830107
Epoch: 37, step: 1040, loss: 0.34329673647880554, mean loss: 0.34478348498719463
Epoch: 37, step: 1041, loss: 0.31415313482284546, mean loss: 0.34478292265287913
Epoch: 37, step: 1042, loss: 0.3440721035003662, mean loss: 0.3447829096033821
Epoch: 37, step: 1043, loss: 0.3177010416984558, mean loss: 0.34478241243294766
Epoch: 37, step: 1044, loss: 0.36124131083488464, mean loss: 0.34478271458077137
Epoch: 37, step: 1045, loss: 0.36726081371307373, mean loss: 0.3447831272198126
Epoch: 37, step: 1046, loss: 0.3196244537830353, mean loss: 0.34478266538092434
Epoch: 37, step: 1047, loss: 0.3171408772468567, mean loss: 0.34478215796870365
Epoch: 37, step: 1048, loss: 0.40898457169532776, mean loss: 0.34478333649200205
Epoch: 37, step: 1049, loss: 0.31999441981315613, mean loss: 0.3447828814658139
Epoch: 37, step: 1050, loss: 0.34773391485214233, mean loss: 0.34478293563408763
Epoch: 37, step: 1051, loss: 0.3549306392669678, mean loss: 0.3447831218988386
Epoch: 37, step: 1052, loss: 0.3079264760017395, mean loss: 0.3447824453942609
Epoch: 37, step: 1053, loss: 0.33120912313461304, mean loss: 0.3447821962601935
Epoch: 37, step: 1054, loss: 0.3335241675376892, mean loss: 0.3447819896264046
Epoch: 37, step: 1055, loss: 0.31875598430633545, mean loss: 0.3447815119447858
Epoch: 37, step: 1056, loss: 0.33482295274734497, mean loss: 0.3447813291686236
Epoch: 37, step: 1057, loss: 0.33199360966682434, mean loss: 0.3447810944712793
Epoch: 37, step: 1058, loss: 0.2956010103225708, mean loss: 0.34478019186911457
Epoch: 37, step: 1059, loss: 0.3455815613269806, mean loss: 0.34478020657637964
Epoch: 37, step: 1060, loss: 0.3506275713443756, mean loss: 0.34478031388913577
Epoch: 37, step: 1061, loss: 0.3185079097747803, mean loss: 0.3447798317382069
Epoch: 37, step: 1062, loss: 0.3173171281814575, mean loss: 0.3447793277521623
Epoch: 37, step: 1063, loss: 0.31076836585998535, mean loss: 0.3447787036061979
Epoch: 37, step: 1064, loss: 0.33008840680122375, mean loss: 0.3447784340248424
Epoch: 37, step: 1065, loss: 0.3203098177909851, mean loss: 0.3447779850099741
Epoch: 37, step: 1066, loss: 0.3623298704624176, mean loss: 0.34477830709246704
Epoch: 37, step: 1067, loss: 0.33005908131599426, mean loss: 0.3447780369951062
Epoch: 37, step: 1068, loss: 0.3364715576171875, mean loss: 0.3447778845742504
Epoch: 37, step: 1069, loss: 0.3599432408809662, mean loss: 0.34477816284788076
Epoch: 37, step: 1070, loss: 0.34132033586502075, mean loss: 0.3447780994003499
Epoch: 37, step: 1071, loss: 0.30332863330841064, mean loss: 0.3447773388596877
Epoch: 37, step: 1072, loss: 0.35739168524742126, mean loss: 0.3447775703113379
Epoch: 37, step: 1073, loss: 0.3541110157966614, mean loss: 0.34477774156093394
Epoch: 37, step: 1074, loss: 0.3387625515460968, mean loss: 0.34477763119655
Epoch: 37, step: 1075, loss: 0.30483439564704895, mean loss: 0.3447768983469326
Epoch: 37, step: 1076, loss: 0.3402378559112549, mean loss: 0.34477681506939045
Epoch: 37, step: 1077, loss: 0.3130898177623749, mean loss: 0.3447762337205975
Epoch: 37, step: 1078, loss: 0.34023600816726685, mean loss: 0.34477615042440524
Epoch: 37, step: 1079, loss: 0.3044215738773346, mean loss: 0.3447754100821335
Epoch: 37, step: 1080, loss: 0.3528450131416321, mean loss: 0.34477555812379745
Epoch: 37, step: 1081, loss: 0.31516823172569275, mean loss: 0.34477501496976337
Epoch: 37, step: 1082, loss: 0.3034260869026184, mean loss: 0.34477425642693593
Epoch: 37, step: 1083, loss: 0.32620230317115784, mean loss: 0.34477391573216676
Epoch: 37, step: 1084, loss: 0.32474246621131897, mean loss: 0.3447735482702857
Epoch: 37, step: 1085, loss: 0.3575757145881653, mean loss: 0.34477378311209367
Epoch: 37, step: 1086, loss: 0.3231261968612671, mean loss: 0.3447733860179682
Epoch: 37, step: 1087, loss: 0.3285857141017914, mean loss: 0.3447730890836385
Epoch: 37, step: 1088, loss: 0.34866854548454285, mean loss: 0.34477316053761436
Epoch: 37, step: 1089, loss: 0.34488579630851746, mean loss: 0.3447731626036434
Epoch: 37, step: 1090, loss: 0.3255389630794525, mean loss: 0.34477280980554503
Epoch: 37, step: 1091, loss: 0.33245623111724854, mean loss: 0.34477258389617804
Epoch: 37, step: 1092, loss: 0.3244679570198059, mean loss: 0.3447722114777177
Epoch: 37, step: 1093, loss: 0.36805498600006104, mean loss: 0.3447726385122088
Epoch: 37, step: 1094, loss: 0.3427577316761017, mean loss: 0.34477260155703693
Epoch: 37, step: 1095, loss: 0.31963253021240234, mean loss: 0.34477214047436977
Epoch: 37, step: 1096, loss: 0.3050159513950348, mean loss: 0.34477141133747696
Epoch: 37, step: 1097, loss: 0.35427603125572205, mean loss: 0.34477158565101396
Epoch: 37, step: 1098, loss: 0.3256264328956604, mean loss: 0.34477123453775343
Epoch: 37, step: 1099, loss: 0.31944191455841064, mean loss: 0.3447707700182409
Epoch: 37, step: 1100, loss: 0.35014814138412476, mean loss: 0.34477086863313144
Epoch: 37, step: 1101, loss: 0.3645288050174713, mean loss: 0.34477123096462575
Epoch: 37, step: 1102, loss: 0.33199983835220337, mean loss: 0.3447709967603637
Epoch: 37, step: 1103, loss: 0.33598923683166504, mean loss: 0.3447708357217088
Epoch: 37, step: 1104, loss: 0.31320783495903015, mean loss: 0.3447702569345384
Epoch: 37, step: 1105, loss: 0.33301499485969543, mean loss: 0.3447700413761331
Epoch: 37, step: 1106, loss: 0.3110606074333191, mean loss: 0.3447694232513702
Epoch: 37, step: 1107, loss: 0.3228268623352051, mean loss: 0.3447690209013461
Epoch: 37, step: 1108, loss: 0.3117380142211914, mean loss: 0.34476841523901264
Epoch: 37, step: 1109, loss: 0.3272721469402313, mean loss: 0.34476809443024997
Epoch: 37, step: 1110, loss: 0.3235069513320923, mean loss: 0.3447677045964962
Epoch: 37, step: 1111, loss: 0.3337148427963257, mean loss: 0.34476750194043093
Epoch: 37, step: 1112, loss: 0.3212609887123108, mean loss: 0.3447670709524911
Epoch: 37, step: 1113, loss: 0.30454540252685547, mean loss: 0.34476633350853186
Epoch: 37, step: 1114, loss: 0.3050468862056732, mean loss: 0.3447656052858946
Epoch: 37, step: 1115, loss: 0.31497281789779663, mean loss: 0.34476505907022675
Epoch: 37, step: 1116, loss: 0.3188171982765198, mean loss: 0.34476458335548127
Epoch: 37, step: 1117, loss: 0.29598623514175415, mean loss: 0.3447636890947066
Epoch: 37, step: 1118, loss: 0.3536913990974426, mean loss: 0.3447638527647527
Epoch: 37, step: 1119, loss: 0.3225255012512207, mean loss: 0.34476344508066686
Epoch: 37, step: 1120, loss: 0.323265016078949, mean loss: 0.34476305096841914
Epoch: 37, step: 1121, loss: 0.34243136644363403, mean loss: 0.3447630082244315
Epoch: 37, step: 1122, loss: 0.3232455551624298, mean loss: 0.3447626137778941
Epoch: 37, step: 1123, loss: 0.32510149478912354, mean loss: 0.3447622533672952
Epoch: 37, step: 1124, loss: 0.3313116431236267, mean loss: 0.3447620068068816
Epoch: 37, step: 1125, loss: 0.3553154766559601, mean loss: 0.34476220025685506
Epoch: 37, step: 1126, loss: 0.2979254722595215, mean loss: 0.34476134173375
Epoch: 37, step: 1127, loss: 0.3180619776248932, mean loss: 0.3447608523400241
Epoch: 37, step: 1128, loss: 0.32863765954971313, mean loss: 0.34476055681071
Epoch: 37, step: 1129, loss: 0.32815083861351013, mean loss: 0.34476025236923125
Epoch: 37, step: 1130, loss: 0.3495045006275177, mean loss: 0.34476033932552186
Epoch: 37, step: 1131, loss: 0.4145102798938751, mean loss: 0.3447616177335235
Epoch: 37, step: 1132, loss: 0.3327052891254425, mean loss: 0.3447613967638087
Epoch: 37, step: 1133, loss: 0.3061337172985077, mean loss: 0.34476068880443284
Epoch: 37, step: 1134, loss: 0.4033181071281433, mean loss: 0.344761762011887
Epoch: 37, step: 1135, loss: 0.31047630310058594, mean loss: 0.34476113365878036
Epoch: 37, step: 1136, loss: 0.35301482677459717, mean loss: 0.34476128492228475
Epoch: 37, step: 1137, loss: 0.3425176739692688, mean loss: 0.3447612438049048
Epoch: 37, step: 1138, loss: 0.33184516429901123, mean loss: 0.34476100710361085
Epoch: 37, step: 1139, loss: 0.325766384601593, mean loss: 0.34476065901274255
Epoch: 37, step: 1140, loss: 0.35470813512802124, mean loss: 0.34476084130444873
Epoch: 37, step: 1141, loss: 0.3229237496852875, mean loss: 0.34476044113784404
Epoch: 37, step: 1142, loss: 0.3373614251613617, mean loss: 0.34476030555271686
Epoch: 37, step: 1143, loss: 0.30518481135368347, mean loss: 0.3447595803549195
Epoch: 37, step: 1144, loss: 0.34772709012031555, mean loss: 0.3447596347318049
Epoch: 37, step: 1145, loss: 0.34170958399772644, mean loss: 0.3447595788434563
Epoch: 37, step: 1146, loss: 0.31796619296073914, mean loss: 0.34475908789731097
Epoch: 37, step: 1147, loss: 0.3390684425830841, mean loss: 0.3447589836272048
Epoch: 37, step: 1148, loss: 0.35851871967315674, mean loss: 0.3447592357432252
Epoch: 37, step: 1149, loss: 0.33020713925361633, mean loss: 0.3447589691138784
Epoch: 37, step: 1150, loss: 0.3409673273563385, mean loss: 0.34475889964317064
Epoch: 37, step: 1151, loss: 0.3285202980041504, mean loss: 0.3447586021239028
Epoch: 37, step: 1152, loss: 0.3186926245689392, mean loss: 0.34475812455886085
Epoch: 37, step: 1153, loss: 0.31735193729400635, mean loss: 0.34475762244850827
Epoch: 37, step: 1154, loss: 0.3364577889442444, mean loss: 0.3447574703895613
Epoch: 37, step: 1155, loss: 0.33696240186691284, mean loss: 0.34475732758088984
Epoch: 37, step: 1156, loss: 0.3349444568157196, mean loss: 0.34475714780859407
Epoch: 37, step: 1157, loss: 0.3075282573699951, mean loss: 0.34475646578590624
Epoch: 37, step: 1158, loss: 0.3779923915863037, mean loss: 0.344757074647463
Epoch: 37, step: 1159, loss: 0.3091718554496765, mean loss: 0.34475642276024976
Epoch: 37, step: 1160, loss: 0.35755273699760437, mean loss: 0.3447566571722052
Epoch: 37, step: 1161, loss: 0.33743536472320557, mean loss: 0.3447565230580369
Epoch: 37, step: 1162, loss: 0.3378830552101135, mean loss: 0.3447563971495932
Epoch: 37, step: 1163, loss: 0.3454715311527252, mean loss: 0.34475641024920495
Epoch: 37, step: 1164, loss: 0.3136591613292694, mean loss: 0.34475584062949327
Epoch: 37, step: 1165, loss: 0.3997703492641449, mean loss: 0.344756848331963
Epoch: 37, step: 1166, loss: 0.34063488245010376, mean loss: 0.3447567728311684
Epoch: 37, step: 1167, loss: 0.3587484359741211, mean loss: 0.34475702910750994
Epoch: 37, step: 1168, loss: 0.30387577414512634, mean loss: 0.3447562803254347
Epoch: 37, step: 1169, loss: 0.32734039425849915, mean loss: 0.344755961341478
Epoch: 37, step: 1170, loss: 0.33814552426338196, mean loss: 0.3447558402689844
Epoch: 37, step: 1171, loss: 0.35817164182662964, mean loss: 0.34475608597963564
Epoch: 37, step: 1172, loss: 0.30790093541145325, mean loss: 0.34475541098924045
Epoch: 37, step: 1173, loss: 0.3033084273338318, mean loss: 0.3447546519147806
Epoch: 37, step: 1174, loss: 0.30794039368629456, mean loss: 0.3447539776980118
Epoch: 37, step: 1175, loss: 0.34192028641700745, mean loss: 0.344753925802706
Epoch: 37, step: 1176, loss: 0.37019437551498413, mean loss: 0.3447543917023436
Epoch: 37, step: 1177, loss: 0.35854917764663696, mean loss: 0.34475464432633995
Epoch: 37, step: 1178, loss: 0.35942599177360535, mean loss: 0.34475491299789207
Epoch: 37, step: 1179, loss: 0.420902818441391, mean loss: 0.3447563074438605
Epoch: 37, step: 1180, loss: 0.3704754412174225, mean loss: 0.34475677841263436
Epoch: 37, step: 1181, loss: 0.3343733251094818, mean loss: 0.3447565882743208
Epoch: 37, step: 1182, loss: 0.3320132791996002, mean loss: 0.344756354927393
Epoch: 37, step: 1183, loss: 0.32631585001945496, mean loss: 0.3447560172634197
Epoch: 37, step: 1184, loss: 0.3490654528141022, mean loss: 0.34475609617202296
Epoch: 37, step: 1185, loss: 0.3031635284423828, mean loss: 0.3447553345986584
Epoch: 37, step: 1186, loss: 0.35511836409568787, mean loss: 0.3447555243456052
Epoch: 37, step: 1187, loss: 0.3207347095012665, mean loss: 0.3447550845328242
Epoch: 37, step: 1188, loss: 0.3107989430427551, mean loss: 0.3447544628190448
Epoch: 37, step: 1189, loss: 0.32549482583999634, mean loss: 0.3447541101946906
Epoch: 37, step: 1190, loss: 0.3399800956249237, mean loss: 0.34475402278894224
Epoch: 37, step: 1191, loss: 0.40956300497055054, mean loss: 0.3447552093320067
Epoch: 37, step: 1192, loss: 0.34241172671318054, mean loss: 0.3447551664275813
Epoch: 37, step: 1193, loss: 0.3184913992881775, mean loss: 0.3447546855999452
Epoch: 37, step: 1194, loss: 0.3573974668979645, mean loss: 0.34475491705521677
Epoch: 37, step: 1195, loss: 0.29859793186187744, mean loss: 0.3447540720606138
Epoch: 37, step: 1196, loss: 0.34504255652427673, mean loss: 0.3447540773417939
Epoch: 37, step: 1197, loss: 0.30873358249664307, mean loss: 0.3447534179397721
Epoch: 37, step: 1198, loss: 0.3268025517463684, mean loss: 0.3447530893318274
Epoch: 37, step: 1199, loss: 0.34045854210853577, mean loss: 0.3447530107174314
Epoch: 37, step: 1200, loss: 0.2910047471523285, mean loss: 0.3447520268395723
Epoch: 37, step: 1201, loss: 0.3147191107273102, mean loss: 0.34475147708822484
Epoch: 37, step: 1202, loss: 0.31404078006744385, mean loss: 0.3447509149404146
Epoch: 37, step: 1203, loss: 0.31917086243629456, mean loss: 0.3447504467157019
Epoch: 37, step: 1204, loss: 0.32408931851387024, mean loss: 0.344750068535331
Epoch: 37, step: 1205, loss: 0.2894328236579895, mean loss: 0.3447490560294761
Epoch: 37, step: 1206, loss: 0.3762602210044861, mean loss: 0.3447496327873232
Epoch: 37, step: 1207, loss: 0.3230994641780853, mean loss: 0.3447492365253602
Epoch: 37, step: 1208, loss: 0.3360927402973175, mean loss: 0.34474907808883865
Epoch: 37, step: 1209, loss: 0.3667715787887573, mean loss: 0.344749481150823
Epoch: 37, step: 1210, loss: 0.32988831400871277, mean loss: 0.3447492091625519
Epoch: 37, step: 1211, loss: 0.350383996963501, mean loss: 0.34474931228824374
Epoch: 37, step: 1212, loss: 0.3405364453792572, mean loss: 0.34474923518740536
Epoch: 37, step: 1213, loss: 0.2885679006576538, mean loss: 0.34474820701613546
Epoch: 37, step: 1214, loss: 0.34612733125686646, mean loss: 0.34474823225494444
Epoch: 37, step: 1215, loss: 0.310151606798172, mean loss: 0.3447475991273283
Epoch: 37, step: 1216, loss: 0.3035550117492676, mean loss: 0.3447468453056176
Epoch: 37, step: 1217, loss: 0.3483790457248688, mean loss: 0.3447469117734363
Epoch: 37, step: 1218, loss: 0.3499992787837982, mean loss: 0.3447470078878984
Epoch: 37, step: 1219, loss: 0.37740764021873474, mean loss: 0.34474760554256706
Epoch: 37, step: 1220, loss: 0.34163767099380493, mean loss: 0.34474754863512963
Epoch: 37, step: 1221, loss: 0.31057804822921753, mean loss: 0.3447469233926702
Epoch: 37, step: 1222, loss: 0.33979639410972595, mean loss: 0.3447468328082475
Epoch: 37, step: 1223, loss: 0.3629726469516754, mean loss: 0.3447471662967593
Epoch: 37, step: 1224, loss: 0.3054640591144562, mean loss: 0.3447464475236419
Epoch: 37, step: 1225, loss: 0.3234183192253113, mean loss: 0.3447460572845323
Epoch: 37, step: 1226, loss: 0.2897038459777832, mean loss: 0.34474505019988666
Epoch: 37, step: 1227, loss: 0.33251088857650757, mean loss: 0.34474482636057124
Epoch: 37, step: 1228, loss: 0.3082444965839386, mean loss: 0.3447441585535241
Epoch: 37, step: 1229, loss: 0.3384966254234314, mean loss: 0.3447440442512604
Epoch: 37, step: 1230, loss: 0.37433454394340515, mean loss: 0.3447445856168121
Epoch: 37, step: 1231, loss: 0.32005587220191956, mean loss: 0.34474413393892306
Epoch: 37, step: 1232, loss: 0.3201325237751007, mean loss: 0.3447436836798688
Epoch: 37, step: 1233, loss: 0.2940620183944702, mean loss: 0.3447427564970858
Epoch: 37, step: 1234, loss: 0.3067873418331146, mean loss: 0.34474206214414754
Epoch: 37, step: 1235, loss: 0.30613428354263306, mean loss: 0.34474135586984267
Epoch: 37, step: 1236, loss: 0.30859723687171936, mean loss: 0.3447406946767758
Epoch: 37, step: 1237, loss: 0.32252106070518494, mean loss: 0.3447402882151
Epoch: 37, step: 1238, loss: 0.3024768829345703, mean loss: 0.34473951510874185
Epoch: 37, step: 1239, loss: 0.31552955508232117, mean loss: 0.34473898079323684
Epoch: 37, step: 1240, loss: 0.31254279613494873, mean loss: 0.34473839186377664
Epoch: 37, step: 1241, loss: 0.4019705057144165, mean loss: 0.3447394387288553
Epoch: 37, step: 1242, loss: 0.32344138622283936, mean loss: 0.34473904916121423
Epoch: 37, step: 1243, loss: 0.3395155072212219, mean loss: 0.34473895361793905
Epoch: 37, step: 1244, loss: 0.3234003782272339, mean loss: 0.3447385633233624
Epoch: 37, step: 1245, loss: 0.33808231353759766, mean loss: 0.3447384415790271
Epoch: 37, step: 1246, loss: 0.2985827326774597, mean loss: 0.3447375973959654
Epoch: 37, step: 1247, loss: 0.3315797448158264, mean loss: 0.34473735674462697
Epoch: 37, step: 1248, loss: 0.2942253649234772, mean loss: 0.3447364329194021
Epoch: 37, step: 1249, loss: 0.33792588114738464, mean loss: 0.34473630836196084
Epoch: 37, step: 1250, loss: 0.35905349254608154, mean loss: 0.34473657020259774
Epoch: 37, step: 1251, loss: 0.33282536268234253, mean loss: 0.3447363523677857
Epoch: 37, step: 1252, loss: 0.30778950452804565, mean loss: 0.344735676687973
Epoch: 37, step: 1253, loss: 0.31386682391166687, mean loss: 0.34473511217217667
Epoch: 37, step: 1254, loss: 0.3428242802619934, mean loss: 0.34473507722837493
Epoch: 37, step: 1255, loss: 0.3282592296600342, mean loss: 0.344734775936451
Epoch: 37, step: 1256, loss: 0.35026416182518005, mean loss: 0.3447348770498439
Epoch: 37, step: 1257, loss: 0.3195270001888275, mean loss: 0.34473441609316646
Epoch: 37, step: 1258, loss: 0.3424612283706665, mean loss: 0.3447343745259252
Epoch: 37, step: 1259, loss: 0.30976641178131104, mean loss: 0.3447337351175953
Epoch: 37, step: 1260, loss: 0.35887816548347473, mean loss: 0.34473399375151376
Epoch: 37, step: 1261, loss: 0.33008354902267456, mean loss: 0.3447337258699133
Epoch: 37, step: 1262, loss: 0.35611680150032043, mean loss: 0.3447339340042614
Epoch: 37, step: 1263, loss: 0.34101155400276184, mean loss: 0.34473386594348465
Epoch: 37, step: 1264, loss: 0.291482537984848, mean loss: 0.3447328923028367
Epoch: 37, step: 1265, loss: 0.32254084944725037, mean loss: 0.3447324865537078
Epoch: 37, step: 1266, loss: 0.3093646466732025, mean loss: 0.34473183991617457
Epoch: 37, step: 1267, loss: 0.3752492070198059, mean loss: 0.34473239786130955
Epoch: 37, step: 1268, loss: 0.3075047731399536, mean loss: 0.344731717245833
Epoch: 37, step: 1269, loss: 0.3524378538131714, mean loss: 0.3447318581309946
Epoch: 37, step: 1270, loss: 0.3235590159893036, mean loss: 0.3447314710518498
Epoch: 37, step: 1271, loss: 0.295515239238739, mean loss: 0.3447305713035534
Epoch: 37, step: 1272, loss: 0.3097998797893524, mean loss: 0.34472993272854535
Epoch: 37, step: 1273, loss: 0.3590167760848999, mean loss: 0.3447301939044321
Epoch: 37, step: 1274, loss: 0.2964436411857605, mean loss: 0.34472931120050876
Epoch: 37, step: 1275, loss: 0.326522558927536, mean loss: 0.3447289783774561
Epoch: 37, step: 1276, loss: 0.3862053453922272, mean loss: 0.3447297365598346
Epoch: 37, step: 1277, loss: 0.3281605541706085, mean loss: 0.3447294336829584
Epoch: 37, step: 1278, loss: 0.31728053092956543, mean loss: 0.3447289319390727
Epoch: 37, step: 1279, loss: 0.32784590125083923, mean loss: 0.3447286233364792
Epoch: 37, step: 1280, loss: 0.32965773344039917, mean loss: 0.34472834786279305
Epoch: 37, step: 1281, loss: 0.2970219850540161, mean loss: 0.34472747587663316
Epoch: 37, step: 1282, loss: 0.3195447325706482, mean loss: 0.34472701558997587
Epoch: 37, step: 1283, loss: 0.35625702142715454, mean loss: 0.34472722632995684
Epoch: 37, step: 1284, loss: 0.3219047784805298, mean loss: 0.34472680919969806
Epoch: 37, step: 1285, loss: 0.3142523467540741, mean loss: 0.3447262522222801
Epoch: 37, step: 1286, loss: 0.3138013184070587, mean loss: 0.344725687021991
Epoch: 37, step: 1287, loss: 0.35747307538986206, mean loss: 0.34472591999568003
Epoch: 37, step: 1288, loss: 0.33404025435447693, mean loss: 0.344725724705996
Epoch: 37, step: 1289, loss: 0.3036104738712311, mean loss: 0.34472497330333446
Epoch: 37, step: 1290, loss: 0.3375207185745239, mean loss: 0.3447248416442265
Epoch: 37, step: 1291, loss: 0.33506301045417786, mean loss: 0.34472466507567406
Epoch: 37, step: 1292, loss: 0.3922238349914551, mean loss: 0.34472553310019693
Epoch: 37, step: 1293, loss: 0.3439420759677887, mean loss: 0.34472551878315566
Epoch: 37, step: 1294, loss: 0.3063147962093353, mean loss: 0.34472481687129825
Epoch: 37, step: 1295, loss: 0.32299700379371643, mean loss: 0.3447244198277145
Epoch: 37, step: 1296, loss: 0.31980466842651367, mean loss: 0.34472396446450937
Epoch: 37, step: 1297, loss: 0.33725714683532715, mean loss: 0.3447238280244694
Epoch: 37, step: 1298, loss: 0.3611476421356201, mean loss: 0.3447241281288806
Epoch: 37, step: 1299, loss: 0.3386630415916443, mean loss: 0.3447240173796017
Epoch: 37, step: 1300, loss: 0.34214702248573303, mean loss: 0.3447239702931412
Epoch: 37, step: 1301, loss: 0.328896701335907, mean loss: 0.34472368110496365
Epoch: 37, step: 1302, loss: 0.3426603376865387, mean loss: 0.34472364340524286
Epoch: 37, step: 1303, loss: 0.322350412607193, mean loss: 0.34472323462736526
Epoch: 37, step: 1304, loss: 0.3198293447494507, mean loss: 0.3447227798032212
Epoch: 37, step: 1305, loss: 0.32520702481269836, mean loss: 0.34472242324687613
Epoch: 37, step: 1306, loss: 0.3204851448535919, mean loss: 0.34472198043554164
Epoch: 37, step: 1307, loss: 0.33193761110305786, mean loss: 0.34472174687135476
Epoch: 37, step: 1308, loss: 0.4199902415275574, mean loss: 0.3447231219648867
Epoch: 37, step: 1309, loss: 0.3088410496711731, mean loss: 0.3447224664408943
Epoch: 37, step: 1310, loss: 0.3274664580821991, mean loss: 0.34472215119932326
Epoch: 37, step: 1311, loss: 0.3203452527523041, mean loss: 0.34472170587783174
Epoch: 37, step: 1312, loss: 0.34736886620521545, mean loss: 0.3447217542357413
Epoch: 37, step: 1313, loss: 0.3802799582481384, mean loss: 0.3447224037955676
Epoch: 37, step: 1314, loss: 0.3587239384651184, mean loss: 0.3447226595640617
Epoch: 37, step: 1315, loss: 0.3554283082485199, mean loss: 0.344722855122455
Epoch: 37, step: 1316, loss: 0.3367716670036316, mean loss: 0.34472270988201076
Epoch: 37, step: 1317, loss: 0.3454909920692444, mean loss: 0.3447227239155874
Epoch: 37, step: 1318, loss: 0.3227216303348541, mean loss: 0.3447223220471091
Epoch: 37, step: 1319, loss: 0.35238850116729736, mean loss: 0.34472246207376067
Epoch: 37, step: 1320, loss: 0.3686113953590393, mean loss: 0.34472289840927883
Epoch: 37, step: 1321, loss: 0.36388731002807617, mean loss: 0.3447232484441942
Epoch: 37, step: 1322, loss: 0.37240684032440186, mean loss: 0.34472375407134037
Epoch: 37, step: 1323, loss: 0.29632568359375, mean loss: 0.34472287012060837
Epoch: 37, step: 1324, loss: 0.32846468687057495, mean loss: 0.34472257318376015
Epoch: 37, step: 1325, loss: 0.2967216670513153, mean loss: 0.3447216965189296
Epoch: 37, step: 1326, loss: 0.3582167327404022, mean loss: 0.3447219429811015
Epoch: 37, step: 1327, loss: 0.35072481632232666, mean loss: 0.3447220526106095
Epoch: 37, step: 1328, loss: 0.32800379395484924, mean loss: 0.34472174729332306
Epoch: 37, step: 1329, loss: 0.332176148891449, mean loss: 0.3447215181834505
Epoch: 37, step: 1330, loss: 0.29820001125335693, mean loss: 0.3447206686152164
Epoch: 37, step: 1331, loss: 0.3404453992843628, mean loss: 0.3447205905423652
Epoch: 37, step: 1332, loss: 0.38455602526664734, mean loss: 0.34472131798406136
Epoch: 37, step: 1333, loss: 0.41049015522003174, mean loss: 0.3447225189781309
Epoch: 37, step: 1334, loss: 0.3331769108772278, mean loss: 0.3447223081495039
Epoch: 37, step: 1335, loss: 0.33276674151420593, mean loss: 0.34472208983881375
Epoch: 37, step: 1336, loss: 0.33317282795906067, mean loss: 0.34472187895116874
Epoch: 37, step: 1337, loss: 0.3031049370765686, mean loss: 0.34472111904644914
Epoch: 37, step: 1338, loss: 0.32822659611701965, mean loss: 0.34472081787013986
Epoch: 37, step: 1339, loss: 0.310639888048172, mean loss: 0.34472019559198797
Epoch: 37, step: 1340, loss: 0.3384508490562439, mean loss: 0.3447200811230998
Epoch: 37, step: 1341, loss: 0.3015339970588684, mean loss: 0.3447192926242124
Epoch: 37, step: 1342, loss: 0.2902803122997284, mean loss: 0.3447182986861736
Epoch: 37, step: 1343, loss: 0.328708291053772, mean loss: 0.3447180063833979
Epoch: 37, step: 1344, loss: 0.36102524399757385, mean loss: 0.34471830410741544
Epoch: 37, step: 1345, loss: 0.3513077199459076, mean loss: 0.34471842440930756
Epoch: 37, step: 1346, loss: 0.32736146450042725, mean loss: 0.34471810753190163
Epoch: 37, step: 1347, loss: 0.35775524377822876, mean loss: 0.3447183455400849
Epoch: 37, step: 1348, loss: 0.32770490646362305, mean loss: 0.3447180349455091
Epoch: 37, step: 1349, loss: 0.3212326169013977, mean loss: 0.34471760620736525
Epoch: 37, step: 1350, loss: 0.32336410880088806, mean loss: 0.3447172163956234
Epoch: 37, step: 1351, loss: 0.36589643359184265, mean loss: 0.3447176030187924
Epoch: 37, step: 1352, loss: 0.3662185072898865, mean loss: 0.34471799550714183
Epoch: 37, step: 1353, loss: 0.3029611110687256, mean loss: 0.3447172332698296
Epoch: 37, step: 1354, loss: 0.34396007657051086, mean loss: 0.344717219448814
Epoch: 37, step: 1355, loss: 0.35788199305534363, mean loss: 0.3447174597520706
Epoch: 37, step: 1356, loss: 0.34704580903053284, mean loss: 0.34471750225182923
Epoch: 37, step: 1357, loss: 0.32985958456993103, mean loss: 0.34471723105266006
Epoch: 37, step: 1358, loss: 0.3259740173816681, mean loss: 0.3447168889420559
Epoch: 37, step: 1359, loss: 0.3452376425266266, mean loss: 0.34471689844693987
Epoch: 37, step: 1360, loss: 0.3369983434677124, mean loss: 0.34471675756911807
Epoch: 37, step: 1361, loss: 0.3343130350112915, mean loss: 0.344716567685516
Epoch: 37, step: 1362, loss: 0.4381716549396515, mean loss: 0.34471827335044736
Epoch: 37, step: 1363, loss: 0.31945401430130005, mean loss: 0.3447178122565094
Epoch: 37, step: 1364, loss: 0.2929932475090027, mean loss: 0.34471686825700676
Epoch: 37, step: 1365, loss: 0.3579190969467163, mean loss: 0.3447171091999693
Epoch: 37, step: 1366, loss: 0.3184606730937958, mean loss: 0.3447166300242031
Epoch: 37, step: 1367, loss: 0.3529764413833618, mean loss: 0.3447167807616905
Epoch: 37, step: 1368, loss: 0.2977151572704315, mean loss: 0.34471592302087456
Epoch: 37, step: 1369, loss: 0.3352772891521454, mean loss: 0.34471575077674393
Epoch: 37, step: 1370, loss: 0.3596220910549164, mean loss: 0.3447160227952165
Epoch: 37, step: 1371, loss: 0.30358341336250305, mean loss: 0.34471527220015385
Epoch: 37, step: 1372, loss: 0.3448210656642914, mean loss: 0.3447152741306563
Epoch: 37, step: 1373, loss: 0.36630716919898987, mean loss: 0.3447156681289605
Epoch: 37, step: 1374, loss: 0.3062078356742859, mean loss: 0.3447149654697547
Epoch: 37, step: 1375, loss: 0.33831703662872314, mean loss: 0.3447148487277497
Epoch: 37, step: 1376, loss: 0.3203281760215759, mean loss: 0.34471440375607365
Epoch: 37, step: 1377, loss: 0.3444635272026062, mean loss: 0.3447143991785355
Epoch: 37, step: 1378, loss: 0.364540159702301, mean loss: 0.34471476091627934
Epoch: 37, step: 1379, loss: 0.35311487317085266, mean loss: 0.34471491418062494
Epoch: 37, step: 1380, loss: 0.3141869902610779, mean loss: 0.3447143571931973
Epoch: 37, step: 1381, loss: 0.3773939311504364, mean loss: 0.344714953426986
Epoch: 37, step: 1382, loss: 0.3557044267654419, mean loss: 0.34471515392457475
Epoch: 37, step: 1383, loss: 0.43433624505996704, mean loss: 0.34471678898790276
Epoch: 37, step: 1384, loss: 0.33236071467399597, mean loss: 0.34471656356557023
Epoch: 37, step: 1385, loss: 0.3039967119693756, mean loss: 0.34471582069237
Epoch: 37, step: 1386, loss: 0.34953704476356506, mean loss: 0.3447159086468363
Epoch: 37, step: 1387, loss: 0.3073393702507019, mean loss: 0.34471522679229755
Epoch: 37, step: 1388, loss: 0.3254063129425049, mean loss: 0.3447148745491275
Epoch: 37, step: 1389, loss: 0.3075251579284668, mean loss: 0.34471419612750287
Epoch: 37, step: 1390, loss: 0.28502702713012695, mean loss: 0.344713107323092
Epoch: 37, step: 1391, loss: 0.31725528836250305, mean loss: 0.3447126064508016
Epoch: 37, step: 1392, loss: 0.30704382061958313, mean loss: 0.3447119193275125
Epoch: 37, step: 1393, loss: 0.32591572403907776, mean loss: 0.34471157646889206
Epoch: 37, step: 1394, loss: 0.3043923079967499, mean loss: 0.3447108410244897
Epoch: 37, step: 1395, loss: 0.30530911684036255, mean loss: 0.3447101223296811
Epoch: 37, step: 1396, loss: 0.33839380741119385, mean loss: 0.3447100071210187
Epoch: 37, step: 1397, loss: 0.3423396050930023, mean loss: 0.34470996388602015
Epoch: 37, step: 1398, loss: 0.3117630183696747, mean loss: 0.3447093629604631
Epoch: 37, step: 1399, loss: 0.33608534932136536, mean loss: 0.3447092056683197
Epoch: 37, step: 1400, loss: 0.3266247510910034, mean loss: 0.34470887583457155
Epoch: 37, step: 1401, loss: 0.29055821895599365, mean loss: 0.344707888224561
Epoch: 37, step: 1402, loss: 0.3003489673137665, mean loss: 0.34470707921285393
Epoch: 37, step: 1403, loss: 0.3220495283603668, mean loss: 0.34470666599519173
Epoch: 37, step: 1404, loss: 0.3438583016395569, mean loss: 0.3447066505234073
Epoch: 37, step: 1405, loss: 0.34426528215408325, mean loss: 0.344706642474234
Epoch: 37, step: 1406, loss: 0.3551867604255676, mean loss: 0.344706833595196
Epoch: 37, step: 1407, loss: 0.3142046332359314, mean loss: 0.3447062773511162
Epoch: 37, step: 1408, loss: 0.34318774938583374, mean loss: 0.3447062496594488
Epoch: 37, step: 1409, loss: 0.3265170753002167, mean loss: 0.34470591797021216
Epoch: 37, step: 1410, loss: 0.3325909674167633, mean loss: 0.3447056970516952
Epoch: 37, step: 1411, loss: 0.35995015501976013, mean loss: 0.3447059750323292
Epoch: 37, step: 1412, loss: 0.3103400766849518, mean loss: 0.3447053483862369
Epoch: 37, step: 1413, loss: 0.3196924328804016, mean loss: 0.3447048922957313
Epoch: 37, step: 1414, loss: 0.3427196145057678, mean loss: 0.34470485609643897
Epoch: 37, step: 1415, loss: 0.3295496106147766, mean loss: 0.3447045797627383
Epoch: 37, step: 1416, loss: 0.3156050145626068, mean loss: 0.3447040491844686
Epoch: 37, step: 1417, loss: 0.36401763558387756, mean loss: 0.34470440132658287
Epoch: 37, step: 1418, loss: 0.3349839746952057, mean loss: 0.344704224098537
Epoch: 37, step: 1419, loss: 0.3772704601287842, mean loss: 0.34470481785284035
Epoch: 37, step: 1420, loss: 0.3746589720249176, mean loss: 0.34470536397317386
Epoch: 37, step: 1421, loss: 0.2767506241798401, mean loss: 0.3447041250535787
Epoch: 37, step: 1422, loss: 0.3340226709842682, mean loss: 0.3447039303177659
Epoch: 37, step: 1423, loss: 0.2973717153072357, mean loss: 0.3447030674100322
Epoch: 37, step: 1424, loss: 0.29754260182380676, mean loss: 0.3447022076491151
Epoch: 37, step: 1425, loss: 0.30740442872047424, mean loss: 0.34470152770273144
Epoch: 37, step: 1426, loss: 0.31088563799858093, mean loss: 0.3447009112431616
Epoch: 37, step: 1427, loss: 0.32015979290008545, mean loss: 0.3447004638697049
Epoch: 37, step: 1428, loss: 0.36127039790153503, mean loss: 0.3447007659265806
Epoch: 37, step: 1429, loss: 0.3321138918399811, mean loss: 0.34470053648194016
Epoch: 37, step: 1430, loss: 0.3467179536819458, mean loss: 0.3447005732565296
Epoch: 37, step: 1431, loss: 0.3541845679283142, mean loss: 0.3447007461328451
Epoch: 37, step: 1432, loss: 0.33835217356681824, mean loss: 0.3447006304117944
Epoch: 37, step: 1433, loss: 0.34261077642440796, mean loss: 0.34470059231887057
Epoch: 37, step: 1434, loss: 0.31714075803756714, mean loss: 0.3447000899796933
Epoch: 37, step: 1435, loss: 0.33331725001335144, mean loss: 0.34469988250594064
Epoch: 37, step: 1436, loss: 0.3501719832420349, mean loss: 0.34469998224349163
Epoch: 37, step: 1437, loss: 0.3034449815750122, mean loss: 0.34469923032061284
Epoch: 37, step: 1438, loss: 0.31364917755126953, mean loss: 0.34469866440571373
Epoch: 37, step: 1439, loss: 0.308184415102005, mean loss: 0.34469799891308955
Epoch: 37, step: 1440, loss: 0.3049210011959076, mean loss: 0.3446972739682625
Epoch: 37, step: 1441, loss: 0.32096055150032043, mean loss: 0.344696841368983
Epoch: 37, step: 1442, loss: 0.2939051389694214, mean loss: 0.3446959157123994
Epoch: 37, step: 1443, loss: 0.3398316204547882, mean loss: 0.34469582706435925
Valid: 37, mean loss: 0.18614689509073892
Epoch: 38, step: 0, loss: 0.33317533135414124, mean loss: 0.34469561711601104
Epoch: 38, step: 1, loss: 0.32121217250823975, mean loss: 0.3446951891638915
Epoch: 38, step: 2, loss: 0.35223498940467834, mean loss: 0.3446953265634403
Epoch: 38, step: 3, loss: 0.31802693009376526, mean loss: 0.34469484058785044
Epoch: 38, step: 4, loss: 0.33776938915252686, mean loss: 0.34469471438832355
Epoch: 38, step: 5, loss: 0.3353569805622101, mean loss: 0.3446945442339115
Epoch: 38, step: 6, loss: 0.30794525146484375, mean loss: 0.3446938745917393
Epoch: 38, step: 7, loss: 0.3528333306312561, mean loss: 0.3446940229054426
Epoch: 38, step: 8, loss: 0.36605292558670044, mean loss: 0.3446944120911841
Epoch: 38, step: 9, loss: 0.2970864176750183, mean loss: 0.34469354463018753
Epoch: 38, step: 10, loss: 0.321128785610199, mean loss: 0.3446931152666502
Epoch: 38, step: 11, loss: 0.3379720151424408, mean loss: 0.34469299280655025
Epoch: 38, step: 12, loss: 0.3361743986606598, mean loss: 0.3446928375984944
Epoch: 38, step: 13, loss: 0.3346036672592163, mean loss: 0.344692653778024
Epoch: 38, step: 14, loss: 0.3583771586418152, mean loss: 0.3446929030994455
Epoch: 38, step: 15, loss: 0.3103662431240082, mean loss: 0.3446922777048242
Epoch: 38, step: 16, loss: 0.3295549154281616, mean loss: 0.34469200192347865
Epoch: 38, step: 17, loss: 0.29775023460388184, mean loss: 0.344691146726406
Epoch: 38, step: 18, loss: 0.30680954456329346, mean loss: 0.3446904566023025
Epoch: 38, step: 19, loss: 0.3251217305660248, mean loss: 0.34469010010725704
Epoch: 38, step: 20, loss: 0.3105885982513428, mean loss: 0.34468947887136436
Epoch: 38, step: 21, loss: 0.3249172866344452, mean loss: 0.3446891186827784
Epoch: 38, step: 22, loss: 0.30720070004463196, mean loss: 0.34468843577142694
Epoch: 38, step: 23, loss: 0.3109248876571655, mean loss: 0.34468782072573845
Epoch: 38, step: 24, loss: 0.27988719940185547, mean loss: 0.34468664032204926
Epoch: 38, step: 25, loss: 0.3113279640674591, mean loss: 0.3446860326737514
Epoch: 38, step: 26, loss: 0.34983521699905396, mean loss: 0.34468612646752406
Epoch: 38, step: 27, loss: 0.315364271402359, mean loss: 0.3446855923718034
Epoch: 38, step: 28, loss: 0.3474300503730774, mean loss: 0.3446856423610204
Epoch: 38, step: 29, loss: 0.36699533462524414, mean loss: 0.34468604871583924
Epoch: 38, step: 30, loss: 0.3200933337211609, mean loss: 0.3446856007855805
Epoch: 38, step: 31, loss: 0.30051231384277344, mean loss: 0.34468479623059467
Epoch: 38, step: 32, loss: 0.35347655415534973, mean loss: 0.34468495635732127
Epoch: 38, step: 33, loss: 0.3183378279209137, mean loss: 0.3446844764985001
Epoch: 38, step: 34, loss: 0.3400534987449646, mean loss: 0.34468439215628954
Epoch: 38, step: 35, loss: 0.3470395803451538, mean loss: 0.34468443504964186
Epoch: 38, step: 36, loss: 0.32825958728790283, mean loss: 0.34468413592112446
Epoch: 38, step: 37, loss: 0.3325478732585907, mean loss: 0.3446839149001326
Epoch: 38, step: 38, loss: 0.33095306158065796, mean loss: 0.3446836648436172
Epoch: 38, step: 39, loss: 0.3424488604068756, mean loss: 0.34468362414569254
Epoch: 38, step: 40, loss: 0.36318689584732056, mean loss: 0.3446839611018177
Epoch: 38, step: 41, loss: 0.35203877091407776, mean loss: 0.34468409503505537
Epoch: 38, step: 42, loss: 0.3248107433319092, mean loss: 0.34468373314209894
Epoch: 38, step: 43, loss: 0.3200187087059021, mean loss: 0.34468328400114845
Epoch: 38, step: 44, loss: 0.32036107778549194, mean loss: 0.34468284111085556
Epoch: 38, step: 45, loss: 0.3427831828594208, mean loss: 0.34468280652004285
Epoch: 38, step: 46, loss: 0.3521699905395508, mean loss: 0.34468294285144035
Epoch: 38, step: 47, loss: 0.3187715709209442, mean loss: 0.3446824710493295
Epoch: 38, step: 48, loss: 0.31430405378341675, mean loss: 0.3446819179199752
Epoch: 38, step: 49, loss: 0.3177834451198578, mean loss: 0.34468142816226793
Epoch: 38, step: 50, loss: 0.2869866192340851, mean loss: 0.3446803776950879
Epoch: 38, step: 51, loss: 0.2885500490665436, mean loss: 0.34467935573149044
Epoch: 38, step: 52, loss: 0.31730520725250244, mean loss: 0.34467885734007525
Epoch: 38, step: 53, loss: 0.32239285111427307, mean loss: 0.3446784515940492
Epoch: 38, step: 54, loss: 0.3246496617794037, mean loss: 0.3446780869502526
Epoch: 38, step: 55, loss: 0.3392271399497986, mean loss: 0.3446779877122137
Epoch: 38, step: 56, loss: 0.3145565688610077, mean loss: 0.3446774393421569
Epoch: 38, step: 57, loss: 0.33084115386009216, mean loss: 0.3446771874527434
Epoch: 38, step: 58, loss: 0.3213805854320526, mean loss: 0.34467676334610015
Epoch: 38, step: 59, loss: 0.3212191164493561, mean loss: 0.3446763363154641
Epoch: 38, step: 60, loss: 0.31301435828208923, mean loss: 0.34467575994100735
Epoch: 38, step: 61, loss: 0.2934194803237915, mean loss: 0.34467482688898826
Epoch: 38, step: 62, loss: 0.34425005316734314, mean loss: 0.3446748191566915
Epoch: 38, step: 63, loss: 0.3619314134120941, mean loss: 0.3446751332784742
Epoch: 38, step: 64, loss: 0.3135397136211395, mean loss: 0.34467456653075124
Epoch: 38, step: 65, loss: 0.2911794185638428, mean loss: 0.3446735927940304
Epoch: 38, step: 66, loss: 0.3277567923069, mean loss: 0.3446732848743288
Epoch: 38, step: 67, loss: 0.3201870322227478, mean loss: 0.344672839183527
Epoch: 38, step: 68, loss: 0.36657169461250305, mean loss: 0.3446732377721116
Epoch: 38, step: 69, loss: 0.32203689217567444, mean loss: 0.3446728257677143
Epoch: 38, step: 70, loss: 0.3114885091781616, mean loss: 0.3446722217905636
Epoch: 38, step: 71, loss: 0.2948431670665741, mean loss: 0.34467131488435504
Epoch: 38, step: 72, loss: 0.3102704882621765, mean loss: 0.3446706887886844
Epoch: 38, step: 73, loss: 0.36706671118736267, mean loss: 0.34467109638928134
Epoch: 38, step: 74, loss: 0.2996516227722168, mean loss: 0.3446702770638656
Epoch: 38, step: 75, loss: 0.34152695536613464, mean loss: 0.3446702198584769
Epoch: 38, step: 76, loss: 0.33993053436279297, mean loss: 0.34467013360239407
Epoch: 38, step: 77, loss: 0.33771950006484985, mean loss: 0.3446700071122478
Epoch: 38, step: 78, loss: 0.3255265951156616, mean loss: 0.3446696587398434
Epoch: 38, step: 79, loss: 0.3191474378108978, mean loss: 0.34466919429412846
Epoch: 38, step: 80, loss: 0.2850324511528015, mean loss: 0.3446681090623278
Epoch: 38, step: 81, loss: 0.35316795110702515, mean loss: 0.34466826373427245
Epoch: 38, step: 82, loss: 0.31519773602485657, mean loss: 0.3446677274677324
Epoch: 38, step: 83, loss: 0.30742764472961426, mean loss: 0.34466704983321134
Epoch: 38, step: 84, loss: 0.3209441304206848, mean loss: 0.3446666181699216
Epoch: 38, step: 85, loss: 0.3444836735725403, mean loss: 0.3446666148411142
Epoch: 38, step: 86, loss: 0.32821986079216003, mean loss: 0.3446663155861414
Epoch: 38, step: 87, loss: 0.32990503311157227, mean loss: 0.3446660470038548
Epoch: 38, step: 88, loss: 0.312794953584671, mean loss: 0.34466546711823737
Epoch: 38, step: 89, loss: 0.31532591581344604, mean loss: 0.3446649333030322
Epoch: 38, step: 90, loss: 0.3326527178287506, mean loss: 0.3446647147520893
Epoch: 38, step: 91, loss: 0.32616889476776123, mean loss: 0.34466437824419355
Epoch: 38, step: 92, loss: 0.29617589712142944, mean loss: 0.3446634960740649
Epoch: 38, step: 93, loss: 0.329216867685318, mean loss: 0.3446632150525536
Epoch: 38, step: 94, loss: 0.37072476744651794, mean loss: 0.3446636891834393
Epoch: 38, step: 95, loss: 0.3123185932636261, mean loss: 0.34466310074842404
Epoch: 38, step: 96, loss: 0.3107757270336151, mean loss: 0.3446624842668851
Epoch: 38, step: 97, loss: 0.3131157457828522, mean loss: 0.34466191037679084
Epoch: 38, step: 98, loss: 0.3095020651817322, mean loss: 0.34466127076963077
Epoch: 38, step: 99, loss: 0.29748860001564026, mean loss: 0.34466041264784597
Epoch: 38, step: 100, loss: 0.37786319851875305, mean loss: 0.3446610166313628
Epoch: 38, step: 101, loss: 0.33420148491859436, mean loss: 0.3446608263681163
Epoch: 38, step: 102, loss: 0.30552205443382263, mean loss: 0.3446601144304731
Epoch: 38, step: 103, loss: 0.3414804935455322, mean loss: 0.34466005659394655
Epoch: 38, step: 104, loss: 0.3594616651535034, mean loss: 0.34466032582669043
Epoch: 38, step: 105, loss: 0.34789180755615234, mean loss: 0.3446603846044148
Epoch: 38, step: 106, loss: 0.35425567626953125, mean loss: 0.3446605591309006
Epoch: 38, step: 107, loss: 0.3554700016975403, mean loss: 0.3446607557377134
Epoch: 38, step: 108, loss: 0.2712383568286896, mean loss: 0.3446594203236811
Epoch: 38, step: 109, loss: 0.3192758560180664, mean loss: 0.3446589586532379
Epoch: 38, step: 110, loss: 0.3164266049861908, mean loss: 0.3446584451790065
Epoch: 38, step: 111, loss: 0.3286384642124176, mean loss: 0.3446581538218669
Epoch: 38, step: 112, loss: 0.392940878868103, mean loss: 0.34465903192907876
Epoch: 38, step: 113, loss: 0.386474609375, mean loss: 0.34465979240588096
Epoch: 38, step: 114, loss: 0.3374849855899811, mean loss: 0.34465966192400677
Epoch: 38, step: 115, loss: 0.3293410539627075, mean loss: 0.3446593833430807
Epoch: 38, step: 116, loss: 0.2973916828632355, mean loss: 0.3446585237584278
Epoch: 38, step: 117, loss: 0.35722365975379944, mean loss: 0.3446587522569911
Epoch: 38, step: 118, loss: 0.3461052179336548, mean loss: 0.3446587785606713
Epoch: 38, step: 119, loss: 0.37055179476737976, mean loss: 0.3446592494112715
Epoch: 38, step: 120, loss: 0.3416071832180023, mean loss: 0.3446591939120954
Epoch: 38, step: 121, loss: 0.32447683811187744, mean loss: 0.3446588269201363
Epoch: 38, step: 122, loss: 0.2802875339984894, mean loss: 0.34465765642658375
Epoch: 38, step: 123, loss: 0.3459662199020386, mean loss: 0.3446576802203774
Epoch: 38, step: 124, loss: 0.34659597277641296, mean loss: 0.3446577154639826
Epoch: 38, step: 125, loss: 0.331839382648468, mean loss: 0.34465748239491073
Epoch: 38, step: 126, loss: 0.4045824110507965, mean loss: 0.3446585719588784
Epoch: 38, step: 127, loss: 0.34137189388275146, mean loss: 0.34465851220109517
Epoch: 38, step: 128, loss: 0.3162231743335724, mean loss: 0.3446579952043521
Epoch: 38, step: 129, loss: 0.3251725435256958, mean loss: 0.344657640936295
Epoch: 38, step: 130, loss: 0.3126015067100525, mean loss: 0.3446570581292803
Epoch: 38, step: 131, loss: 0.33680158853530884, mean loss: 0.34465691531294707
Epoch: 38, step: 132, loss: 0.29854676127433777, mean loss: 0.3446560770227182
Epoch: 38, step: 133, loss: 0.3522110879421234, mean loss: 0.3446562143715696
Epoch: 38, step: 134, loss: 0.31915563344955444, mean loss: 0.34465575078364585
Epoch: 38, step: 135, loss: 0.29292383790016174, mean loss: 0.3446548103402034
Epoch: 38, step: 136, loss: 0.3270730972290039, mean loss: 0.34465449072499293
Epoch: 38, step: 137, loss: 0.3273705840110779, mean loss: 0.3446541765292701
Epoch: 38, step: 138, loss: 0.3604557514190674, mean loss: 0.344654463773183
Epoch: 38, step: 139, loss: 0.3247925639152527, mean loss: 0.3446541027265048
Epoch: 38, step: 140, loss: 0.3026021718978882, mean loss: 0.34465333832662065
Epoch: 38, step: 141, loss: 0.32873502373695374, mean loss: 0.34465304897637183
Epoch: 38, step: 142, loss: 0.338704913854599, mean loss: 0.3446529408579474
Epoch: 38, step: 143, loss: 0.3091965913772583, mean loss: 0.34465229638453093
Epoch: 38, step: 144, loss: 0.35323888063430786, mean loss: 0.3446524524560043
Epoch: 38, step: 145, loss: 0.3321787714958191, mean loss: 0.3446522257360043
Epoch: 38, step: 146, loss: 0.3251870572566986, mean loss: 0.34465187194606844
Epoch: 38, step: 147, loss: 0.335225373506546, mean loss: 0.344651700617489
Epoch: 38, step: 148, loss: 0.33634820580482483, mean loss: 0.34465154970247813
Epoch: 38, step: 149, loss: 0.3699657917022705, mean loss: 0.34465200977739363
Epoch: 38, step: 150, loss: 0.31602513790130615, mean loss: 0.34465148950638197
Epoch: 38, step: 151, loss: 0.3247095048427582, mean loss: 0.344651127082991
Epoch: 38, step: 152, loss: 0.34122759103775024, mean loss: 0.34465106486516195
Epoch: 38, step: 153, loss: 0.3704502284526825, mean loss: 0.3446515337192234
Epoch: 38, step: 154, loss: 0.3337756097316742, mean loss: 0.3446513360721776
Epoch: 38, step: 155, loss: 0.3435792922973633, mean loss: 0.3446513165903906
Epoch: 38, step: 156, loss: 0.37578991055488586, mean loss: 0.3446518824482831
Epoch: 38, step: 157, loss: 0.3652079999446869, mean loss: 0.34465225599212274
Epoch: 38, step: 158, loss: 0.2875615060329437, mean loss: 0.3446512185632198
Epoch: 38, step: 159, loss: 0.3453059196472168, mean loss: 0.3446512304599541
Epoch: 38, step: 160, loss: 0.3380460739135742, mean loss: 0.3446511104382118
Epoch: 38, step: 161, loss: 0.32254743576049805, mean loss: 0.34465070880150217
Epoch: 38, step: 162, loss: 0.37166938185691833, mean loss: 0.34465119973768926
Epoch: 38, step: 163, loss: 0.3350890278816223, mean loss: 0.3446510259937425
Epoch: 38, step: 164, loss: 0.32568007707595825, mean loss: 0.3446506812992839
Epoch: 38, step: 165, loss: 0.36237266659736633, mean loss: 0.3446510032947288
Epoch: 38, step: 166, loss: 0.3059903383255005, mean loss: 0.3446503008716294
Epoch: 38, step: 167, loss: 0.3243066072463989, mean loss: 0.3446499312551028
Epoch: 38, step: 168, loss: 0.32190266251564026, mean loss: 0.34464951797647886
Epoch: 38, step: 169, loss: 0.31005406379699707, mean loss: 0.3446488894481881
Epoch: 38, step: 170, loss: 0.32417547702789307, mean loss: 0.3446485174951256
Epoch: 38, step: 171, loss: 0.3150472939014435, mean loss: 0.3446479797212793
Epoch: 38, step: 172, loss: 0.37800535559654236, mean loss: 0.3446485857232027
Epoch: 38, step: 173, loss: 0.3637748062610626, mean loss: 0.3446489331820651
Epoch: 38, step: 174, loss: 0.32776975631713867, mean loss: 0.3446486265499713
Epoch: 38, step: 175, loss: 0.35266590118408203, mean loss: 0.3446487721914957
Epoch: 38, step: 176, loss: 0.32367196679115295, mean loss: 0.344648391134521
Epoch: 38, step: 177, loss: 0.33203113079071045, mean loss: 0.34464816193814785
Epoch: 38, step: 178, loss: 0.3140767216682434, mean loss: 0.3446476066087211
Epoch: 38, step: 179, loss: 0.3582885265350342, mean loss: 0.34464785439118
Epoch: 38, step: 180, loss: 0.34406915307044983, mean loss: 0.3446478438794673
Epoch: 38, step: 181, loss: 0.3172616958618164, mean loss: 0.3446473464379005
Epoch: 38, step: 182, loss: 0.3063349723815918, mean loss: 0.344646650545174
Epoch: 38, step: 183, loss: 0.32672762870788574, mean loss: 0.3446463250761636
Epoch: 38, step: 184, loss: 0.329541951417923, mean loss: 0.3446460507355047
Epoch: 38, step: 185, loss: 0.3319460153579712, mean loss: 0.34464582006901884
Epoch: 38, step: 186, loss: 0.332951158285141, mean loss: 0.3446456076666544
Epoch: 38, step: 187, loss: 0.35135313868522644, mean loss: 0.3446457294888669
Epoch: 38, step: 188, loss: 0.30314046144485474, mean loss: 0.34464497568366825
Epoch: 38, step: 189, loss: 0.3393724262714386, mean loss: 0.34464487992707726
Epoch: 38, step: 190, loss: 0.36285561323165894, mean loss: 0.34464521065248827
Epoch: 38, step: 191, loss: 0.3296091854572296, mean loss: 0.3446449375879598
Epoch: 38, step: 192, loss: 0.3002891540527344, mean loss: 0.34464413207114264
Epoch: 38, step: 193, loss: 0.37746840715408325, mean loss: 0.3446447281608365
Epoch: 38, step: 194, loss: 0.3247744143009186, mean loss: 0.34464436732197007
Epoch: 38, step: 195, loss: 0.3338927924633026, mean loss: 0.34464417208018067
Epoch: 38, step: 196, loss: 0.3384712338447571, mean loss: 0.3446440599855678
Epoch: 38, step: 197, loss: 0.3175087869167328, mean loss: 0.34464356724409206
Epoch: 38, step: 198, loss: 0.316440612077713, mean loss: 0.3446430551241893
Epoch: 38, step: 199, loss: 0.3301159739494324, mean loss: 0.34464279134075715
Epoch: 38, step: 200, loss: 0.33697211742401123, mean loss: 0.3446426520588238
Epoch: 38, step: 201, loss: 0.3159847855567932, mean loss: 0.3446421317068155
Epoch: 38, step: 202, loss: 0.32278111577033997, mean loss: 0.34464173477506904
Epoch: 38, step: 203, loss: 0.3646593987941742, mean loss: 0.3446420982303675
Epoch: 38, step: 204, loss: 0.30891484022140503, mean loss: 0.344641449552008
Epoch: 38, step: 205, loss: 0.3064383864402771, mean loss: 0.3446407559345362
Epoch: 38, step: 206, loss: 0.31740108132362366, mean loss: 0.344640261378088
Epoch: 38, step: 207, loss: 0.317557692527771, mean loss: 0.34463976968293825
Epoch: 38, step: 208, loss: 0.31350383162498474, mean loss: 0.34463920440747015
Epoch: 38, step: 209, loss: 0.35315170884132385, mean loss: 0.34463935894986936
Epoch: 38, step: 210, loss: 0.3219361901283264, mean loss: 0.344638946786973
Epoch: 38, step: 211, loss: 0.30662673711776733, mean loss: 0.3446382567098241
Epoch: 38, step: 212, loss: 0.32482028007507324, mean loss: 0.34463789693898567
Epoch: 38, step: 213, loss: 0.3526274859905243, mean loss: 0.34463804197745374
Epoch: 38, step: 214, loss: 0.3131517767906189, mean loss: 0.34463747040403014
Epoch: 38, step: 215, loss: 0.35061851143836975, mean loss: 0.3446375789765148
Epoch: 38, step: 216, loss: 0.38594114780426025, mean loss: 0.3446383287372443
Epoch: 38, step: 217, loss: 0.3155757188796997, mean loss: 0.34463780118941606
Epoch: 38, step: 218, loss: 0.31299784779548645, mean loss: 0.3446372268677774
Epoch: 38, step: 219, loss: 0.3343745768070221, mean loss: 0.344637040585739
Epoch: 38, step: 220, loss: 0.3585303723812103, mean loss: 0.34463729276535887
Epoch: 38, step: 221, loss: 0.32107532024383545, mean loss: 0.34463686509678293
Epoch: 38, step: 222, loss: 0.400908499956131, mean loss: 0.34463788645325555
Epoch: 38, step: 223, loss: 0.34139004349708557, mean loss: 0.34463782750445787
Epoch: 38, step: 224, loss: 0.2962814271450043, mean loss: 0.34463694984505067
Epoch: 38, step: 225, loss: 0.30197402834892273, mean loss: 0.3446361755352482
Epoch: 38, step: 226, loss: 0.3428442180156708, mean loss: 0.3446361430127429
Epoch: 38, step: 227, loss: 0.3180857300758362, mean loss: 0.3446356611540689
Epoch: 38, step: 228, loss: 0.2991611063480377, mean loss: 0.3446348358595224
Epoch: 38, step: 229, loss: 0.33426520228385925, mean loss: 0.34463464766973667
Epoch: 38, step: 230, loss: 0.33325859904289246, mean loss: 0.34463444121911463
Epoch: 38, step: 231, loss: 0.35028886795043945, mean loss: 0.34463454383284015
Epoch: 38, step: 232, loss: 0.31898221373558044, mean loss: 0.3446340783155532
Epoch: 38, step: 233, loss: 0.3341788351535797, mean loss: 0.3446338885858838
Epoch: 38, step: 234, loss: 0.3899518549442291, mean loss: 0.34463471094903836
Epoch: 38, step: 235, loss: 0.34729957580566406, mean loss: 0.3446347593061708
Epoch: 38, step: 236, loss: 0.3665113151073456, mean loss: 0.3446351562750108
Epoch: 38, step: 237, loss: 0.3252403736114502, mean loss: 0.3446348043464558
Epoch: 38, step: 238, loss: 0.31735745072364807, mean loss: 0.3446343093934769
Epoch: 38, step: 239, loss: 0.3417433798313141, mean loss: 0.34463425693793975
Epoch: 38, step: 240, loss: 0.3536529242992401, mean loss: 0.34463442057750504
Epoch: 38, step: 241, loss: 0.39544031023979187, mean loss: 0.34463534241024557
Epoch: 38, step: 242, loss: 0.3040614724159241, mean loss: 0.34463460624277764
Epoch: 38, step: 243, loss: 0.34051716327667236, mean loss: 0.344634531537738
Epoch: 38, step: 244, loss: 0.3154749274253845, mean loss: 0.3446340024885497
Epoch: 38, step: 245, loss: 0.3157694339752197, mean loss: 0.3446334788017593
Epoch: 38, step: 246, loss: 0.3507484197616577, mean loss: 0.3446335897424687
Epoch: 38, step: 247, loss: 0.30462726950645447, mean loss: 0.3446328639384006
Epoch: 38, step: 248, loss: 0.4024502635002136, mean loss: 0.34463391285622796
Epoch: 38, step: 249, loss: 0.357242614030838, mean loss: 0.34463414159794953
Epoch: 38, step: 250, loss: 0.33636313676834106, mean loss: 0.34463399155160174
Epoch: 38, step: 251, loss: 0.3468565344810486, mean loss: 0.34463403187057223
Epoch: 38, step: 252, loss: 0.30156299471855164, mean loss: 0.34463325053656496
Epoch: 38, step: 253, loss: 0.3433923125267029, mean loss: 0.3446332280256262
Epoch: 38, step: 254, loss: 0.3360951840877533, mean loss: 0.3446330731460946
Epoch: 38, step: 255, loss: 0.311964213848114, mean loss: 0.3446324805459767
Epoch: 38, step: 256, loss: 0.36097240447998047, mean loss: 0.34463277694032335
Epoch: 38, step: 257, loss: 0.3630903661251068, mean loss: 0.34463311174150574
Epoch: 38, step: 258, loss: 0.3616441786289215, mean loss: 0.3446334202987038
Epoch: 38, step: 259, loss: 0.3094453811645508, mean loss: 0.3446327820479758
Epoch: 38, step: 260, loss: 0.3450770676136017, mean loss: 0.34463279010640846
Epoch: 38, step: 261, loss: 0.3347857594490051, mean loss: 0.3446326115046263
Epoch: 38, step: 262, loss: 0.3270215690135956, mean loss: 0.3446322920878767
Epoch: 38, step: 263, loss: 0.3331952691078186, mean loss: 0.34463208465492945
Epoch: 38, step: 264, loss: 0.3326249420642853, mean loss: 0.34463186688568936
Epoch: 38, step: 265, loss: 0.34078770875930786, mean loss: 0.3446317971668362
Epoch: 38, step: 266, loss: 0.326732337474823, mean loss: 0.3446314725425287
Epoch: 38, step: 267, loss: 0.3181856870651245, mean loss: 0.34463099293089505
Epoch: 38, step: 268, loss: 0.30366218090057373, mean loss: 0.3446302499481412
Epoch: 38, step: 269, loss: 0.32818517088890076, mean loss: 0.34462995171668315
Epoch: 38, step: 270, loss: 0.32138592004776, mean loss: 0.3446295301938848
Epoch: 38, step: 271, loss: 0.30669504404067993, mean loss: 0.3446288422770461
Epoch: 38, step: 272, loss: 0.3541398346424103, mean loss: 0.34462901474948
Epoch: 38, step: 273, loss: 0.314291775226593, mean loss: 0.3446284646236409
Epoch: 38, step: 274, loss: 0.33790647983551025, mean loss: 0.34462834273152004
Epoch: 38, step: 275, loss: 0.3513025641441345, mean loss: 0.3446284637553362
Epoch: 38, step: 276, loss: 0.33843177556991577, mean loss: 0.3446283513926789
Epoch: 38, step: 277, loss: 0.3492802381515503, mean loss: 0.3446284357423935
Epoch: 38, step: 278, loss: 0.33952826261520386, mean loss: 0.3446283432658631
Epoch: 38, step: 279, loss: 0.3049837648868561, mean loss: 0.34462762444191514
Epoch: 38, step: 280, loss: 0.3435502350330353, mean loss: 0.3446276049073584
Epoch: 38, step: 281, loss: 0.323810875415802, mean loss: 0.3446272274781694
Epoch: 38, step: 282, loss: 0.3442173898220062, mean loss: 0.34462722004751656
Epoch: 38, step: 283, loss: 0.3284721374511719, mean loss: 0.3446269271495073
Epoch: 38, step: 284, loss: 0.3388507068157196, mean loss: 0.3446268224262567
Epoch: 38, step: 285, loss: 0.34451982378959656, mean loss: 0.34462682048639964
Epoch: 38, step: 286, loss: 0.33949026465415955, mean loss: 0.3446267273636847
Epoch: 38, step: 287, loss: 0.32328957319259644, mean loss: 0.3446263405407302
Epoch: 38, step: 288, loss: 0.3157578408718109, mean loss: 0.34462581719090574
Epoch: 38, step: 289, loss: 0.3461102545261383, mean loss: 0.3446258441014118
Epoch: 38, step: 290, loss: 0.31394219398498535, mean loss: 0.34462528786534563
Epoch: 38, step: 291, loss: 0.35255783796310425, mean loss: 0.3446254316647456
Epoch: 38, step: 292, loss: 0.33328282833099365, mean loss: 0.344625226052431
Epoch: 38, step: 293, loss: 0.3407142162322998, mean loss: 0.34462515515713643
Epoch: 38, step: 294, loss: 0.3305529057979584, mean loss: 0.3446249000725866
Epoch: 38, step: 295, loss: 0.33962756395339966, mean loss: 0.34462480948862273
Epoch: 38, step: 296, loss: 0.3155014216899872, mean loss: 0.34462428159455544
Epoch: 38, step: 297, loss: 0.3158372938632965, mean loss: 0.34462375980757465
Epoch: 38, step: 298, loss: 0.3277732729911804, mean loss: 0.3446234543846746
Epoch: 38, step: 299, loss: 0.31528574228286743, mean loss: 0.34462292263465466
Epoch: 38, step: 300, loss: 0.3283608555793762, mean loss: 0.34462262788782094
Epoch: 38, step: 301, loss: 0.3146739602088928, mean loss: 0.34462208508382486
Epoch: 38, step: 302, loss: 0.33040809631347656, mean loss: 0.34462182746735415
Epoch: 38, step: 303, loss: 0.3352108299732208, mean loss: 0.3446216569041112
Epoch: 38, step: 304, loss: 0.3160121440887451, mean loss: 0.3446211383997921
Epoch: 38, step: 305, loss: 0.32688915729522705, mean loss: 0.3446208170401722
Epoch: 38, step: 306, loss: 0.3359609842300415, mean loss: 0.3446206600994373
Epoch: 38, step: 307, loss: 0.30000171065330505, mean loss: 0.3446198514921621
Epoch: 38, step: 308, loss: 0.32213231921195984, mean loss: 0.3446194439690603
Epoch: 38, step: 309, loss: 0.3137184977531433, mean loss: 0.3446188839867071
Epoch: 38, step: 310, loss: 0.31456348299980164, mean loss: 0.34461833933706887
Epoch: 38, step: 311, loss: 0.33351781964302063, mean loss: 0.3446181381823919
Epoch: 38, step: 312, loss: 0.3482316732406616, mean loss: 0.3446182036627771
Epoch: 38, step: 313, loss: 0.33578649163246155, mean loss: 0.3446180436274053
Epoch: 38, step: 314, loss: 0.32349666953086853, mean loss: 0.34461766090368234
Epoch: 38, step: 315, loss: 0.361919105052948, mean loss: 0.34461797440379377
Epoch: 38, step: 316, loss: 0.35868576169013977, mean loss: 0.34461822930580843
Epoch: 38, step: 317, loss: 0.3221927881240845, mean loss: 0.34461782297420523
Epoch: 38, step: 318, loss: 0.3411564528942108, mean loss: 0.34461776025800006
Epoch: 38, step: 319, loss: 0.29475438594818115, mean loss: 0.3446168568050665
Epoch: 38, step: 320, loss: 0.31683140993118286, mean loss: 0.34461635338168173
Epoch: 38, step: 321, loss: 0.33235472440719604, mean loss: 0.34461613122657475
Epoch: 38, step: 322, loss: 0.33719390630722046, mean loss: 0.3446159967537979
Epoch: 38, step: 323, loss: 0.31184613704681396, mean loss: 0.34461540305389743
Epoch: 38, step: 324, loss: 0.32599514722824097, mean loss: 0.34461506571208855
Epoch: 38, step: 325, loss: 0.3410516381263733, mean loss: 0.34461500115490196
Epoch: 38, step: 326, loss: 0.38538673520088196, mean loss: 0.3446157397866534
Epoch: 38, step: 327, loss: 0.3178008794784546, mean loss: 0.34461525401019855
Epoch: 38, step: 328, loss: 0.32333070039749146, mean loss: 0.3446148684274444
Epoch: 38, step: 329, loss: 0.36880502104759216, mean loss: 0.34461530663896967
Epoch: 38, step: 330, loss: 0.319344162940979, mean loss: 0.3446148488532751
Epoch: 38, step: 331, loss: 0.32099461555480957, mean loss: 0.34461442098150313
Epoch: 38, step: 332, loss: 0.30907565355300903, mean loss: 0.3446137772215642
Epoch: 38, step: 333, loss: 0.3008113503456116, mean loss: 0.34461298378558125
Epoch: 38, step: 334, loss: 0.3230714797973633, mean loss: 0.34461259359042506
Epoch: 38, step: 335, loss: 0.310000479221344, mean loss: 0.34461196665022853
Epoch: 38, step: 336, loss: 0.32414793968200684, mean loss: 0.34461159598553676
Epoch: 38, step: 337, loss: 0.2947940528392792, mean loss: 0.34461069365727837
Epoch: 38, step: 338, loss: 0.3359501361846924, mean loss: 0.34461053679438014
Epoch: 38, step: 339, loss: 0.3239397406578064, mean loss: 0.34461016240482467
Epoch: 38, step: 340, loss: 0.2945496737957001, mean loss: 0.34460925572544465
Epoch: 38, step: 341, loss: 0.3749958276748657, mean loss: 0.3446098060672411
Epoch: 38, step: 342, loss: 0.34666141867637634, mean loss: 0.34460984322403926
Epoch: 38, step: 343, loss: 0.37691372632980347, mean loss: 0.3446104282697344
Epoch: 38, step: 344, loss: 0.3581726849079132, mean loss: 0.34461067388714645
Epoch: 38, step: 345, loss: 0.3048442602157593, mean loss: 0.3446099537159401
Epoch: 38, step: 346, loss: 0.31575238704681396, mean loss: 0.3446094311138164
Epoch: 38, step: 347, loss: 0.3462674021720886, mean loss: 0.34460946113864543
Epoch: 38, step: 348, loss: 0.3293002247810364, mean loss: 0.3446091839028772
Epoch: 38, step: 349, loss: 0.31200912594795227, mean loss: 0.34460859355739976
Epoch: 38, step: 350, loss: 0.35441070795059204, mean loss: 0.34460877105797727
Epoch: 38, step: 351, loss: 0.3548336327075958, mean loss: 0.3446089562104771
Epoch: 38, step: 352, loss: 0.319963663816452, mean loss: 0.3446085099399041
Epoch: 38, step: 353, loss: 0.30369508266448975, mean loss: 0.34460776910357205
Epoch: 38, step: 354, loss: 0.3135021924972534, mean loss: 0.344607205872243
Epoch: 38, step: 355, loss: 0.3220236599445343, mean loss: 0.3446067969574547
Epoch: 38, step: 356, loss: 0.362793892621994, mean loss: 0.34460712626082185
Epoch: 38, step: 357, loss: 0.3848738372325897, mean loss: 0.3446078553339881
Epoch: 38, step: 358, loss: 0.38485944271087646, mean loss: 0.3446085841201295
Epoch: 38, step: 359, loss: 0.3833974003791809, mean loss: 0.3446092864089523
Epoch: 38, step: 360, loss: 0.3471812605857849, mean loss: 0.3446093329748491
Epoch: 38, step: 361, loss: 0.4262029826641083, mean loss: 0.3446108102107851
Epoch: 38, step: 362, loss: 0.3662351071834564, mean loss: 0.34461120170706416
Epoch: 38, step: 363, loss: 0.33028215169906616, mean loss: 0.3446109422920086
Epoch: 38, step: 364, loss: 0.35171568393707275, mean loss: 0.3446110709148818
Epoch: 38, step: 365, loss: 0.34999504685401917, mean loss: 0.3446111683835798
Epoch: 38, step: 366, loss: 0.3399314284324646, mean loss: 0.3446110836655373
Epoch: 38, step: 367, loss: 0.3346250057220459, mean loss: 0.3446109028893254
Epoch: 38, step: 368, loss: 0.30247583985328674, mean loss: 0.34461014013950125
Epoch: 38, step: 369, loss: 0.3059805631637573, mean loss: 0.34460944086038436
Epoch: 38, step: 370, loss: 0.3370128273963928, mean loss: 0.34460930334769563
Epoch: 38, step: 371, loss: 0.37905457615852356, mean loss: 0.34460992685925906
Epoch: 38, step: 372, loss: 0.33849018812179565, mean loss: 0.3446098160847322
Epoch: 38, step: 373, loss: 0.31242942810058594, mean loss: 0.3446092335920995
Epoch: 38, step: 374, loss: 0.33550164103507996, mean loss: 0.34460906873984404
Epoch: 38, step: 375, loss: 0.29287585616111755, mean loss: 0.34460813235820886
Epoch: 38, step: 376, loss: 0.3015211522579193, mean loss: 0.3446073524892501
Epoch: 38, step: 377, loss: 0.3680352568626404, mean loss: 0.34460777652371843
Epoch: 38, step: 378, loss: 0.33960384130477905, mean loss: 0.3446076859563944
Epoch: 38, step: 379, loss: 0.36256906390190125, mean loss: 0.34460801103744026
Epoch: 38, step: 380, loss: 0.3412654399871826, mean loss: 0.34460795054170157
Epoch: 38, step: 381, loss: 0.32448112964630127, mean loss: 0.3446075862817223
Epoch: 38, step: 382, loss: 0.3158431053161621, mean loss: 0.3446070657047434
Epoch: 38, step: 383, loss: 0.32715487480163574, mean loss: 0.3446067498622846
Epoch: 38, step: 384, loss: 0.3475220203399658, mean loss: 0.34460680262067683
Epoch: 38, step: 385, loss: 0.3430282473564148, mean loss: 0.34460677405367723
Epoch: 38, step: 386, loss: 0.3177187740802765, mean loss: 0.34460628747230637
Epoch: 38, step: 387, loss: 0.3096921145915985, mean loss: 0.34460565565593143
Epoch: 38, step: 388, loss: 0.3342130184173584, mean loss: 0.3446054675913427
Epoch: 38, step: 389, loss: 0.33133187890052795, mean loss: 0.34460522739756233
Epoch: 38, step: 390, loss: 0.3674320578575134, mean loss: 0.34460564045567466
Epoch: 38, step: 391, loss: 0.30770647525787354, mean loss: 0.3446049727666692
Epoch: 38, step: 392, loss: 0.31650763750076294, mean loss: 0.34460446435564474
Epoch: 38, step: 393, loss: 0.30123570561408997, mean loss: 0.3446036796279868
Epoch: 38, step: 394, loss: 0.3507937788963318, mean loss: 0.34460379163152
Epoch: 38, step: 395, loss: 0.318226158618927, mean loss: 0.344603314363788
Epoch: 38, step: 396, loss: 0.322496622800827, mean loss: 0.34460291438022467
Epoch: 38, step: 397, loss: 0.3131197988986969, mean loss: 0.34460234475627893
Epoch: 38, step: 398, loss: 0.3194046914577484, mean loss: 0.3446018888634364
Epoch: 38, step: 399, loss: 0.34981364011764526, mean loss: 0.3446019831562294
Epoch: 38, step: 400, loss: 0.32117941975593567, mean loss: 0.3446015593948378
Epoch: 38, step: 401, loss: 0.35869136452674866, mean loss: 0.34460181430320574
Epoch: 38, step: 402, loss: 0.35653218626976013, mean loss: 0.34460203013987634
Epoch: 38, step: 403, loss: 0.3496491312980652, mean loss: 0.3446021214471554
Epoch: 38, step: 404, loss: 0.35424211621284485, mean loss: 0.3446022958414743
Epoch: 38, step: 405, loss: 0.35163167119026184, mean loss: 0.3446024230055422
Epoch: 38, step: 406, loss: 0.3162183165550232, mean loss: 0.3446019095355726
Epoch: 38, step: 407, loss: 0.3377789855003357, mean loss: 0.3446017861107529
Epoch: 38, step: 408, loss: 0.303973525762558, mean loss: 0.34460105116998935
Epoch: 38, step: 409, loss: 0.3364275097846985, mean loss: 0.3446009033182223
Epoch: 38, step: 410, loss: 0.32788482308387756, mean loss: 0.3446006009453367
Epoch: 38, step: 411, loss: 0.31895533204078674, mean loss: 0.3446001370630397
Epoch: 38, step: 412, loss: 0.3583124279975891, mean loss: 0.34460038509217844
Epoch: 38, step: 413, loss: 0.32079240679740906, mean loss: 0.3445999544591376
Epoch: 38, step: 414, loss: 0.3302541971206665, mean loss: 0.3445996949811891
Epoch: 38, step: 415, loss: 0.34094738960266113, mean loss: 0.34459962892154905
Epoch: 38, step: 416, loss: 0.362209290266037, mean loss: 0.3445999474236262
Epoch: 38, step: 417, loss: 0.37593305110931396, mean loss: 0.3446005141283411
Epoch: 38, step: 418, loss: 0.3466636538505554, mean loss: 0.3446005514425463
Epoch: 38, step: 419, loss: 0.3112561106681824, mean loss: 0.34459994838169167
Epoch: 38, step: 420, loss: 0.330932080745697, mean loss: 0.34459970119185507
Epoch: 38, step: 421, loss: 0.32036513090133667, mean loss: 0.3445992629061407
Epoch: 38, step: 422, loss: 0.35278549790382385, mean loss: 0.344599410952709
Epoch: 38, step: 423, loss: 0.4052720069885254, mean loss: 0.34460050818571025
Epoch: 38, step: 424, loss: 0.37079036235809326, mean loss: 0.34460098180732035
Epoch: 38, step: 425, loss: 0.30929869413375854, mean loss: 0.3446003434065161
Epoch: 38, step: 426, loss: 0.31821954250335693, mean loss: 0.34459986634904843
Epoch: 38, step: 427, loss: 0.31905099749565125, mean loss: 0.34459940434418673
Epoch: 38, step: 428, loss: 0.3725663423538208, mean loss: 0.3445999100662896
Epoch: 38, step: 429, loss: 0.31221726536750793, mean loss: 0.34459932450618874
Epoch: 38, step: 430, loss: 0.3342662751674652, mean loss: 0.34459913766190653
Epoch: 38, step: 431, loss: 0.3154507875442505, mean loss: 0.34459861060509117
Epoch: 38, step: 432, loss: 0.34042632579803467, mean loss: 0.3445985351637241
Epoch: 38, step: 433, loss: 0.3394417464733124, mean loss: 0.3445984419226889
Epoch: 38, step: 434, loss: 0.31397321820259094, mean loss: 0.3445978881912676
Epoch: 38, step: 435, loss: 0.32081231474876404, mean loss: 0.3445974581346132
Epoch: 38, step: 436, loss: 0.35886871814727783, mean loss: 0.3445977161624208
Epoch: 38, step: 437, loss: 0.3080786168575287, mean loss: 0.3445970559002746
Epoch: 38, step: 438, loss: 0.33646953105926514, mean loss: 0.34459690895798756
Epoch: 38, step: 439, loss: 0.3493352234363556, mean loss: 0.3445969946232045
Epoch: 38, step: 440, loss: 0.31697726249694824, mean loss: 0.3445964952879284
Epoch: 38, step: 441, loss: 0.3079030215740204, mean loss: 0.3445958319210825
Epoch: 38, step: 442, loss: 0.33885276317596436, mean loss: 0.3445957280962837
Epoch: 38, step: 443, loss: 0.3213770091533661, mean loss: 0.3445953083493941
Epoch: 38, step: 444, loss: 0.3989109694957733, mean loss: 0.3445962902475655
Epoch: 38, step: 445, loss: 0.316437304019928, mean loss: 0.3445957812091652
Epoch: 38, step: 446, loss: 0.33313971757888794, mean loss: 0.3445955741182266
Epoch: 38, step: 447, loss: 0.3109892010688782, mean loss: 0.34459496662775213
Epoch: 38, step: 448, loss: 0.34969478845596313, mean loss: 0.34459505881375435
Epoch: 38, step: 449, loss: 0.31680089235305786, mean loss: 0.34459455640663855
Epoch: 38, step: 450, loss: 0.36647436022758484, mean loss: 0.3445949518986368
Epoch: 38, step: 451, loss: 0.3245064318180084, mean loss: 0.34459458879184623
Epoch: 38, step: 452, loss: 0.31854185461997986, mean loss: 0.3445941178883818
Epoch: 38, step: 453, loss: 0.338205486536026, mean loss: 0.3445940024158851
Epoch: 38, step: 454, loss: 0.3139518201351166, mean loss: 0.34459344857811547
Epoch: 38, step: 455, loss: 0.33995217084884644, mean loss: 0.34459336469151686
Epoch: 38, step: 456, loss: 0.3086174428462982, mean loss: 0.3445927144733339
Epoch: 38, step: 457, loss: 0.30365189909935, mean loss: 0.3445919745345055
Epoch: 38, step: 458, loss: 0.2778729796409607, mean loss: 0.34459076871868993
Epoch: 38, step: 459, loss: 0.3383616805076599, mean loss: 0.3445906561420939
Epoch: 38, step: 460, loss: 0.33294111490249634, mean loss: 0.3445904456069478
Epoch: 38, step: 461, loss: 0.35064980387687683, mean loss: 0.34459055511210324
Epoch: 38, step: 462, loss: 0.3338375985622406, mean loss: 0.34459036078741634
Epoch: 38, step: 463, loss: 0.33610841631889343, mean loss: 0.3445902075066503
Epoch: 38, step: 464, loss: 0.33472585678100586, mean loss: 0.34459002924706406
Epoch: 38, step: 465, loss: 0.33601313829421997, mean loss: 0.34458987425608223
Epoch: 38, step: 466, loss: 0.3360884189605713, mean loss: 0.3445897206310566
Epoch: 38, step: 467, loss: 0.34510132670402527, mean loss: 0.34458972987583564
Epoch: 38, step: 468, loss: 0.3113963305950165, mean loss: 0.3445891300782302
Epoch: 38, step: 469, loss: 0.34813183546066284, mean loss: 0.3445891940929999
Epoch: 38, step: 470, loss: 0.3076798617839813, mean loss: 0.34458852717338384
Epoch: 38, step: 471, loss: 0.3168375790119171, mean loss: 0.34458802574688485
Epoch: 38, step: 472, loss: 0.346031129360199, mean loss: 0.344588051821573
Epoch: 38, step: 473, loss: 0.3299586772918701, mean loss: 0.3445877874957946
Epoch: 38, step: 474, loss: 0.3401978015899658, mean loss: 0.3445877081782904
Epoch: 38, step: 475, loss: 0.37973320484161377, mean loss: 0.34458834316955766
Epoch: 38, step: 476, loss: 0.3371961712837219, mean loss: 0.3445882096139038
Epoch: 38, step: 477, loss: 0.31626904010772705, mean loss: 0.3445876979757917
Epoch: 38, step: 478, loss: 0.2893698215484619, mean loss: 0.3445867003808715
Epoch: 38, step: 479, loss: 0.3547171354293823, mean loss: 0.34458688339928184
Epoch: 38, step: 480, loss: 0.3316885530948639, mean loss: 0.3445866503797471
Epoch: 38, step: 481, loss: 0.3547169864177704, mean loss: 0.3445868333897561
Epoch: 38, step: 482, loss: 0.338879257440567, mean loss: 0.344586730281167
Epoch: 38, step: 483, loss: 0.2969689965248108, mean loss: 0.34458587007208835
Epoch: 38, step: 484, loss: 0.370385080575943, mean loss: 0.34458633612354533
Epoch: 38, step: 485, loss: 0.3300875723361969, mean loss: 0.3445860742144484
Epoch: 38, step: 486, loss: 0.3141174018383026, mean loss: 0.3445855238310893
Epoch: 38, step: 487, loss: 0.31631043553352356, mean loss: 0.34458501308166195
Epoch: 38, step: 488, loss: 0.3899671733379364, mean loss: 0.34458583283130984
Epoch: 38, step: 489, loss: 0.3496300280094147, mean loss: 0.3445859239442606
Epoch: 38, step: 490, loss: 0.3672270178794861, mean loss: 0.34458633290139684
Epoch: 38, step: 491, loss: 0.35391244292259216, mean loss: 0.3445865013521956
Epoch: 38, step: 492, loss: 0.31763094663619995, mean loss: 0.3445860144822468
Epoch: 38, step: 493, loss: 0.34827762842178345, mean loss: 0.3445860811587981
Epoch: 38, step: 494, loss: 0.3201906681060791, mean loss: 0.344585640545923
Epoch: 38, step: 495, loss: 0.3113137185573578, mean loss: 0.3445850396226101
Epoch: 38, step: 496, loss: 0.35948091745376587, mean loss: 0.34458530865181114
Epoch: 38, step: 497, loss: 0.30396756529808044, mean loss: 0.3445845750823086
Epoch: 38, step: 498, loss: 0.3186150789260864, mean loss: 0.34458410607332995
Epoch: 38, step: 499, loss: 0.33715376257896423, mean loss: 0.3445839718837848
Epoch: 38, step: 500, loss: 0.3053809702396393, mean loss: 0.34458326390333144
Epoch: 38, step: 501, loss: 0.3407258987426758, mean loss: 0.34458319424310896
Epoch: 38, step: 502, loss: 0.3173168897628784, mean loss: 0.3445827018493486
Epoch: 38, step: 503, loss: 0.29957714676856995, mean loss: 0.34458188912262433
Epoch: 38, step: 504, loss: 0.29652005434036255, mean loss: 0.3445810212201597
Epoch: 38, step: 505, loss: 0.3192441165447235, mean loss: 0.3445805636936207
Epoch: 38, step: 506, loss: 0.29674094915390015, mean loss: 0.344579699835217
Epoch: 38, step: 507, loss: 0.30591219663619995, mean loss: 0.3445790016137797
Epoch: 38, step: 508, loss: 0.31649890542030334, mean loss: 0.34457849457894474
Epoch: 38, step: 509, loss: 0.3572915494441986, mean loss: 0.3445787241310531
Epoch: 38, step: 510, loss: 0.32522156834602356, mean loss: 0.34457837461665725
Epoch: 38, step: 511, loss: 0.3390046954154968, mean loss: 0.3445782739796646
Epoch: 38, step: 512, loss: 0.310683012008667, mean loss: 0.344577661986129
Epoch: 38, step: 513, loss: 0.2903413474559784, mean loss: 0.3445766827438199
Epoch: 38, step: 514, loss: 0.31105491518974304, mean loss: 0.34457607751574193
Epoch: 38, step: 515, loss: 0.3084653913974762, mean loss: 0.3445754255570845
Epoch: 38, step: 516, loss: 0.31776759028434753, mean loss: 0.3445749415650414
Epoch: 38, step: 517, loss: 0.3328973054885864, mean loss: 0.3445747307393314
Epoch: 38, step: 518, loss: 0.3094760775566101, mean loss: 0.344574097086695
Epoch: 38, step: 519, loss: 0.3312021493911743, mean loss: 0.34457385568093796
Epoch: 38, step: 520, loss: 0.33055755496025085, mean loss: 0.3445736026471481
Epoch: 38, step: 521, loss: 0.31530165672302246, mean loss: 0.34457307421544203
Epoch: 38, step: 522, loss: 0.3353997766971588, mean loss: 0.34457290861750867
Epoch: 38, step: 523, loss: 0.29965466260910034, mean loss: 0.3445720977602986
Epoch: 38, step: 524, loss: 0.34819096326828003, mean loss: 0.3445721630863182
Epoch: 38, step: 525, loss: 0.39995917677879333, mean loss: 0.34457316288800227
Epoch: 38, step: 526, loss: 0.35255366563796997, mean loss: 0.34457330694299876
Epoch: 38, step: 527, loss: 0.3571789562702179, mean loss: 0.3445735344817953
Epoch: 38, step: 528, loss: 0.35504525899887085, mean loss: 0.3445737234986816
Epoch: 38, step: 529, loss: 0.31923216581344604, mean loss: 0.3445732660863556
Epoch: 38, step: 530, loss: 0.33944910764694214, mean loss: 0.34457317359752937
Epoch: 38, step: 531, loss: 0.3594890832901001, mean loss: 0.3445734428183382
Epoch: 38, step: 532, loss: 0.3111446797847748, mean loss: 0.3445728394655174
Epoch: 38, step: 533, loss: 0.3852596879005432, mean loss: 0.34457357380563286
Epoch: 38, step: 534, loss: 0.3006405532360077, mean loss: 0.3445727808910089
Epoch: 38, step: 535, loss: 0.3673606514930725, mean loss: 0.3445731921650235
Epoch: 38, step: 536, loss: 0.3434533178806305, mean loss: 0.34457317195396964
Epoch: 38, step: 537, loss: 0.3255482316017151, mean loss: 0.3445728286054702
Epoch: 38, step: 538, loss: 0.30538544058799744, mean loss: 0.3445721213923173
Epoch: 38, step: 539, loss: 0.299733966588974, mean loss: 0.3445713122146157
Epoch: 38, step: 540, loss: 0.332788348197937, mean loss: 0.34457109957563176
Epoch: 38, step: 541, loss: 0.32625433802604675, mean loss: 0.3445707690316979
Epoch: 38, step: 542, loss: 0.3266686797142029, mean loss: 0.34457044597676123
Epoch: 38, step: 543, loss: 0.3620140254497528, mean loss: 0.3445707607519069
Epoch: 38, step: 544, loss: 0.3068278729915619, mean loss: 0.34457007968133724
Epoch: 38, step: 545, loss: 0.37410831451416016, mean loss: 0.3445706126892919
Epoch: 38, step: 546, loss: 0.3479033410549164, mean loss: 0.34457067282621906
Epoch: 38, step: 547, loss: 0.33954548835754395, mean loss: 0.3445705821516527
Epoch: 38, step: 548, loss: 0.35211464762687683, mean loss: 0.34457071827452085
Epoch: 38, step: 549, loss: 0.31814706325531006, mean loss: 0.34457024150257076
Epoch: 38, step: 550, loss: 0.3318673074245453, mean loss: 0.3445700123028869
Epoch: 38, step: 551, loss: 0.3260571360588074, mean loss: 0.3445696782801487
Epoch: 38, step: 552, loss: 0.3183031380176544, mean loss: 0.3445692043687321
Epoch: 38, step: 553, loss: 0.34475192427635193, mean loss: 0.34456920766537824
Epoch: 38, step: 554, loss: 0.36188095808029175, mean loss: 0.34456951999962715
Epoch: 38, step: 555, loss: 0.29447099566459656, mean loss: 0.3445686161509526
Epoch: 38, step: 556, loss: 0.3795923888683319, mean loss: 0.3445692480182552
Epoch: 38, step: 557, loss: 0.32365256547927856, mean loss: 0.3445688706651515
Epoch: 38, step: 558, loss: 0.37720033526420593, mean loss: 0.34456945935134875
Epoch: 38, step: 559, loss: 0.34428033232688904, mean loss: 0.3445694541354622
Epoch: 38, step: 560, loss: 0.3039919137954712, mean loss: 0.34456872212492085
Epoch: 38, step: 561, loss: 0.338718056678772, mean loss: 0.34456861658201493
Epoch: 38, step: 562, loss: 0.3477880656719208, mean loss: 0.3445686746581237
Epoch: 38, step: 563, loss: 0.32611382007598877, mean loss: 0.34456834175433226
Epoch: 38, step: 564, loss: 0.34777840971946716, mean loss: 0.34456839965912445
Epoch: 38, step: 565, loss: 0.360718309879303, mean loss: 0.34456869097393056
Epoch: 38, step: 566, loss: 0.35817742347717285, mean loss: 0.34456893644611625
Epoch: 38, step: 567, loss: 0.2985229790210724, mean loss: 0.34456810589132864
Epoch: 38, step: 568, loss: 0.357104629278183, mean loss: 0.34456833201501663
Epoch: 38, step: 569, loss: 0.3446490168571472, mean loss: 0.3445683334703184
Epoch: 38, step: 570, loss: 0.359602153301239, mean loss: 0.3445686046284417
Epoch: 38, step: 571, loss: 0.3063511848449707, mean loss: 0.34456791533077585
Epoch: 38, step: 572, loss: 0.3809080719947815, mean loss: 0.34456857075789576
Epoch: 38, step: 573, loss: 0.3107861578464508, mean loss: 0.34456796147295343
Epoch: 38, step: 574, loss: 0.36838918924331665, mean loss: 0.34456839109453385
Epoch: 38, step: 575, loss: 0.3366684317588806, mean loss: 0.344568248619434
Epoch: 38, step: 576, loss: 0.32950398325920105, mean loss: 0.3445679769415794
Epoch: 38, step: 577, loss: 0.3623608946800232, mean loss: 0.3445682978237749
Epoch: 38, step: 578, loss: 0.3005465567111969, mean loss: 0.3445675039383425
Epoch: 38, step: 579, loss: 0.32829228043556213, mean loss: 0.3445672104372334
Epoch: 38, step: 580, loss: 0.3563600182533264, mean loss: 0.34456742310035016
Epoch: 38, step: 581, loss: 0.34900638461112976, mean loss: 0.3445675031479844
Epoch: 38, step: 582, loss: 0.31933197379112244, mean loss: 0.3445670480847916
Epoch: 38, step: 583, loss: 0.31550630927085876, mean loss: 0.34456652405242694
Epoch: 38, step: 584, loss: 0.3497335910797119, mean loss: 0.34456661722492143
Epoch: 38, step: 585, loss: 0.32544031739234924, mean loss: 0.3445662723459169
Epoch: 38, step: 586, loss: 0.3360355794429779, mean loss: 0.3445661185261058
Epoch: 38, step: 587, loss: 0.3172777593135834, mean loss: 0.34456562648933675
Epoch: 38, step: 588, loss: 0.3468829393386841, mean loss: 0.3445656682720823
Epoch: 38, step: 589, loss: 0.3369872272014618, mean loss: 0.34456553163003784
Epoch: 38, step: 590, loss: 0.3047861158847809, mean loss: 0.3445648144056586
Epoch: 38, step: 591, loss: 0.3435118496417999, mean loss: 0.34456479542100615
Epoch: 38, step: 592, loss: 0.3343162536621094, mean loss: 0.34456461064607136
Epoch: 38, step: 593, loss: 0.3287180960178375, mean loss: 0.34456432494826317
Epoch: 38, step: 594, loss: 0.37472495436668396, mean loss: 0.34456486870634306
Epoch: 38, step: 595, loss: 0.3170164227485657, mean loss: 0.3445643720515879
Epoch: 38, step: 596, loss: 0.34251490235328674, mean loss: 0.3445643351035683
Epoch: 38, step: 597, loss: 0.2962336838245392, mean loss: 0.34456346381005326
Epoch: 38, step: 598, loss: 0.30572423338890076, mean loss: 0.3445627636382442
Epoch: 38, step: 599, loss: 0.2885192334651947, mean loss: 0.3445617533352053
Epoch: 38, step: 600, loss: 0.3557472229003906, mean loss: 0.3445619549732917
Epoch: 38, step: 601, loss: 0.35539931058883667, mean loss: 0.34456215033248005
Epoch: 38, step: 602, loss: 0.29207444190979004, mean loss: 0.34456120418180997
Epoch: 38, step: 603, loss: 0.28794005513191223, mean loss: 0.34456018353956736
Epoch: 38, step: 604, loss: 0.35255885124206543, mean loss: 0.3445603277194564
Epoch: 38, step: 605, loss: 0.29356324672698975, mean loss: 0.34455940848875244
Epoch: 38, step: 606, loss: 0.38594961166381836, mean loss: 0.34456015454046884
Epoch: 38, step: 607, loss: 0.3124619424343109, mean loss: 0.3445595759858166
Epoch: 38, step: 608, loss: 0.32592183351516724, mean loss: 0.3445592400556338
Epoch: 38, step: 609, loss: 0.4028426706790924, mean loss: 0.3445602905482372
Epoch: 38, step: 610, loss: 0.31087419390678406, mean loss: 0.34455968340556936
Epoch: 38, step: 611, loss: 0.3215622305870056, mean loss: 0.34455926891755806
Epoch: 38, step: 612, loss: 0.3793223202228546, mean loss: 0.34455989544817545
Epoch: 38, step: 613, loss: 0.33271488547325134, mean loss: 0.3445596819707221
Epoch: 38, step: 614, loss: 0.3548314571380615, mean loss: 0.3445598670911137
Epoch: 38, step: 615, loss: 0.32896625995635986, mean loss: 0.34455958606445686
Epoch: 38, step: 616, loss: 0.34149420261383057, mean loss: 0.3445595308213735
Epoch: 38, step: 617, loss: 0.3844877779483795, mean loss: 0.3445602503788997
Epoch: 38, step: 618, loss: 0.35693901777267456, mean loss: 0.3445604734559283
Epoch: 38, step: 619, loss: 0.34463340044021606, mean loss: 0.3445604747701174
Epoch: 38, step: 620, loss: 0.33182281255722046, mean loss: 0.3445602452337396
Epoch: 38, step: 621, loss: 0.29174938797950745, mean loss: 0.344559293583881
Epoch: 38, step: 622, loss: 0.3915773928165436, mean loss: 0.3445601408331689
Epoch: 38, step: 623, loss: 0.3375987410545349, mean loss: 0.34456001539350156
Epoch: 38, step: 624, loss: 0.3350772261619568, mean loss: 0.3445598445231981
Epoch: 38, step: 625, loss: 0.33014482259750366, mean loss: 0.34455958478371335
Epoch: 38, step: 626, loss: 0.33738231658935547, mean loss: 0.34455945546123556
Epoch: 38, step: 627, loss: 0.3656297028064728, mean loss: 0.3445598351053319
Epoch: 38, step: 628, loss: 0.37118592858314514, mean loss: 0.34456031484611993
Epoch: 38, step: 629, loss: 0.34712255001068115, mean loss: 0.3445603610108557
Epoch: 38, step: 630, loss: 0.3317062258720398, mean loss: 0.3445601294173357
Epoch: 38, step: 631, loss: 0.31601619720458984, mean loss: 0.34455961514931516
Epoch: 38, step: 632, loss: 0.32120397686958313, mean loss: 0.34455919436491234
Epoch: 38, step: 633, loss: 0.33340901136398315, mean loss: 0.34455899348243113
Epoch: 38, step: 634, loss: 0.30040013790130615, mean loss: 0.34455819792771586
Epoch: 38, step: 635, loss: 0.33232438564300537, mean loss: 0.34455797753043466
Epoch: 38, step: 636, loss: 0.36878660321235657, mean loss: 0.34455841401146803
Epoch: 38, step: 637, loss: 0.3527831733226776, mean loss: 0.34455856217863273
Epoch: 38, step: 638, loss: 0.3394315540790558, mean loss: 0.34455846981841404
Epoch: 38, step: 639, loss: 0.3043646812438965, mean loss: 0.34455774576255993
Epoch: 38, step: 640, loss: 0.30400046706199646, mean loss: 0.3445570151719109
Epoch: 38, step: 641, loss: 0.30259785056114197, mean loss: 0.34455625934158685
Epoch: 38, step: 642, loss: 0.33415156602859497, mean loss: 0.34455607192028964
Epoch: 38, step: 643, loss: 0.3783746361732483, mean loss: 0.3445566810881737
Epoch: 38, step: 644, loss: 0.31088724732398987, mean loss: 0.3445560746174753
Epoch: 38, step: 645, loss: 0.3291938006877899, mean loss: 0.3445557979094899
Epoch: 38, step: 646, loss: 0.3352901339530945, mean loss: 0.3445556310177239
Epoch: 38, step: 647, loss: 0.35585513710975647, mean loss: 0.3445558345390872
Epoch: 38, step: 648, loss: 0.33686211705207825, mean loss: 0.34455569596598
Epoch: 38, step: 649, loss: 0.32485195994377136, mean loss: 0.3445553410843831
Epoch: 38, step: 650, loss: 0.3439229130744934, mean loss: 0.3445553296940042
Epoch: 38, step: 651, loss: 0.30572113394737244, mean loss: 0.3445546302812143
Epoch: 38, step: 652, loss: 0.29726195335388184, mean loss: 0.3445537785445745
Epoch: 38, step: 653, loss: 0.35079696774482727, mean loss: 0.3445538909817967
Epoch: 38, step: 654, loss: 0.35377389192581177, mean loss: 0.34455405702716096
Epoch: 38, step: 655, loss: 0.30490925908088684, mean loss: 0.3445533430666735
Epoch: 38, step: 656, loss: 0.3426744043827057, mean loss: 0.3445533092296031
Epoch: 38, step: 657, loss: 0.3351195156574249, mean loss: 0.34455313934317106
Epoch: 38, step: 658, loss: 0.3076159954071045, mean loss: 0.3445524741805783
Epoch: 38, step: 659, loss: 0.3162998855113983, mean loss: 0.34455196541826705
Epoch: 38, step: 660, loss: 0.3138684630393982, mean loss: 0.34455141289089813
Epoch: 38, step: 661, loss: 0.32298386096954346, mean loss: 0.3445510245242773
Epoch: 38, step: 662, loss: 0.29932668805122375, mean loss: 0.3445502101849153
Epoch: 38, step: 663, loss: 0.3271756172180176, mean loss: 0.34454989733211766
Epoch: 38, step: 664, loss: 0.3510860502719879, mean loss: 0.3445500150221791
Epoch: 38, step: 665, loss: 0.37087467312812805, mean loss: 0.344550489015807
Epoch: 38, step: 666, loss: 0.36966031789779663, mean loss: 0.34455094112745616
Epoch: 38, step: 667, loss: 0.3278995156288147, mean loss: 0.3445506413178505
Epoch: 38, step: 668, loss: 0.38621506094932556, mean loss: 0.34455139147394476
Epoch: 38, step: 669, loss: 0.3137059509754181, mean loss: 0.3445508361205095
Epoch: 38, step: 670, loss: 0.31622549891471863, mean loss: 0.3445503261491863
Epoch: 38, step: 671, loss: 0.31979089975357056, mean loss: 0.3445498803867926
Epoch: 38, step: 672, loss: 0.3356160819530487, mean loss: 0.34454971954786134
Epoch: 38, step: 673, loss: 0.3547927737236023, mean loss: 0.3445499039545545
Epoch: 38, step: 674, loss: 0.2884731590747833, mean loss: 0.34454889441767794
Epoch: 38, step: 675, loss: 0.33038780093193054, mean loss: 0.34454863948332415
Epoch: 38, step: 676, loss: 0.3361210227012634, mean loss: 0.3445484877683197
Epoch: 38, step: 677, loss: 0.38159796595573425, mean loss: 0.3445491547256228
Epoch: 38, step: 678, loss: 0.3164743483066559, mean loss: 0.34454864933766544
Epoch: 38, step: 679, loss: 0.3202418088912964, mean loss: 0.3445482117865341
Epoch: 38, step: 680, loss: 0.3800954222679138, mean loss: 0.3445488516657572
Epoch: 38, step: 681, loss: 0.3901834189891815, mean loss: 0.3445496731109695
Epoch: 38, step: 682, loss: 0.3142446279525757, mean loss: 0.3445491276147017
Epoch: 38, step: 683, loss: 0.3253605365753174, mean loss: 0.3445487822228261
Epoch: 38, step: 684, loss: 0.36202970147132874, mean loss: 0.34454909687119173
Epoch: 38, step: 685, loss: 0.3210592269897461, mean loss: 0.344548674072137
Epoch: 38, step: 686, loss: 0.32459455728530884, mean loss: 0.34454831492030225
Epoch: 38, step: 687, loss: 0.32667112350463867, mean loss: 0.34454799315659784
Epoch: 38, step: 688, loss: 0.32279568910598755, mean loss: 0.34454760165349224
Epoch: 38, step: 689, loss: 0.30325573682785034, mean loss: 0.3445468584861328
Epoch: 38, step: 690, loss: 0.3732120990753174, mean loss: 0.3445473743913321
Epoch: 38, step: 691, loss: 0.33235225081443787, mean loss: 0.3445471549124685
Epoch: 38, step: 692, loss: 0.3633764982223511, mean loss: 0.3445474937830401
Epoch: 38, step: 693, loss: 0.32088419795036316, mean loss: 0.34454706792377665
Epoch: 38, step: 694, loss: 0.3665183186531067, mean loss: 0.34454746332483716
Epoch: 38, step: 695, loss: 0.3650512099266052, mean loss: 0.3445478323096234
Epoch: 38, step: 696, loss: 0.3340078294277191, mean loss: 0.34454764263547266
Epoch: 38, step: 697, loss: 0.3024461269378662, mean loss: 0.344546885005174
Epoch: 38, step: 698, loss: 0.31187504529953003, mean loss: 0.34454629707550377
Epoch: 38, step: 699, loss: 0.3457496464252472, mean loss: 0.3445463187293825
Epoch: 38, step: 700, loss: 0.3707222640514374, mean loss: 0.34454678974849834
Epoch: 38, step: 701, loss: 0.34607434272766113, mean loss: 0.3445468172353263
Epoch: 38, step: 702, loss: 0.2932736873626709, mean loss: 0.34454589464189633
Epoch: 38, step: 703, loss: 0.311958909034729, mean loss: 0.3445453082919322
Epoch: 38, step: 704, loss: 0.33494487404823303, mean loss: 0.3445451355507939
Epoch: 38, step: 705, loss: 0.3273630142211914, mean loss: 0.3445448263975079
Epoch: 38, step: 706, loss: 0.307301789522171, mean loss: 0.3445441563056229
Epoch: 38, step: 707, loss: 0.3773089051246643, mean loss: 0.34454474581171896
Epoch: 38, step: 708, loss: 0.36559122800827026, mean loss: 0.3445451244749707
Epoch: 38, step: 709, loss: 0.36841437220573425, mean loss: 0.34454555391701547
Epoch: 38, step: 710, loss: 0.3261549770832062, mean loss: 0.34454522305008073
Epoch: 38, step: 711, loss: 0.35532525181770325, mean loss: 0.34454541699130065
Epoch: 38, step: 712, loss: 0.40539348125457764, mean loss: 0.34454651167627437
Epoch: 38, step: 713, loss: 0.3327968716621399, mean loss: 0.34454630029858907
Epoch: 38, step: 714, loss: 0.3237502872943878, mean loss: 0.34454592618210494
Epoch: 38, step: 715, loss: 0.3877503275871277, mean loss: 0.34454670340743065
Epoch: 38, step: 716, loss: 0.29592692852020264, mean loss: 0.3445458287780096
Epoch: 38, step: 717, loss: 0.3951282203197479, mean loss: 0.34454673869690766
Epoch: 38, step: 718, loss: 0.3382449448108673, mean loss: 0.34454662533694136
Epoch: 38, step: 719, loss: 0.2942359745502472, mean loss: 0.3445457203389059
Epoch: 38, step: 720, loss: 0.3316550552845001, mean loss: 0.34454548846321914
Epoch: 38, step: 721, loss: 0.36654573678970337, mean loss: 0.3445458841938434
Epoch: 38, step: 722, loss: 0.3335912525653839, mean loss: 0.344545687150375
Epoch: 38, step: 723, loss: 0.31271785497665405, mean loss: 0.34454511466616433
Epoch: 38, step: 724, loss: 0.311541885137558, mean loss: 0.3445445210508698
Epoch: 38, step: 725, loss: 0.3116197884082794, mean loss: 0.3445439288581175
Epoch: 38, step: 726, loss: 0.3308461904525757, mean loss: 0.3445436824914849
Epoch: 38, step: 727, loss: 0.37229791283607483, mean loss: 0.3445441816682897
Epoch: 38, step: 728, loss: 0.37183883786201477, mean loss: 0.34454467257054316
Epoch: 38, step: 729, loss: 0.27930599451065063, mean loss: 0.3445434992552297
Epoch: 38, step: 730, loss: 0.30687078833580017, mean loss: 0.3445428217250439
Epoch: 38, step: 731, loss: 0.32709887623786926, mean loss: 0.3445425080075868
Epoch: 38, step: 732, loss: 0.3352067470550537, mean loss: 0.3445423401133155
Epoch: 38, step: 733, loss: 0.31233981251716614, mean loss: 0.34454176099365946
Epoch: 38, step: 734, loss: 0.33490070700645447, mean loss: 0.3445415876152361
Epoch: 38, step: 735, loss: 0.31683549284935, mean loss: 0.3445410893758683
Epoch: 38, step: 736, loss: 0.3197081387042999, mean loss: 0.3445406428123503
Epoch: 38, step: 737, loss: 0.29816484451293945, mean loss: 0.3445398088652491
Epoch: 38, step: 738, loss: 0.3889062702655792, mean loss: 0.3445406066653498
Epoch: 38, step: 739, loss: 0.35403895378112793, mean loss: 0.3445407774620684
Epoch: 38, step: 740, loss: 0.3792111873626709, mean loss: 0.3445414008848275
Epoch: 38, step: 741, loss: 0.3252805471420288, mean loss: 0.34454105455380035
Epoch: 38, step: 742, loss: 0.35504937171936035, mean loss: 0.34454124350133547
Epoch: 38, step: 743, loss: 0.33094263076782227, mean loss: 0.34454099899233204
Epoch: 38, step: 744, loss: 0.3240405321121216, mean loss: 0.3445406303916006
Epoch: 38, step: 745, loss: 0.339738130569458, mean loss: 0.3445405440436589
Epoch: 38, step: 746, loss: 0.2964523434638977, mean loss: 0.34453967944342195
Epoch: 38, step: 747, loss: 0.31158363819122314, mean loss: 0.34453908692200425
Epoch: 38, step: 748, loss: 0.34580153226852417, mean loss: 0.3445391096192831
Epoch: 38, step: 749, loss: 0.3209669888019562, mean loss: 0.34453868582796277
Epoch: 38, step: 750, loss: 0.32629767060279846, mean loss: 0.34453835788780807
Epoch: 38, step: 751, loss: 0.2921639382839203, mean loss: 0.34453741630828116
Epoch: 38, step: 752, loss: 0.3093849718570709, mean loss: 0.34453678435422364
Epoch: 38, step: 753, loss: 0.3137037754058838, mean loss: 0.34453623006290396
Epoch: 38, step: 754, loss: 0.370868057012558, mean loss: 0.3445367034270428
Epoch: 38, step: 755, loss: 0.3287368714809418, mean loss: 0.34453641940043844
Epoch: 38, step: 756, loss: 0.34339144825935364, mean loss: 0.34453639881816767
Epoch: 38, step: 757, loss: 0.34492191672325134, mean loss: 0.3445364057482037
Epoch: 38, step: 758, loss: 0.3083271384239197, mean loss: 0.34453575486529087
Epoch: 38, step: 759, loss: 0.3061693608760834, mean loss: 0.34453506521915217
Epoch: 38, step: 760, loss: 0.3348107635974884, mean loss: 0.3445348904253855
Epoch: 38, step: 761, loss: 0.32903560996055603, mean loss: 0.3445346118317114
Epoch: 38, step: 762, loss: 0.35025808215141296, mean loss: 0.3445347147070654
Epoch: 38, step: 763, loss: 0.3230769634246826, mean loss: 0.3445343290260085
Epoch: 38, step: 764, loss: 0.34718066453933716, mean loss: 0.34453437659031844
Epoch: 38, step: 765, loss: 0.29924264550209045, mean loss: 0.34453356254719886
Epoch: 38, step: 766, loss: 0.34630751609802246, mean loss: 0.3445335944304741
Epoch: 38, step: 767, loss: 0.3265194296836853, mean loss: 0.3445332706676282
Epoch: 38, step: 768, loss: 0.3222074508666992, mean loss: 0.3445328694199906
Epoch: 38, step: 769, loss: 0.34851640462875366, mean loss: 0.34453294101222687
Epoch: 38, step: 770, loss: 0.3154721260070801, mean loss: 0.3445324187396139
Epoch: 38, step: 771, loss: 0.34194475412368774, mean loss: 0.34453237223568506
Epoch: 38, step: 772, loss: 0.3225260078907013, mean loss: 0.3445319767578462
Epoch: 38, step: 773, loss: 0.32496377825737, mean loss: 0.34453162510276764
Epoch: 38, step: 774, loss: 0.3090550899505615, mean loss: 0.3445309875745064
Epoch: 38, step: 775, loss: 0.349609911441803, mean loss: 0.3445310788432648
Epoch: 38, step: 776, loss: 0.3215165138244629, mean loss: 0.3445306652767134
Epoch: 38, step: 777, loss: 0.3254607319831848, mean loss: 0.34453032260046373
Epoch: 38, step: 778, loss: 0.31234267354011536, mean loss: 0.3445297442164444
Epoch: 38, step: 779, loss: 0.33788496255874634, mean loss: 0.34452962481765087
Epoch: 38, step: 780, loss: 0.32118722796440125, mean loss: 0.3445292053901833
Epoch: 38, step: 781, loss: 0.3077887296676636, mean loss: 0.3445285452314216
Epoch: 38, step: 782, loss: 0.34929218888282776, mean loss: 0.344528630823797
Epoch: 38, step: 783, loss: 0.3248719871044159, mean loss: 0.34452827764276134
Epoch: 38, step: 784, loss: 0.34304919838905334, mean loss: 0.34452825106786056
Epoch: 38, step: 785, loss: 0.3165215253829956, mean loss: 0.34452774787468643
Epoch: 38, step: 786, loss: 0.35668712854385376, mean loss: 0.3445279663367621
Epoch: 38, step: 787, loss: 0.36323562264442444, mean loss: 0.34452830244269644
Epoch: 38, step: 788, loss: 0.3347255289554596, mean loss: 0.34452812632704116
Epoch: 38, step: 789, loss: 0.32108843326568604, mean loss: 0.3445277052194083
Epoch: 38, step: 790, loss: 0.3734601140022278, mean loss: 0.3445282249975155
Epoch: 38, step: 791, loss: 0.3254704773426056, mean loss: 0.3445278826263662
Epoch: 38, step: 792, loss: 0.3574122190475464, mean loss: 0.3445281140884415
Epoch: 38, step: 793, loss: 0.3085038661956787, mean loss: 0.34452746693851344
Epoch: 38, step: 794, loss: 0.30852416157722473, mean loss: 0.34452682017642167
Epoch: 38, step: 795, loss: 0.3528832793235779, mean loss: 0.34452697028885876
Epoch: 38, step: 796, loss: 0.31426331400871277, mean loss: 0.3445264266531498
Epoch: 38, step: 797, loss: 0.3819607198238373, mean loss: 0.34452709908521684
Epoch: 38, step: 798, loss: 0.2960106432437897, mean loss: 0.34452622759995805
Epoch: 38, step: 799, loss: 0.37937667965888977, mean loss: 0.3445268535960074
Epoch: 38, step: 800, loss: 0.29191580414772034, mean loss: 0.3445259085948498
Epoch: 38, step: 801, loss: 0.3418499231338501, mean loss: 0.3445258605295866
Epoch: 38, step: 802, loss: 0.3168989419937134, mean loss: 0.34452536431192093
Epoch: 38, step: 803, loss: 0.3472919762134552, mean loss: 0.34452541400320447
Epoch: 38, step: 804, loss: 0.32132425904273987, mean loss: 0.34452499729334296
Epoch: 38, step: 805, loss: 0.29541435837745667, mean loss: 0.3445241152458751
Epoch: 38, step: 806, loss: 0.32173627614974976, mean loss: 0.3445237059741731
Epoch: 38, step: 807, loss: 0.326715350151062, mean loss: 0.3445233861401964
Epoch: 38, step: 808, loss: 0.3132043182849884, mean loss: 0.3445228236670394
Epoch: 38, step: 809, loss: 0.29465144872665405, mean loss: 0.34452192802078135
Epoch: 38, step: 810, loss: 0.35799920558929443, mean loss: 0.34452217005654756
Epoch: 38, step: 811, loss: 0.31227147579193115, mean loss: 0.3445215908830998
Epoch: 38, step: 812, loss: 0.304792195558548, mean loss: 0.34452087741636145
Epoch: 38, step: 813, loss: 0.2979658246040344, mean loss: 0.3445200413884045
Epoch: 38, step: 814, loss: 0.3433229327201843, mean loss: 0.3445200198913106
Epoch: 38, step: 815, loss: 0.3196217715740204, mean loss: 0.3445195727887334
Epoch: 38, step: 816, loss: 0.33685439825057983, mean loss: 0.3445194351462091
Epoch: 38, step: 817, loss: 0.3405066728591919, mean loss: 0.34451936309086184
Epoch: 38, step: 818, loss: 0.36672157049179077, mean loss: 0.344519761758643
Epoch: 38, step: 819, loss: 0.32624658942222595, mean loss: 0.34451943364738224
Epoch: 38, step: 820, loss: 0.3358566164970398, mean loss: 0.3445192781014941
Epoch: 38, step: 821, loss: 0.3408352732658386, mean loss: 0.34451921195424595
Epoch: 38, step: 822, loss: 0.3393409848213196, mean loss: 0.3445191189795241
Epoch: 38, step: 823, loss: 0.34776338934898376, mean loss: 0.3445191772291357
Epoch: 38, step: 824, loss: 0.36478808522224426, mean loss: 0.344519541142955
Epoch: 38, step: 825, loss: 0.3108133375644684, mean loss: 0.34451893598292094
Epoch: 38, step: 826, loss: 0.3260014057159424, mean loss: 0.34451860352578045
Epoch: 38, step: 827, loss: 0.33242836594581604, mean loss: 0.3445183864658598
Epoch: 38, step: 828, loss: 0.32768669724464417, mean loss: 0.3445180842865592
Epoch: 38, step: 829, loss: 0.31020838022232056, mean loss: 0.344517468335533
Epoch: 38, step: 830, loss: 0.3464040458202362, mean loss: 0.3445175022040407
Epoch: 38, step: 831, loss: 0.3206568658351898, mean loss: 0.344517073857129
Epoch: 38, step: 832, loss: 0.31214386224746704, mean loss: 0.34451649270262563
Epoch: 38, step: 833, loss: 0.38132891058921814, mean loss: 0.34451715353660917
Epoch: 38, step: 834, loss: 0.378484308719635, mean loss: 0.3445177632832332
Epoch: 38, step: 835, loss: 0.3559528589248657, mean loss: 0.3445179685516981
Epoch: 38, step: 836, loss: 0.31181129813194275, mean loss: 0.3445173814531966
Epoch: 38, step: 837, loss: 0.35178500413894653, mean loss: 0.3445175119077413
Epoch: 38, step: 838, loss: 0.2902941107749939, mean loss: 0.3445165386098086
Epoch: 38, step: 839, loss: 0.3300611674785614, mean loss: 0.3445162791437845
Epoch: 38, step: 840, loss: 0.28110796213150024, mean loss: 0.34451514101952246
Epoch: 38, step: 841, loss: 0.3382951617240906, mean loss: 0.3445150293782959
Epoch: 38, step: 842, loss: 0.3486497700214386, mean loss: 0.3445151035906381
Epoch: 38, step: 843, loss: 0.3779621422290802, mean loss: 0.3445157039036297
Epoch: 38, step: 844, loss: 0.3282153010368347, mean loss: 0.34451541134654895
Epoch: 38, step: 845, loss: 0.3687259256839752, mean loss: 0.3445158458652743
Epoch: 38, step: 846, loss: 0.3518621623516083, mean loss: 0.34451597771108067
Epoch: 38, step: 847, loss: 0.2901059091091156, mean loss: 0.3445150012202587
Epoch: 38, step: 848, loss: 0.30942976474761963, mean loss: 0.3445143715611271
Epoch: 38, step: 849, loss: 0.3310602009296417, mean loss: 0.3445141301094449
Epoch: 38, step: 850, loss: 0.30165398120880127, mean loss: 0.34451336094502627
Epoch: 38, step: 851, loss: 0.3336494266986847, mean loss: 0.34451316598532766
Epoch: 38, step: 852, loss: 0.3101765811443329, mean loss: 0.34451254980614704
Epoch: 38, step: 853, loss: 0.3411085605621338, mean loss: 0.3445124887217476
Epoch: 38, step: 854, loss: 0.3320164680480957, mean loss: 0.3445122644853689
Epoch: 38, step: 855, loss: 0.38464295864105225, mean loss: 0.34451298460261975
Epoch: 38, step: 856, loss: 0.31725865602493286, mean loss: 0.34451249555152286
Epoch: 38, step: 857, loss: 0.3216577172279358, mean loss: 0.3445120854532217
Epoch: 38, step: 858, loss: 0.350075364112854, mean loss: 0.3445121852769941
Epoch: 38, step: 859, loss: 0.33656367659568787, mean loss: 0.3445120426567996
Epoch: 38, step: 860, loss: 0.30478978157043457, mean loss: 0.3445113299325413
Epoch: 38, step: 861, loss: 0.35150375962257385, mean loss: 0.34451145539329575
Epoch: 38, step: 862, loss: 0.3768870532512665, mean loss: 0.34451203627780025
Epoch: 38, step: 863, loss: 0.31453657150268555, mean loss: 0.34451149846624624
Epoch: 38, step: 864, loss: 0.30059075355529785, mean loss: 0.3445107104664452
Epoch: 38, step: 865, loss: 0.3137821555137634, mean loss: 0.3445101591629368
Epoch: 38, step: 866, loss: 0.35132449865341187, mean loss: 0.3445102814173635
Epoch: 38, step: 867, loss: 0.31861412525177, mean loss: 0.34450981682898596
Epoch: 38, step: 868, loss: 0.30567508935928345, mean loss: 0.3445091201294745
Epoch: 38, step: 869, loss: 0.33941882848739624, mean loss: 0.3445090288106908
Epoch: 38, step: 870, loss: 0.29822102189064026, mean loss: 0.3445081984282765
Epoch: 38, step: 871, loss: 0.33398160338401794, mean loss: 0.3445080095901048
Epoch: 38, step: 872, loss: 0.33549168705940247, mean loss: 0.3445078478478404
Epoch: 38, step: 873, loss: 0.3416418135166168, mean loss: 0.34450779643546403
Epoch: 38, step: 874, loss: 0.2854361832141876, mean loss: 0.344506736797937
Epoch: 38, step: 875, loss: 0.31355684995651245, mean loss: 0.3445061816230995
Epoch: 38, step: 876, loss: 0.35501834750175476, mean loss: 0.344506370185511
Epoch: 38, step: 877, loss: 0.3052273392677307, mean loss: 0.3445056656289026
Epoch: 38, step: 878, loss: 0.30234295129776, mean loss: 0.3445049093605966
Epoch: 38, step: 879, loss: 0.30492785573005676, mean loss: 0.3445041994837557
Epoch: 38, step: 880, loss: 0.35390299558639526, mean loss: 0.3445043680629551
Epoch: 38, step: 881, loss: 0.350765585899353, mean loss: 0.34450448036373776
Epoch: 38, step: 882, loss: 0.30857789516448975, mean loss: 0.34450383599847545
Epoch: 38, step: 883, loss: 0.2964586019515991, mean loss: 0.3445029742932949
Epoch: 38, step: 884, loss: 0.3690963685512543, mean loss: 0.34450341537502915
Epoch: 38, step: 885, loss: 0.33340248465538025, mean loss: 0.3445032162837648
Epoch: 38, step: 886, loss: 0.32018837332725525, mean loss: 0.34450278021348096
Epoch: 38, step: 887, loss: 0.31282007694244385, mean loss: 0.34450221201578957
Epoch: 38, step: 888, loss: 0.35021311044692993, mean loss: 0.34450231443322166
Epoch: 38, step: 889, loss: 0.36267924308776855, mean loss: 0.34450264040662026
Epoch: 38, step: 890, loss: 0.3178257942199707, mean loss: 0.34450216200972295
Epoch: 38, step: 891, loss: 0.2939758598804474, mean loss: 0.3445012559358737
Epoch: 38, step: 892, loss: 0.33584415912628174, mean loss: 0.3445011006933953
Epoch: 38, step: 893, loss: 0.32835984230041504, mean loss: 0.3445008112471665
Epoch: 38, step: 894, loss: 0.33702534437179565, mean loss: 0.3445006771989503
Epoch: 38, step: 895, loss: 0.3415931165218353, mean loss: 0.3445006250622289
Epoch: 38, step: 896, loss: 0.3137386739253998, mean loss: 0.3445000734663398
Epoch: 38, step: 897, loss: 0.3456518054008484, mean loss: 0.3445000941178
Epoch: 38, step: 898, loss: 0.3552074432373047, mean loss: 0.34450028610555566
Epoch: 38, step: 899, loss: 0.3196781873703003, mean loss: 0.344499841041747
Epoch: 38, step: 900, loss: 0.34721261262893677, mean loss: 0.34449988968126055
Epoch: 38, step: 901, loss: 0.30891159176826477, mean loss: 0.3444992516008304
Epoch: 38, step: 902, loss: 0.32059216499328613, mean loss: 0.34449882296637757
Epoch: 38, step: 903, loss: 0.31208816170692444, mean loss: 0.34449824188022476
Epoch: 38, step: 904, loss: 0.37323418259620667, mean loss: 0.3444987570735969
Epoch: 38, step: 905, loss: 0.32851549983024597, mean loss: 0.34449847052231786
Epoch: 38, step: 906, loss: 0.31023192405700684, mean loss: 0.3444978561953047
Epoch: 38, step: 907, loss: 0.31011641025543213, mean loss: 0.3444972398194363
Epoch: 38, step: 908, loss: 0.3404610753059387, mean loss: 0.34449716746210113
Epoch: 38, step: 909, loss: 0.31832924485206604, mean loss: 0.3444966983515886
Epoch: 38, step: 910, loss: 0.31740787625312805, mean loss: 0.34449621274088105
Epoch: 38, step: 911, loss: 0.32246679067611694, mean loss: 0.34449581783513633
Epoch: 38, step: 912, loss: 0.3778438866138458, mean loss: 0.3444964156314755
Epoch: 38, step: 913, loss: 0.363875150680542, mean loss: 0.3444967630077894
Epoch: 38, step: 914, loss: 0.3012111485004425, mean loss: 0.3444959870991636
Epoch: 38, step: 915, loss: 0.28121933341026306, mean loss: 0.34449485286503284
Epoch: 38, step: 916, loss: 0.3498985171318054, mean loss: 0.3444949497239883
Epoch: 38, step: 917, loss: 0.33050376176834106, mean loss: 0.34449469894090967
Epoch: 38, step: 918, loss: 0.3446834981441498, mean loss: 0.34449470232495377
Epoch: 38, step: 919, loss: 0.3109666705131531, mean loss: 0.34449410137801134
Epoch: 38, step: 920, loss: 0.30722567439079285, mean loss: 0.3444934334012582
Epoch: 38, step: 921, loss: 0.32074499130249023, mean loss: 0.34449300775616915
Epoch: 38, step: 922, loss: 0.34806016087532043, mean loss: 0.34449307168937315
Epoch: 38, step: 923, loss: 0.32656943798065186, mean loss: 0.3444927504542719
Epoch: 38, step: 924, loss: 0.3402847349643707, mean loss: 0.34449267503775327
Epoch: 38, step: 925, loss: 0.33710771799087524, mean loss: 0.344492542686109
Epoch: 38, step: 926, loss: 0.31657660007476807, mean loss: 0.3444920423914333
Epoch: 38, step: 927, loss: 0.3586133122444153, mean loss: 0.34449229546078547
Epoch: 38, step: 928, loss: 0.38969120383262634, mean loss: 0.34449310546254835
Epoch: 38, step: 929, loss: 0.3658912479877472, mean loss: 0.3444934889280608
Epoch: 38, step: 930, loss: 0.36386480927467346, mean loss: 0.34449383606567613
Epoch: 38, step: 931, loss: 0.3112161457538605, mean loss: 0.34449323973404555
Epoch: 38, step: 932, loss: 0.3168478310108185, mean loss: 0.3444927443410033
Epoch: 38, step: 933, loss: 0.3082073926925659, mean loss: 0.3444920941357987
Epoch: 38, step: 934, loss: 0.29382097721099854, mean loss: 0.3444911861651691
Epoch: 38, step: 935, loss: 0.3180195689201355, mean loss: 0.3444907118314312
Epoch: 38, step: 936, loss: 0.33349230885505676, mean loss: 0.34449051475922104
Epoch: 38, step: 937, loss: 0.3383621573448181, mean loss: 0.344490404951706
Epoch: 38, step: 938, loss: 0.3233821988105774, mean loss: 0.3444900267429991
Epoch: 38, step: 939, loss: 0.29363906383514404, mean loss: 0.3444891156313581
Epoch: 38, step: 940, loss: 0.3076463043689728, mean loss: 0.34448845551971274
Epoch: 38, step: 941, loss: 0.34801819920539856, mean loss: 0.3444885187609011
Epoch: 38, step: 942, loss: 0.3190988600254059, mean loss: 0.3444880638713779
Epoch: 38, step: 943, loss: 0.3868902325630188, mean loss: 0.3444888235490455
Epoch: 38, step: 944, loss: 0.3318406045436859, mean loss: 0.3444885969474903
Epoch: 38, step: 945, loss: 0.31861987709999084, mean loss: 0.34448813349985963
Epoch: 38, step: 946, loss: 0.3114953637123108, mean loss: 0.34448754243284324
Epoch: 38, step: 947, loss: 0.3328571021556854, mean loss: 0.3444873340766935
Epoch: 38, step: 948, loss: 0.35029077529907227, mean loss: 0.3444874380418898
Epoch: 38, step: 949, loss: 0.35247769951820374, mean loss: 0.3444875811801055
Epoch: 38, step: 950, loss: 0.3583846986293793, mean loss: 0.34448783012977585
Epoch: 38, step: 951, loss: 0.3066355586051941, mean loss: 0.34448715206529595
Epoch: 38, step: 952, loss: 0.30612972378730774, mean loss: 0.34448646496402807
Epoch: 38, step: 953, loss: 0.38335245847702026, mean loss: 0.3444871611628156
Epoch: 38, step: 954, loss: 0.35815954208374023, mean loss: 0.34448740606906025
Epoch: 38, step: 955, loss: 0.3419796824455261, mean loss: 0.34448736115031653
Epoch: 38, step: 956, loss: 0.36051177978515625, mean loss: 0.3444876481771061
Epoch: 38, step: 957, loss: 0.3467564880847931, mean loss: 0.3444876888154709
Epoch: 38, step: 958, loss: 0.32183822989463806, mean loss: 0.34448728313656635
Epoch: 38, step: 959, loss: 0.3508995473384857, mean loss: 0.34448739798583206
Epoch: 38, step: 960, loss: 0.31969770789146423, mean loss: 0.34448695398873186
Epoch: 38, step: 961, loss: 0.30940455198287964, mean loss: 0.3444863256547059
Epoch: 38, step: 962, loss: 0.32768166065216064, mean loss: 0.34448602468461537
Epoch: 38, step: 963, loss: 0.35950055718421936, mean loss: 0.3444862935887722
Epoch: 38, step: 964, loss: 0.31530165672302246, mean loss: 0.34448577091318316
Epoch: 38, step: 965, loss: 0.3274141848087311, mean loss: 0.34448546517898593
Epoch: 38, step: 966, loss: 0.31621092557907104, mean loss: 0.34448495882071306
Epoch: 38, step: 967, loss: 0.31685352325439453, mean loss: 0.34448446398841426
Epoch: 38, step: 968, loss: 0.3201928436756134, mean loss: 0.3444840289743509
Epoch: 38, step: 969, loss: 0.3242875635623932, mean loss: 0.3444836673027522
Epoch: 38, step: 970, loss: 0.3460049033164978, mean loss: 0.344483694544054
Epoch: 38, step: 971, loss: 0.32699230313301086, mean loss: 0.34448338132524065
Epoch: 38, step: 972, loss: 0.3624601364135742, mean loss: 0.34448370322970995
Epoch: 38, step: 973, loss: 0.3474534749984741, mean loss: 0.3444837564075878
Epoch: 38, step: 974, loss: 0.32731330394744873, mean loss: 0.3444834489523537
Epoch: 38, step: 975, loss: 0.3048139810562134, mean loss: 0.3444827386410105
Epoch: 38, step: 976, loss: 0.35435768961906433, mean loss: 0.3444829154561903
Epoch: 38, step: 977, loss: 0.30707621574401855, mean loss: 0.3444822456853808
Epoch: 38, step: 978, loss: 0.316608190536499, mean loss: 0.3444817466064896
Epoch: 38, step: 979, loss: 0.3167159855365753, mean loss: 0.3444812494754814
Epoch: 38, step: 980, loss: 0.35779398679733276, mean loss: 0.34448148782861054
Epoch: 38, step: 981, loss: 0.3315944969654083, mean loss: 0.3444812571022371
Epoch: 38, step: 982, loss: 0.316733717918396, mean loss: 0.3444807603241656
Epoch: 38, step: 983, loss: 0.3164184093475342, mean loss: 0.3444802579188559
Epoch: 38, step: 984, loss: 0.3252783417701721, mean loss: 0.3444799141496569
Epoch: 38, step: 985, loss: 0.34844550490379333, mean loss: 0.34447998514379835
Epoch: 38, step: 986, loss: 0.3233812153339386, mean loss: 0.3444796074290199
Epoch: 38, step: 987, loss: 0.28399476408958435, mean loss: 0.344478524635548
Epoch: 38, step: 988, loss: 0.37335047125816345, mean loss: 0.34447904148892733
Epoch: 38, step: 989, loss: 0.3417178690433502, mean loss: 0.34447899206047067
Epoch: 38, step: 990, loss: 0.3322480320930481, mean loss: 0.3444787731148364
Epoch: 38, step: 991, loss: 0.3648073673248291, mean loss: 0.3444791370091907
Epoch: 38, step: 992, loss: 0.3735024631023407, mean loss: 0.34447965653529994
Epoch: 38, step: 993, loss: 0.2932896316051483, mean loss: 0.3444787402351365
Epoch: 38, step: 994, loss: 0.3148080110549927, mean loss: 0.34447820913933436
Epoch: 38, step: 995, loss: 0.3145067095756531, mean loss: 0.34447767266944884
Epoch: 38, step: 996, loss: 0.3553997576236725, mean loss: 0.3444778681639978
Epoch: 38, step: 997, loss: 0.3132968544960022, mean loss: 0.34447731006459437
Epoch: 38, step: 998, loss: 0.3067072927951813, mean loss: 0.34447663404273565
Epoch: 38, step: 999, loss: 0.3326341211795807, mean loss: 0.34447642208481644
Epoch: 38, step: 1000, loss: 0.31832775473594666, mean loss: 0.3444759540829667
Epoch: 38, step: 1001, loss: 0.31584012508392334, mean loss: 0.3444754415757362
Epoch: 38, step: 1002, loss: 0.3075568974018097, mean loss: 0.34447478084116484
Epoch: 38, step: 1003, loss: 0.3759225904941559, mean loss: 0.3444753436554259
Epoch: 38, step: 1004, loss: 0.357952743768692, mean loss: 0.34447558485305846
Epoch: 38, step: 1005, loss: 0.33417123556137085, mean loss: 0.34447540044507513
Epoch: 38, step: 1006, loss: 0.354289174079895, mean loss: 0.34447557607050927
Epoch: 38, step: 1007, loss: 0.3374011218547821, mean loss: 0.3444754494696822
Epoch: 38, step: 1008, loss: 0.33323636651039124, mean loss: 0.344475248344381
Epoch: 38, step: 1009, loss: 0.33498871326446533, mean loss: 0.34447507858426
Epoch: 38, step: 1010, loss: 0.3601393401622772, mean loss: 0.34447535888885317
Epoch: 38, step: 1011, loss: 0.3131919503211975, mean loss: 0.34447479909698847
Epoch: 38, step: 1012, loss: 0.2870093584060669, mean loss: 0.3444737708167578
Epoch: 38, step: 1013, loss: 0.32836636900901794, mean loss: 0.3444734825978513
Epoch: 38, step: 1014, loss: 0.3520393967628479, mean loss: 0.34447361797663645
Epoch: 38, step: 1015, loss: 0.3281652331352234, mean loss: 0.34447332617186904
Epoch: 38, step: 1016, loss: 0.33000311255455017, mean loss: 0.34447306726200094
Epoch: 38, step: 1017, loss: 0.35951340198516846, mean loss: 0.3444733363680078
Epoch: 38, step: 1018, loss: 0.3523699641227722, mean loss: 0.34447347765422126
Epoch: 38, step: 1019, loss: 0.3560456931591034, mean loss: 0.3444736847002297
Epoch: 38, step: 1020, loss: 0.3132922351360321, mean loss: 0.34447312682268577
Epoch: 38, step: 1021, loss: 0.3377750813961029, mean loss: 0.3444730069879016
Epoch: 38, step: 1022, loss: 0.3407289981842041, mean loss: 0.3444729400050086
Epoch: 38, step: 1023, loss: 0.34814390540122986, mean loss: 0.34447300567992983
Epoch: 38, step: 1024, loss: 0.3106842637062073, mean loss: 0.34447240119772193
Epoch: 38, step: 1025, loss: 0.309152752161026, mean loss: 0.34447176933881757
Epoch: 38, step: 1026, loss: 0.3534770607948303, mean loss: 0.3444719304381477
Epoch: 38, step: 1027, loss: 0.3584050238132477, mean loss: 0.34447217968847643
Epoch: 38, step: 1028, loss: 0.3555925786495209, mean loss: 0.34447237861870955
Epoch: 38, step: 1029, loss: 0.33277371525764465, mean loss: 0.3444721693477826
Epoch: 38, step: 1030, loss: 0.3288399875164032, mean loss: 0.3444718897173185
Epoch: 38, step: 1031, loss: 0.30133742094039917, mean loss: 0.3444711181362371
Epoch: 38, step: 1032, loss: 0.3215145766735077, mean loss: 0.344470707501384
Epoch: 38, step: 1033, loss: 0.42189809679985046, mean loss: 0.34447209245808447
Epoch: 38, step: 1034, loss: 0.3572928011417389, mean loss: 0.3444723217801494
Epoch: 38, step: 1035, loss: 0.31707698106765747, mean loss: 0.3444718317726243
Epoch: 38, step: 1036, loss: 0.3552572429180145, mean loss: 0.3444720246827308
Epoch: 38, step: 1037, loss: 0.3516225814819336, mean loss: 0.3444721525767891
Epoch: 38, step: 1038, loss: 0.34198009967803955, mean loss: 0.34447210800500716
Epoch: 38, step: 1039, loss: 0.2990688681602478, mean loss: 0.3444712959567913
Epoch: 38, step: 1040, loss: 0.31829604506492615, mean loss: 0.34447082781430405
Epoch: 38, step: 1041, loss: 0.3349597752094269, mean loss: 0.34447065771285174
Epoch: 38, step: 1042, loss: 0.31838077306747437, mean loss: 0.3444701911138238
Epoch: 38, step: 1043, loss: 0.38159888982772827, mean loss: 0.34447085512231357
Epoch: 38, step: 1044, loss: 0.29674163460731506, mean loss: 0.3444700015496878
Epoch: 38, step: 1045, loss: 0.33898302912712097, mean loss: 0.3444699034243539
Epoch: 38, step: 1046, loss: 0.3433336913585663, mean loss: 0.3444698831054629
Epoch: 38, step: 1047, loss: 0.3372655212879181, mean loss: 0.3444697542720971
Epoch: 38, step: 1048, loss: 0.3709346354007721, mean loss: 0.3444702275268874
Epoch: 38, step: 1049, loss: 0.31549927592277527, mean loss: 0.3444697094668823
Epoch: 38, step: 1050, loss: 0.29555895924568176, mean loss: 0.3444688348580412
Epoch: 38, step: 1051, loss: 0.3267243504524231, mean loss: 0.34446851756163166
Epoch: 38, step: 1052, loss: 0.36795124411582947, mean loss: 0.34446893745839613
Epoch: 38, step: 1053, loss: 0.3525751233100891, mean loss: 0.3444690824032492
Epoch: 38, step: 1054, loss: 0.3274317979812622, mean loss: 0.34446877776891477
Epoch: 38, step: 1055, loss: 0.34319159388542175, mean loss: 0.34446875493269885
Epoch: 38, step: 1056, loss: 0.314950555562973, mean loss: 0.34446822715284636
Epoch: 38, step: 1057, loss: 0.36618417501449585, mean loss: 0.34446861542296725
Epoch: 38, step: 1058, loss: 0.33781880140304565, mean loss: 0.34446849652979494
Epoch: 38, step: 1059, loss: 0.4084089696407318, mean loss: 0.3444696397121076
Epoch: 38, step: 1060, loss: 0.32367512583732605, mean loss: 0.34446926793669996
Epoch: 38, step: 1061, loss: 0.2941015958786011, mean loss: 0.34446836745269993
Epoch: 38, step: 1062, loss: 0.31020745635032654, mean loss: 0.34446775493976345
Epoch: 38, step: 1063, loss: 0.31610602140426636, mean loss: 0.3444672479007629
Epoch: 38, step: 1064, loss: 0.3632654547691345, mean loss: 0.3444675839610963
Epoch: 38, step: 1065, loss: 0.3557153642177582, mean loss: 0.3444677850369348
Epoch: 38, step: 1066, loss: 0.32722586393356323, mean loss: 0.34446747680973905
Epoch: 38, step: 1067, loss: 0.3398860692977905, mean loss: 0.34446739491114214
Epoch: 38, step: 1068, loss: 0.32936468720436096, mean loss: 0.3444671249354945
Epoch: 38, step: 1069, loss: 0.28252172470092773, mean loss: 0.34446601762077145
Epoch: 38, step: 1070, loss: 0.3156948983669281, mean loss: 0.3444655033273075
Epoch: 38, step: 1071, loss: 0.31948667764663696, mean loss: 0.344465056830352
Epoch: 38, step: 1072, loss: 0.32554054260253906, mean loss: 0.3444647185603685
Epoch: 38, step: 1073, loss: 0.3108135759830475, mean loss: 0.3444641170670968
Epoch: 38, step: 1074, loss: 0.3179386854171753, mean loss: 0.34446364294995646
Epoch: 38, step: 1075, loss: 0.3286588788032532, mean loss: 0.3444633604597129
Epoch: 38, step: 1076, loss: 0.32789838314056396, mean loss: 0.3444630643869087
Epoch: 38, step: 1077, loss: 0.32102158665657043, mean loss: 0.34446264541501004
Epoch: 38, step: 1078, loss: 0.3498547673225403, mean loss: 0.3444627417872269
Epoch: 38, step: 1079, loss: 0.33110901713371277, mean loss: 0.344462503123289
Epoch: 38, step: 1080, loss: 0.3171405792236328, mean loss: 0.3444620148219665
Epoch: 38, step: 1081, loss: 0.34368351101875305, mean loss: 0.34446200090868406
Epoch: 38, step: 1082, loss: 0.3133750557899475, mean loss: 0.34446144533822354
Epoch: 38, step: 1083, loss: 0.31646043062210083, mean loss: 0.3444609449269233
Epoch: 38, step: 1084, loss: 0.32744529843330383, mean loss: 0.34446064084259975
Epoch: 38, step: 1085, loss: 0.3618493676185608, mean loss: 0.34446095158863743
Epoch: 38, step: 1086, loss: 0.3496807813644409, mean loss: 0.34446104486817736
Epoch: 38, step: 1087, loss: 0.3050331473350525, mean loss: 0.3444603402953122
Epoch: 38, step: 1088, loss: 0.323737233877182, mean loss: 0.3444599699819436
Epoch: 38, step: 1089, loss: 0.33006593585014343, mean loss: 0.3444597127710839
Epoch: 38, step: 1090, loss: 0.2998054325580597, mean loss: 0.3444589148460225
Epoch: 38, step: 1091, loss: 0.31285372376441956, mean loss: 0.3444583501045622
Epoch: 38, step: 1092, loss: 0.3310871720314026, mean loss: 0.34445811118419994
Epoch: 38, step: 1093, loss: 0.3196209669113159, mean loss: 0.34445766739432265
Epoch: 38, step: 1094, loss: 0.2975675165653229, mean loss: 0.3444568295764866
Epoch: 38, step: 1095, loss: 0.335342675447464, mean loss: 0.34445666673067954
Epoch: 38, step: 1096, loss: 0.3435916304588318, mean loss: 0.3444566512750475
Epoch: 38, step: 1097, loss: 0.34538915753364563, mean loss: 0.34445666793587043
Epoch: 38, step: 1098, loss: 0.3266863524913788, mean loss: 0.3444563504443937
Epoch: 38, step: 1099, loss: 0.3259386420249939, mean loss: 0.3444560196056097
Epoch: 38, step: 1100, loss: 0.3092001676559448, mean loss: 0.34445538973313633
Epoch: 38, step: 1101, loss: 0.31235530972480774, mean loss: 0.3444548162511624
Epoch: 38, step: 1102, loss: 0.3139011263847351, mean loss: 0.34445427040587673
Epoch: 38, step: 1103, loss: 0.3339068591594696, mean loss: 0.34445408197849275
Epoch: 38, step: 1104, loss: 0.33322691917419434, mean loss: 0.34445388141106675
Epoch: 38, step: 1105, loss: 0.3305080533027649, mean loss: 0.34445363228054926
Epoch: 38, step: 1106, loss: 0.34312453866004944, mean loss: 0.3444536085378311
Epoch: 38, step: 1107, loss: 0.319474458694458, mean loss: 0.3444531623222212
Epoch: 38, step: 1108, loss: 0.3311503529548645, mean loss: 0.3444529246914292
Epoch: 38, step: 1109, loss: 0.32112938165664673, mean loss: 0.34445250806567385
Epoch: 38, step: 1110, loss: 0.33622992038726807, mean loss: 0.3444523611891635
Epoch: 38, step: 1111, loss: 0.33652353286743164, mean loss: 0.3444522195624787
Epoch: 38, step: 1112, loss: 0.3727825880050659, mean loss: 0.34445272559746026
Epoch: 38, step: 1113, loss: 0.32942187786102295, mean loss: 0.3444524571223462
Epoch: 38, step: 1114, loss: 0.3177919387817383, mean loss: 0.3444519809311171
Epoch: 38, step: 1115, loss: 0.31408101320266724, mean loss: 0.3444514384761673
Epoch: 38, step: 1116, loss: 0.32896578311920166, mean loss: 0.3444511618922784
Epoch: 38, step: 1117, loss: 0.32598423957824707, mean loss: 0.34445083206691113
Epoch: 38, step: 1118, loss: 0.36379802227020264, mean loss: 0.3444511776079839
Epoch: 38, step: 1119, loss: 0.3101269602775574, mean loss: 0.34445056458795725
Epoch: 38, step: 1120, loss: 0.327883780002594, mean loss: 0.3444502687155342
Epoch: 38, step: 1121, loss: 0.368895024061203, mean loss: 0.3444507052757968
Epoch: 38, step: 1122, loss: 0.3632410168647766, mean loss: 0.34445104084703687
Epoch: 38, step: 1123, loss: 0.3267483413219452, mean loss: 0.3444507247048209
Epoch: 38, step: 1124, loss: 0.3415890336036682, mean loss: 0.3444506736004564
Epoch: 38, step: 1125, loss: 0.3259837329387665, mean loss: 0.34445034382188106
Epoch: 38, step: 1126, loss: 0.31107330322265625, mean loss: 0.3444497477926555
Epoch: 38, step: 1127, loss: 0.3851793706417084, mean loss: 0.3444504751073493
Epoch: 38, step: 1128, loss: 0.36498841643333435, mean loss: 0.34445084184975255
Epoch: 38, step: 1129, loss: 0.35081660747528076, mean loss: 0.3444509555200791
Epoch: 38, step: 1130, loss: 0.3214746415615082, mean loss: 0.3444505452507371
Epoch: 38, step: 1131, loss: 0.3157338798046112, mean loss: 0.34445003248976563
Epoch: 38, step: 1132, loss: 0.3137992322444916, mean loss: 0.34444948520291185
Epoch: 38, step: 1133, loss: 0.3140256702899933, mean loss: 0.3444489419787053
Epoch: 38, step: 1134, loss: 0.3137173354625702, mean loss: 0.34444839326860627
Epoch: 38, step: 1135, loss: 0.30889055132865906, mean loss: 0.34444775839783887
Epoch: 38, step: 1136, loss: 0.3483796715736389, mean loss: 0.3444478285992918
Epoch: 38, step: 1137, loss: 0.3541082441806793, mean loss: 0.3444480010759135
Epoch: 38, step: 1138, loss: 0.3298695683479309, mean loss: 0.3444477407978837
Epoch: 38, step: 1139, loss: 0.30895960330963135, mean loss: 0.3444471072169102
Epoch: 38, step: 1140, loss: 0.29525813460350037, mean loss: 0.34444622904626027
Epoch: 38, step: 1141, loss: 0.33204036951065063, mean loss: 0.34444600756842375
Epoch: 38, step: 1142, loss: 0.3687655031681061, mean loss: 0.3444464417288379
Epoch: 38, step: 1143, loss: 0.28687405586242676, mean loss: 0.34444541394417166
Epoch: 38, step: 1144, loss: 0.28870904445648193, mean loss: 0.34444441895391
Epoch: 38, step: 1145, loss: 0.310495525598526, mean loss: 0.3444438129184686
Epoch: 38, step: 1146, loss: 0.3475371301174164, mean loss: 0.3444438681375407
Epoch: 38, step: 1147, loss: 0.35788223147392273, mean loss: 0.3444441080226413
Epoch: 38, step: 1148, loss: 0.33364173769950867, mean loss: 0.34444391519548145
Epoch: 38, step: 1149, loss: 0.32005375623703003, mean loss: 0.34444347982796586
Epoch: 38, step: 1150, loss: 0.33960777521133423, mean loss: 0.34444339351154907
Epoch: 38, step: 1151, loss: 0.3330828845500946, mean loss: 0.344443190732223
Epoch: 38, step: 1152, loss: 0.3366827964782715, mean loss: 0.34444305221559196
Epoch: 38, step: 1153, loss: 0.3291044235229492, mean loss: 0.3444427784386189
Epoch: 38, step: 1154, loss: 0.309183269739151, mean loss: 0.3444421491079623
Epoch: 38, step: 1155, loss: 0.31569525599479675, mean loss: 0.3444416360271257
Epoch: 38, step: 1156, loss: 0.336981862783432, mean loss: 0.34444150288583736
Epoch: 38, step: 1157, loss: 0.30723488330841064, mean loss: 0.3444408388376564
Epoch: 38, step: 1158, loss: 0.31379222869873047, mean loss: 0.34444029184384695
Epoch: 38, step: 1159, loss: 0.33502158522605896, mean loss: 0.3444401237487117
Epoch: 38, step: 1160, loss: 0.35701119899749756, mean loss: 0.34444034809999124
Epoch: 38, step: 1161, loss: 0.33217093348503113, mean loss: 0.34444012913624394
Epoch: 38, step: 1162, loss: 0.3204413652420044, mean loss: 0.3444397008545647
Epoch: 38, step: 1163, loss: 0.3039172887802124, mean loss: 0.3444389777049453
Epoch: 38, step: 1164, loss: 0.3998279571533203, mean loss: 0.34443996614079037
Epoch: 38, step: 1165, loss: 0.34364721179008484, mean loss: 0.34443995199406224
Epoch: 38, step: 1166, loss: 0.3375228941440582, mean loss: 0.3444398285611343
Epoch: 38, step: 1167, loss: 0.3580211400985718, mean loss: 0.34444007091144724
Epoch: 38, step: 1168, loss: 0.3166863024234772, mean loss: 0.3444395756710253
Epoch: 38, step: 1169, loss: 0.31758299469947815, mean loss: 0.344439096448639
Epoch: 38, step: 1170, loss: 0.31557440757751465, mean loss: 0.3444385814032476
Epoch: 38, step: 1171, loss: 0.31960397958755493, mean loss: 0.3444381382763863
Epoch: 38, step: 1172, loss: 0.34722983837127686, mean loss: 0.3444381880881464
Epoch: 38, step: 1173, loss: 0.30695098638534546, mean loss: 0.34443751922325505
Epoch: 38, step: 1174, loss: 0.32373905181884766, mean loss: 0.34443714991771857
Epoch: 38, step: 1175, loss: 0.33573171496391296, mean loss: 0.3444369945966553
Epoch: 38, step: 1176, loss: 0.2885708510875702, mean loss: 0.3444359978590951
Epoch: 38, step: 1177, loss: 0.29937636852264404, mean loss: 0.3444351939406413
Epoch: 38, step: 1178, loss: 0.3061443567276001, mean loss: 0.344434510797839
Epoch: 38, step: 1179, loss: 0.2907072603702545, mean loss: 0.34443355227271183
Epoch: 38, step: 1180, loss: 0.3101624846458435, mean loss: 0.34443294086801224
Epoch: 38, step: 1181, loss: 0.30758291482925415, mean loss: 0.3444322834657566
Epoch: 38, step: 1182, loss: 0.29285311698913574, mean loss: 0.3444313633129339
Epoch: 38, step: 1183, loss: 0.32498979568481445, mean loss: 0.3444310164889074
Epoch: 38, step: 1184, loss: 0.33414503931999207, mean loss: 0.3444308329975117
Epoch: 38, step: 1185, loss: 0.33826833963394165, mean loss: 0.34443072306684414
Epoch: 38, step: 1186, loss: 0.30338582396507263, mean loss: 0.3444299908936141
Epoch: 38, step: 1187, loss: 0.3455767333507538, mean loss: 0.3444300113492412
Epoch: 38, step: 1188, loss: 0.3315860629081726, mean loss: 0.3444297822425817
Epoch: 38, step: 1189, loss: 0.33608314394950867, mean loss: 0.34442963336030324
Epoch: 38, step: 1190, loss: 0.3635063171386719, mean loss: 0.34442997363256445
Epoch: 38, step: 1191, loss: 0.3939450681209564, mean loss: 0.34443085682132174
Epoch: 38, step: 1192, loss: 0.3140258491039276, mean loss: 0.34443031450423056
Epoch: 38, step: 1193, loss: 0.34733372926712036, mean loss: 0.34443036628988966
Epoch: 38, step: 1194, loss: 0.3712082505226135, mean loss: 0.34443084389497347
Epoch: 38, step: 1195, loss: 0.3292585611343384, mean loss: 0.3444305732899446
Epoch: 38, step: 1196, loss: 0.3110041618347168, mean loss: 0.3444299771243013
Epoch: 38, step: 1197, loss: 0.34021085500717163, mean loss: 0.34442990187689415
Epoch: 38, step: 1198, loss: 0.31258538365364075, mean loss: 0.3444293339448397
Epoch: 38, step: 1199, loss: 0.38313552737236023, mean loss: 0.3444300242393437
Epoch: 38, step: 1200, loss: 0.34095340967178345, mean loss: 0.34442996223776423
Epoch: 38, step: 1201, loss: 0.3344223201274872, mean loss: 0.3444297837657075
Epoch: 38, step: 1202, loss: 0.34485238790512085, mean loss: 0.3444297913021166
Epoch: 38, step: 1203, loss: 0.3172551393508911, mean loss: 0.3444293066981514
Epoch: 38, step: 1204, loss: 0.31401732563972473, mean loss: 0.3444287643727585
Epoch: 38, step: 1205, loss: 0.3554365038871765, mean loss: 0.34442896066612694
Epoch: 38, step: 1206, loss: 0.3649624288082123, mean loss: 0.3444293268186643
Epoch: 38, step: 1207, loss: 0.3187901973724365, mean loss: 0.3444288696301934
Epoch: 38, step: 1208, loss: 0.33636945486068726, mean loss: 0.34442872591993917
Epoch: 38, step: 1209, loss: 0.28821346163749695, mean loss: 0.3444277235436993
Epoch: 38, step: 1210, loss: 0.3221970498561859, mean loss: 0.34442732715488833
Epoch: 38, step: 1211, loss: 0.32043614983558655, mean loss: 0.34442689938266596
Epoch: 38, step: 1212, loss: 0.3715687394142151, mean loss: 0.3444273833238273
Epoch: 38, step: 1213, loss: 0.3509152829647064, mean loss: 0.3444274990015301
Epoch: 38, step: 1214, loss: 0.32460227608680725, mean loss: 0.3444271455288374
Epoch: 38, step: 1215, loss: 0.3253006637096405, mean loss: 0.34442680452038965
Epoch: 38, step: 1216, loss: 0.34667953848838806, mean loss: 0.3444268446839506
Epoch: 38, step: 1217, loss: 0.318248450756073, mean loss: 0.34442637796271813
Epoch: 38, step: 1218, loss: 0.3159867525100708, mean loss: 0.34442587093618177
Epoch: 38, step: 1219, loss: 0.29810652136802673, mean loss: 0.3444250451615692
Epoch: 38, step: 1220, loss: 0.3849393129348755, mean loss: 0.34442576743115316
Epoch: 38, step: 1221, loss: 0.34307676553726196, mean loss: 0.3444257433822015
Epoch: 38, step: 1222, loss: 0.3159823417663574, mean loss: 0.34442523632450267
Epoch: 38, step: 1223, loss: 0.3402033746242523, mean loss: 0.34442516106313464
Epoch: 38, step: 1224, loss: 0.4196248948574066, mean loss: 0.34442650159353366
Epoch: 38, step: 1225, loss: 0.34897926449775696, mean loss: 0.3444265827508459
Epoch: 38, step: 1226, loss: 0.33717429637908936, mean loss: 0.34442645347427464
Epoch: 38, step: 1227, loss: 0.37382280826568604, mean loss: 0.3444269774734688
Epoch: 38, step: 1228, loss: 0.33724936842918396, mean loss: 0.34442684953262914
Epoch: 38, step: 1229, loss: 0.3899845778942108, mean loss: 0.34442766158439847
Epoch: 38, step: 1230, loss: 0.3179807960987091, mean loss: 0.3444271901859797
Epoch: 38, step: 1231, loss: 0.3300682306289673, mean loss: 0.3444269342512949
Epoch: 38, step: 1232, loss: 0.3118419647216797, mean loss: 0.3444263534658118
Epoch: 38, step: 1233, loss: 0.3676423132419586, mean loss: 0.34442676725328153
Epoch: 38, step: 1234, loss: 0.35815104842185974, mean loss: 0.3444270118623529
Epoch: 38, step: 1235, loss: 0.3603552579879761, mean loss: 0.34442729574782605
Epoch: 38, step: 1236, loss: 0.36188411712646484, mean loss: 0.34442760687119983
Epoch: 38, step: 1237, loss: 0.34332311153411865, mean loss: 0.3444275871867347
Epoch: 38, step: 1238, loss: 0.34873297810554504, mean loss: 0.3444276639166258
Epoch: 38, step: 1239, loss: 0.3091979920864105, mean loss: 0.3444270360710343
Epoch: 38, step: 1240, loss: 0.36562448740005493, mean loss: 0.34442741383467784
Epoch: 38, step: 1241, loss: 0.3407602310180664, mean loss: 0.34442734848230916
Epoch: 38, step: 1242, loss: 0.368806928396225, mean loss: 0.34442778293976106
Epoch: 38, step: 1243, loss: 0.32046282291412354, mean loss: 0.34442735587867285
Epoch: 38, step: 1244, loss: 0.3115125000476837, mean loss: 0.3444267693388394
Epoch: 38, step: 1245, loss: 0.32679229974746704, mean loss: 0.3444264550997434
Epoch: 38, step: 1246, loss: 0.34334349632263184, mean loss: 0.3444264358022011
Epoch: 38, step: 1247, loss: 0.3237400949001312, mean loss: 0.344426067193133
Epoch: 38, step: 1248, loss: 0.35979020595550537, mean loss: 0.34442634096121916
Epoch: 38, step: 1249, loss: 0.2970825433731079, mean loss: 0.34442549737407707
Epoch: 38, step: 1250, loss: 0.36268478631973267, mean loss: 0.3444258227182131
Epoch: 38, step: 1251, loss: 0.386470764875412, mean loss: 0.3444265718619334
Epoch: 38, step: 1252, loss: 0.3672069311141968, mean loss: 0.344426977748067
Epoch: 38, step: 1253, loss: 0.3365893065929413, mean loss: 0.344426838103853
Epoch: 38, step: 1254, loss: 0.35153868794441223, mean loss: 0.34442696481381146
Epoch: 38, step: 1255, loss: 0.32928645610809326, mean loss: 0.34442669506415524
Epoch: 38, step: 1256, loss: 0.3544375002384186, mean loss: 0.34442687341768324
Epoch: 38, step: 1257, loss: 0.3149978816509247, mean loss: 0.34442634911709946
Epoch: 38, step: 1258, loss: 0.3218410611152649, mean loss: 0.3444259467496376
Epoch: 38, step: 1259, loss: 0.34689658880233765, mean loss: 0.34442599076449637
Epoch: 38, step: 1260, loss: 0.3104282319545746, mean loss: 0.3444253851001134
Epoch: 38, step: 1261, loss: 0.3249903619289398, mean loss: 0.3444250388745964
Epoch: 38, step: 1262, loss: 0.30636030435562134, mean loss: 0.3444243607818821
Epoch: 38, step: 1263, loss: 0.32114294171333313, mean loss: 0.3444239460494632
Epoch: 38, step: 1264, loss: 0.3351111114025116, mean loss: 0.3444237801546942
Epoch: 38, step: 1265, loss: 0.324096143245697, mean loss: 0.3444234180534988
Epoch: 38, step: 1266, loss: 0.32476919889450073, mean loss: 0.3444230679542958
Epoch: 38, step: 1267, loss: 0.30505937337875366, mean loss: 0.3444223667841038
Epoch: 38, step: 1268, loss: 0.33115649223327637, mean loss: 0.34442213048844555
Epoch: 38, step: 1269, loss: 0.30373668670654297, mean loss: 0.3444214058002659
Epoch: 38, step: 1270, loss: 0.3227847218513489, mean loss: 0.34442102041501843
Epoch: 38, step: 1271, loss: 0.3160746395587921, mean loss: 0.3444205155279271
Epoch: 38, step: 1272, loss: 0.40524691343307495, mean loss: 0.34442159890842233
Epoch: 38, step: 1273, loss: 0.3293973207473755, mean loss: 0.34442133131539415
Epoch: 38, step: 1274, loss: 0.347355455160141, mean loss: 0.34442138357328583
Epoch: 38, step: 1275, loss: 0.32255157828330994, mean loss: 0.34442099407044885
Epoch: 38, step: 1276, loss: 0.3266696631908417, mean loss: 0.34442067792357395
Epoch: 38, step: 1277, loss: 0.30459925532341003, mean loss: 0.34441996872637715
Epoch: 38, step: 1278, loss: 0.336622416973114, mean loss: 0.34441982985882796
Epoch: 38, step: 1279, loss: 0.32913532853126526, mean loss: 0.34441955766012927
Epoch: 38, step: 1280, loss: 0.30995476245880127, mean loss: 0.34441894389425387
Epoch: 38, step: 1281, loss: 0.320195734500885, mean loss: 0.34441851252321365
Epoch: 38, step: 1282, loss: 0.3167526125907898, mean loss: 0.34441801985292725
Epoch: 38, step: 1283, loss: 0.32064729928970337, mean loss: 0.3444175965549615
Epoch: 38, step: 1284, loss: 0.4058257043361664, mean loss: 0.344418690062588
Epoch: 38, step: 1285, loss: 0.3127768337726593, mean loss: 0.3444181266191554
Epoch: 38, step: 1286, loss: 0.36381179094314575, mean loss: 0.3444184719540852
Epoch: 38, step: 1287, loss: 0.37953314185142517, mean loss: 0.34441909721530134
Epoch: 38, step: 1288, loss: 0.3112025856971741, mean loss: 0.34441850576373323
Epoch: 38, step: 1289, loss: 0.33630648255348206, mean loss: 0.3444183613240194
Epoch: 38, step: 1290, loss: 0.31808987259864807, mean loss: 0.3444178925369402
Epoch: 38, step: 1291, loss: 0.3422123193740845, mean loss: 0.3444178532667108
Epoch: 38, step: 1292, loss: 0.3241845369338989, mean loss: 0.34441749301893493
Epoch: 38, step: 1293, loss: 0.31241410970687866, mean loss: 0.34441692321899703
Epoch: 38, step: 1294, loss: 0.3018880784511566, mean loss: 0.34441616603337616
Epoch: 38, step: 1295, loss: 0.3314436674118042, mean loss: 0.3444159350744917
Epoch: 38, step: 1296, loss: 0.3017506003379822, mean loss: 0.34441517548584427
Epoch: 38, step: 1297, loss: 0.3174203932285309, mean loss: 0.3444146948950973
Epoch: 38, step: 1298, loss: 0.35688021779060364, mean loss: 0.3444149168160689
Epoch: 38, step: 1299, loss: 0.34892991185188293, mean loss: 0.34441499719410484
Epoch: 38, step: 1300, loss: 0.3768619894981384, mean loss: 0.34441557482022955
Epoch: 38, step: 1301, loss: 0.3437817692756653, mean loss: 0.344415563537331
Epoch: 38, step: 1302, loss: 0.3898112177848816, mean loss: 0.34441637164866606
Epoch: 38, step: 1303, loss: 0.31304946541786194, mean loss: 0.3444158132802128
Epoch: 38, step: 1304, loss: 0.3465609550476074, mean loss: 0.34441585146562265
Epoch: 38, step: 1305, loss: 0.39808785915374756, mean loss: 0.3444168068575499
Epoch: 38, step: 1306, loss: 0.3311218023300171, mean loss: 0.3444165702032035
Epoch: 38, step: 1307, loss: 0.3766237795352936, mean loss: 0.34441714348923647
Epoch: 38, step: 1308, loss: 0.33642879128456116, mean loss: 0.34441700129966696
Epoch: 38, step: 1309, loss: 0.31664130091667175, mean loss: 0.3444165069117779
Epoch: 38, step: 1310, loss: 0.36958152055740356, mean loss: 0.34441695482331064
Epoch: 38, step: 1311, loss: 0.4009741544723511, mean loss: 0.34441796146576487
Epoch: 38, step: 1312, loss: 0.34429800510406494, mean loss: 0.3444179593307402
Epoch: 38, step: 1313, loss: 0.3386465013027191, mean loss: 0.34441785661016877
Epoch: 38, step: 1314, loss: 0.30174940824508667, mean loss: 0.3444170972094468
Epoch: 38, step: 1315, loss: 0.3489411175251007, mean loss: 0.3444171777252209
Epoch: 38, step: 1316, loss: 0.3092184364795685, mean loss: 0.3444165512904873
Epoch: 38, step: 1317, loss: 0.3245657682418823, mean loss: 0.34441619801084594
Epoch: 38, step: 1318, loss: 0.33944401144981384, mean loss: 0.3444161095236049
Epoch: 38, step: 1319, loss: 0.2902942895889282, mean loss: 0.3444151463647934
Epoch: 38, step: 1320, loss: 0.33561691641807556, mean loss: 0.3444149897931573
Epoch: 38, step: 1321, loss: 0.35744205117225647, mean loss: 0.3444152216161523
Epoch: 38, step: 1322, loss: 0.30568405985832214, mean loss: 0.34441453238825376
Epoch: 38, step: 1323, loss: 0.3132933974266052, mean loss: 0.3444139785919878
Epoch: 38, step: 1324, loss: 0.3698580265045166, mean loss: 0.34441443135722283
Epoch: 38, step: 1325, loss: 0.32713159918785095, mean loss: 0.34441412382257447
Epoch: 38, step: 1326, loss: 0.3121681809425354, mean loss: 0.3444135500411392
Epoch: 38, step: 1327, loss: 0.29478955268859863, mean loss: 0.34441266705186246
Epoch: 38, step: 1328, loss: 0.33295926451683044, mean loss: 0.34441246325829056
Epoch: 38, step: 1329, loss: 0.33575892448425293, mean loss: 0.34441230928621175
Epoch: 38, step: 1330, loss: 0.30859965085983276, mean loss: 0.344411672084311
Epoch: 38, step: 1331, loss: 0.349957138299942, mean loss: 0.34441177075106455
Epoch: 38, step: 1332, loss: 0.3261360824108124, mean loss: 0.3444114455898095
Epoch: 38, step: 1333, loss: 0.320766806602478, mean loss: 0.34441102491160813
Epoch: 38, step: 1334, loss: 0.3199998736381531, mean loss: 0.34441059060358115
Epoch: 38, step: 1335, loss: 0.34205737709999084, mean loss: 0.34441054873741433
Epoch: 38, step: 1336, loss: 0.3318808674812317, mean loss: 0.344410325825047
Epoch: 38, step: 1337, loss: 0.3021295666694641, mean loss: 0.34440957363221375
Epoch: 38, step: 1338, loss: 0.31170645356178284, mean loss: 0.3444089918400366
Epoch: 38, step: 1339, loss: 0.3532704710960388, mean loss: 0.3444091494839428
Epoch: 38, step: 1340, loss: 0.37624484300613403, mean loss: 0.34440971582435376
Epoch: 38, step: 1341, loss: 0.3425883948802948, mean loss: 0.3444096834245789
Epoch: 38, step: 1342, loss: 0.3356097936630249, mean loss: 0.3444095268846917
Epoch: 38, step: 1343, loss: 0.3882508873939514, mean loss: 0.3444103067580464
Epoch: 38, step: 1344, loss: 0.34162986278533936, mean loss: 0.34441025729891533
Epoch: 38, step: 1345, loss: 0.3401746451854706, mean loss: 0.34441018195628287
Epoch: 38, step: 1346, loss: 0.31758636236190796, mean loss: 0.3444097048254269
Epoch: 38, step: 1347, loss: 0.32168012857437134, mean loss: 0.34440930052844626
Epoch: 38, step: 1348, loss: 0.35403746366500854, mean loss: 0.3444094717840827
Epoch: 38, step: 1349, loss: 0.326023668050766, mean loss: 0.3444091447625656
Epoch: 38, step: 1350, loss: 0.35370832681655884, mean loss: 0.3444093101607488
Epoch: 38, step: 1351, loss: 0.3097330629825592, mean loss: 0.344408693409056
Epoch: 38, step: 1352, loss: 0.31744542717933655, mean loss: 0.344408213848963
Epoch: 38, step: 1353, loss: 0.3119000792503357, mean loss: 0.34440763567988464
Epoch: 38, step: 1354, loss: 0.3214327394962311, mean loss: 0.3444072270702099
Epoch: 38, step: 1355, loss: 0.2956275939941406, mean loss: 0.34440635953743126
Epoch: 38, step: 1356, loss: 0.3852640986442566, mean loss: 0.34440708616851323
Epoch: 38, step: 1357, loss: 0.282128244638443, mean loss: 0.3444059785953044
Epoch: 38, step: 1358, loss: 0.3228239417076111, mean loss: 0.34440559478500604
Epoch: 38, step: 1359, loss: 0.3193880617618561, mean loss: 0.3444051498864959
Epoch: 38, step: 1360, loss: 0.33638766407966614, mean loss: 0.3444050073103252
Epoch: 38, step: 1361, loss: 0.33992713689804077, mean loss: 0.34440492768109
Epoch: 38, step: 1362, loss: 0.31337040662765503, mean loss: 0.3444043758091054
Epoch: 38, step: 1363, loss: 0.3217974901199341, mean loss: 0.34440397380886195
Epoch: 38, step: 1364, loss: 0.33079540729522705, mean loss: 0.34440373182286493
Epoch: 38, step: 1365, loss: 0.3837684988975525, mean loss: 0.34440443179027264
Epoch: 38, step: 1366, loss: 0.33791109919548035, mean loss: 0.34440431633067
Epoch: 38, step: 1367, loss: 0.31117114424705505, mean loss: 0.3444037254136699
Epoch: 38, step: 1368, loss: 0.33218860626220703, mean loss: 0.3444035082212453
Epoch: 38, step: 1369, loss: 0.31808844208717346, mean loss: 0.34440304033130303
Epoch: 38, step: 1370, loss: 0.33082762360572815, mean loss: 0.344402798960524
Epoch: 38, step: 1371, loss: 0.35216569900512695, mean loss: 0.34440293698235824
Epoch: 38, step: 1372, loss: 0.32801660895347595, mean loss: 0.3444026456439632
Epoch: 38, step: 1373, loss: 0.33645740151405334, mean loss: 0.34440250438513365
Epoch: 38, step: 1374, loss: 0.3173184096813202, mean loss: 0.3444020228644356
Epoch: 38, step: 1375, loss: 0.30403760075569153, mean loss: 0.34440130524919405
Epoch: 38, step: 1376, loss: 0.37635448575019836, mean loss: 0.34440187331583527
Epoch: 38, step: 1377, loss: 0.2999096214771271, mean loss: 0.34440108234246924
Epoch: 38, step: 1378, loss: 0.3686881959438324, mean loss: 0.3444015141057019
Epoch: 38, step: 1379, loss: 0.31307274103164673, mean loss: 0.34440095716953834
Epoch: 38, step: 1380, loss: 0.30325043201446533, mean loss: 0.3444002256436614
Epoch: 38, step: 1381, loss: 0.3228112757205963, mean loss: 0.34439984186739797
Epoch: 38, step: 1382, loss: 0.3079952597618103, mean loss: 0.3443991947323503
Epoch: 38, step: 1383, loss: 0.3382633626461029, mean loss: 0.34439908566252514
Epoch: 38, step: 1384, loss: 0.3542984127998352, mean loss: 0.34439926162866513
Epoch: 38, step: 1385, loss: 0.32511332631111145, mean loss: 0.3443989188163484
Epoch: 38, step: 1386, loss: 0.3847706913948059, mean loss: 0.3443996364219329
Epoch: 38, step: 1387, loss: 0.33470115065574646, mean loss: 0.3443994640350547
Epoch: 38, step: 1388, loss: 0.3789846897125244, mean loss: 0.3444000787632977
Epoch: 38, step: 1389, loss: 0.34304293990135193, mean loss: 0.34440005464153056
Epoch: 38, step: 1390, loss: 0.2990427315235138, mean loss: 0.3443992484754335
Epoch: 38, step: 1391, loss: 0.316728800535202, mean loss: 0.34439875667876174
Epoch: 38, step: 1392, loss: 0.34436383843421936, mean loss: 0.34439875605815845
Epoch: 38, step: 1393, loss: 0.3441646993160248, mean loss: 0.34439875189833297
Epoch: 38, step: 1394, loss: 0.31199681758880615, mean loss: 0.34439817603798306
Epoch: 38, step: 1395, loss: 0.3734881579875946, mean loss: 0.344398693027781
Epoch: 38, step: 1396, loss: 0.30504927039146423, mean loss: 0.3443979937187007
Epoch: 38, step: 1397, loss: 0.32778167724609375, mean loss: 0.34439769842251317
Epoch: 38, step: 1398, loss: 0.3118424415588379, mean loss: 0.34439711987838095
Epoch: 38, step: 1399, loss: 0.3394184708595276, mean loss: 0.3443970314036685
Epoch: 38, step: 1400, loss: 0.3540065586566925, mean loss: 0.3443972021698842
Epoch: 38, step: 1401, loss: 0.28769442439079285, mean loss: 0.3443961945504191
Epoch: 38, step: 1402, loss: 0.3285726308822632, mean loss: 0.3443959133675907
Epoch: 38, step: 1403, loss: 0.3359115719795227, mean loss: 0.3443957626045409
Epoch: 38, step: 1404, loss: 0.3148306608200073, mean loss: 0.34439523725489923
Epoch: 38, step: 1405, loss: 0.3241965174674988, mean loss: 0.3443948783452047
Epoch: 38, step: 1406, loss: 0.35330384969711304, mean loss: 0.34439503664530513
Epoch: 38, step: 1407, loss: 0.32970383763313293, mean loss: 0.34439477560765386
Epoch: 38, step: 1408, loss: 0.33044397830963135, mean loss: 0.3443945277300878
Epoch: 38, step: 1409, loss: 0.3018827438354492, mean loss: 0.34439377239474267
Epoch: 38, step: 1410, loss: 0.3117994964122772, mean loss: 0.34439319328069434
Epoch: 38, step: 1411, loss: 0.3322708308696747, mean loss: 0.34439297790221357
Epoch: 38, step: 1412, loss: 0.30834928154945374, mean loss: 0.3443923375238472
Epoch: 38, step: 1413, loss: 0.2928609251976013, mean loss: 0.3443914219957882
Epoch: 38, step: 1414, loss: 0.3317999243736267, mean loss: 0.3443911982940876
Epoch: 38, step: 1415, loss: 0.3794791102409363, mean loss: 0.34439182165807186
Epoch: 38, step: 1416, loss: 0.32637909054756165, mean loss: 0.34439150165361077
Epoch: 38, step: 1417, loss: 0.3616887032985687, mean loss: 0.3443918089409024
Epoch: 38, step: 1418, loss: 0.3134230375289917, mean loss: 0.344391258785968
Epoch: 38, step: 1419, loss: 0.3245930075645447, mean loss: 0.34439090707966474
Epoch: 38, step: 1420, loss: 0.28508999943733215, mean loss: 0.3443898536465977
Epoch: 38, step: 1421, loss: 0.36566317081451416, mean loss: 0.34439023154330367
Epoch: 38, step: 1422, loss: 0.33379966020584106, mean loss: 0.34439004341698093
Epoch: 38, step: 1423, loss: 0.33350691199302673, mean loss: 0.3443898500971816
Epoch: 38, step: 1424, loss: 0.31562402844429016, mean loss: 0.3443893391317367
Epoch: 38, step: 1425, loss: 0.33021652698516846, mean loss: 0.3443890873854554
Epoch: 38, step: 1426, loss: 0.3038805425167084, mean loss: 0.34438836786033294
Epoch: 38, step: 1427, loss: 0.31085893511772156, mean loss: 0.3443877723109059
Epoch: 38, step: 1428, loss: 0.3049578070640564, mean loss: 0.34438707196872287
Epoch: 38, step: 1429, loss: 0.34637898206710815, mean loss: 0.344387107347752
Epoch: 38, step: 1430, loss: 0.318829208612442, mean loss: 0.34438665341281544
Epoch: 38, step: 1431, loss: 0.36603298783302307, mean loss: 0.344387037867462
Epoch: 38, step: 1432, loss: 0.3023243248462677, mean loss: 0.34438629081634714
Epoch: 38, step: 1433, loss: 0.3578912913799286, mean loss: 0.3443865306664619
Epoch: 38, step: 1434, loss: 0.3074566125869751, mean loss: 0.3443858747991971
Epoch: 38, step: 1435, loss: 0.3157184422016144, mean loss: 0.34438536568090844
Epoch: 38, step: 1436, loss: 0.32588863372802734, mean loss: 0.34438503719466373
Epoch: 38, step: 1437, loss: 0.349347323179245, mean loss: 0.3443851253190819
Epoch: 38, step: 1438, loss: 0.3694426715373993, mean loss: 0.3443855703040088
Epoch: 38, step: 1439, loss: 0.33425188064575195, mean loss: 0.34438539034787763
Epoch: 38, step: 1440, loss: 0.3345089554786682, mean loss: 0.3443852149632441
Epoch: 38, step: 1441, loss: 0.37563449144363403, mean loss: 0.3443857698745713
Epoch: 38, step: 1442, loss: 0.4142419397830963, mean loss: 0.3443870103286228
Epoch: 38, step: 1443, loss: 0.32099437713623047, mean loss: 0.3443865949469694
Valid: 38, mean loss: 0.18533487369616825
Epoch: 39, step: 0, loss: 0.31862348318099976, mean loss: 0.34438613748098634
Epoch: 39, step: 1, loss: 0.30473822355270386, mean loss: 0.34438543348024186
Epoch: 39, step: 2, loss: 0.32560428977012634, mean loss: 0.3443851000023088
Epoch: 39, step: 3, loss: 0.3198070228099823, mean loss: 0.3443846636017905
Epoch: 39, step: 4, loss: 0.3336731791496277, mean loss: 0.34438447341545764
Epoch: 39, step: 5, loss: 0.3156512379646301, mean loss: 0.34438396325538784
Epoch: 39, step: 6, loss: 0.301285982131958, mean loss: 0.3443831980621076
Epoch: 39, step: 7, loss: 0.32192423939704895, mean loss: 0.3443827993163036
Epoch: 39, step: 8, loss: 0.3581773042678833, mean loss: 0.3443830442254017
Epoch: 39, step: 9, loss: 0.31064867973327637, mean loss: 0.3443824453125641
Epoch: 39, step: 10, loss: 0.3102036714553833, mean loss: 0.3443818385205486
Epoch: 39, step: 11, loss: 0.33291375637054443, mean loss: 0.34438163492585055
Epoch: 39, step: 12, loss: 0.2983700931072235, mean loss: 0.34438081809008536
Epoch: 39, step: 13, loss: 0.32217711210250854, mean loss: 0.34438042391813456
Epoch: 39, step: 14, loss: 0.3158385455608368, mean loss: 0.3443799172365852
Epoch: 39, step: 15, loss: 0.33073341846466064, mean loss: 0.3443796749853111
Epoch: 39, step: 16, loss: 0.33420541882514954, mean loss: 0.34437949437614485
Epoch: 39, step: 17, loss: 0.3097369074821472, mean loss: 0.34437887942625856
Epoch: 39, step: 18, loss: 0.32596564292907715, mean loss: 0.3443785525737424
Epoch: 39, step: 19, loss: 0.31490933895111084, mean loss: 0.3443780294763691
Epoch: 39, step: 20, loss: 0.29785600304603577, mean loss: 0.3443772036953294
Epoch: 39, step: 21, loss: 0.3440135419368744, mean loss: 0.34437719724033
Epoch: 39, step: 22, loss: 0.32443076372146606, mean loss: 0.34437684319724227
Epoch: 39, step: 23, loss: 0.3068607747554779, mean loss: 0.3443761773103335
Epoch: 39, step: 24, loss: 0.311333030462265, mean loss: 0.344375590825414
Epoch: 39, step: 25, loss: 0.41772669553756714, mean loss: 0.3443768927157394
Epoch: 39, step: 26, loss: 0.32089951634407043, mean loss: 0.3443764760290814
Epoch: 39, step: 27, loss: 0.3321548402309418, mean loss: 0.34437625911803854
Epoch: 39, step: 28, loss: 0.29466721415519714, mean loss: 0.344375376891666
Epoch: 39, step: 29, loss: 0.313581645488739, mean loss: 0.34437483038026495
Epoch: 39, step: 30, loss: 0.3310590386390686, mean loss: 0.34437459406259513
Epoch: 39, step: 31, loss: 0.3393736183643341, mean loss: 0.3443745053109855
Epoch: 39, step: 32, loss: 0.28493428230285645, mean loss: 0.3443734504524608
Epoch: 39, step: 33, loss: 0.3864922821521759, mean loss: 0.34437419790289026
Epoch: 39, step: 34, loss: 0.3729463219642639, mean loss: 0.34437470494134675
Epoch: 39, step: 35, loss: 0.33250612020492554, mean loss: 0.34437449432620026
Epoch: 39, step: 36, loss: 0.3077748417854309, mean loss: 0.34437384485496464
Epoch: 39, step: 37, loss: 0.3571045994758606, mean loss: 0.3443740707618146
Epoch: 39, step: 38, loss: 0.3629334568977356, mean loss: 0.3443744000917079
Epoch: 39, step: 39, loss: 0.3648456037044525, mean loss: 0.3443747633396959
Epoch: 39, step: 40, loss: 0.2901342511177063, mean loss: 0.3443738008947073
Epoch: 39, step: 41, loss: 0.31934428215026855, mean loss: 0.3443733567781889
Epoch: 39, step: 42, loss: 0.3498063385486603, mean loss: 0.3443734531777306
Epoch: 39, step: 43, loss: 0.3248507082462311, mean loss: 0.3443731067841016
Epoch: 39, step: 44, loss: 0.3566034138202667, mean loss: 0.34437332378356994
Epoch: 39, step: 45, loss: 0.3096630573272705, mean loss: 0.3443727079383825
Epoch: 39, step: 46, loss: 0.3434397876262665, mean loss: 0.3443726913863836
Epoch: 39, step: 47, loss: 0.3285787105560303, mean loss: 0.3443724111724025
Epoch: 39, step: 48, loss: 0.4277838468551636, mean loss: 0.34437389101691035
Epoch: 39, step: 49, loss: 0.3075851500034332, mean loss: 0.344373238340811
Epoch: 39, step: 50, loss: 0.3282957673072815, mean loss: 0.34437295311237887
Epoch: 39, step: 51, loss: 0.3310694396495819, mean loss: 0.34437271710057316
Epoch: 39, step: 52, loss: 0.3317128121852875, mean loss: 0.34437249251072916
Epoch: 39, step: 53, loss: 0.3176637887954712, mean loss: 0.34437201870012574
Epoch: 39, step: 54, loss: 0.3110663592815399, mean loss: 0.3443714278704541
Epoch: 39, step: 55, loss: 0.3384024500846863, mean loss: 0.34437132198494735
Epoch: 39, step: 56, loss: 0.33127495646476746, mean loss: 0.3443710896686697
Epoch: 39, step: 57, loss: 0.3382422924041748, mean loss: 0.34437098095193386
Epoch: 39, step: 58, loss: 0.3305513262748718, mean loss: 0.3443707358139351
Epoch: 39, step: 59, loss: 0.38441482186317444, mean loss: 0.34437144611771775
Epoch: 39, step: 60, loss: 0.35169854760169983, mean loss: 0.344371576083865
Epoch: 39, step: 61, loss: 0.32143712043762207, mean loss: 0.3443711692859004
Epoch: 39, step: 62, loss: 0.38137853145599365, mean loss: 0.3443718256892096
Epoch: 39, step: 63, loss: 0.31071937084198, mean loss: 0.3443712288028164
Epoch: 39, step: 64, loss: 0.3850136697292328, mean loss: 0.34437194965631185
Epoch: 39, step: 65, loss: 0.3410874903202057, mean loss: 0.34437189140262564
Epoch: 39, step: 66, loss: 0.31888216733932495, mean loss: 0.34437143932089775
Epoch: 39, step: 67, loss: 0.32482460141181946, mean loss: 0.34437109264741045
Epoch: 39, step: 68, loss: 0.33308595418930054, mean loss: 0.3443708925030732
Epoch: 39, step: 69, loss: 0.3589775562286377, mean loss: 0.3443711515507752
Epoch: 39, step: 70, loss: 0.3313756287097931, mean loss: 0.344370921080581
Epoch: 39, step: 71, loss: 0.3455142080783844, mean loss: 0.34437094135594093
Epoch: 39, step: 72, loss: 0.34125620126724243, mean loss: 0.34437088611927974
Epoch: 39, step: 73, loss: 0.3159356713294983, mean loss: 0.34437038185939695
Epoch: 39, step: 74, loss: 0.3395483195781708, mean loss: 0.3443702963481934
Epoch: 39, step: 75, loss: 0.42952603101730347, mean loss: 0.344371806415839
Epoch: 39, step: 76, loss: 0.3665061295032501, mean loss: 0.3443721989170907
Epoch: 39, step: 77, loss: 0.36207467317581177, mean loss: 0.34437251282414216
Epoch: 39, step: 78, loss: 0.29151785373687744, mean loss: 0.34437157560170956
Epoch: 39, step: 79, loss: 0.32802286744117737, mean loss: 0.34437128571043785
Epoch: 39, step: 80, loss: 0.3428576588630676, mean loss: 0.3443712588716548
Epoch: 39, step: 81, loss: 0.3252016603946686, mean loss: 0.34437091897310385
Epoch: 39, step: 82, loss: 0.31810152530670166, mean loss: 0.3443704531954541
Epoch: 39, step: 83, loss: 0.30998364090919495, mean loss: 0.34436984350020083
Epoch: 39, step: 84, loss: 0.35371795296669006, mean loss: 0.3443700092438839
Epoch: 39, step: 85, loss: 0.3269924223423004, mean loss: 0.34436970114156656
Epoch: 39, step: 86, loss: 0.30766215920448303, mean loss: 0.3443690503332419
Epoch: 39, step: 87, loss: 0.32638075947761536, mean loss: 0.344368731414533
Epoch: 39, step: 88, loss: 0.3578638732433319, mean loss: 0.34436897066888683
Epoch: 39, step: 89, loss: 0.32924872636795044, mean loss: 0.344368702607966
Epoch: 39, step: 90, loss: 0.33307895064353943, mean loss: 0.34436850245989986
Epoch: 39, step: 91, loss: 0.2994137108325958, mean loss: 0.34436770550217
Epoch: 39, step: 92, loss: 0.3296782374382019, mean loss: 0.3443674450921634
Epoch: 39, step: 93, loss: 0.30269721150398254, mean loss: 0.34436670638921024
Epoch: 39, step: 94, loss: 0.3074911832809448, mean loss: 0.344366052695372
Epoch: 39, step: 95, loss: 0.30545032024383545, mean loss: 0.34436536284689206
Epoch: 39, step: 96, loss: 0.3330399990081787, mean loss: 0.3443651620888427
Epoch: 39, step: 97, loss: 0.32942619919776917, mean loss: 0.344364897279347
Epoch: 39, step: 98, loss: 0.30211278796195984, mean loss: 0.3443641483276618
Epoch: 39, step: 99, loss: 0.3178826868534088, mean loss: 0.3443636789313651
Epoch: 39, step: 100, loss: 0.3262683153152466, mean loss: 0.3443633581882626
Epoch: 39, step: 101, loss: 0.32867228984832764, mean loss: 0.3443630800665933
Epoch: 39, step: 102, loss: 0.3407943546772003, mean loss: 0.3443630168126294
Epoch: 39, step: 103, loss: 0.32731467485427856, mean loss: 0.34436271464421464
Epoch: 39, step: 104, loss: 0.306433767080307, mean loss: 0.34436204239544976
Epoch: 39, step: 105, loss: 0.33035051822662354, mean loss: 0.34436179406103823
Epoch: 39, step: 106, loss: 0.3322351574897766, mean loss: 0.3443615791373977
Epoch: 39, step: 107, loss: 0.31652525067329407, mean loss: 0.3443610857954073
Epoch: 39, step: 108, loss: 0.33370572328567505, mean loss: 0.3443608969542463
Epoch: 39, step: 109, loss: 0.3565724194049835, mean loss: 0.3443611133708353
Epoch: 39, step: 110, loss: 0.31898894906044006, mean loss: 0.34436066372502194
Epoch: 39, step: 111, loss: 0.34826192259788513, mean loss: 0.34436073286195523
Epoch: 39, step: 112, loss: 0.30301520228385925, mean loss: 0.34436000016191487
Epoch: 39, step: 113, loss: 0.3753781020641327, mean loss: 0.3443605498358809
Epoch: 39, step: 114, loss: 0.38136470317840576, mean loss: 0.34436120557746513
Epoch: 39, step: 115, loss: 0.27753350138664246, mean loss: 0.3443600213609888
Epoch: 39, step: 116, loss: 0.28551843762397766, mean loss: 0.34435897868057597
Epoch: 39, step: 117, loss: 0.3037512004375458, mean loss: 0.3443582591182865
Epoch: 39, step: 118, loss: 0.3297576904296875, mean loss: 0.34435800040350506
Epoch: 39, step: 119, loss: 0.3560061752796173, mean loss: 0.34435820679968615
Epoch: 39, step: 120, loss: 0.3314902186393738, mean loss: 0.34435797879344626
Epoch: 39, step: 121, loss: 0.3358895182609558, mean loss: 0.3443578287445336
Epoch: 39, step: 122, loss: 0.31888318061828613, mean loss: 0.34435737737849015
Epoch: 39, step: 123, loss: 0.3163668215274811, mean loss: 0.34435688144376564
Epoch: 39, step: 124, loss: 0.3081769049167633, mean loss: 0.344356240420812
Epoch: 39, step: 125, loss: 0.32337698340415955, mean loss: 0.3443558687249646
Epoch: 39, step: 126, loss: 0.3274327218532562, mean loss: 0.34435556889776064
Epoch: 39, step: 127, loss: 0.4141319990158081, mean loss: 0.3443568051040911
Epoch: 39, step: 128, loss: 0.3372640311717987, mean loss: 0.3443566794459472
Epoch: 39, step: 129, loss: 0.31992512941360474, mean loss: 0.3443562466154538
Epoch: 39, step: 130, loss: 0.30110540986061096, mean loss: 0.34435548039516295
Epoch: 39, step: 131, loss: 0.2921256721019745, mean loss: 0.3443545551221986
Epoch: 39, step: 132, loss: 0.3258515000343323, mean loss: 0.3443542273386225
Epoch: 39, step: 133, loss: 0.3394418954849243, mean loss: 0.3443541403176862
Epoch: 39, step: 134, loss: 0.3681899607181549, mean loss: 0.3443545625568033
Epoch: 39, step: 135, loss: 0.3780069351196289, mean loss: 0.34435515868045813
Epoch: 39, step: 136, loss: 0.3447149991989136, mean loss: 0.34435516505461927
Epoch: 39, step: 137, loss: 0.379198282957077, mean loss: 0.34435578224946645
Epoch: 39, step: 138, loss: 0.3781439960002899, mean loss: 0.3443563807476287
Epoch: 39, step: 139, loss: 0.3018619120121002, mean loss: 0.34435562804696385
Epoch: 39, step: 140, loss: 0.3661385476589203, mean loss: 0.34435601387900616
Epoch: 39, step: 141, loss: 0.3228382170200348, mean loss: 0.3443556327497267
Epoch: 39, step: 142, loss: 0.3202768862247467, mean loss: 0.3443552062677393
Epoch: 39, step: 143, loss: 0.34387001395225525, mean loss: 0.34435519767418077
Epoch: 39, step: 144, loss: 0.3361050486564636, mean loss: 0.34435505155298174
Epoch: 39, step: 145, loss: 0.31926023960113525, mean loss: 0.34435460709809257
Epoch: 39, step: 146, loss: 0.3142305612564087, mean loss: 0.34435407357975595
Epoch: 39, step: 147, loss: 0.29501745104789734, mean loss: 0.34435319980845863
Epoch: 39, step: 148, loss: 0.35507887601852417, mean loss: 0.3443533897611056
Epoch: 39, step: 149, loss: 0.3228524923324585, mean loss: 0.3443530089851089
Epoch: 39, step: 150, loss: 0.33380502462387085, mean loss: 0.3443528221860163
Epoch: 39, step: 151, loss: 0.3187488317489624, mean loss: 0.34435236876123704
Epoch: 39, step: 152, loss: 0.3132062554359436, mean loss: 0.3443518171999676
Epoch: 39, step: 153, loss: 0.3091980814933777, mean loss: 0.3443511946794132
Epoch: 39, step: 154, loss: 0.37226805090904236, mean loss: 0.34435168903680424
Epoch: 39, step: 155, loss: 0.36221009492874146, mean loss: 0.3443520052715027
Epoch: 39, step: 156, loss: 0.34590691328048706, mean loss: 0.34435203280515614
Epoch: 39, step: 157, loss: 0.3426772654056549, mean loss: 0.34435200314960845
Epoch: 39, step: 158, loss: 0.34272003173828125, mean loss: 0.3443519742523723
Epoch: 39, step: 159, loss: 0.31323689222335815, mean loss: 0.34435142330892676
Epoch: 39, step: 160, loss: 0.33623647689819336, mean loss: 0.34435127962306505
Epoch: 39, step: 161, loss: 0.3304423689842224, mean loss: 0.34435103335176226
Epoch: 39, step: 162, loss: 0.3503311276435852, mean loss: 0.34435113923349336
Epoch: 39, step: 163, loss: 0.3157615065574646, mean loss: 0.34435063304311314
Epoch: 39, step: 164, loss: 0.3441324532032013, mean loss: 0.344350629180224
Epoch: 39, step: 165, loss: 0.32066717743873596, mean loss: 0.34435020987050163
Epoch: 39, step: 166, loss: 0.31717273592948914, mean loss: 0.34434972870848934
Epoch: 39, step: 167, loss: 0.3328915238380432, mean loss: 0.34434952585095674
Epoch: 39, step: 168, loss: 0.31374070048332214, mean loss: 0.3443489839579698
Epoch: 39, step: 169, loss: 0.30742087960243225, mean loss: 0.34434833020120964
Epoch: 39, step: 170, loss: 0.3144461512565613, mean loss: 0.3443478008373039
Epoch: 39, step: 171, loss: 0.31758859753608704, mean loss: 0.3443473271224742
Epoch: 39, step: 172, loss: 0.341988742351532, mean loss: 0.34434728536948206
Epoch: 39, step: 173, loss: 0.3354074954986572, mean loss: 0.344347127115103
Epoch: 39, step: 174, loss: 0.32904252409935, mean loss: 0.34434685619401795
Epoch: 39, step: 175, loss: 0.34700238704681396, mean loss: 0.3443469032012199
Epoch: 39, step: 176, loss: 0.3297231197357178, mean loss: 0.34434664434112283
Epoch: 39, step: 177, loss: 0.32482725381851196, mean loss: 0.34434629882849277
Epoch: 39, step: 178, loss: 0.28207069635391235, mean loss: 0.34434519650788964
Epoch: 39, step: 179, loss: 0.347928524017334, mean loss: 0.3443452599341058
Epoch: 39, step: 180, loss: 0.36494606733322144, mean loss: 0.34434562456952716
Epoch: 39, step: 181, loss: 0.3212098479270935, mean loss: 0.34434521507225924
Epoch: 39, step: 182, loss: 0.3593263030052185, mean loss: 0.34434548022895106
Epoch: 39, step: 183, loss: 0.35053300857543945, mean loss: 0.3443455897427271
Epoch: 39, step: 184, loss: 0.36156049370765686, mean loss: 0.34434589442590025
Epoch: 39, step: 185, loss: 0.32686683535575867, mean loss: 0.34434558507297347
Epoch: 39, step: 186, loss: 0.33097726106643677, mean loss: 0.3443453484780315
Epoch: 39, step: 187, loss: 0.3754481077194214, mean loss: 0.3443458989303754
Epoch: 39, step: 188, loss: 0.3648988902568817, mean loss: 0.34434626266794427
Epoch: 39, step: 189, loss: 0.3144530653953552, mean loss: 0.34434573364098653
Epoch: 39, step: 190, loss: 0.3473467528820038, mean loss: 0.3443457867497915
Epoch: 39, step: 191, loss: 0.3219020366668701, mean loss: 0.3443453895715144
Epoch: 39, step: 192, loss: 0.3217260539531708, mean loss: 0.34434498929305224
Epoch: 39, step: 193, loss: 0.3759145438671112, mean loss: 0.34434554794735367
Epoch: 39, step: 194, loss: 0.3307357430458069, mean loss: 0.34434530711273914
Epoch: 39, step: 195, loss: 0.32704031467437744, mean loss: 0.3443450008947246
Epoch: 39, step: 196, loss: 0.360864520072937, mean loss: 0.344345293208337
Epoch: 39, step: 197, loss: 0.3155728876590729, mean loss: 0.3443447840883747
Epoch: 39, step: 198, loss: 0.3397388756275177, mean loss: 0.34434470258950783
Epoch: 39, step: 199, loss: 0.304671972990036, mean loss: 0.34434400061609144
Epoch: 39, step: 200, loss: 0.32440322637557983, mean loss: 0.3443436477881947
Epoch: 39, step: 201, loss: 0.3099891245365143, mean loss: 0.344343039937187
Epoch: 39, step: 202, loss: 0.3195977210998535, mean loss: 0.3443426021141746
Epoch: 39, step: 203, loss: 0.35669973492622375, mean loss: 0.3443428207470977
Epoch: 39, step: 204, loss: 0.32958731055259705, mean loss: 0.3443425596846573
Epoch: 39, step: 205, loss: 0.326433390378952, mean loss: 0.3443422428315859
Epoch: 39, step: 206, loss: 0.28546833992004395, mean loss: 0.34434120123961603
Epoch: 39, step: 207, loss: 0.3032841086387634, mean loss: 0.3443404748739554
Epoch: 39, step: 208, loss: 0.3412591516971588, mean loss: 0.3443404203613826
Epoch: 39, step: 209, loss: 0.38208910822868347, mean loss: 0.3443410881724407
Epoch: 39, step: 210, loss: 0.37463125586509705, mean loss: 0.344341624025532
Epoch: 39, step: 211, loss: 0.3160776197910309, mean loss: 0.3443411240254571
Epoch: 39, step: 212, loss: 0.31713470816612244, mean loss: 0.3443406427430028
Epoch: 39, step: 213, loss: 0.3499343693256378, mean loss: 0.3443407416944725
Epoch: 39, step: 214, loss: 0.31098470091819763, mean loss: 0.3443401516458129
Epoch: 39, step: 215, loss: 0.3205495774745941, mean loss: 0.344339730812052
Epoch: 39, step: 216, loss: 0.3349074721336365, mean loss: 0.34433956396686993
Epoch: 39, step: 217, loss: 0.33164840936660767, mean loss: 0.3443393394797542
Epoch: 39, step: 218, loss: 0.30721473693847656, mean loss: 0.344338682813927
Epoch: 39, step: 219, loss: 0.32740119099617004, mean loss: 0.3443383832261985
Epoch: 39, step: 220, loss: 0.3211555480957031, mean loss: 0.3443379731790589
Epoch: 39, step: 221, loss: 0.3093172609806061, mean loss: 0.34433735376004515
Epoch: 39, step: 222, loss: 0.3392970561981201, mean loss: 0.34433726461277403
Epoch: 39, step: 223, loss: 0.34548017382621765, mean loss: 0.34433728482694476
Epoch: 39, step: 224, loss: 0.3551710247993469, mean loss: 0.3443374764355115
Epoch: 39, step: 225, loss: 0.32999157905578613, mean loss: 0.3443372227144302
Epoch: 39, step: 226, loss: 0.36748355627059937, mean loss: 0.3443376320725038
Epoch: 39, step: 227, loss: 0.332026869058609, mean loss: 0.3443374143524448
Epoch: 39, step: 228, loss: 0.3190348744392395, mean loss: 0.3443369668762769
Epoch: 39, step: 229, loss: 0.3584854006767273, mean loss: 0.3443372170873228
Epoch: 39, step: 230, loss: 0.3590945303440094, mean loss: 0.3443374780616142
Epoch: 39, step: 231, loss: 0.3597358167171478, mean loss: 0.34433775036724223
Epoch: 39, step: 232, loss: 0.3412390947341919, mean loss: 0.34433769557130184
Epoch: 39, step: 233, loss: 0.32647550106048584, mean loss: 0.34433737970579326
Epoch: 39, step: 234, loss: 0.32487136125564575, mean loss: 0.34433703548520567
Epoch: 39, step: 235, loss: 0.30155056715011597, mean loss: 0.3443362788989075
Epoch: 39, step: 236, loss: 0.31001755595207214, mean loss: 0.3443356720571317
Epoch: 39, step: 237, loss: 0.3334910273551941, mean loss: 0.34433548029979005
Epoch: 39, step: 238, loss: 0.32965996861457825, mean loss: 0.34433522080882223
Epoch: 39, step: 239, loss: 0.3635430634021759, mean loss: 0.34433556043401836
Epoch: 39, step: 240, loss: 0.3277931809425354, mean loss: 0.34433526794361946
Epoch: 39, step: 241, loss: 0.3352160155773163, mean loss: 0.3443351067064405
Epoch: 39, step: 242, loss: 0.327588826417923, mean loss: 0.3443348106212854
Epoch: 39, step: 243, loss: 0.26952865719795227, mean loss: 0.344333488023099
Epoch: 39, step: 244, loss: 0.32437896728515625, mean loss: 0.3443331352266361
Epoch: 39, step: 245, loss: 0.2998814284801483, mean loss: 0.34433234933316087
Epoch: 39, step: 246, loss: 0.35523298382759094, mean loss: 0.3443325420498572
Epoch: 39, step: 247, loss: 0.3441297113895416, mean loss: 0.34433253846399586
Epoch: 39, step: 248, loss: 0.3237450420856476, mean loss: 0.34433217450224607
Epoch: 39, step: 249, loss: 0.2825285494327545, mean loss: 0.34433108190907935
Epoch: 39, step: 250, loss: 0.3459818959236145, mean loss: 0.3443311110924197
Epoch: 39, step: 251, loss: 0.3154396116733551, mean loss: 0.3443306003531427
Epoch: 39, step: 252, loss: 0.3562890887260437, mean loss: 0.34433081174963853
Epoch: 39, step: 253, loss: 0.35406893491744995, mean loss: 0.3443309838925264
Epoch: 39, step: 254, loss: 0.3957644999027252, mean loss: 0.3443318930777275
Epoch: 39, step: 255, loss: 0.29920169711112976, mean loss: 0.3443310953297962
Epoch: 39, step: 256, loss: 0.3621462881565094, mean loss: 0.34433141023607355
Epoch: 39, step: 257, loss: 0.2946241497993469, mean loss: 0.3443305316123164
Epoch: 39, step: 258, loss: 0.3441998362541199, mean loss: 0.34433052930219077
Epoch: 39, step: 259, loss: 0.33700287342071533, mean loss: 0.3443303997833863
Epoch: 39, step: 260, loss: 0.37138471007347107, mean loss: 0.34433087796904993
Epoch: 39, step: 261, loss: 0.33517277240753174, mean loss: 0.34433071610214827
Epoch: 39, step: 262, loss: 0.30354806780815125, mean loss: 0.34432999529322106
Epoch: 39, step: 263, loss: 0.3342961370944977, mean loss: 0.3443298179539104
Epoch: 39, step: 264, loss: 0.34065675735473633, mean loss: 0.34432975303705493
Epoch: 39, step: 265, loss: 0.30746370553970337, mean loss: 0.3443291014862526
Epoch: 39, step: 266, loss: 0.28546616435050964, mean loss: 0.3443280611925754
Epoch: 39, step: 267, loss: 0.33570265769958496, mean loss: 0.34432790875719627
Epoch: 39, step: 268, loss: 0.29878920316696167, mean loss: 0.34432710397314414
Epoch: 39, step: 269, loss: 0.36513620615005493, mean loss: 0.34432747171608724
Epoch: 39, step: 270, loss: 0.3440276086330414, mean loss: 0.3443274664169358
Epoch: 39, step: 271, loss: 0.3655790388584137, mean loss: 0.3443278419660353
Epoch: 39, step: 272, loss: 0.3711816966533661, mean loss: 0.34432831650799023
Epoch: 39, step: 273, loss: 0.361312597990036, mean loss: 0.34432861663666103
Epoch: 39, step: 274, loss: 0.35146212577819824, mean loss: 0.34432874269043534
Epoch: 39, step: 275, loss: 0.284552663564682, mean loss: 0.34432768642666794
Epoch: 39, step: 276, loss: 0.3660159111022949, mean loss: 0.34432806965824564
Epoch: 39, step: 277, loss: 0.3467869758605957, mean loss: 0.3443281131064239
Epoch: 39, step: 278, loss: 0.34585800766944885, mean loss: 0.3443281401387512
Epoch: 39, step: 279, loss: 0.30590692162513733, mean loss: 0.34432746127065955
Epoch: 39, step: 280, loss: 0.3560013473033905, mean loss: 0.34432766753399563
Epoch: 39, step: 281, loss: 0.29716044664382935, mean loss: 0.34432683416142257
Epoch: 39, step: 282, loss: 0.31160658597946167, mean loss: 0.34432625605495104
Epoch: 39, step: 283, loss: 0.36224305629730225, mean loss: 0.3443265726061921
Epoch: 39, step: 284, loss: 0.3551894426345825, mean loss: 0.3443267645263
Epoch: 39, step: 285, loss: 0.3250728249549866, mean loss: 0.3443264243627091
Epoch: 39, step: 286, loss: 0.32261401414871216, mean loss: 0.34432604077155293
Epoch: 39, step: 287, loss: 0.3160150647163391, mean loss: 0.3443255406129766
Epoch: 39, step: 288, loss: 0.3671209514141083, mean loss: 0.34432594332317534
Epoch: 39, step: 289, loss: 0.33156195282936096, mean loss: 0.34432571783487914
Epoch: 39, step: 290, loss: 0.3749620318412781, mean loss: 0.34432625904557757
Epoch: 39, step: 291, loss: 0.3203740119934082, mean loss: 0.3443258359208063
Epoch: 39, step: 292, loss: 0.31450948119163513, mean loss: 0.3443253092138387
Epoch: 39, step: 293, loss: 0.3693777322769165, mean loss: 0.3443257517579663
Epoch: 39, step: 294, loss: 0.3256179690361023, mean loss: 0.34432542129599386
Epoch: 39, step: 295, loss: 0.30353787541389465, mean loss: 0.3443247008207257
Epoch: 39, step: 296, loss: 0.36339905858039856, mean loss: 0.34432503774612727
Epoch: 39, step: 297, loss: 0.3665946424007416, mean loss: 0.34432543110474273
Epoch: 39, step: 298, loss: 0.32236242294311523, mean loss: 0.34432504316853924
Epoch: 39, step: 299, loss: 0.33439669013023376, mean loss: 0.34432486780551397
Epoch: 39, step: 300, loss: 0.342314749956131, mean loss: 0.344324832301728
Epoch: 39, step: 301, loss: 0.3170487582683563, mean loss: 0.3443243505455015
Epoch: 39, step: 302, loss: 0.3306858241558075, mean loss: 0.3443241096629993
Epoch: 39, step: 303, loss: 0.35566097497940063, mean loss: 0.34432430989022145
Epoch: 39, step: 304, loss: 0.31736868619918823, mean loss: 0.3443238338190872
Epoch: 39, step: 305, loss: 0.31751012802124023, mean loss: 0.34432336026276994
Epoch: 39, step: 306, loss: 0.36554017663002014, mean loss: 0.3443237349659183
Epoch: 39, step: 307, loss: 0.34037914872169495, mean loss: 0.3443236653031208
Epoch: 39, step: 308, loss: 0.3098728358745575, mean loss: 0.3443230568999521
Epoch: 39, step: 309, loss: 0.32454755902290344, mean loss: 0.3443227076699539
Epoch: 39, step: 310, loss: 0.3349069058895111, mean loss: 0.3443225413923517
Epoch: 39, step: 311, loss: 0.3243599236011505, mean loss: 0.3443221888703168
Epoch: 39, step: 312, loss: 0.3110230565071106, mean loss: 0.34432160084770713
Epoch: 39, step: 313, loss: 0.30176904797554016, mean loss: 0.3443208494340947
Epoch: 39, step: 314, loss: 0.3435063362121582, mean loss: 0.34432083505127925
Epoch: 39, step: 315, loss: 0.3154275715351105, mean loss: 0.34432032485804015
Epoch: 39, step: 316, loss: 0.31788939237594604, mean loss: 0.3443198581525419
Epoch: 39, step: 317, loss: 0.32539406418800354, mean loss: 0.3443195239752992
Epoch: 39, step: 318, loss: 0.31120041012763977, mean loss: 0.34431893919355916
Epoch: 39, step: 319, loss: 0.3292568027973175, mean loss: 0.34431867324722826
Epoch: 39, step: 320, loss: 0.35722222924232483, mean loss: 0.3443189010763152
Epoch: 39, step: 321, loss: 0.30000996589660645, mean loss: 0.3443181187581687
Epoch: 39, step: 322, loss: 0.32467490434646606, mean loss: 0.3443177719438815
Epoch: 39, step: 323, loss: 0.32971182465553284, mean loss: 0.34431751407051836
Epoch: 39, step: 324, loss: 0.32671859860420227, mean loss: 0.3443172033606886
Epoch: 39, step: 325, loss: 0.3986806869506836, mean loss: 0.3443181631340651
Epoch: 39, step: 326, loss: 0.3366664946079254, mean loss: 0.34431802804820233
Epoch: 39, step: 327, loss: 0.3388890027999878, mean loss: 0.34431793220353657
Epoch: 39, step: 328, loss: 0.349235475063324, mean loss: 0.344318019016898
Epoch: 39, step: 329, loss: 0.33185654878616333, mean loss: 0.34431779902836873
Epoch: 39, step: 330, loss: 0.3042152225971222, mean loss: 0.34431709109014724
Epoch: 39, step: 331, loss: 0.3768444359302521, mean loss: 0.3443176652912636
Epoch: 39, step: 332, loss: 0.35023069381713867, mean loss: 0.34431776967136785
Epoch: 39, step: 333, loss: 0.3403799831867218, mean loss: 0.3443177001605738
Epoch: 39, step: 334, loss: 0.30690738558769226, mean loss: 0.3443170397959805
Epoch: 39, step: 335, loss: 0.40252143144607544, mean loss: 0.3443180671982196
Epoch: 39, step: 336, loss: 0.35191163420677185, mean loss: 0.3443182012346697
Epoch: 39, step: 337, loss: 0.3902585208415985, mean loss: 0.3443190121274506
Epoch: 39, step: 338, loss: 0.32336947321891785, mean loss: 0.34431864235357523
Epoch: 39, step: 339, loss: 0.3505970537662506, mean loss: 0.3443187531699303
Epoch: 39, step: 340, loss: 0.33955657482147217, mean loss: 0.3443186691171505
Epoch: 39, step: 341, loss: 0.3252002000808716, mean loss: 0.34431833168079484
Epoch: 39, step: 342, loss: 0.3001319169998169, mean loss: 0.3443175518150245
Epoch: 39, step: 343, loss: 0.34852179884910583, mean loss: 0.3443176260163488
Epoch: 39, step: 344, loss: 0.3087420165538788, mean loss: 0.34431699814868916
Epoch: 39, step: 345, loss: 0.3013622760772705, mean loss: 0.3443162400617513
Epoch: 39, step: 346, loss: 0.32743510603904724, mean loss: 0.3443159421401089
Epoch: 39, step: 347, loss: 0.28930842876434326, mean loss: 0.3443149713736015
Epoch: 39, step: 348, loss: 0.38391396403312683, mean loss: 0.34431567019990805
Epoch: 39, step: 349, loss: 0.33959269523620605, mean loss: 0.3443155868523105
Epoch: 39, step: 350, loss: 0.27654680609703064, mean loss: 0.3443143909396849
Epoch: 39, step: 351, loss: 0.3587128221988678, mean loss: 0.3443146450236699
Epoch: 39, step: 352, loss: 0.3256104588508606, mean loss: 0.34431431496338694
Epoch: 39, step: 353, loss: 0.3013146221637726, mean loss: 0.34431355618991244
Epoch: 39, step: 354, loss: 0.3079887330532074, mean loss: 0.3443129152126377
Epoch: 39, step: 355, loss: 0.3388522267341614, mean loss: 0.3443128188566157
Epoch: 39, step: 356, loss: 0.33400824666023254, mean loss: 0.34431263703154563
Epoch: 39, step: 357, loss: 0.39008405804634094, mean loss: 0.34431344465798835
Epoch: 39, step: 358, loss: 0.3046305179595947, mean loss: 0.34431274447401483
Epoch: 39, step: 359, loss: 0.31307101249694824, mean loss: 0.34431219324012435
Epoch: 39, step: 360, loss: 0.3144671320915222, mean loss: 0.34431166665859836
Epoch: 39, step: 361, loss: 0.29863011837005615, mean loss: 0.3443108606748253
Epoch: 39, step: 362, loss: 0.3173448145389557, mean loss: 0.34431038490697236
Epoch: 39, step: 363, loss: 0.34129923582077026, mean loss: 0.3443103317815474
Epoch: 39, step: 364, loss: 0.3454916179180145, mean loss: 0.3443103526225018
Epoch: 39, step: 365, loss: 0.3101702332496643, mean loss: 0.34430975031278493
Epoch: 39, step: 366, loss: 0.29536256194114685, mean loss: 0.3443088867877709
Epoch: 39, step: 367, loss: 0.29793426394462585, mean loss: 0.3443080686623238
Epoch: 39, step: 368, loss: 0.3477378487586975, mean loss: 0.3443081291682794
Epoch: 39, step: 369, loss: 0.39169660210609436, mean loss: 0.3443089651502315
Epoch: 39, step: 370, loss: 0.3088580071926117, mean loss: 0.34430833976949243
Epoch: 39, step: 371, loss: 0.3057668209075928, mean loss: 0.34430765988099993
Epoch: 39, step: 372, loss: 0.30239158868789673, mean loss: 0.3443069204770381
Epoch: 39, step: 373, loss: 0.3436723053455353, mean loss: 0.344306909282557
Epoch: 39, step: 374, loss: 0.29737111926078796, mean loss: 0.3443060813594295
Epoch: 39, step: 375, loss: 0.3494251072406769, mean loss: 0.34430617165481303
Epoch: 39, step: 376, loss: 0.34633389115333557, mean loss: 0.34430620742147733
Epoch: 39, step: 377, loss: 0.30670270323753357, mean loss: 0.3443055441501579
Epoch: 39, step: 378, loss: 0.3184128403663635, mean loss: 0.344305087448442
Epoch: 39, step: 379, loss: 0.3346158266067505, mean loss: 0.3443049165499511
Epoch: 39, step: 380, loss: 0.32582539319992065, mean loss: 0.3443045906151865
Epoch: 39, step: 381, loss: 0.3360188901424408, mean loss: 0.3443044444777483
Epoch: 39, step: 382, loss: 0.31357860565185547, mean loss: 0.3443039025662714
Epoch: 39, step: 383, loss: 0.3892858326435089, mean loss: 0.34430469589837154
Epoch: 39, step: 384, loss: 0.336519718170166, mean loss: 0.3443045585995985
Epoch: 39, step: 385, loss: 0.3426910936832428, mean loss: 0.34430453014443085
Epoch: 39, step: 386, loss: 0.3571251928806305, mean loss: 0.344304756246449
Epoch: 39, step: 387, loss: 0.2879056930541992, mean loss: 0.34430376162414383
Epoch: 39, step: 388, loss: 0.3257025182247162, mean loss: 0.3443034335888136
Epoch: 39, step: 389, loss: 0.2962091267108917, mean loss: 0.3443025854544561
Epoch: 39, step: 390, loss: 0.335234135389328, mean loss: 0.34430242553680807
Epoch: 39, step: 391, loss: 0.34223800897598267, mean loss: 0.34430238913248135
Epoch: 39, step: 392, loss: 0.33015215396881104, mean loss: 0.34430213960885786
Epoch: 39, step: 393, loss: 0.31609535217285156, mean loss: 0.34430164222237514
Epoch: 39, step: 394, loss: 0.35273221135139465, mean loss: 0.3443017908808211
Epoch: 39, step: 395, loss: 0.34818580746650696, mean loss: 0.3443018593675009
Epoch: 39, step: 396, loss: 0.33661115169525146, mean loss: 0.3443017237600093
Epoch: 39, step: 397, loss: 0.360081285238266, mean loss: 0.34430200199045463
Epoch: 39, step: 398, loss: 0.3369128704071045, mean loss: 0.34430187170514065
Epoch: 39, step: 399, loss: 0.3377324640750885, mean loss: 0.3443017558752579
Epoch: 39, step: 400, loss: 0.31061041355133057, mean loss: 0.3443011618497925
Epoch: 39, step: 401, loss: 0.33146196603775024, mean loss: 0.3443009354808124
Epoch: 39, step: 402, loss: 0.3383283019065857, mean loss: 0.34430083017864604
Epoch: 39, step: 403, loss: 0.28976696729660034, mean loss: 0.34429986872126095
Epoch: 39, step: 404, loss: 0.3615025281906128, mean loss: 0.3443001720068072
Epoch: 39, step: 405, loss: 0.3284759521484375, mean loss: 0.34429989302828284
Epoch: 39, step: 406, loss: 0.32575511932373047, mean loss: 0.34429956609258294
Epoch: 39, step: 407, loss: 0.3044496774673462, mean loss: 0.34429886357004175
Epoch: 39, step: 408, loss: 0.3242168426513672, mean loss: 0.34429850954587393
Epoch: 39, step: 409, loss: 0.3315149247646332, mean loss: 0.34429828418916303
Epoch: 39, step: 410, loss: 0.334247350692749, mean loss: 0.3442981070083938
Epoch: 39, step: 411, loss: 0.36073294281959534, mean loss: 0.34429839672133644
Epoch: 39, step: 412, loss: 0.3490923345088959, mean loss: 0.344298481227282
Epoch: 39, step: 413, loss: 0.3365943431854248, mean loss: 0.3442983454236853
Epoch: 39, step: 414, loss: 0.34557196497917175, mean loss: 0.344298367873837
Epoch: 39, step: 415, loss: 0.3134313225746155, mean loss: 0.3442978237885712
Epoch: 39, step: 416, loss: 0.32971903681755066, mean loss: 0.34429756681666823
Epoch: 39, step: 417, loss: 0.33241915702819824, mean loss: 0.34429735744645307
Epoch: 39, step: 418, loss: 0.2778327465057373, mean loss: 0.3442961859542359
Epoch: 39, step: 419, loss: 0.3412097096443176, mean loss: 0.3442961315535677
Epoch: 39, step: 420, loss: 0.34596243500709534, mean loss: 0.3442961609224708
Epoch: 39, step: 421, loss: 0.3382130265235901, mean loss: 0.3442960537080043
Epoch: 39, step: 422, loss: 0.30628371238708496, mean loss: 0.3442953837571536
Epoch: 39, step: 423, loss: 0.33870089054107666, mean loss: 0.3442952851584011
Epoch: 39, step: 424, loss: 0.31248176097869873, mean loss: 0.34429472447874826
Epoch: 39, step: 425, loss: 0.330924928188324, mean loss: 0.34429448885440844
Epoch: 39, step: 426, loss: 0.2961430847644806, mean loss: 0.3442936402668454
Epoch: 39, step: 427, loss: 0.34553369879722595, mean loss: 0.3442936621204075
Epoch: 39, step: 428, loss: 0.34440672397613525, mean loss: 0.34429366411286244
Epoch: 39, step: 429, loss: 0.3645278215408325, mean loss: 0.34429402068702497
Epoch: 39, step: 430, loss: 0.3186657428741455, mean loss: 0.3442935690635416
Epoch: 39, step: 431, loss: 0.31074610352516174, mean loss: 0.34429297789794033
Epoch: 39, step: 432, loss: 0.3793337643146515, mean loss: 0.34429359536761234
Epoch: 39, step: 433, loss: 0.32143527269363403, mean loss: 0.34429319257778546
Epoch: 39, step: 434, loss: 0.3486519753932953, mean loss: 0.3442932693831777
Epoch: 39, step: 435, loss: 0.3400682508945465, mean loss: 0.3442931949361364
Epoch: 39, step: 436, loss: 0.37416911125183105, mean loss: 0.34429372135617264
Epoch: 39, step: 437, loss: 0.3363748788833618, mean loss: 0.34429358182693287
Epoch: 39, step: 438, loss: 0.2980303466320038, mean loss: 0.3442927666875585
Epoch: 39, step: 439, loss: 0.3521170914173126, mean loss: 0.3442929045465466
Epoch: 39, step: 440, loss: 0.34398892521858215, mean loss: 0.3442928991907433
Epoch: 39, step: 441, loss: 0.32456174492836, mean loss: 0.3442925515542117
Epoch: 39, step: 442, loss: 0.3267962634563446, mean loss: 0.344292243298462
Epoch: 39, step: 443, loss: 0.30094146728515625, mean loss: 0.34429147954271827
Epoch: 39, step: 444, loss: 0.3098345696926117, mean loss: 0.3442908724901672
Epoch: 39, step: 445, loss: 0.338281512260437, mean loss: 0.3442907666207435
Epoch: 39, step: 446, loss: 0.35825780034065247, mean loss: 0.34429101267950923
Epoch: 39, step: 447, loss: 0.296228289604187, mean loss: 0.34429016596815915
Epoch: 39, step: 448, loss: 0.301848828792572, mean loss: 0.3442894183008082
Epoch: 39, step: 449, loss: 0.31430575251579285, mean loss: 0.34428889010319375
Epoch: 39, step: 450, loss: 0.3929533362388611, mean loss: 0.3442897473696714
Epoch: 39, step: 451, loss: 0.37019863724708557, mean loss: 0.3442902037692253
Epoch: 39, step: 452, loss: 0.3356429934501648, mean loss: 0.3442900514464731
Epoch: 39, step: 453, loss: 0.3154096007347107, mean loss: 0.3442895427191398
Epoch: 39, step: 454, loss: 0.36369118094444275, mean loss: 0.34428988447176395
Epoch: 39, step: 455, loss: 0.3388214409351349, mean loss: 0.34428978814886646
Epoch: 39, step: 456, loss: 0.31689003109931946, mean loss: 0.3442893055293634
Epoch: 39, step: 457, loss: 0.3051965534687042, mean loss: 0.34428861696149676
Epoch: 39, step: 458, loss: 0.3517351746559143, mean loss: 0.3442887481205931
Epoch: 39, step: 459, loss: 0.33242207765579224, mean loss: 0.344288539112025
Epoch: 39, step: 460, loss: 0.3435060977935791, mean loss: 0.34428852533106935
Epoch: 39, step: 461, loss: 0.31949377059936523, mean loss: 0.3442880886345543
Epoch: 39, step: 462, loss: 0.2972586452960968, mean loss: 0.34428726034516316
Epoch: 39, step: 463, loss: 0.37444257736206055, mean loss: 0.3442877914356355
Epoch: 39, step: 464, loss: 0.3147216737270355, mean loss: 0.34428727073121485
Epoch: 39, step: 465, loss: 0.35015279054641724, mean loss: 0.34428737403014437
Epoch: 39, step: 466, loss: 0.36540353298187256, mean loss: 0.3442877459048067
Epoch: 39, step: 467, loss: 0.3558262288570404, mean loss: 0.3442879491043515
Epoch: 39, step: 468, loss: 0.2994813919067383, mean loss: 0.344287160048136
Epoch: 39, step: 469, loss: 0.30082935094833374, mean loss: 0.34428639475723505
Epoch: 39, step: 470, loss: 0.3188532292842865, mean loss: 0.34428594688773195
Epoch: 39, step: 471, loss: 0.30410200357437134, mean loss: 0.3442852392744455
Epoch: 39, step: 472, loss: 0.3246029317378998, mean loss: 0.34428489268782597
Epoch: 39, step: 473, loss: 0.3349723815917969, mean loss: 0.34428472870629584
Epoch: 39, step: 474, loss: 0.3084248900413513, mean loss: 0.34428409727105674
Epoch: 39, step: 475, loss: 0.3000706434249878, mean loss: 0.3442833187555291
Epoch: 39, step: 476, loss: 0.32805097103118896, mean loss: 0.3442830329395355
Epoch: 39, step: 477, loss: 0.31866151094436646, mean loss: 0.3442825818087471
Epoch: 39, step: 478, loss: 0.3410504162311554, mean loss: 0.3442825248994139
Epoch: 39, step: 479, loss: 0.328094482421875, mean loss: 0.3442822398785942
Epoch: 39, step: 480, loss: 0.2903214395046234, mean loss: 0.34428128981432365
Epoch: 39, step: 481, loss: 0.33678632974624634, mean loss: 0.34428115785615493
Epoch: 39, step: 482, loss: 0.32394853234291077, mean loss: 0.3442807998810935
Epoch: 39, step: 483, loss: 0.3330143690109253, mean loss: 0.3442806015284373
Epoch: 39, step: 484, loss: 0.3090013861656189, mean loss: 0.34427998042642566
Epoch: 39, step: 485, loss: 0.3417636454105377, mean loss: 0.3442799361263127
Epoch: 39, step: 486, loss: 0.32107558846473694, mean loss: 0.3442795276206411
Epoch: 39, step: 487, loss: 0.3143479526042938, mean loss: 0.3442790006933998
Epoch: 39, step: 488, loss: 0.32577770948410034, mean loss: 0.3442786749951125
Epoch: 39, step: 489, loss: 0.3253861367702484, mean loss: 0.3442783424151346
Epoch: 39, step: 490, loss: 0.32473477721214294, mean loss: 0.34427799838068107
Epoch: 39, step: 491, loss: 0.34846043586730957, mean loss: 0.3442780720047743
Epoch: 39, step: 492, loss: 0.35241422057151794, mean loss: 0.3442782152241333
Epoch: 39, step: 493, loss: 0.3525330424308777, mean loss: 0.3442783605300162
Epoch: 39, step: 494, loss: 0.3213485777378082, mean loss: 0.3442779569148221
Epoch: 39, step: 495, loss: 0.3399008810520172, mean loss: 0.34427787986990444
Epoch: 39, step: 496, loss: 0.3150215744972229, mean loss: 0.3442773649119657
Epoch: 39, step: 497, loss: 0.31262508034706116, mean loss: 0.34427680779075326
Epoch: 39, step: 498, loss: 0.36007317900657654, mean loss: 0.3442770858224564
Epoch: 39, step: 499, loss: 0.33222854137420654, mean loss: 0.34427687375993093
Epoch: 39, step: 500, loss: 0.3238478899002075, mean loss: 0.3442765142023362
Epoch: 39, step: 501, loss: 0.31656771898269653, mean loss: 0.3442760265259798
Epoch: 39, step: 502, loss: 0.3185569643974304, mean loss: 0.34427557387700447
Epoch: 39, step: 503, loss: 0.3456208109855652, mean loss: 0.34427559755242
Epoch: 39, step: 504, loss: 0.31034842133522034, mean loss: 0.34427500046373416
Epoch: 39, step: 505, loss: 0.33958038687705994, mean loss: 0.3442749178440871
Epoch: 39, step: 506, loss: 0.32959264516830444, mean loss: 0.3442746594579991
Epoch: 39, step: 507, loss: 0.3825206160545349, mean loss: 0.34427533251791387
Epoch: 39, step: 508, loss: 0.3699914515018463, mean loss: 0.34427578506730205
Epoch: 39, step: 509, loss: 0.35294437408447266, mean loss: 0.3442759376134784
Epoch: 39, step: 510, loss: 0.3414292335510254, mean loss: 0.3442758875192615
Epoch: 39, step: 511, loss: 0.3996961712837219, mean loss: 0.3442768627477363
Epoch: 39, step: 512, loss: 0.34956657886505127, mean loss: 0.3442769558290173
Epoch: 39, step: 513, loss: 0.31839627027511597, mean loss: 0.34427650042367586
Epoch: 39, step: 514, loss: 0.32439282536506653, mean loss: 0.34427615054992633
Epoch: 39, step: 515, loss: 0.3419954180717468, mean loss: 0.3442761104187946
Epoch: 39, step: 516, loss: 0.34623977541923523, mean loss: 0.3442761449702876
Epoch: 39, step: 517, loss: 0.3216317594051361, mean loss: 0.34427574654002463
Epoch: 39, step: 518, loss: 0.3498709201812744, mean loss: 0.3442758449859407
Epoch: 39, step: 519, loss: 0.30454838275909424, mean loss: 0.3442751460018069
Epoch: 39, step: 520, loss: 0.3085053265094757, mean loss: 0.3442745166614214
Epoch: 39, step: 521, loss: 0.4170404374599457, mean loss: 0.3442757968950819
Epoch: 39, step: 522, loss: 0.3506264090538025, mean loss: 0.3442759086249181
Epoch: 39, step: 523, loss: 0.3941849172115326, mean loss: 0.34427678668629363
Epoch: 39, step: 524, loss: 0.3459474742412567, mean loss: 0.3442768160785907
Epoch: 39, step: 525, loss: 0.32194527983665466, mean loss: 0.3442764232082441
Epoch: 39, step: 526, loss: 0.34310832619667053, mean loss: 0.34427640265871273
Epoch: 39, step: 527, loss: 0.3672747015953064, mean loss: 0.34427680724493004
Epoch: 39, step: 528, loss: 0.3044549524784088, mean loss: 0.34427610671093817
Epoch: 39, step: 529, loss: 0.3164982199668884, mean loss: 0.3442756180593753
Epoch: 39, step: 530, loss: 0.35992515087127686, mean loss: 0.3442758933515246
Epoch: 39, step: 531, loss: 0.3063170313835144, mean loss: 0.34427522562597634
Epoch: 39, step: 532, loss: 0.34189116954803467, mean loss: 0.3442751836893358
Epoch: 39, step: 533, loss: 0.3434998393058777, mean loss: 0.3442751700509122
Epoch: 39, step: 534, loss: 0.3370571732521057, mean loss: 0.34427504308750256
Epoch: 39, step: 535, loss: 0.34927892684936523, mean loss: 0.3442751311034697
Epoch: 39, step: 536, loss: 0.40429842472076416, mean loss: 0.34427618686646577
Epoch: 39, step: 537, loss: 0.3236006200313568, mean loss: 0.3442758232057412
Epoch: 39, step: 538, loss: 0.3796848952770233, mean loss: 0.34427644600183777
Epoch: 39, step: 539, loss: 0.33051759004592896, mean loss: 0.3442762040070447
Epoch: 39, step: 540, loss: 0.34928351640701294, mean loss: 0.3442762920755745
Epoch: 39, step: 541, loss: 0.377361923456192, mean loss: 0.3442768739748917
Epoch: 39, step: 542, loss: 0.31003037095069885, mean loss: 0.34427627166913494
Epoch: 39, step: 543, loss: 0.30320802330970764, mean loss: 0.34427554939955424
Epoch: 39, step: 544, loss: 0.32394224405288696, mean loss: 0.344275191802865
Epoch: 39, step: 545, loss: 0.35943323373794556, mean loss: 0.3442754583788197
Epoch: 39, step: 546, loss: 0.316724956035614, mean loss: 0.3442749738721573
Epoch: 39, step: 547, loss: 0.35980260372161865, mean loss: 0.34427524693824213
Epoch: 39, step: 548, loss: 0.3773263394832611, mean loss: 0.3442758281585454
Epoch: 39, step: 549, loss: 0.30903515219688416, mean loss: 0.34427520844420006
Epoch: 39, step: 550, loss: 0.322598934173584, mean loss: 0.3442748272692784
Epoch: 39, step: 551, loss: 0.4152772128582001, mean loss: 0.3442760758165385
Epoch: 39, step: 552, loss: 0.3118361830711365, mean loss: 0.3442755053846205
Epoch: 39, step: 553, loss: 0.3311176598072052, mean loss: 0.3442752740175451
Epoch: 39, step: 554, loss: 0.32055899500846863, mean loss: 0.34427485699869526
Epoch: 39, step: 555, loss: 0.2911277413368225, mean loss: 0.34427392249462185
Epoch: 39, step: 556, loss: 0.3456747829914093, mean loss: 0.34427394712600223
Epoch: 39, step: 557, loss: 0.3612675368785858, mean loss: 0.344274245919647
Epoch: 39, step: 558, loss: 0.3271721303462982, mean loss: 0.34427394522310945
Epoch: 39, step: 559, loss: 0.3547106087207794, mean loss: 0.34427412872165886
Epoch: 39, step: 560, loss: 0.33727532625198364, mean loss: 0.34427400567011834
Epoch: 39, step: 561, loss: 0.33660179376602173, mean loss: 0.34427387078119986
Epoch: 39, step: 562, loss: 0.36203762888908386, mean loss: 0.3442741830890482
Epoch: 39, step: 563, loss: 0.30066365003585815, mean loss: 0.34427341637784825
Epoch: 39, step: 564, loss: 0.3151766359806061, mean loss: 0.34427290484006945
Epoch: 39, step: 565, loss: 0.3299526572227478, mean loss: 0.34427265308648103
Epoch: 39, step: 566, loss: 0.33180469274520874, mean loss: 0.3442724339004265
Epoch: 39, step: 567, loss: 0.3266671895980835, mean loss: 0.3442721244066444
Epoch: 39, step: 568, loss: 0.3475923240184784, mean loss: 0.3442721827735181
Epoch: 39, step: 569, loss: 0.34948843717575073, mean loss: 0.3442722744701465
Epoch: 39, step: 570, loss: 0.34913334250450134, mean loss: 0.34427235992144534
Epoch: 39, step: 571, loss: 0.3777797222137451, mean loss: 0.34427294892725135
Epoch: 39, step: 572, loss: 0.3761860132217407, mean loss: 0.344273509897989
Epoch: 39, step: 573, loss: 0.33158817887306213, mean loss: 0.3442732869180096
Epoch: 39, step: 574, loss: 0.34439951181411743, mean loss: 0.3442732891367243
Epoch: 39, step: 575, loss: 0.3047706186771393, mean loss: 0.3442725947918171
Epoch: 39, step: 576, loss: 0.3166082501411438, mean loss: 0.3442721085396481
Epoch: 39, step: 577, loss: 0.3253239393234253, mean loss: 0.34427177549628296
Epoch: 39, step: 578, loss: 0.3301159739494324, mean loss: 0.34427152669056105
Epoch: 39, step: 579, loss: 0.32454726099967957, mean loss: 0.3442711800182872
Epoch: 39, step: 580, loss: 0.34535348415374756, mean loss: 0.34427119904045245
Epoch: 39, step: 581, loss: 0.31588879227638245, mean loss: 0.3442707002108492
Epoch: 39, step: 582, loss: 0.3360147476196289, mean loss: 0.34427055511247157
Epoch: 39, step: 583, loss: 0.3785346448421478, mean loss: 0.3442711572933104
Epoch: 39, step: 584, loss: 0.33475378155708313, mean loss: 0.3442709900312986
Epoch: 39, step: 585, loss: 0.3547089695930481, mean loss: 0.3442711734691314
Epoch: 39, step: 586, loss: 0.3158531188964844, mean loss: 0.3442706740568935
Epoch: 39, step: 587, loss: 0.3353016972541809, mean loss: 0.34427051644096485
Epoch: 39, step: 588, loss: 0.3343822956085205, mean loss: 0.3442703426737944
Epoch: 39, step: 589, loss: 0.355117529630661, mean loss: 0.34427053328966895
Epoch: 39, step: 590, loss: 0.3150481581687927, mean loss: 0.34427001977858734
Epoch: 39, step: 591, loss: 0.32538625597953796, mean loss: 0.34426968794890084
Epoch: 39, step: 592, loss: 0.3110639750957489, mean loss: 0.3442691044610017
Epoch: 39, step: 593, loss: 0.3480370342731476, mean loss: 0.3442691706695733
Epoch: 39, step: 594, loss: 0.3322760760784149, mean loss: 0.3442689599353639
Epoch: 39, step: 595, loss: 0.31098848581314087, mean loss: 0.34426837516459285
Epoch: 39, step: 596, loss: 0.32616838812828064, mean loss: 0.34426805713554787
Epoch: 39, step: 597, loss: 0.33002081513404846, mean loss: 0.34426780680624397
Epoch: 39, step: 598, loss: 0.3323034644126892, mean loss: 0.3442675965920229
Epoch: 39, step: 599, loss: 0.4199521541595459, mean loss: 0.34426892635092315
Epoch: 39, step: 600, loss: 0.31011977791786194, mean loss: 0.3442683263693986
Epoch: 39, step: 601, loss: 0.3303889334201813, mean loss: 0.34426808252047647
Epoch: 39, step: 602, loss: 0.35135847330093384, mean loss: 0.34426820709031747
Epoch: 39, step: 603, loss: 0.3409014940261841, mean loss: 0.34426814794216104
Epoch: 39, step: 604, loss: 0.30934756994247437, mean loss: 0.34426753445016334
Epoch: 39, step: 605, loss: 0.3501625657081604, mean loss: 0.3442676380134826
Epoch: 39, step: 606, loss: 0.3089295029640198, mean loss: 0.34426701720756847
Epoch: 39, step: 607, loss: 0.32967501878738403, mean loss: 0.34426676086580715
Epoch: 39, step: 608, loss: 0.3114262819290161, mean loss: 0.3442661839579646
Epoch: 39, step: 609, loss: 0.3335837423801422, mean loss: 0.34426599630308674
Epoch: 39, step: 610, loss: 0.3185551166534424, mean loss: 0.34426554465659825
Epoch: 39, step: 611, loss: 0.3244923949241638, mean loss: 0.3442651973204942
Epoch: 39, step: 612, loss: 0.3595517575740814, mean loss: 0.34426546584023376
Epoch: 39, step: 613, loss: 0.29768162965774536, mean loss: 0.3442646475750628
Epoch: 39, step: 614, loss: 0.37113437056541443, mean loss: 0.34426511954504385
Epoch: 39, step: 615, loss: 0.3581254780292511, mean loss: 0.34426536299966487
Epoch: 39, step: 616, loss: 0.31409594416618347, mean loss: 0.3442648330887374
Epoch: 39, step: 617, loss: 0.3291435241699219, mean loss: 0.34426456749508655
Epoch: 39, step: 618, loss: 0.2937762439250946, mean loss: 0.3442636807237935
Epoch: 39, step: 619, loss: 0.3189809024333954, mean loss: 0.3442632366676903
Epoch: 39, step: 620, loss: 0.33534204959869385, mean loss: 0.3442630799824581
Epoch: 39, step: 621, loss: 0.35896989703178406, mean loss: 0.3442633382777451
Epoch: 39, step: 622, loss: 0.33958402276039124, mean loss: 0.34426325609654207
Epoch: 39, step: 623, loss: 0.30000004172325134, mean loss: 0.3442624787306416
Epoch: 39, step: 624, loss: 0.3252100348472595, mean loss: 0.34426214413090006
Epoch: 39, step: 625, loss: 0.31505563855171204, mean loss: 0.34426163121415004
Epoch: 39, step: 626, loss: 0.3458435535430908, mean loss: 0.34426165899495415
Epoch: 39, step: 627, loss: 0.3402048945426941, mean loss: 0.3442615877536565
Epoch: 39, step: 628, loss: 0.363598495721817, mean loss: 0.3442619273253128
Epoch: 39, step: 629, loss: 0.30969393253326416, mean loss: 0.3442613202941817
Epoch: 39, step: 630, loss: 0.33114227652549744, mean loss: 0.34426108992131277
Epoch: 39, step: 631, loss: 0.31153446435928345, mean loss: 0.34426051524572165
Epoch: 39, step: 632, loss: 0.3001248240470886, mean loss: 0.3442597402419253
Epoch: 39, step: 633, loss: 0.39366626739501953, mean loss: 0.34426060778410533
Epoch: 39, step: 634, loss: 0.3109897971153259, mean loss: 0.34426002358346497
Epoch: 39, step: 635, loss: 0.30867910385131836, mean loss: 0.3442593988306954
Epoch: 39, step: 636, loss: 0.31234511733055115, mean loss: 0.3442588384689673
Epoch: 39, step: 637, loss: 0.34509164094924927, mean loss: 0.34425885309133764
Epoch: 39, step: 638, loss: 0.3373328149318695, mean loss: 0.3442587314858919
Epoch: 39, step: 639, loss: 0.3257211744785309, mean loss: 0.34425840601435237
Epoch: 39, step: 640, loss: 0.310847669839859, mean loss: 0.34425781941856654
Epoch: 39, step: 641, loss: 0.3161720633506775, mean loss: 0.34425732632267014
Epoch: 39, step: 642, loss: 0.34556981921195984, mean loss: 0.3442573493654358
Epoch: 39, step: 643, loss: 0.33052363991737366, mean loss: 0.3442571082539637
Epoch: 39, step: 644, loss: 0.3151233196258545, mean loss: 0.3442565967849125
Epoch: 39, step: 645, loss: 0.2950805425643921, mean loss: 0.34425573347157695
Epoch: 39, step: 646, loss: 0.3555445671081543, mean loss: 0.34425593164993196
Epoch: 39, step: 647, loss: 0.31018269062042236, mean loss: 0.34425533349599213
Epoch: 39, step: 648, loss: 0.3085193932056427, mean loss: 0.3442547061644677
Epoch: 39, step: 649, loss: 0.33456873893737793, mean loss: 0.3442545361337963
Epoch: 39, step: 650, loss: 0.3402010202407837, mean loss: 0.3442544649782871
Epoch: 39, step: 651, loss: 0.3382900357246399, mean loss: 0.34425436028039963
Epoch: 39, step: 652, loss: 0.3476872146129608, mean loss: 0.34425442053868627
Epoch: 39, step: 653, loss: 0.3574037551879883, mean loss: 0.3442546513502476
Epoch: 39, step: 654, loss: 0.33342719078063965, mean loss: 0.3442544612981058
Epoch: 39, step: 655, loss: 0.29667600989341736, mean loss: 0.34425362617819766
Epoch: 39, step: 656, loss: 0.3313411474227905, mean loss: 0.3442533995361259
Epoch: 39, step: 657, loss: 0.30786454677581787, mean loss: 0.34425276084386697
Epoch: 39, step: 658, loss: 0.34042561054229736, mean loss: 0.34425269367141764
Epoch: 39, step: 659, loss: 0.35315272212028503, mean loss: 0.34425284987803884
Epoch: 39, step: 660, loss: 0.32469677925109863, mean loss: 0.34425250665058515
Epoch: 39, step: 661, loss: 0.31507745385169983, mean loss: 0.34425199460992384
Epoch: 39, step: 662, loss: 0.28210368752479553, mean loss: 0.3442509038869016
Epoch: 39, step: 663, loss: 0.3398292362689972, mean loss: 0.3442508262865573
Epoch: 39, step: 664, loss: 0.34836867451667786, mean loss: 0.3442508985535977
Epoch: 39, step: 665, loss: 0.38675937056541443, mean loss: 0.344251644551843
Epoch: 39, step: 666, loss: 0.34017515182495117, mean loss: 0.3442515730130906
Epoch: 39, step: 667, loss: 0.3163790702819824, mean loss: 0.34425108388451536
Epoch: 39, step: 668, loss: 0.32049670815467834, mean loss: 0.3442506670313833
Epoch: 39, step: 669, loss: 0.363413542509079, mean loss: 0.3442510033047746
Epoch: 39, step: 670, loss: 0.3306688666343689, mean loss: 0.34425076496731744
Epoch: 39, step: 671, loss: 0.30945566296577454, mean loss: 0.34425015439839063
Epoch: 39, step: 672, loss: 0.36290791630744934, mean loss: 0.3442504817907279
Epoch: 39, step: 673, loss: 0.2854194939136505, mean loss: 0.3442494494870277
Epoch: 39, step: 674, loss: 0.31475821137428284, mean loss: 0.34424893201517925
Epoch: 39, step: 675, loss: 0.3203881084918976, mean loss: 0.34424851334547957
Epoch: 39, step: 676, loss: 0.3493897318840027, mean loss: 0.3442486035533742
Epoch: 39, step: 677, loss: 0.29960641264915466, mean loss: 0.34424782027459216
Epoch: 39, step: 678, loss: 0.3468303382396698, mean loss: 0.34424786558589954
Epoch: 39, step: 679, loss: 0.3417043089866638, mean loss: 0.34424782095896783
Epoch: 39, step: 680, loss: 0.3061559200286865, mean loss: 0.3442471526448297
Epoch: 39, step: 681, loss: 0.31906846165657043, mean loss: 0.3442467108979089
Epoch: 39, step: 682, loss: 0.38362494111061096, mean loss: 0.34424740175617335
Epoch: 39, step: 683, loss: 0.38573676347732544, mean loss: 0.3442481296397123
Epoch: 39, step: 684, loss: 0.30092158913612366, mean loss: 0.3442473695383017
Epoch: 39, step: 685, loss: 0.3914124369621277, mean loss: 0.34424819696659237
Epoch: 39, step: 686, loss: 0.30931830406188965, mean loss: 0.3442475841937049
Epoch: 39, step: 687, loss: 0.31440410017967224, mean loss: 0.34424706066054905
Epoch: 39, step: 688, loss: 0.35834333300590515, mean loss: 0.3442473079418813
Epoch: 39, step: 689, loss: 0.339364618062973, mean loss: 0.34424722228967136
Epoch: 39, step: 690, loss: 0.3289296627044678, mean loss: 0.3442469535935536
Epoch: 39, step: 691, loss: 0.33024075627326965, mean loss: 0.3442467079052762
Epoch: 39, step: 692, loss: 0.3333396017551422, mean loss: 0.3442465165827455
Epoch: 39, step: 693, loss: 0.3146655857563019, mean loss: 0.3442459977100771
Epoch: 39, step: 694, loss: 0.301548570394516, mean loss: 0.34424524877693585
Epoch: 39, step: 695, loss: 0.3422923982143402, mean loss: 0.3442452145236109
Epoch: 39, step: 696, loss: 0.3603692948818207, mean loss: 0.3442454973377122
Epoch: 39, step: 697, loss: 0.35447901487350464, mean loss: 0.34424567682902196
Epoch: 39, step: 698, loss: 0.32505351305007935, mean loss: 0.3442453402129774
Epoch: 39, step: 699, loss: 0.2900305986404419, mean loss: 0.3442443893440709
Epoch: 39, step: 700, loss: 0.31064608693122864, mean loss: 0.3442438000759156
Epoch: 39, step: 701, loss: 0.35403046011924744, mean loss: 0.3442439717175032
Epoch: 39, step: 702, loss: 0.3051542341709137, mean loss: 0.34424328616115274
Epoch: 39, step: 703, loss: 0.31743013858795166, mean loss: 0.34424281592005185
Epoch: 39, step: 704, loss: 0.3351883292198181, mean loss: 0.34424265712791036
Epoch: 39, step: 705, loss: 0.3306834101676941, mean loss: 0.34424241933816324
Epoch: 39, step: 706, loss: 0.3203100264072418, mean loss: 0.3442419996409721
Epoch: 39, step: 707, loss: 0.31274935603141785, mean loss: 0.34424144737098733
Epoch: 39, step: 708, loss: 0.3328939378261566, mean loss: 0.34424124837914966
Epoch: 39, step: 709, loss: 0.3791877329349518, mean loss: 0.3442418611958395
Epoch: 39, step: 710, loss: 0.36372750997543335, mean loss: 0.3442422028874729
Epoch: 39, step: 711, loss: 0.32556024193763733, mean loss: 0.3442418752946948
Epoch: 39, step: 712, loss: 0.29653528332710266, mean loss: 0.3442410387625451
Epoch: 39, step: 713, loss: 0.3160420060157776, mean loss: 0.34424054430291423
Epoch: 39, step: 714, loss: 0.2988957464694977, mean loss: 0.3442397492125628
Epoch: 39, step: 715, loss: 0.34660688042640686, mean loss: 0.34423979071787936
Epoch: 39, step: 716, loss: 0.3207809627056122, mean loss: 0.34423937939762594
Epoch: 39, step: 717, loss: 0.37030261754989624, mean loss: 0.3442398363748352
Epoch: 39, step: 718, loss: 0.37973278760910034, mean loss: 0.3442404586760754
Epoch: 39, step: 719, loss: 0.3582977056503296, mean loss: 0.3442407051387827
Epoch: 39, step: 720, loss: 0.33424806594848633, mean loss: 0.34424052994304677
Epoch: 39, step: 721, loss: 0.3186097741127014, mean loss: 0.34424008058023897
Epoch: 39, step: 722, loss: 0.3125513792037964, mean loss: 0.3442395250182309
Epoch: 39, step: 723, loss: 0.31456267833709717, mean loss: 0.3442390047369076
Epoch: 39, step: 724, loss: 0.3183779716491699, mean loss: 0.34423855136068543
Epoch: 39, step: 725, loss: 0.3132186233997345, mean loss: 0.344238007552124
Epoch: 39, step: 726, loss: 0.3040691912174225, mean loss: 0.34423730336727515
Epoch: 39, step: 727, loss: 0.35568803548812866, mean loss: 0.344237504102359
Epoch: 39, step: 728, loss: 0.31647035479545593, mean loss: 0.34423701734367185
Epoch: 39, step: 729, loss: 0.35392844676971436, mean loss: 0.3442371872316469
Epoch: 39, step: 730, loss: 0.35912641882896423, mean loss: 0.3442374482310263
Epoch: 39, step: 731, loss: 0.3219684064388275, mean loss: 0.34423705787480363
Epoch: 39, step: 732, loss: 0.3640269637107849, mean loss: 0.3442374047679277
Epoch: 39, step: 733, loss: 0.3658626079559326, mean loss: 0.3442377838249511
Epoch: 39, step: 734, loss: 0.32283923029899597, mean loss: 0.34423740874732717
Epoch: 39, step: 735, loss: 0.30538225173950195, mean loss: 0.34423672769921304
Epoch: 39, step: 736, loss: 0.35659876465797424, mean loss: 0.3442369443755834
Epoch: 39, step: 737, loss: 0.3230579197406769, mean loss: 0.34423657316542045
Epoch: 39, step: 738, loss: 0.3181445896625519, mean loss: 0.3442361158525907
Epoch: 39, step: 739, loss: 0.3409665524959564, mean loss: 0.34423605854812916
Epoch: 39, step: 740, loss: 0.3333735167980194, mean loss: 0.3442358681676018
Epoch: 39, step: 741, loss: 0.30828535556793213, mean loss: 0.34423523809797796
Epoch: 39, step: 742, loss: 0.33953964710235596, mean loss: 0.34423515580436964
Epoch: 39, step: 743, loss: 0.3719974160194397, mean loss: 0.34423564234941373
Epoch: 39, step: 744, loss: 0.32691097259521484, mean loss: 0.3442353387327622
Epoch: 39, step: 745, loss: 0.32354283332824707, mean loss: 0.34423497610079334
Epoch: 39, step: 746, loss: 0.3981185853481293, mean loss: 0.34423592038359035
Epoch: 39, step: 747, loss: 0.3376191258430481, mean loss: 0.3442358044296695
Epoch: 39, step: 748, loss: 0.32750293612480164, mean loss: 0.3442355112049555
Epoch: 39, step: 749, loss: 0.3612418472766876, mean loss: 0.34423580921666247
Epoch: 39, step: 750, loss: 0.3292703628540039, mean loss: 0.34423554697322295
Epoch: 39, step: 751, loss: 0.3012842833995819, mean loss: 0.3442347943401611
Epoch: 39, step: 752, loss: 0.35048890113830566, mean loss: 0.3442349039286732
Epoch: 39, step: 753, loss: 0.3070682883262634, mean loss: 0.34423425268256136
Epoch: 39, step: 754, loss: 0.2896997034549713, mean loss: 0.34423329712633793
Epoch: 39, step: 755, loss: 0.3269611597061157, mean loss: 0.34423299448866235
Epoch: 39, step: 756, loss: 0.3756953179836273, mean loss: 0.34423354575324444
Epoch: 39, step: 757, loss: 0.34158727526664734, mean loss: 0.34423349938764036
Epoch: 39, step: 758, loss: 0.3283754587173462, mean loss: 0.34423322154198693
Epoch: 39, step: 759, loss: 0.3001399040222168, mean loss: 0.3442324490050621
Epoch: 39, step: 760, loss: 0.34207460284233093, mean loss: 0.34423241119918296
Epoch: 39, step: 761, loss: 0.3546879291534424, mean loss: 0.3442325943786559
Epoch: 39, step: 762, loss: 0.28603628277778625, mean loss: 0.344231574803828
Epoch: 39, step: 763, loss: 0.35729143023490906, mean loss: 0.3442318036029771
Epoch: 39, step: 764, loss: 0.3345406949520111, mean loss: 0.34423163382479083
Epoch: 39, step: 765, loss: 0.3020152151584625, mean loss: 0.34423089424981684
Epoch: 39, step: 766, loss: 0.3322451114654541, mean loss: 0.34423068427867337
Epoch: 39, step: 767, loss: 0.3216095268726349, mean loss: 0.344230288000252
Epoch: 39, step: 768, loss: 0.36458033323287964, mean loss: 0.3442306444869864
Epoch: 39, step: 769, loss: 0.35048720240592957, mean loss: 0.34423075408580084
Epoch: 39, step: 770, loss: 0.3559594750404358, mean loss: 0.3442309595392483
Epoch: 39, step: 771, loss: 0.3960050940513611, mean loss: 0.3442318664572436
Epoch: 39, step: 772, loss: 0.3082740008831024, mean loss: 0.3442312366009565
Epoch: 39, step: 773, loss: 0.3571307957172394, mean loss: 0.34423146255224596
Epoch: 39, step: 774, loss: 0.34387898445129395, mean loss: 0.3442314563782763
Epoch: 39, step: 775, loss: 0.30345073342323303, mean loss: 0.344230742079899
Epoch: 39, step: 776, loss: 0.3225710093975067, mean loss: 0.3442303627035712
Epoch: 39, step: 777, loss: 0.3197684586048126, mean loss: 0.34422993425392506
Epoch: 39, step: 778, loss: 0.30264097452163696, mean loss: 0.34422920583708067
Epoch: 39, step: 779, loss: 0.3290782868862152, mean loss: 0.3442289404784049
Epoch: 39, step: 780, loss: 0.3181905746459961, mean loss: 0.3442284844410329
Epoch: 39, step: 781, loss: 0.339010626077652, mean loss: 0.3442283930567749
Epoch: 39, step: 782, loss: 0.3494049906730652, mean loss: 0.34422848371681475
Epoch: 39, step: 783, loss: 0.3554421365261078, mean loss: 0.3442286801030286
Epoch: 39, step: 784, loss: 0.3269862234592438, mean loss: 0.34422837813884855
Epoch: 39, step: 785, loss: 0.34063130617141724, mean loss: 0.34422831514504854
Epoch: 39, step: 786, loss: 0.29694393277168274, mean loss: 0.34422748709078915
Epoch: 39, step: 787, loss: 0.342271089553833, mean loss: 0.3442274528305353
Epoch: 39, step: 788, loss: 0.2897087335586548, mean loss: 0.3442264981204526
Epoch: 39, step: 789, loss: 0.31449949741363525, mean loss: 0.34422597756218015
Epoch: 39, step: 790, loss: 0.3332803547382355, mean loss: 0.34422578589350866
Epoch: 39, step: 791, loss: 0.31199923157691956, mean loss: 0.3442252215845797
Epoch: 39, step: 792, loss: 0.33845189213752747, mean loss: 0.3442251204914167
Epoch: 39, step: 793, loss: 0.3628440201282501, mean loss: 0.3442254465096208
Epoch: 39, step: 794, loss: 0.29635149240493774, mean loss: 0.34422460824809314
Epoch: 39, step: 795, loss: 0.31371667981147766, mean loss: 0.34422407407088984
Epoch: 39, step: 796, loss: 0.3491955101490021, mean loss: 0.34422416111650256
Epoch: 39, step: 797, loss: 0.32852116227149963, mean loss: 0.3442238861751774
Epoch: 39, step: 798, loss: 0.3271626830101013, mean loss: 0.3442235874584976
Epoch: 39, step: 799, loss: 0.3135021924972534, mean loss: 0.3442230495812835
Epoch: 39, step: 800, loss: 0.30627667903900146, mean loss: 0.3442223852191752
Epoch: 39, step: 801, loss: 0.2905917465686798, mean loss: 0.3442214462745579
Epoch: 39, step: 802, loss: 0.35358452796936035, mean loss: 0.34422161019692515
Epoch: 39, step: 803, loss: 0.3214755356311798, mean loss: 0.34422121198133404
Epoch: 39, step: 804, loss: 0.32724106311798096, mean loss: 0.3442209147150246
Epoch: 39, step: 805, loss: 0.35519668459892273, mean loss: 0.3442211068611309
Epoch: 39, step: 806, loss: 0.3153943419456482, mean loss: 0.34422060221738116
Epoch: 39, step: 807, loss: 0.3415420651435852, mean loss: 0.3442205553275087
Epoch: 39, step: 808, loss: 0.3282764256000519, mean loss: 0.34422027621801676
Epoch: 39, step: 809, loss: 0.34668615460395813, mean loss: 0.34422031938362235
Epoch: 39, step: 810, loss: 0.3293924629688263, mean loss: 0.3442200598241073
Epoch: 39, step: 811, loss: 0.3189791142940521, mean loss: 0.34421961799268436
Epoch: 39, step: 812, loss: 0.33101800084114075, mean loss: 0.34421938690834625
Epoch: 39, step: 813, loss: 0.32182782888412476, mean loss: 0.3442189949678942
Epoch: 39, step: 814, loss: 0.27486759424209595, mean loss: 0.344217781066497
Epoch: 39, step: 815, loss: 0.3090294301509857, mean loss: 0.34421716515333245
Epoch: 39, step: 816, loss: 0.37572288513183594, mean loss: 0.3442177165985564
Epoch: 39, step: 817, loss: 0.29183077812194824, mean loss: 0.34421679968501145
Epoch: 39, step: 818, loss: 0.34003403782844543, mean loss: 0.34421672647661283
Epoch: 39, step: 819, loss: 0.36289528012275696, mean loss: 0.3442170533905313
Epoch: 39, step: 820, loss: 0.3414258062839508, mean loss: 0.34421700453869963
Epoch: 39, step: 821, loss: 0.3104182779788971, mean loss: 0.34421641301070494
Epoch: 39, step: 822, loss: 0.34423941373825073, mean loss: 0.3442164134132448
Epoch: 39, step: 823, loss: 0.3075513541698456, mean loss: 0.3442157717426245
Epoch: 39, step: 824, loss: 0.31164753437042236, mean loss: 0.34421520177994674
Epoch: 39, step: 825, loss: 0.3633928596973419, mean loss: 0.3442155373939945
Epoch: 39, step: 826, loss: 0.3151439428329468, mean loss: 0.3442150286423616
Epoch: 39, step: 827, loss: 0.34631383419036865, mean loss: 0.3442150653707241
Epoch: 39, step: 828, loss: 0.30434998869895935, mean loss: 0.3442143677580428
Epoch: 39, step: 829, loss: 0.33576416969299316, mean loss: 0.34421421988770956
Epoch: 39, step: 830, loss: 0.29855531454086304, mean loss: 0.3442134209147915
Epoch: 39, step: 831, loss: 0.3352973759174347, mean loss: 0.34421326489804555
Epoch: 39, step: 832, loss: 0.31449151039123535, mean loss: 0.3442127448232497
Epoch: 39, step: 833, loss: 0.3517124056816101, mean loss: 0.3442128760509113
Epoch: 39, step: 834, loss: 0.33142390847206116, mean loss: 0.3442126522758666
Epoch: 39, step: 835, loss: 0.3347589373588562, mean loss: 0.34421248686232175
Epoch: 39, step: 836, loss: 0.3073670268058777, mean loss: 0.34421184218120165
Epoch: 39, step: 837, loss: 0.29529064893722534, mean loss: 0.3442109862272309
Epoch: 39, step: 838, loss: 0.31803998351097107, mean loss: 0.3442105283319861
Epoch: 39, step: 839, loss: 0.33218643069267273, mean loss: 0.3442103179586633
Epoch: 39, step: 840, loss: 0.3471781313419342, mean loss: 0.34421036988254633
Epoch: 39, step: 841, loss: 0.3394835889339447, mean loss: 0.3442102871857944
Epoch: 39, step: 842, loss: 0.29655709862709045, mean loss: 0.3442094534905135
Epoch: 39, step: 843, loss: 0.30870312452316284, mean loss: 0.34420883231610894
Epoch: 39, step: 844, loss: 0.3392331004142761, mean loss: 0.3442087452684383
Epoch: 39, step: 845, loss: 0.3560793995857239, mean loss: 0.34420895293532044
Epoch: 39, step: 846, loss: 0.3195315897464752, mean loss: 0.3442085212336395
Epoch: 39, step: 847, loss: 0.35715800523757935, mean loss: 0.34420874776579263
Epoch: 39, step: 848, loss: 0.3110399842262268, mean loss: 0.34420816753726924
Epoch: 39, step: 849, loss: 0.33468255400657654, mean loss: 0.34420800090651793
Epoch: 39, step: 850, loss: 0.3426869809627533, mean loss: 0.3442079742999102
Epoch: 39, step: 851, loss: 0.43927237391471863, mean loss: 0.3442096371952295
Epoch: 39, step: 852, loss: 0.3558502793312073, mean loss: 0.34420984081331163
Epoch: 39, step: 853, loss: 0.2986466586589813, mean loss: 0.34420904383618806
Epoch: 39, step: 854, loss: 0.3100922703742981, mean loss: 0.3442084470865517
Epoch: 39, step: 855, loss: 0.3235710859298706, mean loss: 0.344208086116826
Epoch: 39, step: 856, loss: 0.3535229563713074, mean loss: 0.3442082490411129
Epoch: 39, step: 857, loss: 0.32182857394218445, mean loss: 0.34420785761012856
Epoch: 39, step: 858, loss: 0.32032540440559387, mean loss: 0.34420743990215824
Epoch: 39, step: 859, loss: 0.33016738295555115, mean loss: 0.34420719434358565
Epoch: 39, step: 860, loss: 0.40109580755233765, mean loss: 0.34420818929983044
Epoch: 39, step: 861, loss: 0.3361543118953705, mean loss: 0.3442080484436024
Epoch: 39, step: 862, loss: 0.3548380434513092, mean loss: 0.3442082343509287
Epoch: 39, step: 863, loss: 0.31891706585884094, mean loss: 0.34420779204298024
Epoch: 39, step: 864, loss: 0.33920273184776306, mean loss: 0.3442077045128532
Epoch: 39, step: 865, loss: 0.36579617857933044, mean loss: 0.34420808205253467
Epoch: 39, step: 866, loss: 0.33890682458877563, mean loss: 0.34420798934565566
Epoch: 39, step: 867, loss: 0.3407083749771118, mean loss: 0.3442079281464676
Epoch: 39, step: 868, loss: 0.3435187339782715, mean loss: 0.344207916094458
Epoch: 39, step: 869, loss: 0.3263092339038849, mean loss: 0.3442076031038276
Epoch: 39, step: 870, loss: 0.33950936794281006, mean loss: 0.3442075209481775
Epoch: 39, step: 871, loss: 0.33484989404678345, mean loss: 0.34420735731897384
Epoch: 39, step: 872, loss: 0.3202451765537262, mean loss: 0.3442069383191528
Epoch: 39, step: 873, loss: 0.42577865719795227, mean loss: 0.34420836464751225
Epoch: 39, step: 874, loss: 0.3623296618461609, mean loss: 0.3442086815032623
Epoch: 39, step: 875, loss: 0.3235835134983063, mean loss: 0.34420832087296427
Epoch: 39, step: 876, loss: 0.3683216869831085, mean loss: 0.344208742486905
Epoch: 39, step: 877, loss: 0.34447070956230164, mean loss: 0.3442087470672294
Epoch: 39, step: 878, loss: 0.32098737359046936, mean loss: 0.3442083410636718
Epoch: 39, step: 879, loss: 0.30884233117103577, mean loss: 0.3442077227335457
Epoch: 39, step: 880, loss: 0.37754565477371216, mean loss: 0.3442083055950951
Epoch: 39, step: 881, loss: 0.33739644289016724, mean loss: 0.3442081865024222
Epoch: 39, step: 882, loss: 0.30019044876098633, mean loss: 0.3442074169480988
Epoch: 39, step: 883, loss: 0.35641351342201233, mean loss: 0.3442076303413938
Epoch: 39, step: 884, loss: 0.3060358762741089, mean loss: 0.3442069630147025
Epoch: 39, step: 885, loss: 0.3338290750980377, mean loss: 0.3442067815894391
Epoch: 39, step: 886, loss: 0.3775755763053894, mean loss: 0.34420736492938137
Epoch: 39, step: 887, loss: 0.321115106344223, mean loss: 0.3442069612467965
Epoch: 39, step: 888, loss: 0.30891481041908264, mean loss: 0.3442063443050811
Epoch: 39, step: 889, loss: 0.3399122655391693, mean loss: 0.3442062692416478
Epoch: 39, step: 890, loss: 0.3258078396320343, mean loss: 0.34420594763013856
Epoch: 39, step: 891, loss: 0.36721187829971313, mean loss: 0.3442063497754796
Epoch: 39, step: 892, loss: 0.3990578353404999, mean loss: 0.3442073085666762
Epoch: 39, step: 893, loss: 0.3174901604652405, mean loss: 0.344206841565311
Epoch: 39, step: 894, loss: 0.3632621169090271, mean loss: 0.34420717463544337
Epoch: 39, step: 895, loss: 0.300552099943161, mean loss: 0.3442064115949153
Epoch: 39, step: 896, loss: 0.31923285126686096, mean loss: 0.3442059750934151
Epoch: 39, step: 897, loss: 0.36231279373168945, mean loss: 0.3442062915687295
Epoch: 39, step: 898, loss: 0.320267915725708, mean loss: 0.3442058731753739
Epoch: 39, step: 899, loss: 0.3691348135471344, mean loss: 0.34420630887413595
Epoch: 39, step: 900, loss: 0.30277833342552185, mean loss: 0.34420558482402064
Epoch: 39, step: 901, loss: 0.3352099657058716, mean loss: 0.3442054276074259
Epoch: 39, step: 902, loss: 0.33511680364608765, mean loss: 0.3442052687681599
Epoch: 39, step: 903, loss: 0.34039419889450073, mean loss: 0.34420520216435224
Epoch: 39, step: 904, loss: 0.3506028652191162, mean loss: 0.3442053139705607
Epoch: 39, step: 905, loss: 0.3872499167919159, mean loss: 0.3442060662092595
Epoch: 39, step: 906, loss: 0.3406812846660614, mean loss: 0.34420600461197265
Epoch: 39, step: 907, loss: 0.3241957724094391, mean loss: 0.34420565492945826
Epoch: 39, step: 908, loss: 0.3671965003013611, mean loss: 0.344206056691719
Epoch: 39, step: 909, loss: 0.3217726945877075, mean loss: 0.34420566467826175
Epoch: 39, step: 910, loss: 0.32284173369407654, mean loss: 0.3442052913591819
Epoch: 39, step: 911, loss: 0.38505783677101135, mean loss: 0.34420600521508127
Epoch: 39, step: 912, loss: 0.29049351811408997, mean loss: 0.34420506666142664
Epoch: 39, step: 913, loss: 0.30001309514045715, mean loss: 0.34420429447950246
Epoch: 39, step: 914, loss: 0.35141071677207947, mean loss: 0.3442044203976638
Epoch: 39, step: 915, loss: 0.3725214898586273, mean loss: 0.34420491517452745
Epoch: 39, step: 916, loss: 0.34565669298171997, mean loss: 0.34420494054062406
Epoch: 39, step: 917, loss: 0.32723289728164673, mean loss: 0.3442046440028448
Epoch: 39, step: 918, loss: 0.3468598425388336, mean loss: 0.3442046903940134
Epoch: 39, step: 919, loss: 0.32859569787979126, mean loss: 0.34420441768116633
Epoch: 39, step: 920, loss: 0.3065148890018463, mean loss: 0.3442037591992634
Epoch: 39, step: 921, loss: 0.308345764875412, mean loss: 0.3442031327274383
Epoch: 39, step: 922, loss: 0.3399197459220886, mean loss: 0.34420305789407635
Epoch: 39, step: 923, loss: 0.33918213844299316, mean loss: 0.34420297017710483
Epoch: 39, step: 924, loss: 0.3105739951133728, mean loss: 0.3442023826790691
Epoch: 39, step: 925, loss: 0.2955906093120575, mean loss: 0.34420153344645377
Epoch: 39, step: 926, loss: 0.33554163575172424, mean loss: 0.3442013821633677
Epoch: 39, step: 927, loss: 0.35982954502105713, mean loss: 0.3442016551729907
Epoch: 39, step: 928, loss: 0.3015049695968628, mean loss: 0.34420090931421565
Epoch: 39, step: 929, loss: 0.3329855799674988, mean loss: 0.34420071339957803
Epoch: 39, step: 930, loss: 0.3456243872642517, mean loss: 0.34420073826854697
Epoch: 39, step: 931, loss: 0.33342474699020386, mean loss: 0.34420055003504924
Epoch: 39, step: 932, loss: 0.35145241022109985, mean loss: 0.34420067670730875
Epoch: 39, step: 933, loss: 0.3704155683517456, mean loss: 0.3442011346093462
Epoch: 39, step: 934, loss: 0.3249032497406006, mean loss: 0.34420079753427557
Epoch: 39, step: 935, loss: 0.3387220501899719, mean loss: 0.34420070183897505
Epoch: 39, step: 936, loss: 0.3319483697414398, mean loss: 0.34420048783565477
Epoch: 39, step: 937, loss: 0.3669759929180145, mean loss: 0.34420088563327733
Epoch: 39, step: 938, loss: 0.32677462697029114, mean loss: 0.34420058127106157
Epoch: 39, step: 939, loss: 0.31773775815963745, mean loss: 0.344200119086782
Epoch: 39, step: 940, loss: 0.3337470591068268, mean loss: 0.3441999365229037
Epoch: 39, step: 941, loss: 0.39471954107284546, mean loss: 0.34420081883811815
Epoch: 39, step: 942, loss: 0.37458863854408264, mean loss: 0.3442013495462986
Epoch: 39, step: 943, loss: 0.3436586558818817, mean loss: 0.34420134006858877
Epoch: 39, step: 944, loss: 0.31755849719047546, mean loss: 0.34420087478082084
Epoch: 39, step: 945, loss: 0.2997686266899109, mean loss: 0.3442000988343277
Epoch: 39, step: 946, loss: 0.3601905405521393, mean loss: 0.3442003780799438
Epoch: 39, step: 947, loss: 0.32768964767456055, mean loss: 0.34420008975341393
Epoch: 39, step: 948, loss: 0.3214168846607208, mean loss: 0.3441996918977413
Epoch: 39, step: 949, loss: 0.3449349105358124, mean loss: 0.34419970473640016
Epoch: 39, step: 950, loss: 0.33012905716896057, mean loss: 0.3441994590338565
Epoch: 39, step: 951, loss: 0.3195170760154724, mean loss: 0.3441990280360389
Epoch: 39, step: 952, loss: 0.3258345127105713, mean loss: 0.34419870736490227
Epoch: 39, step: 953, loss: 0.3206467628479004, mean loss: 0.34419829612089115
Epoch: 39, step: 954, loss: 0.3373155891895294, mean loss: 0.3441981759430187
Epoch: 39, step: 955, loss: 0.32959628105163574, mean loss: 0.34419792098606083
Epoch: 39, step: 956, loss: 0.32076922059059143, mean loss: 0.3441975119154622
Epoch: 39, step: 957, loss: 0.34319597482681274, mean loss: 0.3441974944286953
Epoch: 39, step: 958, loss: 0.3243541121482849, mean loss: 0.3441971479706895
Epoch: 39, step: 959, loss: 0.3715333938598633, mean loss: 0.3441976252429482
Epoch: 39, step: 960, loss: 0.35166653990745544, mean loss: 0.3441977556428411
Epoch: 39, step: 961, loss: 0.3094145655632019, mean loss: 0.3441971483732074
Epoch: 39, step: 962, loss: 0.3094003200531006, mean loss: 0.34419654087607376
Epoch: 39, step: 963, loss: 0.3213953971862793, mean loss: 0.34419614281141436
Epoch: 39, step: 964, loss: 0.3147502541542053, mean loss: 0.34419562875110365
Epoch: 39, step: 965, loss: 0.3423561155796051, mean loss: 0.344195596637819
Epoch: 39, step: 966, loss: 0.29634395241737366, mean loss: 0.34419476128275345
Epoch: 39, step: 967, loss: 0.3281196057796478, mean loss: 0.3441944806606687
Epoch: 39, step: 968, loss: 0.3559269905090332, mean loss: 0.34419468547012755
Epoch: 39, step: 969, loss: 0.3067411780357361, mean loss: 0.34419403167151297
Epoch: 39, step: 970, loss: 0.31701886653900146, mean loss: 0.34419355730271844
Epoch: 39, step: 971, loss: 0.37581464648246765, mean loss: 0.3441941092697827
Epoch: 39, step: 972, loss: 0.31977787613868713, mean loss: 0.3441936830756943
Epoch: 39, step: 973, loss: 0.3318116366863251, mean loss: 0.3441934669464154
Epoch: 39, step: 974, loss: 0.3686898946762085, mean loss: 0.34419389452540217
Epoch: 39, step: 975, loss: 0.3103681802749634, mean loss: 0.34419330411637034
Epoch: 39, step: 976, loss: 0.314285010099411, mean loss: 0.3441927820928419
Epoch: 39, step: 977, loss: 0.3244464099407196, mean loss: 0.3441924374429282
Epoch: 39, step: 978, loss: 0.3286301791667938, mean loss: 0.3441921658265869
Epoch: 39, step: 979, loss: 0.32245221734046936, mean loss: 0.34419178639436676
Epoch: 39, step: 980, loss: 0.38452956080436707, mean loss: 0.34419249040634664
Epoch: 39, step: 981, loss: 0.3878024220466614, mean loss: 0.34419325151374375
Epoch: 39, step: 982, loss: 0.3369295001029968, mean loss: 0.34419312474449104
Epoch: 39, step: 983, loss: 0.3567250967025757, mean loss: 0.34419334345255315
Epoch: 39, step: 984, loss: 0.3101506531238556, mean loss: 0.34419274934965216
Epoch: 39, step: 985, loss: 0.34865012764930725, mean loss: 0.3441928271371343
Epoch: 39, step: 986, loss: 0.31364378333091736, mean loss: 0.3441922940229203
Epoch: 39, step: 987, loss: 0.38043326139450073, mean loss: 0.34419292645638694
Epoch: 39, step: 988, loss: 0.33508408069610596, mean loss: 0.34419276750261746
Epoch: 39, step: 989, loss: 0.31690514087677, mean loss: 0.3441922913286282
Epoch: 39, step: 990, loss: 0.3360341787338257, mean loss: 0.3441921489705813
Epoch: 39, step: 991, loss: 0.31387320160865784, mean loss: 0.34419161991796454
Epoch: 39, step: 992, loss: 0.3087259829044342, mean loss: 0.34419100106862127
Epoch: 39, step: 993, loss: 0.34273087978363037, mean loss: 0.34419097559102074
Epoch: 39, step: 994, loss: 0.32704371213912964, mean loss: 0.3441906763942967
Epoch: 39, step: 995, loss: 0.3152434229850769, mean loss: 0.3441901713124044
Epoch: 39, step: 996, loss: 0.3606211841106415, mean loss: 0.3441904580015116
Epoch: 39, step: 997, loss: 0.3352191150188446, mean loss: 0.34419030147181584
Epoch: 39, step: 998, loss: 0.3389645516872406, mean loss: 0.34419021029586216
Epoch: 39, step: 999, loss: 0.3028780221939087, mean loss: 0.3441894895165318
Epoch: 39, step: 1000, loss: 0.35611680150032043, mean loss: 0.34418969761032564
Epoch: 39, step: 1001, loss: 0.36768823862075806, mean loss: 0.34419010757824164
Epoch: 39, step: 1002, loss: 0.36196842789649963, mean loss: 0.3441904177427651
Epoch: 39, step: 1003, loss: 0.3679260015487671, mean loss: 0.34419083183180565
Epoch: 39, step: 1004, loss: 0.35028472542762756, mean loss: 0.3441909381435168
Epoch: 39, step: 1005, loss: 0.3791530728340149, mean loss: 0.3441915480687583
Epoch: 39, step: 1006, loss: 0.31801408529281616, mean loss: 0.34419109140279913
Epoch: 39, step: 1007, loss: 0.3281370997428894, mean loss: 0.344190811345726
Epoch: 39, step: 1008, loss: 0.30837133526802063, mean loss: 0.3441901864966012
Epoch: 39, step: 1009, loss: 0.3160442113876343, mean loss: 0.34418969551563083
Epoch: 39, step: 1010, loss: 0.34563279151916504, mean loss: 0.3441897206886907
Epoch: 39, step: 1011, loss: 0.33016860485076904, mean loss: 0.34418947611159334
Epoch: 39, step: 1012, loss: 0.322544664144516, mean loss: 0.34418909855726715
Epoch: 39, step: 1013, loss: 0.32273995876312256, mean loss: 0.3441887244226117
Epoch: 39, step: 1014, loss: 0.3498258590698242, mean loss: 0.3441888227487293
Epoch: 39, step: 1015, loss: 0.3160828948020935, mean loss: 0.34418833251765507
Epoch: 39, step: 1016, loss: 0.30792728066444397, mean loss: 0.3441877000537712
Epoch: 39, step: 1017, loss: 0.34594807028770447, mean loss: 0.34418773075754616
Epoch: 39, step: 1018, loss: 0.36412855982780457, mean loss: 0.34418807855259403
Epoch: 39, step: 1019, loss: 0.31242212653160095, mean loss: 0.3441875245210603
Epoch: 39, step: 1020, loss: 0.2944311499595642, mean loss: 0.344186656732816
Epoch: 39, step: 1021, loss: 0.3264453113079071, mean loss: 0.34418634731592973
Epoch: 39, step: 1022, loss: 0.36437806487083435, mean loss: 0.3441866994622447
Epoch: 39, step: 1023, loss: 0.30821284651756287, mean loss: 0.3441860720842722
Epoch: 39, step: 1024, loss: 0.42955976724624634, mean loss: 0.3441875609612566
Epoch: 39, step: 1025, loss: 0.3334577679634094, mean loss: 0.3441873738419898
Epoch: 39, step: 1026, loss: 0.32463034987449646, mean loss: 0.3441870327886098
Epoch: 39, step: 1027, loss: 0.3564743101596832, mean loss: 0.34418724706172243
Epoch: 39, step: 1028, loss: 0.3242672383785248, mean loss: 0.34418689969039656
Epoch: 39, step: 1029, loss: 0.34142452478408813, mean loss: 0.34418685152008116
Epoch: 39, step: 1030, loss: 0.32834669947624207, mean loss: 0.3441865753042016
Epoch: 39, step: 1031, loss: 0.3731715977191925, mean loss: 0.3441870807276238
Epoch: 39, step: 1032, loss: 0.2874099016189575, mean loss: 0.34418609069851935
Epoch: 39, step: 1033, loss: 0.3809393644332886, mean loss: 0.3441867315576952
Epoch: 39, step: 1034, loss: 0.32938921451568604, mean loss: 0.34418647354097287
Epoch: 39, step: 1035, loss: 0.3178376853466034, mean loss: 0.3441860141186651
Epoch: 39, step: 1036, loss: 0.3277421295642853, mean loss: 0.34418572740507464
Epoch: 39, step: 1037, loss: 0.34677135944366455, mean loss: 0.3441857724870574
Epoch: 39, step: 1038, loss: 0.34015336632728577, mean loss: 0.344185702180961
Epoch: 39, step: 1039, loss: 0.33038532733917236, mean loss: 0.3441854615718732
Epoch: 39, step: 1040, loss: 0.3341863751411438, mean loss: 0.344185287241165
Epoch: 39, step: 1041, loss: 0.3512403666973114, mean loss: 0.3441854102419575
Epoch: 39, step: 1042, loss: 0.33129554986953735, mean loss: 0.34418518551941396
Epoch: 39, step: 1043, loss: 0.29877734184265137, mean loss: 0.3441843938903401
Epoch: 39, step: 1044, loss: 0.37494567036628723, mean loss: 0.3441849301654482
Epoch: 39, step: 1045, loss: 0.31800201535224915, mean loss: 0.3441844737149267
Epoch: 39, step: 1046, loss: 0.3523443043231964, mean loss: 0.344184615963948
Epoch: 39, step: 1047, loss: 0.3360915780067444, mean loss: 0.3441844748817718
Epoch: 39, step: 1048, loss: 0.31292077898979187, mean loss: 0.3441839298857656
Epoch: 39, step: 1049, loss: 0.3340311050415039, mean loss: 0.3441837529024507
Epoch: 39, step: 1050, loss: 0.31053030490875244, mean loss: 0.3441831662681837
Epoch: 39, step: 1051, loss: 0.3208361566066742, mean loss: 0.3441827592989733
Epoch: 39, step: 1052, loss: 0.3409573435783386, mean loss: 0.34418270307669785
Epoch: 39, step: 1053, loss: 0.32948964834213257, mean loss: 0.3441824469662789
Epoch: 39, step: 1054, loss: 0.2991867661476135, mean loss: 0.34418166267315486
Epoch: 39, step: 1055, loss: 0.32663989067077637, mean loss: 0.3441813569182221
Epoch: 39, step: 1056, loss: 0.3318118155002594, mean loss: 0.34418114131957084
Epoch: 39, step: 1057, loss: 0.3387756943702698, mean loss: 0.34418104710534575
Epoch: 39, step: 1058, loss: 0.3603406250476837, mean loss: 0.34418132875376306
Epoch: 39, step: 1059, loss: 0.34757113456726074, mean loss: 0.3441813878343161
Epoch: 39, step: 1060, loss: 0.33287709951400757, mean loss: 0.3441811908165508
Epoch: 39, step: 1061, loss: 0.3382127583026886, mean loss: 0.34418108679702214
Epoch: 39, step: 1062, loss: 0.33708664774894714, mean loss: 0.3441809631552883
Epoch: 39, step: 1063, loss: 0.3469722270965576, mean loss: 0.3441810118005295
Epoch: 39, step: 1064, loss: 0.33596429228782654, mean loss: 0.34418086860470665
Epoch: 39, step: 1065, loss: 0.3851170539855957, mean loss: 0.3441815820023815
Epoch: 39, step: 1066, loss: 0.3296540081501007, mean loss: 0.34418132883378016
Epoch: 39, step: 1067, loss: 0.33839160203933716, mean loss: 0.3441812279393358
Epoch: 39, step: 1068, loss: 0.3707614839076996, mean loss: 0.3441816911310404
Epoch: 39, step: 1069, loss: 0.31913629174232483, mean loss: 0.34418125469359245
Epoch: 39, step: 1070, loss: 0.325213760137558, mean loss: 0.3441809241745802
Epoch: 39, step: 1071, loss: 0.3776993453502655, mean loss: 0.3441815082413045
Epoch: 39, step: 1072, loss: 0.30903783440589905, mean loss: 0.3441808958648241
Epoch: 39, step: 1073, loss: 0.28472426533699036, mean loss: 0.34417985985453436
Epoch: 39, step: 1074, loss: 0.34314092993736267, mean loss: 0.3441798417518716
Epoch: 39, step: 1075, loss: 0.3236854374408722, mean loss: 0.344179484656731
Epoch: 39, step: 1076, loss: 0.321045458316803, mean loss: 0.344179081575757
Epoch: 39, step: 1077, loss: 0.33331233263015747, mean loss: 0.34417889223978204
Epoch: 39, step: 1078, loss: 0.37646666169166565, mean loss: 0.3441794547934793
Epoch: 39, step: 1079, loss: 0.3443203568458557, mean loss: 0.34417945724838994
Epoch: 39, step: 1080, loss: 0.33573949337005615, mean loss: 0.3441793102030064
Epoch: 39, step: 1081, loss: 0.33613330125808716, mean loss: 0.34417917002375026
Epoch: 39, step: 1082, loss: 0.34354397654533386, mean loss: 0.344179158957469
Epoch: 39, step: 1083, loss: 0.35042804479599, mean loss: 0.3441792678230759
Epoch: 39, step: 1084, loss: 0.3255545496940613, mean loss: 0.34417894335628735
Epoch: 39, step: 1085, loss: 0.313890665769577, mean loss: 0.3441784157043312
Epoch: 39, step: 1086, loss: 0.32159560918807983, mean loss: 0.34417802229620764
Epoch: 39, step: 1087, loss: 0.30830320715904236, mean loss: 0.344177397342979
Epoch: 39, step: 1088, loss: 0.33772531151771545, mean loss: 0.34417728494709315
Epoch: 39, step: 1089, loss: 0.33041930198669434, mean loss: 0.34417704528603055
Epoch: 39, step: 1090, loss: 0.30448609590530396, mean loss: 0.3441763538903927
Epoch: 39, step: 1091, loss: 0.3347876965999603, mean loss: 0.34417619034772806
Epoch: 39, step: 1092, loss: 0.30500346422195435, mean loss: 0.34417550800304125
Epoch: 39, step: 1093, loss: 0.32635000348091125, mean loss: 0.34417519750827513
Epoch: 39, step: 1094, loss: 0.3312341272830963, mean loss: 0.34417497209728726
Epoch: 39, step: 1095, loss: 0.3226169943809509, mean loss: 0.3441745966012635
Epoch: 39, step: 1096, loss: 0.3306501805782318, mean loss: 0.34417436103761023
Epoch: 39, step: 1097, loss: 0.3446623980998993, mean loss: 0.34417436953792485
Epoch: 39, step: 1098, loss: 0.3274092376232147, mean loss: 0.34417407753876234
Epoch: 39, step: 1099, loss: 0.287742018699646, mean loss: 0.3441730946758175
Epoch: 39, step: 1100, loss: 0.3180825114250183, mean loss: 0.34417264027061956
Epoch: 39, step: 1101, loss: 0.33582934737205505, mean loss: 0.3441724949626517
Epoch: 39, step: 1102, loss: 0.33016130328178406, mean loss: 0.3441722509460077
Epoch: 39, step: 1103, loss: 0.34423935413360596, mean loss: 0.3441722521146456
Epoch: 39, step: 1104, loss: 0.3636433780193329, mean loss: 0.34417259120880805
Epoch: 39, step: 1105, loss: 0.3501729667186737, mean loss: 0.344172695704916
Epoch: 39, step: 1106, loss: 0.33006414771080017, mean loss: 0.34417245000984614
Epoch: 39, step: 1107, loss: 0.3144194781780243, mean loss: 0.34417193188202794
Epoch: 39, step: 1108, loss: 0.30094611644744873, mean loss: 0.3441711791468876
Epoch: 39, step: 1109, loss: 0.3381391167640686, mean loss: 0.3441710741062722
Epoch: 39, step: 1110, loss: 0.33926114439964294, mean loss: 0.3441709886076442
Epoch: 39, step: 1111, loss: 0.3599940836429596, mean loss: 0.3441712641369163
Epoch: 39, step: 1112, loss: 0.3236020505428314, mean loss: 0.3441709059692032
Epoch: 39, step: 1113, loss: 0.33528295159339905, mean loss: 0.34417075120767826
Epoch: 39, step: 1114, loss: 0.3295806646347046, mean loss: 0.3441704971621876
Epoch: 39, step: 1115, loss: 0.3338591158390045, mean loss: 0.34417031762149036
Epoch: 39, step: 1116, loss: 0.29299700260162354, mean loss: 0.34416942661257527
Epoch: 39, step: 1117, loss: 0.3409780263900757, mean loss: 0.34416937104618217
Epoch: 39, step: 1118, loss: 0.39261898398399353, mean loss: 0.34417021460173086
Epoch: 39, step: 1119, loss: 0.30020490288734436, mean loss: 0.34416944913561703
Epoch: 39, step: 1120, loss: 0.32740360498428345, mean loss: 0.3441691572358982
Epoch: 39, step: 1121, loss: 0.3098386228084564, mean loss: 0.344168559538652
Epoch: 39, step: 1122, loss: 0.3267717659473419, mean loss: 0.3441682566644099
Epoch: 39, step: 1123, loss: 0.3077634871006012, mean loss: 0.344167622876639
Epoch: 39, step: 1124, loss: 0.3363409638404846, mean loss: 0.34416748662101954
Epoch: 39, step: 1125, loss: 0.3268957734107971, mean loss: 0.344167185940103
Epoch: 39, step: 1126, loss: 0.3946215808391571, mean loss: 0.3441680642785411
Epoch: 39, step: 1127, loss: 0.30480530858039856, mean loss: 0.3441673790415155
Epoch: 39, step: 1128, loss: 0.3211217522621155, mean loss: 0.34416697786427153
Epoch: 39, step: 1129, loss: 0.3277435302734375, mean loss: 0.34416669197060457
Epoch: 39, step: 1130, loss: 0.31731364130973816, mean loss: 0.3441662245301697
Epoch: 39, step: 1131, loss: 0.36208221316337585, mean loss: 0.34416653639461464
Epoch: 39, step: 1132, loss: 0.31247949600219727, mean loss: 0.3441659848264343
Epoch: 39, step: 1133, loss: 0.3433948755264282, mean loss: 0.3441659714041662
Epoch: 39, step: 1134, loss: 0.3506878614425659, mean loss: 0.3441660849250804
Epoch: 39, step: 1135, loss: 0.3367331624031067, mean loss: 0.3441659555488616
Epoch: 39, step: 1136, loss: 0.373759925365448, mean loss: 0.3441664706476348
Epoch: 39, step: 1137, loss: 0.34464240074157715, mean loss: 0.3441664789313068
Epoch: 39, step: 1138, loss: 0.3503575026988983, mean loss: 0.34416658668561484
Epoch: 39, step: 1139, loss: 0.3513723909854889, mean loss: 0.34416671209991967
Epoch: 39, step: 1140, loss: 0.44002488255500793, mean loss: 0.34416838044616915
Epoch: 39, step: 1141, loss: 0.336355596780777, mean loss: 0.3441682444723506
Epoch: 39, step: 1142, loss: 0.38329634070396423, mean loss: 0.3441689254465449
Epoch: 39, step: 1143, loss: 0.3586372435092926, mean loss: 0.34416917724463164
Epoch: 39, step: 1144, loss: 0.33919793367385864, mean loss: 0.34416909072954194
Epoch: 39, step: 1145, loss: 0.33099305629730225, mean loss: 0.34416886142957964
Epoch: 39, step: 1146, loss: 0.32896026968955994, mean loss: 0.34416859676202416
Epoch: 39, step: 1147, loss: 0.32083892822265625, mean loss: 0.34416819077447475
Epoch: 39, step: 1148, loss: 0.3060838282108307, mean loss: 0.3441675280343275
Epoch: 39, step: 1149, loss: 0.3141765296459198, mean loss: 0.3441670061431503
Epoch: 39, step: 1150, loss: 0.3235233724117279, mean loss: 0.34416664691726884
Epoch: 39, step: 1151, loss: 0.32324889302253723, mean loss: 0.3441662829276765
Epoch: 39, step: 1152, loss: 0.31490081548690796, mean loss: 0.344165773688479
Epoch: 39, step: 1153, loss: 0.31809383630752563, mean loss: 0.344165320026788
Epoch: 39, step: 1154, loss: 0.32483094930648804, mean loss: 0.34416498360718994
Epoch: 39, step: 1155, loss: 0.3739166259765625, mean loss: 0.344165501279141
Epoch: 39, step: 1156, loss: 0.34107914566993713, mean loss: 0.34416544757817513
Epoch: 39, step: 1157, loss: 0.3367098271846771, mean loss: 0.344165317856555
Epoch: 39, step: 1158, loss: 0.311044305562973, mean loss: 0.34416474158839855
Epoch: 39, step: 1159, loss: 0.3487008213996887, mean loss: 0.34416482050968417
Epoch: 39, step: 1160, loss: 0.33919596672058105, mean loss: 0.3441647340602559
Epoch: 39, step: 1161, loss: 0.31471502780914307, mean loss: 0.3441642216954163
Epoch: 39, step: 1162, loss: 0.32442405819892883, mean loss: 0.3441638782627975
Epoch: 39, step: 1163, loss: 0.39994117617607117, mean loss: 0.3441648486402838
Epoch: 39, step: 1164, loss: 0.3245462477207184, mean loss: 0.344164507334445
Epoch: 39, step: 1165, loss: 0.36635372042655945, mean loss: 0.34416489335464423
Epoch: 39, step: 1166, loss: 0.31581011414527893, mean loss: 0.3441644000822122
Epoch: 39, step: 1167, loss: 0.3241097927093506, mean loss: 0.34416405120935417
Epoch: 39, step: 1168, loss: 0.3357902765274048, mean loss: 0.3441639055404896
Epoch: 39, step: 1169, loss: 0.34123021364212036, mean loss: 0.34416385450733544
Epoch: 39, step: 1170, loss: 0.3111918270587921, mean loss: 0.34416328095109755
Epoch: 39, step: 1171, loss: 0.33623212575912476, mean loss: 0.3441631429891717
Epoch: 39, step: 1172, loss: 0.3523228168487549, mean loss: 0.3441632849236959
Epoch: 39, step: 1173, loss: 0.3479718267917633, mean loss: 0.3441633511707279
Epoch: 39, step: 1174, loss: 0.3187868893146515, mean loss: 0.344162909771868
Epoch: 39, step: 1175, loss: 0.34903445839881897, mean loss: 0.34416299450624194
Epoch: 39, step: 1176, loss: 0.30333074927330017, mean loss: 0.34416228429377727
Epoch: 39, step: 1177, loss: 0.3245360553264618, mean loss: 0.3441619429324358
Epoch: 39, step: 1178, loss: 0.33637571334838867, mean loss: 0.3441618075079713
Epoch: 39, step: 1179, loss: 0.30655330419540405, mean loss: 0.3441611534015411
Epoch: 39, step: 1180, loss: 0.35869091749191284, mean loss: 0.34416140610627505
Epoch: 39, step: 1181, loss: 0.32227379083633423, mean loss: 0.34416102543885585
Epoch: 39, step: 1182, loss: 0.32793334126472473, mean loss: 0.34416074321335327
Epoch: 39, step: 1183, loss: 0.3407849669456482, mean loss: 0.3441606845042008
Epoch: 39, step: 1184, loss: 0.3241409659385681, mean loss: 0.34416033634123727
Epoch: 39, step: 1185, loss: 0.346698135137558, mean loss: 0.3441603804753334
Epoch: 39, step: 1186, loss: 0.32568982243537903, mean loss: 0.3441600592649959
Epoch: 39, step: 1187, loss: 0.36477115750312805, mean loss: 0.34416041769394407
Epoch: 39, step: 1188, loss: 0.3085290193557739, mean loss: 0.34415979807133146
Epoch: 39, step: 1189, loss: 0.3173259496688843, mean loss: 0.3441593314443986
Epoch: 39, step: 1190, loss: 0.3521521985530853, mean loss: 0.34415947043386264
Epoch: 39, step: 1191, loss: 0.3178211450576782, mean loss: 0.34415901243975094
Epoch: 39, step: 1192, loss: 0.3607041835784912, mean loss: 0.3441593001368269
Epoch: 39, step: 1193, loss: 0.3462972342967987, mean loss: 0.3441593373118253
Epoch: 39, step: 1194, loss: 0.36873751878738403, mean loss: 0.3441597646767029
Epoch: 39, step: 1195, loss: 0.3243308961391449, mean loss: 0.3441594198987689
Epoch: 39, step: 1196, loss: 0.3074396550655365, mean loss: 0.34415878143851064
Epoch: 39, step: 1197, loss: 0.3230125904083252, mean loss: 0.34415841376818634
Epoch: 39, step: 1198, loss: 0.34483930468559265, mean loss: 0.3441584256066792
Epoch: 39, step: 1199, loss: 0.3534393012523651, mean loss: 0.34415858696831153
Epoch: 39, step: 1200, loss: 0.3396453261375427, mean loss: 0.34415850850001817
Epoch: 39, step: 1201, loss: 0.3345889747142792, mean loss: 0.3441583421254261
Epoch: 39, step: 1202, loss: 0.37897804379463196, mean loss: 0.34415894748542314
Epoch: 39, step: 1203, loss: 0.3806709349155426, mean loss: 0.3441595822557192
Epoch: 39, step: 1204, loss: 0.37345632910728455, mean loss: 0.3441600915783466
Epoch: 39, step: 1205, loss: 0.3266375958919525, mean loss: 0.3441597869558424
Epoch: 39, step: 1206, loss: 0.33572152256965637, mean loss: 0.3441596402620958
Epoch: 39, step: 1207, loss: 0.38245323300361633, mean loss: 0.3441603059597653
Epoch: 39, step: 1208, loss: 0.3225657343864441, mean loss: 0.3441599305652139
Epoch: 39, step: 1209, loss: 0.32393360137939453, mean loss: 0.344159578961953
Epoch: 39, step: 1210, loss: 0.35064977407455444, mean loss: 0.3441596917819351
Epoch: 39, step: 1211, loss: 0.3196580410003662, mean loss: 0.3441592658736682
Epoch: 39, step: 1212, loss: 0.31837189197540283, mean loss: 0.3441588176236743
Epoch: 39, step: 1213, loss: 0.3710114061832428, mean loss: 0.3441592843816885
Epoch: 39, step: 1214, loss: 0.3518884778022766, mean loss: 0.3441594187300124
Epoch: 39, step: 1215, loss: 0.3302019238471985, mean loss: 0.34415917612598534
Epoch: 39, step: 1216, loss: 0.3354666233062744, mean loss: 0.34415902503786516
Epoch: 39, step: 1217, loss: 0.3372775912284851, mean loss: 0.3441589054314792
Epoch: 39, step: 1218, loss: 0.3834802508354187, mean loss: 0.3441595888649615
Epoch: 39, step: 1219, loss: 0.31007707118988037, mean loss: 0.3441589964963979
Epoch: 39, step: 1220, loss: 0.3303634524345398, mean loss: 0.34415875672817814
Epoch: 39, step: 1221, loss: 0.3683602511882782, mean loss: 0.3441591773457606
Epoch: 39, step: 1222, loss: 0.36339855194091797, mean loss: 0.3441595117167889
Epoch: 39, step: 1223, loss: 0.32066041231155396, mean loss: 0.3441591033209007
Epoch: 39, step: 1224, loss: 0.3425661623477936, mean loss: 0.34415907563731907
Epoch: 39, step: 1225, loss: 0.30918028950691223, mean loss: 0.34415846775462244
Epoch: 39, step: 1226, loss: 0.33293235301971436, mean loss: 0.3441582726637385
Epoch: 39, step: 1227, loss: 0.3805222511291504, mean loss: 0.34415890459718884
Epoch: 39, step: 1228, loss: 0.3461362421512604, mean loss: 0.34415893895877636
Epoch: 39, step: 1229, loss: 0.3358537554740906, mean loss: 0.3441587946362607
Epoch: 39, step: 1230, loss: 0.29964882135391235, mean loss: 0.34415802118198363
Epoch: 39, step: 1231, loss: 0.31898385286331177, mean loss: 0.3441575837355334
Epoch: 39, step: 1232, loss: 0.34593668580055237, mean loss: 0.3441576146500943
Epoch: 39, step: 1233, loss: 0.3891265392303467, mean loss: 0.3441583960388794
Epoch: 39, step: 1234, loss: 0.38242506980895996, mean loss: 0.3441590609564963
Epoch: 39, step: 1235, loss: 0.33730924129486084, mean loss: 0.344158941936833
Epoch: 39, step: 1236, loss: 0.34530124068260193, mean loss: 0.34415896178460365
Epoch: 39, step: 1237, loss: 0.41522762179374695, mean loss: 0.3441601966016452
Epoch: 39, step: 1238, loss: 0.33701467514038086, mean loss: 0.34416007245046004
Epoch: 39, step: 1239, loss: 0.3287351429462433, mean loss: 0.34415980445182387
Epoch: 39, step: 1240, loss: 0.34776851534843445, mean loss: 0.3441598671498605
Epoch: 39, step: 1241, loss: 0.3277578055858612, mean loss: 0.3441595821840597
Epoch: 39, step: 1242, loss: 0.3305441737174988, mean loss: 0.344159345637065
Epoch: 39, step: 1243, loss: 0.3161638081073761, mean loss: 0.3441588592656694
Epoch: 39, step: 1244, loss: 0.3468520939350128, mean loss: 0.34415890605489596
Epoch: 39, step: 1245, loss: 0.3264586925506592, mean loss: 0.3441585985566592
Epoch: 39, step: 1246, loss: 0.3185099959373474, mean loss: 0.3441581529821996
Epoch: 39, step: 1247, loss: 0.3318946063518524, mean loss: 0.34415793994025273
Epoch: 39, step: 1248, loss: 0.3435012996196747, mean loss: 0.3441579285333159
Epoch: 39, step: 1249, loss: 0.3375436067581177, mean loss: 0.34415781363351783
Epoch: 39, step: 1250, loss: 0.332574725151062, mean loss: 0.3441576124229548
Epoch: 39, step: 1251, loss: 0.3284810781478882, mean loss: 0.3441573401096162
Epoch: 39, step: 1252, loss: 0.3404328525066376, mean loss: 0.344157275413554
Epoch: 39, step: 1253, loss: 0.33365994691848755, mean loss: 0.3441570930732988
Epoch: 39, step: 1254, loss: 0.3407424986362457, mean loss: 0.3441570337622839
Epoch: 39, step: 1255, loss: 0.30910277366638184, mean loss: 0.34415642488539766
Epoch: 39, step: 1256, loss: 0.3329879939556122, mean loss: 0.3441562308980958
Epoch: 39, step: 1257, loss: 0.31110259890556335, mean loss: 0.3441556567911727
Epoch: 39, step: 1258, loss: 0.35351771116256714, mean loss: 0.3441558193974145
Epoch: 39, step: 1259, loss: 0.34211090207099915, mean loss: 0.34415578388057894
Epoch: 39, step: 1260, loss: 0.3378376066684723, mean loss: 0.3441556741461848
Epoch: 39, step: 1261, loss: 0.31685930490493774, mean loss: 0.34415520006981465
Epoch: 39, step: 1262, loss: 0.3254474997520447, mean loss: 0.3441548751648959
Epoch: 39, step: 1263, loss: 0.3507084250450134, mean loss: 0.34415498898132313
Epoch: 39, step: 1264, loss: 0.32695290446281433, mean loss: 0.34415469023547784
Epoch: 39, step: 1265, loss: 0.32661500573158264, mean loss: 0.34415438563187767
Epoch: 39, step: 1266, loss: 0.3354881703853607, mean loss: 0.3441542351323336
Epoch: 39, step: 1267, loss: 0.3475686013698578, mean loss: 0.3441542944259957
Epoch: 39, step: 1268, loss: 0.3335971534252167, mean loss: 0.34415411109455524
Epoch: 39, step: 1269, loss: 0.3193647265434265, mean loss: 0.34415368061866614
Epoch: 39, step: 1270, loss: 0.3120405972003937, mean loss: 0.34415312297399947
Epoch: 39, step: 1271, loss: 0.2951717674732208, mean loss: 0.34415227242604673
Epoch: 39, step: 1272, loss: 0.3576878309249878, mean loss: 0.34415250746326737
Epoch: 39, step: 1273, loss: 0.38504236936569214, mean loss: 0.34415321747996996
Epoch: 39, step: 1274, loss: 0.31138157844543457, mean loss: 0.34415264843899074
Epoch: 39, step: 1275, loss: 0.36054253578186035, mean loss: 0.34415293302517186
Epoch: 39, step: 1276, loss: 0.3367122709751129, mean loss: 0.34415280383131064
Epoch: 39, step: 1277, loss: 0.33395957946777344, mean loss: 0.344152626847174
Epoch: 39, step: 1278, loss: 0.3190765678882599, mean loss: 0.3441521914611343
Epoch: 39, step: 1279, loss: 0.35196325182914734, mean loss: 0.34415232707923915
Epoch: 39, step: 1280, loss: 0.3326650559902191, mean loss: 0.3441521276370618
Epoch: 39, step: 1281, loss: 0.33062925934791565, mean loss: 0.34415189285689085
Epoch: 39, step: 1282, loss: 0.2947942018508911, mean loss: 0.34415103593765606
Epoch: 39, step: 1283, loss: 0.32166698575019836, mean loss: 0.34415064558956254
Epoch: 39, step: 1284, loss: 0.3604162335395813, mean loss: 0.34415092797333974
Epoch: 39, step: 1285, loss: 0.3432537317276001, mean loss: 0.34415091239755685
Epoch: 39, step: 1286, loss: 0.3354336619377136, mean loss: 0.344150761064285
Epoch: 39, step: 1287, loss: 0.314196914434433, mean loss: 0.3441502410683363
Epoch: 39, step: 1288, loss: 0.3574814796447754, mean loss: 0.3441504724933615
Epoch: 39, step: 1289, loss: 0.3058297336101532, mean loss: 0.3441498072720498
Epoch: 39, step: 1290, loss: 0.3269430696964264, mean loss: 0.3441495085802662
Epoch: 39, step: 1291, loss: 0.3063630163669586, mean loss: 0.344148852655877
Epoch: 39, step: 1292, loss: 0.29226887226104736, mean loss: 0.3441479521024844
Epoch: 39, step: 1293, loss: 0.3230181932449341, mean loss: 0.3441475853300689
Epoch: 39, step: 1294, loss: 0.3477996587753296, mean loss: 0.34414764872201564
Epoch: 39, step: 1295, loss: 0.36412501335144043, mean loss: 0.34414799547902164
Epoch: 39, step: 1296, loss: 0.3356688916683197, mean loss: 0.3441478483055745
Epoch: 39, step: 1297, loss: 0.3307727575302124, mean loss: 0.3441476161555628
Epoch: 39, step: 1298, loss: 0.3436376750469208, mean loss: 0.34414760730472344
Epoch: 39, step: 1299, loss: 0.34312042593955994, mean loss: 0.34414758947666585
Epoch: 39, step: 1300, loss: 0.3213483691215515, mean loss: 0.3441471937736554
Epoch: 39, step: 1301, loss: 0.3970833420753479, mean loss: 0.3441481125169006
Epoch: 39, step: 1302, loss: 0.3325136601924896, mean loss: 0.34414791059648675
Epoch: 39, step: 1303, loss: 0.36975252628326416, mean loss: 0.34414835496676943
Epoch: 39, step: 1304, loss: 0.3797507882118225, mean loss: 0.3441489728393028
Epoch: 39, step: 1305, loss: 0.35649773478507996, mean loss: 0.3441491871456779
Epoch: 39, step: 1306, loss: 0.3808521628379822, mean loss: 0.34414982409577927
Epoch: 39, step: 1307, loss: 0.35451292991638184, mean loss: 0.3441500039358775
Epoch: 39, step: 1308, loss: 0.31078699231147766, mean loss: 0.34414942496821377
Epoch: 39, step: 1309, loss: 0.3086310625076294, mean loss: 0.3441488086081947
Epoch: 39, step: 1310, loss: 0.33891749382019043, mean loss: 0.34414871782931
Epoch: 39, step: 1311, loss: 0.3098808825016022, mean loss: 0.3441481231906738
Epoch: 39, step: 1312, loss: 0.34280312061309814, mean loss: 0.3441480998516851
Epoch: 39, step: 1313, loss: 0.3309272229671478, mean loss: 0.3441478704420567
Epoch: 39, step: 1314, loss: 0.3430798649787903, mean loss: 0.34414785191026886
Epoch: 39, step: 1315, loss: 0.3424833416938782, mean loss: 0.34414782302856745
Epoch: 39, step: 1316, loss: 0.3093584179878235, mean loss: 0.3441472193916747
Epoch: 39, step: 1317, loss: 0.31761130690574646, mean loss: 0.344146758970526
Epoch: 39, step: 1318, loss: 0.3029276430606842, mean loss: 0.34414604379544295
Epoch: 39, step: 1319, loss: 0.3458802402019501, mean loss: 0.344146073884214
Epoch: 39, step: 1320, loss: 0.3847558796405792, mean loss: 0.3441467784629699
Epoch: 39, step: 1321, loss: 0.3410506248474121, mean loss: 0.34414672474574143
Epoch: 39, step: 1322, loss: 0.32461783289909363, mean loss: 0.3441463859318854
Epoch: 39, step: 1323, loss: 0.3325129747390747, mean loss: 0.34414618410309994
Epoch: 39, step: 1324, loss: 0.30549415946006775, mean loss: 0.3441455135383172
Epoch: 39, step: 1325, loss: 0.32065874338150024, mean loss: 0.3441451060789966
Epoch: 39, step: 1326, loss: 0.3491893708705902, mean loss: 0.34414519358771045
Epoch: 39, step: 1327, loss: 0.34786373376846313, mean loss: 0.3441452580964222
Epoch: 39, step: 1328, loss: 0.29392075538635254, mean loss: 0.3441443868239318
Epoch: 39, step: 1329, loss: 0.34862199425697327, mean loss: 0.34414446449814046
Epoch: 39, step: 1330, loss: 0.34295475482940674, mean loss: 0.34414444386029863
Epoch: 39, step: 1331, loss: 0.3123491406440735, mean loss: 0.34414389231812514
Epoch: 39, step: 1332, loss: 0.2998106777667999, mean loss: 0.34414312329846214
Epoch: 39, step: 1333, loss: 0.33598199486732483, mean loss: 0.3441429817350895
Epoch: 39, step: 1334, loss: 0.3390756845474243, mean loss: 0.34414289383900465
Epoch: 39, step: 1335, loss: 0.3236103951931, mean loss: 0.3441425376935345
Epoch: 39, step: 1336, loss: 0.3178568482398987, mean loss: 0.34414208176427746
Epoch: 39, step: 1337, loss: 0.335901141166687, mean loss: 0.3441419388263964
Epoch: 39, step: 1338, loss: 0.35224488377571106, mean loss: 0.34414207936832597
Epoch: 39, step: 1339, loss: 0.3392423391342163, mean loss: 0.34414199438601306
Epoch: 39, step: 1340, loss: 0.3245954215526581, mean loss: 0.3441416553712736
Epoch: 39, step: 1341, loss: 0.3244054317474365, mean loss: 0.3441413130731775
Epoch: 39, step: 1342, loss: 0.35396185517311096, mean loss: 0.3441414833942393
Epoch: 39, step: 1343, loss: 0.3462879955768585, mean loss: 0.3441415206212976
Epoch: 39, step: 1344, loss: 0.3158591389656067, mean loss: 0.3441410301271741
Epoch: 39, step: 1345, loss: 0.3128858208656311, mean loss: 0.344140488085461
Epoch: 39, step: 1346, loss: 0.3340629041194916, mean loss: 0.3441403133185573
Epoch: 39, step: 1347, loss: 0.31491532921791077, mean loss: 0.34413980650348897
Epoch: 39, step: 1348, loss: 0.3353496491909027, mean loss: 0.3441396540686097
Epoch: 39, step: 1349, loss: 0.35192951560020447, mean loss: 0.3441397891544754
Epoch: 39, step: 1350, loss: 0.3388403356075287, mean loss: 0.34413969725696825
Epoch: 39, step: 1351, loss: 0.33767399191856384, mean loss: 0.3441395851375027
Epoch: 39, step: 1352, loss: 0.29585036635398865, mean loss: 0.34413874778608716
Epoch: 39, step: 1353, loss: 0.35089412331581116, mean loss: 0.34413886492455653
Epoch: 39, step: 1354, loss: 0.3210912048816681, mean loss: 0.34413846528418196
Epoch: 39, step: 1355, loss: 0.31870996952056885, mean loss: 0.34413802436838636
Epoch: 39, step: 1356, loss: 0.3254415690898895, mean loss: 0.3441377001880025
Epoch: 39, step: 1357, loss: 0.3144664764404297, mean loss: 0.34413718572353413
Epoch: 39, step: 1358, loss: 0.3701803386211395, mean loss: 0.3441376372736494
Epoch: 39, step: 1359, loss: 0.301585853099823, mean loss: 0.3441368995008466
Epoch: 39, step: 1360, loss: 0.32493719458580017, mean loss: 0.34413656661763636
Epoch: 39, step: 1361, loss: 0.34572502970695496, mean loss: 0.34413659415782655
Epoch: 39, step: 1362, loss: 0.3121807873249054, mean loss: 0.3441360401293789
Epoch: 39, step: 1363, loss: 0.34786921739578247, mean loss: 0.34413610485159224
Epoch: 39, step: 1364, loss: 0.33768516778945923, mean loss: 0.34413599301342956
Epoch: 39, step: 1365, loss: 0.3511093556880951, mean loss: 0.34413611390664883
Epoch: 39, step: 1366, loss: 0.3375841975212097, mean loss: 0.3441360003217731
Epoch: 39, step: 1367, loss: 0.30559462308883667, mean loss: 0.3441353321750213
Epoch: 39, step: 1368, loss: 0.2911316752433777, mean loss: 0.3441344133285806
Epoch: 39, step: 1369, loss: 0.3266729414463043, mean loss: 0.3441341106299729
Epoch: 39, step: 1370, loss: 0.37160566449165344, mean loss: 0.3441345868473852
Epoch: 39, step: 1371, loss: 0.30601415038108826, mean loss: 0.3441339260438131
Epoch: 39, step: 1372, loss: 0.3425561785697937, mean loss: 0.3441338986946222
Epoch: 39, step: 1373, loss: 0.31979498267173767, mean loss: 0.3441334768032021
Epoch: 39, step: 1374, loss: 0.32474908232688904, mean loss: 0.3441331407994151
Epoch: 39, step: 1375, loss: 0.3626428246498108, mean loss: 0.3441334616356463
Epoch: 39, step: 1376, loss: 0.2826169431209564, mean loss: 0.34413239536212065
Epoch: 39, step: 1377, loss: 0.3189278244972229, mean loss: 0.34413195849570705
Epoch: 39, step: 1378, loss: 0.3733939528465271, mean loss: 0.34413246567994055
Epoch: 39, step: 1379, loss: 0.3674579858779907, mean loss: 0.3441328699630832
Epoch: 39, step: 1380, loss: 0.30145663022994995, mean loss: 0.3441321303017536
Epoch: 39, step: 1381, loss: 0.3735359311103821, mean loss: 0.3441326399173522
Epoch: 39, step: 1382, loss: 0.35443130135536194, mean loss: 0.344132818406779
Epoch: 39, step: 1383, loss: 0.35988661646842957, mean loss: 0.3441330914362081
Epoch: 39, step: 1384, loss: 0.3581099510192871, mean loss: 0.3441333336652784
Epoch: 39, step: 1385, loss: 0.32994315028190613, mean loss: 0.3441330877434146
Epoch: 39, step: 1386, loss: 0.34477880597114563, mean loss: 0.34413309893378996
Epoch: 39, step: 1387, loss: 0.3262663781642914, mean loss: 0.34413278930671437
Epoch: 39, step: 1388, loss: 0.3590804636478424, mean loss: 0.3441330483427484
Epoch: 39, step: 1389, loss: 0.32297655940055847, mean loss: 0.34413268171728584
Epoch: 39, step: 1390, loss: 0.3416450023651123, mean loss: 0.34413263860848875
Epoch: 39, step: 1391, loss: 0.3508414626121521, mean loss: 0.3441327548631502
Epoch: 39, step: 1392, loss: 0.385393351316452, mean loss: 0.34413346983995546
Epoch: 39, step: 1393, loss: 0.3383067846298218, mean loss: 0.34413336887504103
Epoch: 39, step: 1394, loss: 0.3308999538421631, mean loss: 0.3441331395701419
Epoch: 39, step: 1395, loss: 0.33793067932128906, mean loss: 0.34413303209751495
Epoch: 39, step: 1396, loss: 0.33090513944625854, mean loss: 0.3441328028962492
Epoch: 39, step: 1397, loss: 0.38030388951301575, mean loss: 0.34413342962610016
Epoch: 39, step: 1398, loss: 0.33754274249076843, mean loss: 0.3441333154324393
Epoch: 39, step: 1399, loss: 0.315799355506897, mean loss: 0.3441328245120719
Epoch: 39, step: 1400, loss: 0.33290237188339233, mean loss: 0.3441326299341723
Epoch: 39, step: 1401, loss: 0.33207011222839355, mean loss: 0.3441324209436026
Epoch: 39, step: 1402, loss: 0.379453182220459, mean loss: 0.3441330328870056
Epoch: 39, step: 1403, loss: 0.3373572528362274, mean loss: 0.3441329154964988
Epoch: 39, step: 1404, loss: 0.3492111563682556, mean loss: 0.3441330034755857
Epoch: 39, step: 1405, loss: 0.30942943692207336, mean loss: 0.34413240225652614
Epoch: 39, step: 1406, loss: 0.3228452801704407, mean loss: 0.3441320334759346
Epoch: 39, step: 1407, loss: 0.34219396114349365, mean loss: 0.3441319999011246
Epoch: 39, step: 1408, loss: 0.34861278533935547, mean loss: 0.3441320775240858
Epoch: 39, step: 1409, loss: 0.2892400920391083, mean loss: 0.344131126618333
Epoch: 39, step: 1410, loss: 0.3482091724872589, mean loss: 0.344131197261981
Epoch: 39, step: 1411, loss: 0.292116641998291, mean loss: 0.34413029623379254
Epoch: 39, step: 1412, loss: 0.33918628096580505, mean loss: 0.34413021059199606
Epoch: 39, step: 1413, loss: 0.3433854281902313, mean loss: 0.34413019769086317
Epoch: 39, step: 1414, loss: 0.31927379965782166, mean loss: 0.3441297671353898
Epoch: 39, step: 1415, loss: 0.33874350786209106, mean loss: 0.34412967383775117
Epoch: 39, step: 1416, loss: 0.37839335203170776, mean loss: 0.3441302673229017
Epoch: 39, step: 1417, loss: 0.3115265965461731, mean loss: 0.3441297026007141
Epoch: 39, step: 1418, loss: 0.3221251666545868, mean loss: 0.3441293214707939
Epoch: 39, step: 1419, loss: 0.30333632230758667, mean loss: 0.34412861492723074
Epoch: 39, step: 1420, loss: 0.279554158449173, mean loss: 0.3441274965030577
Epoch: 39, step: 1421, loss: 0.3119416832923889, mean loss: 0.3441269390571259
Epoch: 39, step: 1422, loss: 0.30853572487831116, mean loss: 0.3441263226416324
Epoch: 39, step: 1423, loss: 0.3039456307888031, mean loss: 0.34412562675157604
Epoch: 39, step: 1424, loss: 0.3166232407093048, mean loss: 0.3441251504455536
Epoch: 39, step: 1425, loss: 0.29336097836494446, mean loss: 0.34412427129048306
Epoch: 39, step: 1426, loss: 0.2966274917125702, mean loss: 0.3441234487357218
Epoch: 39, step: 1427, loss: 0.3491453230381012, mean loss: 0.3441235357036198
Epoch: 39, step: 1428, loss: 0.31226831674575806, mean loss: 0.34412298405033453
Epoch: 39, step: 1429, loss: 0.3229277431964874, mean loss: 0.34412261700775404
Epoch: 39, step: 1430, loss: 0.3657125234603882, mean loss: 0.3441229908783699
Epoch: 39, step: 1431, loss: 0.3366815745830536, mean loss: 0.3441228620182138
Epoch: 39, step: 1432, loss: 0.31723904609680176, mean loss: 0.3441223964895307
Epoch: 39, step: 1433, loss: 0.40486013889312744, mean loss: 0.34412344822532986
Epoch: 39, step: 1434, loss: 0.352817565202713, mean loss: 0.34412359877020315
Epoch: 39, step: 1435, loss: 0.31244486570358276, mean loss: 0.34412305023970957
Epoch: 39, step: 1436, loss: 0.347842276096344, mean loss: 0.3441231146385435
Epoch: 39, step: 1437, loss: 0.3198838233947754, mean loss: 0.34412269493962666
Epoch: 39, step: 1438, loss: 0.2964722812175751, mean loss: 0.3441218698956699
Epoch: 39, step: 1439, loss: 0.39554357528686523, mean loss: 0.3441227602223094
Epoch: 39, step: 1440, loss: 0.36521774530410767, mean loss: 0.34412312545916524
Epoch: 39, step: 1441, loss: 0.3040635585784912, mean loss: 0.3441224318830913
Epoch: 39, step: 1442, loss: 0.35411807894706726, mean loss: 0.34412260494091884
Epoch: 39, step: 1443, loss: 0.3471023440361023, mean loss: 0.3441226565291996
Valid: 39, mean loss: 0.1851575324932734
Epoch: 40, step: 0, loss: 0.34136128425598145, mean loss: 0.3441226087223356
Epoch: 40, step: 1, loss: 0.33874809741973877, mean loss: 0.344122515676539
Epoch: 40, step: 2, loss: 0.27767473459243774, mean loss: 0.34412136532456483
Epoch: 40, step: 3, loss: 0.3210468292236328, mean loss: 0.3441209658623375
Epoch: 40, step: 4, loss: 0.2928787171840668, mean loss: 0.34412007878108275
Epoch: 40, step: 5, loss: 0.32635438442230225, mean loss: 0.34411977123521914
Epoch: 40, step: 6, loss: 0.3277493417263031, mean loss: 0.3441194878479996
Epoch: 40, step: 7, loss: 0.3281409442424774, mean loss: 0.34411921124947437
Epoch: 40, step: 8, loss: 0.3579123914241791, mean loss: 0.34411945001386657
Epoch: 40, step: 9, loss: 0.3253891170024872, mean loss: 0.34411912579138065
Epoch: 40, step: 10, loss: 0.32536986470222473, mean loss: 0.34411880124686717
Epoch: 40, step: 11, loss: 0.3127621114253998, mean loss: 0.3441182584806513
Epoch: 40, step: 12, loss: 0.3244832754135132, mean loss: 0.34411791861630175
Epoch: 40, step: 13, loss: 0.3514486849308014, mean loss: 0.344118045503246
Epoch: 40, step: 14, loss: 0.3548959791660309, mean loss: 0.3441182320533743
Epoch: 40, step: 15, loss: 0.31327739357948303, mean loss: 0.3441176982532068
Epoch: 40, step: 16, loss: 0.29744598269462585, mean loss: 0.3441168904626404
Epoch: 40, step: 17, loss: 0.3207376301288605, mean loss: 0.34411648582315246
Epoch: 40, step: 18, loss: 0.34691381454467773, mean loss: 0.3441165342374331
Epoch: 40, step: 19, loss: 0.34530526399612427, mean loss: 0.3441165548108107
Epoch: 40, step: 20, loss: 0.3232592046260834, mean loss: 0.3441161938383425
Epoch: 40, step: 21, loss: 0.3592453896999359, mean loss: 0.34411645567067545
Epoch: 40, step: 22, loss: 0.3328028619289398, mean loss: 0.3441162598761729
Epoch: 40, step: 23, loss: 0.3406517207622528, mean loss: 0.3441161999194528
Epoch: 40, step: 24, loss: 0.351430743932724, mean loss: 0.3441163265015072
Epoch: 40, step: 25, loss: 0.32505232095718384, mean loss: 0.34411599659451336
Epoch: 40, step: 26, loss: 0.3621215522289276, mean loss: 0.34411630817939637
Epoch: 40, step: 27, loss: 0.2956378161907196, mean loss: 0.34411546927699466
Epoch: 40, step: 28, loss: 0.3361753225326538, mean loss: 0.34411533187806503
Epoch: 40, step: 29, loss: 0.3588554859161377, mean loss: 0.3441155869421598
Epoch: 40, step: 30, loss: 0.36604446172714233, mean loss: 0.34411596639354125
Epoch: 40, step: 31, loss: 0.33000800013542175, mean loss: 0.3441157222772923
Epoch: 40, step: 32, loss: 0.3232448995113373, mean loss: 0.3441153611466577
Epoch: 40, step: 33, loss: 0.3260047137737274, mean loss: 0.3441150477811289
Epoch: 40, step: 34, loss: 0.3337940573692322, mean loss: 0.3441148692018329
Epoch: 40, step: 35, loss: 0.38542625308036804, mean loss: 0.34411558398112346
Epoch: 40, step: 36, loss: 0.3525993227958679, mean loss: 0.3441157307662302
Epoch: 40, step: 37, loss: 0.3061070442199707, mean loss: 0.3441150731537428
Epoch: 40, step: 38, loss: 0.3565734624862671, mean loss: 0.34411528870054003
Epoch: 40, step: 39, loss: 0.32046815752983093, mean loss: 0.3441148795806236
Epoch: 40, step: 40, loss: 0.33371952176094055, mean loss: 0.3441146997332538
Epoch: 40, step: 41, loss: 0.36973336338996887, mean loss: 0.3441151429473927
Epoch: 40, step: 42, loss: 0.32311317324638367, mean loss: 0.34411477961037384
Epoch: 40, step: 43, loss: 0.3552655577659607, mean loss: 0.3441149725170612
Epoch: 40, step: 44, loss: 0.3455449640750885, mean loss: 0.34411499725525957
Epoch: 40, step: 45, loss: 0.3321320712566376, mean loss: 0.34411478995971934
Epoch: 40, step: 46, loss: 0.31695979833602905, mean loss: 0.3441143202070661
Epoch: 40, step: 47, loss: 0.3174039125442505, mean loss: 0.3441138581532386
Epoch: 40, step: 48, loss: 0.3042359948158264, mean loss: 0.3441131683322187
Epoch: 40, step: 49, loss: 0.3463415503501892, mean loss: 0.34411320687887187
Epoch: 40, step: 50, loss: 0.3211601972579956, mean loss: 0.34411280984353915
Epoch: 40, step: 51, loss: 0.32350924611091614, mean loss: 0.3441124534544896
Epoch: 40, step: 52, loss: 0.324663370847702, mean loss: 0.3441121170408351
Epoch: 40, step: 53, loss: 0.3387453854084015, mean loss: 0.34411202421329107
Epoch: 40, step: 54, loss: 0.38966163992881775, mean loss: 0.34411281206446664
Epoch: 40, step: 55, loss: 0.3215444087982178, mean loss: 0.34411242171571776
Epoch: 40, step: 56, loss: 0.3457161784172058, mean loss: 0.3441124494542151
Epoch: 40, step: 57, loss: 0.34170934557914734, mean loss: 0.34411240789096703
Epoch: 40, step: 58, loss: 0.33007892966270447, mean loss: 0.34411216517701093
Epoch: 40, step: 59, loss: 0.3176019787788391, mean loss: 0.3441117066819158
Epoch: 40, step: 60, loss: 0.3203604221343994, mean loss: 0.34411129590928047
Epoch: 40, step: 61, loss: 0.31465211510658264, mean loss: 0.344110786428792
Epoch: 40, step: 62, loss: 0.3057806193828583, mean loss: 0.34411012354089193
Epoch: 40, step: 63, loss: 0.3352707326412201, mean loss: 0.3441099706737278
Epoch: 40, step: 64, loss: 0.3368189334869385, mean loss: 0.3441098445857522
Epoch: 40, step: 65, loss: 0.3132883608341217, mean loss: 0.34410931158184827
Epoch: 40, step: 66, loss: 0.3459870517253876, mean loss: 0.34410934405353355
Epoch: 40, step: 67, loss: 0.3242298364639282, mean loss: 0.3441090002839481
Epoch: 40, step: 68, loss: 0.32059547305107117, mean loss: 0.3441085936795241
Epoch: 40, step: 69, loss: 0.33563169836997986, mean loss: 0.3441084470965169
Epoch: 40, step: 70, loss: 0.3308122456073761, mean loss: 0.34410821718173956
Epoch: 40, step: 71, loss: 0.32767969369888306, mean loss: 0.34410793310850185
Epoch: 40, step: 72, loss: 0.33181032538414, mean loss: 0.344107720468526
Epoch: 40, step: 73, loss: 0.350197434425354, mean loss: 0.34410782576495985
Epoch: 40, step: 74, loss: 0.32820695638656616, mean loss: 0.3441075508298967
Epoch: 40, step: 75, loss: 0.3524567782878876, mean loss: 0.34410769519028567
Epoch: 40, step: 76, loss: 0.299385130405426, mean loss: 0.34410692193847825
Epoch: 40, step: 77, loss: 0.3242047131061554, mean loss: 0.3441065778358324
Epoch: 40, step: 78, loss: 0.30756551027297974, mean loss: 0.34410594606371386
Epoch: 40, step: 79, loss: 0.32298731803894043, mean loss: 0.34410558094220584
Epoch: 40, step: 80, loss: 0.37515705823898315, mean loss: 0.3441061177841916
Epoch: 40, step: 81, loss: 0.3517991006374359, mean loss: 0.3441062507841372
Epoch: 40, step: 82, loss: 0.34822219610214233, mean loss: 0.3441063219413268
Epoch: 40, step: 83, loss: 0.35035285353660583, mean loss: 0.3441064299306013
Epoch: 40, step: 84, loss: 0.35914772748947144, mean loss: 0.34410668995821925
Epoch: 40, step: 85, loss: 0.31244412064552307, mean loss: 0.3441061425985174
Epoch: 40, step: 86, loss: 0.3349711000919342, mean loss: 0.34410598468120956
Epoch: 40, step: 87, loss: 0.32135167717933655, mean loss: 0.3441055913347239
Epoch: 40, step: 88, loss: 0.3519284129142761, mean loss: 0.3441057265630179
Epoch: 40, step: 89, loss: 0.3540993928909302, mean loss: 0.3441058993143805
Epoch: 40, step: 90, loss: 0.3137357831001282, mean loss: 0.34410537434305394
Epoch: 40, step: 91, loss: 0.31118521094322205, mean loss: 0.344104805301994
Epoch: 40, step: 92, loss: 0.3469429016113281, mean loss: 0.34410485435902316
Epoch: 40, step: 93, loss: 0.31640270352363586, mean loss: 0.3441043755304057
Epoch: 40, step: 94, loss: 0.33065709471702576, mean loss: 0.34410414309965964
Epoch: 40, step: 95, loss: 0.32746386528015137, mean loss: 0.3441038554842383
Epoch: 40, step: 96, loss: 0.3391779363155365, mean loss: 0.3441037703446844
Epoch: 40, step: 97, loss: 0.34286195039749146, mean loss: 0.34410374888144774
Epoch: 40, step: 98, loss: 0.3726534843444824, mean loss: 0.34410424231782694
Epoch: 40, step: 99, loss: 0.33524978160858154, mean loss: 0.34410408928532243
Epoch: 40, step: 100, loss: 0.34073150157928467, mean loss: 0.3441040309975689
Epoch: 40, step: 101, loss: 0.2981131672859192, mean loss: 0.3441032361604787
Epoch: 40, step: 102, loss: 0.29650282859802246, mean loss: 0.3441024135206646
Epoch: 40, step: 103, loss: 0.3259607255458832, mean loss: 0.3441020999977838
Epoch: 40, step: 104, loss: 0.37707391381263733, mean loss: 0.3441026698036045
Epoch: 40, step: 105, loss: 0.3431089222431183, mean loss: 0.3441026526303497
Epoch: 40, step: 106, loss: 0.33214977383613586, mean loss: 0.34410244607257423
Epoch: 40, step: 107, loss: 0.3291305601596832, mean loss: 0.3441021873477883
Epoch: 40, step: 108, loss: 0.3406047224998474, mean loss: 0.34410212691016456
Epoch: 40, step: 109, loss: 0.320531964302063, mean loss: 0.344101719615148
Epoch: 40, step: 110, loss: 0.29904285073280334, mean loss: 0.344100941006365
Epoch: 40, step: 111, loss: 0.3333330452442169, mean loss: 0.3441007549423658
Epoch: 40, step: 112, loss: 0.3582090139389038, mean loss: 0.3441009987220039
Epoch: 40, step: 113, loss: 0.3491722047328949, mean loss: 0.3441010863469479
Epoch: 40, step: 114, loss: 0.3370589315891266, mean loss: 0.344100964668248
Epoch: 40, step: 115, loss: 0.33802318572998047, mean loss: 0.3441008596544437
Epoch: 40, step: 116, loss: 0.322427898645401, mean loss: 0.3441004851885763
Epoch: 40, step: 117, loss: 0.347773015499115, mean loss: 0.3441005486415344
Epoch: 40, step: 118, loss: 0.30318692326545715, mean loss: 0.34409984175949815
Epoch: 40, step: 119, loss: 0.3091946542263031, mean loss: 0.34409923869820697
Epoch: 40, step: 120, loss: 0.31777626276016235, mean loss: 0.3440987839207163
Epoch: 40, step: 121, loss: 0.3558899760246277, mean loss: 0.34409898763157815
Epoch: 40, step: 122, loss: 0.2977074086666107, mean loss: 0.3440981861600068
Epoch: 40, step: 123, loss: 0.36314141750335693, mean loss: 0.3440985151495608
Epoch: 40, step: 124, loss: 0.2978784739971161, mean loss: 0.34409771666910555
Epoch: 40, step: 125, loss: 0.3215347230434418, mean loss: 0.3440973268858484
Epoch: 40, step: 126, loss: 0.3149562478065491, mean loss: 0.3440968234726627
Epoch: 40, step: 127, loss: 0.3321145474910736, mean loss: 0.34409661648199136
Epoch: 40, step: 128, loss: 0.28772789239883423, mean loss: 0.344095642743905
Epoch: 40, step: 129, loss: 0.3544301986694336, mean loss: 0.3440958212644772
Epoch: 40, step: 130, loss: 0.3413729965686798, mean loss: 0.344095774230833
Epoch: 40, step: 131, loss: 0.3624417185783386, mean loss: 0.344096091130307
Epoch: 40, step: 132, loss: 0.3141675889492035, mean loss: 0.34409557416794223
Epoch: 40, step: 133, loss: 0.355074405670166, mean loss: 0.3440957638047181
Epoch: 40, step: 134, loss: 0.33381086587905884, mean loss: 0.3440955861572887
Epoch: 40, step: 135, loss: 0.2990155816078186, mean loss: 0.3440948075196531
Epoch: 40, step: 136, loss: 0.34498488903045654, mean loss: 0.3440948228931873
Epoch: 40, step: 137, loss: 0.31642845273017883, mean loss: 0.34409434504645403
Epoch: 40, step: 138, loss: 0.35490405559539795, mean loss: 0.3440945317458884
Epoch: 40, step: 139, loss: 0.3313351571559906, mean loss: 0.34409431137672447
Epoch: 40, step: 140, loss: 0.3446148633956909, mean loss: 0.3440943203671049
Epoch: 40, step: 141, loss: 0.3274663984775543, mean loss: 0.34409403319357224
Epoch: 40, step: 142, loss: 0.28726306557655334, mean loss: 0.3440930517078527
Epoch: 40, step: 143, loss: 0.3660571575164795, mean loss: 0.34409343102717105
Epoch: 40, step: 144, loss: 0.30380281805992126, mean loss: 0.34409273522174894
Epoch: 40, step: 145, loss: 0.3369060456752777, mean loss: 0.3440926111121654
Epoch: 40, step: 146, loss: 0.3465309143066406, mean loss: 0.34409265321939236
Epoch: 40, step: 147, loss: 0.31491419672966003, mean loss: 0.3440921493433046
Epoch: 40, step: 148, loss: 0.305116206407547, mean loss: 0.3440914762882884
Epoch: 40, step: 149, loss: 0.3170425593852997, mean loss: 0.3440910092028644
Epoch: 40, step: 150, loss: 0.3076443076133728, mean loss: 0.34409037984572
Epoch: 40, step: 151, loss: 0.3307173252105713, mean loss: 0.3440901489254507
Epoch: 40, step: 152, loss: 0.30590713024139404, mean loss: 0.34408948960856706
Epoch: 40, step: 153, loss: 0.337828665971756, mean loss: 0.34408938150303753
Epoch: 40, step: 154, loss: 0.3550489544868469, mean loss: 0.34408957073852026
Epoch: 40, step: 155, loss: 0.3038809597492218, mean loss: 0.3440888764811304
Epoch: 40, step: 156, loss: 0.3105338215827942, mean loss: 0.3440882971166105
Epoch: 40, step: 157, loss: 0.2866981625556946, mean loss: 0.34408730623062406
Epoch: 40, step: 158, loss: 0.3105785548686981, mean loss: 0.34408672768556353
Epoch: 40, step: 159, loss: 0.3335464894771576, mean loss: 0.3440865457063127
Epoch: 40, step: 160, loss: 0.35149040818214417, mean loss: 0.3440866735332231
Epoch: 40, step: 161, loss: 0.30905869603157043, mean loss: 0.3440860687893002
Epoch: 40, step: 162, loss: 0.3163575530052185, mean loss: 0.34408559007590855
Epoch: 40, step: 163, loss: 0.3124244511127472, mean loss: 0.34408504347797053
Epoch: 40, step: 164, loss: 0.3224821090698242, mean loss: 0.3440846705313256
Epoch: 40, step: 165, loss: 0.32479768991470337, mean loss: 0.3440843375723673
Epoch: 40, step: 166, loss: 0.3106193542480469, mean loss: 0.34408375986277895
Epoch: 40, step: 167, loss: 0.30305248498916626, mean loss: 0.3440830515477176
Epoch: 40, step: 168, loss: 0.36010637879371643, mean loss: 0.3440833281505805
Epoch: 40, step: 169, loss: 0.3445374369621277, mean loss: 0.3440833359895035
Epoch: 40, step: 170, loss: 0.3605780601501465, mean loss: 0.34408362072003057
Epoch: 40, step: 171, loss: 0.33336368203163147, mean loss: 0.3440834356765539
Epoch: 40, step: 172, loss: 0.3255557119846344, mean loss: 0.3440831158636029
Epoch: 40, step: 173, loss: 0.3979577124118805, mean loss: 0.344084045794154
Epoch: 40, step: 174, loss: 0.34177032113075256, mean loss: 0.34408400585759297
Epoch: 40, step: 175, loss: 0.31492340564727783, mean loss: 0.34408350253323144
Epoch: 40, step: 176, loss: 0.29249489307403564, mean loss: 0.3440826121072608
Epoch: 40, step: 177, loss: 0.3414536416530609, mean loss: 0.3440825667316791
Epoch: 40, step: 178, loss: 0.30688396096229553, mean loss: 0.3440819247011682
Epoch: 40, step: 179, loss: 0.3361070156097412, mean loss: 0.34408178706034853
Epoch: 40, step: 180, loss: 0.3371388018131256, mean loss: 0.34408166723181177
Epoch: 40, step: 181, loss: 0.32053157687187195, mean loss: 0.3440812607893286
Epoch: 40, step: 182, loss: 0.2990482449531555, mean loss: 0.3440804835942259
Epoch: 40, step: 183, loss: 0.32572197914123535, mean loss: 0.3440801667623804
Epoch: 40, step: 184, loss: 0.3099738359451294, mean loss: 0.3440795781640403
Epoch: 40, step: 185, loss: 0.32197660207748413, mean loss: 0.34407919672311105
Epoch: 40, step: 186, loss: 0.31746047735214233, mean loss: 0.3440787373599107
Epoch: 40, step: 187, loss: 0.34295159578323364, mean loss: 0.34407871790899647
Epoch: 40, step: 188, loss: 0.33528614044189453, mean loss: 0.34407856617941585
Epoch: 40, step: 189, loss: 0.322119802236557, mean loss: 0.34407818725337713
Epoch: 40, step: 190, loss: 0.3307859003543854, mean loss: 0.3440779578822377
Epoch: 40, step: 191, loss: 0.3400370180606842, mean loss: 0.34407788815315465
Epoch: 40, step: 192, loss: 0.30827945470809937, mean loss: 0.34407727043822284
Epoch: 40, step: 193, loss: 0.3306019604206085, mean loss: 0.3440770379208812
Epoch: 40, step: 194, loss: 0.3777323365211487, mean loss: 0.34407761863520436
Epoch: 40, step: 195, loss: 0.2833729684352875, mean loss: 0.34407657120870494
Epoch: 40, step: 196, loss: 0.3362457752227783, mean loss: 0.3440764360948104
Epoch: 40, step: 197, loss: 0.3290212154388428, mean loss: 0.3440761763339378
Epoch: 40, step: 198, loss: 0.3074239194393158, mean loss: 0.3440755439514451
Epoch: 40, step: 199, loss: 0.323007196187973, mean loss: 0.34407518045338154
Epoch: 40, step: 200, loss: 0.3187595307826996, mean loss: 0.34407474368297264
Epoch: 40, step: 201, loss: 0.27709537744522095, mean loss: 0.3440735881092133
Epoch: 40, step: 202, loss: 0.33034324645996094, mean loss: 0.34407335122807103
Epoch: 40, step: 203, loss: 0.3256795108318329, mean loss: 0.344073033895927
Epoch: 40, step: 204, loss: 0.336169958114624, mean loss: 0.3440728975537243
Epoch: 40, step: 205, loss: 0.33055809140205383, mean loss: 0.34407266440315065
Epoch: 40, step: 206, loss: 0.31894204020500183, mean loss: 0.34407223086986105
Epoch: 40, step: 207, loss: 0.33298298716545105, mean loss: 0.34407203957045956
Epoch: 40, step: 208, loss: 0.31874504685401917, mean loss: 0.34407160266465275
Epoch: 40, step: 209, loss: 0.32522985339164734, mean loss: 0.34407127763878986
Epoch: 40, step: 210, loss: 0.31502434611320496, mean loss: 0.3440707765790958
Epoch: 40, step: 211, loss: 0.301866352558136, mean loss: 0.34407004856515766
Epoch: 40, step: 212, loss: 0.3066819906234741, mean loss: 0.34406940364324673
Epoch: 40, step: 213, loss: 0.35235294699668884, mean loss: 0.34406954652701105
Epoch: 40, step: 214, loss: 0.3401445150375366, mean loss: 0.3440694788248724
Epoch: 40, step: 215, loss: 0.3051050901412964, mean loss: 0.34406880674696627
Epoch: 40, step: 216, loss: 0.3207930326461792, mean loss: 0.3440684052813144
Epoch: 40, step: 217, loss: 0.3252275884151459, mean loss: 0.3440680803163817
Epoch: 40, step: 218, loss: 0.3119196593761444, mean loss: 0.3440675258325006
Epoch: 40, step: 219, loss: 0.336648553609848, mean loss: 0.3440673978750632
Epoch: 40, step: 220, loss: 0.3352499306201935, mean loss: 0.34406724579994796
Epoch: 40, step: 221, loss: 0.33410531282424927, mean loss: 0.34406707398916225
Epoch: 40, step: 222, loss: 0.32405078411102295, mean loss: 0.3440667287795339
Epoch: 40, step: 223, loss: 0.36029940843582153, mean loss: 0.34406700873054896
Epoch: 40, step: 224, loss: 0.3366037905216217, mean loss: 0.34406688002108604
Epoch: 40, step: 225, loss: 0.3191404938697815, mean loss: 0.34406645015204607
Epoch: 40, step: 226, loss: 0.3109598159790039, mean loss: 0.34406587922004106
Epoch: 40, step: 227, loss: 0.3527306020259857, mean loss: 0.3440660286427286
Epoch: 40, step: 228, loss: 0.3509809672832489, mean loss: 0.3440661478884242
Epoch: 40, step: 229, loss: 0.33518731594085693, mean loss: 0.3440659947787165
Epoch: 40, step: 230, loss: 0.3429562747478485, mean loss: 0.34406597564264313
Epoch: 40, step: 231, loss: 0.33799803256988525, mean loss: 0.34406587100850267
Epoch: 40, step: 232, loss: 0.3400736153125763, mean loss: 0.3440658021681996
Epoch: 40, step: 233, loss: 0.3193298280239105, mean loss: 0.3440653756417633
Epoch: 40, step: 234, loss: 0.3204042315483093, mean loss: 0.3440649676558319
Epoch: 40, step: 235, loss: 0.34451037645339966, mean loss: 0.3440649753358236
Epoch: 40, step: 236, loss: 0.35170185565948486, mean loss: 0.34406510701298487
Epoch: 40, step: 237, loss: 0.30584368109703064, mean loss: 0.3440644480001583
Epoch: 40, step: 238, loss: 0.327502578496933, mean loss: 0.3440641624457607
Epoch: 40, step: 239, loss: 0.32199302315711975, mean loss: 0.34406378190887643
Epoch: 40, step: 240, loss: 0.31632545590400696, mean loss: 0.34406330367012183
Epoch: 40, step: 241, loss: 0.33200567960739136, mean loss: 0.34406309578722016
Epoch: 40, step: 242, loss: 0.3318469226360321, mean loss: 0.3440628851744389
Epoch: 40, step: 243, loss: 0.3331068158149719, mean loss: 0.34406269628971786
Epoch: 40, step: 244, loss: 0.3390127122402191, mean loss: 0.3440626092285326
Epoch: 40, step: 245, loss: 0.3219865560531616, mean loss: 0.3440622286462967
Epoch: 40, step: 246, loss: 0.364623099565506, mean loss: 0.3440625831012921
Epoch: 40, step: 247, loss: 0.3204185664653778, mean loss: 0.3440621755020535
Epoch: 40, step: 248, loss: 0.28053611516952515, mean loss: 0.3440610803950816
Epoch: 40, step: 249, loss: 0.3517635762691498, mean loss: 0.3440612131738417
Epoch: 40, step: 250, loss: 0.36564114689826965, mean loss: 0.34406158517111335
Epoch: 40, step: 251, loss: 0.3152618408203125, mean loss: 0.34406108872650965
Epoch: 40, step: 252, loss: 0.33764007687568665, mean loss: 0.34406097804421687
Epoch: 40, step: 253, loss: 0.3717249631881714, mean loss: 0.34406145489437623
Epoch: 40, step: 254, loss: 0.31643351912498474, mean loss: 0.3440609786738166
Epoch: 40, step: 255, loss: 0.3413657546043396, mean loss: 0.34406093221725165
Epoch: 40, step: 256, loss: 0.3178403675556183, mean loss: 0.3440604802710176
Epoch: 40, step: 257, loss: 0.3238241970539093, mean loss: 0.344060131477829
Epoch: 40, step: 258, loss: 0.3355244994163513, mean loss: 0.3440599843599528
Epoch: 40, step: 259, loss: 0.3643498122692108, mean loss: 0.3440603340639843
Epoch: 40, step: 260, loss: 0.3192830979824066, mean loss: 0.3440599070248764
Epoch: 40, step: 261, loss: 0.3584796190261841, mean loss: 0.3440601555463338
Epoch: 40, step: 262, loss: 0.32088395953178406, mean loss: 0.34405975611514245
Epoch: 40, step: 263, loss: 0.29371413588523865, mean loss: 0.3440588884462428
Epoch: 40, step: 264, loss: 0.31449395418167114, mean loss: 0.34405837892561786
Epoch: 40, step: 265, loss: 0.34213367104530334, mean loss: 0.3440583457558684
Epoch: 40, step: 266, loss: 0.3519197702407837, mean loss: 0.3440584812346022
Epoch: 40, step: 267, loss: 0.37626203894615173, mean loss: 0.3440590362004413
Epoch: 40, step: 268, loss: 0.3455515503883362, mean loss: 0.3440590619205845
Epoch: 40, step: 269, loss: 0.39098429679870605, mean loss: 0.3440598705580975
Epoch: 40, step: 270, loss: 0.3137563169002533, mean loss: 0.3440593483621392
Epoch: 40, step: 271, loss: 0.3349471688270569, mean loss: 0.3440591913422272
Epoch: 40, step: 272, loss: 0.3409978449344635, mean loss: 0.34405913859040654
Epoch: 40, step: 273, loss: 0.39767253398895264, mean loss: 0.3440600624177388
Epoch: 40, step: 274, loss: 0.3392907977104187, mean loss: 0.34405998023862777
Epoch: 40, step: 275, loss: 0.317542165517807, mean loss: 0.3440595233185313
Epoch: 40, step: 276, loss: 0.35334497690200806, mean loss: 0.34405968331049475
Epoch: 40, step: 277, loss: 0.33993667364120483, mean loss: 0.34405961227066445
Epoch: 40, step: 278, loss: 0.33814045786857605, mean loss: 0.3440595102848549
Epoch: 40, step: 279, loss: 0.32038411498069763, mean loss: 0.3440591023697049
Epoch: 40, step: 280, loss: 0.3315388262271881, mean loss: 0.34405888665536255
Epoch: 40, step: 281, loss: 0.38651445508003235, mean loss: 0.3440596181182416
Epoch: 40, step: 282, loss: 0.2997826933860779, mean loss: 0.34405885528853375
Epoch: 40, step: 283, loss: 0.3115611672401428, mean loss: 0.3440582954083041
Epoch: 40, step: 284, loss: 0.32496511936187744, mean loss: 0.34405796647082376
Epoch: 40, step: 285, loss: 0.34005141258239746, mean loss: 0.34405789744705145
Epoch: 40, step: 286, loss: 0.37619900703430176, mean loss: 0.3440584511554186
Epoch: 40, step: 287, loss: 0.32682231068611145, mean loss: 0.34405815422631736
Epoch: 40, step: 288, loss: 0.36105531454086304, mean loss: 0.344058447033434
Epoch: 40, step: 289, loss: 0.3303339183330536, mean loss: 0.34405821060744435
Epoch: 40, step: 290, loss: 0.3419229984283447, mean loss: 0.34405817382578374
Epoch: 40, step: 291, loss: 0.3566800057888031, mean loss: 0.34405839124864535
Epoch: 40, step: 292, loss: 0.3138481080532074, mean loss: 0.3440578708572238
Epoch: 40, step: 293, loss: 0.3466135859489441, mean loss: 0.3440579148802901
Epoch: 40, step: 294, loss: 0.30261465907096863, mean loss: 0.34405720101833487
Epoch: 40, step: 295, loss: 0.3182857036590576, mean loss: 0.3440567571107739
Epoch: 40, step: 296, loss: 0.3320826590061188, mean loss: 0.34405655086349785
Epoch: 40, step: 297, loss: 0.2983899414539337, mean loss: 0.34405576429473195
Epoch: 40, step: 298, loss: 0.346145898103714, mean loss: 0.3440558002949009
Epoch: 40, step: 299, loss: 0.3266862630844116, mean loss: 0.34405550112960276
Epoch: 40, step: 300, loss: 0.34540262818336487, mean loss: 0.34405552433152925
Epoch: 40, step: 301, loss: 0.3667575716972351, mean loss: 0.3440559153281771
Epoch: 40, step: 302, loss: 0.30719542503356934, mean loss: 0.34405528049204576
Epoch: 40, step: 303, loss: 0.32066336274147034, mean loss: 0.344054877627659
Epoch: 40, step: 304, loss: 0.3392397463321686, mean loss: 0.34405479470108885
Epoch: 40, step: 305, loss: 0.3297540843486786, mean loss: 0.34405454841737115
Epoch: 40, step: 306, loss: 0.34046417474746704, mean loss: 0.34405448658580295
Epoch: 40, step: 307, loss: 0.2944873869419098, mean loss: 0.3440536329814142
Epoch: 40, step: 308, loss: 0.3067096471786499, mean loss: 0.34405298988465344
Epoch: 40, step: 309, loss: 0.3199208080768585, mean loss: 0.34405257431410396
Epoch: 40, step: 310, loss: 0.3416723906993866, mean loss: 0.3440525333266298
Epoch: 40, step: 311, loss: 0.3814246654510498, mean loss: 0.34405317687484793
Epoch: 40, step: 312, loss: 0.32681456208229065, mean loss: 0.34405288003096535
Epoch: 40, step: 313, loss: 0.345929890871048, mean loss: 0.34405291235198404
Epoch: 40, step: 314, loss: 0.3055382966995239, mean loss: 0.34405224916445665
Epoch: 40, step: 315, loss: 0.345177561044693, mean loss: 0.3440522685409957
Epoch: 40, step: 316, loss: 0.3175230622291565, mean loss: 0.34405181174731986
Epoch: 40, step: 317, loss: 0.3457268476486206, mean loss: 0.34405184058846283
Epoch: 40, step: 318, loss: 0.3551653325557709, mean loss: 0.34405203193975964
Epoch: 40, step: 319, loss: 0.3214600086212158, mean loss: 0.3440516429586419
Epoch: 40, step: 320, loss: 0.3193386495113373, mean loss: 0.34405121746676937
Epoch: 40, step: 321, loss: 0.37964287400245667, mean loss: 0.34405183024967173
Epoch: 40, step: 322, loss: 0.3118498623371124, mean loss: 0.34405127583671247
Epoch: 40, step: 323, loss: 0.36771586537361145, mean loss: 0.3440516832568202
Epoch: 40, step: 324, loss: 0.375363826751709, mean loss: 0.3440522223313402
Epoch: 40, step: 325, loss: 0.32770437002182007, mean loss: 0.3440519408891285
Epoch: 40, step: 326, loss: 0.31433144211769104, mean loss: 0.3440514292342183
Epoch: 40, step: 327, loss: 0.3318895995616913, mean loss: 0.3440512198651632
Epoch: 40, step: 328, loss: 0.3182838261127472, mean loss: 0.3440507762804268
Epoch: 40, step: 329, loss: 0.36374810338020325, mean loss: 0.3440511153633516
Epoch: 40, step: 330, loss: 0.29937347769737244, mean loss: 0.3440503462659412
Epoch: 40, step: 331, loss: 0.34540513157844543, mean loss: 0.34405036958731616
Epoch: 40, step: 332, loss: 0.3394377529621124, mean loss: 0.344050290186758
Epoch: 40, step: 333, loss: 0.31092700362205505, mean loss: 0.3440497200196742
Epoch: 40, step: 334, loss: 0.33424508571624756, mean loss: 0.34404955125068715
Epoch: 40, step: 335, loss: 0.33999085426330566, mean loss: 0.3440494813887864
Epoch: 40, step: 336, loss: 0.2973273694515228, mean loss: 0.344048677180102
Epoch: 40, step: 337, loss: 0.3160703480243683, mean loss: 0.344048195608806
Epoch: 40, step: 338, loss: 0.33997842669487, mean loss: 0.34404812555994263
Epoch: 40, step: 339, loss: 0.3438134789466858, mean loss: 0.34404812152127456
Epoch: 40, step: 340, loss: 0.3817586302757263, mean loss: 0.3440487705722161
Epoch: 40, step: 341, loss: 0.31484726071357727, mean loss: 0.3440482679817742
Epoch: 40, step: 342, loss: 0.29898443818092346, mean loss: 0.3440474923965238
Epoch: 40, step: 343, loss: 0.33273226022720337, mean loss: 0.3440472976555048
Epoch: 40, step: 344, loss: 0.3394908010959625, mean loss: 0.3440472192371835
Epoch: 40, step: 345, loss: 0.4028469920158386, mean loss: 0.34404823117696215
Epoch: 40, step: 346, loss: 0.3664620816707611, mean loss: 0.34404861691104743
Epoch: 40, step: 347, loss: 0.35754644870758057, mean loss: 0.3440488491997477
Epoch: 40, step: 348, loss: 0.29175809025764465, mean loss: 0.34404794932608024
Epoch: 40, step: 349, loss: 0.32111018896102905, mean loss: 0.3440475545960791
Epoch: 40, step: 350, loss: 0.29997727274894714, mean loss: 0.34404679621501794
Epoch: 40, step: 351, loss: 0.3710520565509796, mean loss: 0.34404726092558263
Epoch: 40, step: 352, loss: 0.32281336188316345, mean loss: 0.3440468955357552
Epoch: 40, step: 353, loss: 0.332061231136322, mean loss: 0.34404668929174514
Epoch: 40, step: 354, loss: 0.32157960534095764, mean loss: 0.3440463026947573
Epoch: 40, step: 355, loss: 0.3070525825023651, mean loss: 0.3440456661450947
Epoch: 40, step: 356, loss: 0.34512418508529663, mean loss: 0.34404568470281344
Epoch: 40, step: 357, loss: 0.3302043378353119, mean loss: 0.3440454465434331
Epoch: 40, step: 358, loss: 0.354383647441864, mean loss: 0.3440456244233157
Epoch: 40, step: 359, loss: 0.30486735701560974, mean loss: 0.34404495033062116
Epoch: 40, step: 360, loss: 0.34978997707366943, mean loss: 0.34404504917659323
Epoch: 40, step: 361, loss: 0.3237074613571167, mean loss: 0.3440446992645493
Epoch: 40, step: 362, loss: 0.2879403233528137, mean loss: 0.34404373399476085
Epoch: 40, step: 363, loss: 0.3330062925815582, mean loss: 0.3440435441000287
Epoch: 40, step: 364, loss: 0.30519986152648926, mean loss: 0.3440428758216188
Epoch: 40, step: 365, loss: 0.3069208860397339, mean loss: 0.34404223717471755
Epoch: 40, step: 366, loss: 0.3735940754413605, mean loss: 0.34404274557594705
Epoch: 40, step: 367, loss: 0.334553986787796, mean loss: 0.34404258233690926
Epoch: 40, step: 368, loss: 0.3639370799064636, mean loss: 0.3440429245842827
Epoch: 40, step: 369, loss: 0.3877032995223999, mean loss: 0.34404367566590904
Epoch: 40, step: 370, loss: 0.3327653706073761, mean loss: 0.3440434816505806
Epoch: 40, step: 371, loss: 0.32384875416755676, mean loss: 0.34404313425624555
Epoch: 40, step: 372, loss: 0.35108697414398193, mean loss: 0.34404325542391084
Epoch: 40, step: 373, loss: 0.3075786232948303, mean loss: 0.3440426281725239
Epoch: 40, step: 374, loss: 0.35123440623283386, mean loss: 0.3440427518807558
Epoch: 40, step: 375, loss: 0.3405737578868866, mean loss: 0.34404269221043116
Epoch: 40, step: 376, loss: 0.37275317311286926, mean loss: 0.34404318605223416
Epoch: 40, step: 377, loss: 0.3817797303199768, mean loss: 0.3440438351379314
Epoch: 40, step: 378, loss: 0.3472706973552704, mean loss: 0.3440438906404722
Epoch: 40, step: 379, loss: 0.3102765679359436, mean loss: 0.344043309847168
Epoch: 40, step: 380, loss: 0.3354175090789795, mean loss: 0.3440431614871335
Epoch: 40, step: 381, loss: 0.32955849170684814, mean loss: 0.3440429123613762
Epoch: 40, step: 382, loss: 0.31457826495170593, mean loss: 0.3440424055996437
Epoch: 40, step: 383, loss: 0.33224985003471375, mean loss: 0.3440422027832643
Epoch: 40, step: 384, loss: 0.32056131958961487, mean loss: 0.3440417989500337
Epoch: 40, step: 385, loss: 0.34056782722473145, mean loss: 0.3440417392043637
Epoch: 40, step: 386, loss: 0.3399280607700348, mean loss: 0.34404166845817846
Epoch: 40, step: 387, loss: 0.3160063624382019, mean loss: 0.3440411863211141
Epoch: 40, step: 388, loss: 0.3249737024307251, mean loss: 0.34404085841377446
Epoch: 40, step: 389, loss: 0.35033491253852844, mean loss: 0.34404096665202255
Epoch: 40, step: 390, loss: 0.36434540152549744, mean loss: 0.3440413158194466
Epoch: 40, step: 391, loss: 0.3099985122680664, mean loss: 0.34404073040873756
Epoch: 40, step: 392, loss: 0.31918269395828247, mean loss: 0.34404030294951016
Epoch: 40, step: 393, loss: 0.3182157278060913, mean loss: 0.3440398588773029
Epoch: 40, step: 394, loss: 0.3362045884132385, mean loss: 0.3440397241464893
Epoch: 40, step: 395, loss: 0.30605271458625793, mean loss: 0.3440390709549087
Epoch: 40, step: 396, loss: 0.3473047614097595, mean loss: 0.3440391271079162
Epoch: 40, step: 397, loss: 0.31888094544410706, mean loss: 0.34403869452458
Epoch: 40, step: 398, loss: 0.35136014223098755, mean loss: 0.3440388204113337
Epoch: 40, step: 399, loss: 0.3229326903820038, mean loss: 0.3440384575136372
Epoch: 40, step: 400, loss: 0.34053969383239746, mean loss: 0.34403839735711167
Epoch: 40, step: 401, loss: 0.3019253611564636, mean loss: 0.34403767329266755
Epoch: 40, step: 402, loss: 0.31869402527809143, mean loss: 0.3440372375577843
Epoch: 40, step: 403, loss: 0.3963545858860016, mean loss: 0.34403813703767444
Epoch: 40, step: 404, loss: 0.3377312123775482, mean loss: 0.3440380286060633
Epoch: 40, step: 405, loss: 0.3748995363712311, mean loss: 0.3440385591824785
Epoch: 40, step: 406, loss: 0.3615886867046356, mean loss: 0.34403886090213953
Epoch: 40, step: 407, loss: 0.3214150369167328, mean loss: 0.3440384719627917
Epoch: 40, step: 408, loss: 0.3873676657676697, mean loss: 0.3440392168474176
Epoch: 40, step: 409, loss: 0.3039776086807251, mean loss: 0.34403852814863534
Epoch: 40, step: 410, loss: 0.33422335982322693, mean loss: 0.3440383594190566
Epoch: 40, step: 411, loss: 0.3113204538822174, mean loss: 0.3440377969851445
Epoch: 40, step: 412, loss: 0.3086636960506439, mean loss: 0.34403718890062185
Epoch: 40, step: 413, loss: 0.3272785544395447, mean loss: 0.3440369008228816
Epoch: 40, step: 414, loss: 0.3500898480415344, mean loss: 0.3440370048701049
Epoch: 40, step: 415, loss: 0.3175661563873291, mean loss: 0.3440365498568953
Epoch: 40, step: 416, loss: 0.3293309509754181, mean loss: 0.3440362970834817
Epoch: 40, step: 417, loss: 0.37444886565208435, mean loss: 0.34403681983380946
Epoch: 40, step: 418, loss: 0.38859447836875916, mean loss: 0.34403758570566245
Epoch: 40, step: 419, loss: 0.3339887261390686, mean loss: 0.3440374129854911
Epoch: 40, step: 420, loss: 0.3361174166202545, mean loss: 0.34403727685863933
Epoch: 40, step: 421, loss: 0.3544430136680603, mean loss: 0.3440374557066818
Epoch: 40, step: 422, loss: 0.3270624577999115, mean loss: 0.3440371639548315
Epoch: 40, step: 423, loss: 0.3325885832309723, mean loss: 0.34403696718972904
Epoch: 40, step: 424, loss: 0.31196531653404236, mean loss: 0.3440364159883772
Epoch: 40, step: 425, loss: 0.3479105234146118, mean loss: 0.34403648256981306
Epoch: 40, step: 426, loss: 0.31235623359680176, mean loss: 0.34403593811402444
Epoch: 40, step: 427, loss: 0.33948832750320435, mean loss: 0.3440358599602709
Epoch: 40, step: 428, loss: 0.3494172692298889, mean loss: 0.34403595244182705
Epoch: 40, step: 429, loss: 0.32653793692588806, mean loss: 0.344035651736972
Epoch: 40, step: 430, loss: 0.4216865301132202, mean loss: 0.34403698615085687
Epoch: 40, step: 431, loss: 0.3313349485397339, mean loss: 0.3440367678727841
Epoch: 40, step: 432, loss: 0.35620203614234924, mean loss: 0.3440369769231556
Epoch: 40, step: 433, loss: 0.29850733280181885, mean loss: 0.34403619454620743
Epoch: 40, step: 434, loss: 0.38643792271614075, mean loss: 0.3440369231608336
Epoch: 40, step: 435, loss: 0.3417204022407532, mean loss: 0.3440368833553329
Epoch: 40, step: 436, loss: 0.353020578622818, mean loss: 0.34403703772231514
Epoch: 40, step: 437, loss: 0.3082415461540222, mean loss: 0.3440364226583685
Epoch: 40, step: 438, loss: 0.3225024342536926, mean loss: 0.3440360526522102
Epoch: 40, step: 439, loss: 0.3320590853691101, mean loss: 0.34403584686239436
Epoch: 40, step: 440, loss: 0.3180150091648102, mean loss: 0.344035399776645
Epoch: 40, step: 441, loss: 0.42488545179367065, mean loss: 0.3440367889050601
Epoch: 40, step: 442, loss: 0.31136903166770935, mean loss: 0.34403622763232095
Epoch: 40, step: 443, loss: 0.33071190118789673, mean loss: 0.34403599870773766
Epoch: 40, step: 444, loss: 0.3501633405685425, mean loss: 0.3440361039794817
Epoch: 40, step: 445, loss: 0.36370575428009033, mean loss: 0.3440364419111434
Epoch: 40, step: 446, loss: 0.3199857473373413, mean loss: 0.3440360287186653
Epoch: 40, step: 447, loss: 0.3310632109642029, mean loss: 0.3440358058486516
Epoch: 40, step: 448, loss: 0.329873651266098, mean loss: 0.34403556255028567
Epoch: 40, step: 449, loss: 0.3576664924621582, mean loss: 0.3440357967184683
Epoch: 40, step: 450, loss: 0.3572338819503784, mean loss: 0.34403602344683976
Epoch: 40, step: 451, loss: 0.31667569279670715, mean loss: 0.3440355534349754
Epoch: 40, step: 452, loss: 0.32268521189689636, mean loss: 0.34403518667254196
Epoch: 40, step: 453, loss: 0.31857892870903015, mean loss: 0.3440347493849829
Epoch: 40, step: 454, loss: 0.340415358543396, mean loss: 0.34403468721216074
Epoch: 40, step: 455, loss: 0.33638808131217957, mean loss: 0.3440345558632893
Epoch: 40, step: 456, loss: 0.32041653990745544, mean loss: 0.34403415017395533
Epoch: 40, step: 457, loss: 0.32038336992263794, mean loss: 0.3440337439288035
Epoch: 40, step: 458, loss: 0.3315999209880829, mean loss: 0.3440335303589562
Epoch: 40, step: 459, loss: 0.3258972764015198, mean loss: 0.3440332188465213
Epoch: 40, step: 460, loss: 0.32828599214553833, mean loss: 0.3440329483732093
Epoch: 40, step: 461, loss: 0.2896755039691925, mean loss: 0.3440320147494175
Epoch: 40, step: 462, loss: 0.3218823969364166, mean loss: 0.3440316343221326
Epoch: 40, step: 463, loss: 0.3612813651561737, mean loss: 0.3440319305870892
Epoch: 40, step: 464, loss: 0.35454726219177246, mean loss: 0.3440321111853134
Epoch: 40, step: 465, loss: 0.3422330617904663, mean loss: 0.3440320802876149
Epoch: 40, step: 466, loss: 0.3245692551136017, mean loss: 0.34403174602987924
Epoch: 40, step: 467, loss: 0.3448816239833832, mean loss: 0.3440317606255712
Epoch: 40, step: 468, loss: 0.3679589629173279, mean loss: 0.3440321715411338
Epoch: 40, step: 469, loss: 0.34800419211387634, mean loss: 0.3440322397537488
Epoch: 40, step: 470, loss: 0.3155389428138733, mean loss: 0.34403175043883166
Epoch: 40, step: 471, loss: 0.3071179986000061, mean loss: 0.3440311165304679
Epoch: 40, step: 472, loss: 0.3493504226207733, mean loss: 0.3440312078756861
Epoch: 40, step: 473, loss: 0.32227838039398193, mean loss: 0.34403083433398396
Epoch: 40, step: 474, loss: 0.34956875443458557, mean loss: 0.3440309294300619
Epoch: 40, step: 475, loss: 0.39019137620925903, mean loss: 0.3440317220745907
Epoch: 40, step: 476, loss: 0.29079023003578186, mean loss: 0.34403080785352785
Epoch: 40, step: 477, loss: 0.3067673444747925, mean loss: 0.3440301680056042
Epoch: 40, step: 478, loss: 0.3460178077220917, mean loss: 0.34403020213461943
Epoch: 40, step: 479, loss: 0.33455002307891846, mean loss: 0.3440300393568197
Epoch: 40, step: 480, loss: 0.3655705749988556, mean loss: 0.3440304092085675
Epoch: 40, step: 481, loss: 0.30757424235343933, mean loss: 0.34402978326565936
Epoch: 40, step: 482, loss: 0.33234673738479614, mean loss: 0.3440295826742427
Epoch: 40, step: 483, loss: 0.3319116532802582, mean loss: 0.3440293746196896
Epoch: 40, step: 484, loss: 0.30153414607048035, mean loss: 0.34402864502524283
Epoch: 40, step: 485, loss: 0.3550336956977844, mean loss: 0.3440288339661259
Epoch: 40, step: 486, loss: 0.3248474597930908, mean loss: 0.3440285046551884
Epoch: 40, step: 487, loss: 0.32166269421577454, mean loss: 0.3440281206795937
Epoch: 40, step: 488, loss: 0.36498650908470154, mean loss: 0.34402848048643
Epoch: 40, step: 489, loss: 0.35755252838134766, mean loss: 0.34402871265892604
Epoch: 40, step: 490, loss: 0.35740119218826294, mean loss: 0.344028942225449
Epoch: 40, step: 491, loss: 0.3774096369743347, mean loss: 0.34402951526491116
Epoch: 40, step: 492, loss: 0.31298723816871643, mean loss: 0.3440289823777277
Epoch: 40, step: 493, loss: 0.3311047852039337, mean loss: 0.3440287605183331
Epoch: 40, step: 494, loss: 0.2905394434928894, mean loss: 0.344027842325611
Epoch: 40, step: 495, loss: 0.3237046003341675, mean loss: 0.344027493464687
Epoch: 40, step: 496, loss: 0.3241432011127472, mean loss: 0.3440271521444619
Epoch: 40, step: 497, loss: 0.3196049630641937, mean loss: 0.3440267329369869
Epoch: 40, step: 498, loss: 0.3225741684436798, mean loss: 0.3440263647095114
Epoch: 40, step: 499, loss: 0.3233538269996643, mean loss: 0.3440260098770756
Epoch: 40, step: 500, loss: 0.3407171368598938, mean loss: 0.3440259530831136
Epoch: 40, step: 501, loss: 0.35006457567214966, mean loss: 0.34402605672910225
Epoch: 40, step: 502, loss: 0.34101295471191406, mean loss: 0.34402600501357067
Epoch: 40, step: 503, loss: 0.3484766483306885, mean loss: 0.3440260814011053
Epoch: 40, step: 504, loss: 0.3042440414428711, mean loss: 0.3440253986234522
Epoch: 40, step: 505, loss: 0.31244954466819763, mean loss: 0.3440248566975614
Epoch: 40, step: 506, loss: 0.311886191368103, mean loss: 0.34402430512179244
Epoch: 40, step: 507, loss: 0.3734699785709381, mean loss: 0.34402481047075667
Epoch: 40, step: 508, loss: 0.34126555919647217, mean loss: 0.3440247631170819
Epoch: 40, step: 509, loss: 0.29913076758384705, mean loss: 0.34402399266924366
Epoch: 40, step: 510, loss: 0.3401409685611725, mean loss: 0.34402392603190934
Epoch: 40, step: 511, loss: 0.31687813997268677, mean loss: 0.34402346018577296
Epoch: 40, step: 512, loss: 0.32548946142196655, mean loss: 0.34402314213112045
Epoch: 40, step: 513, loss: 0.3317452073097229, mean loss: 0.3440229314379327
Epoch: 40, step: 514, loss: 0.32040727138519287, mean loss: 0.344022526192801
Epoch: 40, step: 515, loss: 0.34092605113983154, mean loss: 0.34402247305814776
Epoch: 40, step: 516, loss: 0.3252764940261841, mean loss: 0.3440221513878656
Epoch: 40, step: 517, loss: 0.37304142117500305, mean loss: 0.3440226493333989
Epoch: 40, step: 518, loss: 0.33847954869270325, mean loss: 0.3440225542202253
Epoch: 40, step: 519, loss: 0.32647421956062317, mean loss: 0.34402225311633616
Epoch: 40, step: 520, loss: 0.3388180136680603, mean loss: 0.34402216382069184
Epoch: 40, step: 521, loss: 0.3799736797809601, mean loss: 0.344022780675226
Epoch: 40, step: 522, loss: 0.3192097842693329, mean loss: 0.3440223549422266
Epoch: 40, step: 523, loss: 0.32597801089286804, mean loss: 0.3440220453487867
Epoch: 40, step: 524, loss: 0.34549230337142944, mean loss: 0.34402207057411094
Epoch: 40, step: 525, loss: 0.32263514399528503, mean loss: 0.3440217036433458
Epoch: 40, step: 526, loss: 0.3586205542087555, mean loss: 0.3440219541082962
Epoch: 40, step: 527, loss: 0.37728163599967957, mean loss: 0.34402252471771655
Epoch: 40, step: 528, loss: 0.31582024693489075, mean loss: 0.3440220408823826
Epoch: 40, step: 529, loss: 0.313464492559433, mean loss: 0.3440215166492667
Epoch: 40, step: 530, loss: 0.32860133051872253, mean loss: 0.34402125211123974
Epoch: 40, step: 531, loss: 0.3546932339668274, mean loss: 0.34402143518922396
Epoch: 40, step: 532, loss: 0.3874146044254303, mean loss: 0.3440221795868229
Epoch: 40, step: 533, loss: 0.34117498993873596, mean loss: 0.3440221307449241
Epoch: 40, step: 534, loss: 0.325909286737442, mean loss: 0.34402182003484594
Epoch: 40, step: 535, loss: 0.33953195810317993, mean loss: 0.3440217430164925
Epoch: 40, step: 536, loss: 0.33663690090179443, mean loss: 0.34402161634029793
Epoch: 40, step: 537, loss: 0.30262070894241333, mean loss: 0.3440209061803028
Epoch: 40, step: 538, loss: 0.2985606789588928, mean loss: 0.3440201264031673
Epoch: 40, step: 539, loss: 0.3435196280479431, mean loss: 0.34402011781828984
Epoch: 40, step: 540, loss: 0.3527103066444397, mean loss: 0.34402026687557574
Epoch: 40, step: 541, loss: 0.3512451648712158, mean loss: 0.34402039079753377
Epoch: 40, step: 542, loss: 0.3594782054424286, mean loss: 0.34402065592650904
Epoch: 40, step: 543, loss: 0.3590421974658966, mean loss: 0.3440209135682067
Epoch: 40, step: 544, loss: 0.3257814049720764, mean loss: 0.34402060073897084
Epoch: 40, step: 545, loss: 0.34064462780952454, mean loss: 0.3440205428380185
Epoch: 40, step: 546, loss: 0.3560674786567688, mean loss: 0.34402074945018885
Epoch: 40, step: 547, loss: 0.31526339054107666, mean loss: 0.34402025625270466
Epoch: 40, step: 548, loss: 0.3426606357097626, mean loss: 0.3440202329351972
Epoch: 40, step: 549, loss: 0.29849371314048767, mean loss: 0.34401945216826535
Epoch: 40, step: 550, loss: 0.3472382426261902, mean loss: 0.3440195073686642
Epoch: 40, step: 551, loss: 0.3845413625240326, mean loss: 0.3440202022831785
Epoch: 40, step: 552, loss: 0.3169340491294861, mean loss: 0.3440197377872144
Epoch: 40, step: 553, loss: 0.3083881735801697, mean loss: 0.3440191267578868
Epoch: 40, step: 554, loss: 0.3790178596973419, mean loss: 0.34401972692478966
Epoch: 40, step: 555, loss: 0.2970060706138611, mean loss: 0.34401892073684276
Epoch: 40, step: 556, loss: 0.37584128975868225, mean loss: 0.344019466415959
Epoch: 40, step: 557, loss: 0.33566251397132874, mean loss: 0.3440193231162497
Epoch: 40, step: 558, loss: 0.3334682583808899, mean loss: 0.3440191421963997
Epoch: 40, step: 559, loss: 0.3555243909358978, mean loss: 0.3440193394743273
Epoch: 40, step: 560, loss: 0.32807326316833496, mean loss: 0.34401906605521054
Epoch: 40, step: 561, loss: 0.3636161684989929, mean loss: 0.34401940207082116
Epoch: 40, step: 562, loss: 0.3111782968044281, mean loss: 0.3440188389806978
Epoch: 40, step: 563, loss: 0.2954482138156891, mean loss: 0.34401800620816564
Epoch: 40, step: 564, loss: 0.36471322178840637, mean loss: 0.34401836103397926
Epoch: 40, step: 565, loss: 0.2936561107635498, mean loss: 0.34401749757256805
Epoch: 40, step: 566, loss: 0.38474541902542114, mean loss: 0.34401819584131926
Epoch: 40, step: 567, loss: 0.2974463999271393, mean loss: 0.3440173973946742
Epoch: 40, step: 568, loss: 0.3294890224933624, mean loss: 0.3440171483183159
Epoch: 40, step: 569, loss: 0.36170291900634766, mean loss: 0.3440174515202821
Epoch: 40, step: 570, loss: 0.33867305517196655, mean loss: 0.34401735989839416
Epoch: 40, step: 571, loss: 0.3768272399902344, mean loss: 0.3440179223663379
Epoch: 40, step: 572, loss: 0.3096369504928589, mean loss: 0.3440173329748807
Epoch: 40, step: 573, loss: 0.33430662751197815, mean loss: 0.34401716650754666
Epoch: 40, step: 574, loss: 0.3279695212841034, mean loss: 0.34401689141291697
Epoch: 40, step: 575, loss: 0.35346946120262146, mean loss: 0.3440170534495631
Epoch: 40, step: 576, loss: 0.2908612787723541, mean loss: 0.344016142264986
Epoch: 40, step: 577, loss: 0.3553929924964905, mean loss: 0.344016337281103
Epoch: 40, step: 578, loss: 0.32743629813194275, mean loss: 0.3440160530794686
Epoch: 40, step: 579, loss: 0.31209638714790344, mean loss: 0.34401550594772484
Epoch: 40, step: 580, loss: 0.3141922950744629, mean loss: 0.34401499475986597
Epoch: 40, step: 581, loss: 0.3014693856239319, mean loss: 0.34401426551491143
Epoch: 40, step: 582, loss: 0.3357773423194885, mean loss: 0.3440141243339095
Epoch: 40, step: 583, loss: 0.33520644903182983, mean loss: 0.3440139733727943
Epoch: 40, step: 584, loss: 0.325288325548172, mean loss: 0.34401365242587817
Epoch: 40, step: 585, loss: 0.2850622236728668, mean loss: 0.3440126420493527
Epoch: 40, step: 586, loss: 0.32211554050445557, mean loss: 0.3440122667583944
Epoch: 40, step: 587, loss: 0.29506051540374756, mean loss: 0.34401142779645305
Epoch: 40, step: 588, loss: 0.35473451018333435, mean loss: 0.34401161157136584
Epoch: 40, step: 589, loss: 0.3386879861354828, mean loss: 0.344011520335283
Epoch: 40, step: 590, loss: 0.3410872519016266, mean loss: 0.3440114702201447
Epoch: 40, step: 591, loss: 0.33732134103775024, mean loss: 0.3440113555689043
Epoch: 40, step: 592, loss: 0.35744884610176086, mean loss: 0.3440115858482478
Epoch: 40, step: 593, loss: 0.29672476649284363, mean loss: 0.3440107755041522
Epoch: 40, step: 594, loss: 0.3115844428539276, mean loss: 0.34401021983055696
Epoch: 40, step: 595, loss: 0.35471874475479126, mean loss: 0.34401040333396576
Epoch: 40, step: 596, loss: 0.33147671818733215, mean loss: 0.34401018855792953
Epoch: 40, step: 597, loss: 0.3627825677394867, mean loss: 0.344010510234121
Epoch: 40, step: 598, loss: 0.32340264320373535, mean loss: 0.3440101571117743
Epoch: 40, step: 599, loss: 0.29469504952430725, mean loss: 0.34400931209622276
Epoch: 40, step: 600, loss: 0.2900024950504303, mean loss: 0.3440083867039737
Epoch: 40, step: 601, loss: 0.33689889311790466, mean loss: 0.34400826488680525
Epoch: 40, step: 602, loss: 0.33276045322418213, mean loss: 0.34400807216518947
Epoch: 40, step: 603, loss: 0.297293484210968, mean loss: 0.3440072717644638
Epoch: 40, step: 604, loss: 0.32860442996025085, mean loss: 0.3440070078590101
Epoch: 40, step: 605, loss: 0.30350056290626526, mean loss: 0.34400631385145514
Epoch: 40, step: 606, loss: 0.33075860142707825, mean loss: 0.34400608687880924
Epoch: 40, step: 607, loss: 0.35032886266708374, mean loss: 0.3440061952048747
Epoch: 40, step: 608, loss: 0.3906174302101135, mean loss: 0.34400699376635435
Epoch: 40, step: 609, loss: 0.3499755859375, mean loss: 0.34400709602080304
Epoch: 40, step: 610, loss: 0.3431234657764435, mean loss: 0.34400708088263093
Epoch: 40, step: 611, loss: 0.33536186814308167, mean loss: 0.3440069327771567
Epoch: 40, step: 612, loss: 0.319621205329895, mean loss: 0.3440065150201895
Epoch: 40, step: 613, loss: 0.3099042475223541, mean loss: 0.34400593081716246
Epoch: 40, step: 614, loss: 0.3378342390060425, mean loss: 0.3440058250922492
Epoch: 40, step: 615, loss: 0.34384530782699585, mean loss: 0.34400582234253585
Epoch: 40, step: 616, loss: 0.3319661617279053, mean loss: 0.3440056161027391
Epoch: 40, step: 617, loss: 0.3434259295463562, mean loss: 0.34400560617285875
Epoch: 40, step: 618, loss: 0.304898738861084, mean loss: 0.3440049362938387
Epoch: 40, step: 619, loss: 0.362946093082428, mean loss: 0.34400526073982685
Epoch: 40, step: 620, loss: 0.2979751229286194, mean loss: 0.3440044722960213
Epoch: 40, step: 621, loss: 0.31518930196762085, mean loss: 0.34400397873344507
Epoch: 40, step: 622, loss: 0.3224775493144989, mean loss: 0.34400361002287144
Epoch: 40, step: 623, loss: 0.36427173018455505, mean loss: 0.3440039571748337
Epoch: 40, step: 624, loss: 0.27848121523857117, mean loss: 0.3440028349218246
Epoch: 40, step: 625, loss: 0.3042990565299988, mean loss: 0.3440021548995865
Epoch: 40, step: 626, loss: 0.31695204973220825, mean loss: 0.3440016916097246
Epoch: 40, step: 627, loss: 0.33621564507484436, mean loss: 0.34400155825960926
Epoch: 40, step: 628, loss: 0.33471405506134033, mean loss: 0.34400139919705985
Epoch: 40, step: 629, loss: 0.3014846444129944, mean loss: 0.3440006710457534
Epoch: 40, step: 630, loss: 0.3388781249523163, mean loss: 0.34400058331740324
Epoch: 40, step: 631, loss: 0.3335813581943512, mean loss: 0.3440004048815709
Epoch: 40, step: 632, loss: 0.32304996252059937, mean loss: 0.34400004609811463
Epoch: 40, step: 633, loss: 0.3568393886089325, mean loss: 0.3440002659724598
Epoch: 40, step: 634, loss: 0.34859156608581543, mean loss: 0.344000344597344
Epoch: 40, step: 635, loss: 0.320553183555603, mean loss: 0.34399994307735904
Epoch: 40, step: 636, loss: 0.3050684630870819, mean loss: 0.343999276408181
Epoch: 40, step: 637, loss: 0.33061841130256653, mean loss: 0.3439990472759315
Epoch: 40, step: 638, loss: 0.3624590039253235, mean loss: 0.3439993633764923
Epoch: 40, step: 639, loss: 0.3109394311904907, mean loss: 0.3439987972817631
Epoch: 40, step: 640, loss: 0.34046754240989685, mean loss: 0.34399873681610543
Epoch: 40, step: 641, loss: 0.313151478767395, mean loss: 0.3439982086277206
Epoch: 40, step: 642, loss: 0.36347830295562744, mean loss: 0.34399854217384546
Epoch: 40, step: 643, loss: 0.31556662917137146, mean loss: 0.3439980553593635
Epoch: 40, step: 644, loss: 0.34761422872543335, mean loss: 0.34399811727483937
Epoch: 40, step: 645, loss: 0.32996249198913574, mean loss: 0.3439978769634795
Epoch: 40, step: 646, loss: 0.30329081416130066, mean loss: 0.34399718000827206
Epoch: 40, step: 647, loss: 0.3153195381164551, mean loss: 0.3439966890200189
Epoch: 40, step: 648, loss: 0.2837968170642853, mean loss: 0.3439956583591284
Epoch: 40, step: 649, loss: 0.3452015519142151, mean loss: 0.34399567900445543
Epoch: 40, step: 650, loss: 0.3190836012363434, mean loss: 0.3439952525081145
Epoch: 40, step: 651, loss: 0.31736093759536743, mean loss: 0.3439947965347715
Epoch: 40, step: 652, loss: 0.2946205735206604, mean loss: 0.34399395127390464
Epoch: 40, step: 653, loss: 0.3323705494403839, mean loss: 0.34399375229075274
Epoch: 40, step: 654, loss: 0.32111918926239014, mean loss: 0.34399336070360853
Epoch: 40, step: 655, loss: 0.33176273107528687, mean loss: 0.343993151332381
Epoch: 40, step: 656, loss: 0.30282241106033325, mean loss: 0.3439924465591083
Epoch: 40, step: 657, loss: 0.36452803015708923, mean loss: 0.34399279808746597
Epoch: 40, step: 658, loss: 0.34348705410957336, mean loss: 0.3439927894302829
Epoch: 40, step: 659, loss: 0.32030409574508667, mean loss: 0.3439923839408326
Epoch: 40, step: 660, loss: 0.31796589493751526, mean loss: 0.34399193844197085
Epoch: 40, step: 661, loss: 0.31749558448791504, mean loss: 0.34399148490813164
Epoch: 40, step: 662, loss: 0.3279961943626404, mean loss: 0.34399121112399617
Epoch: 40, step: 663, loss: 0.31034255027770996, mean loss: 0.343990635184984
Epoch: 40, step: 664, loss: 0.3120107650756836, mean loss: 0.34399008781878615
Epoch: 40, step: 665, loss: 0.34406355023384094, mean loss: 0.3439900890761444
Epoch: 40, step: 666, loss: 0.38062557578086853, mean loss: 0.3439907161062282
Epoch: 40, step: 667, loss: 0.32644879817962646, mean loss: 0.3439904158748678
Epoch: 40, step: 668, loss: 0.329728364944458, mean loss: 0.343990171782877
Epoch: 40, step: 669, loss: 0.34701183438301086, mean loss: 0.3439902234971094
Epoch: 40, step: 670, loss: 0.320997953414917, mean loss: 0.34398983000273
Epoch: 40, step: 671, loss: 0.3541543185710907, mean loss: 0.3439900039568744
Epoch: 40, step: 672, loss: 0.32093191146850586, mean loss: 0.3439896093495038
Epoch: 40, step: 673, loss: 0.3266472816467285, mean loss: 0.34398931256462334
Epoch: 40, step: 674, loss: 0.29826849699020386, mean loss: 0.34398853014286285
Epoch: 40, step: 675, loss: 0.3158577084541321, mean loss: 0.34398804874746125
Epoch: 40, step: 676, loss: 0.3403405547142029, mean loss: 0.343987986329917
Epoch: 40, step: 677, loss: 0.33860835433006287, mean loss: 0.3439878942728309
Epoch: 40, step: 678, loss: 0.30582964420318604, mean loss: 0.34398724131418906
Epoch: 40, step: 679, loss: 0.3235815167427063, mean loss: 0.3439868921402573
Epoch: 40, step: 680, loss: 0.29277047514915466, mean loss: 0.34398601576208115
Epoch: 40, step: 681, loss: 0.37664589285850525, mean loss: 0.34398657460464466
Epoch: 40, step: 682, loss: 0.3295992612838745, mean loss: 0.3439863284278002
Epoch: 40, step: 683, loss: 0.37700825929641724, mean loss: 0.34398689344612315
Epoch: 40, step: 684, loss: 0.3578668236732483, mean loss: 0.34398713093316613
Epoch: 40, step: 685, loss: 0.3927685618400574, mean loss: 0.3439879655742178
Epoch: 40, step: 686, loss: 0.33211490511894226, mean loss: 0.3439877624318759
Epoch: 40, step: 687, loss: 0.3990800082683563, mean loss: 0.3439887050175219
Epoch: 40, step: 688, loss: 0.32836467027664185, mean loss: 0.34398843770696497
Epoch: 40, step: 689, loss: 0.3068327009677887, mean loss: 0.34398780202284623
Epoch: 40, step: 690, loss: 0.3246249854564667, mean loss: 0.3439874707570584
Epoch: 40, step: 691, loss: 0.3767837882041931, mean loss: 0.3439880318382437
Epoch: 40, step: 692, loss: 0.35373520851135254, mean loss: 0.3439881985906204
Epoch: 40, step: 693, loss: 0.31917402148246765, mean loss: 0.34398777408285175
Epoch: 40, step: 694, loss: 0.30205824971199036, mean loss: 0.3439870567870794
Epoch: 40, step: 695, loss: 0.35106226801872253, mean loss: 0.34398717782189586
Epoch: 40, step: 696, loss: 0.2810397446155548, mean loss: 0.34398610100589083
Epoch: 40, step: 697, loss: 0.342518150806427, mean loss: 0.3439860758946965
Epoch: 40, step: 698, loss: 0.31180906295776367, mean loss: 0.34398552547452277
Epoch: 40, step: 699, loss: 0.3232609033584595, mean loss: 0.3439851709650784
Epoch: 40, step: 700, loss: 0.3380531370639801, mean loss: 0.3439850694951429
Epoch: 40, step: 701, loss: 0.28397467732429504, mean loss: 0.3439840430096964
Epoch: 40, step: 702, loss: 0.33727821707725525, mean loss: 0.34398392830764674
Epoch: 40, step: 703, loss: 0.3022990822792053, mean loss: 0.3439832153074068
Epoch: 40, step: 704, loss: 0.33861491084098816, mean loss: 0.34398312348658294
Epoch: 40, step: 705, loss: 0.3427576422691345, mean loss: 0.34398310252600384
Epoch: 40, step: 706, loss: 0.3278122544288635, mean loss: 0.3439828259452301
Epoch: 40, step: 707, loss: 0.3616577982902527, mean loss: 0.3439831282468711
Epoch: 40, step: 708, loss: 0.29070019721984863, mean loss: 0.343982216944625
Epoch: 40, step: 709, loss: 0.3210197985172272, mean loss: 0.3439818242232563
Epoch: 40, step: 710, loss: 0.34357476234436035, mean loss: 0.3439818172614824
Epoch: 40, step: 711, loss: 0.3237343430519104, mean loss: 0.34398147098507303
Epoch: 40, step: 712, loss: 0.34010136127471924, mean loss: 0.34398140462778487
Epoch: 40, step: 713, loss: 0.3330419659614563, mean loss: 0.3439812175456857
Epoch: 40, step: 714, loss: 0.33116111159324646, mean loss: 0.34398099830488277
Epoch: 40, step: 715, loss: 0.32146281003952026, mean loss: 0.34398061322060436
Epoch: 40, step: 716, loss: 0.30335986614227295, mean loss: 0.3439799185757512
Epoch: 40, step: 717, loss: 0.35282647609710693, mean loss: 0.3439800698558484
Epoch: 40, step: 718, loss: 0.3585595488548279, mean loss: 0.343980319167208
Epoch: 40, step: 719, loss: 0.3202754855155945, mean loss: 0.34397991381779536
Epoch: 40, step: 720, loss: 0.3325676918029785, mean loss: 0.34397971867369703
Epoch: 40, step: 721, loss: 0.33821526169776917, mean loss: 0.3439796201056423
Epoch: 40, step: 722, loss: 0.33283206820487976, mean loss: 0.3439794294938081
Epoch: 40, step: 723, loss: 0.34089478850364685, mean loss: 0.3439793767504768
Epoch: 40, step: 724, loss: 0.30152109265327454, mean loss: 0.3439786507816968
Epoch: 40, step: 725, loss: 0.31840434670448303, mean loss: 0.3439782135094594
Epoch: 40, step: 726, loss: 0.32423269748687744, mean loss: 0.3439778759042476
Epoch: 40, step: 727, loss: 0.3670591115951538, mean loss: 0.3439782705362352
Epoch: 40, step: 728, loss: 0.3658028244972229, mean loss: 0.34397864367569664
Epoch: 40, step: 729, loss: 0.3079381287097931, mean loss: 0.3439780274931874
Epoch: 40, step: 730, loss: 0.3795080780982971, mean loss: 0.34397863493793285
Epoch: 40, step: 731, loss: 0.34142789244651794, mean loss: 0.34397859132953357
Epoch: 40, step: 732, loss: 0.3269690275192261, mean loss: 0.34397830053296286
Epoch: 40, step: 733, loss: 0.35599422454833984, mean loss: 0.34397850595444224
Epoch: 40, step: 734, loss: 0.32183369994163513, mean loss: 0.3439781273783928
Epoch: 40, step: 735, loss: 0.29550671577453613, mean loss: 0.34397729875059596
Epoch: 40, step: 736, loss: 0.32682427763938904, mean loss: 0.3439770055215225
Epoch: 40, step: 737, loss: 0.3362111449241638, mean loss: 0.3439768727672301
Epoch: 40, step: 738, loss: 0.3489989638328552, mean loss: 0.34397695861640815
Epoch: 40, step: 739, loss: 0.29246506094932556, mean loss: 0.3439760780711489
Epoch: 40, step: 740, loss: 0.32463541626930237, mean loss: 0.3439757474671968
Epoch: 40, step: 741, loss: 0.32651287317276, mean loss: 0.3439754489667302
Epoch: 40, step: 742, loss: 0.3022630512714386, mean loss: 0.3439747359708549
Epoch: 40, step: 743, loss: 0.32428234815597534, mean loss: 0.34397439937185625
Epoch: 40, step: 744, loss: 0.3361356258392334, mean loss: 0.3439742653871792
Epoch: 40, step: 745, loss: 0.33303168416023254, mean loss: 0.34397407835369154
Epoch: 40, step: 746, loss: 0.3198738098144531, mean loss: 0.3439736664325789
Epoch: 40, step: 747, loss: 0.33380842208862305, mean loss: 0.34397349269147776
Epoch: 40, step: 748, loss: 0.3250924050807953, mean loss: 0.34397316998749017
Epoch: 40, step: 749, loss: 0.33620384335517883, mean loss: 0.34397303720118644
Epoch: 40, step: 750, loss: 0.35169151425361633, mean loss: 0.3439731691161606
Epoch: 40, step: 751, loss: 0.31579744815826416, mean loss: 0.3439726875786818
Epoch: 40, step: 752, loss: 0.30947983264923096, mean loss: 0.34397209808822793
Epoch: 40, step: 753, loss: 0.352641761302948, mean loss: 0.34397224625214107
Epoch: 40, step: 754, loss: 0.35034868121147156, mean loss: 0.343972355223088
Epoch: 40, step: 755, loss: 0.3232775032520294, mean loss: 0.3439720015616626
Epoch: 40, step: 756, loss: 0.34932613372802734, mean loss: 0.34397209305870047
Epoch: 40, step: 757, loss: 0.3329967260360718, mean loss: 0.3439719055032983
Epoch: 40, step: 758, loss: 0.3280661106109619, mean loss: 0.34397163369764727
Epoch: 40, step: 759, loss: 0.31415170431137085, mean loss: 0.34397112412947595
Epoch: 40, step: 760, loss: 0.3033665418624878, mean loss: 0.3439704302831256
Epoch: 40, step: 761, loss: 0.3667629361152649, mean loss: 0.34397081975214294
Epoch: 40, step: 762, loss: 0.35030338168144226, mean loss: 0.34397092795852213
Epoch: 40, step: 763, loss: 0.3018350303173065, mean loss: 0.3439702079821425
Epoch: 40, step: 764, loss: 0.29462912678718567, mean loss: 0.34396936490514646
Epoch: 40, step: 765, loss: 0.36669182777404785, mean loss: 0.34396975315076156
Epoch: 40, step: 766, loss: 0.34635356068611145, mean loss: 0.34396979388080984
Epoch: 40, step: 767, loss: 0.3260217607021332, mean loss: 0.3439694872236
Epoch: 40, step: 768, loss: 0.3618013858795166, mean loss: 0.3439697918913486
Epoch: 40, step: 769, loss: 0.35065603256225586, mean loss: 0.34396990612747824
Epoch: 40, step: 770, loss: 0.30428239703178406, mean loss: 0.343969228067833
Epoch: 40, step: 771, loss: 0.3141079545021057, mean loss: 0.34396871789777955
Epoch: 40, step: 772, loss: 0.3226441442966461, mean loss: 0.34396835358066613
Epoch: 40, step: 773, loss: 0.3598514497280121, mean loss: 0.34396862492887653
Epoch: 40, step: 774, loss: 0.33755889534950256, mean loss: 0.34396851542636386
Epoch: 40, step: 775, loss: 0.3385128080844879, mean loss: 0.3439684222237647
Epoch: 40, step: 776, loss: 0.34527716040611267, mean loss: 0.34396844458121695
Epoch: 40, step: 777, loss: 0.356607049703598, mean loss: 0.34396866048550345
Epoch: 40, step: 778, loss: 0.3094281554222107, mean loss: 0.3439680704428812
Epoch: 40, step: 779, loss: 0.3436070382595062, mean loss: 0.34396806427560783
Epoch: 40, step: 780, loss: 0.2980445325374603, mean loss: 0.34396727980776926
Epoch: 40, step: 781, loss: 0.3374977111816406, mean loss: 0.3439671692961942
Epoch: 40, step: 782, loss: 0.32573050260543823, mean loss: 0.3439668577872744
Epoch: 40, step: 783, loss: 0.3059327304363251, mean loss: 0.34396620811989004
Epoch: 40, step: 784, loss: 0.3319392204284668, mean loss: 0.34396600268838107
Epoch: 40, step: 785, loss: 0.2841300368309021, mean loss: 0.343964980655008
Epoch: 40, step: 786, loss: 0.3042733073234558, mean loss: 0.34396430270953976
Epoch: 40, step: 787, loss: 0.332889199256897, mean loss: 0.3439641135467425
Epoch: 40, step: 788, loss: 0.32933154702186584, mean loss: 0.3439638636267349
Epoch: 40, step: 789, loss: 0.3151306211948395, mean loss: 0.3439633711716977
Epoch: 40, step: 790, loss: 0.32606565952301025, mean loss: 0.3439630654943967
Epoch: 40, step: 791, loss: 0.3248869776725769, mean loss: 0.34396273969702307
Epoch: 40, step: 792, loss: 0.34054169058799744, mean loss: 0.34396268127048457
Epoch: 40, step: 793, loss: 0.31591078639030457, mean loss: 0.3439622021931392
Epoch: 40, step: 794, loss: 0.3071799576282501, mean loss: 0.343961574027405
Epoch: 40, step: 795, loss: 0.3331875205039978, mean loss: 0.3439613900316826
Epoch: 40, step: 796, loss: 0.34512099623680115, mean loss: 0.3439614098347156
Epoch: 40, step: 797, loss: 0.33342650532722473, mean loss: 0.3439612299292457
Epoch: 40, step: 798, loss: 0.32418543100357056, mean loss: 0.3439608922219945
Epoch: 40, step: 799, loss: 0.34191280603408813, mean loss: 0.3439608572478451
Epoch: 40, step: 800, loss: 0.34013840556144714, mean loss: 0.3439607919748531
Epoch: 40, step: 801, loss: 0.3277948200702667, mean loss: 0.34396051592601756
Epoch: 40, step: 802, loss: 0.30289986729621887, mean loss: 0.3439598147896579
Epoch: 40, step: 803, loss: 0.35619106888771057, mean loss: 0.34396002364243605
Epoch: 40, step: 804, loss: 0.3073275685310364, mean loss: 0.3439593981416231
Epoch: 40, step: 805, loss: 0.3202298879623413, mean loss: 0.34395899296609156
Epoch: 40, step: 806, loss: 0.2873130440711975, mean loss: 0.3439580257670051
Epoch: 40, step: 807, loss: 0.3119291067123413, mean loss: 0.34395747889979
Epoch: 40, step: 808, loss: 0.3207039535045624, mean loss: 0.3439570818719187
Epoch: 40, step: 809, loss: 0.3443371653556824, mean loss: 0.3439570883613072
Epoch: 40, step: 810, loss: 0.3261583745479584, mean loss: 0.3439567844786039
Epoch: 40, step: 811, loss: 0.3231697678565979, mean loss: 0.3439564295817825
Epoch: 40, step: 812, loss: 0.3239766061306, mean loss: 0.34395608847199727
Epoch: 40, step: 813, loss: 0.33565661311149597, mean loss: 0.3439559467798581
Epoch: 40, step: 814, loss: 0.32006537914276123, mean loss: 0.3439555389169876
Epoch: 40, step: 815, loss: 0.34459665417671204, mean loss: 0.34395554986200366
Epoch: 40, step: 816, loss: 0.33973318338394165, mean loss: 0.3439554777796765
Epoch: 40, step: 817, loss: 0.3718077540397644, mean loss: 0.34395595325299855
Epoch: 40, step: 818, loss: 0.34077900648117065, mean loss: 0.34395589901945456
Epoch: 40, step: 819, loss: 0.30637937784194946, mean loss: 0.3439552575629647
Epoch: 40, step: 820, loss: 0.38101136684417725, mean loss: 0.3439558901248752
Epoch: 40, step: 821, loss: 0.33648478984832764, mean loss: 0.34395576259252264
Epoch: 40, step: 822, loss: 0.35511425137519836, mean loss: 0.34395595306567667
Epoch: 40, step: 823, loss: 0.30667126178741455, mean loss: 0.3439553166343767
Epoch: 40, step: 824, loss: 0.285504013299942, mean loss: 0.3439543189164739
Epoch: 40, step: 825, loss: 0.3238792419433594, mean loss: 0.34395397625650437
Epoch: 40, step: 826, loss: 0.3574911653995514, mean loss: 0.34395420731781734
Epoch: 40, step: 827, loss: 0.3413164019584656, mean loss: 0.34395416229485426
Epoch: 40, step: 828, loss: 0.3612304627895355, mean loss: 0.3439544571676204
Epoch: 40, step: 829, loss: 0.37957891821861267, mean loss: 0.34395506519733626
Epoch: 40, step: 830, loss: 0.34164124727249146, mean loss: 0.3439550257063236
Epoch: 40, step: 831, loss: 0.3132788836956024, mean loss: 0.34395450215119644
Epoch: 40, step: 832, loss: 0.31817102432250977, mean loss: 0.34395406210754226
Epoch: 40, step: 833, loss: 0.34335586428642273, mean loss: 0.343954051898343
Epoch: 40, step: 834, loss: 0.3303511440753937, mean loss: 0.34395381974700207
Epoch: 40, step: 835, loss: 0.3708585500717163, mean loss: 0.34395427890343466
Epoch: 40, step: 836, loss: 0.3589939475059509, mean loss: 0.34395453556620925
Epoch: 40, step: 837, loss: 0.31369563937187195, mean loss: 0.34395401918516905
Epoch: 40, step: 838, loss: 0.3528161644935608, mean loss: 0.3439541704188984
Epoch: 40, step: 839, loss: 0.329566091299057, mean loss: 0.343953924888538
Epoch: 40, step: 840, loss: 0.2977111339569092, mean loss: 0.34395313577587894
Epoch: 40, step: 841, loss: 0.32090815901756287, mean loss: 0.3439527425303112
Epoch: 40, step: 842, loss: 0.3168150782585144, mean loss: 0.3439522794539453
Epoch: 40, step: 843, loss: 0.4117564260959625, mean loss: 0.34395343644231885
Epoch: 40, step: 844, loss: 0.370620459318161, mean loss: 0.34395389147214356
Epoch: 40, step: 845, loss: 0.3218300938606262, mean loss: 0.3439535139715871
Epoch: 40, step: 846, loss: 0.3742341101169586, mean loss: 0.3439540306435912
Epoch: 40, step: 847, loss: 0.36292126774787903, mean loss: 0.3439543542723979
Epoch: 40, step: 848, loss: 0.31267237663269043, mean loss: 0.3439538205322276
Epoch: 40, step: 849, loss: 0.3231622278690338, mean loss: 0.34395346578742875
Epoch: 40, step: 850, loss: 0.32404401898384094, mean loss: 0.34395312609954076
Epoch: 40, step: 851, loss: 0.37352418899536133, mean loss: 0.3439536306218723
Epoch: 40, step: 852, loss: 0.317115843296051, mean loss: 0.3439531727407311
Epoch: 40, step: 853, loss: 0.34156733751296997, mean loss: 0.34395313203654393
Epoch: 40, step: 854, loss: 0.30998364090919495, mean loss: 0.34395255250074036
Epoch: 40, step: 855, loss: 0.3174663782119751, mean loss: 0.34395210064161846
Epoch: 40, step: 856, loss: 0.34421950578689575, mean loss: 0.34395210520352276
Epoch: 40, step: 857, loss: 0.3656676709651947, mean loss: 0.34395247566252446
Epoch: 40, step: 858, loss: 0.3614676594734192, mean loss: 0.34395277445956657
Epoch: 40, step: 859, loss: 0.32517334818840027, mean loss: 0.3439524541008789
Epoch: 40, step: 860, loss: 0.31451547145843506, mean loss: 0.34395195194324524
Epoch: 40, step: 861, loss: 0.34210947155952454, mean loss: 0.34395192051340007
Epoch: 40, step: 862, loss: 0.3039570450782776, mean loss: 0.34395123827476615
Epoch: 40, step: 863, loss: 0.3324328660964966, mean loss: 0.34395104179598307
Epoch: 40, step: 864, loss: 0.3429437279701233, mean loss: 0.3439510246136577
Epoch: 40, step: 865, loss: 0.30894890427589417, mean loss: 0.3439504275727486
Epoch: 40, step: 866, loss: 0.28822728991508484, mean loss: 0.34394947710389195
Epoch: 40, step: 867, loss: 0.3218829929828644, mean loss: 0.3439491007225704
Epoch: 40, step: 868, loss: 0.3397788405418396, mean loss: 0.34394902959292156
Epoch: 40, step: 869, loss: 0.3412807881832123, mean loss: 0.34394898408309027
Epoch: 40, step: 870, loss: 0.34311559796333313, mean loss: 0.34394896986900353
Epoch: 40, step: 871, loss: 0.32146722078323364, mean loss: 0.34394858643079423
Epoch: 40, step: 872, loss: 0.33963364362716675, mean loss: 0.34394851283840083
Epoch: 40, step: 873, loss: 0.3335154354572296, mean loss: 0.34394833490277676
Epoch: 40, step: 874, loss: 0.3368138372898102, mean loss: 0.3439482132263444
Epoch: 40, step: 875, loss: 0.31769922375679016, mean loss: 0.34394776556638346
Epoch: 40, step: 876, loss: 0.33911702036857605, mean loss: 0.3439476831824757
Epoch: 40, step: 877, loss: 0.3478357493877411, mean loss: 0.34394774948873114
Epoch: 40, step: 878, loss: 0.31057989597320557, mean loss: 0.3439471804501473
Epoch: 40, step: 879, loss: 0.3103930652141571, mean loss: 0.34394660824490797
Epoch: 40, step: 880, loss: 0.30044612288475037, mean loss: 0.34394586643482017
Epoch: 40, step: 881, loss: 0.3206864297389984, mean loss: 0.3439454698003825
Epoch: 40, step: 882, loss: 0.29766497015953064, mean loss: 0.3439446806098629
Epoch: 40, step: 883, loss: 0.39033564925193787, mean loss: 0.3439454716706473
Epoch: 40, step: 884, loss: 0.3660643994808197, mean loss: 0.3439458488371203
Epoch: 40, step: 885, loss: 0.2973015606403351, mean loss: 0.3439450534838448
Epoch: 40, step: 886, loss: 0.31832459568977356, mean loss: 0.34394461662504905
Epoch: 40, step: 887, loss: 0.32844123244285583, mean loss: 0.34394435227870845
Epoch: 40, step: 888, loss: 0.3456612229347229, mean loss: 0.34394438155236456
Epoch: 40, step: 889, loss: 0.3413478434085846, mean loss: 0.34394433728061446
Epoch: 40, step: 890, loss: 0.3365461826324463, mean loss: 0.34394421114202095
Epoch: 40, step: 891, loss: 0.34070295095443726, mean loss: 0.3439441558794521
Epoch: 40, step: 892, loss: 0.35037800669670105, mean loss: 0.34394426557291735
Epoch: 40, step: 893, loss: 0.3313550055027008, mean loss: 0.3439440509369152
Epoch: 40, step: 894, loss: 0.2953346371650696, mean loss: 0.34394322220255713
Epoch: 40, step: 895, loss: 0.36459439992904663, mean loss: 0.3439435742752816
Epoch: 40, step: 896, loss: 0.34826934337615967, mean loss: 0.3439436480221337
Epoch: 40, step: 897, loss: 0.3288023769855499, mean loss: 0.3439433898941539
Epoch: 40, step: 898, loss: 0.35472986102104187, mean loss: 0.34394357377848755
Epoch: 40, step: 899, loss: 0.34984055161476135, mean loss: 0.34394367430657885
Epoch: 40, step: 900, loss: 0.36454474925994873, mean loss: 0.34394402549518716
Epoch: 40, step: 901, loss: 0.31034916639328003, mean loss: 0.3439434528099889
Epoch: 40, step: 902, loss: 0.36387327313423157, mean loss: 0.3439437925440687
Epoch: 40, step: 903, loss: 0.31006988883018494, mean loss: 0.3439432151217362
Epoch: 40, step: 904, loss: 0.32578569650650024, mean loss: 0.343942905609785
Epoch: 40, step: 905, loss: 0.33339083194732666, mean loss: 0.3439427257428491
Epoch: 40, step: 906, loss: 0.30723410844802856, mean loss: 0.3439421000313368
Epoch: 40, step: 907, loss: 0.31141674518585205, mean loss: 0.34394154563447915
Epoch: 40, step: 908, loss: 0.3445497453212738, mean loss: 0.343941556001107
Epoch: 40, step: 909, loss: 0.33333519101142883, mean loss: 0.34394137522106627
Epoch: 40, step: 910, loss: 0.31671690940856934, mean loss: 0.34394091120194586
Epoch: 40, step: 911, loss: 0.40065181255340576, mean loss: 0.3439418777771666
Epoch: 40, step: 912, loss: 0.352745920419693, mean loss: 0.34394202782987643
Epoch: 40, step: 913, loss: 0.31995490193367004, mean loss: 0.3439416190095148
Epoch: 40, step: 914, loss: 0.3156014680862427, mean loss: 0.3439411360073687
Epoch: 40, step: 915, loss: 0.3513711392879486, mean loss: 0.3439412626350066
Epoch: 40, step: 916, loss: 0.3241990804672241, mean loss: 0.3439409261797998
Epoch: 40, step: 917, loss: 0.33716246485710144, mean loss: 0.34394081066016174
Epoch: 40, step: 918, loss: 0.3696645498275757, mean loss: 0.3439412490408289
Epoch: 40, step: 919, loss: 0.35980701446533203, mean loss: 0.34394151941856277
Epoch: 40, step: 920, loss: 0.35125070810317993, mean loss: 0.34394164397657445
Epoch: 40, step: 921, loss: 0.35128340125083923, mean loss: 0.34394176908746493
Epoch: 40, step: 922, loss: 0.3582009971141815, mean loss: 0.3439420120748382
Epoch: 40, step: 923, loss: 0.31369832158088684, mean loss: 0.34394149670965357
Epoch: 40, step: 924, loss: 0.35530373454093933, mean loss: 0.3439416903236577
Epoch: 40, step: 925, loss: 0.36122289299964905, mean loss: 0.3439419847925715
Epoch: 40, step: 926, loss: 0.31959280371665955, mean loss: 0.3439415698935125
Epoch: 40, step: 927, loss: 0.3232347071170807, mean loss: 0.34394121706392594
Epoch: 40, step: 928, loss: 0.32134997844696045, mean loss: 0.34394083213253135
Epoch: 40, step: 929, loss: 0.3276306986808777, mean loss: 0.3439405542294226
Epoch: 40, step: 930, loss: 0.30896830558776855, mean loss: 0.34393995835869895
Epoch: 40, step: 931, loss: 0.31592175364494324, mean loss: 0.3439394809818041
Epoch: 40, step: 932, loss: 0.3222253620624542, mean loss: 0.3439391110208391
Epoch: 40, step: 933, loss: 0.31493669748306274, mean loss: 0.34393861689173666
Epoch: 40, step: 934, loss: 0.35269612073898315, mean loss: 0.3439387660953119
Epoch: 40, step: 935, loss: 0.3194299340248108, mean loss: 0.34393834853990657
Epoch: 40, step: 936, loss: 0.3023530840873718, mean loss: 0.34393764006648453
Epoch: 40, step: 937, loss: 0.30532708764076233, mean loss: 0.34393698228338415
Epoch: 40, step: 938, loss: 0.3231094479560852, mean loss: 0.34393662746414827
Epoch: 40, step: 939, loss: 0.3299247622489929, mean loss: 0.34393638876116334
Epoch: 40, step: 940, loss: 0.3285577595233917, mean loss: 0.34393612677875696
Epoch: 40, step: 941, loss: 0.3378564715385437, mean loss: 0.34393602321064615
Epoch: 40, step: 942, loss: 0.33620110154151917, mean loss: 0.34393589144699405
Epoch: 40, step: 943, loss: 0.33123764395713806, mean loss: 0.3439356751372453
Epoch: 40, step: 944, loss: 0.3452233374118805, mean loss: 0.3439356970717019
Epoch: 40, step: 945, loss: 0.3284723460674286, mean loss: 0.34393543366845514
Epoch: 40, step: 946, loss: 0.3309016227722168, mean loss: 0.343935211653859
Epoch: 40, step: 947, loss: 0.33527871966362, mean loss: 0.34393506420390346
Epoch: 40, step: 948, loss: 0.31387728452682495, mean loss: 0.34393455222482566
Epoch: 40, step: 949, loss: 0.3702229857444763, mean loss: 0.3439349999923869
Epoch: 40, step: 950, loss: 0.37156999111175537, mean loss: 0.34393547068767605
Epoch: 40, step: 951, loss: 0.35998469591140747, mean loss: 0.34393574404278615
Epoch: 40, step: 952, loss: 0.37653592228889465, mean loss: 0.3439362992891242
Epoch: 40, step: 953, loss: 0.33722132444381714, mean loss: 0.3439361849215995
Epoch: 40, step: 954, loss: 0.3043938875198364, mean loss: 0.343935511460007
Epoch: 40, step: 955, loss: 0.2925815284252167, mean loss: 0.34393463684349646
Epoch: 40, step: 956, loss: 0.31305715441703796, mean loss: 0.34393411097394544
Epoch: 40, step: 957, loss: 0.41586410999298096, mean loss: 0.3439353359815925
Epoch: 40, step: 958, loss: 0.2904405891895294, mean loss: 0.34393442495199744
Epoch: 40, step: 959, loss: 0.35394468903541565, mean loss: 0.34393459542652205
Epoch: 40, step: 960, loss: 0.3582831621170044, mean loss: 0.3439348397780605
Epoch: 40, step: 961, loss: 0.3564949929714203, mean loss: 0.343935053669842
Epoch: 40, step: 962, loss: 0.3598034977912903, mean loss: 0.3439353238952072
Epoch: 40, step: 963, loss: 0.3456341028213501, mean loss: 0.34393535282339543
Epoch: 40, step: 964, loss: 0.34815874695777893, mean loss: 0.34393542474155864
Epoch: 40, step: 965, loss: 0.30877918004989624, mean loss: 0.3439348260928393
Epoch: 40, step: 966, loss: 0.31862157583236694, mean loss: 0.3439343950602604
Epoch: 40, step: 967, loss: 0.3184598982334137, mean loss: 0.3439339612893704
Epoch: 40, step: 968, loss: 0.33233487606048584, mean loss: 0.3439337637875361
Epoch: 40, step: 969, loss: 0.34757834672927856, mean loss: 0.3439338258441161
Epoch: 40, step: 970, loss: 0.32049086689949036, mean loss: 0.3439334266859382
Epoch: 40, step: 971, loss: 0.3229854702949524, mean loss: 0.34393307001570067
Epoch: 40, step: 972, loss: 0.3158879280090332, mean loss: 0.3439325925134105
Epoch: 40, step: 973, loss: 0.32844337821006775, mean loss: 0.34393232879538854
Epoch: 40, step: 974, loss: 0.3362905979156494, mean loss: 0.34393219869015523
Epoch: 40, step: 975, loss: 0.3084845244884491, mean loss: 0.34393159518167316
Epoch: 40, step: 976, loss: 0.32247960567474365, mean loss: 0.3439312299606114
Epoch: 40, step: 977, loss: 0.35307610034942627, mean loss: 0.34393138564978004
Epoch: 40, step: 978, loss: 0.30183523893356323, mean loss: 0.3439306689854392
Epoch: 40, step: 979, loss: 0.3401642441749573, mean loss: 0.34393060486516663
Epoch: 40, step: 980, loss: 0.3277696967124939, mean loss: 0.34393032974373267
Epoch: 40, step: 981, loss: 0.3297615647315979, mean loss: 0.3439300885404197
Epoch: 40, step: 982, loss: 0.3467603027820587, mean loss: 0.34393013672001965
Epoch: 40, step: 983, loss: 0.31313997507095337, mean loss: 0.34392961257863247
Epoch: 40, step: 984, loss: 0.3556874394416809, mean loss: 0.34392981272888973
Epoch: 40, step: 985, loss: 0.3123493790626526, mean loss: 0.3439292751529924
Epoch: 40, step: 986, loss: 0.3439156413078308, mean loss: 0.3439292749209151
Epoch: 40, step: 987, loss: 0.3137205243110657, mean loss: 0.34392876071191036
Epoch: 40, step: 988, loss: 0.3312585949897766, mean loss: 0.3439285450458442
Epoch: 40, step: 989, loss: 0.30761030316352844, mean loss: 0.34392792686300366
Epoch: 40, step: 990, loss: 0.28942224383354187, mean loss: 0.3439269991224881
Epoch: 40, step: 991, loss: 0.33762848377227783, mean loss: 0.3439268919173657
Epoch: 40, step: 992, loss: 0.3399219810962677, mean loss: 0.34392682375215167
Epoch: 40, step: 993, loss: 0.3521457016468048, mean loss: 0.34392696363842146
Epoch: 40, step: 994, loss: 0.32680994272232056, mean loss: 0.3439266723096679
Epoch: 40, step: 995, loss: 0.3668523132801056, mean loss: 0.3439270624934954
Epoch: 40, step: 996, loss: 0.3874865174293518, mean loss: 0.3439278038426953
Epoch: 40, step: 997, loss: 0.3803631663322449, mean loss: 0.34392842393464
Epoch: 40, step: 998, loss: 0.34570759534835815, mean loss: 0.3439284542137703
Epoch: 40, step: 999, loss: 0.3182157278060913, mean loss: 0.3439280166248253
Epoch: 40, step: 1000, loss: 0.29015102982521057, mean loss: 0.34392710144321165
Epoch: 40, step: 1001, loss: 0.3038195073604584, mean loss: 0.3439264189001722
Epoch: 40, step: 1002, loss: 0.3366297483444214, mean loss: 0.34392629472900066
Epoch: 40, step: 1003, loss: 0.31446805596351624, mean loss: 0.3439257934316287
Epoch: 40, step: 1004, loss: 0.3265681862831116, mean loss: 0.34392549805841083
Epoch: 40, step: 1005, loss: 0.33991360664367676, mean loss: 0.34392542978948976
Epoch: 40, step: 1006, loss: 0.3750678300857544, mean loss: 0.3439259597195576
Epoch: 40, step: 1007, loss: 0.3329947590827942, mean loss: 0.3439257737135571
Epoch: 40, step: 1008, loss: 0.3331514596939087, mean loss: 0.3439255903802688
Epoch: 40, step: 1009, loss: 0.3554951548576355, mean loss: 0.3439257872420091
Epoch: 40, step: 1010, loss: 0.3252462148666382, mean loss: 0.3439254694054507
Epoch: 40, step: 1011, loss: 0.31568917632102966, mean loss: 0.3439249889676047
Epoch: 40, step: 1012, loss: 0.301577091217041, mean loss: 0.34392426843440493
Epoch: 40, step: 1013, loss: 0.3999404013156891, mean loss: 0.34392522151115457
Epoch: 40, step: 1014, loss: 0.3125600218772888, mean loss: 0.34392468786250063
Epoch: 40, step: 1015, loss: 0.37071672081947327, mean loss: 0.34392514369537386
Epoch: 40, step: 1016, loss: 0.36845335364341736, mean loss: 0.3439255610050349
Epoch: 40, step: 1017, loss: 0.31406253576278687, mean loss: 0.34392505294036374
Epoch: 40, step: 1018, loss: 0.3626311123371124, mean loss: 0.3439253711842841
Epoch: 40, step: 1019, loss: 0.3327518105506897, mean loss: 0.34392518109308584
Epoch: 40, step: 1020, loss: 0.36660611629486084, mean loss: 0.34392556694795734
Epoch: 40, step: 1021, loss: 0.34014421701431274, mean loss: 0.34392550261959265
Epoch: 40, step: 1022, loss: 0.305819571018219, mean loss: 0.3439248543721129
Epoch: 40, step: 1023, loss: 0.32811856269836426, mean loss: 0.3439245854844619
Epoch: 40, step: 1024, loss: 0.3080614507198334, mean loss: 0.34392397541157316
Epoch: 40, step: 1025, loss: 0.33843186497688293, mean loss: 0.3439238819860903
Epoch: 40, step: 1026, loss: 0.33044004440307617, mean loss: 0.34392365261841407
Epoch: 40, step: 1027, loss: 0.29688552021980286, mean loss: 0.34392285248688387
Epoch: 40, step: 1028, loss: 0.3247990012168884, mean loss: 0.3439225271904633
Epoch: 40, step: 1029, loss: 0.3363531529903412, mean loss: 0.34392239843771283
Epoch: 40, step: 1030, loss: 0.3514188230037689, mean loss: 0.3439225259474433
Epoch: 40, step: 1031, loss: 0.3256884813308716, mean loss: 0.34392221580244714
Epoch: 40, step: 1032, loss: 0.31486454606056213, mean loss: 0.34392172156555256
Epoch: 40, step: 1033, loss: 0.3318021297454834, mean loss: 0.34392151542901106
Epoch: 40, step: 1034, loss: 0.3448479175567627, mean loss: 0.3439215311854891
Epoch: 40, step: 1035, loss: 0.34630751609802246, mean loss: 0.3439215717662244
Epoch: 40, step: 1036, loss: 0.3805764615535736, mean loss: 0.34392219518051065
Epoch: 40, step: 1037, loss: 0.30928412079811096, mean loss: 0.3439216060775755
Epoch: 40, step: 1038, loss: 0.3759792149066925, mean loss: 0.3439221512842768
Epoch: 40, step: 1039, loss: 0.32787609100341797, mean loss: 0.34392187839209515
Epoch: 40, step: 1040, loss: 0.32226690649986267, mean loss: 0.34392151011652344
Epoch: 40, step: 1041, loss: 0.332734078168869, mean loss: 0.34392131986054664
Epoch: 40, step: 1042, loss: 0.4093805253505707, mean loss: 0.34392243305554504
Epoch: 40, step: 1043, loss: 0.3165391981601715, mean loss: 0.3439219673859495
Epoch: 40, step: 1044, loss: 0.3241298496723175, mean loss: 0.3439216308139282
Epoch: 40, step: 1045, loss: 0.35187727212905884, mean loss: 0.34392176610014585
Epoch: 40, step: 1046, loss: 0.299520879983902, mean loss: 0.3439210110729192
Epoch: 40, step: 1047, loss: 0.39420270919799805, mean loss: 0.3439218660875112
Epoch: 40, step: 1048, loss: 0.3463059067726135, mean loss: 0.3439219066262159
Epoch: 40, step: 1049, loss: 0.3270561099052429, mean loss: 0.3439216198417112
Epoch: 40, step: 1050, loss: 0.2910080552101135, mean loss: 0.3439207201194716
Epoch: 40, step: 1051, loss: 0.3026660084724426, mean loss: 0.343920018651886
Epoch: 40, step: 1052, loss: 0.32979440689086914, mean loss: 0.3439197784734941
Epoch: 40, step: 1053, loss: 0.3616648018360138, mean loss: 0.343920080187769
Epoch: 40, step: 1054, loss: 0.3252885341644287, mean loss: 0.3439197634055532
Epoch: 40, step: 1055, loss: 0.317743718624115, mean loss: 0.34391931835582557
Epoch: 40, step: 1056, loss: 0.30765652656555176, mean loss: 0.3439187018199297
Epoch: 40, step: 1057, loss: 0.32785117626190186, mean loss: 0.3439184286463169
Epoch: 40, step: 1058, loss: 0.31606683135032654, mean loss: 0.3439179551327023
Epoch: 40, step: 1059, loss: 0.34310805797576904, mean loss: 0.34391794136362447
Epoch: 40, step: 1060, loss: 0.34453538060188293, mean loss: 0.3439179518605429
Epoch: 40, step: 1061, loss: 0.373687744140625, mean loss: 0.3439184579601703
Epoch: 40, step: 1062, loss: 0.32578590512275696, mean loss: 0.34391814970399776
Epoch: 40, step: 1063, loss: 0.3398374021053314, mean loss: 0.34391808033184357
Epoch: 40, step: 1064, loss: 0.3631208837032318, mean loss: 0.3439184067713399
Epoch: 40, step: 1065, loss: 0.29264867305755615, mean loss: 0.3439175352224718
Epoch: 40, step: 1066, loss: 0.349641352891922, mean loss: 0.34391763252163154
Epoch: 40, step: 1067, loss: 0.31275150179862976, mean loss: 0.34391710273767284
Epoch: 40, step: 1068, loss: 0.3495739698410034, mean loss: 0.3439171988954709
Epoch: 40, step: 1069, loss: 0.37567517161369324, mean loss: 0.34391773872162623
Epoch: 40, step: 1070, loss: 0.3288875222206116, mean loss: 0.34391748324039184
Epoch: 40, step: 1071, loss: 0.319767028093338, mean loss: 0.34391707274176614
Epoch: 40, step: 1072, loss: 0.3389725685119629, mean loss: 0.34391698869872517
Epoch: 40, step: 1073, loss: 0.3953549861907959, mean loss: 0.34391786298905885
Epoch: 40, step: 1074, loss: 0.35007810592651367, mean loss: 0.34391796769277155
Epoch: 40, step: 1075, loss: 0.3118716776371002, mean loss: 0.34391742302131095
Epoch: 40, step: 1076, loss: 0.3332279622554779, mean loss: 0.34391724134208246
Epoch: 40, step: 1077, loss: 0.3263501226902008, mean loss: 0.343916942774513
Epoch: 40, step: 1078, loss: 0.3026461601257324, mean loss: 0.34391624135568116
Epoch: 40, step: 1079, loss: 0.3403315544128418, mean loss: 0.3439161804330615
Epoch: 40, step: 1080, loss: 0.3639802038669586, mean loss: 0.3439165214201867
Epoch: 40, step: 1081, loss: 0.31929609179496765, mean loss: 0.34391610300426567
Epoch: 40, step: 1082, loss: 0.3137548863887787, mean loss: 0.3439155904332442
Epoch: 40, step: 1083, loss: 0.3097333014011383, mean loss: 0.34391500953648274
Epoch: 40, step: 1084, loss: 0.32067617774009705, mean loss: 0.34391461462048656
Epoch: 40, step: 1085, loss: 0.3135931193828583, mean loss: 0.3439140993519001
Epoch: 40, step: 1086, loss: 0.32784101366996765, mean loss: 0.34391382621842376
Epoch: 40, step: 1087, loss: 0.3374788165092468, mean loss: 0.34391371686874816
Epoch: 40, step: 1088, loss: 0.29034653306007385, mean loss: 0.3439128066207608
Epoch: 40, step: 1089, loss: 0.3264809846878052, mean loss: 0.3439125104130814
Epoch: 40, step: 1090, loss: 0.30323660373687744, mean loss: 0.3439118192454432
Epoch: 40, step: 1091, loss: 0.3112255036830902, mean loss: 0.3439112638468915
Epoch: 40, step: 1092, loss: 0.339197039604187, mean loss: 0.34391118374521035
Epoch: 40, step: 1093, loss: 0.40935200452804565, mean loss: 0.34391229566319015
Epoch: 40, step: 1094, loss: 0.3448026478290558, mean loss: 0.34391231079108353
Epoch: 40, step: 1095, loss: 0.3303287923336029, mean loss: 0.3439120799986672
Epoch: 40, step: 1096, loss: 0.35841378569602966, mean loss: 0.3439123263874688
Epoch: 40, step: 1097, loss: 0.3015589714050293, mean loss: 0.34391160680211114
Epoch: 40, step: 1098, loss: 0.3462526500225067, mean loss: 0.3439116465758623
Epoch: 40, step: 1099, loss: 0.2967425584793091, mean loss: 0.3439108451982188
Epoch: 40, step: 1100, loss: 0.32238703966140747, mean loss: 0.3439104795264576
Epoch: 40, step: 1101, loss: 0.3321365714073181, mean loss: 0.3439102795008363
Epoch: 40, step: 1102, loss: 0.3042481243610382, mean loss: 0.34390960569632173
Epoch: 40, step: 1103, loss: 0.37660253047943115, mean loss: 0.34391016109392947
Epoch: 40, step: 1104, loss: 0.35379695892333984, mean loss: 0.34391032905108276
Epoch: 40, step: 1105, loss: 0.3197495937347412, mean loss: 0.3439099186149173
Epoch: 40, step: 1106, loss: 0.30968526005744934, mean loss: 0.3439093372253687
Epoch: 40, step: 1107, loss: 0.3310466408729553, mean loss: 0.3439091187247172
Epoch: 40, step: 1108, loss: 0.32805177569389343, mean loss: 0.34390884935810606
Epoch: 40, step: 1109, loss: 0.3361620008945465, mean loss: 0.34390871776564025
Epoch: 40, step: 1110, loss: 0.3720134496688843, mean loss: 0.3439091951608247
Epoch: 40, step: 1111, loss: 0.3350255787372589, mean loss: 0.34390904426368474
Epoch: 40, step: 1112, loss: 0.3249451220035553, mean loss: 0.3439087221479057
Epoch: 40, step: 1113, loss: 0.36488112807273865, mean loss: 0.34390907837316514
Epoch: 40, step: 1114, loss: 0.34268054366111755, mean loss: 0.3439090575063335
Epoch: 40, step: 1115, loss: 0.3200784921646118, mean loss: 0.34390865274776733
Epoch: 40, step: 1116, loss: 0.35190480947494507, mean loss: 0.3439087885589793
Epoch: 40, step: 1117, loss: 0.3185664117336273, mean loss: 0.3439083581371439
Epoch: 40, step: 1118, loss: 0.3588932752609253, mean loss: 0.3439086126407381
Epoch: 40, step: 1119, loss: 0.3430490493774414, mean loss: 0.3439085980421772
Epoch: 40, step: 1120, loss: 0.31866151094436646, mean loss: 0.3439081692606161
Epoch: 40, step: 1121, loss: 0.30353742837905884, mean loss: 0.3439074836395285
Epoch: 40, step: 1122, loss: 0.3951960504055023, mean loss: 0.3439083546645572
Epoch: 40, step: 1123, loss: 0.2981535792350769, mean loss: 0.34390757763216423
Epoch: 40, step: 1124, loss: 0.3506505787372589, mean loss: 0.34390769214351863
Epoch: 40, step: 1125, loss: 0.3261025846004486, mean loss: 0.3439073897778028
Epoch: 40, step: 1126, loss: 0.30992621183395386, mean loss: 0.3439068127204226
Epoch: 40, step: 1127, loss: 0.3315117061138153, mean loss: 0.3439066022343031
Epoch: 40, step: 1128, loss: 0.3701475262641907, mean loss: 0.34390704783405907
Epoch: 40, step: 1129, loss: 0.3140290379524231, mean loss: 0.3439065404811998
Epoch: 40, step: 1130, loss: 0.31808680295944214, mean loss: 0.34390610204854416
Epoch: 40, step: 1131, loss: 0.3414326310157776, mean loss: 0.3439060600484247
Epoch: 40, step: 1132, loss: 0.3318624198436737, mean loss: 0.3439058555480562
Epoch: 40, step: 1133, loss: 0.3171978294849396, mean loss: 0.34390540205489795
Epoch: 40, step: 1134, loss: 0.34492355585098267, mean loss: 0.343905419342508
Epoch: 40, step: 1135, loss: 0.31948140263557434, mean loss: 0.3439050046451312
Epoch: 40, step: 1136, loss: 0.3268733620643616, mean loss: 0.3439047154683891
Epoch: 40, step: 1137, loss: 0.32422497868537903, mean loss: 0.34390438133587553
Epoch: 40, step: 1138, loss: 0.36396077275276184, mean loss: 0.3439047218576402
Epoch: 40, step: 1139, loss: 0.3700914680957794, mean loss: 0.34390516645435054
Epoch: 40, step: 1140, loss: 0.3240077495574951, mean loss: 0.34390482864316063
Epoch: 40, step: 1141, loss: 0.3695400357246399, mean loss: 0.34390526386110026
Epoch: 40, step: 1142, loss: 0.33908548951148987, mean loss: 0.3439051820354827
Epoch: 40, step: 1143, loss: 0.36450180411338806, mean loss: 0.3439055316997174
Epoch: 40, step: 1144, loss: 0.3578837811946869, mean loss: 0.3439057690012961
Epoch: 40, step: 1145, loss: 0.3457232713699341, mean loss: 0.3439057998555787
Epoch: 40, step: 1146, loss: 0.38728368282318115, mean loss: 0.3439065362346672
Epoch: 40, step: 1147, loss: 0.31203338503837585, mean loss: 0.3439059951680685
Epoch: 40, step: 1148, loss: 0.32424402236938477, mean loss: 0.3439056613994967
Epoch: 40, step: 1149, loss: 0.3159944713115692, mean loss: 0.343905187605742
Epoch: 40, step: 1150, loss: 0.30563420057296753, mean loss: 0.3439045379649783
Epoch: 40, step: 1151, loss: 0.3161090314388275, mean loss: 0.3439040661509756
Epoch: 40, step: 1152, loss: 0.35908740758895874, mean loss: 0.34390432387578057
Epoch: 40, step: 1153, loss: 0.30246663093566895, mean loss: 0.34390362051676676
Epoch: 40, step: 1154, loss: 0.37523865699768066, mean loss: 0.34390415238533134
Epoch: 40, step: 1155, loss: 0.3743704557418823, mean loss: 0.3439046694995848
Epoch: 40, step: 1156, loss: 0.33160191774368286, mean loss: 0.34390446068461195
Epoch: 40, step: 1157, loss: 0.3550303876399994, mean loss: 0.3439046495220972
Epoch: 40, step: 1158, loss: 0.3626442551612854, mean loss: 0.3439049675791864
Epoch: 40, step: 1159, loss: 0.32449135184288025, mean loss: 0.3439046380880843
Epoch: 40, step: 1160, loss: 0.3663202226161957, mean loss: 0.3439050185226412
Epoch: 40, step: 1161, loss: 0.29644080996513367, mean loss: 0.34390421297957485
Epoch: 40, step: 1162, loss: 0.35563018918037415, mean loss: 0.34390441198465266
Epoch: 40, step: 1163, loss: 0.3434504270553589, mean loss: 0.3439044042800683
Epoch: 40, step: 1164, loss: 0.3353082537651062, mean loss: 0.34390425839715755
Epoch: 40, step: 1165, loss: 0.3279203474521637, mean loss: 0.34390398714319587
Epoch: 40, step: 1166, loss: 0.33593395352363586, mean loss: 0.34390385189053374
Epoch: 40, step: 1167, loss: 0.2894775867462158, mean loss: 0.3439029282843509
Epoch: 40, step: 1168, loss: 0.3831522464752197, mean loss: 0.3439035943285429
Epoch: 40, step: 1169, loss: 0.30417993664741516, mean loss: 0.3439029202464509
Epoch: 40, step: 1170, loss: 0.34445199370384216, mean loss: 0.34390292956367713
Epoch: 40, step: 1171, loss: 0.386244535446167, mean loss: 0.3439036480460956
Epoch: 40, step: 1172, loss: 0.30102235078811646, mean loss: 0.3439029204181578
Epoch: 40, step: 1173, loss: 0.2964465618133545, mean loss: 0.3439021151723132
Epoch: 40, step: 1174, loss: 0.34262824058532715, mean loss: 0.3439020935574055
Epoch: 40, step: 1175, loss: 0.32421818375587463, mean loss: 0.3439017595695237
Epoch: 40, step: 1176, loss: 0.3261845111846924, mean loss: 0.3439014589561843
Epoch: 40, step: 1177, loss: 0.3538453280925751, mean loss: 0.34390162767363547
Epoch: 40, step: 1178, loss: 0.334683358669281, mean loss: 0.3439014712700826
Epoch: 40, step: 1179, loss: 0.3891303241252899, mean loss: 0.34390223864118635
Epoch: 40, step: 1180, loss: 0.3169306516647339, mean loss: 0.34390178103804125
Epoch: 40, step: 1181, loss: 0.36201179027557373, mean loss: 0.34390208828939406
Epoch: 40, step: 1182, loss: 0.3108876943588257, mean loss: 0.3439015281822748
Epoch: 40, step: 1183, loss: 0.3500623404979706, mean loss: 0.3439016327020277
Epoch: 40, step: 1184, loss: 0.3490447998046875, mean loss: 0.34390171995568963
Epoch: 40, step: 1185, loss: 0.331601083278656, mean loss: 0.34390151127933033
Epoch: 40, step: 1186, loss: 0.322905957698822, mean loss: 0.34390115510253455
Epoch: 40, step: 1187, loss: 0.31803688406944275, mean loss: 0.343900716338352
Epoch: 40, step: 1188, loss: 0.3251047432422638, mean loss: 0.3439003974869195
Epoch: 40, step: 1189, loss: 0.3373430669307709, mean loss: 0.34390028625145624
Epoch: 40, step: 1190, loss: 0.3108418881893158, mean loss: 0.3438997254738942
Epoch: 40, step: 1191, loss: 0.3279561400413513, mean loss: 0.34389945502360525
Epoch: 40, step: 1192, loss: 0.37108948826789856, mean loss: 0.34389991623903526
Epoch: 40, step: 1193, loss: 0.333532452583313, mean loss: 0.34389974038220356
Epoch: 40, step: 1194, loss: 0.32606181502342224, mean loss: 0.343899437813713
Epoch: 40, step: 1195, loss: 0.31046220660209656, mean loss: 0.34389887065801705
Epoch: 40, step: 1196, loss: 0.28433433175086975, mean loss: 0.34389786035323716
Epoch: 40, step: 1197, loss: 0.3600175976753235, mean loss: 0.34389813376375516
Epoch: 40, step: 1198, loss: 0.3406714200973511, mean loss: 0.3438980790356616
Epoch: 40, step: 1199, loss: 0.30938270688056946, mean loss: 0.34389749363247035
Epoch: 40, step: 1200, loss: 0.3575384318828583, mean loss: 0.34389772498774335
Epoch: 40, step: 1201, loss: 0.32560041546821594, mean loss: 0.34389741466398366
Epoch: 40, step: 1202, loss: 0.3434518277645111, mean loss: 0.3438974071069242
Epoch: 40, step: 1203, loss: 0.35386741161346436, mean loss: 0.3438975761932227
Epoch: 40, step: 1204, loss: 0.3442624807357788, mean loss: 0.3438975823817166
Epoch: 40, step: 1205, loss: 0.32105568051338196, mean loss: 0.3438971950076049
Epoch: 40, step: 1206, loss: 0.3133910000324249, mean loss: 0.34389667766409115
Epoch: 40, step: 1207, loss: 0.3711540400981903, mean loss: 0.34389713990399134
Epoch: 40, step: 1208, loss: 0.34089580178260803, mean loss: 0.34389708900711125
Epoch: 40, step: 1209, loss: 0.3605778217315674, mean loss: 0.34389737187522595
Epoch: 40, step: 1210, loss: 0.30262866616249084, mean loss: 0.34389667206166147
Epoch: 40, step: 1211, loss: 0.32640376687049866, mean loss: 0.34389637543096907
Epoch: 40, step: 1212, loss: 0.32588574290275574, mean loss: 0.3438960700262495
Epoch: 40, step: 1213, loss: 0.33523598313331604, mean loss: 0.343895923180404
Epoch: 40, step: 1214, loss: 0.29560720920562744, mean loss: 0.3438951043806757
Epoch: 40, step: 1215, loss: 0.32792434096336365, mean loss: 0.343894833579614
Epoch: 40, step: 1216, loss: 0.33282995223999023, mean loss: 0.3438946459661148
Epoch: 40, step: 1217, loss: 0.33942416310310364, mean loss: 0.34389457016695474
Epoch: 40, step: 1218, loss: 0.3283620774745941, mean loss: 0.3438943068106297
Epoch: 40, step: 1219, loss: 0.3400706350803375, mean loss: 0.34389424198065804
Epoch: 40, step: 1220, loss: 0.3017631471157074, mean loss: 0.34389352766427034
Epoch: 40, step: 1221, loss: 0.3093704283237457, mean loss: 0.34389294234842244
Epoch: 40, step: 1222, loss: 0.3225325345993042, mean loss: 0.34389258020326624
Epoch: 40, step: 1223, loss: 0.325133740901947, mean loss: 0.34389226217059127
Epoch: 40, step: 1224, loss: 0.37289923429489136, mean loss: 0.34389275393921254
Epoch: 40, step: 1225, loss: 0.35316434502601624, mean loss: 0.34389291112212184
Epoch: 40, step: 1226, loss: 0.3536420166492462, mean loss: 0.3438930763976152
Epoch: 40, step: 1227, loss: 0.2959335446357727, mean loss: 0.34389226335883166
Epoch: 40, step: 1228, loss: 0.31438496708869934, mean loss: 0.3438917631419053
Epoch: 40, step: 1229, loss: 0.31229686737060547, mean loss: 0.34389122754441803
Epoch: 40, step: 1230, loss: 0.3273819386959076, mean loss: 0.3438909476832723
Epoch: 40, step: 1231, loss: 0.32099783420562744, mean loss: 0.3438905596117799
Epoch: 40, step: 1232, loss: 0.31524550914764404, mean loss: 0.34389007404484034
Epoch: 40, step: 1233, loss: 0.3691227436065674, mean loss: 0.34389050176070235
Epoch: 40, step: 1234, loss: 0.33414486050605774, mean loss: 0.3438903365663426
Epoch: 40, step: 1235, loss: 0.28684690594673157, mean loss: 0.3438893696629827
Epoch: 40, step: 1236, loss: 0.29440224170684814, mean loss: 0.3438885308554509
Epoch: 40, step: 1237, loss: 0.35803449153900146, mean loss: 0.3438887706256242
Epoch: 40, step: 1238, loss: 0.30399855971336365, mean loss: 0.34388809450889485
Epoch: 40, step: 1239, loss: 0.374081552028656, mean loss: 0.34388860626241213
Epoch: 40, step: 1240, loss: 0.34530800580978394, mean loss: 0.34388863031962386
Epoch: 40, step: 1241, loss: 0.3633553981781006, mean loss: 0.3438889602536576
Epoch: 40, step: 1242, loss: 0.34702691435813904, mean loss: 0.3438890134366162
Epoch: 40, step: 1243, loss: 0.2906840145587921, mean loss: 0.3438881117181077
Epoch: 40, step: 1244, loss: 0.30295851826667786, mean loss: 0.3438874180549698
Epoch: 40, step: 1245, loss: 0.2992728054523468, mean loss: 0.343886661951987
Epoch: 40, step: 1246, loss: 0.3065706193447113, mean loss: 0.34388602955171915
Epoch: 40, step: 1247, loss: 0.3363584280014038, mean loss: 0.3438859019825497
Epoch: 40, step: 1248, loss: 0.3371119797229767, mean loss: 0.3438857871878191
Epoch: 40, step: 1249, loss: 0.34153756499290466, mean loss: 0.3438857473941876
Epoch: 40, step: 1250, loss: 0.329706072807312, mean loss: 0.34388550710551957
Epoch: 40, step: 1251, loss: 0.3336961567401886, mean loss: 0.34388533443978436
Epoch: 40, step: 1252, loss: 0.35462456941604614, mean loss: 0.3438855164206187
Epoch: 40, step: 1253, loss: 0.37406736612319946, mean loss: 0.3438860278560358
Epoch: 40, step: 1254, loss: 0.3376985490322113, mean loss: 0.34388592301016907
Epoch: 40, step: 1255, loss: 0.3401722311973572, mean loss: 0.34388586008330496
Epoch: 40, step: 1256, loss: 0.30830466747283936, mean loss: 0.34388525718595997
Epoch: 40, step: 1257, loss: 0.3095346689224243, mean loss: 0.3438846751501698
Epoch: 40, step: 1258, loss: 0.31957346200942993, mean loss: 0.3438842632283626
Epoch: 40, step: 1259, loss: 0.4117976725101471, mean loss: 0.34388541391303357
Epoch: 40, step: 1260, loss: 0.3252700865268707, mean loss: 0.3438850985112717
Epoch: 40, step: 1261, loss: 0.3021351993083954, mean loss: 0.34388439114962344
Epoch: 40, step: 1262, loss: 0.33033376932144165, mean loss: 0.3438841615675651
Epoch: 40, step: 1263, loss: 0.3642657995223999, mean loss: 0.3438845068785904
Epoch: 40, step: 1264, loss: 0.3267839550971985, mean loss: 0.3438842171614912
Epoch: 40, step: 1265, loss: 0.3372156620025635, mean loss: 0.3438841041849189
Epoch: 40, step: 1266, loss: 0.34726154804229736, mean loss: 0.3438841614035452
Epoch: 40, step: 1267, loss: 0.35451748967170715, mean loss: 0.3438843415439577
Epoch: 40, step: 1268, loss: 0.3310537338256836, mean loss: 0.3438841241828688
Epoch: 40, step: 1269, loss: 0.3299599587917328, mean loss: 0.343883888300006
Epoch: 40, step: 1270, loss: 0.30912867188453674, mean loss: 0.34388329953789093
Epoch: 40, step: 1271, loss: 0.35762566328048706, mean loss: 0.3438835323330485
Epoch: 40, step: 1272, loss: 0.340779572725296, mean loss: 0.34388347975297284
Epoch: 40, step: 1273, loss: 0.3251260817050934, mean loss: 0.3438831620140758
Epoch: 40, step: 1274, loss: 0.343349814414978, mean loss: 0.3438831529796454
Epoch: 40, step: 1275, loss: 0.330337792634964, mean loss: 0.3438829235372654
Epoch: 40, step: 1276, loss: 0.3319490849971771, mean loss: 0.3438827213955824
Epoch: 40, step: 1277, loss: 0.34530970454216003, mean loss: 0.34388274556616993
Epoch: 40, step: 1278, loss: 0.37363922595977783, mean loss: 0.3438832495801335
Epoch: 40, step: 1279, loss: 0.33872875571250916, mean loss: 0.3438831622750206
Epoch: 40, step: 1280, loss: 0.3075040578842163, mean loss: 0.3438825461082146
Epoch: 40, step: 1281, loss: 0.33263063430786133, mean loss: 0.3438823555335085
Epoch: 40, step: 1282, loss: 0.3058595061302185, mean loss: 0.3438817115477794
Epoch: 40, step: 1283, loss: 0.33209240436553955, mean loss: 0.34388151187791993
Epoch: 40, step: 1284, loss: 0.34301143884658813, mean loss: 0.34388149714215854
Epoch: 40, step: 1285, loss: 0.31688785552978516, mean loss: 0.3438810399792413
Epoch: 40, step: 1286, loss: 0.32719895243644714, mean loss: 0.3438807574570549
Epoch: 40, step: 1287, loss: 0.3776210844516754, mean loss: 0.343881328862132
Epoch: 40, step: 1288, loss: 0.32434794306755066, mean loss: 0.34388099806252836
Epoch: 40, step: 1289, loss: 0.32749029994010925, mean loss: 0.34388072048931717
Epoch: 40, step: 1290, loss: 0.34263014793395996, mean loss: 0.3438806993114784
Epoch: 40, step: 1291, loss: 0.32956957817077637, mean loss: 0.3438804569636978
Epoch: 40, step: 1292, loss: 0.33499976992607117, mean loss: 0.34388030657867014
Epoch: 40, step: 1293, loss: 0.34408602118492126, mean loss: 0.34388031006217007
Epoch: 40, step: 1294, loss: 0.30177220702171326, mean loss: 0.3438795970301992
Epoch: 40, step: 1295, loss: 0.33674582839012146, mean loss: 0.34387947623352083
Epoch: 40, step: 1296, loss: 0.3137868344783783, mean loss: 0.34387896668102486
Epoch: 40, step: 1297, loss: 0.3586660921573639, mean loss: 0.3438792170641309
Epoch: 40, step: 1298, loss: 0.34374532103538513, mean loss: 0.3438792147969738
Epoch: 40, step: 1299, loss: 0.3171160817146301, mean loss: 0.34387876164538084
Epoch: 40, step: 1300, loss: 0.35379716753959656, mean loss: 0.3438789295803277
Epoch: 40, step: 1301, loss: 0.37431269884109497, mean loss: 0.34387944486543925
Epoch: 40, step: 1302, loss: 0.340144544839859, mean loss: 0.34387938162957205
Epoch: 40, step: 1303, loss: 0.30002716183662415, mean loss: 0.34387863917698175
Epoch: 40, step: 1304, loss: 0.3256874680519104, mean loss: 0.34387833119135364
Epoch: 40, step: 1305, loss: 0.33720922470092773, mean loss: 0.34387821828195586
Epoch: 40, step: 1306, loss: 0.3666102886199951, mean loss: 0.34387860313424795
Epoch: 40, step: 1307, loss: 0.3219490647315979, mean loss: 0.34387823187504835
Epoch: 40, step: 1308, loss: 0.3126280605792999, mean loss: 0.343877702829842
Epoch: 40, step: 1309, loss: 0.3230530023574829, mean loss: 0.3438773502870881
Epoch: 40, step: 1310, loss: 0.2968237102031708, mean loss: 0.34387655372633774
Epoch: 40, step: 1311, loss: 0.3220615088939667, mean loss: 0.3438761844304813
Epoch: 40, step: 1312, loss: 0.3707362413406372, mean loss: 0.3438766391230974
Epoch: 40, step: 1313, loss: 0.29895156621932983, mean loss: 0.3438758786350163
Epoch: 40, step: 1314, loss: 0.37436503171920776, mean loss: 0.34387639474425175
Epoch: 40, step: 1315, loss: 0.36640557646751404, mean loss: 0.34387677610354694
Epoch: 40, step: 1316, loss: 0.36375370621681213, mean loss: 0.3438771125615613
Epoch: 40, step: 1317, loss: 0.35328394174575806, mean loss: 0.3438772717888402
Epoch: 40, step: 1318, loss: 0.358560711145401, mean loss: 0.3438775203279041
Epoch: 40, step: 1319, loss: 0.3106502890586853, mean loss: 0.34387695791708367
Epoch: 40, step: 1320, loss: 0.36984458565711975, mean loss: 0.34387739744295054
Epoch: 40, step: 1321, loss: 0.3197864592075348, mean loss: 0.3438769896886728
Epoch: 40, step: 1322, loss: 0.3492335379123688, mean loss: 0.34387708035008513
Epoch: 40, step: 1323, loss: 0.3532349467277527, mean loss: 0.34387723873249626
Epoch: 40, step: 1324, loss: 0.34991371631622314, mean loss: 0.34387734089848737
Epoch: 40, step: 1325, loss: 0.39184287190437317, mean loss: 0.3438781526902994
Epoch: 40, step: 1326, loss: 0.3244529664516449, mean loss: 0.34387782393463
Epoch: 40, step: 1327, loss: 0.35452625155448914, mean loss: 0.34387800414766173
Epoch: 40, step: 1328, loss: 0.3153975009918213, mean loss: 0.3438775221543439
Epoch: 40, step: 1329, loss: 0.35283178091049194, mean loss: 0.34387767369028494
Epoch: 40, step: 1330, loss: 0.32821792364120483, mean loss: 0.343877408679538
Epoch: 40, step: 1331, loss: 0.3546861708164215, mean loss: 0.3438775915936742
Epoch: 40, step: 1332, loss: 0.3348274230957031, mean loss: 0.34387743844239577
Epoch: 40, step: 1333, loss: 0.31545355916023254, mean loss: 0.3438769574480599
Epoch: 40, step: 1334, loss: 0.32509884238243103, mean loss: 0.34387663968657306
Epoch: 40, step: 1335, loss: 0.2825183570384979, mean loss: 0.3438756014050879
Epoch: 40, step: 1336, loss: 0.3095432221889496, mean loss: 0.34387502045547597
Epoch: 40, step: 1337, loss: 0.39081308245658875, mean loss: 0.3438758146966009
Epoch: 40, step: 1338, loss: 0.32817938923835754, mean loss: 0.3438755491011516
Epoch: 40, step: 1339, loss: 0.35559794306755066, mean loss: 0.34387574744961125
Epoch: 40, step: 1340, loss: 0.35022953152656555, mean loss: 0.343875854956829
Epoch: 40, step: 1341, loss: 0.3599748909473419, mean loss: 0.34387612735092715
Epoch: 40, step: 1342, loss: 0.2824803590774536, mean loss: 0.3438750885581709
Epoch: 40, step: 1343, loss: 0.3581492006778717, mean loss: 0.3438753300665649
Epoch: 40, step: 1344, loss: 0.33480554819107056, mean loss: 0.3438751766145409
Epoch: 40, step: 1345, loss: 0.3404202163219452, mean loss: 0.34387511816091026
Epoch: 40, step: 1346, loss: 0.35458898544311523, mean loss: 0.3438752994231513
Epoch: 40, step: 1347, loss: 0.32795754075050354, mean loss: 0.34387503012358656
Epoch: 40, step: 1348, loss: 0.33903050422668457, mean loss: 0.3438749481643943
Epoch: 40, step: 1349, loss: 0.33537524938583374, mean loss: 0.34387480436979473
Epoch: 40, step: 1350, loss: 0.34203091263771057, mean loss: 0.34387477317607895
Epoch: 40, step: 1351, loss: 0.3543107807636261, mean loss: 0.34387494972242466
Epoch: 40, step: 1352, loss: 0.3171386420726776, mean loss: 0.3438744974309211
Epoch: 40, step: 1353, loss: 0.3022514283657074, mean loss: 0.3438737933156681
Epoch: 40, step: 1354, loss: 0.3663034737110138, mean loss: 0.34387417274018633
Epoch: 40, step: 1355, loss: 0.3477162718772888, mean loss: 0.34387423773272874
Epoch: 40, step: 1356, loss: 0.33789706230163574, mean loss: 0.343874136625172
Epoch: 40, step: 1357, loss: 0.3023737072944641, mean loss: 0.34387343463205094
Epoch: 40, step: 1358, loss: 0.2896369397640228, mean loss: 0.34387251721979994
Epoch: 40, step: 1359, loss: 0.3333725333213806, mean loss: 0.34387233961520086
Epoch: 40, step: 1360, loss: 0.34704747796058655, mean loss: 0.3438723933209627
Epoch: 40, step: 1361, loss: 0.3442912995815277, mean loss: 0.34387240040641753
Epoch: 40, step: 1362, loss: 0.3615736663341522, mean loss: 0.3438726998037067
Epoch: 40, step: 1363, loss: 0.3201873004436493, mean loss: 0.3438722991982105
Epoch: 40, step: 1364, loss: 0.3264771103858948, mean loss: 0.3438720049878289
Epoch: 40, step: 1365, loss: 0.3197672367095947, mean loss: 0.34387159730308314
Epoch: 40, step: 1366, loss: 0.33334746956825256, mean loss: 0.34387141931117193
Epoch: 40, step: 1367, loss: 0.3071295917034149, mean loss: 0.3438707979164417
Epoch: 40, step: 1368, loss: 0.3645690381526947, mean loss: 0.3438711479687043
Epoch: 40, step: 1369, loss: 0.3631359934806824, mean loss: 0.34387147377363436
Epoch: 40, step: 1370, loss: 0.3374187648296356, mean loss: 0.3438713646479821
Epoch: 40, step: 1371, loss: 0.3329116702079773, mean loss: 0.3438711793051146
Epoch: 40, step: 1372, loss: 0.283486008644104, mean loss: 0.3438701581296177
Epoch: 40, step: 1373, loss: 0.3573356866836548, mean loss: 0.3438703858417385
Epoch: 40, step: 1374, loss: 0.34152838587760925, mean loss: 0.34387034623744384
Epoch: 40, step: 1375, loss: 0.3503554165363312, mean loss: 0.34387045590110554
Epoch: 40, step: 1376, loss: 0.3322652578353882, mean loss: 0.3438702596585152
Epoch: 40, step: 1377, loss: 0.34704160690307617, mean loss: 0.3438703132847326
Epoch: 40, step: 1378, loss: 0.30633121728897095, mean loss: 0.34386967852432077
Epoch: 40, step: 1379, loss: 0.3345834016799927, mean loss: 0.34386952150239236
Epoch: 40, step: 1380, loss: 0.35563039779663086, mean loss: 0.34386972036403307
Epoch: 40, step: 1381, loss: 0.32966163754463196, mean loss: 0.343869480127267
Epoch: 40, step: 1382, loss: 0.35639137029647827, mean loss: 0.3438696918495362
Epoch: 40, step: 1383, loss: 0.3262284994125366, mean loss: 0.34386939357426843
Epoch: 40, step: 1384, loss: 0.35675695538520813, mean loss: 0.34386961147200806
Epoch: 40, step: 1385, loss: 0.3409328758716583, mean loss: 0.3438695618196968
Epoch: 40, step: 1386, loss: 0.34505176544189453, mean loss: 0.34386958180724686
Epoch: 40, step: 1387, loss: 0.3018811047077179, mean loss: 0.3438688719188804
Epoch: 40, step: 1388, loss: 0.3137516379356384, mean loss: 0.34386836274317184
Epoch: 40, step: 1389, loss: 0.31602349877357483, mean loss: 0.343867891993147
Epoch: 40, step: 1390, loss: 0.32059767842292786, mean loss: 0.34386749858959387
Epoch: 40, step: 1391, loss: 0.3737148344516754, mean loss: 0.3438680031766892
Epoch: 40, step: 1392, loss: 0.35561344027519226, mean loss: 0.3438682017369837
Epoch: 40, step: 1393, loss: 0.3143240213394165, mean loss: 0.34386770229179997
Epoch: 40, step: 1394, loss: 0.3052813410758972, mean loss: 0.3438670499993274
Epoch: 40, step: 1395, loss: 0.40104955434799194, mean loss: 0.34386801663845695
Epoch: 40, step: 1396, loss: 0.3231119215488434, mean loss: 0.34386766577389166
Epoch: 40, step: 1397, loss: 0.33555305004119873, mean loss: 0.3438675252245875
Epoch: 40, step: 1398, loss: 0.31445416808128357, mean loss: 0.34386702803299973
Epoch: 40, step: 1399, loss: 0.33929380774497986, mean loss: 0.34386695073042556
Epoch: 40, step: 1400, loss: 0.326158344745636, mean loss: 0.34386665140137457
Epoch: 40, step: 1401, loss: 0.34184396266937256, mean loss: 0.34386661721238954
Epoch: 40, step: 1402, loss: 0.29689133167266846, mean loss: 0.34386582321469605
Epoch: 40, step: 1403, loss: 0.36732497811317444, mean loss: 0.34386621972532583
Epoch: 40, step: 1404, loss: 0.31823328137397766, mean loss: 0.34386578648036087
Epoch: 40, step: 1405, loss: 0.3146924078464508, mean loss: 0.3438652934036169
Epoch: 40, step: 1406, loss: 0.39665767550468445, mean loss: 0.343866185664203
Epoch: 40, step: 1407, loss: 0.33011019229888916, mean loss: 0.3438659531737797
Epoch: 40, step: 1408, loss: 0.35038626194000244, mean loss: 0.34386606337183556
Epoch: 40, step: 1409, loss: 0.31067588925361633, mean loss: 0.3438655024427479
Epoch: 40, step: 1410, loss: 0.33457285165786743, mean loss: 0.34386534539536345
Epoch: 40, step: 1411, loss: 0.33344459533691406, mean loss: 0.343865169285885
Epoch: 40, step: 1412, loss: 0.34709596633911133, mean loss: 0.3438652238850612
Epoch: 40, step: 1413, loss: 0.3277427554130554, mean loss: 0.34386495142640583
Epoch: 40, step: 1414, loss: 0.3258283734321594, mean loss: 0.34386464662576377
Epoch: 40, step: 1415, loss: 0.3109000027179718, mean loss: 0.3438640895647271
Epoch: 40, step: 1416, loss: 0.29677504301071167, mean loss: 0.34386329383249065
Epoch: 40, step: 1417, loss: 0.33164164423942566, mean loss: 0.34386308730895837
Epoch: 40, step: 1418, loss: 0.36191338300704956, mean loss: 0.3438633923207987
Epoch: 40, step: 1419, loss: 0.32245784997940063, mean loss: 0.3438630306184949
Epoch: 40, step: 1420, loss: 0.296962171792984, mean loss: 0.34386223811990874
Epoch: 40, step: 1421, loss: 0.2954099476337433, mean loss: 0.34386141942012693
Epoch: 40, step: 1422, loss: 0.35115811228752136, mean loss: 0.34386154271047836
Epoch: 40, step: 1423, loss: 0.3370698094367981, mean loss: 0.34386142795423896
Epoch: 40, step: 1424, loss: 0.27598440647125244, mean loss: 0.3438602810923401
Epoch: 40, step: 1425, loss: 0.338510125875473, mean loss: 0.34386019069671925
Epoch: 40, step: 1426, loss: 0.29840710759162903, mean loss: 0.34385942273951403
Epoch: 40, step: 1427, loss: 0.33091554045677185, mean loss: 0.3438592040485246
Epoch: 40, step: 1428, loss: 0.32820478081703186, mean loss: 0.3438589395665561
Epoch: 40, step: 1429, loss: 0.335265189409256, mean loss: 0.3438587943773323
Epoch: 40, step: 1430, loss: 0.34273260831832886, mean loss: 0.3438587753510266
Epoch: 40, step: 1431, loss: 0.32732829451560974, mean loss: 0.3438584960821924
Epoch: 40, step: 1432, loss: 0.3894645571708679, mean loss: 0.34385926654594806
Epoch: 40, step: 1433, loss: 0.3399450182914734, mean loss: 0.34385920042018775
Epoch: 40, step: 1434, loss: 0.3490491807460785, mean loss: 0.3438592880961794
Epoch: 40, step: 1435, loss: 0.32620227336883545, mean loss: 0.3438589898156414
Epoch: 40, step: 1436, loss: 0.32556846737861633, mean loss: 0.3438586808384561
Epoch: 40, step: 1437, loss: 0.3373650014400482, mean loss: 0.34385857114421986
Epoch: 40, step: 1438, loss: 0.34458231925964355, mean loss: 0.34385858336990127
Epoch: 40, step: 1439, loss: 0.2941809296607971, mean loss: 0.3438577442203454
Epoch: 40, step: 1440, loss: 0.3677963614463806, mean loss: 0.34385814858204916
Epoch: 40, step: 1441, loss: 0.3285536766052246, mean loss: 0.3438578900692966
Epoch: 40, step: 1442, loss: 0.31015121936798096, mean loss: 0.34385732072871084
Epoch: 40, step: 1443, loss: 0.3355677127838135, mean loss: 0.34385718071101024
Valid: 40, mean loss: 0.18521206577618918
Epoch: 41, step: 0, loss: 0.29681864380836487, mean loss: 0.3438563862082334
Epoch: 41, step: 1, loss: 0.3130645751953125, mean loss: 0.3438558661290013
Epoch: 41, step: 2, loss: 0.34885936975479126, mean loss: 0.34385595063765106
Epoch: 41, step: 3, loss: 0.35924312472343445, mean loss: 0.3438562105210129
Epoch: 41, step: 4, loss: 0.32644587755203247, mean loss: 0.34385591647225394
Epoch: 41, step: 5, loss: 0.32653337717056274, mean loss: 0.3438556239112119
Epoch: 41, step: 6, loss: 0.34532999992370605, mean loss: 0.3438556488115853
Epoch: 41, step: 7, loss: 0.3246326446533203, mean loss: 0.34385532416448406
Epoch: 41, step: 8, loss: 0.35610365867614746, mean loss: 0.3438555310166029
Epoch: 41, step: 9, loss: 0.30702924728393555, mean loss: 0.3438549090980746
Epoch: 41, step: 10, loss: 0.3245770037174225, mean loss: 0.3438545835402703
Epoch: 41, step: 11, loss: 0.2982686460018158, mean loss: 0.34385381371560236
Epoch: 41, step: 12, loss: 0.3508046567440033, mean loss: 0.3438539310947845
Epoch: 41, step: 13, loss: 0.29608461260795593, mean loss: 0.34385312442589183
Epoch: 41, step: 14, loss: 0.3117285370826721, mean loss: 0.34385258195493923
Epoch: 41, step: 15, loss: 0.3379119634628296, mean loss: 0.3438524816405439
Epoch: 41, step: 16, loss: 0.3575940728187561, mean loss: 0.3438527136797053
Epoch: 41, step: 17, loss: 0.3382415175437927, mean loss: 0.3438526189311974
Epoch: 41, step: 18, loss: 0.31651461124420166, mean loss: 0.34385215731986923
Epoch: 41, step: 19, loss: 0.3357487916946411, mean loss: 0.343852020494163
Epoch: 41, step: 20, loss: 0.34115758538246155, mean loss: 0.3438519749992688
Epoch: 41, step: 21, loss: 0.38400372862815857, mean loss: 0.34385265294060585
Epoch: 41, step: 22, loss: 0.33943507075309753, mean loss: 0.34385257835330296
Epoch: 41, step: 23, loss: 0.29505687952041626, mean loss: 0.34385175449129796
Epoch: 41, step: 24, loss: 0.3375190496444702, mean loss: 0.3438516475723082
Epoch: 41, step: 25, loss: 0.3399197459220886, mean loss: 0.3438515811886909
Epoch: 41, step: 26, loss: 0.31282228231430054, mean loss: 0.34385105731945226
Epoch: 41, step: 27, loss: 0.32854437828063965, mean loss: 0.3438507989003707
Epoch: 41, step: 28, loss: 0.2930196225643158, mean loss: 0.3438499407439995
Epoch: 41, step: 29, loss: 0.3388233780860901, mean loss: 0.34384985588458333
Epoch: 41, step: 30, loss: 0.3461804986000061, mean loss: 0.3438498952302863
Epoch: 41, step: 31, loss: 0.3327666223049164, mean loss: 0.3438497081266175
Epoch: 41, step: 32, loss: 0.3775865137577057, mean loss: 0.34385027764913945
Epoch: 41, step: 33, loss: 0.3432832956314087, mean loss: 0.3438502680778842
Epoch: 41, step: 34, loss: 0.35201549530029297, mean loss: 0.34385040591321603
Epoch: 41, step: 35, loss: 0.3265317678451538, mean loss: 0.34385011356618583
Epoch: 41, step: 36, loss: 0.3594880700111389, mean loss: 0.34385037753803716
Epoch: 41, step: 37, loss: 0.3164058029651642, mean loss: 0.34384991427591616
Epoch: 41, step: 38, loss: 0.30117151141166687, mean loss: 0.34384919388020924
Epoch: 41, step: 39, loss: 0.3718726933002472, mean loss: 0.34384966689856417
Epoch: 41, step: 40, loss: 0.2905183434486389, mean loss: 0.3438487667158745
Epoch: 41, step: 41, loss: 0.32395637035369873, mean loss: 0.34384843095655976
Epoch: 41, step: 42, loss: 0.30721646547317505, mean loss: 0.343847812664233
Epoch: 41, step: 43, loss: 0.3590848743915558, mean loss: 0.34384806983851274
Epoch: 41, step: 44, loss: 0.40757280588150024, mean loss: 0.3438491453796365
Epoch: 41, step: 45, loss: 0.33469563722610474, mean loss: 0.34384899089004745
Epoch: 41, step: 46, loss: 0.315340131521225, mean loss: 0.34384850973598474
Epoch: 41, step: 47, loss: 0.35468533635139465, mean loss: 0.34384869262983836
Epoch: 41, step: 48, loss: 0.3309932053089142, mean loss: 0.3438484756705735
Epoch: 41, step: 49, loss: 0.3413901627063751, mean loss: 0.34384843418286015
Epoch: 41, step: 50, loss: 0.3725636899471283, mean loss: 0.34384891878763213
Epoch: 41, step: 51, loss: 0.3196253180503845, mean loss: 0.34384850999188593
Epoch: 41, step: 52, loss: 0.3295064866542816, mean loss: 0.3438482679610147
Epoch: 41, step: 53, loss: 0.3707274794578552, mean loss: 0.34384872155734764
Epoch: 41, step: 54, loss: 0.36872562766075134, mean loss: 0.34384914135697475
Epoch: 41, step: 55, loss: 0.2912226915359497, mean loss: 0.3438482532967348
Epoch: 41, step: 56, loss: 0.352472186088562, mean loss: 0.3438483988213259
Epoch: 41, step: 57, loss: 0.3236873745918274, mean loss: 0.34384805861977635
Epoch: 41, step: 58, loss: 0.32123810052871704, mean loss: 0.34384767710081693
Epoch: 41, step: 59, loss: 0.31994888186454773, mean loss: 0.34384727384090813
Epoch: 41, step: 60, loss: 0.3579716682434082, mean loss: 0.34384751216697584
Epoch: 41, step: 61, loss: 0.37014374136924744, mean loss: 0.3438479558653729
Epoch: 41, step: 62, loss: 0.2997666001319885, mean loss: 0.34384721208965063
Epoch: 41, step: 63, loss: 0.3431326150894165, mean loss: 0.34384720003260466
Epoch: 41, step: 64, loss: 0.36792126297950745, mean loss: 0.3438476062156505
Epoch: 41, step: 65, loss: 0.3740720748901367, mean loss: 0.3438481161611318
Epoch: 41, step: 66, loss: 0.3467383086681366, mean loss: 0.3438481649234693
Epoch: 41, step: 67, loss: 0.30730873346328735, mean loss: 0.34384754845310456
Epoch: 41, step: 68, loss: 0.3326578438282013, mean loss: 0.343847359670613
Epoch: 41, step: 69, loss: 0.3281015455722809, mean loss: 0.34384709402607916
Epoch: 41, step: 70, loss: 0.303447425365448, mean loss: 0.3438464124627108
Epoch: 41, step: 71, loss: 0.33020296692848206, mean loss: 0.3438461822945899
Epoch: 41, step: 72, loss: 0.30503931641578674, mean loss: 0.34384552762472
Epoch: 41, step: 73, loss: 0.2874104976654053, mean loss: 0.3438445755846721
Epoch: 41, step: 74, loss: 0.36511605978012085, mean loss: 0.3438449344214304
Epoch: 41, step: 75, loss: 0.34999245405197144, mean loss: 0.34384503812452805
Epoch: 41, step: 76, loss: 0.3508698046207428, mean loss: 0.3438451566239882
Epoch: 41, step: 77, loss: 0.2754162847995758, mean loss: 0.34384400232973655
Epoch: 41, step: 78, loss: 0.30885541439056396, mean loss: 0.34384341213376235
Epoch: 41, step: 79, loss: 0.3298676908016205, mean loss: 0.3438431763918871
Epoch: 41, step: 80, loss: 0.31194010376930237, mean loss: 0.3438426382612871
Epoch: 41, step: 81, loss: 0.3333315849304199, mean loss: 0.34384246096726606
Epoch: 41, step: 82, loss: 0.3205825686454773, mean loss: 0.3438420686402412
Epoch: 41, step: 83, loss: 0.29804229736328125, mean loss: 0.3438412961437617
Epoch: 41, step: 84, loss: 0.3040509819984436, mean loss: 0.34384062501903123
Epoch: 41, step: 85, loss: 0.34530144929885864, mean loss: 0.34384064965765965
Epoch: 41, step: 86, loss: 0.30944937467575073, mean loss: 0.3438400696155794
Epoch: 41, step: 87, loss: 0.3471131920814514, mean loss: 0.3438401248190211
Epoch: 41, step: 88, loss: 0.3267274498939514, mean loss: 0.34383983620696024
Epoch: 41, step: 89, loss: 0.33958399295806885, mean loss: 0.3438397644316837
Epoch: 41, step: 90, loss: 0.35278210043907166, mean loss: 0.34383991524264595
Epoch: 41, step: 91, loss: 0.3466028869152069, mean loss: 0.34383996183890325
Epoch: 41, step: 92, loss: 0.3239441514015198, mean loss: 0.34383962631079157
Epoch: 41, step: 93, loss: 0.3248567283153534, mean loss: 0.343839306183671
Epoch: 41, step: 94, loss: 0.33725297451019287, mean loss: 0.3438391951138102
Epoch: 41, step: 95, loss: 0.3711564540863037, mean loss: 0.34383965577585024
Epoch: 41, step: 96, loss: 0.3275604248046875, mean loss: 0.34383938125719166
Epoch: 41, step: 97, loss: 0.333955317735672, mean loss: 0.3438392145838329
Epoch: 41, step: 98, loss: 0.31692999601364136, mean loss: 0.34383876082569975
Epoch: 41, step: 99, loss: 0.3194367289543152, mean loss: 0.3438383493520745
Epoch: 41, step: 100, loss: 0.31503087282180786, mean loss: 0.3438378636008473
Epoch: 41, step: 101, loss: 0.30907142162323, mean loss: 0.34383727737952097
Epoch: 41, step: 102, loss: 0.33274388313293457, mean loss: 0.34383709032918547
Epoch: 41, step: 103, loss: 0.32267242670059204, mean loss: 0.34383673346900423
Epoch: 41, step: 104, loss: 0.3224039375782013, mean loss: 0.3438363720939028
Epoch: 41, step: 105, loss: 0.3621253967285156, mean loss: 0.34383668045715743
Epoch: 41, step: 106, loss: 0.35220760107040405, mean loss: 0.3438368215932134
Epoch: 41, step: 107, loss: 0.29970109462738037, mean loss: 0.34383607746509487
Epoch: 41, step: 108, loss: 0.3591143488883972, mean loss: 0.3438363350523257
Epoch: 41, step: 109, loss: 0.3070238530635834, mean loss: 0.3438357144150059
Epoch: 41, step: 110, loss: 0.3612297773361206, mean loss: 0.34383600766398037
Epoch: 41, step: 111, loss: 0.3240847587585449, mean loss: 0.34383567468048676
Epoch: 41, step: 112, loss: 0.3033548593521118, mean loss: 0.3438349922316891
Epoch: 41, step: 113, loss: 0.3689887821674347, mean loss: 0.34383541628155484
Epoch: 41, step: 114, loss: 0.3166900873184204, mean loss: 0.3438349586654628
Epoch: 41, step: 115, loss: 0.35167771577835083, mean loss: 0.3438350908764728
Epoch: 41, step: 116, loss: 0.3352385461330414, mean loss: 0.3438349459607643
Epoch: 41, step: 117, loss: 0.30758488178253174, mean loss: 0.3438343348879047
Epoch: 41, step: 118, loss: 0.35449743270874023, mean loss: 0.34383451463434067
Epoch: 41, step: 119, loss: 0.2966236174106598, mean loss: 0.34383371881987734
Epoch: 41, step: 120, loss: 0.34208136796951294, mean loss: 0.34383368928172564
Epoch: 41, step: 121, loss: 0.4351542890071869, mean loss: 0.3438352285832077
Epoch: 41, step: 122, loss: 0.33431771397590637, mean loss: 0.34383506815853415
Epoch: 41, step: 123, loss: 0.32531774044036865, mean loss: 0.3438347560406856
Epoch: 41, step: 124, loss: 0.3480275869369507, mean loss: 0.3438348267115362
Epoch: 41, step: 125, loss: 0.31953442096710205, mean loss: 0.3438344171311259
Epoch: 41, step: 126, loss: 0.35463467240333557, mean loss: 0.34383459916505876
Epoch: 41, step: 127, loss: 0.3591000437736511, mean loss: 0.34383485645361483
Epoch: 41, step: 128, loss: 0.3271578848361969, mean loss: 0.3438345753794804
Epoch: 41, step: 129, loss: 0.364328533411026, mean loss: 0.3438349207793866
Epoch: 41, step: 130, loss: 0.33350232243537903, mean loss: 0.34383474663936225
Epoch: 41, step: 131, loss: 0.3125755488872528, mean loss: 0.34383421982262785
Epoch: 41, step: 132, loss: 0.32648321986198425, mean loss: 0.3438339274081148
Epoch: 41, step: 133, loss: 0.33377477526664734, mean loss: 0.343833757885176
Epoch: 41, step: 134, loss: 0.31526610255241394, mean loss: 0.34383327645381834
Epoch: 41, step: 135, loss: 0.3881533145904541, mean loss: 0.34383402333683377
Epoch: 41, step: 136, loss: 0.3330393135547638, mean loss: 0.34383384142702805
Epoch: 41, step: 137, loss: 0.36148226261138916, mean loss: 0.3438341388288882
Epoch: 41, step: 138, loss: 0.3478887975215912, mean loss: 0.3438342071547007
Epoch: 41, step: 139, loss: 0.3397083580493927, mean loss: 0.34383413763041676
Epoch: 41, step: 140, loss: 0.31465792655944824, mean loss: 0.34383364599319255
Epoch: 41, step: 141, loss: 0.3045291006565094, mean loss: 0.34383298369842397
Epoch: 41, step: 142, loss: 0.32996127009391785, mean loss: 0.3438327499593368
Epoch: 41, step: 143, loss: 0.3760187029838562, mean loss: 0.3438332922851612
Epoch: 41, step: 144, loss: 0.33188116550445557, mean loss: 0.34383309089799746
Epoch: 41, step: 145, loss: 0.34529244899749756, mean loss: 0.34383311548701345
Epoch: 41, step: 146, loss: 0.38262224197387695, mean loss: 0.3438337690417385
Epoch: 41, step: 147, loss: 0.33229541778564453, mean loss: 0.3438335746363056
Epoch: 41, step: 148, loss: 0.34139424562454224, mean loss: 0.34383353353764146
Epoch: 41, step: 149, loss: 0.3203597068786621, mean loss: 0.34383313804910387
Epoch: 41, step: 150, loss: 0.3584144115447998, mean loss: 0.3438333837111963
Epoch: 41, step: 151, loss: 0.34682074189186096, mean loss: 0.3438334340407027
Epoch: 41, step: 152, loss: 0.349259614944458, mean loss: 0.3438335254567262
Epoch: 41, step: 153, loss: 0.3206847310066223, mean loss: 0.34383313547063415
Epoch: 41, step: 154, loss: 0.32454028725624084, mean loss: 0.34383281045086944
Epoch: 41, step: 155, loss: 0.37027508020401, mean loss: 0.3438332559068963
Epoch: 41, step: 156, loss: 0.37634992599487305, mean loss: 0.3438338036852371
Epoch: 41, step: 157, loss: 0.3650171458721161, mean loss: 0.3438341605354474
Epoch: 41, step: 158, loss: 0.3282627761363983, mean loss: 0.34383389822753846
Epoch: 41, step: 159, loss: 0.35610121488571167, mean loss: 0.34383410487326077
Epoch: 41, step: 160, loss: 0.3549664616584778, mean loss: 0.34383429239716856
Epoch: 41, step: 161, loss: 0.3250083923339844, mean loss: 0.34383397528130993
Epoch: 41, step: 162, loss: 0.3204325735569, mean loss: 0.34383358109932793
Epoch: 41, step: 163, loss: 0.3190453350543976, mean loss: 0.3438331635638535
Epoch: 41, step: 164, loss: 0.37759968638420105, mean loss: 0.3438337323206596
Epoch: 41, step: 165, loss: 0.29739242792129517, mean loss: 0.3438329500854499
Epoch: 41, step: 166, loss: 0.3179284632205963, mean loss: 0.34383251376996143
Epoch: 41, step: 167, loss: 0.3201078176498413, mean loss: 0.343832114175942
Epoch: 41, step: 168, loss: 0.35463351011276245, mean loss: 0.34383229610031735
Epoch: 41, step: 169, loss: 0.31387636065483093, mean loss: 0.34383179157080196
Epoch: 41, step: 170, loss: 0.34506338834762573, mean loss: 0.34383181231348453
Epoch: 41, step: 171, loss: 0.3377188444137573, mean loss: 0.34383170935996965
Epoch: 41, step: 172, loss: 0.30629995465278625, mean loss: 0.3438310772674977
Epoch: 41, step: 173, loss: 0.3070790469646454, mean loss: 0.34383045831720793
Epoch: 41, step: 174, loss: 0.33406710624694824, mean loss: 0.34383029389288167
Epoch: 41, step: 175, loss: 0.2846381664276123, mean loss: 0.3438292970567842
Epoch: 41, step: 176, loss: 0.3360764682292938, mean loss: 0.3438291664960185
Epoch: 41, step: 177, loss: 0.38016214966773987, mean loss: 0.34382977834781153
Epoch: 41, step: 178, loss: 0.32620957493782043, mean loss: 0.34382948162647026
Epoch: 41, step: 179, loss: 0.35158464312553406, mean loss: 0.34382961221992137
Epoch: 41, step: 180, loss: 0.30423277616500854, mean loss: 0.3438289454381405
Epoch: 41, step: 181, loss: 0.33972352743148804, mean loss: 0.34382887630706577
Epoch: 41, step: 182, loss: 0.3246123194694519, mean loss: 0.3438285527251903
Epoch: 41, step: 183, loss: 0.3160257935523987, mean loss: 0.3438280845706949
Epoch: 41, step: 184, loss: 0.3581556975841522, mean loss: 0.34382832582097717
Epoch: 41, step: 185, loss: 0.31802937388420105, mean loss: 0.34382789142205583
Epoch: 41, step: 186, loss: 0.32010266184806824, mean loss: 0.34382749194689
Epoch: 41, step: 187, loss: 0.328644722700119, mean loss: 0.34382723631028494
Epoch: 41, step: 188, loss: 0.3478781580924988, mean loss: 0.343827304515659
Epoch: 41, step: 189, loss: 0.3463691174983978, mean loss: 0.34382734731144615
Epoch: 41, step: 190, loss: 0.3397010862827301, mean loss: 0.3438272778399245
Epoch: 41, step: 191, loss: 0.30387961864471436, mean loss: 0.3438266052751189
Epoch: 41, step: 192, loss: 0.3499423861503601, mean loss: 0.3438267082395931
Epoch: 41, step: 193, loss: 0.34477317333221436, mean loss: 0.3438267241738854
Epoch: 41, step: 194, loss: 0.37446433305740356, mean loss: 0.3438272399672301
Epoch: 41, step: 195, loss: 0.3145318925380707, mean loss: 0.34382674677956293
Epoch: 41, step: 196, loss: 0.32993799448013306, mean loss: 0.3438265129661204
Epoch: 41, step: 197, loss: 0.2910245358943939, mean loss: 0.3438256240738765
Epoch: 41, step: 198, loss: 0.3613196313381195, mean loss: 0.3438259185709097
Epoch: 41, step: 199, loss: 0.3825985789299011, mean loss: 0.3438265712653471
Epoch: 41, step: 200, loss: 0.3209969699382782, mean loss: 0.3438261869609733
Epoch: 41, step: 201, loss: 0.3274943232536316, mean loss: 0.34382591204154245
Epoch: 41, step: 202, loss: 0.30130934715270996, mean loss: 0.3438251963587965
Epoch: 41, step: 203, loss: 0.35229429602622986, mean loss: 0.3438253389170322
Epoch: 41, step: 204, loss: 0.3271026313304901, mean loss: 0.3438250574326176
Epoch: 41, step: 205, loss: 0.34734025597572327, mean loss: 0.3438251166010832
Epoch: 41, step: 206, loss: 0.32992076873779297, mean loss: 0.34382488256449295
Epoch: 41, step: 207, loss: 0.34635189175605774, mean loss: 0.34382492509814255
Epoch: 41, step: 208, loss: 0.32094135880470276, mean loss: 0.34382453993721324
Epoch: 41, step: 209, loss: 0.3772355616092682, mean loss: 0.3438251022797869
Epoch: 41, step: 210, loss: 0.3580595850944519, mean loss: 0.34382534185704544
Epoch: 41, step: 211, loss: 0.32210057973861694, mean loss: 0.3438249762187979
Epoch: 41, step: 212, loss: 0.32089564204216003, mean loss: 0.34382459031351525
Epoch: 41, step: 213, loss: 0.38730868697166443, mean loss: 0.34382532214724676
Epoch: 41, step: 214, loss: 0.3059285879135132, mean loss: 0.34382468435909425
Epoch: 41, step: 215, loss: 0.32562828063964844, mean loss: 0.34382437812544026
Epoch: 41, step: 216, loss: 0.3159870207309723, mean loss: 0.343823909648683
Epoch: 41, step: 217, loss: 0.3291070759296417, mean loss: 0.3438236619822679
Epoch: 41, step: 218, loss: 0.3303449749946594, mean loss: 0.3438234351561738
Epoch: 41, step: 219, loss: 0.32703638076782227, mean loss: 0.34382315265997043
Epoch: 41, step: 220, loss: 0.3842218220233917, mean loss: 0.34382383248612713
Epoch: 41, step: 221, loss: 0.3043486475944519, mean loss: 0.34382316821148484
Epoch: 41, step: 222, loss: 0.3300771713256836, mean loss: 0.3438229369025363
Epoch: 41, step: 223, loss: 0.3591063618659973, mean loss: 0.34382319407802536
Epoch: 41, step: 224, loss: 0.3099823594093323, mean loss: 0.34382262464501
Epoch: 41, step: 225, loss: 0.3417108356952667, mean loss: 0.343822589110954
Epoch: 41, step: 226, loss: 0.3281942903995514, mean loss: 0.34382232614551994
Epoch: 41, step: 227, loss: 0.3290819525718689, mean loss: 0.34382207812469656
Epoch: 41, step: 228, loss: 0.3179683983325958, mean loss: 0.3438216431192317
Epoch: 41, step: 229, loss: 0.31356310844421387, mean loss: 0.3438211340077017
Epoch: 41, step: 230, loss: 0.32250910997390747, mean loss: 0.34382077543070105
Epoch: 41, step: 231, loss: 0.2986859977245331, mean loss: 0.34382001604619156
Epoch: 41, step: 232, loss: 0.33805811405181885, mean loss: 0.3438199191048588
Epoch: 41, step: 233, loss: 0.3385588526725769, mean loss: 0.3438198305913417
Epoch: 41, step: 234, loss: 0.31098437309265137, mean loss: 0.3438192781685637
Epoch: 41, step: 235, loss: 0.33044031262397766, mean loss: 0.343819053085025
Epoch: 41, step: 236, loss: 0.33256542682647705, mean loss: 0.34381886376071585
Epoch: 41, step: 237, loss: 0.2993417978286743, mean loss: 0.34381811551762287
Epoch: 41, step: 238, loss: 0.32442596554756165, mean loss: 0.34381778928661216
Epoch: 41, step: 239, loss: 0.3466433584690094, mean loss: 0.3438178368199071
Epoch: 41, step: 240, loss: 0.3220996856689453, mean loss: 0.34381747147124614
Epoch: 41, step: 241, loss: 0.3179001808166504, mean loss: 0.3438170354908496
Epoch: 41, step: 242, loss: 0.31992363929748535, mean loss: 0.343816633563146
Epoch: 41, step: 243, loss: 0.33921146392822266, mean loss: 0.34381655609763606
Epoch: 41, step: 244, loss: 0.3278922736644745, mean loss: 0.34381628823303895
Epoch: 41, step: 245, loss: 0.41144874691963196, mean loss: 0.3438174258690135
Epoch: 41, step: 246, loss: 0.3285049498081207, mean loss: 0.3438171683043626
Epoch: 41, step: 247, loss: 0.3066762387752533, mean loss: 0.3438165435830828
Epoch: 41, step: 248, loss: 0.3171869218349457, mean loss: 0.34381609567260313
Epoch: 41, step: 249, loss: 0.3108549118041992, mean loss: 0.3438155412745161
Epoch: 41, step: 250, loss: 0.31295299530029297, mean loss: 0.3438150221836747
Epoch: 41, step: 251, loss: 0.31400734186172485, mean loss: 0.3438145208435186
Epoch: 41, step: 252, loss: 0.328142911195755, mean loss: 0.3438142572646356
Epoch: 41, step: 253, loss: 0.29493293166160583, mean loss: 0.3438134351494349
Epoch: 41, step: 254, loss: 0.3220484256744385, mean loss: 0.3438130690987197
Epoch: 41, step: 255, loss: 0.35878464579582214, mean loss: 0.3438133208911297
Epoch: 41, step: 256, loss: 0.31918463110923767, mean loss: 0.34381290669207853
Epoch: 41, step: 257, loss: 0.3029758334159851, mean loss: 0.34381221991609934
Epoch: 41, step: 258, loss: 0.3535473644733429, mean loss: 0.34381238363378186
Epoch: 41, step: 259, loss: 0.3617510199546814, mean loss: 0.3438126853059923
Epoch: 41, step: 260, loss: 0.32789191603660583, mean loss: 0.34381241757254793
Epoch: 41, step: 261, loss: 0.30467915534973145, mean loss: 0.3438117594946173
Epoch: 41, step: 262, loss: 0.3122219741344452, mean loss: 0.3438112282792313
Epoch: 41, step: 263, loss: 0.37869778275489807, mean loss: 0.34381181492338403
Epoch: 41, step: 264, loss: 0.321664959192276, mean loss: 0.34381144251329254
Epoch: 41, step: 265, loss: 0.3104349374771118, mean loss: 0.3438108812806536
Epoch: 41, step: 266, loss: 0.33011600375175476, mean loss: 0.34381065100240826
Epoch: 41, step: 267, loss: 0.3392362892627716, mean loss: 0.34381057408618315
Epoch: 41, step: 268, loss: 0.3185402750968933, mean loss: 0.34381014918246233
Epoch: 41, step: 269, loss: 0.3545602262020111, mean loss: 0.34381032993501
Epoch: 41, step: 270, loss: 0.29347091913223267, mean loss: 0.34380948353886365
Epoch: 41, step: 271, loss: 0.3047850430011749, mean loss: 0.3438088274012529
Epoch: 41, step: 272, loss: 0.36015933752059937, mean loss: 0.34380910230600803
Epoch: 41, step: 273, loss: 0.3399195671081543, mean loss: 0.34380903691148906
Epoch: 41, step: 274, loss: 0.3226691782474518, mean loss: 0.34380868149430543
Epoch: 41, step: 275, loss: 0.3295136094093323, mean loss: 0.34380844116020853
Epoch: 41, step: 276, loss: 0.3643887937068939, mean loss: 0.3438087871589736
Epoch: 41, step: 277, loss: 0.32739126682281494, mean loss: 0.34380851115076383
Epoch: 41, step: 278, loss: 0.3170459270477295, mean loss: 0.3438080612308858
Epoch: 41, step: 279, loss: 0.3073129653930664, mean loss: 0.34380744770294824
Epoch: 41, step: 280, loss: 0.34001705050468445, mean loss: 0.34380738398272975
Epoch: 41, step: 281, loss: 0.3751067817211151, mean loss: 0.3438079101468312
Epoch: 41, step: 282, loss: 0.3695935010910034, mean loss: 0.3438083436128144
Epoch: 41, step: 283, loss: 0.36100447177886963, mean loss: 0.34380863268167144
Epoch: 41, step: 284, loss: 0.3318425416946411, mean loss: 0.34380843153371154
Epoch: 41, step: 285, loss: 0.3242402672767639, mean loss: 0.3438081026017187
Epoch: 41, step: 286, loss: 0.3365199565887451, mean loss: 0.343807980093339
Epoch: 41, step: 287, loss: 0.3245454430580139, mean loss: 0.34380765630968685
Epoch: 41, step: 288, loss: 0.3259434998035431, mean loss: 0.3438073560364361
Epoch: 41, step: 289, loss: 0.31289058923721313, mean loss: 0.34380683637450715
Epoch: 41, step: 290, loss: 0.3406161665916443, mean loss: 0.34380678274529825
Epoch: 41, step: 291, loss: 0.35429155826568604, mean loss: 0.34380695897186003
Epoch: 41, step: 292, loss: 0.34460771083831787, mean loss: 0.3438069724305532
Epoch: 41, step: 293, loss: 0.31705242395401, mean loss: 0.3438065227591613
Epoch: 41, step: 294, loss: 0.34060320258140564, mean loss: 0.3438064689209425
Epoch: 41, step: 295, loss: 0.3459048569202423, mean loss: 0.3438065041879677
Epoch: 41, step: 296, loss: 0.3302341401576996, mean loss: 0.3438062760848429
Epoch: 41, step: 297, loss: 0.3239147961139679, mean loss: 0.34380594178549206
Epoch: 41, step: 298, loss: 0.2982203960418701, mean loss: 0.3438051756804933
Epoch: 41, step: 299, loss: 0.3450251519680023, mean loss: 0.3438051961829181
Epoch: 41, step: 300, loss: 0.3090781569480896, mean loss: 0.3438046125842418
Epoch: 41, step: 301, loss: 0.29644790291786194, mean loss: 0.3438038167534068
Epoch: 41, step: 302, loss: 0.3195889890193939, mean loss: 0.34380340982938556
Epoch: 41, step: 303, loss: 0.3108724057674408, mean loss: 0.3438028564415375
Epoch: 41, step: 304, loss: 0.3599705994129181, mean loss: 0.3438031281272148
Epoch: 41, step: 305, loss: 0.31774142384529114, mean loss: 0.3438026901889812
Epoch: 41, step: 306, loss: 0.3182888925075531, mean loss: 0.3438022614649187
Epoch: 41, step: 307, loss: 0.3215334117412567, mean loss: 0.3438018872740039
Epoch: 41, step: 308, loss: 0.34135860204696655, mean loss: 0.34380184621935655
Epoch: 41, step: 309, loss: 0.38907015323638916, mean loss: 0.34380260685226677
Epoch: 41, step: 310, loss: 0.37303677201271057, mean loss: 0.34380309805894005
Epoch: 41, step: 311, loss: 0.3252432644367218, mean loss: 0.343802786212821
Epoch: 41, step: 312, loss: 0.3055954873561859, mean loss: 0.3438021442567604
Epoch: 41, step: 313, loss: 0.31438329815864563, mean loss: 0.34380164997190377
Epoch: 41, step: 314, loss: 0.3677234351634979, mean loss: 0.34380205189037
Epoch: 41, step: 315, loss: 0.31187477707862854, mean loss: 0.3438015154778228
Epoch: 41, step: 316, loss: 0.35716015100479126, mean loss: 0.343801739913493
Epoch: 41, step: 317, loss: 0.3347243070602417, mean loss: 0.3438015874079849
Epoch: 41, step: 318, loss: 0.3246261477470398, mean loss: 0.3438012652562173
Epoch: 41, step: 319, loss: 0.33106309175491333, mean loss: 0.3438010512555873
Epoch: 41, step: 320, loss: 0.3544275164604187, mean loss: 0.3438012297766323
Epoch: 41, step: 321, loss: 0.3711738884449005, mean loss: 0.34380168962037566
Epoch: 41, step: 322, loss: 0.31958261132240295, mean loss: 0.3438012827616679
Epoch: 41, step: 323, loss: 0.31953829526901245, mean loss: 0.3438008751721723
Epoch: 41, step: 324, loss: 0.38412511348724365, mean loss: 0.34380155256030775
Epoch: 41, step: 325, loss: 0.34158292412757874, mean loss: 0.34380151529122605
Epoch: 41, step: 326, loss: 0.34536802768707275, mean loss: 0.34380154160545556
Epoch: 41, step: 327, loss: 0.3255693316459656, mean loss: 0.3438012353464695
Epoch: 41, step: 328, loss: 0.409260094165802, mean loss: 0.34380233488552886
Epoch: 41, step: 329, loss: 0.31031352281570435, mean loss: 0.34380177236978876
Epoch: 41, step: 330, loss: 0.3293650150299072, mean loss: 0.34380152987785395
Epoch: 41, step: 331, loss: 0.3250632882118225, mean loss: 0.3438012151398523
Epoch: 41, step: 332, loss: 0.32303404808044434, mean loss: 0.34380086632874224
Epoch: 41, step: 333, loss: 0.3144204020500183, mean loss: 0.3438003728545866
Epoch: 41, step: 334, loss: 0.3049458861351013, mean loss: 0.3437997202657504
Epoch: 41, step: 335, loss: 0.3629934787750244, mean loss: 0.3438000426332094
Epoch: 41, step: 336, loss: 0.3431462347507477, mean loss: 0.34380003165240824
Epoch: 41, step: 337, loss: 0.34061065316200256, mean loss: 0.3437999780872191
Epoch: 41, step: 338, loss: 0.29789894819259644, mean loss: 0.3437992071984514
Epoch: 41, step: 339, loss: 0.3218495547771454, mean loss: 0.34379883856932975
Epoch: 41, step: 340, loss: 0.3685663342475891, mean loss: 0.3437992545151804
Epoch: 41, step: 341, loss: 0.3370940387248993, mean loss: 0.3437991419095345
Epoch: 41, step: 342, loss: 0.3435085713863373, mean loss: 0.3437991370298508
Epoch: 41, step: 343, loss: 0.31476891040802, mean loss: 0.34379864952016753
Epoch: 41, step: 344, loss: 0.39343443512916565, mean loss: 0.3437994830486165
Epoch: 41, step: 345, loss: 0.33406397700309753, mean loss: 0.3437993195640482
Epoch: 41, step: 346, loss: 0.3294437825679779, mean loss: 0.3437990785011442
Epoch: 41, step: 347, loss: 0.39681529998779297, mean loss: 0.3437999687520424
Epoch: 41, step: 348, loss: 0.31871816515922546, mean loss: 0.3437995475842827
Epoch: 41, step: 349, loss: 0.32042792439460754, mean loss: 0.3437991551400608
Epoch: 41, step: 350, loss: 0.3559911251068115, mean loss: 0.3437993598578841
Epoch: 41, step: 351, loss: 0.33125603199005127, mean loss: 0.343799149243876
Epoch: 41, step: 352, loss: 0.3427756428718567, mean loss: 0.3437991320585515
Epoch: 41, step: 353, loss: 0.3460260033607483, mean loss: 0.3437991694485126
Epoch: 41, step: 354, loss: 0.3039303123950958, mean loss: 0.343798500047464
Epoch: 41, step: 355, loss: 0.38741448521614075, mean loss: 0.3437992323507744
Epoch: 41, step: 356, loss: 0.3362496793270111, mean loss: 0.34379910559747906
Epoch: 41, step: 357, loss: 0.3586004376411438, mean loss: 0.3437993541004179
Epoch: 41, step: 358, loss: 0.30132028460502625, mean loss: 0.3437986409216073
Epoch: 41, step: 359, loss: 0.33893635869026184, mean loss: 0.3437985592903832
Epoch: 41, step: 360, loss: 0.33775654435157776, mean loss: 0.34379845785472574
Epoch: 41, step: 361, loss: 0.3480362892150879, mean loss: 0.3437985289998649
Epoch: 41, step: 362, loss: 0.3133038878440857, mean loss: 0.34379801706135604
Epoch: 41, step: 363, loss: 0.32905134558677673, mean loss: 0.34379776950106405
Epoch: 41, step: 364, loss: 0.3300623297691345, mean loss: 0.34379753892073317
Epoch: 41, step: 365, loss: 0.3142683804035187, mean loss: 0.34379704321553733
Epoch: 41, step: 366, loss: 0.3291838467121124, mean loss: 0.34379679790831563
Epoch: 41, step: 367, loss: 0.34704679250717163, mean loss: 0.34379685246405656
Epoch: 41, step: 368, loss: 0.30258792638778687, mean loss: 0.34379616072575103
Epoch: 41, step: 369, loss: 0.3246988356113434, mean loss: 0.3437958401609893
Epoch: 41, step: 370, loss: 0.321982741355896, mean loss: 0.34379547401581423
Epoch: 41, step: 371, loss: 0.3181564211845398, mean loss: 0.3437950436570652
Epoch: 41, step: 372, loss: 0.3345816135406494, mean loss: 0.3437948890096322
Epoch: 41, step: 373, loss: 0.392709881067276, mean loss: 0.34379571003403814
Epoch: 41, step: 374, loss: 0.3688187003135681, mean loss: 0.3437961300308538
Epoch: 41, step: 375, loss: 0.34914886951446533, mean loss: 0.34379621987206704
Epoch: 41, step: 376, loss: 0.3189411759376526, mean loss: 0.34379580270814003
Epoch: 41, step: 377, loss: 0.33708345890045166, mean loss: 0.3437956900508978
Epoch: 41, step: 378, loss: 0.34940293431282043, mean loss: 0.34379578415902023
Epoch: 41, step: 379, loss: 0.33015871047973633, mean loss: 0.3437955552876172
Epoch: 41, step: 380, loss: 0.31802523136138916, mean loss: 0.34379512279078195
Epoch: 41, step: 381, loss: 0.3730504810810089, mean loss: 0.3437956137678284
Epoch: 41, step: 382, loss: 0.3243853747844696, mean loss: 0.3437952880216257
Epoch: 41, step: 383, loss: 0.35655829310417175, mean loss: 0.34379550220913124
Epoch: 41, step: 384, loss: 0.3233700096607208, mean loss: 0.34379515943626127
Epoch: 41, step: 385, loss: 0.30484235286712646, mean loss: 0.34379450575600334
Epoch: 41, step: 386, loss: 0.35318976640701294, mean loss: 0.34379466341841297
Epoch: 41, step: 387, loss: 0.35578086972236633, mean loss: 0.34379486455625535
Epoch: 41, step: 388, loss: 0.3071623146533966, mean loss: 0.34379424984395857
Epoch: 41, step: 389, loss: 0.3526385426521301, mean loss: 0.34379439825307373
Epoch: 41, step: 390, loss: 0.3103429079055786, mean loss: 0.3437938369393671
Epoch: 41, step: 391, loss: 0.3296903371810913, mean loss: 0.34379360028758243
Epoch: 41, step: 392, loss: 0.29766666889190674, mean loss: 0.34379282630682173
Epoch: 41, step: 393, loss: 0.305627703666687, mean loss: 0.3437921859309259
Epoch: 41, step: 394, loss: 0.3220488429069519, mean loss: 0.343791821103613
Epoch: 41, step: 395, loss: 0.2803618311882019, mean loss: 0.34379075684203725
Epoch: 41, step: 396, loss: 0.31904420256614685, mean loss: 0.34379034163836153
Epoch: 41, step: 397, loss: 0.3191518783569336, mean loss: 0.34378992825519855
Epoch: 41, step: 398, loss: 0.3461546301841736, mean loss: 0.3437899679294084
Epoch: 41, step: 399, loss: 0.3681796193122864, mean loss: 0.3437903771242843
Epoch: 41, step: 400, loss: 0.3022877275943756, mean loss: 0.3437896808295182
Epoch: 41, step: 401, loss: 0.32985010743141174, mean loss: 0.34378944696760166
Epoch: 41, step: 402, loss: 0.3218238055706024, mean loss: 0.3437890784598526
Epoch: 41, step: 403, loss: 0.36962854862213135, mean loss: 0.34378951194982316
Epoch: 41, step: 404, loss: 0.3329092860221863, mean loss: 0.34378932942325957
Epoch: 41, step: 405, loss: 0.32054173946380615, mean loss: 0.3437889394284607
Epoch: 41, step: 406, loss: 0.3386463522911072, mean loss: 0.3437888531593638
Epoch: 41, step: 407, loss: 0.32120054960250854, mean loss: 0.34378847423727504
Epoch: 41, step: 408, loss: 0.35996213555336, mean loss: 0.3437887455482528
Epoch: 41, step: 409, loss: 0.31567615270614624, mean loss: 0.3437882739712265
Epoch: 41, step: 410, loss: 0.3591993451118469, mean loss: 0.3437885324811844
Epoch: 41, step: 411, loss: 0.30201852321624756, mean loss: 0.343787831830197
Epoch: 41, step: 412, loss: 0.3395310640335083, mean loss: 0.34378776042828485
Epoch: 41, step: 413, loss: 0.3586425185203552, mean loss: 0.34378800959394107
Epoch: 41, step: 414, loss: 0.34609365463256836, mean loss: 0.3437880482669319
Epoch: 41, step: 415, loss: 0.33309704065322876, mean loss: 0.34378786894778374
Epoch: 41, step: 416, loss: 0.32599329948425293, mean loss: 0.34378757048634456
Epoch: 41, step: 417, loss: 0.314191609621048, mean loss: 0.3437870740930524
Epoch: 41, step: 418, loss: 0.33418798446655273, mean loss: 0.3437869130966311
Epoch: 41, step: 419, loss: 0.3223661184310913, mean loss: 0.34378655383199497
Epoch: 41, step: 420, loss: 0.3160736560821533, mean loss: 0.3437860890454499
Epoch: 41, step: 421, loss: 0.38144394755363464, mean loss: 0.3437867206131973
Epoch: 41, step: 422, loss: 0.3687194883823395, mean loss: 0.3437871387587986
Epoch: 41, step: 423, loss: 0.344606876373291, mean loss: 0.34378715250632685
Epoch: 41, step: 424, loss: 0.3460434377193451, mean loss: 0.34378719034504984
Epoch: 41, step: 425, loss: 0.35734084248542786, mean loss: 0.34378741764091
Epoch: 41, step: 426, loss: 0.33102700114250183, mean loss: 0.34378720365126536
Epoch: 41, step: 427, loss: 0.31398749351501465, mean loss: 0.34378670392443855
Epoch: 41, step: 428, loss: 0.35600408911705017, mean loss: 0.3437869088006848
Epoch: 41, step: 429, loss: 0.31930145621299744, mean loss: 0.3437864982051757
Epoch: 41, step: 430, loss: 0.34196174144744873, mean loss: 0.3437864676064207
Epoch: 41, step: 431, loss: 0.30666935443878174, mean loss: 0.34378584521200845
Epoch: 41, step: 432, loss: 0.37787845730781555, mean loss: 0.34378641688080624
Epoch: 41, step: 433, loss: 0.3794528543949127, mean loss: 0.3437870149296596
Epoch: 41, step: 434, loss: 0.33085817098617554, mean loss: 0.3437867981446038
Epoch: 41, step: 435, loss: 0.37949466705322266, mean loss: 0.3437873968680932
Epoch: 41, step: 436, loss: 0.2995706796646118, mean loss: 0.3437866554868755
Epoch: 41, step: 437, loss: 0.31855374574661255, mean loss: 0.34378623241404527
Epoch: 41, step: 438, loss: 0.3444003760814667, mean loss: 0.3437862427110402
Epoch: 41, step: 439, loss: 0.3185086250305176, mean loss: 0.34378581890281673
Epoch: 41, step: 440, loss: 0.32409241795539856, mean loss: 0.34378548872592096
Epoch: 41, step: 441, loss: 0.32274168729782104, mean loss: 0.34378513591430865
Epoch: 41, step: 442, loss: 0.36397671699523926, mean loss: 0.34378547443227403
Epoch: 41, step: 443, loss: 0.33215436339378357, mean loss: 0.3437852794364479
Epoch: 41, step: 444, loss: 0.3343099057674408, mean loss: 0.34378512058426813
Epoch: 41, step: 445, loss: 0.36224067211151123, mean loss: 0.34378542998161143
Epoch: 41, step: 446, loss: 0.30751481652259827, mean loss: 0.3437848219345802
Epoch: 41, step: 447, loss: 0.3398537039756775, mean loss: 0.3437847560337226
Epoch: 41, step: 448, loss: 0.29774153232574463, mean loss: 0.3437839841827896
Epoch: 41, step: 449, loss: 0.3612433075904846, mean loss: 0.3437842768592808
Epoch: 41, step: 450, loss: 0.33428868651390076, mean loss: 0.34378411768418493
Epoch: 41, step: 451, loss: 0.42338821291923523, mean loss: 0.3437854520695818
Epoch: 41, step: 452, loss: 0.3474651277065277, mean loss: 0.3437855137501161
Epoch: 41, step: 453, loss: 0.33441489934921265, mean loss: 0.3437853566778978
Epoch: 41, step: 454, loss: 0.3303774893283844, mean loss: 0.3437851319361597
Epoch: 41, step: 455, loss: 0.32090288400650024, mean loss: 0.3437847483919437
Epoch: 41, step: 456, loss: 0.3368081748485565, mean loss: 0.34378463145502436
Epoch: 41, step: 457, loss: 0.31948181986808777, mean loss: 0.34378422411347387
Epoch: 41, step: 458, loss: 0.3446156978607178, mean loss: 0.3437842380496445
Epoch: 41, step: 459, loss: 0.3503522574901581, mean loss: 0.3437843481331025
Epoch: 41, step: 460, loss: 0.33629104495048523, mean loss: 0.34378422254350754
Epoch: 41, step: 461, loss: 0.32621726393699646, mean loss: 0.34378392812191727
Epoch: 41, step: 462, loss: 0.29546675086021423, mean loss: 0.3437831183413474
Epoch: 41, step: 463, loss: 0.34718456864356995, mean loss: 0.3437831753476205
Epoch: 41, step: 464, loss: 0.40584978461265564, mean loss: 0.34378421552944466
Epoch: 41, step: 465, loss: 0.35484257340431213, mean loss: 0.34378440085469814
Epoch: 41, step: 466, loss: 0.32951819896698, mean loss: 0.3437841617737059
Epoch: 41, step: 467, loss: 0.3658907413482666, mean loss: 0.34378453224192507
Epoch: 41, step: 468, loss: 0.34775254130363464, mean loss: 0.34378459873781203
Epoch: 41, step: 469, loss: 0.3409639596939087, mean loss: 0.34378455147034137
Epoch: 41, step: 470, loss: 0.33307984471321106, mean loss: 0.34378437208690177
Epoch: 41, step: 471, loss: 0.3141863942146301, mean loss: 0.34378387610898986
Epoch: 41, step: 472, loss: 0.31849536299705505, mean loss: 0.34378345235254915
Epoch: 41, step: 473, loss: 0.3634513318538666, mean loss: 0.34378378191921527
Epoch: 41, step: 474, loss: 0.35832348465919495, mean loss: 0.34378402555102444
Epoch: 41, step: 475, loss: 0.32603925466537476, mean loss: 0.3437837282190726
Epoch: 41, step: 476, loss: 0.3467962443828583, mean loss: 0.3437837786960446
Epoch: 41, step: 477, loss: 0.38715019822120667, mean loss: 0.3437845053208146
Epoch: 41, step: 478, loss: 0.3556930124759674, mean loss: 0.34378470485011364
Epoch: 41, step: 479, loss: 0.3298635482788086, mean loss: 0.3437844716023995
Epoch: 41, step: 480, loss: 0.32371634244918823, mean loss: 0.3437841353683515
Epoch: 41, step: 481, loss: 0.3301290273666382, mean loss: 0.34378390658592345
Epoch: 41, step: 482, loss: 0.3375667333602905, mean loss: 0.34378380242298634
Epoch: 41, step: 483, loss: 0.32903727889060974, mean loss: 0.3437835553628816
Epoch: 41, step: 484, loss: 0.33215412497520447, mean loss: 0.34378336052915365
Epoch: 41, step: 485, loss: 0.32811781764030457, mean loss: 0.34378309808078894
Epoch: 41, step: 486, loss: 0.3229961693286896, mean loss: 0.34378274983852875
Epoch: 41, step: 487, loss: 0.3348085880279541, mean loss: 0.3437825994974142
Epoch: 41, step: 488, loss: 0.3195626139640808, mean loss: 0.3437821937549396
Epoch: 41, step: 489, loss: 0.32620251178741455, mean loss: 0.3437818992583073
Epoch: 41, step: 490, loss: 0.3242337703704834, mean loss: 0.34378157179153646
Epoch: 41, step: 491, loss: 0.3998883068561554, mean loss: 0.34378251166581725
Epoch: 41, step: 492, loss: 0.32215484976768494, mean loss: 0.34378214937521806
Epoch: 41, step: 493, loss: 0.38322803378105164, mean loss: 0.34378281013243617
Epoch: 41, step: 494, loss: 0.34976619482040405, mean loss: 0.3437829103583141
Epoch: 41, step: 495, loss: 0.4065488278865814, mean loss: 0.34378396171371656
Epoch: 41, step: 496, loss: 0.394715815782547, mean loss: 0.3437848148293104
Epoch: 41, step: 497, loss: 0.3632139265537262, mean loss: 0.34378514026416557
Epoch: 41, step: 498, loss: 0.32613563537597656, mean loss: 0.34378484464242315
Epoch: 41, step: 499, loss: 0.3501046895980835, mean loss: 0.3437849504953803
Epoch: 41, step: 500, loss: 0.3138369023799896, mean loss: 0.3437844488950434
Epoch: 41, step: 501, loss: 0.29318392276763916, mean loss: 0.34378360140021663
Epoch: 41, step: 502, loss: 0.32786133885383606, mean loss: 0.3437833347269196
Epoch: 41, step: 503, loss: 0.3127300441265106, mean loss: 0.34378281464099136
Epoch: 41, step: 504, loss: 0.3156615197658539, mean loss: 0.343782343668527
Epoch: 41, step: 505, loss: 0.35589513182640076, mean loss: 0.34378254652882106
Epoch: 41, step: 506, loss: 0.30696433782577515, mean loss: 0.34378192992201995
Epoch: 41, step: 507, loss: 0.29330646991729736, mean loss: 0.3437810846068403
Epoch: 41, step: 508, loss: 0.29169052839279175, mean loss: 0.34378021225816896
Epoch: 41, step: 509, loss: 0.3336590528488159, mean loss: 0.34378004276425783
Epoch: 41, step: 510, loss: 0.3022891581058502, mean loss: 0.3437793479491417
Epoch: 41, step: 511, loss: 0.3475218415260315, mean loss: 0.34377941062067996
Epoch: 41, step: 512, loss: 0.3931257426738739, mean loss: 0.34378023695710097
Epoch: 41, step: 513, loss: 0.3403572738170624, mean loss: 0.34378017963831703
Epoch: 41, step: 514, loss: 0.33327069878578186, mean loss: 0.34378000365611955
Epoch: 41, step: 515, loss: 0.3025246262550354, mean loss: 0.34377931284270025
Epoch: 41, step: 516, loss: 0.2930876910686493, mean loss: 0.3437784640353833
Epoch: 41, step: 517, loss: 0.32992562651634216, mean loss: 0.34377823208003155
Epoch: 41, step: 518, loss: 0.32299789786338806, mean loss: 0.3437778841347807
Epoch: 41, step: 519, loss: 0.32306286692619324, mean loss: 0.34377753728900334
Epoch: 41, step: 520, loss: 0.3759390711784363, mean loss: 0.3437780757826641
Epoch: 41, step: 521, loss: 0.3227815628051758, mean loss: 0.3437777242353819
Epoch: 41, step: 522, loss: 0.2988045811653137, mean loss: 0.3437769712569455
Epoch: 41, step: 523, loss: 0.32326146960258484, mean loss: 0.3437766277747989
Epoch: 41, step: 524, loss: 0.3253161609172821, mean loss: 0.34377631870438324
Epoch: 41, step: 525, loss: 0.37656813859939575, mean loss: 0.3437768677052186
Epoch: 41, step: 526, loss: 0.3112049698829651, mean loss: 0.3437763223954494
Epoch: 41, step: 527, loss: 0.31934934854507446, mean loss: 0.3437759134526072
Epoch: 41, step: 528, loss: 0.32193228602409363, mean loss: 0.3437755477648395
Epoch: 41, step: 529, loss: 0.3147635757923126, mean loss: 0.343775062078765
Epoch: 41, step: 530, loss: 0.38478168845176697, mean loss: 0.3437757485544723
Epoch: 41, step: 531, loss: 0.37497612833976746, mean loss: 0.3437762708589417
Epoch: 41, step: 532, loss: 0.36703240871429443, mean loss: 0.34377666016770936
Epoch: 41, step: 533, loss: 0.3116917014122009, mean loss: 0.3437761230730836
Epoch: 41, step: 534, loss: 0.3196413516998291, mean loss: 0.34377571906947835
Epoch: 41, step: 535, loss: 0.3749949336051941, mean loss: 0.34377624165425463
Epoch: 41, step: 536, loss: 0.3435240089893341, mean loss: 0.34377623743215147
Epoch: 41, step: 537, loss: 0.31098809838294983, mean loss: 0.34377568860320284
Epoch: 41, step: 538, loss: 0.3398304879665375, mean loss: 0.34377562256700384
Epoch: 41, step: 539, loss: 0.32364144921302795, mean loss: 0.34377528555954945
Epoch: 41, step: 540, loss: 0.3362114727497101, mean loss: 0.3437751589579458
Epoch: 41, step: 541, loss: 0.3691083490848541, mean loss: 0.3437755829727774
Epoch: 41, step: 542, loss: 0.3124193847179413, mean loss: 0.34377505815649784
Epoch: 41, step: 543, loss: 0.31201979517936707, mean loss: 0.34377452666987107
Epoch: 41, step: 544, loss: 0.30691245198249817, mean loss: 0.3437739097210571
Epoch: 41, step: 545, loss: 0.34855780005455017, mean loss: 0.3437739897861673
Epoch: 41, step: 546, loss: 0.33724597096443176, mean loss: 0.34377388053245067
Epoch: 41, step: 547, loss: 0.37258848547935486, mean loss: 0.34377436276911133
Epoch: 41, step: 548, loss: 0.3504129946231842, mean loss: 0.3437744738703423
Epoch: 41, step: 549, loss: 0.32635390758514404, mean loss: 0.3437741823322648
Epoch: 41, step: 550, loss: 0.37042248249053955, mean loss: 0.3437746282916014
Epoch: 41, step: 551, loss: 0.3485935628414154, mean loss: 0.34377470893512757
Epoch: 41, step: 552, loss: 0.3065967559814453, mean loss: 0.34377408678286164
Epoch: 41, step: 553, loss: 0.32327908277511597, mean loss: 0.3437737438161625
Epoch: 41, step: 554, loss: 0.37482550740242004, mean loss: 0.34377426343268197
Epoch: 41, step: 555, loss: 0.34649839997291565, mean loss: 0.3437743090172961
Epoch: 41, step: 556, loss: 0.324807733297348, mean loss: 0.34377399164349515
Epoch: 41, step: 557, loss: 0.32497015595436096, mean loss: 0.34377367699814043
Epoch: 41, step: 558, loss: 0.31132617592811584, mean loss: 0.3437731340618576
Epoch: 41, step: 559, loss: 0.3103007972240448, mean loss: 0.34377257398661437
Epoch: 41, step: 560, loss: 0.39302554726600647, mean loss: 0.3437733980972691
Epoch: 41, step: 561, loss: 0.30746421217918396, mean loss: 0.34377279057483295
Epoch: 41, step: 562, loss: 0.38064056634902954, mean loss: 0.3437734074332293
Epoch: 41, step: 563, loss: 0.3513512909412384, mean loss: 0.3437735342215359
Epoch: 41, step: 564, loss: 0.3453887403011322, mean loss: 0.34377356124568015
Epoch: 41, step: 565, loss: 0.36956700682640076, mean loss: 0.3437739927906957
Epoch: 41, step: 566, loss: 0.33744698762893677, mean loss: 0.3437738869365999
Epoch: 41, step: 567, loss: 0.31051599979400635, mean loss: 0.3437733305241134
Epoch: 41, step: 568, loss: 0.3460725247859955, mean loss: 0.3437733689895453
Epoch: 41, step: 569, loss: 0.35813233256340027, mean loss: 0.34377360921043687
Epoch: 41, step: 570, loss: 0.3521733283996582, mean loss: 0.34377374973271524
Epoch: 41, step: 571, loss: 0.2836819887161255, mean loss: 0.34377274445031064
Epoch: 41, step: 572, loss: 0.3159189820289612, mean loss: 0.3437722784891145
Epoch: 41, step: 573, loss: 0.303645521402359, mean loss: 0.3437716072261568
Epoch: 41, step: 574, loss: 0.3449038863182068, mean loss: 0.34377162616724133
Epoch: 41, step: 575, loss: 0.3097558319568634, mean loss: 0.34377105715094475
Epoch: 41, step: 576, loss: 0.36711975932121277, mean loss: 0.3437714477215637
Epoch: 41, step: 577, loss: 0.3312177360057831, mean loss: 0.343771237730066
Epoch: 41, step: 578, loss: 0.2905174791812897, mean loss: 0.3437703469457536
Epoch: 41, step: 579, loss: 0.3292880058288574, mean loss: 0.3437701047013217
Epoch: 41, step: 580, loss: 0.3058961033821106, mean loss: 0.34376947119791246
Epoch: 41, step: 581, loss: 0.2930617928504944, mean loss: 0.3437686230448608
Epoch: 41, step: 582, loss: 0.3201725482940674, mean loss: 0.34376822837587334
Epoch: 41, step: 583, loss: 0.35790175199508667, mean loss: 0.34376846476985906
Epoch: 41, step: 584, loss: 0.3099459707736969, mean loss: 0.3437678990722559
Epoch: 41, step: 585, loss: 0.34913378953933716, mean loss: 0.34376798881787335
Epoch: 41, step: 586, loss: 0.3610657751560211, mean loss: 0.34376827812205524
Epoch: 41, step: 587, loss: 0.3307328224182129, mean loss: 0.3437680601086805
Epoch: 41, step: 588, loss: 0.3172227740287781, mean loss: 0.34376761615560775
Epoch: 41, step: 589, loss: 0.32817307114601135, mean loss: 0.3437673553510954
Epoch: 41, step: 590, loss: 0.29637518525123596, mean loss: 0.3437665627736207
Epoch: 41, step: 591, loss: 0.3362479507923126, mean loss: 0.3437664370359128
Epoch: 41, step: 592, loss: 0.3288280665874481, mean loss: 0.34376618721785424
Epoch: 41, step: 593, loss: 0.3244097828865051, mean loss: 0.3437658635213371
Epoch: 41, step: 594, loss: 0.3060254752635956, mean loss: 0.3437652324006117
Epoch: 41, step: 595, loss: 0.3158213496208191, mean loss: 0.343764765111602
Epoch: 41, step: 596, loss: 0.3137281537055969, mean loss: 0.3437642628355296
Epoch: 41, step: 597, loss: 0.34654971957206726, mean loss: 0.3437643094135159
Epoch: 41, step: 598, loss: 0.30689573287963867, mean loss: 0.34376369291306386
Epoch: 41, step: 599, loss: 0.3989834487438202, mean loss: 0.34376461625858973
Epoch: 41, step: 600, loss: 0.3353155255317688, mean loss: 0.3437644749812596
Epoch: 41, step: 601, loss: 0.3225770890712738, mean loss: 0.34376412071269274
Epoch: 41, step: 602, loss: 0.3947902023792267, mean loss: 0.3437649738917799
Epoch: 41, step: 603, loss: 0.297703355550766, mean loss: 0.3437642037336348
Epoch: 41, step: 604, loss: 0.3496355414390564, mean loss: 0.3437643019017651
Epoch: 41, step: 605, loss: 0.3130252957344055, mean loss: 0.3437637879575055
Epoch: 41, step: 606, loss: 0.3236854672431946, mean loss: 0.34376345226138416
Epoch: 41, step: 607, loss: 0.3210734724998474, mean loss: 0.34376307290640923
Epoch: 41, step: 608, loss: 0.33408936858177185, mean loss: 0.3437629111739376
Epoch: 41, step: 609, loss: 0.35482561588287354, mean loss: 0.3437630961256999
Epoch: 41, step: 610, loss: 0.3429447114467621, mean loss: 0.3437630824437693
Epoch: 41, step: 611, loss: 0.3514246344566345, mean loss: 0.34376321052909786
Epoch: 41, step: 612, loss: 0.3645792603492737, mean loss: 0.34376355852464796
Epoch: 41, step: 613, loss: 0.33152395486831665, mean loss: 0.34376335391059104
Epoch: 41, step: 614, loss: 0.33920443058013916, mean loss: 0.34376327769862947
Epoch: 41, step: 615, loss: 0.310470849275589, mean loss: 0.34376272115519213
Epoch: 41, step: 616, loss: 0.32212725281715393, mean loss: 0.3437623594850706
Epoch: 41, step: 617, loss: 0.3356441557407379, mean loss: 0.34376222377908044
Epoch: 41, step: 618, loss: 0.34184542298316956, mean loss: 0.343762191737879
Epoch: 41, step: 619, loss: 0.33493128418922424, mean loss: 0.3437620441230831
Epoch: 41, step: 620, loss: 0.32575199007987976, mean loss: 0.343761743077466
Epoch: 41, step: 621, loss: 0.338660329580307, mean loss: 0.34376165780662227
Epoch: 41, step: 622, loss: 0.33753061294555664, mean loss: 0.34376155365557237
Epoch: 41, step: 623, loss: 0.37106335163116455, mean loss: 0.34376200999370793
Epoch: 41, step: 624, loss: 0.35119393467903137, mean loss: 0.3437621342131447
Epoch: 41, step: 625, loss: 0.3353170156478882, mean loss: 0.3437619930612382
Epoch: 41, step: 626, loss: 0.3624407947063446, mean loss: 0.34376230525394175
Epoch: 41, step: 627, loss: 0.39163386821746826, mean loss: 0.34376310535360355
Epoch: 41, step: 628, loss: 0.3330143094062805, mean loss: 0.343762925706988
Epoch: 41, step: 629, loss: 0.3378992974758148, mean loss: 0.3437628277087223
Epoch: 41, step: 630, loss: 0.3377337157726288, mean loss: 0.34376272694642707
Epoch: 41, step: 631, loss: 0.33104854822158813, mean loss: 0.3437625144626594
Epoch: 41, step: 632, loss: 0.3380284607410431, mean loss: 0.3437624186347649
Epoch: 41, step: 633, loss: 0.2745409309864044, mean loss: 0.343761261819904
Epoch: 41, step: 634, loss: 0.2941023111343384, mean loss: 0.34376043194389194
Epoch: 41, step: 635, loss: 0.3590851426124573, mean loss: 0.3437606880386558
Epoch: 41, step: 636, loss: 0.30337777733802795, mean loss: 0.34376001320182653
Epoch: 41, step: 637, loss: 0.3420676589012146, mean loss: 0.3437599849214499
Epoch: 41, step: 638, loss: 0.313086599111557, mean loss: 0.3437594723571431
Epoch: 41, step: 639, loss: 0.3045516610145569, mean loss: 0.34375881719018664
Epoch: 41, step: 640, loss: 0.33715343475341797, mean loss: 0.3437587068153444
Epoch: 41, step: 641, loss: 0.3386908769607544, mean loss: 0.3437586221341651
Epoch: 41, step: 642, loss: 0.3670997619628906, mean loss: 0.3437590121476967
Epoch: 41, step: 643, loss: 0.3592039942741394, mean loss: 0.3437592702178432
Epoch: 41, step: 644, loss: 0.3348528742790222, mean loss: 0.34375912140339454
Epoch: 41, step: 645, loss: 0.34908929467201233, mean loss: 0.3437592104622629
Epoch: 41, step: 646, loss: 0.3026700019836426, mean loss: 0.3437585239372511
Epoch: 41, step: 647, loss: 0.3658159673213959, mean loss: 0.3437588924703558
Epoch: 41, step: 648, loss: 0.330171138048172, mean loss: 0.3437586654515861
Epoch: 41, step: 649, loss: 0.3450040817260742, mean loss: 0.3437586862591558
Epoch: 41, step: 650, loss: 0.3343372046947479, mean loss: 0.34375852885406744
Epoch: 41, step: 651, loss: 0.30407193303108215, mean loss: 0.3437578658195208
Epoch: 41, step: 652, loss: 0.3402145802974701, mean loss: 0.34375780662367866
Epoch: 41, step: 653, loss: 0.3829661011695862, mean loss: 0.3437584616454727
Epoch: 41, step: 654, loss: 0.31919562816619873, mean loss: 0.3437580513006043
Epoch: 41, step: 655, loss: 0.35148561000823975, mean loss: 0.3437581803944684
Epoch: 41, step: 656, loss: 0.3448876738548279, mean loss: 0.3437581992630717
Epoch: 41, step: 657, loss: 0.2927834987640381, mean loss: 0.34375734772619526
Epoch: 41, step: 658, loss: 0.3060673177242279, mean loss: 0.343756718121431
Epoch: 41, step: 659, loss: 0.35810086131095886, mean loss: 0.3437569577336051
Epoch: 41, step: 660, loss: 0.35650259256362915, mean loss: 0.3437571706398914
Epoch: 41, step: 661, loss: 0.37661826610565186, mean loss: 0.3437577195507167
Epoch: 41, step: 662, loss: 0.3166442811489105, mean loss: 0.3437572666561604
Epoch: 41, step: 663, loss: 0.3433217406272888, mean loss: 0.3437572593813888
Epoch: 41, step: 664, loss: 0.32354235649108887, mean loss: 0.3437569217291332
Epoch: 41, step: 665, loss: 0.3134938180446625, mean loss: 0.34375641624886455
Epoch: 41, step: 666, loss: 0.3794197738170624, mean loss: 0.34375701191884783
Epoch: 41, step: 667, loss: 0.34629377722740173, mean loss: 0.34375705428865855
Epoch: 41, step: 668, loss: 0.31000208854675293, mean loss: 0.3437564905125701
Epoch: 41, step: 669, loss: 0.37883511185646057, mean loss: 0.34375707638659464
Epoch: 41, step: 670, loss: 0.39569082856178284, mean loss: 0.3437579437561508
Epoch: 41, step: 671, loss: 0.3272136449813843, mean loss: 0.3437576674467986
Epoch: 41, step: 672, loss: 0.3092550039291382, mean loss: 0.343757091221144
Epoch: 41, step: 673, loss: 0.30411162972450256, mean loss: 0.3437564291171743
Epoch: 41, step: 674, loss: 0.34184888005256653, mean loss: 0.3437563972604455
Epoch: 41, step: 675, loss: 0.3352653384208679, mean loss: 0.34375625545919564
Epoch: 41, step: 676, loss: 0.3347194194793701, mean loss: 0.34375610454595135
Epoch: 41, step: 677, loss: 0.354932576417923, mean loss: 0.34375629118754436
Epoch: 41, step: 678, loss: 0.29798486828804016, mean loss: 0.34375552684001837
Epoch: 41, step: 679, loss: 0.352077841758728, mean loss: 0.34375566581394995
Epoch: 41, step: 680, loss: 0.31945568323135376, mean loss: 0.34375526003650014
Epoch: 41, step: 681, loss: 0.36010435223579407, mean loss: 0.34375553304007694
Epoch: 41, step: 682, loss: 0.2968367338180542, mean loss: 0.3437547495845821
Epoch: 41, step: 683, loss: 0.36211419105529785, mean loss: 0.34375505614752405
Epoch: 41, step: 684, loss: 0.3001413941383362, mean loss: 0.34375432790591026
Epoch: 41, step: 685, loss: 0.3322214186191559, mean loss: 0.34375413533771376
Epoch: 41, step: 686, loss: 0.3434528410434723, mean loss: 0.3437541303070031
Epoch: 41, step: 687, loss: 0.3036988377571106, mean loss: 0.3437534615149683
Epoch: 41, step: 688, loss: 0.31039944291114807, mean loss: 0.3437529046215316
Epoch: 41, step: 689, loss: 0.3082923889160156, mean loss: 0.3437523125669734
Epoch: 41, step: 690, loss: 0.3071100413799286, mean loss: 0.34375170079184714
Epoch: 41, step: 691, loss: 0.32327696681022644, mean loss: 0.3437513589537614
Epoch: 41, step: 692, loss: 0.321503221988678, mean loss: 0.34375098751384014
Epoch: 41, step: 693, loss: 0.3141796588897705, mean loss: 0.343750493819082
Epoch: 41, step: 694, loss: 0.3441813290119171, mean loss: 0.3437505010117763
Epoch: 41, step: 695, loss: 0.33124735951423645, mean loss: 0.34375029227819537
Epoch: 41, step: 696, loss: 0.33438098430633545, mean loss: 0.3437501358649807
Epoch: 41, step: 697, loss: 0.34352177381515503, mean loss: 0.34375013205271987
Epoch: 41, step: 698, loss: 0.3251720368862152, mean loss: 0.3437498219164134
Epoch: 41, step: 699, loss: 0.32676318287849426, mean loss: 0.3437495383520598
Epoch: 41, step: 700, loss: 0.31149202585220337, mean loss: 0.3437489998742616
Epoch: 41, step: 701, loss: 0.3193073868751526, mean loss: 0.34374859187484585
Epoch: 41, step: 702, loss: 0.35036543011665344, mean loss: 0.3437487023266836
Epoch: 41, step: 703, loss: 0.35379308462142944, mean loss: 0.34374886999013915
Epoch: 41, step: 704, loss: 0.32263368368148804, mean loss: 0.3437485175358116
Epoch: 41, step: 705, loss: 0.34373733401298523, mean loss: 0.3437485173491395
Epoch: 41, step: 706, loss: 0.32590097188949585, mean loss: 0.3437482194481621
Epoch: 41, step: 707, loss: 0.3459480106830597, mean loss: 0.343748256165201
Epoch: 41, step: 708, loss: 0.3349546492099762, mean loss: 0.3437481093922643
Epoch: 41, step: 709, loss: 0.3193148076534271, mean loss: 0.3437477015860464
Epoch: 41, step: 710, loss: 0.38703784346580505, mean loss: 0.34374842411198947
Epoch: 41, step: 711, loss: 0.3222869038581848, mean loss: 0.34374806591851437
Epoch: 41, step: 712, loss: 0.32723313570022583, mean loss: 0.34374779028838903
Epoch: 41, step: 713, loss: 0.34910058975219727, mean loss: 0.34374787962380515
Epoch: 41, step: 714, loss: 0.31413793563842773, mean loss: 0.34374738545761435
Epoch: 41, step: 715, loss: 0.3713115155696869, mean loss: 0.3437478454731369
Epoch: 41, step: 716, loss: 0.37521153688430786, mean loss: 0.3437483705593573
Epoch: 41, step: 717, loss: 0.3117018938064575, mean loss: 0.3437478357561673
Epoch: 41, step: 718, loss: 0.31287693977355957, mean loss: 0.3437473205800916
Epoch: 41, step: 719, loss: 0.32178106904029846, mean loss: 0.3437469540115792
Epoch: 41, step: 720, loss: 0.3315275311470032, mean loss: 0.3437467500996415
Epoch: 41, step: 721, loss: 0.34541791677474976, mean loss: 0.3437467779868136
Epoch: 41, step: 722, loss: 0.34003016352653503, mean loss: 0.3437467159677828
Epoch: 41, step: 723, loss: 0.30605828762054443, mean loss: 0.34374608707263615
Epoch: 41, step: 724, loss: 0.3392724096775055, mean loss: 0.34374601242301084
Epoch: 41, step: 725, loss: 0.3188968002796173, mean loss: 0.3437455977857316
Epoch: 41, step: 726, loss: 0.3480139672756195, mean loss: 0.3437456690071277
Epoch: 41, step: 727, loss: 0.31690216064453125, mean loss: 0.34374522110770234
Epoch: 41, step: 728, loss: 0.39218029379844666, mean loss: 0.3437460292613521
Epoch: 41, step: 729, loss: 0.34839412569999695, mean loss: 0.34374610681493506
Epoch: 41, step: 730, loss: 0.33427366614341736, mean loss: 0.3437459487697082
Epoch: 41, step: 731, loss: 0.37134596705436707, mean loss: 0.34374640926120387
Epoch: 41, step: 732, loss: 0.3319438099861145, mean loss: 0.34374621234445335
Epoch: 41, step: 733, loss: 0.3703320026397705, mean loss: 0.34374665589929826
Epoch: 41, step: 734, loss: 0.3273448944091797, mean loss: 0.3437463822584052
Epoch: 41, step: 735, loss: 0.34366869926452637, mean loss: 0.34374638096239263
Epoch: 41, step: 736, loss: 0.34926509857177734, mean loss: 0.34374647303155415
Epoch: 41, step: 737, loss: 0.334722101688385, mean loss: 0.3437463224798318
Epoch: 41, step: 738, loss: 0.30504435300827026, mean loss: 0.3437456768336434
Epoch: 41, step: 739, loss: 0.3310575485229492, mean loss: 0.34374546516728294
Epoch: 41, step: 740, loss: 0.34027454257011414, mean loss: 0.34374540726549635
Epoch: 41, step: 741, loss: 0.3168569505214691, mean loss: 0.3437449587208604
Epoch: 41, step: 742, loss: 0.3083743155002594, mean loss: 0.3437443686889452
Epoch: 41, step: 743, loss: 0.349001944065094, mean loss: 0.3437444563912101
Epoch: 41, step: 744, loss: 0.33997491002082825, mean loss: 0.34374439351198993
Epoch: 41, step: 745, loss: 0.2943160831928253, mean loss: 0.34374356901974107
Epoch: 41, step: 746, loss: 0.3756989538669586, mean loss: 0.34374410204479233
Epoch: 41, step: 747, loss: 0.37434902787208557, mean loss: 0.3437446125352818
Epoch: 41, step: 748, loss: 0.32936498522758484, mean loss: 0.3437443726869455
Epoch: 41, step: 749, loss: 0.37729838490486145, mean loss: 0.34374493234955716
Epoch: 41, step: 750, loss: 0.3528623580932617, mean loss: 0.3437450844207063
Epoch: 41, step: 751, loss: 0.27622145414352417, mean loss: 0.34374395820097386
Epoch: 41, step: 752, loss: 0.3180263936519623, mean loss: 0.34374352926749574
Epoch: 41, step: 753, loss: 0.3807128965854645, mean loss: 0.3437441458552291
Epoch: 41, step: 754, loss: 0.3361218273639679, mean loss: 0.3437440187297185
Epoch: 41, step: 755, loss: 0.3010125160217285, mean loss: 0.3437433060628955
Epoch: 41, step: 756, loss: 0.3417351245880127, mean loss: 0.3437432725714348
Epoch: 41, step: 757, loss: 0.32757434248924255, mean loss: 0.34374300291848653
Epoch: 41, step: 758, loss: 0.32554545998573303, mean loss: 0.34374269943895863
Epoch: 41, step: 759, loss: 0.35052093863487244, mean loss: 0.343742812477435
Epoch: 41, step: 760, loss: 0.32042574882507324, mean loss: 0.34374242363288143
Epoch: 41, step: 761, loss: 0.31262943148612976, mean loss: 0.3437419047890008
Epoch: 41, step: 762, loss: 0.3493193984031677, mean loss: 0.3437419977983829
Epoch: 41, step: 763, loss: 0.35086557269096375, mean loss: 0.34374211658798554
Epoch: 41, step: 764, loss: 0.3344801068305969, mean loss: 0.3437419621413588
Epoch: 41, step: 765, loss: 0.3274679183959961, mean loss: 0.34374169077161154
Epoch: 41, step: 766, loss: 0.3835904002189636, mean loss: 0.34374235523792773
Epoch: 41, step: 767, loss: 0.34361255168914795, mean loss: 0.3437423530735252
Epoch: 41, step: 768, loss: 0.33740437030792236, mean loss: 0.3437422473929228
Epoch: 41, step: 769, loss: 0.3683677017688751, mean loss: 0.34374265799509
Epoch: 41, step: 770, loss: 0.3530137240886688, mean loss: 0.34374281257726746
Epoch: 41, step: 771, loss: 0.3313872516155243, mean loss: 0.3437426065688481
Epoch: 41, step: 772, loss: 0.3159094452857971, mean loss: 0.3437421425049355
Epoch: 41, step: 773, loss: 0.3327603042125702, mean loss: 0.34374195940716146
Epoch: 41, step: 774, loss: 0.3683876395225525, mean loss: 0.3437423703123135
Epoch: 41, step: 775, loss: 0.37805575132369995, mean loss: 0.3437429423926905
Epoch: 41, step: 776, loss: 0.2937486469745636, mean loss: 0.34374210889049117
Epoch: 41, step: 777, loss: 0.33557918667793274, mean loss: 0.34374197280096075
Epoch: 41, step: 778, loss: 0.3183520436286926, mean loss: 0.3437415495155437
Epoch: 41, step: 779, loss: 0.2882727086544037, mean loss: 0.3437406247882687
Epoch: 41, step: 780, loss: 0.33557620644569397, mean loss: 0.34374048868060275
Epoch: 41, step: 781, loss: 0.3057209253311157, mean loss: 0.3437398548733252
Epoch: 41, step: 782, loss: 0.32750746607780457, mean loss: 0.34373958427488227
Epoch: 41, step: 783, loss: 0.3556792736053467, mean loss: 0.3437397833095114
Epoch: 41, step: 784, loss: 0.34619972109794617, mean loss: 0.34373982431599237
Epoch: 41, step: 785, loss: 0.30861490964889526, mean loss: 0.34373923880316243
Epoch: 41, step: 786, loss: 0.3485167920589447, mean loss: 0.3437393184409957
Epoch: 41, step: 787, loss: 0.3306950032711029, mean loss: 0.34373910100675165
Epoch: 41, step: 788, loss: 0.2817375659942627, mean loss: 0.34373806752726216
Epoch: 41, step: 789, loss: 0.3490397334098816, mean loss: 0.3437381558971972
Epoch: 41, step: 790, loss: 0.2926454544067383, mean loss: 0.34373730428120436
Epoch: 41, step: 791, loss: 0.36869391798973083, mean loss: 0.3437377202524976
Epoch: 41, step: 792, loss: 0.336579293012619, mean loss: 0.3437376009394113
Epoch: 41, step: 793, loss: 0.37935706973075867, mean loss: 0.34373819461701377
Epoch: 41, step: 794, loss: 0.3303724229335785, mean loss: 0.3437379718504396
Epoch: 41, step: 795, loss: 0.3283836245536804, mean loss: 0.3437377159446513
Epoch: 41, step: 796, loss: 0.411281019449234, mean loss: 0.34373884164761465
Epoch: 41, step: 797, loss: 0.30476415157318115, mean loss: 0.3437381920910986
Epoch: 41, step: 798, loss: 0.30930060148239136, mean loss: 0.3437376181599517
Epoch: 41, step: 799, loss: 0.28427842259407043, mean loss: 0.3437366272394203
Epoch: 41, step: 800, loss: 0.35639941692352295, mean loss: 0.3437368382683293
Epoch: 41, step: 801, loss: 0.371075838804245, mean loss: 0.3437372938727778
Epoch: 41, step: 802, loss: 0.3243238925933838, mean loss: 0.34373697035383366
Epoch: 41, step: 803, loss: 0.3573375642299652, mean loss: 0.34373719700017874
Epoch: 41, step: 804, loss: 0.35403168201446533, mean loss: 0.3437373685491966
Epoch: 41, step: 805, loss: 0.30762606859207153, mean loss: 0.3437367667944898
Epoch: 41, step: 806, loss: 0.3589833974838257, mean loss: 0.3437370208584229
Epoch: 41, step: 807, loss: 0.3436275124549866, mean loss: 0.3437370190336478
Epoch: 41, step: 808, loss: 0.3136228024959564, mean loss: 0.34373651723876103
Epoch: 41, step: 809, loss: 0.3425818085670471, mean loss: 0.34373649799810596
Epoch: 41, step: 810, loss: 0.3361112177371979, mean loss: 0.34373637094186565
Epoch: 41, step: 811, loss: 0.38419607281684875, mean loss: 0.34373704509045727
Epoch: 41, step: 812, loss: 0.315638929605484, mean loss: 0.3437365769211805
Epoch: 41, step: 813, loss: 0.31725773215293884, mean loss: 0.34373613573945555
Epoch: 41, step: 814, loss: 0.3238159716129303, mean loss: 0.343735803841821
Epoch: 41, step: 815, loss: 0.35463747382164, mean loss: 0.343735985475776
Epoch: 41, step: 816, loss: 0.3682100772857666, mean loss: 0.3437363932345906
Epoch: 41, step: 817, loss: 0.29827606678009033, mean loss: 0.3437356358401943
Epoch: 41, step: 818, loss: 0.3534594774246216, mean loss: 0.34373579784211994
Epoch: 41, step: 819, loss: 0.30501410365104675, mean loss: 0.3437351527385915
Epoch: 41, step: 820, loss: 0.3101443946361542, mean loss: 0.34373459312579513
Epoch: 41, step: 821, loss: 0.3003532886505127, mean loss: 0.3437338704172276
Epoch: 41, step: 822, loss: 0.3682924211025238, mean loss: 0.3437342795422994
Epoch: 41, step: 823, loss: 0.2733103334903717, mean loss: 0.3437331063573515
Epoch: 41, step: 824, loss: 0.353836327791214, mean loss: 0.34373327466302767
Epoch: 41, step: 825, loss: 0.3020034730434418, mean loss: 0.34373257951390856
Epoch: 41, step: 826, loss: 0.3649235963821411, mean loss: 0.3437329325151391
Epoch: 41, step: 827, loss: 0.3408234417438507, mean loss: 0.3437328840494746
Epoch: 41, step: 828, loss: 0.32021331787109375, mean loss: 0.3437324922721825
Epoch: 41, step: 829, loss: 0.3442451059818268, mean loss: 0.34373250081090573
Epoch: 41, step: 830, loss: 0.3544008135795593, mean loss: 0.3437326785124593
Epoch: 41, step: 831, loss: 0.31251853704452515, mean loss: 0.3437321585887224
Epoch: 41, step: 832, loss: 0.36050882935523987, mean loss: 0.34373243802758124
Epoch: 41, step: 833, loss: 0.29665058851242065, mean loss: 0.34373165382674986
Epoch: 41, step: 834, loss: 0.35092973709106445, mean loss: 0.3437317737168757
Epoch: 41, step: 835, loss: 0.37788069248199463, mean loss: 0.3437323424863421
Epoch: 41, step: 836, loss: 0.3182360529899597, mean loss: 0.34373191783835993
Epoch: 41, step: 837, loss: 0.3592907190322876, mean loss: 0.34373217697032077
Epoch: 41, step: 838, loss: 0.35677823424339294, mean loss: 0.34373239424889235
Epoch: 41, step: 839, loss: 0.29284876585006714, mean loss: 0.34373154680987433
Epoch: 41, step: 840, loss: 0.2992004454135895, mean loss: 0.3437308051810727
Epoch: 41, step: 841, loss: 0.33711016178131104, mean loss: 0.34373069492154834
Epoch: 41, step: 842, loss: 0.30219772458076477, mean loss: 0.34373000324718755
Epoch: 41, step: 843, loss: 0.3195418417453766, mean loss: 0.34372960043341355
Epoch: 41, step: 844, loss: 0.33013102412223816, mean loss: 0.34372937397541575
Epoch: 41, step: 845, loss: 0.30291008949279785, mean loss: 0.34372869422047014
Epoch: 41, step: 846, loss: 0.3000413179397583, mean loss: 0.343727966715911
Epoch: 41, step: 847, loss: 0.33069783449172974, mean loss: 0.3437277497350906
Epoch: 41, step: 848, loss: 0.35376065969467163, mean loss: 0.3437279168026802
Epoch: 41, step: 849, loss: 0.36221247911453247, mean loss: 0.34372822460169966
Epoch: 41, step: 850, loss: 0.34123390913009644, mean loss: 0.34372818306784786
Epoch: 41, step: 851, loss: 0.32778435945510864, mean loss: 0.3437279175852381
Epoch: 41, step: 852, loss: 0.3333292305469513, mean loss: 0.343727744438277
Epoch: 41, step: 853, loss: 0.31703463196754456, mean loss: 0.34372729998270957
Epoch: 41, step: 854, loss: 0.31552451848983765, mean loss: 0.34372683039810953
Epoch: 41, step: 855, loss: 0.3128320872783661, mean loss: 0.3437263160001222
Epoch: 41, step: 856, loss: 0.36394041776657104, mean loss: 0.34372665255964946
Epoch: 41, step: 857, loss: 0.32379233837127686, mean loss: 0.34372632066403846
Epoch: 41, step: 858, loss: 0.34170880913734436, mean loss: 0.3437262870741158
Epoch: 41, step: 859, loss: 0.38342931866645813, mean loss: 0.3437269480862294
Epoch: 41, step: 860, loss: 0.3360103964805603, mean loss: 0.3437268196162118
Epoch: 41, step: 861, loss: 0.3909255862236023, mean loss: 0.34372760539796204
Epoch: 41, step: 862, loss: 0.3181290328502655, mean loss: 0.34372717923097273
Epoch: 41, step: 863, loss: 0.34158194065093994, mean loss: 0.3437271435174717
Epoch: 41, step: 864, loss: 0.33241623640060425, mean loss: 0.34372695521889646
Epoch: 41, step: 865, loss: 0.33552154898643494, mean loss: 0.34372681862148957
Epoch: 41, step: 866, loss: 0.3362988531589508, mean loss: 0.34372669496838804
Epoch: 41, step: 867, loss: 0.4092158377170563, mean loss: 0.34372778514588753
Epoch: 41, step: 868, loss: 0.31999507546424866, mean loss: 0.343727390081388
Epoch: 41, step: 869, loss: 0.3047870397567749, mean loss: 0.3437267418750038
Epoch: 41, step: 870, loss: 0.37746530771255493, mean loss: 0.34372730348242514
Epoch: 41, step: 871, loss: 0.35398921370506287, mean loss: 0.3437274742978959
Epoch: 41, step: 872, loss: 0.36802852153778076, mean loss: 0.34372787879624367
Epoch: 41, step: 873, loss: 0.30466124415397644, mean loss: 0.3437272285310111
Epoch: 41, step: 874, loss: 0.35385292768478394, mean loss: 0.343727397070753
Epoch: 41, step: 875, loss: 0.3150993287563324, mean loss: 0.3437269205716133
Epoch: 41, step: 876, loss: 0.3100641369819641, mean loss: 0.34372636028161163
Epoch: 41, step: 877, loss: 0.3245958983898163, mean loss: 0.3437260418757348
Epoch: 41, step: 878, loss: 0.3083494305610657, mean loss: 0.3437254530800469
Epoch: 41, step: 879, loss: 0.34988775849342346, mean loss: 0.34372555564155105
Epoch: 41, step: 880, loss: 0.3512840270996094, mean loss: 0.3437256814378639
Epoch: 41, step: 881, loss: 0.3512641489505768, mean loss: 0.34372580689916127
Epoch: 41, step: 882, loss: 0.337950736284256, mean loss: 0.3437257107873465
Epoch: 41, step: 883, loss: 0.333769291639328, mean loss: 0.34372554509005004
Epoch: 41, step: 884, loss: 0.3383653461933136, mean loss: 0.3437254558857215
Epoch: 41, step: 885, loss: 0.3307311534881592, mean loss: 0.34372523963838586
Epoch: 41, step: 886, loss: 0.34453412890434265, mean loss: 0.3437252530994577
Epoch: 41, step: 887, loss: 0.339751660823822, mean loss: 0.34372518697431165
Epoch: 41, step: 888, loss: 0.3464493751525879, mean loss: 0.343725232307182
Epoch: 41, step: 889, loss: 0.3448135256767273, mean loss: 0.3437252504170327
Epoch: 41, step: 890, loss: 0.30305320024490356, mean loss: 0.34372457362112335
Epoch: 41, step: 891, loss: 0.31853625178337097, mean loss: 0.343724154486375
Epoch: 41, step: 892, loss: 0.3155517876148224, mean loss: 0.3437236857047907
Epoch: 41, step: 893, loss: 0.34825509786605835, mean loss: 0.3437237611051728
Epoch: 41, step: 894, loss: 0.35954082012176514, mean loss: 0.34372402428857046
Epoch: 41, step: 895, loss: 0.31348901987075806, mean loss: 0.343723521210294
Epoch: 41, step: 896, loss: 0.3179209530353546, mean loss: 0.3437230918901799
Epoch: 41, step: 897, loss: 0.3382226824760437, mean loss: 0.3437230003722701
Epoch: 41, step: 898, loss: 0.3427973687648773, mean loss: 0.3437229849715146
Epoch: 41, step: 899, loss: 0.3478284478187561, mean loss: 0.34372305327749836
Epoch: 41, step: 900, loss: 0.3798944652080536, mean loss: 0.3437236550812074
Epoch: 41, step: 901, loss: 0.3028362989425659, mean loss: 0.3437229748270541
Epoch: 41, step: 902, loss: 0.3352198898792267, mean loss: 0.3437228333612523
Epoch: 41, step: 903, loss: 0.3231239318847656, mean loss: 0.3437224906630844
Epoch: 41, step: 904, loss: 0.3237297832965851, mean loss: 0.343722158055532
Epoch: 41, step: 905, loss: 0.2999293804168701, mean loss: 0.34372142951156864
Epoch: 41, step: 906, loss: 0.3328700661659241, mean loss: 0.34372124898947876
Epoch: 41, step: 907, loss: 0.311065673828125, mean loss: 0.343720705743951
Epoch: 41, step: 908, loss: 0.37122130393981934, mean loss: 0.3437211632256637
Epoch: 41, step: 909, loss: 0.3005618751049042, mean loss: 0.34372044526831397
Epoch: 41, step: 910, loss: 0.32628336548805237, mean loss: 0.34372015520626986
Epoch: 41, step: 911, loss: 0.34913694858551025, mean loss: 0.34372024531195516
Epoch: 41, step: 912, loss: 0.32795894145965576, mean loss: 0.34371998313480306
Epoch: 41, step: 913, loss: 0.35265520215034485, mean loss: 0.34372013176281824
Epoch: 41, step: 914, loss: 0.3211512565612793, mean loss: 0.34371975635944824
Epoch: 41, step: 915, loss: 0.3026180565357208, mean loss: 0.3437190726984399
Epoch: 41, step: 916, loss: 0.3537987172603607, mean loss: 0.3437192403544097
Epoch: 41, step: 917, loss: 0.3546026051044464, mean loss: 0.3437194213757455
Epoch: 41, step: 918, loss: 0.29479771852493286, mean loss: 0.3437186076821033
Epoch: 41, step: 919, loss: 0.39742621779441833, mean loss: 0.34371950096282505
Epoch: 41, step: 920, loss: 0.32009047269821167, mean loss: 0.34371910796443395
Epoch: 41, step: 921, loss: 0.3505113422870636, mean loss: 0.3437192209311093
Epoch: 41, step: 922, loss: 0.30805379152297974, mean loss: 0.34371862776282536
Epoch: 41, step: 923, loss: 0.32376977801322937, mean loss: 0.3437182959897787
Epoch: 41, step: 924, loss: 0.32134389877319336, mean loss: 0.3437179238831876
Epoch: 41, step: 925, loss: 0.3284468352794647, mean loss: 0.34371766991530794
Epoch: 41, step: 926, loss: 0.3011421859264374, mean loss: 0.3437169618698075
Epoch: 41, step: 927, loss: 0.3179054856300354, mean loss: 0.34371653262288004
Epoch: 41, step: 928, loss: 0.306763231754303, mean loss: 0.34371591809673185
Epoch: 41, step: 929, loss: 0.3883483111858368, mean loss: 0.34371666031233516
Epoch: 41, step: 930, loss: 0.3106096386909485, mean loss: 0.34371610976736766
Epoch: 41, step: 931, loss: 0.2853531241416931, mean loss: 0.3437151392507782
Epoch: 41, step: 932, loss: 0.3051569163799286, mean loss: 0.34371449807774207
Epoch: 41, step: 933, loss: 0.3545491099357605, mean loss: 0.34371467824023266
Epoch: 41, step: 934, loss: 0.3439132571220398, mean loss: 0.34371468154223106
Epoch: 41, step: 935, loss: 0.29962223768234253, mean loss: 0.3437139483788812
Epoch: 41, step: 936, loss: 0.27938157320022583, mean loss: 0.34371287868640554
Epoch: 41, step: 937, loss: 0.3071526288986206, mean loss: 0.3437122707876029
Epoch: 41, step: 938, loss: 0.33796024322509766, mean loss: 0.34371217514841695
Epoch: 41, step: 939, loss: 0.30401885509490967, mean loss: 0.3437115151770141
Epoch: 41, step: 940, loss: 0.34957659244537354, mean loss: 0.3437116126926391
Epoch: 41, step: 941, loss: 0.35807231068611145, mean loss: 0.3437118514566133
Epoch: 41, step: 942, loss: 0.32648760080337524, mean loss: 0.3437115650873737
Epoch: 41, step: 943, loss: 0.29300254583358765, mean loss: 0.34371072201662733
Epoch: 41, step: 944, loss: 0.3624449372291565, mean loss: 0.34371103348008
Epoch: 41, step: 945, loss: 0.3641813397407532, mean loss: 0.34371137380104855
Epoch: 41, step: 946, loss: 0.32516026496887207, mean loss: 0.343711065392064
Epoch: 41, step: 947, loss: 0.31362152099609375, mean loss: 0.34371056516689447
Epoch: 41, step: 948, loss: 0.3745342195034027, mean loss: 0.34371107758779346
Epoch: 41, step: 949, loss: 0.3521523177623749, mean loss: 0.3437112179149566
Epoch: 41, step: 950, loss: 0.34701135754585266, mean loss: 0.3437112727755606
Epoch: 41, step: 951, loss: 0.3455784320831299, mean loss: 0.34371130381418197
Epoch: 41, step: 952, loss: 0.31145280599594116, mean loss: 0.343710767575709
Epoch: 41, step: 953, loss: 0.35226941108703613, mean loss: 0.34371090984512476
Epoch: 41, step: 954, loss: 0.34057995676994324, mean loss: 0.34371085780049176
Epoch: 41, step: 955, loss: 0.3219539523124695, mean loss: 0.34371049614980215
Epoch: 41, step: 956, loss: 0.30639633536338806, mean loss: 0.34370987591142865
Epoch: 41, step: 957, loss: 0.3452296257019043, mean loss: 0.34370990117238726
Epoch: 41, step: 958, loss: 0.3203367292881012, mean loss: 0.3437095126749406
Epoch: 41, step: 959, loss: 0.32809963822364807, mean loss: 0.3437092532195445
Epoch: 41, step: 960, loss: 0.3706856667995453, mean loss: 0.34370970159340936
Epoch: 41, step: 961, loss: 0.3228243291378021, mean loss: 0.3437093544642591
Epoch: 41, step: 962, loss: 0.30075979232788086, mean loss: 0.3437086406250759
Epoch: 41, step: 963, loss: 0.34510546922683716, mean loss: 0.34370866384054927
Epoch: 41, step: 964, loss: 0.31009772419929504, mean loss: 0.34370810523163703
Epoch: 41, step: 965, loss: 0.3805219233036041, mean loss: 0.3437087170617529
Epoch: 41, step: 966, loss: 0.31252872943878174, mean loss: 0.3437081988721329
Epoch: 41, step: 967, loss: 0.34702596068382263, mean loss: 0.3437082540101009
Epoch: 41, step: 968, loss: 0.3405425250530243, mean loss: 0.3437082013996451
Epoch: 41, step: 969, loss: 0.29862597584724426, mean loss: 0.3437074522018927
Epoch: 41, step: 970, loss: 0.2893693447113037, mean loss: 0.34370654920052185
Epoch: 41, step: 971, loss: 0.3319700062274933, mean loss: 0.34370635416358064
Epoch: 41, step: 972, loss: 0.2994365990161896, mean loss: 0.3437056185045224
Epoch: 41, step: 973, loss: 0.3653479516506195, mean loss: 0.3437059781431469
Epoch: 41, step: 974, loss: 0.31992316246032715, mean loss: 0.34370558294190257
Epoch: 41, step: 975, loss: 0.32472047209739685, mean loss: 0.3437052674698048
Epoch: 41, step: 976, loss: 0.3468415141105652, mean loss: 0.34370531958337286
Epoch: 41, step: 977, loss: 0.3090161979198456, mean loss: 0.3437047431797694
Epoch: 41, step: 978, loss: 0.3426991403102875, mean loss: 0.3437047264706843
Epoch: 41, step: 979, loss: 0.3147293031215668, mean loss: 0.34370424502340013
Epoch: 41, step: 980, loss: 0.3287317156791687, mean loss: 0.34370399624830095
Epoch: 41, step: 981, loss: 0.3063788115978241, mean loss: 0.3437033760843982
Epoch: 41, step: 982, loss: 0.3453900218009949, mean loss: 0.3437034041078205
Epoch: 41, step: 983, loss: 0.3175290524959564, mean loss: 0.3437029692312403
Epoch: 41, step: 984, loss: 0.3584156930446625, mean loss: 0.3437032136733113
Epoch: 41, step: 985, loss: 0.32693609595298767, mean loss: 0.3437029351034871
Epoch: 41, step: 986, loss: 0.3416356146335602, mean loss: 0.3437029007574807
Epoch: 41, step: 987, loss: 0.32369181513786316, mean loss: 0.34370256830324064
Epoch: 41, step: 988, loss: 0.3438130021095276, mean loss: 0.34370257013790256
Epoch: 41, step: 989, loss: 0.3852784037590027, mean loss: 0.3437032608352083
Epoch: 41, step: 990, loss: 0.3103320300579071, mean loss: 0.3437027064497813
Epoch: 41, step: 991, loss: 0.32637545466423035, mean loss: 0.34370241860255246
Epoch: 41, step: 992, loss: 0.31077930331230164, mean loss: 0.34370187167969435
Epoch: 41, step: 993, loss: 0.34495845437049866, mean loss: 0.34370189255385447
Epoch: 41, step: 994, loss: 0.3313320577144623, mean loss: 0.3437016870714571
Epoch: 41, step: 995, loss: 0.3587213456630707, mean loss: 0.34370193656744696
Epoch: 41, step: 996, loss: 0.3284779191017151, mean loss: 0.34370168368099213
Epoch: 41, step: 997, loss: 0.36673703789711, mean loss: 0.34370206631536004
Epoch: 41, step: 998, loss: 0.30777707695961, mean loss: 0.34370146958447695
Epoch: 41, step: 999, loss: 0.3020026385784149, mean loss: 0.3437007769588872
Epoch: 41, step: 1000, loss: 0.3759367763996124, mean loss: 0.34370131239613394
Epoch: 41, step: 1001, loss: 0.35602396726608276, mean loss: 0.34370151707099805
Epoch: 41, step: 1002, loss: 0.34795746207237244, mean loss: 0.3437015877595393
Epoch: 41, step: 1003, loss: 0.3189486861228943, mean loss: 0.34370117663640554
Epoch: 41, step: 1004, loss: 0.34429898858070374, mean loss: 0.3437011865653521
Epoch: 41, step: 1005, loss: 0.3372359573841095, mean loss: 0.3437010791873554
Epoch: 41, step: 1006, loss: 0.36675581336021423, mean loss: 0.3437014620863966
Epoch: 41, step: 1007, loss: 0.3791366219520569, mean loss: 0.34370205059300435
Epoch: 41, step: 1008, loss: 0.31290191411972046, mean loss: 0.34370153907329143
Epoch: 41, step: 1009, loss: 0.31503480672836304, mean loss: 0.3437010629924407
Epoch: 41, step: 1010, loss: 0.3211677074432373, mean loss: 0.3437006887774519
Epoch: 41, step: 1011, loss: 0.31742554903030396, mean loss: 0.34370025242930946
Epoch: 41, step: 1012, loss: 0.32662203907966614, mean loss: 0.34369996881814735
Epoch: 41, step: 1013, loss: 0.3809542655944824, mean loss: 0.34370058747530596
Epoch: 41, step: 1014, loss: 0.3479059636592865, mean loss: 0.34370065731001237
Epoch: 41, step: 1015, loss: 0.36833634972572327, mean loss: 0.34370106640487147
Epoch: 41, step: 1016, loss: 0.3086181879043579, mean loss: 0.34370048383602503
Epoch: 41, step: 1017, loss: 0.355165034532547, mean loss: 0.3437006742074955
Epoch: 41, step: 1018, loss: 0.3455953001976013, mean loss: 0.34370070566766836
Epoch: 41, step: 1019, loss: 0.33994609117507935, mean loss: 0.3437006433235117
Epoch: 41, step: 1020, loss: 0.34635716676712036, mean loss: 0.34370068743348997
Epoch: 41, step: 1021, loss: 0.3356774151325226, mean loss: 0.3437005542140781
Epoch: 41, step: 1022, loss: 0.35804691910743713, mean loss: 0.3437007924189512
Epoch: 41, step: 1023, loss: 0.3241557478904724, mean loss: 0.3437004679013758
Epoch: 41, step: 1024, loss: 0.3275086581707001, mean loss: 0.34370019906394317
Epoch: 41, step: 1025, loss: 0.3373444974422455, mean loss: 0.3437000935400909
Epoch: 41, step: 1026, loss: 0.33564475178718567, mean loss: 0.3436999597992971
Epoch: 41, step: 1027, loss: 0.32004889845848083, mean loss: 0.3436995671332501
Epoch: 41, step: 1028, loss: 0.34288695454597473, mean loss: 0.34369955364209764
Epoch: 41, step: 1029, loss: 0.37143632769584656, mean loss: 0.34370001412577883
Epoch: 41, step: 1030, loss: 0.34666985273361206, mean loss: 0.34370006342998083
Epoch: 41, step: 1031, loss: 0.3522271513938904, mean loss: 0.34370020499130566
Epoch: 41, step: 1032, loss: 0.3392869830131531, mean loss: 0.34370013172700004
Epoch: 41, step: 1033, loss: 0.3327392339706421, mean loss: 0.34369994976714485
Epoch: 41, step: 1034, loss: 0.34531694650650024, mean loss: 0.3436999766101658
Epoch: 41, step: 1035, loss: 0.3685263693332672, mean loss: 0.343700388734879
Epoch: 41, step: 1036, loss: 0.2980961501598358, mean loss: 0.34369963170497286
Epoch: 41, step: 1037, loss: 0.32377350330352783, mean loss: 0.34369930093693063
Epoch: 41, step: 1038, loss: 0.32261067628860474, mean loss: 0.34369895087759345
Epoch: 41, step: 1039, loss: 0.32920533418655396, mean loss: 0.3436987102956817
Epoch: 41, step: 1040, loss: 0.35101380944252014, mean loss: 0.34369883171819227
Epoch: 41, step: 1041, loss: 0.3539372384548187, mean loss: 0.34369900166153683
Epoch: 41, step: 1042, loss: 0.3010282516479492, mean loss: 0.3436982933980546
Epoch: 41, step: 1043, loss: 0.3539228141307831, mean loss: 0.34369846310527696
Epoch: 41, step: 1044, loss: 0.3456905782222748, mean loss: 0.34369849616997705
Epoch: 41, step: 1045, loss: 0.3540711998939514, mean loss: 0.3436986683310347
Epoch: 41, step: 1046, loss: 0.3846333920955658, mean loss: 0.3436993477342606
Epoch: 41, step: 1047, loss: 0.3183025121688843, mean loss: 0.3436989262240109
Epoch: 41, step: 1048, loss: 0.3691045939922333, mean loss: 0.3436993478738502
Epoch: 41, step: 1049, loss: 0.29798850417137146, mean loss: 0.34369858923801355
Epoch: 41, step: 1050, loss: 0.3106960356235504, mean loss: 0.34369804152324107
Epoch: 41, step: 1051, loss: 0.3355479836463928, mean loss: 0.3436979062660405
Epoch: 41, step: 1052, loss: 0.3377455174922943, mean loss: 0.343697807482683
Epoch: 41, step: 1053, loss: 0.33180996775627136, mean loss: 0.343697610200335
Epoch: 41, step: 1054, loss: 0.35769104957580566, mean loss: 0.3436978424219015
Epoch: 41, step: 1055, loss: 0.3005513846874237, mean loss: 0.34369712641696065
Epoch: 41, step: 1056, loss: 0.34326693415641785, mean loss: 0.3436971192781435
Epoch: 41, step: 1057, loss: 0.31580328941345215, mean loss: 0.34369665640220404
Epoch: 41, step: 1058, loss: 0.3266459107398987, mean loss: 0.3436963734633251
Epoch: 41, step: 1059, loss: 0.34976333379745483, mean loss: 0.3436964741363693
Epoch: 41, step: 1060, loss: 0.3587837219238281, mean loss: 0.34369672448479355
Epoch: 41, step: 1061, loss: 0.3149568736553192, mean loss: 0.3436962476014625
Epoch: 41, step: 1062, loss: 0.317158043384552, mean loss: 0.34369580725758914
Epoch: 41, step: 1063, loss: 0.3050667941570282, mean loss: 0.3436951663036318
Epoch: 41, step: 1064, loss: 0.3251950144767761, mean loss: 0.3436948593439705
Epoch: 41, step: 1065, loss: 0.3471028208732605, mean loss: 0.34369491588887724
Epoch: 41, step: 1066, loss: 0.321164071559906, mean loss: 0.34369454206325084
Epoch: 41, step: 1067, loss: 0.3591785430908203, mean loss: 0.34369479896531197
Epoch: 41, step: 1068, loss: 0.30333900451660156, mean loss: 0.3436941294151909
Epoch: 41, step: 1069, loss: 0.37036922574043274, mean loss: 0.34369457197908787
Epoch: 41, step: 1070, loss: 0.3686642646789551, mean loss: 0.3436949862419282
Epoch: 41, step: 1071, loss: 0.30456534028053284, mean loss: 0.34369433706736513
Epoch: 41, step: 1072, loss: 0.32923486828804016, mean loss: 0.3436940971836818
Epoch: 41, step: 1073, loss: 0.33733510971069336, mean loss: 0.34369399168934767
Epoch: 41, step: 1074, loss: 0.3508765995502472, mean loss: 0.343694110845403
Epoch: 41, step: 1075, loss: 0.31561610102653503, mean loss: 0.34369364505227396
Epoch: 41, step: 1076, loss: 0.3455928862094879, mean loss: 0.34369367655873795
Epoch: 41, step: 1077, loss: 0.31441885232925415, mean loss: 0.34369319092746775
Epoch: 41, step: 1078, loss: 0.4134342074394226, mean loss: 0.3436943478210615
Epoch: 41, step: 1079, loss: 0.3369811773300171, mean loss: 0.34369423646198627
Epoch: 41, step: 1080, loss: 0.37164852023124695, mean loss: 0.34369470016413056
Epoch: 41, step: 1081, loss: 0.33139142394065857, mean loss: 0.34369449608231684
Epoch: 41, step: 1082, loss: 0.34671884775161743, mean loss: 0.34369454624821777
Epoch: 41, step: 1083, loss: 0.33834242820739746, mean loss: 0.3436944574723745
Epoch: 41, step: 1084, loss: 0.32878589630126953, mean loss: 0.34369421018744406
Epoch: 41, step: 1085, loss: 0.34545189142227173, mean loss: 0.3436942393412214
Epoch: 41, step: 1086, loss: 0.3252038061618805, mean loss: 0.3436939326547644
Epoch: 41, step: 1087, loss: 0.3511618673801422, mean loss: 0.3436940565175443
Epoch: 41, step: 1088, loss: 0.3147943913936615, mean loss: 0.3436935771971402
Epoch: 41, step: 1089, loss: 0.332735151052475, mean loss: 0.3436933954472788
Epoch: 41, step: 1090, loss: 0.3604888916015625, mean loss: 0.3436936740026508
Epoch: 41, step: 1091, loss: 0.33029037714004517, mean loss: 0.3436934517110085
Epoch: 41, step: 1092, loss: 0.371550977230072, mean loss: 0.3436939137161749
Epoch: 41, step: 1093, loss: 0.3494572043418884, mean loss: 0.34369400929630406
Epoch: 41, step: 1094, loss: 0.30749765038490295, mean loss: 0.34369340901505707
Epoch: 41, step: 1095, loss: 0.31456801295280457, mean loss: 0.3436929260068305
Epoch: 41, step: 1096, loss: 0.36507952213287354, mean loss: 0.343693280670868
Epoch: 41, step: 1097, loss: 0.31866222620010376, mean loss: 0.343692865575938
Epoch: 41, step: 1098, loss: 0.30190300941467285, mean loss: 0.343692172577975
Epoch: 41, step: 1099, loss: 0.31525251269340515, mean loss: 0.34369170097310825
Epoch: 41, step: 1100, loss: 0.42061281204223633, mean loss: 0.3436929765076588
Epoch: 41, step: 1101, loss: 0.3563784658908844, mean loss: 0.3436931868596865
Epoch: 41, step: 1102, loss: 0.30507799983024597, mean loss: 0.34369254654948983
Epoch: 41, step: 1103, loss: 0.30460622906684875, mean loss: 0.34369189843783826
Epoch: 41, step: 1104, loss: 0.35322776436805725, mean loss: 0.3436920565546356
Epoch: 41, step: 1105, loss: 0.3166233003139496, mean loss: 0.34369160772763774
Epoch: 41, step: 1106, loss: 0.34441077709198, mean loss: 0.3436916196519859
Epoch: 41, step: 1107, loss: 0.3118321895599365, mean loss: 0.3436910914083513
Epoch: 41, step: 1108, loss: 0.32863563299179077, mean loss: 0.3436908417862397
Epoch: 41, step: 1109, loss: 0.32463714480400085, mean loss: 0.34369052587787713
Epoch: 41, step: 1110, loss: 0.33711227774620056, mean loss: 0.3436904168129989
Epoch: 41, step: 1111, loss: 0.31378236413002014, mean loss: 0.34368992095696266
Epoch: 41, step: 1112, loss: 0.35493239760398865, mean loss: 0.3436901073468137
Epoch: 41, step: 1113, loss: 0.3335270285606384, mean loss: 0.34368993885517296
Epoch: 41, step: 1114, loss: 0.30223792791366577, mean loss: 0.34368925164200725
Epoch: 41, step: 1115, loss: 0.3020813465118408, mean loss: 0.3436885618557816
Epoch: 41, step: 1116, loss: 0.3513173460960388, mean loss: 0.34368868832557226
Epoch: 41, step: 1117, loss: 0.3251849114894867, mean loss: 0.34368838157551695
Epoch: 41, step: 1118, loss: 0.36066290736198425, mean loss: 0.3436886629694428
Epoch: 41, step: 1119, loss: 0.33143019676208496, mean loss: 0.343688459759009
Epoch: 41, step: 1120, loss: 0.3085830807685852, mean loss: 0.3436878778215206
Epoch: 41, step: 1121, loss: 0.32572513818740845, mean loss: 0.3436875800603623
Epoch: 41, step: 1122, loss: 0.3174157440662384, mean loss: 0.3436871445698524
Epoch: 41, step: 1123, loss: 0.34015795588493347, mean loss: 0.34368708606984105
Epoch: 41, step: 1124, loss: 0.3102360665798187, mean loss: 0.34368653159322965
Epoch: 41, step: 1125, loss: 0.3154064416885376, mean loss: 0.3436860628365596
Epoch: 41, step: 1126, loss: 0.3271789848804474, mean loss: 0.3436857892280009
Epoch: 41, step: 1127, loss: 0.3254699409008026, mean loss: 0.3436854873011905
Epoch: 41, step: 1128, loss: 0.30906206369400024, mean loss: 0.34368491342912033
Epoch: 41, step: 1129, loss: 0.3279445469379425, mean loss: 0.34368465254195074
Epoch: 41, step: 1130, loss: 0.32986295223236084, mean loss: 0.3436844234593236
Epoch: 41, step: 1131, loss: 0.33060482144355774, mean loss: 0.34368420667992133
Epoch: 41, step: 1132, loss: 0.3565967082977295, mean loss: 0.34368442068627925
Epoch: 41, step: 1133, loss: 0.3581659197807312, mean loss: 0.3436846606925621
Epoch: 41, step: 1134, loss: 0.3184778094291687, mean loss: 0.34368424293868377
Epoch: 41, step: 1135, loss: 0.32241347432136536, mean loss: 0.34368389042345976
Epoch: 41, step: 1136, loss: 0.3479977548122406, mean loss: 0.3436839619148899
Epoch: 41, step: 1137, loss: 0.31583520770072937, mean loss: 0.34368350039962337
Epoch: 41, step: 1138, loss: 0.2987973690032959, mean loss: 0.34368275654977504
Epoch: 41, step: 1139, loss: 0.33005744218826294, mean loss: 0.3436825307557547
Epoch: 41, step: 1140, loss: 0.40146103501319885, mean loss: 0.34368348822537537
Epoch: 41, step: 1141, loss: 0.324542760848999, mean loss: 0.34368317104234125
Epoch: 41, step: 1142, loss: 0.3373531997203827, mean loss: 0.34368306614944977
Epoch: 41, step: 1143, loss: 0.34255674481391907, mean loss: 0.3436830474856774
Epoch: 41, step: 1144, loss: 0.35374048352241516, mean loss: 0.34368321414023734
Epoch: 41, step: 1145, loss: 0.3221016824245453, mean loss: 0.343682856534078
Epoch: 41, step: 1146, loss: 0.34887173771858215, mean loss: 0.3436829425124575
Epoch: 41, step: 1147, loss: 0.3086397647857666, mean loss: 0.34368236186595486
Epoch: 41, step: 1148, loss: 0.3204268515110016, mean loss: 0.3436819765411101
Epoch: 41, step: 1149, loss: 0.3450298309326172, mean loss: 0.34368199887358836
Epoch: 41, step: 1150, loss: 0.32050275802612305, mean loss: 0.3436816148251939
Epoch: 41, step: 1151, loss: 0.311987042427063, mean loss: 0.3436810896980748
Epoch: 41, step: 1152, loss: 0.36455902457237244, mean loss: 0.34368143560550685
Epoch: 41, step: 1153, loss: 0.3222566545009613, mean loss: 0.3436810806437602
Epoch: 41, step: 1154, loss: 0.3233056664466858, mean loss: 0.34368074307332
Epoch: 41, step: 1155, loss: 0.290351539850235, mean loss: 0.34367985955437996
Epoch: 41, step: 1156, loss: 0.3650655448436737, mean loss: 0.34368021385078473
Epoch: 41, step: 1157, loss: 0.32737407088279724, mean loss: 0.3436799437115752
Epoch: 41, step: 1158, loss: 0.3210281431674957, mean loss: 0.34367956845188724
Epoch: 41, step: 1159, loss: 0.3166821599006653, mean loss: 0.3436791212083555
Epoch: 41, step: 1160, loss: 0.30101603269577026, mean loss: 0.34367841445628866
Epoch: 41, step: 1161, loss: 0.32517364621162415, mean loss: 0.3436781079133962
Epoch: 41, step: 1162, loss: 0.33578160405158997, mean loss: 0.34367797710510917
Epoch: 41, step: 1163, loss: 0.3113076686859131, mean loss: 0.34367744088876245
Epoch: 41, step: 1164, loss: 0.3292659521102905, mean loss: 0.3436772021654313
Epoch: 41, step: 1165, loss: 0.3167110085487366, mean loss: 0.34367675548341015
Epoch: 41, step: 1166, loss: 0.2950229048728943, mean loss: 0.34367594956913655
Epoch: 41, step: 1167, loss: 0.32550886273384094, mean loss: 0.3436756486500543
Epoch: 41, step: 1168, loss: 0.3038974702358246, mean loss: 0.34367498977641187
Epoch: 41, step: 1169, loss: 0.30674901604652405, mean loss: 0.3436743781559506
Epoch: 41, step: 1170, loss: 0.3130624294281006, mean loss: 0.34367387112574393
Epoch: 41, step: 1171, loss: 0.34426426887512207, mean loss: 0.3436738809044267
Epoch: 41, step: 1172, loss: 0.2871018052101135, mean loss: 0.34367294392385966
Epoch: 41, step: 1173, loss: 0.30834269523620605, mean loss: 0.34367235877283303
Epoch: 41, step: 1174, loss: 0.3368639349937439, mean loss: 0.3436722460113799
Epoch: 41, step: 1175, loss: 0.3157002627849579, mean loss: 0.3436717827456756
Epoch: 41, step: 1176, loss: 0.302912175655365, mean loss: 0.34367110770539655
Epoch: 41, step: 1177, loss: 0.3438999056816101, mean loss: 0.34367111149457175
Epoch: 41, step: 1178, loss: 0.30726727843284607, mean loss: 0.34367050861241843
Epoch: 41, step: 1179, loss: 0.3100228011608124, mean loss: 0.34366995138355894
Epoch: 41, step: 1180, loss: 0.3025682270526886, mean loss: 0.3436692707223959
Epoch: 41, step: 1181, loss: 0.29401206970214844, mean loss: 0.34366844839269994
Epoch: 41, step: 1182, loss: 0.3527662456035614, mean loss: 0.343668599050908
Epoch: 41, step: 1183, loss: 0.30865219235420227, mean loss: 0.3436680191938719
Epoch: 41, step: 1184, loss: 0.31170517206192017, mean loss: 0.3436674899112686
Epoch: 41, step: 1185, loss: 0.32185879349708557, mean loss: 0.34366712878034605
Epoch: 41, step: 1186, loss: 0.3334293067455292, mean loss: 0.3436669592547208
Epoch: 41, step: 1187, loss: 0.3412652015686035, mean loss: 0.3436669194852532
Epoch: 41, step: 1188, loss: 0.3784205913543701, mean loss: 0.3436674949438638
Epoch: 41, step: 1189, loss: 0.3178439736366272, mean loss: 0.34366706735964503
Epoch: 41, step: 1190, loss: 0.32375243306159973, mean loss: 0.34366673761986033
Epoch: 41, step: 1191, loss: 0.33941400051116943, mean loss: 0.3436666672056424
Epoch: 41, step: 1192, loss: 0.33114486932754517, mean loss: 0.3436664598808104
Epoch: 41, step: 1193, loss: 0.31363949179649353, mean loss: 0.34366596272911526
Epoch: 41, step: 1194, loss: 0.2986481487751007, mean loss: 0.34366521738872957
Epoch: 41, step: 1195, loss: 0.3306027948856354, mean loss: 0.3436650011234563
Epoch: 41, step: 1196, loss: 0.3451950252056122, mean loss: 0.3436650264545615
Epoch: 41, step: 1197, loss: 0.3342902660369873, mean loss: 0.3436648712484356
Epoch: 41, step: 1198, loss: 0.3601597547531128, mean loss: 0.3436651443289697
Epoch: 41, step: 1199, loss: 0.3097124695777893, mean loss: 0.34366458223581775
Epoch: 41, step: 1200, loss: 0.32746443152427673, mean loss: 0.3436643140436033
Epoch: 41, step: 1201, loss: 0.2927739918231964, mean loss: 0.3436634715722889
Epoch: 41, step: 1202, loss: 0.3482336699962616, mean loss: 0.3436635472290575
Epoch: 41, step: 1203, loss: 0.33348822593688965, mean loss: 0.34366337878578357
Epoch: 41, step: 1204, loss: 0.3374446630477905, mean loss: 0.343663275842253
Epoch: 41, step: 1205, loss: 0.36354750394821167, mean loss: 0.3436636049968318
Epoch: 41, step: 1206, loss: 0.3086642026901245, mean loss: 0.3436630256420403
Epoch: 41, step: 1207, loss: 0.3144809305667877, mean loss: 0.3436625425907413
Epoch: 41, step: 1208, loss: 0.3603169918060303, mean loss: 0.3436628182673211
Epoch: 41, step: 1209, loss: 0.33067378401756287, mean loss: 0.3436626032669197
Epoch: 41, step: 1210, loss: 0.34556785225868225, mean loss: 0.3436626348029454
Epoch: 41, step: 1211, loss: 0.31588828563690186, mean loss: 0.34366217508450714
Epoch: 41, step: 1212, loss: 0.31428369879722595, mean loss: 0.3436616888227549
Epoch: 41, step: 1213, loss: 0.3133638799190521, mean loss: 0.34366118735284684
Epoch: 41, step: 1214, loss: 0.3708857297897339, mean loss: 0.3436616379485607
Epoch: 41, step: 1215, loss: 0.32475462555885315, mean loss: 0.3436613250221722
Epoch: 41, step: 1216, loss: 0.3712241053581238, mean loss: 0.3436617812009898
Epoch: 41, step: 1217, loss: 0.3025500178337097, mean loss: 0.3436611007904875
Epoch: 41, step: 1218, loss: 0.3162783682346344, mean loss: 0.3436606476065583
Epoch: 41, step: 1219, loss: 0.34379056096076965, mean loss: 0.34366064975658733
Epoch: 41, step: 1220, loss: 0.31108933687210083, mean loss: 0.3436601107195516
Epoch: 41, step: 1221, loss: 0.3554762899875641, mean loss: 0.34366030626748245
Epoch: 41, step: 1222, loss: 0.3120148181915283, mean loss: 0.343659782569664
Epoch: 41, step: 1223, loss: 0.3468661606311798, mean loss: 0.3436598356307956
Epoch: 41, step: 1224, loss: 0.3441988527774811, mean loss: 0.34365984455063786
Epoch: 41, step: 1225, loss: 0.32595938444137573, mean loss: 0.3436595516421469
Epoch: 41, step: 1226, loss: 0.32715559005737305, mean loss: 0.34365927853791917
Epoch: 41, step: 1227, loss: 0.3339095115661621, mean loss: 0.3436591172034114
Epoch: 41, step: 1228, loss: 0.33424627780914307, mean loss: 0.3436589614467984
Epoch: 41, step: 1229, loss: 0.3572143614292145, mean loss: 0.34365918574768833
Epoch: 41, step: 1230, loss: 0.3500317633152008, mean loss: 0.3436592911928371
Epoch: 41, step: 1231, loss: 0.3249351978302002, mean loss: 0.34365898137595047
Epoch: 41, step: 1232, loss: 0.3166888654232025, mean loss: 0.343658535124218
Epoch: 41, step: 1233, loss: 0.31239694356918335, mean loss: 0.34365801787362144
Epoch: 41, step: 1234, loss: 0.38176265358924866, mean loss: 0.34365864833798576
Epoch: 41, step: 1235, loss: 0.3299035429954529, mean loss: 0.3436584207551707
Epoch: 41, step: 1236, loss: 0.3301956057548523, mean loss: 0.3436581980120824
Epoch: 41, step: 1237, loss: 0.3007219433784485, mean loss: 0.3436574876409062
Epoch: 41, step: 1238, loss: 0.3037030100822449, mean loss: 0.3436568266135323
Epoch: 41, step: 1239, loss: 0.31238603591918945, mean loss: 0.34365630926208807
Epoch: 41, step: 1240, loss: 0.3127843141555786, mean loss: 0.3436557985168634
Epoch: 41, step: 1241, loss: 0.30385634303092957, mean loss: 0.34365514008693443
Epoch: 41, step: 1242, loss: 0.37354910373687744, mean loss: 0.34365563463527676
Epoch: 41, step: 1243, loss: 0.3655489683151245, mean loss: 0.34365599681985987
Epoch: 41, step: 1244, loss: 0.3277395963668823, mean loss: 0.34365573351690276
Epoch: 41, step: 1245, loss: 0.3168525993824005, mean loss: 0.3436552901234514
Epoch: 41, step: 1246, loss: 0.3001427948474884, mean loss: 0.34365457032567676
Epoch: 41, step: 1247, loss: 0.3257027864456177, mean loss: 0.34365427336637216
Epoch: 41, step: 1248, loss: 0.294039249420166, mean loss: 0.3436534526457471
Epoch: 41, step: 1249, loss: 0.33258360624313354, mean loss: 0.3436532695338537
Epoch: 41, step: 1250, loss: 0.33425283432006836, mean loss: 0.34365311403910204
Epoch: 41, step: 1251, loss: 0.3033548593521118, mean loss: 0.3436524474674683
Epoch: 41, step: 1252, loss: 0.36258628964424133, mean loss: 0.34365276064612715
Epoch: 41, step: 1253, loss: 0.41355109214782715, mean loss: 0.3436539167930639
Epoch: 41, step: 1254, loss: 0.32362785935401917, mean loss: 0.34365358555937764
Epoch: 41, step: 1255, loss: 0.3241580128669739, mean loss: 0.3436532631053139
Epoch: 41, step: 1256, loss: 0.34299227595329285, mean loss: 0.3436532521728591
Epoch: 41, step: 1257, loss: 0.30723151564598083, mean loss: 0.34365264978232407
Epoch: 41, step: 1258, loss: 0.31748515367507935, mean loss: 0.3436522169970487
Epoch: 41, step: 1259, loss: 0.3263474106788635, mean loss: 0.34365193079689127
Epoch: 41, step: 1260, loss: 0.366566002368927, mean loss: 0.34365230976111144
Epoch: 41, step: 1261, loss: 0.3281615972518921, mean loss: 0.3436520535723027
Epoch: 41, step: 1262, loss: 0.32512903213500977, mean loss: 0.34365174723956854
Epoch: 41, step: 1263, loss: 0.36194390058517456, mean loss: 0.3436520497492157
Epoch: 41, step: 1264, loss: 0.28577032685279846, mean loss: 0.34365109253605036
Epoch: 41, step: 1265, loss: 0.33783718943595886, mean loss: 0.34365099639080315
Epoch: 41, step: 1266, loss: 0.3016239404678345, mean loss: 0.34365030139558356
Epoch: 41, step: 1267, loss: 0.3452126681804657, mean loss: 0.3436503272317852
Epoch: 41, step: 1268, loss: 0.33565694093704224, mean loss: 0.34365019505070776
Epoch: 41, step: 1269, loss: 0.32461485266685486, mean loss: 0.3436498802816767
Epoch: 41, step: 1270, loss: 0.3382095694541931, mean loss: 0.34364979032201026
Epoch: 41, step: 1271, loss: 0.3182311952114105, mean loss: 0.3436493700132082
Epoch: 41, step: 1272, loss: 0.33198630809783936, mean loss: 0.34364917716201
Epoch: 41, step: 1273, loss: 0.385578453540802, mean loss: 0.3436498704600089
Epoch: 41, step: 1274, loss: 0.3076138198375702, mean loss: 0.3436492746159866
Epoch: 41, step: 1275, loss: 0.297016978263855, mean loss: 0.34364850357934057
Epoch: 41, step: 1276, loss: 0.33558809757232666, mean loss: 0.3436483703076353
Epoch: 41, step: 1277, loss: 0.3041679859161377, mean loss: 0.3436477175450879
Epoch: 41, step: 1278, loss: 0.34343767166137695, mean loss: 0.3436477140722793
Epoch: 41, step: 1279, loss: 0.33952847123146057, mean loss: 0.3436476459676096
Epoch: 41, step: 1280, loss: 0.39469581842422485, mean loss: 0.3436484899483066
Epoch: 41, step: 1281, loss: 0.3473448157310486, mean loss: 0.3436485510587418
Epoch: 41, step: 1282, loss: 0.30514514446258545, mean loss: 0.3436479145020173
Epoch: 41, step: 1283, loss: 0.31831249594688416, mean loss: 0.3436474956516907
Epoch: 41, step: 1284, loss: 0.320301353931427, mean loss: 0.3436471096948768
Epoch: 41, step: 1285, loss: 0.348548948764801, mean loss: 0.34364719073040445
Epoch: 41, step: 1286, loss: 0.31751561164855957, mean loss: 0.34364675873921435
Epoch: 41, step: 1287, loss: 0.3186272084712982, mean loss: 0.3436463451382379
Epoch: 41, step: 1288, loss: 0.3033652603626251, mean loss: 0.34364567925813977
Epoch: 41, step: 1289, loss: 0.33557620644569397, mean loss: 0.3436455458651948
Epoch: 41, step: 1290, loss: 0.3201102316379547, mean loss: 0.34364515681958396
Epoch: 41, step: 1291, loss: 0.32151034474372864, mean loss: 0.3436447909307306
Epoch: 41, step: 1292, loss: 0.2929842174053192, mean loss: 0.3436439535243546
Epoch: 41, step: 1293, loss: 0.33313894271850586, mean loss: 0.3436437798820721
Epoch: 41, step: 1294, loss: 0.337705135345459, mean loss: 0.3436436817210358
Epoch: 41, step: 1295, loss: 0.31014344096183777, mean loss: 0.3436431279980481
Epoch: 41, step: 1296, loss: 0.32209616899490356, mean loss: 0.343642771855852
Epoch: 41, step: 1297, loss: 0.3205147087574005, mean loss: 0.3436423895864543
Epoch: 41, step: 1298, loss: 0.3575657606124878, mean loss: 0.34364261971340715
Epoch: 41, step: 1299, loss: 0.35043802857398987, mean loss: 0.3436427320267891
Epoch: 41, step: 1300, loss: 0.29254642128944397, mean loss: 0.3436418875294626
Epoch: 41, step: 1301, loss: 0.328605592250824, mean loss: 0.34364163902030187
Epoch: 41, step: 1302, loss: 0.31749656796455383, mean loss: 0.3436412069203621
Epoch: 41, step: 1303, loss: 0.32228347659111023, mean loss: 0.3436408539467003
Epoch: 41, step: 1304, loss: 0.30680975317955017, mean loss: 0.34364024525872383
Epoch: 41, step: 1305, loss: 0.3302651345729828, mean loss: 0.34364002421904966
Epoch: 41, step: 1306, loss: 0.2984839677810669, mean loss: 0.3436392779736325
Epoch: 41, step: 1307, loss: 0.3071235418319702, mean loss: 0.3436386745274376
Epoch: 41, step: 1308, loss: 0.4205995500087738, mean loss: 0.3436399463347432
Epoch: 41, step: 1309, loss: 0.3184594213962555, mean loss: 0.3436395302240095
Epoch: 41, step: 1310, loss: 0.36334332823753357, mean loss: 0.34363985582589357
Epoch: 41, step: 1311, loss: 0.30077970027923584, mean loss: 0.34363914758087494
Epoch: 41, step: 1312, loss: 0.36946702003479004, mean loss: 0.343639574367934
Epoch: 41, step: 1313, loss: 0.36012691259384155, mean loss: 0.3436398468048656
Epoch: 41, step: 1314, loss: 0.3433176279067993, mean loss: 0.34363984148060545
Epoch: 41, step: 1315, loss: 0.2861645221710205, mean loss: 0.34363889178927515
Epoch: 41, step: 1316, loss: 0.31512102484703064, mean loss: 0.34363842058313276
Epoch: 41, step: 1317, loss: 0.34245526790618896, mean loss: 0.34363840103399895
Epoch: 41, step: 1318, loss: 0.35462450981140137, mean loss: 0.34363858255356633
Epoch: 41, step: 1319, loss: 0.3066093623638153, mean loss: 0.34363797074304175
Epoch: 41, step: 1320, loss: 0.32299044728279114, mean loss: 0.34363762960262934
Epoch: 41, step: 1321, loss: 0.3238612711429596, mean loss: 0.3436373028610892
Epoch: 41, step: 1322, loss: 0.37310895323753357, mean loss: 0.3436377897785042
Epoch: 41, step: 1323, loss: 0.3028569519519806, mean loss: 0.34363711602688796
Epoch: 41, step: 1324, loss: 0.37036609649658203, mean loss: 0.34363755761654696
Epoch: 41, step: 1325, loss: 0.30146798491477966, mean loss: 0.3436368609442737
Epoch: 41, step: 1326, loss: 0.36041319370269775, mean loss: 0.3436371380970179
Epoch: 41, step: 1327, loss: 0.31378427147865295, mean loss: 0.3436366449220589
Epoch: 41, step: 1328, loss: 0.3530931770801544, mean loss: 0.3436368011431641
Epoch: 41, step: 1329, loss: 0.30375275015830994, mean loss: 0.3436361422729261
Epoch: 41, step: 1330, loss: 0.31437191367149353, mean loss: 0.3436356588463365
Epoch: 41, step: 1331, loss: 0.3416244685649872, mean loss: 0.34363562562329103
Epoch: 41, step: 1332, loss: 0.3440544605255127, mean loss: 0.34363563254195073
Epoch: 41, step: 1333, loss: 0.31862950325012207, mean loss: 0.3436352194769454
Epoch: 41, step: 1334, loss: 0.3679044842720032, mean loss: 0.3436356203633954
Epoch: 41, step: 1335, loss: 0.33001288771629333, mean loss: 0.34363539534303456
Epoch: 41, step: 1336, loss: 0.3524649143218994, mean loss: 0.34363554118666084
Epoch: 41, step: 1337, loss: 0.36487725377082825, mean loss: 0.34363589204577655
Epoch: 41, step: 1338, loss: 0.35136592388153076, mean loss: 0.3436360197241512
Epoch: 41, step: 1339, loss: 0.35002073645591736, mean loss: 0.343636125179964
Epoch: 41, step: 1340, loss: 0.3942786157131195, mean loss: 0.34363696162377494
Epoch: 41, step: 1341, loss: 0.30701351165771484, mean loss: 0.3436363567374081
Epoch: 41, step: 1342, loss: 0.37701931595802307, mean loss: 0.3436369080935318
Epoch: 41, step: 1343, loss: 0.3519006371498108, mean loss: 0.3436370445758113
Epoch: 41, step: 1344, loss: 0.36995774507522583, mean loss: 0.34363747927664035
Epoch: 41, step: 1345, loss: 0.31011873483657837, mean loss: 0.3436369257053036
Epoch: 41, step: 1346, loss: 0.3064763844013214, mean loss: 0.3436363119988197
Epoch: 41, step: 1347, loss: 0.34787774085998535, mean loss: 0.343636382044877
Epoch: 41, step: 1348, loss: 0.3253040611743927, mean loss: 0.34363607929652645
Epoch: 41, step: 1349, loss: 0.3365027904510498, mean loss: 0.3436359614960699
Epoch: 41, step: 1350, loss: 0.3357549011707306, mean loss: 0.34363583134892556
Epoch: 41, step: 1351, loss: 0.32978543639183044, mean loss: 0.3436356026284857
Epoch: 41, step: 1352, loss: 0.36304113268852234, mean loss: 0.3436359230791365
Epoch: 41, step: 1353, loss: 0.314638614654541, mean loss: 0.3436354442438311
Epoch: 41, step: 1354, loss: 0.3421354293823242, mean loss: 0.3436354194743524
Epoch: 41, step: 1355, loss: 0.3418845236301422, mean loss: 0.343635390562598
Epoch: 41, step: 1356, loss: 0.34702879190444946, mean loss: 0.34363544659538053
Epoch: 41, step: 1357, loss: 0.33542031049728394, mean loss: 0.34363531094701855
Epoch: 41, step: 1358, loss: 0.31862974166870117, mean loss: 0.3436348980617705
Epoch: 41, step: 1359, loss: 0.34841808676719666, mean loss: 0.3436349770391945
Epoch: 41, step: 1360, loss: 0.3481645882129669, mean loss: 0.34363505182844856
Epoch: 41, step: 1361, loss: 0.32050231099128723, mean loss: 0.34363466988576064
Epoch: 41, step: 1362, loss: 0.31891024112701416, mean loss: 0.34363426166959077
Epoch: 41, step: 1363, loss: 0.3233237862586975, mean loss: 0.3436339263361571
Epoch: 41, step: 1364, loss: 0.35890993475914, mean loss: 0.3436341785445215
Epoch: 41, step: 1365, loss: 0.3192797899246216, mean loss: 0.3436337764578677
Epoch: 41, step: 1366, loss: 0.3338087201118469, mean loss: 0.34363361425060107
Epoch: 41, step: 1367, loss: 0.3035837709903717, mean loss: 0.34363295305659625
Epoch: 41, step: 1368, loss: 0.2980339527130127, mean loss: 0.34363220026244135
Epoch: 41, step: 1369, loss: 0.3556668162345886, mean loss: 0.3436323989387046
Epoch: 41, step: 1370, loss: 0.34138616919517517, mean loss: 0.34363236185690943
Epoch: 41, step: 1371, loss: 0.3486558496952057, mean loss: 0.3436324447855914
Epoch: 41, step: 1372, loss: 0.3123541474342346, mean loss: 0.3436319284461003
Epoch: 41, step: 1373, loss: 0.33220604062080383, mean loss: 0.34363173983162265
Epoch: 41, step: 1374, loss: 0.3057478964328766, mean loss: 0.34363111446898215
Epoch: 41, step: 1375, loss: 0.3731241822242737, mean loss: 0.34363160131394344
Epoch: 41, step: 1376, loss: 0.3324321210384369, mean loss: 0.34363141644607603
Epoch: 41, step: 1377, loss: 0.35132449865341187, mean loss: 0.343631543432346
Epoch: 41, step: 1378, loss: 0.2993449568748474, mean loss: 0.3436308124255197
Epoch: 41, step: 1379, loss: 0.3032039999961853, mean loss: 0.3436301451402228
Epoch: 41, step: 1380, loss: 0.332611083984375, mean loss: 0.3436299632625112
Epoch: 41, step: 1381, loss: 0.29278624057769775, mean loss: 0.343629124063312
Epoch: 41, step: 1382, loss: 0.3274378180503845, mean loss: 0.3436288568227156
Epoch: 41, step: 1383, loss: 0.36779123544692993, mean loss: 0.3436292556208047
Epoch: 41, step: 1384, loss: 0.3508285880088806, mean loss: 0.3436293744432376
Epoch: 41, step: 1385, loss: 0.32354459166526794, mean loss: 0.3436290429564778
Epoch: 41, step: 1386, loss: 0.4183669090270996, mean loss: 0.34363027643778804
Epoch: 41, step: 1387, loss: 0.2986520230770111, mean loss: 0.3436295341243909
Epoch: 41, step: 1388, loss: 0.3101886212825775, mean loss: 0.34362898223039584
Epoch: 41, step: 1389, loss: 0.3252100944519043, mean loss: 0.34362867825825705
Epoch: 41, step: 1390, loss: 0.3272964358329773, mean loss: 0.34362840872706757
Epoch: 41, step: 1391, loss: 0.30192849040031433, mean loss: 0.3436277205641801
Epoch: 41, step: 1392, loss: 0.33497899770736694, mean loss: 0.34362757783891557
Epoch: 41, step: 1393, loss: 0.3307286500930786, mean loss: 0.3436273649782973
Epoch: 41, step: 1394, loss: 0.3097524046897888, mean loss: 0.34362680597632883
Epoch: 41, step: 1395, loss: 0.3538518249988556, mean loss: 0.34362697470601566
Epoch: 41, step: 1396, loss: 0.3134363889694214, mean loss: 0.3436264765197525
Epoch: 41, step: 1397, loss: 0.28040528297424316, mean loss: 0.34362543330016326
Epoch: 41, step: 1398, loss: 0.32815513014793396, mean loss: 0.34362517802727
Epoch: 41, step: 1399, loss: 0.3452025353908539, mean loss: 0.34362520405455144
Epoch: 41, step: 1400, loss: 0.3456052839756012, mean loss: 0.3436252367264419
Epoch: 41, step: 1401, loss: 0.3003033697605133, mean loss: 0.34362452191492215
Epoch: 41, step: 1402, loss: 0.3398900628089905, mean loss: 0.343624460297302
Epoch: 41, step: 1403, loss: 0.3545168936252594, mean loss: 0.34362464001670084
Epoch: 41, step: 1404, loss: 0.3192857503890991, mean loss: 0.34362423844449824
Epoch: 41, step: 1405, loss: 0.30127912759780884, mean loss: 0.34362353979558147
Epoch: 41, step: 1406, loss: 0.3372379243373871, mean loss: 0.3436234344415128
Epoch: 41, step: 1407, loss: 0.3050578236579895, mean loss: 0.3436227981712893
Epoch: 41, step: 1408, loss: 0.3258410692214966, mean loss: 0.3436225048063519
Epoch: 41, step: 1409, loss: 0.30571311712265015, mean loss: 0.34362187938338556
Epoch: 41, step: 1410, loss: 0.34459254145622253, mean loss: 0.34362189539694776
Epoch: 41, step: 1411, loss: 0.36328819394111633, mean loss: 0.34362221983766544
Epoch: 41, step: 1412, loss: 0.38550007343292236, mean loss: 0.3436229106975496
Epoch: 41, step: 1413, loss: 0.34378287196159363, mean loss: 0.34362291333639056
Epoch: 41, step: 1414, loss: 0.29965677857398987, mean loss: 0.3436221880500156
Epoch: 41, step: 1415, loss: 0.3405860364437103, mean loss: 0.34362213796503366
Epoch: 41, step: 1416, loss: 0.3381713032722473, mean loss: 0.34362204804842567
Epoch: 41, step: 1417, loss: 0.31595882773399353, mean loss: 0.34362159172530343
Epoch: 41, step: 1418, loss: 0.35566994547843933, mean loss: 0.3436217904675919
Epoch: 41, step: 1419, loss: 0.3371054530143738, mean loss: 0.3436216829798403
Epoch: 41, step: 1420, loss: 0.31547480821609497, mean loss: 0.3436212187014937
Epoch: 41, step: 1421, loss: 0.3430827558040619, mean loss: 0.343621209819778
Epoch: 41, step: 1422, loss: 0.3456501066684723, mean loss: 0.34362124328501376
Epoch: 41, step: 1423, loss: 0.3648957908153534, mean loss: 0.34362159418802113
Epoch: 41, step: 1424, loss: 0.34566253423690796, mean loss: 0.3436216278507906
Epoch: 41, step: 1425, loss: 0.33403438329696655, mean loss: 0.34362146972371566
Epoch: 41, step: 1426, loss: 0.3452870547771454, mean loss: 0.3436214971945648
Epoch: 41, step: 1427, loss: 0.31796979904174805, mean loss: 0.34362107412262005
Epoch: 41, step: 1428, loss: 0.29938241839408875, mean loss: 0.3436203445091137
Epoch: 41, step: 1429, loss: 0.3156961500644684, mean loss: 0.3436198839722129
Epoch: 41, step: 1430, loss: 0.30364343523979187, mean loss: 0.3436192246756229
Epoch: 41, step: 1431, loss: 0.3100523054599762, mean loss: 0.3436186710949247
Epoch: 41, step: 1432, loss: 0.3348114788532257, mean loss: 0.34361852585040004
Epoch: 41, step: 1433, loss: 0.3191165626049042, mean loss: 0.3436181217809511
Epoch: 41, step: 1434, loss: 0.3003888428211212, mean loss: 0.343617408885307
Epoch: 41, step: 1435, loss: 0.33276107907295227, mean loss: 0.3436172298561214
Epoch: 41, step: 1436, loss: 0.27089160680770874, mean loss: 0.34361603057472684
Epoch: 41, step: 1437, loss: 0.29515936970710754, mean loss: 0.34361523151366574
Epoch: 41, step: 1438, loss: 0.3326452076435089, mean loss: 0.3436150506185275
Epoch: 41, step: 1439, loss: 0.3543553054332733, mean loss: 0.34361522772186526
Epoch: 41, step: 1440, loss: 0.3334715962409973, mean loss: 0.3436150604594119
Epoch: 41, step: 1441, loss: 0.34167686104774475, mean loss: 0.3436150285001828
Epoch: 41, step: 1442, loss: 0.3277389705181122, mean loss: 0.3436147667220572
Epoch: 41, step: 1443, loss: 0.3164138197898865, mean loss: 0.34361431821679844
Valid: 41, mean loss: 0.18570480247338614
Epoch: 42, step: 0, loss: 0.3488284647464752, mean loss: 0.34361440418930467
Epoch: 42, step: 1, loss: 0.30117812752723694, mean loss: 0.3436137044980159
Epoch: 42, step: 2, loss: 0.31239596009254456, mean loss: 0.34361318978689154
Epoch: 42, step: 3, loss: 0.3305005729198456, mean loss: 0.3436129735925885
Epoch: 42, step: 4, loss: 0.2850251793861389, mean loss: 0.34361200764211275
Epoch: 42, step: 5, loss: 0.3220873475074768, mean loss: 0.3436116527659276
Epoch: 42, step: 6, loss: 0.3675435185432434, mean loss: 0.343612047323108
Epoch: 42, step: 7, loss: 0.3036602735519409, mean loss: 0.34361138866157787
Epoch: 42, step: 8, loss: 0.28991007804870605, mean loss: 0.3436105033340705
Epoch: 42, step: 9, loss: 0.32800501585006714, mean loss: 0.3436102460640075
Epoch: 42, step: 10, loss: 0.33401861786842346, mean loss: 0.3436100879402633
Epoch: 42, step: 11, loss: 0.308838814496994, mean loss: 0.3436095147244136
Epoch: 42, step: 12, loss: 0.30814704298973083, mean loss: 0.34360893012357063
Epoch: 42, step: 13, loss: 0.3679308295249939, mean loss: 0.343609331064842
Epoch: 42, step: 14, loss: 0.3256112337112427, mean loss: 0.34360903437497575
Epoch: 42, step: 15, loss: 0.300027459859848, mean loss: 0.34360831596579544
Epoch: 42, step: 16, loss: 0.3186943531036377, mean loss: 0.3436079052847955
Epoch: 42, step: 17, loss: 0.33383071422576904, mean loss: 0.3436077441205345
Epoch: 42, step: 18, loss: 0.319492369890213, mean loss: 0.34360734661654996
Epoch: 42, step: 19, loss: 0.2993902862071991, mean loss: 0.34360661777992424
Epoch: 42, step: 20, loss: 0.3200383186340332, mean loss: 0.34360622930641804
Epoch: 42, step: 21, loss: 0.33012887835502625, mean loss: 0.3436060071644871
Epoch: 42, step: 22, loss: 0.34221041202545166, mean loss: 0.34360598416181465
Epoch: 42, step: 23, loss: 0.3074781894683838, mean loss: 0.3436053887010635
Epoch: 42, step: 24, loss: 0.3203861713409424, mean loss: 0.343605006006663
Epoch: 42, step: 25, loss: 0.33079543709754944, mean loss: 0.3436047948854429
Epoch: 42, step: 26, loss: 0.3205263614654541, mean loss: 0.34360441452395263
Epoch: 42, step: 27, loss: 0.32772332429885864, mean loss: 0.3436041527880072
Epoch: 42, step: 28, loss: 0.341620534658432, mean loss: 0.3436041200965734
Epoch: 42, step: 29, loss: 0.35316067934036255, mean loss: 0.34360427759285284
Epoch: 42, step: 30, loss: 0.32864436507225037, mean loss: 0.34360403105100934
Epoch: 42, step: 31, loss: 0.34992095828056335, mean loss: 0.34360413515330385
Epoch: 42, step: 32, loss: 0.3018200099468231, mean loss: 0.3436034465666753
Epoch: 42, step: 33, loss: 0.3136095106601715, mean loss: 0.34360295228606647
Epoch: 42, step: 34, loss: 0.345225989818573, mean loss: 0.34360297903223147
Epoch: 42, step: 35, loss: 0.3312613368034363, mean loss: 0.3436027756566757
Epoch: 42, step: 36, loss: 0.33474859595298767, mean loss: 0.3436026297527504
Epoch: 42, step: 37, loss: 0.3520396649837494, mean loss: 0.3436027687804542
Epoch: 42, step: 38, loss: 0.33914363384246826, mean loss: 0.34360269530285703
Epoch: 42, step: 39, loss: 0.3153724670410156, mean loss: 0.34360223013300034
Epoch: 42, step: 40, loss: 0.3175744116306305, mean loss: 0.3436018012609065
Epoch: 42, step: 41, loss: 0.3768106997013092, mean loss: 0.34360234844987403
Epoch: 42, step: 42, loss: 0.31363770365715027, mean loss: 0.3436018547251901
Epoch: 42, step: 43, loss: 0.34823694825172424, mean loss: 0.34360193109593956
Epoch: 42, step: 44, loss: 0.36028149724006653, mean loss: 0.34360220591455365
Epoch: 42, step: 45, loss: 0.34724730253219604, mean loss: 0.3436022659715052
Epoch: 42, step: 46, loss: 0.2908753454685211, mean loss: 0.34360139725216254
Epoch: 42, step: 47, loss: 0.3255336582660675, mean loss: 0.34360109957622037
Epoch: 42, step: 48, loss: 0.3485891819000244, mean loss: 0.3436011817562675
Epoch: 42, step: 49, loss: 0.37072205543518066, mean loss: 0.34360162857286247
Epoch: 42, step: 50, loss: 0.340011328458786, mean loss: 0.34360156942361597
Epoch: 42, step: 51, loss: 0.3112558126449585, mean loss: 0.3436010365445916
Epoch: 42, step: 52, loss: 0.34278079867362976, mean loss: 0.3436010230318345
Epoch: 42, step: 53, loss: 0.3596559762954712, mean loss: 0.3436012875198788
Epoch: 42, step: 54, loss: 0.33275720477104187, mean loss: 0.34360110887825074
Epoch: 42, step: 55, loss: 0.3266924321651459, mean loss: 0.34360083033521055
Epoch: 42, step: 56, loss: 0.3655155301094055, mean loss: 0.3436011913384191
Epoch: 42, step: 57, loss: 0.33793503046035767, mean loss: 0.34360109800067856
Epoch: 42, step: 58, loss: 0.3717643916606903, mean loss: 0.3436015619223624
Epoch: 42, step: 59, loss: 0.3586137592792511, mean loss: 0.3436018092076849
Epoch: 42, step: 60, loss: 0.3106313645839691, mean loss: 0.3436012661177868
Epoch: 42, step: 61, loss: 0.33062744140625, mean loss: 0.34360105241617733
Epoch: 42, step: 62, loss: 0.3206811547279358, mean loss: 0.3436006748915494
Epoch: 42, step: 63, loss: 0.33658021688461304, mean loss: 0.343600559256123
Epoch: 42, step: 64, loss: 0.3523840308189392, mean loss: 0.34360070392813
Epoch: 42, step: 65, loss: 0.3095671534538269, mean loss: 0.34360014337289607
Epoch: 42, step: 66, loss: 0.3307344615459442, mean loss: 0.3435999314700413
Epoch: 42, step: 67, loss: 0.32447534799575806, mean loss: 0.3435996164857954
Epoch: 42, step: 68, loss: 0.31332576274871826, mean loss: 0.3435991178799068
Epoch: 42, step: 69, loss: 0.378479540348053, mean loss: 0.343599692345839
Epoch: 42, step: 70, loss: 0.29894858598709106, mean loss: 0.34359895697295145
Epoch: 42, step: 71, loss: 0.33501997590065, mean loss: 0.34359881568538436
Epoch: 42, step: 72, loss: 0.32443487644195557, mean loss: 0.3435985000789345
Epoch: 42, step: 73, loss: 0.31783849000930786, mean loss: 0.3435980758503177
Epoch: 42, step: 74, loss: 0.36333006620407104, mean loss: 0.3435984008011659
Epoch: 42, step: 75, loss: 0.33238181471824646, mean loss: 0.3435982160869494
Epoch: 42, step: 76, loss: 0.31726330518722534, mean loss: 0.3435977824120066
Epoch: 42, step: 77, loss: 0.3030780255794525, mean loss: 0.3435971151565175
Epoch: 42, step: 78, loss: 0.30874311923980713, mean loss: 0.34359654121089334
Epoch: 42, step: 79, loss: 0.3839002251625061, mean loss: 0.34359720488636347
Epoch: 42, step: 80, loss: 0.34916919469833374, mean loss: 0.34359729663807703
Epoch: 42, step: 81, loss: 0.31421294808387756, mean loss: 0.3435968127858038
Epoch: 42, step: 82, loss: 0.34598854184150696, mean loss: 0.3435968521681465
Epoch: 42, step: 83, loss: 0.32017067074775696, mean loss: 0.3435964664377009
Epoch: 42, step: 84, loss: 0.2970097064971924, mean loss: 0.34359569936280027
Epoch: 42, step: 85, loss: 0.38379979133605957, mean loss: 0.34359636133289895
Epoch: 42, step: 86, loss: 0.30579105019569397, mean loss: 0.34359573886955597
Epoch: 42, step: 87, loss: 0.31411272287368774, mean loss: 0.3435952534405518
Epoch: 42, step: 88, loss: 0.32154232263565063, mean loss: 0.3435948903516471
Epoch: 42, step: 89, loss: 0.31864407658576965, mean loss: 0.34359447955751876
Epoch: 42, step: 90, loss: 0.3313814699649811, mean loss: 0.34359427848391544
Epoch: 42, step: 91, loss: 0.34740814566612244, mean loss: 0.34359434127395794
Epoch: 42, step: 92, loss: 0.34142544865608215, mean loss: 0.3435943055667319
Epoch: 42, step: 93, loss: 0.3119186460971832, mean loss: 0.3435937840880274
Epoch: 42, step: 94, loss: 0.3421170115470886, mean loss: 0.343593759776213
Epoch: 42, step: 95, loss: 0.34108978509902954, mean loss: 0.34359371855445153
Epoch: 42, step: 96, loss: 0.3110898733139038, mean loss: 0.34359318346769147
Epoch: 42, step: 97, loss: 0.33110058307647705, mean loss: 0.34359297781463793
Epoch: 42, step: 98, loss: 0.29604557156562805, mean loss: 0.3435921951026316
Epoch: 42, step: 99, loss: 0.3078393340110779, mean loss: 0.3435916065587933
Epoch: 42, step: 100, loss: 0.30059653520584106, mean loss: 0.343590898809343
Epoch: 42, step: 101, loss: 0.2989625334739685, mean loss: 0.3435901641860453
Epoch: 42, step: 102, loss: 0.3408110439777374, mean loss: 0.3435901184399636
Epoch: 42, step: 103, loss: 0.3014090657234192, mean loss: 0.34358942412450544
Epoch: 42, step: 104, loss: 0.37147969007492065, mean loss: 0.343589883200863
Epoch: 42, step: 105, loss: 0.3586655855178833, mean loss: 0.3435901313442332
Epoch: 42, step: 106, loss: 0.3480362594127655, mean loss: 0.3435902045255034
Epoch: 42, step: 107, loss: 0.34444504976272583, mean loss: 0.34359021859564026
Epoch: 42, step: 108, loss: 0.3480089604854584, mean loss: 0.3435902913237521
Epoch: 42, step: 109, loss: 0.3520899713039398, mean loss: 0.34359043121775745
Epoch: 42, step: 110, loss: 0.33768194913864136, mean loss: 0.34359033397319977
Epoch: 42, step: 111, loss: 0.3425339460372925, mean loss: 0.3435903165869599
Epoch: 42, step: 112, loss: 0.35743874311447144, mean loss: 0.3435905445033294
Epoch: 42, step: 113, loss: 0.3168445825576782, mean loss: 0.3435901043275296
Epoch: 42, step: 114, loss: 0.3208601474761963, mean loss: 0.34358973025191036
Epoch: 42, step: 115, loss: 0.3194560706615448, mean loss: 0.3435893330815531
Epoch: 42, step: 116, loss: 0.343253493309021, mean loss: 0.34358932755469107
Epoch: 42, step: 117, loss: 0.32763776183128357, mean loss: 0.34358906504661546
Epoch: 42, step: 118, loss: 0.3207603394985199, mean loss: 0.3435886893702525
Epoch: 42, step: 119, loss: 0.3542482256889343, mean loss: 0.3435888647838965
Epoch: 42, step: 120, loss: 0.33045125007629395, mean loss: 0.3435886485944791
Epoch: 42, step: 121, loss: 0.3489234149456024, mean loss: 0.34358873638066223
Epoch: 42, step: 122, loss: 0.3211946487426758, mean loss: 0.3435883678810878
Epoch: 42, step: 123, loss: 0.33852142095565796, mean loss: 0.343588284504748
Epoch: 42, step: 124, loss: 0.3205159604549408, mean loss: 0.3435879048571405
Epoch: 42, step: 125, loss: 0.3195081353187561, mean loss: 0.343587508638864
Epoch: 42, step: 126, loss: 0.359269917011261, mean loss: 0.3435877666793144
Epoch: 42, step: 127, loss: 0.34271398186683655, mean loss: 0.3435877523021785
Epoch: 42, step: 128, loss: 0.3103577494621277, mean loss: 0.34358720554924826
Epoch: 42, step: 129, loss: 0.3025114834308624, mean loss: 0.3435865297171689
Epoch: 42, step: 130, loss: 0.3100229501724243, mean loss: 0.3435859774938756
Epoch: 42, step: 131, loss: 0.3398127555847168, mean loss: 0.34358591541388367
Epoch: 42, step: 132, loss: 0.3102758824825287, mean loss: 0.3435853673802394
Epoch: 42, step: 133, loss: 0.3765391707420349, mean loss: 0.34358590954409324
Epoch: 42, step: 134, loss: 0.3460935354232788, mean loss: 0.3435859507994752
Epoch: 42, step: 135, loss: 0.364295095205307, mean loss: 0.343586291500061
Epoch: 42, step: 136, loss: 0.3304678797721863, mean loss: 0.34358607568346594
Epoch: 42, step: 137, loss: 0.3303951025009155, mean loss: 0.3435858586767015
Epoch: 42, step: 138, loss: 0.3052534759044647, mean loss: 0.343585228075047
Epoch: 42, step: 139, loss: 0.3636280298233032, mean loss: 0.34358555779146716
Epoch: 42, step: 140, loss: 0.31362488865852356, mean loss: 0.34358506492813445
Epoch: 42, step: 141, loss: 0.33321893215179443, mean loss: 0.3435848944044829
Epoch: 42, step: 142, loss: 0.30470946431159973, mean loss: 0.34358425491129985
Epoch: 42, step: 143, loss: 0.3289680778980255, mean loss: 0.34358401448201614
Epoch: 42, step: 144, loss: 0.3442380428314209, mean loss: 0.34358402524029996
Epoch: 42, step: 145, loss: 0.31779953837394714, mean loss: 0.3435836011114901
Epoch: 42, step: 146, loss: 0.3666933476924896, mean loss: 0.3435839812372666
Epoch: 42, step: 147, loss: 0.3234562277793884, mean loss: 0.343583650166909
Epoch: 42, step: 148, loss: 0.31063348054885864, mean loss: 0.3435831081965878
Epoch: 42, step: 149, loss: 0.3769122362136841, mean loss: 0.3435836563910682
Epoch: 42, step: 150, loss: 0.3125666677951813, mean loss: 0.3435831462348387
Epoch: 42, step: 151, loss: 0.3133852481842041, mean loss: 0.34358264955888396
Epoch: 42, step: 152, loss: 0.3040015995502472, mean loss: 0.3435819985654791
Epoch: 42, step: 153, loss: 0.35611411929130554, mean loss: 0.3435822046791057
Epoch: 42, step: 154, loss: 0.3332306146621704, mean loss: 0.34358203443109137
Epoch: 42, step: 155, loss: 0.310160368680954, mean loss: 0.3435814847688035
Epoch: 42, step: 156, loss: 0.31742432713508606, mean loss: 0.3435810545877718
Epoch: 42, step: 157, loss: 0.3175402879714966, mean loss: 0.3435806263279518
Epoch: 42, step: 158, loss: 0.3182328939437866, mean loss: 0.3435802094724518
Epoch: 42, step: 159, loss: 0.330028772354126, mean loss: 0.3435799866162961
Epoch: 42, step: 160, loss: 0.350144624710083, mean loss: 0.34358009457133715
Epoch: 42, step: 161, loss: 0.3517687916755676, mean loss: 0.3435802292317072
Epoch: 42, step: 162, loss: 0.3358675539493561, mean loss: 0.3435801024014416
Epoch: 42, step: 163, loss: 0.3382275700569153, mean loss: 0.3435800143837421
Epoch: 42, step: 164, loss: 0.3608093559741974, mean loss: 0.34358029770049325
Epoch: 42, step: 165, loss: 0.3209736943244934, mean loss: 0.3435799259669553
Epoch: 42, step: 166, loss: 0.3295145332813263, mean loss: 0.3435796946853194
Epoch: 42, step: 167, loss: 0.3237111568450928, mean loss: 0.34357936798613103
Epoch: 42, step: 168, loss: 0.34248900413513184, mean loss: 0.343579350057528
Epoch: 42, step: 169, loss: 0.319583922624588, mean loss: 0.3435789555126986
Epoch: 42, step: 170, loss: 0.3173956871032715, mean loss: 0.3435785250013714
Epoch: 42, step: 171, loss: 0.3081649839878082, mean loss: 0.3435779427333508
Epoch: 42, step: 172, loss: 0.34152254462242126, mean loss: 0.34357790893913315
Epoch: 42, step: 173, loss: 0.3622370958328247, mean loss: 0.34357821572264724
Epoch: 42, step: 174, loss: 0.37121281027793884, mean loss: 0.34357867006713133
Epoch: 42, step: 175, loss: 0.34738093614578247, mean loss: 0.3435787325797263
Epoch: 42, step: 176, loss: 0.3178298771381378, mean loss: 0.34357830925287974
Epoch: 42, step: 177, loss: 0.2966573238372803, mean loss: 0.3435775378560196
Epoch: 42, step: 178, loss: 0.33811092376708984, mean loss: 0.3435774479845137
Epoch: 42, step: 179, loss: 0.3220641314983368, mean loss: 0.34357709430994793
Epoch: 42, step: 180, loss: 0.32455047965049744, mean loss: 0.3435767815213987
Epoch: 42, step: 181, loss: 0.31440359354019165, mean loss: 0.3435763019358656
Epoch: 42, step: 182, loss: 0.30640900135040283, mean loss: 0.3435756909431055
Epoch: 42, step: 183, loss: 0.31287914514541626, mean loss: 0.3435751863312927
Epoch: 42, step: 184, loss: 0.31022724509239197, mean loss: 0.34357463814295347
Epoch: 42, step: 185, loss: 0.3051181435585022, mean loss: 0.3435740059883264
Epoch: 42, step: 186, loss: 0.3629247546195984, mean loss: 0.34357432407410976
Epoch: 42, step: 187, loss: 0.3353349268436432, mean loss: 0.34357418863790046
Epoch: 42, step: 188, loss: 0.32693231105804443, mean loss: 0.3435739150892774
Epoch: 42, step: 189, loss: 0.36014482378959656, mean loss: 0.3435741874668819
Epoch: 42, step: 190, loss: 0.318173348903656, mean loss: 0.34357376995774197
Epoch: 42, step: 191, loss: 0.34909436106681824, mean loss: 0.34357386069724083
Epoch: 42, step: 192, loss: 0.33767956495285034, mean loss: 0.3435737638169176
Epoch: 42, step: 193, loss: 0.3421799838542938, mean loss: 0.34357374090872983
Epoch: 42, step: 194, loss: 0.3290994167327881, mean loss: 0.3435735030124365
Epoch: 42, step: 195, loss: 0.36581170558929443, mean loss: 0.34357386850784405
Epoch: 42, step: 196, loss: 0.345990926027298, mean loss: 0.34357390823267797
Epoch: 42, step: 197, loss: 0.351397305727005, mean loss: 0.3435740368097002
Epoch: 42, step: 198, loss: 0.3053785264492035, mean loss: 0.3435734090793214
Epoch: 42, step: 199, loss: 0.3366032838821411, mean loss: 0.3435732945295384
Epoch: 42, step: 200, loss: 0.33592358231544495, mean loss: 0.3435731688132207
Epoch: 42, step: 201, loss: 0.3125568628311157, mean loss: 0.34357265909578466
Epoch: 42, step: 202, loss: 0.3224913477897644, mean loss: 0.3435723126542914
Epoch: 42, step: 203, loss: 0.3666492998600006, mean loss: 0.34357269188565936
Epoch: 42, step: 204, loss: 0.3501286506652832, mean loss: 0.3435727996200156
Epoch: 42, step: 205, loss: 0.29690852761268616, mean loss: 0.34357203279660203
Epoch: 42, step: 206, loss: 0.3308669924736023, mean loss: 0.3435718240209826
Epoch: 42, step: 207, loss: 0.36930084228515625, mean loss: 0.3435722468062176
Epoch: 42, step: 208, loss: 0.3434019386768341, mean loss: 0.3435722440077207
Epoch: 42, step: 209, loss: 0.37101489305496216, mean loss: 0.3435726949369173
Epoch: 42, step: 210, loss: 0.35713478922843933, mean loss: 0.3435729177814315
Epoch: 42, step: 211, loss: 0.3038019835948944, mean loss: 0.34357226429910837
Epoch: 42, step: 212, loss: 0.3695216178894043, mean loss: 0.3435726906699138
Epoch: 42, step: 213, loss: 0.33831775188446045, mean loss: 0.34357260432804554
Epoch: 42, step: 214, loss: 0.3594571650028229, mean loss: 0.3435728653168347
Epoch: 42, step: 215, loss: 0.29657331109046936, mean loss: 0.34357209311069925
Epoch: 42, step: 216, loss: 0.3295328617095947, mean loss: 0.3435718624488837
Epoch: 42, step: 217, loss: 0.34098246693611145, mean loss: 0.3435718199063228
Epoch: 42, step: 218, loss: 0.31984931230545044, mean loss: 0.3435714301629873
Epoch: 42, step: 219, loss: 0.32974451780319214, mean loss: 0.34357120300072863
Epoch: 42, step: 220, loss: 0.37017059326171875, mean loss: 0.3435716399947693
Epoch: 42, step: 221, loss: 0.3310028314590454, mean loss: 0.3435714335086754
Epoch: 42, step: 222, loss: 0.35628005862236023, mean loss: 0.3435716422883096
Epoch: 42, step: 223, loss: 0.3027220368385315, mean loss: 0.3435709712144916
Epoch: 42, step: 224, loss: 0.3332940936088562, mean loss: 0.34357080238960036
Epoch: 42, step: 225, loss: 0.3401086926460266, mean loss: 0.3435707455162268
Epoch: 42, step: 226, loss: 0.32421842217445374, mean loss: 0.34357042761358464
Epoch: 42, step: 227, loss: 0.3480256199836731, mean loss: 0.34357050079829404
Epoch: 42, step: 228, loss: 0.33103981614112854, mean loss: 0.3435702949621875
Epoch: 42, step: 229, loss: 0.3048384487628937, mean loss: 0.3435696587414477
Epoch: 42, step: 230, loss: 0.31806111335754395, mean loss: 0.3435692397374334
Epoch: 42, step: 231, loss: 0.3046509921550751, mean loss: 0.34356860047581084
Epoch: 42, step: 232, loss: 0.33738037943840027, mean loss: 0.34356849883127416
Epoch: 42, step: 233, loss: 0.3683902621269226, mean loss: 0.3435689065340976
Epoch: 42, step: 234, loss: 0.4031996726989746, mean loss: 0.34356988596622423
Epoch: 42, step: 235, loss: 0.33376577496528625, mean loss: 0.3435697249368733
Epoch: 42, step: 236, loss: 0.3172677755355835, mean loss: 0.3435692929429602
Epoch: 42, step: 237, loss: 0.30687156319618225, mean loss: 0.3435686902144225
Epoch: 42, step: 238, loss: 0.30999207496643066, mean loss: 0.34356813875655384
Epoch: 42, step: 239, loss: 0.3285243511199951, mean loss: 0.34356789168344193
Epoch: 42, step: 240, loss: 0.33416539430618286, mean loss: 0.3435677372631464
Epoch: 42, step: 241, loss: 0.29863855242729187, mean loss: 0.34356699938853913
Epoch: 42, step: 242, loss: 0.3170742690563202, mean loss: 0.3435665643040384
Epoch: 42, step: 243, loss: 0.32775062322616577, mean loss: 0.3435663045664526
Epoch: 42, step: 244, loss: 0.2959310710430145, mean loss: 0.34356552228879306
Epoch: 42, step: 245, loss: 0.31040164828300476, mean loss: 0.34356497767234473
Epoch: 42, step: 246, loss: 0.36325693130493164, mean loss: 0.3435653010478868
Epoch: 42, step: 247, loss: 0.3444312810897827, mean loss: 0.34356531526852596
Epoch: 42, step: 248, loss: 0.30365443229675293, mean loss: 0.34356465988512497
Epoch: 42, step: 249, loss: 0.32797563076019287, mean loss: 0.3435644038992285
Epoch: 42, step: 250, loss: 0.35045742988586426, mean loss: 0.34356451708706387
Epoch: 42, step: 251, loss: 0.3053419291973114, mean loss: 0.3435638894583629
Epoch: 42, step: 252, loss: 0.30398139357566833, mean loss: 0.34356323951015383
Epoch: 42, step: 253, loss: 0.30784448981285095, mean loss: 0.3435626530146414
Epoch: 42, step: 254, loss: 0.31029248237609863, mean loss: 0.34356210673333115
Epoch: 42, step: 255, loss: 0.32514506578445435, mean loss: 0.34356180433872735
Epoch: 42, step: 256, loss: 0.3644079566001892, mean loss: 0.34356214661197687
Epoch: 42, step: 257, loss: 0.30872732400894165, mean loss: 0.3435615746679549
Epoch: 42, step: 258, loss: 0.3419249355792999, mean loss: 0.34356154779683845
Epoch: 42, step: 259, loss: 0.3092740774154663, mean loss: 0.34356098485813774
Epoch: 42, step: 260, loss: 0.3648228645324707, mean loss: 0.3435613339342952
Epoch: 42, step: 261, loss: 0.36063867807388306, mean loss: 0.34356161430441734
Epoch: 42, step: 262, loss: 0.31910157203674316, mean loss: 0.34356121273422036
Epoch: 42, step: 263, loss: 0.36578768491744995, mean loss: 0.3435615776290224
Epoch: 42, step: 264, loss: 0.3977946639060974, mean loss: 0.34356246796583517
Epoch: 42, step: 265, loss: 0.36631524562835693, mean loss: 0.34356284148879646
Epoch: 42, step: 266, loss: 0.2930499315261841, mean loss: 0.3435620122528125
Epoch: 42, step: 267, loss: 0.2948697507381439, mean loss: 0.3435612129182943
Epoch: 42, step: 268, loss: 0.3096972107887268, mean loss: 0.3435606570143245
Epoch: 42, step: 269, loss: 0.3495252728462219, mean loss: 0.3435607549265316
Epoch: 42, step: 270, loss: 0.3648811876773834, mean loss: 0.3435611049065502
Epoch: 42, step: 271, loss: 0.3285273015499115, mean loss: 0.3435608581271123
Epoch: 42, step: 272, loss: 0.3188230097293854, mean loss: 0.3435604520627273
Epoch: 42, step: 273, loss: 0.3674793839454651, mean loss: 0.34356084467839787
Epoch: 42, step: 274, loss: 0.3204897344112396, mean loss: 0.3435604659854532
Epoch: 42, step: 275, loss: 0.3398352861404419, mean loss: 0.34356040484075084
Epoch: 42, step: 276, loss: 0.3534868657588959, mean loss: 0.34356056776994115
Epoch: 42, step: 277, loss: 0.3433021008968353, mean loss: 0.34356056352763287
Epoch: 42, step: 278, loss: 0.3644544184207916, mean loss: 0.343560906460239
Epoch: 42, step: 279, loss: 0.32112595438957214, mean loss: 0.3435605382395183
Epoch: 42, step: 280, loss: 0.37153029441833496, mean loss: 0.34356099729442124
Epoch: 42, step: 281, loss: 0.3148961067199707, mean loss: 0.3435605268383147
Epoch: 42, step: 282, loss: 0.3070150911808014, mean loss: 0.34355992705436794
Epoch: 42, step: 283, loss: 0.3148208558559418, mean loss: 0.3435594553962704
Epoch: 42, step: 284, loss: 0.34337830543518066, mean loss: 0.3435594524233336
Epoch: 42, step: 285, loss: 0.3190224766731262, mean loss: 0.34355904974214163
Epoch: 42, step: 286, loss: 0.35832464694976807, mean loss: 0.34355929205931907
Epoch: 42, step: 287, loss: 0.3331233561038971, mean loss: 0.34355912079871853
Epoch: 42, step: 288, loss: 0.33729398250579834, mean loss: 0.3435590179853491
Epoch: 42, step: 289, loss: 0.3722403943538666, mean loss: 0.3435594886502276
Epoch: 42, step: 290, loss: 0.31003978848457336, mean loss: 0.3435589385968929
Epoch: 42, step: 291, loss: 0.30821940302848816, mean loss: 0.34355835868984386
Epoch: 42, step: 292, loss: 0.3462541401386261, mean loss: 0.34355840292576795
Epoch: 42, step: 293, loss: 0.349987655878067, mean loss: 0.3435585084236668
Epoch: 42, step: 294, loss: 0.3308146595954895, mean loss: 0.3435582993127135
Epoch: 42, step: 295, loss: 0.3535437285900116, mean loss: 0.3435584631586914
Epoch: 42, step: 296, loss: 0.3106338679790497, mean loss: 0.3435579229241327
Epoch: 42, step: 297, loss: 0.33181750774383545, mean loss: 0.34355773028777953
Epoch: 42, step: 298, loss: 0.32864058017730713, mean loss: 0.34355748553167814
Epoch: 42, step: 299, loss: 0.3910069465637207, mean loss: 0.3435582640553546
Epoch: 42, step: 300, loss: 0.32409054040908813, mean loss: 0.34355794464529626
Epoch: 42, step: 301, loss: 0.3384627401828766, mean loss: 0.34355786104883257
Epoch: 42, step: 302, loss: 0.3122570812702179, mean loss: 0.3435573475087794
Epoch: 42, step: 303, loss: 0.3378397226333618, mean loss: 0.34355725370341
Epoch: 42, step: 304, loss: 0.3917900621891022, mean loss: 0.34355804501488746
Epoch: 42, step: 305, loss: 0.35177209973335266, mean loss: 0.3435581797731432
Epoch: 42, step: 306, loss: 0.3083938956260681, mean loss: 0.3435576028838946
Epoch: 42, step: 307, loss: 0.38172683119773865, mean loss: 0.3435582290606174
Epoch: 42, step: 308, loss: 0.3390411138534546, mean loss: 0.3435581549573117
Epoch: 42, step: 309, loss: 0.35602930188179016, mean loss: 0.3435583595432056
Epoch: 42, step: 310, loss: 0.3203565776348114, mean loss: 0.3435579789303034
Epoch: 42, step: 311, loss: 0.32940012216567993, mean loss: 0.34355774668199685
Epoch: 42, step: 312, loss: 0.30570486187934875, mean loss: 0.3435571257459098
Epoch: 42, step: 313, loss: 0.3171981871128082, mean loss: 0.3435566933628083
Epoch: 42, step: 314, loss: 0.3261454999446869, mean loss: 0.3435564077601736
Epoch: 42, step: 315, loss: 0.34676051139831543, mean loss: 0.34355646031748016
Epoch: 42, step: 316, loss: 0.3086031675338745, mean loss: 0.3435558869837184
Epoch: 42, step: 317, loss: 0.3645800054073334, mean loss: 0.3435562318336089
Epoch: 42, step: 318, loss: 0.3139232099056244, mean loss: 0.34355574578341896
Epoch: 42, step: 319, loss: 0.3290828466415405, mean loss: 0.3435555083982474
Epoch: 42, step: 320, loss: 0.329558402299881, mean loss: 0.3435552788208212
Epoch: 42, step: 321, loss: 0.3302489221096039, mean loss: 0.34355506057649265
Epoch: 42, step: 322, loss: 0.3481861650943756, mean loss: 0.34355513653234904
Epoch: 42, step: 323, loss: 0.3476497530937195, mean loss: 0.34355520368803627
Epoch: 42, step: 324, loss: 0.31881067156791687, mean loss: 0.3435547978603401
Epoch: 42, step: 325, loss: 0.32942721247673035, mean loss: 0.34355456616182295
Epoch: 42, step: 326, loss: 0.3142615258693695, mean loss: 0.34355408575115803
Epoch: 42, step: 327, loss: 0.32432320713996887, mean loss: 0.34355377036676726
Epoch: 42, step: 328, loss: 0.3077690303325653, mean loss: 0.34355318351041103
Epoch: 42, step: 329, loss: 0.3426632881164551, mean loss: 0.3435531689166986
Epoch: 42, step: 330, loss: 0.3344888985157013, mean loss: 0.34355302027092877
Epoch: 42, step: 331, loss: 0.35557159781455994, mean loss: 0.34355321736141
Epoch: 42, step: 332, loss: 0.3427731990814209, mean loss: 0.3435532045702409
Epoch: 42, step: 333, loss: 0.3547014892101288, mean loss: 0.3435533873829502
Epoch: 42, step: 334, loss: 0.41212621331214905, mean loss: 0.34355451184101116
Epoch: 42, step: 335, loss: 0.32442596554756165, mean loss: 0.34355419817601224
Epoch: 42, step: 336, loss: 0.349004328250885, mean loss: 0.3435542875443827
Epoch: 42, step: 337, loss: 0.3770312964916229, mean loss: 0.34355483647379187
Epoch: 42, step: 338, loss: 0.32770901918411255, mean loss: 0.3435545766509232
Epoch: 42, step: 339, loss: 0.3193686902523041, mean loss: 0.3435541800829689
Epoch: 42, step: 340, loss: 0.33985790610313416, mean loss: 0.3435541194773846
Epoch: 42, step: 341, loss: 0.36315247416496277, mean loss: 0.34355444081456593
Epoch: 42, step: 342, loss: 0.3112576901912689, mean loss: 0.34355391128150986
Epoch: 42, step: 343, loss: 0.3591969907283783, mean loss: 0.3435541677590716
Epoch: 42, step: 344, loss: 0.3637809157371521, mean loss: 0.34355449938315924
Epoch: 42, step: 345, loss: 0.3226156532764435, mean loss: 0.3435541560896204
Epoch: 42, step: 346, loss: 0.37012749910354614, mean loss: 0.3435545917539046
Epoch: 42, step: 347, loss: 0.3687874376773834, mean loss: 0.34355500543424305
Epoch: 42, step: 348, loss: 0.3391067087650299, mean loss: 0.3435549325077603
Epoch: 42, step: 349, loss: 0.32465165853500366, mean loss: 0.3435546226078624
Epoch: 42, step: 350, loss: 0.3335924446582794, mean loss: 0.3435544592907925
Epoch: 42, step: 351, loss: 0.32156866788864136, mean loss: 0.3435540988679826
Epoch: 42, step: 352, loss: 0.33345186710357666, mean loss: 0.34355393326034067
Epoch: 42, step: 353, loss: 0.3750326633453369, mean loss: 0.34355444928817724
Epoch: 42, step: 354, loss: 0.31103402376174927, mean loss: 0.3435539161926651
Epoch: 42, step: 355, loss: 0.3476729989051819, mean loss: 0.3435539837141836
Epoch: 42, step: 356, loss: 0.32295602560043335, mean loss: 0.34355364607041483
Epoch: 42, step: 357, loss: 0.36565354466438293, mean loss: 0.3435540083282025
Epoch: 42, step: 358, loss: 0.35496506094932556, mean loss: 0.3435541953731747
Epoch: 42, step: 359, loss: 0.3713970482349396, mean loss: 0.3435546517535324
Epoch: 42, step: 360, loss: 0.3641826808452606, mean loss: 0.343554989868058
Epoch: 42, step: 361, loss: 0.3607234060764313, mean loss: 0.34355527127137236
Epoch: 42, step: 362, loss: 0.35119175910949707, mean loss: 0.3435553964371267
Epoch: 42, step: 363, loss: 0.33007556200027466, mean loss: 0.3435551754996974
Epoch: 42, step: 364, loss: 0.34539344906806946, mean loss: 0.3435552056289087
Epoch: 42, step: 365, loss: 0.3076860308647156, mean loss: 0.3435546177445745
Epoch: 42, step: 366, loss: 0.3305169343948364, mean loss: 0.34355440406460486
Epoch: 42, step: 367, loss: 0.30858761072158813, mean loss: 0.34355383098879944
Epoch: 42, step: 368, loss: 0.31175652146339417, mean loss: 0.34355330986666094
Epoch: 42, step: 369, loss: 0.35223013162612915, mean loss: 0.3435534520676796
Epoch: 42, step: 370, loss: 0.3441142439842224, mean loss: 0.34355346125812714
Epoch: 42, step: 371, loss: 0.33388856053352356, mean loss: 0.3435533028690625
Epoch: 42, step: 372, loss: 0.373155415058136, mean loss: 0.3435537879825839
Epoch: 42, step: 373, loss: 0.31263020634651184, mean loss: 0.343553281221389
Epoch: 42, step: 374, loss: 0.31673264503479004, mean loss: 0.34355284170454803
Epoch: 42, step: 375, loss: 0.3321154713630676, mean loss: 0.3435526542804142
Epoch: 42, step: 376, loss: 0.29002052545547485, mean loss: 0.3435517770640467
Epoch: 42, step: 377, loss: 0.36856353282928467, mean loss: 0.3435521869181378
Epoch: 42, step: 378, loss: 0.3474835455417633, mean loss: 0.3435522513381261
Epoch: 42, step: 379, loss: 0.32518768310546875, mean loss: 0.3435519504177579
Epoch: 42, step: 380, loss: 0.3023097515106201, mean loss: 0.3435512746374091
Epoch: 42, step: 381, loss: 0.3212537169456482, mean loss: 0.34355090928335874
Epoch: 42, step: 382, loss: 0.3778700530529022, mean loss: 0.34355147160650223
Epoch: 42, step: 383, loss: 0.3521312475204468, mean loss: 0.3435516121848204
Epoch: 42, step: 384, loss: 0.3324287533760071, mean loss: 0.34355142994146337
Epoch: 42, step: 385, loss: 0.332480788230896, mean loss: 0.34355124855663344
Epoch: 42, step: 386, loss: 0.3153313994407654, mean loss: 0.3435507862014419
Epoch: 42, step: 387, loss: 0.3706623911857605, mean loss: 0.3435512303918375
Epoch: 42, step: 388, loss: 0.3074282705783844, mean loss: 0.34355063857114165
Epoch: 42, step: 389, loss: 0.32473278045654297, mean loss: 0.3435503302737185
Epoch: 42, step: 390, loss: 0.3928510844707489, mean loss: 0.34355113796641
Epoch: 42, step: 391, loss: 0.347604364156723, mean loss: 0.34355120436919817
Epoch: 42, step: 392, loss: 0.34100016951560974, mean loss: 0.3435511625770445
Epoch: 42, step: 393, loss: 0.31264856457710266, mean loss: 0.3435506563256438
Epoch: 42, step: 394, loss: 0.3055289387702942, mean loss: 0.34355003345786933
Epoch: 42, step: 395, loss: 0.32841092348098755, mean loss: 0.34354978545462617
Epoch: 42, step: 396, loss: 0.3511732518672943, mean loss: 0.34354991033735877
Epoch: 42, step: 397, loss: 0.33457183837890625, mean loss: 0.34354976326675696
Epoch: 42, step: 398, loss: 0.3436420261859894, mean loss: 0.34354976477809934
Epoch: 42, step: 399, loss: 0.3460918068885803, mean loss: 0.34354980641815486
Epoch: 42, step: 400, loss: 0.32335227727890015, mean loss: 0.34354947557687754
Epoch: 42, step: 401, loss: 0.33125871419906616, mean loss: 0.34354927425400483
Epoch: 42, step: 402, loss: 0.37528350949287415, mean loss: 0.3435497940527835
Epoch: 42, step: 403, loss: 0.3184168040752411, mean loss: 0.34354938238748217
Epoch: 42, step: 404, loss: 0.3373584747314453, mean loss: 0.34354928098529625
Epoch: 42, step: 405, loss: 0.34522852301597595, mean loss: 0.34354930848950616
Epoch: 42, step: 406, loss: 0.31195715069770813, mean loss: 0.34354879105182223
Epoch: 42, step: 407, loss: 0.3273196816444397, mean loss: 0.34354852524486784
Epoch: 42, step: 408, loss: 0.3103312849998474, mean loss: 0.3435479812083078
Epoch: 42, step: 409, loss: 0.351033091545105, mean loss: 0.3435481037984735
Epoch: 42, step: 410, loss: 0.35664159059524536, mean loss: 0.34354831823838894
Epoch: 42, step: 411, loss: 0.30341386795043945, mean loss: 0.3435476609431009
Epoch: 42, step: 412, loss: 0.3327072262763977, mean loss: 0.3435474834085917
Epoch: 42, step: 413, loss: 0.32737216353416443, mean loss: 0.343547218508656
Epoch: 42, step: 414, loss: 0.3045108914375305, mean loss: 0.3435465792291075
Epoch: 42, step: 415, loss: 0.32136595249176025, mean loss: 0.3435462159933755
Epoch: 42, step: 416, loss: 0.30345654487609863, mean loss: 0.34354555948521015
Epoch: 42, step: 417, loss: 0.33933714032173157, mean loss: 0.34354549056929684
Epoch: 42, step: 418, loss: 0.3437838554382324, mean loss: 0.3435454944726304
Epoch: 42, step: 419, loss: 0.35776451230049133, mean loss: 0.34354572731172495
Epoch: 42, step: 420, loss: 0.3606787919998169, mean loss: 0.3435460078642915
Epoch: 42, step: 421, loss: 0.3471403419971466, mean loss: 0.3435460667202623
Epoch: 42, step: 422, loss: 0.3322802186012268, mean loss: 0.34354588224894006
Epoch: 42, step: 423, loss: 0.29809290170669556, mean loss: 0.3435451379965733
Epoch: 42, step: 424, loss: 0.31437045335769653, mean loss: 0.34354466029473063
Epoch: 42, step: 425, loss: 0.3567529320716858, mean loss: 0.34354487656141985
Epoch: 42, step: 426, loss: 0.3374691307544708, mean loss: 0.3435447770813411
Epoch: 42, step: 427, loss: 0.33220192790031433, mean loss: 0.343544591364379
Epoch: 42, step: 428, loss: 0.30249837040901184, mean loss: 0.34354391932382433
Epoch: 42, step: 429, loss: 0.33282577991485596, mean loss: 0.3435437438410088
Epoch: 42, step: 430, loss: 0.30785948038101196, mean loss: 0.3435431596097106
Epoch: 42, step: 431, loss: 0.3462214767932892, mean loss: 0.3435432034590424
Epoch: 42, step: 432, loss: 0.32729700207710266, mean loss: 0.3435429374810561
Epoch: 42, step: 433, loss: 0.35058844089508057, mean loss: 0.3435430528260581
Epoch: 42, step: 434, loss: 0.3563731610774994, mean loss: 0.3435432628699042
Epoch: 42, step: 435, loss: 0.3193295896053314, mean loss: 0.34354286647030263
Epoch: 42, step: 436, loss: 0.34044674038887024, mean loss: 0.34354281578476475
Epoch: 42, step: 437, loss: 0.3288717567920685, mean loss: 0.34354257561420204
Epoch: 42, step: 438, loss: 0.30452045798301697, mean loss: 0.343541936818425
Epoch: 42, step: 439, loss: 0.35555851459503174, mean loss: 0.34354213352772595
Epoch: 42, step: 440, loss: 0.3219965398311615, mean loss: 0.3435417808358551
Epoch: 42, step: 441, loss: 0.31570157408714294, mean loss: 0.3435413251114035
Epoch: 42, step: 442, loss: 0.3236396908760071, mean loss: 0.3435409993410898
Epoch: 42, step: 443, loss: 0.37005993723869324, mean loss: 0.34354143342309557
Epoch: 42, step: 444, loss: 0.3307909369468689, mean loss: 0.3435412247167548
Epoch: 42, step: 445, loss: 0.3369148075580597, mean loss: 0.3435411162541045
Epoch: 42, step: 446, loss: 0.3490554690361023, mean loss: 0.34354120651276365
Epoch: 42, step: 447, loss: 0.32383519411087036, mean loss: 0.34354088397098675
Epoch: 42, step: 448, loss: 0.32232657074928284, mean loss: 0.34354053674750246
Epoch: 42, step: 449, loss: 0.35891884565353394, mean loss: 0.34354078844655817
Epoch: 42, step: 450, loss: 0.3425247073173523, mean loss: 0.3435407718164803
Epoch: 42, step: 451, loss: 0.3524901568889618, mean loss: 0.3435409182875944
Epoch: 42, step: 452, loss: 0.32126131653785706, mean loss: 0.34354055365196245
Epoch: 42, step: 453, loss: 0.35565412044525146, mean loss: 0.343540751903522
Epoch: 42, step: 454, loss: 0.32986441254615784, mean loss: 0.3435405280791704
Epoch: 42, step: 455, loss: 0.31646788120269775, mean loss: 0.34354008502066563
Epoch: 42, step: 456, loss: 0.31732070446014404, mean loss: 0.34353965593334773
Epoch: 42, step: 457, loss: 0.3347245454788208, mean loss: 0.3435395116740204
Epoch: 42, step: 458, loss: 0.3669060170650482, mean loss: 0.3435398940607419
Epoch: 42, step: 459, loss: 0.31038805842399597, mean loss: 0.34353935154854
Epoch: 42, step: 460, loss: 0.36038950085639954, mean loss: 0.3435396272877815
Epoch: 42, step: 461, loss: 0.34661123156547546, mean loss: 0.3435396775513108
Epoch: 42, step: 462, loss: 0.30606162548065186, mean loss: 0.3435390642729801
Epoch: 42, step: 463, loss: 0.3670741617679596, mean loss: 0.34353944938715564
Epoch: 42, step: 464, loss: 0.30174487829208374, mean loss: 0.3435387654971307
Epoch: 42, step: 465, loss: 0.3266855478286743, mean loss: 0.3435384897302415
Epoch: 42, step: 466, loss: 0.33265602588653564, mean loss: 0.34353831166489185
Epoch: 42, step: 467, loss: 0.28538778424263, mean loss: 0.343537360186925
Epoch: 42, step: 468, loss: 0.28323444724082947, mean loss: 0.34353637350706595
Epoch: 42, step: 469, loss: 0.36086374521255493, mean loss: 0.3435366570139167
Epoch: 42, step: 470, loss: 0.3296812176704407, mean loss: 0.34353643031781006
Epoch: 42, step: 471, loss: 0.34254154562950134, mean loss: 0.34353641404024643
Epoch: 42, step: 472, loss: 0.3196704089641571, mean loss: 0.3435360235688033
Epoch: 42, step: 473, loss: 0.3597669303417206, mean loss: 0.34353628911814355
Epoch: 42, step: 474, loss: 0.35256704688072205, mean loss: 0.3435364368654361
Epoch: 42, step: 475, loss: 0.3480859398841858, mean loss: 0.34353651129615104
Epoch: 42, step: 476, loss: 0.3420538008213043, mean loss: 0.343536487039129
Epoch: 42, step: 477, loss: 0.3453412652015686, mean loss: 0.34353651656466905
Epoch: 42, step: 478, loss: 0.3366006016731262, mean loss: 0.3435364030973814
Epoch: 42, step: 479, loss: 0.3519192636013031, mean loss: 0.34353654023356295
Epoch: 42, step: 480, loss: 0.2998960614204407, mean loss: 0.34353582632561724
Epoch: 42, step: 481, loss: 0.3113603889942169, mean loss: 0.3435352999811492
Epoch: 42, step: 482, loss: 0.28758084774017334, mean loss: 0.343534384660735
Epoch: 42, step: 483, loss: 0.315836638212204, mean loss: 0.3435339315797553
Epoch: 42, step: 484, loss: 0.3334876298904419, mean loss: 0.34353376724458956
Epoch: 42, step: 485, loss: 0.2929261028766632, mean loss: 0.34353293942922714
Epoch: 42, step: 486, loss: 0.28915464878082275, mean loss: 0.34353204995035824
Epoch: 42, step: 487, loss: 0.30703163146972656, mean loss: 0.34353145291393977
Epoch: 42, step: 488, loss: 0.3197750747203827, mean loss: 0.34353106433782066
Epoch: 42, step: 489, loss: 0.392399400472641, mean loss: 0.3435318636498056
Epoch: 42, step: 490, loss: 0.31276994943618774, mean loss: 0.3435313605026456
Epoch: 42, step: 491, loss: 0.3045458495616913, mean loss: 0.3435307228593525
Epoch: 42, step: 492, loss: 0.31637948751449585, mean loss: 0.34353027878360387
Epoch: 42, step: 493, loss: 0.3285049498081207, mean loss: 0.3435300330387971
Epoch: 42, step: 494, loss: 0.3857249319553375, mean loss: 0.3435307231406717
Epoch: 42, step: 495, loss: 0.34865760803222656, mean loss: 0.34353080699002553
Epoch: 42, step: 496, loss: 0.3655787706375122, mean loss: 0.3435311675749245
Epoch: 42, step: 497, loss: 0.344694048166275, mean loss: 0.34353118659302206
Epoch: 42, step: 498, loss: 0.35377204418182373, mean loss: 0.34353135407233565
Epoch: 42, step: 499, loss: 0.33803004026412964, mean loss: 0.34353126410514445
Epoch: 42, step: 500, loss: 0.39186033606529236, mean loss: 0.3435320544544872
Epoch: 42, step: 501, loss: 0.3648650050163269, mean loss: 0.34353240331712925
Epoch: 42, step: 502, loss: 0.3410593271255493, mean loss: 0.34353236287500744
Epoch: 42, step: 503, loss: 0.34571146965026855, mean loss: 0.34353239850927575
Epoch: 42, step: 504, loss: 0.35272446274757385, mean loss: 0.3435325488218399
Epoch: 42, step: 505, loss: 0.3745787739753723, mean loss: 0.34353305649468474
Epoch: 42, step: 506, loss: 0.32550519704818726, mean loss: 0.3435327617050609
Epoch: 42, step: 507, loss: 0.30874890089035034, mean loss: 0.3435321929324006
Epoch: 42, step: 508, loss: 0.39750659465789795, mean loss: 0.343533075487165
Epoch: 42, step: 509, loss: 0.31637871265411377, mean loss: 0.34353263148371765
Epoch: 42, step: 510, loss: 0.3667911887168884, mean loss: 0.34353301178027634
Epoch: 42, step: 511, loss: 0.31276628375053406, mean loss: 0.34353250872716923
Epoch: 42, step: 512, loss: 0.3406839370727539, mean loss: 0.3435324621522006
Epoch: 42, step: 513, loss: 0.3472886383533478, mean loss: 0.34353252356576136
Epoch: 42, step: 514, loss: 0.32535675168037415, mean loss: 0.34353222639636344
Epoch: 42, step: 515, loss: 0.3440282642841339, mean loss: 0.34353223450632825
Epoch: 42, step: 516, loss: 0.32251450419425964, mean loss: 0.3435318908828457
Epoch: 42, step: 517, loss: 0.31463998556137085, mean loss: 0.3435314185304715
Epoch: 42, step: 518, loss: 0.3096745014190674, mean loss: 0.34353086501440705
Epoch: 42, step: 519, loss: 0.3624423146247864, mean loss: 0.3435311741866803
Epoch: 42, step: 520, loss: 0.3208189904689789, mean loss: 0.34353080288448934
Epoch: 42, step: 521, loss: 0.3469313979148865, mean loss: 0.34353085847701886
Epoch: 42, step: 522, loss: 0.30513113737106323, mean loss: 0.3435302307331352
Epoch: 42, step: 523, loss: 0.3527736961841583, mean loss: 0.3435303818392859
Epoch: 42, step: 524, loss: 0.3618144392967224, mean loss: 0.3435306807302584
Epoch: 42, step: 525, loss: 0.33569279313087463, mean loss: 0.3435305526057676
Epoch: 42, step: 526, loss: 0.2962871193885803, mean loss: 0.3435297803387759
Epoch: 42, step: 527, loss: 0.34823811054229736, mean loss: 0.3435298573024578
Epoch: 42, step: 528, loss: 0.3542834222316742, mean loss: 0.34353003308036334
Epoch: 42, step: 529, loss: 0.363852858543396, mean loss: 0.34353036527209013
Epoch: 42, step: 530, loss: 0.3265417218208313, mean loss: 0.34353008758459197
Epoch: 42, step: 531, loss: 0.33513081073760986, mean loss: 0.3435299502966409
Epoch: 42, step: 532, loss: 0.33325737714767456, mean loss: 0.3435297823920112
Epoch: 42, step: 533, loss: 0.33550703525543213, mean loss: 0.3435296512628043
Epoch: 42, step: 534, loss: 0.316132515668869, mean loss: 0.3435292034728039
Epoch: 42, step: 535, loss: 0.32957887649536133, mean loss: 0.3435289754666752
Epoch: 42, step: 536, loss: 0.3251896798610687, mean loss: 0.3435286757315178
Epoch: 42, step: 537, loss: 0.3190598487854004, mean loss: 0.3435282758226016
Epoch: 42, step: 538, loss: 0.35331329703330994, mean loss: 0.343528435742539
Epoch: 42, step: 539, loss: 0.37766116857528687, mean loss: 0.34352899357631084
Epoch: 42, step: 540, loss: 0.33498963713645935, mean loss: 0.3435288540192591
Epoch: 42, step: 541, loss: 0.32088175415992737, mean loss: 0.3435284839081321
Epoch: 42, step: 542, loss: 0.34673595428466797, mean loss: 0.34352853632548724
Epoch: 42, step: 543, loss: 0.3027488887310028, mean loss: 0.3435278699042623
Epoch: 42, step: 544, loss: 0.29884129762649536, mean loss: 0.34352713964798665
Epoch: 42, step: 545, loss: 0.3705202341079712, mean loss: 0.3435275807548674
Epoch: 42, step: 546, loss: 0.3627769351005554, mean loss: 0.3435278953125003
Epoch: 42, step: 547, loss: 0.32620251178741455, mean loss: 0.3435276121994941
Epoch: 42, step: 548, loss: 0.33512067794799805, mean loss: 0.3435274748245533
Epoch: 42, step: 549, loss: 0.3365662395954132, mean loss: 0.34352736107516235
Epoch: 42, step: 550, loss: 0.36704984307289124, mean loss: 0.3435277454357238
Epoch: 42, step: 551, loss: 0.33036008477211, mean loss: 0.3435275302778698
Epoch: 42, step: 552, loss: 0.35014086961746216, mean loss: 0.34352763833720446
Epoch: 42, step: 553, loss: 0.3083925247192383, mean loss: 0.3435270642528017
Epoch: 42, step: 554, loss: 0.35114336013793945, mean loss: 0.34352718869598076
Epoch: 42, step: 555, loss: 0.384706974029541, mean loss: 0.3435278615243144
Epoch: 42, step: 556, loss: 0.3226390779018402, mean loss: 0.34352752023220395
Epoch: 42, step: 557, loss: 0.32551679015159607, mean loss: 0.3435272259680782
Epoch: 42, step: 558, loss: 0.35806024074554443, mean loss: 0.3435274634084817
Epoch: 42, step: 559, loss: 0.3300577700138092, mean loss: 0.34352724334421897
Epoch: 42, step: 560, loss: 0.3372015058994293, mean loss: 0.343527139997694
Epoch: 42, step: 561, loss: 0.3177713453769684, mean loss: 0.34352671922013117
Epoch: 42, step: 562, loss: 0.3174645006656647, mean loss: 0.3435262934434153
Epoch: 42, step: 563, loss: 0.29232823848724365, mean loss: 0.34352545703789095
Epoch: 42, step: 564, loss: 0.35427528619766235, mean loss: 0.3435256326513907
Epoch: 42, step: 565, loss: 0.3728606402873993, mean loss: 0.3435261118719552
Epoch: 42, step: 566, loss: 0.31502074003219604, mean loss: 0.34352564621203785
Epoch: 42, step: 567, loss: 0.3538685739040375, mean loss: 0.34352581516995234
Epoch: 42, step: 568, loss: 0.3324744403362274, mean loss: 0.3435256346420788
Epoch: 42, step: 569, loss: 0.33766689896583557, mean loss: 0.3435255389392516
Epoch: 42, step: 570, loss: 0.3807201087474823, mean loss: 0.3435261465050369
Epoch: 42, step: 571, loss: 0.3788876533508301, mean loss: 0.3435267241186737
Epoch: 42, step: 572, loss: 0.3435560166835785, mean loss: 0.34352672459714617
Epoch: 42, step: 573, loss: 0.35093286633491516, mean loss: 0.3435268455690474
Epoch: 42, step: 574, loss: 0.34548476338386536, mean loss: 0.3435268775491499
Epoch: 42, step: 575, loss: 0.3212115168571472, mean loss: 0.3435265130620094
Epoch: 42, step: 576, loss: 0.3400501310825348, mean loss: 0.3435264562815769
Epoch: 42, step: 577, loss: 0.33230629563331604, mean loss: 0.3435262730234733
Epoch: 42, step: 578, loss: 0.2768823802471161, mean loss: 0.34352518455118536
Epoch: 42, step: 579, loss: 0.30571305751800537, mean loss: 0.3435245669885174
Epoch: 42, step: 580, loss: 0.29268521070480347, mean loss: 0.3435237366735313
Epoch: 42, step: 581, loss: 0.3575368821620941, mean loss: 0.34352396553431014
Epoch: 42, step: 582, loss: 0.31580471992492676, mean loss: 0.3435235128347689
Epoch: 42, step: 583, loss: 0.3276903033256531, mean loss: 0.34352325425739905
Epoch: 42, step: 584, loss: 0.3518995940685272, mean loss: 0.34352339105193486
Epoch: 42, step: 585, loss: 0.36212098598480225, mean loss: 0.34352369476547523
Epoch: 42, step: 586, loss: 0.33653563261032104, mean loss: 0.34352358064671706
Epoch: 42, step: 587, loss: 0.34705856442451477, mean loss: 0.34352363837393274
Epoch: 42, step: 588, loss: 0.3086555600166321, mean loss: 0.34352306897833274
Epoch: 42, step: 589, loss: 0.3580339252948761, mean loss: 0.3435233059366971
Epoch: 42, step: 590, loss: 0.3337118327617645, mean loss: 0.3435231457206065
Epoch: 42, step: 591, loss: 0.3252795934677124, mean loss: 0.34352284781805503
Epoch: 42, step: 592, loss: 0.31517669558525085, mean loss: 0.34352238495572046
Epoch: 42, step: 593, loss: 0.33690345287323, mean loss: 0.34352227687740683
Epoch: 42, step: 594, loss: 0.30215543508529663, mean loss: 0.3435216014232032
Epoch: 42, step: 595, loss: 0.3507225215435028, mean loss: 0.3435217190007638
Epoch: 42, step: 596, loss: 0.3314022123813629, mean loss: 0.343521521115114
Epoch: 42, step: 597, loss: 0.3479234576225281, mean loss: 0.34352159298815893
Epoch: 42, step: 598, loss: 0.3777257204055786, mean loss: 0.3435221514502455
Epoch: 42, step: 599, loss: 0.34682902693748474, mean loss: 0.3435222054418124
Epoch: 42, step: 600, loss: 0.36698731780052185, mean loss: 0.3435225885519425
Epoch: 42, step: 601, loss: 0.3094530403614044, mean loss: 0.343522032314421
Epoch: 42, step: 602, loss: 0.4283076822757721, mean loss: 0.3435234165473309
Epoch: 42, step: 603, loss: 0.2983419597148895, mean loss: 0.34352267891497873
Epoch: 42, step: 604, loss: 0.3130754828453064, mean loss: 0.3435221818422465
Epoch: 42, step: 605, loss: 0.3252345323562622, mean loss: 0.34352188328787475
Epoch: 42, step: 606, loss: 0.3458821177482605, mean loss: 0.3435219218191695
Epoch: 42, step: 607, loss: 0.3896876871585846, mean loss: 0.34352267547212334
Epoch: 42, step: 608, loss: 0.35639268159866333, mean loss: 0.3435228855706611
Epoch: 42, step: 609, loss: 0.30677905678749084, mean loss: 0.34352228574975957
Epoch: 42, step: 610, loss: 0.30150288343429565, mean loss: 0.3435215998194911
Epoch: 42, step: 611, loss: 0.3141045868396759, mean loss: 0.34352111962012805
Epoch: 42, step: 612, loss: 0.2911681532859802, mean loss: 0.34352026503129773
Epoch: 42, step: 613, loss: 0.3462357521057129, mean loss: 0.3435203093570963
Epoch: 42, step: 614, loss: 0.31894001364707947, mean loss: 0.34351990813130406
Epoch: 42, step: 615, loss: 0.3108355700969696, mean loss: 0.3435193746314014
Epoch: 42, step: 616, loss: 0.3324577212333679, mean loss: 0.34351919407719594
Epoch: 42, step: 617, loss: 0.37536853551864624, mean loss: 0.3435197139306455
Epoch: 42, step: 618, loss: 0.3251063823699951, mean loss: 0.34351941338823994
Epoch: 42, step: 619, loss: 0.3043346703052521, mean loss: 0.3435187738252857
Epoch: 42, step: 620, loss: 0.32093554735183716, mean loss: 0.3435184052338859
Epoch: 42, step: 621, loss: 0.3028622269630432, mean loss: 0.3435177416762187
Epoch: 42, step: 622, loss: 0.343391478061676, mean loss: 0.34351773961547843
Epoch: 42, step: 623, loss: 0.369034081697464, mean loss: 0.34351815605923874
Epoch: 42, step: 624, loss: 0.3644305467605591, mean loss: 0.3435184973578646
Epoch: 42, step: 625, loss: 0.3365054428577423, mean loss: 0.3435183829038629
Epoch: 42, step: 626, loss: 0.37483400106430054, mean loss: 0.3435188939706627
Epoch: 42, step: 627, loss: 0.3266143798828125, mean loss: 0.34351861809570206
Epoch: 42, step: 628, loss: 0.3512798547744751, mean loss: 0.3435187447539373
Epoch: 42, step: 629, loss: 0.33802559971809387, mean loss: 0.3435186551109164
Epoch: 42, step: 630, loss: 0.307114839553833, mean loss: 0.3435180610441797
Epoch: 42, step: 631, loss: 0.3159135580062866, mean loss: 0.3435176105790518
Epoch: 42, step: 632, loss: 0.32478806376457214, mean loss: 0.3435173049452205
Epoch: 42, step: 633, loss: 0.30046144127845764, mean loss: 0.3435166023594095
Epoch: 42, step: 634, loss: 0.34438249468803406, mean loss: 0.34351661648881454
Epoch: 42, step: 635, loss: 0.3394491374492645, mean loss: 0.34351655011783616
Epoch: 42, step: 636, loss: 0.3534616529941559, mean loss: 0.3435167123941334
Epoch: 42, step: 637, loss: 0.42192158102989197, mean loss: 0.34351799172169
Epoch: 42, step: 638, loss: 0.35118454694747925, mean loss: 0.3435181168143724
Epoch: 42, step: 639, loss: 0.3119252324104309, mean loss: 0.3435176013319875
Epoch: 42, step: 640, loss: 0.2916962802410126, mean loss: 0.3435167558079768
Epoch: 42, step: 641, loss: 0.33619847893714905, mean loss: 0.34351663640388364
Epoch: 42, step: 642, loss: 0.2872582972049713, mean loss: 0.3435157185148102
Epoch: 42, step: 643, loss: 0.3256332576274872, mean loss: 0.34351542675632807
Epoch: 42, step: 644, loss: 0.3900239169597626, mean loss: 0.34351618554591584
Epoch: 42, step: 645, loss: 0.3647010922431946, mean loss: 0.3435165311736559
Epoch: 42, step: 646, loss: 0.363066166639328, mean loss: 0.343516850117052
Epoch: 42, step: 647, loss: 0.3317696154117584, mean loss: 0.3435166584693963
Epoch: 42, step: 648, loss: 0.34198522567749023, mean loss: 0.34351663348558314
Epoch: 42, step: 649, loss: 0.33113211393356323, mean loss: 0.3435164314476773
Epoch: 42, step: 650, loss: 0.3197517395019531, mean loss: 0.3435160437628546
Epoch: 42, step: 651, loss: 0.3160317838191986, mean loss: 0.34351559540624865
Epoch: 42, step: 652, loss: 0.3184257447719574, mean loss: 0.3435151861168303
Epoch: 42, step: 653, loss: 0.3651711642742157, mean loss: 0.3435155393839041
Epoch: 42, step: 654, loss: 0.3255772590637207, mean loss: 0.34351524676722434
Epoch: 42, step: 655, loss: 0.3643403947353363, mean loss: 0.34351558647014696
Epoch: 42, step: 656, loss: 0.2903357148170471, mean loss: 0.3435147190062916
Epoch: 42, step: 657, loss: 0.33371615409851074, mean loss: 0.3435145591758524
Epoch: 42, step: 658, loss: 0.31598034501075745, mean loss: 0.3435141100556187
Epoch: 42, step: 659, loss: 0.343624472618103, mean loss: 0.34351411185575187
Epoch: 42, step: 660, loss: 0.36780017614364624, mean loss: 0.34351450798134986
Epoch: 42, step: 661, loss: 0.3969084918498993, mean loss: 0.34351537886674977
Epoch: 42, step: 662, loss: 0.3770260512828827, mean loss: 0.343515925435431
Epoch: 42, step: 663, loss: 0.33749815821647644, mean loss: 0.34351582728552205
Epoch: 42, step: 664, loss: 0.30956751108169556, mean loss: 0.3435152735968067
Epoch: 42, step: 665, loss: 0.32156798243522644, mean loss: 0.34351491564770603
Epoch: 42, step: 666, loss: 0.3808290362358093, mean loss: 0.34351552421201476
Epoch: 42, step: 667, loss: 0.3081311285495758, mean loss: 0.3435149471294317
Epoch: 42, step: 668, loss: 0.3421153724193573, mean loss: 0.3435149243042004
Epoch: 42, step: 669, loss: 0.3529662489891052, mean loss: 0.3435150784404195
Epoch: 42, step: 670, loss: 0.31282445788383484, mean loss: 0.3435145779329005
Epoch: 42, step: 671, loss: 0.3547176122665405, mean loss: 0.34351476063078595
Epoch: 42, step: 672, loss: 0.3587900996208191, mean loss: 0.3435150097353177
Epoch: 42, step: 673, loss: 0.38469111919403076, mean loss: 0.34351568120900505
Epoch: 42, step: 674, loss: 0.32315361499786377, mean loss: 0.34351534916285253
Epoch: 42, step: 675, loss: 0.3425747752189636, mean loss: 0.34351533382507377
Epoch: 42, step: 676, loss: 0.32031530141830444, mean loss: 0.3435149555122746
Epoch: 42, step: 677, loss: 0.34612107276916504, mean loss: 0.3435149980083979
Epoch: 42, step: 678, loss: 0.3512501120567322, mean loss: 0.34351512413741203
Epoch: 42, step: 679, loss: 0.34132489562034607, mean loss: 0.343515088424059
Epoch: 42, step: 680, loss: 0.3116999864578247, mean loss: 0.3435145696629188
Epoch: 42, step: 681, loss: 0.3732324242591858, mean loss: 0.3435150542194914
Epoch: 42, step: 682, loss: 0.2860228717327118, mean loss: 0.3435141168112886
Epoch: 42, step: 683, loss: 0.33455416560173035, mean loss: 0.34351397072195167
Epoch: 42, step: 684, loss: 0.3118833005428314, mean loss: 0.3435134550017003
Epoch: 42, step: 685, loss: 0.3217322826385498, mean loss: 0.34351309987775
Epoch: 42, step: 686, loss: 0.30038347840309143, mean loss: 0.34351239669650807
Epoch: 42, step: 687, loss: 0.30885782837867737, mean loss: 0.34351183170093746
Epoch: 42, step: 688, loss: 0.3423742949962616, mean loss: 0.3435118131552521
Epoch: 42, step: 689, loss: 0.3264440596103668, mean loss: 0.3435115348978334
Epoch: 42, step: 690, loss: 0.3394961953163147, mean loss: 0.34351146943638833
Epoch: 42, step: 691, loss: 0.31184279918670654, mean loss: 0.34351095315549085
Epoch: 42, step: 692, loss: 0.33657461404800415, mean loss: 0.3435108400771402
Epoch: 42, step: 693, loss: 0.3701823055744171, mean loss: 0.3435112748765517
Epoch: 42, step: 694, loss: 0.31155210733413696, mean loss: 0.34351075388528063
Epoch: 42, step: 695, loss: 0.3845411241054535, mean loss: 0.34351142274238516
Epoch: 42, step: 696, loss: 0.34136563539505005, mean loss: 0.34351138776337553
Epoch: 42, step: 697, loss: 0.3018677532672882, mean loss: 0.34351070893126756
Epoch: 42, step: 698, loss: 0.35860979557037354, mean loss: 0.3435109550571847
Epoch: 42, step: 699, loss: 0.3353422284126282, mean loss: 0.3435108219032654
Epoch: 42, step: 700, loss: 0.3237030506134033, mean loss: 0.3435104990329449
Epoch: 42, step: 701, loss: 0.3441080152988434, mean loss: 0.34351050877241135
Epoch: 42, step: 702, loss: 0.27502360939979553, mean loss: 0.34350939245972906
Epoch: 42, step: 703, loss: 0.35250794887542725, mean loss: 0.3435095391306838
Epoch: 42, step: 704, loss: 0.3529033660888672, mean loss: 0.34350969224181055
Epoch: 42, step: 705, loss: 0.30325737595558167, mean loss: 0.34350903617511097
Epoch: 42, step: 706, loss: 0.33475950360298157, mean loss: 0.34350889357006537
Epoch: 42, step: 707, loss: 0.34699147939682007, mean loss: 0.34350895033037937
Epoch: 42, step: 708, loss: 0.31152164936065674, mean loss: 0.3435084289994641
Epoch: 42, step: 709, loss: 0.33623209595680237, mean loss: 0.3435083104112923
Epoch: 42, step: 710, loss: 0.3623487949371338, mean loss: 0.3435086174646101
Epoch: 42, step: 711, loss: 0.3124978840351105, mean loss: 0.3435081120745607
Epoch: 42, step: 712, loss: 0.35115671157836914, mean loss: 0.3435082367237598
Epoch: 42, step: 713, loss: 0.3296353816986084, mean loss: 0.343508010641575
Epoch: 42, step: 714, loss: 0.33949679136276245, mean loss: 0.3435079452728792
Epoch: 42, step: 715, loss: 0.32580849528312683, mean loss: 0.3435076568391071
Epoch: 42, step: 716, loss: 0.35062575340270996, mean loss: 0.3435077728351401
Epoch: 42, step: 717, loss: 0.2991509735584259, mean loss: 0.34350705001143844
Epoch: 42, step: 718, loss: 0.3505117893218994, mean loss: 0.3435071641564889
Epoch: 42, step: 719, loss: 0.31535080075263977, mean loss: 0.34350670534467487
Epoch: 42, step: 720, loss: 0.33304470777511597, mean loss: 0.34350653486776356
Epoch: 42, step: 721, loss: 0.3096334934234619, mean loss: 0.34350598291988277
Epoch: 42, step: 722, loss: 0.3251577317714691, mean loss: 0.34350568394722225
Epoch: 42, step: 723, loss: 0.3278369903564453, mean loss: 0.3435054286403463
Epoch: 42, step: 724, loss: 0.31490835547447205, mean loss: 0.3435049626850701
Epoch: 42, step: 725, loss: 0.3080679774284363, mean loss: 0.34350438529097393
Epoch: 42, step: 726, loss: 0.3745536506175995, mean loss: 0.34350489118531735
Epoch: 42, step: 727, loss: 0.3331136405467987, mean loss: 0.34350472188052983
Epoch: 42, step: 728, loss: 0.3478432595729828, mean loss: 0.34350479256723154
Epoch: 42, step: 729, loss: 0.3862021267414093, mean loss: 0.3435054882128077
Epoch: 42, step: 730, loss: 0.35260647535324097, mean loss: 0.343505636488067
Epoch: 42, step: 731, loss: 0.33584973216056824, mean loss: 0.34350551175844285
Epoch: 42, step: 732, loss: 0.3367007374763489, mean loss: 0.34350540089719456
Epoch: 42, step: 733, loss: 0.300429105758667, mean loss: 0.343504699123138
Epoch: 42, step: 734, loss: 0.32398468255996704, mean loss: 0.3435043811195122
Epoch: 42, step: 735, loss: 0.3226744532585144, mean loss: 0.3435040417814459
Epoch: 42, step: 736, loss: 0.3439881503582001, mean loss: 0.34350404966787706
Epoch: 42, step: 737, loss: 0.34487026929855347, mean loss: 0.34350407192408583
Epoch: 42, step: 738, loss: 0.2893756330013275, mean loss: 0.34350319016672803
Epoch: 42, step: 739, loss: 0.29632169008255005, mean loss: 0.3435024215881771
Epoch: 42, step: 740, loss: 0.3404292166233063, mean loss: 0.3435023715270104
Epoch: 42, step: 741, loss: 0.3307444751262665, mean loss: 0.34350216370983494
Epoch: 42, step: 742, loss: 0.34675613045692444, mean loss: 0.3435022167138053
Epoch: 42, step: 743, loss: 0.3262249231338501, mean loss: 0.3435019352879912
Epoch: 42, step: 744, loss: 0.3207986056804657, mean loss: 0.34350156548476274
Epoch: 42, step: 745, loss: 0.3186016082763672, mean loss: 0.3435011599083675
Epoch: 42, step: 746, loss: 0.33335041999816895, mean loss: 0.3435009945734068
Epoch: 42, step: 747, loss: 0.3328132629394531, mean loss: 0.34350082049477576
Epoch: 42, step: 748, loss: 0.3207273781299591, mean loss: 0.3435004495736825
Epoch: 42, step: 749, loss: 0.34496548771858215, mean loss: 0.34350047343501583
Epoch: 42, step: 750, loss: 0.32681235671043396, mean loss: 0.34350020163715717
Epoch: 42, step: 751, loss: 0.31799060106277466, mean loss: 0.34349978617134974
Epoch: 42, step: 752, loss: 0.3149201571941376, mean loss: 0.34349932071266054
Epoch: 42, step: 753, loss: 0.30979710817337036, mean loss: 0.3434987718345696
Epoch: 42, step: 754, loss: 0.3386252522468567, mean loss: 0.3434986924651644
Epoch: 42, step: 755, loss: 0.3202025294303894, mean loss: 0.3434983130735444
Epoch: 42, step: 756, loss: 0.34732893109321594, mean loss: 0.34349837545638
Epoch: 42, step: 757, loss: 0.3141396939754486, mean loss: 0.34349789734867914
Epoch: 42, step: 758, loss: 0.3233610987663269, mean loss: 0.34349756942517556
Epoch: 42, step: 759, loss: 0.3360941708087921, mean loss: 0.3434974488643591
Epoch: 42, step: 760, loss: 0.3100375533103943, mean loss: 0.343496903994787
Epoch: 42, step: 761, loss: 0.33030325174331665, mean loss: 0.34349668914944825
Epoch: 42, step: 762, loss: 0.3500778377056122, mean loss: 0.3434967963150791
Epoch: 42, step: 763, loss: 0.3434634804725647, mean loss: 0.34349679577258185
Epoch: 42, step: 764, loss: 0.3319863975048065, mean loss: 0.3434966083464951
Epoch: 42, step: 765, loss: 0.3658238351345062, mean loss: 0.3434969718992158
Epoch: 42, step: 766, loss: 0.3309536576271057, mean loss: 0.34349676766060516
Epoch: 42, step: 767, loss: 0.309096097946167, mean loss: 0.3434962075350725
Epoch: 42, step: 768, loss: 0.3643704056739807, mean loss: 0.3434965474116236
Epoch: 42, step: 769, loss: 0.3375990390777588, mean loss: 0.3434964513891492
Epoch: 42, step: 770, loss: 0.3086884319782257, mean loss: 0.3434958846586682
Epoch: 42, step: 771, loss: 0.3514755070209503, mean loss: 0.3434960145776256
Epoch: 42, step: 772, loss: 0.30414578318595886, mean loss: 0.3434953739134978
Epoch: 42, step: 773, loss: 0.3669498860836029, mean loss: 0.34349575577198777
Epoch: 42, step: 774, loss: 0.3211526870727539, mean loss: 0.34349539201462165
Epoch: 42, step: 775, loss: 0.3025665581226349, mean loss: 0.34349472568169165
Epoch: 42, step: 776, loss: 0.3244931399822235, mean loss: 0.3434944163355671
Epoch: 42, step: 777, loss: 0.3068539500236511, mean loss: 0.34349381983789
Epoch: 42, step: 778, loss: 0.3759396970272064, mean loss: 0.3434943480401006
Epoch: 42, step: 779, loss: 0.3265249729156494, mean loss: 0.3434940717918893
Epoch: 42, step: 780, loss: 0.32757216691970825, mean loss: 0.34349381259989736
Epoch: 42, step: 781, loss: 0.31907355785369873, mean loss: 0.3434934150701115
Epoch: 42, step: 782, loss: 0.32524237036705017, mean loss: 0.3434931179718272
Epoch: 42, step: 783, loss: 0.3180403709411621, mean loss: 0.34349270364790757
Epoch: 42, step: 784, loss: 0.3562341034412384, mean loss: 0.3434929110510914
Epoch: 42, step: 785, loss: 0.3423647880554199, mean loss: 0.34349289268792127
Epoch: 42, step: 786, loss: 0.3232633173465729, mean loss: 0.3434925634037129
Epoch: 42, step: 787, loss: 0.3725441098213196, mean loss: 0.34349303627867905
Epoch: 42, step: 788, loss: 0.3279542326927185, mean loss: 0.3434927833561147
Epoch: 42, step: 789, loss: 0.32986316084861755, mean loss: 0.3434925615125894
Epoch: 42, step: 790, loss: 0.3214716613292694, mean loss: 0.34349220309366685
Epoch: 42, step: 791, loss: 0.3163376450538635, mean loss: 0.3434917611249487
Epoch: 42, step: 792, loss: 0.33502402901649475, mean loss: 0.3434916233060312
Epoch: 42, step: 793, loss: 0.37836262583732605, mean loss: 0.34349219084944665
Epoch: 42, step: 794, loss: 0.41732078790664673, mean loss: 0.34349339242809773
Epoch: 42, step: 795, loss: 0.3145626187324524, mean loss: 0.3434929215802738
Epoch: 42, step: 796, loss: 0.3166359066963196, mean loss: 0.343492484489951
Epoch: 42, step: 797, loss: 0.31328731775283813, mean loss: 0.3434919929174038
Epoch: 42, step: 798, loss: 0.30048108100891113, mean loss: 0.3434912929497584
Epoch: 42, step: 799, loss: 0.3657742142677307, mean loss: 0.3434916555802967
Epoch: 42, step: 800, loss: 0.3238799571990967, mean loss: 0.3434913364262278
Epoch: 42, step: 801, loss: 0.3354204595088959, mean loss: 0.3434912050856759
Epoch: 42, step: 802, loss: 0.3504759669303894, mean loss: 0.3434913187496007
Epoch: 42, step: 803, loss: 0.3399598300457001, mean loss: 0.3434912612821675
Epoch: 42, step: 804, loss: 0.35685789585113525, mean loss: 0.3434914787920461
Epoch: 42, step: 805, loss: 0.320842444896698, mean loss: 0.3434911102394068
Epoch: 42, step: 806, loss: 0.319009006023407, mean loss: 0.3434907118649179
Epoch: 42, step: 807, loss: 0.33326223492622375, mean loss: 0.3434905454291437
Epoch: 42, step: 808, loss: 0.3193335235118866, mean loss: 0.3434901523572086
Epoch: 42, step: 809, loss: 0.3423171043395996, mean loss: 0.34349013327022204
Epoch: 42, step: 810, loss: 0.32075244188308716, mean loss: 0.34348976330501946
Epoch: 42, step: 811, loss: 0.3148301839828491, mean loss: 0.34348929699230674
Epoch: 42, step: 812, loss: 0.30205193161964417, mean loss: 0.3434886227864628
Epoch: 42, step: 813, loss: 0.35062023997306824, mean loss: 0.34348873881941305
Epoch: 42, step: 814, loss: 0.3164971172809601, mean loss: 0.34348829966705247
Epoch: 42, step: 815, loss: 0.3493904173374176, mean loss: 0.3434883956926556
Epoch: 42, step: 816, loss: 0.3730401396751404, mean loss: 0.34348887648243814
Epoch: 42, step: 817, loss: 0.31857606768608093, mean loss: 0.34348847117204223
Epoch: 42, step: 818, loss: 0.30640724301338196, mean loss: 0.3434878679015368
Epoch: 42, step: 819, loss: 0.3371050953865051, mean loss: 0.34348776406258785
Epoch: 42, step: 820, loss: 0.32715973258018494, mean loss: 0.343487498432246
Epoch: 42, step: 821, loss: 0.3331287205219269, mean loss: 0.3434873299146291
Epoch: 42, step: 822, loss: 0.33925384283065796, mean loss: 0.34348726104496563
Epoch: 42, step: 823, loss: 0.36726194620132446, mean loss: 0.34348764780129626
Epoch: 42, step: 824, loss: 0.37119439244270325, mean loss: 0.34348809851534373
Epoch: 42, step: 825, loss: 0.3164374530315399, mean loss: 0.3434876584814191
Epoch: 42, step: 826, loss: 0.313663125038147, mean loss: 0.3434871733324408
Epoch: 42, step: 827, loss: 0.33693554997444153, mean loss: 0.3434870667603906
Epoch: 42, step: 828, loss: 0.3673865497112274, mean loss: 0.34348745551525744
Epoch: 42, step: 829, loss: 0.33395934104919434, mean loss: 0.3434873005311255
Epoch: 42, step: 830, loss: 0.3436124324798584, mean loss: 0.3434873025664863
Epoch: 42, step: 831, loss: 0.34358060359954834, mean loss: 0.3434873040840698
Epoch: 42, step: 832, loss: 0.3229823708534241, mean loss: 0.3434869705674837
Epoch: 42, step: 833, loss: 0.34162959456443787, mean loss: 0.3434869403574059
Epoch: 42, step: 834, loss: 0.33658716082572937, mean loss: 0.34348682813484793
Epoch: 42, step: 835, loss: 0.33894097805023193, mean loss: 0.34348675419935115
Epoch: 42, step: 836, loss: 0.34415340423583984, mean loss: 0.3434867650418337
Epoch: 42, step: 837, loss: 0.4176850914955139, mean loss: 0.34348797179339424
Epoch: 42, step: 838, loss: 0.36732345819473267, mean loss: 0.3434883594442213
Epoch: 42, step: 839, loss: 0.3156028091907501, mean loss: 0.3434879059321498
Epoch: 42, step: 840, loss: 0.3281281292438507, mean loss: 0.34348765613500415
Epoch: 42, step: 841, loss: 0.33935070037841797, mean loss: 0.3434875888564913
Epoch: 42, step: 842, loss: 0.3299112617969513, mean loss: 0.3434873680708957
Epoch: 42, step: 843, loss: 0.3382439911365509, mean loss: 0.3434872828016422
Epoch: 42, step: 844, loss: 0.3192999064922333, mean loss: 0.3434868894662006
Epoch: 42, step: 845, loss: 0.33261948823928833, mean loss: 0.3434867127432483
Epoch: 42, step: 846, loss: 0.3491976857185364, mean loss: 0.34348680561214784
Epoch: 42, step: 847, loss: 0.3143526017665863, mean loss: 0.34348633185444255
Epoch: 42, step: 848, loss: 0.3368173837661743, mean loss: 0.34348622341097235
Epoch: 42, step: 849, loss: 0.33905860781669617, mean loss: 0.34348615141488154
Epoch: 42, step: 850, loss: 0.33499443531036377, mean loss: 0.34348601333595175
Epoch: 42, step: 851, loss: 0.323845237493515, mean loss: 0.3434856939737429
Epoch: 42, step: 852, loss: 0.3270830810070038, mean loss: 0.3434854272689256
Epoch: 42, step: 853, loss: 0.3053276240825653, mean loss: 0.34348480683701793
Epoch: 42, step: 854, loss: 0.3440210521221161, mean loss: 0.34348481555602817
Epoch: 42, step: 855, loss: 0.32169216871261597, mean loss: 0.34348446122709275
Epoch: 42, step: 856, loss: 0.3585066795349121, mean loss: 0.34348470547094784
Epoch: 42, step: 857, loss: 0.35551974177360535, mean loss: 0.34348490114350505
Epoch: 42, step: 858, loss: 0.36666104197502136, mean loss: 0.3434852779484351
Epoch: 42, step: 859, loss: 0.3177682161331177, mean loss: 0.3434848598392165
Epoch: 42, step: 860, loss: 0.3145294785499573, mean loss: 0.34348438908889883
Epoch: 42, step: 861, loss: 0.4018227756023407, mean loss: 0.343485337526332
Epoch: 42, step: 862, loss: 0.3300078511238098, mean loss: 0.3434851184194015
Epoch: 42, step: 863, loss: 0.3353370726108551, mean loss: 0.34348498595669813
Epoch: 42, step: 864, loss: 0.335013210773468, mean loss: 0.3434848482333684
Epoch: 42, step: 865, loss: 0.3324582874774933, mean loss: 0.3434846689805031
Epoch: 42, step: 866, loss: 0.314269483089447, mean loss: 0.34348419405266617
Epoch: 42, step: 867, loss: 0.3125913143157959, mean loss: 0.34348369186007016
Epoch: 42, step: 868, loss: 0.32989007234573364, mean loss: 0.34348347088668857
Epoch: 42, step: 869, loss: 0.32666853070259094, mean loss: 0.34348319755302714
Epoch: 42, step: 870, loss: 0.32218703627586365, mean loss: 0.3434828513809295
Epoch: 42, step: 871, loss: 0.32234546542167664, mean loss: 0.34348250779533196
Epoch: 42, step: 872, loss: 0.3394504189491272, mean loss: 0.34348244225529123
Epoch: 42, step: 873, loss: 0.3309182822704315, mean loss: 0.34348223803306205
Epoch: 42, step: 874, loss: 0.3121805787086487, mean loss: 0.3434817292532671
Epoch: 42, step: 875, loss: 0.3442942798137665, mean loss: 0.3434817424603174
Epoch: 42, step: 876, loss: 0.36865219473838806, mean loss: 0.34348215156965956
Epoch: 42, step: 877, loss: 0.36286571621894836, mean loss: 0.34348246661638204
Epoch: 42, step: 878, loss: 0.29060545563697815, mean loss: 0.34348160720488824
Epoch: 42, step: 879, loss: 0.3045446276664734, mean loss: 0.343480974371389
Epoch: 42, step: 880, loss: 0.33076274394989014, mean loss: 0.3434807676683641
Epoch: 42, step: 881, loss: 0.31906038522720337, mean loss: 0.34348037078257765
Epoch: 42, step: 882, loss: 0.30923062562942505, mean loss: 0.343479814156728
Epoch: 42, step: 883, loss: 0.35778871178627014, mean loss: 0.3434800467007316
Epoch: 42, step: 884, loss: 0.3295530080795288, mean loss: 0.34347982036626684
Epoch: 42, step: 885, loss: 0.312679260969162, mean loss: 0.3434793198208871
Epoch: 42, step: 886, loss: 0.33941733837127686, mean loss: 0.3434792538099754
Epoch: 42, step: 887, loss: 0.31617072224617004, mean loss: 0.3434788100285862
Epoch: 42, step: 888, loss: 0.33552613854408264, mean loss: 0.3434786807946053
Epoch: 42, step: 889, loss: 0.34448471665382385, mean loss: 0.34347869714281065
Epoch: 42, step: 890, loss: 0.3140541613101959, mean loss: 0.3434782189982871
Epoch: 42, step: 891, loss: 0.30897313356399536, mean loss: 0.34347765830466614
Epoch: 42, step: 892, loss: 0.36213237047195435, mean loss: 0.3434779614312349
Epoch: 42, step: 893, loss: 0.3179660141468048, mean loss: 0.34347754688592785
Epoch: 42, step: 894, loss: 0.32259032130241394, mean loss: 0.3434772074935423
Epoch: 42, step: 895, loss: 0.3137120306491852, mean loss: 0.34347672385294625
Epoch: 42, step: 896, loss: 0.34416306018829346, mean loss: 0.3434767350047268
Epoch: 42, step: 897, loss: 0.3020668625831604, mean loss: 0.3434760621767214
Epoch: 42, step: 898, loss: 0.3222501277923584, mean loss: 0.34347571730313886
Epoch: 42, step: 899, loss: 0.3843742609024048, mean loss: 0.3434763818014751
Epoch: 42, step: 900, loss: 0.3690793812274933, mean loss: 0.3434767977789796
Epoch: 42, step: 901, loss: 0.32726237177848816, mean loss: 0.34347653434395115
Epoch: 42, step: 902, loss: 0.32265084981918335, mean loss: 0.3434761959955161
Epoch: 42, step: 903, loss: 0.3213927447795868, mean loss: 0.34347583721836483
Epoch: 42, step: 904, loss: 0.3732870817184448, mean loss: 0.34347632153666774
Epoch: 42, step: 905, loss: 0.3366814851760864, mean loss: 0.3434762111484499
Epoch: 42, step: 906, loss: 0.3223532736301422, mean loss: 0.3434758679929383
Epoch: 42, step: 907, loss: 0.3211287260055542, mean loss: 0.3434755049553467
Epoch: 42, step: 908, loss: 0.3178427517414093, mean loss: 0.3434750885485495
Epoch: 42, step: 909, loss: 0.3048609495162964, mean loss: 0.34347446126795184
Epoch: 42, step: 910, loss: 0.2978067696094513, mean loss: 0.3434737194155556
Epoch: 42, step: 911, loss: 0.33621931076049805, mean loss: 0.34347360157266
Epoch: 42, step: 912, loss: 0.32591184973716736, mean loss: 0.3434733162986743
Epoch: 42, step: 913, loss: 0.36197736859321594, mean loss: 0.3434736168745538
Epoch: 42, step: 914, loss: 0.35059890151023865, mean loss: 0.34347373261427794
Epoch: 42, step: 915, loss: 0.37481337785720825, mean loss: 0.3434742416722541
Epoch: 42, step: 916, loss: 0.31813275814056396, mean loss: 0.3434738300506585
Epoch: 42, step: 917, loss: 0.31808874011039734, mean loss: 0.3434734177274616
Epoch: 42, step: 918, loss: 0.3429124653339386, mean loss: 0.34347340861621056
Epoch: 42, step: 919, loss: 0.36210542917251587, mean loss: 0.34347371124128456
Epoch: 42, step: 920, loss: 0.36177870631217957, mean loss: 0.34347400854991506
Epoch: 42, step: 921, loss: 0.35763612389564514, mean loss: 0.34347423856640596
Epoch: 42, step: 922, loss: 0.35862237215042114, mean loss: 0.3434744845934899
Epoch: 42, step: 923, loss: 0.3558664619922638, mean loss: 0.34347468585343593
Epoch: 42, step: 924, loss: 0.3713415861129761, mean loss: 0.34347513843655286
Epoch: 42, step: 925, loss: 0.30327850580215454, mean loss: 0.3434744856182751
Epoch: 42, step: 926, loss: 0.33102577924728394, mean loss: 0.34347428344683584
Epoch: 42, step: 927, loss: 0.38109439611434937, mean loss: 0.34347489440098466
Epoch: 42, step: 928, loss: 0.3128730356693268, mean loss: 0.3434743974320071
Epoch: 42, step: 929, loss: 0.34975937008857727, mean loss: 0.34347449949723585
Epoch: 42, step: 930, loss: 0.32270005345344543, mean loss: 0.3434741621347252
Epoch: 42, step: 931, loss: 0.36370140314102173, mean loss: 0.34347449060567364
Epoch: 42, step: 932, loss: 0.3247586488723755, mean loss: 0.3434741866833318
Epoch: 42, step: 933, loss: 0.31344926357269287, mean loss: 0.34347369912327996
Epoch: 42, step: 934, loss: 0.3694382309913635, mean loss: 0.3434741207417764
Epoch: 42, step: 935, loss: 0.3460244834423065, mean loss: 0.34347416215452486
Epoch: 42, step: 936, loss: 0.316448450088501, mean loss: 0.34347372331857345
Epoch: 42, step: 937, loss: 0.3262302875518799, mean loss: 0.3434734433290342
Epoch: 42, step: 938, loss: 0.33360663056373596, mean loss: 0.3434732831196919
Epoch: 42, step: 939, loss: 0.34893450140953064, mean loss: 0.343473371793107
Epoch: 42, step: 940, loss: 0.33836033940315247, mean loss: 0.34347328877450967
Epoch: 42, step: 941, loss: 0.3368193805217743, mean loss: 0.3434731807389803
Epoch: 42, step: 942, loss: 0.3226442337036133, mean loss: 0.3434728425573136
Epoch: 42, step: 943, loss: 0.2939114570617676, mean loss: 0.3434720378848643
Epoch: 42, step: 944, loss: 0.3324844539165497, mean loss: 0.3434718594947231
Epoch: 42, step: 945, loss: 0.34825319051742554, mean loss: 0.3434719371212942
Epoch: 42, step: 946, loss: 0.3233686685562134, mean loss: 0.34347161074304006
Epoch: 42, step: 947, loss: 0.3483841121196747, mean loss: 0.34347169049661785
Epoch: 42, step: 948, loss: 0.3629193902015686, mean loss: 0.34347200622140484
Epoch: 42, step: 949, loss: 0.3096265196800232, mean loss: 0.3434714567638487
Epoch: 42, step: 950, loss: 0.2988305389881134, mean loss: 0.34347073206186046
Epoch: 42, step: 951, loss: 0.3338169753551483, mean loss: 0.3434705753450308
Epoch: 42, step: 952, loss: 0.3379763960838318, mean loss: 0.3434704861552569
Epoch: 42, step: 953, loss: 0.34661391377449036, mean loss: 0.34347053718326925
Epoch: 42, step: 954, loss: 0.2919996678829193, mean loss: 0.34346970165790036
Epoch: 42, step: 955, loss: 0.30447784066200256, mean loss: 0.34346906871424415
Epoch: 42, step: 956, loss: 0.3381771445274353, mean loss: 0.34346898281335647
Epoch: 42, step: 957, loss: 0.3014960289001465, mean loss: 0.34346830150059615
Epoch: 42, step: 958, loss: 0.3423067331314087, mean loss: 0.34346828264610935
Epoch: 42, step: 959, loss: 0.31603068113327026, mean loss: 0.343467837288339
Epoch: 42, step: 960, loss: 0.34735938906669617, mean loss: 0.34346790045365216
Epoch: 42, step: 961, loss: 0.31865379214286804, mean loss: 0.3434674976926018
Epoch: 42, step: 962, loss: 0.3151338994503021, mean loss: 0.34346703781371263
Epoch: 42, step: 963, loss: 0.337589830160141, mean loss: 0.34346694242308007
Epoch: 42, step: 964, loss: 0.3396592140197754, mean loss: 0.34346688062234965
Epoch: 42, step: 965, loss: 0.3633011281490326, mean loss: 0.34346720253372576
Epoch: 42, step: 966, loss: 0.34276896715164185, mean loss: 0.34346719120149527
Epoch: 42, step: 967, loss: 0.3271900415420532, mean loss: 0.34346692703066856
Epoch: 42, step: 968, loss: 0.313754677772522, mean loss: 0.34346644482203686
Epoch: 42, step: 969, loss: 0.35552316904067993, mean loss: 0.3434666404909034
Epoch: 42, step: 970, loss: 0.3103088438510895, mean loss: 0.3434661023809594
Epoch: 42, step: 971, loss: 0.408171683549881, mean loss: 0.3434671524553049
Epoch: 42, step: 972, loss: 0.33059436082839966, mean loss: 0.3434669435526317
Epoch: 42, step: 973, loss: 0.3466013967990875, mean loss: 0.3434669944184466
Epoch: 42, step: 974, loss: 0.3209598958492279, mean loss: 0.3434666291798414
Epoch: 42, step: 975, loss: 0.3220531642436981, mean loss: 0.3434662816940414
Epoch: 42, step: 976, loss: 0.3242133855819702, mean loss: 0.34346596927382056
Epoch: 42, step: 977, loss: 0.30721771717071533, mean loss: 0.34346538107643465
Epoch: 42, step: 978, loss: 0.33987146615982056, mean loss: 0.34346532275922115
Epoch: 42, step: 979, loss: 0.3047894537448883, mean loss: 0.34346469518946365
Epoch: 42, step: 980, loss: 0.3351593017578125, mean loss: 0.3434645604250925
Epoch: 42, step: 981, loss: 0.3340286314487457, mean loss: 0.34346440731899197
Epoch: 42, step: 982, loss: 0.31291037797927856, mean loss: 0.3434639115615105
Epoch: 42, step: 983, loss: 0.31259772181510925, mean loss: 0.34346341074716497
Epoch: 42, step: 984, loss: 0.3106929659843445, mean loss: 0.34346287904426615
Epoch: 42, step: 985, loss: 0.3802756369113922, mean loss: 0.34346347632430424
Epoch: 42, step: 986, loss: 0.3421870470046997, mean loss: 0.3434634556148158
Epoch: 42, step: 987, loss: 0.3042858839035034, mean loss: 0.34346281998674594
Epoch: 42, step: 988, loss: 0.3768090605735779, mean loss: 0.34346336099686303
Epoch: 42, step: 989, loss: 0.347711443901062, mean loss: 0.34346342991673234
Epoch: 42, step: 990, loss: 0.36053240299224854, mean loss: 0.3434637068351294
Epoch: 42, step: 991, loss: 0.32233262062072754, mean loss: 0.34346336402062233
Epoch: 42, step: 992, loss: 0.2957308292388916, mean loss: 0.34346258965721516
Epoch: 42, step: 993, loss: 0.3170475661754608, mean loss: 0.34346216113407374
Epoch: 42, step: 994, loss: 0.33449411392211914, mean loss: 0.3434620156504469
Epoch: 42, step: 995, loss: 0.306160569190979, mean loss: 0.3434614105397068
Epoch: 42, step: 996, loss: 0.3535275161266327, mean loss: 0.34346157383122417
Epoch: 42, step: 997, loss: 0.283209890127182, mean loss: 0.3434605964493388
Epoch: 42, step: 998, loss: 0.3290552496910095, mean loss: 0.3434603627745978
Epoch: 42, step: 999, loss: 0.3451424241065979, mean loss: 0.3434603900595273
Epoch: 42, step: 1000, loss: 0.3136729300022125, mean loss: 0.3434599068812104
Epoch: 42, step: 1001, loss: 0.34354913234710693, mean loss: 0.34345990832850104
Epoch: 42, step: 1002, loss: 0.31083083152770996, mean loss: 0.3434593790738774
Epoch: 42, step: 1003, loss: 0.2988828122615814, mean loss: 0.34345865603866665
Epoch: 42, step: 1004, loss: 0.3419165313243866, mean loss: 0.34345863102569546
Epoch: 42, step: 1005, loss: 0.3472040295600891, mean loss: 0.343458691774366
Epoch: 42, step: 1006, loss: 0.32840481400489807, mean loss: 0.3434584476112362
Epoch: 42, step: 1007, loss: 0.33215829730033875, mean loss: 0.3434582643338534
Epoch: 42, step: 1008, loss: 0.35781896114349365, mean loss: 0.3434584972465285
Epoch: 42, step: 1009, loss: 0.32555142045021057, mean loss: 0.34345820682068273
Epoch: 42, step: 1010, loss: 0.32761090993881226, mean loss: 0.34345794980553684
Epoch: 42, step: 1011, loss: 0.3043506145477295, mean loss: 0.343457315563966
Epoch: 42, step: 1012, loss: 0.3422926962375641, mean loss: 0.3434572966765116
Epoch: 42, step: 1013, loss: 0.33426177501678467, mean loss: 0.3434571475486588
Epoch: 42, step: 1014, loss: 0.2983197271823883, mean loss: 0.34345641554696626
Epoch: 42, step: 1015, loss: 0.31306999921798706, mean loss: 0.3434559227729599
Epoch: 42, step: 1016, loss: 0.3364669978618622, mean loss: 0.34345580943597925
Epoch: 42, step: 1017, loss: 0.3392806947231293, mean loss: 0.3434557417306844
Epoch: 42, step: 1018, loss: 0.35063812136650085, mean loss: 0.34345585820107594
Epoch: 42, step: 1019, loss: 0.33673015236854553, mean loss: 0.3434557491379341
Epoch: 42, step: 1020, loss: 0.3272762894630432, mean loss: 0.34345548677824483
Epoch: 42, step: 1021, loss: 0.32697051763534546, mean loss: 0.34345521946887003
Epoch: 42, step: 1022, loss: 0.3301905393600464, mean loss: 0.34345500438106363
Epoch: 42, step: 1023, loss: 0.3032826781272888, mean loss: 0.34345435299427135
Epoch: 42, step: 1024, loss: 0.3165011405944824, mean loss: 0.34345391596003594
Epoch: 42, step: 1025, loss: 0.3337852358818054, mean loss: 0.3434537591892723
Epoch: 42, step: 1026, loss: 0.36305782198905945, mean loss: 0.3434540770500392
Epoch: 42, step: 1027, loss: 0.32943230867385864, mean loss: 0.34345384970442056
Epoch: 42, step: 1028, loss: 0.3539368212223053, mean loss: 0.34345401967007255
Epoch: 42, step: 1029, loss: 0.3053577244281769, mean loss: 0.3434534020058285
Epoch: 42, step: 1030, loss: 0.3460597097873688, mean loss: 0.34345344426182783
Epoch: 42, step: 1031, loss: 0.3313881754875183, mean loss: 0.3434532486511149
Epoch: 42, step: 1032, loss: 0.30574342608451843, mean loss: 0.3434526372825805
Epoch: 42, step: 1033, loss: 0.3433775007724762, mean loss: 0.34345263606445353
Epoch: 42, step: 1034, loss: 0.3234519064426422, mean loss: 0.34345231181418
Epoch: 42, step: 1035, loss: 0.31480535864830017, mean loss: 0.3434518473995317
Epoch: 42, step: 1036, loss: 0.32079246640205383, mean loss: 0.3434514800593194
Epoch: 42, step: 1037, loss: 0.3359689712524414, mean loss: 0.34345135875936794
Epoch: 42, step: 1038, loss: 0.3064010739326477, mean loss: 0.34345075814197973
Epoch: 42, step: 1039, loss: 0.3660130798816681, mean loss: 0.343451123890938
Epoch: 42, step: 1040, loss: 0.32154718041419983, mean loss: 0.3434507688204477
Epoch: 42, step: 1041, loss: 0.36005669832229614, mean loss: 0.3434510380039378
Epoch: 42, step: 1042, loss: 0.3346237540245056, mean loss: 0.3434508949152542
Epoch: 42, step: 1043, loss: 0.3287356495857239, mean loss: 0.343450656387644
Epoch: 42, step: 1044, loss: 0.3280853033065796, mean loss: 0.3434504073261122
Epoch: 42, step: 1045, loss: 0.3303076922893524, mean loss: 0.3434501942954279
Epoch: 42, step: 1046, loss: 0.32281914353370667, mean loss: 0.343449859891493
Epoch: 42, step: 1047, loss: 0.33668842911720276, mean loss: 0.3434497502988002
Epoch: 42, step: 1048, loss: 0.3119729459285736, mean loss: 0.34344924011509
Epoch: 42, step: 1049, loss: 0.31322914361953735, mean loss: 0.34344875030834593
Epoch: 42, step: 1050, loss: 0.3568703830242157, mean loss: 0.34344896784238566
Epoch: 42, step: 1051, loss: 0.3537887930870056, mean loss: 0.34344913542464245
Epoch: 42, step: 1052, loss: 0.3720591068267822, mean loss: 0.3434495991119636
Epoch: 42, step: 1053, loss: 0.3187432587146759, mean loss: 0.34344919869803214
Epoch: 42, step: 1054, loss: 0.3264409005641937, mean loss: 0.34344892305020086
Epoch: 42, step: 1055, loss: 0.32464492321014404, mean loss: 0.34344861830496815
Epoch: 42, step: 1056, loss: 0.39008772373199463, mean loss: 0.3434493741449394
Epoch: 42, step: 1057, loss: 0.30732882022857666, mean loss: 0.34344878877959545
Epoch: 42, step: 1058, loss: 0.3508451282978058, mean loss: 0.3434489086418399
Epoch: 42, step: 1059, loss: 0.3290359675884247, mean loss: 0.34344867507502436
Epoch: 42, step: 1060, loss: 0.29711252450942993, mean loss: 0.3434479241934582
Epoch: 42, step: 1061, loss: 0.3160529136657715, mean loss: 0.34344748026199606
Epoch: 42, step: 1062, loss: 0.34211599826812744, mean loss: 0.34344745868590765
Epoch: 42, step: 1063, loss: 0.33856600522994995, mean loss: 0.34344737958535254
Epoch: 42, step: 1064, loss: 0.3044739067554474, mean loss: 0.3434467480575897
Epoch: 42, step: 1065, loss: 0.32605230808258057, mean loss: 0.34344646620193336
Epoch: 42, step: 1066, loss: 0.3408493995666504, mean loss: 0.34344642412032217
Epoch: 42, step: 1067, loss: 0.3146722614765167, mean loss: 0.34344595788526733
Epoch: 42, step: 1068, loss: 0.3269892930984497, mean loss: 0.3434456912380747
Epoch: 42, step: 1069, loss: 0.35461661219596863, mean loss: 0.3434458722374745
Epoch: 42, step: 1070, loss: 0.2947614789009094, mean loss: 0.343445083430246
Epoch: 42, step: 1071, loss: 0.3270115256309509, mean loss: 0.3434448171703983
Epoch: 42, step: 1072, loss: 0.37912678718566895, mean loss: 0.343445395287571
Epoch: 42, step: 1073, loss: 0.3424485921859741, mean loss: 0.34344537913768763
Epoch: 42, step: 1074, loss: 0.2896438539028168, mean loss: 0.34344450747679567
Epoch: 42, step: 1075, loss: 0.2694964110851288, mean loss: 0.34344330943233337
Epoch: 42, step: 1076, loss: 0.33043521642684937, mean loss: 0.34344309868963585
Epoch: 42, step: 1077, loss: 0.37964513897895813, mean loss: 0.3434436851854446
Epoch: 42, step: 1078, loss: 0.3098733425140381, mean loss: 0.34344314133360226
Epoch: 42, step: 1079, loss: 0.33664974570274353, mean loss: 0.3434430312798887
Epoch: 42, step: 1080, loss: 0.3609636127948761, mean loss: 0.34344331511052767
Epoch: 42, step: 1081, loss: 0.3309459984302521, mean loss: 0.3434431126592612
Epoch: 42, step: 1082, loss: 0.3239021897315979, mean loss: 0.34344279610966816
Epoch: 42, step: 1083, loss: 0.35583823919296265, mean loss: 0.3434429969041197
Epoch: 42, step: 1084, loss: 0.32628533244132996, mean loss: 0.3434427189706893
Epoch: 42, step: 1085, loss: 0.31119513511657715, mean loss: 0.34344219660726144
Epoch: 42, step: 1086, loss: 0.33315855264663696, mean loss: 0.343442030030053
Epoch: 42, step: 1087, loss: 0.34831520915031433, mean loss: 0.3434421089658299
Epoch: 42, step: 1088, loss: 0.3319862484931946, mean loss: 0.34344192340675717
Epoch: 42, step: 1089, loss: 0.34303709864616394, mean loss: 0.34344191684961634
Epoch: 42, step: 1090, loss: 0.3233667016029358, mean loss: 0.3434415916869923
Epoch: 42, step: 1091, loss: 0.328308641910553, mean loss: 0.34344134657928616
Epoch: 42, step: 1092, loss: 0.35051605105400085, mean loss: 0.3434414611661
Epoch: 42, step: 1093, loss: 0.3040655851364136, mean loss: 0.3434408234174681
Epoch: 42, step: 1094, loss: 0.3435826599597931, mean loss: 0.3434408257146766
Epoch: 42, step: 1095, loss: 0.3423056900501251, mean loss: 0.34344080733012644
Epoch: 42, step: 1096, loss: 0.2994519770145416, mean loss: 0.3434400949027183
Epoch: 42, step: 1097, loss: 0.30521199107170105, mean loss: 0.3434394757840089
Epoch: 42, step: 1098, loss: 0.3531830310821533, mean loss: 0.34343963358204443
Epoch: 42, step: 1099, loss: 0.35261908173561096, mean loss: 0.34343978224189015
Epoch: 42, step: 1100, loss: 0.33203908801078796, mean loss: 0.343439597612273
Epoch: 42, step: 1101, loss: 0.34554919600486755, mean loss: 0.3434396317758097
Epoch: 42, step: 1102, loss: 0.3430175483226776, mean loss: 0.34343962494056085
Epoch: 42, step: 1103, loss: 0.3066980540752411, mean loss: 0.34343902995463543
Epoch: 42, step: 1104, loss: 0.3724629580974579, mean loss: 0.34343949995492923
Epoch: 42, step: 1105, loss: 0.36973974108695984, mean loss: 0.34343992584217753
Epoch: 42, step: 1106, loss: 0.2981024384498596, mean loss: 0.3434391916913008
Epoch: 42, step: 1107, loss: 0.321052223443985, mean loss: 0.3434388291845282
Epoch: 42, step: 1108, loss: 0.4123685359954834, mean loss: 0.3434399453285574
Epoch: 42, step: 1109, loss: 0.3504604399204254, mean loss: 0.34344005900605007
Epoch: 42, step: 1110, loss: 0.33939605951309204, mean loss: 0.3434399935257234
Epoch: 42, step: 1111, loss: 0.32175132632255554, mean loss: 0.3434396423491171
Epoch: 42, step: 1112, loss: 0.29852738976478577, mean loss: 0.3434389151547293
Epoch: 42, step: 1113, loss: 0.3557749390602112, mean loss: 0.3434391148895809
Epoch: 42, step: 1114, loss: 0.3354843854904175, mean loss: 0.34343898609516677
Epoch: 42, step: 1115, loss: 0.3281126618385315, mean loss: 0.3434387379518429
Epoch: 42, step: 1116, loss: 0.34049680829048157, mean loss: 0.3434386903208276
Epoch: 42, step: 1117, loss: 0.34464725852012634, mean loss: 0.34343870988771225
Epoch: 42, step: 1118, loss: 0.3082636892795563, mean loss: 0.34343814040853066
Epoch: 42, step: 1119, loss: 0.3022194802761078, mean loss: 0.34343747309438527
Epoch: 42, step: 1120, loss: 0.37256258726119995, mean loss: 0.3434379446110711
Epoch: 42, step: 1121, loss: 0.31499022245407104, mean loss: 0.34343748406837793
Epoch: 42, step: 1122, loss: 0.28786107897758484, mean loss: 0.34343658435159996
Epoch: 42, step: 1123, loss: 0.34606796503067017, mean loss: 0.34343662694987553
Epoch: 42, step: 1124, loss: 0.3141099214553833, mean loss: 0.34343615220030055
Epoch: 42, step: 1125, loss: 0.3115693926811218, mean loss: 0.343435636339914
Epoch: 42, step: 1126, loss: 0.3084634244441986, mean loss: 0.3434350702175037
Epoch: 42, step: 1127, loss: 0.311639666557312, mean loss: 0.34343455552889224
Epoch: 42, step: 1128, loss: 0.36481621861457825, mean loss: 0.3434349016393069
Epoch: 42, step: 1129, loss: 0.33232080936431885, mean loss: 0.3434347217355827
Epoch: 42, step: 1130, loss: 0.3000123202800751, mean loss: 0.34343401886888925
Epoch: 42, step: 1131, loss: 0.32352766394615173, mean loss: 0.34343369665531004
Epoch: 42, step: 1132, loss: 0.3146308660507202, mean loss: 0.34343323044675717
Epoch: 42, step: 1133, loss: 0.3303923010826111, mean loss: 0.3434330193670031
Epoch: 42, step: 1134, loss: 0.3350769281387329, mean loss: 0.3434328841179665
Epoch: 42, step: 1135, loss: 0.3115604519844055, mean loss: 0.3434323682492605
Epoch: 42, step: 1136, loss: 0.32911044359207153, mean loss: 0.34343213644664405
Epoch: 42, step: 1137, loss: 0.34341534972190857, mean loss: 0.34343213617495266
Epoch: 42, step: 1138, loss: 0.35631364583969116, mean loss: 0.3434323446574759
Epoch: 42, step: 1139, loss: 0.3444456458091736, mean loss: 0.34343236105711905
Epoch: 42, step: 1140, loss: 0.3523743152618408, mean loss: 0.3434325057746935
Epoch: 42, step: 1141, loss: 0.34447309374809265, mean loss: 0.34343252261541163
Epoch: 42, step: 1142, loss: 0.3062500059604645, mean loss: 0.3434319208689331
Epoch: 42, step: 1143, loss: 0.3332284986972809, mean loss: 0.343431755743639
Epoch: 42, step: 1144, loss: 0.3204132616519928, mean loss: 0.3434313832339034
Epoch: 42, step: 1145, loss: 0.36738887429237366, mean loss: 0.3434317709332117
Epoch: 42, step: 1146, loss: 0.32234153151512146, mean loss: 0.34343142963958895
Epoch: 42, step: 1147, loss: 0.3364827334880829, mean loss: 0.34343131719386183
Epoch: 42, step: 1148, loss: 0.33853283524513245, mean loss: 0.34343123792655195
Epoch: 42, step: 1149, loss: 0.35086366534233093, mean loss: 0.34343135819626
Epoch: 42, step: 1150, loss: 0.35555607080459595, mean loss: 0.3434315543921953
Epoch: 42, step: 1151, loss: 0.3583166301250458, mean loss: 0.3434317952510259
Epoch: 42, step: 1152, loss: 0.34980785846710205, mean loss: 0.3434318984219004
Epoch: 42, step: 1153, loss: 0.29322168231010437, mean loss: 0.343431085985149
Epoch: 42, step: 1154, loss: 0.3450285792350769, mean loss: 0.34343111183329955
Epoch: 42, step: 1155, loss: 0.34269505739212036, mean loss: 0.34343109992380433
Epoch: 42, step: 1156, loss: 0.32719433307647705, mean loss: 0.34343083721420403
Epoch: 42, step: 1157, loss: 0.32783401012420654, mean loss: 0.34343058486286127
Epoch: 42, step: 1158, loss: 0.3690371811389923, mean loss: 0.3434309991621522
Epoch: 42, step: 1159, loss: 0.31531620025634766, mean loss: 0.3434305442890143
Epoch: 42, step: 1160, loss: 0.31109997630119324, mean loss: 0.3434300212168406
Epoch: 42, step: 1161, loss: 0.3178499937057495, mean loss: 0.3434296073675037
Epoch: 42, step: 1162, loss: 0.29126226902008057, mean loss: 0.3434287633860385
Epoch: 42, step: 1163, loss: 0.31078508496284485, mean loss: 0.34342823527372335
Epoch: 42, step: 1164, loss: 0.32621070742607117, mean loss: 0.34342795673154214
Epoch: 42, step: 1165, loss: 0.3010508120059967, mean loss: 0.3434272711725308
Epoch: 42, step: 1166, loss: 0.3684728741645813, mean loss: 0.3434276763428453
Epoch: 42, step: 1167, loss: 0.32843488454818726, mean loss: 0.3434274338038296
Epoch: 42, step: 1168, loss: 0.3275773525238037, mean loss: 0.3434271774005541
Epoch: 42, step: 1169, loss: 0.3229750394821167, mean loss: 0.34342684655617356
Epoch: 42, step: 1170, loss: 0.3884345591068268, mean loss: 0.34342757461247586
Epoch: 42, step: 1171, loss: 0.35861262679100037, mean loss: 0.3434278202458013
Epoch: 42, step: 1172, loss: 0.3936534523963928, mean loss: 0.343428632682225
Epoch: 42, step: 1173, loss: 0.2990912199020386, mean loss: 0.3434279155036675
Epoch: 42, step: 1174, loss: 0.33683064579963684, mean loss: 0.34342780879144547
Epoch: 42, step: 1175, loss: 0.3365470767021179, mean loss: 0.3434276974959601
Epoch: 42, step: 1176, loss: 0.3276059031486511, mean loss: 0.34342744158339483
Epoch: 42, step: 1177, loss: 0.3568260371685028, mean loss: 0.3434276582979742
Epoch: 42, step: 1178, loss: 0.3376123309135437, mean loss: 0.34342756423991894
Epoch: 42, step: 1179, loss: 0.32679805159568787, mean loss: 0.34342729527581456
Epoch: 42, step: 1180, loss: 0.31296056509017944, mean loss: 0.34342680251788243
Epoch: 42, step: 1181, loss: 0.3151985704898834, mean loss: 0.3434263459719981
Epoch: 42, step: 1182, loss: 0.3159901201725006, mean loss: 0.34342590224270697
Epoch: 42, step: 1183, loss: 0.3314550518989563, mean loss: 0.34342570863987437
Epoch: 42, step: 1184, loss: 0.3428466022014618, mean loss: 0.3434256992742211
Epoch: 42, step: 1185, loss: 0.33374086022377014, mean loss: 0.343425542647785
Epoch: 42, step: 1186, loss: 0.3742122948169708, mean loss: 0.3434260405333218
Epoch: 42, step: 1187, loss: 0.3177025020122528, mean loss: 0.3434256245371623
Epoch: 42, step: 1188, loss: 0.34695300459861755, mean loss: 0.3434256815803575
Epoch: 42, step: 1189, loss: 0.3191879987716675, mean loss: 0.34342528962585045
Epoch: 42, step: 1190, loss: 0.3071635365486145, mean loss: 0.34342470323614366
Epoch: 42, step: 1191, loss: 0.3711608052253723, mean loss: 0.3434251517500827
Epoch: 42, step: 1192, loss: 0.3376213312149048, mean loss: 0.3434250578993925
Epoch: 42, step: 1193, loss: 0.3394935727119446, mean loss: 0.34342499432633233
Epoch: 42, step: 1194, loss: 0.33661022782325745, mean loss: 0.34342488413170236
Epoch: 42, step: 1195, loss: 0.3223617672920227, mean loss: 0.3434245435470565
Epoch: 42, step: 1196, loss: 0.3562989830970764, mean loss: 0.343424751719739
Epoch: 42, step: 1197, loss: 0.3591213822364807, mean loss: 0.34342500552161004
Epoch: 42, step: 1198, loss: 0.3457809090614319, mean loss: 0.34342504361405657
Epoch: 42, step: 1199, loss: 0.35032719373703003, mean loss: 0.3434251552126551
Epoch: 42, step: 1200, loss: 0.31404751539230347, mean loss: 0.34342468022292494
Epoch: 42, step: 1201, loss: 0.35025495290756226, mean loss: 0.3434247906557897
Epoch: 42, step: 1202, loss: 0.30944326519966125, mean loss: 0.3434242412463144
Epoch: 42, step: 1203, loss: 0.3730160593986511, mean loss: 0.3434247196757613
Epoch: 42, step: 1204, loss: 0.35298195481300354, mean loss: 0.34342487419106593
Epoch: 42, step: 1205, loss: 0.3557962477207184, mean loss: 0.34342507420033824
Epoch: 42, step: 1206, loss: 0.3343987464904785, mean loss: 0.34342492827312604
Epoch: 42, step: 1207, loss: 0.3422667384147644, mean loss: 0.3434249095491565
Epoch: 42, step: 1208, loss: 0.32266050577163696, mean loss: 0.34342457386517933
Epoch: 42, step: 1209, loss: 0.396531343460083, mean loss: 0.34342543239228324
Epoch: 42, step: 1210, loss: 0.3400179445743561, mean loss: 0.3434253773075289
Epoch: 42, step: 1211, loss: 0.32984307408332825, mean loss: 0.3434251577423297
Epoch: 42, step: 1212, loss: 0.35021883249282837, mean loss: 0.34342526756394187
Epoch: 42, step: 1213, loss: 0.32387998700141907, mean loss: 0.3434249516142383
Epoch: 42, step: 1214, loss: 0.34275123476982117, mean loss: 0.34342494072377316
Epoch: 42, step: 1215, loss: 0.38153359293937683, mean loss: 0.343425556730695
Epoch: 42, step: 1216, loss: 0.30916187167167664, mean loss: 0.3434250028846583
Epoch: 42, step: 1217, loss: 0.340178906917572, mean loss: 0.3434249504148693
Epoch: 42, step: 1218, loss: 0.3087235689163208, mean loss: 0.3434243895119405
Epoch: 42, step: 1219, loss: 0.317417711019516, mean loss: 0.34342396915442946
Epoch: 42, step: 1220, loss: 0.3531995713710785, mean loss: 0.34342412715928194
Epoch: 42, step: 1221, loss: 0.3032122850418091, mean loss: 0.343423477218404
Epoch: 42, step: 1222, loss: 0.2961369454860687, mean loss: 0.34342271294222076
Epoch: 42, step: 1223, loss: 0.35807397961616516, mean loss: 0.3434229497418502
Epoch: 42, step: 1224, loss: 0.3444516658782959, mean loss: 0.343422966368103
Epoch: 42, step: 1225, loss: 0.3244829773902893, mean loss: 0.3434226602623239
Epoch: 42, step: 1226, loss: 0.335793673992157, mean loss: 0.34342253696557606
Epoch: 42, step: 1227, loss: 0.34315651655197144, mean loss: 0.3434225326663257
Epoch: 42, step: 1228, loss: 0.34737640619277954, mean loss: 0.3434225965652466
Epoch: 42, step: 1229, loss: 0.3041302263736725, mean loss: 0.3434219615678292
Epoch: 42, step: 1230, loss: 0.3092029094696045, mean loss: 0.34342140856839326
Epoch: 42, step: 1231, loss: 0.3237866759300232, mean loss: 0.3434210912650216
Epoch: 42, step: 1232, loss: 0.3141283690929413, mean loss: 0.3434206178931923
Epoch: 42, step: 1233, loss: 0.3205910921096802, mean loss: 0.34342024897289586
Epoch: 42, step: 1234, loss: 0.3167833089828491, mean loss: 0.34341981853254894
Epoch: 42, step: 1235, loss: 0.33353662490844727, mean loss: 0.343419658827397
Epoch: 42, step: 1236, loss: 0.3449437618255615, mean loss: 0.3434196834553844
Epoch: 42, step: 1237, loss: 0.3150022327899933, mean loss: 0.34341922426508825
Epoch: 42, step: 1238, loss: 0.35130950808525085, mean loss: 0.34341935176010047
Epoch: 42, step: 1239, loss: 0.31962528824806213, mean loss: 0.34341896729035654
Epoch: 42, step: 1240, loss: 0.3265572786331177, mean loss: 0.343418694839862
Epoch: 42, step: 1241, loss: 0.36822807788848877, mean loss: 0.3434190957024092
Epoch: 42, step: 1242, loss: 0.3619239628314972, mean loss: 0.34341939469365396
Epoch: 42, step: 1243, loss: 0.3545520603656769, mean loss: 0.3434195745661039
Epoch: 42, step: 1244, loss: 0.31616804003715515, mean loss: 0.34341913426535053
Epoch: 42, step: 1245, loss: 0.3570791482925415, mean loss: 0.3434193549654835
Epoch: 42, step: 1246, loss: 0.31609395146369934, mean loss: 0.34341891348550124
Epoch: 42, step: 1247, loss: 0.33916616439819336, mean loss: 0.34341884477752194
Epoch: 42, step: 1248, loss: 0.32830119132995605, mean loss: 0.34341860053865014
Epoch: 42, step: 1249, loss: 0.35730621218681335, mean loss: 0.3434188249014995
Epoch: 42, step: 1250, loss: 0.33297744393348694, mean loss: 0.3434186562173371
Epoch: 42, step: 1251, loss: 0.3679063022136688, mean loss: 0.34341905181743393
Epoch: 42, step: 1252, loss: 0.37085244059562683, mean loss: 0.34341949499910757
Epoch: 42, step: 1253, loss: 0.3812188506126404, mean loss: 0.34342010563132647
Epoch: 42, step: 1254, loss: 0.29856815934181213, mean loss: 0.34341938107926456
Epoch: 42, step: 1255, loss: 0.36683711409568787, mean loss: 0.3434197593703769
Epoch: 42, step: 1256, loss: 0.30913349986076355, mean loss: 0.3434192055175458
Epoch: 42, step: 1257, loss: 0.3336835205554962, mean loss: 0.34341904825193403
Epoch: 42, step: 1258, loss: 0.3149145543575287, mean loss: 0.3434185878113717
Epoch: 42, step: 1259, loss: 0.3153019845485687, mean loss: 0.34341813364384466
Epoch: 42, step: 1260, loss: 0.3474871516227722, mean loss: 0.3434181993696354
Epoch: 42, step: 1261, loss: 0.3429224193096161, mean loss: 0.3434181913615582
Epoch: 42, step: 1262, loss: 0.29833874106407166, mean loss: 0.3434174632284268
Epoch: 42, step: 1263, loss: 0.31319817900657654, mean loss: 0.3434169751278288
Epoch: 42, step: 1264, loss: 0.3625366687774658, mean loss: 0.3434172839433223
Epoch: 42, step: 1265, loss: 0.3362042009830475, mean loss: 0.3434171674416755
Epoch: 42, step: 1266, loss: 0.3327025771141052, mean loss: 0.3434169943884521
Epoch: 42, step: 1267, loss: 0.3506131172180176, mean loss: 0.34341711061241403
Epoch: 42, step: 1268, loss: 0.3388682007789612, mean loss: 0.34341703714454846
Epoch: 42, step: 1269, loss: 0.33819466829299927, mean loss: 0.34341695280124196
Epoch: 42, step: 1270, loss: 0.3408429026603699, mean loss: 0.3434169112299934
Epoch: 42, step: 1271, loss: 0.3279024660587311, mean loss: 0.34341666067370835
Epoch: 42, step: 1272, loss: 0.3152792155742645, mean loss: 0.34341620626494396
Epoch: 42, step: 1273, loss: 0.3291188180446625, mean loss: 0.3434159753714292
Epoch: 42, step: 1274, loss: 0.37330085039138794, mean loss: 0.34341645798491727
Epoch: 42, step: 1275, loss: 0.35147878527641296, mean loss: 0.34341658818205073
Epoch: 42, step: 1276, loss: 0.3091515898704529, mean loss: 0.34341603485143607
Epoch: 42, step: 1277, loss: 0.3294154703617096, mean loss: 0.34341580876603595
Epoch: 42, step: 1278, loss: 0.3129940927028656, mean loss: 0.3434153175147875
Epoch: 42, step: 1279, loss: 0.3133351802825928, mean loss: 0.343414831787213
Epoch: 42, step: 1280, loss: 0.32352331280708313, mean loss: 0.3434145105884373
Epoch: 42, step: 1281, loss: 0.3183133602142334, mean loss: 0.34341410527355964
Epoch: 42, step: 1282, loss: 0.37556201219558716, mean loss: 0.34341462436588693
Epoch: 42, step: 1283, loss: 0.31895244121551514, mean loss: 0.3434142293813369
Epoch: 42, step: 1284, loss: 0.3131716549396515, mean loss: 0.34341374107018713
Epoch: 42, step: 1285, loss: 0.31105878949165344, mean loss: 0.34341321866001534
Epoch: 42, step: 1286, loss: 0.312787264585495, mean loss: 0.343412724174602
Epoch: 42, step: 1287, loss: 0.3342727720737457, mean loss: 0.34341257660368846
Epoch: 42, step: 1288, loss: 0.41915321350097656, mean loss: 0.3434137994694536
Epoch: 42, step: 1289, loss: 0.3377548158168793, mean loss: 0.34341370810415844
Epoch: 42, step: 1290, loss: 0.35261327028274536, mean loss: 0.34341385663032414
Epoch: 42, step: 1291, loss: 0.3374350666999817, mean loss: 0.3434137601048167
Epoch: 42, step: 1292, loss: 0.31362611055374146, mean loss: 0.34341327920122217
Epoch: 42, step: 1293, loss: 0.3192756474018097, mean loss: 0.3434128895200398
Epoch: 42, step: 1294, loss: 0.3509853184223175, mean loss: 0.3434130117683794
Epoch: 42, step: 1295, loss: 0.32130637764930725, mean loss: 0.3434126548874205
Epoch: 42, step: 1296, loss: 0.31933948397636414, mean loss: 0.3434122662657253
Epoch: 42, step: 1297, loss: 0.36840328574180603, mean loss: 0.3434126696980611
Epoch: 42, step: 1298, loss: 0.3089093863964081, mean loss: 0.34341211271736305
Epoch: 42, step: 1299, loss: 0.3426153063774109, mean loss: 0.34341209985486
Epoch: 42, step: 1300, loss: 0.29968827962875366, mean loss: 0.34341139405137283
Epoch: 42, step: 1301, loss: 0.3237772583961487, mean loss: 0.3434110771161726
Epoch: 42, step: 1302, loss: 0.31629225611686707, mean loss: 0.3434106393698731
Epoch: 42, step: 1303, loss: 0.33252111077308655, mean loss: 0.3434104635962323
Epoch: 42, step: 1304, loss: 0.28939369320869446, mean loss: 0.3434095916970444
Epoch: 42, step: 1305, loss: 0.3828912377357483, mean loss: 0.3434102289706028
Epoch: 42, step: 1306, loss: 0.31247156858444214, mean loss: 0.3434097295975032
Epoch: 42, step: 1307, loss: 0.32453829050064087, mean loss: 0.34340942500328964
Epoch: 42, step: 1308, loss: 0.34117841720581055, mean loss: 0.34340938899431894
Epoch: 42, step: 1309, loss: 0.31412947177886963, mean loss: 0.34340891641745697
Epoch: 42, step: 1310, loss: 0.3507411479949951, mean loss: 0.3434090347575137
Epoch: 42, step: 1311, loss: 0.31184452772140503, mean loss: 0.34340852532389465
Epoch: 42, step: 1312, loss: 0.28772351145744324, mean loss: 0.3434076266131917
Epoch: 42, step: 1313, loss: 0.33135929703712463, mean loss: 0.3434074321661181
Epoch: 42, step: 1314, loss: 0.3025422990322113, mean loss: 0.3434067726574898
Epoch: 42, step: 1315, loss: 0.3151453137397766, mean loss: 0.343406316562678
Epoch: 42, step: 1316, loss: 0.334545373916626, mean loss: 0.3434061735635229
Epoch: 42, step: 1317, loss: 0.30276787281036377, mean loss: 0.343405517747418
Epoch: 42, step: 1318, loss: 0.35470741987228394, mean loss: 0.3434057001332383
Epoch: 42, step: 1319, loss: 0.3381977677345276, mean loss: 0.343405616090952
Epoch: 42, step: 1320, loss: 0.30897051095962524, mean loss: 0.34340506040818913
Epoch: 42, step: 1321, loss: 0.33918946981430054, mean loss: 0.3434049923818765
Epoch: 42, step: 1322, loss: 0.29791712760925293, mean loss: 0.34340425836330696
Epoch: 42, step: 1323, loss: 0.34797951579093933, mean loss: 0.3434043321911232
Epoch: 42, step: 1324, loss: 0.3832746744155884, mean loss: 0.3434049755413277
Epoch: 42, step: 1325, loss: 0.30820831656455994, mean loss: 0.3434044076151171
Epoch: 42, step: 1326, loss: 0.4379432499408722, mean loss: 0.3434059330502494
Epoch: 42, step: 1327, loss: 0.309533029794693, mean loss: 0.3434053865015329
Epoch: 42, step: 1328, loss: 0.32357245683670044, mean loss: 0.34340506649685915
Epoch: 42, step: 1329, loss: 0.3212617337703705, mean loss: 0.34340470921955546
Epoch: 42, step: 1330, loss: 0.3180992901325226, mean loss: 0.3434043009293429
Epoch: 42, step: 1331, loss: 0.325759619474411, mean loss: 0.34340401624587313
Epoch: 42, step: 1332, loss: 0.336626261472702, mean loss: 0.3434039068937366
Epoch: 42, step: 1333, loss: 0.31900089979171753, mean loss: 0.34340351318254464
Epoch: 42, step: 1334, loss: 0.34066304564476013, mean loss: 0.3434034689693323
Epoch: 42, step: 1335, loss: 0.30126628279685974, mean loss: 0.3434027891618631
Epoch: 42, step: 1336, loss: 0.34070125222206116, mean loss: 0.3434027455781422
Epoch: 42, step: 1337, loss: 0.33098483085632324, mean loss: 0.34340254524395836
Epoch: 42, step: 1338, loss: 0.31928202509880066, mean loss: 0.3434021561217207
Epoch: 42, step: 1339, loss: 0.3492662012577057, mean loss: 0.34340225072140346
Epoch: 42, step: 1340, loss: 0.31883203983306885, mean loss: 0.3434018543573568
Epoch: 42, step: 1341, loss: 0.3253471255302429, mean loss: 0.34340156310507697
Epoch: 42, step: 1342, loss: 0.36887457966804504, mean loss: 0.34340197401983175
Epoch: 42, step: 1343, loss: 0.3076936602592468, mean loss: 0.3434013980049627
Epoch: 42, step: 1344, loss: 0.3136228919029236, mean loss: 0.34340091765224384
Epoch: 42, step: 1345, loss: 0.3294009268283844, mean loss: 0.3434006918240859
Epoch: 42, step: 1346, loss: 0.3399558663368225, mean loss: 0.34340063625790335
Epoch: 42, step: 1347, loss: 0.3420887887477875, mean loss: 0.34340061509770736
Epoch: 42, step: 1348, loss: 0.31737327575683594, mean loss: 0.3434001952815979
Epoch: 42, step: 1349, loss: 0.31787168979644775, mean loss: 0.3433997835182267
Epoch: 42, step: 1350, loss: 0.32870200276374817, mean loss: 0.3433995464534232
Epoch: 42, step: 1351, loss: 0.30619144439697266, mean loss: 0.34339894632274487
Epoch: 42, step: 1352, loss: 0.31014284491539, mean loss: 0.3433984099426638
Epoch: 42, step: 1353, loss: 0.35756441950798035, mean loss: 0.34339863841931884
Epoch: 42, step: 1354, loss: 0.30219927430152893, mean loss: 0.3433979739455979
Epoch: 42, step: 1355, loss: 0.3648342788219452, mean loss: 0.34339831967014595
Epoch: 42, step: 1356, loss: 0.33031758666038513, mean loss: 0.3433981087075944
Epoch: 42, step: 1357, loss: 0.30920735001564026, mean loss: 0.34339755729710686
Epoch: 42, step: 1358, loss: 0.3276110887527466, mean loss: 0.3433973027053907
Epoch: 42, step: 1359, loss: 0.3343883156776428, mean loss: 0.3433971574178951
Epoch: 42, step: 1360, loss: 0.33155179023742676, mean loss: 0.3433969663913154
Epoch: 42, step: 1361, loss: 0.31662148237228394, mean loss: 0.343396534598314
Epoch: 42, step: 1362, loss: 0.3090488016605377, mean loss: 0.34339598070089355
Epoch: 42, step: 1363, loss: 0.3604006767272949, mean loss: 0.3433962549171102
Epoch: 42, step: 1364, loss: 0.35036566853523254, mean loss: 0.34339636730344236
Epoch: 42, step: 1365, loss: 0.3174888789653778, mean loss: 0.34339594953506203
Epoch: 42, step: 1366, loss: 0.33777564764022827, mean loss: 0.3433958589069576
Epoch: 42, step: 1367, loss: 0.3228713870048523, mean loss: 0.34339552795249584
Epoch: 42, step: 1368, loss: 0.34317150712013245, mean loss: 0.34339552434024706
Epoch: 42, step: 1369, loss: 0.349035382270813, mean loss: 0.3433956152792959
Epoch: 42, step: 1370, loss: 0.3480435609817505, mean loss: 0.3433956902231954
Epoch: 42, step: 1371, loss: 0.33640146255493164, mean loss: 0.3433955774494503
Epoch: 42, step: 1372, loss: 0.3225245475769043, mean loss: 0.3433952409339173
Epoch: 42, step: 1373, loss: 0.34913402795791626, mean loss: 0.3433953334621658
Epoch: 42, step: 1374, loss: 0.31352755427360535, mean loss: 0.3433948519024349
Epoch: 42, step: 1375, loss: 0.35464078187942505, mean loss: 0.3433950332182155
Epoch: 42, step: 1376, loss: 0.34123462438583374, mean loss: 0.34339499838695664
Epoch: 42, step: 1377, loss: 0.3369450271129608, mean loss: 0.34339489439876986
Epoch: 42, step: 1378, loss: 0.32500791549682617, mean loss: 0.3433945979636867
Epoch: 42, step: 1379, loss: 0.3243817985057831, mean loss: 0.34339429144405914
Epoch: 42, step: 1380, loss: 0.31649067997932434, mean loss: 0.34339385771771397
Epoch: 42, step: 1381, loss: 0.3244899809360504, mean loss: 0.34339355296393703
Epoch: 42, step: 1382, loss: 0.3142528831958771, mean loss: 0.34339308318802225
Epoch: 42, step: 1383, loss: 0.33778613805770874, mean loss: 0.34339299280007524
Epoch: 42, step: 1384, loss: 0.3645564913749695, mean loss: 0.3433933339652385
Epoch: 42, step: 1385, loss: 0.30959925055503845, mean loss: 0.34339278919812033
Epoch: 42, step: 1386, loss: 0.3242405652999878, mean loss: 0.34339248046556775
Epoch: 42, step: 1387, loss: 0.3588795065879822, mean loss: 0.343392730111356
Epoch: 42, step: 1388, loss: 0.333224892616272, mean loss: 0.3433925662117881
Epoch: 42, step: 1389, loss: 0.3362800180912018, mean loss: 0.3433924515635383
Epoch: 42, step: 1390, loss: 0.31680595874786377, mean loss: 0.3433920230187066
Epoch: 42, step: 1391, loss: 0.36543336510658264, mean loss: 0.3433923782950136
Epoch: 42, step: 1392, loss: 0.3091316521167755, mean loss: 0.3433918260678384
Epoch: 42, step: 1393, loss: 0.30689916014671326, mean loss: 0.3433912378749059
Epoch: 42, step: 1394, loss: 0.30673322081565857, mean loss: 0.3433906470263483
Epoch: 42, step: 1395, loss: 0.31720083951950073, mean loss: 0.34339022490966487
Epoch: 42, step: 1396, loss: 0.3304545283317566, mean loss: 0.3433900164207201
Epoch: 42, step: 1397, loss: 0.36589178442955017, mean loss: 0.3433903790833899
Epoch: 42, step: 1398, loss: 0.33376678824424744, mean loss: 0.34339022398175983
Epoch: 42, step: 1399, loss: 0.37414678931236267, mean loss: 0.3433907196716343
Epoch: 42, step: 1400, loss: 0.3190804719924927, mean loss: 0.34339032788050666
Epoch: 42, step: 1401, loss: 0.35299935936927795, mean loss: 0.34339048273999884
Epoch: 42, step: 1402, loss: 0.31063881516456604, mean loss: 0.3433899549214693
Epoch: 42, step: 1403, loss: 0.30756714940071106, mean loss: 0.3433893776184731
Epoch: 42, step: 1404, loss: 0.3183428943157196, mean loss: 0.3433889739879749
Epoch: 42, step: 1405, loss: 0.33070236444473267, mean loss: 0.34338876954330505
Epoch: 42, step: 1406, loss: 0.33158785104751587, mean loss: 0.343388579374608
Epoch: 42, step: 1407, loss: 0.31552383303642273, mean loss: 0.3433881303487871
Epoch: 42, step: 1408, loss: 0.32980573177337646, mean loss: 0.3433879114790613
Epoch: 42, step: 1409, loss: 0.35722416639328003, mean loss: 0.3433881344358906
Epoch: 42, step: 1410, loss: 0.34031203389167786, mean loss: 0.3433880848685346
Epoch: 42, step: 1411, loss: 0.34735432267189026, mean loss: 0.34338814877826396
Epoch: 42, step: 1412, loss: 0.3432301878929138, mean loss: 0.34338814623301195
Epoch: 42, step: 1413, loss: 0.3211536109447479, mean loss: 0.3433877879697383
Epoch: 42, step: 1414, loss: 0.3514176905155182, mean loss: 0.3433879173528256
Epoch: 42, step: 1415, loss: 0.3163377344608307, mean loss: 0.34338748150945597
Epoch: 42, step: 1416, loss: 0.31606847047805786, mean loss: 0.343387041341712
Epoch: 42, step: 1417, loss: 0.3296923041343689, mean loss: 0.34338682069373716
Epoch: 42, step: 1418, loss: 0.33100759983062744, mean loss: 0.3433866212444185
Epoch: 42, step: 1419, loss: 0.3645719289779663, mean loss: 0.3433869625685748
Epoch: 42, step: 1420, loss: 0.34702491760253906, mean loss: 0.34338702118004
Epoch: 42, step: 1421, loss: 0.3296152949333191, mean loss: 0.34338679930592614
Epoch: 42, step: 1422, loss: 0.3369606137275696, mean loss: 0.34338669577632974
Epoch: 42, step: 1423, loss: 0.32054129242897034, mean loss: 0.34338632772949146
Epoch: 42, step: 1424, loss: 0.31238093972206116, mean loss: 0.3433858282307076
Epoch: 42, step: 1425, loss: 0.31352895498275757, mean loss: 0.3433853472423188
Epoch: 42, step: 1426, loss: 0.3475710451602936, mean loss: 0.34338541467200734
Epoch: 42, step: 1427, loss: 0.32754456996917725, mean loss: 0.3433851594873192
Epoch: 42, step: 1428, loss: 0.3081565201282501, mean loss: 0.34338459198825577
Epoch: 42, step: 1429, loss: 0.32572558522224426, mean loss: 0.34338430752344107
Epoch: 42, step: 1430, loss: 0.3137497007846832, mean loss: 0.34338383015417384
Epoch: 42, step: 1431, loss: 0.3999245762825012, mean loss: 0.34338474092650195
Epoch: 42, step: 1432, loss: 0.29885491728782654, mean loss: 0.3433840236406393
Epoch: 42, step: 1433, loss: 0.325871080160141, mean loss: 0.3433837415469007
Epoch: 42, step: 1434, loss: 0.291420042514801, mean loss: 0.3433829045432277
Epoch: 42, step: 1435, loss: 0.31348052620887756, mean loss: 0.34338242289935267
Epoch: 42, step: 1436, loss: 0.33895695209503174, mean loss: 0.34338235161851505
Epoch: 42, step: 1437, loss: 0.29569298028945923, mean loss: 0.34338158350056047
Epoch: 42, step: 1438, loss: 0.3034221827983856, mean loss: 0.34338093989721835
Epoch: 42, step: 1439, loss: 0.3290838897228241, mean loss: 0.34338070962647077
Epoch: 42, step: 1440, loss: 0.36484694480895996, mean loss: 0.3433810553597759
Epoch: 42, step: 1441, loss: 0.3445413410663605, mean loss: 0.34338107404693496
Epoch: 42, step: 1442, loss: 0.29333946108818054, mean loss: 0.3433802681070571
Epoch: 42, step: 1443, loss: 0.32574620842933655, mean loss: 0.3433799841081574
Valid: 42, mean loss: 0.18588629613320032
Epoch: 43, step: 0, loss: 0.32870301604270935, mean loss: 0.34337974773742214
Epoch: 43, step: 1, loss: 0.3113906979560852, mean loss: 0.34337923256607256
Epoch: 43, step: 2, loss: 0.32561126351356506, mean loss: 0.3433789464243695
Epoch: 43, step: 3, loss: 0.35580724477767944, mean loss: 0.34337914657089025
Epoch: 43, step: 4, loss: 0.3504347801208496, mean loss: 0.3433792601936667
Epoch: 43, step: 5, loss: 0.33765631914138794, mean loss: 0.34337916803383783
Epoch: 43, step: 6, loss: 0.3518134355545044, mean loss: 0.3433793038535374
Epoch: 43, step: 7, loss: 0.33792901039123535, mean loss: 0.343379216087137
Epoch: 43, step: 8, loss: 0.33589136600494385, mean loss: 0.34337909551178264
Epoch: 43, step: 9, loss: 0.3740144670009613, mean loss: 0.3433795888191075
Epoch: 43, step: 10, loss: 0.3246782720088959, mean loss: 0.3433792876852362
Epoch: 43, step: 11, loss: 0.3398296535015106, mean loss: 0.343379230528947
Epoch: 43, step: 12, loss: 0.3129620850086212, mean loss: 0.3433787407592743
Epoch: 43, step: 13, loss: 0.34837228059768677, mean loss: 0.3433788211627754
Epoch: 43, step: 14, loss: 0.30849942564964294, mean loss: 0.34337825956109586
Epoch: 43, step: 15, loss: 0.33591172099113464, mean loss: 0.3433781393424675
Epoch: 43, step: 16, loss: 0.3124275207519531, mean loss: 0.34337764101503365
Epoch: 43, step: 17, loss: 0.34310516715049744, mean loss: 0.3433776366280772
Epoch: 43, step: 18, loss: 0.3111211359500885, mean loss: 0.3433771172917168
Epoch: 43, step: 19, loss: 0.3464074432849884, mean loss: 0.34337716607980917
Epoch: 43, step: 20, loss: 0.30460771918296814, mean loss: 0.3433765419037607
Epoch: 43, step: 21, loss: 0.3021279573440552, mean loss: 0.3433758778250577
Epoch: 43, step: 22, loss: 0.31838423013687134, mean loss: 0.34337547548025066
Epoch: 43, step: 23, loss: 0.32646480202674866, mean loss: 0.3433752032368117
Epoch: 43, step: 24, loss: 0.28279605507850647, mean loss: 0.3433742279941542
Epoch: 43, step: 25, loss: 0.3161393404006958, mean loss: 0.34337378955622005
Epoch: 43, step: 26, loss: 0.3824070692062378, mean loss: 0.34337441791919515
Epoch: 43, step: 27, loss: 0.35687726736068726, mean loss: 0.3433746352863787
Epoch: 43, step: 28, loss: 0.35028308629989624, mean loss: 0.3433747464959699
Epoch: 43, step: 29, loss: 0.33254092931747437, mean loss: 0.3433745721001491
Epoch: 43, step: 30, loss: 0.33611875772476196, mean loss: 0.34337445530259625
Epoch: 43, step: 31, loss: 0.3382473886013031, mean loss: 0.3433743727730312
Epoch: 43, step: 32, loss: 0.3378978967666626, mean loss: 0.3433742846204999
Epoch: 43, step: 33, loss: 0.34092092514038086, mean loss: 0.3433742451304397
Epoch: 43, step: 34, loss: 0.3213765025138855, mean loss: 0.3433738910534262
Epoch: 43, step: 35, loss: 0.3362593948841095, mean loss: 0.343373776539903
Epoch: 43, step: 36, loss: 0.36187297105789185, mean loss: 0.34337407429448646
Epoch: 43, step: 37, loss: 0.32410353422164917, mean loss: 0.3433737641296696
Epoch: 43, step: 38, loss: 0.3430044651031494, mean loss: 0.3433737581857925
Epoch: 43, step: 39, loss: 0.30290669202804565, mean loss: 0.34337310687783273
Epoch: 43, step: 40, loss: 0.3726598620414734, mean loss: 0.3433735782337171
Epoch: 43, step: 41, loss: 0.30645760893821716, mean loss: 0.3433729840989552
Epoch: 43, step: 42, loss: 0.3639351427555084, mean loss: 0.3433733150261083
Epoch: 43, step: 43, loss: 0.29719823598861694, mean loss: 0.34337257189685894
Epoch: 43, step: 44, loss: 0.3706724941730499, mean loss: 0.3433730112473631
Epoch: 43, step: 45, loss: 0.318816214799881, mean loss: 0.3433726160496347
Epoch: 43, step: 46, loss: 0.3167755603790283, mean loss: 0.3433721880244706
Epoch: 43, step: 47, loss: 0.34247028827667236, mean loss: 0.34337217351047405
Epoch: 43, step: 48, loss: 0.34341609477996826, mean loss: 0.34337217421727423
Epoch: 43, step: 49, loss: 0.3367204964160919, mean loss: 0.34337206717730445
Epoch: 43, step: 50, loss: 0.32151633501052856, mean loss: 0.3433717154766758
Epoch: 43, step: 51, loss: 0.3366835117340088, mean loss: 0.34337160785238796
Epoch: 43, step: 52, loss: 0.33023321628570557, mean loss: 0.3433713964372851
Epoch: 43, step: 53, loss: 0.31155693531036377, mean loss: 0.34337088450633013
Epoch: 43, step: 54, loss: 0.2844226062297821, mean loss: 0.34336993597658166
Epoch: 43, step: 55, loss: 0.3152153789997101, mean loss: 0.3433694829522369
Epoch: 43, step: 56, loss: 0.3745422959327698, mean loss: 0.3433699845341285
Epoch: 43, step: 57, loss: 0.32725411653518677, mean loss: 0.34336972522812687
Epoch: 43, step: 58, loss: 0.32524728775024414, mean loss: 0.34336943364090416
Epoch: 43, step: 59, loss: 0.34420329332351685, mean loss: 0.34336944705736194
Epoch: 43, step: 60, loss: 0.3441723585128784, mean loss: 0.34336945997566765
Epoch: 43, step: 61, loss: 0.3024957478046417, mean loss: 0.34336880235568873
Epoch: 43, step: 62, loss: 0.36558446288108826, mean loss: 0.3433691597792351
Epoch: 43, step: 63, loss: 0.320221483707428, mean loss: 0.34336878736665916
Epoch: 43, step: 64, loss: 0.3118897080421448, mean loss: 0.3433682809220218
Epoch: 43, step: 65, loss: 0.3118194341659546, mean loss: 0.34336777336311136
Epoch: 43, step: 66, loss: 0.3497479557991028, mean loss: 0.34336787600605023
Epoch: 43, step: 67, loss: 0.33031004667282104, mean loss: 0.34336766593801077
Epoch: 43, step: 68, loss: 0.32709386944770813, mean loss: 0.34336740413725964
Epoch: 43, step: 69, loss: 0.34578263759613037, mean loss: 0.34336744299111666
Epoch: 43, step: 70, loss: 0.3288576006889343, mean loss: 0.34336720957506045
Epoch: 43, step: 71, loss: 0.33906933665275574, mean loss: 0.3433671404374097
Epoch: 43, step: 72, loss: 0.3676306903362274, mean loss: 0.3433675307462635
Epoch: 43, step: 73, loss: 0.37248504161834717, mean loss: 0.34336799912947735
Epoch: 43, step: 74, loss: 0.32003551721572876, mean loss: 0.3433676238100649
Epoch: 43, step: 75, loss: 0.30391037464141846, mean loss: 0.3433669891226185
Epoch: 43, step: 76, loss: 0.32050636410713196, mean loss: 0.3433666214051867
Epoch: 43, step: 77, loss: 0.37726807594299316, mean loss: 0.3433671667076563
Epoch: 43, step: 78, loss: 0.3207188546657562, mean loss: 0.3433668024170378
Epoch: 43, step: 79, loss: 0.31313076615333557, mean loss: 0.3433663160882039
Epoch: 43, step: 80, loss: 0.308933287858963, mean loss: 0.3433657622621342
Epoch: 43, step: 81, loss: 0.37516719102859497, mean loss: 0.3433662737529305
Epoch: 43, step: 82, loss: 0.3063786029815674, mean loss: 0.34336567885673797
Epoch: 43, step: 83, loss: 0.32062828540802, mean loss: 0.3433653131626848
Epoch: 43, step: 84, loss: 0.3447183668613434, mean loss: 0.3433653349240065
Epoch: 43, step: 85, loss: 0.3440503180027008, mean loss: 0.3433653459404927
Epoch: 43, step: 86, loss: 0.2904275357723236, mean loss: 0.3433644945628545
Epoch: 43, step: 87, loss: 0.42212265729904175, mean loss: 0.34336576117853057
Epoch: 43, step: 88, loss: 0.35383516550064087, mean loss: 0.3433659295483593
Epoch: 43, step: 89, loss: 0.35087838768959045, mean loss: 0.3433660503623914
Epoch: 43, step: 90, loss: 0.30197346210479736, mean loss: 0.34336538470476374
Epoch: 43, step: 91, loss: 0.3366299867630005, mean loss: 0.3433652763907611
Epoch: 43, step: 92, loss: 0.3278008997440338, mean loss: 0.3433650260992656
Epoch: 43, step: 93, loss: 0.3227822780609131, mean loss: 0.34336469511241907
Epoch: 43, step: 94, loss: 0.3344976007938385, mean loss: 0.34336455252483133
Epoch: 43, step: 95, loss: 0.3201393485069275, mean loss: 0.3433641790572167
Epoch: 43, step: 96, loss: 0.3018537759780884, mean loss: 0.3433635115693478
Epoch: 43, step: 97, loss: 0.30469271540641785, mean loss: 0.3433628897523971
Epoch: 43, step: 98, loss: 0.3245740532875061, mean loss: 0.3433625876373569
Epoch: 43, step: 99, loss: 0.3364672064781189, mean loss: 0.34336247676487874
Epoch: 43, step: 100, loss: 0.3411093056201935, mean loss: 0.3433624405361851
Epoch: 43, step: 101, loss: 0.3232262432575226, mean loss: 0.3433621167718786
Epoch: 43, step: 102, loss: 0.33366304636001587, mean loss: 0.34336196082573484
Epoch: 43, step: 103, loss: 0.3295885920524597, mean loss: 0.3433617393746966
Epoch: 43, step: 104, loss: 0.3406596779823303, mean loss: 0.3433616959310998
Epoch: 43, step: 105, loss: 0.32514163851737976, mean loss: 0.3433614029947125
Epoch: 43, step: 106, loss: 0.2993856370449066, mean loss: 0.3433606959774622
Epoch: 43, step: 107, loss: 0.38652291893959045, mean loss: 0.3433613899038764
Epoch: 43, step: 108, loss: 0.3287633955478668, mean loss: 0.34336115521320654
Epoch: 43, step: 109, loss: 0.3124445974826813, mean loss: 0.343360658178421
Epoch: 43, step: 110, loss: 0.3040395975112915, mean loss: 0.34336002603751675
Epoch: 43, step: 111, loss: 0.31884390115737915, mean loss: 0.3433596319129447
Epoch: 43, step: 112, loss: 0.3259698748588562, mean loss: 0.34335935235732934
Epoch: 43, step: 113, loss: 0.380815714597702, mean loss: 0.34335995449156465
Epoch: 43, step: 114, loss: 0.32858046889305115, mean loss: 0.34335971690599393
Epoch: 43, step: 115, loss: 0.32955193519592285, mean loss: 0.34335949494448237
Epoch: 43, step: 116, loss: 0.29717791080474854, mean loss: 0.34335875258269966
Epoch: 43, step: 117, loss: 0.3176192343235016, mean loss: 0.34335833883059774
Epoch: 43, step: 118, loss: 0.3195462226867676, mean loss: 0.34335795606683983
Epoch: 43, step: 119, loss: 0.317722350358963, mean loss: 0.34335754399833684
Epoch: 43, step: 120, loss: 0.31711864471435547, mean loss: 0.3433571222392305
Epoch: 43, step: 121, loss: 0.35397830605506897, mean loss: 0.343357292959387
Epoch: 43, step: 122, loss: 0.3714938759803772, mean loss: 0.34335774520696427
Epoch: 43, step: 123, loss: 0.3276411294937134, mean loss: 0.34335749259323606
Epoch: 43, step: 124, loss: 0.32982102036476135, mean loss: 0.3433572750245293
Epoch: 43, step: 125, loss: 0.33188316226005554, mean loss: 0.3433570906066315
Epoch: 43, step: 126, loss: 0.3192251920700073, mean loss: 0.34335670275246255
Epoch: 43, step: 127, loss: 0.321514368057251, mean loss: 0.34335635170240314
Epoch: 43, step: 128, loss: 0.3395918905735016, mean loss: 0.3433562912009466
Epoch: 43, step: 129, loss: 0.4112958610057831, mean loss: 0.34335738309078945
Epoch: 43, step: 130, loss: 0.32714954018592834, mean loss: 0.3433571226108559
Epoch: 43, step: 131, loss: 0.30969756841659546, mean loss: 0.34335658166919036
Epoch: 43, step: 132, loss: 0.2967371940612793, mean loss: 0.3433558324624791
Epoch: 43, step: 133, loss: 0.32748863101005554, mean loss: 0.343355577469366
Epoch: 43, step: 134, loss: 0.3862259089946747, mean loss: 0.3433562664039366
Epoch: 43, step: 135, loss: 0.3375793695449829, mean loss: 0.3433561735695717
Epoch: 43, step: 136, loss: 0.33724188804626465, mean loss: 0.34335607531497137
Epoch: 43, step: 137, loss: 0.3136438727378845, mean loss: 0.34335559785711217
Epoch: 43, step: 138, loss: 0.3491705358028412, mean loss: 0.34335569129829013
Epoch: 43, step: 139, loss: 0.29759860038757324, mean loss: 0.34335495603201377
Epoch: 43, step: 140, loss: 0.2958245575428009, mean loss: 0.34335419228290176
Epoch: 43, step: 141, loss: 0.30825546383857727, mean loss: 0.34335362830294797
Epoch: 43, step: 142, loss: 0.35115182399749756, mean loss: 0.3433537536053613
Epoch: 43, step: 143, loss: 0.3479744791984558, mean loss: 0.3433538278505826
Epoch: 43, step: 144, loss: 0.31979385018348694, mean loss: 0.3433534492979906
Epoch: 43, step: 145, loss: 0.32305097579956055, mean loss: 0.3433531230909547
Epoch: 43, step: 146, loss: 0.32750627398490906, mean loss: 0.34335286847810575
Epoch: 43, step: 147, loss: 0.3250706195831299, mean loss: 0.3433525747401736
Epoch: 43, step: 148, loss: 0.3274896442890167, mean loss: 0.34335231987713394
Epoch: 43, step: 149, loss: 0.32137995958328247, mean loss: 0.34335196686212327
Epoch: 43, step: 150, loss: 0.37295809388160706, mean loss: 0.3433524425160445
Epoch: 43, step: 151, loss: 0.3222988247871399, mean loss: 0.3433521042727162
Epoch: 43, step: 152, loss: 0.35891905426979065, mean loss: 0.34335235436428974
Epoch: 43, step: 153, loss: 0.35326817631721497, mean loss: 0.34335251366483843
Epoch: 43, step: 154, loss: 0.34263476729393005, mean loss: 0.3433525021342206
Epoch: 43, step: 155, loss: 0.34367796778678894, mean loss: 0.34335250736275247
Epoch: 43, step: 156, loss: 0.3493591547012329, mean loss: 0.3433526038566293
Epoch: 43, step: 157, loss: 0.33735719323158264, mean loss: 0.34335250754481206
Epoch: 43, step: 158, loss: 0.30733928084373474, mean loss: 0.34335192902837536
Epoch: 43, step: 159, loss: 0.30968597531318665, mean loss: 0.3433513882272169
Epoch: 43, step: 160, loss: 0.32621920108795166, mean loss: 0.343351113024622
Epoch: 43, step: 161, loss: 0.3299172520637512, mean loss: 0.34335089723349277
Epoch: 43, step: 162, loss: 0.3523429036140442, mean loss: 0.343351041671793
Epoch: 43, step: 163, loss: 0.32827600836753845, mean loss: 0.3433507995259226
Epoch: 43, step: 164, loss: 0.3098095655441284, mean loss: 0.3433502607715017
Epoch: 43, step: 165, loss: 0.30659019947052, mean loss: 0.34334967032430935
Epoch: 43, step: 166, loss: 0.300464928150177, mean loss: 0.34334898151237575
Epoch: 43, step: 167, loss: 0.35856008529663086, mean loss: 0.3433492258282091
Epoch: 43, step: 168, loss: 0.32365113496780396, mean loss: 0.34334890944892094
Epoch: 43, step: 169, loss: 0.3175811469554901, mean loss: 0.3433484955887415
Epoch: 43, step: 170, loss: 0.32118505239486694, mean loss: 0.3433481396238314
Epoch: 43, step: 171, loss: 0.33513930439949036, mean loss: 0.3433480077846431
Epoch: 43, step: 172, loss: 0.30918899178504944, mean loss: 0.3433474591776247
Epoch: 43, step: 173, loss: 0.33506229519844055, mean loss: 0.3433473261168214
Epoch: 43, step: 174, loss: 0.33648598194122314, mean loss: 0.34334721592451767
Epoch: 43, step: 175, loss: 0.38101518154144287, mean loss: 0.34334782085747867
Epoch: 43, step: 176, loss: 0.3434545695781708, mean loss: 0.3433478225717943
Epoch: 43, step: 177, loss: 0.32368963956832886, mean loss: 0.3433475068791172
Epoch: 43, step: 178, loss: 0.3582456111907959, mean loss: 0.3433477461253845
Epoch: 43, step: 179, loss: 0.3058997094631195, mean loss: 0.343347144763028
Epoch: 43, step: 180, loss: 0.35074472427368164, mean loss: 0.3433472635557554
Epoch: 43, step: 181, loss: 0.31450769305229187, mean loss: 0.3433468004480298
Epoch: 43, step: 182, loss: 0.27706119418144226, mean loss: 0.34334573604648394
Epoch: 43, step: 183, loss: 0.3628566265106201, mean loss: 0.3433460493435882
Epoch: 43, step: 184, loss: 0.3155076205730438, mean loss: 0.34334560233379696
Epoch: 43, step: 185, loss: 0.34877675771713257, mean loss: 0.3433456895420468
Epoch: 43, step: 186, loss: 0.30733010172843933, mean loss: 0.3433451112477933
Epoch: 43, step: 187, loss: 0.34766989946365356, mean loss: 0.34334518068883724
Epoch: 43, step: 188, loss: 0.288502961397171, mean loss: 0.34334430012784284
Epoch: 43, step: 189, loss: 0.32573482394218445, mean loss: 0.3433440173900344
Epoch: 43, step: 190, loss: 0.34831228852272034, mean loss: 0.3433440971593315
Epoch: 43, step: 191, loss: 0.3501526713371277, mean loss: 0.3433442064743109
Epoch: 43, step: 192, loss: 0.33054107427597046, mean loss: 0.34334400091707884
Epoch: 43, step: 193, loss: 0.3573029935359955, mean loss: 0.34334422502831763
Epoch: 43, step: 194, loss: 0.3149630129337311, mean loss: 0.3433437693760612
Epoch: 43, step: 195, loss: 0.3847665786743164, mean loss: 0.3433444343967602
Epoch: 43, step: 196, loss: 0.36089956760406494, mean loss: 0.3433447162303618
Epoch: 43, step: 197, loss: 0.30419331789016724, mean loss: 0.34334408769611324
Epoch: 43, step: 198, loss: 0.3258265554904938, mean loss: 0.3433438064751952
Epoch: 43, step: 199, loss: 0.3215128481388092, mean loss: 0.3433434560135254
Epoch: 43, step: 200, loss: 0.35544246435165405, mean loss: 0.34334365024094
Epoch: 43, step: 201, loss: 0.37847480177879333, mean loss: 0.34334421419816763
Epoch: 43, step: 202, loss: 0.3293409049510956, mean loss: 0.3433439894079076
Epoch: 43, step: 203, loss: 0.34747782349586487, mean loss: 0.3433440557658453
Epoch: 43, step: 204, loss: 0.3486325740814209, mean loss: 0.34334414065786767
Epoch: 43, step: 205, loss: 0.4251091778278351, mean loss: 0.34334545314040593
Epoch: 43, step: 206, loss: 0.2980446219444275, mean loss: 0.34334472598858656
Epoch: 43, step: 207, loss: 0.3773633539676666, mean loss: 0.34334527203397947
Epoch: 43, step: 208, loss: 0.36115285754203796, mean loss: 0.34334555786543497
Epoch: 43, step: 209, loss: 0.3320296108722687, mean loss: 0.3433453762348775
Epoch: 43, step: 210, loss: 0.3249727189540863, mean loss: 0.34334508134286135
Epoch: 43, step: 211, loss: 0.35779374837875366, mean loss: 0.3433453132487909
Epoch: 43, step: 212, loss: 0.32390761375427246, mean loss: 0.34334500127223216
Epoch: 43, step: 213, loss: 0.34095752239227295, mean loss: 0.34334496295362915
Epoch: 43, step: 214, loss: 0.32868027687072754, mean loss: 0.3433447275918547
Epoch: 43, step: 215, loss: 0.3319718539714813, mean loss: 0.34334454506515477
Epoch: 43, step: 216, loss: 0.3010408878326416, mean loss: 0.3433438661318188
Epoch: 43, step: 217, loss: 0.32598772644996643, mean loss: 0.34334358758680705
Epoch: 43, step: 218, loss: 0.3525339663028717, mean loss: 0.34334373507888255
Epoch: 43, step: 219, loss: 0.33856332302093506, mean loss: 0.3433436583615238
Epoch: 43, step: 220, loss: 0.30055949091911316, mean loss: 0.3433429717605346
Epoch: 43, step: 221, loss: 0.3317386209964752, mean loss: 0.34334278553672026
Epoch: 43, step: 222, loss: 0.32667824625968933, mean loss: 0.3433425181125162
Epoch: 43, step: 223, loss: 0.3636084198951721, mean loss: 0.34334284332436843
Epoch: 43, step: 224, loss: 0.3334594964981079, mean loss: 0.34334268472644447
Epoch: 43, step: 225, loss: 0.36202526092529297, mean loss: 0.3433429845206644
Epoch: 43, step: 226, loss: 0.32324326038360596, mean loss: 0.3433426619910324
Epoch: 43, step: 227, loss: 0.3110101819038391, mean loss: 0.3433421431771671
Epoch: 43, step: 228, loss: 0.3209245800971985, mean loss: 0.3433417834659449
Epoch: 43, step: 229, loss: 0.3429476320743561, mean loss: 0.34334177714151065
Epoch: 43, step: 230, loss: 0.32099926471710205, mean loss: 0.3433414186460527
Epoch: 43, step: 231, loss: 0.3563189208507538, mean loss: 0.34334162687245356
Epoch: 43, step: 232, loss: 0.33580395579338074, mean loss: 0.3433415059310805
Epoch: 43, step: 233, loss: 0.3723165690898895, mean loss: 0.3433419708263595
Epoch: 43, step: 234, loss: 0.3601244390010834, mean loss: 0.3433422400911753
Epoch: 43, step: 235, loss: 0.35305458307266235, mean loss: 0.34334239591749705
Epoch: 43, step: 236, loss: 0.3580303192138672, mean loss: 0.34334263156901235
Epoch: 43, step: 237, loss: 0.3606748580932617, mean loss: 0.3433429096409925
Epoch: 43, step: 238, loss: 0.37722259759902954, mean loss: 0.34334345318574483
Epoch: 43, step: 239, loss: 0.3416011929512024, mean loss: 0.343343425234448
Epoch: 43, step: 240, loss: 0.32080405950546265, mean loss: 0.3433430636384117
Epoch: 43, step: 241, loss: 0.2985900938510895, mean loss: 0.34334234568400823
Epoch: 43, step: 242, loss: 0.3182654082775116, mean loss: 0.3433419433909561
Epoch: 43, step: 243, loss: 0.3490530252456665, mean loss: 0.34334203500867067
Epoch: 43, step: 244, loss: 0.3563210368156433, mean loss: 0.3433422432157035
Epoch: 43, step: 245, loss: 0.3303106427192688, mean loss: 0.34334203416824455
Epoch: 43, step: 246, loss: 0.3550526201725006, mean loss: 0.3433422220215307
Epoch: 43, step: 247, loss: 0.32256293296813965, mean loss: 0.3433418886996017
Epoch: 43, step: 248, loss: 0.3609884977340698, mean loss: 0.34334217176546583
Epoch: 43, step: 249, loss: 0.36076393723487854, mean loss: 0.34334245122017487
Epoch: 43, step: 250, loss: 0.3171307146549225, mean loss: 0.34334203077623465
Epoch: 43, step: 251, loss: 0.3083304166793823, mean loss: 0.3433414691886866
Epoch: 43, step: 252, loss: 0.3371274471282959, mean loss: 0.3433413695171482
Epoch: 43, step: 253, loss: 0.36217835545539856, mean loss: 0.3433416716533869
Epoch: 43, step: 254, loss: 0.32795029878616333, mean loss: 0.34334142478709234
Epoch: 43, step: 255, loss: 0.3469758629798889, mean loss: 0.34334148307987145
Epoch: 43, step: 256, loss: 0.3090936839580536, mean loss: 0.34334093378799635
Epoch: 43, step: 257, loss: 0.37612026929855347, mean loss: 0.3433414595191192
Epoch: 43, step: 258, loss: 0.3115878105163574, mean loss: 0.34334095024662953
Epoch: 43, step: 259, loss: 0.3786504566669464, mean loss: 0.3433415165397143
Epoch: 43, step: 260, loss: 0.31757596135139465, mean loss: 0.343341103318936
Epoch: 43, step: 261, loss: 0.329571932554245, mean loss: 0.34334088249636224
Epoch: 43, step: 262, loss: 0.3272492587566376, mean loss: 0.34334062443167235
Epoch: 43, step: 263, loss: 0.31659552454948425, mean loss: 0.34334019552186607
Epoch: 43, step: 264, loss: 0.3588777184486389, mean loss: 0.34334044469233493
Epoch: 43, step: 265, loss: 0.3245702087879181, mean loss: 0.34334014368467103
Epoch: 43, step: 266, loss: 0.327886164188385, mean loss: 0.34333989586191094
Epoch: 43, step: 267, loss: 0.3316926658153534, mean loss: 0.3433397090878563
Epoch: 43, step: 268, loss: 0.37522169947624207, mean loss: 0.34334022033672
Epoch: 43, step: 269, loss: 0.3484836220741272, mean loss: 0.343340302813256
Epoch: 43, step: 270, loss: 0.4283403754234314, mean loss: 0.3433416658020893
Epoch: 43, step: 271, loss: 0.35448336601257324, mean loss: 0.34334184445804805
Epoch: 43, step: 272, loss: 0.3134300410747528, mean loss: 0.34334136483320427
Epoch: 43, step: 273, loss: 0.35798677802085876, mean loss: 0.343341599663291
Epoch: 43, step: 274, loss: 0.37282681465148926, mean loss: 0.34334207243278425
Epoch: 43, step: 275, loss: 0.37141332030296326, mean loss: 0.3433425225233414
Epoch: 43, step: 276, loss: 0.31966128945350647, mean loss: 0.34334214282777037
Epoch: 43, step: 277, loss: 0.32596033811569214, mean loss: 0.3433418641392228
Epoch: 43, step: 278, loss: 0.32680052518844604, mean loss: 0.3433415989304086
Epoch: 43, step: 279, loss: 0.3135148584842682, mean loss: 0.3433411207231931
Epoch: 43, step: 280, loss: 0.33298900723457336, mean loss: 0.34334095475212406
Epoch: 43, step: 281, loss: 0.35102319717407227, mean loss: 0.3433410779163018
Epoch: 43, step: 282, loss: 0.32568123936653137, mean loss: 0.3433407947926377
Epoch: 43, step: 283, loss: 0.3110258877277374, mean loss: 0.343340276726281
Epoch: 43, step: 284, loss: 0.3390140235424042, mean loss: 0.34334020736973636
Epoch: 43, step: 285, loss: 0.3366454243659973, mean loss: 0.3433401000437079
Epoch: 43, step: 286, loss: 0.36868947744369507, mean loss: 0.34334050642049174
Epoch: 43, step: 287, loss: 0.28467345237731934, mean loss: 0.3433395659419082
Epoch: 43, step: 288, loss: 0.2992021143436432, mean loss: 0.34333885839551426
Epoch: 43, step: 289, loss: 0.3576241433620453, mean loss: 0.34333908739241986
Epoch: 43, step: 290, loss: 0.32554003596305847, mean loss: 0.34333880207347994
Epoch: 43, step: 291, loss: 0.3107486367225647, mean loss: 0.3433382796612372
Epoch: 43, step: 292, loss: 0.3251816928386688, mean loss: 0.34333798862033277
Epoch: 43, step: 293, loss: 0.33211803436279297, mean loss: 0.34333780877302317
Epoch: 43, step: 294, loss: 0.32556799054145813, mean loss: 0.34333752394095507
Epoch: 43, step: 295, loss: 0.32108572125434875, mean loss: 0.34333716727296304
Epoch: 43, step: 296, loss: 0.3403821885585785, mean loss: 0.34333711990918553
Epoch: 43, step: 297, loss: 0.3595046103000641, mean loss: 0.343337379045111
Epoch: 43, step: 298, loss: 0.3122497797012329, mean loss: 0.34333688077453767
Epoch: 43, step: 299, loss: 0.3783973753452301, mean loss: 0.34333744271348127
Epoch: 43, step: 300, loss: 0.3098435699939728, mean loss: 0.3433369058924802
Epoch: 43, step: 301, loss: 0.3067202568054199, mean loss: 0.3433363190307774
Epoch: 43, step: 302, loss: 0.37334632873535156, mean loss: 0.3433367999989592
Epoch: 43, step: 303, loss: 0.3457786738872528, mean loss: 0.34333683913406227
Epoch: 43, step: 304, loss: 0.32964226603507996, mean loss: 0.3433366196591981
Epoch: 43, step: 305, loss: 0.2853877544403076, mean loss: 0.3433356909617203
Epoch: 43, step: 306, loss: 0.3380233347415924, mean loss: 0.3433356058264422
Epoch: 43, step: 307, loss: 0.35041123628616333, mean loss: 0.34333571921795597
Epoch: 43, step: 308, loss: 0.4117840528488159, mean loss: 0.34333681612880085
Epoch: 43, step: 309, loss: 0.35460177063941956, mean loss: 0.34333699665113204
Epoch: 43, step: 310, loss: 0.32191002368927, mean loss: 0.343336653286663
Epoch: 43, step: 311, loss: 0.3490307033061981, mean loss: 0.34333674453161556
Epoch: 43, step: 312, loss: 0.3181493580341339, mean loss: 0.34333634091994186
Epoch: 43, step: 313, loss: 0.3465195596218109, mean loss: 0.34333639192815746
Epoch: 43, step: 314, loss: 0.3012305796146393, mean loss: 0.34333571723121137
Epoch: 43, step: 315, loss: 0.3130234479904175, mean loss: 0.3433352315199365
Epoch: 43, step: 316, loss: 0.3373645544052124, mean loss: 0.34333513584980696
Epoch: 43, step: 317, loss: 0.3866427540779114, mean loss: 0.34333582977094507
Epoch: 43, step: 318, loss: 0.3502618074417114, mean loss: 0.3433359407446143
Epoch: 43, step: 319, loss: 0.3402945399284363, mean loss: 0.343335892013588
Epoch: 43, step: 320, loss: 0.3283483684062958, mean loss: 0.3433356518789428
Epoch: 43, step: 321, loss: 0.31904250383377075, mean loss: 0.3433352626529992
Epoch: 43, step: 322, loss: 0.3590758442878723, mean loss: 0.34333551484528685
Epoch: 43, step: 323, loss: 0.29233047366142273, mean loss: 0.3433346976663394
Epoch: 43, step: 324, loss: 0.31782227754592896, mean loss: 0.3433342889248087
Epoch: 43, step: 325, loss: 0.2911081910133362, mean loss: 0.3433334522094716
Epoch: 43, step: 326, loss: 0.32716548442840576, mean loss: 0.3433331931862931
Epoch: 43, step: 327, loss: 0.3493979573249817, mean loss: 0.34333329034688487
Epoch: 43, step: 328, loss: 0.3538297116756439, mean loss: 0.3433334585021744
Epoch: 43, step: 329, loss: 0.32354864478111267, mean loss: 0.34333314154959804
Epoch: 43, step: 330, loss: 0.3662920892238617, mean loss: 0.34333350934588586
Epoch: 43, step: 331, loss: 0.3443542420864105, mean loss: 0.34333352569749326
Epoch: 43, step: 332, loss: 0.3514633774757385, mean loss: 0.3433336559314024
Epoch: 43, step: 333, loss: 0.36160513758659363, mean loss: 0.3433339486216542
Epoch: 43, step: 334, loss: 0.35832080245018005, mean loss: 0.3433341886917173
Epoch: 43, step: 335, loss: 0.32670971751213074, mean loss: 0.34333392239340277
Epoch: 43, step: 336, loss: 0.30018123984336853, mean loss: 0.3433332311652468
Epoch: 43, step: 337, loss: 0.32894641160964966, mean loss: 0.343333000718033
Epoch: 43, step: 338, loss: 0.3658500611782074, mean loss: 0.34333336138918136
Epoch: 43, step: 339, loss: 0.34125199913978577, mean loss: 0.34333332805111355
Epoch: 43, step: 340, loss: 0.29337286949157715, mean loss: 0.3433325278259352
Epoch: 43, step: 341, loss: 0.3846287727355957, mean loss: 0.3433331892643327
Epoch: 43, step: 342, loss: 0.29837289452552795, mean loss: 0.3433324691506987
Epoch: 43, step: 343, loss: 0.33232784271240234, mean loss: 0.34333229289619105
Epoch: 43, step: 344, loss: 0.32261326909065247, mean loss: 0.34333196105731656
Epoch: 43, step: 345, loss: 0.3313896656036377, mean loss: 0.34333176979085295
Epoch: 43, step: 346, loss: 0.3466746211051941, mean loss: 0.3433318233287269
Epoch: 43, step: 347, loss: 0.35014212131500244, mean loss: 0.34333193239820137
Epoch: 43, step: 348, loss: 0.33576861023902893, mean loss: 0.34333181127070245
Epoch: 43, step: 349, loss: 0.33487334847450256, mean loss: 0.3433316758095898
Epoch: 43, step: 350, loss: 0.361007422208786, mean loss: 0.3433319588796921
Epoch: 43, step: 351, loss: 0.31380513310432434, mean loss: 0.3433314860268035
Epoch: 43, step: 352, loss: 0.2950494885444641, mean loss: 0.3433307128344345
Epoch: 43, step: 353, loss: 0.30313947796821594, mean loss: 0.34333006921859255
Epoch: 43, step: 354, loss: 0.3359159827232361, mean loss: 0.3433299504925289
Epoch: 43, step: 355, loss: 0.34833917021751404, mean loss: 0.34333003070678275
Epoch: 43, step: 356, loss: 0.3363799452781677, mean loss: 0.34332991941460145
Epoch: 43, step: 357, loss: 0.2951178252696991, mean loss: 0.34332914740348625
Epoch: 43, step: 358, loss: 0.3258485794067383, mean loss: 0.34332886749495
Epoch: 43, step: 359, loss: 0.3189951181411743, mean loss: 0.3433284778557174
Epoch: 43, step: 360, loss: 0.3506273925304413, mean loss: 0.34332859472623883
Epoch: 43, step: 361, loss: 0.3052169978618622, mean loss: 0.34332798449155627
Epoch: 43, step: 362, loss: 0.3252171277999878, mean loss: 0.3433276945090618
Epoch: 43, step: 363, loss: 0.3267432749271393, mean loss: 0.34332742897141
Epoch: 43, step: 364, loss: 0.38109612464904785, mean loss: 0.3433280336865849
Epoch: 43, step: 365, loss: 0.3160977363586426, mean loss: 0.3433275977088506
Epoch: 43, step: 366, loss: 0.3361794948577881, mean loss: 0.3433274832641292
Epoch: 43, step: 367, loss: 0.3923940658569336, mean loss: 0.3433282688322143
Epoch: 43, step: 368, loss: 0.32224041223526, mean loss: 0.3433279312158361
Epoch: 43, step: 369, loss: 0.36430418491363525, mean loss: 0.3433282670400764
Epoch: 43, step: 370, loss: 0.3418694734573364, mean loss: 0.3433282436855532
Epoch: 43, step: 371, loss: 0.35153108835220337, mean loss: 0.3433283750067089
Epoch: 43, step: 372, loss: 0.33077704906463623, mean loss: 0.3433281740729709
Epoch: 43, step: 373, loss: 0.33483806252479553, mean loss: 0.343328038157248
Epoch: 43, step: 374, loss: 0.3181286156177521, mean loss: 0.34332763475349015
Epoch: 43, step: 375, loss: 0.34919437766075134, mean loss: 0.34332772866946165
Epoch: 43, step: 376, loss: 0.28912612795829773, mean loss: 0.3433268610134929
Epoch: 43, step: 377, loss: 0.3261086940765381, mean loss: 0.3433265853905229
Epoch: 43, step: 378, loss: 0.3270251750946045, mean loss: 0.3433263244468803
Epoch: 43, step: 379, loss: 0.3283522129058838, mean loss: 0.3433260847537131
Epoch: 43, step: 380, loss: 0.31131505966186523, mean loss: 0.34332557235595584
Epoch: 43, step: 381, loss: 0.3400156497955322, mean loss: 0.3433255193751549
Epoch: 43, step: 382, loss: 0.3167189657688141, mean loss: 0.3433250934999471
Epoch: 43, step: 383, loss: 0.32888829708099365, mean loss: 0.3433248624224707
Epoch: 43, step: 384, loss: 0.3180526793003082, mean loss: 0.3433244579186833
Epoch: 43, step: 385, loss: 0.3009320795536041, mean loss: 0.34332377940179154
Epoch: 43, step: 386, loss: 0.38120728731155396, mean loss: 0.3433243857416483
Epoch: 43, step: 387, loss: 0.335616797208786, mean loss: 0.3433242623807563
Epoch: 43, step: 388, loss: 0.3192858397960663, mean loss: 0.3433238776490365
Epoch: 43, step: 389, loss: 0.3621232211589813, mean loss: 0.343324178525185
Epoch: 43, step: 390, loss: 0.3129726052284241, mean loss: 0.34332369276788627
Epoch: 43, step: 391, loss: 0.280337393283844, mean loss: 0.3433226847290366
Epoch: 43, step: 392, loss: 0.3098811209201813, mean loss: 0.3433221495355692
Epoch: 43, step: 393, loss: 0.3138381242752075, mean loss: 0.3433216776854706
Epoch: 43, step: 394, loss: 0.45156171917915344, mean loss: 0.34332340988643234
Epoch: 43, step: 395, loss: 0.3236137330532074, mean loss: 0.34332309447104326
Epoch: 43, step: 396, loss: 0.358571320772171, mean loss: 0.34332333848561064
Epoch: 43, step: 397, loss: 0.33370256423950195, mean loss: 0.34332318452858956
Epoch: 43, step: 398, loss: 0.35351935029029846, mean loss: 0.3433233476907371
Epoch: 43, step: 399, loss: 0.3239051103591919, mean loss: 0.34332303695916616
Epoch: 43, step: 400, loss: 0.3418230712413788, mean loss: 0.34332301295702644
Epoch: 43, step: 401, loss: 0.30975934863090515, mean loss: 0.3433224758868385
Epoch: 43, step: 402, loss: 0.3438887894153595, mean loss: 0.3433224849485799
Epoch: 43, step: 403, loss: 0.3186745345592499, mean loss: 0.34332209055613255
Epoch: 43, step: 404, loss: 0.33897727727890015, mean loss: 0.34332202103578313
Epoch: 43, step: 405, loss: 0.35119879245758057, mean loss: 0.3433221470681589
Epoch: 43, step: 406, loss: 0.31057989597320557, mean loss: 0.3433216231837592
Epoch: 43, step: 407, loss: 0.3479718863964081, mean loss: 0.3433216975879706
Epoch: 43, step: 408, loss: 0.3244726359844208, mean loss: 0.3433213960078102
Epoch: 43, step: 409, loss: 0.3276713788509369, mean loss: 0.3433211456155482
Epoch: 43, step: 410, loss: 0.31454703211784363, mean loss: 0.34332068525182974
Epoch: 43, step: 411, loss: 0.3037484586238861, mean loss: 0.34332005213672306
Epoch: 43, step: 412, loss: 0.3173743486404419, mean loss: 0.34331963703867496
Epoch: 43, step: 413, loss: 0.3338625133037567, mean loss: 0.34331948573921994
Epoch: 43, step: 414, loss: 0.36554262042045593, mean loss: 0.34331984126955545
Epoch: 43, step: 415, loss: 0.3600625693798065, mean loss: 0.34332010911892047
Epoch: 43, step: 416, loss: 0.3020203113555908, mean loss: 0.3433194484172973
Epoch: 43, step: 417, loss: 0.326022744178772, mean loss: 0.34331917171430193
Epoch: 43, step: 418, loss: 0.37039119005203247, mean loss: 0.34331960479037393
Epoch: 43, step: 419, loss: 0.2964853048324585, mean loss: 0.34331885558542197
Epoch: 43, step: 420, loss: 0.3205818831920624, mean loss: 0.3433184918695166
Epoch: 43, step: 421, loss: 0.3193865418434143, mean loss: 0.34331810904406906
Epoch: 43, step: 422, loss: 0.3291630446910858, mean loss: 0.34331788261738183
Epoch: 43, step: 423, loss: 0.39145275950431824, mean loss: 0.343318652578302
Epoch: 43, step: 424, loss: 0.3042013347148895, mean loss: 0.3433180268714085
Epoch: 43, step: 425, loss: 0.31892380118370056, mean loss: 0.3433176366761737
Epoch: 43, step: 426, loss: 0.296431303024292, mean loss: 0.3433168867228211
Epoch: 43, step: 427, loss: 0.315072625875473, mean loss: 0.34331643495921194
Epoch: 43, step: 428, loss: 0.3162519037723541, mean loss: 0.343316002072163
Epoch: 43, step: 429, loss: 0.3422345817089081, mean loss: 0.3433159847755256
Epoch: 43, step: 430, loss: 0.3440370559692383, mean loss: 0.3433159963084206
Epoch: 43, step: 431, loss: 0.3051157295703888, mean loss: 0.3433153853387651
Epoch: 43, step: 432, loss: 0.33843469619750977, mean loss: 0.34331530727896276
Epoch: 43, step: 433, loss: 0.3317701816558838, mean loss: 0.3433151226337652
Epoch: 43, step: 434, loss: 0.3058544099330902, mean loss: 0.3433145235211786
Epoch: 43, step: 435, loss: 0.33113664388656616, mean loss: 0.3433143287623564
Epoch: 43, step: 436, loss: 0.3202110528945923, mean loss: 0.3433139592813817
Epoch: 43, step: 437, loss: 0.31620362401008606, mean loss: 0.3433135257241248
Epoch: 43, step: 438, loss: 0.37462106347084045, mean loss: 0.3433140263963953
Epoch: 43, step: 439, loss: 0.32100218534469604, mean loss: 0.34331366958962356
Epoch: 43, step: 440, loss: 0.35559558868408203, mean loss: 0.34331386599662617
Epoch: 43, step: 441, loss: 0.33775565028190613, mean loss: 0.3433137771135271
Epoch: 43, step: 442, loss: 0.34696388244628906, mean loss: 0.3433138354825258
Epoch: 43, step: 443, loss: 0.310799777507782, mean loss: 0.3433133155570753
Epoch: 43, step: 444, loss: 0.34540286660194397, mean loss: 0.3433133489701115
Epoch: 43, step: 445, loss: 0.3010498881340027, mean loss: 0.34331267316562725
Epoch: 43, step: 446, loss: 0.31994393467903137, mean loss: 0.34331229949897946
Epoch: 43, step: 447, loss: 0.3341500759124756, mean loss: 0.3433121529971632
Epoch: 43, step: 448, loss: 0.30306917428970337, mean loss: 0.3433115095316173
Epoch: 43, step: 449, loss: 0.3633720874786377, mean loss: 0.343311830285318
Epoch: 43, step: 450, loss: 0.395207017660141, mean loss: 0.3433126600374465
Epoch: 43, step: 451, loss: 0.36308181285858154, mean loss: 0.3433129761213685
Epoch: 43, step: 452, loss: 0.29993191361427307, mean loss: 0.34331228252375867
Epoch: 43, step: 453, loss: 0.3160246014595032, mean loss: 0.34331184624196504
Epoch: 43, step: 454, loss: 0.29916831851005554, mean loss: 0.34331114047625716
Epoch: 43, step: 455, loss: 0.3559907078742981, mean loss: 0.3433113431936486
Epoch: 43, step: 456, loss: 0.31635528802871704, mean loss: 0.34331091223463783
Epoch: 43, step: 457, loss: 0.3456306755542755, mean loss: 0.3433109493211817
Epoch: 43, step: 458, loss: 0.39678525924682617, mean loss: 0.3433118042125492
Epoch: 43, step: 459, loss: 0.29868772625923157, mean loss: 0.3433110908208438
Epoch: 43, step: 460, loss: 0.3999614417552948, mean loss: 0.34331199645847804
Epoch: 43, step: 461, loss: 0.3096908926963806, mean loss: 0.3433114589851948
Epoch: 43, step: 462, loss: 0.3321904242038727, mean loss: 0.34331128120508475
Epoch: 43, step: 463, loss: 0.34176772832870483, mean loss: 0.3433112565303473
Epoch: 43, step: 464, loss: 0.33987152576446533, mean loss: 0.3433112015448018
Epoch: 43, step: 465, loss: 0.3071678876876831, mean loss: 0.3433106237879385
Epoch: 43, step: 466, loss: 0.36218202114105225, mean loss: 0.3433109254455314
Epoch: 43, step: 467, loss: 0.36597707867622375, mean loss: 0.3433112877561649
Epoch: 43, step: 468, loss: 0.3169613182544708, mean loss: 0.34331086656773274
Epoch: 43, step: 469, loss: 0.3031761646270752, mean loss: 0.34331022504888836
Epoch: 43, step: 470, loss: 0.32233765721321106, mean loss: 0.343309889825708
Epoch: 43, step: 471, loss: 0.31633663177490234, mean loss: 0.34330945869505697
Epoch: 43, step: 472, loss: 0.3628294765949249, mean loss: 0.3433097706908677
Epoch: 43, step: 473, loss: 0.35812798142433167, mean loss: 0.3433100075321351
Epoch: 43, step: 474, loss: 0.2845990061759949, mean loss: 0.3433090691620461
Epoch: 43, step: 475, loss: 0.4006185233592987, mean loss: 0.34330998511675453
Epoch: 43, step: 476, loss: 0.32067155838012695, mean loss: 0.34330962330137094
Epoch: 43, step: 477, loss: 0.32763829827308655, mean loss: 0.34330937284068647
Epoch: 43, step: 478, loss: 0.3115885853767395, mean loss: 0.34330886588398984
Epoch: 43, step: 479, loss: 0.36296263337135315, mean loss: 0.3433091799824282
Epoch: 43, step: 480, loss: 0.33284133672714233, mean loss: 0.34330901269233094
Epoch: 43, step: 481, loss: 0.3350260555744171, mean loss: 0.34330888032174384
Epoch: 43, step: 482, loss: 0.35495951771736145, mean loss: 0.34330906650851806
Epoch: 43, step: 483, loss: 0.3101719915866852, mean loss: 0.34330853695925123
Epoch: 43, step: 484, loss: 0.2863415777683258, mean loss: 0.34330762660945513
Epoch: 43, step: 485, loss: 0.34732669591903687, mean loss: 0.3433076908344113
Epoch: 43, step: 486, loss: 0.35682523250579834, mean loss: 0.34330790684204443
Epoch: 43, step: 487, loss: 0.3587234318256378, mean loss: 0.3433081531751378
Epoch: 43, step: 488, loss: 0.3165534734725952, mean loss: 0.34330772565432954
Epoch: 43, step: 489, loss: 0.35554832220077515, mean loss: 0.34330792124725634
Epoch: 43, step: 490, loss: 0.3322208821773529, mean loss: 0.34330774408989617
Epoch: 43, step: 491, loss: 0.303168922662735, mean loss: 0.34330710273074005
Epoch: 43, step: 492, loss: 0.29942595958709717, mean loss: 0.3433064015860066
Epoch: 43, step: 493, loss: 0.30015555024147034, mean loss: 0.34330571212108885
Epoch: 43, step: 494, loss: 0.3398208022117615, mean loss: 0.3433056564400383
Epoch: 43, step: 495, loss: 0.28941023349761963, mean loss: 0.34330479532572017
Epoch: 43, step: 496, loss: 0.33055806159973145, mean loss: 0.34330459166798916
Epoch: 43, step: 497, loss: 0.3836199939250946, mean loss: 0.34330523578689404
Epoch: 43, step: 498, loss: 0.32785001397132874, mean loss: 0.34330498886286637
Epoch: 43, step: 499, loss: 0.34061360359191895, mean loss: 0.34330494586399635
Epoch: 43, step: 500, loss: 0.30455026030540466, mean loss: 0.34330432671032807
Epoch: 43, step: 501, loss: 0.32230645418167114, mean loss: 0.3433039912489016
Epoch: 43, step: 502, loss: 0.3592292368412018, mean loss: 0.3433042456661169
Epoch: 43, step: 503, loss: 0.3027476966381073, mean loss: 0.3433035977565216
Epoch: 43, step: 504, loss: 0.3115042746067047, mean loss: 0.34330308975576834
Epoch: 43, step: 505, loss: 0.3681659400463104, mean loss: 0.3433034869385903
Epoch: 43, step: 506, loss: 0.3871936500072479, mean loss: 0.3433041880706063
Epoch: 43, step: 507, loss: 0.3098462224006653, mean loss: 0.3433036535983113
Epoch: 43, step: 508, loss: 0.3466460406780243, mean loss: 0.3433037069902232
Epoch: 43, step: 509, loss: 0.33285412192344666, mean loss: 0.34330354006927716
Epoch: 43, step: 510, loss: 0.37019044160842896, mean loss: 0.3433039695519144
Epoch: 43, step: 511, loss: 0.31327056884765625, mean loss: 0.34330348981578407
Epoch: 43, step: 512, loss: 0.30457884073257446, mean loss: 0.3433028712605715
Epoch: 43, step: 513, loss: 0.33552634716033936, mean loss: 0.3433027470468524
Epoch: 43, step: 514, loss: 0.3510929346084595, mean loss: 0.34330287147682925
Epoch: 43, step: 515, loss: 0.3152053654193878, mean loss: 0.3433024226922321
Epoch: 43, step: 516, loss: 0.319629043340683, mean loss: 0.3433020445775944
Epoch: 43, step: 517, loss: 0.2939348816871643, mean loss: 0.34330125609072504
Epoch: 43, step: 518, loss: 0.38270291686058044, mean loss: 0.34330188539964474
Epoch: 43, step: 519, loss: 0.3107013404369354, mean loss: 0.34330136472397615
Epoch: 43, step: 520, loss: 0.3082990050315857, mean loss: 0.34330080569694194
Epoch: 43, step: 521, loss: 0.34218913316726685, mean loss: 0.34330078794256547
Epoch: 43, step: 522, loss: 0.2956860363483429, mean loss: 0.34330002750574373
Epoch: 43, step: 523, loss: 0.3754082918167114, mean loss: 0.34330054028625206
Epoch: 43, step: 524, loss: 0.3248338997364044, mean loss: 0.3433002453720826
Epoch: 43, step: 525, loss: 0.33375027775764465, mean loss: 0.3433000928605425
Epoch: 43, step: 526, loss: 0.3420487940311432, mean loss: 0.3433000728778084
Epoch: 43, step: 527, loss: 0.35003983974456787, mean loss: 0.3433001805074294
Epoch: 43, step: 528, loss: 0.3188714385032654, mean loss: 0.3432997904027999
Epoch: 43, step: 529, loss: 0.30567753314971924, mean loss: 0.343299189619413
Epoch: 43, step: 530, loss: 0.31399214267730713, mean loss: 0.3432987216276697
Epoch: 43, step: 531, loss: 0.35194990038871765, mean loss: 0.34329885977245067
Epoch: 43, step: 532, loss: 0.33520427346229553, mean loss: 0.3432987305175795
Epoch: 43, step: 533, loss: 0.33552131056785583, mean loss: 0.343298606329224
Epoch: 43, step: 534, loss: 0.34861132502555847, mean loss: 0.3432986911603463
Epoch: 43, step: 535, loss: 0.3523365557193756, mean loss: 0.3432988354706318
Epoch: 43, step: 536, loss: 0.30694347620010376, mean loss: 0.3432982549830099
Epoch: 43, step: 537, loss: 0.3164757490158081, mean loss: 0.34329782671371456
Epoch: 43, step: 538, loss: 0.354209840297699, mean loss: 0.343298000940752
Epoch: 43, step: 539, loss: 0.3535381853580475, mean loss: 0.34329816443839567
Epoch: 43, step: 540, loss: 0.3375636041164398, mean loss: 0.3432980728802662
Epoch: 43, step: 541, loss: 0.3472518026828766, mean loss: 0.34329813600460446
Epoch: 43, step: 542, loss: 0.30983859300613403, mean loss: 0.34329760180578595
Epoch: 43, step: 543, loss: 0.39850306510925293, mean loss: 0.3432984831753387
Epoch: 43, step: 544, loss: 0.29274290800094604, mean loss: 0.3432976760553429
Epoch: 43, step: 545, loss: 0.3636992573738098, mean loss: 0.34329800176148484
Epoch: 43, step: 546, loss: 0.3426145017147064, mean loss: 0.34329799084975177
Epoch: 43, step: 547, loss: 0.32719433307647705, mean loss: 0.34329773376709255
Epoch: 43, step: 548, loss: 0.33281657099723816, mean loss: 0.3432975664459647
Epoch: 43, step: 549, loss: 0.3564826250076294, mean loss: 0.34329777692868496
Epoch: 43, step: 550, loss: 0.315053790807724, mean loss: 0.3432973260565026
Epoch: 43, step: 551, loss: 0.36839383840560913, mean loss: 0.343297726677669
Epoch: 43, step: 552, loss: 0.3606777787208557, mean loss: 0.34329800411484745
Epoch: 43, step: 553, loss: 0.33980172872543335, mean loss: 0.34329794830481347
Epoch: 43, step: 554, loss: 0.3331899046897888, mean loss: 0.343297786955609
Epoch: 43, step: 555, loss: 0.3187538981437683, mean loss: 0.34329739518111
Epoch: 43, step: 556, loss: 0.3483336865901947, mean loss: 0.34329747557012513
Epoch: 43, step: 557, loss: 0.30150750279426575, mean loss: 0.34329680853145356
Epoch: 43, step: 558, loss: 0.33550307154655457, mean loss: 0.3432966841322104
Epoch: 43, step: 559, loss: 0.35478025674819946, mean loss: 0.34329686742360754
Epoch: 43, step: 560, loss: 0.34600794315338135, mean loss: 0.3432969106948911
Epoch: 43, step: 561, loss: 0.33244335651397705, mean loss: 0.343296737464863
Epoch: 43, step: 562, loss: 0.3140734136104584, mean loss: 0.34329627104839416
Epoch: 43, step: 563, loss: 0.3268545866012573, mean loss: 0.3432960086364233
Epoch: 43, step: 564, loss: 0.3120352625846863, mean loss: 0.3432955097177701
Epoch: 43, step: 565, loss: 0.3641927242279053, mean loss: 0.34329584323008316
Epoch: 43, step: 566, loss: 0.31090161204338074, mean loss: 0.343295326237613
Epoch: 43, step: 567, loss: 0.3545047342777252, mean loss: 0.34329550513017665
Epoch: 43, step: 568, loss: 0.3152012825012207, mean loss: 0.3432950567775709
Epoch: 43, step: 569, loss: 0.3203817307949066, mean loss: 0.34329469111215993
Epoch: 43, step: 570, loss: 0.30896294116973877, mean loss: 0.34329414323302965
Epoch: 43, step: 571, loss: 0.3375062346458435, mean loss: 0.34329405086885584
Epoch: 43, step: 572, loss: 0.3342629373073578, mean loss: 0.34329390675150867
Epoch: 43, step: 573, loss: 0.3100907504558563, mean loss: 0.34329337690827155
Epoch: 43, step: 574, loss: 0.31284454464912415, mean loss: 0.34329289102523486
Epoch: 43, step: 575, loss: 0.3151506185531616, mean loss: 0.34329244195597347
Epoch: 43, step: 576, loss: 0.3526824116706848, mean loss: 0.3432925917903368
Epoch: 43, step: 577, loss: 0.34014537930488586, mean loss: 0.34329254157153216
Epoch: 43, step: 578, loss: 0.3104300796985626, mean loss: 0.3432920172068041
Epoch: 43, step: 579, loss: 0.37434571981430054, mean loss: 0.3432925127024418
Epoch: 43, step: 580, loss: 0.31811264157295227, mean loss: 0.3432921109365916
Epoch: 43, step: 581, loss: 0.3261867165565491, mean loss: 0.3432918380101089
Epoch: 43, step: 582, loss: 0.3338259160518646, mean loss: 0.34329168697824675
Epoch: 43, step: 583, loss: 0.32590922713279724, mean loss: 0.3432914096398741
Epoch: 43, step: 584, loss: 0.3164008855819702, mean loss: 0.34329098060651164
Epoch: 43, step: 585, loss: 0.346717894077301, mean loss: 0.3432910352814131
Epoch: 43, step: 586, loss: 0.3193395733833313, mean loss: 0.3432906531524401
Epoch: 43, step: 587, loss: 0.32990849018096924, mean loss: 0.3432904396527118
Epoch: 43, step: 588, loss: 0.3155863285064697, mean loss: 0.34328999766692425
Epoch: 43, step: 589, loss: 0.32491588592529297, mean loss: 0.34328970453473734
Epoch: 43, step: 590, loss: 0.2999185025691986, mean loss: 0.3432890126214281
Epoch: 43, step: 591, loss: 0.32820838689804077, mean loss: 0.34328877203968916
Epoch: 43, step: 592, loss: 0.32202452421188354, mean loss: 0.34328843281582655
Epoch: 43, step: 593, loss: 0.3055388629436493, mean loss: 0.3432878306148587
Epoch: 43, step: 594, loss: 0.32802990078926086, mean loss: 0.34328758721623015
Epoch: 43, step: 595, loss: 0.3279908001422882, mean loss: 0.3432873432016329
Epoch: 43, step: 596, loss: 0.31021252274513245, mean loss: 0.34328681559997304
Epoch: 43, step: 597, loss: 0.329581618309021, mean loss: 0.3432865969814168
Epoch: 43, step: 598, loss: 0.32652947306632996, mean loss: 0.3432863296842941
Epoch: 43, step: 599, loss: 0.3187800943851471, mean loss: 0.34328593878537084
Epoch: 43, step: 600, loss: 0.3198093771934509, mean loss: 0.3432855643167445
Epoch: 43, step: 601, loss: 0.32639390230178833, mean loss: 0.34328529488646387
Epoch: 43, step: 602, loss: 0.285648375749588, mean loss: 0.3432843755640436
Epoch: 43, step: 603, loss: 0.3614448010921478, mean loss: 0.3432846652224832
Epoch: 43, step: 604, loss: 0.2980119287967682, mean loss: 0.343283943134721
Epoch: 43, step: 605, loss: 0.3348737061023712, mean loss: 0.34328380899588035
Epoch: 43, step: 606, loss: 0.3420780301094055, mean loss: 0.3432837897646504
Epoch: 43, step: 607, loss: 0.31877920031547546, mean loss: 0.34328339894185217
Epoch: 43, step: 608, loss: 0.34456512331962585, mean loss: 0.3432834193837012
Epoch: 43, step: 609, loss: 0.31842413544654846, mean loss: 0.34328302291654006
Epoch: 43, step: 610, loss: 0.32155027985572815, mean loss: 0.3432826763184018
Epoch: 43, step: 611, loss: 0.3632556200027466, mean loss: 0.34328299484582725
Epoch: 43, step: 612, loss: 0.3238714635372162, mean loss: 0.343282685276713
Epoch: 43, step: 613, loss: 0.3434339463710785, mean loss: 0.3432826876889398
Epoch: 43, step: 614, loss: 0.31242769956588745, mean loss: 0.3432821956387999
Epoch: 43, step: 615, loss: 0.34050828218460083, mean loss: 0.34328215140340007
Epoch: 43, step: 616, loss: 0.3029095232486725, mean loss: 0.3432815075942474
Epoch: 43, step: 617, loss: 0.31480562686920166, mean loss: 0.34328105350589266
Epoch: 43, step: 618, loss: 0.36529994010925293, mean loss: 0.34328140462270795
Epoch: 43, step: 619, loss: 0.3965925872325897, mean loss: 0.34328225471810614
Epoch: 43, step: 620, loss: 0.30664679408073425, mean loss: 0.34328167054160946
Epoch: 43, step: 621, loss: 0.316913366317749, mean loss: 0.34328125008837373
Epoch: 43, step: 622, loss: 0.34677886962890625, mean loss: 0.34328130585843736
Epoch: 43, step: 623, loss: 0.3814883828163147, mean loss: 0.3432819150662465
Epoch: 43, step: 624, loss: 0.31839972734451294, mean loss: 0.3432815183287157
Epoch: 43, step: 625, loss: 0.34155213832855225, mean loss: 0.34328149075481346
Epoch: 43, step: 626, loss: 0.32047832012176514, mean loss: 0.3432811271780563
Epoch: 43, step: 627, loss: 0.3377588391304016, mean loss: 0.34328103913137187
Epoch: 43, step: 628, loss: 0.2989140748977661, mean loss: 0.34328033176120504
Epoch: 43, step: 629, loss: 0.3091144859790802, mean loss: 0.34327978704251333
Epoch: 43, step: 630, loss: 0.3299035131931305, mean loss: 0.3432795737830415
Epoch: 43, step: 631, loss: 0.32302990555763245, mean loss: 0.3432792509454
Epoch: 43, step: 632, loss: 0.3162834644317627, mean loss: 0.34327882056219533
Epoch: 43, step: 633, loss: 0.29728078842163086, mean loss: 0.3432780872453548
Epoch: 43, step: 634, loss: 0.3513143062591553, mean loss: 0.3432782153595483
Epoch: 43, step: 635, loss: 0.38834547996520996, mean loss: 0.343278933814857
Epoch: 43, step: 636, loss: 0.3209891617298126, mean loss: 0.34327857848044896
Epoch: 43, step: 637, loss: 0.3529594838619232, mean loss: 0.3432787328070133
Epoch: 43, step: 638, loss: 0.3985247313976288, mean loss: 0.34327961348799385
Epoch: 43, step: 639, loss: 0.30972757935523987, mean loss: 0.3432790786408005
Epoch: 43, step: 640, loss: 0.3618624210357666, mean loss: 0.3432793748699366
Epoch: 43, step: 641, loss: 0.29974186420440674, mean loss: 0.3432786808681088
Epoch: 43, step: 642, loss: 0.3104991912841797, mean loss: 0.3432781583609026
Epoch: 43, step: 643, loss: 0.31587836146354675, mean loss: 0.34327772161331116
Epoch: 43, step: 644, loss: 0.35844194889068604, mean loss: 0.3432779633243792
Epoch: 43, step: 645, loss: 0.3180118501186371, mean loss: 0.3432775606001418
Epoch: 43, step: 646, loss: 0.32921186089515686, mean loss: 0.3432773364062639
Epoch: 43, step: 647, loss: 0.3969954550266266, mean loss: 0.34327819260834586
Epoch: 43, step: 648, loss: 0.33644184470176697, mean loss: 0.3432780836469346
Epoch: 43, step: 649, loss: 0.31249547004699707, mean loss: 0.34327759302480587
Epoch: 43, step: 650, loss: 0.38924652338027954, mean loss: 0.3432783256791315
Epoch: 43, step: 651, loss: 0.3235079050064087, mean loss: 0.3432780105825379
Epoch: 43, step: 652, loss: 0.33607807755470276, mean loss: 0.34327789583342594
Epoch: 43, step: 653, loss: 0.3112627863883972, mean loss: 0.34327738559995374
Epoch: 43, step: 654, loss: 0.4389570355415344, mean loss: 0.34327891044815273
Epoch: 43, step: 655, loss: 0.31911689043045044, mean loss: 0.3432785253837679
Epoch: 43, step: 656, loss: 0.3128717541694641, mean loss: 0.34327804080598634
Epoch: 43, step: 657, loss: 0.32757124304771423, mean loss: 0.34327779049845236
Epoch: 43, step: 658, loss: 0.36813485622406006, mean loss: 0.3432781866206771
Epoch: 43, step: 659, loss: 0.3218350410461426, mean loss: 0.3432778449081329
Epoch: 43, step: 660, loss: 0.32036295533180237, mean loss: 0.3432774797480676
Epoch: 43, step: 661, loss: 0.34554898738861084, mean loss: 0.34327751594508515
Epoch: 43, step: 662, loss: 0.3455543518066406, mean loss: 0.343277552226431
Epoch: 43, step: 663, loss: 0.2904965579509735, mean loss: 0.3432767111754674
Epoch: 43, step: 664, loss: 0.3292887806892395, mean loss: 0.34327648828510476
Epoch: 43, step: 665, loss: 0.3512912392616272, mean loss: 0.3432766159939383
Epoch: 43, step: 666, loss: 0.31140175461769104, mean loss: 0.34327610810086523
Epoch: 43, step: 667, loss: 0.32877010107040405, mean loss: 0.34327587696627265
Epoch: 43, step: 668, loss: 0.3129023611545563, mean loss: 0.34327539301101684
Epoch: 43, step: 669, loss: 0.32186275720596313, mean loss: 0.3432750518390369
Epoch: 43, step: 670, loss: 0.3124556541442871, mean loss: 0.34327456079498714
Epoch: 43, step: 671, loss: 0.3348526954650879, mean loss: 0.3432744266119311
Epoch: 43, step: 672, loss: 0.315777450799942, mean loss: 0.343273988517837
Epoch: 43, step: 673, loss: 0.38799765706062317, mean loss: 0.3432747010639375
Epoch: 43, step: 674, loss: 0.3135744035243988, mean loss: 0.343274227880616
Epoch: 43, step: 675, loss: 0.3506696820259094, mean loss: 0.3432743457026614
Epoch: 43, step: 676, loss: 0.3219652771949768, mean loss: 0.34327400621870424
Epoch: 43, step: 677, loss: 0.37864434719085693, mean loss: 0.3432745697098779
Epoch: 43, step: 678, loss: 0.3239766061306, mean loss: 0.3432742622754961
Epoch: 43, step: 679, loss: 0.34293514490127563, mean loss: 0.34327425687312924
Epoch: 43, step: 680, loss: 0.35868409276008606, mean loss: 0.34327450235822454
Epoch: 43, step: 681, loss: 0.38142064213752747, mean loss: 0.34327511003241734
Epoch: 43, step: 682, loss: 0.339847207069397, mean loss: 0.34327505542623715
Epoch: 43, step: 683, loss: 0.34621191024780273, mean loss: 0.3432751022093202
Epoch: 43, step: 684, loss: 0.31744813919067383, mean loss: 0.3432746908012724
Epoch: 43, step: 685, loss: 0.3245381712913513, mean loss: 0.34327439234449597
Epoch: 43, step: 686, loss: 0.33731451630592346, mean loss: 0.34327429741026577
Epoch: 43, step: 687, loss: 0.3141111135482788, mean loss: 0.3432738328804177
Epoch: 43, step: 688, loss: 0.33600449562072754, mean loss: 0.34327371709160803
Epoch: 43, step: 689, loss: 0.28728359937667847, mean loss: 0.3432728252736074
Epoch: 43, step: 690, loss: 0.3310478925704956, mean loss: 0.34327263055636387
Epoch: 43, step: 691, loss: 0.3103587329387665, mean loss: 0.3432721063161495
Epoch: 43, step: 692, loss: 0.326107382774353, mean loss: 0.34327183292722635
Epoch: 43, step: 693, loss: 0.3281496465206146, mean loss: 0.34327159207438646
Epoch: 43, step: 694, loss: 0.3253666162490845, mean loss: 0.34327130690427443
Epoch: 43, step: 695, loss: 0.3669500946998596, mean loss: 0.3432716840270972
Epoch: 43, step: 696, loss: 0.32363414764404297, mean loss: 0.3432713712726914
Epoch: 43, step: 697, loss: 0.31999722123146057, mean loss: 0.3432710006061834
Epoch: 43, step: 698, loss: 0.3775703012943268, mean loss: 0.3432715468516754
Epoch: 43, step: 699, loss: 0.36643826961517334, mean loss: 0.3432719157955339
Epoch: 43, step: 700, loss: 0.34911489486694336, mean loss: 0.3432720088469739
Epoch: 43, step: 701, loss: 0.3349084258079529, mean loss: 0.3432718756561748
Epoch: 43, step: 702, loss: 0.31039363145828247, mean loss: 0.3432713520755681
Epoch: 43, step: 703, loss: 0.33975380659103394, mean loss: 0.34327129606012946
Epoch: 43, step: 704, loss: 0.3416398763656616, mean loss: 0.3432712700808678
Epoch: 43, step: 705, loss: 0.30093395709991455, mean loss: 0.3432705958983623
Epoch: 43, step: 706, loss: 0.35107967257499695, mean loss: 0.3432707202486971
Epoch: 43, step: 707, loss: 0.32884296774864197, mean loss: 0.34327049050741526
Epoch: 43, step: 708, loss: 0.3216935694217682, mean loss: 0.3432701469313403
Epoch: 43, step: 709, loss: 0.3082214295864105, mean loss: 0.34326958884851894
Epoch: 43, step: 710, loss: 0.32983162999153137, mean loss: 0.34326937487850384
Epoch: 43, step: 711, loss: 0.3219035565853119, mean loss: 0.34326903468013603
Epoch: 43, step: 712, loss: 0.3447466790676117, mean loss: 0.34326905820763204
Epoch: 43, step: 713, loss: 0.35454413294792175, mean loss: 0.34326923772988693
Epoch: 43, step: 714, loss: 0.3422701358795166, mean loss: 0.34326922182239494
Epoch: 43, step: 715, loss: 0.3300364911556244, mean loss: 0.34326901113696207
Epoch: 43, step: 716, loss: 0.33063316345214844, mean loss: 0.3432688099580278
Epoch: 43, step: 717, loss: 0.2945992946624756, mean loss: 0.3432680350891328
Epoch: 43, step: 718, loss: 0.3447560966014862, mean loss: 0.3432680587802301
Epoch: 43, step: 719, loss: 0.3870706558227539, mean loss: 0.34326875614056
Epoch: 43, step: 720, loss: 0.34460896253585815, mean loss: 0.3432687774770094
Epoch: 43, step: 721, loss: 0.34932833909988403, mean loss: 0.3432688739453385
Epoch: 43, step: 722, loss: 0.3172033131122589, mean loss: 0.34326845898775143
Epoch: 43, step: 723, loss: 0.344441682100296, mean loss: 0.3432684776648896
Epoch: 43, step: 724, loss: 0.369928777217865, mean loss: 0.3432689020770639
Epoch: 43, step: 725, loss: 0.3664877116680145, mean loss: 0.34326927169738913
Epoch: 43, step: 726, loss: 0.31482818722724915, mean loss: 0.3432688189508559
Epoch: 43, step: 727, loss: 0.4142591655254364, mean loss: 0.3432699490104958
Epoch: 43, step: 728, loss: 0.38576775789260864, mean loss: 0.34327062550098275
Epoch: 43, step: 729, loss: 0.30864065885543823, mean loss: 0.34327007426150224
Epoch: 43, step: 730, loss: 0.31716251373291016, mean loss: 0.3432696586882165
Epoch: 43, step: 731, loss: 0.3244175612926483, mean loss: 0.3432693586102623
Epoch: 43, step: 732, loss: 0.3745000660419464, mean loss: 0.3432698557166281
Epoch: 43, step: 733, loss: 0.31931132078170776, mean loss: 0.34326947436917743
Epoch: 43, step: 734, loss: 0.31359609961509705, mean loss: 0.3432690020662702
Epoch: 43, step: 735, loss: 0.3654548227787018, mean loss: 0.3432693551862281
Epoch: 43, step: 736, loss: 0.3324117064476013, mean loss: 0.34326918237353427
Epoch: 43, step: 737, loss: 0.3510323166847229, mean loss: 0.34326930593129823
Epoch: 43, step: 738, loss: 0.35462746024131775, mean loss: 0.3432694867043929
Epoch: 43, step: 739, loss: 0.3472449481487274, mean loss: 0.34326954997567893
Epoch: 43, step: 740, loss: 0.296268105506897, mean loss: 0.3432688019381116
Epoch: 43, step: 741, loss: 0.3158763349056244, mean loss: 0.3432683659883546
Epoch: 43, step: 742, loss: 0.3090991675853729, mean loss: 0.3432678221959077
Epoch: 43, step: 743, loss: 0.3384617567062378, mean loss: 0.3432677457100478
Epoch: 43, step: 744, loss: 0.3421240448951721, mean loss: 0.34326772750897494
Epoch: 43, step: 745, loss: 0.340925395488739, mean loss: 0.3432676902332497
Epoch: 43, step: 746, loss: 0.32214584946632385, mean loss: 0.34326735410694653
Epoch: 43, step: 747, loss: 0.35466623306274414, mean loss: 0.34326753550221956
Epoch: 43, step: 748, loss: 0.3157638907432556, mean loss: 0.34326709783183307
Epoch: 43, step: 749, loss: 0.29424721002578735, mean loss: 0.3432663177820605
Epoch: 43, step: 750, loss: 0.30642059445381165, mean loss: 0.34326573146817785
Epoch: 43, step: 751, loss: 0.3194204866886139, mean loss: 0.3432653520326744
Epoch: 43, step: 752, loss: 0.3359653949737549, mean loss: 0.34326523587455426
Epoch: 43, step: 753, loss: 0.3067271411418915, mean loss: 0.34326465448361876
Epoch: 43, step: 754, loss: 0.48745810985565186, mean loss: 0.3432669488406346
Epoch: 43, step: 755, loss: 0.39951539039611816, mean loss: 0.3432678438323854
Epoch: 43, step: 756, loss: 0.33054986596107483, mean loss: 0.34326764147470473
Epoch: 43, step: 757, loss: 0.3393491804599762, mean loss: 0.34326757912846745
Epoch: 43, step: 758, loss: 0.3272101879119873, mean loss: 0.3432673236450031
Epoch: 43, step: 759, loss: 0.35297006368637085, mean loss: 0.34326747801940716
Epoch: 43, step: 760, loss: 0.30159464478492737, mean loss: 0.34326681499881573
Epoch: 43, step: 761, loss: 0.35726651549339294, mean loss: 0.34326703773246026
Epoch: 43, step: 762, loss: 0.3619038760662079, mean loss: 0.3432673342377237
Epoch: 43, step: 763, loss: 0.279568612575531, mean loss: 0.3432663208305444
Epoch: 43, step: 764, loss: 0.30391448736190796, mean loss: 0.34326569477722546
Epoch: 43, step: 765, loss: 0.3647365868091583, mean loss: 0.3432660363549408
Epoch: 43, step: 766, loss: 0.3303206264972687, mean loss: 0.3432658304113232
Epoch: 43, step: 767, loss: 0.36654284596443176, mean loss: 0.34326620071064795
Epoch: 43, step: 768, loss: 0.29135626554489136, mean loss: 0.34326537492144377
Epoch: 43, step: 769, loss: 0.33216363191604614, mean loss: 0.3432651983164518
Epoch: 43, step: 770, loss: 0.29059720039367676, mean loss: 0.3432643604945546
Epoch: 43, step: 771, loss: 0.3215857148170471, mean loss: 0.3432640156446297
Epoch: 43, step: 772, loss: 0.3717627227306366, mean loss: 0.34326446897648505
Epoch: 43, step: 773, loss: 0.3157331049442291, mean loss: 0.34326403103922115
Epoch: 43, step: 774, loss: 0.3516448140144348, mean loss: 0.343264164348954
Epoch: 43, step: 775, loss: 0.3262196481227875, mean loss: 0.343263893233025
Epoch: 43, step: 776, loss: 0.3564753830432892, mean loss: 0.34326410337617674
Epoch: 43, step: 777, loss: 0.32279202342033386, mean loss: 0.34326377775060085
Epoch: 43, step: 778, loss: 0.3054269552230835, mean loss: 0.34326317593382477
Epoch: 43, step: 779, loss: 0.3354417085647583, mean loss: 0.34326305153079373
Epoch: 43, step: 780, loss: 0.3034168779850006, mean loss: 0.3432624177742759
Epoch: 43, step: 781, loss: 0.3060440719127655, mean loss: 0.3432618258229787
Epoch: 43, step: 782, loss: 0.31895580887794495, mean loss: 0.3432614392461684
Epoch: 43, step: 783, loss: 0.32161062955856323, mean loss: 0.34326109490477125
Epoch: 43, step: 784, loss: 0.3583410680294037, mean loss: 0.3432613347376692
Epoch: 43, step: 785, loss: 0.3293173313140869, mean loss: 0.343261112974836
Epoch: 43, step: 786, loss: 0.3305613398551941, mean loss: 0.343260911003222
Epoch: 43, step: 787, loss: 0.33100831508636475, mean loss: 0.3432607161464167
Epoch: 43, step: 788, loss: 0.3190271258354187, mean loss: 0.34326033075829765
Epoch: 43, step: 789, loss: 0.3381810784339905, mean loss: 0.34326024998395327
Epoch: 43, step: 790, loss: 0.3273414075374603, mean loss: 0.3432599968337784
Epoch: 43, step: 791, loss: 0.30771249532699585, mean loss: 0.343259431546877
Epoch: 43, step: 792, loss: 0.3329337239265442, mean loss: 0.34325926734702616
Epoch: 43, step: 793, loss: 0.33135268092155457, mean loss: 0.34325907801098277
Epoch: 43, step: 794, loss: 0.32745781540870667, mean loss: 0.3432588267466101
Epoch: 43, step: 795, loss: 0.3191691040992737, mean loss: 0.343258443689069
Epoch: 43, step: 796, loss: 0.3383481800556183, mean loss: 0.34325836561080997
Epoch: 43, step: 797, loss: 0.4190271198749542, mean loss: 0.3432595703930371
Epoch: 43, step: 798, loss: 0.31023702025413513, mean loss: 0.3432590453171099
Epoch: 43, step: 799, loss: 0.30386778712272644, mean loss: 0.34325841898533166
Epoch: 43, step: 800, loss: 0.3056785762310028, mean loss: 0.34325782146505507
Epoch: 43, step: 801, loss: 0.3532472848892212, mean loss: 0.3432579802952046
Epoch: 43, step: 802, loss: 0.3095247447490692, mean loss: 0.34325744395311786
Epoch: 43, step: 803, loss: 0.3017941415309906, mean loss: 0.3432567847171979
Epoch: 43, step: 804, loss: 0.2780916094779968, mean loss: 0.3432557486554582
Epoch: 43, step: 805, loss: 0.3771042227745056, mean loss: 0.34325628680411346
Epoch: 43, step: 806, loss: 0.3068571090698242, mean loss: 0.34325570811164247
Epoch: 43, step: 807, loss: 0.31095391511917114, mean loss: 0.3432551945696235
Epoch: 43, step: 808, loss: 0.352664589881897, mean loss: 0.3432553441601755
Epoch: 43, step: 809, loss: 0.3398306369781494, mean loss: 0.34325528971505165
Epoch: 43, step: 810, loss: 0.32944783568382263, mean loss: 0.3432550702111483
Epoch: 43, step: 811, loss: 0.3335806131362915, mean loss: 0.34325491641398004
Epoch: 43, step: 812, loss: 0.3153620660305023, mean loss: 0.34325447300168554
Epoch: 43, step: 813, loss: 0.33716514706611633, mean loss: 0.34325437620128596
Epoch: 43, step: 814, loss: 0.3188590705394745, mean loss: 0.343253988401746
Epoch: 43, step: 815, loss: 0.3253883123397827, mean loss: 0.34325370440486064
Epoch: 43, step: 816, loss: 0.3259778618812561, mean loss: 0.3432534297884699
Epoch: 43, step: 817, loss: 0.32042592763900757, mean loss: 0.343253066928795
Epoch: 43, step: 818, loss: 0.34154602885246277, mean loss: 0.3432530397946201
Epoch: 43, step: 819, loss: 0.36442211270332336, mean loss: 0.343253376281664
Epoch: 43, step: 820, loss: 0.29175543785095215, mean loss: 0.3432525577236803
Epoch: 43, step: 821, loss: 0.36048486828804016, mean loss: 0.34325283162631826
Epoch: 43, step: 822, loss: 0.3537974953651428, mean loss: 0.3432529992280625
Epoch: 43, step: 823, loss: 0.3078608810901642, mean loss: 0.34325243669836997
Epoch: 43, step: 824, loss: 0.32069581747055054, mean loss: 0.34325207818446707
Epoch: 43, step: 825, loss: 0.3764742612838745, mean loss: 0.34325260620797543
Epoch: 43, step: 826, loss: 0.3026711940765381, mean loss: 0.3432519612293182
Epoch: 43, step: 827, loss: 0.3484157919883728, mean loss: 0.3432520432991014
Epoch: 43, step: 828, loss: 0.31333333253860474, mean loss: 0.3432515678026732
Epoch: 43, step: 829, loss: 0.3194551169872284, mean loss: 0.34325118961299683
Epoch: 43, step: 830, loss: 0.3407304584980011, mean loss: 0.3432511495524289
Epoch: 43, step: 831, loss: 0.29718467593193054, mean loss: 0.34325041745539725
Epoch: 43, step: 832, loss: 0.3314702808856964, mean loss: 0.34325023024623447
Epoch: 43, step: 833, loss: 0.3323787748813629, mean loss: 0.34325005748051973
Epoch: 43, step: 834, loss: 0.3314560055732727, mean loss: 0.34324987005617236
Epoch: 43, step: 835, loss: 0.34266898036003113, mean loss: 0.34324986082515124
Epoch: 43, step: 836, loss: 0.3101312518119812, mean loss: 0.3432493345398295
Epoch: 43, step: 837, loss: 0.36934545636177063, mean loss: 0.3432497492247464
Epoch: 43, step: 838, loss: 0.3180781602859497, mean loss: 0.3432493492376345
Epoch: 43, step: 839, loss: 0.3541414737701416, mean loss: 0.3432495223153141
Epoch: 43, step: 840, loss: 0.33048075437545776, mean loss: 0.34324931942068104
Epoch: 43, step: 841, loss: 0.34590646624565125, mean loss: 0.3432493616418465
Epoch: 43, step: 842, loss: 0.327777236700058, mean loss: 0.34324911579891426
Epoch: 43, step: 843, loss: 0.32376033067703247, mean loss: 0.3432488061385431
Epoch: 43, step: 844, loss: 0.34841954708099365, mean loss: 0.34324888829595357
Epoch: 43, step: 845, loss: 0.3099917769432068, mean loss: 0.34324835988527397
Epoch: 43, step: 846, loss: 0.334639310836792, mean loss: 0.34324822310126013
Epoch: 43, step: 847, loss: 0.37703606486320496, mean loss: 0.3432487599274718
Epoch: 43, step: 848, loss: 0.3145540654659271, mean loss: 0.3432483040291788
Epoch: 43, step: 849, loss: 0.31247982382774353, mean loss: 0.34324781519056224
Epoch: 43, step: 850, loss: 0.3316086232662201, mean loss: 0.34324763027417876
Epoch: 43, step: 851, loss: 0.33175599575042725, mean loss: 0.3432474477049978
Epoch: 43, step: 852, loss: 0.3301207721233368, mean loss: 0.3432472391630075
Epoch: 43, step: 853, loss: 0.3060734272003174, mean loss: 0.3432466485963001
Epoch: 43, step: 854, loss: 0.3616465926170349, mean loss: 0.34324694090481395
Epoch: 43, step: 855, loss: 0.31240180134773254, mean loss: 0.3432464508949716
Epoch: 43, step: 856, loss: 0.34291067719459534, mean loss: 0.34324644556091227
Epoch: 43, step: 857, loss: 0.31391915678977966, mean loss: 0.3432459796786443
Epoch: 43, step: 858, loss: 0.30230361223220825, mean loss: 0.34324532929394114
Epoch: 43, step: 859, loss: 0.28507575392723083, mean loss: 0.34324440526332467
Epoch: 43, step: 860, loss: 0.31764036417007446, mean loss: 0.34324399854655036
Epoch: 43, step: 861, loss: 0.35544586181640625, mean loss: 0.34324419236844045
Epoch: 43, step: 862, loss: 0.3483181297779083, mean loss: 0.3432442729646982
Epoch: 43, step: 863, loss: 0.3104404807090759, mean loss: 0.3432437519056688
Epoch: 43, step: 864, loss: 0.3491632044315338, mean loss: 0.34324384592940765
Epoch: 43, step: 865, loss: 0.390507310628891, mean loss: 0.3432445966436092
Epoch: 43, step: 866, loss: 0.33164072036743164, mean loss: 0.3432444123351501
Epoch: 43, step: 867, loss: 0.3473914563655853, mean loss: 0.3432444782030667
Epoch: 43, step: 868, loss: 0.32430300116539, mean loss: 0.3432441773584639
Epoch: 43, step: 869, loss: 0.3876437544822693, mean loss: 0.3432448825390033
Epoch: 43, step: 870, loss: 0.3629970848560333, mean loss: 0.34324519625026734
Epoch: 43, step: 871, loss: 0.3207521140575409, mean loss: 0.3432448390130811
Epoch: 43, step: 872, loss: 0.30689942836761475, mean loss: 0.3432442617811166
Epoch: 43, step: 873, loss: 0.3513491749763489, mean loss: 0.3432443904999997
Epoch: 43, step: 874, loss: 0.33099693059921265, mean loss: 0.3432441959939902
Epoch: 43, step: 875, loss: 0.33536234498023987, mean loss: 0.34324407082166436
Epoch: 43, step: 876, loss: 0.31930646300315857, mean loss: 0.343243690672578
Epoch: 43, step: 877, loss: 0.310679167509079, mean loss: 0.34324317352912614
Epoch: 43, step: 878, loss: 0.35902950167655945, mean loss: 0.34324342422116133
Epoch: 43, step: 879, loss: 0.3381216526031494, mean loss: 0.34324334288705066
Epoch: 43, step: 880, loss: 0.3132512867450714, mean loss: 0.3432428666185524
Epoch: 43, step: 881, loss: 0.326679527759552, mean loss: 0.3432426035998644
Epoch: 43, step: 882, loss: 0.3261004686355591, mean loss: 0.343242331394466
Epoch: 43, step: 883, loss: 0.33247360587120056, mean loss: 0.34324216039717304
Epoch: 43, step: 884, loss: 0.3415865898132324, mean loss: 0.3432421341086775
Epoch: 43, step: 885, loss: 0.3575419485569, mean loss: 0.3432423611691502
Epoch: 43, step: 886, loss: 0.3259003460407257, mean loss: 0.3432420858072815
Epoch: 43, step: 887, loss: 0.3333064913749695, mean loss: 0.3432419280493515
Epoch: 43, step: 888, loss: 0.32597586512565613, mean loss: 0.34324165390218137
Epoch: 43, step: 889, loss: 0.36717984080314636, mean loss: 0.34324203398199626
Epoch: 43, step: 890, loss: 0.33123549818992615, mean loss: 0.34324184335062286
Epoch: 43, step: 891, loss: 0.31886494159698486, mean loss: 0.34324145631738023
Epoch: 43, step: 892, loss: 0.3232506811618805, mean loss: 0.34324113892791996
Epoch: 43, step: 893, loss: 0.3282320499420166, mean loss: 0.34324090063545837
Epoch: 43, step: 894, loss: 0.29732269048690796, mean loss: 0.343240171624549
Epoch: 43, step: 895, loss: 0.32413288950920105, mean loss: 0.34323986827657615
Epoch: 43, step: 896, loss: 0.3386300206184387, mean loss: 0.3432397950916128
Epoch: 43, step: 897, loss: 0.2673012316226959, mean loss: 0.3432385895262299
Epoch: 43, step: 898, loss: 0.3272097110748291, mean loss: 0.3432383350632359
Epoch: 43, step: 899, loss: 0.36229634284973145, mean loss: 0.3432386376097146
Epoch: 43, step: 900, loss: 0.33010509610176086, mean loss: 0.343238429117636
Epoch: 43, step: 901, loss: 0.3517199158668518, mean loss: 0.34323856375723266
Epoch: 43, step: 902, loss: 0.30660897493362427, mean loss: 0.34323798228903957
Epoch: 43, step: 903, loss: 0.29991358518600464, mean loss: 0.3432372945565311
Epoch: 43, step: 904, loss: 0.3709595501422882, mean loss: 0.34323773461328916
Epoch: 43, step: 905, loss: 0.2949441969394684, mean loss: 0.343236968024863
Epoch: 43, step: 906, loss: 0.30841007828712463, mean loss: 0.3432364152083145
Epoch: 43, step: 907, loss: 0.336736798286438, mean loss: 0.34323631203979194
Epoch: 43, step: 908, loss: 0.330661416053772, mean loss: 0.3432361124414366
Epoch: 43, step: 909, loss: 0.3384200632572174, mean loss: 0.3432360359986382
Epoch: 43, step: 910, loss: 0.39453402161598206, mean loss: 0.34323685021360606
Epoch: 43, step: 911, loss: 0.34097278118133545, mean loss: 0.343236814278284
Epoch: 43, step: 912, loss: 0.31947773694992065, mean loss: 0.3432364371800009
Epoch: 43, step: 913, loss: 0.33093249797821045, mean loss: 0.34323624189797697
Epoch: 43, step: 914, loss: 0.3244410753250122, mean loss: 0.34323594359514437
Epoch: 43, step: 915, loss: 0.32734590768814087, mean loss: 0.34323569140437643
Epoch: 43, step: 916, loss: 0.3821769058704376, mean loss: 0.3432363094306023
Epoch: 43, step: 917, loss: 0.28999748826026917, mean loss: 0.3432354645040641
Epoch: 43, step: 918, loss: 0.3705417513847351, mean loss: 0.34323589786152364
Epoch: 43, step: 919, loss: 0.33013731241226196, mean loss: 0.34323568998706405
Epoch: 43, step: 920, loss: 0.31461068987846375, mean loss: 0.3432352357157215
Epoch: 43, step: 921, loss: 0.37274107336997986, mean loss: 0.34323570395829706
Epoch: 43, step: 922, loss: 0.35908016562461853, mean loss: 0.34323595539782203
Epoch: 43, step: 923, loss: 0.3328990936279297, mean loss: 0.3432357913623109
Epoch: 43, step: 924, loss: 0.3624415993690491, mean loss: 0.3432360961341662
Epoch: 43, step: 925, loss: 0.3350802958011627, mean loss: 0.34323596671399526
Epoch: 43, step: 926, loss: 0.2945473790168762, mean loss: 0.34323519411227676
Epoch: 43, step: 927, loss: 0.31800663471221924, mean loss: 0.34323479378604066
Epoch: 43, step: 928, loss: 0.31338757276535034, mean loss: 0.3432343201784968
Epoch: 43, step: 929, loss: 0.34906187653541565, mean loss: 0.34323441264710075
Epoch: 43, step: 930, loss: 0.3125784695148468, mean loss: 0.34323392622241244
Epoch: 43, step: 931, loss: 0.31241193413734436, mean loss: 0.3432334371707482
Epoch: 43, step: 932, loss: 0.35161855816841125, mean loss: 0.3432335702151115
Epoch: 43, step: 933, loss: 0.33145710825920105, mean loss: 0.343233383364257
Epoch: 43, step: 934, loss: 0.35144591331481934, mean loss: 0.34323351366603166
Epoch: 43, step: 935, loss: 0.2988223433494568, mean loss: 0.34323280903998743
Epoch: 43, step: 936, loss: 0.32468342781066895, mean loss: 0.34323251474083577
Epoch: 43, step: 937, loss: 0.3326485753059387, mean loss: 0.34323234682175857
Epoch: 43, step: 938, loss: 0.3369365930557251, mean loss: 0.3432322469383081
Epoch: 43, step: 939, loss: 0.3178287744522095, mean loss: 0.34323184391329725
Epoch: 43, step: 940, loss: 0.3279877007007599, mean loss: 0.3432316020694502
Epoch: 43, step: 941, loss: 0.31428468227386475, mean loss: 0.34323114284236966
Epoch: 43, step: 942, loss: 0.32101258635520935, mean loss: 0.3432307903626919
Epoch: 43, step: 943, loss: 0.40799668431282043, mean loss: 0.3432318178056443
Epoch: 43, step: 944, loss: 0.31925976276397705, mean loss: 0.3432314375201764
Epoch: 43, step: 945, loss: 0.29268592596054077, mean loss: 0.3432306356941102
Epoch: 43, step: 946, loss: 0.376571387052536, mean loss: 0.3432311645849771
Epoch: 43, step: 947, loss: 0.33385342359542847, mean loss: 0.3432310158263954
Epoch: 43, step: 948, loss: 0.3383992612361908, mean loss: 0.34323093918175795
Epoch: 43, step: 949, loss: 0.34387344121932983, mean loss: 0.3432309493734086
Epoch: 43, step: 950, loss: 0.34201186895370483, mean loss: 0.3432309300361242
Epoch: 43, step: 951, loss: 0.3390880227088928, mean loss: 0.3432308643215863
Epoch: 43, step: 952, loss: 0.31651392579078674, mean loss: 0.3432304405458938
Epoch: 43, step: 953, loss: 0.3669561743736267, mean loss: 0.34323081687006707
Epoch: 43, step: 954, loss: 0.3710559904575348, mean loss: 0.3432312582102353
Epoch: 43, step: 955, loss: 0.32757967710494995, mean loss: 0.34323100996158185
Epoch: 43, step: 956, loss: 0.3534221351146698, mean loss: 0.3432311715997546
Epoch: 43, step: 957, loss: 0.3306642472743988, mean loss: 0.34323097228295324
Epoch: 43, step: 958, loss: 0.33537590503692627, mean loss: 0.34323084770019885
Epoch: 43, step: 959, loss: 0.3381429612636566, mean loss: 0.34323076700670085
Epoch: 43, step: 960, loss: 0.32419684529304504, mean loss: 0.343230465134915
Epoch: 43, step: 961, loss: 0.3598175644874573, mean loss: 0.3432307281967248
Epoch: 43, step: 962, loss: 0.330971360206604, mean loss: 0.3432305337733168
Epoch: 43, step: 963, loss: 0.33981966972351074, mean loss: 0.3432304796806999
Epoch: 43, step: 964, loss: 0.39221295714378357, mean loss: 0.343231256477526
Epoch: 43, step: 965, loss: 0.28893473744392395, mean loss: 0.34323039542073647
Epoch: 43, step: 966, loss: 0.32768818736076355, mean loss: 0.34323014894984316
Epoch: 43, step: 967, loss: 0.33491581678390503, mean loss: 0.3432300171018862
Epoch: 43, step: 968, loss: 0.36861324310302734, mean loss: 0.3432304196204952
Epoch: 43, step: 969, loss: 0.33758825063705444, mean loss: 0.3432303301503074
Epoch: 43, step: 970, loss: 0.34612470865249634, mean loss: 0.3432303760469267
Epoch: 43, step: 971, loss: 0.3244222104549408, mean loss: 0.343230077807589
Epoch: 43, step: 972, loss: 0.35889115929603577, mean loss: 0.3432303261399681
Epoch: 43, step: 973, loss: 0.3250647783279419, mean loss: 0.3432300380996958
Epoch: 43, step: 974, loss: 0.3483152687549591, mean loss: 0.343230118731891
Epoch: 43, step: 975, loss: 0.3077738583087921, mean loss: 0.34322955654091586
Epoch: 43, step: 976, loss: 0.342693030834198, mean loss: 0.34322954803395195
Epoch: 43, step: 977, loss: 0.3102875351905823, mean loss: 0.34322902572520225
Epoch: 43, step: 978, loss: 0.2950310707092285, mean loss: 0.34322826153952235
Epoch: 43, step: 979, loss: 0.337268203496933, mean loss: 0.34322816704342196
Epoch: 43, step: 980, loss: 0.3575230538845062, mean loss: 0.34322839368377267
Epoch: 43, step: 981, loss: 0.34724560379981995, mean loss: 0.3432284573742016
Epoch: 43, step: 982, loss: 0.3493289053440094, mean loss: 0.3432285540915693
Epoch: 43, step: 983, loss: 0.3224536180496216, mean loss: 0.34322822472800724
Epoch: 43, step: 984, loss: 0.40126878023147583, mean loss: 0.3432291448820333
Epoch: 43, step: 985, loss: 0.3710351288318634, mean loss: 0.343229585701082
Epoch: 43, step: 986, loss: 0.3132457137107849, mean loss: 0.34322911036266524
Epoch: 43, step: 987, loss: 0.31369104981422424, mean loss: 0.3432286420991816
Epoch: 43, step: 988, loss: 0.37224116921424866, mean loss: 0.3432291020241529
Epoch: 43, step: 989, loss: 0.34314674139022827, mean loss: 0.3432291007185406
Epoch: 43, step: 990, loss: 0.33717289566993713, mean loss: 0.3432290047147829
Epoch: 43, step: 991, loss: 0.2837948501110077, mean loss: 0.34322806257169425
Epoch: 43, step: 992, loss: 0.3061860203742981, mean loss: 0.343227475394993
Epoch: 43, step: 993, loss: 0.2969745993614197, mean loss: 0.3432267422231952
Epoch: 43, step: 994, loss: 0.3156927824020386, mean loss: 0.34322630577892266
Epoch: 43, step: 995, loss: 0.32646864652633667, mean loss: 0.34322604015536107
Epoch: 43, step: 996, loss: 0.30998075008392334, mean loss: 0.34322551319677763
Epoch: 43, step: 997, loss: 0.3669857978820801, mean loss: 0.3432258898061402
Epoch: 43, step: 998, loss: 0.32764190435409546, mean loss: 0.3432256427980812
Epoch: 43, step: 999, loss: 0.3272666931152344, mean loss: 0.3432253898508029
Epoch: 43, step: 1000, loss: 0.3192252814769745, mean loss: 0.34322500945823364
Epoch: 43, step: 1001, loss: 0.3200918436050415, mean loss: 0.34322464281218407
Epoch: 43, step: 1002, loss: 0.30837282538414, mean loss: 0.3432240904416725
Epoch: 43, step: 1003, loss: 0.3473550081253052, mean loss: 0.34322415591203015
Epoch: 43, step: 1004, loss: 0.31694403290748596, mean loss: 0.34322373940850376
Epoch: 43, step: 1005, loss: 0.3060302138328552, mean loss: 0.34322314995201425
Epoch: 43, step: 1006, loss: 0.31482404470443726, mean loss: 0.3432226998798222
Epoch: 43, step: 1007, loss: 0.37607020139694214, mean loss: 0.3432232204424453
Epoch: 43, step: 1008, loss: 0.3029683530330658, mean loss: 0.34322258249903065
Epoch: 43, step: 1009, loss: 0.35327404737472534, mean loss: 0.34322274178819545
Epoch: 43, step: 1010, loss: 0.32989245653152466, mean loss: 0.3432225305417372
Epoch: 43, step: 1011, loss: 0.29047316312789917, mean loss: 0.34322169463010854
Epoch: 43, step: 1012, loss: 0.36931151151657104, mean loss: 0.34322210806512776
Epoch: 43, step: 1013, loss: 0.3137449324131012, mean loss: 0.3432216409593747
Epoch: 43, step: 1014, loss: 0.305522620677948, mean loss: 0.3432210435768295
Epoch: 43, step: 1015, loss: 0.3118383288383484, mean loss: 0.3432205462909903
Epoch: 43, step: 1016, loss: 0.3390587866306305, mean loss: 0.3432204803454095
Epoch: 43, step: 1017, loss: 0.3277921676635742, mean loss: 0.34322023587840456
Epoch: 43, step: 1018, loss: 0.3134039640426636, mean loss: 0.34321976343664584
Epoch: 43, step: 1019, loss: 0.29680830240249634, mean loss: 0.34321902805413484
Epoch: 43, step: 1020, loss: 0.3410080373287201, mean loss: 0.3432189930218796
Epoch: 43, step: 1021, loss: 0.3251454830169678, mean loss: 0.34321870665894894
Epoch: 43, step: 1022, loss: 0.3675929009914398, mean loss: 0.3432190928459779
Epoch: 43, step: 1023, loss: 0.3673776388168335, mean loss: 0.3432194756101894
Epoch: 43, step: 1024, loss: 0.325295627117157, mean loss: 0.34321919163204573
Epoch: 43, step: 1025, loss: 0.34697484970092773, mean loss: 0.34321925113421736
Epoch: 43, step: 1026, loss: 0.32449373602867126, mean loss: 0.3432189544641956
Epoch: 43, step: 1027, loss: 0.3059890568256378, mean loss: 0.34321836463691996
Epoch: 43, step: 1028, loss: 0.32355761528015137, mean loss: 0.3432180531597672
Epoch: 43, step: 1029, loss: 0.3609837293624878, mean loss: 0.3432183346095978
Epoch: 43, step: 1030, loss: 0.3242546319961548, mean loss: 0.3432180341849885
Epoch: 43, step: 1031, loss: 0.32518279552459717, mean loss: 0.3432177484737113
Epoch: 43, step: 1032, loss: 0.2969421148300171, mean loss: 0.34321701539436644
Epoch: 43, step: 1033, loss: 0.29113301634788513, mean loss: 0.34321619031438283
Epoch: 43, step: 1034, loss: 0.3248099386692047, mean loss: 0.34321589873943636
Epoch: 43, step: 1035, loss: 0.3353833556175232, mean loss: 0.3432157746654419
Epoch: 43, step: 1036, loss: 0.32893696427345276, mean loss: 0.3432155484807979
Epoch: 43, step: 1037, loss: 0.3230629861354828, mean loss: 0.3432152292575705
Epoch: 43, step: 1038, loss: 0.32351046800613403, mean loss: 0.3432149171326041
Epoch: 43, step: 1039, loss: 0.32422590255737305, mean loss: 0.34321461634988576
Epoch: 43, step: 1040, loss: 0.3503546118736267, mean loss: 0.34321472944439296
Epoch: 43, step: 1041, loss: 0.3411213159561157, mean loss: 0.34321469628613455
Epoch: 43, step: 1042, loss: 0.32422223687171936, mean loss: 0.34321439546314547
Epoch: 43, step: 1043, loss: 0.3243855834007263, mean loss: 0.3432140972369027
Epoch: 43, step: 1044, loss: 0.3249223828315735, mean loss: 0.343213807522244
Epoch: 43, step: 1045, loss: 0.31414100527763367, mean loss: 0.34321334705782885
Epoch: 43, step: 1046, loss: 0.3111252784729004, mean loss: 0.3432128388447025
Epoch: 43, step: 1047, loss: 0.3294956684112549, mean loss: 0.34321262159461646
Epoch: 43, step: 1048, loss: 0.3314206898212433, mean loss: 0.34321243483907293
Epoch: 43, step: 1049, loss: 0.34392720460891724, mean loss: 0.34321244615910984
Epoch: 43, step: 1050, loss: 0.37894153594970703, mean loss: 0.3432130120031431
Epoch: 43, step: 1051, loss: 0.2928728461265564, mean loss: 0.34321221477512653
Epoch: 43, step: 1052, loss: 0.3322916030883789, mean loss: 0.3432120418301319
Epoch: 43, step: 1053, loss: 0.3341441750526428, mean loss: 0.3432118982285296
Epoch: 43, step: 1054, loss: 0.31675592064857483, mean loss: 0.34321147926994755
Epoch: 43, step: 1055, loss: 0.32862889766693115, mean loss: 0.34321124834289357
Epoch: 43, step: 1056, loss: 0.3223054111003876, mean loss: 0.34321091728718023
Epoch: 43, step: 1057, loss: 0.32132861018180847, mean loss: 0.3432105707740036
Epoch: 43, step: 1058, loss: 0.33919981122016907, mean loss: 0.3432105072633774
Epoch: 43, step: 1059, loss: 0.3202001750469208, mean loss: 0.34321014289910995
Epoch: 43, step: 1060, loss: 0.3219214975833893, mean loss: 0.3432098058027675
Epoch: 43, step: 1061, loss: 0.33557605743408203, mean loss: 0.34320968492763104
Epoch: 43, step: 1062, loss: 0.32725533843040466, mean loss: 0.34320943230556633
Epoch: 43, step: 1063, loss: 0.355377197265625, mean loss: 0.34320962496762475
Epoch: 43, step: 1064, loss: 0.3785597085952759, mean loss: 0.34321018468521153
Epoch: 43, step: 1065, loss: 0.31676986813545227, mean loss: 0.34320976604756387
Epoch: 43, step: 1066, loss: 0.31623998284339905, mean loss: 0.34320933903346923
Epoch: 43, step: 1067, loss: 0.3513820171356201, mean loss: 0.34320946842989264
Epoch: 43, step: 1068, loss: 0.31332477927207947, mean loss: 0.3432089952789109
Epoch: 43, step: 1069, loss: 0.40261486172676086, mean loss: 0.3432099358106618
Epoch: 43, step: 1070, loss: 0.2958308160305023, mean loss: 0.34320918570189907
Epoch: 43, step: 1071, loss: 0.29231002926826477, mean loss: 0.34320837987648534
Epoch: 43, step: 1072, loss: 0.3078523576259613, mean loss: 0.34320782013577056
Epoch: 43, step: 1073, loss: 0.2957589328289032, mean loss: 0.34320706895812264
Epoch: 43, step: 1074, loss: 0.3069627285003662, mean loss: 0.34320649517211954
Epoch: 43, step: 1075, loss: 0.34933388233184814, mean loss: 0.3432065921735627
Epoch: 43, step: 1076, loss: 0.320710152387619, mean loss: 0.34320623604255246
Epoch: 43, step: 1077, loss: 0.30895787477493286, mean loss: 0.34320569388074673
Epoch: 43, step: 1078, loss: 0.29788175225257874, mean loss: 0.3432049764005481
Epoch: 43, step: 1079, loss: 0.32143470644950867, mean loss: 0.3432046317815721
Epoch: 43, step: 1080, loss: 0.31976717710494995, mean loss: 0.3432042607772716
Epoch: 43, step: 1081, loss: 0.32190582156181335, mean loss: 0.34320392363795454
Epoch: 43, step: 1082, loss: 0.32011544704437256, mean loss: 0.3432035581693895
Epoch: 43, step: 1083, loss: 0.35476502776145935, mean loss: 0.3432037411735302
Epoch: 43, step: 1084, loss: 0.33772775530815125, mean loss: 0.3432036544966404
Epoch: 43, step: 1085, loss: 0.3228257894515991, mean loss: 0.34320333194978797
Epoch: 43, step: 1086, loss: 0.3589332699775696, mean loss: 0.3432035809239412
Epoch: 43, step: 1087, loss: 0.3304009437561035, mean loss: 0.3432033782864425
Epoch: 43, step: 1088, loss: 0.32179322838783264, mean loss: 0.34320303941637237
Epoch: 43, step: 1089, loss: 0.3159603774547577, mean loss: 0.34320260823879073
Epoch: 43, step: 1090, loss: 0.31944483518600464, mean loss: 0.3432022322235168
Epoch: 43, step: 1091, loss: 0.33229097723960876, mean loss: 0.34320205953335814
Epoch: 43, step: 1092, loss: 0.3099004328250885, mean loss: 0.34320153248379404
Epoch: 43, step: 1093, loss: 0.3571167290210724, mean loss: 0.3432017527097387
Epoch: 43, step: 1094, loss: 0.3031206429004669, mean loss: 0.3432011183844849
Epoch: 43, step: 1095, loss: 0.3532349467277527, mean loss: 0.34320127717774224
Epoch: 43, step: 1096, loss: 0.3435624837875366, mean loss: 0.3432012828940316
Epoch: 43, step: 1097, loss: 0.30992794036865234, mean loss: 0.34320075633377645
Epoch: 43, step: 1098, loss: 0.3135487139225006, mean loss: 0.34320028708906736
Epoch: 43, step: 1099, loss: 0.31411507725715637, mean loss: 0.34319982682178934
Epoch: 43, step: 1100, loss: 0.30174604058265686, mean loss: 0.34319917083479334
Epoch: 43, step: 1101, loss: 0.2915048897266388, mean loss: 0.34319835280964683
Epoch: 43, step: 1102, loss: 0.3556348979473114, mean loss: 0.34319854960599366
Epoch: 43, step: 1103, loss: 0.3558446764945984, mean loss: 0.34319874971560327
Epoch: 43, step: 1104, loss: 0.323041170835495, mean loss: 0.34319843075142964
Epoch: 43, step: 1105, loss: 0.3125935196876526, mean loss: 0.34319794648118274
Epoch: 43, step: 1106, loss: 0.3333219885826111, mean loss: 0.3431977902135535
Epoch: 43, step: 1107, loss: 0.3369561433792114, mean loss: 0.3431976914533188
Epoch: 43, step: 1108, loss: 0.3405737280845642, mean loss: 0.343197649935568
Epoch: 43, step: 1109, loss: 0.34558406472206116, mean loss: 0.34319768769410075
Epoch: 43, step: 1110, loss: 0.3163926303386688, mean loss: 0.3431972635835782
Epoch: 43, step: 1111, loss: 0.3371039628982544, mean loss: 0.3431971671766944
Epoch: 43, step: 1112, loss: 0.3473351299762726, mean loss: 0.3431972326456098
Epoch: 43, step: 1113, loss: 0.37068742513656616, mean loss: 0.3431976675757191
Epoch: 43, step: 1114, loss: 0.36569473147392273, mean loss: 0.3431980235024978
Epoch: 43, step: 1115, loss: 0.39198562502861023, mean loss: 0.34319879536051456
Epoch: 43, step: 1116, loss: 0.32933104038238525, mean loss: 0.3431985759652547
Epoch: 43, step: 1117, loss: 0.3493630290031433, mean loss: 0.3431986734886377
Epoch: 43, step: 1118, loss: 0.34189218282699585, mean loss: 0.3431986528199145
Epoch: 43, step: 1119, loss: 0.31538888812065125, mean loss: 0.3431982128755258
Epoch: 43, step: 1120, loss: 0.31826335191726685, mean loss: 0.34319781841772506
Epoch: 43, step: 1121, loss: 0.3160700500011444, mean loss: 0.34319738927594606
Epoch: 43, step: 1122, loss: 0.3340781629085541, mean loss: 0.3431972450186279
Epoch: 43, step: 1123, loss: 0.35627177357673645, mean loss: 0.3431974518417195
Epoch: 43, step: 1124, loss: 0.332635760307312, mean loss: 0.34319728477128697
Epoch: 43, step: 1125, loss: 0.33278337121009827, mean loss: 0.3431971200410905
Epoch: 43, step: 1126, loss: 0.329754114151001, mean loss: 0.3431969073992282
Epoch: 43, step: 1127, loss: 0.3974703848361969, mean loss: 0.34319776588510986
Epoch: 43, step: 1128, loss: 0.3424266278743744, mean loss: 0.343197753687612
Epoch: 43, step: 1129, loss: 0.33562344312667847, mean loss: 0.3431976338826302
Epoch: 43, step: 1130, loss: 0.3074551522731781, mean loss: 0.3431970685427759
Epoch: 43, step: 1131, loss: 0.38879474997520447, mean loss: 0.3431977897512004
Epoch: 43, step: 1132, loss: 0.36339080333709717, mean loss: 0.3431981091345707
Epoch: 43, step: 1133, loss: 0.3270384967327118, mean loss: 0.34319785354964677
Epoch: 43, step: 1134, loss: 0.33338749408721924, mean loss: 0.3431976983887272
Epoch: 43, step: 1135, loss: 0.3602701723575592, mean loss: 0.34319796840318234
Epoch: 43, step: 1136, loss: 0.3648297190666199, mean loss: 0.34319831052073385
Epoch: 43, step: 1137, loss: 0.3524211049079895, mean loss: 0.3431984563817869
Epoch: 43, step: 1138, loss: 0.31484556198120117, mean loss: 0.343198007979984
Epoch: 43, step: 1139, loss: 0.334232896566391, mean loss: 0.34319786619874326
Epoch: 43, step: 1140, loss: 0.35216251015663147, mean loss: 0.3431980079703492
Epoch: 43, step: 1141, loss: 0.3631595969200134, mean loss: 0.3431983236484488
Epoch: 43, step: 1142, loss: 0.31334418058395386, mean loss: 0.3431978515342231
Epoch: 43, step: 1143, loss: 0.3212251365184784, mean loss: 0.34319750406260857
Epoch: 43, step: 1144, loss: 0.3535013496875763, mean loss: 0.34319766700274845
Epoch: 43, step: 1145, loss: 0.3587184548377991, mean loss: 0.34319791243726305
Epoch: 43, step: 1146, loss: 0.33750343322753906, mean loss: 0.3431978223903109
Epoch: 43, step: 1147, loss: 0.3503471314907074, mean loss: 0.3431979354407394
Epoch: 43, step: 1148, loss: 0.31483936309814453, mean loss: 0.34319748702005753
Epoch: 43, step: 1149, loss: 0.29845431447029114, mean loss: 0.3431967795286349
Epoch: 43, step: 1150, loss: 0.34184736013412476, mean loss: 0.3431967581915795
Epoch: 43, step: 1151, loss: 0.3613470792770386, mean loss: 0.34319704518040195
Epoch: 43, step: 1152, loss: 0.38011568784713745, mean loss: 0.3431976289205026
Epoch: 43, step: 1153, loss: 0.30823996663093567, mean loss: 0.34319707619523476
Epoch: 43, step: 1154, loss: 0.34864136576652527, mean loss: 0.34319716227504204
Epoch: 43, step: 1155, loss: 0.32938867807388306, mean loss: 0.3431969439521828
Epoch: 43, step: 1156, loss: 0.3535396158695221, mean loss: 0.34319710747527277
Epoch: 43, step: 1157, loss: 0.2785934805870056, mean loss: 0.34319608607405716
Epoch: 43, step: 1158, loss: 0.33076465129852295, mean loss: 0.3431958895327412
Epoch: 43, step: 1159, loss: 0.3409700393676758, mean loss: 0.343195854342547
Epoch: 43, step: 1160, loss: 0.33745628595352173, mean loss: 0.3431957636026866
Epoch: 43, step: 1161, loss: 0.3457522392272949, mean loss: 0.34319580401871763
Epoch: 43, step: 1162, loss: 0.3835930824279785, mean loss: 0.3431964426603809
Epoch: 43, step: 1163, loss: 0.33366650342941284, mean loss: 0.34319629200369645
Epoch: 43, step: 1164, loss: 0.3254465162754059, mean loss: 0.34319601140588546
Epoch: 43, step: 1165, loss: 0.3563114106655121, mean loss: 0.34319621873775275
Epoch: 43, step: 1166, loss: 0.32718560099601746, mean loss: 0.34319596564147015
Epoch: 43, step: 1167, loss: 0.3816854655742645, mean loss: 0.3431965740749183
Epoch: 43, step: 1168, loss: 0.3472231924533844, mean loss: 0.3431966377257993
Epoch: 43, step: 1169, loss: 0.3386671543121338, mean loss: 0.3431965661269973
Epoch: 43, step: 1170, loss: 0.32869619131088257, mean loss: 0.3431963369191694
Epoch: 43, step: 1171, loss: 0.29960593581199646, mean loss: 0.3431956478953785
Epoch: 43, step: 1172, loss: 0.2971084415912628, mean loss: 0.3431949194166572
Epoch: 43, step: 1173, loss: 0.3348931670188904, mean loss: 0.3431947881968488
Epoch: 43, step: 1174, loss: 0.3715105950832367, mean loss: 0.34319523575729716
Epoch: 43, step: 1175, loss: 0.3016636371612549, mean loss: 0.34319457931804515
Epoch: 43, step: 1176, loss: 0.35070231556892395, mean loss: 0.3431946979817865
Epoch: 43, step: 1177, loss: 0.332503080368042, mean loss: 0.3431945289977875
Epoch: 43, step: 1178, loss: 0.3147478401660919, mean loss: 0.343194079397041
Epoch: 43, step: 1179, loss: 0.3204974830150604, mean loss: 0.34319372068234283
Epoch: 43, step: 1180, loss: 0.3021825850009918, mean loss: 0.3431930725206359
Epoch: 43, step: 1181, loss: 0.33139437437057495, mean loss: 0.3431928860507091
Epoch: 43, step: 1182, loss: 0.36812731623649597, mean loss: 0.34319328011519246
Epoch: 43, step: 1183, loss: 0.31187888979911804, mean loss: 0.3431927852294488
Epoch: 43, step: 1184, loss: 0.32424068450927734, mean loss: 0.34319248571934685
Epoch: 43, step: 1185, loss: 0.30313223600387573, mean loss: 0.34319185263597324
Epoch: 43, step: 1186, loss: 0.3274730443954468, mean loss: 0.343191604231159
Epoch: 43, step: 1187, loss: 0.31868883967399597, mean loss: 0.34319121701932975
Epoch: 43, step: 1188, loss: 0.31249094009399414, mean loss: 0.3431907318772346
Epoch: 43, step: 1189, loss: 0.3490216135978699, mean loss: 0.34319082401847095
Epoch: 43, step: 1190, loss: 0.3159961998462677, mean loss: 0.34319039428814574
Epoch: 43, step: 1191, loss: 0.3289923369884491, mean loss: 0.3431901699335332
Epoch: 43, step: 1192, loss: 0.3053278923034668, mean loss: 0.34318957165151326
Epoch: 43, step: 1193, loss: 0.2946183979511261, mean loss: 0.34318880416464886
Epoch: 43, step: 1194, loss: 0.3161552846431732, mean loss: 0.3431883770071043
Epoch: 43, step: 1195, loss: 0.3346273601055145, mean loss: 0.34318824173632784
Epoch: 43, step: 1196, loss: 0.3139011263847351, mean loss: 0.3431877789842643
Epoch: 43, step: 1197, loss: 0.31475934386253357, mean loss: 0.34318732980690414
Epoch: 43, step: 1198, loss: 0.3588525950908661, mean loss: 0.34318757731864014
Epoch: 43, step: 1199, loss: 0.3010494112968445, mean loss: 0.3431869115446715
Epoch: 43, step: 1200, loss: 0.3462529480457306, mean loss: 0.343186959986624
Epoch: 43, step: 1201, loss: 0.3235112428665161, mean loss: 0.3431866491243445
Epoch: 43, step: 1202, loss: 0.3566989302635193, mean loss: 0.34318686260536413
Epoch: 43, step: 1203, loss: 0.3221847414970398, mean loss: 0.34318653079733347
Epoch: 43, step: 1204, loss: 0.3905565142631531, mean loss: 0.34318727917377256
Epoch: 43, step: 1205, loss: 0.32766470313072205, mean loss: 0.343187033943654
Epoch: 43, step: 1206, loss: 0.352592408657074, mean loss: 0.34318718253012004
Epoch: 43, step: 1207, loss: 0.32246851921081543, mean loss: 0.34318685522106285
Epoch: 43, step: 1208, loss: 0.3277953863143921, mean loss: 0.34318661207373646
Epoch: 43, step: 1209, loss: 0.3603900074958801, mean loss: 0.3431868838407489
Epoch: 43, step: 1210, loss: 0.3500062823295593, mean loss: 0.3431869915670571
Epoch: 43, step: 1211, loss: 0.3552166819572449, mean loss: 0.34318718159755107
Epoch: 43, step: 1212, loss: 0.34581756591796875, mean loss: 0.3431872231485237
Epoch: 43, step: 1213, loss: 0.3674658536911011, mean loss: 0.3431876066608376
Epoch: 43, step: 1214, loss: 0.35100966691970825, mean loss: 0.34318773021842613
Epoch: 43, step: 1215, loss: 0.3442334234714508, mean loss: 0.34318774673597924
Epoch: 43, step: 1216, loss: 0.32913699746131897, mean loss: 0.34318752479677195
Epoch: 43, step: 1217, loss: 0.2924688756465912, mean loss: 0.3431867236808479
Epoch: 43, step: 1218, loss: 0.3441067337989807, mean loss: 0.3431867382124478
Epoch: 43, step: 1219, loss: 0.3150804340839386, mean loss: 0.343186294279163
Epoch: 43, step: 1220, loss: 0.3385676443576813, mean loss: 0.34318622132969095
Epoch: 43, step: 1221, loss: 0.32343557476997375, mean loss: 0.34318590938215077
Epoch: 43, step: 1222, loss: 0.35158422589302063, mean loss: 0.3431860420255451
Epoch: 43, step: 1223, loss: 0.3389665186405182, mean loss: 0.3431859753832527
Epoch: 43, step: 1224, loss: 0.3614315688610077, mean loss: 0.3431862635458864
Epoch: 43, step: 1225, loss: 0.33054402470588684, mean loss: 0.3431860638832495
Epoch: 43, step: 1226, loss: 0.3149595856666565, mean loss: 0.34318561810112697
Epoch: 43, step: 1227, loss: 0.3372361958026886, mean loss: 0.3431855241430995
Epoch: 43, step: 1228, loss: 0.3413016200065613, mean loss: 0.34318549439145096
Epoch: 43, step: 1229, loss: 0.3431902229785919, mean loss: 0.34318549446612623
Epoch: 43, step: 1230, loss: 0.30188241600990295, mean loss: 0.34318484220583445
Epoch: 43, step: 1231, loss: 0.32174497842788696, mean loss: 0.3431845036317744
Epoch: 43, step: 1232, loss: 0.3057747781276703, mean loss: 0.3431839128741667
Epoch: 43, step: 1233, loss: 0.3630526065826416, mean loss: 0.3431842266267124
Epoch: 43, step: 1234, loss: 0.3400060832500458, mean loss: 0.34318417644048255
Epoch: 43, step: 1235, loss: 0.3084367513656616, mean loss: 0.3431836277507233
Epoch: 43, step: 1236, loss: 0.3089219629764557, mean loss: 0.34318308674005243
Epoch: 43, step: 1237, loss: 0.316137433052063, mean loss: 0.3431826596809385
Epoch: 43, step: 1238, loss: 0.34400320053100586, mean loss: 0.343182672637324
Epoch: 43, step: 1239, loss: 0.3474122881889343, mean loss: 0.34318273942213345
Epoch: 43, step: 1240, loss: 0.3399112820625305, mean loss: 0.3431826877672717
Epoch: 43, step: 1241, loss: 0.3517998158931732, mean loss: 0.34318282382575727
Epoch: 43, step: 1242, loss: 0.33020249009132385, mean loss: 0.3431826188785127
Epoch: 43, step: 1243, loss: 0.29395315051078796, mean loss: 0.3431818416038448
Epoch: 43, step: 1244, loss: 0.3620782792568207, mean loss: 0.3431821399513771
Epoch: 43, step: 1245, loss: 0.30111929774284363, mean loss: 0.3431814758501707
Epoch: 43, step: 1246, loss: 0.26985442638397217, mean loss: 0.3431803181582358
Epoch: 43, step: 1247, loss: 0.35429880023002625, mean loss: 0.34318049369473835
Epoch: 43, step: 1248, loss: 0.3828442394733429, mean loss: 0.3431811198886061
Epoch: 43, step: 1249, loss: 0.3354727029800415, mean loss: 0.3431809981934132
Epoch: 43, step: 1250, loss: 0.2973799407482147, mean loss: 0.34318027512918436
Epoch: 43, step: 1251, loss: 0.3233943283557892, mean loss: 0.343179962772106
Epoch: 43, step: 1252, loss: 0.3006385266780853, mean loss: 0.343179291188933
Epoch: 43, step: 1253, loss: 0.3060835003852844, mean loss: 0.3431787055830415
Epoch: 43, step: 1254, loss: 0.32945504784584045, mean loss: 0.343178488940458
Epoch: 43, step: 1255, loss: 0.33691930770874023, mean loss: 0.3431783901341621
Epoch: 43, step: 1256, loss: 0.3153046667575836, mean loss: 0.34317795013158314
Epoch: 43, step: 1257, loss: 0.2977599799633026, mean loss: 0.3431772331944061
Epoch: 43, step: 1258, loss: 0.32400310039520264, mean loss: 0.34317693052936843
Epoch: 43, step: 1259, loss: 0.30083736777305603, mean loss: 0.34317626220693576
Epoch: 43, step: 1260, loss: 0.3010794520378113, mean loss: 0.34317559772679795
Epoch: 43, step: 1261, loss: 0.305329829454422, mean loss: 0.34317500035696696
Epoch: 43, step: 1262, loss: 0.31343454122543335, mean loss: 0.34317453093136313
Epoch: 43, step: 1263, loss: 0.33126315474510193, mean loss: 0.34317434292428906
Epoch: 43, step: 1264, loss: 0.31275674700737, mean loss: 0.343173862825864
Epoch: 43, step: 1265, loss: 0.28256329894065857, mean loss: 0.3431729061895452
Epoch: 43, step: 1266, loss: 0.3157137632369995, mean loss: 0.3431724727997671
Epoch: 43, step: 1267, loss: 0.31271979212760925, mean loss: 0.3431719921703373
Epoch: 43, step: 1268, loss: 0.3463863134384155, mean loss: 0.34317204290061726
Epoch: 43, step: 1269, loss: 0.3257615864276886, mean loss: 0.34317176812304595
Epoch: 43, step: 1270, loss: 0.33292078971862793, mean loss: 0.3431716063412742
Epoch: 43, step: 1271, loss: 0.31430909037590027, mean loss: 0.34317115083789745
Epoch: 43, step: 1272, loss: 0.3299712538719177, mean loss: 0.3431709425226293
Epoch: 43, step: 1273, loss: 0.32689589262008667, mean loss: 0.3431706856806336
Epoch: 43, step: 1274, loss: 0.3608270585536957, mean loss: 0.343170964317351
Epoch: 43, step: 1275, loss: 0.36269885301589966, mean loss: 0.3431712724837552
Epoch: 43, step: 1276, loss: 0.3610415756702423, mean loss: 0.3431715544876244
Epoch: 43, step: 1277, loss: 0.302501380443573, mean loss: 0.34317091269854366
Epoch: 43, step: 1278, loss: 0.3095138370990753, mean loss: 0.3431703815869059
Epoch: 43, step: 1279, loss: 0.3158182203769684, mean loss: 0.34316994997418715
Epoch: 43, step: 1280, loss: 0.2968425452709198, mean loss: 0.34316921894670377
Epoch: 43, step: 1281, loss: 0.3470706641674042, mean loss: 0.34316928050894097
Epoch: 43, step: 1282, loss: 0.3325927257537842, mean loss: 0.343169113620503
Epoch: 43, step: 1283, loss: 0.34308212995529175, mean loss: 0.34316911224800134
Epoch: 43, step: 1284, loss: 0.32502320408821106, mean loss: 0.34316882593106995
Epoch: 43, step: 1285, loss: 0.33210399746894836, mean loss: 0.3431686513463803
Epoch: 43, step: 1286, loss: 0.316276878118515, mean loss: 0.34316822704537797
Epoch: 43, step: 1287, loss: 0.29611364006996155, mean loss: 0.3431674846252616
Epoch: 43, step: 1288, loss: 0.34986138343811035, mean loss: 0.3431675902389126
Epoch: 43, step: 1289, loss: 0.3257242441177368, mean loss: 0.343167315029135
Epoch: 43, step: 1290, loss: 0.3670247495174408, mean loss: 0.3431676914302913
Epoch: 43, step: 1291, loss: 0.30661740899086, mean loss: 0.3431671147818873
Epoch: 43, step: 1292, loss: 0.3027465045452118, mean loss: 0.3431664770819545
Epoch: 43, step: 1293, loss: 0.35646870732307434, mean loss: 0.3431666869426531
Epoch: 43, step: 1294, loss: 0.28698885440826416, mean loss: 0.3431658006752397
Epoch: 43, step: 1295, loss: 0.36425673961639404, mean loss: 0.3431661334028686
Epoch: 43, step: 1296, loss: 0.3845420479774475, mean loss: 0.34316678613306745
Epoch: 43, step: 1297, loss: 0.33022770285606384, mean loss: 0.34316658201438505
Epoch: 43, step: 1298, loss: 0.3232058584690094, mean loss: 0.34316626713177484
Epoch: 43, step: 1299, loss: 0.3284991383552551, mean loss: 0.34316603575985444
Epoch: 43, step: 1300, loss: 0.302102267742157, mean loss: 0.34316538799483276
Epoch: 43, step: 1301, loss: 0.3153776228427887, mean loss: 0.3431649496605243
Epoch: 43, step: 1302, loss: 0.3495062589645386, mean loss: 0.34316504968906447
Epoch: 43, step: 1303, loss: 0.33071181178092957, mean loss: 0.3431648532533602
Epoch: 43, step: 1304, loss: 0.30124446749687195, mean loss: 0.3431641920172488
Epoch: 43, step: 1305, loss: 0.3812696039676666, mean loss: 0.3431647930679436
Epoch: 43, step: 1306, loss: 0.32206296920776367, mean loss: 0.3431644602263553
Epoch: 43, step: 1307, loss: 0.3412379324436188, mean loss: 0.34316442983948175
Epoch: 43, step: 1308, loss: 0.3581409454345703, mean loss: 0.34316466605839935
Epoch: 43, step: 1309, loss: 0.32996758818626404, mean loss: 0.34316445790916317
Epoch: 43, step: 1310, loss: 0.32790762186050415, mean loss: 0.34316421727644786
Epoch: 43, step: 1311, loss: 0.31843987107276917, mean loss: 0.34316382732713546
Epoch: 43, step: 1312, loss: 0.3141389787197113, mean loss: 0.34316336955805404
Epoch: 43, step: 1313, loss: 0.31542250514030457, mean loss: 0.3431629320463924
Epoch: 43, step: 1314, loss: 0.3260030746459961, mean loss: 0.3431626614160614
Epoch: 43, step: 1315, loss: 0.33145612478256226, mean loss: 0.34316247679366935
Epoch: 43, step: 1316, loss: 0.3436632454395294, mean loss: 0.34316248469110733
Epoch: 43, step: 1317, loss: 0.32375168800354004, mean loss: 0.34316217857540493
Epoch: 43, step: 1318, loss: 0.3320225775241852, mean loss: 0.34316200290239784
Epoch: 43, step: 1319, loss: 0.3951141834259033, mean loss: 0.3431628221823531
Epoch: 43, step: 1320, loss: 0.3823888301849365, mean loss: 0.3431634407622658
Epoch: 43, step: 1321, loss: 0.34759989380836487, mean loss: 0.3431635107224173
Epoch: 43, step: 1322, loss: 0.3293532133102417, mean loss: 0.3431632929459068
Epoch: 43, step: 1323, loss: 0.309865802526474, mean loss: 0.34316276788140543
Epoch: 43, step: 1324, loss: 0.39176642894744873, mean loss: 0.3431635342951599
Epoch: 43, step: 1325, loss: 0.3224566876888275, mean loss: 0.3431632077814476
Epoch: 43, step: 1326, loss: 0.3636780381202698, mean loss: 0.343163531262271
Epoch: 43, step: 1327, loss: 0.33751121163368225, mean loss: 0.3431634421370798
Epoch: 43, step: 1328, loss: 0.30766624212265015, mean loss: 0.3431628824297271
Epoch: 43, step: 1329, loss: 0.32472681999206543, mean loss: 0.34316259174096864
Epoch: 43, step: 1330, loss: 0.321663498878479, mean loss: 0.3431622527615312
Epoch: 43, step: 1331, loss: 0.33054226636886597, mean loss: 0.343162053783441
Epoch: 43, step: 1332, loss: 0.34472039341926575, mean loss: 0.34316207835324214
Epoch: 43, step: 1333, loss: 0.33832263946533203, mean loss: 0.34316200205268893
Epoch: 43, step: 1334, loss: 0.334408700466156, mean loss: 0.34316186404676735
Epoch: 43, step: 1335, loss: 0.3080931603908539, mean loss: 0.3431613111568188
Epoch: 43, step: 1336, loss: 0.3594522774219513, mean loss: 0.34316156799464165
Epoch: 43, step: 1337, loss: 0.2871433198451996, mean loss: 0.3431606848439535
Epoch: 43, step: 1338, loss: 0.33142635226249695, mean loss: 0.34316049985029773
Epoch: 43, step: 1339, loss: 0.326469361782074, mean loss: 0.3431602367159481
Epoch: 43, step: 1340, loss: 0.3000061810016632, mean loss: 0.3431595564067129
Epoch: 43, step: 1341, loss: 0.2889149785041809, mean loss: 0.3431587012725908
Epoch: 43, step: 1342, loss: 0.3522428274154663, mean loss: 0.34315884447628187
Epoch: 43, step: 1343, loss: 0.3428986668586731, mean loss: 0.34315884037486283
Epoch: 43, step: 1344, loss: 0.3353469967842102, mean loss: 0.34315871723153024
Epoch: 43, step: 1345, loss: 0.3066248297691345, mean loss: 0.3431581413324246
Epoch: 43, step: 1346, loss: 0.35873258113861084, mean loss: 0.34315838683503036
Epoch: 43, step: 1347, loss: 0.32520148158073425, mean loss: 0.34315810378166883
Epoch: 43, step: 1348, loss: 0.386582612991333, mean loss: 0.3431587882681872
Epoch: 43, step: 1349, loss: 0.32150375843048096, mean loss: 0.3431584469323239
Epoch: 43, step: 1350, loss: 0.34357380867004395, mean loss: 0.34315845347933044
Epoch: 43, step: 1351, loss: 0.3192876875400543, mean loss: 0.3431580772299461
Epoch: 43, step: 1352, loss: 0.3536633551120758, mean loss: 0.3431582428108096
Epoch: 43, step: 1353, loss: 0.3483065962791443, mean loss: 0.34315832395624773
Epoch: 43, step: 1354, loss: 0.367397665977478, mean loss: 0.343158705997038
Epoch: 43, step: 1355, loss: 0.33123037219047546, mean loss: 0.3431585179953074
Epoch: 43, step: 1356, loss: 0.2954392433166504, mean loss: 0.34315776590662705
Epoch: 43, step: 1357, loss: 0.3196844756603241, mean loss: 0.3431573959572142
Epoch: 43, step: 1358, loss: 0.3227784037590027, mean loss: 0.34315707478036594
Epoch: 43, step: 1359, loss: 0.3410739302635193, mean loss: 0.3431570419501239
Epoch: 43, step: 1360, loss: 0.367145299911499, mean loss: 0.34315741999778065
Epoch: 43, step: 1361, loss: 0.32176563143730164, mean loss: 0.34315708287500574
Epoch: 43, step: 1362, loss: 0.32230710983276367, mean loss: 0.3431567542961224
Epoch: 43, step: 1363, loss: 0.3174830675125122, mean loss: 0.34315634970574826
Epoch: 43, step: 1364, loss: 0.32304441928863525, mean loss: 0.3431560327678152
Epoch: 43, step: 1365, loss: 0.3412982225418091, mean loss: 0.34315600349159747
Epoch: 43, step: 1366, loss: 0.3622181713581085, mean loss: 0.34315630387716717
Epoch: 43, step: 1367, loss: 0.3532412052154541, mean loss: 0.34315646279461653
Epoch: 43, step: 1368, loss: 0.3698565363883972, mean loss: 0.3431568835266188
Epoch: 43, step: 1369, loss: 0.32060688734054565, mean loss: 0.34315652819592973
Epoch: 43, step: 1370, loss: 0.3288581967353821, mean loss: 0.3431563028940773
Epoch: 43, step: 1371, loss: 0.29945313930511475, mean loss: 0.3431556142648767
Epoch: 43, step: 1372, loss: 0.3619990646839142, mean loss: 0.34315591117577904
Epoch: 43, step: 1373, loss: 0.3878459632396698, mean loss: 0.34315661533315567
Epoch: 43, step: 1374, loss: 0.30791381001472473, mean loss: 0.34315606003976984
Epoch: 43, step: 1375, loss: 0.3123514652252197, mean loss: 0.3431555746834515
Epoch: 43, step: 1376, loss: 0.3191734552383423, mean loss: 0.34315519682781415
Epoch: 43, step: 1377, loss: 0.32501721382141113, mean loss: 0.34315491105527585
Epoch: 43, step: 1378, loss: 0.31776267290115356, mean loss: 0.3431545109948049
Epoch: 43, step: 1379, loss: 0.380830854177475, mean loss: 0.34315510458478443
Epoch: 43, step: 1380, loss: 0.32514092326164246, mean loss: 0.34315482077621506
Epoch: 43, step: 1381, loss: 0.3233223855495453, mean loss: 0.34315450832646827
Epoch: 43, step: 1382, loss: 0.3273848593235016, mean loss: 0.3431542598877286
Epoch: 43, step: 1383, loss: 0.32273831963539124, mean loss: 0.3431539382552966
Epoch: 43, step: 1384, loss: 0.31698334217071533, mean loss: 0.34315352597059373
Epoch: 43, step: 1385, loss: 0.323402464389801, mean loss: 0.34315321482245453
Epoch: 43, step: 1386, loss: 0.3283299207687378, mean loss: 0.34315298130752747
Epoch: 43, step: 1387, loss: 0.3160169720649719, mean loss: 0.343152553834162
Epoch: 43, step: 1388, loss: 0.3260229229927063, mean loss: 0.34315228399545683
Epoch: 43, step: 1389, loss: 0.3263111412525177, mean loss: 0.3431520187054102
Epoch: 43, step: 1390, loss: 0.30420970916748047, mean loss: 0.343151405276468
Epoch: 43, step: 1391, loss: 0.3097139894962311, mean loss: 0.34315087857027776
Epoch: 43, step: 1392, loss: 0.30287662148475647, mean loss: 0.3431502441801528
Epoch: 43, step: 1393, loss: 0.36353397369384766, mean loss: 0.34315056525455523
Epoch: 43, step: 1394, loss: 0.3729456961154938, mean loss: 0.34315103456529383
Epoch: 43, step: 1395, loss: 0.3336549401283264, mean loss: 0.3431508849922338
Epoch: 43, step: 1396, loss: 0.3188919126987457, mean loss: 0.34315050289498394
Epoch: 43, step: 1397, loss: 0.33653879165649414, mean loss: 0.3431503987571475
Epoch: 43, step: 1398, loss: 0.2945542633533478, mean loss: 0.3431496333551944
Epoch: 43, step: 1399, loss: 0.3326402008533478, mean loss: 0.34314946783146694
Epoch: 43, step: 1400, loss: 0.3450623154640198, mean loss: 0.3431494979583728
Epoch: 43, step: 1401, loss: 0.3738548755645752, mean loss: 0.34314998155332044
Epoch: 43, step: 1402, loss: 0.3202923536300659, mean loss: 0.34314962156233025
Epoch: 43, step: 1403, loss: 0.30651119351387024, mean loss: 0.3431490445428637
Epoch: 43, step: 1404, loss: 0.3384099304676056, mean loss: 0.3431489699076199
Epoch: 43, step: 1405, loss: 0.3348747193813324, mean loss: 0.34314883960035786
Epoch: 43, step: 1406, loss: 0.33299195766448975, mean loss: 0.3431486796469423
Epoch: 43, step: 1407, loss: 0.32471567392349243, mean loss: 0.3431483893633876
Epoch: 43, step: 1408, loss: 0.3231145739555359, mean loss: 0.3431480738751999
Epoch: 43, step: 1409, loss: 0.32958969473838806, mean loss: 0.34314786036414296
Epoch: 43, step: 1410, loss: 0.33132293820381165, mean loss: 0.3431476741536937
Epoch: 43, step: 1411, loss: 0.2889978885650635, mean loss: 0.343146821454878
Epoch: 43, step: 1412, loss: 0.32843017578125, mean loss: 0.3431465897149257
Epoch: 43, step: 1413, loss: 0.3718631863594055, mean loss: 0.34314704190206774
Epoch: 43, step: 1414, loss: 0.30533263087272644, mean loss: 0.34314644646517056
Epoch: 43, step: 1415, loss: 0.33795785903930664, mean loss: 0.34314636476542526
Epoch: 43, step: 1416, loss: 0.3440730571746826, mean loss: 0.3431463793569384
Epoch: 43, step: 1417, loss: 0.3460729718208313, mean loss: 0.3431464254377519
Epoch: 43, step: 1418, loss: 0.32033786177635193, mean loss: 0.3431460663099841
Epoch: 43, step: 1419, loss: 0.32892003655433655, mean loss: 0.3431458423203482
Epoch: 43, step: 1420, loss: 0.316439151763916, mean loss: 0.3431454218286291
Epoch: 43, step: 1421, loss: 0.35099294781684875, mean loss: 0.3431455453844749
Epoch: 43, step: 1422, loss: 0.2967583239078522, mean loss: 0.3431448150495701
Epoch: 43, step: 1423, loss: 0.3046517074108124, mean loss: 0.34314420901160114
Epoch: 43, step: 1424, loss: 0.309647798538208, mean loss: 0.3431436816502574
Epoch: 43, step: 1425, loss: 0.36351004242897034, mean loss: 0.3431440022894585
Epoch: 43, step: 1426, loss: 0.3471171259880066, mean loss: 0.34314406483961984
Epoch: 43, step: 1427, loss: 0.32264092564582825, mean loss: 0.34314374205720183
Epoch: 43, step: 1428, loss: 0.34989216923713684, mean loss: 0.34314384829651134
Epoch: 43, step: 1429, loss: 0.2954734265804291, mean loss: 0.343143097841209
Epoch: 43, step: 1430, loss: 0.32934364676475525, mean loss: 0.3431428806057025
Epoch: 43, step: 1431, loss: 0.3137328624725342, mean loss: 0.3431424176307933
Epoch: 43, step: 1432, loss: 0.3001210391521454, mean loss: 0.34314174039539813
Epoch: 43, step: 1433, loss: 0.3152872622013092, mean loss: 0.34314130192173076
Epoch: 43, step: 1434, loss: 0.35504937171936035, mean loss: 0.3431414893706863
Epoch: 43, step: 1435, loss: 0.3548431992530823, mean loss: 0.34314167356836106
Epoch: 43, step: 1436, loss: 0.3320457339286804, mean loss: 0.3431414989089199
Epoch: 43, step: 1437, loss: 0.33072879910469055, mean loss: 0.3431413035256395
Epoch: 43, step: 1438, loss: 0.35480982065200806, mean loss: 0.34314148719215076
Epoch: 43, step: 1439, loss: 0.3122377097606659, mean loss: 0.34314100076361975
Epoch: 43, step: 1440, loss: 0.33773714303970337, mean loss: 0.3431409157077004
Epoch: 43, step: 1441, loss: 0.31745630502700806, mean loss: 0.3431405114420996
Epoch: 43, step: 1442, loss: 0.30969053506851196, mean loss: 0.34313998496100456
Epoch: 43, step: 1443, loss: 0.3640907108783722, mean loss: 0.3431403147067537
Valid: 43, mean loss: 0.18558472146590552
Epoch: 44, step: 0, loss: 0.3534313440322876, mean loss: 0.343140476675832
Epoch: 44, step: 1, loss: 0.3607345521450043, mean loss: 0.3431407535821789
Epoch: 44, step: 2, loss: 0.343656450510025, mean loss: 0.34314076169840557
Epoch: 44, step: 3, loss: 0.31306788325309753, mean loss: 0.3431402884079044
Epoch: 44, step: 4, loss: 0.32849282026290894, mean loss: 0.3431400578879544
Epoch: 44, step: 5, loss: 0.31729912757873535, mean loss: 0.34313965121315176
Epoch: 44, step: 6, loss: 0.31486228108406067, mean loss: 0.3431392062015828
Epoch: 44, step: 7, loss: 0.3602408170700073, mean loss: 0.34313947533180544
Epoch: 44, step: 8, loss: 0.32835209369659424, mean loss: 0.34313924262456436
Epoch: 44, step: 9, loss: 0.320865273475647, mean loss: 0.3431388921073147
Epoch: 44, step: 10, loss: 0.35872745513916016, mean loss: 0.34313913741493
Epoch: 44, step: 11, loss: 0.354487806558609, mean loss: 0.34313931599913633
Epoch: 44, step: 12, loss: 0.3443182110786438, mean loss: 0.34313933455009826
Epoch: 44, step: 13, loss: 0.357467383146286, mean loss: 0.34313956001113044
Epoch: 44, step: 14, loss: 0.2866259515285492, mean loss: 0.343138670747256
Epoch: 44, step: 15, loss: 0.332848459482193, mean loss: 0.34313850882927915
Epoch: 44, step: 16, loss: 0.30332452058792114, mean loss: 0.343137882360218
Epoch: 44, step: 17, loss: 0.33543917536735535, mean loss: 0.3431377612237515
Epoch: 44, step: 18, loss: 0.318610280752182, mean loss: 0.3431373752984825
Epoch: 44, step: 19, loss: 0.31564414501190186, mean loss: 0.3431369427157163
Epoch: 44, step: 20, loss: 0.31111598014831543, mean loss: 0.34313643890083256
Epoch: 44, step: 21, loss: 0.36697298288345337, mean loss: 0.3431368139369253
Epoch: 44, step: 22, loss: 0.3299049139022827, mean loss: 0.34313660575397664
Epoch: 44, step: 23, loss: 0.3373335003852844, mean loss: 0.3431365144527594
Epoch: 44, step: 24, loss: 0.3951294422149658, mean loss: 0.34313733245322764
Epoch: 44, step: 25, loss: 0.32542160153388977, mean loss: 0.34313705373747105
Epoch: 44, step: 26, loss: 0.32804831862449646, mean loss: 0.34313681635510845
Epoch: 44, step: 27, loss: 0.3484381139278412, mean loss: 0.34313689975605194
Epoch: 44, step: 28, loss: 0.33398380875587463, mean loss: 0.34313675576028385
Epoch: 44, step: 29, loss: 0.3389461040496826, mean loss: 0.34313668983429024
Epoch: 44, step: 30, loss: 0.34789130091667175, mean loss: 0.3431367646311358
Epoch: 44, step: 31, loss: 0.3338311016559601, mean loss: 0.3431366182420253
Epoch: 44, step: 32, loss: 0.3274921178817749, mean loss: 0.34313637213935955
Epoch: 44, step: 33, loss: 0.35359644889831543, mean loss: 0.34313653668359045
Epoch: 44, step: 34, loss: 0.31681492924690247, mean loss: 0.34313612263304166
Epoch: 44, step: 35, loss: 0.37834861874580383, mean loss: 0.343136676532496
Epoch: 44, step: 36, loss: 0.34403860569000244, mean loss: 0.34313669071979497
Epoch: 44, step: 37, loss: 0.3527003526687622, mean loss: 0.3431368411533362
Epoch: 44, step: 38, loss: 0.3060379922389984, mean loss: 0.34313625760872096
Epoch: 44, step: 39, loss: 0.3503020405769348, mean loss: 0.34313637032079736
Epoch: 44, step: 40, loss: 0.32080158591270447, mean loss: 0.34313601901789836
Epoch: 44, step: 41, loss: 0.37241360545158386, mean loss: 0.3431364795165997
Epoch: 44, step: 42, loss: 0.3181353211402893, mean loss: 0.3431360862867852
Epoch: 44, step: 43, loss: 0.3156966269016266, mean loss: 0.34313565471302954
Epoch: 44, step: 44, loss: 0.3553125858306885, mean loss: 0.34313584623142523
Epoch: 44, step: 45, loss: 0.34317079186439514, mean loss: 0.3431358467810404
Epoch: 44, step: 46, loss: 0.36308690905570984, mean loss: 0.3431361605608601
Epoch: 44, step: 47, loss: 0.3147667944431305, mean loss: 0.34313571438940005
Epoch: 44, step: 48, loss: 0.34213733673095703, mean loss: 0.3431356986879349
Epoch: 44, step: 49, loss: 0.36264216899871826, mean loss: 0.3431360054609716
Epoch: 44, step: 50, loss: 0.3644963204860687, mean loss: 0.3431363413836449
Epoch: 44, step: 51, loss: 0.3558023273944855, mean loss: 0.34313654057195103
Epoch: 44, step: 52, loss: 0.3562556207180023, mean loss: 0.34313674688247875
Epoch: 44, step: 53, loss: 0.42422226071357727, mean loss: 0.34313802201243365
Epoch: 44, step: 54, loss: 0.309377521276474, mean loss: 0.34313749111182296
Epoch: 44, step: 55, loss: 0.35239627957344055, mean loss: 0.34313763670857195
Epoch: 44, step: 56, loss: 0.31250593066215515, mean loss: 0.34313715502495823
Epoch: 44, step: 57, loss: 0.36279061436653137, mean loss: 0.3431374640707698
Epoch: 44, step: 58, loss: 0.38668784499168396, mean loss: 0.3431381488790239
Epoch: 44, step: 59, loss: 0.27970725297927856, mean loss: 0.3431371514751636
Epoch: 44, step: 60, loss: 0.3267289102077484, mean loss: 0.3431368934717787
Epoch: 44, step: 61, loss: 0.35532405972480774, mean loss: 0.34313708509991564
Epoch: 44, step: 62, loss: 0.36291083693504333, mean loss: 0.3431373960128519
Epoch: 44, step: 63, loss: 0.35405322909355164, mean loss: 0.34313756764544756
Epoch: 44, step: 64, loss: 0.30806297063827515, mean loss: 0.3431370161667443
Epoch: 44, step: 65, loss: 0.3425910472869873, mean loss: 0.3431370075825979
Epoch: 44, step: 66, loss: 0.3769959509372711, mean loss: 0.3431375399308103
Epoch: 44, step: 67, loss: 0.3623362183570862, mean loss: 0.34313784177783924
Epoch: 44, step: 68, loss: 0.3645665645599365, mean loss: 0.34313817868095664
Epoch: 44, step: 69, loss: 0.2914056181907654, mean loss: 0.34313736535264655
Epoch: 44, step: 70, loss: 0.33164671063423157, mean loss: 0.34313718470185783
Epoch: 44, step: 71, loss: 0.3732636868953705, mean loss: 0.34313765832942345
Epoch: 44, step: 72, loss: 0.3219880163669586, mean loss: 0.3431373258349343
Epoch: 44, step: 73, loss: 0.31087636947631836, mean loss: 0.3431368186669362
Epoch: 44, step: 74, loss: 0.3120616376399994, mean loss: 0.3431363301479532
Epoch: 44, step: 75, loss: 0.3197823464870453, mean loss: 0.3431359630162224
Epoch: 44, step: 76, loss: 0.3011428117752075, mean loss: 0.343135302881482
Epoch: 44, step: 77, loss: 0.29959815740585327, mean loss: 0.3431346184858226
Epoch: 44, step: 78, loss: 0.3334044814109802, mean loss: 0.3431344655323199
Epoch: 44, step: 79, loss: 0.32048383355140686, mean loss: 0.34313410947988054
Epoch: 44, step: 80, loss: 0.3386954963207245, mean loss: 0.3431340397090149
Epoch: 44, step: 81, loss: 0.3114076554775238, mean loss: 0.34313354100763743
Epoch: 44, step: 82, loss: 0.3562818169593811, mean loss: 0.3431337476797944
Epoch: 44, step: 83, loss: 0.33761924505233765, mean loss: 0.3431336610010357
Epoch: 44, step: 84, loss: 0.29198911786079407, mean loss: 0.3431328571069891
Epoch: 44, step: 85, loss: 0.32405614852905273, mean loss: 0.34313255726246084
Epoch: 44, step: 86, loss: 0.3580273389816284, mean loss: 0.34313279137247954
Epoch: 44, step: 87, loss: 0.35434848070144653, mean loss: 0.343132967653275
Epoch: 44, step: 88, loss: 0.29975053668022156, mean loss: 0.3431322858076016
Epoch: 44, step: 89, loss: 0.3356627821922302, mean loss: 0.34313216841056865
Epoch: 44, step: 90, loss: 0.3175338804721832, mean loss: 0.34313176609255996
Epoch: 44, step: 91, loss: 0.31445232033729553, mean loss: 0.34313131535631564
Epoch: 44, step: 92, loss: 0.3488108515739441, mean loss: 0.34313140461649916
Epoch: 44, step: 93, loss: 0.35291576385498047, mean loss: 0.3431315583860927
Epoch: 44, step: 94, loss: 0.32633674144744873, mean loss: 0.3431312944452944
Epoch: 44, step: 95, loss: 0.32360705733299255, mean loss: 0.34313098761481425
Epoch: 44, step: 96, loss: 0.3751946985721588, mean loss: 0.34313149149976324
Epoch: 44, step: 97, loss: 0.40132027864456177, mean loss: 0.34313240592895433
Epoch: 44, step: 98, loss: 0.30032840371131897, mean loss: 0.34313173328021984
Epoch: 44, step: 99, loss: 0.3086603283882141, mean loss: 0.343131191583619
Epoch: 44, step: 100, loss: 0.3242378532886505, mean loss: 0.34313089469127184
Epoch: 44, step: 101, loss: 0.34415140748023987, mean loss: 0.343130910727489
Epoch: 44, step: 102, loss: 0.34276044368743896, mean loss: 0.34313090490610526
Epoch: 44, step: 103, loss: 0.3735554814338684, mean loss: 0.3431313829792751
Epoch: 44, step: 104, loss: 0.3186195194721222, mean loss: 0.3431309978209101
Epoch: 44, step: 105, loss: 0.2984693646430969, mean loss: 0.3431302960574021
Epoch: 44, step: 106, loss: 0.435756653547287, mean loss: 0.3431317514626704
Epoch: 44, step: 107, loss: 0.3306328058242798, mean loss: 0.3431315550742341
Epoch: 44, step: 108, loss: 0.33545365929603577, mean loss: 0.34313143443795824
Epoch: 44, step: 109, loss: 0.33995428681373596, mean loss: 0.3431313845189119
Epoch: 44, step: 110, loss: 0.37442588806152344, mean loss: 0.34313187620749963
Epoch: 44, step: 111, loss: 0.33440732955932617, mean loss: 0.343131739132546
Epoch: 44, step: 112, loss: 0.35677865147590637, mean loss: 0.3431319535414502
Epoch: 44, step: 113, loss: 0.29884210228919983, mean loss: 0.3431312577071807
Epoch: 44, step: 114, loss: 0.32587844133377075, mean loss: 0.3431309866538371
Epoch: 44, step: 115, loss: 0.32834091782569885, mean loss: 0.34313075429556356
Epoch: 44, step: 116, loss: 0.35957175493240356, mean loss: 0.3431310125866203
Epoch: 44, step: 117, loss: 0.33748525381088257, mean loss: 0.3431309238921349
Epoch: 44, step: 118, loss: 0.3147650361061096, mean loss: 0.34313047827297244
Epoch: 44, step: 119, loss: 0.35181552171707153, mean loss: 0.34313061471012596
Epoch: 44, step: 120, loss: 0.33693447709083557, mean loss: 0.34313051737381384
Epoch: 44, step: 121, loss: 0.3065865933895111, mean loss: 0.3431299433073338
Epoch: 44, step: 122, loss: 0.30868837237358093, mean loss: 0.34312940227510064
Epoch: 44, step: 123, loss: 0.3213530480861664, mean loss: 0.3431290602023047
Epoch: 44, step: 124, loss: 0.308171808719635, mean loss: 0.3431285110866533
Epoch: 44, step: 125, loss: 0.32969456911087036, mean loss: 0.3431283000668617
Epoch: 44, step: 126, loss: 0.3372029662132263, mean loss: 0.34312820699343044
Epoch: 44, step: 127, loss: 0.3117683231830597, mean loss: 0.3431277144091786
Epoch: 44, step: 128, loss: 0.31228092312812805, mean loss: 0.3431272298919198
Epoch: 44, step: 129, loss: 0.30582836270332336, mean loss: 0.3431266440397037
Epoch: 44, step: 130, loss: 0.34259873628616333, mean loss: 0.34312663574800234
Epoch: 44, step: 131, loss: 0.33542588353157043, mean loss: 0.34312651479631207
Epoch: 44, step: 132, loss: 0.31982195377349854, mean loss: 0.34312614876950115
Epoch: 44, step: 133, loss: 0.37868568301200867, mean loss: 0.3431267072669763
Epoch: 44, step: 134, loss: 0.3160267472267151, mean loss: 0.3431262816421229
Epoch: 44, step: 135, loss: 0.3204919695854187, mean loss: 0.3431259261591468
Epoch: 44, step: 136, loss: 0.3376561999320984, mean loss: 0.34312584025576187
Epoch: 44, step: 137, loss: 0.3262586295604706, mean loss: 0.3431255753562629
Epoch: 44, step: 138, loss: 0.3286016285419464, mean loss: 0.34312534726129923
Epoch: 44, step: 139, loss: 0.31418517231941223, mean loss: 0.3431248927702046
Epoch: 44, step: 140, loss: 0.33967325091362, mean loss: 0.3431248385647323
Epoch: 44, step: 141, loss: 0.32998427748680115, mean loss: 0.34312463220521916
Epoch: 44, step: 142, loss: 0.36319199204444885, mean loss: 0.34312494733830606
Epoch: 44, step: 143, loss: 0.337678998708725, mean loss: 0.343124861817756
Epoch: 44, step: 144, loss: 0.3674159348011017, mean loss: 0.3431252432670577
Epoch: 44, step: 145, loss: 0.31107258796691895, mean loss: 0.34312473994342935
Epoch: 44, step: 146, loss: 0.322298139333725, mean loss: 0.3431244129079472
Epoch: 44, step: 147, loss: 0.3040764331817627, mean loss: 0.3431237997558254
Epoch: 44, step: 148, loss: 0.32323116064071655, mean loss: 0.34312348739594295
Epoch: 44, step: 149, loss: 0.3331136703491211, mean loss: 0.34312333022141406
Epoch: 44, step: 150, loss: 0.35327377915382385, mean loss: 0.34312348960164757
Epoch: 44, step: 151, loss: 0.33882901072502136, mean loss: 0.3431234221716941
Epoch: 44, step: 152, loss: 0.31599631905555725, mean loss: 0.3431229962409507
Epoch: 44, step: 153, loss: 0.2977572977542877, mean loss: 0.3431222839517611
Epoch: 44, step: 154, loss: 0.2892897427082062, mean loss: 0.34312143873750406
Epoch: 44, step: 155, loss: 0.3396967649459839, mean loss: 0.3431213849682113
Epoch: 44, step: 156, loss: 0.3425770699977875, mean loss: 0.34312137642229623
Epoch: 44, step: 157, loss: 0.32553014159202576, mean loss: 0.3431211002387494
Epoch: 44, step: 158, loss: 0.32813000679016113, mean loss: 0.3431208648812889
Epoch: 44, step: 159, loss: 0.3461301326751709, mean loss: 0.3431209121255082
Epoch: 44, step: 160, loss: 0.32825273275375366, mean loss: 0.3431206787051058
Epoch: 44, step: 161, loss: 0.3525509834289551, mean loss: 0.34312082675221445
Epoch: 44, step: 162, loss: 0.29656052589416504, mean loss: 0.3431200958098
Epoch: 44, step: 163, loss: 0.3452586531639099, mean loss: 0.343120129382129
Epoch: 44, step: 164, loss: 0.33447906374931335, mean loss: 0.3431199937317368
Epoch: 44, step: 165, loss: 0.3045981526374817, mean loss: 0.34311938901224454
Epoch: 44, step: 166, loss: 0.3301577568054199, mean loss: 0.3431191855425146
Epoch: 44, step: 167, loss: 0.3503194749355316, mean loss: 0.3431192985697875
Epoch: 44, step: 168, loss: 0.35083580017089844, mean loss: 0.34311941969845244
Epoch: 44, step: 169, loss: 0.3661029040813446, mean loss: 0.34311978047270264
Epoch: 44, step: 170, loss: 0.3606311082839966, mean loss: 0.3431200553456022
Epoch: 44, step: 171, loss: 0.2977295219898224, mean loss: 0.34311934286783874
Epoch: 44, step: 172, loss: 0.33509886264801025, mean loss: 0.3431192169754182
Epoch: 44, step: 173, loss: 0.35516732931137085, mean loss: 0.34311940608407204
Epoch: 44, step: 174, loss: 0.31601595878601074, mean loss: 0.34311898067170526
Epoch: 44, step: 175, loss: 0.3473142683506012, mean loss: 0.34311904651938985
Epoch: 44, step: 176, loss: 0.34078308939933777, mean loss: 0.34311900985564586
Epoch: 44, step: 177, loss: 0.3089905381202698, mean loss: 0.3431184742045843
Epoch: 44, step: 178, loss: 0.32297205924987793, mean loss: 0.34311815800879125
Epoch: 44, step: 179, loss: 0.33285242319107056, mean loss: 0.3431179968917278
Epoch: 44, step: 180, loss: 0.2924765348434448, mean loss: 0.3431172021044332
Epoch: 44, step: 181, loss: 0.2948820888996124, mean loss: 0.3431164450952175
Epoch: 44, step: 182, loss: 0.3257450759410858, mean loss: 0.3431161724705819
Epoch: 44, step: 183, loss: 0.3375591039657593, mean loss: 0.3431160852598395
Epoch: 44, step: 184, loss: 0.32910221815109253, mean loss: 0.34311586533442856
Epoch: 44, step: 185, loss: 0.3046402931213379, mean loss: 0.3431152615308409
Epoch: 44, step: 186, loss: 0.36094290018081665, mean loss: 0.3431155412985645
Epoch: 44, step: 187, loss: 0.3112049698829651, mean loss: 0.34311504053634906
Epoch: 44, step: 188, loss: 0.346723347902298, mean loss: 0.34311509715945404
Epoch: 44, step: 189, loss: 0.28097429871559143, mean loss: 0.34311412203472563
Epoch: 44, step: 190, loss: 0.3516307473182678, mean loss: 0.3431142556770638
Epoch: 44, step: 191, loss: 0.30798810720443726, mean loss: 0.34311370448844225
Epoch: 44, step: 192, loss: 0.325900673866272, mean loss: 0.34311343439114556
Epoch: 44, step: 193, loss: 0.3511812090873718, mean loss: 0.3431135609841896
Epoch: 44, step: 194, loss: 0.3103314936161041, mean loss: 0.3431130466023759
Epoch: 44, step: 195, loss: 0.30678918957710266, mean loss: 0.3431124766554572
Epoch: 44, step: 196, loss: 0.315638929605484, mean loss: 0.3431120455829037
Epoch: 44, step: 197, loss: 0.31614866852760315, mean loss: 0.34311162252178945
Epoch: 44, step: 198, loss: 0.32466384768486023, mean loss: 0.34311133307682457
Epoch: 44, step: 199, loss: 0.2973327040672302, mean loss: 0.3431106148229491
Epoch: 44, step: 200, loss: 0.3149731755256653, mean loss: 0.3431101733613287
Epoch: 44, step: 201, loss: 0.3427947759628296, mean loss: 0.3431101684129871
Epoch: 44, step: 202, loss: 0.31681281328201294, mean loss: 0.34310975583426556
Epoch: 44, step: 203, loss: 0.33360418677330017, mean loss: 0.3431096067039069
Epoch: 44, step: 204, loss: 0.2982838749885559, mean loss: 0.343108903455892
Epoch: 44, step: 205, loss: 0.3793049454689026, mean loss: 0.3431094713082031
Epoch: 44, step: 206, loss: 0.31287407875061035, mean loss: 0.3431089969754519
Epoch: 44, step: 207, loss: 0.3449415862560272, mean loss: 0.34310902572465624
Epoch: 44, step: 208, loss: 0.29799026250839233, mean loss: 0.3431083179238371
Epoch: 44, step: 209, loss: 0.33616137504577637, mean loss: 0.34310820894534627
Epoch: 44, step: 210, loss: 0.3506280183792114, mean loss: 0.34310832690869253
Epoch: 44, step: 211, loss: 0.3288487195968628, mean loss: 0.3431081032215602
Epoch: 44, step: 212, loss: 0.3512028455734253, mean loss: 0.34310823019990266
Epoch: 44, step: 213, loss: 0.34265244007110596, mean loss: 0.34310822305025357
Epoch: 44, step: 214, loss: 0.3341166377067566, mean loss: 0.34310808200799003
Epoch: 44, step: 215, loss: 0.3248421251773834, mean loss: 0.34310779549216575
Epoch: 44, step: 216, loss: 0.3436102867126465, mean loss: 0.34310780337401003
Epoch: 44, step: 217, loss: 0.33070147037506104, mean loss: 0.34310760877707497
Epoch: 44, step: 218, loss: 0.39505353569984436, mean loss: 0.3431084235512405
Epoch: 44, step: 219, loss: 0.30516523122787476, mean loss: 0.34310782841992227
Epoch: 44, step: 220, loss: 0.30841267108917236, mean loss: 0.3431072842419131
Epoch: 44, step: 221, loss: 0.3357280492782593, mean loss: 0.3431071685037318
Epoch: 44, step: 222, loss: 0.3000730574131012, mean loss: 0.34310649355413897
Epoch: 44, step: 223, loss: 0.34677183628082275, mean loss: 0.34310655104069365
Epoch: 44, step: 224, loss: 0.34563690423965454, mean loss: 0.3431065907256609
Epoch: 44, step: 225, loss: 0.3529888093471527, mean loss: 0.34310674571168115
Epoch: 44, step: 226, loss: 0.3365257680416107, mean loss: 0.34310664250170564
Epoch: 44, step: 227, loss: 0.3504749834537506, mean loss: 0.3431067580581474
Epoch: 44, step: 228, loss: 0.3411671817302704, mean loss: 0.34310672764057776
Epoch: 44, step: 229, loss: 0.3019944131374359, mean loss: 0.34310608290334316
Epoch: 44, step: 230, loss: 0.3087378144264221, mean loss: 0.3431055439369738
Epoch: 44, step: 231, loss: 0.3219006359577179, mean loss: 0.34310521140485767
Epoch: 44, step: 232, loss: 0.31306666135787964, mean loss: 0.34310474035230787
Epoch: 44, step: 233, loss: 0.3142411410808563, mean loss: 0.3431042877319649
Epoch: 44, step: 234, loss: 0.354168564081192, mean loss: 0.343104461232088
Epoch: 44, step: 235, loss: 0.3285974860191345, mean loss: 0.34310423375019605
Epoch: 44, step: 236, loss: 0.3020364046096802, mean loss: 0.3431035897812885
Epoch: 44, step: 237, loss: 0.3783620297908783, mean loss: 0.34310414264671973
Epoch: 44, step: 238, loss: 0.32970136404037476, mean loss: 0.3431039324894699
Epoch: 44, step: 239, loss: 0.3430302143096924, mean loss: 0.34310393133357775
Epoch: 44, step: 240, loss: 0.39107975363731384, mean loss: 0.34310468357689905
Epoch: 44, step: 241, loss: 0.32920563220977783, mean loss: 0.34310446564828156
Epoch: 44, step: 242, loss: 0.3084637224674225, mean loss: 0.34310392251114896
Epoch: 44, step: 243, loss: 0.3645855486392975, mean loss: 0.34310425931933536
Epoch: 44, step: 244, loss: 0.33407020568847656, mean loss: 0.34310411767756693
Epoch: 44, step: 245, loss: 0.31401124596595764, mean loss: 0.3431036615477543
Epoch: 44, step: 246, loss: 0.31270885467529297, mean loss: 0.34310318501314674
Epoch: 44, step: 247, loss: 0.34597542881965637, mean loss: 0.3431032300439351
Epoch: 44, step: 248, loss: 0.33522313833236694, mean loss: 0.34310310650248005
Epoch: 44, step: 249, loss: 0.32532912492752075, mean loss: 0.34310282785228136
Epoch: 44, step: 250, loss: 0.34337422251701355, mean loss: 0.34310283210698317
Epoch: 44, step: 251, loss: 0.3449862003326416, mean loss: 0.3431028616324147
Epoch: 44, step: 252, loss: 0.34321144223213196, mean loss: 0.3431028633345985
Epoch: 44, step: 253, loss: 0.3497210144996643, mean loss: 0.34310296708363697
Epoch: 44, step: 254, loss: 0.3702753186225891, mean loss: 0.3431033930426522
Epoch: 44, step: 255, loss: 0.34726226329803467, mean loss: 0.34310345823688115
Epoch: 44, step: 256, loss: 0.3963821828365326, mean loss: 0.3431042934182427
Epoch: 44, step: 257, loss: 0.2978208065032959, mean loss: 0.3431035835789645
Epoch: 44, step: 258, loss: 0.2960888147354126, mean loss: 0.3431028466126059
Epoch: 44, step: 259, loss: 0.31299594044685364, mean loss: 0.3431023746879372
Epoch: 44, step: 260, loss: 0.3163210153579712, mean loss: 0.3431019548976754
Epoch: 44, step: 261, loss: 0.3256986439228058, mean loss: 0.3431016821099552
Epoch: 44, step: 262, loss: 0.33861392736434937, mean loss: 0.3431016117678692
Epoch: 44, step: 263, loss: 0.34018751978874207, mean loss: 0.3431015660924463
Epoch: 44, step: 264, loss: 0.3651708662509918, mean loss: 0.34310191200082013
Epoch: 44, step: 265, loss: 0.3405489921569824, mean loss: 0.34310187198765685
Epoch: 44, step: 266, loss: 0.30263426899909973, mean loss: 0.34310123772903284
Epoch: 44, step: 267, loss: 0.3929750323295593, mean loss: 0.3431020194009437
Epoch: 44, step: 268, loss: 0.3086627721786499, mean loss: 0.34310147964313126
Epoch: 44, step: 269, loss: 0.3246690630912781, mean loss: 0.3431011907609485
Epoch: 44, step: 270, loss: 0.32240742444992065, mean loss: 0.3431008664428281
Epoch: 44, step: 271, loss: 0.3366268277168274, mean loss: 0.3431007649815893
Epoch: 44, step: 272, loss: 0.4072767496109009, mean loss: 0.34310177073288817
Epoch: 44, step: 273, loss: 0.37506282329559326, mean loss: 0.3431022716113173
Epoch: 44, step: 274, loss: 0.33652299642562866, mean loss: 0.3431021685056586
Epoch: 44, step: 275, loss: 0.35449326038360596, mean loss: 0.34310234701584286
Epoch: 44, step: 276, loss: 0.3074410855770111, mean loss: 0.343101788175772
Epoch: 44, step: 277, loss: 0.3009714186191559, mean loss: 0.34310112797002473
Epoch: 44, step: 278, loss: 0.2923676073551178, mean loss: 0.34310033296069126
Epoch: 44, step: 279, loss: 0.3421954810619354, mean loss: 0.3431003187816155
Epoch: 44, step: 280, loss: 0.2978039085865021, mean loss: 0.343099608995662
Epoch: 44, step: 281, loss: 0.3077017366886139, mean loss: 0.34309905432656695
Epoch: 44, step: 282, loss: 0.3238266706466675, mean loss: 0.3430987523415205
Epoch: 44, step: 283, loss: 0.3868945837020874, mean loss: 0.34309943858143527
Epoch: 44, step: 284, loss: 0.332210510969162, mean loss: 0.34309926796474777
Epoch: 44, step: 285, loss: 0.3367462456226349, mean loss: 0.3430991684219202
Epoch: 44, step: 286, loss: 0.389838308095932, mean loss: 0.34309990074631225
Epoch: 44, step: 287, loss: 0.3454071581363678, mean loss: 0.3430999368966223
Epoch: 44, step: 288, loss: 0.3201301097869873, mean loss: 0.34309957700900606
Epoch: 44, step: 289, loss: 0.29913944005966187, mean loss: 0.34309888825932805
Epoch: 44, step: 290, loss: 0.32425081729888916, mean loss: 0.3430985929599883
Epoch: 44, step: 291, loss: 0.36686456203460693, mean loss: 0.3430989653039294
Epoch: 44, step: 292, loss: 0.30928850173950195, mean loss: 0.34309843560013387
Epoch: 44, step: 293, loss: 0.3259812295436859, mean loss: 0.3430981674314662
Epoch: 44, step: 294, loss: 0.30638813972473145, mean loss: 0.34309759231862597
Epoch: 44, step: 295, loss: 0.326324999332428, mean loss: 0.3430973295571116
Epoch: 44, step: 296, loss: 0.3084010183811188, mean loss: 0.3430967860089284
Epoch: 44, step: 297, loss: 0.32097628712654114, mean loss: 0.343096439477317
Epoch: 44, step: 298, loss: 0.3404160141944885, mean loss: 0.3430963974874167
Epoch: 44, step: 299, loss: 0.3739413619041443, mean loss: 0.343096880678162
Epoch: 44, step: 300, loss: 0.3579370081424713, mean loss: 0.3430971131472233
Epoch: 44, step: 301, loss: 0.4020178020000458, mean loss: 0.3430980361192596
Epoch: 44, step: 302, loss: 0.35356515645980835, mean loss: 0.34309820008047986
Epoch: 44, step: 303, loss: 0.3424427807331085, mean loss: 0.34309818981388607
Epoch: 44, step: 304, loss: 0.3357388377189636, mean loss: 0.3430980745376201
Epoch: 44, step: 305, loss: 0.3207094669342041, mean loss: 0.3430977238498659
Epoch: 44, step: 306, loss: 0.32338207960128784, mean loss: 0.34309741503536395
Epoch: 44, step: 307, loss: 0.32352373003959656, mean loss: 0.3430971084492322
Epoch: 44, step: 308, loss: 0.3575780391693115, mean loss: 0.3430973352630895
Epoch: 44, step: 309, loss: 0.3071998357772827, mean loss: 0.34309677301174274
Epoch: 44, step: 310, loss: 0.3118681013584137, mean loss: 0.3430962838944521
Epoch: 44, step: 311, loss: 0.33704420924186707, mean loss: 0.3430961891056623
Epoch: 44, step: 312, loss: 0.3274565637111664, mean loss: 0.3430959441585935
Epoch: 44, step: 313, loss: 0.32790040969848633, mean loss: 0.34309570617058316
Epoch: 44, step: 314, loss: 0.3373733162879944, mean loss: 0.34309561654959236
Epoch: 44, step: 315, loss: 0.3675289452075958, mean loss: 0.34309599920524386
Epoch: 44, step: 316, loss: 0.31984108686447144, mean loss: 0.34309563501072926
Epoch: 44, step: 317, loss: 0.3332015872001648, mean loss: 0.34309548006275714
Epoch: 44, step: 318, loss: 0.33054319024086, mean loss: 0.34309528348786367
Epoch: 44, step: 319, loss: 0.32987895607948303, mean loss: 0.3430950765170636
Epoch: 44, step: 320, loss: 0.3908033072948456, mean loss: 0.3430958236274944
Epoch: 44, step: 321, loss: 0.33852142095565796, mean loss: 0.3430957519935148
Epoch: 44, step: 322, loss: 0.34937340021133423, mean loss: 0.343095850298346
Epoch: 44, step: 323, loss: 0.32686951756477356, mean loss: 0.34309559620607016
Epoch: 44, step: 324, loss: 0.33769866824150085, mean loss: 0.3430955116955244
Epoch: 44, step: 325, loss: 0.3146331012248993, mean loss: 0.34309506600934997
Epoch: 44, step: 326, loss: 0.3310912251472473, mean loss: 0.3430948780469795
Epoch: 44, step: 327, loss: 0.3279906213283539, mean loss: 0.3430946415403918
Epoch: 44, step: 328, loss: 0.3514634370803833, mean loss: 0.3430947725792322
Epoch: 44, step: 329, loss: 0.30165889859199524, mean loss: 0.34309412378528886
Epoch: 44, step: 330, loss: 0.3226281702518463, mean loss: 0.3430938033388371
Epoch: 44, step: 331, loss: 0.34748321771621704, mean loss: 0.3430938720651848
Epoch: 44, step: 332, loss: 0.3148573637008667, mean loss: 0.34309342996481745
Epoch: 44, step: 333, loss: 0.3685644567012787, mean loss: 0.3430938287596622
Epoch: 44, step: 334, loss: 0.3603059947490692, mean loss: 0.343094098242933
Epoch: 44, step: 335, loss: 0.3292800784111023, mean loss: 0.3430938819663199
Epoch: 44, step: 336, loss: 0.3035769462585449, mean loss: 0.3430932632865067
Epoch: 44, step: 337, loss: 0.3481299877166748, mean loss: 0.34309334214056986
Epoch: 44, step: 338, loss: 0.31588560342788696, mean loss: 0.3430929161877133
Epoch: 44, step: 339, loss: 0.3695976138114929, mean loss: 0.34309333112755963
Epoch: 44, step: 340, loss: 0.37923139333724976, mean loss: 0.34309389687207187
Epoch: 44, step: 341, loss: 0.3519597053527832, mean loss: 0.3430940356649032
Epoch: 44, step: 342, loss: 0.3413037955760956, mean loss: 0.3430940076394161
Epoch: 44, step: 343, loss: 0.31226983666419983, mean loss: 0.3430935251069963
Epoch: 44, step: 344, loss: 0.366157591342926, mean loss: 0.34309388615435366
Epoch: 44, step: 345, loss: 0.3415575921535492, mean loss: 0.34309386210541964
Epoch: 44, step: 346, loss: 0.3054262697696686, mean loss: 0.3430932724713646
Epoch: 44, step: 347, loss: 0.36636924743652344, mean loss: 0.3430936368188533
Epoch: 44, step: 348, loss: 0.33197021484375, mean loss: 0.34309346270251967
Epoch: 44, step: 349, loss: 0.37902799248695374, mean loss: 0.34309402518146315
Epoch: 44, step: 350, loss: 0.357863187789917, mean loss: 0.3430942563577996
Epoch: 44, step: 351, loss: 0.3631375730037689, mean loss: 0.3430945700836424
Epoch: 44, step: 352, loss: 0.3460271954536438, mean loss: 0.3430946159855249
Epoch: 44, step: 353, loss: 0.3081260621547699, mean loss: 0.3430940686611575
Epoch: 44, step: 354, loss: 0.305805504322052, mean loss: 0.3430934850333486
Epoch: 44, step: 355, loss: 0.35649845004081726, mean loss: 0.3430936948399755
Epoch: 44, step: 356, loss: 0.2831071615219116, mean loss: 0.3430927559807371
Epoch: 44, step: 357, loss: 0.39137840270996094, mean loss: 0.34309351169561997
Epoch: 44, step: 358, loss: 0.3506551682949066, mean loss: 0.3430936300406642
Epoch: 44, step: 359, loss: 0.37058863043785095, mean loss: 0.3430940603492969
Epoch: 44, step: 360, loss: 0.328007310628891, mean loss: 0.34309382423884227
Epoch: 44, step: 361, loss: 0.3259330093860626, mean loss: 0.34309355567308353
Epoch: 44, step: 362, loss: 0.3063637912273407, mean loss: 0.3430929808633925
Epoch: 44, step: 363, loss: 0.32917121052742004, mean loss: 0.34309276299531216
Epoch: 44, step: 364, loss: 0.29597046971321106, mean loss: 0.34309202556877294
Epoch: 44, step: 365, loss: 0.32717618346214294, mean loss: 0.34309177650235706
Epoch: 44, step: 366, loss: 0.33115485310554504, mean loss: 0.34309158970481396
Epoch: 44, step: 367, loss: 0.359619677066803, mean loss: 0.343091848344138
Epoch: 44, step: 368, loss: 0.3059840798377991, mean loss: 0.3430912676733218
Epoch: 44, step: 369, loss: 0.3596068322658539, mean loss: 0.3430915261085954
Epoch: 44, step: 370, loss: 0.3218255043029785, mean loss: 0.34309119334345534
Epoch: 44, step: 371, loss: 0.3129631280899048, mean loss: 0.343090721914757
Epoch: 44, step: 372, loss: 0.3239232301712036, mean loss: 0.34309042199625184
Epoch: 44, step: 373, loss: 0.34039759635925293, mean loss: 0.3430903798615994
Epoch: 44, step: 374, loss: 0.3449437618255615, mean loss: 0.34309040886101994
Epoch: 44, step: 375, loss: 0.3613170385360718, mean loss: 0.34309069404423553
Epoch: 44, step: 376, loss: 0.3244105577468872, mean loss: 0.34309040176979533
Epoch: 44, step: 377, loss: 0.31578150391578674, mean loss: 0.34308997449411466
Epoch: 44, step: 378, loss: 0.30782219767570496, mean loss: 0.3430894227022533
Epoch: 44, step: 379, loss: 0.3454526662826538, mean loss: 0.34308945967646287
Epoch: 44, step: 380, loss: 0.28316742181777954, mean loss: 0.34308852217880403
Epoch: 44, step: 381, loss: 0.35894501209259033, mean loss: 0.3430887702543057
Epoch: 44, step: 382, loss: 0.3724530339241028, mean loss: 0.34308922965235117
Epoch: 44, step: 383, loss: 0.3171555995941162, mean loss: 0.34308882393223133
Epoch: 44, step: 384, loss: 0.30507126450538635, mean loss: 0.34308822917371024
Epoch: 44, step: 385, loss: 0.3207760155200958, mean loss: 0.34308788011996266
Epoch: 44, step: 386, loss: 0.3566705584526062, mean loss: 0.3430880926049576
Epoch: 44, step: 387, loss: 0.31022223830223083, mean loss: 0.34308757846544347
Epoch: 44, step: 388, loss: 0.3059130609035492, mean loss: 0.3430869969321222
Epoch: 44, step: 389, loss: 0.34160467982292175, mean loss: 0.34308697374410624
Epoch: 44, step: 390, loss: 0.31535688042640686, mean loss: 0.3430865399666207
Epoch: 44, step: 391, loss: 0.3150186836719513, mean loss: 0.34308610091243014
Epoch: 44, step: 392, loss: 0.37569543719291687, mean loss: 0.343086610999187
Epoch: 44, step: 393, loss: 0.3362388610839844, mean loss: 0.3430865038859395
Epoch: 44, step: 394, loss: 0.3336324691772461, mean loss: 0.3430863560072154
Epoch: 44, step: 395, loss: 0.3173610270023346, mean loss: 0.34308595362141475
Epoch: 44, step: 396, loss: 0.3299759328365326, mean loss: 0.3430857485626691
Epoch: 44, step: 397, loss: 0.31952977180480957, mean loss: 0.3430853801205764
Epoch: 44, step: 398, loss: 0.3134384751319885, mean loss: 0.3430849164167367
Epoch: 44, step: 399, loss: 0.31886595487594604, mean loss: 0.3430845376166626
Epoch: 44, step: 400, loss: 0.3160442113876343, mean loss: 0.34308411469525196
Epoch: 44, step: 401, loss: 0.35474786162376404, mean loss: 0.3430842971180198
Epoch: 44, step: 402, loss: 0.3846285939216614, mean loss: 0.3430849468669493
Epoch: 44, step: 403, loss: 0.32250258326530457, mean loss: 0.3430846249657356
Epoch: 44, step: 404, loss: 0.3228641152381897, mean loss: 0.34308430872874013
Epoch: 44, step: 405, loss: 0.32104629278182983, mean loss: 0.34308396407239616
Epoch: 44, step: 406, loss: 0.30663585662841797, mean loss: 0.34308339406305277
Epoch: 44, step: 407, loss: 0.3324984610080719, mean loss: 0.34308322852863116
Epoch: 44, step: 408, loss: 0.3671382665634155, mean loss: 0.34308360471188293
Epoch: 44, step: 409, loss: 0.331169992685318, mean loss: 0.34308341840449813
Epoch: 44, step: 410, loss: 0.31967684626579285, mean loss: 0.3430830523736892
Epoch: 44, step: 411, loss: 0.31945547461509705, mean loss: 0.3430826828925833
Epoch: 44, step: 412, loss: 0.313207745552063, mean loss: 0.3430822157244127
Epoch: 44, step: 413, loss: 0.356502890586853, mean loss: 0.3430824255864121
Epoch: 44, step: 414, loss: 0.3501996397972107, mean loss: 0.34308253687809187
Epoch: 44, step: 415, loss: 0.33256515860557556, mean loss: 0.3430823724207133
Epoch: 44, step: 416, loss: 0.3609771728515625, mean loss: 0.3430826522324568
Epoch: 44, step: 417, loss: 0.3191334009170532, mean loss: 0.3430822777562502
Epoch: 44, step: 418, loss: 0.31913813948631287, mean loss: 0.3430819033658465
Epoch: 44, step: 419, loss: 0.30760085582733154, mean loss: 0.34308134859307243
Epoch: 44, step: 420, loss: 0.29298561811447144, mean loss: 0.3430805653210228
Epoch: 44, step: 421, loss: 0.34442296624183655, mean loss: 0.3430805863098111
Epoch: 44, step: 422, loss: 0.3787479102611542, mean loss: 0.34308114396899825
Epoch: 44, step: 423, loss: 0.3206087350845337, mean loss: 0.34308079261801505
Epoch: 44, step: 424, loss: 0.34047967195510864, mean loss: 0.3430807519507231
Epoch: 44, step: 425, loss: 0.3678044080734253, mean loss: 0.3430811384873561
Epoch: 44, step: 426, loss: 0.3561549782752991, mean loss: 0.3430813428842698
Epoch: 44, step: 427, loss: 0.34828221797943115, mean loss: 0.3430814241936797
Epoch: 44, step: 428, loss: 0.3889909088611603, mean loss: 0.34308214192188524
Epoch: 44, step: 429, loss: 0.3284132778644562, mean loss: 0.34308191259905657
Epoch: 44, step: 430, loss: 0.32483282685279846, mean loss: 0.3430816273099896
Epoch: 44, step: 431, loss: 0.3528028130531311, mean loss: 0.34308177927950156
Epoch: 44, step: 432, loss: 0.319932222366333, mean loss: 0.34308141739238573
Epoch: 44, step: 433, loss: 0.3342490792274475, mean loss: 0.3430812793223816
Epoch: 44, step: 434, loss: 0.33442047238349915, mean loss: 0.3430811439359262
Epoch: 44, step: 435, loss: 0.34432223439216614, mean loss: 0.34308116333645233
Epoch: 44, step: 436, loss: 0.3007131516933441, mean loss: 0.3430805010568712
Epoch: 44, step: 437, loss: 0.32477867603302, mean loss: 0.3430802149746343
Epoch: 44, step: 438, loss: 0.3206180930137634, mean loss: 0.3430798638668272
Epoch: 44, step: 439, loss: 0.3239370584487915, mean loss: 0.3430795646482856
Epoch: 44, step: 440, loss: 0.3192915618419647, mean loss: 0.3430791928271185
Epoch: 44, step: 441, loss: 0.31272605061531067, mean loss: 0.3430787183961858
Epoch: 44, step: 442, loss: 0.3212348222732544, mean loss: 0.3430783769732795
Epoch: 44, step: 443, loss: 0.32870757579803467, mean loss: 0.34307815235931927
Epoch: 44, step: 444, loss: 0.3159366846084595, mean loss: 0.3430777281479479
Epoch: 44, step: 445, loss: 0.30242717266082764, mean loss: 0.343077092804328
Epoch: 44, step: 446, loss: 0.3922438621520996, mean loss: 0.3430778612392146
Epoch: 44, step: 447, loss: 0.3545975685119629, mean loss: 0.3430780412796508
Epoch: 44, step: 448, loss: 0.35897424817085266, mean loss: 0.34307828971611076
Epoch: 44, step: 449, loss: 0.35642868280410767, mean loss: 0.34307849836164395
Epoch: 44, step: 450, loss: 0.31167444586753845, mean loss: 0.34307800757363244
Epoch: 44, step: 451, loss: 0.31307411193847656, mean loss: 0.34307753867484464
Epoch: 44, step: 452, loss: 0.32333827018737793, mean loss: 0.3430772301957547
Epoch: 44, step: 453, loss: 0.33428654074668884, mean loss: 0.34307709281976706
Epoch: 44, step: 454, loss: 0.3708014190196991, mean loss: 0.34307752607329023
Epoch: 44, step: 455, loss: 0.3877066671848297, mean loss: 0.3430782234907973
Epoch: 44, step: 456, loss: 0.31158629059791565, mean loss: 0.3430777313755207
Epoch: 44, step: 457, loss: 0.34009799361228943, mean loss: 0.3430776848127529
Epoch: 44, step: 458, loss: 0.32051390409469604, mean loss: 0.34307733222613335
Epoch: 44, step: 459, loss: 0.34858986735343933, mean loss: 0.3430774183648784
Epoch: 44, step: 460, loss: 0.3231494128704071, mean loss: 0.3430771069751961
Epoch: 44, step: 461, loss: 0.32144293189048767, mean loss: 0.34307676893064654
Epoch: 44, step: 462, loss: 0.28194913268089294, mean loss: 0.34307581379640617
Epoch: 44, step: 463, loss: 0.29463234543800354, mean loss: 0.34307505686721307
Epoch: 44, step: 464, loss: 0.3116559088230133, mean loss: 0.34307456595069546
Epoch: 44, step: 465, loss: 0.3155404329299927, mean loss: 0.34307413574331097
Epoch: 44, step: 466, loss: 0.3403484523296356, mean loss: 0.3430740931565039
Epoch: 44, step: 467, loss: 0.35968780517578125, mean loss: 0.34307435272953085
Epoch: 44, step: 468, loss: 0.2982040047645569, mean loss: 0.343073651685113
Epoch: 44, step: 469, loss: 0.31884291768074036, mean loss: 0.3430732731153851
Epoch: 44, step: 470, loss: 0.3551309108734131, mean loss: 0.343073461495371
Epoch: 44, step: 471, loss: 0.3479554355144501, mean loss: 0.34307353776668115
Epoch: 44, step: 472, loss: 0.31173020601272583, mean loss: 0.34307304809598244
Epoch: 44, step: 473, loss: 0.36588552594184875, mean loss: 0.34307340448526297
Epoch: 44, step: 474, loss: 0.275000661611557, mean loss: 0.3430723410314367
Epoch: 44, step: 475, loss: 0.3197883367538452, mean loss: 0.3430719772870719
Epoch: 44, step: 476, loss: 0.30510327219963074, mean loss: 0.3430713841465366
Epoch: 44, step: 477, loss: 0.3204386234283447, mean loss: 0.3430710305869915
Epoch: 44, step: 478, loss: 0.3577955961227417, mean loss: 0.34307126060441767
Epoch: 44, step: 479, loss: 0.3095335066318512, mean loss: 0.34307073670798593
Epoch: 44, step: 480, loss: 0.3124777376651764, mean loss: 0.3430702588193151
Epoch: 44, step: 481, loss: 0.328482449054718, mean loss: 0.34307003094887606
Epoch: 44, step: 482, loss: 0.32086870074272156, mean loss: 0.3430696841560457
Epoch: 44, step: 483, loss: 0.34353944659233093, mean loss: 0.34306969149379074
Epoch: 44, step: 484, loss: 0.30478426814079285, mean loss: 0.34306909348027403
Epoch: 44, step: 485, loss: 0.30351337790489197, mean loss: 0.34306847563460263
Epoch: 44, step: 486, loss: 0.3370334804058075, mean loss: 0.34306838137167794
Epoch: 44, step: 487, loss: 0.32680463790893555, mean loss: 0.343068127345946
Epoch: 44, step: 488, loss: 0.3456360697746277, mean loss: 0.34306816745437907
Epoch: 44, step: 489, loss: 0.33130156993865967, mean loss: 0.34306798367595287
Epoch: 44, step: 490, loss: 0.33485618233680725, mean loss: 0.34306785542066465
Epoch: 44, step: 491, loss: 0.3402443528175354, mean loss: 0.34306781132272934
Epoch: 44, step: 492, loss: 0.31333673000335693, mean loss: 0.34306734698498675
Epoch: 44, step: 493, loss: 0.29120784997940063, mean loss: 0.3430665370599984
Epoch: 44, step: 494, loss: 0.380502313375473, mean loss: 0.3430671217108131
Epoch: 44, step: 495, loss: 0.35435277223587036, mean loss: 0.34306729796097746
Epoch: 44, step: 496, loss: 0.32636311650276184, mean loss: 0.3430670370926524
Epoch: 44, step: 497, loss: 0.3283815085887909, mean loss: 0.34306680775310616
Epoch: 44, step: 498, loss: 0.306045800447464, mean loss: 0.3430662296160357
Epoch: 44, step: 499, loss: 0.3491877019405365, mean loss: 0.34306632521026903
Epoch: 44, step: 500, loss: 0.2822911739349365, mean loss: 0.34306537614720745
Epoch: 44, step: 501, loss: 0.3233124613761902, mean loss: 0.34306506769106
Epoch: 44, step: 502, loss: 0.3693370819091797, mean loss: 0.3430654779412859
Epoch: 44, step: 503, loss: 0.3475361764431, mean loss: 0.34306554775231807
Epoch: 44, step: 504, loss: 0.32374149560928345, mean loss: 0.34306524600730876
Epoch: 44, step: 505, loss: 0.29616591334342957, mean loss: 0.34306451368582186
Epoch: 44, step: 506, loss: 0.28639212250709534, mean loss: 0.34306362877425967
Epoch: 44, step: 507, loss: 0.3298953175544739, mean loss: 0.34306342316075616
Epoch: 44, step: 508, loss: 0.3485637903213501, mean loss: 0.34306350904360666
Epoch: 44, step: 509, loss: 0.3428358733654022, mean loss: 0.3430635054893538
Epoch: 44, step: 510, loss: 0.3165273666381836, mean loss: 0.34306309116645267
Epoch: 44, step: 511, loss: 0.33153948187828064, mean loss: 0.34306291124499866
Epoch: 44, step: 512, loss: 0.32067349553108215, mean loss: 0.34306256167801535
Epoch: 44, step: 513, loss: 0.3764379620552063, mean loss: 0.34306308276154973
Epoch: 44, step: 514, loss: 0.3356213867664337, mean loss: 0.34306296657763385
Epoch: 44, step: 515, loss: 0.34340324997901917, mean loss: 0.3430629718902455
Epoch: 44, step: 516, loss: 0.29293638467788696, mean loss: 0.3430621893103942
Epoch: 44, step: 517, loss: 0.2937528192996979, mean loss: 0.3430614195010145
Epoch: 44, step: 518, loss: 0.34417057037353516, mean loss: 0.34306143681661627
Epoch: 44, step: 519, loss: 0.34420400857925415, mean loss: 0.34306145465369264
Epoch: 44, step: 520, loss: 0.3256082832813263, mean loss: 0.3430611821905524
Epoch: 44, step: 521, loss: 0.34813445806503296, mean loss: 0.3430612613887146
Epoch: 44, step: 522, loss: 0.35181760787963867, mean loss: 0.3430613980806157
Epoch: 44, step: 523, loss: 0.3415195345878601, mean loss: 0.34306137401156334
Epoch: 44, step: 524, loss: 0.3152426779270172, mean loss: 0.3430609397583346
Epoch: 44, step: 525, loss: 0.3173760175704956, mean loss: 0.3430605388198346
Epoch: 44, step: 526, loss: 0.3340761065483093, mean loss: 0.34306039857613274
Epoch: 44, step: 527, loss: 0.3466643989086151, mean loss: 0.3430604548323817
Epoch: 44, step: 528, loss: 0.36174046993255615, mean loss: 0.3430607464114826
Epoch: 44, step: 529, loss: 0.29546260833740234, mean loss: 0.34306000345674725
Epoch: 44, step: 530, loss: 0.346273809671402, mean loss: 0.34306005361995473
Epoch: 44, step: 531, loss: 0.3355506360530853, mean loss: 0.343059936409841
Epoch: 44, step: 532, loss: 0.32246100902557373, mean loss: 0.34305961489823034
Epoch: 44, step: 533, loss: 0.30693063139915466, mean loss: 0.34305905099962725
Epoch: 44, step: 534, loss: 0.349081426858902, mean loss: 0.343059144994974
Epoch: 44, step: 535, loss: 0.372638463973999, mean loss: 0.3430596066524683
Epoch: 44, step: 536, loss: 0.3709092140197754, mean loss: 0.34306004130680584
Epoch: 44, step: 537, loss: 0.30816254019737244, mean loss: 0.3430594966630953
Epoch: 44, step: 538, loss: 0.33901047706604004, mean loss: 0.3430594334712171
Epoch: 44, step: 539, loss: 0.35291096568107605, mean loss: 0.34305958721883256
Epoch: 44, step: 540, loss: 0.33696797490119934, mean loss: 0.3430594921517677
Epoch: 44, step: 541, loss: 0.3338262736797333, mean loss: 0.34305934805834293
Epoch: 44, step: 542, loss: 0.35408827662467957, mean loss: 0.34305952017289787
Epoch: 44, step: 543, loss: 0.3239678144454956, mean loss: 0.34305922223741525
Epoch: 44, step: 544, loss: 0.3685273826122284, mean loss: 0.3430596196744149
Epoch: 44, step: 545, loss: 0.32271164655685425, mean loss: 0.3430593021441706
Epoch: 44, step: 546, loss: 0.3333527445793152, mean loss: 0.34305915067564435
Epoch: 44, step: 547, loss: 0.3362967371940613, mean loss: 0.3430590451514342
Epoch: 44, step: 548, loss: 0.36316487193107605, mean loss: 0.34305935888829586
Epoch: 44, step: 549, loss: 0.35134074091911316, mean loss: 0.34305948811124676
Epoch: 44, step: 550, loss: 0.35190844535827637, mean loss: 0.343059626188505
Epoch: 44, step: 551, loss: 0.3038199245929718, mean loss: 0.34305901391005045
Epoch: 44, step: 552, loss: 0.3267724812030792, mean loss: 0.34305875978636763
Epoch: 44, step: 553, loss: 0.3848895728588104, mean loss: 0.3430594124749785
Epoch: 44, step: 554, loss: 0.33485037088394165, mean loss: 0.3430592843908233
Epoch: 44, step: 555, loss: 0.31352129578590393, mean loss: 0.3430588235222499
Epoch: 44, step: 556, loss: 0.33319398760795593, mean loss: 0.34305866960784565
Epoch: 44, step: 557, loss: 0.3266604542732239, mean loss: 0.34305841376150537
Epoch: 44, step: 558, loss: 0.3236153721809387, mean loss: 0.3430581104142617
Epoch: 44, step: 559, loss: 0.3806557059288025, mean loss: 0.3430586969968178
Epoch: 44, step: 560, loss: 0.3310394287109375, mean loss: 0.3430585094799561
Epoch: 44, step: 561, loss: 0.33608531951904297, mean loss: 0.3430584006904469
Epoch: 44, step: 562, loss: 0.2860727906227112, mean loss: 0.3430575116655001
Epoch: 44, step: 563, loss: 0.32297590374946594, mean loss: 0.3430571983798852
Epoch: 44, step: 564, loss: 0.3286272883415222, mean loss: 0.34305697326779583
Epoch: 44, step: 565, loss: 0.40365657210350037, mean loss: 0.34305791862985685
Epoch: 44, step: 566, loss: 0.29357078671455383, mean loss: 0.3430571466358485
Epoch: 44, step: 567, loss: 0.3269236385822296, mean loss: 0.34305689495876046
Epoch: 44, step: 568, loss: 0.33889633417129517, mean loss: 0.34305683005647847
Epoch: 44, step: 569, loss: 0.3734121322631836, mean loss: 0.34305730357381237
Epoch: 44, step: 570, loss: 0.29329678416252136, mean loss: 0.3430565273634233
Epoch: 44, step: 571, loss: 0.30044302344322205, mean loss: 0.3430558626491299
Epoch: 44, step: 572, loss: 0.31700098514556885, mean loss: 0.3430554562338449
Epoch: 44, step: 573, loss: 0.3808978796005249, mean loss: 0.34305604650717775
Epoch: 44, step: 574, loss: 0.31205621361732483, mean loss: 0.3430555629734177
Epoch: 44, step: 575, loss: 0.35764214396476746, mean loss: 0.34305579049059065
Epoch: 44, step: 576, loss: 0.33550167083740234, mean loss: 0.34305567266550596
Epoch: 44, step: 577, loss: 0.3126322031021118, mean loss: 0.3430551981440354
Epoch: 44, step: 578, loss: 0.319665789604187, mean loss: 0.34305483334003417
Epoch: 44, step: 579, loss: 0.32887858152389526, mean loss: 0.3430546122368491
Epoch: 44, step: 580, loss: 0.3683800995349884, mean loss: 0.3430550072254995
Epoch: 44, step: 581, loss: 0.3088509440422058, mean loss: 0.34305447377056975
Epoch: 44, step: 582, loss: 0.360116571187973, mean loss: 0.3430547398710613
Epoch: 44, step: 583, loss: 0.32876741886138916, mean loss: 0.343054517049461
Epoch: 44, step: 584, loss: 0.34159499406814575, mean loss: 0.34305449428744883
Epoch: 44, step: 585, loss: 0.3035270869731903, mean loss: 0.3430538778467995
Epoch: 44, step: 586, loss: 0.2999385595321655, mean loss: 0.34305320546219004
Epoch: 44, step: 587, loss: 0.30025944113731384, mean loss: 0.3430525381026316
Epoch: 44, step: 588, loss: 0.35632166266441345, mean loss: 0.34305274502855065
Epoch: 44, step: 589, loss: 0.3776208460330963, mean loss: 0.34305328409384406
Epoch: 44, step: 590, loss: 0.36496078968048096, mean loss: 0.343053625720703
Epoch: 44, step: 591, loss: 0.3606782853603363, mean loss: 0.3430539005563386
Epoch: 44, step: 592, loss: 0.2996175289154053, mean loss: 0.3430532232282711
Epoch: 44, step: 593, loss: 0.37850096821784973, mean loss: 0.34305377597651665
Epoch: 44, step: 594, loss: 0.35648950934410095, mean loss: 0.343053985481021
Epoch: 44, step: 595, loss: 0.3466187119483948, mean loss: 0.34305404106522963
Epoch: 44, step: 596, loss: 0.30501559376716614, mean loss: 0.34305344794706427
Epoch: 44, step: 597, loss: 0.2970702052116394, mean loss: 0.34305273096008804
Epoch: 44, step: 598, loss: 0.34559166431427, mean loss: 0.3430527705474172
Epoch: 44, step: 599, loss: 0.2987739145755768, mean loss: 0.3430520801573715
Epoch: 44, step: 600, loss: 0.29157787561416626, mean loss: 0.3430512775909193
Epoch: 44, step: 601, loss: 0.35736438632011414, mean loss: 0.343051500752052
Epoch: 44, step: 602, loss: 0.316111296415329, mean loss: 0.3430510807236085
Epoch: 44, step: 603, loss: 0.29189273715019226, mean loss: 0.34305028311924973
Epoch: 44, step: 604, loss: 0.34738680720329285, mean loss: 0.34305035072848694
Epoch: 44, step: 605, loss: 0.32880809903144836, mean loss: 0.343050128685961
Epoch: 44, step: 606, loss: 0.2963889241218567, mean loss: 0.343049401230049
Epoch: 44, step: 607, loss: 0.32367828488349915, mean loss: 0.34304909923584304
Epoch: 44, step: 608, loss: 0.34084686636924744, mean loss: 0.34304906490373815
Epoch: 44, step: 609, loss: 0.32002872228622437, mean loss: 0.34304870602956644
Epoch: 44, step: 610, loss: 0.3347536027431488, mean loss: 0.34304857671559563
Epoch: 44, step: 611, loss: 0.31766948103904724, mean loss: 0.3430481810821281
Epoch: 44, step: 612, loss: 0.31370118260383606, mean loss: 0.34304772360035163
Epoch: 44, step: 613, loss: 0.3535454273223877, mean loss: 0.3430478872434338
Epoch: 44, step: 614, loss: 0.3519166111946106, mean loss: 0.34304802549106755
Epoch: 44, step: 615, loss: 0.3173723518848419, mean loss: 0.3430476252592181
Epoch: 44, step: 616, loss: 0.30597513914108276, mean loss: 0.3430470473831076
Epoch: 44, step: 617, loss: 0.3582243025302887, mean loss: 0.34304728395845985
Epoch: 44, step: 618, loss: 0.3319210410118103, mean loss: 0.3430471105309336
Epoch: 44, step: 619, loss: 0.3148808479309082, mean loss: 0.34304667150321055
Epoch: 44, step: 620, loss: 0.3232320249080658, mean loss: 0.3430463626569959
Epoch: 44, step: 621, loss: 0.28235241770744324, mean loss: 0.3430454166495619
Epoch: 44, step: 622, loss: 0.3474663496017456, mean loss: 0.3430454855554512
Epoch: 44, step: 623, loss: 0.3229576349258423, mean loss: 0.34304517246551
Epoch: 44, step: 624, loss: 0.32856303453445435, mean loss: 0.3430449467499206
Epoch: 44, step: 625, loss: 0.30566513538360596, mean loss: 0.343044364165036
Epoch: 44, step: 626, loss: 0.34612664580345154, mean loss: 0.34304441220333903
Epoch: 44, step: 627, loss: 0.2999506890773773, mean loss: 0.34304374058493736
Epoch: 44, step: 628, loss: 0.306854248046875, mean loss: 0.34304317657819633
Epoch: 44, step: 629, loss: 0.3184526562690735, mean loss: 0.3430427933453268
Epoch: 44, step: 630, loss: 0.2977452874183655, mean loss: 0.3430420874138366
Epoch: 44, step: 631, loss: 0.3514728248119354, mean loss: 0.3430422187992218
Epoch: 44, step: 632, loss: 0.3514482080936432, mean loss: 0.3430423497968888
Epoch: 44, step: 633, loss: 0.3295391798019409, mean loss: 0.34304213936880723
Epoch: 44, step: 634, loss: 0.32804781198501587, mean loss: 0.34304190570675763
Epoch: 44, step: 635, loss: 0.3280107080936432, mean loss: 0.343041671473796
Epoch: 44, step: 636, loss: 0.3540479838848114, mean loss: 0.3430418429838144
Epoch: 44, step: 637, loss: 0.3824533224105835, mean loss: 0.3430424571185018
Epoch: 44, step: 638, loss: 0.3253242075443268, mean loss: 0.3430421810257932
Epoch: 44, step: 639, loss: 0.330511212348938, mean loss: 0.343041985766371
Epoch: 44, step: 640, loss: 0.32613641023635864, mean loss: 0.3430417223452773
Epoch: 44, step: 641, loss: 0.31668147444725037, mean loss: 0.34304131160876483
Epoch: 44, step: 642, loss: 0.33274731040000916, mean loss: 0.3430411512136012
Epoch: 44, step: 643, loss: 0.3499467968940735, mean loss: 0.3430412588116953
Epoch: 44, step: 644, loss: 0.31795772910118103, mean loss: 0.3430408679868451
Epoch: 44, step: 645, loss: 0.32716211676597595, mean loss: 0.34304062058490653
Epoch: 44, step: 646, loss: 0.366566002368927, mean loss: 0.34304098712093295
Epoch: 44, step: 647, loss: 0.3120875358581543, mean loss: 0.34304050485975784
Epoch: 44, step: 648, loss: 0.31145551800727844, mean loss: 0.3430400127667945
Epoch: 44, step: 649, loss: 0.3033497929573059, mean loss: 0.3430393944042262
Epoch: 44, step: 650, loss: 0.35140854120254517, mean loss: 0.34303952479117056
Epoch: 44, step: 651, loss: 0.325544536113739, mean loss: 0.3430392522326132
Epoch: 44, step: 652, loss: 0.32919132709503174, mean loss: 0.34303903649588047
Epoch: 44, step: 653, loss: 0.3468988239765167, mean loss: 0.3430390966265469
Epoch: 44, step: 654, loss: 0.36532777547836304, mean loss: 0.3430394438509063
Epoch: 44, step: 655, loss: 0.30370622873306274, mean loss: 0.3430388311076498
Epoch: 44, step: 656, loss: 0.34409499168395996, mean loss: 0.3430388475605431
Epoch: 44, step: 657, loss: 0.35743555426597595, mean loss: 0.3430390718292708
Epoch: 44, step: 658, loss: 0.3094029426574707, mean loss: 0.3430385478612176
Epoch: 44, step: 659, loss: 0.30769458413124084, mean loss: 0.34303799729788453
Epoch: 44, step: 660, loss: 0.3048085570335388, mean loss: 0.3430374017959099
Epoch: 44, step: 661, loss: 0.3616757094860077, mean loss: 0.3430376921212735
Epoch: 44, step: 662, loss: 0.34108567237854004, mean loss: 0.3430376617155079
Epoch: 44, step: 663, loss: 0.3321618437767029, mean loss: 0.3430374923102441
Epoch: 44, step: 664, loss: 0.30439645051956177, mean loss: 0.34303689043423297
Epoch: 44, step: 665, loss: 0.33303648233413696, mean loss: 0.34303673466948886
Epoch: 44, step: 666, loss: 0.31887510418891907, mean loss: 0.34303635833769003
Epoch: 44, step: 667, loss: 0.2980217933654785, mean loss: 0.34303565721992524
Epoch: 44, step: 668, loss: 0.34780558943748474, mean loss: 0.34303573151214883
Epoch: 44, step: 669, loss: 0.3328646719455719, mean loss: 0.34303557309923466
Epoch: 44, step: 670, loss: 0.3337310254573822, mean loss: 0.3430354281843867
Epoch: 44, step: 671, loss: 0.31706178188323975, mean loss: 0.3430350236608647
Epoch: 44, step: 672, loss: 0.3216322064399719, mean loss: 0.343034690330378
Epoch: 44, step: 673, loss: 0.35540199279785156, mean loss: 0.34303488293748696
Epoch: 44, step: 674, loss: 0.3357831537723541, mean loss: 0.3430347700015544
Epoch: 44, step: 675, loss: 0.3417053818702698, mean loss: 0.3430347492984439
Epoch: 44, step: 676, loss: 0.3271333575248718, mean loss: 0.34303450166335797
Epoch: 44, step: 677, loss: 0.3363341689109802, mean loss: 0.3430343973195583
Epoch: 44, step: 678, loss: 0.35813480615615845, mean loss: 0.3430346324734762
Epoch: 44, step: 679, loss: 0.3640824258327484, mean loss: 0.3430349602390387
Epoch: 44, step: 680, loss: 0.34033820033073425, mean loss: 0.3430349182445527
Epoch: 44, step: 681, loss: 0.3555065989494324, mean loss: 0.343035112453041
Epoch: 44, step: 682, loss: 0.30143916606903076, mean loss: 0.3430344647327965
Epoch: 44, step: 683, loss: 0.337293416261673, mean loss: 0.34303437533621484
Epoch: 44, step: 684, loss: 0.3213993012905121, mean loss: 0.34303403845148794
Epoch: 44, step: 685, loss: 0.3598995506763458, mean loss: 0.3430343010641787
Epoch: 44, step: 686, loss: 0.3388356566429138, mean loss: 0.3430342356881542
Epoch: 44, step: 687, loss: 0.35939499735832214, mean loss: 0.3430344904334468
Epoch: 44, step: 688, loss: 0.34337010979652405, mean loss: 0.3430344956591278
Epoch: 44, step: 689, loss: 0.31006693840026855, mean loss: 0.34303398235365556
Epoch: 44, step: 690, loss: 0.293503999710083, mean loss: 0.34303321118292296
Epoch: 44, step: 691, loss: 0.3601667582988739, mean loss: 0.34303347794425937
Epoch: 44, step: 692, loss: 0.33118048310279846, mean loss: 0.34303329340153194
Epoch: 44, step: 693, loss: 0.337839275598526, mean loss: 0.34303321253561564
Epoch: 44, step: 694, loss: 0.34808608889579773, mean loss: 0.34303329120286913
Epoch: 44, step: 695, loss: 0.376630574464798, mean loss: 0.34303381426432233
Epoch: 44, step: 696, loss: 0.32596826553344727, mean loss: 0.3430335485823718
Epoch: 44, step: 697, loss: 0.34193670749664307, mean loss: 0.3430335315066629
Epoch: 44, step: 698, loss: 0.29522398114204407, mean loss: 0.343032787215383
Epoch: 44, step: 699, loss: 0.3376697897911072, mean loss: 0.3430327037264138
Epoch: 44, step: 700, loss: 0.33860188722610474, mean loss: 0.343032634750333
Epoch: 44, step: 701, loss: 0.29489666223526, mean loss: 0.34303188541236307
Epoch: 44, step: 702, loss: 0.30650725960731506, mean loss: 0.3430313168383534
Epoch: 44, step: 703, loss: 0.3410016894340515, mean loss: 0.3430312852439044
Epoch: 44, step: 704, loss: 0.3521096408367157, mean loss: 0.3430314265610631
Epoch: 44, step: 705, loss: 0.32305049896240234, mean loss: 0.34303111553513616
Epoch: 44, step: 706, loss: 0.3118366003036499, mean loss: 0.34303062996448674
Epoch: 44, step: 707, loss: 0.3267943263053894, mean loss: 0.3430303772357703
Epoch: 44, step: 708, loss: 0.35214105248451233, mean loss: 0.34303051904719917
Epoch: 44, step: 709, loss: 0.31358739733695984, mean loss: 0.343030060759964
Epoch: 44, step: 710, loss: 0.3252519369125366, mean loss: 0.3430297840447268
Epoch: 44, step: 711, loss: 0.31250280141830444, mean loss: 0.34302930890180205
Epoch: 44, step: 712, loss: 0.35190239548683167, mean loss: 0.3430294470064665
Epoch: 44, step: 713, loss: 0.32673919200897217, mean loss: 0.3430291934616416
Epoch: 44, step: 714, loss: 0.3058690130710602, mean loss: 0.34302861510207694
Epoch: 44, step: 715, loss: 0.3466910421848297, mean loss: 0.34302867210305876
Epoch: 44, step: 716, loss: 0.32645198702812195, mean loss: 0.3430284141122245
Epoch: 44, step: 717, loss: 0.34771597385406494, mean loss: 0.3430284870658109
Epoch: 44, step: 718, loss: 0.29327741265296936, mean loss: 0.3430277127902773
Epoch: 44, step: 719, loss: 0.269209086894989, mean loss: 0.34302656396953063
Epoch: 44, step: 720, loss: 0.31569400429725647, mean loss: 0.34302613860638465
Epoch: 44, step: 721, loss: 0.3180171549320221, mean loss: 0.34302574940996283
Epoch: 44, step: 722, loss: 0.31229493021965027, mean loss: 0.34302527117626497
Epoch: 44, step: 723, loss: 0.3119668662548065, mean loss: 0.3430247878521921
Epoch: 44, step: 724, loss: 0.3230104148387909, mean loss: 0.34302447639776384
Epoch: 44, step: 725, loss: 0.343395471572876, mean loss: 0.34302448217092957
Epoch: 44, step: 726, loss: 0.3293469250202179, mean loss: 0.343024269333727
Epoch: 44, step: 727, loss: 0.2873445749282837, mean loss: 0.3430234029124895
Epoch: 44, step: 728, loss: 0.3662375509738922, mean loss: 0.3430237641378542
Epoch: 44, step: 729, loss: 0.34944653511047363, mean loss: 0.3430238640782733
Epoch: 44, step: 730, loss: 0.321745365858078, mean loss: 0.34302353298302657
Epoch: 44, step: 731, loss: 0.3616047203540802, mean loss: 0.3430238221033877
Epoch: 44, step: 732, loss: 0.29823869466781616, mean loss: 0.34302312526467177
Epoch: 44, step: 733, loss: 0.34863337874412537, mean loss: 0.3430232125566195
Epoch: 44, step: 734, loss: 0.3530668020248413, mean loss: 0.34302336882600176
Epoch: 44, step: 735, loss: 0.31719085574150085, mean loss: 0.34302296690116535
Epoch: 44, step: 736, loss: 0.3405062258243561, mean loss: 0.3430229277441153
Epoch: 44, step: 737, loss: 0.31668025255203247, mean loss: 0.3430225178944842
Epoch: 44, step: 738, loss: 0.3703981041908264, mean loss: 0.34302294380792325
Epoch: 44, step: 739, loss: 0.33686363697052, mean loss: 0.3430228479820032
Epoch: 44, step: 740, loss: 0.35384446382522583, mean loss: 0.3430230163410717
Epoch: 44, step: 741, loss: 0.3705701529979706, mean loss: 0.34302344490351383
Epoch: 44, step: 742, loss: 0.33515486121177673, mean loss: 0.34302332249053774
Epoch: 44, step: 743, loss: 0.31492000818252563, mean loss: 0.3430228852890084
Epoch: 44, step: 744, loss: 0.3421338200569153, mean loss: 0.3430228714580905
Epoch: 44, step: 745, loss: 0.3651100695133209, mean loss: 0.3430232150565793
Epoch: 44, step: 746, loss: 0.32343292236328125, mean loss: 0.3430229103058257
Epoch: 44, step: 747, loss: 0.2936509847640991, mean loss: 0.3430221422776143
Epoch: 44, step: 748, loss: 0.321967214345932, mean loss: 0.34302181475287397
Epoch: 44, step: 749, loss: 0.3129388093948364, mean loss: 0.3430213467970926
Epoch: 44, step: 750, loss: 0.30761411786079407, mean loss: 0.3430207960289912
Epoch: 44, step: 751, loss: 0.34744784235954285, mean loss: 0.3430208648917079
Epoch: 44, step: 752, loss: 0.3454359471797943, mean loss: 0.3430209024577346
Epoch: 44, step: 753, loss: 0.3385400176048279, mean loss: 0.34302083275972783
Epoch: 44, step: 754, loss: 0.341632217168808, mean loss: 0.3430208111608168
Epoch: 44, step: 755, loss: 0.30833205580711365, mean loss: 0.34302027161071175
Epoch: 44, step: 756, loss: 0.361723393201828, mean loss: 0.34302056251518953
Epoch: 44, step: 757, loss: 0.28644680976867676, mean loss: 0.34301968259244797
Epoch: 44, step: 758, loss: 0.35443294048309326, mean loss: 0.34301986010637425
Epoch: 44, step: 759, loss: 0.3128970265388489, mean loss: 0.3430193916039236
Epoch: 44, step: 760, loss: 0.37668952345848083, mean loss: 0.3430199152695978
Epoch: 44, step: 761, loss: 0.3427121341228485, mean loss: 0.3430199104828059
Epoch: 44, step: 762, loss: 0.31363967061042786, mean loss: 0.3430194535512848
Epoch: 44, step: 763, loss: 0.3891350030899048, mean loss: 0.34302017074490126
Epoch: 44, step: 764, loss: 0.3377307057380676, mean loss: 0.3430200884838943
Epoch: 44, step: 765, loss: 0.31699755787849426, mean loss: 0.34301968379149583
Epoch: 44, step: 766, loss: 0.35736942291259766, mean loss: 0.3430199069496552
Epoch: 44, step: 767, loss: 0.38809654116630554, mean loss: 0.3430206079423495
Epoch: 44, step: 768, loss: 0.30253273248672485, mean loss: 0.34301997831984027
Epoch: 44, step: 769, loss: 0.30195119976997375, mean loss: 0.3430193396737023
Epoch: 44, step: 770, loss: 0.35652440786361694, mean loss: 0.3430195496830044
Epoch: 44, step: 771, loss: 0.3180214464664459, mean loss: 0.3430191609583789
Epoch: 44, step: 772, loss: 0.3416246771812439, mean loss: 0.34301913927426353
Epoch: 44, step: 773, loss: 0.2888035178184509, mean loss: 0.3430182962386321
Epoch: 44, step: 774, loss: 0.3399454653263092, mean loss: 0.3430182484578339
Epoch: 44, step: 775, loss: 0.32682350277900696, mean loss: 0.3430179966425323
Epoch: 44, step: 776, loss: 0.3359145224094391, mean loss: 0.34301788619092477
Epoch: 44, step: 777, loss: 0.32258591055870056, mean loss: 0.3430175684999767
Epoch: 44, step: 778, loss: 0.28933438658714294, mean loss: 0.3430167338085064
Epoch: 44, step: 779, loss: 0.33247292041778564, mean loss: 0.34301656987086426
Epoch: 44, step: 780, loss: 0.33089742064476013, mean loss: 0.343016381442467
Epoch: 44, step: 781, loss: 0.3381597697734833, mean loss: 0.34301630593309684
Epoch: 44, step: 782, loss: 0.3530213534832001, mean loss: 0.3430164614866277
Epoch: 44, step: 783, loss: 0.31934550404548645, mean loss: 0.34301609346801076
Epoch: 44, step: 784, loss: 0.42929941415786743, mean loss: 0.343017434916693
Epoch: 44, step: 785, loss: 0.3378789722919464, mean loss: 0.3430173550301437
Epoch: 44, step: 786, loss: 0.33643463253974915, mean loss: 0.34301725269159467
Epoch: 44, step: 787, loss: 0.37250816822052, mean loss: 0.3430177111661225
Epoch: 44, step: 788, loss: 0.3262408971786499, mean loss: 0.34301745035284636
Epoch: 44, step: 789, loss: 0.3319390118122101, mean loss: 0.34301727812950683
Epoch: 44, step: 790, loss: 0.31525182723999023, mean loss: 0.34301684649969527
Epoch: 44, step: 791, loss: 0.31029313802719116, mean loss: 0.3430163377988423
Epoch: 44, step: 792, loss: 0.36951425671577454, mean loss: 0.34301674971133767
Epoch: 44, step: 793, loss: 0.3341324031352997, mean loss: 0.3430166116055305
Epoch: 44, step: 794, loss: 0.34067824482917786, mean loss: 0.34301657525654206
Epoch: 44, step: 795, loss: 0.3437425494194031, mean loss: 0.3430165865413484
Epoch: 44, step: 796, loss: 0.342321515083313, mean loss: 0.3430165757370729
Epoch: 44, step: 797, loss: 0.36685433983802795, mean loss: 0.3430169462684265
Epoch: 44, step: 798, loss: 0.29274487495422363, mean loss: 0.34301616485750996
Epoch: 44, step: 799, loss: 0.2933627963066101, mean loss: 0.343015393075482
Epoch: 44, step: 800, loss: 0.37154620885849, mean loss: 0.34301583653439033
Epoch: 44, step: 801, loss: 0.30225804448127747, mean loss: 0.3430152030395342
Epoch: 44, step: 802, loss: 0.3207738399505615, mean loss: 0.3430148573493138
Epoch: 44, step: 803, loss: 0.395288348197937, mean loss: 0.3430156698064299
Epoch: 44, step: 804, loss: 0.34014976024627686, mean loss: 0.34301562526392104
Epoch: 44, step: 805, loss: 0.37120991945266724, mean loss: 0.34301606345816726
Epoch: 44, step: 806, loss: 0.3605247735977173, mean loss: 0.34301633557339567
Epoch: 44, step: 807, loss: 0.30188265442848206, mean loss: 0.34301569629574513
Epoch: 44, step: 808, loss: 0.34164029359817505, mean loss: 0.343015674920305
Epoch: 44, step: 809, loss: 0.33158838748931885, mean loss: 0.34301549732904163
Epoch: 44, step: 810, loss: 0.3774772882461548, mean loss: 0.3430160328907759
Epoch: 44, step: 811, loss: 0.3525558412075043, mean loss: 0.3430161811441531
Epoch: 44, step: 812, loss: 0.3273628056049347, mean loss: 0.3430159378866737
Epoch: 44, step: 813, loss: 0.3609870672225952, mean loss: 0.3430162171583029
Epoch: 44, step: 814, loss: 0.3016281723976135, mean loss: 0.34301557399743887
Epoch: 44, step: 815, loss: 0.3340643346309662, mean loss: 0.3430154348993632
Epoch: 44, step: 816, loss: 0.3589717447757721, mean loss: 0.3430156828491072
Epoch: 44, step: 817, loss: 0.378498911857605, mean loss: 0.34301623422476385
Epoch: 44, step: 818, loss: 0.3607056140899658, mean loss: 0.3430165090966443
Epoch: 44, step: 819, loss: 0.37155064940452576, mean loss: 0.34301695247628733
Epoch: 44, step: 820, loss: 0.3158721625804901, mean loss: 0.3430165306917123
Epoch: 44, step: 821, loss: 0.3213365375995636, mean loss: 0.3430161938261619
Epoch: 44, step: 822, loss: 0.3168773651123047, mean loss: 0.3430157876851604
Epoch: 44, step: 823, loss: 0.33749154210090637, mean loss: 0.3430157018516367
Epoch: 44, step: 824, loss: 0.33111372590065, mean loss: 0.3430155169263566
Epoch: 44, step: 825, loss: 0.31062212586402893, mean loss: 0.34301501362641157
Epoch: 44, step: 826, loss: 0.3633027672767639, mean loss: 0.3430153288347401
Epoch: 44, step: 827, loss: 0.31961479783058167, mean loss: 0.34301496526922204
Epoch: 44, step: 828, loss: 0.34929773211479187, mean loss: 0.34301506288076317
Epoch: 44, step: 829, loss: 0.3424209654331207, mean loss: 0.34301505365077456
Epoch: 44, step: 830, loss: 0.33098074793815613, mean loss: 0.3430148666868689
Epoch: 44, step: 831, loss: 0.30135494470596313, mean loss: 0.34301421947207306
Epoch: 44, step: 832, loss: 0.335145503282547, mean loss: 0.343014097228195
Epoch: 44, step: 833, loss: 0.3394692540168762, mean loss: 0.3430140421583921
Epoch: 44, step: 834, loss: 0.326986163854599, mean loss: 0.34301379316617037
Epoch: 44, step: 835, loss: 0.31656739115715027, mean loss: 0.34301338232912926
Epoch: 44, step: 836, loss: 0.32643336057662964, mean loss: 0.3430131247673914
Epoch: 44, step: 837, loss: 0.3905344009399414, mean loss: 0.34301386297344
Epoch: 44, step: 838, loss: 0.3275523781776428, mean loss: 0.3430136227950354
Epoch: 44, step: 839, loss: 0.3253265619277954, mean loss: 0.3430133480488432
Epoch: 44, step: 840, loss: 0.33331170678138733, mean loss: 0.34301319734841806
Epoch: 44, step: 841, loss: 0.3366357982158661, mean loss: 0.34301309828664023
Epoch: 44, step: 842, loss: 0.32942092418670654, mean loss: 0.34301288715919026
Epoch: 44, step: 843, loss: 0.3562808632850647, mean loss: 0.3430130932476669
Epoch: 44, step: 844, loss: 0.31324124336242676, mean loss: 0.3430126308154293
Epoch: 44, step: 845, loss: 0.3412852883338928, mean loss: 0.34301260398584216
Epoch: 44, step: 846, loss: 0.33994677662849426, mean loss: 0.3430125563672572
Epoch: 44, step: 847, loss: 0.31459274888038635, mean loss: 0.34301211495623135
Epoch: 44, step: 848, loss: 0.3477974832057953, mean loss: 0.3430121892805033
Epoch: 44, step: 849, loss: 0.3278423249721527, mean loss: 0.34301195367238496
Epoch: 44, step: 850, loss: 0.33680734038352966, mean loss: 0.34301185730800565
Epoch: 44, step: 851, loss: 0.3019809126853943, mean loss: 0.343011220062795
Epoch: 44, step: 852, loss: 0.32519426941871643, mean loss: 0.3430109433548069
Epoch: 44, step: 853, loss: 0.3134540319442749, mean loss: 0.3430104843252773
Epoch: 44, step: 854, loss: 0.3459928631782532, mean loss: 0.3430105306419808
Epoch: 44, step: 855, loss: 0.34153589606285095, mean loss: 0.3430105077410835
Epoch: 44, step: 856, loss: 0.32702237367630005, mean loss: 0.34301025945114416
Epoch: 44, step: 857, loss: 0.28742432594299316, mean loss: 0.34300939623510684
Epoch: 44, step: 858, loss: 0.3317658305168152, mean loss: 0.3430092216320209
Epoch: 44, step: 859, loss: 0.3592270612716675, mean loss: 0.34300947347747157
Epoch: 44, step: 860, loss: 0.3456800580024719, mean loss: 0.3430095149481072
Epoch: 44, step: 861, loss: 0.31867966055870056, mean loss: 0.34300913714360415
Epoch: 44, step: 862, loss: 0.3668835759162903, mean loss: 0.34300950787045975
Epoch: 44, step: 863, loss: 0.3108433783054352, mean loss: 0.3430090083963982
Epoch: 44, step: 864, loss: 0.333578497171402, mean loss: 0.3430088619621623
Epoch: 44, step: 865, loss: 0.3524587154388428, mean loss: 0.3430090086944606
Epoch: 44, step: 866, loss: 0.3400101661682129, mean loss: 0.343008962130752
Epoch: 44, step: 867, loss: 0.3342084288597107, mean loss: 0.34300882548499595
Epoch: 44, step: 868, loss: 0.35429081320762634, mean loss: 0.34300900065754036
Epoch: 44, step: 869, loss: 0.3286002576351166, mean loss: 0.3430087769401379
Epoch: 44, step: 870, loss: 0.34696364402770996, mean loss: 0.3430088383444432
Epoch: 44, step: 871, loss: 0.32724177837371826, mean loss: 0.3430085935447293
Epoch: 44, step: 872, loss: 0.3666350841522217, mean loss: 0.34300896036443784
Epoch: 44, step: 873, loss: 0.3359966576099396, mean loss: 0.3430088514946544
Epoch: 44, step: 874, loss: 0.3645133376121521, mean loss: 0.3430091853582199
Epoch: 44, step: 875, loss: 0.34731370210647583, mean loss: 0.3430092521860897
Epoch: 44, step: 876, loss: 0.3246007263660431, mean loss: 0.34300896639710576
Epoch: 44, step: 877, loss: 0.3363218903541565, mean loss: 0.3430088625830895
Epoch: 44, step: 878, loss: 0.3470233380794525, mean loss: 0.3430089249051495
Epoch: 44, step: 879, loss: 0.3563230037689209, mean loss: 0.34300913159415325
Epoch: 44, step: 880, loss: 0.30318281054496765, mean loss: 0.3430085133362237
Epoch: 44, step: 881, loss: 0.3088431656360626, mean loss: 0.3430079829666422
Epoch: 44, step: 882, loss: 0.3184872269630432, mean loss: 0.34300760232186345
Epoch: 44, step: 883, loss: 0.30740463733673096, mean loss: 0.34300704965242873
Epoch: 44, step: 884, loss: 0.3683261275291443, mean loss: 0.3430074426776515
Epoch: 44, step: 885, loss: 0.3638652265071869, mean loss: 0.3430077664456784
Epoch: 44, step: 886, loss: 0.3119298815727234, mean loss: 0.3430072840421133
Epoch: 44, step: 887, loss: 0.33273935317993164, mean loss: 0.3430071246615895
Epoch: 44, step: 888, loss: 0.3104817867279053, mean loss: 0.34300661980574265
Epoch: 44, step: 889, loss: 0.30933043360710144, mean loss: 0.34300609709462915
Epoch: 44, step: 890, loss: 0.3225794732570648, mean loss: 0.34300578004395416
Epoch: 44, step: 891, loss: 0.3542892038822174, mean loss: 0.3430059551762544
Epoch: 44, step: 892, loss: 0.3481273055076599, mean loss: 0.34300603466453344
Epoch: 44, step: 893, loss: 0.33279240131378174, mean loss: 0.3430058761415884
Epoch: 44, step: 894, loss: 0.3416047990322113, mean loss: 0.3430058543962002
Epoch: 44, step: 895, loss: 0.35110822319984436, mean loss: 0.34300598014689554
Epoch: 44, step: 896, loss: 0.32194891571998596, mean loss: 0.34300565334130795
Epoch: 44, step: 897, loss: 0.3412071168422699, mean loss: 0.34300562542845914
Epoch: 44, step: 898, loss: 0.32304447889328003, mean loss: 0.3430053156411303
Epoch: 44, step: 899, loss: 0.2991170287132263, mean loss: 0.34300463452673885
Epoch: 44, step: 900, loss: 0.3006732761859894, mean loss: 0.34300397758494544
Epoch: 44, step: 901, loss: 0.3634646236896515, mean loss: 0.34300429510948227
Epoch: 44, step: 902, loss: 0.33814385533332825, mean loss: 0.3430042196824928
Epoch: 44, step: 903, loss: 0.3222348690032959, mean loss: 0.3430038973772371
Epoch: 44, step: 904, loss: 0.3251185417175293, mean loss: 0.3430036198310218
Epoch: 44, step: 905, loss: 0.340933233499527, mean loss: 0.3430035877031187
Epoch: 44, step: 906, loss: 0.32780885696411133, mean loss: 0.34300335191752923
Epoch: 44, step: 907, loss: 0.32633528113365173, mean loss: 0.3430030932732678
Epoch: 44, step: 908, loss: 0.3317070007324219, mean loss: 0.34300291799058424
Epoch: 44, step: 909, loss: 0.3566299080848694, mean loss: 0.34300312943877487
Epoch: 44, step: 910, loss: 0.32530781626701355, mean loss: 0.34300285486721727
Epoch: 44, step: 911, loss: 0.38428762555122375, mean loss: 0.3430034954576263
Epoch: 44, step: 912, loss: 0.347351610660553, mean loss: 0.34300356292361034
Epoch: 44, step: 913, loss: 0.37043851613998413, mean loss: 0.3430039886017052
Epoch: 44, step: 914, loss: 0.3178691267967224, mean loss: 0.34300359861765833
Epoch: 44, step: 915, loss: 0.39154142141342163, mean loss: 0.343004351702478
Epoch: 44, step: 916, loss: 0.31447461247444153, mean loss: 0.34300390905839273
Epoch: 44, step: 917, loss: 0.2741960883140564, mean loss: 0.34300284150912125
Epoch: 44, step: 918, loss: 0.3271181583404541, mean loss: 0.34300259506302444
Epoch: 44, step: 919, loss: 0.30950599908828735, mean loss: 0.3430020753814436
Epoch: 44, step: 920, loss: 0.30038002133369446, mean loss: 0.3430014141335722
Epoch: 44, step: 921, loss: 0.35385391116142273, mean loss: 0.3430015824989734
Epoch: 44, step: 922, loss: 0.3341941833496094, mean loss: 0.3430014458632957
Epoch: 44, step: 923, loss: 0.35132601857185364, mean loss: 0.3430015750065273
Epoch: 44, step: 924, loss: 0.3463905155658722, mean loss: 0.34300162758003
Epoch: 44, step: 925, loss: 0.31686729192733765, mean loss: 0.34300122215767803
Epoch: 44, step: 926, loss: 0.3690190017223358, mean loss: 0.3430016257656324
Epoch: 44, step: 927, loss: 0.3051898181438446, mean loss: 0.34300103920867625
Epoch: 44, step: 928, loss: 0.31478142738342285, mean loss: 0.3430006014577754
Epoch: 44, step: 929, loss: 0.3609749376773834, mean loss: 0.34300088027662906
Epoch: 44, step: 930, loss: 0.3418939411640167, mean loss: 0.34300086310599737
Epoch: 44, step: 931, loss: 0.34955182671546936, mean loss: 0.34300096472173863
Epoch: 44, step: 932, loss: 0.36891970038414, mean loss: 0.3430013667558273
Epoch: 44, step: 933, loss: 0.32873299717903137, mean loss: 0.34300114543785654
Epoch: 44, step: 934, loss: 0.306289941072464, mean loss: 0.3430005760158782
Epoch: 44, step: 935, loss: 0.3414572477340698, mean loss: 0.34300055207791624
Epoch: 44, step: 936, loss: 0.3655298948287964, mean loss: 0.34300090151632845
Epoch: 44, step: 937, loss: 0.315399706363678, mean loss: 0.3430004734182555
Epoch: 44, step: 938, loss: 0.4012269377708435, mean loss: 0.34300137650417023
Epoch: 44, step: 939, loss: 0.3197881579399109, mean loss: 0.34300101647534453
Epoch: 44, step: 940, loss: 0.32898202538490295, mean loss: 0.3430007990491136
Epoch: 44, step: 941, loss: 0.323872447013855, mean loss: 0.34300050238432817
Epoch: 44, step: 942, loss: 0.34278401732444763, mean loss: 0.3430004990268775
Epoch: 44, step: 943, loss: 0.3203713893890381, mean loss: 0.3430001480791474
Epoch: 44, step: 944, loss: 0.33171987533569336, mean loss: 0.34299997313966535
Epoch: 44, step: 945, loss: 0.34078463912010193, mean loss: 0.3429999387838138
Epoch: 44, step: 946, loss: 0.3202550709247589, mean loss: 0.3429995860572369
Epoch: 44, step: 947, loss: 0.3446110486984253, mean loss: 0.34299961104735294
Epoch: 44, step: 948, loss: 0.3401355743408203, mean loss: 0.34299956663335424
Epoch: 44, step: 949, loss: 0.3042677342891693, mean loss: 0.34299896600946156
Epoch: 44, step: 950, loss: 0.3242700397968292, mean loss: 0.3429986755799764
Epoch: 44, step: 951, loss: 0.35271239280700684, mean loss: 0.3429988262082673
Epoch: 44, step: 952, loss: 0.33283373713493347, mean loss: 0.3429986685831053
Epoch: 44, step: 953, loss: 0.3688134253025055, mean loss: 0.34299906887395226
Epoch: 44, step: 954, loss: 0.3368556797504425, mean loss: 0.3429989736143172
Epoch: 44, step: 955, loss: 0.30395013093948364, mean loss: 0.3429983681308049
Epoch: 44, step: 956, loss: 0.3223739266395569, mean loss: 0.34299804833731584
Epoch: 44, step: 957, loss: 0.3415376842021942, mean loss: 0.3429980256939051
Epoch: 44, step: 958, loss: 0.3569071590900421, mean loss: 0.3429982413561021
Epoch: 44, step: 959, loss: 0.34510892629623413, mean loss: 0.3429982740819291
Epoch: 44, step: 960, loss: 0.34603753685951233, mean loss: 0.342998321204474
Epoch: 44, step: 961, loss: 0.3154720664024353, mean loss: 0.34299789442760026
Epoch: 44, step: 962, loss: 0.30170977115631104, mean loss: 0.3429972542917335
Epoch: 44, step: 963, loss: 0.33857491612434387, mean loss: 0.3429971857283511
Epoch: 44, step: 964, loss: 0.2973268926143646, mean loss: 0.3429964776727688
Epoch: 44, step: 965, loss: 0.34618911147117615, mean loss: 0.34299652716943246
Epoch: 44, step: 966, loss: 0.3041193187236786, mean loss: 0.3429959244500482
Epoch: 44, step: 967, loss: 0.31411632895469666, mean loss: 0.34299547673214703
Epoch: 44, step: 968, loss: 0.3463013470172882, mean loss: 0.342995527981977
Epoch: 44, step: 969, loss: 0.3877914845943451, mean loss: 0.3429962224283326
Epoch: 44, step: 970, loss: 0.28870531916618347, mean loss: 0.34299538080024167
Epoch: 44, step: 971, loss: 0.34202441573143005, mean loss: 0.34299536574838657
Epoch: 44, step: 972, loss: 0.34669649600982666, mean loss: 0.34299542312224546
Epoch: 44, step: 973, loss: 0.3384503722190857, mean loss: 0.3429953526672632
Epoch: 44, step: 974, loss: 0.31936022639274597, mean loss: 0.34299498629367925
Epoch: 44, step: 975, loss: 0.32365065813064575, mean loss: 0.34299468643740194
Epoch: 44, step: 976, loss: 0.32969504594802856, mean loss: 0.34299448028297586
Epoch: 44, step: 977, loss: 0.37508565187454224, mean loss: 0.3429949777125507
Epoch: 44, step: 978, loss: 0.3731015622615814, mean loss: 0.3429954443727778
Epoch: 44, step: 979, loss: 0.31226933002471924, mean loss: 0.3429949681170529
Epoch: 44, step: 980, loss: 0.33333900570869446, mean loss: 0.342994818451656
Epoch: 44, step: 981, loss: 0.3957771956920624, mean loss: 0.34299563655477827
Epoch: 44, step: 982, loss: 0.373958557844162, mean loss: 0.34299611645870254
Epoch: 44, step: 983, loss: 0.33704376220703125, mean loss: 0.342996024202747
Epoch: 44, step: 984, loss: 0.3312400281429291, mean loss: 0.3429958419985645
Epoch: 44, step: 985, loss: 0.34063413739204407, mean loss: 0.342995805395474
Epoch: 44, step: 986, loss: 0.3041657507419586, mean loss: 0.3429952035937187
Epoch: 44, step: 987, loss: 0.3484998643398285, mean loss: 0.34299528890555225
Epoch: 44, step: 988, loss: 0.36486899852752686, mean loss: 0.34299562790143945
Epoch: 44, step: 989, loss: 0.3487277925014496, mean loss: 0.342995716736399
Epoch: 44, step: 990, loss: 0.32412004470825195, mean loss: 0.3429954242127728
Epoch: 44, step: 991, loss: 0.3535919487476349, mean loss: 0.3429955884286874
Epoch: 44, step: 992, loss: 0.3135279417037964, mean loss: 0.3429951317712663
Epoch: 44, step: 993, loss: 0.2977474629878998, mean loss: 0.3429944305831556
Epoch: 44, step: 994, loss: 0.3281952738761902, mean loss: 0.34299420124908814
Epoch: 44, step: 995, loss: 0.334993451833725, mean loss: 0.34299407726797154
Epoch: 44, step: 996, loss: 0.3013470768928528, mean loss: 0.3429934319082273
Epoch: 44, step: 997, loss: 0.32085537910461426, mean loss: 0.3429930888634322
Epoch: 44, step: 998, loss: 0.3642925024032593, mean loss: 0.3429934189078041
Epoch: 44, step: 999, loss: 0.3310602307319641, mean loss: 0.3429932340003389
Epoch: 44, step: 1000, loss: 0.35979634523391724, mean loss: 0.34299349436433524
Epoch: 44, step: 1001, loss: 0.3590497374534607, mean loss: 0.3429937431517642
Epoch: 44, step: 1002, loss: 0.32076939940452576, mean loss: 0.34299339879651003
Epoch: 44, step: 1003, loss: 0.30882754921913147, mean loss: 0.34299286942171026
Epoch: 44, step: 1004, loss: 0.3115137219429016, mean loss: 0.3429923816829476
Epoch: 44, step: 1005, loss: 0.32995399832725525, mean loss: 0.3429921796690132
Epoch: 44, step: 1006, loss: 0.37551867961883545, mean loss: 0.3429926836198669
Epoch: 44, step: 1007, loss: 0.3830811679363251, mean loss: 0.3429933047230572
Epoch: 44, step: 1008, loss: 0.35694196820259094, mean loss: 0.342993520830633
Epoch: 44, step: 1009, loss: 0.31981948018074036, mean loss: 0.34299316179923445
Epoch: 44, step: 1010, loss: 0.3477195203304291, mean loss: 0.34299323502275425
Epoch: 44, step: 1011, loss: 0.32127729058265686, mean loss: 0.3429928985918123
Epoch: 44, step: 1012, loss: 0.3228985667228699, mean loss: 0.3429925872882775
Epoch: 44, step: 1013, loss: 0.339923620223999, mean loss: 0.3429925397442486
Epoch: 44, step: 1014, loss: 0.3526916801929474, mean loss: 0.3429926899997125
Epoch: 44, step: 1015, loss: 0.36402109265327454, mean loss: 0.34299301575883157
Epoch: 44, step: 1016, loss: 0.3244118094444275, mean loss: 0.34299272791463664
Epoch: 44, step: 1017, loss: 0.3256111741065979, mean loss: 0.3429924586586059
Epoch: 44, step: 1018, loss: 0.3298562169075012, mean loss: 0.34299225516946097
Epoch: 44, step: 1019, loss: 0.366822749376297, mean loss: 0.34299262431398986
Epoch: 44, step: 1020, loss: 0.3627055883407593, mean loss: 0.3429929296714883
Epoch: 44, step: 1021, loss: 0.36710476875305176, mean loss: 0.34299330316259835
Epoch: 44, step: 1022, loss: 0.34216588735580444, mean loss: 0.3429932903461699
Epoch: 44, step: 1023, loss: 0.3521311581134796, mean loss: 0.3429934318868726
Epoch: 44, step: 1024, loss: 0.3486012816429138, mean loss: 0.3429935187481318
Epoch: 44, step: 1025, loss: 0.34604400396347046, mean loss: 0.3429935659970586
Epoch: 44, step: 1026, loss: 0.33494895696640015, mean loss: 0.3429934413961412
Epoch: 44, step: 1027, loss: 0.3299148678779602, mean loss: 0.3429932388285568
Epoch: 44, step: 1028, loss: 0.35111021995544434, mean loss: 0.3429933645465329
Epoch: 44, step: 1029, loss: 0.3404157757759094, mean loss: 0.3429933246247665
Epoch: 44, step: 1030, loss: 0.3584732711315155, mean loss: 0.34299356437489437
Epoch: 44, step: 1031, loss: 0.35934093594551086, mean loss: 0.34299381755559644
Epoch: 44, step: 1032, loss: 0.3389160931110382, mean loss: 0.3429937544026214
Epoch: 44, step: 1033, loss: 0.3705894649028778, mean loss: 0.34299418177927465
Epoch: 44, step: 1034, loss: 0.3539736568927765, mean loss: 0.3429943518165222
Epoch: 44, step: 1035, loss: 0.31232649087905884, mean loss: 0.3429938768759762
Epoch: 44, step: 1036, loss: 0.3356606960296631, mean loss: 0.34299376331177994
Epoch: 44, step: 1037, loss: 0.3024098873138428, mean loss: 0.3429931348254542
Epoch: 44, step: 1038, loss: 0.3318575918674469, mean loss: 0.3429929623818931
Epoch: 44, step: 1039, loss: 0.2967525124549866, mean loss: 0.3429922463194252
Epoch: 44, step: 1040, loss: 0.31897392868995667, mean loss: 0.34299187438642076
Epoch: 44, step: 1041, loss: 0.3447231650352478, mean loss: 0.3429919011957157
Epoch: 44, step: 1042, loss: 0.3325158655643463, mean loss: 0.34299173897524726
Epoch: 44, step: 1043, loss: 0.32851335406303406, mean loss: 0.3429915147822322
Epoch: 44, step: 1044, loss: 0.32076969742774963, mean loss: 0.3429911706900479
Epoch: 44, step: 1045, loss: 0.3447984457015991, mean loss: 0.3429911986742387
Epoch: 44, step: 1046, loss: 0.3128846287727356, mean loss: 0.34299073250558904
Epoch: 44, step: 1047, loss: 0.3336643576622009, mean loss: 0.34299058809869504
Epoch: 44, step: 1048, loss: 0.31455856561660767, mean loss: 0.34299014787228826
Epoch: 44, step: 1049, loss: 0.338664174079895, mean loss: 0.3429900808922339
Epoch: 44, step: 1050, loss: 0.3157497048377991, mean loss: 0.34298965912971113
Epoch: 44, step: 1051, loss: 0.34670010209083557, mean loss: 0.3429897165775801
Epoch: 44, step: 1052, loss: 0.3080551028251648, mean loss: 0.3429891757019859
Epoch: 44, step: 1053, loss: 0.32500049471855164, mean loss: 0.34298889719631964
Epoch: 44, step: 1054, loss: 0.3366745412349701, mean loss: 0.34298879943725163
Epoch: 44, step: 1055, loss: 0.34111014008522034, mean loss: 0.3429887703522357
Epoch: 44, step: 1056, loss: 0.327394962310791, mean loss: 0.3429885289358586
Epoch: 44, step: 1057, loss: 0.3199255168437958, mean loss: 0.3429881718901254
Epoch: 44, step: 1058, loss: 0.3232434093952179, mean loss: 0.3429878662199885
Epoch: 44, step: 1059, loss: 0.30879175662994385, mean loss: 0.3429873368356676
Epoch: 44, step: 1060, loss: 0.352737694978714, mean loss: 0.3429874877770139
Epoch: 44, step: 1061, loss: 0.31530705094337463, mean loss: 0.34298705927401324
Epoch: 44, step: 1062, loss: 0.3626304864883423, mean loss: 0.34298736335654106
Epoch: 44, step: 1063, loss: 0.32019495964050293, mean loss: 0.3429870105329541
Epoch: 44, step: 1064, loss: 0.3127521872520447, mean loss: 0.34298654250887894
Epoch: 44, step: 1065, loss: 0.3383811414241791, mean loss: 0.34298647122004755
Epoch: 44, step: 1066, loss: 0.3115732669830322, mean loss: 0.3429859849701174
Epoch: 44, step: 1067, loss: 0.3034985065460205, mean loss: 0.34298537374668814
Epoch: 44, step: 1068, loss: 0.3191778361797333, mean loss: 0.34298500523747727
Epoch: 44, step: 1069, loss: 0.3033101558685303, mean loss: 0.3429843911327599
Epoch: 44, step: 1070, loss: 0.34480711817741394, mean loss: 0.3429844193452918
Epoch: 44, step: 1071, loss: 0.30528444051742554, mean loss: 0.3429838358265506
Epoch: 44, step: 1072, loss: 0.37689128518104553, mean loss: 0.34298436063655163
Epoch: 44, step: 1073, loss: 0.3559509813785553, mean loss: 0.3429845613271683
Epoch: 44, step: 1074, loss: 0.31102654337882996, mean loss: 0.3429840667052317
Epoch: 44, step: 1075, loss: 0.3539489805698395, mean loss: 0.34298423640921644
Epoch: 44, step: 1076, loss: 0.332981675863266, mean loss: 0.3429840816019711
Epoch: 44, step: 1077, loss: 0.32408952713012695, mean loss: 0.3429837891799809
Epoch: 44, step: 1078, loss: 0.2987169921398163, mean loss: 0.34298310409452026
Epoch: 44, step: 1079, loss: 0.2995336949825287, mean loss: 0.3429824316695928
Epoch: 44, step: 1080, loss: 0.3585246801376343, mean loss: 0.3429826721983773
Epoch: 44, step: 1081, loss: 0.38854122161865234, mean loss: 0.34298337724262845
Epoch: 44, step: 1082, loss: 0.28560879826545715, mean loss: 0.3429824893523953
Epoch: 44, step: 1083, loss: 0.3091687262058258, mean loss: 0.3429819660815326
Epoch: 44, step: 1084, loss: 0.334973007440567, mean loss: 0.3429818421441339
Epoch: 44, step: 1085, loss: 0.35412728786468506, mean loss: 0.34298201461551703
Epoch: 44, step: 1086, loss: 0.3409339189529419, mean loss: 0.3429819829225337
Epoch: 44, step: 1087, loss: 0.32176509499549866, mean loss: 0.34298165460970986
Epoch: 44, step: 1088, loss: 0.3477659523487091, mean loss: 0.34298172864139637
Epoch: 44, step: 1089, loss: 0.3119370639324188, mean loss: 0.3429812482671707
Epoch: 44, step: 1090, loss: 0.34263548254966736, mean loss: 0.34298124291699633
Epoch: 44, step: 1091, loss: 0.3472810685634613, mean loss: 0.34298130944892746
Epoch: 44, step: 1092, loss: 0.31233933568000793, mean loss: 0.34298083532780893
Epoch: 44, step: 1093, loss: 0.31317687034606934, mean loss: 0.3429803741802771
Epoch: 44, step: 1094, loss: 0.3003983199596405, mean loss: 0.3429797153315169
Epoch: 44, step: 1095, loss: 0.30234643816947937, mean loss: 0.34297908664484217
Epoch: 44, step: 1096, loss: 0.3361716866493225, mean loss: 0.3429789813209365
Epoch: 44, step: 1097, loss: 0.31263506412506104, mean loss: 0.34297851184794714
Epoch: 44, step: 1098, loss: 0.3050589859485626, mean loss: 0.3429779251762383
Epoch: 44, step: 1099, loss: 0.3008727729320526, mean loss: 0.342977273756716
Epoch: 44, step: 1100, loss: 0.37157583236694336, mean loss: 0.34297771620544676
Epoch: 44, step: 1101, loss: 0.3168386220932007, mean loss: 0.34297731181338464
Epoch: 44, step: 1102, loss: 0.30474451184272766, mean loss: 0.3429767203314624
Epoch: 44, step: 1103, loss: 0.3020828068256378, mean loss: 0.3429760876904738
Epoch: 44, step: 1104, loss: 0.3400118350982666, mean loss: 0.34297604183331515
Epoch: 44, step: 1105, loss: 0.3803516924381256, mean loss: 0.342976620027842
Epoch: 44, step: 1106, loss: 0.30600136518478394, mean loss: 0.3429760480362135
Epoch: 44, step: 1107, loss: 0.3074745833873749, mean loss: 0.3429754988519946
Epoch: 44, step: 1108, loss: 0.34837862849235535, mean loss: 0.34297558243354986
Epoch: 44, step: 1109, loss: 0.3029385805130005, mean loss: 0.342974963106725
Epoch: 44, step: 1110, loss: 0.33495083451271057, mean loss: 0.3429748389845137
Epoch: 44, step: 1111, loss: 0.29921311140060425, mean loss: 0.34297416206136705
Epoch: 44, step: 1112, loss: 0.3196635842323303, mean loss: 0.3429738014900074
Epoch: 44, step: 1113, loss: 0.35906872153282166, mean loss: 0.3429740504446871
Epoch: 44, step: 1114, loss: 0.367825984954834, mean loss: 0.34297443484608087
Epoch: 44, step: 1115, loss: 0.3380894362926483, mean loss: 0.3429743592877292
Epoch: 44, step: 1116, loss: 0.3234575092792511, mean loss: 0.34297405741697284
Epoch: 44, step: 1117, loss: 0.28477340936660767, mean loss: 0.34297315723062627
Epoch: 44, step: 1118, loss: 0.3486756980419159, mean loss: 0.34297324543015933
Epoch: 44, step: 1119, loss: 0.3022474944591522, mean loss: 0.34297261554660685
Epoch: 44, step: 1120, loss: 0.32787537574768066, mean loss: 0.3429723820492315
Epoch: 44, step: 1121, loss: 0.32688695192337036, mean loss: 0.3429721332721254
Epoch: 44, step: 1122, loss: 0.34976089000701904, mean loss: 0.3429722382653473
Epoch: 44, step: 1123, loss: 0.35145482420921326, mean loss: 0.34297236945288123
Epoch: 44, step: 1124, loss: 0.3105643391609192, mean loss: 0.3429718682538541
Epoch: 44, step: 1125, loss: 0.31772810220718384, mean loss: 0.34297147785816506
Epoch: 44, step: 1126, loss: 0.35521015524864197, mean loss: 0.34297166712679455
Epoch: 44, step: 1127, loss: 0.33720308542251587, mean loss: 0.3429715779182441
Epoch: 44, step: 1128, loss: 0.294904500246048, mean loss: 0.34297083459376143
Epoch: 44, step: 1129, loss: 0.320024698972702, mean loss: 0.3429704797529545
Epoch: 44, step: 1130, loss: 0.2861289381980896, mean loss: 0.3429696007645748
Epoch: 44, step: 1131, loss: 0.34883958101272583, mean loss: 0.34296969153559365
Epoch: 44, step: 1132, loss: 0.32374465465545654, mean loss: 0.3429693942519356
Epoch: 44, step: 1133, loss: 0.3319675624370575, mean loss: 0.342969224129285
Epoch: 44, step: 1134, loss: 0.30264660716056824, mean loss: 0.34296860062544293
Epoch: 44, step: 1135, loss: 0.3441656529903412, mean loss: 0.3429686191350354
Epoch: 44, step: 1136, loss: 0.34863215684890747, mean loss: 0.3429687067069389
Epoch: 44, step: 1137, loss: 0.3358873128890991, mean loss: 0.3429685972132657
Epoch: 44, step: 1138, loss: 0.30831611156463623, mean loss: 0.3429680614191312
Epoch: 44, step: 1139, loss: 0.33785268664360046, mean loss: 0.34296798232681297
Epoch: 44, step: 1140, loss: 0.32730674743652344, mean loss: 0.3429677401814616
Epoch: 44, step: 1141, loss: 0.3542253375053406, mean loss: 0.3429679142375135
Epoch: 44, step: 1142, loss: 0.3148353695869446, mean loss: 0.3429674792811188
Epoch: 44, step: 1143, loss: 0.31438207626342773, mean loss: 0.34296703732992806
Epoch: 44, step: 1144, loss: 0.33270785212516785, mean loss: 0.34296687871789044
Epoch: 44, step: 1145, loss: 0.3374902606010437, mean loss: 0.3429667940479959
Epoch: 44, step: 1146, loss: 0.3523555099964142, mean loss: 0.34296693919766347
Epoch: 44, step: 1147, loss: 0.3362658619880676, mean loss: 0.3429668356005265
Epoch: 44, step: 1148, loss: 0.3060437738895416, mean loss: 0.3429662647871739
Epoch: 44, step: 1149, loss: 0.3260366916656494, mean loss: 0.3429660030678974
Epoch: 44, step: 1150, loss: 0.3089951276779175, mean loss: 0.342965477910209
Epoch: 44, step: 1151, loss: 0.31636956334114075, mean loss: 0.34296506676881383
Epoch: 44, step: 1152, loss: 0.36810606718063354, mean loss: 0.34296545541294826
Epoch: 44, step: 1153, loss: 0.4391334652900696, mean loss: 0.34296694201072037
Epoch: 44, step: 1154, loss: 0.3558034896850586, mean loss: 0.3429671404393685
Epoch: 44, step: 1155, loss: 0.3192809820175171, mean loss: 0.3429667743020034
Epoch: 44, step: 1156, loss: 0.31785935163497925, mean loss: 0.3429663862009312
Epoch: 44, step: 1157, loss: 0.33416879177093506, mean loss: 0.34296625021313587
Epoch: 44, step: 1158, loss: 0.3244590759277344, mean loss: 0.3429659641450582
Epoch: 44, step: 1159, loss: 0.31815603375434875, mean loss: 0.34296558066029265
Epoch: 44, step: 1160, loss: 0.28992384672164917, mean loss: 0.34296476081186167
Epoch: 44, step: 1161, loss: 0.36589592695236206, mean loss: 0.3429651152457876
Epoch: 44, step: 1162, loss: 0.3165781497955322, mean loss: 0.3429647074038511
Epoch: 44, step: 1163, loss: 0.3140197694301605, mean loss: 0.3429642600323214
Epoch: 44, step: 1164, loss: 0.29336225986480713, mean loss: 0.3429634933981091
Epoch: 44, step: 1165, loss: 0.32115983963012695, mean loss: 0.3429631564123317
Epoch: 44, step: 1166, loss: 0.374333918094635, mean loss: 0.3429636412547916
Epoch: 44, step: 1167, loss: 0.32372426986694336, mean loss: 0.34296334391040195
Epoch: 44, step: 1168, loss: 0.3420908451080322, mean loss: 0.3429633304261457
Epoch: 44, step: 1169, loss: 0.34251782298088074, mean loss: 0.34296332354104314
Epoch: 44, step: 1170, loss: 0.35792234539985657, mean loss: 0.3429635547219333
Epoch: 44, step: 1171, loss: 0.35262158513069153, mean loss: 0.3429637039775185
Epoch: 44, step: 1172, loss: 0.33107802271842957, mean loss: 0.34296352029856725
Epoch: 44, step: 1173, loss: 0.32547661662101746, mean loss: 0.3429632500636163
Epoch: 44, step: 1174, loss: 0.3083246350288391, mean loss: 0.34296271478190166
Epoch: 44, step: 1175, loss: 0.37335872650146484, mean loss: 0.3429631844940373
Epoch: 44, step: 1176, loss: 0.31939151883125305, mean loss: 0.3429628202447263
Epoch: 44, step: 1177, loss: 0.3126777112483978, mean loss: 0.34296235226084343
Epoch: 44, step: 1178, loss: 0.30959832668304443, mean loss: 0.34296183670763974
Epoch: 44, step: 1179, loss: 0.32536059617996216, mean loss: 0.3429615647309952
Epoch: 44, step: 1180, loss: 0.3086666464805603, mean loss: 0.3429610348096724
Epoch: 44, step: 1181, loss: 0.3135718107223511, mean loss: 0.34296058069761565
Epoch: 44, step: 1182, loss: 0.3269737660884857, mean loss: 0.34296033367874007
Epoch: 44, step: 1183, loss: 0.32715606689453125, mean loss: 0.3429600894842595
Epoch: 44, step: 1184, loss: 0.2939385771751404, mean loss: 0.342959332056032
Epoch: 44, step: 1185, loss: 0.30639177560806274, mean loss: 0.34295876706180367
Epoch: 44, step: 1186, loss: 0.28383731842041016, mean loss: 0.34295785360833825
Epoch: 44, step: 1187, loss: 0.3169795274734497, mean loss: 0.3429574522375
Epoch: 44, step: 1188, loss: 0.336600124835968, mean loss: 0.34295735401691446
Epoch: 44, step: 1189, loss: 0.3047011196613312, mean loss: 0.3429567629679642
Epoch: 44, step: 1190, loss: 0.35020285844802856, mean loss: 0.3429568749165402
Epoch: 44, step: 1191, loss: 0.3169425427913666, mean loss: 0.3429564730142394
Epoch: 44, step: 1192, loss: 0.3378477096557617, mean loss: 0.3429563940888218
Epoch: 44, step: 1193, loss: 0.3209571838378906, mean loss: 0.3429560542277025
Epoch: 44, step: 1194, loss: 0.3233925402164459, mean loss: 0.3429557519998053
Epoch: 44, step: 1195, loss: 0.303219199180603, mean loss: 0.34295513813722084
Epoch: 44, step: 1196, loss: 0.37057071924209595, mean loss: 0.34295556474468697
Epoch: 44, step: 1197, loss: 0.32861173152923584, mean loss: 0.34295534316355164
Epoch: 44, step: 1198, loss: 0.32870253920555115, mean loss: 0.3429551229920222
Epoch: 44, step: 1199, loss: 0.32180190086364746, mean loss: 0.34295479623068187
Epoch: 44, step: 1200, loss: 0.3379852771759033, mean loss: 0.34295471946594064
Epoch: 44, step: 1201, loss: 0.3323865532875061, mean loss: 0.34295455622076504
Epoch: 44, step: 1202, loss: 0.2806580662727356, mean loss: 0.3429535939493375
Epoch: 44, step: 1203, loss: 0.3268378674983978, mean loss: 0.34295334501936453
Epoch: 44, step: 1204, loss: 0.306863009929657, mean loss: 0.3429527875621876
Epoch: 44, step: 1205, loss: 0.2995307147502899, mean loss: 0.3429521168681588
Epoch: 44, step: 1206, loss: 0.3493807315826416, mean loss: 0.34295221616251825
Epoch: 44, step: 1207, loss: 0.3696226477622986, mean loss: 0.34295262809924754
Epoch: 44, step: 1208, loss: 0.33680784702301025, mean loss: 0.34295253319182495
Epoch: 44, step: 1209, loss: 0.36891916394233704, mean loss: 0.3429529342456468
Epoch: 44, step: 1210, loss: 0.3183842897415161, mean loss: 0.3429525547895407
Epoch: 44, step: 1211, loss: 0.5145537257194519, mean loss: 0.3429552050825371
Epoch: 44, step: 1212, loss: 0.33824679255485535, mean loss: 0.3429551323646182
Epoch: 44, step: 1213, loss: 0.3173637092113495, mean loss: 0.3429547371302838
Epoch: 44, step: 1214, loss: 0.3145027458667755, mean loss: 0.3429542977240775
Epoch: 44, step: 1215, loss: 0.3036046624183655, mean loss: 0.3429536900264727
Epoch: 44, step: 1216, loss: 0.3484925925731659, mean loss: 0.34295377556540596
Epoch: 44, step: 1217, loss: 0.3416156768798828, mean loss: 0.3429537549010658
Epoch: 44, step: 1218, loss: 0.3263150155544281, mean loss: 0.34295349795195995
Epoch: 44, step: 1219, loss: 0.3530025780200958, mean loss: 0.34295365313572773
Epoch: 44, step: 1220, loss: 0.3183613419532776, mean loss: 0.3429532733727495
Epoch: 44, step: 1221, loss: 0.3289954364299774, mean loss: 0.34295305783433044
Epoch: 44, step: 1222, loss: 0.36839038133621216, mean loss: 0.3429534506341498
Epoch: 44, step: 1223, loss: 0.32666176557540894, mean loss: 0.34295319906396665
Epoch: 44, step: 1224, loss: 0.31955021619796753, mean loss: 0.34295283768932966
Epoch: 44, step: 1225, loss: 0.32920292019844055, mean loss: 0.3429526253747395
Epoch: 44, step: 1226, loss: 0.3321773409843445, mean loss: 0.34295245899448545
Epoch: 44, step: 1227, loss: 0.3160088360309601, mean loss: 0.3429520429667082
Epoch: 44, step: 1228, loss: 0.34599295258522034, mean loss: 0.3429520899196862
Epoch: 44, step: 1229, loss: 0.3240869641304016, mean loss: 0.342951798638369
Epoch: 44, step: 1230, loss: 0.3182852566242218, mean loss: 0.34295141778790483
Epoch: 44, step: 1231, loss: 0.3194984495639801, mean loss: 0.34295105568056444
Epoch: 44, step: 1232, loss: 0.35462722182273865, mean loss: 0.34295123595455573
Epoch: 44, step: 1233, loss: 0.3423204720020294, mean loss: 0.3429512262160355
Epoch: 44, step: 1234, loss: 0.3629903793334961, mean loss: 0.3429515356006848
Epoch: 44, step: 1235, loss: 0.3460719883441925, mean loss: 0.3429515837766365
Epoch: 44, step: 1236, loss: 0.3321448564529419, mean loss: 0.34295141693663644
Epoch: 44, step: 1237, loss: 0.31266075372695923, mean loss: 0.34295094930049835
Epoch: 44, step: 1238, loss: 0.31964629888534546, mean loss: 0.342950589522028
Epoch: 44, step: 1239, loss: 0.33621567487716675, mean loss: 0.34295048554965174
Epoch: 44, step: 1240, loss: 0.32770389318466187, mean loss: 0.34295025017919056
Epoch: 44, step: 1241, loss: 0.31132057309150696, mean loss: 0.3429497619011164
Epoch: 44, step: 1242, loss: 0.3298942744731903, mean loss: 0.34294956036223145
Epoch: 44, step: 1243, loss: 0.3300186097621918, mean loss: 0.34294936074891563
Epoch: 44, step: 1244, loss: 0.2939414083957672, mean loss: 0.3429486042315363
Epoch: 44, step: 1245, loss: 0.3221544027328491, mean loss: 0.34294828324420185
Epoch: 44, step: 1246, loss: 0.30532318353652954, mean loss: 0.3429477024575802
Epoch: 44, step: 1247, loss: 0.3322931230068207, mean loss: 0.34294753799444966
Epoch: 44, step: 1248, loss: 0.3047335147857666, mean loss: 0.34294694813532783
Epoch: 44, step: 1249, loss: 0.3570924401283264, mean loss: 0.34294716647712997
Epoch: 44, step: 1250, loss: 0.36143258213996887, mean loss: 0.3429474518031315
Epoch: 44, step: 1251, loss: 0.2906447649002075, mean loss: 0.34294664451340345
Epoch: 44, step: 1252, loss: 0.35093823075294495, mean loss: 0.3429467678612903
Epoch: 44, step: 1253, loss: 0.3373555839061737, mean loss: 0.34294668156426983
Epoch: 44, step: 1254, loss: 0.34803304076194763, mean loss: 0.34294676006837066
Epoch: 44, step: 1255, loss: 0.35319089889526367, mean loss: 0.34294691817645234
Epoch: 44, step: 1256, loss: 0.3225870430469513, mean loss: 0.34294660394690396
Epoch: 44, step: 1257, loss: 0.3781713843345642, mean loss: 0.34294714758953115
Epoch: 44, step: 1258, loss: 0.33101025223731995, mean loss: 0.3429469633639682
Epoch: 44, step: 1259, loss: 0.338286429643631, mean loss: 0.3429468914377116
Epoch: 44, step: 1260, loss: 0.3246506154537201, mean loss: 0.34294660907470126
Epoch: 44, step: 1261, loss: 0.3028647303581238, mean loss: 0.34294599050809865
Epoch: 44, step: 1262, loss: 0.3356601595878601, mean loss: 0.34294587807070115
Epoch: 44, step: 1263, loss: 0.3216642439365387, mean loss: 0.3429455496504213
Epoch: 44, step: 1264, loss: 0.3094540238380432, mean loss: 0.342945032813863
Epoch: 44, step: 1265, loss: 0.3060457408428192, mean loss: 0.3429444633979195
Epoch: 44, step: 1266, loss: 0.323331743478775, mean loss: 0.3429441607465003
Epoch: 44, step: 1267, loss: 0.33462026715278625, mean loss: 0.3429440322992811
Epoch: 44, step: 1268, loss: 0.32264259457588196, mean loss: 0.34294371902966114
Epoch: 44, step: 1269, loss: 0.3534272015094757, mean loss: 0.34294388079681976
Epoch: 44, step: 1270, loss: 0.3948557376861572, mean loss: 0.3429446818191922
Epoch: 44, step: 1271, loss: 0.3052482604980469, mean loss: 0.3429441001561055
Epoch: 44, step: 1272, loss: 0.32630041241645813, mean loss: 0.3429438433447407
Epoch: 44, step: 1273, loss: 0.32311779260635376, mean loss: 0.342943537434376
Epoch: 44, step: 1274, loss: 0.3281935751438141, mean loss: 0.34294330985013427
Epoch: 44, step: 1275, loss: 0.34394559264183044, mean loss: 0.34294332531459754
Epoch: 44, step: 1276, loss: 0.3247121572494507, mean loss: 0.34294304402584275
Epoch: 44, step: 1277, loss: 0.3338862955570221, mean loss: 0.3429429042913954
Epoch: 44, step: 1278, loss: 0.32793551683425903, mean loss: 0.3429426727495076
Epoch: 44, step: 1279, loss: 0.3178498446941376, mean loss: 0.34294228561009676
Epoch: 44, step: 1280, loss: 0.38361871242523193, mean loss: 0.34294291316809566
Epoch: 44, step: 1281, loss: 0.3094954788684845, mean loss: 0.3429423971473252
Epoch: 44, step: 1282, loss: 0.3311898708343506, mean loss: 0.34294221583434115
Epoch: 44, step: 1283, loss: 0.3058869242668152, mean loss: 0.34294164416986156
Epoch: 44, step: 1284, loss: 0.34685876965522766, mean loss: 0.34294170459974516
Epoch: 44, step: 1285, loss: 0.3739653527736664, mean loss: 0.34294218319726105
Epoch: 44, step: 1286, loss: 0.34128475189208984, mean loss: 0.34294215762869273
Epoch: 44, step: 1287, loss: 0.2945522964000702, mean loss: 0.3429414111480493
Epoch: 44, step: 1288, loss: 0.33389952778816223, mean loss: 0.3429412716666246
Epoch: 44, step: 1289, loss: 0.3527807891368866, mean loss: 0.3429414234501292
Epoch: 44, step: 1290, loss: 0.32542017102241516, mean loss: 0.3429411531730467
Epoch: 44, step: 1291, loss: 0.3165416717529297, mean loss: 0.3429407459496028
Epoch: 44, step: 1292, loss: 0.3352784514427185, mean loss: 0.3429406277572119
Epoch: 44, step: 1293, loss: 0.35015225410461426, mean loss: 0.3429407389962424
Epoch: 44, step: 1294, loss: 0.3137059509754181, mean loss: 0.342940288057833
Epoch: 44, step: 1295, loss: 0.3097011148929596, mean loss: 0.34293977536081355
Epoch: 44, step: 1296, loss: 0.31517350673675537, mean loss: 0.34293934708711615
Epoch: 44, step: 1297, loss: 0.3369908928871155, mean loss: 0.34293925533812336
Epoch: 44, step: 1298, loss: 0.3352935314178467, mean loss: 0.34293913741225124
Epoch: 44, step: 1299, loss: 0.3065918982028961, mean loss: 0.3429385768095119
Epoch: 44, step: 1300, loss: 0.3324286639690399, mean loss: 0.34293841471205455
Epoch: 44, step: 1301, loss: 0.34504014253616333, mean loss: 0.3429384471271171
Epoch: 44, step: 1302, loss: 0.2981241047382355, mean loss: 0.34293775596373716
Epoch: 44, step: 1303, loss: 0.3422650694847107, mean loss: 0.342937745589177
Epoch: 44, step: 1304, loss: 0.34854856133461, mean loss: 0.34293783212108964
Epoch: 44, step: 1305, loss: 0.3210156261920929, mean loss: 0.34293749403457274
Epoch: 44, step: 1306, loss: 0.32779979705810547, mean loss: 0.34293726058305174
Epoch: 44, step: 1307, loss: 0.33199062943458557, mean loss: 0.3429370917681861
Epoch: 44, step: 1308, loss: 0.2942122220993042, mean loss: 0.3429363403629942
Epoch: 44, step: 1309, loss: 0.36885079741477966, mean loss: 0.34293673999376634
Epoch: 44, step: 1310, loss: 0.32177025079727173, mean loss: 0.3429364135871601
Epoch: 44, step: 1311, loss: 0.3419407308101654, mean loss: 0.34293639823305855
Epoch: 44, step: 1312, loss: 0.27402979135513306, mean loss: 0.34293533566298223
Epoch: 44, step: 1313, loss: 0.34089601039886475, mean loss: 0.34293530421617785
Epoch: 44, step: 1314, loss: 0.29210683703422546, mean loss: 0.3429345204431106
Epoch: 44, step: 1315, loss: 0.31295162439346313, mean loss: 0.34293405811510147
Epoch: 44, step: 1316, loss: 0.33521121740341187, mean loss: 0.34293393903285835
Epoch: 44, step: 1317, loss: 0.3280789852142334, mean loss: 0.3429337099806207
Epoch: 44, step: 1318, loss: 0.32165858149528503, mean loss: 0.34293338193916695
Epoch: 44, step: 1319, loss: 0.3579763174057007, mean loss: 0.3429336138827877
Epoch: 44, step: 1320, loss: 0.3383953273296356, mean loss: 0.34293354390905234
Epoch: 44, step: 1321, loss: 0.2940704822540283, mean loss: 0.3429327905237852
Epoch: 44, step: 1322, loss: 0.3116694688796997, mean loss: 0.3429323085039939
Epoch: 44, step: 1323, loss: 0.2976300120353699, mean loss: 0.3429316100412053
Epoch: 44, step: 1324, loss: 0.3312017321586609, mean loss: 0.3429314291948125
Epoch: 44, step: 1325, loss: 0.34920161962509155, mean loss: 0.34293152586451786
Epoch: 44, step: 1326, loss: 0.329269140958786, mean loss: 0.3429313152300282
Epoch: 44, step: 1327, loss: 0.3173222243785858, mean loss: 0.3429309204179467
Epoch: 44, step: 1328, loss: 0.3210495710372925, mean loss: 0.34293058308117985
Epoch: 44, step: 1329, loss: 0.36541086435317993, mean loss: 0.34293092964611793
Epoch: 44, step: 1330, loss: 0.36108410358428955, mean loss: 0.34293120949833766
Epoch: 44, step: 1331, loss: 0.3080413341522217, mean loss: 0.34293067163875596
Epoch: 44, step: 1332, loss: 0.307102769613266, mean loss: 0.34293011932714296
Epoch: 44, step: 1333, loss: 0.35865336656570435, mean loss: 0.34293036170801605
Epoch: 44, step: 1334, loss: 0.3342835009098053, mean loss: 0.3429302284148527
Epoch: 44, step: 1335, loss: 0.3660266399383545, mean loss: 0.342930584445367
Epoch: 44, step: 1336, loss: 0.3267357349395752, mean loss: 0.3429303348060794
Epoch: 44, step: 1337, loss: 0.3164803385734558, mean loss: 0.34292992709272374
Epoch: 44, step: 1338, loss: 0.33884117007255554, mean loss: 0.34292986406756737
Epoch: 44, step: 1339, loss: 0.3425638675689697, mean loss: 0.3429298584260898
Epoch: 44, step: 1340, loss: 0.32338759303092957, mean loss: 0.3429295572058516
Epoch: 44, step: 1341, loss: 0.3380756974220276, mean loss: 0.34292948239066334
Epoch: 44, step: 1342, loss: 0.3170246183872223, mean loss: 0.34292908311101966
Epoch: 44, step: 1343, loss: 0.33194831013679504, mean loss: 0.34292891386359403
Epoch: 44, step: 1344, loss: 0.326999694108963, mean loss: 0.3429286683491945
Epoch: 44, step: 1345, loss: 0.3002408742904663, mean loss: 0.3429280104195059
Epoch: 44, step: 1346, loss: 0.3084724247455597, mean loss: 0.3429274793776972
Epoch: 44, step: 1347, loss: 0.33055976033210754, mean loss: 0.342927288764926
Epoch: 44, step: 1348, loss: 0.33063551783561707, mean loss: 0.34292709932559595
Epoch: 44, step: 1349, loss: 0.3384900987148285, mean loss: 0.34292703094411753
Epoch: 44, step: 1350, loss: 0.31298723816871643, mean loss: 0.3429265695297699
Epoch: 44, step: 1351, loss: 0.3496505618095398, mean loss: 0.3429266731543581
Epoch: 44, step: 1352, loss: 0.3496614396572113, mean loss: 0.3429267769433902
Epoch: 44, step: 1353, loss: 0.309382826089859, mean loss: 0.34292626000779375
Epoch: 44, step: 1354, loss: 0.31595584750175476, mean loss: 0.34292584438139706
Epoch: 44, step: 1355, loss: 0.2987264394760132, mean loss: 0.34292516325884104
Epoch: 44, step: 1356, loss: 0.28708910942077637, mean loss: 0.34292430282622366
Epoch: 44, step: 1357, loss: 0.42047810554504395, mean loss: 0.3429254979105569
Epoch: 44, step: 1358, loss: 0.33292680978775024, mean loss: 0.3429253438356956
Epoch: 44, step: 1359, loss: 0.31356164813041687, mean loss: 0.3429248913625739
Epoch: 44, step: 1360, loss: 0.3190920948982239, mean loss: 0.34292452412223207
Epoch: 44, step: 1361, loss: 0.38605162501335144, mean loss: 0.3429251886589033
Epoch: 44, step: 1362, loss: 0.3155977129936218, mean loss: 0.3429247675819119
Epoch: 44, step: 1363, loss: 0.3591269552707672, mean loss: 0.3429250172304125
Epoch: 44, step: 1364, loss: 0.32673829793930054, mean loss: 0.34292476782409687
Epoch: 44, step: 1365, loss: 0.33483707904815674, mean loss: 0.34292464321023636
Epoch: 44, step: 1366, loss: 0.33444637060165405, mean loss: 0.34292451258033313
Epoch: 44, step: 1367, loss: 0.3725500702857971, mean loss: 0.3429249690322884
Epoch: 44, step: 1368, loss: 0.32203906774520874, mean loss: 0.34292464724041893
Epoch: 44, step: 1369, loss: 0.2984928786754608, mean loss: 0.34292396268477593
Epoch: 44, step: 1370, loss: 0.3220674991607666, mean loss: 0.3429236413563595
Epoch: 44, step: 1371, loss: 0.34817591309547424, mean loss: 0.3429237222750712
Epoch: 44, step: 1372, loss: 0.3247939348220825, mean loss: 0.34292344296422905
Epoch: 44, step: 1373, loss: 0.31022411584854126, mean loss: 0.34292293920013855
Epoch: 44, step: 1374, loss: 0.34545379877090454, mean loss: 0.34292297818982553
Epoch: 44, step: 1375, loss: 0.31772804260253906, mean loss: 0.3429225900499502
Epoch: 44, step: 1376, loss: 0.31828537583351135, mean loss: 0.34292221050788285
Epoch: 44, step: 1377, loss: 0.36186957359313965, mean loss: 0.34292250239196154
Epoch: 44, step: 1378, loss: 0.2872510552406311, mean loss: 0.34292164478667536
Epoch: 44, step: 1379, loss: 0.33623063564300537, mean loss: 0.34292154171487266
Epoch: 44, step: 1380, loss: 0.393331378698349, mean loss: 0.34292231824239217
Epoch: 44, step: 1381, loss: 0.35555127263069153, mean loss: 0.3429225127794141
Epoch: 44, step: 1382, loss: 0.37154093384742737, mean loss: 0.3429229536121606
Epoch: 44, step: 1383, loss: 0.3065347671508789, mean loss: 0.3429223931040512
Epoch: 44, step: 1384, loss: 0.3334944248199463, mean loss: 0.3429222478818845
Epoch: 44, step: 1385, loss: 0.3490822911262512, mean loss: 0.3429223427656411
Epoch: 44, step: 1386, loss: 0.3049613833427429, mean loss: 0.34292175805822733
Epoch: 44, step: 1387, loss: 0.31388187408447266, mean loss: 0.34292131076779586
Epoch: 44, step: 1388, loss: 0.3795580267906189, mean loss: 0.342921875060688
Epoch: 44, step: 1389, loss: 0.33487099409103394, mean loss: 0.34292175105981054
Epoch: 44, step: 1390, loss: 0.3357870578765869, mean loss: 0.34292164117188745
Epoch: 44, step: 1391, loss: 0.3580664098262787, mean loss: 0.34292187442670286
Epoch: 44, step: 1392, loss: 0.34875422716140747, mean loss: 0.3429219642533248
Epoch: 44, step: 1393, loss: 0.3508552610874176, mean loss: 0.3429220864356262
Epoch: 44, step: 1394, loss: 0.35134920477867126, mean loss: 0.3429222162213733
Epoch: 44, step: 1395, loss: 0.3242758810520172, mean loss: 0.3429219290542574
Epoch: 44, step: 1396, loss: 0.32173213362693787, mean loss: 0.3429216027210304
Epoch: 44, step: 1397, loss: 0.38055968284606934, mean loss: 0.34292218235697036
Epoch: 44, step: 1398, loss: 0.3433305621147156, mean loss: 0.3429221886460249
Epoch: 44, step: 1399, loss: 0.3360580801963806, mean loss: 0.34292208294027693
Epoch: 44, step: 1400, loss: 0.33062130212783813, mean loss: 0.34292189351389735
Epoch: 44, step: 1401, loss: 0.3529793918132782, mean loss: 0.34292204839237067
Epoch: 44, step: 1402, loss: 0.3224685490131378, mean loss: 0.3429217334275671
Epoch: 44, step: 1403, loss: 0.32239529490470886, mean loss: 0.34292141734443615
Epoch: 44, step: 1404, loss: 0.31949758529663086, mean loss: 0.3429210566503901
Epoch: 44, step: 1405, loss: 0.30324670672416687, mean loss: 0.34292044573064745
Epoch: 44, step: 1406, loss: 0.3351830244064331, mean loss: 0.3429203265889182
Epoch: 44, step: 1407, loss: 0.3040980398654938, mean loss: 0.3429197288079573
Epoch: 44, step: 1408, loss: 0.3678382933139801, mean loss: 0.34292011249514653
Epoch: 44, step: 1409, loss: 0.3134101331233978, mean loss: 0.3429196581179813
Epoch: 44, step: 1410, loss: 0.27774864435195923, mean loss: 0.3429186546688033
Epoch: 44, step: 1411, loss: 0.3153817057609558, mean loss: 0.3429182306842478
Epoch: 44, step: 1412, loss: 0.36448195576667786, mean loss: 0.3429185626943647
Epoch: 44, step: 1413, loss: 0.34533730149269104, mean loss: 0.342918599934377
Epoch: 44, step: 1414, loss: 0.36758139729499817, mean loss: 0.34291897964827456
Epoch: 44, step: 1415, loss: 0.3410463035106659, mean loss: 0.34291895081658136
Epoch: 44, step: 1416, loss: 0.3287632465362549, mean loss: 0.3429187328789298
Epoch: 44, step: 1417, loss: 0.32931023836135864, mean loss: 0.3429185233692073
Epoch: 44, step: 1418, loss: 0.3092564642429352, mean loss: 0.3429180051325954
Epoch: 44, step: 1419, loss: 0.2977599799633026, mean loss: 0.34291730992314334
Epoch: 44, step: 1420, loss: 0.3221888840198517, mean loss: 0.3429169908131798
Epoch: 44, step: 1421, loss: 0.3083898425102234, mean loss: 0.34291645928283243
Epoch: 44, step: 1422, loss: 0.33004504442214966, mean loss: 0.3429162611360805
Epoch: 44, step: 1423, loss: 0.2997286915779114, mean loss: 0.34291559630280527
Epoch: 44, step: 1424, loss: 0.3264249265193939, mean loss: 0.34291534244788024
Epoch: 44, step: 1425, loss: 0.310588538646698, mean loss: 0.34291484482151713
Epoch: 44, step: 1426, loss: 0.3194258213043213, mean loss: 0.3429144832461047
Epoch: 44, step: 1427, loss: 0.3128524124622345, mean loss: 0.3429140204964159
Epoch: 44, step: 1428, loss: 0.3720296025276184, mean loss: 0.34291446866977127
Epoch: 44, step: 1429, loss: 0.29951614141464233, mean loss: 0.34291380065377436
Epoch: 44, step: 1430, loss: 0.34205034375190735, mean loss: 0.34291378736307443
Epoch: 44, step: 1431, loss: 0.3136143088340759, mean loss: 0.3429133363798438
Epoch: 44, step: 1432, loss: 0.34574830532073975, mean loss: 0.34291338001556143
Epoch: 44, step: 1433, loss: 0.35883405804634094, mean loss: 0.34291362506216805
Epoch: 44, step: 1434, loss: 0.3150143325328827, mean loss: 0.3429131956506994
Epoch: 44, step: 1435, loss: 0.3154398798942566, mean loss: 0.342912772802153
Epoch: 44, step: 1436, loss: 0.3633788824081421, mean loss: 0.34291308779622137
Epoch: 44, step: 1437, loss: 0.35900694131851196, mean loss: 0.3429133354930466
Epoch: 44, step: 1438, loss: 0.32413798570632935, mean loss: 0.3429130465303719
Epoch: 44, step: 1439, loss: 0.34551116824150085, mean loss: 0.3429130865162392
Epoch: 44, step: 1440, loss: 0.347504198551178, mean loss: 0.34291315717373394
Epoch: 44, step: 1441, loss: 0.35053175687789917, mean loss: 0.3429132744226444
Epoch: 44, step: 1442, loss: 0.301337331533432, mean loss: 0.3429126345860374
Epoch: 44, step: 1443, loss: 0.3252250850200653, mean loss: 0.34291236238613637
Valid: 44, mean loss: 0.18574969470500946
Epoch: 45, step: 0, loss: 0.3380279242992401, mean loss: 0.3429122872189631
Epoch: 45, step: 1, loss: 0.2860964834690094, mean loss: 0.3429114128875521
Epoch: 45, step: 2, loss: 0.33989307284355164, mean loss: 0.34291136643940345
Epoch: 45, step: 3, loss: 0.32304292917251587, mean loss: 0.34291106069587785
Epoch: 45, step: 4, loss: 0.3691848814487457, mean loss: 0.3429114650018062
Epoch: 45, step: 5, loss: 0.2969634532928467, mean loss: 0.3429107579570318
Epoch: 45, step: 6, loss: 0.3373970091342926, mean loss: 0.34291067311315804
Epoch: 45, step: 7, loss: 0.40971165895462036, mean loss: 0.34291170101039814
Epoch: 45, step: 8, loss: 0.31651514768600464, mean loss: 0.3429112948408414
Epoch: 45, step: 9, loss: 0.33218422532081604, mean loss: 0.34291112978360916
Epoch: 45, step: 10, loss: 0.3589383661746979, mean loss: 0.3429113763906223
Epoch: 45, step: 11, loss: 0.33274126052856445, mean loss: 0.34291121990804196
Epoch: 45, step: 12, loss: 0.32099297642707825, mean loss: 0.3429108826679779
Epoch: 45, step: 13, loss: 0.31856462359428406, mean loss: 0.3429105080755683
Epoch: 45, step: 14, loss: 0.3191336989402771, mean loss: 0.34291014225036426
Epoch: 45, step: 15, loss: 0.30959588289260864, mean loss: 0.34290962969175515
Epoch: 45, step: 16, loss: 0.29353922605514526, mean loss: 0.3429088701120263
Epoch: 45, step: 17, loss: 0.3109143376350403, mean loss: 0.3429083778733039
Epoch: 45, step: 18, loss: 0.3742479681968689, mean loss: 0.34290886002826515
Epoch: 45, step: 19, loss: 0.31519266963005066, mean loss: 0.34290843362533596
Epoch: 45, step: 20, loss: 0.34984833002090454, mean loss: 0.3429085403913303
Epoch: 45, step: 21, loss: 0.3308386206626892, mean loss: 0.3429083547059709
Epoch: 45, step: 22, loss: 0.3829422891139984, mean loss: 0.342908970584229
Epoch: 45, step: 23, loss: 0.33380287885665894, mean loss: 0.34290883049913073
Epoch: 45, step: 24, loss: 0.29343467950820923, mean loss: 0.34290806941689106
Epoch: 45, step: 25, loss: 0.2985566258430481, mean loss: 0.34290738714996843
Epoch: 45, step: 26, loss: 0.33323460817337036, mean loss: 0.3429072383540084
Epoch: 45, step: 27, loss: 0.33133652806282043, mean loss: 0.3429070603649872
Epoch: 45, step: 28, loss: 0.3595174252986908, mean loss: 0.34290731587368495
Epoch: 45, step: 29, loss: 0.410258024930954, mean loss: 0.3429083518790542
Epoch: 45, step: 30, loss: 0.3226126730442047, mean loss: 0.34290803969067324
Epoch: 45, step: 31, loss: 0.3284401595592499, mean loss: 0.3429078171489866
Epoch: 45, step: 32, loss: 0.3884626030921936, mean loss: 0.34290851785170673
Epoch: 45, step: 33, loss: 0.3396872282028198, mean loss: 0.34290846830407623
Epoch: 45, step: 34, loss: 0.31670206785202026, mean loss: 0.3429080652217037
Epoch: 45, step: 35, loss: 0.3155060410499573, mean loss: 0.3429076437558465
Epoch: 45, step: 36, loss: 0.33982500433921814, mean loss: 0.342907596343025
Epoch: 45, step: 37, loss: 0.3179710805416107, mean loss: 0.3429072128105293
Epoch: 45, step: 38, loss: 0.3153463900089264, mean loss: 0.3429067889217768
Epoch: 45, step: 39, loss: 0.31996554136276245, mean loss: 0.34290643608807087
Epoch: 45, step: 40, loss: 0.3369584083557129, mean loss: 0.34290634460950653
Epoch: 45, step: 41, loss: 0.36084774136543274, mean loss: 0.342906620537604
Epoch: 45, step: 42, loss: 0.316479355096817, mean loss: 0.34290621410810307
Epoch: 45, step: 43, loss: 0.3150964379310608, mean loss: 0.34290578642330705
Epoch: 45, step: 44, loss: 0.33666345477104187, mean loss: 0.34290569042435814
Epoch: 45, step: 45, loss: 0.31041449308395386, mean loss: 0.34290519075964954
Epoch: 45, step: 46, loss: 0.31241634488105774, mean loss: 0.34290472189524124
Epoch: 45, step: 47, loss: 0.3367382884025574, mean loss: 0.3429046270678824
Epoch: 45, step: 48, loss: 0.32589560747146606, mean loss: 0.34290436550735404
Epoch: 45, step: 49, loss: 0.34684985876083374, mean loss: 0.3429044261792478
Epoch: 45, step: 50, loss: 0.34657788276672363, mean loss: 0.3429044826670242
Epoch: 45, step: 51, loss: 0.3177720010280609, mean loss: 0.3429040962037194
Epoch: 45, step: 52, loss: 0.2957758605480194, mean loss: 0.3429033715218555
Epoch: 45, step: 53, loss: 0.35234543681144714, mean loss: 0.34290351670845465
Epoch: 45, step: 54, loss: 0.3196195065975189, mean loss: 0.342903158685696
Epoch: 45, step: 55, loss: 0.35759812593460083, mean loss: 0.34290338463697295
Epoch: 45, step: 56, loss: 0.3336115777492523, mean loss: 0.3429032417674235
Epoch: 45, step: 57, loss: 0.33822911977767944, mean loss: 0.3429031698998693
Epoch: 45, step: 58, loss: 0.3639983534812927, mean loss: 0.34290349424654715
Epoch: 45, step: 59, loss: 0.3586121201515198, mean loss: 0.34290373576908567
Epoch: 45, step: 60, loss: 0.31749939918518066, mean loss: 0.3429033451795101
Epoch: 45, step: 61, loss: 0.35035109519958496, mean loss: 0.34290345968629066
Epoch: 45, step: 62, loss: 0.3306453824043274, mean loss: 0.3429032712251606
Epoch: 45, step: 63, loss: 0.36086606979370117, mean loss: 0.34290354738896617
Epoch: 45, step: 64, loss: 0.34801703691482544, mean loss: 0.3429036260036103
Epoch: 45, step: 65, loss: 0.3050357699394226, mean loss: 0.3429030438332068
Epoch: 45, step: 66, loss: 0.2847221791744232, mean loss: 0.34290214938973274
Epoch: 45, step: 67, loss: 0.39340823888778687, mean loss: 0.34290292583312065
Epoch: 45, step: 68, loss: 0.3293999135494232, mean loss: 0.34290271825095514
Epoch: 45, step: 69, loss: 0.3406077027320862, mean loss: 0.34290268297016313
Epoch: 45, step: 70, loss: 0.35435226559638977, mean loss: 0.3429028589794885
Epoch: 45, step: 71, loss: 0.35359033942222595, mean loss: 0.3429030232708315
Epoch: 45, step: 72, loss: 0.3597448170185089, mean loss: 0.342903282164253
Epoch: 45, step: 73, loss: 0.35706549882888794, mean loss: 0.3429034998636514
Epoch: 45, step: 74, loss: 0.36996990442276, mean loss: 0.34290391591782954
Epoch: 45, step: 75, loss: 0.32004714012145996, mean loss: 0.3429035645778179
Epoch: 45, step: 76, loss: 0.31320589780807495, mean loss: 0.3429031080909407
Epoch: 45, step: 77, loss: 0.31724512577056885, mean loss: 0.3429027137046651
Epoch: 45, step: 78, loss: 0.304543137550354, mean loss: 0.342902124092526
Epoch: 45, step: 79, loss: 0.3144969344139099, mean loss: 0.3429016874926232
Epoch: 45, step: 80, loss: 0.35625147819519043, mean loss: 0.34290189268145677
Epoch: 45, step: 81, loss: 0.3457905650138855, mean loss: 0.34290193708022
Epoch: 45, step: 82, loss: 0.34998247027397156, mean loss: 0.3429020459060226
Epoch: 45, step: 83, loss: 0.3313938081264496, mean loss: 0.34290186903036507
Epoch: 45, step: 84, loss: 0.36032161116600037, mean loss: 0.3429021367586696
Epoch: 45, step: 85, loss: 0.33717605471611023, mean loss: 0.34290204875445784
Epoch: 45, step: 86, loss: 0.30500513315200806, mean loss: 0.3429014663253371
Epoch: 45, step: 87, loss: 0.3802986145019531, mean loss: 0.34290204106481237
Epoch: 45, step: 88, loss: 0.30351898074150085, mean loss: 0.34290143581407356
Epoch: 45, step: 89, loss: 0.33689063787460327, mean loss: 0.34290134343973916
Epoch: 45, step: 90, loss: 0.3670025169849396, mean loss: 0.3429017138224526
Epoch: 45, step: 91, loss: 0.28422269225120544, mean loss: 0.342900812067142
Epoch: 45, step: 92, loss: 0.353744775056839, mean loss: 0.3429009787101889
Epoch: 45, step: 93, loss: 0.38121336698532104, mean loss: 0.3429015674612765
Epoch: 45, step: 94, loss: 0.3649393320083618, mean loss: 0.34290190611305593
Epoch: 45, step: 95, loss: 0.36252596974372864, mean loss: 0.34290220766913854
Epoch: 45, step: 96, loss: 0.30128324031829834, mean loss: 0.3429015681349352
Epoch: 45, step: 97, loss: 0.3434588313102722, mean loss: 0.34290157669793925
Epoch: 45, step: 98, loss: 0.36020204424858093, mean loss: 0.34290184253588313
Epoch: 45, step: 99, loss: 0.31003451347351074, mean loss: 0.34290133750624174
Epoch: 45, step: 100, loss: 0.35234808921813965, mean loss: 0.34290148265999953
Epoch: 45, step: 101, loss: 0.32899123430252075, mean loss: 0.3429012689258126
Epoch: 45, step: 102, loss: 0.33634188771247864, mean loss: 0.34290116814094995
Epoch: 45, step: 103, loss: 0.3053429126739502, mean loss: 0.3429005910673917
Epoch: 45, step: 104, loss: 0.33329033851623535, mean loss: 0.3429004434104423
Epoch: 45, step: 105, loss: 0.33825311064720154, mean loss: 0.34290037200748674
Epoch: 45, step: 106, loss: 0.3061065673828125, mean loss: 0.3428998067055889
Epoch: 45, step: 107, loss: 0.314220666885376, mean loss: 0.34289936608458627
Epoch: 45, step: 108, loss: 0.2993263006210327, mean loss: 0.3428986966463484
Epoch: 45, step: 109, loss: 0.3307584226131439, mean loss: 0.3428985101311536
Epoch: 45, step: 110, loss: 0.3205109238624573, mean loss: 0.34289816618826946
Epoch: 45, step: 111, loss: 0.3194849193096161, mean loss: 0.34289780649357765
Epoch: 45, step: 112, loss: 0.3563106656074524, mean loss: 0.3428980125504365
Epoch: 45, step: 113, loss: 0.3195359706878662, mean loss: 0.3428976536534281
Epoch: 45, step: 114, loss: 0.34441304206848145, mean loss: 0.34289767693307194
Epoch: 45, step: 115, loss: 0.3475038409233093, mean loss: 0.34289774769262693
Epoch: 45, step: 116, loss: 0.3544383645057678, mean loss: 0.3428979249760165
Epoch: 45, step: 117, loss: 0.383606880903244, mean loss: 0.3428985503248126
Epoch: 45, step: 118, loss: 0.32006901502609253, mean loss: 0.3428981996353197
Epoch: 45, step: 119, loss: 0.3064838945865631, mean loss: 0.34289764027579517
Epoch: 45, step: 120, loss: 0.3884138762950897, mean loss: 0.34289833943918774
Epoch: 45, step: 121, loss: 0.3235357105731964, mean loss: 0.34289804201931023
Epoch: 45, step: 122, loss: 0.33120566606521606, mean loss: 0.3428978624211972
Epoch: 45, step: 123, loss: 0.33161357045173645, mean loss: 0.3428976890940288
Epoch: 45, step: 124, loss: 0.32903242111206055, mean loss: 0.34289747612623855
Epoch: 45, step: 125, loss: 0.33509519696235657, mean loss: 0.3428973562866053
Epoch: 45, step: 126, loss: 0.34522342681884766, mean loss: 0.34289739201349384
Epoch: 45, step: 127, loss: 0.3031276762485504, mean loss: 0.3428967811866252
Epoch: 45, step: 128, loss: 0.30240151286125183, mean loss: 0.3428961592254781
Epoch: 45, step: 129, loss: 0.3273366391658783, mean loss: 0.34289592025266197
Epoch: 45, step: 130, loss: 0.3281266987323761, mean loss: 0.34289569342122767
Epoch: 45, step: 131, loss: 0.3301530182361603, mean loss: 0.34289549771728395
Epoch: 45, step: 132, loss: 0.3621053099632263, mean loss: 0.3428957927399714
Epoch: 45, step: 133, loss: 0.3183680474758148, mean loss: 0.3428954160506993
Epoch: 45, step: 134, loss: 0.3288041949272156, mean loss: 0.34289519964555265
Epoch: 45, step: 135, loss: 0.2858208417892456, mean loss: 0.3428943231427291
Epoch: 45, step: 136, loss: 0.3575086295604706, mean loss: 0.34289454757423576
Epoch: 45, step: 137, loss: 0.3125763237476349, mean loss: 0.3428940819852461
Epoch: 45, step: 138, loss: 0.3710470199584961, mean loss: 0.3428945143158712
Epoch: 45, step: 139, loss: 0.3175267279148102, mean loss: 0.34289412476141173
Epoch: 45, step: 140, loss: 0.37867507338523865, mean loss: 0.3428946742147159
Epoch: 45, step: 141, loss: 0.3088870346546173, mean loss: 0.34289415200041723
Epoch: 45, step: 142, loss: 0.3536185622215271, mean loss: 0.3428943166797198
Epoch: 45, step: 143, loss: 0.2978692054748535, mean loss: 0.3428936253046322
Epoch: 45, step: 144, loss: 0.34456416964530945, mean loss: 0.34289365095598484
Epoch: 45, step: 145, loss: 0.3808206617832184, mean loss: 0.3428942333195697
Epoch: 45, step: 146, loss: 0.328309565782547, mean loss: 0.34289400937761727
Epoch: 45, step: 147, loss: 0.36233049631118774, mean loss: 0.34289430781280544
Epoch: 45, step: 148, loss: 0.3522929251194, mean loss: 0.34289445212052255
Epoch: 45, step: 149, loss: 0.3427720367908478, mean loss: 0.3428944502409689
Epoch: 45, step: 150, loss: 0.3141259551048279, mean loss: 0.3428940085389355
Epoch: 45, step: 151, loss: 0.31588664650917053, mean loss: 0.34289359388312834
Epoch: 45, step: 152, loss: 0.3450835645198822, mean loss: 0.34289362750618635
Epoch: 45, step: 153, loss: 0.31653469800949097, mean loss: 0.3428932228184734
Epoch: 45, step: 154, loss: 0.31173479557037354, mean loss: 0.3428927444515854
Epoch: 45, step: 155, loss: 0.37393805384635925, mean loss: 0.34289322107448816
Epoch: 45, step: 156, loss: 0.3608950078487396, mean loss: 0.3428934974425551
Epoch: 45, step: 157, loss: 0.36136776208877563, mean loss: 0.34289378105986984
Epoch: 45, step: 158, loss: 0.299410343170166, mean loss: 0.342893113511429
Epoch: 45, step: 159, loss: 0.33242520689964294, mean loss: 0.34289295281283194
Epoch: 45, step: 160, loss: 0.3277660310268402, mean loss: 0.34289272059469306
Epoch: 45, step: 161, loss: 0.31809002161026, mean loss: 0.34289233984649703
Epoch: 45, step: 162, loss: 0.33833882212638855, mean loss: 0.342892269946159
Epoch: 45, step: 163, loss: 0.3188730776309967, mean loss: 0.34289190123695606
Epoch: 45, step: 164, loss: 0.31523382663726807, mean loss: 0.34289147667521536
Epoch: 45, step: 165, loss: 0.36806562542915344, mean loss: 0.34289186310183795
Epoch: 45, step: 166, loss: 0.3255596458911896, mean loss: 0.3428915970540198
Epoch: 45, step: 167, loss: 0.3536621928215027, mean loss: 0.3428917623790607
Epoch: 45, step: 168, loss: 0.3244331479072571, mean loss: 0.34289147904985423
Epoch: 45, step: 169, loss: 0.36174261569976807, mean loss: 0.34289176839961094
Epoch: 45, step: 170, loss: 0.29678377509117126, mean loss: 0.34289106068993175
Epoch: 45, step: 171, loss: 0.32430222630500793, mean loss: 0.34289077537506213
Epoch: 45, step: 172, loss: 0.3300124406814575, mean loss: 0.3428905777121043
Epoch: 45, step: 173, loss: 0.3521423935890198, mean loss: 0.3428907197113043
Epoch: 45, step: 174, loss: 0.3160347044467926, mean loss: 0.3428903075247451
Epoch: 45, step: 175, loss: 0.3068641424179077, mean loss: 0.34288975460306315
Epoch: 45, step: 176, loss: 0.3305187225341797, mean loss: 0.3428895647380898
Epoch: 45, step: 177, loss: 0.31611332297325134, mean loss: 0.34288915379481705
Epoch: 45, step: 178, loss: 0.3601325452327728, mean loss: 0.34288941843042287
Epoch: 45, step: 179, loss: 0.27818188071250916, mean loss: 0.3428884253742885
Epoch: 45, step: 180, loss: 0.33018219470977783, mean loss: 0.3428882303768105
Epoch: 45, step: 181, loss: 0.320227712392807, mean loss: 0.34288788262017345
Epoch: 45, step: 182, loss: 0.31688159704208374, mean loss: 0.34288748352428194
Epoch: 45, step: 183, loss: 0.31592920422554016, mean loss: 0.3428870698253178
Epoch: 45, step: 184, loss: 0.3273778557777405, mean loss: 0.3428868318261764
Epoch: 45, step: 185, loss: 0.3226809501647949, mean loss: 0.3428865217583241
Epoch: 45, step: 186, loss: 0.3425263464450836, mean loss: 0.3428865162313655
Epoch: 45, step: 187, loss: 0.35042768716812134, mean loss: 0.342886631950291
Epoch: 45, step: 188, loss: 0.31156954169273376, mean loss: 0.3428861513983375
Epoch: 45, step: 189, loss: 0.3562445640563965, mean loss: 0.34288635637628223
Epoch: 45, step: 190, loss: 0.3106542229652405, mean loss: 0.3428858617984269
Epoch: 45, step: 191, loss: 0.3269546329975128, mean loss: 0.3428856173494488
Epoch: 45, step: 192, loss: 0.32484257221221924, mean loss: 0.3428853405009818
Epoch: 45, step: 193, loss: 0.3260297179222107, mean loss: 0.34288508187603045
Epoch: 45, step: 194, loss: 0.30862483382225037, mean loss: 0.34288455621054437
Epoch: 45, step: 195, loss: 0.3049660921096802, mean loss: 0.34288397442485485
Epoch: 45, step: 196, loss: 0.3364885151386261, mean loss: 0.34288387630037404
Epoch: 45, step: 197, loss: 0.31888872385025024, mean loss: 0.3428835081523417
Epoch: 45, step: 198, loss: 0.2987527549266815, mean loss: 0.3428828310822236
Epoch: 45, step: 199, loss: 0.2956346869468689, mean loss: 0.34288210619507825
Epoch: 45, step: 200, loss: 0.32029038667678833, mean loss: 0.34288175959530964
Epoch: 45, step: 201, loss: 0.3710136115550995, mean loss: 0.34288219118458213
Epoch: 45, step: 202, loss: 0.30884331464767456, mean loss: 0.3428816689797659
Epoch: 45, step: 203, loss: 0.3239693343639374, mean loss: 0.34288137884208464
Epoch: 45, step: 204, loss: 0.3626387417316437, mean loss: 0.34288168193885366
Epoch: 45, step: 205, loss: 0.3802388906478882, mean loss: 0.3428822550252328
Epoch: 45, step: 206, loss: 0.327053040266037, mean loss: 0.34288201219744874
Epoch: 45, step: 207, loss: 0.3516930341720581, mean loss: 0.3428821473606993
Epoch: 45, step: 208, loss: 0.3320354223251343, mean loss: 0.3428819809718141
Epoch: 45, step: 209, loss: 0.2947884500026703, mean loss: 0.3428812432278201
Epoch: 45, step: 210, loss: 0.3242732882499695, mean loss: 0.3428809577903367
Epoch: 45, step: 211, loss: 0.3507058024406433, mean loss: 0.3428810778180188
Epoch: 45, step: 212, loss: 0.3167230784893036, mean loss: 0.34288067657863225
Epoch: 45, step: 213, loss: 0.3197430372238159, mean loss: 0.34288032167420307
Epoch: 45, step: 214, loss: 0.3281412422657013, mean loss: 0.34288009559736576
Epoch: 45, step: 215, loss: 0.32156309485435486, mean loss: 0.34287976862944225
Epoch: 45, step: 216, loss: 0.31575462222099304, mean loss: 0.342879352580446
Epoch: 45, step: 217, loss: 0.3255912661552429, mean loss: 0.3428790874176124
Epoch: 45, step: 218, loss: 0.349197655916214, mean loss: 0.3428791843296586
Epoch: 45, step: 219, loss: 0.32504457235336304, mean loss: 0.3428789107926651
Epoch: 45, step: 220, loss: 0.3613949716091156, mean loss: 0.3428791947769723
Epoch: 45, step: 221, loss: 0.3271512985229492, mean loss: 0.34287895355896897
Epoch: 45, step: 222, loss: 0.31981581449508667, mean loss: 0.34287859984611735
Epoch: 45, step: 223, loss: 0.3154866695404053, mean loss: 0.34287817975025964
Epoch: 45, step: 224, loss: 0.31044480204582214, mean loss: 0.342877682343961
Epoch: 45, step: 225, loss: 0.35604605078697205, mean loss: 0.3428778842942178
Epoch: 45, step: 226, loss: 0.3152875304222107, mean loss: 0.342877461174708
Epoch: 45, step: 227, loss: 0.3246106207370758, mean loss: 0.34287718104281567
Epoch: 45, step: 228, loss: 0.34922319650650024, mean loss: 0.3428772783609077
Epoch: 45, step: 229, loss: 0.306855708360672, mean loss: 0.34287672596756313
Epoch: 45, step: 230, loss: 0.3637992739677429, mean loss: 0.3428770468114085
Epoch: 45, step: 231, loss: 0.33598098158836365, mean loss: 0.3428769410629999
Epoch: 45, step: 232, loss: 0.3127936124801636, mean loss: 0.34287647975423347
Epoch: 45, step: 233, loss: 0.32930126786231995, mean loss: 0.34287627159015993
Epoch: 45, step: 234, loss: 0.34577107429504395, mean loss: 0.34287631597876234
Epoch: 45, step: 235, loss: 0.32388022541999817, mean loss: 0.3428760246991598
Epoch: 45, step: 236, loss: 0.2932361364364624, mean loss: 0.34287526354963954
Epoch: 45, step: 237, loss: 0.34989258646965027, mean loss: 0.34287537114758676
Epoch: 45, step: 238, loss: 0.3359348177909851, mean loss: 0.34287526472839364
Epoch: 45, step: 239, loss: 0.30532997846603394, mean loss: 0.3428746890570311
Epoch: 45, step: 240, loss: 0.3610805571079254, mean loss: 0.34287496819822877
Epoch: 45, step: 241, loss: 0.31795933842658997, mean loss: 0.3428745861855678
Epoch: 45, step: 242, loss: 0.3231993317604065, mean loss: 0.34287428452427615
Epoch: 45, step: 243, loss: 0.3121579885482788, mean loss: 0.34287381358879265
Epoch: 45, step: 244, loss: 0.315690815448761, mean loss: 0.34287339683144286
Epoch: 45, step: 245, loss: 0.39491546154022217, mean loss: 0.34287419470444913
Epoch: 45, step: 246, loss: 0.3186261057853699, mean loss: 0.3428738229551901
Epoch: 45, step: 247, loss: 0.3134450912475586, mean loss: 0.34287337178802707
Epoch: 45, step: 248, loss: 0.38337668776512146, mean loss: 0.3428739927283447
Epoch: 45, step: 249, loss: 0.3748112916946411, mean loss: 0.34287448233893747
Epoch: 45, step: 250, loss: 0.3123787045478821, mean loss: 0.3428740148345639
Epoch: 45, step: 251, loss: 0.31838297843933105, mean loss: 0.3428736393894389
Epoch: 45, step: 252, loss: 0.3284032344818115, mean loss: 0.34287341756298745
Epoch: 45, step: 253, loss: 0.34554028511047363, mean loss: 0.34287345844454536
Epoch: 45, step: 254, loss: 0.29954683780670166, mean loss: 0.34287279428235273
Epoch: 45, step: 255, loss: 0.28692102432250977, mean loss: 0.34287193659993875
Epoch: 45, step: 256, loss: 0.3411843776702881, mean loss: 0.34287191073181283
Epoch: 45, step: 257, loss: 0.31316304206848145, mean loss: 0.34287145533973057
Epoch: 45, step: 258, loss: 0.33100467920303345, mean loss: 0.342871273442765
Epoch: 45, step: 259, loss: 0.31566253304481506, mean loss: 0.3428708563866584
Epoch: 45, step: 260, loss: 0.31036561727523804, mean loss: 0.34287035815335243
Epoch: 45, step: 261, loss: 0.3259814977645874, mean loss: 0.3428700992885048
Epoch: 45, step: 262, loss: 0.3687366843223572, mean loss: 0.34287049575379663
Epoch: 45, step: 263, loss: 0.31348270177841187, mean loss: 0.34287004532473075
Epoch: 45, step: 264, loss: 0.34380361437797546, mean loss: 0.3428700596333989
Epoch: 45, step: 265, loss: 0.32312190532684326, mean loss: 0.3428697569611384
Epoch: 45, step: 266, loss: 0.29805654287338257, mean loss: 0.34286907013700724
Epoch: 45, step: 267, loss: 0.3080381751060486, mean loss: 0.34286853631382447
Epoch: 45, step: 268, loss: 0.3218773901462555, mean loss: 0.34286821460550454
Epoch: 45, step: 269, loss: 0.3305521309375763, mean loss: 0.3428680258532644
Epoch: 45, step: 270, loss: 0.3324959874153137, mean loss: 0.342867866897257
Epoch: 45, step: 271, loss: 0.3065544366836548, mean loss: 0.3428673103866487
Epoch: 45, step: 272, loss: 0.37220093607902527, mean loss: 0.3428677599234622
Epoch: 45, step: 273, loss: 0.3287186026573181, mean loss: 0.34286754309143247
Epoch: 45, step: 274, loss: 0.34545308351516724, mean loss: 0.3428675827135369
Epoch: 45, step: 275, loss: 0.29981714487075806, mean loss: 0.34286692299737526
Epoch: 45, step: 276, loss: 0.31968578696250916, mean loss: 0.3428665677690314
Epoch: 45, step: 277, loss: 0.31408530473709106, mean loss: 0.3428661267309513
Epoch: 45, step: 278, loss: 0.3164041042327881, mean loss: 0.34286572123864373
Epoch: 45, step: 279, loss: 0.29479560256004333, mean loss: 0.34286498464473203
Epoch: 45, step: 280, loss: 0.3372662663459778, mean loss: 0.3428648988550828
Epoch: 45, step: 281, loss: 0.32293182611465454, mean loss: 0.3428645934235493
Epoch: 45, step: 282, loss: 0.3248211145401001, mean loss: 0.3428643169502201
Epoch: 45, step: 283, loss: 0.4167836010456085, mean loss: 0.3428654495697975
Epoch: 45, step: 284, loss: 0.3077687919139862, mean loss: 0.3428649118136088
Epoch: 45, step: 285, loss: 0.3350500166416168, mean loss: 0.34286479207446174
Epoch: 45, step: 286, loss: 0.319279283285141, mean loss: 0.34286443070487543
Epoch: 45, step: 287, loss: 0.3179945647716522, mean loss: 0.3428640496626199
Epoch: 45, step: 288, loss: 0.3136405050754547, mean loss: 0.3428636019225812
Epoch: 45, step: 289, loss: 0.3469371795654297, mean loss: 0.34286366433376003
Epoch: 45, step: 290, loss: 0.30662211775779724, mean loss: 0.3428631090864592
Epoch: 45, step: 291, loss: 0.31828901171684265, mean loss: 0.34286273259887845
Epoch: 45, step: 292, loss: 0.33071765303611755, mean loss: 0.3428625465329773
Epoch: 45, step: 293, loss: 0.3100566864013672, mean loss: 0.3428620439460341
Epoch: 45, step: 294, loss: 0.33605924248695374, mean loss: 0.34286193972847057
Epoch: 45, step: 295, loss: 0.35528936982154846, mean loss: 0.34286213011130795
Epoch: 45, step: 296, loss: 0.34564343094825745, mean loss: 0.3428621727189774
Epoch: 45, step: 297, loss: 0.3234900236129761, mean loss: 0.3428618759551503
Epoch: 45, step: 298, loss: 0.33100128173828125, mean loss: 0.3428616942643429
Epoch: 45, step: 299, loss: 0.32274186611175537, mean loss: 0.34286138605619104
Epoch: 45, step: 300, loss: 0.3173101246356964, mean loss: 0.3428609946519322
Epoch: 45, step: 301, loss: 0.31874561309814453, mean loss: 0.34286062524870387
Epoch: 45, step: 302, loss: 0.37184566259384155, mean loss: 0.3428610692392886
Epoch: 45, step: 303, loss: 0.3415849804878235, mean loss: 0.34286104969255815
Epoch: 45, step: 304, loss: 0.32467398047447205, mean loss: 0.34286077111295765
Epoch: 45, step: 305, loss: 0.3161150813102722, mean loss: 0.3428603614433531
Epoch: 45, step: 306, loss: 0.3105396628379822, mean loss: 0.3428598663876972
Epoch: 45, step: 307, loss: 0.3176601827144623, mean loss: 0.3428594804104323
Epoch: 45, step: 308, loss: 0.337955504655838, mean loss: 0.3428594052986102
Epoch: 45, step: 309, loss: 0.31572824716567993, mean loss: 0.34285898975016277
Epoch: 45, step: 310, loss: 0.34755411744117737, mean loss: 0.34285906166095736
Epoch: 45, step: 311, loss: 0.4161434471607208, mean loss: 0.34286018407083146
Epoch: 45, step: 312, loss: 0.29412388801574707, mean loss: 0.34285943764631344
Epoch: 45, step: 313, loss: 0.4180348217487335, mean loss: 0.3428605889830994
Epoch: 45, step: 314, loss: 0.39833611249923706, mean loss: 0.34286143859675305
Epoch: 45, step: 315, loss: 0.30033913254737854, mean loss: 0.342860787373002
Epoch: 45, step: 316, loss: 0.3271205425262451, mean loss: 0.3428605463168303
Epoch: 45, step: 317, loss: 0.3259493112564087, mean loss: 0.3428602873313321
Epoch: 45, step: 318, loss: 0.34035488963127136, mean loss: 0.3428602489632453
Epoch: 45, step: 319, loss: 0.3331083655357361, mean loss: 0.3428600996235297
Epoch: 45, step: 320, loss: 0.34777384996414185, mean loss: 0.34286017487123405
Epoch: 45, step: 321, loss: 0.4190651476383209, mean loss: 0.34286134183354405
Epoch: 45, step: 322, loss: 0.3163732588291168, mean loss: 0.34286093621537944
Epoch: 45, step: 323, loss: 0.32345741987228394, mean loss: 0.34286063908937886
Epoch: 45, step: 324, loss: 0.31832072138786316, mean loss: 0.34286026331543046
Epoch: 45, step: 325, loss: 0.3270154893398285, mean loss: 0.34286002069187405
Epoch: 45, step: 326, loss: 0.3284659683704376, mean loss: 0.34285980028590957
Epoch: 45, step: 327, loss: 0.31163161993026733, mean loss: 0.3428593221181452
Epoch: 45, step: 328, loss: 0.33358466625213623, mean loss: 0.3428591801062346
Epoch: 45, step: 329, loss: 0.3222399950027466, mean loss: 0.34285886439370816
Epoch: 45, step: 330, loss: 0.3556618094444275, mean loss: 0.34285906042416325
Epoch: 45, step: 331, loss: 0.2824796736240387, mean loss: 0.34285813594800574
Epoch: 45, step: 332, loss: 0.3332556486129761, mean loss: 0.34285798892540176
Epoch: 45, step: 333, loss: 0.31912651658058167, mean loss: 0.34285762558105987
Epoch: 45, step: 334, loss: 0.35932543873786926, mean loss: 0.342857877710175
Epoch: 45, step: 335, loss: 0.36338943243026733, mean loss: 0.34285819205206247
Epoch: 45, step: 336, loss: 0.36012136936187744, mean loss: 0.3428584563504428
Epoch: 45, step: 337, loss: 0.29722967743873596, mean loss: 0.342857757786817
Epoch: 45, step: 338, loss: 0.377560555934906, mean loss: 0.3428582890686515
Epoch: 45, step: 339, loss: 0.309092253446579, mean loss: 0.3428577721360792
Epoch: 45, step: 340, loss: 0.3271785378456116, mean loss: 0.34285753210248676
Epoch: 45, step: 341, loss: 0.3383023142814636, mean loss: 0.3428574623676682
Epoch: 45, step: 342, loss: 0.3068121671676636, mean loss: 0.3428569105666915
Epoch: 45, step: 343, loss: 0.274941086769104, mean loss: 0.342855870890251
Epoch: 45, step: 344, loss: 0.34540629386901855, mean loss: 0.34285590993231724
Epoch: 45, step: 345, loss: 0.32344159483909607, mean loss: 0.34285561274107496
Epoch: 45, step: 346, loss: 0.34792283177375793, mean loss: 0.34285569030806917
Epoch: 45, step: 347, loss: 0.3219369947910309, mean loss: 0.3428553700978145
Epoch: 45, step: 348, loss: 0.2988671064376831, mean loss: 0.3428546967634047
Epoch: 45, step: 349, loss: 0.32317787408828735, mean loss: 0.3428543955721805
Epoch: 45, step: 350, loss: 0.3488159477710724, mean loss: 0.3428544868236874
Epoch: 45, step: 351, loss: 0.3452669382095337, mean loss: 0.3428545237497173
Epoch: 45, step: 352, loss: 0.31033122539520264, mean loss: 0.3428540259415904
Epoch: 45, step: 353, loss: 0.3553886115550995, mean loss: 0.342854217795535
Epoch: 45, step: 354, loss: 0.3246035873889923, mean loss: 0.3428539384562772
Epoch: 45, step: 355, loss: 0.3245239853858948, mean loss: 0.342853657907222
Epoch: 45, step: 356, loss: 0.32305169105529785, mean loss: 0.3428533548329019
Epoch: 45, step: 357, loss: 0.32391947507858276, mean loss: 0.3428530650493188
Epoch: 45, step: 358, loss: 0.3027594983577728, mean loss: 0.3428524514255001
Epoch: 45, step: 359, loss: 0.3783409595489502, mean loss: 0.3428529945615289
Epoch: 45, step: 360, loss: 0.3090439736843109, mean loss: 0.34285247713723366
Epoch: 45, step: 361, loss: 0.3134693503379822, mean loss: 0.34285202745514864
Epoch: 45, step: 362, loss: 0.33584830164909363, mean loss: 0.3428519202711227
Epoch: 45, step: 363, loss: 0.34279972314834595, mean loss: 0.3428519194723176
Epoch: 45, step: 364, loss: 0.3261259198188782, mean loss: 0.34285166350782675
Epoch: 45, step: 365, loss: 0.31156495213508606, mean loss: 0.3428511847224172
Epoch: 45, step: 366, loss: 0.33138006925582886, mean loss: 0.34285100918083966
Epoch: 45, step: 367, loss: 0.3509601652622223, mean loss: 0.34285113327271827
Epoch: 45, step: 368, loss: 0.3325786888599396, mean loss: 0.34285097607912063
Epoch: 45, step: 369, loss: 0.3687928318977356, mean loss: 0.342851373047075
Epoch: 45, step: 370, loss: 0.36020761728286743, mean loss: 0.3428516386320582
Epoch: 45, step: 371, loss: 0.3226920962333679, mean loss: 0.3428513301557698
Epoch: 45, step: 372, loss: 0.33215847611427307, mean loss: 0.34285116653888853
Epoch: 45, step: 373, loss: 0.3616964817047119, mean loss: 0.3428514548963749
Epoch: 45, step: 374, loss: 0.3220802843570709, mean loss: 0.342851137075695
Epoch: 45, step: 375, loss: 0.3465908169746399, mean loss: 0.34285119429584154
Epoch: 45, step: 376, loss: 0.36023542284965515, mean loss: 0.3428514602846194
Epoch: 45, step: 377, loss: 0.2964749038219452, mean loss: 0.34285075070726906
Epoch: 45, step: 378, loss: 0.35870641469955444, mean loss: 0.34285099330069907
Epoch: 45, step: 379, loss: 0.3138361871242523, mean loss: 0.342850549377716
Epoch: 45, step: 380, loss: 0.34566351771354675, mean loss: 0.3428505924151287
Epoch: 45, step: 381, loss: 0.3517695963382721, mean loss: 0.34285072887062157
Epoch: 45, step: 382, loss: 0.33478787541389465, mean loss: 0.3428506055156125
Epoch: 45, step: 383, loss: 0.33221572637557983, mean loss: 0.3428504428132207
Epoch: 45, step: 384, loss: 0.34548884630203247, mean loss: 0.3428504831773833
Epoch: 45, step: 385, loss: 0.37547141313552856, mean loss: 0.34285098222780647
Epoch: 45, step: 386, loss: 0.341228723526001, mean loss: 0.34285095741010485
Epoch: 45, step: 387, loss: 0.35009607672691345, mean loss: 0.3428510682459774
Epoch: 45, step: 388, loss: 0.29656273126602173, mean loss: 0.34285036013759296
Epoch: 45, step: 389, loss: 0.3206270635128021, mean loss: 0.34285002017588845
Epoch: 45, step: 390, loss: 0.29940909147262573, mean loss: 0.3428493556468358
Epoch: 45, step: 391, loss: 0.34864333271980286, mean loss: 0.3428494442777033
Epoch: 45, step: 392, loss: 0.29321375489234924, mean loss: 0.34284868500874843
Epoch: 45, step: 393, loss: 0.3231740891933441, mean loss: 0.3428483840543045
Epoch: 45, step: 394, loss: 0.35828664898872375, mean loss: 0.3428486202036725
Epoch: 45, step: 395, loss: 0.34479478001594543, mean loss: 0.3428486499723921
Epoch: 45, step: 396, loss: 0.32433924078941345, mean loss: 0.34284836685433556
Epoch: 45, step: 397, loss: 0.29858171939849854, mean loss: 0.3428476897665162
Epoch: 45, step: 398, loss: 0.3094380795955658, mean loss: 0.34284717875212056
Epoch: 45, step: 399, loss: 0.35277849435806274, mean loss: 0.3428473306535523
Epoch: 45, step: 400, loss: 0.3641188442707062, mean loss: 0.3428476560005738
Epoch: 45, step: 401, loss: 0.34511440992355347, mean loss: 0.3428476906699618
Epoch: 45, step: 402, loss: 0.3301607370376587, mean loss: 0.3428474966294064
Epoch: 45, step: 403, loss: 0.3406575620174408, mean loss: 0.3428474631359736
Epoch: 45, step: 404, loss: 0.28540152311325073, mean loss: 0.34284658455617667
Epoch: 45, step: 405, loss: 0.30780550837516785, mean loss: 0.34284604864518375
Epoch: 45, step: 406, loss: 0.3411640226840973, mean loss: 0.342846022921019
Epoch: 45, step: 407, loss: 0.33758753538131714, mean loss: 0.34284594250125483
Epoch: 45, step: 408, loss: 0.34484192728996277, mean loss: 0.34284597302603403
Epoch: 45, step: 409, loss: 0.33235156536102295, mean loss: 0.34284581253654534
Epoch: 45, step: 410, loss: 0.32824140787124634, mean loss: 0.3428455891968707
Epoch: 45, step: 411, loss: 0.3128286600112915, mean loss: 0.3428451301662678
Epoch: 45, step: 412, loss: 0.30453985929489136, mean loss: 0.342844544396065
Epoch: 45, step: 413, loss: 0.29554539918899536, mean loss: 0.34284382110118766
Epoch: 45, step: 414, loss: 0.34115296602249146, mean loss: 0.34284379524515773
Epoch: 45, step: 415, loss: 0.321793794631958, mean loss: 0.34284347336001775
Epoch: 45, step: 416, loss: 0.37210577726364136, mean loss: 0.34284392081638276
Epoch: 45, step: 417, loss: 0.3261217772960663, mean loss: 0.34284366511829534
Epoch: 45, step: 418, loss: 0.33728909492492676, mean loss: 0.3428435801847307
Epoch: 45, step: 419, loss: 0.33075687289237976, mean loss: 0.3428433953726926
Epoch: 45, step: 420, loss: 0.33730894327163696, mean loss: 0.34284331074933666
Epoch: 45, step: 421, loss: 0.32187381386756897, mean loss: 0.3428429901246328
Epoch: 45, step: 422, loss: 0.34335771203041077, mean loss: 0.34284299799463736
Epoch: 45, step: 423, loss: 0.3608521819114685, mean loss: 0.34284327334758086
Epoch: 45, step: 424, loss: 0.32035505771636963, mean loss: 0.34284292951735945
Epoch: 45, step: 425, loss: 0.35066109895706177, mean loss: 0.34284304905026836
Epoch: 45, step: 426, loss: 0.3337700664997101, mean loss: 0.34284291033449554
Epoch: 45, step: 427, loss: 0.31303834915161133, mean loss: 0.34284245466299995
Epoch: 45, step: 428, loss: 0.35001835227012634, mean loss: 0.3428425643711075
Epoch: 45, step: 429, loss: 0.3537846803665161, mean loss: 0.34284273165617085
Epoch: 45, step: 430, loss: 0.3205356299877167, mean loss: 0.34284239062634914
Epoch: 45, step: 431, loss: 0.33774128556251526, mean loss: 0.3428423126421098
Epoch: 45, step: 432, loss: 0.3373098075389862, mean loss: 0.3428422280640427
Epoch: 45, step: 433, loss: 0.32648345828056335, mean loss: 0.3428419779834822
Epoch: 45, step: 434, loss: 0.3418305218219757, mean loss: 0.34284196252133803
Epoch: 45, step: 435, loss: 0.30903100967407227, mean loss: 0.3428414456607405
Epoch: 45, step: 436, loss: 0.34665030241012573, mean loss: 0.34284150388500556
Epoch: 45, step: 437, loss: 0.3880476653575897, mean loss: 0.34284219492052287
Epoch: 45, step: 438, loss: 0.3376295566558838, mean loss: 0.34284211523972274
Epoch: 45, step: 439, loss: 0.33695361018180847, mean loss: 0.34284202522894536
Epoch: 45, step: 440, loss: 0.3254203796386719, mean loss: 0.3428417589284365
Epoch: 45, step: 441, loss: 0.3803851008415222, mean loss: 0.3428423327926093
Epoch: 45, step: 442, loss: 0.3494192659854889, mean loss: 0.3428424333219826
Epoch: 45, step: 443, loss: 0.3118690848350525, mean loss: 0.3428419598971158
Epoch: 45, step: 444, loss: 0.3399670422077179, mean loss: 0.3428419159549272
Epoch: 45, step: 445, loss: 0.3277387320995331, mean loss: 0.34284168511116697
Epoch: 45, step: 446, loss: 0.3188680410385132, mean loss: 0.3428413186929593
Epoch: 45, step: 447, loss: 0.298359751701355, mean loss: 0.3428406388377445
Epoch: 45, step: 448, loss: 0.31320494413375854, mean loss: 0.3428401858934124
Epoch: 45, step: 449, loss: 0.29930993914604187, mean loss: 0.34283952059849043
Epoch: 45, step: 450, loss: 0.3553103506565094, mean loss: 0.34283971119362205
Epoch: 45, step: 451, loss: 0.39808329939842224, mean loss: 0.3428405554836973
Epoch: 45, step: 452, loss: 0.3222639262676239, mean loss: 0.3428402410150161
Epoch: 45, step: 453, loss: 0.393039345741272, mean loss: 0.34284100818658936
Epoch: 45, step: 454, loss: 0.3573603928089142, mean loss: 0.34284123007677997
Epoch: 45, step: 455, loss: 0.3415711224079132, mean loss: 0.3428412106668578
Epoch: 45, step: 456, loss: 0.3522949516773224, mean loss: 0.34284135513773834
Epoch: 45, step: 457, loss: 0.29354196786880493, mean loss: 0.3428406017622185
Epoch: 45, step: 458, loss: 0.3595205247402191, mean loss: 0.3428408566549121
Epoch: 45, step: 459, loss: 0.3373681902885437, mean loss: 0.34284077302614735
Epoch: 45, step: 460, loss: 0.3318014144897461, mean loss: 0.34284060433437097
Epoch: 45, step: 461, loss: 0.3324265778064728, mean loss: 0.3428404452006873
Epoch: 45, step: 462, loss: 0.3166796863079071, mean loss: 0.3428400454519152
Epoch: 45, step: 463, loss: 0.37536606192588806, mean loss: 0.34284054245724
Epoch: 45, step: 464, loss: 0.3532971441745758, mean loss: 0.3428407022341781
Epoch: 45, step: 465, loss: 0.3198038637638092, mean loss: 0.34284035023652404
Epoch: 45, step: 466, loss: 0.3201945722103119, mean loss: 0.3428400042194717
Epoch: 45, step: 467, loss: 0.3391190469264984, mean loss: 0.3428399473658277
Epoch: 45, step: 468, loss: 0.32945093512535095, mean loss: 0.34283974279414225
Epoch: 45, step: 469, loss: 0.29268500208854675, mean loss: 0.34283897648794354
Epoch: 45, step: 470, loss: 0.3183325529098511, mean loss: 0.34283860206396866
Epoch: 45, step: 471, loss: 0.30850404500961304, mean loss: 0.3428380774878357
Epoch: 45, step: 472, loss: 0.3322293162345886, mean loss: 0.3428379154057118
Epoch: 45, step: 473, loss: 0.34579578042030334, mean loss: 0.34283796059569277
Epoch: 45, step: 474, loss: 0.4332413375377655, mean loss: 0.3428393417488047
Epoch: 45, step: 475, loss: 0.3502095639705658, mean loss: 0.3428394543469198
Epoch: 45, step: 476, loss: 0.30199089646339417, mean loss: 0.34283883029513185
Epoch: 45, step: 477, loss: 0.28604280948638916, mean loss: 0.342837962623941
Epoch: 45, step: 478, loss: 0.3431708514690399, mean loss: 0.34283796770939673
Epoch: 45, step: 479, loss: 0.34744998812675476, mean loss: 0.34283803816494846
Epoch: 45, step: 480, loss: 0.27327537536621094, mean loss: 0.3428369755068345
Epoch: 45, step: 481, loss: 0.31307435035705566, mean loss: 0.3428365208518415
Epoch: 45, step: 482, loss: 0.33855485916137695, mean loss: 0.34283645544601393
Epoch: 45, step: 483, loss: 0.35242822766304016, mean loss: 0.3428366019658144
Epoch: 45, step: 484, loss: 0.3182479441165924, mean loss: 0.3428362263657556
Epoch: 45, step: 485, loss: 0.29235753417015076, mean loss: 0.3428354552984505
Epoch: 45, step: 486, loss: 0.3113022446632385, mean loss: 0.3428349736327161
Epoch: 45, step: 487, loss: 0.3196146786212921, mean loss: 0.3428346189511157
Epoch: 45, step: 488, loss: 0.3683528006076813, mean loss: 0.342835008726149
Epoch: 45, step: 489, loss: 0.325918048620224, mean loss: 0.3428347503336012
Epoch: 45, step: 490, loss: 0.31520023941993713, mean loss: 0.3428343282457927
Epoch: 45, step: 491, loss: 0.32847121357917786, mean loss: 0.3428341088678194
Epoch: 45, step: 492, loss: 0.371355801820755, mean loss: 0.34283454449308404
Epoch: 45, step: 493, loss: 0.3294462561607361, mean loss: 0.34283434001056684
Epoch: 45, step: 494, loss: 0.30834659934043884, mean loss: 0.34283381327913237
Epoch: 45, step: 495, loss: 0.378720223903656, mean loss: 0.34283436136408907
Epoch: 45, step: 496, loss: 0.33893683552742004, mean loss: 0.3428343018389759
Epoch: 45, step: 497, loss: 0.3238850235939026, mean loss: 0.3428340124398152
Epoch: 45, step: 498, loss: 0.33063340187072754, mean loss: 0.3428338261112126
Epoch: 45, step: 499, loss: 0.3153180480003357, mean loss: 0.3428334058946868
Epoch: 45, step: 500, loss: 0.321626752614975, mean loss: 0.34283308203504387
Epoch: 45, step: 501, loss: 0.39279940724372864, mean loss: 0.34283384508939785
Epoch: 45, step: 502, loss: 0.35669878125190735, mean loss: 0.34283405682276624
Epoch: 45, step: 503, loss: 0.3199460208415985, mean loss: 0.34283370730172325
Epoch: 45, step: 504, loss: 0.3644617199897766, mean loss: 0.3428340375760256
Epoch: 45, step: 505, loss: 0.3170984089374542, mean loss: 0.34283364458166593
Epoch: 45, step: 506, loss: 0.3306772708892822, mean loss: 0.34283345895133177
Epoch: 45, step: 507, loss: 0.3094756305217743, mean loss: 0.34283294957818816
Epoch: 45, step: 508, loss: 0.33703410625457764, mean loss: 0.34283286103135857
Epoch: 45, step: 509, loss: 0.32889387011528015, mean loss: 0.34283264818984205
Epoch: 45, step: 510, loss: 0.30882588028907776, mean loss: 0.34283212893119736
Epoch: 45, step: 511, loss: 0.31296032667160034, mean loss: 0.34283167281743904
Epoch: 45, step: 512, loss: 0.33450549840927124, mean loss: 0.342831545686686
Epoch: 45, step: 513, loss: 0.36712396144866943, mean loss: 0.34283191659723905
Epoch: 45, step: 514, loss: 0.3232462406158447, mean loss: 0.3428316175564576
Epoch: 45, step: 515, loss: 0.32350295782089233, mean loss: 0.3428313224443937
Epoch: 45, step: 516, loss: 0.32534360885620117, mean loss: 0.342831055444171
Epoch: 45, step: 517, loss: 0.3005679249763489, mean loss: 0.3428304101858353
Epoch: 45, step: 518, loss: 0.36188074946403503, mean loss: 0.34283070103515023
Epoch: 45, step: 519, loss: 0.3399255871772766, mean loss: 0.3428306566822669
Epoch: 45, step: 520, loss: 0.36281129717826843, mean loss: 0.34283096172555627
Epoch: 45, step: 521, loss: 0.37920841574668884, mean loss: 0.342831517089576
Epoch: 45, step: 522, loss: 0.37436068058013916, mean loss: 0.3428319984288046
Epoch: 45, step: 523, loss: 0.30674779415130615, mean loss: 0.34283144755856343
Epoch: 45, step: 524, loss: 0.32730063796043396, mean loss: 0.34283121046506526
Epoch: 45, step: 525, loss: 0.32484179735183716, mean loss: 0.3428309358426931
Epoch: 45, step: 526, loss: 0.34734413027763367, mean loss: 0.342831004739062
Epoch: 45, step: 527, loss: 0.30400845408439636, mean loss: 0.34283041210074827
Epoch: 45, step: 528, loss: 0.28730639815330505, mean loss: 0.34282956452234
Epoch: 45, step: 529, loss: 0.3550981879234314, mean loss: 0.3428297518009753
Epoch: 45, step: 530, loss: 0.3509635627269745, mean loss: 0.34282987596044356
Epoch: 45, step: 531, loss: 0.34084001183509827, mean loss: 0.3428298455864033
Epoch: 45, step: 532, loss: 0.37528014183044434, mean loss: 0.34283034091246445
Epoch: 45, step: 533, loss: 0.29911404848098755, mean loss: 0.3428296736307776
Epoch: 45, step: 534, loss: 0.3402504622936249, mean loss: 0.3428296342625209
Epoch: 45, step: 535, loss: 0.3229578137397766, mean loss: 0.34282933095003965
Epoch: 45, step: 536, loss: 0.3674357831478119, mean loss: 0.34282970652358846
Epoch: 45, step: 537, loss: 0.3027746379375458, mean loss: 0.34282909516383103
Epoch: 45, step: 538, loss: 0.29501911997795105, mean loss: 0.34282836545221784
Epoch: 45, step: 539, loss: 0.3571304976940155, mean loss: 0.3428285837387295
Epoch: 45, step: 540, loss: 0.40225157141685486, mean loss: 0.3428294906691438
Epoch: 45, step: 541, loss: 0.31156477332115173, mean loss: 0.34282901350548356
Epoch: 45, step: 542, loss: 0.32902732491493225, mean loss: 0.3428288028666454
Epoch: 45, step: 543, loss: 0.3181951344013214, mean loss: 0.3428284269178562
Epoch: 45, step: 544, loss: 0.3052069842815399, mean loss: 0.34282785276382893
Epoch: 45, step: 545, loss: 0.33775004744529724, mean loss: 0.3428277752708442
Epoch: 45, step: 546, loss: 0.3725512623786926, mean loss: 0.34282822887755754
Epoch: 45, step: 547, loss: 0.3277204632759094, mean loss: 0.34282799832320515
Epoch: 45, step: 548, loss: 0.30896884202957153, mean loss: 0.3428274816182914
Epoch: 45, step: 549, loss: 0.31016942858695984, mean loss: 0.34282698325032207
Epoch: 45, step: 550, loss: 0.3461460471153259, mean loss: 0.34282703389908165
Epoch: 45, step: 551, loss: 0.31533244252204895, mean loss: 0.34282661433930356
Epoch: 45, step: 552, loss: 0.29919007420539856, mean loss: 0.3428259484680611
Epoch: 45, step: 553, loss: 0.3705422580242157, mean loss: 0.342826371398289
Epoch: 45, step: 554, loss: 0.4441370368003845, mean loss: 0.3428279172999507
Epoch: 45, step: 555, loss: 0.37356117367744446, mean loss: 0.342828386252227
Epoch: 45, step: 556, loss: 0.3458431661128998, mean loss: 0.342828432253415
Epoch: 45, step: 557, loss: 0.3587781488895416, mean loss: 0.3428286756193498
Epoch: 45, step: 558, loss: 0.374741792678833, mean loss: 0.34282916255258133
Epoch: 45, step: 559, loss: 0.30457571148872375, mean loss: 0.34282857888686474
Epoch: 45, step: 560, loss: 0.3183304965496063, mean loss: 0.3428282051043113
Epoch: 45, step: 561, loss: 0.33617058396339417, mean loss: 0.3428281035263744
Epoch: 45, step: 562, loss: 0.33760297298431396, mean loss: 0.3428280238057247
Epoch: 45, step: 563, loss: 0.36422693729400635, mean loss: 0.34282835028737807
Epoch: 45, step: 564, loss: 0.3732379674911499, mean loss: 0.3428288142375986
Epoch: 45, step: 565, loss: 0.35878264904022217, mean loss: 0.34282905763665883
Epoch: 45, step: 566, loss: 0.31998392939567566, mean loss: 0.3428287091061656
Epoch: 45, step: 567, loss: 0.30929163098335266, mean loss: 0.3428281974646491
Epoch: 45, step: 568, loss: 0.3353073298931122, mean loss: 0.3428280827280769
Epoch: 45, step: 569, loss: 0.34009280800819397, mean loss: 0.342828041000011
Epoch: 45, step: 570, loss: 0.32403814792633057, mean loss: 0.34282775435460405
Epoch: 45, step: 571, loss: 0.2973456382751465, mean loss: 0.3428270605219814
Epoch: 45, step: 572, loss: 0.34654998779296875, mean loss: 0.34282711731461135
Epoch: 45, step: 573, loss: 0.3332701623439789, mean loss: 0.3428269715270931
Epoch: 45, step: 574, loss: 0.3410595655441284, mean loss: 0.3428269445664344
Epoch: 45, step: 575, loss: 0.31408536434173584, mean loss: 0.34282650613852206
Epoch: 45, step: 576, loss: 0.34797239303588867, mean loss: 0.3428265846333723
Epoch: 45, step: 577, loss: 0.3257649540901184, mean loss: 0.3428263243809158
Epoch: 45, step: 578, loss: 0.3461467921733856, mean loss: 0.34282637502945823
Epoch: 45, step: 579, loss: 0.3373289108276367, mean loss: 0.3428262911755198
Epoch: 45, step: 580, loss: 0.31623736023902893, mean loss: 0.3428258856153402
Epoch: 45, step: 581, loss: 0.3157139718532562, mean loss: 0.34282547208442654
Epoch: 45, step: 582, loss: 0.3122212290763855, mean loss: 0.3428250052930502
Epoch: 45, step: 583, loss: 0.36961281299591064, mean loss: 0.34282541386799537
Epoch: 45, step: 584, loss: 0.30638208985328674, mean loss: 0.3428248580329612
Epoch: 45, step: 585, loss: 0.31904488801956177, mean loss: 0.34282449534544
Epoch: 45, step: 586, loss: 0.30552658438682556, mean loss: 0.34282392649356397
Epoch: 45, step: 587, loss: 0.3278432786464691, mean loss: 0.3428236980185785
Epoch: 45, step: 588, loss: 0.2900506258010864, mean loss: 0.3428228931706745
Epoch: 45, step: 589, loss: 0.33409032225608826, mean loss: 0.34282275999131023
Epoch: 45, step: 590, loss: 0.3616962730884552, mean loss: 0.3428230478245459
Epoch: 45, step: 591, loss: 0.3397265672683716, mean loss: 0.34282300060194243
Epoch: 45, step: 592, loss: 0.336398184299469, mean loss: 0.34282290262234255
Epoch: 45, step: 593, loss: 0.33909276127815247, mean loss: 0.34282284573788613
Epoch: 45, step: 594, loss: 0.3687920868396759, mean loss: 0.3428232417613875
Epoch: 45, step: 595, loss: 0.3226642310619354, mean loss: 0.34282293434692646
Epoch: 45, step: 596, loss: 0.29626011848449707, mean loss: 0.3428222242989544
Epoch: 45, step: 597, loss: 0.34011054039001465, mean loss: 0.3428221829484419
Epoch: 45, step: 598, loss: 0.34738266468048096, mean loss: 0.34282225249024234
Epoch: 45, step: 599, loss: 0.35373377799987793, mean loss: 0.3428224188751998
Epoch: 45, step: 600, loss: 0.3248633146286011, mean loss: 0.3428221450290516
Epoch: 45, step: 601, loss: 0.3003802001476288, mean loss: 0.34282149787061056
Epoch: 45, step: 602, loss: 0.2885090708732605, mean loss: 0.3428206697226607
Epoch: 45, step: 603, loss: 0.3184766471385956, mean loss: 0.3428202985342217
Epoch: 45, step: 604, loss: 0.3449417054653168, mean loss: 0.34282033088013814
Epoch: 45, step: 605, loss: 0.28657859563827515, mean loss: 0.3428194733536044
Epoch: 45, step: 606, loss: 0.31793177127838135, mean loss: 0.342819093892704
Epoch: 45, step: 607, loss: 0.30367177724838257, mean loss: 0.3428184970256453
Epoch: 45, step: 608, loss: 0.36760595440864563, mean loss: 0.3428188749465983
Epoch: 45, step: 609, loss: 0.3796103000640869, mean loss: 0.3428194358770011
Epoch: 45, step: 610, loss: 0.3430089056491852, mean loss: 0.3428194387656561
Epoch: 45, step: 611, loss: 0.30127716064453125, mean loss: 0.34281880542198434
Epoch: 45, step: 612, loss: 0.3070933520793915, mean loss: 0.3428182607685405
Epoch: 45, step: 613, loss: 0.39538758993148804, mean loss: 0.3428190622035675
Epoch: 45, step: 614, loss: 0.34932219982147217, mean loss: 0.34281916134431933
Epoch: 45, step: 615, loss: 0.31161895394325256, mean loss: 0.3428186857023991
Epoch: 45, step: 616, loss: 0.35106539726257324, mean loss: 0.34281881142021486
Epoch: 45, step: 617, loss: 0.3106216788291931, mean loss: 0.34281832059530265
Epoch: 45, step: 618, loss: 0.32368505001068115, mean loss: 0.34281802892514635
Epoch: 45, step: 619, loss: 0.3154848515987396, mean loss: 0.34281761226085783
Epoch: 45, step: 620, loss: 0.3611624836921692, mean loss: 0.34281789190402534
Epoch: 45, step: 621, loss: 0.3724840581417084, mean loss: 0.3428183441183822
Epoch: 45, step: 622, loss: 0.3020048439502716, mean loss: 0.3428177219898184
Epoch: 45, step: 623, loss: 0.37316790223121643, mean loss: 0.3428181846167961
Epoch: 45, step: 624, loss: 0.3283292055130005, mean loss: 0.3428179637650454
Epoch: 45, step: 625, loss: 0.3089337944984436, mean loss: 0.3428174472853139
Epoch: 45, step: 626, loss: 0.33217719197273254, mean loss: 0.34281728510360593
Epoch: 45, step: 627, loss: 0.367575079202652, mean loss: 0.34281766246298434
Epoch: 45, step: 628, loss: 0.354409784078598, mean loss: 0.342817839147915
Epoch: 45, step: 629, loss: 0.3317733705043793, mean loss: 0.34281767081277337
Epoch: 45, step: 630, loss: 0.3299635946750641, mean loss: 0.3428174748993421
Epoch: 45, step: 631, loss: 0.38740748167037964, mean loss: 0.34281815450073777
Epoch: 45, step: 632, loss: 0.36599209904670715, mean loss: 0.3428185076920954
Epoch: 45, step: 633, loss: 0.3360763490200043, mean loss: 0.34281840493721577
Epoch: 45, step: 634, loss: 0.2979985177516937, mean loss: 0.34281772186341886
Epoch: 45, step: 635, loss: 0.35237741470336914, mean loss: 0.34281786755490934
Epoch: 45, step: 636, loss: 0.28528445959091187, mean loss: 0.34281699074847255
Epoch: 45, step: 637, loss: 0.3811967372894287, mean loss: 0.3428175756450945
Epoch: 45, step: 638, loss: 0.33910202980041504, mean loss: 0.34281751902207613
Epoch: 45, step: 639, loss: 0.31308212876319885, mean loss: 0.3428170658768421
Epoch: 45, step: 640, loss: 0.3461425304412842, mean loss: 0.3428171165536767
Epoch: 45, step: 641, loss: 0.3370855450630188, mean loss: 0.3428170292114517
Epoch: 45, step: 642, loss: 0.32244157791137695, mean loss: 0.3428167187189216
Epoch: 45, step: 643, loss: 0.32326921820640564, mean loss: 0.34281642084770814
Epoch: 45, step: 644, loss: 0.3385598361492157, mean loss: 0.3428163559854651
Epoch: 45, step: 645, loss: 0.34857526421546936, mean loss: 0.34281644373892
Epoch: 45, step: 646, loss: 0.35947495698928833, mean loss: 0.3428166975751955
Epoch: 45, step: 647, loss: 0.2996337413787842, mean loss: 0.34281603957927614
Epoch: 45, step: 648, loss: 0.34421879053115845, mean loss: 0.342816060953226
Epoch: 45, step: 649, loss: 0.34087029099464417, mean loss: 0.3428160313056569
Epoch: 45, step: 650, loss: 0.32900115847587585, mean loss: 0.34281582081255413
Epoch: 45, step: 651, loss: 0.3055835962295532, mean loss: 0.3428152535248807
Epoch: 45, step: 652, loss: 0.3655882477760315, mean loss: 0.34281560049963805
Epoch: 45, step: 653, loss: 0.3080965280532837, mean loss: 0.34281507151965135
Epoch: 45, step: 654, loss: 0.32886451482772827, mean loss: 0.34281485897212804
Epoch: 45, step: 655, loss: 0.33825474977493286, mean loss: 0.34281478949639527
Epoch: 45, step: 656, loss: 0.33922362327575684, mean loss: 0.342814734783867
Epoch: 45, step: 657, loss: 0.30992835760116577, mean loss: 0.3428142337573704
Epoch: 45, step: 658, loss: 0.3263486921787262, mean loss: 0.34281398290739434
Epoch: 45, step: 659, loss: 0.3368512690067291, mean loss: 0.3428138920677554
Epoch: 45, step: 660, loss: 0.3650626838207245, mean loss: 0.3428142310143247
Epoch: 45, step: 661, loss: 0.3657679557800293, mean loss: 0.3428145806947848
Epoch: 45, step: 662, loss: 0.33550822734832764, mean loss: 0.3428144693904059
Epoch: 45, step: 663, loss: 0.33283302187919617, mean loss: 0.3428143173361814
Epoch: 45, step: 664, loss: 0.30668818950653076, mean loss: 0.34281376701052324
Epoch: 45, step: 665, loss: 0.3512302339076996, mean loss: 0.3428138952204202
Epoch: 45, step: 666, loss: 0.39775508642196655, mean loss: 0.34281473213895725
Epoch: 45, step: 667, loss: 0.31183668971061707, mean loss: 0.34281426025797945
Epoch: 45, step: 668, loss: 0.3017515242099762, mean loss: 0.34281363476884713
Epoch: 45, step: 669, loss: 0.31446510553359985, mean loss: 0.342813202955759
Epoch: 45, step: 670, loss: 0.3308860957622528, mean loss: 0.34281302128134133
Epoch: 45, step: 671, loss: 0.3405953645706177, mean loss: 0.3428129875023748
Epoch: 45, step: 672, loss: 0.30778437852859497, mean loss: 0.34281245396073967
Epoch: 45, step: 673, loss: 0.34821709990501404, mean loss: 0.34281253628087166
Epoch: 45, step: 674, loss: 0.3184008300304413, mean loss: 0.3428121644629408
Epoch: 45, step: 675, loss: 0.3057025074958801, mean loss: 0.3428115992494498
Epoch: 45, step: 676, loss: 0.34423109889030457, mean loss: 0.3428116208693782
Epoch: 45, step: 677, loss: 0.30278071761131287, mean loss: 0.34281101118124796
Epoch: 45, step: 678, loss: 0.3294079899787903, mean loss: 0.34281080705049355
Epoch: 45, step: 679, loss: 0.2986771762371063, mean loss: 0.34281013489650614
Epoch: 45, step: 680, loss: 0.33883824944496155, mean loss: 0.34281007440572087
Epoch: 45, step: 681, loss: 0.3433094024658203, mean loss: 0.3428100820102419
Epoch: 45, step: 682, loss: 0.3288571536540985, mean loss: 0.3428098695172343
Epoch: 45, step: 683, loss: 0.3388410806655884, mean loss: 0.34280980907637093
Epoch: 45, step: 684, loss: 0.3592185080051422, mean loss: 0.34281005896137706
Epoch: 45, step: 685, loss: 0.3528526723384857, mean loss: 0.3428102118961283
Epoch: 45, step: 686, loss: 0.3455042243003845, mean loss: 0.34281025292148964
Epoch: 45, step: 687, loss: 0.31200459599494934, mean loss: 0.3428097838093357
Epoch: 45, step: 688, loss: 0.3405154347419739, mean loss: 0.34280974887125126
Epoch: 45, step: 689, loss: 0.3371959924697876, mean loss: 0.34280966338691443
Epoch: 45, step: 690, loss: 0.32425442337989807, mean loss: 0.3428093808384531
Epoch: 45, step: 691, loss: 0.3418422043323517, mean loss: 0.342809366111073
Epoch: 45, step: 692, loss: 0.3770132064819336, mean loss: 0.3428098869315071
Epoch: 45, step: 693, loss: 0.31928128004074097, mean loss: 0.342809528667858
Epoch: 45, step: 694, loss: 0.3180357813835144, mean loss: 0.3428091514505412
Epoch: 45, step: 695, loss: 0.35801780223846436, mean loss: 0.34280938302144665
Epoch: 45, step: 696, loss: 0.3450923562049866, mean loss: 0.3428094177820658
Epoch: 45, step: 697, loss: 0.2990204989910126, mean loss: 0.34280875106080766
Epoch: 45, step: 698, loss: 0.3471416234970093, mean loss: 0.34280881703124627
Epoch: 45, step: 699, loss: 0.33620017766952515, mean loss: 0.3428087164124984
Epoch: 45, step: 700, loss: 0.36778831481933594, mean loss: 0.34280909672946075
Epoch: 45, step: 701, loss: 0.32805928587913513, mean loss: 0.3428088721654881
Epoch: 45, step: 702, loss: 0.3370278775691986, mean loss: 0.3428087841519291
Epoch: 45, step: 703, loss: 0.34007224440574646, mean loss: 0.34280874248973214
Epoch: 45, step: 704, loss: 0.3273267447948456, mean loss: 0.34280850678907454
Epoch: 45, step: 705, loss: 0.3117203414440155, mean loss: 0.34280803350457945
Epoch: 45, step: 706, loss: 0.3126322627067566, mean loss: 0.3428075741173217
Epoch: 45, step: 707, loss: 0.35256311297416687, mean loss: 0.3428077226305792
Epoch: 45, step: 708, loss: 0.3091773986816406, mean loss: 0.3428072106677856
Epoch: 45, step: 709, loss: 0.3192104995250702, mean loss: 0.34280685145464596
Epoch: 45, step: 710, loss: 0.3248237073421478, mean loss: 0.3428065777011011
Epoch: 45, step: 711, loss: 0.3200590908527374, mean loss: 0.3428062314262602
Epoch: 45, step: 712, loss: 0.3585432767868042, mean loss: 0.3428064709806322
Epoch: 45, step: 713, loss: 0.3118142783641815, mean loss: 0.3428059992146777
Epoch: 45, step: 714, loss: 0.32011255621910095, mean loss: 0.3428056537782975
Epoch: 45, step: 715, loss: 0.35573306679725647, mean loss: 0.34280585055455515
Epoch: 45, step: 716, loss: 0.34692880511283875, mean loss: 0.34280591331167587
Epoch: 45, step: 717, loss: 0.3131507337093353, mean loss: 0.34280546192533834
Epoch: 45, step: 718, loss: 0.323353111743927, mean loss: 0.34280516584244236
Epoch: 45, step: 719, loss: 0.3337031304836273, mean loss: 0.34280502730309137
Epoch: 45, step: 720, loss: 0.36033540964126587, mean loss: 0.3428052941237233
Epoch: 45, step: 721, loss: 0.31687119603157043, mean loss: 0.34280489940060843
Epoch: 45, step: 722, loss: 0.3876080811023712, mean loss: 0.3428055813052658
Epoch: 45, step: 723, loss: 0.3482784330844879, mean loss: 0.34280566460083045
Epoch: 45, step: 724, loss: 0.33934131264686584, mean loss: 0.34280561187498076
Epoch: 45, step: 725, loss: 0.3336937725543976, mean loss: 0.3428054731990711
Epoch: 45, step: 726, loss: 0.33524203300476074, mean loss: 0.34280535809048
Epoch: 45, step: 727, loss: 0.3591374158859253, mean loss: 0.34280560664556914
Epoch: 45, step: 728, loss: 0.332875519990921, mean loss: 0.34280545552339936
Epoch: 45, step: 729, loss: 0.320839524269104, mean loss: 0.34280512123742685
Epoch: 45, step: 730, loss: 0.3454783260822296, mean loss: 0.34280516191866506
Epoch: 45, step: 731, loss: 0.3420971632003784, mean loss: 0.34280515114439675
Epoch: 45, step: 732, loss: 0.3157314360141754, mean loss: 0.3428047391450187
Epoch: 45, step: 733, loss: 0.30344948172569275, mean loss: 0.3428041402580628
Epoch: 45, step: 734, loss: 0.36106282472610474, mean loss: 0.34280441810458895
Epoch: 45, step: 735, loss: 0.33844077587127686, mean loss: 0.3428043517030698
Epoch: 45, step: 736, loss: 0.2942940890789032, mean loss: 0.34280361353391076
Epoch: 45, step: 737, loss: 0.29852595925331116, mean loss: 0.3428029397816012
Epoch: 45, step: 738, loss: 0.29640600085258484, mean loss: 0.3428022337918733
Epoch: 45, step: 739, loss: 0.33064424991607666, mean loss: 0.34280204879516185
Epoch: 45, step: 740, loss: 0.3323715031147003, mean loss: 0.3428018900856827
Epoch: 45, step: 741, loss: 0.3063301146030426, mean loss: 0.3428013351455487
Epoch: 45, step: 742, loss: 0.3752114176750183, mean loss: 0.34280182827706324
Epoch: 45, step: 743, loss: 0.36918312311172485, mean loss: 0.3428022296722132
Epoch: 45, step: 744, loss: 0.398105263710022, mean loss: 0.3428030711029327
Epoch: 45, step: 745, loss: 0.3471672534942627, mean loss: 0.3428031375025674
Epoch: 45, step: 746, loss: 0.3339988887310028, mean loss: 0.34280300355078547
Epoch: 45, step: 747, loss: 0.2812521457672119, mean loss: 0.3428020671027301
Epoch: 45, step: 748, loss: 0.3687005937099457, mean loss: 0.3428024611225175
Epoch: 45, step: 749, loss: 0.3247006833553314, mean loss: 0.3428021857265375
Epoch: 45, step: 750, loss: 0.3306918740272522, mean loss: 0.3428020014860467
Epoch: 45, step: 751, loss: 0.3531970977783203, mean loss: 0.34280215962966465
Epoch: 45, step: 752, loss: 0.32828328013420105, mean loss: 0.3428019387530959
Epoch: 45, step: 753, loss: 0.2856042981147766, mean loss: 0.34280106861525794
Epoch: 45, step: 754, loss: 0.37430137395858765, mean loss: 0.34280154781667793
Epoch: 45, step: 755, loss: 0.3196662664413452, mean loss: 0.3428011958743423
Epoch: 45, step: 756, loss: 0.3027310073375702, mean loss: 0.34280058632129706
Epoch: 45, step: 757, loss: 0.33188772201538086, mean loss: 0.342800420315877
Epoch: 45, step: 758, loss: 0.342388391494751, mean loss: 0.34280041404823036
Epoch: 45, step: 759, loss: 0.3338616192340851, mean loss: 0.3428002780762983
Epoch: 45, step: 760, loss: 0.3019600510597229, mean loss: 0.342799656847126
Epoch: 45, step: 761, loss: 0.2950506806373596, mean loss: 0.34279893053858335
Epoch: 45, step: 762, loss: 0.36901992559432983, mean loss: 0.3427993293794494
Epoch: 45, step: 763, loss: 0.3206222951412201, mean loss: 0.34279899205537057
Epoch: 45, step: 764, loss: 0.28936445713043213, mean loss: 0.34279817930101775
Epoch: 45, step: 765, loss: 0.3290230929851532, mean loss: 0.3427979697812551
Epoch: 45, step: 766, loss: 0.33280491828918457, mean loss: 0.3427978177887461
Epoch: 45, step: 767, loss: 0.3129900395870209, mean loss: 0.3427973644247167
Epoch: 45, step: 768, loss: 0.33937251567840576, mean loss: 0.34279731233497013
Epoch: 45, step: 769, loss: 0.3852579891681671, mean loss: 0.34279795812473185
Epoch: 45, step: 770, loss: 0.3380033075809479, mean loss: 0.3427978852033992
Epoch: 45, step: 771, loss: 0.3239503800868988, mean loss: 0.34279759855804826
Epoch: 45, step: 772, loss: 0.342655211687088, mean loss: 0.3427975963925673
Epoch: 45, step: 773, loss: 0.3206256031990051, mean loss: 0.3427972591964546
Epoch: 45, step: 774, loss: 0.3191535174846649, mean loss: 0.3427968996231642
Epoch: 45, step: 775, loss: 0.33371034264564514, mean loss: 0.34279676143718907
Epoch: 45, step: 776, loss: 0.31455308198928833, mean loss: 0.3427963319212524
Epoch: 45, step: 777, loss: 0.31773537397384644, mean loss: 0.34279595081236913
Epoch: 45, step: 778, loss: 0.33939337730407715, mean loss: 0.3427958990692844
Epoch: 45, step: 779, loss: 0.3689923882484436, mean loss: 0.3427962974343875
Epoch: 45, step: 780, loss: 0.3757200837135315, mean loss: 0.3427967980926238
Epoch: 45, step: 781, loss: 0.3292435109615326, mean loss: 0.34279659199659374
Epoch: 45, step: 782, loss: 0.3421383798122406, mean loss: 0.342796581987741
Epoch: 45, step: 783, loss: 0.3545711636543274, mean loss: 0.3427967610307078
Epoch: 45, step: 784, loss: 0.35462960600852966, mean loss: 0.34279694095688396
Epoch: 45, step: 785, loss: 0.37886375188827515, mean loss: 0.34279748936808324
Epoch: 45, step: 786, loss: 0.3687278926372528, mean loss: 0.3427978836448979
Epoch: 45, step: 787, loss: 0.3412298262119293, mean loss: 0.34279785980264277
Epoch: 45, step: 788, loss: 0.3490968942642212, mean loss: 0.3427979555777718
Epoch: 45, step: 789, loss: 0.3211762011051178, mean loss: 0.3427976268297944
Epoch: 45, step: 790, loss: 0.3130037486553192, mean loss: 0.3427971738356454
Epoch: 45, step: 791, loss: 0.33078545331954956, mean loss: 0.34279699120898793
Epoch: 45, step: 792, loss: 0.3333097994327545, mean loss: 0.34279684696755486
Epoch: 45, step: 793, loss: 0.337787926197052, mean loss: 0.34279677081404786
Epoch: 45, step: 794, loss: 0.3734592795372009, mean loss: 0.3427972369867384
Epoch: 45, step: 795, loss: 0.3702956736087799, mean loss: 0.34279765504859416
Epoch: 45, step: 796, loss: 0.33050331473350525, mean loss: 0.3427974681391833
Epoch: 45, step: 797, loss: 0.3314652144908905, mean loss: 0.3427972958588822
Epoch: 45, step: 798, loss: 0.3340274393558502, mean loss: 0.3427971625358383
Epoch: 45, step: 799, loss: 0.35821405053138733, mean loss: 0.3427973969062852
Epoch: 45, step: 800, loss: 0.36123883724212646, mean loss: 0.3427976772522869
Epoch: 45, step: 801, loss: 0.3367255628108978, mean loss: 0.3427975849456613
Epoch: 45, step: 802, loss: 0.2945910096168518, mean loss: 0.3427968521336076
Epoch: 45, step: 803, loss: 0.3060539662837982, mean loss: 0.3427962935952723
Epoch: 45, step: 804, loss: 0.3357055187225342, mean loss: 0.34279618580816473
Epoch: 45, step: 805, loss: 0.32964348793029785, mean loss: 0.3427959858766006
Epoch: 45, step: 806, loss: 0.35518166422843933, mean loss: 0.34279617414599045
Epoch: 45, step: 807, loss: 0.36362406611442566, mean loss: 0.34279649073704
Epoch: 45, step: 808, loss: 0.31360381841659546, mean loss: 0.34279604700522587
Epoch: 45, step: 809, loss: 0.33205685019493103, mean loss: 0.3427958837707402
Epoch: 45, step: 810, loss: 0.3115703761577606, mean loss: 0.3427954091540356
Epoch: 45, step: 811, loss: 0.38775724172592163, mean loss: 0.34279609254764837
Epoch: 45, step: 812, loss: 0.3440738916397095, mean loss: 0.34279611196915355
Epoch: 45, step: 813, loss: 0.33025360107421875, mean loss: 0.3427959213361035
Epoch: 45, step: 814, loss: 0.3125460147857666, mean loss: 0.34279546157614377
Epoch: 45, step: 815, loss: 0.3235717713832855, mean loss: 0.34279516940503624
Epoch: 45, step: 816, loss: 0.3383060395717621, mean loss: 0.34279510117806794
Epoch: 45, step: 817, loss: 0.3070014715194702, mean loss: 0.3427945571853986
Epoch: 45, step: 818, loss: 0.3147987127304077, mean loss: 0.3427941317101717
Epoch: 45, step: 819, loss: 0.349043607711792, mean loss: 0.34279422668701065
Epoch: 45, step: 820, loss: 0.31407222151756287, mean loss: 0.3427937901890065
Epoch: 45, step: 821, loss: 0.3213155269622803, mean loss: 0.34279346378155345
Epoch: 45, step: 822, loss: 0.32562950253486633, mean loss: 0.34279320294297094
Epoch: 45, step: 823, loss: 0.343539297580719, mean loss: 0.342793214281106
Epoch: 45, step: 824, loss: 0.33095061779022217, mean loss: 0.3427930343161111
Epoch: 45, step: 825, loss: 0.2915334403514862, mean loss: 0.3427922553659551
Epoch: 45, step: 826, loss: 0.352047860622406, mean loss: 0.34279239601368644
Epoch: 45, step: 827, loss: 0.31749969720840454, mean loss: 0.34279201167289497
Epoch: 45, step: 828, loss: 0.32091182470321655, mean loss: 0.3427916791927331
Epoch: 45, step: 829, loss: 0.3389139473438263, mean loss: 0.34279162026959303
Epoch: 45, step: 830, loss: 0.3724622428417206, mean loss: 0.34279207111553933
Epoch: 45, step: 831, loss: 0.3474843502044678, mean loss: 0.342792142413769
Epoch: 45, step: 832, loss: 0.2913496792316437, mean loss: 0.3427913607678452
Epoch: 45, step: 833, loss: 0.3414747714996338, mean loss: 0.3427913407631461
Epoch: 45, step: 834, loss: 0.3289494812488556, mean loss: 0.3427911304484836
Epoch: 45, step: 835, loss: 0.3266075551509857, mean loss: 0.3427908845572824
Epoch: 45, step: 836, loss: 0.31243738532066345, mean loss: 0.3427904233770518
Epoch: 45, step: 837, loss: 0.3427557945251465, mean loss: 0.3427904228509214
Epoch: 45, step: 838, loss: 0.3475808799266815, mean loss: 0.34279049563320424
Epoch: 45, step: 839, loss: 0.33094581961631775, mean loss: 0.3427903156776282
Epoch: 45, step: 840, loss: 0.32562828063964844, mean loss: 0.34279005493964126
Epoch: 45, step: 841, loss: 0.29385870695114136, mean loss: 0.3427893115506833
Epoch: 45, step: 842, loss: 0.35292354226112366, mean loss: 0.34278946551253114
Epoch: 45, step: 843, loss: 0.3139851987361908, mean loss: 0.34278902791732613
Epoch: 45, step: 844, loss: 0.297975093126297, mean loss: 0.34278834711315154
Epoch: 45, step: 845, loss: 0.32709208130836487, mean loss: 0.3427881086622992
Epoch: 45, step: 846, loss: 0.32453909516334534, mean loss: 0.34278783143542424
Epoch: 45, step: 847, loss: 0.3386520445346832, mean loss: 0.34278776860825494
Epoch: 45, step: 848, loss: 0.28976860642433167, mean loss: 0.3427869632008785
Epoch: 45, step: 849, loss: 0.3557227849960327, mean loss: 0.34278715970432366
Epoch: 45, step: 850, loss: 0.32751232385635376, mean loss: 0.3427869276732768
Epoch: 45, step: 851, loss: 0.32919666171073914, mean loss: 0.3427867212346761
Epoch: 45, step: 852, loss: 0.3372279703617096, mean loss: 0.3427866367975264
Epoch: 45, step: 853, loss: 0.28702130913734436, mean loss: 0.34278578973783597
Epoch: 45, step: 854, loss: 0.3301427960395813, mean loss: 0.34278559769722383
Epoch: 45, step: 855, loss: 0.3579745888710022, mean loss: 0.3427858284067319
Epoch: 45, step: 856, loss: 0.3425128757953644, mean loss: 0.3427858242608472
Epoch: 45, step: 857, loss: 0.3683322072029114, mean loss: 0.3427862122796652
Epoch: 45, step: 858, loss: 0.32841843366622925, mean loss: 0.3427859940537108
Epoch: 45, step: 859, loss: 0.3147940933704376, mean loss: 0.3427855689033359
Epoch: 45, step: 860, loss: 0.3151260316371918, mean loss: 0.3427851488073886
Epoch: 45, step: 861, loss: 0.3254720866680145, mean loss: 0.34278488585878225
Epoch: 45, step: 862, loss: 0.33771470189094543, mean loss: 0.3427848088546365
Epoch: 45, step: 863, loss: 0.31466957926750183, mean loss: 0.3427843818570424
Epoch: 45, step: 864, loss: 0.31118446588516235, mean loss: 0.3427839019433668
Epoch: 45, step: 865, loss: 0.36139577627182007, mean loss: 0.34278418460099713
Epoch: 45, step: 866, loss: 0.3619811534881592, mean loss: 0.3427844761400025
Epoch: 45, step: 867, loss: 0.3463217616081238, mean loss: 0.34278452985895325
Epoch: 45, step: 868, loss: 0.34706825017929077, mean loss: 0.3427845949126415
Epoch: 45, step: 869, loss: 0.35394349694252014, mean loss: 0.3427847643720497
Epoch: 45, step: 870, loss: 0.364568293094635, mean loss: 0.34278509517232186
Epoch: 45, step: 871, loss: 0.3561798334121704, mean loss: 0.3427852985790254
Epoch: 45, step: 872, loss: 0.33143770694732666, mean loss: 0.3427851262620219
Epoch: 45, step: 873, loss: 0.3413276970386505, mean loss: 0.342785104130804
Epoch: 45, step: 874, loss: 0.2893463671207428, mean loss: 0.34278429267021615
Epoch: 45, step: 875, loss: 0.3358222246170044, mean loss: 0.3427841869536823
Epoch: 45, step: 876, loss: 0.34434840083122253, mean loss: 0.34278421070535453
Epoch: 45, step: 877, loss: 0.3293636739253998, mean loss: 0.34278400692545263
Epoch: 45, step: 878, loss: 0.31561318039894104, mean loss: 0.3427835943648834
Epoch: 45, step: 879, loss: 0.31692397594451904, mean loss: 0.3427832017195992
Epoch: 45, step: 880, loss: 0.3145390748977661, mean loss: 0.3427827728751112
Epoch: 45, step: 881, loss: 0.32772043347358704, mean loss: 0.3427825441796662
Epoch: 45, step: 882, loss: 0.34454798698425293, mean loss: 0.3427825709844398
Epoch: 45, step: 883, loss: 0.32756730914115906, mean loss: 0.34278233997414825
Epoch: 45, step: 884, loss: 0.32508713006973267, mean loss: 0.34278207131537797
Epoch: 45, step: 885, loss: 0.3247915506362915, mean loss: 0.342781798177178
Epoch: 45, step: 886, loss: 0.3217020332813263, mean loss: 0.3427814781418812
Epoch: 45, step: 887, loss: 0.3105684220790863, mean loss: 0.34278098908716476
Epoch: 45, step: 888, loss: 0.3559302091598511, mean loss: 0.34278118871400093
Epoch: 45, step: 889, loss: 0.35095205903053284, mean loss: 0.34278131275939816
Epoch: 45, step: 890, loss: 0.3088010549545288, mean loss: 0.3427807968987341
Epoch: 45, step: 891, loss: 0.3400743007659912, mean loss: 0.34278075581153267
Epoch: 45, step: 892, loss: 0.2955782413482666, mean loss: 0.34278003924306816
Epoch: 45, step: 893, loss: 0.32973435521125793, mean loss: 0.3427798412031126
Epoch: 45, step: 894, loss: 0.3244374990463257, mean loss: 0.34277956276148597
Epoch: 45, step: 895, loss: 0.2947096526622772, mean loss: 0.3427788330585578
Epoch: 45, step: 896, loss: 0.32724255323410034, mean loss: 0.3427785972208629
Epoch: 45, step: 897, loss: 0.30981752276420593, mean loss: 0.34277809688578204
Epoch: 45, step: 898, loss: 0.34140872955322266, mean loss: 0.3427780760996843
Epoch: 45, step: 899, loss: 0.35459208488464355, mean loss: 0.342778255425865
Epoch: 45, step: 900, loss: 0.32759585976600647, mean loss: 0.3427780249740555
Epoch: 45, step: 901, loss: 0.34168925881385803, mean loss: 0.34277800844805206
Epoch: 45, step: 902, loss: 0.3629905581474304, mean loss: 0.3427783152426683
Epoch: 45, step: 903, loss: 0.3211105465888977, mean loss: 0.342777986365116
Epoch: 45, step: 904, loss: 0.3413146436214447, mean loss: 0.3427779641545561
Epoch: 45, step: 905, loss: 0.3413773775100708, mean loss: 0.34277794289682845
Epoch: 45, step: 906, loss: 0.3318714201450348, mean loss: 0.34277777736306986
Epoch: 45, step: 907, loss: 0.30158594250679016, mean loss: 0.34277715218344906
Epoch: 45, step: 908, loss: 0.37646540999412537, mean loss: 0.34277766347149125
Epoch: 45, step: 909, loss: 0.3276463747024536, mean loss: 0.34277743382679904
Epoch: 45, step: 910, loss: 0.30172285437583923, mean loss: 0.3427768107587101
Epoch: 45, step: 911, loss: 0.3439820110797882, mean loss: 0.342776829049251
Epoch: 45, step: 912, loss: 0.33434683084487915, mean loss: 0.34277670111459624
Epoch: 45, step: 913, loss: 0.31452861428260803, mean loss: 0.34277627242477876
Epoch: 45, step: 914, loss: 0.32759758830070496, mean loss: 0.3427760420782559
Epoch: 45, step: 915, loss: 0.3254605233669281, mean loss: 0.34277577930784936
Epoch: 45, step: 916, loss: 0.343474417924881, mean loss: 0.3427757899098285
Epoch: 45, step: 917, loss: 0.3062822222709656, mean loss: 0.3427752361211302
Epoch: 45, step: 918, loss: 0.375485360622406, mean loss: 0.34277573248866994
Epoch: 45, step: 919, loss: 0.36528775095939636, mean loss: 0.3427760740974479
Epoch: 45, step: 920, loss: 0.32469043135643005, mean loss: 0.3427757996609031
Epoch: 45, step: 921, loss: 0.35376814007759094, mean loss: 0.3427759664591857
Epoch: 45, step: 922, loss: 0.36441078782081604, mean loss: 0.34277629474198557
Epoch: 45, step: 923, loss: 0.33570125699043274, mean loss: 0.3427761873882931
Epoch: 45, step: 924, loss: 0.3125397264957428, mean loss: 0.3427757285997202
Epoch: 45, step: 925, loss: 0.34071603417396545, mean loss: 0.3427756973477185
Epoch: 45, step: 926, loss: 0.3141254782676697, mean loss: 0.34277526264094865
Epoch: 45, step: 927, loss: 0.3178114593029022, mean loss: 0.3427748838735253
Epoch: 45, step: 928, loss: 0.30705198645591736, mean loss: 0.3427743418701962
Epoch: 45, step: 929, loss: 0.3375260531902313, mean loss: 0.34277426224208696
Epoch: 45, step: 930, loss: 0.3196457624435425, mean loss: 0.34277391133708174
Epoch: 45, step: 931, loss: 0.29255837202072144, mean loss: 0.34277314947976717
Epoch: 45, step: 932, loss: 0.3182108998298645, mean loss: 0.3427727768332536
Epoch: 45, step: 933, loss: 0.33721911907196045, mean loss: 0.3427726925771356
Epoch: 45, step: 934, loss: 0.34339189529418945, mean loss: 0.3427727019710932
Epoch: 45, step: 935, loss: 0.3396477699279785, mean loss: 0.3427726545633008
Epoch: 45, step: 936, loss: 0.3068417012691498, mean loss: 0.3427721094694207
Epoch: 45, step: 937, loss: 0.32511916756629944, mean loss: 0.3427718416678809
Epoch: 45, step: 938, loss: 0.35392484068870544, mean loss: 0.34277201086035985
Epoch: 45, step: 939, loss: 0.31972700357437134, mean loss: 0.3427716612698367
Epoch: 45, step: 940, loss: 0.30694305896759033, mean loss: 0.34277111776166325
Epoch: 45, step: 941, loss: 0.3115884065628052, mean loss: 0.3427706447373133
Epoch: 45, step: 942, loss: 0.31591570377349854, mean loss: 0.34277023736900536
Epoch: 45, step: 943, loss: 0.29227006435394287, mean loss: 0.3427694713327664
Epoch: 45, step: 944, loss: 0.3330540359020233, mean loss: 0.3427693239617322
Epoch: 45, step: 945, loss: 0.34006017446517944, mean loss: 0.34276928286793773
Epoch: 45, step: 946, loss: 0.33370453119277954, mean loss: 0.34276914537113556
Epoch: 45, step: 947, loss: 0.32282155752182007, mean loss: 0.34276884280488373
Epoch: 45, step: 948, loss: 0.34153202176094055, mean loss: 0.3427688240449899
Epoch: 45, step: 949, loss: 0.3139759302139282, mean loss: 0.34276838732583575
Epoch: 45, step: 950, loss: 0.3220124840736389, mean loss: 0.34276807251333097
Epoch: 45, step: 951, loss: 0.33839598298072815, mean loss: 0.3427680062012286
Epoch: 45, step: 952, loss: 0.34349048137664795, mean loss: 0.3427680171589459
Epoch: 45, step: 953, loss: 0.31179553270339966, mean loss: 0.34276754740912857
Epoch: 45, step: 954, loss: 0.31909695267677307, mean loss: 0.34276718841019427
Epoch: 45, step: 955, loss: 0.3744426667690277, mean loss: 0.3427676688075244
Epoch: 45, step: 956, loss: 0.2967396080493927, mean loss: 0.3427669707463333
Epoch: 45, step: 957, loss: 0.3251316249370575, mean loss: 0.3427667032928799
Epoch: 45, step: 958, loss: 0.37018883228302, mean loss: 0.34276711916404856
Epoch: 45, step: 959, loss: 0.2926008403301239, mean loss: 0.3427663583772904
Epoch: 45, step: 960, loss: 0.3299940526485443, mean loss: 0.3427661646843569
Epoch: 45, step: 961, loss: 0.360969603061676, mean loss: 0.34276644073662066
Epoch: 45, step: 962, loss: 0.30492833256721497, mean loss: 0.3427658669363967
Epoch: 45, step: 963, loss: 0.31451013684272766, mean loss: 0.3427654384557147
Epoch: 45, step: 964, loss: 0.3215569257736206, mean loss: 0.3427651168466059
Epoch: 45, step: 965, loss: 0.3544289469718933, mean loss: 0.3427652937160161
Epoch: 45, step: 966, loss: 0.2953520119190216, mean loss: 0.34276457475561156
Epoch: 45, step: 967, loss: 0.34222277998924255, mean loss: 0.34276456654012716
Epoch: 45, step: 968, loss: 0.3901154398918152, mean loss: 0.3427652845324144
Epoch: 45, step: 969, loss: 0.3342273533344269, mean loss: 0.3427651550717442
Epoch: 45, step: 970, loss: 0.3357691764831543, mean loss: 0.34276504899331345
Epoch: 45, step: 971, loss: 0.3220396637916565, mean loss: 0.34276473474378044
Epoch: 45, step: 972, loss: 0.312740683555603, mean loss: 0.34276427950973215
Epoch: 45, step: 973, loss: 0.332391619682312, mean loss: 0.3427641222386064
Epoch: 45, step: 974, loss: 0.29958680272102356, mean loss: 0.3427634675904445
Epoch: 45, step: 975, loss: 0.3418985903263092, mean loss: 0.34276345447750156
Epoch: 45, step: 976, loss: 0.30746862292289734, mean loss: 0.34276291935868847
Epoch: 45, step: 977, loss: 0.32421624660491943, mean loss: 0.3427626381695567
Epoch: 45, step: 978, loss: 0.3283616006374359, mean loss: 0.3427624198363871
Epoch: 45, step: 979, loss: 0.2984534204006195, mean loss: 0.3427617480807862
Epoch: 45, step: 980, loss: 0.34311795234680176, mean loss: 0.34276175348101157
Epoch: 45, step: 981, loss: 0.3193473815917969, mean loss: 0.34276139851342585
Epoch: 45, step: 982, loss: 0.2919307053089142, mean loss: 0.3427606279194079
Epoch: 45, step: 983, loss: 0.3029867708683014, mean loss: 0.34276002495632124
Epoch: 45, step: 984, loss: 0.3804597556591034, mean loss: 0.3427605964674363
Epoch: 45, step: 985, loss: 0.34172961115837097, mean loss: 0.34276058083839545
Epoch: 45, step: 986, loss: 0.3380449116230011, mean loss: 0.34276050935311925
Epoch: 45, step: 987, loss: 0.3698411285877228, mean loss: 0.34276091986456775
Epoch: 45, step: 988, loss: 0.3296133875846863, mean loss: 0.3427607205659232
Epoch: 45, step: 989, loss: 0.4169580042362213, mean loss: 0.3427618452784239
Epoch: 45, step: 990, loss: 0.3278723657131195, mean loss: 0.34276161958107865
Epoch: 45, step: 991, loss: 0.3422659635543823, mean loss: 0.34276161206795147
Epoch: 45, step: 992, loss: 0.34376198053359985, mean loss: 0.3427616272312526
Epoch: 45, step: 993, loss: 0.3649918735027313, mean loss: 0.3427619641859055
Epoch: 45, step: 994, loss: 0.30121129751205444, mean loss: 0.34276133439179146
Epoch: 45, step: 995, loss: 0.30732032656669617, mean loss: 0.3427607972114861
Epoch: 45, step: 996, loss: 0.3717525899410248, mean loss: 0.3427612366342051
Epoch: 45, step: 997, loss: 0.33266836404800415, mean loss: 0.3427610836609021
Epoch: 45, step: 998, loss: 0.3581445515155792, mean loss: 0.3427613168179347
Epoch: 45, step: 999, loss: 0.3769402801990509, mean loss: 0.342761834837992
Epoch: 45, step: 1000, loss: 0.3484845459461212, mean loss: 0.34276192157070456
Epoch: 45, step: 1001, loss: 0.32513144612312317, mean loss: 0.34276165436941564
Epoch: 45, step: 1002, loss: 0.37090328335762024, mean loss: 0.34276208086758925
Epoch: 45, step: 1003, loss: 0.2977193295955658, mean loss: 0.34276139823617446
Epoch: 45, step: 1004, loss: 0.32873621582984924, mean loss: 0.34276118568510366
Epoch: 45, step: 1005, loss: 0.3338753283023834, mean loss: 0.34276105102233606
Epoch: 45, step: 1006, loss: 0.3089286983013153, mean loss: 0.3427605383099424
Epoch: 45, step: 1007, loss: 0.31359559297561646, mean loss: 0.3427600963364725
Epoch: 45, step: 1008, loss: 0.3225879967212677, mean loss: 0.3427597906476514
Epoch: 45, step: 1009, loss: 0.32735809683799744, mean loss: 0.3427595572532915
Epoch: 45, step: 1010, loss: 0.3409501016139984, mean loss: 0.3427595298335579
Epoch: 45, step: 1011, loss: 0.35721176862716675, mean loss: 0.34275974883341837
Epoch: 45, step: 1012, loss: 0.32064154744148254, mean loss: 0.34275941367360757
Epoch: 45, step: 1013, loss: 0.307171493768692, mean loss: 0.3427588744136763
Epoch: 45, step: 1014, loss: 0.34573403000831604, mean loss: 0.34275891949520665
Epoch: 45, step: 1015, loss: 0.29800137877464294, mean loss: 0.34275824130954813
Epoch: 45, step: 1016, loss: 0.33688098192214966, mean loss: 0.3427581522561156
Epoch: 45, step: 1017, loss: 0.3382573127746582, mean loss: 0.34275808405951147
Epoch: 45, step: 1018, loss: 0.34938672184944153, mean loss: 0.3427581844949391
Epoch: 45, step: 1019, loss: 0.3032990097999573, mean loss: 0.34275758662865585
Epoch: 45, step: 1020, loss: 0.31351861357688904, mean loss: 0.34275714362062487
Epoch: 45, step: 1021, loss: 0.32335615158081055, mean loss: 0.34275684967510744
Epoch: 45, step: 1022, loss: 0.3401709794998169, mean loss: 0.3427568104970371
Epoch: 45, step: 1023, loss: 0.373489111661911, mean loss: 0.3427572761097449
Epoch: 45, step: 1024, loss: 0.3710086941719055, mean loss: 0.342757704129108
Epoch: 45, step: 1025, loss: 0.36336418986320496, mean loss: 0.3427580163202078
Epoch: 45, step: 1026, loss: 0.346526563167572, mean loss: 0.34275807341334713
Epoch: 45, step: 1027, loss: 0.3214229941368103, mean loss: 0.3427577501937483
Epoch: 45, step: 1028, loss: 0.3180404007434845, mean loss: 0.34275737573951554
Epoch: 45, step: 1029, loss: 0.32471364736557007, mean loss: 0.3427571023911081
Epoch: 45, step: 1030, loss: 0.30082136392593384, mean loss: 0.3427564671070121
Epoch: 45, step: 1031, loss: 0.3394113779067993, mean loss: 0.3427564164330558
Epoch: 45, step: 1032, loss: 0.31901904940605164, mean loss: 0.34275605684680727
Epoch: 45, step: 1033, loss: 0.3571236729621887, mean loss: 0.3427562744917934
Epoch: 45, step: 1034, loss: 0.3135431110858917, mean loss: 0.34275583196867887
Epoch: 45, step: 1035, loss: 0.3550117015838623, mean loss: 0.342756017618667
Epoch: 45, step: 1036, loss: 0.32358118891716003, mean loss: 0.342755727165773
Epoch: 45, step: 1037, loss: 0.32773175835609436, mean loss: 0.34275549959194757
Epoch: 45, step: 1038, loss: 0.3587036728858948, mean loss: 0.3427557411613941
Epoch: 45, step: 1039, loss: 0.35058316588401794, mean loss: 0.3427558597228107
Epoch: 45, step: 1040, loss: 0.3253314793109894, mean loss: 0.342755595801022
Epoch: 45, step: 1041, loss: 0.35140281915664673, mean loss: 0.3427557267758994
Epoch: 45, step: 1042, loss: 0.337263822555542, mean loss: 0.34275564359421695
Epoch: 45, step: 1043, loss: 0.2896440327167511, mean loss: 0.3427548391653596
Epoch: 45, step: 1044, loss: 0.40052708983421326, mean loss: 0.3427557141710494
Epoch: 45, step: 1045, loss: 0.33005616068840027, mean loss: 0.3427555218293433
Epoch: 45, step: 1046, loss: 0.327111154794693, mean loss: 0.34275528489040874
Epoch: 45, step: 1047, loss: 0.3945803940296173, mean loss: 0.3427560697863489
Epoch: 45, step: 1048, loss: 0.32264453172683716, mean loss: 0.34275576519990875
Epoch: 45, step: 1049, loss: 0.31141066551208496, mean loss: 0.34275529048993314
Epoch: 45, step: 1050, loss: 0.299434632062912, mean loss: 0.34275463442447257
Epoch: 45, step: 1051, loss: 0.3120059370994568, mean loss: 0.34275416876089543
Epoch: 45, step: 1052, loss: 0.29842668771743774, mean loss: 0.3427534974680412
Epoch: 45, step: 1053, loss: 0.3254576623439789, mean loss: 0.34275323554486337
Epoch: 45, step: 1054, loss: 0.33325716853141785, mean loss: 0.34275309174131957
Epoch: 45, step: 1055, loss: 0.35235127806663513, mean loss: 0.3427532370891045
Epoch: 45, step: 1056, loss: 0.34238141775131226, mean loss: 0.3427532314586346
Epoch: 45, step: 1057, loss: 0.33926406502723694, mean loss: 0.34275317862289717
Epoch: 45, step: 1058, loss: 0.3365898132324219, mean loss: 0.3427530852937221
Epoch: 45, step: 1059, loss: 0.32066795229911804, mean loss: 0.34275275087317403
Epoch: 45, step: 1060, loss: 0.32644736766815186, mean loss: 0.3427525039752893
Epoch: 45, step: 1061, loss: 0.32396191358566284, mean loss: 0.34275221945043555
Epoch: 45, step: 1062, loss: 0.31007713079452515, mean loss: 0.34275172469567494
Epoch: 45, step: 1063, loss: 0.3440922200679779, mean loss: 0.3427517449926796
Epoch: 45, step: 1064, loss: 0.37522950768470764, mean loss: 0.3427522367447076
Epoch: 45, step: 1065, loss: 0.37116095423698425, mean loss: 0.34275266688002987
Epoch: 45, step: 1066, loss: 0.35284751653671265, mean loss: 0.34275281972345434
Epoch: 45, step: 1067, loss: 0.3463863432407379, mean loss: 0.34275287473683125
Epoch: 45, step: 1068, loss: 0.32237204909324646, mean loss: 0.3427525661655335
Epoch: 45, step: 1069, loss: 0.34798890352249146, mean loss: 0.3427526454439189
Epoch: 45, step: 1070, loss: 0.3063400387763977, mean loss: 0.3427520941637465
Epoch: 45, step: 1071, loss: 0.4057489335536957, mean loss: 0.3427530479098767
Epoch: 45, step: 1072, loss: 0.34297001361846924, mean loss: 0.3427530511945982
Epoch: 45, step: 1073, loss: 0.34919866919517517, mean loss: 0.34275314877563795
Epoch: 45, step: 1074, loss: 0.3573339283466339, mean loss: 0.34275336951259305
Epoch: 45, step: 1075, loss: 0.29352402687072754, mean loss: 0.3427526242458097
Epoch: 45, step: 1076, loss: 0.3276815414428711, mean loss: 0.34275239609311126
Epoch: 45, step: 1077, loss: 0.32045963406562805, mean loss: 0.3427520586205564
Epoch: 45, step: 1078, loss: 0.33385100960731506, mean loss: 0.34275192387663034
Epoch: 45, step: 1079, loss: 0.3065283000469208, mean loss: 0.34275137553233986
Epoch: 45, step: 1080, loss: 0.31302890181541443, mean loss: 0.34275092560766846
Epoch: 45, step: 1081, loss: 0.3815667927265167, mean loss: 0.3427515131749101
Epoch: 45, step: 1082, loss: 0.3018284738063812, mean loss: 0.34275089372015677
Epoch: 45, step: 1083, loss: 0.3278850018978119, mean loss: 0.3427506686975753
Epoch: 45, step: 1084, loss: 0.34210169315338135, mean loss: 0.34275065887428696
Epoch: 45, step: 1085, loss: 0.34684082865715027, mean loss: 0.342750720784646
Epoch: 45, step: 1086, loss: 0.3198947608470917, mean loss: 0.34275037483341564
Epoch: 45, step: 1087, loss: 0.3212394416332245, mean loss: 0.3427500492456394
Epoch: 45, step: 1088, loss: 0.37080079317092896, mean loss: 0.3427504738130451
Epoch: 45, step: 1089, loss: 0.37167322635650635, mean loss: 0.3427509115722784
Epoch: 45, step: 1090, loss: 0.3416535258293152, mean loss: 0.34275089496308914
Epoch: 45, step: 1091, loss: 0.3041738271713257, mean loss: 0.3427503110990046
Epoch: 45, step: 1092, loss: 0.3463633358478546, mean loss: 0.3427503657813219
Epoch: 45, step: 1093, loss: 0.35499101877212524, mean loss: 0.3427505510380491
Epoch: 45, step: 1094, loss: 0.36715757846832275, mean loss: 0.3427509204217408
Epoch: 45, step: 1095, loss: 0.4021795690059662, mean loss: 0.3427518198201394
Epoch: 45, step: 1096, loss: 0.34411919116973877, mean loss: 0.3427518405137446
Epoch: 45, step: 1097, loss: 0.36681947112083435, mean loss: 0.34275220474436
Epoch: 45, step: 1098, loss: 0.3513373136520386, mean loss: 0.34275233466625515
Epoch: 45, step: 1099, loss: 0.32553717494010925, mean loss: 0.3427520741462835
Epoch: 45, step: 1100, loss: 0.34300634264945984, mean loss: 0.3427520779941142
Epoch: 45, step: 1101, loss: 0.3385680615901947, mean loss: 0.342752014678591
Epoch: 45, step: 1102, loss: 0.33987289667129517, mean loss: 0.34275197111038125
Epoch: 45, step: 1103, loss: 0.3100166618824005, mean loss: 0.3427514757513045
Epoch: 45, step: 1104, loss: 0.32512611150741577, mean loss: 0.342751209043818
Epoch: 45, step: 1105, loss: 0.3332933485507965, mean loss: 0.34275106592938387
Epoch: 45, step: 1106, loss: 0.3078904449939728, mean loss: 0.34275053843349307
Epoch: 45, step: 1107, loss: 0.38299497961997986, mean loss: 0.342751147385817
Epoch: 45, step: 1108, loss: 0.3356117904186249, mean loss: 0.34275103935941376
Epoch: 45, step: 1109, loss: 0.3223313093185425, mean loss: 0.3427507303908854
Epoch: 45, step: 1110, loss: 0.3059345781803131, mean loss: 0.3427501733384545
Epoch: 45, step: 1111, loss: 0.3151906430721283, mean loss: 0.34274975635106925
Epoch: 45, step: 1112, loss: 0.3984156847000122, mean loss: 0.34275059858743845
Epoch: 45, step: 1113, loss: 0.3153207004070282, mean loss: 0.34275018357400033
Epoch: 45, step: 1114, loss: 0.3083658814430237, mean loss: 0.342749663348535
Epoch: 45, step: 1115, loss: 0.32973015308380127, mean loss: 0.3427494663697426
Epoch: 45, step: 1116, loss: 0.2952525019645691, mean loss: 0.3427487477748834
Epoch: 45, step: 1117, loss: 0.3552190065383911, mean loss: 0.34274893643806176
Epoch: 45, step: 1118, loss: 0.32625895738601685, mean loss: 0.34274868696410526
Epoch: 45, step: 1119, loss: 0.3273298144340515, mean loss: 0.3427484536982576
Epoch: 45, step: 1120, loss: 0.313228577375412, mean loss: 0.3427480071108184
Epoch: 45, step: 1121, loss: 0.37590375542640686, mean loss: 0.3427485086954651
Epoch: 45, step: 1122, loss: 0.34966328740119934, mean loss: 0.34274861330159045
Epoch: 45, step: 1123, loss: 0.3238147795200348, mean loss: 0.3427483268766573
Epoch: 45, step: 1124, loss: 0.32686641812324524, mean loss: 0.3427480866238965
Epoch: 45, step: 1125, loss: 0.33604052662849426, mean loss: 0.3427479851571613
Epoch: 45, step: 1126, loss: 0.37600570917129517, mean loss: 0.34274848824645615
Epoch: 45, step: 1127, loss: 0.3628925383090973, mean loss: 0.34274879296071253
Epoch: 45, step: 1128, loss: 0.30847445130348206, mean loss: 0.3427482745087369
Epoch: 45, step: 1129, loss: 0.3069831132888794, mean loss: 0.34274773351401266
Epoch: 45, step: 1130, loss: 0.368014395236969, mean loss: 0.3427481156994542
Epoch: 45, step: 1131, loss: 0.43238770961761475, mean loss: 0.3427494715742412
Epoch: 45, step: 1132, loss: 0.2949966788291931, mean loss: 0.3427487492837273
Epoch: 45, step: 1133, loss: 0.3352009654045105, mean loss: 0.3427486351205564
Epoch: 45, step: 1134, loss: 0.32818928360939026, mean loss: 0.34274841490802505
Epoch: 45, step: 1135, loss: 0.3264816701412201, mean loss: 0.3427481688746176
Epoch: 45, step: 1136, loss: 0.356783926486969, mean loss: 0.34274838116128536
Epoch: 45, step: 1137, loss: 0.37286514043807983, mean loss: 0.3427488366614408
Epoch: 45, step: 1138, loss: 0.3835705518722534, mean loss: 0.34274945405909063
Epoch: 45, step: 1139, loss: 0.3020334541797638, mean loss: 0.34274883826961877
Epoch: 45, step: 1140, loss: 0.2803167402744293, mean loss: 0.3427478940597914
Epoch: 45, step: 1141, loss: 0.3324390649795532, mean loss: 0.3427477381536016
Epoch: 45, step: 1142, loss: 0.3741016685962677, mean loss: 0.3427482123294624
Epoch: 45, step: 1143, loss: 0.3609986901283264, mean loss: 0.3427484883333006
Epoch: 45, step: 1144, loss: 0.3794618248939514, mean loss: 0.3427490435444395
Epoch: 45, step: 1145, loss: 0.3104743957519531, mean loss: 0.3427485554664098
Epoch: 45, step: 1146, loss: 0.32565510272979736, mean loss: 0.3427482969721074
Epoch: 45, step: 1147, loss: 0.328124076128006, mean loss: 0.3427480758219011
Epoch: 45, step: 1148, loss: 0.3550572693347931, mean loss: 0.34274826196101577
Epoch: 45, step: 1149, loss: 0.4141143560409546, mean loss: 0.3427493411398163
Epoch: 45, step: 1150, loss: 0.38297945261001587, mean loss: 0.3427499494794977
Epoch: 45, step: 1151, loss: 0.35952720046043396, mean loss: 0.3427502031728834
Epoch: 45, step: 1152, loss: 0.34167715907096863, mean loss: 0.3427501869473364
Epoch: 45, step: 1153, loss: 0.3313142955303192, mean loss: 0.3427500140273343
Epoch: 45, step: 1154, loss: 0.32237741351127625, mean loss: 0.3427497059816623
Epoch: 45, step: 1155, loss: 0.35988372564315796, mean loss: 0.34274996505417443
Epoch: 45, step: 1156, loss: 0.3772212266921997, mean loss: 0.342750486264112
Epoch: 45, step: 1157, loss: 0.36099502444267273, mean loss: 0.3427507621197196
Epoch: 45, step: 1158, loss: 0.3108999729156494, mean loss: 0.34275028054622736
Epoch: 45, step: 1159, loss: 0.34573423862457275, mean loss: 0.34275032566201324
Epoch: 45, step: 1160, loss: 0.31472712755203247, mean loss: 0.3427499019732557
Epoch: 45, step: 1161, loss: 0.32254689931869507, mean loss: 0.3427495965243329
Epoch: 45, step: 1162, loss: 0.31803032755851746, mean loss: 0.34274922279969133
Epoch: 45, step: 1163, loss: 0.30269524455070496, mean loss: 0.3427486172424488
Epoch: 45, step: 1164, loss: 0.38126060366630554, mean loss: 0.34274919947824023
Epoch: 45, step: 1165, loss: 0.3353450298309326, mean loss: 0.3427490875414693
Epoch: 45, step: 1166, loss: 0.326766699552536, mean loss: 0.3427488459222275
Epoch: 45, step: 1167, loss: 0.32357504963874817, mean loss: 0.3427485560601563
Epoch: 45, step: 1168, loss: 0.30876263976097107, mean loss: 0.34274804228192385
Epoch: 45, step: 1169, loss: 0.33475783467292786, mean loss: 0.3427479214926932
Epoch: 45, step: 1170, loss: 0.364676833152771, mean loss: 0.34274825299050365
Epoch: 45, step: 1171, loss: 0.356526643037796, mean loss: 0.3427484612743053
Epoch: 45, step: 1172, loss: 0.3201437294483185, mean loss: 0.3427481195705001
Epoch: 45, step: 1173, loss: 0.3321707844734192, mean loss: 0.3427479596809228
Epoch: 45, step: 1174, loss: 0.31894755363464355, mean loss: 0.34274759991361803
Epoch: 45, step: 1175, loss: 0.3229745626449585, mean loss: 0.34274730102859974
Epoch: 45, step: 1176, loss: 0.3301219642162323, mean loss: 0.34274711018958326
Epoch: 45, step: 1177, loss: 0.357912540435791, mean loss: 0.3427473394200655
Epoch: 45, step: 1178, loss: 0.3259945511817932, mean loss: 0.3427470861999709
Epoch: 45, step: 1179, loss: 0.35660693049430847, mean loss: 0.3427472956897577
Epoch: 45, step: 1180, loss: 0.29675933718681335, mean loss: 0.34274660059811
Epoch: 45, step: 1181, loss: 0.3504985570907593, mean loss: 0.3427467177644063
Epoch: 45, step: 1182, loss: 0.3164733350276947, mean loss: 0.3427463206635684
Epoch: 45, step: 1183, loss: 0.28622835874557495, mean loss: 0.34274546645339493
Epoch: 45, step: 1184, loss: 0.360371857881546, mean loss: 0.3427457328539304
Epoch: 45, step: 1185, loss: 0.372029185295105, mean loss: 0.34274617542945923
Epoch: 45, step: 1186, loss: 0.3186807632446289, mean loss: 0.34274581172229124
Epoch: 45, step: 1187, loss: 0.3438373804092407, mean loss: 0.34274582821921856
Epoch: 45, step: 1188, loss: 0.3244447708129883, mean loss: 0.34274555163868375
Epoch: 45, step: 1189, loss: 0.3214215934276581, mean loss: 0.342745229378472
Epoch: 45, step: 1190, loss: 0.2804093360900879, mean loss: 0.34274428733598683
Epoch: 45, step: 1191, loss: 0.3263792097568512, mean loss: 0.34274404002477393
Epoch: 45, step: 1192, loss: 0.3552130460739136, mean loss: 0.3427442284551919
Epoch: 45, step: 1193, loss: 0.32057812809944153, mean loss: 0.3427438934882811
Epoch: 45, step: 1194, loss: 0.32933515310287476, mean loss: 0.3427436908628125
Epoch: 45, step: 1195, loss: 0.3270765542984009, mean loss: 0.3427434541132875
Epoch: 45, step: 1196, loss: 0.36378204822540283, mean loss: 0.3427437720272774
Epoch: 45, step: 1197, loss: 0.36959072947502136, mean loss: 0.3427441777052587
Epoch: 45, step: 1198, loss: 0.3488684594631195, mean loss: 0.34274427024642373
Epoch: 45, step: 1199, loss: 0.3527250289916992, mean loss: 0.34274442105873476
Epoch: 45, step: 1200, loss: 0.3047681748867035, mean loss: 0.34274384723473433
Epoch: 45, step: 1201, loss: 0.3264056146144867, mean loss: 0.3427436003665131
Epoch: 45, step: 1202, loss: 0.31396061182022095, mean loss: 0.3427431654664852
Epoch: 45, step: 1203, loss: 0.3018615245819092, mean loss: 0.34274254776974755
Epoch: 45, step: 1204, loss: 0.3712952733039856, mean loss: 0.342742979177552
Epoch: 45, step: 1205, loss: 0.34654030203819275, mean loss: 0.34274303655105787
Epoch: 45, step: 1206, loss: 0.31339311599731445, mean loss: 0.3427425931117034
Epoch: 45, step: 1207, loss: 0.3144531548023224, mean loss: 0.3427421657013222
Epoch: 45, step: 1208, loss: 0.3200407326221466, mean loss: 0.3427418227223819
Epoch: 45, step: 1209, loss: 0.3346051573753357, mean loss: 0.3427416997934599
Epoch: 45, step: 1210, loss: 0.3130779266357422, mean loss: 0.3427412516392825
Epoch: 45, step: 1211, loss: 0.3739834427833557, mean loss: 0.3427417236327431
Epoch: 45, step: 1212, loss: 0.33573290705680847, mean loss: 0.3427416177481847
Epoch: 45, step: 1213, loss: 0.30932655930519104, mean loss: 0.342741112943241
Epoch: 45, step: 1214, loss: 0.33989301323890686, mean loss: 0.34274106991733716
Epoch: 45, step: 1215, loss: 0.3535628020763397, mean loss: 0.3427412333974894
Epoch: 45, step: 1216, loss: 0.3468503952026367, mean loss: 0.34274129547223303
Epoch: 45, step: 1217, loss: 0.3244500160217285, mean loss: 0.34274101916057026
Epoch: 45, step: 1218, loss: 0.3514039218425751, mean loss: 0.34274115002210415
Epoch: 45, step: 1219, loss: 0.3185531198978424, mean loss: 0.3427407846440056
Epoch: 45, step: 1220, loss: 0.3031890392303467, mean loss: 0.34274018719464056
Epoch: 45, step: 1221, loss: 0.326355904340744, mean loss: 0.34273993970539773
Epoch: 45, step: 1222, loss: 0.32477933168411255, mean loss: 0.34273966840941383
Epoch: 45, step: 1223, loss: 0.39268603920936584, mean loss: 0.34274042284072914
Epoch: 45, step: 1224, loss: 0.33856576681137085, mean loss: 0.3427403597842224
Epoch: 45, step: 1225, loss: 0.34842807054519653, mean loss: 0.342740445693517
Epoch: 45, step: 1226, loss: 0.33322715759277344, mean loss: 0.3427403020034525
Epoch: 45, step: 1227, loss: 0.3199499249458313, mean loss: 0.3427399577795361
Epoch: 45, step: 1228, loss: 0.31060990691185, mean loss: 0.34273947249731057
Epoch: 45, step: 1229, loss: 0.31570324301719666, mean loss: 0.34273906415673544
Epoch: 45, step: 1230, loss: 0.34023427963256836, mean loss: 0.3427390263263972
Epoch: 45, step: 1231, loss: 0.2989337742328644, mean loss: 0.3427383647355663
Epoch: 45, step: 1232, loss: 0.3007717430591583, mean loss: 0.34273773092314763
Epoch: 45, step: 1233, loss: 0.34041282534599304, mean loss: 0.34273769581115354
Epoch: 45, step: 1234, loss: 0.3357114791870117, mean loss: 0.3427375896989943
Epoch: 45, step: 1235, loss: 0.2992430627346039, mean loss: 0.342736932840728
Epoch: 45, step: 1236, loss: 0.36178305745124817, mean loss: 0.34273722047267463
Epoch: 45, step: 1237, loss: 0.3455134630203247, mean loss: 0.34273726239847346
Epoch: 45, step: 1238, loss: 0.28161653876304626, mean loss: 0.34273633938961445
Epoch: 45, step: 1239, loss: 0.3476041257381439, mean loss: 0.34273641289892204
Epoch: 45, step: 1240, loss: 0.345581978559494, mean loss: 0.3427364558696664
Epoch: 45, step: 1241, loss: 0.3292710781097412, mean loss: 0.3427362525327427
Epoch: 45, step: 1242, loss: 0.3625081181526184, mean loss: 0.34273655109767664
Epoch: 45, step: 1243, loss: 0.3526279926300049, mean loss: 0.3427367004610726
Epoch: 45, step: 1244, loss: 0.34304800629615784, mean loss: 0.34273670516180244
Epoch: 45, step: 1245, loss: 0.30600622296333313, mean loss: 0.3427361505385095
Epoch: 45, step: 1246, loss: 0.35928860306739807, mean loss: 0.3427364004736195
Epoch: 45, step: 1247, loss: 0.32521700859069824, mean loss: 0.342736135942124
Epoch: 45, step: 1248, loss: 0.3251032829284668, mean loss: 0.3427358697014588
Epoch: 45, step: 1249, loss: 0.3250104784965515, mean loss: 0.3427356020675889
Epoch: 45, step: 1250, loss: 0.316832035779953, mean loss: 0.3427352109581947
Epoch: 45, step: 1251, loss: 0.35702207684516907, mean loss: 0.34273542666760837
Epoch: 45, step: 1252, loss: 0.31695556640625, mean loss: 0.3427350374377643
Epoch: 45, step: 1253, loss: 0.296163946390152, mean loss: 0.342734334308087
Epoch: 45, step: 1254, loss: 0.37723249197006226, mean loss: 0.34273485515292224
Epoch: 45, step: 1255, loss: 0.3455812335014343, mean loss: 0.3427348981262049
Epoch: 45, step: 1256, loss: 0.41390183568000793, mean loss: 0.3427359725549615
Epoch: 45, step: 1257, loss: 0.33832883834838867, mean loss: 0.34273590602012943
Epoch: 45, step: 1258, loss: 0.37640082836151123, mean loss: 0.3427364142542867
Epoch: 45, step: 1259, loss: 0.326131135225296, mean loss: 0.34273616357072645
Epoch: 45, step: 1260, loss: 0.32434895634651184, mean loss: 0.34273588599026683
Epoch: 45, step: 1261, loss: 0.3040388822555542, mean loss: 0.342735301814008
Epoch: 45, step: 1262, loss: 0.32360273599624634, mean loss: 0.34273501299004444
Epoch: 45, step: 1263, loss: 0.3077671527862549, mean loss: 0.34273448512548005
Epoch: 45, step: 1264, loss: 0.3255804181098938, mean loss: 0.3427342261766233
Epoch: 45, step: 1265, loss: 0.3107245862483978, mean loss: 0.3427337429830731
Epoch: 45, step: 1266, loss: 0.3142869770526886, mean loss: 0.34273331357848225
Epoch: 45, step: 1267, loss: 0.324799507856369, mean loss: 0.34273304287135564
Epoch: 45, step: 1268, loss: 0.3283456563949585, mean loss: 0.3427328256999798
Epoch: 45, step: 1269, loss: 0.33268213272094727, mean loss: 0.34273267399140656
Epoch: 45, step: 1270, loss: 0.34698596596717834, mean loss: 0.3427327381910711
Epoch: 45, step: 1271, loss: 0.3271605670452118, mean loss: 0.3427325031465268
Epoch: 45, step: 1272, loss: 0.34656867384910583, mean loss: 0.3427325610483683
Epoch: 45, step: 1273, loss: 0.35004696249961853, mean loss: 0.3427326714477623
Epoch: 45, step: 1274, loss: 0.3170273005962372, mean loss: 0.3427322834714458
Epoch: 45, step: 1275, loss: 0.34581464529037476, mean loss: 0.3427323299934486
Epoch: 45, step: 1276, loss: 0.3043366074562073, mean loss: 0.3427317504966024
Epoch: 45, step: 1277, loss: 0.3075011670589447, mean loss: 0.3427312187784184
Epoch: 45, step: 1278, loss: 0.3559272885322571, mean loss: 0.34273141793732137
Epoch: 45, step: 1279, loss: 0.3045872449874878, mean loss: 0.34273084226311445
Epoch: 45, step: 1280, loss: 0.3580659329891205, mean loss: 0.34273107369775513
Epoch: 45, step: 1281, loss: 0.32030412554740906, mean loss: 0.34273073523908876
Epoch: 45, step: 1282, loss: 0.3356514275074005, mean loss: 0.34273062840257773
Epoch: 45, step: 1283, loss: 0.35440751910209656, mean loss: 0.3427308046202932
Epoch: 45, step: 1284, loss: 0.32972249388694763, mean loss: 0.34273060831288005
Epoch: 45, step: 1285, loss: 0.33993422985076904, mean loss: 0.3427305661135854
Epoch: 45, step: 1286, loss: 0.32023411989212036, mean loss: 0.34273022663169816
Epoch: 45, step: 1287, loss: 0.3195342719554901, mean loss: 0.3427298765991836
Epoch: 45, step: 1288, loss: 0.3714785575866699, mean loss: 0.3427303104171224
Epoch: 45, step: 1289, loss: 0.3070463240146637, mean loss: 0.3427297719534676
Epoch: 45, step: 1290, loss: 0.3199886381626129, mean loss: 0.34272942879984397
Epoch: 45, step: 1291, loss: 0.34582439064979553, mean loss: 0.342729475500741
Epoch: 45, step: 1292, loss: 0.30894705653190613, mean loss: 0.34272896575440437
Epoch: 45, step: 1293, loss: 0.3322219252586365, mean loss: 0.3427288072149998
Epoch: 45, step: 1294, loss: 0.3058726489543915, mean loss: 0.3427282511054825
Epoch: 45, step: 1295, loss: 0.35311898589134216, mean loss: 0.3427284078852336
Epoch: 45, step: 1296, loss: 0.30755048990249634, mean loss: 0.3427278771141066
Epoch: 45, step: 1297, loss: 0.31794893741607666, mean loss: 0.34272750325038565
Epoch: 45, step: 1298, loss: 0.3660115599632263, mean loss: 0.34272785455406723
Epoch: 45, step: 1299, loss: 0.37585628032684326, mean loss: 0.342728354379441
Epoch: 45, step: 1300, loss: 0.3659759759902954, mean loss: 0.34272870512281556
Epoch: 45, step: 1301, loss: 0.30509495735168457, mean loss: 0.342728137340495
Epoch: 45, step: 1302, loss: 0.3197784423828125, mean loss: 0.3427277911024708
Epoch: 45, step: 1303, loss: 0.3113287687301636, mean loss: 0.342727317398072
Epoch: 45, step: 1304, loss: 0.3228905498981476, mean loss: 0.3427270181332685
Epoch: 45, step: 1305, loss: 0.3189571499824524, mean loss: 0.34272665953766535
Epoch: 45, step: 1306, loss: 0.2914656400680542, mean loss: 0.3427258862183196
Epoch: 45, step: 1307, loss: 0.37104159593582153, mean loss: 0.3427263133802451
Epoch: 45, step: 1308, loss: 0.3171174228191376, mean loss: 0.3427259270583733
Epoch: 45, step: 1309, loss: 0.29787299036979675, mean loss: 0.34272525044143726
Epoch: 45, step: 1310, loss: 0.41240596771240234, mean loss: 0.34272630157533585
Epoch: 45, step: 1311, loss: 0.3239481449127197, mean loss: 0.34272601831104055
Epoch: 45, step: 1312, loss: 0.3297889828681946, mean loss: 0.3427258231616968
Epoch: 45, step: 1313, loss: 0.32246699929237366, mean loss: 0.34272551757108727
Epoch: 45, step: 1314, loss: 0.3202977776527405, mean loss: 0.3427251792689541
Epoch: 45, step: 1315, loss: 0.397117555141449, mean loss: 0.3427259997162793
Epoch: 45, step: 1316, loss: 0.29409918189048767, mean loss: 0.34272526624692434
Epoch: 45, step: 1317, loss: 0.3495587706565857, mean loss: 0.3427253693194817
Epoch: 45, step: 1318, loss: 0.35403063893318176, mean loss: 0.3427255398389407
Epoch: 45, step: 1319, loss: 0.28234800696372986, mean loss: 0.3427246291672533
Epoch: 45, step: 1320, loss: 0.32348060607910156, mean loss: 0.3427243389148727
Epoch: 45, step: 1321, loss: 0.354877233505249, mean loss: 0.3427245222109209
Epoch: 45, step: 1322, loss: 0.28798019886016846, mean loss: 0.34272369654204693
Epoch: 45, step: 1323, loss: 0.33928197622299194, mean loss: 0.3427236446338616
Epoch: 45, step: 1324, loss: 0.366585373878479, mean loss: 0.34272400451213997
Epoch: 45, step: 1325, loss: 0.3346081078052521, mean loss: 0.3427238821115019
Epoch: 45, step: 1326, loss: 0.3232865035533905, mean loss: 0.3427235889693215
Epoch: 45, step: 1327, loss: 0.39261865615844727, mean loss: 0.34272434144364117
Epoch: 45, step: 1328, loss: 0.3586888909339905, mean loss: 0.3427245822035605
Epoch: 45, step: 1329, loss: 0.2929135859012604, mean loss: 0.34272383101978277
Epoch: 45, step: 1330, loss: 0.3580857813358307, mean loss: 0.3427240626849713
Epoch: 45, step: 1331, loss: 0.29967671632766724, mean loss: 0.3427234135212248
Epoch: 45, step: 1332, loss: 0.32245734333992004, mean loss: 0.3427231079088987
Epoch: 45, step: 1333, loss: 0.3249460458755493, mean loss: 0.3427228398348565
Epoch: 45, step: 1334, loss: 0.29735758900642395, mean loss: 0.34272215574753345
Epoch: 45, step: 1335, loss: 0.34599632024765015, mean loss: 0.34272220511969853
Epoch: 45, step: 1336, loss: 0.31623977422714233, mean loss: 0.3427218057887443
Epoch: 45, step: 1337, loss: 0.36792466044425964, mean loss: 0.342722185819123
Epoch: 45, step: 1338, loss: 0.30696359276771545, mean loss: 0.34272164662834737
Epoch: 45, step: 1339, loss: 0.32764437794685364, mean loss: 0.3427214192871429
Epoch: 45, step: 1340, loss: 0.3464127779006958, mean loss: 0.3427214749461139
Epoch: 45, step: 1341, loss: 0.3065270185470581, mean loss: 0.34272092920780084
Epoch: 45, step: 1342, loss: 0.3220856189727783, mean loss: 0.34272061807425386
Epoch: 45, step: 1343, loss: 0.32999181747436523, mean loss: 0.3427204261557839
Epoch: 45, step: 1344, loss: 0.3231215476989746, mean loss: 0.34272013065818185
Epoch: 45, step: 1345, loss: 0.3535112738609314, mean loss: 0.34272029335671944
Epoch: 45, step: 1346, loss: 0.31248679757118225, mean loss: 0.342719837531855
Epoch: 45, step: 1347, loss: 0.3417210578918457, mean loss: 0.3427198224736648
Epoch: 45, step: 1348, loss: 0.35807305574417114, mean loss: 0.34272005394456395
Epoch: 45, step: 1349, loss: 0.3052266538143158, mean loss: 0.3427194886890215
Epoch: 45, step: 1350, loss: 0.3014126718044281, mean loss: 0.34271886595128376
Epoch: 45, step: 1351, loss: 0.3728513717651367, mean loss: 0.3427193202192964
Epoch: 45, step: 1352, loss: 0.3555317521095276, mean loss: 0.34271951337250656
Epoch: 45, step: 1353, loss: 0.32202643156051636, mean loss: 0.3427192014196345
Epoch: 45, step: 1354, loss: 0.3712631165981293, mean loss: 0.342719631719102
Epoch: 45, step: 1355, loss: 0.30105146765708923, mean loss: 0.3427190035810765
Epoch: 45, step: 1356, loss: 0.3145383596420288, mean loss: 0.34271857877073025
Epoch: 45, step: 1357, loss: 0.32260116934776306, mean loss: 0.3427182755145359
Epoch: 45, step: 1358, loss: 0.38522815704345703, mean loss: 0.34271891631227974
Epoch: 45, step: 1359, loss: 0.3363873064517975, mean loss: 0.34271882087046696
Epoch: 45, step: 1360, loss: 0.3247842490673065, mean loss: 0.342718550531283
Epoch: 45, step: 1361, loss: 0.35717451572418213, mean loss: 0.34271876843193705
Epoch: 45, step: 1362, loss: 0.3071359694004059, mean loss: 0.342718232085992
Epoch: 45, step: 1363, loss: 0.32803836464881897, mean loss: 0.34271801081703873
Epoch: 45, step: 1364, loss: 0.3222719132900238, mean loss: 0.34271770263861495
Epoch: 45, step: 1365, loss: 0.30320432782173157, mean loss: 0.34271710707332365
Epoch: 45, step: 1366, loss: 0.425194650888443, mean loss: 0.34271835019726016
Epoch: 45, step: 1367, loss: 0.31356093287467957, mean loss: 0.3427179107353725
Epoch: 45, step: 1368, loss: 0.36590301990509033, mean loss: 0.3427182601770999
Epoch: 45, step: 1369, loss: 0.36823272705078125, mean loss: 0.34271864472068503
Epoch: 45, step: 1370, loss: 0.32346415519714355, mean loss: 0.3427183545292859
Epoch: 45, step: 1371, loss: 0.3488837480545044, mean loss: 0.3427184474487687
Epoch: 45, step: 1372, loss: 0.35260507464408875, mean loss: 0.3427185964492238
Epoch: 45, step: 1373, loss: 0.3631158173084259, mean loss: 0.3427189038492428
Epoch: 45, step: 1374, loss: 0.36305999755859375, mean loss: 0.34271921039876746
Epoch: 45, step: 1375, loss: 0.3399776816368103, mean loss: 0.34271916908330596
Epoch: 45, step: 1376, loss: 0.3032824993133545, mean loss: 0.3427185747726866
Epoch: 45, step: 1377, loss: 0.29719114303588867, mean loss: 0.3427178886846228
Epoch: 45, step: 1378, loss: 0.33526840806007385, mean loss: 0.34271777642433215
Epoch: 45, step: 1379, loss: 0.3198919892311096, mean loss: 0.34271743245526654
Epoch: 45, step: 1380, loss: 0.3202040195465088, mean loss: 0.342717093198581
Epoch: 45, step: 1381, loss: 0.32682374119758606, mean loss: 0.3427168537038099
Epoch: 45, step: 1382, loss: 0.35113194584846497, mean loss: 0.34271698050778415
Epoch: 45, step: 1383, loss: 0.31476664543151855, mean loss: 0.34271655934065925
Epoch: 45, step: 1384, loss: 0.3302103579044342, mean loss: 0.34271637089492074
Epoch: 45, step: 1385, loss: 0.3190757930278778, mean loss: 0.3427160146797222
Epoch: 45, step: 1386, loss: 0.3510308563709259, mean loss: 0.34271613996550715
Epoch: 45, step: 1387, loss: 0.3305116891860962, mean loss: 0.3427159560749156
Epoch: 45, step: 1388, loss: 0.33111459016799927, mean loss: 0.34271578127394065
Epoch: 45, step: 1389, loss: 0.300884872674942, mean loss: 0.3427151510056176
Epoch: 45, step: 1390, loss: 0.33285507559776306, mean loss: 0.3427150024456229
Epoch: 45, step: 1391, loss: 0.30668365955352783, mean loss: 0.3427144595759958
Epoch: 45, step: 1392, loss: 0.31425976753234863, mean loss: 0.3427140308671527
Epoch: 45, step: 1393, loss: 0.3579716980457306, mean loss: 0.3427142607413079
Epoch: 45, step: 1394, loss: 0.3218594789505005, mean loss: 0.34271394654497206
Epoch: 45, step: 1395, loss: 0.3104203939437866, mean loss: 0.34271346002043607
Epoch: 45, step: 1396, loss: 0.3303544223308563, mean loss: 0.34271327382585526
Epoch: 45, step: 1397, loss: 0.32184499502182007, mean loss: 0.3427129594403841
Epoch: 45, step: 1398, loss: 0.32538074254989624, mean loss: 0.3427126983304413
Epoch: 45, step: 1399, loss: 0.3366777002811432, mean loss: 0.3427126074145322
Epoch: 45, step: 1400, loss: 0.30279627442359924, mean loss: 0.342712006092874
Epoch: 45, step: 1401, loss: 0.38072913885116577, mean loss: 0.34271257879530476
Epoch: 45, step: 1402, loss: 0.3210529685020447, mean loss: 0.3427122525128184
Epoch: 45, step: 1403, loss: 0.3105337619781494, mean loss: 0.342711767780194
Epoch: 45, step: 1404, loss: 0.3477807939052582, mean loss: 0.34271184413819844
Epoch: 45, step: 1405, loss: 0.331632137298584, mean loss: 0.3427116772399542
Epoch: 45, step: 1406, loss: 0.31626346707344055, mean loss: 0.34271127884553715
Epoch: 45, step: 1407, loss: 0.32417356967926025, mean loss: 0.3427109996127064
Epoch: 45, step: 1408, loss: 0.3155061602592468, mean loss: 0.3427105898333852
Epoch: 45, step: 1409, loss: 0.34524664282798767, mean loss: 0.3427106280327073
Epoch: 45, step: 1410, loss: 0.3694365620613098, mean loss: 0.3427110305862767
Epoch: 45, step: 1411, loss: 0.30340394377708435, mean loss: 0.342710438540747
Epoch: 45, step: 1412, loss: 0.3837627172470093, mean loss: 0.342711056863141
Epoch: 45, step: 1413, loss: 0.32074296474456787, mean loss: 0.3427107259884819
Epoch: 45, step: 1414, loss: 0.33339813351631165, mean loss: 0.3427105857280335
Epoch: 45, step: 1415, loss: 0.33959901332855225, mean loss: 0.34271053886418024
Epoch: 45, step: 1416, loss: 0.4009169638156891, mean loss: 0.34271141550657297
Epoch: 45, step: 1417, loss: 0.31146305799484253, mean loss: 0.34271094488460374
Epoch: 45, step: 1418, loss: 0.33069589734077454, mean loss: 0.3427107639323674
Epoch: 45, step: 1419, loss: 0.3287172317504883, mean loss: 0.34271055318640076
Epoch: 45, step: 1420, loss: 0.3309548795223236, mean loss: 0.342710376145789
Epoch: 45, step: 1421, loss: 0.3427031636238098, mean loss: 0.3427103760371699
Epoch: 45, step: 1422, loss: 0.34944388270378113, mean loss: 0.34271047744082134
Epoch: 45, step: 1423, loss: 0.3443174660205841, mean loss: 0.34271050164099875
Epoch: 45, step: 1424, loss: 0.3233518898487091, mean loss: 0.3427102101175925
Epoch: 45, step: 1425, loss: 0.3621843457221985, mean loss: 0.342710503376268
Epoch: 45, step: 1426, loss: 0.358477383852005, mean loss: 0.3427107408042572
Epoch: 45, step: 1427, loss: 0.3124658763408661, mean loss: 0.34271028536418274
Epoch: 45, step: 1428, loss: 0.3367880582809448, mean loss: 0.3427101961861032
Epoch: 45, step: 1429, loss: 0.33467623591423035, mean loss: 0.34271007521094476
Epoch: 45, step: 1430, loss: 0.3212185204029083, mean loss: 0.3427097515965615
Epoch: 45, step: 1431, loss: 0.3308064639568329, mean loss: 0.34270957236257305
Epoch: 45, step: 1432, loss: 0.3597128391265869, mean loss: 0.34270982838574265
Epoch: 45, step: 1433, loss: 0.3342015743255615, mean loss: 0.34270970027639736
Epoch: 45, step: 1434, loss: 0.31439003348350525, mean loss: 0.3427092738717178
Epoch: 45, step: 1435, loss: 0.3037870228290558, mean loss: 0.342708687834452
Epoch: 45, step: 1436, loss: 0.27329424023628235, mean loss: 0.34270764270372345
Epoch: 45, step: 1437, loss: 0.3663373291492462, mean loss: 0.34270799847605093
Epoch: 45, step: 1438, loss: 0.30589982867240906, mean loss: 0.3427074442947202
Epoch: 45, step: 1439, loss: 0.31815454363822937, mean loss: 0.3427070746334637
Epoch: 45, step: 1440, loss: 0.31285360455513, mean loss: 0.3427066251751587
Epoch: 45, step: 1441, loss: 0.3799516558647156, mean loss: 0.34270718590851046
Epoch: 45, step: 1442, loss: 0.2894018292427063, mean loss: 0.3427063833949735
Epoch: 45, step: 1443, loss: 0.35596442222595215, mean loss: 0.34270658299208945
Valid: 45, mean loss: 0.18510274092356366
Epoch: 46, step: 0, loss: 0.32292819023132324, mean loss: 0.3427062852368352
Epoch: 46, step: 1, loss: 0.3246734142303467, mean loss: 0.3427060137637523
Epoch: 46, step: 2, loss: 0.33610108494758606, mean loss: 0.34270591433236425
Epoch: 46, step: 3, loss: 0.333674818277359, mean loss: 0.3427057783792111
Epoch: 46, step: 4, loss: 0.3472349941730499, mean loss: 0.3427058465605144
Epoch: 46, step: 5, loss: 0.28522178530693054, mean loss: 0.34270498122766396
Epoch: 46, step: 6, loss: 0.31925636529922485, mean loss: 0.3427046282506513
Epoch: 46, step: 7, loss: 0.32876092195510864, mean loss: 0.3427044183562285
Epoch: 46, step: 8, loss: 0.2973669469356537, mean loss: 0.3427037359021557
Epoch: 46, step: 9, loss: 0.3298690915107727, mean loss: 0.34270354270824305
Epoch: 46, step: 10, loss: 0.3299095332622528, mean loss: 0.3427033501288881
Epoch: 46, step: 11, loss: 0.378105491399765, mean loss: 0.3427038830047577
Epoch: 46, step: 12, loss: 0.3535152077674866, mean loss: 0.3427040457352356
Epoch: 46, step: 13, loss: 0.35317543148994446, mean loss: 0.342704203346629
Epoch: 46, step: 14, loss: 0.36074012517929077, mean loss: 0.3427044748125125
Epoch: 46, step: 15, loss: 0.3282964527606964, mean loss: 0.3427042579548657
Epoch: 46, step: 16, loss: 0.38493964076042175, mean loss: 0.34270489363739315
Epoch: 46, step: 17, loss: 0.3300982117652893, mean loss: 0.34270470389774244
Epoch: 46, step: 18, loss: 0.3432045578956604, mean loss: 0.34270471142079223
Epoch: 46, step: 19, loss: 0.3285505771636963, mean loss: 0.34270449839727984
Epoch: 46, step: 20, loss: 0.2928631603717804, mean loss: 0.34270374828307976
Epoch: 46, step: 21, loss: 0.35020869970321655, mean loss: 0.3427038612312094
Epoch: 46, step: 22, loss: 0.37437373399734497, mean loss: 0.342704337849759
Epoch: 46, step: 23, loss: 0.323661208152771, mean loss: 0.34270405126280834
Epoch: 46, step: 24, loss: 0.36732304096221924, mean loss: 0.3427044217573184
Epoch: 46, step: 25, loss: 0.30141621828079224, mean loss: 0.3427038004149034
Epoch: 46, step: 26, loss: 0.32634782791137695, mean loss: 0.3427035542790664
Epoch: 46, step: 27, loss: 0.31719833612442017, mean loss: 0.3427031704649125
Epoch: 46, step: 28, loss: 0.32592400908470154, mean loss: 0.34270291796824
Epoch: 46, step: 29, loss: 0.30307143926620483, mean loss: 0.3427023215936244
Epoch: 46, step: 30, loss: 0.34682735800743103, mean loss: 0.3427023836662512
Epoch: 46, step: 31, loss: 0.3382522761821747, mean loss: 0.3427023167030352
Epoch: 46, step: 32, loss: 0.3237326145172119, mean loss: 0.3427020312597834
Epoch: 46, step: 33, loss: 0.3286375403404236, mean loss: 0.34270181963001844
Epoch: 46, step: 34, loss: 0.3363214433193207, mean loss: 0.34270172362531914
Epoch: 46, step: 35, loss: 0.31775540113449097, mean loss: 0.3427013482668706
Epoch: 46, step: 36, loss: 0.33663660287857056, mean loss: 0.3427012570141752
Epoch: 46, step: 37, loss: 0.3340742886066437, mean loss: 0.3427011272111538
Epoch: 46, step: 38, loss: 0.2968853712081909, mean loss: 0.3427004378688731
Epoch: 46, step: 39, loss: 0.3585999310016632, mean loss: 0.3427006770884978
Epoch: 46, step: 40, loss: 0.2812568247318268, mean loss: 0.3426997526342383
Epoch: 46, step: 41, loss: 0.3097359538078308, mean loss: 0.342699256684447
Epoch: 46, step: 42, loss: 0.3258224129676819, mean loss: 0.3426990027713214
Epoch: 46, step: 43, loss: 0.3323279023170471, mean loss: 0.3426988467398408
Epoch: 46, step: 44, loss: 0.35582926869392395, mean loss: 0.34269904428188225
Epoch: 46, step: 45, loss: 0.31473955512046814, mean loss: 0.34269862364867687
Epoch: 46, step: 46, loss: 0.3586018681526184, mean loss: 0.3426988628995457
Epoch: 46, step: 47, loss: 0.3399381637573242, mean loss: 0.34269882136778584
Epoch: 46, step: 48, loss: 0.33847808837890625, mean loss: 0.3426987578723367
Epoch: 46, step: 49, loss: 0.32071739435195923, mean loss: 0.34269842719622995
Epoch: 46, step: 50, loss: 0.3036342263221741, mean loss: 0.34269783954371585
Epoch: 46, step: 51, loss: 0.3204737603664398, mean loss: 0.3426975052263806
Epoch: 46, step: 52, loss: 0.326503723859787, mean loss: 0.3426972616266188
Epoch: 46, step: 53, loss: 0.3433211147785187, mean loss: 0.3426972710109738
Epoch: 46, step: 54, loss: 0.3421449661254883, mean loss: 0.3426972627030136
Epoch: 46, step: 55, loss: 0.34046661853790283, mean loss: 0.342697229149401
Epoch: 46, step: 56, loss: 0.3279232084751129, mean loss: 0.3426970069201825
Epoch: 46, step: 57, loss: 0.3812093138694763, mean loss: 0.3426975862094179
Epoch: 46, step: 58, loss: 0.30900391936302185, mean loss: 0.34269707940817784
Epoch: 46, step: 59, loss: 0.30669495463371277, mean loss: 0.3426965378925534
Epoch: 46, step: 60, loss: 0.31869393587112427, mean loss: 0.3426961768697359
Epoch: 46, step: 61, loss: 0.3384378254413605, mean loss: 0.34269611282089213
Epoch: 46, step: 62, loss: 0.3415400981903076, mean loss: 0.3426960954338145
Epoch: 46, step: 63, loss: 0.34392935037612915, mean loss: 0.3426961139823487
Epoch: 46, step: 64, loss: 0.3286266326904297, mean loss: 0.34269590237619896
Epoch: 46, step: 65, loss: 0.31852060556411743, mean loss: 0.3426955387832254
Epoch: 46, step: 66, loss: 0.3210665285587311, mean loss: 0.3426952134909268
Epoch: 46, step: 67, loss: 0.375457227230072, mean loss: 0.34269570621206225
Epoch: 46, step: 68, loss: 0.32815301418304443, mean loss: 0.34269548750194195
Epoch: 46, step: 69, loss: 0.3335053026676178, mean loss: 0.3426953492912036
Epoch: 46, step: 70, loss: 0.3171786367893219, mean loss: 0.3426949655523886
Epoch: 46, step: 71, loss: 0.3622741103172302, mean loss: 0.3426952599933289
Epoch: 46, step: 72, loss: 0.32358497381210327, mean loss: 0.3426949726076396
Epoch: 46, step: 73, loss: 0.33266887068748474, mean loss: 0.34269482183465516
Epoch: 46, step: 74, loss: 0.31421542167663574, mean loss: 0.3426943935665585
Epoch: 46, step: 75, loss: 0.3190308213233948, mean loss: 0.3426940377233669
Epoch: 46, step: 76, loss: 0.3214442729949951, mean loss: 0.3426937181828377
Epoch: 46, step: 77, loss: 0.3147345781326294, mean loss: 0.34269329775728585
Epoch: 46, step: 78, loss: 0.35100409388542175, mean loss: 0.34269342272602604
Epoch: 46, step: 79, loss: 0.34801289439201355, mean loss: 0.3426935027132699
Epoch: 46, step: 80, loss: 0.33096280694007874, mean loss: 0.342693326325092
Epoch: 46, step: 81, loss: 0.30208006501197815, mean loss: 0.342692715654456
Epoch: 46, step: 82, loss: 0.4027336537837982, mean loss: 0.342693618430677
Epoch: 46, step: 83, loss: 0.3481476902961731, mean loss: 0.34269370043692987
Epoch: 46, step: 84, loss: 0.31864801049232483, mean loss: 0.3426933388965377
Epoch: 46, step: 85, loss: 0.36462387442588806, mean loss: 0.34269366862944295
Epoch: 46, step: 86, loss: 0.2820289433002472, mean loss: 0.34269275652880804
Epoch: 46, step: 87, loss: 0.36006733775138855, mean loss: 0.3426930177535678
Epoch: 46, step: 88, loss: 0.31739476323127747, mean loss: 0.342692637403042
Epoch: 46, step: 89, loss: 0.37866491079330444, mean loss: 0.34269317822562656
Epoch: 46, step: 90, loss: 0.3594420552253723, mean loss: 0.3426934300316402
Epoch: 46, step: 91, loss: 0.3211343288421631, mean loss: 0.34269310591261337
Epoch: 46, step: 92, loss: 0.34885716438293457, mean loss: 0.34269319858153213
Epoch: 46, step: 93, loss: 0.3885679244995117, mean loss: 0.34269388824036007
Epoch: 46, step: 94, loss: 0.3303728699684143, mean loss: 0.3426937030148114
Epoch: 46, step: 95, loss: 0.3184472322463989, mean loss: 0.34269333851585215
Epoch: 46, step: 96, loss: 0.31781554222106934, mean loss: 0.34269296453175246
Epoch: 46, step: 97, loss: 0.3907237648963928, mean loss: 0.34269368656056043
Epoch: 46, step: 98, loss: 0.3788376748561859, mean loss: 0.3426942298912625
Epoch: 46, step: 99, loss: 0.3184317946434021, mean loss: 0.3426938651742394
Epoch: 46, step: 100, loss: 0.31958693265914917, mean loss: 0.34269351783214974
Epoch: 46, step: 101, loss: 0.35150277614593506, mean loss: 0.34269365025042703
Epoch: 46, step: 102, loss: 0.3858345150947571, mean loss: 0.3426942987219475
Epoch: 46, step: 103, loss: 0.3309398293495178, mean loss: 0.34269412203740307
Epoch: 46, step: 104, loss: 0.36254680156707764, mean loss: 0.3426944204438052
Epoch: 46, step: 105, loss: 0.31779733300209045, mean loss: 0.3426940462203355
Epoch: 46, step: 106, loss: 0.34133180975914, mean loss: 0.34269402574512153
Epoch: 46, step: 107, loss: 0.3291186988353729, mean loss: 0.3426938217030529
Epoch: 46, step: 108, loss: 0.34390944242477417, mean loss: 0.342693839973997
Epoch: 46, step: 109, loss: 0.3232147991657257, mean loss: 0.3426935472057761
Epoch: 46, step: 110, loss: 0.3555898666381836, mean loss: 0.34269374103337713
Epoch: 46, step: 111, loss: 0.34566664695739746, mean loss: 0.34269378571454107
Epoch: 46, step: 112, loss: 0.3611757159233093, mean loss: 0.3426940634837553
Epoch: 46, step: 113, loss: 0.3762240409851074, mean loss: 0.34269456740598775
Epoch: 46, step: 114, loss: 0.3235248327255249, mean loss: 0.3426942793082604
Epoch: 46, step: 115, loss: 0.33140426874160767, mean loss: 0.3426941096357241
Epoch: 46, step: 116, loss: 0.3172034025192261, mean loss: 0.34269372655300645
Epoch: 46, step: 117, loss: 0.3677121698856354, mean loss: 0.3426941025327385
Epoch: 46, step: 118, loss: 0.31976941227912903, mean loss: 0.34269375802331975
Epoch: 46, step: 119, loss: 0.3396335542201996, mean loss: 0.34269371203564536
Epoch: 46, step: 120, loss: 0.3514202833175659, mean loss: 0.34269384317354123
Epoch: 46, step: 121, loss: 0.3407565653324127, mean loss: 0.34269381406168115
Epoch: 46, step: 122, loss: 0.3197065591812134, mean loss: 0.34269346863281314
Epoch: 46, step: 123, loss: 0.3145798444747925, mean loss: 0.3426930461764785
Epoch: 46, step: 124, loss: 0.31003186106681824, mean loss: 0.34269255539246807
Epoch: 46, step: 125, loss: 0.3525371849536896, mean loss: 0.34269270332078605
Epoch: 46, step: 126, loss: 0.34738147258758545, mean loss: 0.34269277377456236
Epoch: 46, step: 127, loss: 0.3514408469200134, mean loss: 0.3426929052217487
Epoch: 46, step: 128, loss: 0.3330989181995392, mean loss: 0.3426927610661581
Epoch: 46, step: 129, loss: 0.2901356816291809, mean loss: 0.34269197137538915
Epoch: 46, step: 130, loss: 0.31132176518440247, mean loss: 0.34269150003279747
Epoch: 46, step: 131, loss: 0.3114400804042816, mean loss: 0.3426910304820488
Epoch: 46, step: 132, loss: 0.324983686208725, mean loss: 0.3426907644342361
Epoch: 46, step: 133, loss: 0.32264307141304016, mean loss: 0.3426904632278744
Epoch: 46, step: 134, loss: 0.3349740505218506, mean loss: 0.3426903472944513
Epoch: 46, step: 135, loss: 0.32299715280532837, mean loss: 0.34269005142313985
Epoch: 46, step: 136, loss: 0.30229735374450684, mean loss: 0.34268944457081374
Epoch: 46, step: 137, loss: 0.31403401494026184, mean loss: 0.34268901406347274
Epoch: 46, step: 138, loss: 0.35793426632881165, mean loss: 0.34268924309840604
Epoch: 46, step: 139, loss: 0.34011727571487427, mean loss: 0.3426892044593912
Epoch: 46, step: 140, loss: 0.36461636424064636, mean loss: 0.3426895338691378
Epoch: 46, step: 141, loss: 0.3233698606491089, mean loss: 0.3426892436357871
Epoch: 46, step: 142, loss: 0.325221449136734, mean loss: 0.3426889812265679
Epoch: 46, step: 143, loss: 0.3000829815864563, mean loss: 0.3426883411893181
Epoch: 46, step: 144, loss: 0.3128662705421448, mean loss: 0.3426878932019569
Epoch: 46, step: 145, loss: 0.3022022843360901, mean loss: 0.3426872850359833
Epoch: 46, step: 146, loss: 0.3241715729236603, mean loss: 0.34268700690117815
Epoch: 46, step: 147, loss: 0.32204195857048035, mean loss: 0.34268669678508834
Epoch: 46, step: 148, loss: 0.33341115713119507, mean loss: 0.3426865574562365
Epoch: 46, step: 149, loss: 0.32779544591903687, mean loss: 0.3426863337786516
Epoch: 46, step: 150, loss: 0.36649638414382935, mean loss: 0.34268669142116553
Epoch: 46, step: 151, loss: 0.3385971188545227, mean loss: 0.34268662999403615
Epoch: 46, step: 152, loss: 0.33021801710128784, mean loss: 0.3426864427129497
Epoch: 46, step: 153, loss: 0.3685174882411957, mean loss: 0.3426868306946483
Epoch: 46, step: 154, loss: 0.3371673822402954, mean loss: 0.342686747793907
Epoch: 46, step: 155, loss: 0.343197226524353, mean loss: 0.34268675546105526
Epoch: 46, step: 156, loss: 0.364246666431427, mean loss: 0.3426870792758218
Epoch: 46, step: 157, loss: 0.29894256591796875, mean loss: 0.3426864222737288
Epoch: 46, step: 158, loss: 0.3794497549533844, mean loss: 0.34268697441665835
Epoch: 46, step: 159, loss: 0.37692341208457947, mean loss: 0.3426874886008117
Epoch: 46, step: 160, loss: 0.35442373156547546, mean loss: 0.34268766486037416
Epoch: 46, step: 161, loss: 0.31373563408851624, mean loss: 0.34268723005379664
Epoch: 46, step: 162, loss: 0.2962828576564789, mean loss: 0.34268653315541714
Epoch: 46, step: 163, loss: 0.33339670300483704, mean loss: 0.34268639364334064
Epoch: 46, step: 164, loss: 0.3307771682739258, mean loss: 0.34268621479660366
Epoch: 46, step: 165, loss: 0.3076167404651642, mean loss: 0.34268568814884376
Epoch: 46, step: 166, loss: 0.3069831430912018, mean loss: 0.3426851520021414
Epoch: 46, step: 167, loss: 0.28723764419555664, mean loss: 0.3426843193569617
Epoch: 46, step: 168, loss: 0.28829023241996765, mean loss: 0.3426835025430783
Epoch: 46, step: 169, loss: 0.31075024604797363, mean loss: 0.3426830230215524
Epoch: 46, step: 170, loss: 0.3814328610897064, mean loss: 0.342683604894637
Epoch: 46, step: 171, loss: 0.31544652581214905, mean loss: 0.3426831959049217
Epoch: 46, step: 172, loss: 0.3483143746852875, mean loss: 0.34268328046096447
Epoch: 46, step: 173, loss: 0.3000138998031616, mean loss: 0.342682639760333
Epoch: 46, step: 174, loss: 0.3268255293369293, mean loss: 0.3426824016620068
Epoch: 46, step: 175, loss: 0.3209133744239807, mean loss: 0.34268207479973595
Epoch: 46, step: 176, loss: 0.3788570165634155, mean loss: 0.34268261795887417
Epoch: 46, step: 177, loss: 0.32719776034355164, mean loss: 0.3426823854604865
Epoch: 46, step: 178, loss: 0.30076903104782104, mean loss: 0.3426817561591876
Epoch: 46, step: 179, loss: 0.30827683210372925, mean loss: 0.34268123959976093
Epoch: 46, step: 180, loss: 0.4376057982444763, mean loss: 0.3426826647864383
Epoch: 46, step: 181, loss: 0.3442005217075348, mean loss: 0.34268268757502973
Epoch: 46, step: 182, loss: 0.35051578283309937, mean loss: 0.3426828051767121
Epoch: 46, step: 183, loss: 0.3104020655155182, mean loss: 0.34268232053913616
Epoch: 46, step: 184, loss: 0.33227092027664185, mean loss: 0.34268216423292736
Epoch: 46, step: 185, loss: 0.317466676235199, mean loss: 0.3426817856788364
Epoch: 46, step: 186, loss: 0.3598126471042633, mean loss: 0.3426820428565011
Epoch: 46, step: 187, loss: 0.36371684074401855, mean loss: 0.34268235863740976
Epoch: 46, step: 188, loss: 0.3109714686870575, mean loss: 0.34268188259084303
Epoch: 46, step: 189, loss: 0.33501434326171875, mean loss: 0.34268176748682094
Epoch: 46, step: 190, loss: 0.3338726758956909, mean loss: 0.34268163524796197
Epoch: 46, step: 191, loss: 0.3644377589225769, mean loss: 0.3426819618380255
Epoch: 46, step: 192, loss: 0.35027411580085754, mean loss: 0.3426820758052405
Epoch: 46, step: 193, loss: 0.3269799053668976, mean loss: 0.3426818401006196
Epoch: 46, step: 194, loss: 0.32072797417640686, mean loss: 0.342681510557007
Epoch: 46, step: 195, loss: 0.2823832333087921, mean loss: 0.34268060544927287
Epoch: 46, step: 196, loss: 0.354926198720932, mean loss: 0.3426807892590817
Epoch: 46, step: 197, loss: 0.3612588047981262, mean loss: 0.342681068116149
Epoch: 46, step: 198, loss: 0.30647069215774536, mean loss: 0.34268052460450954
Epoch: 46, step: 199, loss: 0.32925835251808167, mean loss: 0.34268032314299285
Epoch: 46, step: 200, loss: 0.35401567816734314, mean loss: 0.3426804932796536
Epoch: 46, step: 201, loss: 0.3674229681491852, mean loss: 0.3426808646433085
Epoch: 46, step: 202, loss: 0.3066575229167938, mean loss: 0.34268032397148285
Epoch: 46, step: 203, loss: 0.3382052779197693, mean loss: 0.34268025680683656
Epoch: 46, step: 204, loss: 0.29800546169281006, mean loss: 0.3426795863060769
Epoch: 46, step: 205, loss: 0.33026939630508423, mean loss: 0.3426794000507865
Epoch: 46, step: 206, loss: 0.311221718788147, mean loss: 0.34267892793298455
Epoch: 46, step: 207, loss: 0.34074506163597107, mean loss: 0.3426788989098981
Epoch: 46, step: 208, loss: 0.3257777988910675, mean loss: 0.34267864526530734
Epoch: 46, step: 209, loss: 0.32786083221435547, mean loss: 0.34267842288914724
Epoch: 46, step: 210, loss: 0.31975358724594116, mean loss: 0.3426780788531955
Epoch: 46, step: 211, loss: 0.3193494975566864, mean loss: 0.3426777287634348
Epoch: 46, step: 212, loss: 0.3537812829017639, mean loss: 0.34267789539089605
Epoch: 46, step: 213, loss: 0.3087591230869293, mean loss: 0.3426773863904413
Epoch: 46, step: 214, loss: 0.3584927022457123, mean loss: 0.3426776237186704
Epoch: 46, step: 215, loss: 0.3284528851509094, mean loss: 0.34267741026220927
Epoch: 46, step: 216, loss: 0.31949737668037415, mean loss: 0.3426770624277893
Epoch: 46, step: 217, loss: 0.33707040548324585, mean loss: 0.34267697829680666
Epoch: 46, step: 218, loss: 0.32836073637008667, mean loss: 0.34267676347691667
Epoch: 46, step: 219, loss: 0.3137738108634949, mean loss: 0.34267632978517226
Epoch: 46, step: 220, loss: 0.3193730115890503, mean loss: 0.3426759801217587
Epoch: 46, step: 221, loss: 0.31886669993400574, mean loss: 0.3426756228718084
Epoch: 46, step: 222, loss: 0.3259366750717163, mean loss: 0.3426753717134997
Epoch: 46, step: 223, loss: 0.35363802313804626, mean loss: 0.3426755361993271
Epoch: 46, step: 224, loss: 0.33141541481018066, mean loss: 0.34267536725273545
Epoch: 46, step: 225, loss: 0.3085378110408783, mean loss: 0.34267485506134443
Epoch: 46, step: 226, loss: 0.3453517556190491, mean loss: 0.34267489522429107
Epoch: 46, step: 227, loss: 0.32217997312545776, mean loss: 0.34267458773281145
Epoch: 46, step: 228, loss: 0.3336375057697296, mean loss: 0.3426744521487873
Epoch: 46, step: 229, loss: 0.34562674164772034, mean loss: 0.3426744964415454
Epoch: 46, step: 230, loss: 0.3111693263053894, mean loss: 0.3426740237812778
Epoch: 46, step: 231, loss: 0.3417818248271942, mean loss: 0.34267401039615186
Epoch: 46, step: 232, loss: 0.32357099652290344, mean loss: 0.3426737238093887
Epoch: 46, step: 233, loss: 0.31110507249832153, mean loss: 0.34267325021805217
Epoch: 46, step: 234, loss: 0.3147404193878174, mean loss: 0.34267283117740005
Epoch: 46, step: 235, loss: 0.3033832311630249, mean loss: 0.34267224177445954
Epoch: 46, step: 236, loss: 0.2954254150390625, mean loss: 0.3426715330118137
Epoch: 46, step: 237, loss: 0.349249005317688, mean loss: 0.3426716316808051
Epoch: 46, step: 238, loss: 0.3247201442718506, mean loss: 0.3426713623936832
Epoch: 46, step: 239, loss: 0.3255464434623718, mean loss: 0.3426711055096238
Epoch: 46, step: 240, loss: 0.32086580991744995, mean loss: 0.34267077842201277
Epoch: 46, step: 241, loss: 0.3846410810947418, mean loss: 0.34267140798284845
Epoch: 46, step: 242, loss: 0.32842588424682617, mean loss: 0.3426711943010608
Epoch: 46, step: 243, loss: 0.35224637389183044, mean loss: 0.34267133792588217
Epoch: 46, step: 244, loss: 0.33374911546707153, mean loss: 0.3426712040972293
Epoch: 46, step: 245, loss: 0.32364708185195923, mean loss: 0.342670918749663
Epoch: 46, step: 246, loss: 0.3193902373313904, mean loss: 0.3426705695621389
Epoch: 46, step: 247, loss: 0.3151091933250427, mean loss: 0.34267015617456636
Epoch: 46, step: 248, loss: 0.3114510476589203, mean loss: 0.34266968793242164
Epoch: 46, step: 249, loss: 0.33595985174179077, mean loss: 0.3426695872959488
Epoch: 46, step: 250, loss: 0.3045434057712555, mean loss: 0.34266901547470363
Epoch: 46, step: 251, loss: 0.31554052233695984, mean loss: 0.3426686086042684
Epoch: 46, step: 252, loss: 0.39489421248435974, mean loss: 0.3426693918669209
Epoch: 46, step: 253, loss: 0.3578210473060608, mean loss: 0.3426696191031223
Epoch: 46, step: 254, loss: 0.295057475566864, mean loss: 0.3426689050530685
Epoch: 46, step: 255, loss: 0.35291996598243713, mean loss: 0.34266905878823545
Epoch: 46, step: 256, loss: 0.34862977266311646, mean loss: 0.3426691481797244
Epoch: 46, step: 257, loss: 0.3062909245491028, mean loss: 0.34266860263184595
Epoch: 46, step: 258, loss: 0.33829131722450256, mean loss: 0.3426685369886474
Epoch: 46, step: 259, loss: 0.3030722439289093, mean loss: 0.3426679431986369
Epoch: 46, step: 260, loss: 0.34142982959747314, mean loss: 0.3426679246320387
Epoch: 46, step: 261, loss: 0.3028131127357483, mean loss: 0.3426673269831784
Epoch: 46, step: 262, loss: 0.3054550290107727, mean loss: 0.3426667689689032
Epoch: 46, step: 263, loss: 0.37267550826072693, mean loss: 0.3426672189559967
Epoch: 46, step: 264, loss: 0.33397340774536133, mean loss: 0.34266708859250034
Epoch: 46, step: 265, loss: 0.29686984419822693, mean loss: 0.34266640187418584
Epoch: 46, step: 266, loss: 0.32986992597579956, mean loss: 0.3426662099970825
Epoch: 46, step: 267, loss: 0.34000667929649353, mean loss: 0.3426661701192756
Epoch: 46, step: 268, loss: 0.3459942638874054, mean loss: 0.3426662200209709
Epoch: 46, step: 269, loss: 0.33929526805877686, mean loss: 0.34266616947741435
Epoch: 46, step: 270, loss: 0.3676920235157013, mean loss: 0.34266654470575286
Epoch: 46, step: 271, loss: 0.35605525970458984, mean loss: 0.3426667454481512
Epoch: 46, step: 272, loss: 0.3382873237133026, mean loss: 0.3426666797867011
Epoch: 46, step: 273, loss: 0.32879090309143066, mean loss: 0.34266647174782894
Epoch: 46, step: 274, loss: 0.3062026798725128, mean loss: 0.3426659250560963
Epoch: 46, step: 275, loss: 0.32275715470314026, mean loss: 0.34266562657378213
Epoch: 46, step: 276, loss: 0.37431570887565613, mean loss: 0.3426661010806456
Epoch: 46, step: 277, loss: 0.3562856614589691, mean loss: 0.34266630526583314
Epoch: 46, step: 278, loss: 0.3026387095451355, mean loss: 0.3426657051789447
Epoch: 46, step: 279, loss: 0.37118643522262573, mean loss: 0.34266613275045527
Epoch: 46, step: 280, loss: 0.38448894023895264, mean loss: 0.3426667597320532
Epoch: 46, step: 281, loss: 0.3580251932144165, mean loss: 0.34266698997271344
Epoch: 46, step: 282, loss: 0.33458343148231506, mean loss: 0.34266686879265
Epoch: 46, step: 283, loss: 0.3468424379825592, mean loss: 0.34266693138737914
Epoch: 46, step: 284, loss: 0.33332619071006775, mean loss: 0.3426667913651831
Epoch: 46, step: 285, loss: 0.33656373620033264, mean loss: 0.34266669987882176
Epoch: 46, step: 286, loss: 0.3601479232311249, mean loss: 0.34266696192291274
Epoch: 46, step: 287, loss: 0.2928682267665863, mean loss: 0.34266621544948733
Epoch: 46, step: 288, loss: 0.3021450638771057, mean loss: 0.34266560805435337
Epoch: 46, step: 289, loss: 0.3590775728225708, mean loss: 0.3426658540591615
Epoch: 46, step: 290, loss: 0.3160723149776459, mean loss: 0.3426654554450705
Epoch: 46, step: 291, loss: 0.3428199589252472, mean loss: 0.34266545776090895
Epoch: 46, step: 292, loss: 0.3221902847290039, mean loss: 0.34266515086501986
Epoch: 46, step: 293, loss: 0.3134259581565857, mean loss: 0.3426647126145821
Epoch: 46, step: 294, loss: 0.3749946355819702, mean loss: 0.34266519718304034
Epoch: 46, step: 295, loss: 0.33571505546569824, mean loss: 0.34266509301424963
Epoch: 46, step: 296, loss: 0.41317981481552124, mean loss: 0.34266614987373617
Epoch: 46, step: 297, loss: 0.323359876871109, mean loss: 0.3426658605198049
Epoch: 46, step: 298, loss: 0.3262442350387573, mean loss: 0.34266561440339105
Epoch: 46, step: 299, loss: 0.348193496465683, mean loss: 0.3426656972503736
Epoch: 46, step: 300, loss: 0.3612116277217865, mean loss: 0.3426659751961281
Epoch: 46, step: 301, loss: 0.3362125754356384, mean loss: 0.342665878481208
Epoch: 46, step: 302, loss: 0.30271902680397034, mean loss: 0.34266527982022105
Epoch: 46, step: 303, loss: 0.31527164578437805, mean loss: 0.3426648692933952
Epoch: 46, step: 304, loss: 0.3415474593639374, mean loss: 0.3426648525479033
Epoch: 46, step: 305, loss: 0.325176864862442, mean loss: 0.34266459047705533
Epoch: 46, step: 306, loss: 0.3351656198501587, mean loss: 0.34266447810093886
Epoch: 46, step: 307, loss: 0.3574347198009491, mean loss: 0.3426646994376544
Epoch: 46, step: 308, loss: 0.31372231245040894, mean loss: 0.3426642657333853
Epoch: 46, step: 309, loss: 0.35568031668663025, mean loss: 0.3426644607771554
Epoch: 46, step: 310, loss: 0.33760032057762146, mean loss: 0.34266438489283385
Epoch: 46, step: 311, loss: 0.3206689953804016, mean loss: 0.34266405530476274
Epoch: 46, step: 312, loss: 0.3185296654701233, mean loss: 0.3426636936704394
Epoch: 46, step: 313, loss: 0.3175109922885895, mean loss: 0.34266331678318807
Epoch: 46, step: 314, loss: 0.32959166169166565, mean loss: 0.3426631209208723
Epoch: 46, step: 315, loss: 0.31271693110466003, mean loss: 0.3426626722215943
Epoch: 46, step: 316, loss: 0.3584384024143219, mean loss: 0.34266290859399196
Epoch: 46, step: 317, loss: 0.3289686441421509, mean loss: 0.342662703411881
Epoch: 46, step: 318, loss: 0.31740233302116394, mean loss: 0.3426623249396758
Epoch: 46, step: 319, loss: 0.31139668822288513, mean loss: 0.34266185649851677
Epoch: 46, step: 320, loss: 0.3411503732204437, mean loss: 0.34266183385287624
Epoch: 46, step: 321, loss: 0.33145663142204285, mean loss: 0.3426616659746149
Epoch: 46, step: 322, loss: 0.33685651421546936, mean loss: 0.34266157900214034
Epoch: 46, step: 323, loss: 0.29413485527038574, mean loss: 0.3426608519882413
Epoch: 46, step: 324, loss: 0.32935550808906555, mean loss: 0.34266065265426027
Epoch: 46, step: 325, loss: 0.35646384954452515, mean loss: 0.34266085944372676
Epoch: 46, step: 326, loss: 0.3179405629634857, mean loss: 0.34266048910775454
Epoch: 46, step: 327, loss: 0.2867696285247803, mean loss: 0.3426596518165785
Epoch: 46, step: 328, loss: 0.30733832716941833, mean loss: 0.34265912268193816
Epoch: 46, step: 329, loss: 0.34141045808792114, mean loss: 0.3426591039764734
Epoch: 46, step: 330, loss: 0.34506961703300476, mean loss: 0.3426591400863237
Epoch: 46, step: 331, loss: 0.35029226541519165, mean loss: 0.34265925442998313
Epoch: 46, step: 332, loss: 0.3182215094566345, mean loss: 0.3426588883598336
Epoch: 46, step: 333, loss: 0.33095142245292664, mean loss: 0.34265871298810424
Epoch: 46, step: 334, loss: 0.31512686610221863, mean loss: 0.342658300581584
Epoch: 46, step: 335, loss: 0.35979515314102173, mean loss: 0.3426585572750016
Epoch: 46, step: 336, loss: 0.31619182229042053, mean loss: 0.34265816083493955
Epoch: 46, step: 337, loss: 0.37871289253234863, mean loss: 0.34265870088364536
Epoch: 46, step: 338, loss: 0.3258940577507019, mean loss: 0.3426584497768477
Epoch: 46, step: 339, loss: 0.30144819617271423, mean loss: 0.34265783252423243
Epoch: 46, step: 340, loss: 0.3204750120639801, mean loss: 0.3426575002719976
Epoch: 46, step: 341, loss: 0.30837199091911316, mean loss: 0.34265698675449835
Epoch: 46, step: 342, loss: 0.3648802638053894, mean loss: 0.34265731960271756
Epoch: 46, step: 343, loss: 0.3562568128108978, mean loss: 0.34265752328551785
Epoch: 46, step: 344, loss: 0.34907352924346924, mean loss: 0.34265761937810507
Epoch: 46, step: 345, loss: 0.38238465785980225, mean loss: 0.3426582143614581
Epoch: 46, step: 346, loss: 0.35173702239990234, mean loss: 0.3426583503307867
Epoch: 46, step: 347, loss: 0.33425644040107727, mean loss: 0.34265822450094885
Epoch: 46, step: 348, loss: 0.31985044479370117, mean loss: 0.3426578829290604
Epoch: 46, step: 349, loss: 0.3169018030166626, mean loss: 0.34265749720887123
Epoch: 46, step: 350, loss: 0.3410255014896393, mean loss: 0.34265747276865083
Epoch: 46, step: 351, loss: 0.33506712317466736, mean loss: 0.3426573590998238
Epoch: 46, step: 352, loss: 0.33931705355644226, mean loss: 0.3426573090780267
Epoch: 46, step: 353, loss: 0.3123577833175659, mean loss: 0.342656855342878
Epoch: 46, step: 354, loss: 0.3351212441921234, mean loss: 0.3426567424988529
Epoch: 46, step: 355, loss: 0.30550333857536316, mean loss: 0.342656186143598
Epoch: 46, step: 356, loss: 0.32531702518463135, mean loss: 0.34265592650146987
Epoch: 46, step: 357, loss: 0.3442903161048889, mean loss: 0.34265595097497475
Epoch: 46, step: 358, loss: 0.33785566687583923, mean loss: 0.3426558790961418
Epoch: 46, step: 359, loss: 0.3776627480983734, mean loss: 0.3426564032766192
Epoch: 46, step: 360, loss: 0.3342357873916626, mean loss: 0.3426562771911826
Epoch: 46, step: 361, loss: 0.3211328983306885, mean loss: 0.3426559549173698
Epoch: 46, step: 362, loss: 0.3440816104412079, mean loss: 0.34265597626367256
Epoch: 46, step: 363, loss: 0.30553317070007324, mean loss: 0.3426554204332006
Epoch: 46, step: 364, loss: 0.34399738907814026, mean loss: 0.3426554405258602
Epoch: 46, step: 365, loss: 0.3169935941696167, mean loss: 0.34265505630896614
Epoch: 46, step: 366, loss: 0.35044294595718384, mean loss: 0.3426551729098502
Epoch: 46, step: 367, loss: 0.3371211588382721, mean loss: 0.3426550900554055
Epoch: 46, step: 368, loss: 0.35432949662208557, mean loss: 0.34265526484028663
Epoch: 46, step: 369, loss: 0.3019408881664276, mean loss: 0.34265465528887973
Epoch: 46, step: 370, loss: 0.33425915241241455, mean loss: 0.34265452959829096
Epoch: 46, step: 371, loss: 0.33437713980674744, mean loss: 0.3426544056778497
Epoch: 46, step: 372, loss: 0.3212868571281433, mean loss: 0.3426540857900022
Epoch: 46, step: 373, loss: 0.3186948597431183, mean loss: 0.3426537271082146
Epoch: 46, step: 374, loss: 0.33034855127334595, mean loss: 0.3426535428962379
Epoch: 46, step: 375, loss: 0.332077294588089, mean loss: 0.34265338456916744
Epoch: 46, step: 376, loss: 0.325501024723053, mean loss: 0.3426531278011573
Epoch: 46, step: 377, loss: 0.3547060787677765, mean loss: 0.34265330822915296
Epoch: 46, step: 378, loss: 0.32484927773475647, mean loss: 0.34265304171371963
Epoch: 46, step: 379, loss: 0.3554089367389679, mean loss: 0.34265323265879816
Epoch: 46, step: 380, loss: 0.34445396065711975, mean loss: 0.3426532596137865
Epoch: 46, step: 381, loss: 0.3002447783946991, mean loss: 0.3426526248133012
Epoch: 46, step: 382, loss: 0.33154478669166565, mean loss: 0.3426524585457226
Epoch: 46, step: 383, loss: 0.36830055713653564, mean loss: 0.3426528424533174
Epoch: 46, step: 384, loss: 0.34678521752357483, mean loss: 0.3426529043068861
Epoch: 46, step: 385, loss: 0.34758585691452026, mean loss: 0.3426529781424288
Epoch: 46, step: 386, loss: 0.3023955821990967, mean loss: 0.34265237558602424
Epoch: 46, step: 387, loss: 0.28396865725517273, mean loss: 0.34265149724503263
Epoch: 46, step: 388, loss: 0.3206038773059845, mean loss: 0.3426511672550615
Epoch: 46, step: 389, loss: 0.3343459367752075, mean loss: 0.3426510429513156
Epoch: 46, step: 390, loss: 0.2879602313041687, mean loss: 0.34265022441039444
Epoch: 46, step: 391, loss: 0.33020684123039246, mean loss: 0.34265003817680995
Epoch: 46, step: 392, loss: 0.3401588201522827, mean loss: 0.34265000089261544
Epoch: 46, step: 393, loss: 0.3409571349620819, mean loss: 0.342649975557138
Epoch: 46, step: 394, loss: 0.36087214946746826, mean loss: 0.3426502482666055
Epoch: 46, step: 395, loss: 0.32312777638435364, mean loss: 0.342649956101507
Epoch: 46, step: 396, loss: 0.32284054160118103, mean loss: 0.34264965964658267
Epoch: 46, step: 397, loss: 0.359316885471344, mean loss: 0.3426499090738046
Epoch: 46, step: 398, loss: 0.3744603097438812, mean loss: 0.34265038511350154
Epoch: 46, step: 399, loss: 0.3237168490886688, mean loss: 0.3426501017791303
Epoch: 46, step: 400, loss: 0.38001343607902527, mean loss: 0.3426506609012298
Epoch: 46, step: 401, loss: 0.3150551915168762, mean loss: 0.34265024795612786
Epoch: 46, step: 402, loss: 0.33659082651138306, mean loss: 0.34265015728287535
Epoch: 46, step: 403, loss: 0.28723710775375366, mean loss: 0.34264932809377
Epoch: 46, step: 404, loss: 0.34295204281806946, mean loss: 0.3426493326234611
Epoch: 46, step: 405, loss: 0.35083577036857605, mean loss: 0.34264945511991096
Epoch: 46, step: 406, loss: 0.3316662013530731, mean loss: 0.3426492907762117
Epoch: 46, step: 407, loss: 0.38168424367904663, mean loss: 0.34264987485199727
Epoch: 46, step: 408, loss: 0.3151700496673584, mean loss: 0.3426494636804924
Epoch: 46, step: 409, loss: 0.32517263293266296, mean loss: 0.34264920218438644
Epoch: 46, step: 410, loss: 0.3588823676109314, mean loss: 0.34264944506858525
Epoch: 46, step: 411, loss: 0.3369086682796478, mean loss: 0.34264935917510286
Epoch: 46, step: 412, loss: 0.3272785544395447, mean loss: 0.34264912920061663
Epoch: 46, step: 413, loss: 0.3421018421649933, mean loss: 0.34264912101235495
Epoch: 46, step: 414, loss: 0.4144856035709381, mean loss: 0.34265019578131556
Epoch: 46, step: 415, loss: 0.33005452156066895, mean loss: 0.34265000733615963
Epoch: 46, step: 416, loss: 0.38796326518058777, mean loss: 0.34265068526225056
Epoch: 46, step: 417, loss: 0.3023282289505005, mean loss: 0.3426500820119542
Epoch: 46, step: 418, loss: 0.3123982846736908, mean loss: 0.3426496294320679
Epoch: 46, step: 419, loss: 0.3166877031326294, mean loss: 0.3426492410363061
Epoch: 46, step: 420, loss: 0.406097948551178, mean loss: 0.3426501902278315
Epoch: 46, step: 421, loss: 0.3055875301361084, mean loss: 0.3426496357793964
Epoch: 46, step: 422, loss: 0.33543235063552856, mean loss: 0.34264952781217056
Epoch: 46, step: 423, loss: 0.28270423412323, mean loss: 0.34264863107189875
Epoch: 46, step: 424, loss: 0.31887659430503845, mean loss: 0.342648275463935
Epoch: 46, step: 425, loss: 0.321584016084671, mean loss: 0.3426479603665621
Epoch: 46, step: 426, loss: 0.3459341824054718, mean loss: 0.34264800952397245
Epoch: 46, step: 427, loss: 0.29571887850761414, mean loss: 0.34264730753852674
Epoch: 46, step: 428, loss: 0.34427961707115173, mean loss: 0.3426473319549259
Epoch: 46, step: 429, loss: 0.3107328712940216, mean loss: 0.3426468545794411
Epoch: 46, step: 430, loss: 0.3306366801261902, mean loss: 0.34264667493432177
Epoch: 46, step: 431, loss: 0.30978864431381226, mean loss: 0.34264618345965053
Epoch: 46, step: 432, loss: 0.2955797612667084, mean loss: 0.34264547947319896
Epoch: 46, step: 433, loss: 0.31838488578796387, mean loss: 0.34264511660572333
Epoch: 46, step: 434, loss: 0.31589287519454956, mean loss: 0.34264471647647504
Epoch: 46, step: 435, loss: 0.35331693291664124, mean loss: 0.34264487609682265
Epoch: 46, step: 436, loss: 0.3241615295410156, mean loss: 0.34264459965245964
Epoch: 46, step: 437, loss: 0.33331191539764404, mean loss: 0.342644460071169
Epoch: 46, step: 438, loss: 0.37892794609069824, mean loss: 0.34264500272534276
Epoch: 46, step: 439, loss: 0.3544682264328003, mean loss: 0.3426451795502965
Epoch: 46, step: 440, loss: 0.32331448793411255, mean loss: 0.34264489044999563
Epoch: 46, step: 441, loss: 0.3432048261165619, mean loss: 0.3426448988239924
Epoch: 46, step: 442, loss: 0.36954155564308167, mean loss: 0.34264530106511015
Epoch: 46, step: 443, loss: 0.31906867027282715, mean loss: 0.3426449484804539
Epoch: 46, step: 444, loss: 0.32517343759536743, mean loss: 0.34264468720077446
Epoch: 46, step: 445, loss: 0.3262726664543152, mean loss: 0.34264444236720565
Epoch: 46, step: 446, loss: 0.35282668471336365, mean loss: 0.34264459463414265
Epoch: 46, step: 447, loss: 0.2843093276023865, mean loss: 0.3426437222919511
Epoch: 46, step: 448, loss: 0.31972554326057434, mean loss: 0.3426433795799593
Epoch: 46, step: 449, loss: 0.32515838742256165, mean loss: 0.3426431181182229
Epoch: 46, step: 450, loss: 0.408524751663208, mean loss: 0.3426441032641451
Epoch: 46, step: 451, loss: 0.3088272511959076, mean loss: 0.34264359759915214
Epoch: 46, step: 452, loss: 0.3271556794643402, mean loss: 0.3426433660110406
Epoch: 46, step: 453, loss: 0.3847843408584595, mean loss: 0.34264399612819196
Epoch: 46, step: 454, loss: 0.3518138527870178, mean loss: 0.34264413323934284
Epoch: 46, step: 455, loss: 0.3168153166770935, mean loss: 0.34264374704292294
Epoch: 46, step: 456, loss: 0.36530938744544983, mean loss: 0.34264408593798135
Epoch: 46, step: 457, loss: 0.2819293439388275, mean loss: 0.34264317814900974
Epoch: 46, step: 458, loss: 0.32753774523735046, mean loss: 0.3426429523003948
Epoch: 46, step: 459, loss: 0.3631899058818817, mean loss: 0.34264325950321733
Epoch: 46, step: 460, loss: 0.33951959013938904, mean loss: 0.34264321280112625
Epoch: 46, step: 461, loss: 0.3191460967063904, mean loss: 0.342642861500165
Epoch: 46, step: 462, loss: 0.36090347170829773, mean loss: 0.34264313450703043
Epoch: 46, step: 463, loss: 0.2815580368041992, mean loss: 0.34264222126253663
Epoch: 46, step: 464, loss: 0.3473691940307617, mean loss: 0.34264229193144735
Epoch: 46, step: 465, loss: 0.3102257251739502, mean loss: 0.3426418073064398
Epoch: 46, step: 466, loss: 0.32388535141944885, mean loss: 0.3426415269031585
Epoch: 46, step: 467, loss: 0.2992233633995056, mean loss: 0.3426408778245915
Epoch: 46, step: 468, loss: 0.31004512310028076, mean loss: 0.34264039054259304
Epoch: 46, step: 469, loss: 0.3597691059112549, mean loss: 0.34264064660016724
Epoch: 46, step: 470, loss: 0.32840797305107117, mean loss: 0.3426404338387718
Epoch: 46, step: 471, loss: 0.3460046947002411, mean loss: 0.34264048412968395
Epoch: 46, step: 472, loss: 0.3254137933254242, mean loss: 0.3426402266190212
Epoch: 46, step: 473, loss: 0.30318066477775574, mean loss: 0.34263963677236153
Epoch: 46, step: 474, loss: 0.34504544734954834, mean loss: 0.3426396727341932
Epoch: 46, step: 475, loss: 0.33523163199424744, mean loss: 0.34263956200114776
Epoch: 46, step: 476, loss: 0.31084558367729187, mean loss: 0.3426390867619387
Epoch: 46, step: 477, loss: 0.32043400406837463, mean loss: 0.3426387548573216
Epoch: 46, step: 478, loss: 0.327924907207489, mean loss: 0.34263853492925184
Epoch: 46, step: 479, loss: 0.34295475482940674, mean loss: 0.3426385396557241
Epoch: 46, step: 480, loss: 0.35140979290008545, mean loss: 0.34263867075583987
Epoch: 46, step: 481, loss: 0.3366364538669586, mean loss: 0.3426385810446497
Epoch: 46, step: 482, loss: 0.2938992381095886, mean loss: 0.3426378525806185
Epoch: 46, step: 483, loss: 0.33399268984794617, mean loss: 0.34263772337091664
Epoch: 46, step: 484, loss: 0.39135685563087463, mean loss: 0.34263845151111094
Epoch: 46, step: 485, loss: 0.3193797767162323, mean loss: 0.3426381038997704
Epoch: 46, step: 486, loss: 0.30671197175979614, mean loss: 0.3426375669756153
Epoch: 46, step: 487, loss: 0.3061652183532715, mean loss: 0.3426370218962779
Epoch: 46, step: 488, loss: 0.31439295411109924, mean loss: 0.34263659979492567
Epoch: 46, step: 489, loss: 0.3413163721561432, mean loss: 0.3426365800647102
Epoch: 46, step: 490, loss: 0.3223889470100403, mean loss: 0.3426362774773523
Epoch: 46, step: 491, loss: 0.3061487674713135, mean loss: 0.3426357322040245
Epoch: 46, step: 492, loss: 0.3010155260562897, mean loss: 0.3426351102364206
Epoch: 46, step: 493, loss: 0.36001524329185486, mean loss: 0.34263536995926136
Epoch: 46, step: 494, loss: 0.36568352580070496, mean loss: 0.34263571437797413
Epoch: 46, step: 495, loss: 0.32582491636276245, mean loss: 0.34263546317059196
Epoch: 46, step: 496, loss: 0.3397231101989746, mean loss: 0.3426354196513234
Epoch: 46, step: 497, loss: 0.30558061599731445, mean loss: 0.34263486594994486
Epoch: 46, step: 498, loss: 0.3173927068710327, mean loss: 0.34263448876782393
Epoch: 46, step: 499, loss: 0.32948485016822815, mean loss: 0.34263429228168146
Epoch: 46, step: 500, loss: 0.3333323895931244, mean loss: 0.3426341532917272
Epoch: 46, step: 501, loss: 0.30123239755630493, mean loss: 0.3426335346718226
Epoch: 46, step: 502, loss: 0.34259745478630066, mean loss: 0.3426335341327295
Epoch: 46, step: 503, loss: 0.2978273332118988, mean loss: 0.342632864664033
Epoch: 46, step: 504, loss: 0.3387818932533264, mean loss: 0.34263280712587446
Epoch: 46, step: 505, loss: 0.35179296135902405, mean loss: 0.3426329439875842
Epoch: 46, step: 506, loss: 0.36516669392585754, mean loss: 0.3426332806589314
Epoch: 46, step: 507, loss: 0.30787739157676697, mean loss: 0.34263276138729626
Epoch: 46, step: 508, loss: 0.3501994013786316, mean loss: 0.34263287443526946
Epoch: 46, step: 509, loss: 0.38188397884368896, mean loss: 0.34263346085031127
Epoch: 46, step: 510, loss: 0.3232032060623169, mean loss: 0.3426331705648883
Epoch: 46, step: 511, loss: 0.3322025537490845, mean loss: 0.34263301473518804
Epoch: 46, step: 512, loss: 0.3076125681400299, mean loss: 0.342632491550005
Epoch: 46, step: 513, loss: 0.3422822654247284, mean loss: 0.34263248631790777
Epoch: 46, step: 514, loss: 0.33416634798049927, mean loss: 0.3426323598424848
Epoch: 46, step: 515, loss: 0.2811878025531769, mean loss: 0.34263144193753575
Epoch: 46, step: 516, loss: 0.32871708273887634, mean loss: 0.34263123407749185
Epoch: 46, step: 517, loss: 0.3372534215450287, mean loss: 0.3426311537420891
Epoch: 46, step: 518, loss: 0.3361572325229645, mean loss: 0.3426310570341253
Epoch: 46, step: 519, loss: 0.3556708097457886, mean loss: 0.3426312518201063
Epoch: 46, step: 520, loss: 0.34620150923728943, mean loss: 0.3426313051513098
Epoch: 46, step: 521, loss: 0.3569033145904541, mean loss: 0.3426315183381983
Epoch: 46, step: 522, loss: 0.3268844187259674, mean loss: 0.34263128312079333
Epoch: 46, step: 523, loss: 0.3240814208984375, mean loss: 0.3426310060421319
Epoch: 46, step: 524, loss: 0.38203686475753784, mean loss: 0.3426315946373121
Epoch: 46, step: 525, loss: 0.3520912826061249, mean loss: 0.34263173593212864
Epoch: 46, step: 526, loss: 0.32412174344062805, mean loss: 0.34263145946138895
Epoch: 46, step: 527, loss: 0.3236442506313324, mean loss: 0.34263117586704034
Epoch: 46, step: 528, loss: 0.29822298884391785, mean loss: 0.342630512592997
Epoch: 46, step: 529, loss: 0.33763396739959717, mean loss: 0.3426304379664595
Epoch: 46, step: 530, loss: 0.3429623246192932, mean loss: 0.34263044292332084
Epoch: 46, step: 531, loss: 0.41406935453414917, mean loss: 0.34263150987641855
Epoch: 46, step: 532, loss: 0.3148609399795532, mean loss: 0.3426310951241164
Epoch: 46, step: 533, loss: 0.3219895660877228, mean loss: 0.34263078684834597
Epoch: 46, step: 534, loss: 0.310433566570282, mean loss: 0.3426303059985681
Epoch: 46, step: 535, loss: 0.307534396648407, mean loss: 0.34262978186611065
Epoch: 46, step: 536, loss: 0.3264129161834717, mean loss: 0.34262953968236665
Epoch: 46, step: 537, loss: 0.3265729248523712, mean loss: 0.3426292998954005
Epoch: 46, step: 538, loss: 0.3225085437297821, mean loss: 0.3426289994196726
Epoch: 46, step: 539, loss: 0.3028646409511566, mean loss: 0.3426284056027192
Epoch: 46, step: 540, loss: 0.3517664074897766, mean loss: 0.3426285420620918
Epoch: 46, step: 541, loss: 0.33385568857192993, mean loss: 0.3426284110575001
Epoch: 46, step: 542, loss: 0.315085768699646, mean loss: 0.3426279997707117
Epoch: 46, step: 543, loss: 0.3271232545375824, mean loss: 0.34262776824602476
Epoch: 46, step: 544, loss: 0.3264647126197815, mean loss: 0.34262752689471854
Epoch: 46, step: 545, loss: 0.33479923009872437, mean loss: 0.3426274100021279
Epoch: 46, step: 546, loss: 0.31694987416267395, mean loss: 0.3426270265893695
Epoch: 46, step: 547, loss: 0.3519213795661926, mean loss: 0.3426271653690532
Epoch: 46, step: 548, loss: 0.3464493751525879, mean loss: 0.34262722243995913
Epoch: 46, step: 549, loss: 0.31743910908699036, mean loss: 0.34262684635202423
Epoch: 46, step: 550, loss: 0.328421413898468, mean loss: 0.34262663425150236
Epoch: 46, step: 551, loss: 0.30557239055633545, mean loss: 0.3426260810049111
Epoch: 46, step: 552, loss: 0.355028361082077, mean loss: 0.34262626617713554
Epoch: 46, step: 553, loss: 0.35566943883895874, mean loss: 0.34262646091529825
Epoch: 46, step: 554, loss: 0.3282032907009125, mean loss: 0.3426262455766068
Epoch: 46, step: 555, loss: 0.3317205309867859, mean loss: 0.34262608275614415
Epoch: 46, step: 556, loss: 0.3709900975227356, mean loss: 0.34262650621973484
Epoch: 46, step: 557, loss: 0.3173803687095642, mean loss: 0.3426261293104531
Epoch: 46, step: 558, loss: 0.33029666543006897, mean loss: 0.3426259452419002
Epoch: 46, step: 559, loss: 0.35360416769981384, mean loss: 0.34262610913510544
Epoch: 46, step: 560, loss: 0.33674728870391846, mean loss: 0.34262602137186843
Epoch: 46, step: 561, loss: 0.3404211401939392, mean loss: 0.34262598845631625
Epoch: 46, step: 562, loss: 0.3223062753677368, mean loss: 0.3426256851181598
Epoch: 46, step: 563, loss: 0.33587729930877686, mean loss: 0.3426255843779405
Epoch: 46, step: 564, loss: 0.30568498373031616, mean loss: 0.3426250329351566
Epoch: 46, step: 565, loss: 0.35643571615219116, mean loss: 0.34262523909552706
Epoch: 46, step: 566, loss: 0.32427406311035156, mean loss: 0.3426249651605808
Epoch: 46, step: 567, loss: 0.29167258739471436, mean loss: 0.3426242045865157
Epoch: 46, step: 568, loss: 0.3220536708831787, mean loss: 0.34262389753154426
Epoch: 46, step: 569, loss: 0.34730029106140137, mean loss: 0.3426239673347137
Epoch: 46, step: 570, loss: 0.3801788091659546, mean loss: 0.342624527896574
Epoch: 46, step: 571, loss: 0.33679428696632385, mean loss: 0.3426244408728572
Epoch: 46, step: 572, loss: 0.28287532925605774, mean loss: 0.34262354905513975
Epoch: 46, step: 573, loss: 0.3155459761619568, mean loss: 0.3426231449001964
Epoch: 46, step: 574, loss: 0.3517041504383087, mean loss: 0.3426232804396155
Epoch: 46, step: 575, loss: 0.33853739500045776, mean loss: 0.34262321945625074
Epoch: 46, step: 576, loss: 0.3199639916419983, mean loss: 0.3426228812638683
Epoch: 46, step: 577, loss: 0.32140427827835083, mean loss: 0.3426225645777547
Epoch: 46, step: 578, loss: 0.36863377690315247, mean loss: 0.34262295278742183
Epoch: 46, step: 579, loss: 0.358372300863266, mean loss: 0.3426231878382856
Epoch: 46, step: 580, loss: 0.353121280670166, mean loss: 0.34262334451454607
Epoch: 46, step: 581, loss: 0.3960725963115692, mean loss: 0.34262414219313897
Epoch: 46, step: 582, loss: 0.3032492697238922, mean loss: 0.3426235545698687
Epoch: 46, step: 583, loss: 0.3688221573829651, mean loss: 0.34262394554710746
Epoch: 46, step: 584, loss: 0.32886555790901184, mean loss: 0.34262374022561876
Epoch: 46, step: 585, loss: 0.33618244528770447, mean loss: 0.34262364410123525
Epoch: 46, step: 586, loss: 0.3168978989124298, mean loss: 0.34262326019791806
Epoch: 46, step: 587, loss: 0.321825236082077, mean loss: 0.342622949835235
Epoch: 46, step: 588, loss: 0.3142928183078766, mean loss: 0.34262252707947827
Epoch: 46, step: 589, loss: 0.3304905295372009, mean loss: 0.3426223460427167
Epoch: 46, step: 590, loss: 0.307985782623291, mean loss: 0.3426218291947958
Epoch: 46, step: 591, loss: 0.3374604880809784, mean loss: 0.3426217521782458
Epoch: 46, step: 592, loss: 0.3581847548484802, mean loss: 0.34262198440294506
Epoch: 46, step: 593, loss: 0.3714524209499359, mean loss: 0.34262241459239484
Epoch: 46, step: 594, loss: 0.3182925581932068, mean loss: 0.3426220515631584
Epoch: 46, step: 595, loss: 0.3223337233066559, mean loss: 0.34262174884265323
Epoch: 46, step: 596, loss: 0.321774423122406, mean loss: 0.3426214377860334
Epoch: 46, step: 597, loss: 0.302752822637558, mean loss: 0.34262084292740264
Epoch: 46, step: 598, loss: 0.3293781876564026, mean loss: 0.34262064534365866
Epoch: 46, step: 599, loss: 0.3198401629924774, mean loss: 0.3426203054582094
Epoch: 46, step: 600, loss: 0.33442434668540955, mean loss: 0.34262018317609416
Epoch: 46, step: 601, loss: 0.31984129548072815, mean loss: 0.3426198433245784
Epoch: 46, step: 602, loss: 0.3303085267543793, mean loss: 0.3426196596476039
Epoch: 46, step: 603, loss: 0.3460371196269989, mean loss: 0.3426197106331618
Epoch: 46, step: 604, loss: 0.3232482075691223, mean loss: 0.34261942163134074
Epoch: 46, step: 605, loss: 0.3221288323402405, mean loss: 0.34261911593852723
Epoch: 46, step: 606, loss: 0.34792789816856384, mean loss: 0.3426191951374386
Epoch: 46, step: 607, loss: 0.33808085322380066, mean loss: 0.3426191274333284
Epoch: 46, step: 608, loss: 0.3104836940765381, mean loss: 0.34261864803611575
Epoch: 46, step: 609, loss: 0.3716592490673065, mean loss: 0.3426190812580782
Epoch: 46, step: 610, loss: 0.35200709104537964, mean loss: 0.3426192213044687
Epoch: 46, step: 611, loss: 0.3628866970539093, mean loss: 0.34261952364165693
Epoch: 46, step: 612, loss: 0.35004597902297974, mean loss: 0.34261963442309673
Epoch: 46, step: 613, loss: 0.32819366455078125, mean loss: 0.34261941923216216
Epoch: 46, step: 614, loss: 0.3579210042953491, mean loss: 0.3426196474811674
Epoch: 46, step: 615, loss: 0.312569797039032, mean loss: 0.3426191992435415
Epoch: 46, step: 616, loss: 0.3593004047870636, mean loss: 0.342619448064495
Epoch: 46, step: 617, loss: 0.3281928598880768, mean loss: 0.342619232877177
Epoch: 46, step: 618, loss: 0.33619609475135803, mean loss: 0.3426191370709314
Epoch: 46, step: 619, loss: 0.2955086827278137, mean loss: 0.34261843439128303
Epoch: 46, step: 620, loss: 0.3584545850753784, mean loss: 0.342618670593098
Epoch: 46, step: 621, loss: 0.308531254529953, mean loss: 0.3426181621747574
Epoch: 46, step: 622, loss: 0.3981972932815552, mean loss: 0.3426189911325199
Epoch: 46, step: 623, loss: 0.3800717294216156, mean loss: 0.3426195497284257
Epoch: 46, step: 624, loss: 0.35294824838638306, mean loss: 0.34261970377544587
Epoch: 46, step: 625, loss: 0.34471574425697327, mean loss: 0.34261973503630316
Epoch: 46, step: 626, loss: 0.34993070363998413, mean loss: 0.34261984407224005
Epoch: 46, step: 627, loss: 0.3742445409297943, mean loss: 0.3426203157165886
Epoch: 46, step: 628, loss: 0.3209981620311737, mean loss: 0.34261999325296
Epoch: 46, step: 629, loss: 0.3076728582382202, mean loss: 0.34261947207398463
Epoch: 46, step: 630, loss: 0.30460110306739807, mean loss: 0.3426189051010668
Epoch: 46, step: 631, loss: 0.3398961126804352, mean loss: 0.34261886449631224
Epoch: 46, step: 632, loss: 0.3434063196182251, mean loss: 0.34261887623938336
Epoch: 46, step: 633, loss: 0.3218091130256653, mean loss: 0.342618565914542
Epoch: 46, step: 634, loss: 0.330186665058136, mean loss: 0.34261838052703464
Epoch: 46, step: 635, loss: 0.31853803992271423, mean loss: 0.34261802144053594
Epoch: 46, step: 636, loss: 0.35413166880607605, mean loss: 0.342618193129705
Epoch: 46, step: 637, loss: 0.3259010910987854, mean loss: 0.3426179438513949
Epoch: 46, step: 638, loss: 0.30379629135131836, mean loss: 0.34261736496806877
Epoch: 46, step: 639, loss: 0.2978449761867523, mean loss: 0.3426166973611741
Epoch: 46, step: 640, loss: 0.36527007818222046, mean loss: 0.34261703514363623
Epoch: 46, step: 641, loss: 0.3666536211967468, mean loss: 0.3426173935455993
Epoch: 46, step: 642, loss: 0.3049588203430176, mean loss: 0.3426168320388493
Epoch: 46, step: 643, loss: 0.34098321199417114, mean loss: 0.3426168076811818
Epoch: 46, step: 644, loss: 0.36289840936660767, mean loss: 0.3426171100802288
Epoch: 46, step: 645, loss: 0.29705142974853516, mean loss: 0.3426164307052425
Epoch: 46, step: 646, loss: 0.30968835949897766, mean loss: 0.3426159397617467
Epoch: 46, step: 647, loss: 0.3684737980365753, mean loss: 0.34261632528563557
Epoch: 46, step: 648, loss: 0.321755975484848, mean loss: 0.3426160142759923
Epoch: 46, step: 649, loss: 0.32711920142173767, mean loss: 0.34261578323545716
Epoch: 46, step: 650, loss: 0.3274990916252136, mean loss: 0.34261555786547415
Epoch: 46, step: 651, loss: 0.352059006690979, mean loss: 0.3426156986527725
Epoch: 46, step: 652, loss: 0.2929673194885254, mean loss: 0.3426149584828311
Epoch: 46, step: 653, loss: 0.32203856110572815, mean loss: 0.34261465172953826
Epoch: 46, step: 654, loss: 0.3041088581085205, mean loss: 0.34261407769304963
Epoch: 46, step: 655, loss: 0.3473818898200989, mean loss: 0.3426141487695572
Epoch: 46, step: 656, loss: 0.34459128975868225, mean loss: 0.34261417824349155
Epoch: 46, step: 657, loss: 0.310631662607193, mean loss: 0.3426137014760184
Epoch: 46, step: 658, loss: 0.3128748834133148, mean loss: 0.342613258162242
Epoch: 46, step: 659, loss: 0.301291823387146, mean loss: 0.3426126421966649
Epoch: 46, step: 660, loss: 0.31493380665779114, mean loss: 0.34261222960315607
Epoch: 46, step: 661, loss: 0.31972768902778625, mean loss: 0.3426118884807076
Epoch: 46, step: 662, loss: 0.3644818067550659, mean loss: 0.34261221447409346
Epoch: 46, step: 663, loss: 0.3411445915699005, mean loss: 0.34261219259800674
Epoch: 46, step: 664, loss: 0.35251739621162415, mean loss: 0.3426123402407442
Epoch: 46, step: 665, loss: 0.36057379841804504, mean loss: 0.3426126079625832
Epoch: 46, step: 666, loss: 0.3572947382926941, mean loss: 0.34261282680162763
Epoch: 46, step: 667, loss: 0.34169453382492065, mean loss: 0.3426128131145565
Epoch: 46, step: 668, loss: 0.30704182386398315, mean loss: 0.34261228294018287
Epoch: 46, step: 669, loss: 0.3436776101589203, mean loss: 0.34261229881831234
Epoch: 46, step: 670, loss: 0.3372870981693268, mean loss: 0.34261221945024245
Epoch: 46, step: 671, loss: 0.3069940209388733, mean loss: 0.3426116885959663
Epoch: 46, step: 672, loss: 0.34261903166770935, mean loss: 0.3426116887054059
Epoch: 46, step: 673, loss: 0.35157090425491333, mean loss: 0.34261182222973674
Epoch: 46, step: 674, loss: 0.3229531943798065, mean loss: 0.3426115292502907
Epoch: 46, step: 675, loss: 0.34247732162475586, mean loss: 0.3426115272501771
Epoch: 46, step: 676, loss: 0.3414798378944397, mean loss: 0.3426115103847152
Epoch: 46, step: 677, loss: 0.35053786635398865, mean loss: 0.3426116285087051
Epoch: 46, step: 678, loss: 0.2970985472202301, mean loss: 0.342610950251678
Epoch: 46, step: 679, loss: 0.3365880846977234, mean loss: 0.3426108604974822
Epoch: 46, step: 680, loss: 0.3438502550125122, mean loss: 0.3426108789669631
Epoch: 46, step: 681, loss: 0.322813481092453, mean loss: 0.3426105839501557
Epoch: 46, step: 682, loss: 0.32764774560928345, mean loss: 0.3426103609802965
Epoch: 46, step: 683, loss: 0.33490899205207825, mean loss: 0.3426102462194792
Epoch: 46, step: 684, loss: 0.35277944803237915, mean loss: 0.34261039775208757
Epoch: 46, step: 685, loss: 0.32322758436203003, mean loss: 0.34261010893054994
Epoch: 46, step: 686, loss: 0.32029157876968384, mean loss: 0.34260977636911943
Epoch: 46, step: 687, loss: 0.35378003120422363, mean loss: 0.34260994281110946
Epoch: 46, step: 688, loss: 0.35775816440582275, mean loss: 0.34261016852329035
Epoch: 46, step: 689, loss: 0.2971988618373871, mean loss: 0.34260949189387346
Epoch: 46, step: 690, loss: 0.3518889546394348, mean loss: 0.3426096301560018
Epoch: 46, step: 691, loss: 0.3233562707901001, mean loss: 0.3426093432890943
Epoch: 46, step: 692, loss: 0.34188222885131836, mean loss: 0.3426093324555583
Epoch: 46, step: 693, loss: 0.32434114813804626, mean loss: 0.34260906027545285
Epoch: 46, step: 694, loss: 0.323762983083725, mean loss: 0.34260877948942814
Epoch: 46, step: 695, loss: 0.3425478935241699, mean loss: 0.3426087785823071
Epoch: 46, step: 696, loss: 0.30158719420433044, mean loss: 0.3426081674235881
Epoch: 46, step: 697, loss: 0.34993815422058105, mean loss: 0.34260827662752713
Epoch: 46, step: 698, loss: 0.3682541847229004, mean loss: 0.3426086587008566
Epoch: 46, step: 699, loss: 0.32810816168785095, mean loss: 0.34260844267533647
Epoch: 46, step: 700, loss: 0.3222249746322632, mean loss: 0.34260813901100806
Epoch: 46, step: 701, loss: 0.2748360335826874, mean loss: 0.3426071293857447
Epoch: 46, step: 702, loss: 0.37729695439338684, mean loss: 0.34260764616476075
Epoch: 46, step: 703, loss: 0.2930401563644409, mean loss: 0.34260690776215974
Epoch: 46, step: 704, loss: 0.34254446625709534, mean loss: 0.3426069068319879
Epoch: 46, step: 705, loss: 0.3096424341201782, mean loss: 0.3426064157777244
Epoch: 46, step: 706, loss: 0.3101319968700409, mean loss: 0.3426059320307385
Epoch: 46, step: 707, loss: 0.3489994406700134, mean loss: 0.3426060272686078
Epoch: 46, step: 708, loss: 0.340151309967041, mean loss: 0.34260599070362036
Epoch: 46, step: 709, loss: 0.3134513199329376, mean loss: 0.3426055564278321
Epoch: 46, step: 710, loss: 0.339935839176178, mean loss: 0.34260551666143224
Epoch: 46, step: 711, loss: 0.3098931312561035, mean loss: 0.3426050294059299
Epoch: 46, step: 712, loss: 0.3668108284473419, mean loss: 0.3426053899492822
Epoch: 46, step: 713, loss: 0.3216712474822998, mean loss: 0.34260507814162533
Epoch: 46, step: 714, loss: 0.35495173931121826, mean loss: 0.34260526203863256
Epoch: 46, step: 715, loss: 0.32549598813056946, mean loss: 0.34260500720881565
Epoch: 46, step: 716, loss: 0.34619447588920593, mean loss: 0.3426050606704662
Epoch: 46, step: 717, loss: 0.3334645926952362, mean loss: 0.34260492453409885
Epoch: 46, step: 718, loss: 0.33179500699043274, mean loss: 0.3426047635356695
Epoch: 46, step: 719, loss: 0.3089887797832489, mean loss: 0.34260426288060347
Epoch: 46, step: 720, loss: 0.3552822470664978, mean loss: 0.34260445169561854
Epoch: 46, step: 721, loss: 0.3869069814682007, mean loss: 0.34260511148964606
Epoch: 46, step: 722, loss: 0.3514530658721924, mean loss: 0.3426052432595596
Epoch: 46, step: 723, loss: 0.32303908467292786, mean loss: 0.34260495187100615
Epoch: 46, step: 724, loss: 0.34469708800315857, mean loss: 0.34260498302763
Epoch: 46, step: 725, loss: 0.3275130093097687, mean loss: 0.34260475827746295
Epoch: 46, step: 726, loss: 0.3330462574958801, mean loss: 0.34260461593407593
Epoch: 46, step: 727, loss: 0.3540876507759094, mean loss: 0.3426047869347139
Epoch: 46, step: 728, loss: 0.3182283341884613, mean loss: 0.3426044239359983
Epoch: 46, step: 729, loss: 0.35055556893348694, mean loss: 0.34260454233765714
Epoch: 46, step: 730, loss: 0.32737040519714355, mean loss: 0.34260431548727904
Epoch: 46, step: 731, loss: 0.3299693763256073, mean loss: 0.3426041273441621
Epoch: 46, step: 732, loss: 0.35914677381515503, mean loss: 0.3426043736721171
Epoch: 46, step: 733, loss: 0.32031166553497314, mean loss: 0.34260404172792375
Epoch: 46, step: 734, loss: 0.3033151626586914, mean loss: 0.3426034567150577
Epoch: 46, step: 735, loss: 0.35893484950065613, mean loss: 0.342603699886481
Epoch: 46, step: 736, loss: 0.324203759431839, mean loss: 0.3426034259188442
Epoch: 46, step: 737, loss: 0.31593385338783264, mean loss: 0.3426030288256586
Epoch: 46, step: 738, loss: 0.3722040355205536, mean loss: 0.34260346955949555
Epoch: 46, step: 739, loss: 0.34055593609809875, mean loss: 0.34260343907391605
Epoch: 46, step: 740, loss: 0.31946706771850586, mean loss: 0.3426030946032638
Epoch: 46, step: 741, loss: 0.3675457537174225, mean loss: 0.342603465961676
Epoch: 46, step: 742, loss: 0.34401923418045044, mean loss: 0.3426034870400064
Epoch: 46, step: 743, loss: 0.33437442779541016, mean loss: 0.3426033645254274
Epoch: 46, step: 744, loss: 0.3380809724330902, mean loss: 0.3426032971968667
Epoch: 46, step: 745, loss: 0.3558492064476013, mean loss: 0.3426034943966471
Epoch: 46, step: 746, loss: 0.3402838706970215, mean loss: 0.34260345986353463
Epoch: 46, step: 747, loss: 0.34366241097450256, mean loss: 0.34260347562830434
Epoch: 46, step: 748, loss: 0.3407936990261078, mean loss: 0.34260344868628
Epoch: 46, step: 749, loss: 0.3223120868206024, mean loss: 0.3426031466146174
Epoch: 46, step: 750, loss: 0.30073100328445435, mean loss: 0.34260252328535307
Epoch: 46, step: 751, loss: 0.32356739044189453, mean loss: 0.3426022399232469
Epoch: 46, step: 752, loss: 0.339398056268692, mean loss: 0.34260219222561744
Epoch: 46, step: 753, loss: 0.3697666823863983, mean loss: 0.3426025965914837
Epoch: 46, step: 754, loss: 0.3644821345806122, mean loss: 0.34260292228162476
Epoch: 46, step: 755, loss: 0.33357876539230347, mean loss: 0.3426027879535972
Epoch: 46, step: 756, loss: 0.2880710959434509, mean loss: 0.342601976240583
Epoch: 46, step: 757, loss: 0.33435916900634766, mean loss: 0.34260185354689665
Epoch: 46, step: 758, loss: 0.3355688154697418, mean loss: 0.34260174886210915
Epoch: 46, step: 759, loss: 0.35458609461784363, mean loss: 0.3426019272430593
Epoch: 46, step: 760, loss: 0.34066006541252136, mean loss: 0.34260189833985427
Epoch: 46, step: 761, loss: 0.29659023880958557, mean loss: 0.34260121349986483
Epoch: 46, step: 762, loss: 0.34810763597488403, mean loss: 0.3426012954565302
Epoch: 46, step: 763, loss: 0.3405192494392395, mean loss: 0.3426012644681689
Epoch: 46, step: 764, loss: 0.30639177560806274, mean loss: 0.34260072554827337
Epoch: 46, step: 765, loss: 0.3188093900680542, mean loss: 0.342600371457851
Epoch: 46, step: 766, loss: 0.3353283107280731, mean loss: 0.3426002632281665
Epoch: 46, step: 767, loss: 0.30217885971069336, mean loss: 0.34259966164756883
Epoch: 46, step: 768, loss: 0.32976892590522766, mean loss: 0.34259947069411023
Epoch: 46, step: 769, loss: 0.39752396941185, mean loss: 0.3426002880959425
Epoch: 46, step: 770, loss: 0.3364035189151764, mean loss: 0.34260019587525375
Epoch: 46, step: 771, loss: 0.38454654812812805, mean loss: 0.3426008201140813
Epoch: 46, step: 772, loss: 0.31046897172927856, mean loss: 0.3426003419402285
Epoch: 46, step: 773, loss: 0.3194032311439514, mean loss: 0.34259999673485336
Epoch: 46, step: 774, loss: 0.30612850189208984, mean loss: 0.3425994539961989
Epoch: 46, step: 775, loss: 0.33281564712524414, mean loss: 0.34259930840383473
Epoch: 46, step: 776, loss: 0.34755411744117737, mean loss: 0.3425993821350149
Epoch: 46, step: 777, loss: 0.390918493270874, mean loss: 0.3426001011480076
Epoch: 46, step: 778, loss: 0.3034643530845642, mean loss: 0.3425995187968021
Epoch: 46, step: 779, loss: 0.33431118726730347, mean loss: 0.3425993954658764
Epoch: 46, step: 780, loss: 0.3609464466571808, mean loss: 0.34259966846715895
Epoch: 46, step: 781, loss: 0.3167281746864319, mean loss: 0.3425992835090632
Epoch: 46, step: 782, loss: 0.3045922517776489, mean loss: 0.3425987179871424
Epoch: 46, step: 783, loss: 0.3240371346473694, mean loss: 0.3425984418059833
Epoch: 46, step: 784, loss: 0.32061654329299927, mean loss: 0.342598114738202
Epoch: 46, step: 785, loss: 0.3371608257293701, mean loss: 0.34259803383820187
Epoch: 46, step: 786, loss: 0.33753979206085205, mean loss: 0.34259795857906605
Epoch: 46, step: 787, loss: 0.35598909854888916, mean loss: 0.3425981578164042
Epoch: 46, step: 788, loss: 0.3279069662094116, mean loss: 0.3425979392397656
Epoch: 46, step: 789, loss: 0.2911244332790375, mean loss: 0.3425971734245194
Epoch: 46, step: 790, loss: 0.3495385944843292, mean loss: 0.34259727669642387
Epoch: 46, step: 791, loss: 0.30525243282318115, mean loss: 0.34259672110186495
Epoch: 46, step: 792, loss: 0.34568095207214355, mean loss: 0.34259676698655145
Epoch: 46, step: 793, loss: 0.3738638460636139, mean loss: 0.34259723214587007
Epoch: 46, step: 794, loss: 0.33941152691841125, mean loss: 0.34259718475294204
Epoch: 46, step: 795, loss: 0.3109357953071594, mean loss: 0.34259671374149536
Epoch: 46, step: 796, loss: 0.29848358035087585, mean loss: 0.3425960575011331
Epoch: 46, step: 797, loss: 0.33921149373054504, mean loss: 0.3425960071520841
Epoch: 46, step: 798, loss: 0.3331845700740814, mean loss: 0.34259586714885487
Epoch: 46, step: 799, loss: 0.30631935596466064, mean loss: 0.3425953275125466
Epoch: 46, step: 800, loss: 0.33264386653900146, mean loss: 0.34259517948040125
Epoch: 46, step: 801, loss: 0.351789653301239, mean loss: 0.34259531625001155
Epoch: 46, step: 802, loss: 0.3134615421295166, mean loss: 0.34259488288582574
Epoch: 46, step: 803, loss: 0.30287620425224304, mean loss: 0.34259429208022935
Epoch: 46, step: 804, loss: 0.3501099646091461, mean loss: 0.34259440387235074
Epoch: 46, step: 805, loss: 0.31184691190719604, mean loss: 0.3425939465245601
Epoch: 46, step: 806, loss: 0.32207241654396057, mean loss: 0.3425936412854594
Epoch: 46, step: 807, loss: 0.29774168133735657, mean loss: 0.34259297416325646
Epoch: 46, step: 808, loss: 0.33502107858657837, mean loss: 0.3425928615415443
Epoch: 46, step: 809, loss: 0.3401542007923126, mean loss: 0.3425928252703013
Epoch: 46, step: 810, loss: 0.3344910144805908, mean loss: 0.34259270477040116
Epoch: 46, step: 811, loss: 0.3001669645309448, mean loss: 0.34259207377301526
Epoch: 46, step: 812, loss: 0.35842856764793396, mean loss: 0.3425923093054435
Epoch: 46, step: 813, loss: 0.36890313029289246, mean loss: 0.3425927006142419
Epoch: 46, step: 814, loss: 0.33983543515205383, mean loss: 0.3425926596073045
Epoch: 46, step: 815, loss: 0.2828807234764099, mean loss: 0.34259177156542275
Epoch: 46, step: 816, loss: 0.3217547535896301, mean loss: 0.34259146167981763
Epoch: 46, step: 817, loss: 0.34242579340934753, mean loss: 0.3425914592160558
Epoch: 46, step: 818, loss: 0.2948248088359833, mean loss: 0.34259074885735114
Epoch: 46, step: 819, loss: 0.3518144190311432, mean loss: 0.3425908860245359
Epoch: 46, step: 820, loss: 0.30617526173591614, mean loss: 0.342590344488001
Epoch: 46, step: 821, loss: 0.3421623110771179, mean loss: 0.34259033812281336
Epoch: 46, step: 822, loss: 0.3250904679298401, mean loss: 0.3425900778900864
Epoch: 46, step: 823, loss: 0.35872259736061096, mean loss: 0.3425903177859862
Epoch: 46, step: 824, loss: 0.32587045431137085, mean loss: 0.34259006915978396
Epoch: 46, step: 825, loss: 0.30463001132011414, mean loss: 0.34258950469795735
Epoch: 46, step: 826, loss: 0.3401722013950348, mean loss: 0.3425894687534613
Epoch: 46, step: 827, loss: 0.345231831073761, mean loss: 0.34258950804392585
Epoch: 46, step: 828, loss: 0.3425385355949402, mean loss: 0.342589507286005
Epoch: 46, step: 829, loss: 0.3308362364768982, mean loss: 0.3425893325265735
Epoch: 46, step: 830, loss: 0.32282599806785583, mean loss: 0.34258903866984225
Epoch: 46, step: 831, loss: 0.32707223296165466, mean loss: 0.3425888079572559
Epoch: 46, step: 832, loss: 0.3462895154953003, mean loss: 0.3425888629806369
Epoch: 46, step: 833, loss: 0.3059021532535553, mean loss: 0.3425883175182424
Epoch: 46, step: 834, loss: 0.3178805112838745, mean loss: 0.34258795016508176
Epoch: 46, step: 835, loss: 0.33319786190986633, mean loss: 0.3425878105562763
Epoch: 46, step: 836, loss: 0.3453843891620636, mean loss: 0.34258785213428744
Epoch: 46, step: 837, loss: 0.3527746796607971, mean loss: 0.3425880035842522
Epoch: 46, step: 838, loss: 0.29935914278030396, mean loss: 0.3425873609001494
Epoch: 46, step: 839, loss: 0.3804517388343811, mean loss: 0.3425879238220383
Epoch: 46, step: 840, loss: 0.33288219571113586, mean loss: 0.34258777953112757
Epoch: 46, step: 841, loss: 0.3108418881893158, mean loss: 0.3425873075855482
Epoch: 46, step: 842, loss: 0.3230443298816681, mean loss: 0.3425870170570914
Epoch: 46, step: 843, loss: 0.33893728256225586, mean loss: 0.3425869628004687
Epoch: 46, step: 844, loss: 0.3121008276939392, mean loss: 0.3425865096030805
Epoch: 46, step: 845, loss: 0.3288086950778961, mean loss: 0.3425863047894262
Epoch: 46, step: 846, loss: 0.3285868465900421, mean loss: 0.3425860966840286
Epoch: 46, step: 847, loss: 0.32081812620162964, mean loss: 0.34258577310259086
Epoch: 46, step: 848, loss: 0.315828800201416, mean loss: 0.34258537536541694
Epoch: 46, step: 849, loss: 0.3497176766395569, mean loss: 0.3425854813841058
Epoch: 46, step: 850, loss: 0.3296806812286377, mean loss: 0.34258528956247586
Epoch: 46, step: 851, loss: 0.31283941864967346, mean loss: 0.3425848474156343
Epoch: 46, step: 852, loss: 0.3371742069721222, mean loss: 0.3425847669923032
Epoch: 46, step: 853, loss: 0.34105929732322693, mean loss: 0.3425847443181799
Epoch: 46, step: 854, loss: 0.3192927837371826, mean loss: 0.34258439811861424
Epoch: 46, step: 855, loss: 0.308474600315094, mean loss: 0.3425838911358883
Epoch: 46, step: 856, loss: 0.31816017627716064, mean loss: 0.3425835281253079
Epoch: 46, step: 857, loss: 0.38449281454086304, mean loss: 0.34258415101532924
Epoch: 46, step: 858, loss: 0.33831503987312317, mean loss: 0.34258408756525804
Epoch: 46, step: 859, loss: 0.3733668327331543, mean loss: 0.3425845450699422
Epoch: 46, step: 860, loss: 0.33290672302246094, mean loss: 0.3425844012366651
Epoch: 46, step: 861, loss: 0.3233944773674011, mean loss: 0.3425841160373091
Epoch: 46, step: 862, loss: 0.3149619996547699, mean loss: 0.34258370552537687
Epoch: 46, step: 863, loss: 0.3465661108493805, mean loss: 0.34258376470985735
Epoch: 46, step: 864, loss: 0.33627933263778687, mean loss: 0.34258367101798987
Epoch: 46, step: 865, loss: 0.3219808340072632, mean loss: 0.3425833648382156
Epoch: 46, step: 866, loss: 0.31726783514022827, mean loss: 0.34258298862847436
Epoch: 46, step: 867, loss: 0.3192848563194275, mean loss: 0.3425826424040746
Epoch: 46, step: 868, loss: 0.3516625463962555, mean loss: 0.34258277733495884
Epoch: 46, step: 869, loss: 0.29595261812210083, mean loss: 0.3425820844030598
Epoch: 46, step: 870, loss: 0.34341228008270264, mean loss: 0.34258209673972195
Epoch: 46, step: 871, loss: 0.3041922450065613, mean loss: 0.34258152627711297
Epoch: 46, step: 872, loss: 0.32584068179130554, mean loss: 0.3425812775164775
Epoch: 46, step: 873, loss: 0.3264806270599365, mean loss: 0.3425810382723624
Epoch: 46, step: 874, loss: 0.3236407935619354, mean loss: 0.3425807568380958
Epoch: 46, step: 875, loss: 0.3134874999523163, mean loss: 0.3425803245460173
Epoch: 46, step: 876, loss: 0.3122362792491913, mean loss: 0.342579873675372
Epoch: 46, step: 877, loss: 0.3776368200778961, mean loss: 0.3425803945654853
Epoch: 46, step: 878, loss: 0.3606402575969696, mean loss: 0.3425806629021572
Epoch: 46, step: 879, loss: 0.31955116987228394, mean loss: 0.3425803207309188
Epoch: 46, step: 880, loss: 0.3752214014530182, mean loss: 0.342580805703517
Epoch: 46, step: 881, loss: 0.3766734302043915, mean loss: 0.34258131223524524
Epoch: 46, step: 882, loss: 0.3646162748336792, mean loss: 0.3425816396151998
Epoch: 46, step: 883, loss: 0.3088906407356262, mean loss: 0.34258113906550464
Epoch: 46, step: 884, loss: 0.3145332336425781, mean loss: 0.3425807223618629
Epoch: 46, step: 885, loss: 0.3054674565792084, mean loss: 0.34258017098367566
Epoch: 46, step: 886, loss: 0.3144419193267822, mean loss: 0.3425797529501944
Epoch: 46, step: 887, loss: 0.3322433829307556, mean loss: 0.34257959939109617
Epoch: 46, step: 888, loss: 0.3574616014957428, mean loss: 0.3425798204776932
Epoch: 46, step: 889, loss: 0.3447478413581848, mean loss: 0.3425798526852708
Epoch: 46, step: 890, loss: 0.3681698739528656, mean loss: 0.3425802328385987
Epoch: 46, step: 891, loss: 0.3305167555809021, mean loss: 0.3425800536319129
Epoch: 46, step: 892, loss: 0.32478874921798706, mean loss: 0.34257978934050937
Epoch: 46, step: 893, loss: 0.3218535780906677, mean loss: 0.34257948145537837
Epoch: 46, step: 894, loss: 0.312529593706131, mean loss: 0.3425790350748952
Epoch: 46, step: 895, loss: 0.36111992597579956, mean loss: 0.34257931048919854
Epoch: 46, step: 896, loss: 0.35418900847435, mean loss: 0.34257948294204366
Epoch: 46, step: 897, loss: 0.324990838766098, mean loss: 0.3425792216805812
Epoch: 46, step: 898, loss: 0.31453776359558105, mean loss: 0.34257880515936134
Epoch: 46, step: 899, loss: 0.3374422788619995, mean loss: 0.3425787288637417
Epoch: 46, step: 900, loss: 0.33532199263572693, mean loss: 0.3425786210770914
Epoch: 46, step: 901, loss: 0.3165570795536041, mean loss: 0.3425782345764598
Epoch: 46, step: 902, loss: 0.30320361256599426, mean loss: 0.34257764974983734
Epoch: 46, step: 903, loss: 0.3256329298019409, mean loss: 0.3425773980756461
Epoch: 46, step: 904, loss: 0.35370975732803345, mean loss: 0.34257756341835505
Epoch: 46, step: 905, loss: 0.34067150950431824, mean loss: 0.34257753510922223
Epoch: 46, step: 906, loss: 0.32274749875068665, mean loss: 0.3425772405935258
Epoch: 46, step: 907, loss: 0.3638230562210083, mean loss: 0.34257755613168933
Epoch: 46, step: 908, loss: 0.3339273929595947, mean loss: 0.3425774276632835
Epoch: 46, step: 909, loss: 0.3366503119468689, mean loss: 0.342577339637684
Epoch: 46, step: 910, loss: 0.3217267096042633, mean loss: 0.3425770299825264
Epoch: 46, step: 911, loss: 0.35110893845558167, mean loss: 0.34257715668902033
Epoch: 46, step: 912, loss: 0.3258894681930542, mean loss: 0.3425769088655578
Epoch: 46, step: 913, loss: 0.37324923276901245, mean loss: 0.3425773643635516
Epoch: 46, step: 914, loss: 0.29766130447387695, mean loss: 0.34257669734949003
Epoch: 46, step: 915, loss: 0.30417904257774353, mean loss: 0.34257612714374647
Epoch: 46, step: 916, loss: 0.3497638404369354, mean loss: 0.34257623387981057
Epoch: 46, step: 917, loss: 0.31289610266685486, mean loss: 0.3425757931425112
Epoch: 46, step: 918, loss: 0.3554270565509796, mean loss: 0.342575983975462
Epoch: 46, step: 919, loss: 0.347832590341568, mean loss: 0.3425760620315081
Epoch: 46, step: 920, loss: 0.33954373002052307, mean loss: 0.34257601700467594
Epoch: 46, step: 921, loss: 0.31286725401878357, mean loss: 0.3425755758684097
Epoch: 46, step: 922, loss: 0.3108866214752197, mean loss: 0.34257510533587826
Epoch: 46, step: 923, loss: 0.3345847427845001, mean loss: 0.3425749866929705
Epoch: 46, step: 924, loss: 0.3567410409450531, mean loss: 0.3425751970309748
Epoch: 46, step: 925, loss: 0.3430478572845459, mean loss: 0.34257520404894437
Epoch: 46, step: 926, loss: 0.3122098445892334, mean loss: 0.3425747531965523
Epoch: 46, step: 927, loss: 0.3551943898200989, mean loss: 0.34257494056495447
Epoch: 46, step: 928, loss: 0.3331786096096039, mean loss: 0.34257480105623245
Epoch: 46, step: 929, loss: 0.3451879024505615, mean loss: 0.34257483985276116
Epoch: 46, step: 930, loss: 0.36291196942329407, mean loss: 0.34257514179218024
Epoch: 46, step: 931, loss: 0.3354139029979706, mean loss: 0.34257503547293927
Epoch: 46, step: 932, loss: 0.32287758588790894, mean loss: 0.3425747430393454
Epoch: 46, step: 933, loss: 0.34694740176200867, mean loss: 0.3425748079560401
Epoch: 46, step: 934, loss: 0.3300071954727173, mean loss: 0.34257462137945077
Epoch: 46, step: 935, loss: 0.3244580924510956, mean loss: 0.3425743524286056
Epoch: 46, step: 936, loss: 0.30817344784736633, mean loss: 0.342573841733922
Epoch: 46, step: 937, loss: 0.3338930010795593, mean loss: 0.3425737128654108
Epoch: 46, step: 938, loss: 0.362933486700058, mean loss: 0.3425740151051245
Epoch: 46, step: 939, loss: 0.3144364356994629, mean loss: 0.34257359741051896
Epoch: 46, step: 940, loss: 0.33403322100639343, mean loss: 0.3425734706328688
Epoch: 46, step: 941, loss: 0.31828710436820984, mean loss: 0.3425731101191636
Epoch: 46, step: 942, loss: 0.31107017397880554, mean loss: 0.3425726424875912
Epoch: 46, step: 943, loss: 0.3391038477420807, mean loss: 0.3425725909973474
Epoch: 46, step: 944, loss: 0.3175072968006134, mean loss: 0.34257221893758405
Epoch: 46, step: 945, loss: 0.3224388360977173, mean loss: 0.3425719200896868
Epoch: 46, step: 946, loss: 0.3225460350513458, mean loss: 0.3425716228418348
Epoch: 46, step: 947, loss: 0.3597033619880676, mean loss: 0.3425718771275788
Epoch: 46, step: 948, loss: 0.329774409532547, mean loss: 0.34257168717807984
Epoch: 46, step: 949, loss: 0.3591032326221466, mean loss: 0.3425719325478878
Epoch: 46, step: 950, loss: 0.3006785213947296, mean loss: 0.3425713107532881
Epoch: 46, step: 951, loss: 0.3429063558578491, mean loss: 0.3425713157260544
Epoch: 46, step: 952, loss: 0.3200354278087616, mean loss: 0.3425709812515614
Epoch: 46, step: 953, loss: 0.3503003716468811, mean loss: 0.34257109596838875
Epoch: 46, step: 954, loss: 0.3068205416202545, mean loss: 0.3425705653794167
Epoch: 46, step: 955, loss: 0.3066931664943695, mean loss: 0.3425700329157942
Epoch: 46, step: 956, loss: 0.35797861218452454, mean loss: 0.3425702615941942
Epoch: 46, step: 957, loss: 0.27958884835243225, mean loss: 0.34256932690224023
Epoch: 46, step: 958, loss: 0.3384765088558197, mean loss: 0.3425692661626168
Epoch: 46, step: 959, loss: 0.3008246123790741, mean loss: 0.3425686466586725
Epoch: 46, step: 960, loss: 0.32631587982177734, mean loss: 0.34256840546602074
Epoch: 46, step: 961, loss: 0.3220881223678589, mean loss: 0.3425681015411239
Epoch: 46, step: 962, loss: 0.3754497766494751, mean loss: 0.34256858949392055
Epoch: 46, step: 963, loss: 0.33339983224868774, mean loss: 0.3425684534347224
Epoch: 46, step: 964, loss: 0.3699829578399658, mean loss: 0.3425688602445045
Epoch: 46, step: 965, loss: 0.3161836266517639, mean loss: 0.34256846871410546
Epoch: 46, step: 966, loss: 0.34708160161972046, mean loss: 0.34256853568347684
Epoch: 46, step: 967, loss: 0.3417648673057556, mean loss: 0.3425685237581982
Epoch: 46, step: 968, loss: 0.3185567557811737, mean loss: 0.34256816746350915
Epoch: 46, step: 969, loss: 0.31032219529151917, mean loss: 0.3425676889940286
Epoch: 46, step: 970, loss: 0.33429044485092163, mean loss: 0.34256756617714096
Epoch: 46, step: 971, loss: 0.3208591341972351, mean loss: 0.34256724407446454
Epoch: 46, step: 972, loss: 0.33117806911468506, mean loss: 0.3425670750880859
Epoch: 46, step: 973, loss: 0.3444975018501282, mean loss: 0.3425671037302825
Epoch: 46, step: 974, loss: 0.3224615752696991, mean loss: 0.3425668054242474
Epoch: 46, step: 975, loss: 0.3089316487312317, mean loss: 0.34256630638631425
Epoch: 46, step: 976, loss: 0.32307514548301697, mean loss: 0.34256601720424124
Epoch: 46, step: 977, loss: 0.33940422534942627, mean loss: 0.3425659702947748
Epoch: 46, step: 978, loss: 0.32191768288612366, mean loss: 0.34256566395399757
Epoch: 46, step: 979, loss: 0.32772666215896606, mean loss: 0.34256544380383147
Epoch: 46, step: 980, loss: 0.2981099486351013, mean loss: 0.3425647842756782
Epoch: 46, step: 981, loss: 0.3664953410625458, mean loss: 0.3425651392968453
Epoch: 46, step: 982, loss: 0.37035736441612244, mean loss: 0.34256555160157803
Epoch: 46, step: 983, loss: 0.3316726088523865, mean loss: 0.34256539000439745
Epoch: 46, step: 984, loss: 0.3467390239238739, mean loss: 0.3425654519194818
Epoch: 46, step: 985, loss: 0.3819384276866913, mean loss: 0.3425660360016026
Epoch: 46, step: 986, loss: 0.33709844946861267, mean loss: 0.34256595489337793
Epoch: 46, step: 987, loss: 0.3356736898422241, mean loss: 0.34256585265245565
Epoch: 46, step: 988, loss: 0.29628121852874756, mean loss: 0.34256516606924287
Epoch: 46, step: 989, loss: 0.35759925842285156, mean loss: 0.3425653890806701
Epoch: 46, step: 990, loss: 0.299182653427124, mean loss: 0.3425647455631198
Epoch: 46, step: 991, loss: 0.3531501889228821, mean loss: 0.3425649025799015
Epoch: 46, step: 992, loss: 0.3625740110874176, mean loss: 0.34256519937608804
Epoch: 46, step: 993, loss: 0.33948642015457153, mean loss: 0.34256515370906704
Epoch: 46, step: 994, loss: 0.334725946187973, mean loss: 0.3425650374331282
Epoch: 46, step: 995, loss: 0.33279526233673096, mean loss: 0.3425648925239752
Epoch: 46, step: 996, loss: 0.29333963990211487, mean loss: 0.3425641624064655
Epoch: 46, step: 997, loss: 0.3456919491291046, mean loss: 0.34256420879765415
Epoch: 46, step: 998, loss: 0.299469918012619, mean loss: 0.3425635696345973
Epoch: 46, step: 999, loss: 0.34047043323516846, mean loss: 0.3425635385902155
Epoch: 46, step: 1000, loss: 0.32047563791275024, mean loss: 0.342563210998066
Epoch: 46, step: 1001, loss: 0.3070591688156128, mean loss: 0.3425626844349868
Epoch: 46, step: 1002, loss: 0.3116387128829956, mean loss: 0.3425622258060762
Epoch: 46, step: 1003, loss: 0.3119044005870819, mean loss: 0.3425617711310863
Epoch: 46, step: 1004, loss: 0.30455484986305237, mean loss: 0.3425612074727009
Epoch: 46, step: 1005, loss: 0.30275338888168335, mean loss: 0.3425606171150175
Epoch: 46, step: 1006, loss: 0.32595446705818176, mean loss: 0.3425603708462382
Epoch: 46, step: 1007, loss: 0.3545863926410675, mean loss: 0.34256054918918805
Epoch: 46, step: 1008, loss: 0.3411882221698761, mean loss: 0.3425605288382172
Epoch: 46, step: 1009, loss: 0.36159592866897583, mean loss: 0.34256081112014963
Epoch: 46, step: 1010, loss: 0.3066692054271698, mean loss: 0.34256027888013046
Epoch: 46, step: 1011, loss: 0.3715776801109314, mean loss: 0.3425607091755399
Epoch: 46, step: 1012, loss: 0.35000574588775635, mean loss: 0.34256081957541995
Epoch: 46, step: 1013, loss: 0.3149428963661194, mean loss: 0.3425604100448406
Epoch: 46, step: 1014, loss: 0.30243074893951416, mean loss: 0.3425598149935927
Epoch: 46, step: 1015, loss: 0.33262360095977783, mean loss: 0.34255966765945817
Epoch: 46, step: 1016, loss: 0.37481066584587097, mean loss: 0.3425601458700153
Epoch: 46, step: 1017, loss: 0.3192666471004486, mean loss: 0.34255980048436885
Epoch: 46, step: 1018, loss: 0.30841806530952454, mean loss: 0.34255929425340087
Epoch: 46, step: 1019, loss: 0.3220796585083008, mean loss: 0.34255899059946954
Epoch: 46, step: 1020, loss: 0.3247523307800293, mean loss: 0.3425587265819765
Epoch: 46, step: 1021, loss: 0.33517706394195557, mean loss: 0.342558617136455
Epoch: 46, step: 1022, loss: 0.3611118197441101, mean loss: 0.34255889221470326
Epoch: 46, step: 1023, loss: 0.29213178157806396, mean loss: 0.34255814457043454
Epoch: 46, step: 1024, loss: 0.308345764875412, mean loss: 0.342557637337122
Epoch: 46, step: 1025, loss: 0.3566969037055969, mean loss: 0.34255784696301333
Epoch: 46, step: 1026, loss: 0.3052605390548706, mean loss: 0.34255729400889984
Epoch: 46, step: 1027, loss: 0.30884096026420593, mean loss: 0.3425567941522055
Epoch: 46, step: 1028, loss: 0.31999894976615906, mean loss: 0.34255645972906074
Epoch: 46, step: 1029, loss: 0.32680797576904297, mean loss: 0.3425562262590818
Epoch: 46, step: 1030, loss: 0.3137851059436798, mean loss: 0.3425557997359135
Epoch: 46, step: 1031, loss: 0.3411168158054352, mean loss: 0.34255577840372764
Epoch: 46, step: 1032, loss: 0.31840798258781433, mean loss: 0.34255542043056225
Epoch: 46, step: 1033, loss: 0.34015199542045593, mean loss: 0.34255538480209696
Epoch: 46, step: 1034, loss: 0.33286482095718384, mean loss: 0.3425552411509334
Epoch: 46, step: 1035, loss: 0.3451523184776306, mean loss: 0.3425552796489667
Epoch: 46, step: 1036, loss: 0.31575071811676025, mean loss: 0.34255488231478054
Epoch: 46, step: 1037, loss: 0.44255903363227844, mean loss: 0.3425563646922867
Epoch: 46, step: 1038, loss: 0.3046245872974396, mean loss: 0.34255580243182693
Epoch: 46, step: 1039, loss: 0.3237155079841614, mean loss: 0.3425555231674126
Epoch: 46, step: 1040, loss: 0.3221794664859772, mean loss: 0.3425552211433011
Epoch: 46, step: 1041, loss: 0.325575590133667, mean loss: 0.34255496946644154
Epoch: 46, step: 1042, loss: 0.32402676343917847, mean loss: 0.3425546948402387
Epoch: 46, step: 1043, loss: 0.304429829120636, mean loss: 0.3425541297595231
Epoch: 46, step: 1044, loss: 0.34006261825561523, mean loss: 0.3425540928312819
Epoch: 46, step: 1045, loss: 0.3239597976207733, mean loss: 0.34255381723775574
Epoch: 46, step: 1046, loss: 0.34663069248199463, mean loss: 0.3425538776618675
Epoch: 46, step: 1047, loss: 0.30077502131462097, mean loss: 0.34255325845899304
Epoch: 46, step: 1048, loss: 0.32141533493995667, mean loss: 0.34255294517925866
Epoch: 46, step: 1049, loss: 0.3356432318687439, mean loss: 0.3425528427736904
Epoch: 46, step: 1050, loss: 0.30977386236190796, mean loss: 0.3425523569792419
Epoch: 46, step: 1051, loss: 0.3050033152103424, mean loss: 0.3425518004992821
Epoch: 46, step: 1052, loss: 0.3258656859397888, mean loss: 0.3425515532133245
Epoch: 46, step: 1053, loss: 0.3599996864795685, mean loss: 0.342551811788464
Epoch: 46, step: 1054, loss: 0.3093636929988861, mean loss: 0.3425513199596167
Epoch: 46, step: 1055, loss: 0.3309158980846405, mean loss: 0.34255114753190663
Epoch: 46, step: 1056, loss: 0.32671353220939636, mean loss: 0.34255091283450556
Epoch: 46, step: 1057, loss: 0.31383633613586426, mean loss: 0.34255048731989873
Epoch: 46, step: 1058, loss: 0.3551163077354431, mean loss: 0.34255067352709784
Epoch: 46, step: 1059, loss: 0.32570531964302063, mean loss: 0.34255042390713036
Epoch: 46, step: 1060, loss: 0.355223149061203, mean loss: 0.3425506116929369
Epoch: 46, step: 1061, loss: 0.32054466009140015, mean loss: 0.3425502856112073
Epoch: 46, step: 1062, loss: 0.35366290807724, mean loss: 0.34255045027436415
Epoch: 46, step: 1063, loss: 0.3777833878993988, mean loss: 0.3425509723366215
Epoch: 46, step: 1064, loss: 0.3190474808216095, mean loss: 0.3425506240799943
Epoch: 46, step: 1065, loss: 0.30233022570610046, mean loss: 0.3425500281339523
Epoch: 46, step: 1066, loss: 0.3544321358203888, mean loss: 0.34255020418865123
Epoch: 46, step: 1067, loss: 0.32837599515914917, mean loss: 0.3425499941754789
Epoch: 46, step: 1068, loss: 0.35911598801612854, mean loss: 0.3425502396230637
Epoch: 46, step: 1069, loss: 0.31598344445228577, mean loss: 0.3425498460059248
Epoch: 46, step: 1070, loss: 0.3151654005050659, mean loss: 0.34254944028038214
Epoch: 46, step: 1071, loss: 0.30810442566871643, mean loss: 0.3425489299536278
Epoch: 46, step: 1072, loss: 0.3360459804534912, mean loss: 0.34254883360935323
Epoch: 46, step: 1073, loss: 0.31811651587486267, mean loss: 0.34254847163836544
Epoch: 46, step: 1074, loss: 0.31206509470939636, mean loss: 0.34254802002609075
Epoch: 46, step: 1075, loss: 0.3178406059741974, mean loss: 0.342547653990327
Epoch: 46, step: 1076, loss: 0.32287684082984924, mean loss: 0.34254736257519003
Epoch: 46, step: 1077, loss: 0.3383026719093323, mean loss: 0.34254729969274705
Epoch: 46, step: 1078, loss: 0.37748801708221436, mean loss: 0.34254781730999945
Epoch: 46, step: 1079, loss: 0.3327818214893341, mean loss: 0.3425476726371531
Epoch: 46, step: 1080, loss: 0.32857465744018555, mean loss: 0.3425474656448533
Epoch: 46, step: 1081, loss: 0.3272400498390198, mean loss: 0.34254723888847893
Epoch: 46, step: 1082, loss: 0.3146785497665405, mean loss: 0.34254682606182213
Epoch: 46, step: 1083, loss: 0.31314340233802795, mean loss: 0.342546390507166
Epoch: 46, step: 1084, loss: 0.32324138283729553, mean loss: 0.34254610454518064
Epoch: 46, step: 1085, loss: 0.3647514283657074, mean loss: 0.3425464334642122
Epoch: 46, step: 1086, loss: 0.3216308057308197, mean loss: 0.34254612365354825
Epoch: 46, step: 1087, loss: 0.34149789810180664, mean loss: 0.34254610812704106
Epoch: 46, step: 1088, loss: 0.33676445484161377, mean loss: 0.34254602248941146
Epoch: 46, step: 1089, loss: 0.3454433083534241, mean loss: 0.3425460654032644
Epoch: 46, step: 1090, loss: 0.3084318935871124, mean loss: 0.34254556012041143
Epoch: 46, step: 1091, loss: 0.3213379383087158, mean loss: 0.34254524600787795
Epoch: 46, step: 1092, loss: 0.33351999521255493, mean loss: 0.3425451123341247
Epoch: 46, step: 1093, loss: 0.3172859847545624, mean loss: 0.3425447382245898
Epoch: 46, step: 1094, loss: 0.31434008479118347, mean loss: 0.3425443204954553
Epoch: 46, step: 1095, loss: 0.3414229452610016, mean loss: 0.34254430388740975
Epoch: 46, step: 1096, loss: 0.2976020574569702, mean loss: 0.3425436382834283
Epoch: 46, step: 1097, loss: 0.33409154415130615, mean loss: 0.34254351310801684
Epoch: 46, step: 1098, loss: 0.3531101942062378, mean loss: 0.34254366959811794
Epoch: 46, step: 1099, loss: 0.3127025067806244, mean loss: 0.34254322766394907
Epoch: 46, step: 1100, loss: 0.32983317971229553, mean loss: 0.3425430394366562
Epoch: 46, step: 1101, loss: 0.3699644207954407, mean loss: 0.3425434455229246
Epoch: 46, step: 1102, loss: 0.3310409486293793, mean loss: 0.3425432751836989
Epoch: 46, step: 1103, loss: 0.3212299048900604, mean loss: 0.3425429595609899
Epoch: 46, step: 1104, loss: 0.3178313076496124, mean loss: 0.34254259361966233
Epoch: 46, step: 1105, loss: 0.32532086968421936, mean loss: 0.34254233859635513
Epoch: 46, step: 1106, loss: 0.320492684841156, mean loss: 0.3425420120847715
Epoch: 46, step: 1107, loss: 0.320717453956604, mean loss: 0.34254168891119263
Epoch: 46, step: 1108, loss: 0.32454565167427063, mean loss: 0.34254142243351154
Epoch: 46, step: 1109, loss: 0.3377019464969635, mean loss: 0.3425413507736671
Epoch: 46, step: 1110, loss: 0.3547835350036621, mean loss: 0.34254153204536664
Epoch: 46, step: 1111, loss: 0.30243119597435, mean loss: 0.3425409381349178
Epoch: 46, step: 1112, loss: 0.3529964089393616, mean loss: 0.3425410929459222
Epoch: 46, step: 1113, loss: 0.31980666518211365, mean loss: 0.3425407563290878
Epoch: 46, step: 1114, loss: 0.3433872163295746, mean loss: 0.34254076886199475
Epoch: 46, step: 1115, loss: 0.38040411472320557, mean loss: 0.34254132946824084
Epoch: 46, step: 1116, loss: 0.3630102276802063, mean loss: 0.34254163252709713
Epoch: 46, step: 1117, loss: 0.3501652777194977, mean loss: 0.342541745399757
Epoch: 46, step: 1118, loss: 0.3446292579174042, mean loss: 0.3425417763061798
Epoch: 46, step: 1119, loss: 0.3413064479827881, mean loss: 0.34254175801694137
Epoch: 46, step: 1120, loss: 0.31291839480400085, mean loss: 0.3425413194446827
Epoch: 46, step: 1121, loss: 0.2962160110473633, mean loss: 0.34254063361120035
Epoch: 46, step: 1122, loss: 0.30394914746284485, mean loss: 0.34254006228329315
Epoch: 46, step: 1123, loss: 0.3377271592617035, mean loss: 0.34253999103169397
Epoch: 46, step: 1124, loss: 0.2978458106517792, mean loss: 0.34253932937600134
Epoch: 46, step: 1125, loss: 0.327385812997818, mean loss: 0.34253910504563306
Epoch: 46, step: 1126, loss: 0.3729737401008606, mean loss: 0.342539555588705
Epoch: 46, step: 1127, loss: 0.30408039689064026, mean loss: 0.3425389862619834
Epoch: 46, step: 1128, loss: 0.3221718966960907, mean loss: 0.3425386847640549
Epoch: 46, step: 1129, loss: 0.3339875638484955, mean loss: 0.3425385581820477
Epoch: 46, step: 1130, loss: 0.3718997836112976, mean loss: 0.34253899280902467
Epoch: 46, step: 1131, loss: 0.3276180922985077, mean loss: 0.34253877194188465
Epoch: 46, step: 1132, loss: 0.3179847300052643, mean loss: 0.3425384084852194
Epoch: 46, step: 1133, loss: 0.29841673374176025, mean loss: 0.3425377553919552
Epoch: 46, step: 1134, loss: 0.33816495537757874, mean loss: 0.3425376906663078
Epoch: 46, step: 1135, loss: 0.37997737526893616, mean loss: 0.3425382448357069
Epoch: 46, step: 1136, loss: 0.323611855506897, mean loss: 0.3425379646979154
Epoch: 46, step: 1137, loss: 0.31327956914901733, mean loss: 0.3425375316379772
Epoch: 46, step: 1138, loss: 0.32462260127067566, mean loss: 0.342537266479083
Epoch: 46, step: 1139, loss: 0.3321356475353241, mean loss: 0.342537112526994
Epoch: 46, step: 1140, loss: 0.3390097916126251, mean loss: 0.3425370603206606
Epoch: 46, step: 1141, loss: 0.31699860095977783, mean loss: 0.34253668234269297
Epoch: 46, step: 1142, loss: 0.3515951633453369, mean loss: 0.342536816409338
Epoch: 46, step: 1143, loss: 0.31071215867996216, mean loss: 0.342536345407418
Epoch: 46, step: 1144, loss: 0.3528898060321808, mean loss: 0.3425364986353868
Epoch: 46, step: 1145, loss: 0.3148917257785797, mean loss: 0.34253608950747716
Epoch: 46, step: 1146, loss: 0.3560504913330078, mean loss: 0.342536289510464
Epoch: 46, step: 1147, loss: 0.3316250443458557, mean loss: 0.34253612803462835
Epoch: 46, step: 1148, loss: 0.33631306886672974, mean loss: 0.342536035940757
Epoch: 46, step: 1149, loss: 0.33523643016815186, mean loss: 0.3425359279168754
Epoch: 46, step: 1150, loss: 0.32474687695503235, mean loss: 0.3425356646678786
Epoch: 46, step: 1151, loss: 0.31679248809814453, mean loss: 0.3425352837164081
Epoch: 46, step: 1152, loss: 0.31975966691970825, mean loss: 0.3425349466843292
Epoch: 46, step: 1153, loss: 0.3106248378753662, mean loss: 0.34253447448762603
Epoch: 46, step: 1154, loss: 0.3565654754638672, mean loss: 0.34253468211131055
Epoch: 46, step: 1155, loss: 0.3544994592666626, mean loss: 0.342534859157436
Epoch: 46, step: 1156, loss: 0.35549411177635193, mean loss: 0.3425350509162531
Epoch: 46, step: 1157, loss: 0.36067065596580505, mean loss: 0.3425353192658883
Epoch: 46, step: 1158, loss: 0.33862489461898804, mean loss: 0.342535261404819
Epoch: 46, step: 1159, loss: 0.3422102630138397, mean loss: 0.3425352565960123
Epoch: 46, step: 1160, loss: 0.3395763635635376, mean loss: 0.34253521281569077
Epoch: 46, step: 1161, loss: 0.2978077232837677, mean loss: 0.342534551029381
Epoch: 46, step: 1162, loss: 0.3793700933456421, mean loss: 0.3425350960386626
Epoch: 46, step: 1163, loss: 0.35361453890800476, mean loss: 0.3425352599648458
Epoch: 46, step: 1164, loss: 0.31955021619796753, mean loss: 0.3425349198940685
Epoch: 46, step: 1165, loss: 0.28408950567245483, mean loss: 0.3425340551890201
Epoch: 46, step: 1166, loss: 0.3486565053462982, mean loss: 0.34253414576986896
Epoch: 46, step: 1167, loss: 0.28491365909576416, mean loss: 0.3425332932949211
Epoch: 46, step: 1168, loss: 0.32980433106422424, mean loss: 0.3425331049771629
Epoch: 46, step: 1169, loss: 0.32452088594436646, mean loss: 0.3425328385005668
Epoch: 46, step: 1170, loss: 0.3297194838523865, mean loss: 0.34253264893987967
Epoch: 46, step: 1171, loss: 0.29863667488098145, mean loss: 0.34253199955272573
Epoch: 46, step: 1172, loss: 0.3449070155620575, mean loss: 0.3425320346876579
Epoch: 46, step: 1173, loss: 0.29281744360923767, mean loss: 0.3425312992429542
Epoch: 46, step: 1174, loss: 0.35081037878990173, mean loss: 0.34253142171635687
Epoch: 46, step: 1175, loss: 0.31802111864089966, mean loss: 0.342531059137909
Epoch: 46, step: 1176, loss: 0.3252754509449005, mean loss: 0.34253080388120877
Epoch: 46, step: 1177, loss: 0.31894993782043457, mean loss: 0.34253045506214924
Epoch: 46, step: 1178, loss: 0.3096678555011749, mean loss: 0.3425299689505926
Epoch: 46, step: 1179, loss: 0.32351091504096985, mean loss: 0.34252968762028807
Epoch: 46, step: 1180, loss: 0.33693522214889526, mean loss: 0.34252960486804385
Epoch: 46, step: 1181, loss: 0.31530821323394775, mean loss: 0.3425292022204736
Epoch: 46, step: 1182, loss: 0.3002435266971588, mean loss: 0.34252857675749604
Epoch: 46, step: 1183, loss: 0.3321980834007263, mean loss: 0.3425284239576298
Epoch: 46, step: 1184, loss: 0.32805147767066956, mean loss: 0.3425282098301277
Epoch: 46, step: 1185, loss: 0.30915936827659607, mean loss: 0.3425277162812214
Epoch: 46, step: 1186, loss: 0.3292200267314911, mean loss: 0.34252751945393667
Epoch: 46, step: 1187, loss: 0.29648494720458984, mean loss: 0.3425268384716813
Epoch: 46, step: 1188, loss: 0.3134623169898987, mean loss: 0.3425264086058052
Epoch: 46, step: 1189, loss: 0.3033776581287384, mean loss: 0.3425258296021894
Epoch: 46, step: 1190, loss: 0.36108723282814026, mean loss: 0.3425261041182469
Epoch: 46, step: 1191, loss: 0.35855892300605774, mean loss: 0.3425263412340019
Epoch: 46, step: 1192, loss: 0.3467739522457123, mean loss: 0.3425264040526867
Epoch: 46, step: 1193, loss: 0.3542066514492035, mean loss: 0.34252657679141596
Epoch: 46, step: 1194, loss: 0.33445271849632263, mean loss: 0.3425264573892022
Epoch: 46, step: 1195, loss: 0.35232433676719666, mean loss: 0.3425266022853775
Epoch: 46, step: 1196, loss: 0.3430224657058716, mean loss: 0.34252660961835724
Epoch: 46, step: 1197, loss: 0.3453007638454437, mean loss: 0.34252665064279053
Epoch: 46, step: 1198, loss: 0.3599777817726135, mean loss: 0.3425269087078147
Epoch: 46, step: 1199, loss: 0.3581702709197998, mean loss: 0.34252714003636986
Epoch: 46, step: 1200, loss: 0.3228829503059387, mean loss: 0.34252684954927587
Epoch: 46, step: 1201, loss: 0.3142572045326233, mean loss: 0.3425264315200413
Epoch: 46, step: 1202, loss: 0.29957398772239685, mean loss: 0.34252579638254005
Epoch: 46, step: 1203, loss: 0.3433641493320465, mean loss: 0.34252580877907624
Epoch: 46, step: 1204, loss: 0.3022591769695282, mean loss: 0.3425252133742675
Epoch: 46, step: 1205, loss: 0.3129502832889557, mean loss: 0.342524776069372
Epoch: 46, step: 1206, loss: 0.30632394552230835, mean loss: 0.34252424079959115
Epoch: 46, step: 1207, loss: 0.3223065733909607, mean loss: 0.34252394186317925
Epoch: 46, step: 1208, loss: 0.359708309173584, mean loss: 0.3425241959457619
Epoch: 46, step: 1209, loss: 0.3246724307537079, mean loss: 0.3425239319991494
Epoch: 46, step: 1210, loss: 0.3417581021785736, mean loss: 0.3425239206761684
Epoch: 46, step: 1211, loss: 0.294833242893219, mean loss: 0.3425232155682705
Epoch: 46, step: 1212, loss: 0.3653241991996765, mean loss: 0.3425235526764159
Epoch: 46, step: 1213, loss: 0.32005375623703003, mean loss: 0.34252322046972083
Epoch: 46, step: 1214, loss: 0.33876463770866394, mean loss: 0.34252316490144274
Epoch: 46, step: 1215, loss: 0.3299332857131958, mean loss: 0.3425229787707628
Epoch: 46, step: 1216, loss: 0.32482320070266724, mean loss: 0.3425227170984329
Epoch: 46, step: 1217, loss: 0.34973788261413574, mean loss: 0.34252282376537824
Epoch: 46, step: 1218, loss: 0.338306188583374, mean loss: 0.34252276142877014
Epoch: 46, step: 1219, loss: 0.334646075963974, mean loss: 0.34252264498554585
Epoch: 46, step: 1220, loss: 0.327605664730072, mean loss: 0.34252242446695236
Epoch: 46, step: 1221, loss: 0.33717307448387146, mean loss: 0.342522345388367
Epoch: 46, step: 1222, loss: 0.35435301065444946, mean loss: 0.34252252027661434
Epoch: 46, step: 1223, loss: 0.3211875557899475, mean loss: 0.34252220489457075
Epoch: 46, step: 1224, loss: 0.31649985909461975, mean loss: 0.3425218202274537
Epoch: 46, step: 1225, loss: 0.34838882088661194, mean loss: 0.34252190695325796
Epoch: 46, step: 1226, loss: 0.33778467774391174, mean loss: 0.34252183692873195
Epoch: 46, step: 1227, loss: 0.3363092839717865, mean loss: 0.3425217450977002
Epoch: 46, step: 1228, loss: 0.34561842679977417, mean loss: 0.342521790870714
Epoch: 46, step: 1229, loss: 0.32551416754722595, mean loss: 0.3425215394794685
Epoch: 46, step: 1230, loss: 0.3819862902164459, mean loss: 0.3425221228029588
Epoch: 46, step: 1231, loss: 0.316266268491745, mean loss: 0.3425217347242324
Epoch: 46, step: 1232, loss: 0.32647091150283813, mean loss: 0.3425214974860572
Epoch: 46, step: 1233, loss: 0.3028286397457123, mean loss: 0.34252091081696057
Epoch: 46, step: 1234, loss: 0.3342132866382599, mean loss: 0.34252078803027763
Epoch: 46, step: 1235, loss: 0.33216848969459534, mean loss: 0.34252063502557273
Epoch: 46, step: 1236, loss: 0.29510629177093506, mean loss: 0.342519934262308
Epoch: 46, step: 1237, loss: 0.3463699519634247, mean loss: 0.3425199911630455
Epoch: 46, step: 1238, loss: 0.3447840213775635, mean loss: 0.34252002462343323
Epoch: 46, step: 1239, loss: 0.3382295072078705, mean loss: 0.342519961214273
Epoch: 46, step: 1240, loss: 0.32257089018821716, mean loss: 0.3425196663931539
Epoch: 46, step: 1241, loss: 0.3347586989402771, mean loss: 0.3425195516979236
Epoch: 46, step: 1242, loss: 0.34948429465293884, mean loss: 0.34251965462465234
Epoch: 46, step: 1243, loss: 0.320662260055542, mean loss: 0.34251933161533377
Epoch: 46, step: 1244, loss: 0.33456963300704956, mean loss: 0.3425192141361541
Epoch: 46, step: 1245, loss: 0.32791614532470703, mean loss: 0.34251899833788585
Epoch: 46, step: 1246, loss: 0.3384394645690918, mean loss: 0.34251893805307004
Epoch: 46, step: 1247, loss: 0.337184339761734, mean loss: 0.3425188592228553
Epoch: 46, step: 1248, loss: 0.2874707877635956, mean loss: 0.34251804578069284
Epoch: 46, step: 1249, loss: 0.323364794254303, mean loss: 0.34251776275838697
Epoch: 46, step: 1250, loss: 0.32485058903694153, mean loss: 0.34251750169929984
Epoch: 46, step: 1251, loss: 0.3438064754009247, mean loss: 0.3425175207455452
Epoch: 46, step: 1252, loss: 0.3302602171897888, mean loss: 0.34251733963078607
Epoch: 46, step: 1253, loss: 0.3622344732284546, mean loss: 0.3425176309682014
Epoch: 46, step: 1254, loss: 0.3524737060070038, mean loss: 0.34251777807550265
Epoch: 46, step: 1255, loss: 0.364617258310318, mean loss: 0.3425181046044659
Epoch: 46, step: 1256, loss: 0.29923582077026367, mean loss: 0.3425174651002648
Epoch: 46, step: 1257, loss: 0.38131555914878845, mean loss: 0.34251803834121586
Epoch: 46, step: 1258, loss: 0.3537053167819977, mean loss: 0.34251820363055646
Epoch: 46, step: 1259, loss: 0.3174648582935333, mean loss: 0.3425178334788908
Epoch: 46, step: 1260, loss: 0.33421146869659424, mean loss: 0.342517710757981
Epoch: 46, step: 1261, loss: 0.3373362421989441, mean loss: 0.3425176342064259
Epoch: 46, step: 1262, loss: 0.3290245532989502, mean loss: 0.3425174348611911
Epoch: 46, step: 1263, loss: 0.369448184967041, mean loss: 0.3425178327271364
Epoch: 46, step: 1264, loss: 0.33612900972366333, mean loss: 0.3425177383421846
Epoch: 46, step: 1265, loss: 0.30767586827278137, mean loss: 0.3425172236151929
Epoch: 46, step: 1266, loss: 0.33592528104782104, mean loss: 0.3425171262323419
Epoch: 46, step: 1267, loss: 0.3346361815929413, mean loss: 0.34251700980876687
Epoch: 46, step: 1268, loss: 0.3214820623397827, mean loss: 0.34251669906840276
Epoch: 46, step: 1269, loss: 0.35559359192848206, mean loss: 0.34251689224494514
Epoch: 46, step: 1270, loss: 0.348436564207077, mean loss: 0.3425169796911666
Epoch: 46, step: 1271, loss: 0.3224845230579376, mean loss: 0.34251668377328914
Epoch: 46, step: 1272, loss: 0.3352087140083313, mean loss: 0.34251657582212786
Epoch: 46, step: 1273, loss: 0.32631587982177734, mean loss: 0.3425163365137879
Epoch: 46, step: 1274, loss: 0.31974372267723083, mean loss: 0.34251600013343014
Epoch: 46, step: 1275, loss: 0.33792567253112793, mean loss: 0.34251593232947736
Epoch: 46, step: 1276, loss: 0.343342125415802, mean loss: 0.34251594453303547
Epoch: 46, step: 1277, loss: 0.36335158348083496, mean loss: 0.3425162522881823
Epoch: 46, step: 1278, loss: 0.2922322154045105, mean loss: 0.3425155095731344
Epoch: 46, step: 1279, loss: 0.3330744206905365, mean loss: 0.34251537012658945
Epoch: 46, step: 1280, loss: 0.33037394285202026, mean loss: 0.3425151907982197
Epoch: 46, step: 1281, loss: 0.33375927805900574, mean loss: 0.3425150614756672
Epoch: 46, step: 1282, loss: 0.30396854877471924, mean loss: 0.34251449216211466
Epoch: 46, step: 1283, loss: 0.310199499130249, mean loss: 0.34251401489217564
Epoch: 46, step: 1284, loss: 0.3561352491378784, mean loss: 0.3425142160653468
Epoch: 46, step: 1285, loss: 0.33404529094696045, mean loss: 0.34251409098891616
Epoch: 46, step: 1286, loss: 0.29932475090026855, mean loss: 0.342513453140707
Epoch: 46, step: 1287, loss: 0.32184478640556335, mean loss: 0.34251314789692844
Epoch: 46, step: 1288, loss: 0.30340585112571716, mean loss: 0.34251257035204385
Epoch: 46, step: 1289, loss: 0.33060091733932495, mean loss: 0.3425123944408141
Epoch: 46, step: 1290, loss: 0.326401948928833, mean loss: 0.34251215652535205
Epoch: 46, step: 1291, loss: 0.37061017751693726, mean loss: 0.34251257146452435
Epoch: 46, step: 1292, loss: 0.3411442041397095, mean loss: 0.34251255125737806
Epoch: 46, step: 1293, loss: 0.30425459146499634, mean loss: 0.34251198629740004
Epoch: 46, step: 1294, loss: 0.3708151876926422, mean loss: 0.34251240424806967
Epoch: 46, step: 1295, loss: 0.3456745445728302, mean loss: 0.34251245094240407
Epoch: 46, step: 1296, loss: 0.32080650329589844, mean loss: 0.3425121304222161
Epoch: 46, step: 1297, loss: 0.32746344804763794, mean loss: 0.34251190820960614
Epoch: 46, step: 1298, loss: 0.36398839950561523, mean loss: 0.3425122253321686
Epoch: 46, step: 1299, loss: 0.3672957718372345, mean loss: 0.34251259128141115
Epoch: 46, step: 1300, loss: 0.3537670969963074, mean loss: 0.34251275746089754
Epoch: 46, step: 1301, loss: 0.3244440257549286, mean loss: 0.3425124906692414
Epoch: 46, step: 1302, loss: 0.3459552824497223, mean loss: 0.3425125415026133
Epoch: 46, step: 1303, loss: 0.3375777304172516, mean loss: 0.34251246864041324
Epoch: 46, step: 1304, loss: 0.3459950089454651, mean loss: 0.3425125200591601
Epoch: 46, step: 1305, loss: 0.37031397223472595, mean loss: 0.3425129305338711
Epoch: 46, step: 1306, loss: 0.36564552783966064, mean loss: 0.34251327207020316
Epoch: 46, step: 1307, loss: 0.31562143564224243, mean loss: 0.3425128750372434
Epoch: 46, step: 1308, loss: 0.36276930570602417, mean loss: 0.3425131741001916
Epoch: 46, step: 1309, loss: 0.3347684442996979, mean loss: 0.3425130597598337
Epoch: 46, step: 1310, loss: 0.2994888424873352, mean loss: 0.3425124245754051
Epoch: 46, step: 1311, loss: 0.3709048330783844, mean loss: 0.34251284373816204
Epoch: 46, step: 1312, loss: 0.36878105998039246, mean loss: 0.34251323153532226
Epoch: 46, step: 1313, loss: 0.3461616635322571, mean loss: 0.342513285396257
Epoch: 46, step: 1314, loss: 0.3530910015106201, mean loss: 0.34251344155026153
Epoch: 46, step: 1315, loss: 0.30526202917099, mean loss: 0.34251289163274784
Epoch: 46, step: 1316, loss: 0.316099613904953, mean loss: 0.34251250171707304
Epoch: 46, step: 1317, loss: 0.34990960359573364, mean loss: 0.34251261091228247
Epoch: 46, step: 1318, loss: 0.33945178985595703, mean loss: 0.34251256572944355
Epoch: 46, step: 1319, loss: 0.33076170086860657, mean loss: 0.342512392269582
Epoch: 46, step: 1320, loss: 0.41531145572662354, mean loss: 0.34251346687381046
Epoch: 46, step: 1321, loss: 0.324118971824646, mean loss: 0.34251319535231767
Epoch: 46, step: 1322, loss: 0.30373290181159973, mean loss: 0.3425126229241136
Epoch: 46, step: 1323, loss: 0.3434920012950897, mean loss: 0.3425126373803097
Epoch: 46, step: 1324, loss: 0.3343667984008789, mean loss: 0.34251251714474934
Epoch: 46, step: 1325, loss: 0.33637261390686035, mean loss: 0.3425124265188713
Epoch: 46, step: 1326, loss: 0.3282730281352997, mean loss: 0.3425122163463516
Epoch: 46, step: 1327, loss: 0.3804256021976471, mean loss: 0.3425127759370036
Epoch: 46, step: 1328, loss: 0.35242822766304016, mean loss: 0.3425129222840543
Epoch: 46, step: 1329, loss: 0.30530112981796265, mean loss: 0.3425123730649312
Epoch: 46, step: 1330, loss: 0.2996161878108978, mean loss: 0.3425117399576291
Epoch: 46, step: 1331, loss: 0.323933482170105, mean loss: 0.3425114657640848
Epoch: 46, step: 1332, loss: 0.3217672109603882, mean loss: 0.34251115960745443
Epoch: 46, step: 1333, loss: 0.3621883988380432, mean loss: 0.3425114500121185
Epoch: 46, step: 1334, loss: 0.32242152094841003, mean loss: 0.3425111535211865
Epoch: 46, step: 1335, loss: 0.34686988592147827, mean loss: 0.34251121784722544
Epoch: 46, step: 1336, loss: 0.31160232424736023, mean loss: 0.3425107617014543
Epoch: 46, step: 1337, loss: 0.3672829568386078, mean loss: 0.34251112727795935
Epoch: 46, step: 1338, loss: 0.37718066573143005, mean loss: 0.3425116389072918
Epoch: 46, step: 1339, loss: 0.2844015061855316, mean loss: 0.3425107813703589
Epoch: 46, step: 1340, loss: 0.33227694034576416, mean loss: 0.34251063035079093
Epoch: 46, step: 1341, loss: 0.33650529384613037, mean loss: 0.34251054173206613
Epoch: 46, step: 1342, loss: 0.323220431804657, mean loss: 0.3425102570786223
Epoch: 46, step: 1343, loss: 0.33834514021873474, mean loss: 0.3425101956172119
Epoch: 46, step: 1344, loss: 0.3198332190513611, mean loss: 0.3425098609955329
Epoch: 46, step: 1345, loss: 0.3278313875198364, mean loss: 0.34250964440303655
Epoch: 46, step: 1346, loss: 0.29401063919067383, mean loss: 0.3425089287723802
Epoch: 46, step: 1347, loss: 0.31727102398872375, mean loss: 0.3425085563781055
Epoch: 46, step: 1348, loss: 0.335742324590683, mean loss: 0.34250845654141854
Epoch: 46, step: 1349, loss: 0.2945893704891205, mean loss: 0.3425077494991007
Epoch: 46, step: 1350, loss: 0.3199939429759979, mean loss: 0.34250741731457063
Epoch: 46, step: 1351, loss: 0.3928253650665283, mean loss: 0.34250815972999427
Epoch: 46, step: 1352, loss: 0.40893593430519104, mean loss: 0.3425091398231612
Epoch: 46, step: 1353, loss: 0.3397281765937805, mean loss: 0.3425090987926907
Epoch: 46, step: 1354, loss: 0.340145468711853, mean loss: 0.34250906392008884
Epoch: 46, step: 1355, loss: 0.2989775240421295, mean loss: 0.342508421672525
Epoch: 46, step: 1356, loss: 0.37061095237731934, mean loss: 0.3425088362803163
Epoch: 46, step: 1357, loss: 0.3579731583595276, mean loss: 0.34250906442823287
Epoch: 46, step: 1358, loss: 0.342389851808548, mean loss: 0.34250906266949366
Epoch: 46, step: 1359, loss: 0.3187905550003052, mean loss: 0.3425087127564217
Epoch: 46, step: 1360, loss: 0.3540828824043274, mean loss: 0.34250888350466463
Epoch: 46, step: 1361, loss: 0.3189236521720886, mean loss: 0.3425085355680504
Epoch: 46, step: 1362, loss: 0.3471442759037018, mean loss: 0.34250860395491417
Epoch: 46, step: 1363, loss: 0.3582254946231842, mean loss: 0.34250883580849695
Epoch: 46, step: 1364, loss: 0.30656135082244873, mean loss: 0.3425083055235689
Epoch: 46, step: 1365, loss: 0.3409634530544281, mean loss: 0.3425082827347731
Epoch: 46, step: 1366, loss: 0.3541545867919922, mean loss: 0.34250845453197415
Epoch: 46, step: 1367, loss: 0.3399534821510315, mean loss: 0.3425084168435687
Epoch: 46, step: 1368, loss: 0.3267260789871216, mean loss: 0.3425081840416886
Epoch: 46, step: 1369, loss: 0.3227769434452057, mean loss: 0.3425078929946845
Epoch: 46, step: 1370, loss: 0.33325785398483276, mean loss: 0.3425077565533686
Epoch: 46, step: 1371, loss: 0.33423250913619995, mean loss: 0.34250763449237065
Epoch: 46, step: 1372, loss: 0.34534043073654175, mean loss: 0.342507676275875
Epoch: 46, step: 1373, loss: 0.32328012585639954, mean loss: 0.3425073926753201
Epoch: 46, step: 1374, loss: 0.3198834955692291, mean loss: 0.3425070589846004
Epoch: 46, step: 1375, loss: 0.35653936862945557, mean loss: 0.3425072659508193
Epoch: 46, step: 1376, loss: 0.3141922056674957, mean loss: 0.34250684833072104
Epoch: 46, step: 1377, loss: 0.3359357714653015, mean loss: 0.34250675141504205
Epoch: 46, step: 1378, loss: 0.3345061242580414, mean loss: 0.3425066334169128
Epoch: 46, step: 1379, loss: 0.3428190052509308, mean loss: 0.3425066380238952
Epoch: 46, step: 1380, loss: 0.30703049898147583, mean loss: 0.34250611481559134
Epoch: 46, step: 1381, loss: 0.34116703271865845, mean loss: 0.34250609506686563
Epoch: 46, step: 1382, loss: 0.3097985088825226, mean loss: 0.3425056127038915
Epoch: 46, step: 1383, loss: 0.3117575943470001, mean loss: 0.3425051592468015
Epoch: 46, step: 1384, loss: 0.31775495409965515, mean loss: 0.34250479424797914
Epoch: 46, step: 1385, loss: 0.39215224981307983, mean loss: 0.342505526403348
Epoch: 46, step: 1386, loss: 0.31380611658096313, mean loss: 0.342505103176883
Epoch: 46, step: 1387, loss: 0.34938177466392517, mean loss: 0.34250520458476785
Epoch: 46, step: 1388, loss: 0.3251894414424896, mean loss: 0.34250494923899133
Epoch: 46, step: 1389, loss: 0.394949346780777, mean loss: 0.3425057225954891
Epoch: 46, step: 1390, loss: 0.34499219059944153, mean loss: 0.3425057592609467
Epoch: 46, step: 1391, loss: 0.34820324182510376, mean loss: 0.34250584327478656
Epoch: 46, step: 1392, loss: 0.3893597424030304, mean loss: 0.3425065341620144
Epoch: 46, step: 1393, loss: 0.34390023350715637, mean loss: 0.342506554712596
Epoch: 46, step: 1394, loss: 0.31084245443344116, mean loss: 0.34250608782130776
Epoch: 46, step: 1395, loss: 0.2936209738254547, mean loss: 0.34250536701455464
Epoch: 46, step: 1396, loss: 0.33481305837631226, mean loss: 0.34250525359380535
Epoch: 46, step: 1397, loss: 0.3396664261817932, mean loss: 0.3425052117367765
Epoch: 46, step: 1398, loss: 0.32015079259872437, mean loss: 0.3425048821373908
Epoch: 46, step: 1399, loss: 0.31999436020851135, mean loss: 0.34250455024127835
Epoch: 46, step: 1400, loss: 0.3056235611438751, mean loss: 0.34250400647439155
Epoch: 46, step: 1401, loss: 0.333876371383667, mean loss: 0.3425038792719162
Epoch: 46, step: 1402, loss: 0.31238773465156555, mean loss: 0.3425034352578124
Epoch: 46, step: 1403, loss: 0.29587188363075256, mean loss: 0.342502747760737
Epoch: 46, step: 1404, loss: 0.3294726312160492, mean loss: 0.34250255565829496
Epoch: 46, step: 1405, loss: 0.31188562512397766, mean loss: 0.34250210428087297
Epoch: 46, step: 1406, loss: 0.43780753016471863, mean loss: 0.342503509323197
Epoch: 46, step: 1407, loss: 0.3268641233444214, mean loss: 0.34250327876260644
Epoch: 46, step: 1408, loss: 0.3139771819114685, mean loss: 0.3425028582283996
Epoch: 46, step: 1409, loss: 0.36973488330841064, mean loss: 0.34250325967936934
Epoch: 46, step: 1410, loss: 0.3369559049606323, mean loss: 0.3425031779021936
Epoch: 46, step: 1411, loss: 0.3575834333896637, mean loss: 0.34250340020680303
Epoch: 46, step: 1412, loss: 0.33198460936546326, mean loss: 0.34250324514701497
Epoch: 46, step: 1413, loss: 0.3415686786174774, mean loss: 0.34250323137056915
Epoch: 46, step: 1414, loss: 0.3446737229824066, mean loss: 0.3425032633653157
Epoch: 46, step: 1415, loss: 0.30731201171875, mean loss: 0.3425027446263469
Epoch: 46, step: 1416, loss: 0.3061378598213196, mean loss: 0.34250220859526237
Epoch: 46, step: 1417, loss: 0.3615485727787018, mean loss: 0.34250248934117467
Epoch: 46, step: 1418, loss: 0.3080836534500122, mean loss: 0.3425019820104863
Epoch: 46, step: 1419, loss: 0.32584479451179504, mean loss: 0.3425017364885905
Epoch: 46, step: 1420, loss: 0.30570682883262634, mean loss: 0.34250119415079616
Epoch: 46, step: 1421, loss: 0.3153859078884125, mean loss: 0.3425007944914756
Epoch: 46, step: 1422, loss: 0.32031458616256714, mean loss: 0.3425004674879481
Epoch: 46, step: 1423, loss: 0.3655623197555542, mean loss: 0.3425008073926213
Epoch: 46, step: 1424, loss: 0.35039573907852173, mean loss: 0.3425009237529462
Epoch: 46, step: 1425, loss: 0.3403371274471283, mean loss: 0.3425008918620648
Epoch: 46, step: 1426, loss: 0.30796870589256287, mean loss: 0.34250038292062
Epoch: 46, step: 1427, loss: 0.30749648809432983, mean loss: 0.3424998670346502
Epoch: 46, step: 1428, loss: 0.31980282068252563, mean loss: 0.34249953253143955
Epoch: 46, step: 1429, loss: 0.3074460029602051, mean loss: 0.3424990159291822
Epoch: 46, step: 1430, loss: 0.36408156156539917, mean loss: 0.34249933399779375
Epoch: 46, step: 1431, loss: 0.39263442158699036, mean loss: 0.3425000728431072
Epoch: 46, step: 1432, loss: 0.30769720673561096, mean loss: 0.3424995599576848
Epoch: 46, step: 1433, loss: 0.3412444591522217, mean loss: 0.34249954146169603
Epoch: 46, step: 1434, loss: 0.33298906683921814, mean loss: 0.34249940131116885
Epoch: 46, step: 1435, loss: 0.36776718497276306, mean loss: 0.3424997736628291
Epoch: 46, step: 1436, loss: 0.34139275550842285, mean loss: 0.3424997573498046
Epoch: 46, step: 1437, loss: 0.3094711899757385, mean loss: 0.34249927064785984
Epoch: 46, step: 1438, loss: 0.31917983293533325, mean loss: 0.34249892702264856
Epoch: 46, step: 1439, loss: 0.334771066904068, mean loss: 0.3424988131499013
Epoch: 46, step: 1440, loss: 0.3488936722278595, mean loss: 0.3424989073790191
Epoch: 46, step: 1441, loss: 0.3222101926803589, mean loss: 0.34249860842645524
Epoch: 46, step: 1442, loss: 0.35523784160614014, mean loss: 0.34249879613525597
Epoch: 46, step: 1443, loss: 0.31813687086105347, mean loss: 0.34249843717484346
Valid: 46, mean loss: 0.18459004908800125
Epoch: 47, step: 0, loss: 0.33975672721862793, mean loss: 0.3424983967777556
Epoch: 47, step: 1, loss: 0.3793818950653076, mean loss: 0.34249894022107796
Epoch: 47, step: 2, loss: 0.3183846175670624, mean loss: 0.3424985849246678
Epoch: 47, step: 3, loss: 0.35160261392593384, mean loss: 0.3424987190599371
Epoch: 47, step: 4, loss: 0.381144642829895, mean loss: 0.3424992884457573
Epoch: 47, step: 5, loss: 0.3261111378669739, mean loss: 0.34249904699615097
Epoch: 47, step: 6, loss: 0.3383331298828125, mean loss: 0.3424989856198399
Epoch: 47, step: 7, loss: 0.36311396956443787, mean loss: 0.34249928933520235
Epoch: 47, step: 8, loss: 0.32032012939453125, mean loss: 0.34249896258004314
Epoch: 47, step: 9, loss: 0.32151079177856445, mean loss: 0.3424986533757236
Epoch: 47, step: 10, loss: 0.3111095130443573, mean loss: 0.34249819094786915
Epoch: 47, step: 11, loss: 0.35585781931877136, mean loss: 0.34249838776030833
Epoch: 47, step: 12, loss: 0.37254923582077026, mean loss: 0.3424988304592677
Epoch: 47, step: 13, loss: 0.3097091317176819, mean loss: 0.3424983474195997
Epoch: 47, step: 14, loss: 0.2997511327266693, mean loss: 0.34249771770060244
Epoch: 47, step: 15, loss: 0.34250113368034363, mean loss: 0.3424977177509233
Epoch: 47, step: 16, loss: 0.32977402210235596, mean loss: 0.34249753032077457
Epoch: 47, step: 17, loss: 0.2961348295211792, mean loss: 0.3424968473714065
Epoch: 47, step: 18, loss: 0.3005989193916321, mean loss: 0.34249623019981285
Epoch: 47, step: 19, loss: 0.3301328718662262, mean loss: 0.34249604808576717
Epoch: 47, step: 20, loss: 0.33530521392822266, mean loss: 0.34249594216530643
Epoch: 47, step: 21, loss: 0.3076464831829071, mean loss: 0.3424954288428881
Epoch: 47, step: 22, loss: 0.3390839993953705, mean loss: 0.3424953785942624
Epoch: 47, step: 23, loss: 0.3152281641960144, mean loss: 0.34249497696793824
Epoch: 47, step: 24, loss: 0.32117682695388794, mean loss: 0.34249466297164977
Epoch: 47, step: 25, loss: 0.30266937613487244, mean loss: 0.3424940763912916
Epoch: 47, step: 26, loss: 0.35795897245407104, mean loss: 0.3424943041679476
Epoch: 47, step: 27, loss: 0.2872331738471985, mean loss: 0.34249349025946524
Epoch: 47, step: 28, loss: 0.3615801930427551, mean loss: 0.3424937713720738
Epoch: 47, step: 29, loss: 0.33532482385635376, mean loss: 0.34249366578799895
Epoch: 47, step: 30, loss: 0.32951924204826355, mean loss: 0.3424934747038336
Epoch: 47, step: 31, loss: 0.34309470653533936, mean loss: 0.3424934835584998
Epoch: 47, step: 32, loss: 0.34443360567092896, mean loss: 0.34249351213130597
Epoch: 47, step: 33, loss: 0.31653785705566406, mean loss: 0.3424931298796039
Epoch: 47, step: 34, loss: 0.3205604553222656, mean loss: 0.34249280687952205
Epoch: 47, step: 35, loss: 0.3315944969654083, mean loss: 0.3424926463836762
Epoch: 47, step: 36, loss: 0.3529406487941742, mean loss: 0.3424928002457248
Epoch: 47, step: 37, loss: 0.2991343140602112, mean loss: 0.34249216173828534
Epoch: 47, step: 38, loss: 0.3488122820854187, mean loss: 0.34249225480851886
Epoch: 47, step: 39, loss: 0.3306645452976227, mean loss: 0.3424920806359691
Epoch: 47, step: 40, loss: 0.3324602544307709, mean loss: 0.34249193291142294
Epoch: 47, step: 41, loss: 0.34933164715766907, mean loss: 0.34249203362875835
Epoch: 47, step: 42, loss: 0.32208070158958435, mean loss: 0.3424917330687307
Epoch: 47, step: 43, loss: 0.33410438895225525, mean loss: 0.3424916095656073
Epoch: 47, step: 44, loss: 0.32570961117744446, mean loss: 0.3424913624553576
Epoch: 47, step: 45, loss: 0.32076969742774963, mean loss: 0.3424910426146027
Epoch: 47, step: 46, loss: 0.34703704714775085, mean loss: 0.3424911095512814
Epoch: 47, step: 47, loss: 0.3296204209327698, mean loss: 0.34249092004234954
Epoch: 47, step: 48, loss: 0.33858513832092285, mean loss: 0.34249086253418926
Epoch: 47, step: 49, loss: 0.3661854565143585, mean loss: 0.34249121140479766
Epoch: 47, step: 50, loss: 0.3382395803928375, mean loss: 0.34249114880624626
Epoch: 47, step: 51, loss: 0.3105875849723816, mean loss: 0.34249067908357494
Epoch: 47, step: 52, loss: 0.3370842933654785, mean loss: 0.3424905994854283
Epoch: 47, step: 53, loss: 0.38090336322784424, mean loss: 0.34249116502772303
Epoch: 47, step: 54, loss: 0.3146141767501831, mean loss: 0.34249075460727224
Epoch: 47, step: 55, loss: 0.3559481203556061, mean loss: 0.3424909527311423
Epoch: 47, step: 56, loss: 0.3645160496234894, mean loss: 0.3424912769872614
Epoch: 47, step: 57, loss: 0.33350038528442383, mean loss: 0.34249114462422364
Epoch: 47, step: 58, loss: 0.32770535349845886, mean loss: 0.34249092695244177
Epoch: 47, step: 59, loss: 0.32715466618537903, mean loss: 0.3424907011801422
Epoch: 47, step: 60, loss: 0.2875896990299225, mean loss: 0.34248989296859556
Epoch: 47, step: 61, loss: 0.33798518776893616, mean loss: 0.34248982665466654
Epoch: 47, step: 62, loss: 0.3158492147922516, mean loss: 0.3424894344830238
Epoch: 47, step: 63, loss: 0.38949763774871826, mean loss: 0.3424901264721198
Epoch: 47, step: 64, loss: 0.3099355697631836, mean loss: 0.3424896472564704
Epoch: 47, step: 65, loss: 0.3076113760471344, mean loss: 0.3424891338424037
Epoch: 47, step: 66, loss: 0.3249656558036804, mean loss: 0.3424888758976324
Epoch: 47, step: 67, loss: 0.36300864815711975, mean loss: 0.3424891779432674
Epoch: 47, step: 68, loss: 0.3250090479850769, mean loss: 0.34248892064415265
Epoch: 47, step: 69, loss: 0.3432750701904297, mean loss: 0.34248893221572596
Epoch: 47, step: 70, loss: 0.3236960768699646, mean loss: 0.3424886556020674
Epoch: 47, step: 71, loss: 0.3540341854095459, mean loss: 0.342488825539215
Epoch: 47, step: 72, loss: 0.3596305251121521, mean loss: 0.342489077841942
Epoch: 47, step: 73, loss: 0.31029456853866577, mean loss: 0.3424886039891072
Epoch: 47, step: 74, loss: 0.34283873438835144, mean loss: 0.3424886091424033
Epoch: 47, step: 75, loss: 0.35518449544906616, mean loss: 0.34248879600049686
Epoch: 47, step: 76, loss: 0.3881601095199585, mean loss: 0.3424894681811359
Epoch: 47, step: 77, loss: 0.31001225113868713, mean loss: 0.34248899019542606
Epoch: 47, step: 78, loss: 0.3503493666648865, mean loss: 0.3424891058793631
Epoch: 47, step: 79, loss: 0.31949207186698914, mean loss: 0.34248876742887135
Epoch: 47, step: 80, loss: 0.2884891927242279, mean loss: 0.3424879727214481
Epoch: 47, step: 81, loss: 0.33165064454078674, mean loss: 0.34248781323170296
Epoch: 47, step: 82, loss: 0.3043656349182129, mean loss: 0.34248725220716597
Epoch: 47, step: 83, loss: 0.3428018093109131, mean loss: 0.34248725683627335
Epoch: 47, step: 84, loss: 0.33470970392227173, mean loss: 0.34248714238138667
Epoch: 47, step: 85, loss: 0.28497636318206787, mean loss: 0.34248629606212366
Epoch: 47, step: 86, loss: 0.3494940400123596, mean loss: 0.3424863991854251
Epoch: 47, step: 87, loss: 0.3156338334083557, mean loss: 0.342486004039069
Epoch: 47, step: 88, loss: 0.34760016202926636, mean loss: 0.34248607929486297
Epoch: 47, step: 89, loss: 0.3158385157585144, mean loss: 0.342485687176738
Epoch: 47, step: 90, loss: 0.347053200006485, mean loss: 0.34248575438656786
Epoch: 47, step: 91, loss: 0.33709898591041565, mean loss: 0.3424856751227586
Epoch: 47, step: 92, loss: 0.3458409309387207, mean loss: 0.34248572449307124
Epoch: 47, step: 93, loss: 0.31794866919517517, mean loss: 0.34248536345226466
Epoch: 47, step: 94, loss: 0.3589487373828888, mean loss: 0.342485605692512
Epoch: 47, step: 95, loss: 0.32103782892227173, mean loss: 0.3424852901169607
Epoch: 47, step: 96, loss: 0.3468652069568634, mean loss: 0.34248535456067203
Epoch: 47, step: 97, loss: 0.30110087990760803, mean loss: 0.34248474566100673
Epoch: 47, step: 98, loss: 0.37861496210098267, mean loss: 0.342485277245694
Epoch: 47, step: 99, loss: 0.32119718194007874, mean loss: 0.3424849640380771
Epoch: 47, step: 100, loss: 0.32952243089675903, mean loss: 0.3424847733256473
Epoch: 47, step: 101, loss: 0.3149426579475403, mean loss: 0.34248436811576977
Epoch: 47, step: 102, loss: 0.3294368088245392, mean loss: 0.3424841761580335
Epoch: 47, step: 103, loss: 0.3258053958415985, mean loss: 0.3424839307808147
Epoch: 47, step: 104, loss: 0.34319594502449036, mean loss: 0.3424839412557716
Epoch: 47, step: 105, loss: 0.35201209783554077, mean loss: 0.3424840814293171
Epoch: 47, step: 106, loss: 0.36487284302711487, mean loss: 0.3424844107969022
Epoch: 47, step: 107, loss: 0.39289993047714233, mean loss: 0.34248515246336797
Epoch: 47, step: 108, loss: 0.33569154143333435, mean loss: 0.34248505252352024
Epoch: 47, step: 109, loss: 0.32986578345298767, mean loss: 0.3424848668859747
Epoch: 47, step: 110, loss: 0.3560120463371277, mean loss: 0.3424850658765372
Epoch: 47, step: 111, loss: 0.34963491559028625, mean loss: 0.34248517105232
Epoch: 47, step: 112, loss: 0.33544597029685974, mean loss: 0.3424850675057297
Epoch: 47, step: 113, loss: 0.39268165826797485, mean loss: 0.3424858058863417
Epoch: 47, step: 114, loss: 0.31539595127105713, mean loss: 0.3424854074065068
Epoch: 47, step: 115, loss: 0.3189893364906311, mean loss: 0.3424850617947317
Epoch: 47, step: 116, loss: 0.320300430059433, mean loss: 0.34248473547816577
Epoch: 47, step: 117, loss: 0.32922473549842834, mean loss: 0.34248454043801074
Epoch: 47, step: 118, loss: 0.32176119089126587, mean loss: 0.3424842356245972
Epoch: 47, step: 119, loss: 0.3323911130428314, mean loss: 0.3424840871701261
Epoch: 47, step: 120, loss: 0.37994059920310974, mean loss: 0.3424846380903048
Epoch: 47, step: 121, loss: 0.33515486121177673, mean loss: 0.3424845302836145
Epoch: 47, step: 122, loss: 0.30808025598526, mean loss: 0.342484024271432
Epoch: 47, step: 123, loss: 0.35446351766586304, mean loss: 0.3424842004611807
Epoch: 47, step: 124, loss: 0.32484129071235657, mean loss: 0.3424839409799143
Epoch: 47, step: 125, loss: 0.3138696849346161, mean loss: 0.3424835201448988
Epoch: 47, step: 126, loss: 0.32631242275238037, mean loss: 0.3424832823171557
Epoch: 47, step: 127, loss: 0.35930630564689636, mean loss: 0.3424835297291112
Epoch: 47, step: 128, loss: 0.32951104640960693, mean loss: 0.34248333894888094
Epoch: 47, step: 129, loss: 0.31598544120788574, mean loss: 0.3424829492624528
Epoch: 47, step: 130, loss: 0.3361215889453888, mean loss: 0.34248285571166065
Epoch: 47, step: 131, loss: 0.29678231477737427, mean loss: 0.3424821836448822
Epoch: 47, step: 132, loss: 0.3256657123565674, mean loss: 0.3424819363474706
Epoch: 47, step: 133, loss: 0.28539228439331055, mean loss: 0.3424810968184574
Epoch: 47, step: 134, loss: 0.36886921525001526, mean loss: 0.342481484861903
Epoch: 47, step: 135, loss: 0.30634424090385437, mean loss: 0.34248095346310353
Epoch: 47, step: 136, loss: 0.31106337904930115, mean loss: 0.3424804914739202
Epoch: 47, step: 137, loss: 0.3546803891658783, mean loss: 0.34248067086835143
Epoch: 47, step: 138, loss: 0.3202212452888489, mean loss: 0.34248034355755136
Epoch: 47, step: 139, loss: 0.31992965936660767, mean loss: 0.3424800119688531
Epoch: 47, step: 140, loss: 0.31035295128822327, mean loss: 0.34247953957460114
Epoch: 47, step: 141, loss: 0.4118815064430237, mean loss: 0.3424805600416923
Epoch: 47, step: 142, loss: 0.3521672487258911, mean loss: 0.3424807024699566
Epoch: 47, step: 143, loss: 0.3102198839187622, mean loss: 0.34248022812986145
Epoch: 47, step: 144, loss: 0.31053751707077026, mean loss: 0.3424797584738978
Epoch: 47, step: 145, loss: 0.35185128450393677, mean loss: 0.3424798962620889
Epoch: 47, step: 146, loss: 0.338798850774765, mean loss: 0.3424798421410055
Epoch: 47, step: 147, loss: 0.3293370306491852, mean loss: 0.34247964890983207
Epoch: 47, step: 148, loss: 0.299787700176239, mean loss: 0.34247902124397306
Epoch: 47, step: 149, loss: 0.3562026023864746, mean loss: 0.3424792230079347
Epoch: 47, step: 150, loss: 0.33402547240257263, mean loss: 0.3424790987227996
Epoch: 47, step: 151, loss: 0.34707921743392944, mean loss: 0.34247916635171327
Epoch: 47, step: 152, loss: 0.32604703307151794, mean loss: 0.3424789247772983
Epoch: 47, step: 153, loss: 0.3233560621738434, mean loss: 0.34247864364968367
Epoch: 47, step: 154, loss: 0.35071614384651184, mean loss: 0.3424787647484326
Epoch: 47, step: 155, loss: 0.33229273557662964, mean loss: 0.34247861500673593
Epoch: 47, step: 156, loss: 0.3550252616405487, mean loss: 0.3424787994484358
Epoch: 47, step: 157, loss: 0.3251727223396301, mean loss: 0.3424785450445739
Epoch: 47, step: 158, loss: 0.34018903970718384, mean loss: 0.34247851138874114
Epoch: 47, step: 159, loss: 0.3641051948070526, mean loss: 0.34247882929729967
Epoch: 47, step: 160, loss: 0.33722102642059326, mean loss: 0.34247875200963007
Epoch: 47, step: 161, loss: 0.3603624403476715, mean loss: 0.34247901488907057
Epoch: 47, step: 162, loss: 0.3686428368091583, mean loss: 0.3424793994758313
Epoch: 47, step: 163, loss: 0.3312681019306183, mean loss: 0.3424792346813589
Epoch: 47, step: 164, loss: 0.3057316243648529, mean loss: 0.3424786945374535
Epoch: 47, step: 165, loss: 0.3433862030506134, mean loss: 0.3424787078764974
Epoch: 47, step: 166, loss: 0.2964673638343811, mean loss: 0.34247803158717516
Epoch: 47, step: 167, loss: 0.3143843412399292, mean loss: 0.3424776186632768
Epoch: 47, step: 168, loss: 0.30703112483024597, mean loss: 0.3424770976747877
Epoch: 47, step: 169, loss: 0.3230685293674469, mean loss: 0.3424768124140759
Epoch: 47, step: 170, loss: 0.3782329261302948, mean loss: 0.34247733793787427
Epoch: 47, step: 171, loss: 0.3237001299858093, mean loss: 0.3424770619648003
Epoch: 47, step: 172, loss: 0.3013390004634857, mean loss: 0.3424764573578501
Epoch: 47, step: 173, loss: 0.2935626804828644, mean loss: 0.3424757384816137
Epoch: 47, step: 174, loss: 0.34624239802360535, mean loss: 0.3424757938386606
Epoch: 47, step: 175, loss: 0.3697671890258789, mean loss: 0.3424761949231822
Epoch: 47, step: 176, loss: 0.36897194385528564, mean loss: 0.3424765843088671
Epoch: 47, step: 177, loss: 0.3356025516986847, mean loss: 0.34247648328848956
Epoch: 47, step: 178, loss: 0.3296954929828644, mean loss: 0.34247629546257063
Epoch: 47, step: 179, loss: 0.3252072334289551, mean loss: 0.3424760416849132
Epoch: 47, step: 180, loss: 0.33555546402931213, mean loss: 0.34247593998499615
Epoch: 47, step: 181, loss: 0.29291772842407227, mean loss: 0.3424752117232539
Epoch: 47, step: 182, loss: 0.3332054615020752, mean loss: 0.342475075505561
Epoch: 47, step: 183, loss: 0.3236871361732483, mean loss: 0.34247479942345715
Epoch: 47, step: 184, loss: 0.30978307127952576, mean loss: 0.3424743190371679
Epoch: 47, step: 185, loss: 0.32049083709716797, mean loss: 0.3424739960071926
Epoch: 47, step: 186, loss: 0.35373392701148987, mean loss: 0.3424741614605906
Epoch: 47, step: 187, loss: 0.32969653606414795, mean loss: 0.34247397370895377
Epoch: 47, step: 188, loss: 0.33847329020500183, mean loss: 0.3424739149246479
Epoch: 47, step: 189, loss: 0.34345605969429016, mean loss: 0.3424739293556445
Epoch: 47, step: 190, loss: 0.42586928606033325, mean loss: 0.3424751546947871
Epoch: 47, step: 191, loss: 0.3439004421234131, mean loss: 0.34247517563641844
Epoch: 47, step: 192, loss: 0.327253520488739, mean loss: 0.3424749519891734
Epoch: 47, step: 193, loss: 0.3028809428215027, mean loss: 0.3424743702547376
Epoch: 47, step: 194, loss: 0.36833977699279785, mean loss: 0.3424747502762873
Epoch: 47, step: 195, loss: 0.3259016275405884, mean loss: 0.34247450678306424
Epoch: 47, step: 196, loss: 0.320804625749588, mean loss: 0.3424741884126678
Epoch: 47, step: 197, loss: 0.34652745723724365, mean loss: 0.3424742479617646
Epoch: 47, step: 198, loss: 0.3351852297782898, mean loss: 0.3424741408758319
Epoch: 47, step: 199, loss: 0.30363452434539795, mean loss: 0.34247357027560077
Epoch: 47, step: 200, loss: 0.3070720136165619, mean loss: 0.3424730501922051
Epoch: 47, step: 201, loss: 0.3289835751056671, mean loss: 0.34247285202157063
Epoch: 47, step: 202, loss: 0.3550690710544586, mean loss: 0.34247303706687676
Epoch: 47, step: 203, loss: 0.28117817640304565, mean loss: 0.34247213662527576
Epoch: 47, step: 204, loss: 0.34462299942970276, mean loss: 0.3424721682216914
Epoch: 47, step: 205, loss: 0.32154661417007446, mean loss: 0.3424718608274726
Epoch: 47, step: 206, loss: 0.379390686750412, mean loss: 0.34247240315322985
Epoch: 47, step: 207, loss: 0.29233506321907043, mean loss: 0.3424716666625439
Epoch: 47, step: 208, loss: 0.3062038719654083, mean loss: 0.34247113391587913
Epoch: 47, step: 209, loss: 0.2984285056591034, mean loss: 0.34247048697225185
Epoch: 47, step: 210, loss: 0.37472161650657654, mean loss: 0.34247096070320465
Epoch: 47, step: 211, loss: 0.33899033069610596, mean loss: 0.342470909577617
Epoch: 47, step: 212, loss: 0.3249659538269043, mean loss: 0.3424706524580719
Epoch: 47, step: 213, loss: 0.3055557310581207, mean loss: 0.3424701102454254
Epoch: 47, step: 214, loss: 0.3799784779548645, mean loss: 0.3424706611666202
Epoch: 47, step: 215, loss: 0.3316252827644348, mean loss: 0.3424705018725364
Epoch: 47, step: 216, loss: 0.3368630111217499, mean loss: 0.3424704195123873
Epoch: 47, step: 217, loss: 0.3215494751930237, mean loss: 0.3424701122400506
Epoch: 47, step: 218, loss: 0.3359106183052063, mean loss: 0.34247001590016285
Epoch: 47, step: 219, loss: 0.36140677332878113, mean loss: 0.3424702940219674
Epoch: 47, step: 220, loss: 0.3185601234436035, mean loss: 0.342469942861419
Epoch: 47, step: 221, loss: 0.34188273549079895, mean loss: 0.3424699342374306
Epoch: 47, step: 222, loss: 0.3821410536766052, mean loss: 0.3424705168565644
Epoch: 47, step: 223, loss: 0.36564967036247253, mean loss: 0.34247085726591503
Epoch: 47, step: 224, loss: 0.33372482657432556, mean loss: 0.34247072882348056
Epoch: 47, step: 225, loss: 0.3082713484764099, mean loss: 0.34247022658568654
Epoch: 47, step: 226, loss: 0.3130345940589905, mean loss: 0.34246979431264846
Epoch: 47, step: 227, loss: 0.31087931990623474, mean loss: 0.34246933040178135
Epoch: 47, step: 228, loss: 0.33909350633621216, mean loss: 0.3424692808280253
Epoch: 47, step: 229, loss: 0.3010101914405823, mean loss: 0.3424686720129443
Epoch: 47, step: 230, loss: 0.33101749420166016, mean loss: 0.3424685038580843
Epoch: 47, step: 231, loss: 0.3552844822406769, mean loss: 0.34246869205159947
Epoch: 47, step: 232, loss: 0.33845746517181396, mean loss: 0.3424686331504544
Epoch: 47, step: 233, loss: 0.3393303453922272, mean loss: 0.3424685870682871
Epoch: 47, step: 234, loss: 0.34231114387512207, mean loss: 0.34246858475644776
Epoch: 47, step: 235, loss: 0.2916492521762848, mean loss: 0.3424678385545715
Epoch: 47, step: 236, loss: 0.3448235094547272, mean loss: 0.34246787314338145
Epoch: 47, step: 237, loss: 0.31681501865386963, mean loss: 0.3424674964826689
Epoch: 47, step: 238, loss: 0.32450753450393677, mean loss: 0.34246723278052404
Epoch: 47, step: 239, loss: 0.31677350401878357, mean loss: 0.3424668555307331
Epoch: 47, step: 240, loss: 0.3435530662536621, mean loss: 0.3424668714788563
Epoch: 47, step: 241, loss: 0.3187711834907532, mean loss: 0.34246652357564106
Epoch: 47, step: 242, loss: 0.3192934989929199, mean loss: 0.3424661833512341
Epoch: 47, step: 243, loss: 0.3268486261367798, mean loss: 0.34246595405893293
Epoch: 47, step: 244, loss: 0.395874559879303, mean loss: 0.34246673817658774
Epoch: 47, step: 245, loss: 0.30722469091415405, mean loss: 0.34246622077858935
Epoch: 47, step: 246, loss: 0.3373569846153259, mean loss: 0.3424661457696168
Epoch: 47, step: 247, loss: 0.34172889590263367, mean loss: 0.3424661349461705
Epoch: 47, step: 248, loss: 0.3414609134197235, mean loss: 0.3424661201888922
Epoch: 47, step: 249, loss: 0.34232833981513977, mean loss: 0.3424661181662202
Epoch: 47, step: 250, loss: 0.36297690868377686, mean loss: 0.3424664192685634
Epoch: 47, step: 251, loss: 0.317940354347229, mean loss: 0.3424660592265064
Epoch: 47, step: 252, loss: 0.3155252933502197, mean loss: 0.3424656637425018
Epoch: 47, step: 253, loss: 0.30618005990982056, mean loss: 0.3424651310863286
Epoch: 47, step: 254, loss: 0.33861327171325684, mean loss: 0.3424650745436136
Epoch: 47, step: 255, loss: 0.35354679822921753, mean loss: 0.342465237213505
Epoch: 47, step: 256, loss: 0.34374722838401794, mean loss: 0.34246525603172406
Epoch: 47, step: 257, loss: 0.3221825957298279, mean loss: 0.3424649583089706
Epoch: 47, step: 258, loss: 0.3350007236003876, mean loss: 0.34246484874543914
Epoch: 47, step: 259, loss: 0.3695807456970215, mean loss: 0.3424652467594268
Epoch: 47, step: 260, loss: 0.32321682572364807, mean loss: 0.3424649642303858
Epoch: 47, step: 261, loss: 0.34846028685569763, mean loss: 0.342465052228663
Epoch: 47, step: 262, loss: 0.31806617975234985, mean loss: 0.3424646941116168
Epoch: 47, step: 263, loss: 0.34311363101005554, mean loss: 0.34246470363631737
Epoch: 47, step: 264, loss: 0.33988508582115173, mean loss: 0.34246466577481394
Epoch: 47, step: 265, loss: 0.37362390756607056, mean loss: 0.3424651230977627
Epoch: 47, step: 266, loss: 0.3764762580394745, mean loss: 0.34246562227050714
Epoch: 47, step: 267, loss: 0.3614557683467865, mean loss: 0.34246590097994234
Epoch: 47, step: 268, loss: 0.34630876779556274, mean loss: 0.342465957379062
Epoch: 47, step: 269, loss: 0.34240010380744934, mean loss: 0.3424659564125885
Epoch: 47, step: 270, loss: 0.3456849455833435, mean loss: 0.3424660036540973
Epoch: 47, step: 271, loss: 0.35630497336387634, mean loss: 0.34246620675021866
Epoch: 47, step: 272, loss: 0.3690967559814453, mean loss: 0.3424665975655755
Epoch: 47, step: 273, loss: 0.3501022160053253, mean loss: 0.3424667096200858
Epoch: 47, step: 274, loss: 0.3231378495693207, mean loss: 0.3424664259686462
Epoch: 47, step: 275, loss: 0.3064962327480316, mean loss: 0.34246589811302836
Epoch: 47, step: 276, loss: 0.32480061054229736, mean loss: 0.3424656388821593
Epoch: 47, step: 277, loss: 0.36204788088798523, mean loss: 0.3424659262393337
Epoch: 47, step: 278, loss: 0.3204424977302551, mean loss: 0.342465603064014
Epoch: 47, step: 279, loss: 0.3085949122905731, mean loss: 0.3424651060473624
Epoch: 47, step: 280, loss: 0.32960590720176697, mean loss: 0.3424649173549554
Epoch: 47, step: 281, loss: 0.3576508164405823, mean loss: 0.34246514018546287
Epoch: 47, step: 282, loss: 0.2940898537635803, mean loss: 0.34246443036042107
Epoch: 47, step: 283, loss: 0.34672239422798157, mean loss: 0.3424644928378813
Epoch: 47, step: 284, loss: 0.31823277473449707, mean loss: 0.34246413728907044
Epoch: 47, step: 285, loss: 0.31694912910461426, mean loss: 0.3424637629162063
Epoch: 47, step: 286, loss: 0.3129535913467407, mean loss: 0.3424633299300487
Epoch: 47, step: 287, loss: 0.31466081738471985, mean loss: 0.34246292200539724
Epoch: 47, step: 288, loss: 0.3729158937931061, mean loss: 0.3424633688116209
Epoch: 47, step: 289, loss: 0.3066776692867279, mean loss: 0.34246284377128045
Epoch: 47, step: 290, loss: 0.29375556111335754, mean loss: 0.34246212915864443
Epoch: 47, step: 291, loss: 0.3139016628265381, mean loss: 0.3424617101377182
Epoch: 47, step: 292, loss: 0.3066088855266571, mean loss: 0.3424611841356846
Epoch: 47, step: 293, loss: 0.2980189323425293, mean loss: 0.3424605321264743
Epoch: 47, step: 294, loss: 0.31409016251564026, mean loss: 0.3424601159128451
Epoch: 47, step: 295, loss: 0.34970325231552124, mean loss: 0.3424602221732817
Epoch: 47, step: 296, loss: 0.30043402314186096, mean loss: 0.34245960563695027
Epoch: 47, step: 297, loss: 0.33370283246040344, mean loss: 0.3424594771744737
Epoch: 47, step: 298, loss: 0.33191484212875366, mean loss: 0.3424593224862075
Epoch: 47, step: 299, loss: 0.31877776980400085, mean loss: 0.34245897508636175
Epoch: 47, step: 300, loss: 0.3371445834636688, mean loss: 0.342458897127295
Epoch: 47, step: 301, loss: 0.35042548179626465, mean loss: 0.34245901399079315
Epoch: 47, step: 302, loss: 0.303973913192749, mean loss: 0.3424584494530748
Epoch: 47, step: 303, loss: 0.37774404883384705, mean loss: 0.34245896704973294
Epoch: 47, step: 304, loss: 0.3426353931427002, mean loss: 0.3424589696376503
Epoch: 47, step: 305, loss: 0.3292352259159088, mean loss: 0.34245877566716715
Epoch: 47, step: 306, loss: 0.3290614187717438, mean loss: 0.3424585791529479
Epoch: 47, step: 307, loss: 0.3094712793827057, mean loss: 0.342458095297929
Epoch: 47, step: 308, loss: 0.3299923539161682, mean loss: 0.3424579124541344
Epoch: 47, step: 309, loss: 0.34661439061164856, mean loss: 0.3424579734192281
Epoch: 47, step: 310, loss: 0.32415279746055603, mean loss: 0.3424577049322166
Epoch: 47, step: 311, loss: 0.3200247287750244, mean loss: 0.34245737590645897
Epoch: 47, step: 312, loss: 0.33380788564682007, mean loss: 0.34245724904574615
Epoch: 47, step: 313, loss: 0.3341200351715088, mean loss: 0.3424571267669354
Epoch: 47, step: 314, loss: 0.342425137758255, mean loss: 0.3424571262977714
Epoch: 47, step: 315, loss: 0.35177093744277954, mean loss: 0.34245726289596373
Epoch: 47, step: 316, loss: 0.31211787462234497, mean loss: 0.3424568179390337
Epoch: 47, step: 317, loss: 0.31474339962005615, mean loss: 0.3424564115004933
Epoch: 47, step: 318, loss: 0.3048836290836334, mean loss: 0.3424558604748958
Epoch: 47, step: 319, loss: 0.309763640165329, mean loss: 0.34245538103246737
Epoch: 47, step: 320, loss: 0.3356282711029053, mean loss: 0.3424552809120677
Epoch: 47, step: 321, loss: 0.3381710648536682, mean loss: 0.3424552180844382
Epoch: 47, step: 322, loss: 0.30238696932792664, mean loss: 0.34245463049591834
Epoch: 47, step: 323, loss: 0.29142525792121887, mean loss: 0.34245388217686956
Epoch: 47, step: 324, loss: 0.319611132144928, mean loss: 0.34245354720480453
Epoch: 47, step: 325, loss: 0.31211888790130615, mean loss: 0.3424531023759442
Epoch: 47, step: 326, loss: 0.37497255206108093, mean loss: 0.34245357923568
Epoch: 47, step: 327, loss: 0.3069152235984802, mean loss: 0.3424530581148571
Epoch: 47, step: 328, loss: 0.33194035291671753, mean loss: 0.34245290396283873
Epoch: 47, step: 329, loss: 0.32788485288619995, mean loss: 0.34245269034878734
Epoch: 47, step: 330, loss: 0.3124752938747406, mean loss: 0.3424522507910743
Epoch: 47, step: 331, loss: 0.34663236141204834, mean loss: 0.34245231208301885
Epoch: 47, step: 332, loss: 0.3954141438007355, mean loss: 0.3424530886380799
Epoch: 47, step: 333, loss: 0.30129727721214294, mean loss: 0.34245248519813054
Epoch: 47, step: 334, loss: 0.30922773480415344, mean loss: 0.34245199805313115
Epoch: 47, step: 335, loss: 0.3199046552181244, mean loss: 0.3424516674663205
Epoch: 47, step: 336, loss: 0.3115370571613312, mean loss: 0.3424512142061445
Epoch: 47, step: 337, loss: 0.3483964800834656, mean loss: 0.3424513013724624
Epoch: 47, step: 338, loss: 0.3344094455242157, mean loss: 0.34245118346878906
Epoch: 47, step: 339, loss: 0.33251526951789856, mean loss: 0.3424510377979887
Epoch: 47, step: 340, loss: 0.29691189527511597, mean loss: 0.34245037015673135
Epoch: 47, step: 341, loss: 0.32540977001190186, mean loss: 0.34245012033119043
Epoch: 47, step: 342, loss: 0.32603803277015686, mean loss: 0.34244987972355295
Epoch: 47, step: 343, loss: 0.34177249670028687, mean loss: 0.34244986979299785
Epoch: 47, step: 344, loss: 0.3122634291648865, mean loss: 0.34244942726092
Epoch: 47, step: 345, loss: 0.29854220151901245, mean loss: 0.34244878359208747
Epoch: 47, step: 346, loss: 0.3694188594818115, mean loss: 0.34244917896078775
Epoch: 47, step: 347, loss: 0.3152484893798828, mean loss: 0.342448780217244
Epoch: 47, step: 348, loss: 0.3368133306503296, mean loss: 0.3424486976066108
Epoch: 47, step: 349, loss: 0.34148654341697693, mean loss: 0.3424486835025006
Epoch: 47, step: 350, loss: 0.311224102973938, mean loss: 0.3424482257915912
Epoch: 47, step: 351, loss: 0.33809199929237366, mean loss: 0.3424481619360283
Epoch: 47, step: 352, loss: 0.3453456163406372, mean loss: 0.3424482044076192
Epoch: 47, step: 353, loss: 0.336130827665329, mean loss: 0.34244811180733276
Epoch: 47, step: 354, loss: 0.33355778455734253, mean loss: 0.34244798149457534
Epoch: 47, step: 355, loss: 0.3638079762458801, mean loss: 0.34244829458080234
Epoch: 47, step: 356, loss: 0.31493079662323, mean loss: 0.3424478912462775
Epoch: 47, step: 357, loss: 0.3072366416454315, mean loss: 0.3424473751490477
Epoch: 47, step: 358, loss: 0.32422930002212524, mean loss: 0.34244710812755874
Epoch: 47, step: 359, loss: 0.32603803277015686, mean loss: 0.3424468676240212
Epoch: 47, step: 360, loss: 0.2951696515083313, mean loss: 0.3424461747043519
Epoch: 47, step: 361, loss: 0.33170828223228455, mean loss: 0.342446017326476
Epoch: 47, step: 362, loss: 0.33449748158454895, mean loss: 0.3424459008319832
Epoch: 47, step: 363, loss: 0.3693675696849823, mean loss: 0.34244629539272964
Epoch: 47, step: 364, loss: 0.31827685236930847, mean loss: 0.3424459411734659
Epoch: 47, step: 365, loss: 0.337221622467041, mean loss: 0.3424458646087224
Epoch: 47, step: 366, loss: 0.29366421699523926, mean loss: 0.3424451497021845
Epoch: 47, step: 367, loss: 0.3738633394241333, mean loss: 0.3424456101364087
Epoch: 47, step: 368, loss: 0.3478168845176697, mean loss: 0.3424456888513929
Epoch: 47, step: 369, loss: 0.3336677551269531, mean loss: 0.3424455602143619
Epoch: 47, step: 370, loss: 0.3745344281196594, mean loss: 0.34244603045671457
Epoch: 47, step: 371, loss: 0.3376489281654358, mean loss: 0.3424459601592015
Epoch: 47, step: 372, loss: 0.30574026703834534, mean loss: 0.3424454222759184
Epoch: 47, step: 373, loss: 0.35959380865097046, mean loss: 0.3424456735637818
Epoch: 47, step: 374, loss: 0.3415847718715668, mean loss: 0.34244566094854373
Epoch: 47, step: 375, loss: 0.32706403732299805, mean loss: 0.34244543555695434
Epoch: 47, step: 376, loss: 0.390974760055542, mean loss: 0.34244614666142353
Epoch: 47, step: 377, loss: 0.33352363109588623, mean loss: 0.34244601592093227
Epoch: 47, step: 378, loss: 0.30480507016181946, mean loss: 0.342445464381
Epoch: 47, step: 379, loss: 0.37169918417930603, mean loss: 0.3424458930194919
Epoch: 47, step: 380, loss: 0.3106744885444641, mean loss: 0.3424454274975872
Epoch: 47, step: 381, loss: 0.3177761733531952, mean loss: 0.34244506604331404
Epoch: 47, step: 382, loss: 0.34457260370254517, mean loss: 0.34244509721557026
Epoch: 47, step: 383, loss: 0.4032287299633026, mean loss: 0.3424459877921504
Epoch: 47, step: 384, loss: 0.3085719347000122, mean loss: 0.34244549149084363
Epoch: 47, step: 385, loss: 0.389723002910614, mean loss: 0.3424461841610376
Epoch: 47, step: 386, loss: 0.3090452551841736, mean loss: 0.342445694805987
Epoch: 47, step: 387, loss: 0.2975819706916809, mean loss: 0.34244503751982736
Epoch: 47, step: 388, loss: 0.2846219837665558, mean loss: 0.3424441903824824
Epoch: 47, step: 389, loss: 0.31486883759498596, mean loss: 0.34244378639536316
Epoch: 47, step: 390, loss: 0.304176926612854, mean loss: 0.34244322578269987
Epoch: 47, step: 391, loss: 0.31744495034217834, mean loss: 0.34244285956126064
Epoch: 47, step: 392, loss: 0.3820949196815491, mean loss: 0.34244344045020336
Epoch: 47, step: 393, loss: 0.3596061170101166, mean loss: 0.3424436918737854
Epoch: 47, step: 394, loss: 0.31746727228164673, mean loss: 0.34244332598861205
Epoch: 47, step: 395, loss: 0.3853124976158142, mean loss: 0.3424439539795242
Epoch: 47, step: 396, loss: 0.3052898645401001, mean loss: 0.34244340971687953
Epoch: 47, step: 397, loss: 0.33302733302116394, mean loss: 0.34244327178472156
Epoch: 47, step: 398, loss: 0.3178413510322571, mean loss: 0.3424429114067827
Epoch: 47, step: 399, loss: 0.3347901701927185, mean loss: 0.3424427993082707
Epoch: 47, step: 400, loss: 0.3363867402076721, mean loss: 0.3424427105994995
Epoch: 47, step: 401, loss: 0.32923051714897156, mean loss: 0.34244251707095913
Epoch: 47, step: 402, loss: 0.3829033374786377, mean loss: 0.34244310972113867
Epoch: 47, step: 403, loss: 0.32687142491340637, mean loss: 0.342442881638106
Epoch: 47, step: 404, loss: 0.30436137318611145, mean loss: 0.34244232385525697
Epoch: 47, step: 405, loss: 0.29229113459587097, mean loss: 0.3424415892976031
Epoch: 47, step: 406, loss: 0.34286051988601685, mean loss: 0.34244159543353264
Epoch: 47, step: 407, loss: 0.3575989007949829, mean loss: 0.34244181743402125
Epoch: 47, step: 408, loss: 0.3677983582019806, mean loss: 0.34244218881150956
Epoch: 47, step: 409, loss: 0.3187362253665924, mean loss: 0.3424418416138259
Epoch: 47, step: 410, loss: 0.32421115040779114, mean loss: 0.342441574610923
Epoch: 47, step: 411, loss: 0.3220152258872986, mean loss: 0.3424412754552592
Epoch: 47, step: 412, loss: 0.3430475890636444, mean loss: 0.3424412843349418
Epoch: 47, step: 413, loss: 0.33276042342185974, mean loss: 0.34244114255730035
Epoch: 47, step: 414, loss: 0.33982789516448975, mean loss: 0.34244110428646585
Epoch: 47, step: 415, loss: 0.3630860149860382, mean loss: 0.3424414066253842
Epoch: 47, step: 416, loss: 0.34134700894355774, mean loss: 0.34244139059847223
Epoch: 47, step: 417, loss: 0.34322410821914673, mean loss: 0.3424414020608162
Epoch: 47, step: 418, loss: 0.33819764852523804, mean loss: 0.342441339914968
Epoch: 47, step: 419, loss: 0.3529507517814636, mean loss: 0.34244149381333766
Epoch: 47, step: 420, loss: 0.3872847855091095, mean loss: 0.342442150482665
Epoch: 47, step: 421, loss: 0.31234481930732727, mean loss: 0.3424417097544299
Epoch: 47, step: 422, loss: 0.32759854197502136, mean loss: 0.3424414924026884
Epoch: 47, step: 423, loss: 0.3120346963405609, mean loss: 0.34244104715586504
Epoch: 47, step: 424, loss: 0.366623193025589, mean loss: 0.3424414012499284
Epoch: 47, step: 425, loss: 0.31226634979248047, mean loss: 0.3424409594094818
Epoch: 47, step: 426, loss: 0.304203599691391, mean loss: 0.34244039952428207
Epoch: 47, step: 427, loss: 0.35350537300109863, mean loss: 0.3424405615392387
Epoch: 47, step: 428, loss: 0.28868192434310913, mean loss: 0.3424397744089519
Epoch: 47, step: 429, loss: 0.3465554118156433, mean loss: 0.34243983466895084
Epoch: 47, step: 430, loss: 0.32513856887817383, mean loss: 0.34243958135241925
Epoch: 47, step: 431, loss: 0.3581787049770355, mean loss: 0.34243981179346794
Epoch: 47, step: 432, loss: 0.3092930316925049, mean loss: 0.3424393264890053
Epoch: 47, step: 433, loss: 0.3254362642765045, mean loss: 0.3424390775495568
Epoch: 47, step: 434, loss: 0.34323781728744507, mean loss: 0.34243908924362204
Epoch: 47, step: 435, loss: 0.29179447889328003, mean loss: 0.34243834778469795
Epoch: 47, step: 436, loss: 0.32517459988594055, mean loss: 0.3424380950396881
Epoch: 47, step: 437, loss: 0.3214016556739807, mean loss: 0.3424377870661665
Epoch: 47, step: 438, loss: 0.3773372173309326, mean loss: 0.34243829798642744
Epoch: 47, step: 439, loss: 0.33580517768859863, mean loss: 0.342438200880374
Epoch: 47, step: 440, loss: 0.2894911468029022, mean loss: 0.34243742576942116
Epoch: 47, step: 441, loss: 0.34594056010246277, mean loss: 0.34243747705231287
Epoch: 47, step: 442, loss: 0.3289518356323242, mean loss: 0.3424372796369417
Epoch: 47, step: 443, loss: 0.35473716259002686, mean loss: 0.34243745969144096
Epoch: 47, step: 444, loss: 0.37634965777397156, mean loss: 0.3424379561152268
Epoch: 47, step: 445, loss: 0.3462616503238678, mean loss: 0.3424380120875635
Epoch: 47, step: 446, loss: 0.31635990738868713, mean loss: 0.3424376303543468
Epoch: 47, step: 447, loss: 0.30874377489089966, mean loss: 0.34243713714842927
Epoch: 47, step: 448, loss: 0.32328709959983826, mean loss: 0.34243685683697606
Epoch: 47, step: 449, loss: 0.3414495885372162, mean loss: 0.3424368423859046
Epoch: 47, step: 450, loss: 0.32664918899536133, mean loss: 0.34243661129860253
Epoch: 47, step: 451, loss: 0.31016823649406433, mean loss: 0.34243613898632497
Epoch: 47, step: 452, loss: 0.34157681465148926, mean loss: 0.3424361264085768
Epoch: 47, step: 453, loss: 0.30159667134284973, mean loss: 0.3424355286588759
Epoch: 47, step: 454, loss: 0.3191794157028198, mean loss: 0.34243518827404273
Epoch: 47, step: 455, loss: 0.3270896077156067, mean loss: 0.34243496367389403
Epoch: 47, step: 456, loss: 0.34194669127464294, mean loss: 0.3424349565275728
Epoch: 47, step: 457, loss: 0.34034264087677, mean loss: 0.34243492590503305
Epoch: 47, step: 458, loss: 0.3165534734725952, mean loss: 0.3424345471169634
Epoch: 47, step: 459, loss: 0.31061387062072754, mean loss: 0.3424340814121792
Epoch: 47, step: 460, loss: 0.34240731596946716, mean loss: 0.3424340810204649
Epoch: 47, step: 461, loss: 0.3186003863811493, mean loss: 0.3424337322176749
Epoch: 47, step: 462, loss: 0.33645865321159363, mean loss: 0.3424336447745085
Epoch: 47, step: 463, loss: 0.35126885771751404, mean loss: 0.34243377407283054
Epoch: 47, step: 464, loss: 0.3494337797164917, mean loss: 0.34243387651243723
Epoch: 47, step: 465, loss: 0.32348835468292236, mean loss: 0.3424335992636031
Epoch: 47, step: 466, loss: 0.35045406222343445, mean loss: 0.34243371663336913
Epoch: 47, step: 467, loss: 0.3003111779689789, mean loss: 0.3424331002300288
Epoch: 47, step: 468, loss: 0.4064827561378479, mean loss: 0.3424340374917744
Epoch: 47, step: 469, loss: 0.32834991812705994, mean loss: 0.34243383139678535
Epoch: 47, step: 470, loss: 0.3026328980922699, mean loss: 0.3424332489923998
Epoch: 47, step: 471, loss: 0.3479783535003662, mean loss: 0.34243333013235455
Epoch: 47, step: 472, loss: 0.33814847469329834, mean loss: 0.34243326743418745
Epoch: 47, step: 473, loss: 0.3237564265727997, mean loss: 0.3424329941492256
Epoch: 47, step: 474, loss: 0.3408956825733185, mean loss: 0.3424329716551651
Epoch: 47, step: 475, loss: 0.32746458053588867, mean loss: 0.3424327526397268
Epoch: 47, step: 476, loss: 0.3470735549926758, mean loss: 0.34243282054231444
Epoch: 47, step: 477, loss: 0.3428318202495575, mean loss: 0.3424328263802524
Epoch: 47, step: 478, loss: 0.29834815859794617, mean loss: 0.34243218136777515
Epoch: 47, step: 479, loss: 0.3437628448009491, mean loss: 0.3424322008367199
Epoch: 47, step: 480, loss: 0.3274496793746948, mean loss: 0.34243198163056526
Epoch: 47, step: 481, loss: 0.4023522138595581, mean loss: 0.34243285829819115
Epoch: 47, step: 482, loss: 0.3470246493816376, mean loss: 0.34243292547776544
Epoch: 47, step: 483, loss: 0.2961438298225403, mean loss: 0.3424322482613613
Epoch: 47, step: 484, loss: 0.38821300864219666, mean loss: 0.3424329180309454
Epoch: 47, step: 485, loss: 0.3732312023639679, mean loss: 0.3424333686012753
Epoch: 47, step: 486, loss: 0.3079430162906647, mean loss: 0.34243286402440004
Epoch: 47, step: 487, loss: 0.31950655579566956, mean loss: 0.34243252862870355
Epoch: 47, step: 488, loss: 0.313590943813324, mean loss: 0.34243210670286106
Epoch: 47, step: 489, loss: 0.3267654776573181, mean loss: 0.34243187751784915
Epoch: 47, step: 490, loss: 0.40951213240623474, mean loss: 0.34243285881153235
Epoch: 47, step: 491, loss: 0.39482367038726807, mean loss: 0.3424336252072546
Epoch: 47, step: 492, loss: 0.2993902564048767, mean loss: 0.3424329955592272
Epoch: 47, step: 493, loss: 0.36769407987594604, mean loss: 0.34243336507861394
Epoch: 47, step: 494, loss: 0.3484005033969879, mean loss: 0.3424334523646944
Epoch: 47, step: 495, loss: 0.3581341803073883, mean loss: 0.3424336820283762
Epoch: 47, step: 496, loss: 0.31500646471977234, mean loss: 0.34243328084038077
Epoch: 47, step: 497, loss: 0.3248799741268158, mean loss: 0.34243302408546294
Epoch: 47, step: 498, loss: 0.30146288871765137, mean loss: 0.3424324248177553
Epoch: 47, step: 499, loss: 0.337960422039032, mean loss: 0.34243235940699623
Epoch: 47, step: 500, loss: 0.3208053708076477, mean loss: 0.34243204307958763
Epoch: 47, step: 501, loss: 0.332139253616333, mean loss: 0.3424318925341808
Epoch: 47, step: 502, loss: 0.33226215839385986, mean loss: 0.34243174379079344
Epoch: 47, step: 503, loss: 0.3242546319961548, mean loss: 0.342431477934715
Epoch: 47, step: 504, loss: 0.2944536805152893, mean loss: 0.34243077622793866
Epoch: 47, step: 505, loss: 0.29995444416999817, mean loss: 0.34243015499278995
Epoch: 47, step: 506, loss: 0.31741395592689514, mean loss: 0.3424297891251619
Epoch: 47, step: 507, loss: 0.3479576110839844, mean loss: 0.3424298699696389
Epoch: 47, step: 508, loss: 0.32563355565071106, mean loss: 0.3424296243268889
Epoch: 47, step: 509, loss: 0.29732614755630493, mean loss: 0.3424289647071754
Epoch: 47, step: 510, loss: 0.34497737884521484, mean loss: 0.34242900197613424
Epoch: 47, step: 511, loss: 0.3137175440788269, mean loss: 0.34242858209520566
Epoch: 47, step: 512, loss: 0.3233785033226013, mean loss: 0.3424283035078967
Epoch: 47, step: 513, loss: 0.3509160876274109, mean loss: 0.3424284276309718
Epoch: 47, step: 514, loss: 0.43671754002571106, mean loss: 0.3424298064694608
Epoch: 47, step: 515, loss: 0.328159362077713, mean loss: 0.3424295977884186
Epoch: 47, step: 516, loss: 0.3362007439136505, mean loss: 0.34242950670332867
Epoch: 47, step: 517, loss: 0.3109382092952728, mean loss: 0.3424290462099907
Epoch: 47, step: 518, loss: 0.38323405385017395, mean loss: 0.34242964288783356
Epoch: 47, step: 519, loss: 0.32033807039260864, mean loss: 0.34242931985495506
Epoch: 47, step: 520, loss: 0.29194775223731995, mean loss: 0.3424285817016319
Epoch: 47, step: 521, loss: 0.33966630697250366, mean loss: 0.34242854131159345
Epoch: 47, step: 522, loss: 0.3513107895851135, mean loss: 0.3424286711861131
Epoch: 47, step: 523, loss: 0.34227433800697327, mean loss: 0.3424286689295161
Epoch: 47, step: 524, loss: 0.3387547731399536, mean loss: 0.342428615212092
Epoch: 47, step: 525, loss: 0.36379027366638184, mean loss: 0.3424289275444377
Epoch: 47, step: 526, loss: 0.34554028511047363, mean loss: 0.3424289730354468
Epoch: 47, step: 527, loss: 0.32174915075302124, mean loss: 0.34242867068118216
Epoch: 47, step: 528, loss: 0.3420047163963318, mean loss: 0.3424286644827482
Epoch: 47, step: 529, loss: 0.3141367435455322, mean loss: 0.3424282508460785
Epoch: 47, step: 530, loss: 0.3549128472805023, mean loss: 0.34242843337208667
Epoch: 47, step: 531, loss: 0.3126460909843445, mean loss: 0.3424279979577243
Epoch: 47, step: 532, loss: 0.3080783784389496, mean loss: 0.3424274957776462
Epoch: 47, step: 533, loss: 0.3656892478466034, mean loss: 0.3424278358517971
Epoch: 47, step: 534, loss: 0.31834739446640015, mean loss: 0.34242748381400073
Epoch: 47, step: 535, loss: 0.32303452491760254, mean loss: 0.34242720030778917
Epoch: 47, step: 536, loss: 0.32510286569595337, mean loss: 0.34242694704655663
Epoch: 47, step: 537, loss: 0.32625678181648254, mean loss: 0.34242671066136776
Epoch: 47, step: 538, loss: 0.3534342050552368, mean loss: 0.3424268715731808
Epoch: 47, step: 539, loss: 0.3299546539783478, mean loss: 0.3424266892521424
Epoch: 47, step: 540, loss: 0.32903218269348145, mean loss: 0.34242649345178633
Epoch: 47, step: 541, loss: 0.3472626805305481, mean loss: 0.34242656414594036
Epoch: 47, step: 542, loss: 0.33052799105644226, mean loss: 0.3424263902181643
Epoch: 47, step: 543, loss: 0.3736514151096344, mean loss: 0.3424268466443014
Epoch: 47, step: 544, loss: 0.30937090516090393, mean loss: 0.34242636346213595
Epoch: 47, step: 545, loss: 0.38343536853790283, mean loss: 0.34242696288630464
Epoch: 47, step: 546, loss: 0.34295234084129333, mean loss: 0.34242697056558485
Epoch: 47, step: 547, loss: 0.33772844076156616, mean loss: 0.3424269018896932
Epoch: 47, step: 548, loss: 0.3454698920249939, mean loss: 0.3424269463667988
Epoch: 47, step: 549, loss: 0.35828688740730286, mean loss: 0.3424271781762794
Epoch: 47, step: 550, loss: 0.3534913957118988, mean loss: 0.3424273398889255
Epoch: 47, step: 551, loss: 0.2970850169658661, mean loss: 0.34242667718324116
Epoch: 47, step: 552, loss: 0.3255753815174103, mean loss: 0.3424264308948843
Epoch: 47, step: 553, loss: 0.3088340759277344, mean loss: 0.3424259399364942
Epoch: 47, step: 554, loss: 0.3394849896430969, mean loss: 0.34242589695459785
Epoch: 47, step: 555, loss: 0.36397668719291687, mean loss: 0.3424262119141185
Epoch: 47, step: 556, loss: 0.3061690330505371, mean loss: 0.34242568203207446
Epoch: 47, step: 557, loss: 0.3288508355617523, mean loss: 0.3424254836448171
Epoch: 47, step: 558, loss: 0.31963253021240234, mean loss: 0.34242515054599015
Epoch: 47, step: 559, loss: 0.3132099509239197, mean loss: 0.3424247235979627
Epoch: 47, step: 560, loss: 0.3370363712310791, mean loss: 0.3424246448542668
Epoch: 47, step: 561, loss: 0.31842154264450073, mean loss: 0.3424242940855658
Epoch: 47, step: 562, loss: 0.30603235960006714, mean loss: 0.3424237622807626
Epoch: 47, step: 563, loss: 0.3502086102962494, mean loss: 0.34242387604110885
Epoch: 47, step: 564, loss: 0.316460520029068, mean loss: 0.3424234966429236
Epoch: 47, step: 565, loss: 0.3026401698589325, mean loss: 0.3424229153043085
Epoch: 47, step: 566, loss: 0.327960729598999, mean loss: 0.3424227039769803
Epoch: 47, step: 567, loss: 0.34560465812683105, mean loss: 0.34242275047230664
Epoch: 47, step: 568, loss: 0.3482898771762848, mean loss: 0.34242283620263825
Epoch: 47, step: 569, loss: 0.3270206153392792, mean loss: 0.34242261114900047
Epoch: 47, step: 570, loss: 0.3098946511745453, mean loss: 0.34242213586502535
Epoch: 47, step: 571, loss: 0.34728166460990906, mean loss: 0.3424222068692443
Epoch: 47, step: 572, loss: 0.3036211133003235, mean loss: 0.3424216399416195
Epoch: 47, step: 573, loss: 0.30416467785835266, mean loss: 0.342421080972535
Epoch: 47, step: 574, loss: 0.34532293677330017, mean loss: 0.3424211233706736
Epoch: 47, step: 575, loss: 0.32343634963035583, mean loss: 0.3424208459939314
Epoch: 47, step: 576, loss: 0.330086886882782, mean loss: 0.34242066579144603
Epoch: 47, step: 577, loss: 0.3566534221172333, mean loss: 0.34242087373283525
Epoch: 47, step: 578, loss: 0.30784639716148376, mean loss: 0.34242036860512226
Epoch: 47, step: 579, loss: 0.33936452865600586, mean loss: 0.3424203239604292
Epoch: 47, step: 580, loss: 0.3560371696949005, mean loss: 0.3424205228946099
Epoch: 47, step: 581, loss: 0.30184370279312134, mean loss: 0.34241993009957555
Epoch: 47, step: 582, loss: 0.32376331090927124, mean loss: 0.3424196575452054
Epoch: 47, step: 583, loss: 0.31755802035331726, mean loss: 0.342419294347093
Epoch: 47, step: 584, loss: 0.32781630754470825, mean loss: 0.34241908101843244
Epoch: 47, step: 585, loss: 0.327313095331192, mean loss: 0.34241886034490443
Epoch: 47, step: 586, loss: 0.3152764141559601, mean loss: 0.34241846384433927
Epoch: 47, step: 587, loss: 0.33741307258605957, mean loss: 0.34241839072596747
Epoch: 47, step: 588, loss: 0.28847724199295044, mean loss: 0.34241760276931243
Epoch: 47, step: 589, loss: 0.3209986686706543, mean loss: 0.34241728989230613
Epoch: 47, step: 590, loss: 0.34105417132377625, mean loss: 0.34241726998084715
Epoch: 47, step: 591, loss: 0.3685356080532074, mean loss: 0.342417651493235
Epoch: 47, step: 592, loss: 0.33802253007888794, mean loss: 0.34241758729432736
Epoch: 47, step: 593, loss: 0.3289012610912323, mean loss: 0.3424173898661745
Epoch: 47, step: 594, loss: 0.30639344453811646, mean loss: 0.3424168636849477
Epoch: 47, step: 595, loss: 0.30871278047561646, mean loss: 0.3424163713958146
Epoch: 47, step: 596, loss: 0.33790209889411926, mean loss: 0.3424163054603366
Epoch: 47, step: 597, loss: 0.32922837138175964, mean loss: 0.3424161128401444
Epoch: 47, step: 598, loss: 0.3640405237674713, mean loss: 0.3424164286771305
Epoch: 47, step: 599, loss: 0.3269828259944916, mean loss: 0.34241620326375954
Epoch: 47, step: 600, loss: 0.3455878794193268, mean loss: 0.34241624958656486
Epoch: 47, step: 601, loss: 0.31715184450149536, mean loss: 0.34241588060153366
Epoch: 47, step: 602, loss: 0.3341202735900879, mean loss: 0.3424157594464898
Epoch: 47, step: 603, loss: 0.3456966280937195, mean loss: 0.3424158073619683
Epoch: 47, step: 604, loss: 0.3260991871356964, mean loss: 0.3424155690692073
Epoch: 47, step: 605, loss: 0.31481748819351196, mean loss: 0.3424151660245352
Epoch: 47, step: 606, loss: 0.3329508304595947, mean loss: 0.3424150278086087
Epoch: 47, step: 607, loss: 0.36913129687309265, mean loss: 0.3424154179638319
Epoch: 47, step: 608, loss: 0.35037165880203247, mean loss: 0.3424155341523454
Epoch: 47, step: 609, loss: 0.3294339179992676, mean loss: 0.3424153445788159
Epoch: 47, step: 610, loss: 0.307424396276474, mean loss: 0.3424148336054036
Epoch: 47, step: 611, loss: 0.32025882601737976, mean loss: 0.34241451006557316
Epoch: 47, step: 612, loss: 0.3576362431049347, mean loss: 0.3424147323423074
Epoch: 47, step: 613, loss: 0.3062836527824402, mean loss: 0.3424142047426526
Epoch: 47, step: 614, loss: 0.3378354609012604, mean loss: 0.34241413788308395
Epoch: 47, step: 615, loss: 0.3302167057991028, mean loss: 0.3424139597767805
Epoch: 47, step: 616, loss: 0.31653159856796265, mean loss: 0.3424135818493335
Epoch: 47, step: 617, loss: 0.31596627831459045, mean loss: 0.3424131956783857
Epoch: 47, step: 618, loss: 0.3503749370574951, mean loss: 0.34241331193024926
Epoch: 47, step: 619, loss: 0.36344075202941895, mean loss: 0.3424136189539629
Epoch: 47, step: 620, loss: 0.3458077907562256, mean loss: 0.3424136685118744
Epoch: 47, step: 621, loss: 0.30679431557655334, mean loss: 0.34241314844539844
Epoch: 47, step: 622, loss: 0.3218773305416107, mean loss: 0.34241284861304233
Epoch: 47, step: 623, loss: 0.33807575702667236, mean loss: 0.34241278529044133
Epoch: 47, step: 624, loss: 0.3385453522205353, mean loss: 0.34241272882579427
Epoch: 47, step: 625, loss: 0.36097633838653564, mean loss: 0.34241299985113316
Epoch: 47, step: 626, loss: 0.31626492738723755, mean loss: 0.34241261809958246
Epoch: 47, step: 627, loss: 0.34744739532470703, mean loss: 0.3424126916042721
Epoch: 47, step: 628, loss: 0.3080069422721863, mean loss: 0.3424121893085609
Epoch: 47, step: 629, loss: 0.33415889739990234, mean loss: 0.3424120688190297
Epoch: 47, step: 630, loss: 0.29927265644073486, mean loss: 0.3424114390373923
Epoch: 47, step: 631, loss: 0.3232405483722687, mean loss: 0.3424111591703753
Epoch: 47, step: 632, loss: 0.3556625247001648, mean loss: 0.34241135261814293
Epoch: 47, step: 633, loss: 0.3291811943054199, mean loss: 0.34241115948278467
Epoch: 47, step: 634, loss: 0.333808958530426, mean loss: 0.3424110339087083
Epoch: 47, step: 635, loss: 0.4085286855697632, mean loss: 0.3424119990735405
Epoch: 47, step: 636, loss: 0.3461473882198334, mean loss: 0.3424120536007888
Epoch: 47, step: 637, loss: 0.3225157856941223, mean loss: 0.34241176316976224
Epoch: 47, step: 638, loss: 0.31468936800956726, mean loss: 0.3424113585046162
Epoch: 47, step: 639, loss: 0.3194851577281952, mean loss: 0.34241102385463695
Epoch: 47, step: 640, loss: 0.33344322443008423, mean loss: 0.3424108929550555
Epoch: 47, step: 641, loss: 0.3718448579311371, mean loss: 0.34241132258525514
Epoch: 47, step: 642, loss: 0.35335206985473633, mean loss: 0.34241148227854923
Epoch: 47, step: 643, loss: 0.3465985655784607, mean loss: 0.34241154339314667
Epoch: 47, step: 644, loss: 0.3076575994491577, mean loss: 0.3424110361325692
Epoch: 47, step: 645, loss: 0.31322214007377625, mean loss: 0.3424106101043697
Epoch: 47, step: 646, loss: 0.320634126663208, mean loss: 0.3424102922691009
Epoch: 47, step: 647, loss: 0.3122260570526123, mean loss: 0.34240985172623184
Epoch: 47, step: 648, loss: 0.36833128333091736, mean loss: 0.34241023004740184
Epoch: 47, step: 649, loss: 0.3105805218219757, mean loss: 0.34240976550219876
Epoch: 47, step: 650, loss: 0.32888063788414, mean loss: 0.34240956805145345
Epoch: 47, step: 651, loss: 0.3346485197544098, mean loss: 0.34240945478454893
Epoch: 47, step: 652, loss: 0.3660271465778351, mean loss: 0.34240979946270295
Epoch: 47, step: 653, loss: 0.35427767038345337, mean loss: 0.3424099726606674
Epoch: 47, step: 654, loss: 0.3151688277721405, mean loss: 0.34240957511320325
Epoch: 47, step: 655, loss: 0.33163323998451233, mean loss: 0.34240941784954193
Epoch: 47, step: 656, loss: 0.326480895280838, mean loss: 0.3424091854012009
Epoch: 47, step: 657, loss: 0.3332598805427551, mean loss: 0.3424090518853842
Epoch: 47, step: 658, loss: 0.3333929777145386, mean loss: 0.342408920315723
Epoch: 47, step: 659, loss: 0.33368828892707825, mean loss: 0.3424087930592528
Epoch: 47, step: 660, loss: 0.3899531066417694, mean loss: 0.3424094868431046
Epoch: 47, step: 661, loss: 0.3406692445278168, mean loss: 0.34240946144922874
Epoch: 47, step: 662, loss: 0.335521399974823, mean loss: 0.34240936093907315
Epoch: 47, step: 663, loss: 0.2978537976741791, mean loss: 0.3424087107966103
Epoch: 47, step: 664, loss: 0.2994685769081116, mean loss: 0.3424080842351889
Epoch: 47, step: 665, loss: 0.3163069784641266, mean loss: 0.34240770338618304
Epoch: 47, step: 666, loss: 0.3169917166233063, mean loss: 0.34240733253936373
Epoch: 47, step: 667, loss: 0.2871640920639038, mean loss: 0.34240652649231584
Epoch: 47, step: 668, loss: 0.3295649588108063, mean loss: 0.34240633912538
Epoch: 47, step: 669, loss: 0.306972861289978, mean loss: 0.3424058221351288
Epoch: 47, step: 670, loss: 0.3245296776294708, mean loss: 0.34240556131801003
Epoch: 47, step: 671, loss: 0.354411780834198, mean loss: 0.342405736488998
Epoch: 47, step: 672, loss: 0.3435317277908325, mean loss: 0.34240575291699443
Epoch: 47, step: 673, loss: 0.30795377492904663, mean loss: 0.34240525027659896
Epoch: 47, step: 674, loss: 0.31230926513671875, mean loss: 0.34240481119477967
Epoch: 47, step: 675, loss: 0.3496176302433014, mean loss: 0.34240491642381576
Epoch: 47, step: 676, loss: 0.336503267288208, mean loss: 0.34240483032491525
Epoch: 47, step: 677, loss: 0.3293485939502716, mean loss: 0.34240463985083397
Epoch: 47, step: 678, loss: 0.3081957697868347, mean loss: 0.34240414079368975
Epoch: 47, step: 679, loss: 0.34451764822006226, mean loss: 0.3424041716262075
Epoch: 47, step: 680, loss: 0.34194356203079224, mean loss: 0.34240416490678643
Epoch: 47, step: 681, loss: 0.35928985476493835, mean loss: 0.34240441123340726
Epoch: 47, step: 682, loss: 0.30338937044143677, mean loss: 0.3424038420945064
Epoch: 47, step: 683, loss: 0.3356153070926666, mean loss: 0.34240374306697985
Epoch: 47, step: 684, loss: 0.33746063709259033, mean loss: 0.3424036709606391
Epoch: 47, step: 685, loss: 0.3312455117702484, mean loss: 0.3424035081961149
Epoch: 47, step: 686, loss: 0.33621031045913696, mean loss: 0.3424034178570042
Epoch: 47, step: 687, loss: 0.3232976496219635, mean loss: 0.3424031391685125
Epoch: 47, step: 688, loss: 0.347564160823822, mean loss: 0.342403214449252
Epoch: 47, step: 689, loss: 0.3232917785644531, mean loss: 0.3424029356862209
Epoch: 47, step: 690, loss: 0.35444992780685425, mean loss: 0.3424031114033714
Epoch: 47, step: 691, loss: 0.3160005807876587, mean loss: 0.342402726302283
Epoch: 47, step: 692, loss: 0.29494187235832214, mean loss: 0.3424020340595511
Epoch: 47, step: 693, loss: 0.34714576601982117, mean loss: 0.342402103248489
Epoch: 47, step: 694, loss: 0.30280646681785583, mean loss: 0.34240152574113913
Epoch: 47, step: 695, loss: 0.29377004504203796, mean loss: 0.3424008164552063
Epoch: 47, step: 696, loss: 0.37171700596809387, mean loss: 0.34240124402305455
Epoch: 47, step: 697, loss: 0.3103512227535248, mean loss: 0.3424007765899059
Epoch: 47, step: 698, loss: 0.38084331154823303, mean loss: 0.34240133724641647
Epoch: 47, step: 699, loss: 0.3287351727485657, mean loss: 0.3424011379382188
Epoch: 47, step: 700, loss: 0.36001068353652954, mean loss: 0.34240139475318765
Epoch: 47, step: 701, loss: 0.3311006724834442, mean loss: 0.34240122994755445
Epoch: 47, step: 702, loss: 0.31062012910842896, mean loss: 0.34240076647027046
Epoch: 47, step: 703, loss: 0.29259994626045227, mean loss: 0.3424000402143612
Epoch: 47, step: 704, loss: 0.3215421736240387, mean loss: 0.34239973604411067
Epoch: 47, step: 705, loss: 0.3170008063316345, mean loss: 0.3423993656569419
Epoch: 47, step: 706, loss: 0.3156128525733948, mean loss: 0.3423989750406374
Epoch: 47, step: 707, loss: 0.35035228729248047, mean loss: 0.3423990910187092
Epoch: 47, step: 708, loss: 0.31931498646736145, mean loss: 0.3423987544028679
Epoch: 47, step: 709, loss: 0.35886138677597046, mean loss: 0.34239899445991784
Epoch: 47, step: 710, loss: 0.31775331497192383, mean loss: 0.3423986350834398
Epoch: 47, step: 711, loss: 0.322068989276886, mean loss: 0.3423983386464931
Epoch: 47, step: 712, loss: 0.4045107662677765, mean loss: 0.3423992443263114
Epoch: 47, step: 713, loss: 0.3611100912094116, mean loss: 0.342399517150768
Epoch: 47, step: 714, loss: 0.32603222131729126, mean loss: 0.3423992785013092
Epoch: 47, step: 715, loss: 0.407446950674057, mean loss: 0.34240022693931477
Epoch: 47, step: 716, loss: 0.2726775109767914, mean loss: 0.34239921035090676
Epoch: 47, step: 717, loss: 0.3053218126296997, mean loss: 0.34239866975373356
Epoch: 47, step: 718, loss: 0.36060166358947754, mean loss: 0.3423989351537924
Epoch: 47, step: 719, loss: 0.3456990420818329, mean loss: 0.342398983268724
Epoch: 47, step: 720, loss: 0.3005990982055664, mean loss: 0.3423983738432321
Epoch: 47, step: 721, loss: 0.3415694236755371, mean loss: 0.34239836175764865
Epoch: 47, step: 722, loss: 0.308470219373703, mean loss: 0.3423978671134186
Epoch: 47, step: 723, loss: 0.3264041841030121, mean loss: 0.3423976339421594
Epoch: 47, step: 724, loss: 0.32271409034729004, mean loss: 0.34239734698075525
Epoch: 47, step: 725, loss: 0.3922390639781952, mean loss: 0.3423980735999493
Epoch: 47, step: 726, loss: 0.31190407276153564, mean loss: 0.3423976290485849
Epoch: 47, step: 727, loss: 0.30379247665405273, mean loss: 0.3423970662584456
Epoch: 47, step: 728, loss: 0.3571387231349945, mean loss: 0.3423972811608011
Epoch: 47, step: 729, loss: 0.3039940297603607, mean loss: 0.3423967213303191
Epoch: 47, step: 730, loss: 0.33563438057899475, mean loss: 0.34239662275248633
Epoch: 47, step: 731, loss: 0.35250914096832275, mean loss: 0.3423967701652883
Epoch: 47, step: 732, loss: 0.34308451414108276, mean loss: 0.3423967801905645
Epoch: 47, step: 733, loss: 0.3162226676940918, mean loss: 0.3423963986548586
Epoch: 47, step: 734, loss: 0.3265918493270874, mean loss: 0.34239616827791697
Epoch: 47, step: 735, loss: 0.33308976888656616, mean loss: 0.3423960326240281
Epoch: 47, step: 736, loss: 0.34290313720703125, mean loss: 0.34239604001568447
Epoch: 47, step: 737, loss: 0.3412901759147644, mean loss: 0.3423960238966264
Epoch: 47, step: 738, loss: 0.3242757320404053, mean loss: 0.34239575977938097
Epoch: 47, step: 739, loss: 0.3161410093307495, mean loss: 0.3423953771016984
Epoch: 47, step: 740, loss: 0.3592103123664856, mean loss: 0.34239562218521896
Epoch: 47, step: 741, loss: 0.34772709012031555, mean loss: 0.3423956998920829
Epoch: 47, step: 742, loss: 0.3417765498161316, mean loss: 0.3423956908680186
Epoch: 47, step: 743, loss: 0.32883548736572266, mean loss: 0.3423954932319855
Epoch: 47, step: 744, loss: 0.3148408532142639, mean loss: 0.3423950916369522
Epoch: 47, step: 745, loss: 0.3533601462841034, mean loss: 0.3423952514447851
Epoch: 47, step: 746, loss: 0.34006884694099426, mean loss: 0.3423952175395967
Epoch: 47, step: 747, loss: 0.30130666494369507, mean loss: 0.3423946187207702
Epoch: 47, step: 748, loss: 0.31661057472229004, mean loss: 0.34239424295319076
Epoch: 47, step: 749, loss: 0.3307764232158661, mean loss: 0.3423940736416437
Epoch: 47, step: 750, loss: 0.33540695905685425, mean loss: 0.3423939718168636
Epoch: 47, step: 751, loss: 0.321847528219223, mean loss: 0.34239367239331947
Epoch: 47, step: 752, loss: 0.33505767583847046, mean loss: 0.34239356548732053
Epoch: 47, step: 753, loss: 0.33939823508262634, mean loss: 0.34239352183761046
Epoch: 47, step: 754, loss: 0.30800679326057434, mean loss: 0.34239302074135153
Epoch: 47, step: 755, loss: 0.3419143557548523, mean loss: 0.3423930137661681
Epoch: 47, step: 756, loss: 0.35260552167892456, mean loss: 0.34239316258231256
Epoch: 47, step: 757, loss: 0.3452158570289612, mean loss: 0.3423932037138727
Epoch: 47, step: 758, loss: 0.3451654613018036, mean loss: 0.3423932441098916
Epoch: 47, step: 759, loss: 0.34861934185028076, mean loss: 0.34239333483230433
Epoch: 47, step: 760, loss: 0.2918759882450104, mean loss: 0.34239259873901157
Epoch: 47, step: 761, loss: 0.33276253938674927, mean loss: 0.3423924584205014
Epoch: 47, step: 762, loss: 0.35859906673431396, mean loss: 0.342392694561725
Epoch: 47, step: 763, loss: 0.3619718551635742, mean loss: 0.3423929798391554
Epoch: 47, step: 764, loss: 0.346484512090683, mean loss: 0.34239303945380506
Epoch: 47, step: 765, loss: 0.3217715919017792, mean loss: 0.342392738998527
Epoch: 47, step: 766, loss: 0.3417509198188782, mean loss: 0.3423927296473333
Epoch: 47, step: 767, loss: 0.31881484389305115, mean loss: 0.342392386126648
Epoch: 47, step: 768, loss: 0.3140788972377777, mean loss: 0.342391973616065
Epoch: 47, step: 769, loss: 0.31517472863197327, mean loss: 0.3423915770828766
Epoch: 47, step: 770, loss: 0.31325772404670715, mean loss: 0.342391152632447
Epoch: 47, step: 771, loss: 0.3807636797428131, mean loss: 0.3423917116727604
Epoch: 47, step: 772, loss: 0.35154426097869873, mean loss: 0.34239184501215386
Epoch: 47, step: 773, loss: 0.35378333926200867, mean loss: 0.34239201096731614
Epoch: 47, step: 774, loss: 0.33208832144737244, mean loss: 0.34239186086184986
Epoch: 47, step: 775, loss: 0.3447764217853546, mean loss: 0.3423918955999322
Epoch: 47, step: 776, loss: 0.29259172081947327, mean loss: 0.34239117012575665
Epoch: 47, step: 777, loss: 0.3252018094062805, mean loss: 0.3423909197198959
Epoch: 47, step: 778, loss: 0.32259175181388855, mean loss: 0.34239063129989344
Epoch: 47, step: 779, loss: 0.327217698097229, mean loss: 0.3423904102747623
Epoch: 47, step: 780, loss: 0.3186124861240387, mean loss: 0.342390063905199
Epoch: 47, step: 781, loss: 0.3503771126270294, mean loss: 0.3423901802496815
Epoch: 47, step: 782, loss: 0.3474974036216736, mean loss: 0.34239025464369427
Epoch: 47, step: 783, loss: 0.3030592203140259, mean loss: 0.342389681739273
Epoch: 47, step: 784, loss: 0.3108842372894287, mean loss: 0.34238922283078466
Epoch: 47, step: 785, loss: 0.3162304759025574, mean loss: 0.3423888418078737
Epoch: 47, step: 786, loss: 0.32031434774398804, mean loss: 0.3423885202800307
Epoch: 47, step: 787, loss: 0.37599775195121765, mean loss: 0.3423890098109045
Epoch: 47, step: 788, loss: 0.29570502042770386, mean loss: 0.34238832985125894
Epoch: 47, step: 789, loss: 0.27557846903800964, mean loss: 0.3423873567693047
Epoch: 47, step: 790, loss: 0.3028043210506439, mean loss: 0.3423867802529599
Epoch: 47, step: 791, loss: 0.33362704515457153, mean loss: 0.3423866526716156
Epoch: 47, step: 792, loss: 0.32726162672042847, mean loss: 0.3423864323860685
Epoch: 47, step: 793, loss: 0.30246761441230774, mean loss: 0.34238585100454777
Epoch: 47, step: 794, loss: 0.33607789874076843, mean loss: 0.3423857591362597
Epoch: 47, step: 795, loss: 0.28994423151016235, mean loss: 0.3423849953950325
Epoch: 47, step: 796, loss: 0.35807955265045166, mean loss: 0.34238522396209364
Epoch: 47, step: 797, loss: 0.3081420063972473, mean loss: 0.34238472526961755
Epoch: 47, step: 798, loss: 0.3349614143371582, mean loss: 0.34238461716367247
Epoch: 47, step: 799, loss: 0.296182781457901, mean loss: 0.34238394433446956
Epoch: 47, step: 800, loss: 0.3469375967979431, mean loss: 0.3423840106475433
Epoch: 47, step: 801, loss: 0.3654985725879669, mean loss: 0.34238434725103745
Epoch: 47, step: 802, loss: 0.33557623624801636, mean loss: 0.3423842481100463
Epoch: 47, step: 803, loss: 0.3088948428630829, mean loss: 0.34238376043813856
Epoch: 47, step: 804, loss: 0.3133920133113861, mean loss: 0.34238333826716705
Epoch: 47, step: 805, loss: 0.3166196644306183, mean loss: 0.342382963108099
Epoch: 47, step: 806, loss: 0.34144240617752075, mean loss: 0.3423829494123301
Epoch: 47, step: 807, loss: 0.36513084173202515, mean loss: 0.3423832806472931
Epoch: 47, step: 808, loss: 0.39536812901496887, mean loss: 0.3423840521551978
Epoch: 47, step: 809, loss: 0.38658303022384644, mean loss: 0.3423846957234157
Epoch: 47, step: 810, loss: 0.33538582921028137, mean loss: 0.34238459381647884
Epoch: 47, step: 811, loss: 0.32122695446014404, mean loss: 0.342384285755335
Epoch: 47, step: 812, loss: 0.3336467146873474, mean loss: 0.34238415853570997
Epoch: 47, step: 813, loss: 0.3431955575942993, mean loss: 0.3423841703495631
Epoch: 47, step: 814, loss: 0.37148517370224, mean loss: 0.3423845940497997
Epoch: 47, step: 815, loss: 0.3238801658153534, mean loss: 0.3423843246358425
Epoch: 47, step: 816, loss: 0.30760660767555237, mean loss: 0.3423838182994232
Epoch: 47, step: 817, loss: 0.3371219038963318, mean loss: 0.34238374169117114
Epoch: 47, step: 818, loss: 0.35226520895957947, mean loss: 0.3423838855534343
Epoch: 47, step: 819, loss: 0.3028063476085663, mean loss: 0.34238330936053385
Epoch: 47, step: 820, loss: 0.33238905668258667, mean loss: 0.34238316386048756
Epoch: 47, step: 821, loss: 0.36427783966064453, mean loss: 0.34238348260667767
Epoch: 47, step: 822, loss: 0.33178991079330444, mean loss: 0.342383328386011
Epoch: 47, step: 823, loss: 0.3934350311756134, mean loss: 0.3423840715832216
Epoch: 47, step: 824, loss: 0.31762194633483887, mean loss: 0.3423837111079876
Epoch: 47, step: 825, loss: 0.3452417850494385, mean loss: 0.34238375271386207
Epoch: 47, step: 826, loss: 0.3515208959579468, mean loss: 0.34238388572417205
Epoch: 47, step: 827, loss: 0.30414915084838867, mean loss: 0.34238332914540653
Epoch: 47, step: 828, loss: 0.33345094323158264, mean loss: 0.3423831991195551
Epoch: 47, step: 829, loss: 0.30031147599220276, mean loss: 0.3423825867040099
Epoch: 47, step: 830, loss: 0.33785468339920044, mean loss: 0.3423825207947055
Epoch: 47, step: 831, loss: 0.3235410153865814, mean loss: 0.34238224653698485
Epoch: 47, step: 832, loss: 0.3324565887451172, mean loss: 0.3423821020608085
Epoch: 47, step: 833, loss: 0.34771332144737244, mean loss: 0.34238217965999607
Epoch: 47, step: 834, loss: 0.3957065939903259, mean loss: 0.342382955818451
Epoch: 47, step: 835, loss: 0.3364155888557434, mean loss: 0.34238286896227144
Epoch: 47, step: 836, loss: 0.401862233877182, mean loss: 0.342383734683324
Epoch: 47, step: 837, loss: 0.3206169605255127, mean loss: 0.34238341787294124
Epoch: 47, step: 838, loss: 0.31639495491981506, mean loss: 0.3423830396223561
Epoch: 47, step: 839, loss: 0.3451211750507355, mean loss: 0.34238307947412633
Epoch: 47, step: 840, loss: 0.36821556091308594, mean loss: 0.3423834554435254
Epoch: 47, step: 841, loss: 0.32326439023017883, mean loss: 0.34238317718613615
Epoch: 47, step: 842, loss: 0.31526362895965576, mean loss: 0.3423827824960832
Epoch: 47, step: 843, loss: 0.33504486083984375, mean loss: 0.3423826757036502
Epoch: 47, step: 844, loss: 0.330520898103714, mean loss: 0.34238250307579815
Epoch: 47, step: 845, loss: 0.3578236401081085, mean loss: 0.3423827277918245
Epoch: 47, step: 846, loss: 0.3256256878376007, mean loss: 0.34238248392891313
Epoch: 47, step: 847, loss: 0.32092440128326416, mean loss: 0.3423821716569147
Epoch: 47, step: 848, loss: 0.31662997603416443, mean loss: 0.3423817968996403
Epoch: 47, step: 849, loss: 0.34045618772506714, mean loss: 0.3423817688777367
Epoch: 47, step: 850, loss: 0.32434383034706116, mean loss: 0.3423815063893633
Epoch: 47, step: 851, loss: 0.3482780158519745, mean loss: 0.3423815921942158
Epoch: 47, step: 852, loss: 0.3475967049598694, mean loss: 0.34238166808241255
Epoch: 47, step: 853, loss: 0.3212503492832184, mean loss: 0.3423813605925432
Epoch: 47, step: 854, loss: 0.31050556898117065, mean loss: 0.3423808967625065
Epoch: 47, step: 855, loss: 0.3311968445777893, mean loss: 0.342380734023839
Epoch: 47, step: 856, loss: 0.3306369185447693, mean loss: 0.3423805631425661
Epoch: 47, step: 857, loss: 0.31367939710617065, mean loss: 0.34238014552527374
Epoch: 47, step: 858, loss: 0.36298397183418274, mean loss: 0.34238044531758693
Epoch: 47, step: 859, loss: 0.36437323689460754, mean loss: 0.34238076531513634
Epoch: 47, step: 860, loss: 0.3214160203933716, mean loss: 0.34238046028021774
Epoch: 47, step: 861, loss: 0.321299284696579, mean loss: 0.34238015355570756
Epoch: 47, step: 862, loss: 0.3824858069419861, mean loss: 0.34238073707192856
Epoch: 47, step: 863, loss: 0.3170609772205353, mean loss: 0.34238036868806293
Epoch: 47, step: 864, loss: 0.2937871217727661, mean loss: 0.34237966170238043
Epoch: 47, step: 865, loss: 0.29645049571990967, mean loss: 0.3423789934862722
Epoch: 47, step: 866, loss: 0.3678775429725647, mean loss: 0.3423793644552034
Epoch: 47, step: 867, loss: 0.32765835523605347, mean loss: 0.3423791502878207
Epoch: 47, step: 868, loss: 0.32454222440719604, mean loss: 0.34237889079255784
Epoch: 47, step: 869, loss: 0.3075181543827057, mean loss: 0.3423783836387796
Epoch: 47, step: 870, loss: 0.34794995188713074, mean loss: 0.3423784646927409
Epoch: 47, step: 871, loss: 0.3425115942955017, mean loss: 0.3423784666294532
Epoch: 47, step: 872, loss: 0.35987740755081177, mean loss: 0.34237872119282764
Epoch: 47, step: 873, loss: 0.29739490151405334, mean loss: 0.34237806680657645
Epoch: 47, step: 874, loss: 0.349916934967041, mean loss: 0.34237817647400676
Epoch: 47, step: 875, loss: 0.3355429768562317, mean loss: 0.3423780770442439
Epoch: 47, step: 876, loss: 0.3425941467285156, mean loss: 0.34237808018730426
Epoch: 47, step: 877, loss: 0.306485652923584, mean loss: 0.3423775580852581
Epoch: 47, step: 878, loss: 0.3179211914539337, mean loss: 0.3423772023407655
Epoch: 47, step: 879, loss: 0.3413887619972229, mean loss: 0.3423771879630332
Epoch: 47, step: 880, loss: 0.3447802662849426, mean loss: 0.34237722291740813
Epoch: 47, step: 881, loss: 0.3050302267074585, mean loss: 0.3423766796883724
Epoch: 47, step: 882, loss: 0.36262911558151245, mean loss: 0.3423769742649733
Epoch: 47, step: 883, loss: 0.3434203267097473, mean loss: 0.34237698944056744
Epoch: 47, step: 884, loss: 0.3600844144821167, mean loss: 0.3423772469918749
Epoch: 47, step: 885, loss: 0.375551700592041, mean loss: 0.3423777295013085
Epoch: 47, step: 886, loss: 0.3289404809474945, mean loss: 0.34237753406463406
Epoch: 47, step: 887, loss: 0.32238706946372986, mean loss: 0.342377243319614
Epoch: 47, step: 888, loss: 0.30740422010421753, mean loss: 0.342376734672884
Epoch: 47, step: 889, loss: 0.3181951642036438, mean loss: 0.34237638298187395
Epoch: 47, step: 890, loss: 0.29384464025497437, mean loss: 0.34237567715801487
Epoch: 47, step: 891, loss: 0.29094237089157104, mean loss: 0.3423749291459982
Epoch: 47, step: 892, loss: 0.3015216886997223, mean loss: 0.3423743350121077
Epoch: 47, step: 893, loss: 0.3129362463951111, mean loss: 0.3423739068964534
Epoch: 47, step: 894, loss: 0.3244551122188568, mean loss: 0.3423736463087147
Epoch: 47, step: 895, loss: 0.32406294345855713, mean loss: 0.34237338002544365
Epoch: 47, step: 896, loss: 0.30923205614089966, mean loss: 0.34237289807497634
Epoch: 47, step: 897, loss: 0.3602265417575836, mean loss: 0.34237315770391624
Epoch: 47, step: 898, loss: 0.32368770241737366, mean loss: 0.34237288598266497
Epoch: 47, step: 899, loss: 0.3680861294269562, mean loss: 0.3423732598955815
Epoch: 47, step: 900, loss: 0.31101560592651367, mean loss: 0.3423728039102688
Epoch: 47, step: 901, loss: 0.33579373359680176, mean loss: 0.34237270824253124
Epoch: 47, step: 902, loss: 0.33295589685440063, mean loss: 0.3423725713125551
Epoch: 47, step: 903, loss: 0.3227403163909912, mean loss: 0.3423722858438335
Epoch: 47, step: 904, loss: 0.31872379779815674, mean loss: 0.34237194198086335
Epoch: 47, step: 905, loss: 0.31251463294029236, mean loss: 0.342371507844285
Epoch: 47, step: 906, loss: 0.4357689917087555, mean loss: 0.34237286585931753
Epoch: 47, step: 907, loss: 0.3349769115447998, mean loss: 0.3423727583224687
Epoch: 47, step: 908, loss: 0.34021198749542236, mean loss: 0.3423727269054132
Epoch: 47, step: 909, loss: 0.31969860196113586, mean loss: 0.3423723972342256
Epoch: 47, step: 910, loss: 0.32576096057891846, mean loss: 0.3423721557152059
Epoch: 47, step: 911, loss: 0.3819069266319275, mean loss: 0.34237273051559725
Epoch: 47, step: 912, loss: 0.292606920003891, mean loss: 0.34237200697551334
Epoch: 47, step: 913, loss: 0.32031187415122986, mean loss: 0.34237168625013714
Epoch: 47, step: 914, loss: 0.33082857728004456, mean loss: 0.3423715184309235
Epoch: 47, step: 915, loss: 0.3700568377971649, mean loss: 0.34237192092742513
Epoch: 47, step: 916, loss: 0.30957499146461487, mean loss: 0.34237144412391474
Epoch: 47, step: 917, loss: 0.3502628207206726, mean loss: 0.34237155884750087
Epoch: 47, step: 918, loss: 0.316530704498291, mean loss: 0.3423711831827045
Epoch: 47, step: 919, loss: 0.31318897008895874, mean loss: 0.3423707589486361
Epoch: 47, step: 920, loss: 0.3821404278278351, mean loss: 0.3423713370885841
Epoch: 47, step: 921, loss: 0.37662002444267273, mean loss: 0.34237183496163764
Epoch: 47, step: 922, loss: 0.3744320869445801, mean loss: 0.3423723010146385
Epoch: 47, step: 923, loss: 0.3099287748336792, mean loss: 0.3423718293969187
Epoch: 47, step: 924, loss: 0.29833167791366577, mean loss: 0.34237118921330284
Epoch: 47, step: 925, loss: 0.3185546398162842, mean loss: 0.3423708430123348
Epoch: 47, step: 926, loss: 0.3630572259426117, mean loss: 0.3423711437083582
Epoch: 47, step: 927, loss: 0.3108374774456024, mean loss: 0.34237068534353665
Epoch: 47, step: 928, loss: 0.3504122197628021, mean loss: 0.3423708022314012
Epoch: 47, step: 929, loss: 0.3558170199394226, mean loss: 0.34237099767629364
Epoch: 47, step: 930, loss: 0.33493348956108093, mean loss: 0.3423708895714067
Epoch: 47, step: 931, loss: 0.33538421988487244, mean loss: 0.3423707880209752
Epoch: 47, step: 932, loss: 0.3294093608856201, mean loss: 0.3423705996308772
Epoch: 47, step: 933, loss: 0.33646509051322937, mean loss: 0.342370513797484
Epoch: 47, step: 934, loss: 0.3186355531215668, mean loss: 0.34237016882763277
Epoch: 47, step: 935, loss: 0.3339846432209015, mean loss: 0.3423700469520789
Epoch: 47, step: 936, loss: 0.33330562710762024, mean loss: 0.3423699152113646
Epoch: 47, step: 937, loss: 0.35280919075012207, mean loss: 0.3423700669317893
Epoch: 47, step: 938, loss: 0.34398379921913147, mean loss: 0.34237009038481425
Epoch: 47, step: 939, loss: 0.3486848473548889, mean loss: 0.3423701821584012
Epoch: 47, step: 940, loss: 0.33336764574050903, mean loss: 0.34237005132469606
Epoch: 47, step: 941, loss: 0.346492201089859, mean loss: 0.3423701112309563
Epoch: 47, step: 942, loss: 0.3414875864982605, mean loss: 0.3423700984056125
Epoch: 47, step: 943, loss: 0.32358697056770325, mean loss: 0.34236982544264327
Epoch: 47, step: 944, loss: 0.29763948917388916, mean loss: 0.34236917541523176
Epoch: 47, step: 945, loss: 0.3381386995315552, mean loss: 0.3423691139382666
Epoch: 47, step: 946, loss: 0.284039169549942, mean loss: 0.3423682663041114
Epoch: 47, step: 947, loss: 0.3347178101539612, mean loss: 0.34236815513147495
Epoch: 47, step: 948, loss: 0.3350551128387451, mean loss: 0.34236804886351363
Epoch: 47, step: 949, loss: 0.31213024258613586, mean loss: 0.34236760947547157
Epoch: 47, step: 950, loss: 0.326004296541214, mean loss: 0.3423673717022849
Epoch: 47, step: 951, loss: 0.29462915658950806, mean loss: 0.34236667803452675
Epoch: 47, step: 952, loss: 0.33755719661712646, mean loss: 0.34236660815060443
Epoch: 47, step: 953, loss: 0.36192527413368225, mean loss: 0.3423668923426649
Epoch: 47, step: 954, loss: 0.3065868020057678, mean loss: 0.3423663724570113
Epoch: 47, step: 955, loss: 0.3023108243942261, mean loss: 0.342365790457301
Epoch: 47, step: 956, loss: 0.3927958607673645, mean loss: 0.3423665231862557
Epoch: 47, step: 957, loss: 0.37079668045043945, mean loss: 0.3423669362591826
Epoch: 47, step: 958, loss: 0.3468468487262726, mean loss: 0.34236700134864556
Epoch: 47, step: 959, loss: 0.31029194593429565, mean loss: 0.34236653533110306
Epoch: 47, step: 960, loss: 0.39046838879585266, mean loss: 0.3423672341913722
Epoch: 47, step: 961, loss: 0.3237577974796295, mean loss: 0.3423669638232666
Epoch: 47, step: 962, loss: 0.32809191942214966, mean loss: 0.3423667564306034
Epoch: 47, step: 963, loss: 0.3264068067073822, mean loss: 0.3423665245624356
Epoch: 47, step: 964, loss: 0.4019849896430969, mean loss: 0.34236739069445193
Epoch: 47, step: 965, loss: 0.32605817914009094, mean loss: 0.3423671537590486
Epoch: 47, step: 966, loss: 0.40513136982917786, mean loss: 0.3423680655657758
Epoch: 47, step: 967, loss: 0.33129340410232544, mean loss: 0.34236790468104306
Epoch: 47, step: 968, loss: 0.3541785180568695, mean loss: 0.3423680762546644
Epoch: 47, step: 969, loss: 0.3117802143096924, mean loss: 0.3423676319090712
Epoch: 47, step: 970, loss: 0.3634965121746063, mean loss: 0.3423679388409015
Epoch: 47, step: 971, loss: 0.3370298743247986, mean loss: 0.34236786129783764
Epoch: 47, step: 972, loss: 0.3369365334510803, mean loss: 0.34236778240113586
Epoch: 47, step: 973, loss: 0.31970715522766113, mean loss: 0.34236745323250084
Epoch: 47, step: 974, loss: 0.3742174208164215, mean loss: 0.3423679158789222
Epoch: 47, step: 975, loss: 0.34045708179473877, mean loss: 0.3423678881229219
Epoch: 47, step: 976, loss: 0.30011188983917236, mean loss: 0.3423672743383583
Epoch: 47, step: 977, loss: 0.35257694125175476, mean loss: 0.3423674226355275
Epoch: 47, step: 978, loss: 0.33714550733566284, mean loss: 0.34236734678741065
Epoch: 47, step: 979, loss: 0.3079596757888794, mean loss: 0.3423668470245853
Epoch: 47, step: 980, loss: 0.3068011999130249, mean loss: 0.34236633044994935
Epoch: 47, step: 981, loss: 0.3165602684020996, mean loss: 0.34236595563423333
Epoch: 47, step: 982, loss: 0.2962312698364258, mean loss: 0.34236528556864537
Epoch: 47, step: 983, loss: 0.29840609431266785, mean loss: 0.34236464710946835
Epoch: 47, step: 984, loss: 0.30795860290527344, mean loss: 0.34236414740656207
Epoch: 47, step: 985, loss: 0.3452942371368408, mean loss: 0.3423641899616748
Epoch: 47, step: 986, loss: 0.3430265188217163, mean loss: 0.342364199580858
Epoch: 47, step: 987, loss: 0.357591450214386, mean loss: 0.34236442072717255
Epoch: 47, step: 988, loss: 0.3267921507358551, mean loss: 0.3423641945734047
Epoch: 47, step: 989, loss: 0.3470728099346161, mean loss: 0.3423642629549343
Epoch: 47, step: 990, loss: 0.3303295373916626, mean loss: 0.342364088181476
Epoch: 47, step: 991, loss: 0.38240349292755127, mean loss: 0.3423646696424802
Epoch: 47, step: 992, loss: 0.32310232520103455, mean loss: 0.34236438991455814
Epoch: 47, step: 993, loss: 0.3491460978984833, mean loss: 0.3423644883971463
Epoch: 47, step: 994, loss: 0.30087462067604065, mean loss: 0.34236388589845
Epoch: 47, step: 995, loss: 0.3201808035373688, mean loss: 0.3423635637695821
Epoch: 47, step: 996, loss: 0.3650642931461334, mean loss: 0.34236389341060985
Epoch: 47, step: 997, loss: 0.31961479783058167, mean loss: 0.3423635630720454
Epoch: 47, step: 998, loss: 0.2708578407764435, mean loss: 0.3423625247558374
Epoch: 47, step: 999, loss: 0.32356324791908264, mean loss: 0.3423622517803359
Epoch: 47, step: 1000, loss: 0.30831894278526306, mean loss: 0.34236175746055497
Epoch: 47, step: 1001, loss: 0.33898016810417175, mean loss: 0.34236170835950436
Epoch: 47, step: 1002, loss: 0.3068253993988037, mean loss: 0.3423611923758689
Epoch: 47, step: 1003, loss: 0.4029737114906311, mean loss: 0.3423620724507776
Epoch: 47, step: 1004, loss: 0.31697893142700195, mean loss: 0.342361703900823
Epoch: 47, step: 1005, loss: 0.34127044677734375, mean loss: 0.34236168805656936
Epoch: 47, step: 1006, loss: 0.3437989056110382, mean loss: 0.3423617089236119
Epoch: 47, step: 1007, loss: 0.3474801182746887, mean loss: 0.3423617832370063
Epoch: 47, step: 1008, loss: 0.32464003562927246, mean loss: 0.3423615259414271
Epoch: 47, step: 1009, loss: 0.31133970618247986, mean loss: 0.3423610755534983
Epoch: 47, step: 1010, loss: 0.34228822588920593, mean loss: 0.34236107449585135
Epoch: 47, step: 1011, loss: 0.33803948760032654, mean loss: 0.34236101175504274
Epoch: 47, step: 1012, loss: 0.34429872035980225, mean loss: 0.34236103988629235
Epoch: 47, step: 1013, loss: 0.340946763753891, mean loss: 0.3423610193544243
Epoch: 47, step: 1014, loss: 0.33168599009513855, mean loss: 0.34236086438107444
Epoch: 47, step: 1015, loss: 0.31217435002326965, mean loss: 0.3423604261586373
Epoch: 47, step: 1016, loss: 0.31820303201675415, mean loss: 0.34236007546698977
Epoch: 47, step: 1017, loss: 0.34745413064956665, mean loss: 0.3423601494160532
Epoch: 47, step: 1018, loss: 0.3468588888645172, mean loss: 0.3423602147221262
Epoch: 47, step: 1019, loss: 0.3484102785587311, mean loss: 0.3423603025467667
Epoch: 47, step: 1020, loss: 0.29123350977897644, mean loss: 0.3423595603848429
Epoch: 47, step: 1021, loss: 0.3557644784450531, mean loss: 0.34235975496922466
Epoch: 47, step: 1022, loss: 0.3396326005458832, mean loss: 0.3423597153827123
Epoch: 47, step: 1023, loss: 0.3492741286754608, mean loss: 0.3423598157486952
Epoch: 47, step: 1024, loss: 0.3253260850906372, mean loss: 0.34235956849961824
Epoch: 47, step: 1025, loss: 0.32101237773895264, mean loss: 0.34235925864403194
Epoch: 47, step: 1026, loss: 0.3191850781440735, mean loss: 0.34235892227447684
Epoch: 47, step: 1027, loss: 0.30626606941223145, mean loss: 0.3423583984000449
Epoch: 47, step: 1028, loss: 0.34084904193878174, mean loss: 0.3423583764926112
Epoch: 47, step: 1029, loss: 0.38763824105262756, mean loss: 0.3423590336940475
Epoch: 47, step: 1030, loss: 0.32724761962890625, mean loss: 0.34235881436700266
Epoch: 47, step: 1031, loss: 0.342281311750412, mean loss: 0.3423588132421461
Epoch: 47, step: 1032, loss: 0.3215440809726715, mean loss: 0.3423585111459172
Epoch: 47, step: 1033, loss: 0.3183777630329132, mean loss: 0.34235816310452344
Epoch: 47, step: 1034, loss: 0.3691348135471344, mean loss: 0.3423585517182332
Epoch: 47, step: 1035, loss: 0.3260982036590576, mean loss: 0.34235831573268727
Epoch: 47, step: 1036, loss: 0.3029002249240875, mean loss: 0.3423577430878747
Epoch: 47, step: 1037, loss: 0.33330169320106506, mean loss: 0.34235761166173057
Epoch: 47, step: 1038, loss: 0.3451050817966461, mean loss: 0.34235765153387904
Epoch: 47, step: 1039, loss: 0.3651822507381439, mean loss: 0.3423579827668158
Epoch: 47, step: 1040, loss: 0.3265363276004791, mean loss: 0.3423577531646569
Epoch: 47, step: 1041, loss: 0.3402407169342041, mean loss: 0.3423577224429005
Epoch: 47, step: 1042, loss: 0.3031895160675049, mean loss: 0.3423571540545971
Epoch: 47, step: 1043, loss: 0.3349902927875519, mean loss: 0.3423570471521524
Epoch: 47, step: 1044, loss: 0.34985676407814026, mean loss: 0.342357155980921
Epoch: 47, step: 1045, loss: 0.34687936305999756, mean loss: 0.34235722160194254
Epoch: 47, step: 1046, loss: 0.3024415075778961, mean loss: 0.34235664239982366
Epoch: 47, step: 1047, loss: 0.33144599199295044, mean loss: 0.34235648408172037
Epoch: 47, step: 1048, loss: 0.31416189670562744, mean loss: 0.342356074972395
Epoch: 47, step: 1049, loss: 0.3577173948287964, mean loss: 0.342356297865106
Epoch: 47, step: 1050, loss: 0.30673784017562866, mean loss: 0.342355781048877
Epoch: 47, step: 1051, loss: 0.31943240761756897, mean loss: 0.34235544844044064
Epoch: 47, step: 1052, loss: 0.3180305063724518, mean loss: 0.3423550955009582
Epoch: 47, step: 1053, loss: 0.35099127888679504, mean loss: 0.34235522080468395
Epoch: 47, step: 1054, loss: 0.3529525101184845, mean loss: 0.34235537456016923
Epoch: 47, step: 1055, loss: 0.33348026871681213, mean loss: 0.34235524579361704
Epoch: 47, step: 1056, loss: 0.33071938157081604, mean loss: 0.34235507697440454
Epoch: 47, step: 1057, loss: 0.31243160367012024, mean loss: 0.3423546428352799
Epoch: 47, step: 1058, loss: 0.31321945786476135, mean loss: 0.34235422013902195
Epoch: 47, step: 1059, loss: 0.3706437647342682, mean loss: 0.342354630560688
Epoch: 47, step: 1060, loss: 0.2989446818828583, mean loss: 0.34235400078296485
Epoch: 47, step: 1061, loss: 0.3176674246788025, mean loss: 0.34235364264316936
Epoch: 47, step: 1062, loss: 0.33347100019454956, mean loss: 0.342353513780358
Epoch: 47, step: 1063, loss: 0.2978995442390442, mean loss: 0.3423528688843802
Epoch: 47, step: 1064, loss: 0.3179680109024048, mean loss: 0.34235251513714765
Epoch: 47, step: 1065, loss: 0.32497262954711914, mean loss: 0.3423522630135861
Epoch: 47, step: 1066, loss: 0.29085060954093933, mean loss: 0.342351515909017
Epoch: 47, step: 1067, loss: 0.3256840109825134, mean loss: 0.3423512741267128
Epoch: 47, step: 1068, loss: 0.3126945495605469, mean loss: 0.3423508439263187
Epoch: 47, step: 1069, loss: 0.334591269493103, mean loss: 0.3423507313675785
Epoch: 47, step: 1070, loss: 0.3074771463871002, mean loss: 0.3423502255060925
Epoch: 47, step: 1071, loss: 0.3222057819366455, mean loss: 0.3423499333035458
Epoch: 47, step: 1072, loss: 0.32803937792778015, mean loss: 0.34234972572669925
Epoch: 47, step: 1073, loss: 0.32267290353775024, mean loss: 0.3423494403154523
Epoch: 47, step: 1074, loss: 0.34218546748161316, mean loss: 0.3423494379370696
Epoch: 47, step: 1075, loss: 0.31165167689323425, mean loss: 0.3423489926806145
Epoch: 47, step: 1076, loss: 0.3562397062778473, mean loss: 0.34234919415590054
Epoch: 47, step: 1077, loss: 0.31619948148727417, mean loss: 0.3423488148777311
Epoch: 47, step: 1078, loss: 0.2989703118801117, mean loss: 0.34234818572050896
Epoch: 47, step: 1079, loss: 0.3361891508102417, mean loss: 0.3423480963918133
Epoch: 47, step: 1080, loss: 0.33451735973358154, mean loss: 0.34234798281893103
Epoch: 47, step: 1081, loss: 0.33317604660987854, mean loss: 0.3423478497959258
Epoch: 47, step: 1082, loss: 0.31153544783592224, mean loss: 0.3423474029220304
Epoch: 47, step: 1083, loss: 0.321575790643692, mean loss: 0.3423471016746079
Epoch: 47, step: 1084, loss: 0.34120407700538635, mean loss: 0.34234708509774153
Epoch: 47, step: 1085, loss: 0.31800132989883423, mean loss: 0.34234673202532806
Epoch: 47, step: 1086, loss: 0.31644973158836365, mean loss: 0.34234635646154826
Epoch: 47, step: 1087, loss: 0.3420094847679138, mean loss: 0.34234635157623455
Epoch: 47, step: 1088, loss: 0.3200089633464813, mean loss: 0.3423460276440996
Epoch: 47, step: 1089, loss: 0.4117593467235565, mean loss: 0.34234703424694596
Epoch: 47, step: 1090, loss: 0.34632986783981323, mean loss: 0.34234709200349106
Epoch: 47, step: 1091, loss: 0.3403358459472656, mean loss: 0.34234706283809
Epoch: 47, step: 1092, loss: 0.37212851643562317, mean loss: 0.34234749469745396
Epoch: 47, step: 1093, loss: 0.37633803486824036, mean loss: 0.34234798758542373
Epoch: 47, step: 1094, loss: 0.3657214641571045, mean loss: 0.3423483265132049
Epoch: 47, step: 1095, loss: 0.29748499393463135, mean loss: 0.3423476759805708
Epoch: 47, step: 1096, loss: 0.3224146068096161, mean loss: 0.3423473869489001
Epoch: 47, step: 1097, loss: 0.3000332713127136, mean loss: 0.3423467733985182
Epoch: 47, step: 1098, loss: 0.3160978853702545, mean loss: 0.3423463927978247
Epoch: 47, step: 1099, loss: 0.30209437012672424, mean loss: 0.34234580916450674
Epoch: 47, step: 1100, loss: 0.33680105209350586, mean loss: 0.34234572876958913
Epoch: 47, step: 1101, loss: 0.32026422023773193, mean loss: 0.3423454086085259
Epoch: 47, step: 1102, loss: 0.372003436088562, mean loss: 0.3423458386157388
Epoch: 47, step: 1103, loss: 0.3781895935535431, mean loss: 0.342346358301335
Epoch: 47, step: 1104, loss: 0.3221296966075897, mean loss: 0.3423460651915428
Epoch: 47, step: 1105, loss: 0.31181833148002625, mean loss: 0.3423456225938435
Epoch: 47, step: 1106, loss: 0.3648594617843628, mean loss: 0.34234594899963094
Epoch: 47, step: 1107, loss: 0.3021312952041626, mean loss: 0.34234536597577053
Epoch: 47, step: 1108, loss: 0.34296703338623047, mean loss: 0.34234537498844736
Epoch: 47, step: 1109, loss: 0.30037349462509155, mean loss: 0.34234476650631734
Epoch: 47, step: 1110, loss: 0.32737109065055847, mean loss: 0.3423445494304558
Epoch: 47, step: 1111, loss: 0.30053389072418213, mean loss: 0.3423439433031913
Epoch: 47, step: 1112, loss: 0.39785832166671753, mean loss: 0.34234474808100496
Epoch: 47, step: 1113, loss: 0.3434160649776459, mean loss: 0.3423447636113882
Epoch: 47, step: 1114, loss: 0.3812170624732971, mean loss: 0.34234532711687304
Epoch: 47, step: 1115, loss: 0.37399888038635254, mean loss: 0.3423457859704227
Epoch: 47, step: 1116, loss: 0.3293006420135498, mean loss: 0.3423455968692564
Epoch: 47, step: 1117, loss: 0.35296595096588135, mean loss: 0.34234575081866786
Epoch: 47, step: 1118, loss: 0.34435972571372986, mean loss: 0.34234578001221005
Epoch: 47, step: 1119, loss: 0.3645944893360138, mean loss: 0.3423461025133599
Epoch: 47, step: 1120, loss: 0.366747111082077, mean loss: 0.3423464562075513
Epoch: 47, step: 1121, loss: 0.3418727517127991, mean loss: 0.3423464493412736
Epoch: 47, step: 1122, loss: 0.3421679437160492, mean loss: 0.3423464467538981
Epoch: 47, step: 1123, loss: 0.3090246617794037, mean loss: 0.3423459637734804
Epoch: 47, step: 1124, loss: 0.3204817473888397, mean loss: 0.34234564686862945
Epoch: 47, step: 1125, loss: 0.3262394070625305, mean loss: 0.34234541342456465
Epoch: 47, step: 1126, loss: 0.345512330532074, mean loss: 0.3423454593252402
Epoch: 47, step: 1127, loss: 0.34466552734375, mean loss: 0.3423454929513637
Epoch: 47, step: 1128, loss: 0.30507001280784607, mean loss: 0.3423449527035247
Epoch: 47, step: 1129, loss: 0.34933891892433167, mean loss: 0.34234505406829213
Epoch: 47, step: 1130, loss: 0.35721129179000854, mean loss: 0.3423452695241353
Epoch: 47, step: 1131, loss: 0.2973063886165619, mean loss: 0.34234461678673084
Epoch: 47, step: 1132, loss: 0.37313348054885864, mean loss: 0.3423450629956809
Epoch: 47, step: 1133, loss: 0.37219688296318054, mean loss: 0.3423454956182131
Epoch: 47, step: 1134, loss: 0.3516889810562134, mean loss: 0.34234563102515825
Epoch: 47, step: 1135, loss: 0.3389433026313782, mean loss: 0.34234558171890944
Epoch: 47, step: 1136, loss: 0.3341498374938965, mean loss: 0.3423454629486142
Epoch: 47, step: 1137, loss: 0.3322737216949463, mean loss: 0.34234531699404136
Epoch: 47, step: 1138, loss: 0.33240342140197754, mean loss: 0.34234517292321387
Epoch: 47, step: 1139, loss: 0.32021766901016235, mean loss: 0.34234485227192835
Epoch: 47, step: 1140, loss: 0.31686583161354065, mean loss: 0.3423444830589176
Epoch: 47, step: 1141, loss: 0.30505993962287903, mean loss: 0.34234394278151675
Epoch: 47, step: 1142, loss: 0.35314685106277466, mean loss: 0.3423440993204494
Epoch: 47, step: 1143, loss: 0.32705047726631165, mean loss: 0.3423438777122935
Epoch: 47, step: 1144, loss: 0.2960401773452759, mean loss: 0.34234320677058155
Epoch: 47, step: 1145, loss: 0.3483050763607025, mean loss: 0.342343293156961
Epoch: 47, step: 1146, loss: 0.3224238157272339, mean loss: 0.3423430045316269
Epoch: 47, step: 1147, loss: 0.3302043378353119, mean loss: 0.3423428286497054
Epoch: 47, step: 1148, loss: 0.3096129596233368, mean loss: 0.3423423544206165
Epoch: 47, step: 1149, loss: 0.29203248023986816, mean loss: 0.34234162548216307
Epoch: 47, step: 1150, loss: 0.364688903093338, mean loss: 0.3423419492665936
Epoch: 47, step: 1151, loss: 0.35511723160743713, mean loss: 0.3423421343619622
Epoch: 47, step: 1152, loss: 0.2950262129306793, mean loss: 0.3423414488326098
Epoch: 47, step: 1153, loss: 0.3425842225551605, mean loss: 0.34234145234994806
Epoch: 47, step: 1154, loss: 0.3737976551055908, mean loss: 0.34234190808503284
Epoch: 47, step: 1155, loss: 0.33365222811698914, mean loss: 0.3423417821914311
Epoch: 47, step: 1156, loss: 0.3005059063434601, mean loss: 0.34234117609399034
Epoch: 47, step: 1157, loss: 0.3210470974445343, mean loss: 0.3423408676003988
Epoch: 47, step: 1158, loss: 0.34076157212257385, mean loss: 0.34234084472101134
Epoch: 47, step: 1159, loss: 0.3427133858203888, mean loss: 0.34234085011796767
Epoch: 47, step: 1160, loss: 0.36052611470222473, mean loss: 0.3423411135618041
Epoch: 47, step: 1161, loss: 0.33892112970352173, mean loss: 0.34234106401836123
Epoch: 47, step: 1162, loss: 0.310274213552475, mean loss: 0.34234059949009904
Epoch: 47, step: 1163, loss: 0.3365482687950134, mean loss: 0.3423405155821912
Epoch: 47, step: 1164, loss: 0.3620598018169403, mean loss: 0.34234080123233296
Epoch: 47, step: 1165, loss: 0.3464626967906952, mean loss: 0.3423408609405283
Epoch: 47, step: 1166, loss: 0.32173505425453186, mean loss: 0.34234056245705347
Epoch: 47, step: 1167, loss: 0.3074488043785095, mean loss: 0.3423400570430944
Epoch: 47, step: 1168, loss: 0.32678282260894775, mean loss: 0.34233983169676657
Epoch: 47, step: 1169, loss: 0.36660709977149963, mean loss: 0.3423401832027209
Epoch: 47, step: 1170, loss: 0.34252384305000305, mean loss: 0.3423401858629542
Epoch: 47, step: 1171, loss: 0.3569652736186981, mean loss: 0.3423403976979449
Epoch: 47, step: 1172, loss: 0.315309077501297, mean loss: 0.34234000617232685
Epoch: 47, step: 1173, loss: 0.34361013770103455, mean loss: 0.3423400245688323
Epoch: 47, step: 1174, loss: 0.33156752586364746, mean loss: 0.3423398685428962
Epoch: 47, step: 1175, loss: 0.3345144987106323, mean loss: 0.3423397552040133
Epoch: 47, step: 1176, loss: 0.32704341411590576, mean loss: 0.3423395336623942
Epoch: 47, step: 1177, loss: 0.30302104353904724, mean loss: 0.34233896420883975
Epoch: 47, step: 1178, loss: 0.35214683413505554, mean loss: 0.342339106255126
Epoch: 47, step: 1179, loss: 0.3560168147087097, mean loss: 0.3423393043449831
Epoch: 47, step: 1180, loss: 0.3182545602321625, mean loss: 0.3423389555384238
Epoch: 47, step: 1181, loss: 0.34150680899620056, mean loss: 0.34233894348706184
Epoch: 47, step: 1182, loss: 0.33510181307792664, mean loss: 0.342338838678581
Epoch: 47, step: 1183, loss: 0.34845709800720215, mean loss: 0.3423389272822323
Epoch: 47, step: 1184, loss: 0.3505343794822693, mean loss: 0.34233904596573916
Epoch: 47, step: 1185, loss: 0.3428301513195038, mean loss: 0.34233905307764223
Epoch: 47, step: 1186, loss: 0.30755317211151123, mean loss: 0.342338549335973
Epoch: 47, step: 1187, loss: 0.3497936427593231, mean loss: 0.3423386572931878
Epoch: 47, step: 1188, loss: 0.31937459111213684, mean loss: 0.34233832475533965
Epoch: 47, step: 1189, loss: 0.3353939950466156, mean loss: 0.34233822419740706
Epoch: 47, step: 1190, loss: 0.33209866285324097, mean loss: 0.34233807592475113
Epoch: 47, step: 1191, loss: 0.35139763355255127, mean loss: 0.34233820710861484
Epoch: 47, step: 1192, loss: 0.33538469672203064, mean loss: 0.3423381064221147
Epoch: 47, step: 1193, loss: 0.3359461724758148, mean loss: 0.3423380138685549
Epoch: 47, step: 1194, loss: 0.38320380449295044, mean loss: 0.34233860558612617
Epoch: 47, step: 1195, loss: 0.3763662874698639, mean loss: 0.342339098283941
Epoch: 47, step: 1196, loss: 0.3381325304508209, mean loss: 0.3423390373765663
Epoch: 47, step: 1197, loss: 0.350036084651947, mean loss: 0.34233914882137667
Epoch: 47, step: 1198, loss: 0.3446195423603058, mean loss: 0.34233918183849826
Epoch: 47, step: 1199, loss: 0.32081422209739685, mean loss: 0.34233887018969217
Epoch: 47, step: 1200, loss: 0.35179832577705383, mean loss: 0.3423390071462948
Epoch: 47, step: 1201, loss: 0.318409264087677, mean loss: 0.3423386606899019
Epoch: 47, step: 1202, loss: 0.3767626881599426, mean loss: 0.34233915907601864
Epoch: 47, step: 1203, loss: 0.3005600571632385, mean loss: 0.3423385542129495
Epoch: 47, step: 1204, loss: 0.3396349251270294, mean loss: 0.34233851507132995
Epoch: 47, step: 1205, loss: 0.3555852174758911, mean loss: 0.3423387068468519
Epoch: 47, step: 1206, loss: 0.32041701674461365, mean loss: 0.3423383894861555
Epoch: 47, step: 1207, loss: 0.33057042956352234, mean loss: 0.34233821912365736
Epoch: 47, step: 1208, loss: 0.3335529863834381, mean loss: 0.34233809194336956
Epoch: 47, step: 1209, loss: 0.31760454177856445, mean loss: 0.3423377338908758
Epoch: 47, step: 1210, loss: 0.3316534459590912, mean loss: 0.34233757922320646
Epoch: 47, step: 1211, loss: 0.32944855093955994, mean loss: 0.3423373926420211
Epoch: 47, step: 1212, loss: 0.3188008964061737, mean loss: 0.3423370519333424
Epoch: 47, step: 1213, loss: 0.3636115491390228, mean loss: 0.34233735989340736
Epoch: 47, step: 1214, loss: 0.3451792299747467, mean loss: 0.3423374010304466
Epoch: 47, step: 1215, loss: 0.3428691029548645, mean loss: 0.342337408726902
Epoch: 47, step: 1216, loss: 0.3791066110134125, mean loss: 0.3423379409582443
Epoch: 47, step: 1217, loss: 0.33223962783813477, mean loss: 0.34233779478806337
Epoch: 47, step: 1218, loss: 0.3146968185901642, mean loss: 0.342337394698666
Epoch: 47, step: 1219, loss: 0.34181633591651917, mean loss: 0.34233738715670814
Epoch: 47, step: 1220, loss: 0.374580442905426, mean loss: 0.3423378538454104
Epoch: 47, step: 1221, loss: 0.3106500804424286, mean loss: 0.34233739520055
Epoch: 47, step: 1222, loss: 0.3107159733772278, mean loss: 0.34233693752267846
Epoch: 47, step: 1223, loss: 0.3142063319683075, mean loss: 0.34233653037560563
Epoch: 47, step: 1224, loss: 0.37679383158683777, mean loss: 0.3423370290846096
Epoch: 47, step: 1225, loss: 0.30789804458618164, mean loss: 0.3423365306479219
Epoch: 47, step: 1226, loss: 0.3540029525756836, mean loss: 0.3423366994940313
Epoch: 47, step: 1227, loss: 0.32422488927841187, mean loss: 0.3423364373687242
Epoch: 47, step: 1228, loss: 0.3797202408313751, mean loss: 0.34233697840239374
Epoch: 47, step: 1229, loss: 0.3087082803249359, mean loss: 0.34233649172118624
Epoch: 47, step: 1230, loss: 0.310794472694397, mean loss: 0.3423360352454192
Epoch: 47, step: 1231, loss: 0.3266642987728119, mean loss: 0.34233580844749634
Epoch: 47, step: 1232, loss: 0.3163912296295166, mean loss: 0.3423354329886923
Epoch: 47, step: 1233, loss: 0.29746493697166443, mean loss: 0.34233478365153824
Epoch: 47, step: 1234, loss: 0.30909308791160583, mean loss: 0.34233430260591446
Epoch: 47, step: 1235, loss: 0.3405868709087372, mean loss: 0.3423342773189311
Epoch: 47, step: 1236, loss: 0.3303183317184448, mean loss: 0.3423341034393913
Epoch: 47, step: 1237, loss: 0.3400207459926605, mean loss: 0.3423340699638979
Epoch: 47, step: 1238, loss: 0.32991549372673035, mean loss: 0.3423338902631985
Epoch: 47, step: 1239, loss: 0.35227006673812866, mean loss: 0.34233403404071305
Epoch: 47, step: 1240, loss: 0.3456575572490692, mean loss: 0.34233408213174615
Epoch: 47, step: 1241, loss: 0.33350178599357605, mean loss: 0.3423339543311943
Epoch: 47, step: 1242, loss: 0.3354564905166626, mean loss: 0.3423338548178923
Epoch: 47, step: 1243, loss: 0.28526628017425537, mean loss: 0.342333029091902
Epoch: 47, step: 1244, loss: 0.32767659425735474, mean loss: 0.3423328170270975
Epoch: 47, step: 1245, loss: 0.3276754319667816, mean loss: 0.34233260495161266
Epoch: 47, step: 1246, loss: 0.30538317561149597, mean loss: 0.34233207034365
Epoch: 47, step: 1247, loss: 0.33225011825561523, mean loss: 0.3423319244736331
Epoch: 47, step: 1248, loss: 0.320365846157074, mean loss: 0.3423316066635673
Epoch: 47, step: 1249, loss: 0.3285476267337799, mean loss: 0.34233140723679095
Epoch: 47, step: 1250, loss: 0.3234066367149353, mean loss: 0.3423311334369599
Epoch: 47, step: 1251, loss: 0.3054454028606415, mean loss: 0.34233059978923747
Epoch: 47, step: 1252, loss: 0.33861202001571655, mean loss: 0.3423305459911186
Epoch: 47, step: 1253, loss: 0.3384956419467926, mean loss: 0.3423304905108946
Epoch: 47, step: 1254, loss: 0.356472373008728, mean loss: 0.3423306951010093
Epoch: 47, step: 1255, loss: 0.31802821159362793, mean loss: 0.34233034352292485
Epoch: 47, step: 1256, loss: 0.36796891689300537, mean loss: 0.3423307144245288
Epoch: 47, step: 1257, loss: 0.29467183351516724, mean loss: 0.3423300249751044
Epoch: 47, step: 1258, loss: 0.3306223154067993, mean loss: 0.3423298556098843
Epoch: 47, step: 1259, loss: 0.31950369477272034, mean loss: 0.34232952540850664
Epoch: 47, step: 1260, loss: 0.3414164185523987, mean loss: 0.34232951219976854
Epoch: 47, step: 1261, loss: 0.3721211552619934, mean loss: 0.3423299431507748
Epoch: 47, step: 1262, loss: 0.3494970500469208, mean loss: 0.34233004682505835
Epoch: 47, step: 1263, loss: 0.38952407240867615, mean loss: 0.342330729490475
Epoch: 47, step: 1264, loss: 0.32083308696746826, mean loss: 0.3423304185298263
Epoch: 47, step: 1265, loss: 0.3334788680076599, mean loss: 0.3423302904951325
Epoch: 47, step: 1266, loss: 0.33718153834342957, mean loss: 0.3423302160212459
Epoch: 47, step: 1267, loss: 0.31656330823898315, mean loss: 0.34232984332239463
Epoch: 47, step: 1268, loss: 0.32852035760879517, mean loss: 0.3423296435815075
Epoch: 47, step: 1269, loss: 0.29432398080825806, mean loss: 0.3423289492359555
Epoch: 47, step: 1270, loss: 0.33193135261535645, mean loss: 0.34232879884910267
Epoch: 47, step: 1271, loss: 0.32028284668922424, mean loss: 0.3423284799895111
Epoch: 47, step: 1272, loss: 0.33916398882865906, mean loss: 0.34232843422084763
Epoch: 47, step: 1273, loss: 0.33696261048316956, mean loss: 0.34232835661499683
Epoch: 47, step: 1274, loss: 0.3501228988170624, mean loss: 0.3423284693457462
Epoch: 47, step: 1275, loss: 0.3705861270427704, mean loss: 0.34232887802412315
Epoch: 47, step: 1276, loss: 0.33576396107673645, mean loss: 0.3423287830799197
Epoch: 47, step: 1277, loss: 0.33511844277381897, mean loss: 0.34232867880287826
Epoch: 47, step: 1278, loss: 0.3249547779560089, mean loss: 0.34232842754250764
Epoch: 47, step: 1279, loss: 0.3604797124862671, mean loss: 0.3423286900415668
Epoch: 47, step: 1280, loss: 0.3051060140132904, mean loss: 0.34232815174490266
Epoch: 47, step: 1281, loss: 0.3149421811103821, mean loss: 0.3423277557077279
Epoch: 47, step: 1282, loss: 0.3718741536140442, mean loss: 0.34232818298134515
Epoch: 47, step: 1283, loss: 0.34099963307380676, mean loss: 0.3423281637693208
Epoch: 47, step: 1284, loss: 0.3637148141860962, mean loss: 0.34232847303501307
Epoch: 47, step: 1285, loss: 0.31516990065574646, mean loss: 0.34232808030903367
Epoch: 47, step: 1286, loss: 0.32255735993385315, mean loss: 0.3423277944190709
Epoch: 47, step: 1287, loss: 0.3109438121318817, mean loss: 0.3423273406047629
Epoch: 47, step: 1288, loss: 0.34113121032714844, mean loss: 0.3423273233088958
Epoch: 47, step: 1289, loss: 0.32492297887802124, mean loss: 0.34232707164828635
Epoch: 47, step: 1290, loss: 0.35905930399894714, mean loss: 0.34232731358689666
Epoch: 47, step: 1291, loss: 0.3161640763282776, mean loss: 0.3423269352867628
Epoch: 47, step: 1292, loss: 0.329397052526474, mean loss: 0.3423267483333821
Epoch: 47, step: 1293, loss: 0.32204681634902954, mean loss: 0.34232645510976245
Epoch: 47, step: 1294, loss: 0.3271394968032837, mean loss: 0.3423262355276404
Epoch: 47, step: 1295, loss: 0.35517117381095886, mean loss: 0.34232642124475166
Epoch: 47, step: 1296, loss: 0.39400556683540344, mean loss: 0.34232716843112615
Epoch: 47, step: 1297, loss: 0.32868266105651855, mean loss: 0.3423269711592386
Epoch: 47, step: 1298, loss: 0.3497837781906128, mean loss: 0.3423270789679773
Epoch: 47, step: 1299, loss: 0.32137808203697205, mean loss: 0.3423267760967517
Epoch: 47, step: 1300, loss: 0.34312912821769714, mean loss: 0.34232678769663205
Epoch: 47, step: 1301, loss: 0.32461926341056824, mean loss: 0.34232653169657007
Epoch: 47, step: 1302, loss: 0.3379407227039337, mean loss: 0.3423264682912558
Epoch: 47, step: 1303, loss: 0.32697901129722595, mean loss: 0.34232624641741966
Epoch: 47, step: 1304, loss: 0.34453055262565613, mean loss: 0.3423262782839891
Epoch: 47, step: 1305, loss: 0.3440486192703247, mean loss: 0.3423263031826647
Epoch: 47, step: 1306, loss: 0.3481959104537964, mean loss: 0.3423263880342335
Epoch: 47, step: 1307, loss: 0.365143746137619, mean loss: 0.342326717879239
Epoch: 47, step: 1308, loss: 0.36639201641082764, mean loss: 0.34232706575929356
Epoch: 47, step: 1309, loss: 0.35456228256225586, mean loss: 0.3423272426250139
Epoch: 47, step: 1310, loss: 0.3394148349761963, mean loss: 0.34232720052542226
Epoch: 47, step: 1311, loss: 0.34794294834136963, mean loss: 0.3423272817013086
Epoch: 47, step: 1312, loss: 0.31108665466308594, mean loss: 0.34232683012317244
Epoch: 47, step: 1313, loss: 0.32140639424324036, mean loss: 0.3423265277260767
Epoch: 47, step: 1314, loss: 0.3355367183685303, mean loss: 0.34232642958333415
Epoch: 47, step: 1315, loss: 0.2934563159942627, mean loss: 0.3423257232044953
Epoch: 47, step: 1316, loss: 0.29969051480293274, mean loss: 0.34232510695518686
Epoch: 47, step: 1317, loss: 0.31168869137763977, mean loss: 0.3423246641428321
Epoch: 47, step: 1318, loss: 0.31658145785331726, mean loss: 0.3423242920612808
Epoch: 47, step: 1319, loss: 0.30418235063552856, mean loss: 0.34232374078155847
Epoch: 47, step: 1320, loss: 0.33092954754829407, mean loss: 0.3423235760994091
Epoch: 47, step: 1321, loss: 0.3516102731227875, mean loss: 0.34232371031962916
Epoch: 47, step: 1322, loss: 0.3108941912651062, mean loss: 0.34232325607674996
Epoch: 47, step: 1323, loss: 0.341845840215683, mean loss: 0.3423232491768792
Epoch: 47, step: 1324, loss: 0.31901803612709045, mean loss: 0.3423229123622729
Epoch: 47, step: 1325, loss: 0.35927143692970276, mean loss: 0.3423231573043859
Epoch: 47, step: 1326, loss: 0.32433781027793884, mean loss: 0.3423228973817466
Epoch: 47, step: 1327, loss: 0.31408411264419556, mean loss: 0.3423224892832331
Epoch: 47, step: 1328, loss: 0.31564438343048096, mean loss: 0.34232210374475813
Epoch: 47, step: 1329, loss: 0.3311613202095032, mean loss: 0.34232194245709757
Epoch: 47, step: 1330, loss: 0.31658539175987244, mean loss: 0.3423215705362505
Epoch: 47, step: 1331, loss: 0.3310777246952057, mean loss: 0.3423214080529291
Epoch: 47, step: 1332, loss: 0.3083760738372803, mean loss: 0.3423209175205059
Epoch: 47, step: 1333, loss: 0.34356769919395447, mean loss: 0.3423209355370614
Epoch: 47, step: 1334, loss: 0.319942831993103, mean loss: 0.3423206121680811
Epoch: 47, step: 1335, loss: 0.34459149837493896, mean loss: 0.34232064498245895
Epoch: 47, step: 1336, loss: 0.33842894434928894, mean loss: 0.3423205887480737
Epoch: 47, step: 1337, loss: 0.35043513774871826, mean loss: 0.3423207060001761
Epoch: 47, step: 1338, loss: 0.332101970911026, mean loss: 0.34232055834553005
Epoch: 47, step: 1339, loss: 0.3588024377822876, mean loss: 0.3423207964954468
Epoch: 47, step: 1340, loss: 0.3166802227497101, mean loss: 0.3423204260151083
Epoch: 47, step: 1341, loss: 0.3410699665546417, mean loss: 0.3423204079474958
Epoch: 47, step: 1342, loss: 0.3210710883140564, mean loss: 0.3423201009252069
Epoch: 47, step: 1343, loss: 0.33350130915641785, mean loss: 0.34231997350811494
Epoch: 47, step: 1344, loss: 0.3197087049484253, mean loss: 0.3423196468170517
Epoch: 47, step: 1345, loss: 0.36510515213012695, mean loss: 0.34231997602075775
Epoch: 47, step: 1346, loss: 0.313454270362854, mean loss: 0.34231955897668265
Epoch: 47, step: 1347, loss: 0.33254146575927734, mean loss: 0.34231941770742097
Epoch: 47, step: 1348, loss: 0.341562956571579, mean loss: 0.3423194067785865
Epoch: 47, step: 1349, loss: 0.32611024379730225, mean loss: 0.34231917260303996
Epoch: 47, step: 1350, loss: 0.3212825357913971, mean loss: 0.3423188686888428
Epoch: 47, step: 1351, loss: 0.3183467388153076, mean loss: 0.34231852237087296
Epoch: 47, step: 1352, loss: 0.3134622573852539, mean loss: 0.3423181054993313
Epoch: 47, step: 1353, loss: 0.3507660925388336, mean loss: 0.3423182275412694
Epoch: 47, step: 1354, loss: 0.3372267484664917, mean loss: 0.3423181539894286
Epoch: 47, step: 1355, loss: 0.32076725363731384, mean loss: 0.3423178426682055
Epoch: 47, step: 1356, loss: 0.3325376808643341, mean loss: 0.34231770138742823
Epoch: 47, step: 1357, loss: 0.352446973323822, mean loss: 0.3423178477092139
Epoch: 47, step: 1358, loss: 0.3649880588054657, mean loss: 0.3423181751856479
Epoch: 47, step: 1359, loss: 0.34759894013404846, mean loss: 0.34231825146641504
Epoch: 47, step: 1360, loss: 0.36408963799476624, mean loss: 0.342318565950035
Epoch: 47, step: 1361, loss: 0.3039950430393219, mean loss: 0.34231801238188664
Epoch: 47, step: 1362, loss: 0.3240426182746887, mean loss: 0.3423177484048517
Epoch: 47, step: 1363, loss: 0.3359210193157196, mean loss: 0.3423176560092963
Epoch: 47, step: 1364, loss: 0.29996415972709656, mean loss: 0.3423170442562843
Epoch: 47, step: 1365, loss: 0.30626925826072693, mean loss: 0.34231652359033987
Epoch: 47, step: 1366, loss: 0.33450937271118164, mean loss: 0.3423164108272738
Epoch: 47, step: 1367, loss: 0.38718363642692566, mean loss: 0.3423170588604589
Epoch: 47, step: 1368, loss: 0.30264538526535034, mean loss: 0.3423164858767421
Epoch: 47, step: 1369, loss: 0.30243104696273804, mean loss: 0.34231590981390214
Epoch: 47, step: 1370, loss: 0.32535064220428467, mean loss: 0.34231566478916736
Epoch: 47, step: 1371, loss: 0.3764208257198334, mean loss: 0.34231615735359444
Epoch: 47, step: 1372, loss: 0.2941044270992279, mean loss: 0.34231546106483124
Epoch: 47, step: 1373, loss: 0.3280180096626282, mean loss: 0.3423152545795853
Epoch: 47, step: 1374, loss: 0.3479427695274353, mean loss: 0.34231533585155427
Epoch: 47, step: 1375, loss: 0.33342963457107544, mean loss: 0.34231520752706
Epoch: 47, step: 1376, loss: 0.3519875705242157, mean loss: 0.3423153472102573
Epoch: 47, step: 1377, loss: 0.34919682145118713, mean loss: 0.3423154465874667
Epoch: 47, step: 1378, loss: 0.3592448830604553, mean loss: 0.3423156910664546
Epoch: 47, step: 1379, loss: 0.3317895233631134, mean loss: 0.3423155390596428
Epoch: 47, step: 1380, loss: 0.3314018249511719, mean loss: 0.3423153814586073
Epoch: 47, step: 1381, loss: 0.34682342410087585, mean loss: 0.342315446556696
Epoch: 47, step: 1382, loss: 0.319475919008255, mean loss: 0.3423151167487864
Epoch: 47, step: 1383, loss: 0.3251040577888489, mean loss: 0.34231486822081664
Epoch: 47, step: 1384, loss: 0.3540107011795044, mean loss: 0.342315037106395
Epoch: 47, step: 1385, loss: 0.3584345877170563, mean loss: 0.3423152698662444
Epoch: 47, step: 1386, loss: 0.32830697298049927, mean loss: 0.3423150675949732
Epoch: 47, step: 1387, loss: 0.32118934392929077, mean loss: 0.3423147625568008
Epoch: 47, step: 1388, loss: 0.3171228766441345, mean loss: 0.34231439881182324
Epoch: 47, step: 1389, loss: 0.3140179514884949, mean loss: 0.34231399024606446
Epoch: 47, step: 1390, loss: 0.34952229261398315, mean loss: 0.3423140943235471
Epoch: 47, step: 1391, loss: 0.3668046295642853, mean loss: 0.3423144479264238
Epoch: 47, step: 1392, loss: 0.3949766755104065, mean loss: 0.3423152082710273
Epoch: 47, step: 1393, loss: 0.345246821641922, mean loss: 0.3423152505974598
Epoch: 47, step: 1394, loss: 0.33979272842407227, mean loss: 0.3423152141779837
Epoch: 47, step: 1395, loss: 0.3270799219608307, mean loss: 0.34231499421823236
Epoch: 47, step: 1396, loss: 0.2891820967197418, mean loss: 0.34231422712233256
Epoch: 47, step: 1397, loss: 0.28575578331947327, mean loss: 0.3423134105825612
Epoch: 47, step: 1398, loss: 0.31756898760795593, mean loss: 0.3423130533500699
Epoch: 47, step: 1399, loss: 0.33708685636520386, mean loss: 0.34231297790113263
Epoch: 47, step: 1400, loss: 0.34907716512680054, mean loss: 0.3423130755521342
Epoch: 47, step: 1401, loss: 0.3974305987358093, mean loss: 0.3423138712432441
Epoch: 47, step: 1402, loss: 0.3378024995326996, mean loss: 0.3423138061168317
Epoch: 47, step: 1403, loss: 0.3412872850894928, mean loss: 0.3423137912981311
Epoch: 47, step: 1404, loss: 0.2732085883617401, mean loss: 0.3423127937203889
Epoch: 47, step: 1405, loss: 0.32237815856933594, mean loss: 0.34231250595535223
Epoch: 47, step: 1406, loss: 0.33071261644363403, mean loss: 0.3423123385083726
Epoch: 47, step: 1407, loss: 0.3515491485595703, mean loss: 0.34231247184185104
Epoch: 47, step: 1408, loss: 0.31851649284362793, mean loss: 0.3423121283515296
Epoch: 47, step: 1409, loss: 0.3164258301258087, mean loss: 0.342311754693251
Epoch: 47, step: 1410, loss: 0.35444122552871704, mean loss: 0.34231192977474517
Epoch: 47, step: 1411, loss: 0.370212197303772, mean loss: 0.3423123324922326
Epoch: 47, step: 1412, loss: 0.3178142011165619, mean loss: 0.34231197888689524
Epoch: 47, step: 1413, loss: 0.3232392370700836, mean loss: 0.3423117035954513
Epoch: 47, step: 1414, loss: 0.33213889598846436, mean loss: 0.34231155676567193
Epoch: 47, step: 1415, loss: 0.3344736397266388, mean loss: 0.3423114436382971
Epoch: 47, step: 1416, loss: 0.30309754610061646, mean loss: 0.34231087765868334
Epoch: 47, step: 1417, loss: 0.2929917275905609, mean loss: 0.34231016583883417
Epoch: 47, step: 1418, loss: 0.3247348964214325, mean loss: 0.34230991217985896
Epoch: 47, step: 1419, loss: 0.33851778507232666, mean loss: 0.34230985744993303
Epoch: 47, step: 1420, loss: 0.3645966649055481, mean loss: 0.34231017909994177
Epoch: 47, step: 1421, loss: 0.3692990839481354, mean loss: 0.342310568606434
Epoch: 47, step: 1422, loss: 0.32397693395614624, mean loss: 0.3423103040174592
Epoch: 47, step: 1423, loss: 0.3034849464893341, mean loss: 0.342309743702307
Epoch: 47, step: 1424, loss: 0.35138508677482605, mean loss: 0.34230987467286783
Epoch: 47, step: 1425, loss: 0.3060755431652069, mean loss: 0.34230935176566796
Epoch: 47, step: 1426, loss: 0.30414992570877075, mean loss: 0.34230880108486766
Epoch: 47, step: 1427, loss: 0.342507541179657, mean loss: 0.3423088039528556
Epoch: 47, step: 1428, loss: 0.32135820388793945, mean loss: 0.34230850162230647
Epoch: 47, step: 1429, loss: 0.3356906473636627, mean loss: 0.3423084061238179
Epoch: 47, step: 1430, loss: 0.36310526728630066, mean loss: 0.3423087062271551
Epoch: 47, step: 1431, loss: 0.32132646441459656, mean loss: 0.342308403453103
Epoch: 47, step: 1432, loss: 0.33066603541374207, mean loss: 0.3423082354559884
Epoch: 47, step: 1433, loss: 0.3560349941253662, mean loss: 0.3423084335275977
Epoch: 47, step: 1434, loss: 0.31741800904273987, mean loss: 0.342308074373961
Epoch: 47, step: 1435, loss: 0.3333815038204193, mean loss: 0.3423079455708536
Epoch: 47, step: 1436, loss: 0.311735063791275, mean loss: 0.3423075044355563
Epoch: 47, step: 1437, loss: 0.33230507373809814, mean loss: 0.34230736011283247
Epoch: 47, step: 1438, loss: 0.31147924065589905, mean loss: 0.3423069153075537
Epoch: 47, step: 1439, loss: 0.37150511145591736, mean loss: 0.3423073365893126
Epoch: 47, step: 1440, loss: 0.36086004972457886, mean loss: 0.3423076042704671
Epoch: 47, step: 1441, loss: 0.34345200657844543, mean loss: 0.3423076207818263
Epoch: 47, step: 1442, loss: 0.32601577043533325, mean loss: 0.3423073857275009
Epoch: 47, step: 1443, loss: 0.3105257749557495, mean loss: 0.34230692719779793
Valid: 47, mean loss: 0.18497942884763083
Epoch: 48, step: 0, loss: 0.30221548676490784, mean loss: 0.3423063487862383
Epoch: 48, step: 1, loss: 0.31270450353622437, mean loss: 0.34230592171746066
Epoch: 48, step: 2, loss: 0.30481019616127014, mean loss: 0.34230538077068784
Epoch: 48, step: 3, loss: 0.34711459279060364, mean loss: 0.34230545015166797
Epoch: 48, step: 4, loss: 0.3103159964084625, mean loss: 0.3423049886565983
Epoch: 48, step: 5, loss: 0.3512674570083618, mean loss: 0.3423051179515628
Epoch: 48, step: 6, loss: 0.2931252419948578, mean loss: 0.3423044084797592
Epoch: 48, step: 7, loss: 0.33238255977630615, mean loss: 0.3423042653486469
Epoch: 48, step: 8, loss: 0.3647918403148651, mean loss: 0.3423045897463758
Epoch: 48, step: 9, loss: 0.35222920775413513, mean loss: 0.34230473291330704
Epoch: 48, step: 10, loss: 0.2980099022388458, mean loss: 0.34230409395032685
Epoch: 48, step: 11, loss: 0.3404746353626251, mean loss: 0.3423040675603524
Epoch: 48, step: 12, loss: 0.33547964692115784, mean loss: 0.3423039691193767
Epoch: 48, step: 13, loss: 0.34004083275794983, mean loss: 0.34230393647453405
Epoch: 48, step: 14, loss: 0.3374629318714142, mean loss: 0.34230386664597373
Epoch: 48, step: 15, loss: 0.32793083786964417, mean loss: 0.34230365932672646
Epoch: 48, step: 16, loss: 0.3083604872226715, mean loss: 0.34230316973114444
Epoch: 48, step: 17, loss: 0.3266032636165619, mean loss: 0.3423029432793038
Epoch: 48, step: 18, loss: 0.35942572355270386, mean loss: 0.3423031902507923
Epoch: 48, step: 19, loss: 0.36919066309928894, mean loss: 0.34230357805833933
Epoch: 48, step: 20, loss: 0.32008081674575806, mean loss: 0.3423032575362025
Epoch: 48, step: 21, loss: 0.3587455153465271, mean loss: 0.34230349468187143
Epoch: 48, step: 22, loss: 0.32629430294036865, mean loss: 0.3423032637856179
Epoch: 48, step: 23, loss: 0.3542032241821289, mean loss: 0.342303435413061
Epoch: 48, step: 24, loss: 0.3030184209346771, mean loss: 0.3423028688322387
Epoch: 48, step: 25, loss: 0.3359281122684479, mean loss: 0.3423027768948225
Epoch: 48, step: 26, loss: 0.31482169032096863, mean loss: 0.34230238056538925
Epoch: 48, step: 27, loss: 0.335531622171402, mean loss: 0.3423022829196091
Epoch: 48, step: 28, loss: 0.312282532453537, mean loss: 0.34230184999031094
Epoch: 48, step: 29, loss: 0.3907885253429413, mean loss: 0.34230254922995434
Epoch: 48, step: 30, loss: 0.32887187600135803, mean loss: 0.34230235554532534
Epoch: 48, step: 31, loss: 0.3593862056732178, mean loss: 0.3423026019091078
Epoch: 48, step: 32, loss: 0.40471765398979187, mean loss: 0.34230350197475173
Epoch: 48, step: 33, loss: 0.35712355375289917, mean loss: 0.34230371568645507
Epoch: 48, step: 34, loss: 0.3059900403022766, mean loss: 0.34230319203474147
Epoch: 48, step: 35, loss: 0.3078037202358246, mean loss: 0.34230269455144274
Epoch: 48, step: 36, loss: 0.33051571249961853, mean loss: 0.34230252458529975
Epoch: 48, step: 37, loss: 0.32535216212272644, mean loss: 0.34230228016767233
Epoch: 48, step: 38, loss: 0.3480369746685028, mean loss: 0.342302362858542
Epoch: 48, step: 39, loss: 0.3172060549259186, mean loss: 0.34230200098998836
Epoch: 48, step: 40, loss: 0.3436780273914337, mean loss: 0.34230202083089506
Epoch: 48, step: 41, loss: 0.3314695656299591, mean loss: 0.3423018646401173
Epoch: 48, step: 42, loss: 0.36254826188087463, mean loss: 0.34230215656423585
Epoch: 48, step: 43, loss: 0.29815107583999634, mean loss: 0.3423015199779171
Epoch: 48, step: 44, loss: 0.344469279050827, mean loss: 0.34230155123300415
Epoch: 48, step: 45, loss: 0.3304101228713989, mean loss: 0.3423013797830148
Epoch: 48, step: 46, loss: 0.3310836851596832, mean loss: 0.34230121804921493
Epoch: 48, step: 47, loss: 0.31652864813804626, mean loss: 0.34230084647237075
Epoch: 48, step: 48, loss: 0.3918951749801636, mean loss: 0.3423015614898663
Epoch: 48, step: 49, loss: 0.3314618170261383, mean loss: 0.34230140521201297
Epoch: 48, step: 50, loss: 0.34223634004592896, mean loss: 0.34230140427397443
Epoch: 48, step: 51, loss: 0.3113217055797577, mean loss: 0.3423009576489428
Epoch: 48, step: 52, loss: 0.3489472270011902, mean loss: 0.34230105346483486
Epoch: 48, step: 53, loss: 0.33928006887435913, mean loss: 0.34230100991346113
Epoch: 48, step: 54, loss: 0.32059088349342346, mean loss: 0.34230069693861115
Epoch: 48, step: 55, loss: 0.32886481285095215, mean loss: 0.3423005032486664
Epoch: 48, step: 56, loss: 0.3192029595375061, mean loss: 0.3423001702823023
Epoch: 48, step: 57, loss: 0.30794838070869446, mean loss: 0.34229967508568165
Epoch: 48, step: 58, loss: 0.3487863838672638, mean loss: 0.3422997685931816
Epoch: 48, step: 59, loss: 0.34702643752098083, mean loss: 0.34229983672829273
Epoch: 48, step: 60, loss: 0.3424232602119446, mean loss: 0.34229983850742124
Epoch: 48, step: 61, loss: 0.2926829755306244, mean loss: 0.342299123299087
Epoch: 48, step: 62, loss: 0.31086939573287964, mean loss: 0.34229867025796895
Epoch: 48, step: 63, loss: 0.29378679394721985, mean loss: 0.3422979709977592
Epoch: 48, step: 64, loss: 0.36305853724479675, mean loss: 0.34229827024053777
Epoch: 48, step: 65, loss: 0.3393230438232422, mean loss: 0.34229822735624565
Epoch: 48, step: 66, loss: 0.3631974458694458, mean loss: 0.3422985285888739
Epoch: 48, step: 67, loss: 0.3003047704696655, mean loss: 0.3422979233170647
Epoch: 48, step: 68, loss: 0.36242911219596863, mean loss: 0.34229821347126943
Epoch: 48, step: 69, loss: 0.34489819407463074, mean loss: 0.3422982509446862
Epoch: 48, step: 70, loss: 0.32088568806648254, mean loss: 0.3422979423307191
Epoch: 48, step: 71, loss: 0.31481215357780457, mean loss: 0.34229754619056063
Epoch: 48, step: 72, loss: 0.3661729395389557, mean loss: 0.3422978902907746
Epoch: 48, step: 73, loss: 0.3154585063457489, mean loss: 0.3422975034781043
Epoch: 48, step: 74, loss: 0.3412330746650696, mean loss: 0.3422974881376397
Epoch: 48, step: 75, loss: 0.36117252707481384, mean loss: 0.34229776015929964
Epoch: 48, step: 76, loss: 0.31612563133239746, mean loss: 0.3422973829795042
Epoch: 48, step: 77, loss: 0.32778167724609375, mean loss: 0.34229717378933655
Epoch: 48, step: 78, loss: 0.3634715676307678, mean loss: 0.3422974789354483
Epoch: 48, step: 79, loss: 0.3346702754497528, mean loss: 0.3422973690207105
Epoch: 48, step: 80, loss: 0.33158448338508606, mean loss: 0.3422972146407927
Epoch: 48, step: 81, loss: 0.32616516947746277, mean loss: 0.34229698217047594
Epoch: 48, step: 82, loss: 0.3354478180408478, mean loss: 0.34229688347223935
Epoch: 48, step: 83, loss: 0.33921974897384644, mean loss: 0.34229683913056985
Epoch: 48, step: 84, loss: 0.2954978346824646, mean loss: 0.3422961647641787
Epoch: 48, step: 85, loss: 0.339220255613327, mean loss: 0.34229612044144386
Epoch: 48, step: 86, loss: 0.33819544315338135, mean loss: 0.34229606135302343
Epoch: 48, step: 87, loss: 0.33687132596969604, mean loss: 0.34229598318680754
Epoch: 48, step: 88, loss: 0.34170255064964294, mean loss: 0.3422959746360296
Epoch: 48, step: 89, loss: 0.3028111457824707, mean loss: 0.3422954057067646
Epoch: 48, step: 90, loss: 0.29666924476623535, mean loss: 0.34229474829770534
Epoch: 48, step: 91, loss: 0.3675403296947479, mean loss: 0.34229511204592444
Epoch: 48, step: 92, loss: 0.31579944491386414, mean loss: 0.3422947302914812
Epoch: 48, step: 93, loss: 0.332469642162323, mean loss: 0.34229458873184476
Epoch: 48, step: 94, loss: 0.3419007360935211, mean loss: 0.34229458305730703
Epoch: 48, step: 95, loss: 0.3399121165275574, mean loss: 0.34229454873177495
Epoch: 48, step: 96, loss: 0.3246259391307831, mean loss: 0.34229429417387036
Epoch: 48, step: 97, loss: 0.36981499195098877, mean loss: 0.3422946906685797
Epoch: 48, step: 98, loss: 0.33722782135009766, mean loss: 0.3422946176705056
Epoch: 48, step: 99, loss: 0.3270140290260315, mean loss: 0.34229439752717816
Epoch: 48, step: 100, loss: 0.3152143359184265, mean loss: 0.3422940073976403
Epoch: 48, step: 101, loss: 0.327569842338562, mean loss: 0.34229379527666964
Epoch: 48, step: 102, loss: 0.31053775548934937, mean loss: 0.3422933377957248
Epoch: 48, step: 103, loss: 0.36040550470352173, mean loss: 0.34229359871780196
Epoch: 48, step: 104, loss: 0.33793729543685913, mean loss: 0.3422935359622337
Epoch: 48, step: 105, loss: 0.3450450897216797, mean loss: 0.3422935755997018
Epoch: 48, step: 106, loss: 0.325187623500824, mean loss: 0.34229332918370475
Epoch: 48, step: 107, loss: 0.36751478910446167, mean loss: 0.34229369250061514
Epoch: 48, step: 108, loss: 0.3142186999320984, mean loss: 0.3422932880841912
Epoch: 48, step: 109, loss: 0.3100811541080475, mean loss: 0.34229282407949563
Epoch: 48, step: 110, loss: 0.34498199820518494, mean loss: 0.34229286281556476
Epoch: 48, step: 111, loss: 0.32718315720558167, mean loss: 0.34229264517172964
Epoch: 48, step: 112, loss: 0.3372504413127899, mean loss: 0.3422925725436582
Epoch: 48, step: 113, loss: 0.32000505924224854, mean loss: 0.3422922515182023
Epoch: 48, step: 114, loss: 0.33967283368110657, mean loss: 0.3422922137891079
Epoch: 48, step: 115, loss: 0.35535043478012085, mean loss: 0.3422924018720282
Epoch: 48, step: 116, loss: 0.31730639934539795, mean loss: 0.34229204199355484
Epoch: 48, step: 117, loss: 0.3086124062538147, mean loss: 0.34229155690590196
Epoch: 48, step: 118, loss: 0.32520559430122375, mean loss: 0.3422913108203983
Epoch: 48, step: 119, loss: 0.3439829349517822, mean loss: 0.3422913351841518
Epoch: 48, step: 120, loss: 0.3382333517074585, mean loss: 0.34229127673955806
Epoch: 48, step: 121, loss: 0.3084203004837036, mean loss: 0.34229078892413256
Epoch: 48, step: 122, loss: 0.3126879930496216, mean loss: 0.34229036258588996
Epoch: 48, step: 123, loss: 0.3361928164958954, mean loss: 0.3422902747705479
Epoch: 48, step: 124, loss: 0.3157814145088196, mean loss: 0.34228989300203455
Epoch: 48, step: 125, loss: 0.35307425260543823, mean loss: 0.34229004831122556
Epoch: 48, step: 126, loss: 0.37788885831832886, mean loss: 0.34229056097428245
Epoch: 48, step: 127, loss: 0.306803822517395, mean loss: 0.34229004993254203
Epoch: 48, step: 128, loss: 0.33009883761405945, mean loss: 0.3422898743703768
Epoch: 48, step: 129, loss: 0.3192862570285797, mean loss: 0.34228954310662657
Epoch: 48, step: 130, loss: 0.31126081943511963, mean loss: 0.3422890962837118
Epoch: 48, step: 131, loss: 0.38193780183792114, mean loss: 0.34228966722872584
Epoch: 48, step: 132, loss: 0.30325260758399963, mean loss: 0.342289105099564
Epoch: 48, step: 133, loss: 0.34431344270706177, mean loss: 0.3422891342493726
Epoch: 48, step: 134, loss: 0.36527979373931885, mean loss: 0.34228946530268645
Epoch: 48, step: 135, loss: 0.32297536730766296, mean loss: 0.3422891871939145
Epoch: 48, step: 136, loss: 0.3315545916557312, mean loss: 0.3422890326258784
Epoch: 48, step: 137, loss: 0.35376137495040894, mean loss: 0.34228919781439276
Epoch: 48, step: 138, loss: 0.35286176204681396, mean loss: 0.34228935004494715
Epoch: 48, step: 139, loss: 0.2936760187149048, mean loss: 0.3422886500891312
Epoch: 48, step: 140, loss: 0.3252063989639282, mean loss: 0.34228840413501654
Epoch: 48, step: 141, loss: 0.33463263511657715, mean loss: 0.34228829390711
Epoch: 48, step: 142, loss: 0.30144673585891724, mean loss: 0.3422877058780545
Epoch: 48, step: 143, loss: 0.33359357714653015, mean loss: 0.34228758070342985
Epoch: 48, step: 144, loss: 0.341831237077713, mean loss: 0.34228757413326955
Epoch: 48, step: 145, loss: 0.3048412501811981, mean loss: 0.3422870350114412
Epoch: 48, step: 146, loss: 0.3547383248806, mean loss: 0.3422872142724422
Epoch: 48, step: 147, loss: 0.37666741013526917, mean loss: 0.3422877092363907
Epoch: 48, step: 148, loss: 0.3315665125846863, mean loss: 0.34228755488795554
Epoch: 48, step: 149, loss: 0.37599676847457886, mean loss: 0.3422880401779499
Epoch: 48, step: 150, loss: 0.3262128233909607, mean loss: 0.3422878087566639
Epoch: 48, step: 151, loss: 0.31417474150657654, mean loss: 0.34228740404246305
Epoch: 48, step: 152, loss: 0.3212642967700958, mean loss: 0.3422871013993007
Epoch: 48, step: 153, loss: 0.3223372995853424, mean loss: 0.3422868142112977
Epoch: 48, step: 154, loss: 0.3536139726638794, mean loss: 0.34228697726941815
Epoch: 48, step: 155, loss: 0.37497758865356445, mean loss: 0.3422874478545996
Epoch: 48, step: 156, loss: 0.34096336364746094, mean loss: 0.3422874287945266
Epoch: 48, step: 157, loss: 0.3315028250217438, mean loss: 0.342287273553361
Epoch: 48, step: 158, loss: 0.34417301416397095, mean loss: 0.34228730069764585
Epoch: 48, step: 159, loss: 0.318742573261261, mean loss: 0.34228696178805007
Epoch: 48, step: 160, loss: 0.34816280007362366, mean loss: 0.3422870463653432
Epoch: 48, step: 161, loss: 0.3299661874771118, mean loss: 0.3422868690204532
Epoch: 48, step: 162, loss: 0.29909101128578186, mean loss: 0.3422862472736704
Epoch: 48, step: 163, loss: 0.3079807758331299, mean loss: 0.3422857534992528
Epoch: 48, step: 164, loss: 0.3259035348892212, mean loss: 0.34228551770584476
Epoch: 48, step: 165, loss: 0.332956999540329, mean loss: 0.3422853834400604
Epoch: 48, step: 166, loss: 0.33967432379722595, mean loss: 0.3422853458595016
Epoch: 48, step: 167, loss: 0.3396197557449341, mean loss: 0.34228530749464675
Epoch: 48, step: 168, loss: 0.335668683052063, mean loss: 0.34228521226538344
Epoch: 48, step: 169, loss: 0.34146568179130554, mean loss: 0.3422852004705233
Epoch: 48, step: 170, loss: 0.3502403497695923, mean loss: 0.34228531496110803
Epoch: 48, step: 171, loss: 0.3078266978263855, mean loss: 0.34228481903949826
Epoch: 48, step: 172, loss: 0.34313660860061646, mean loss: 0.3422848312981089
Epoch: 48, step: 173, loss: 0.31411463022232056, mean loss: 0.34228442588980973
Epoch: 48, step: 174, loss: 0.31434616446495056, mean loss: 0.3422840238252304
Epoch: 48, step: 175, loss: 0.3156747817993164, mean loss: 0.3422836408923207
Epoch: 48, step: 176, loss: 0.33198246359825134, mean loss: 0.34228349265047964
Epoch: 48, step: 177, loss: 0.2982492744922638, mean loss: 0.3422828589734303
Epoch: 48, step: 178, loss: 0.30296793580055237, mean loss: 0.34228229321781917
Epoch: 48, step: 179, loss: 0.3209340274333954, mean loss: 0.3422819860131656
Epoch: 48, step: 180, loss: 0.32528170943260193, mean loss: 0.3422817413802302
Epoch: 48, step: 181, loss: 0.3533652424812317, mean loss: 0.342281900868835
Epoch: 48, step: 182, loss: 0.33664774894714355, mean loss: 0.34228181979606825
Epoch: 48, step: 183, loss: 0.30079469084739685, mean loss: 0.342281222824603
Epoch: 48, step: 184, loss: 0.3404555916786194, mean loss: 0.342281196555395
Epoch: 48, step: 185, loss: 0.34873953461647034, mean loss: 0.3422812894837967
Epoch: 48, step: 186, loss: 0.3290213346481323, mean loss: 0.3422810986903344
Epoch: 48, step: 187, loss: 0.36888688802719116, mean loss: 0.3422814815074472
Epoch: 48, step: 188, loss: 0.32953372597694397, mean loss: 0.3422812980891434
Epoch: 48, step: 189, loss: 0.3307447135448456, mean loss: 0.34228113209989786
Epoch: 48, step: 190, loss: 0.3513776659965515, mean loss: 0.3422812629796282
Epoch: 48, step: 191, loss: 0.3316728472709656, mean loss: 0.3422811103493377
Epoch: 48, step: 192, loss: 0.3003147542476654, mean loss: 0.3422805065603139
Epoch: 48, step: 193, loss: 0.3154509663581848, mean loss: 0.34228012055708823
Epoch: 48, step: 194, loss: 0.3105851709842682, mean loss: 0.342279664560576
Epoch: 48, step: 195, loss: 0.30937203764915466, mean loss: 0.3422791911240376
Epoch: 48, step: 196, loss: 0.2984044551849365, mean loss: 0.34227855991461237
Epoch: 48, step: 197, loss: 0.35801705718040466, mean loss: 0.34227878633523195
Epoch: 48, step: 198, loss: 0.32423925399780273, mean loss: 0.3422785268146908
Epoch: 48, step: 199, loss: 0.30173417925834656, mean loss: 0.3422779435434922
Epoch: 48, step: 200, loss: 0.30454492568969727, mean loss: 0.3422774007239066
Epoch: 48, step: 201, loss: 0.3215254247188568, mean loss: 0.3422771021944592
Epoch: 48, step: 202, loss: 0.3462843596935272, mean loss: 0.3422771598403989
Epoch: 48, step: 203, loss: 0.2979627251625061, mean loss: 0.34227652236938966
Epoch: 48, step: 204, loss: 0.3223321735858917, mean loss: 0.3422762354705191
Epoch: 48, step: 205, loss: 0.3209417760372162, mean loss: 0.3422759285793624
Epoch: 48, step: 206, loss: 0.3125317394733429, mean loss: 0.3422755007223865
Epoch: 48, step: 207, loss: 0.37083858251571655, mean loss: 0.34227591158374715
Epoch: 48, step: 208, loss: 0.2940274775028229, mean loss: 0.34227521757137563
Epoch: 48, step: 209, loss: 0.3460768461227417, mean loss: 0.3422752722537575
Epoch: 48, step: 210, loss: 0.3319775462150574, mean loss: 0.34227512413405553
Epoch: 48, step: 211, loss: 0.3771492540836334, mean loss: 0.34227562574687914
Epoch: 48, step: 212, loss: 0.32835984230041504, mean loss: 0.3422754255917774
Epoch: 48, step: 213, loss: 0.3373529314994812, mean loss: 0.3422753547910109
Epoch: 48, step: 214, loss: 0.34303417801856995, mean loss: 0.3422753657050907
Epoch: 48, step: 215, loss: 0.3252755403518677, mean loss: 0.342275121201792
Epoch: 48, step: 216, loss: 0.2962739169597626, mean loss: 0.3422744595900294
Epoch: 48, step: 217, loss: 0.31240811944007874, mean loss: 0.34227403004393203
Epoch: 48, step: 218, loss: 0.33053117990493774, mean loss: 0.3422738611573902
Epoch: 48, step: 219, loss: 0.4327908456325531, mean loss: 0.34227516296065313
Epoch: 48, step: 220, loss: 0.30598801374435425, mean loss: 0.3422746410911924
Epoch: 48, step: 221, loss: 0.3934691846370697, mean loss: 0.3422753773431489
Epoch: 48, step: 222, loss: 0.3385912775993347, mean loss: 0.34227532436120106
Epoch: 48, step: 223, loss: 0.361392080783844, mean loss: 0.34227559928004053
Epoch: 48, step: 224, loss: 0.29848378896713257, mean loss: 0.3422749695173198
Epoch: 48, step: 225, loss: 0.3377051055431366, mean loss: 0.3422749037998132
Epoch: 48, step: 226, loss: 0.3144678473472595, mean loss: 0.342274503922673
Epoch: 48, step: 227, loss: 0.3249574601650238, mean loss: 0.3422742548998982
Epoch: 48, step: 228, loss: 0.32904040813446045, mean loss: 0.3422740645971018
Epoch: 48, step: 229, loss: 0.3015635013580322, mean loss: 0.3422734791873747
Epoch: 48, step: 230, loss: 0.3181155323982239, mean loss: 0.34227313180594465
Epoch: 48, step: 231, loss: 0.3193475306034088, mean loss: 0.34227280214988226
Epoch: 48, step: 232, loss: 0.3591032326221466, mean loss: 0.3422730441576538
Epoch: 48, step: 233, loss: 0.3385530114173889, mean loss: 0.34227299066740646
Epoch: 48, step: 234, loss: 0.3172256350517273, mean loss: 0.3422726305173552
Epoch: 48, step: 235, loss: 0.3460814952850342, mean loss: 0.3422726852833408
Epoch: 48, step: 236, loss: 0.3478209674358368, mean loss: 0.34227276505849435
Epoch: 48, step: 237, loss: 0.37211504578590393, mean loss: 0.34227319413514035
Epoch: 48, step: 238, loss: 0.3306388854980469, mean loss: 0.3422730268577664
Epoch: 48, step: 239, loss: 0.37627580761909485, mean loss: 0.3422735157406276
Epoch: 48, step: 240, loss: 0.3037125766277313, mean loss: 0.34227296132975943
Epoch: 48, step: 241, loss: 0.3288416564464569, mean loss: 0.34227276822361336
Epoch: 48, step: 242, loss: 0.3172338306903839, mean loss: 0.3422724082360131
Epoch: 48, step: 243, loss: 0.3652340769767761, mean loss: 0.3422727383537419
Epoch: 48, step: 244, loss: 0.42824020981788635, mean loss: 0.34227397428213824
Epoch: 48, step: 245, loss: 0.31032034754753113, mean loss: 0.34227351490109315
Epoch: 48, step: 246, loss: 0.3143455982208252, mean loss: 0.3422731134014068
Epoch: 48, step: 247, loss: 0.32484644651412964, mean loss: 0.34227286287428077
Epoch: 48, step: 248, loss: 0.32273101806640625, mean loss: 0.34227258194323024
Epoch: 48, step: 249, loss: 0.33771106600761414, mean loss: 0.34227251636840583
Epoch: 48, step: 250, loss: 0.321397602558136, mean loss: 0.34227221628195453
Epoch: 48, step: 251, loss: 0.34659627079963684, mean loss: 0.342272278441326
Epoch: 48, step: 252, loss: 0.36842966079711914, mean loss: 0.3422726544548724
Epoch: 48, step: 253, loss: 0.3104649484157562, mean loss: 0.34227219722424196
Epoch: 48, step: 254, loss: 0.3202759921550751, mean loss: 0.3422718810368964
Epoch: 48, step: 255, loss: 0.31276649236679077, mean loss: 0.34227145691389915
Epoch: 48, step: 256, loss: 0.30779409408569336, mean loss: 0.34227096132875595
Epoch: 48, step: 257, loss: 0.34469130635261536, mean loss: 0.34227099611882383
Epoch: 48, step: 258, loss: 0.3152424693107605, mean loss: 0.3422706076160453
Epoch: 48, step: 259, loss: 0.29743921756744385, mean loss: 0.3422699632276412
Epoch: 48, step: 260, loss: 0.3301893472671509, mean loss: 0.3422697895882127
Epoch: 48, step: 261, loss: 0.32822924852371216, mean loss: 0.34226958778091304
Epoch: 48, step: 262, loss: 0.3457784056663513, mean loss: 0.3422696382130781
Epoch: 48, step: 263, loss: 0.2996217608451843, mean loss: 0.34226902524485103
Epoch: 48, step: 264, loss: 0.3501596748828888, mean loss: 0.34226913865373093
Epoch: 48, step: 265, loss: 0.35741403698921204, mean loss: 0.342269356321648
Epoch: 48, step: 266, loss: 0.31425485014915466, mean loss: 0.3422689536928926
Epoch: 48, step: 267, loss: 0.3334210216999054, mean loss: 0.34226882653089213
Epoch: 48, step: 268, loss: 0.34605827927589417, mean loss: 0.3422688809919195
Epoch: 48, step: 269, loss: 0.36244750022888184, mean loss: 0.3422691709896091
Epoch: 48, step: 270, loss: 0.30430513620376587, mean loss: 0.3422686253960764
Epoch: 48, step: 271, loss: 0.3193739652633667, mean loss: 0.3422682963741729
Epoch: 48, step: 272, loss: 0.35630106925964355, mean loss: 0.34226849803793497
Epoch: 48, step: 273, loss: 0.2975042164325714, mean loss: 0.3422678547435711
Epoch: 48, step: 274, loss: 0.3037397265434265, mean loss: 0.3422673010750956
Epoch: 48, step: 275, loss: 0.3082060217857361, mean loss: 0.34226681160450745
Epoch: 48, step: 276, loss: 0.39011386036872864, mean loss: 0.3422674991707717
Epoch: 48, step: 277, loss: 0.3189908266067505, mean loss: 0.3422671646877632
Epoch: 48, step: 278, loss: 0.316904217004776, mean loss: 0.34226680023046724
Epoch: 48, step: 279, loss: 0.290335088968277, mean loss: 0.3422660539994168
Epoch: 48, step: 280, loss: 0.3281862735748291, mean loss: 0.34226585168337315
Epoch: 48, step: 281, loss: 0.3453593850135803, mean loss: 0.34226589613452313
Epoch: 48, step: 282, loss: 0.37493184208869934, mean loss: 0.3422663655065463
Epoch: 48, step: 283, loss: 0.32852545380592346, mean loss: 0.34226616806830706
Epoch: 48, step: 284, loss: 0.28367218375205994, mean loss: 0.34226532616442734
Epoch: 48, step: 285, loss: 0.30426132678985596, mean loss: 0.3422647801142625
Epoch: 48, step: 286, loss: 0.29264363646507263, mean loss: 0.3422640671565526
Epoch: 48, step: 287, loss: 0.36224237084388733, mean loss: 0.3422643542011458
Epoch: 48, step: 288, loss: 0.3176593780517578, mean loss: 0.3422640006864528
Epoch: 48, step: 289, loss: 0.3089243471622467, mean loss: 0.34226352168220686
Epoch: 48, step: 290, loss: 0.33507323265075684, mean loss: 0.3422634183779092
Epoch: 48, step: 291, loss: 0.33902662992477417, mean loss: 0.34226337187500055
Epoch: 48, step: 292, loss: 0.31743675470352173, mean loss: 0.3422630151963543
Epoch: 48, step: 293, loss: 0.3041897416114807, mean loss: 0.3422624682137151
Epoch: 48, step: 294, loss: 0.3267945945262909, mean loss: 0.34226224599650007
Epoch: 48, step: 295, loss: 0.31519660353660583, mean loss: 0.34226185716701985
Epoch: 48, step: 296, loss: 0.3197847008705139, mean loss: 0.342261534261127
Epoch: 48, step: 297, loss: 0.3361016809940338, mean loss: 0.3422614457702023
Epoch: 48, step: 298, loss: 0.33605968952178955, mean loss: 0.34226135667858965
Epoch: 48, step: 299, loss: 0.34482496976852417, mean loss: 0.3422613935057615
Epoch: 48, step: 300, loss: 0.30858373641967773, mean loss: 0.34226090972174006
Epoch: 48, step: 301, loss: 0.3416290581226349, mean loss: 0.34226090064523823
Epoch: 48, step: 302, loss: 0.2984386384487152, mean loss: 0.3422602711507012
Epoch: 48, step: 303, loss: 0.32552310824394226, mean loss: 0.3422600307294919
Epoch: 48, step: 304, loss: 0.33325061202049255, mean loss: 0.34225990131543055
Epoch: 48, step: 305, loss: 0.35732781887054443, mean loss: 0.34226011775252374
Epoch: 48, step: 306, loss: 0.34959158301353455, mean loss: 0.3422602230609203
Epoch: 48, step: 307, loss: 0.3261467516422272, mean loss: 0.34225999161203463
Epoch: 48, step: 308, loss: 0.3204001188278198, mean loss: 0.3422596776281392
Epoch: 48, step: 309, loss: 0.3640625774860382, mean loss: 0.34225999078920694
Epoch: 48, step: 310, loss: 0.33136793971061707, mean loss: 0.3422598343459184
Epoch: 48, step: 311, loss: 0.3548990786075592, mean loss: 0.34226001588165694
Epoch: 48, step: 312, loss: 0.32179951667785645, mean loss: 0.342259722014523
Epoch: 48, step: 313, loss: 0.3289129137992859, mean loss: 0.3422595303216465
Epoch: 48, step: 314, loss: 0.3452971875667572, mean loss: 0.3422595739492227
Epoch: 48, step: 315, loss: 0.314956933259964, mean loss: 0.34225918182765247
Epoch: 48, step: 316, loss: 0.3078101873397827, mean loss: 0.3422586870769812
Epoch: 48, step: 317, loss: 0.2988792061805725, mean loss: 0.34225806407711196
Epoch: 48, step: 318, loss: 0.3721407353878021, mean loss: 0.34225849323468993
Epoch: 48, step: 319, loss: 0.3065672814846039, mean loss: 0.3422579806655874
Epoch: 48, step: 320, loss: 0.34642037749290466, mean loss: 0.3422580404417973
Epoch: 48, step: 321, loss: 0.3496248126029968, mean loss: 0.34225814623454454
Epoch: 48, step: 322, loss: 0.34789547324180603, mean loss: 0.3422582271899119
Epoch: 48, step: 323, loss: 0.3554176688194275, mean loss: 0.34225841616460356
Epoch: 48, step: 324, loss: 0.3229202926158905, mean loss: 0.3422581384656282
Epoch: 48, step: 325, loss: 0.32321056723594666, mean loss: 0.34225786494296484
Epoch: 48, step: 326, loss: 0.3141249716281891, mean loss: 0.3422574609610967
Epoch: 48, step: 327, loss: 0.3412017524242401, mean loss: 0.34225744580158296
Epoch: 48, step: 328, loss: 0.3117976486682892, mean loss: 0.3422570084184734
Epoch: 48, step: 329, loss: 0.3474763333797455, mean loss: 0.3422570833635491
Epoch: 48, step: 330, loss: 0.3264692425727844, mean loss: 0.342256856666813
Epoch: 48, step: 331, loss: 0.3597679138183594, mean loss: 0.3422571081035075
Epoch: 48, step: 332, loss: 0.31187373399734497, mean loss: 0.3422566718428412
Epoch: 48, step: 333, loss: 0.33525997400283813, mean loss: 0.3422565713819699
Epoch: 48, step: 334, loss: 0.3482528626918793, mean loss: 0.3422566574774415
Epoch: 48, step: 335, loss: 0.30933764576911926, mean loss: 0.3422561848290997
Epoch: 48, step: 336, loss: 0.3701549768447876, mean loss: 0.3422565853918072
Epoch: 48, step: 337, loss: 0.30177488923072815, mean loss: 0.3422560041757819
Epoch: 48, step: 338, loss: 0.2979487478733063, mean loss: 0.3422553680434033
Epoch: 48, step: 339, loss: 0.3642458915710449, mean loss: 0.3422556837633184
Epoch: 48, step: 340, loss: 0.31063219904899597, mean loss: 0.34225522974863537
Epoch: 48, step: 341, loss: 0.32580772042274475, mean loss: 0.34225499361705175
Epoch: 48, step: 342, loss: 0.3779238164424896, mean loss: 0.34225550569547863
Epoch: 48, step: 343, loss: 0.3326489329338074, mean loss: 0.3422553677809736
Epoch: 48, step: 344, loss: 0.3164551854133606, mean loss: 0.34225499739203397
Epoch: 48, step: 345, loss: 0.3589875102043152, mean loss: 0.3422552376015262
Epoch: 48, step: 346, loss: 0.3077782988548279, mean loss: 0.34225474266277106
Epoch: 48, step: 347, loss: 0.43716859817504883, mean loss: 0.3422561051929966
Epoch: 48, step: 348, loss: 0.36815521121025085, mean loss: 0.34225647698074035
Epoch: 48, step: 349, loss: 0.3377823531627655, mean loss: 0.34225641275456514
Epoch: 48, step: 350, loss: 0.3349989354610443, mean loss: 0.3422563085747668
Epoch: 48, step: 351, loss: 0.34985554218292236, mean loss: 0.3422564176588505
Epoch: 48, step: 352, loss: 0.34016022086143494, mean loss: 0.3422563875691814
Epoch: 48, step: 353, loss: 0.3705609440803528, mean loss: 0.3422567938585695
Epoch: 48, step: 354, loss: 0.3078685998916626, mean loss: 0.34225630025049153
Epoch: 48, step: 355, loss: 0.3176034092903137, mean loss: 0.34225594638801576
Epoch: 48, step: 356, loss: 0.33715593814849854, mean loss: 0.34225587318460765
Epoch: 48, step: 357, loss: 0.36383527517318726, mean loss: 0.34225618292196935
Epoch: 48, step: 358, loss: 0.30928659439086914, mean loss: 0.3422557097037217
Epoch: 48, step: 359, loss: 0.3464188277721405, mean loss: 0.34225576945682296
Epoch: 48, step: 360, loss: 0.3185461163520813, mean loss: 0.3422554291578104
Epoch: 48, step: 361, loss: 0.35320478677749634, mean loss: 0.3422555863090809
Epoch: 48, step: 362, loss: 0.30915552377700806, mean loss: 0.3422551112453919
Epoch: 48, step: 363, loss: 0.3445354402065277, mean loss: 0.342255143973002
Epoch: 48, step: 364, loss: 0.32943180203437805, mean loss: 0.3422549599331906
Epoch: 48, step: 365, loss: 0.31557995080947876, mean loss: 0.3422545771006018
Epoch: 48, step: 366, loss: 0.28418833017349243, mean loss: 0.3422537437613328
Epoch: 48, step: 367, loss: 0.3125542402267456, mean loss: 0.34225331753424415
Epoch: 48, step: 368, loss: 0.37591269612312317, mean loss: 0.3422538005838357
Epoch: 48, step: 369, loss: 0.3342316746711731, mean loss: 0.34225368545904145
Epoch: 48, step: 370, loss: 0.3036312460899353, mean loss: 0.3422531311999055
Epoch: 48, step: 371, loss: 0.36336246132850647, mean loss: 0.3422534341292742
Epoch: 48, step: 372, loss: 0.3155062794685364, mean loss: 0.3422530502998323
Epoch: 48, step: 373, loss: 0.3152918219566345, mean loss: 0.34225266340392285
Epoch: 48, step: 374, loss: 0.3138827681541443, mean loss: 0.34225225629936606
Epoch: 48, step: 375, loss: 0.3365020155906677, mean loss: 0.3422521737852932
Epoch: 48, step: 376, loss: 0.3455377519130707, mean loss: 0.34225222093158786
Epoch: 48, step: 377, loss: 0.3477875292301178, mean loss: 0.3422523003591714
Epoch: 48, step: 378, loss: 0.3432750701904297, mean loss: 0.3422523150349521
Epoch: 48, step: 379, loss: 0.3367752134799957, mean loss: 0.34225223644484776
Epoch: 48, step: 380, loss: 0.3565044105052948, mean loss: 0.3422524409442101
Epoch: 48, step: 381, loss: 0.35588163137435913, mean loss: 0.34225263650179655
Epoch: 48, step: 382, loss: 0.3544919490814209, mean loss: 0.3422528121142878
Epoch: 48, step: 383, loss: 0.3235996961593628, mean loss: 0.3422525444789005
Epoch: 48, step: 384, loss: 0.32553890347480774, mean loss: 0.3422523046745904
Epoch: 48, step: 385, loss: 0.41907671093940735, mean loss: 0.3422534069215166
Epoch: 48, step: 386, loss: 0.33205029368400574, mean loss: 0.3422532605332867
Epoch: 48, step: 387, loss: 0.3003498911857605, mean loss: 0.3422526593371698
Epoch: 48, step: 388, loss: 0.3621522784233093, mean loss: 0.3422529448369343
Epoch: 48, step: 389, loss: 0.33762797713279724, mean loss: 0.342252878483491
Epoch: 48, step: 390, loss: 0.32837697863578796, mean loss: 0.3422526794117172
Epoch: 48, step: 391, loss: 0.3316461145877838, mean loss: 0.34225252724591865
Epoch: 48, step: 392, loss: 0.3412095606327057, mean loss: 0.342252512283339
Epoch: 48, step: 393, loss: 0.31166085600852966, mean loss: 0.342252073416437
Epoch: 48, step: 394, loss: 0.29820945858955383, mean loss: 0.3422514415915869
Epoch: 48, step: 395, loss: 0.3735728859901428, mean loss: 0.34225189091511354
Epoch: 48, step: 396, loss: 0.3438372015953064, mean loss: 0.34225191365695
Epoch: 48, step: 397, loss: 0.32056155800819397, mean loss: 0.34225160250567116
Epoch: 48, step: 398, loss: 0.3136707544326782, mean loss: 0.34225119251516645
Epoch: 48, step: 399, loss: 0.3421509861946106, mean loss: 0.34225119107773355
Epoch: 48, step: 400, loss: 0.3686988353729248, mean loss: 0.34225157045667715
Epoch: 48, step: 401, loss: 0.33196383714675903, mean loss: 0.3422514228861273
Epoch: 48, step: 402, loss: 0.38301122188568115, mean loss: 0.34225200754938484
Epoch: 48, step: 403, loss: 0.3174549341201782, mean loss: 0.3422516518624058
Epoch: 48, step: 404, loss: 0.367156445980072, mean loss: 0.3422520090893966
Epoch: 48, step: 405, loss: 0.31601855158805847, mean loss: 0.342251632809849
Epoch: 48, step: 406, loss: 0.3387799561023712, mean loss: 0.342251583014575
Epoch: 48, step: 407, loss: 0.2905823290348053, mean loss: 0.34225084191798893
Epoch: 48, step: 408, loss: 0.3494410514831543, mean loss: 0.34225094504630843
Epoch: 48, step: 409, loss: 0.34126201272010803, mean loss: 0.3422509308623733
Epoch: 48, step: 410, loss: 0.3136732876300812, mean loss: 0.34225052098839726
Epoch: 48, step: 411, loss: 0.3204997479915619, mean loss: 0.34225020903307346
Epoch: 48, step: 412, loss: 0.32898378372192383, mean loss: 0.3422500187652311
Epoch: 48, step: 413, loss: 0.3507075607776642, mean loss: 0.34225014006205023
Epoch: 48, step: 414, loss: 0.3172077536582947, mean loss: 0.3422497809129917
Epoch: 48, step: 415, loss: 0.35621148347854614, mean loss: 0.3422499811439257
Epoch: 48, step: 416, loss: 0.3290878236293793, mean loss: 0.342249792382327
Epoch: 48, step: 417, loss: 0.3349285423755646, mean loss: 0.34224968738806333
Epoch: 48, step: 418, loss: 0.32001471519470215, mean loss: 0.3422493685202399
Epoch: 48, step: 419, loss: 0.33277782797813416, mean loss: 0.34224923269249163
Epoch: 48, step: 420, loss: 0.3309505879878998, mean loss: 0.34224907066526344
Epoch: 48, step: 421, loss: 0.36408016085624695, mean loss: 0.34224938372761743
Epoch: 48, step: 422, loss: 0.3389001488685608, mean loss: 0.34224933569958477
Epoch: 48, step: 423, loss: 0.33109015226364136, mean loss: 0.342249175679173
Epoch: 48, step: 424, loss: 0.3506041169166565, mean loss: 0.3422492954856063
Epoch: 48, step: 425, loss: 0.283907026052475, mean loss: 0.34224845889336913
Epoch: 48, step: 426, loss: 0.3455938696861267, mean loss: 0.34224850686381314
Epoch: 48, step: 427, loss: 0.30120667815208435, mean loss: 0.34224791836612584
Epoch: 48, step: 428, loss: 0.3169780969619751, mean loss: 0.34224755602802626
Epoch: 48, step: 429, loss: 0.3014754354953766, mean loss: 0.3422469714144429
Epoch: 48, step: 430, loss: 0.39325565099716187, mean loss: 0.34224770279507727
Epoch: 48, step: 431, loss: 0.31170889735221863, mean loss: 0.34224726492507496
Epoch: 48, step: 432, loss: 0.2980749309062958, mean loss: 0.3422466315845628
Epoch: 48, step: 433, loss: 0.3446945250034332, mean loss: 0.3422466666818217
Epoch: 48, step: 434, loss: 0.3442755937576294, mean loss: 0.3422466957716331
Epoch: 48, step: 435, loss: 0.33820971846580505, mean loss: 0.34224663789216264
Epoch: 48, step: 436, loss: 0.2945028245449066, mean loss: 0.3422459533832328
Epoch: 48, step: 437, loss: 0.3726765215396881, mean loss: 0.34224638966377985
Epoch: 48, step: 438, loss: 0.3598560094833374, mean loss: 0.34224664212782796
Epoch: 48, step: 439, loss: 0.3455495536327362, mean loss: 0.34224668948004017
Epoch: 48, step: 440, loss: 0.30120542645454407, mean loss: 0.34224610110014214
Epoch: 48, step: 441, loss: 0.3248826563358307, mean loss: 0.3422458521761412
Epoch: 48, step: 442, loss: 0.3222585916519165, mean loss: 0.3422455656409749
Epoch: 48, step: 443, loss: 0.3060973286628723, mean loss: 0.3422450474312585
Epoch: 48, step: 444, loss: 0.32241150736808777, mean loss: 0.34224476310796387
Epoch: 48, step: 445, loss: 0.3377877473831177, mean loss: 0.342244699215425
Epoch: 48, step: 446, loss: 0.35030505061149597, mean loss: 0.34224481476110935
Epoch: 48, step: 447, loss: 0.33198803663253784, mean loss: 0.34224466773160633
Epoch: 48, step: 448, loss: 0.3357940912246704, mean loss: 0.3422445752648053
Epoch: 48, step: 449, loss: 0.34204256534576416, mean loss: 0.34224457236910394
Epoch: 48, step: 450, loss: 0.3538689613342285, mean loss: 0.34224473899595437
Epoch: 48, step: 451, loss: 0.3561916947364807, mean loss: 0.3422449389121825
Epoch: 48, step: 452, loss: 0.30750399827957153, mean loss: 0.3422444409412711
Epoch: 48, step: 453, loss: 0.32880428433418274, mean loss: 0.342244248295045
Epoch: 48, step: 454, loss: 0.3318632245063782, mean loss: 0.34224409949942836
Epoch: 48, step: 455, loss: 0.330559104681015, mean loss: 0.34224393201584247
Epoch: 48, step: 456, loss: 0.3108034133911133, mean loss: 0.3422434813784731
Epoch: 48, step: 457, loss: 0.3677174746990204, mean loss: 0.3422438464923232
Epoch: 48, step: 458, loss: 0.35129237174987793, mean loss: 0.34224397618123775
Epoch: 48, step: 459, loss: 0.29927584528923035, mean loss: 0.3422433603449296
Epoch: 48, step: 460, loss: 0.3829464912414551, mean loss: 0.34224394370999767
Epoch: 48, step: 461, loss: 0.32370761036872864, mean loss: 0.34224367804752537
Epoch: 48, step: 462, loss: 0.3481948971748352, mean loss: 0.34224376333909295
Epoch: 48, step: 463, loss: 0.2959127426147461, mean loss: 0.34224309934257946
Epoch: 48, step: 464, loss: 0.30262070894241333, mean loss: 0.3422425314994449
Epoch: 48, step: 465, loss: 0.32334381341934204, mean loss: 0.3422422606588063
Epoch: 48, step: 466, loss: 0.35654598474502563, mean loss: 0.3422424656448922
Epoch: 48, step: 467, loss: 0.3205875754356384, mean loss: 0.3422421553139921
Epoch: 48, step: 468, loss: 0.3503163456916809, mean loss: 0.34224227102156835
Epoch: 48, step: 469, loss: 0.3734177350997925, mean loss: 0.34224271777666393
Epoch: 48, step: 470, loss: 0.35301464796066284, mean loss: 0.3422428721399069
Epoch: 48, step: 471, loss: 0.3160635232925415, mean loss: 0.34224249699160864
Epoch: 48, step: 472, loss: 0.33112162351608276, mean loss: 0.34224233763252754
Epoch: 48, step: 473, loss: 0.3211885690689087, mean loss: 0.34224203594209446
Epoch: 48, step: 474, loss: 0.3560333251953125, mean loss: 0.342242233561841
Epoch: 48, step: 475, loss: 0.3962179124355316, mean loss: 0.3422430069853361
Epoch: 48, step: 476, loss: 0.30968862771987915, mean loss: 0.34224254051670544
Epoch: 48, step: 477, loss: 0.3174628019332886, mean loss: 0.3422421854552556
Epoch: 48, step: 478, loss: 0.3582521378993988, mean loss: 0.3422424148537804
Epoch: 48, step: 479, loss: 0.44315069913864136, mean loss: 0.34224386069691837
Epoch: 48, step: 480, loss: 0.3360998332500458, mean loss: 0.34224377266477407
Epoch: 48, step: 481, loss: 0.40318989753723145, mean loss: 0.3422446458934882
Epoch: 48, step: 482, loss: 0.359456330537796, mean loss: 0.34224489249689305
Epoch: 48, step: 483, loss: 0.29409998655319214, mean loss: 0.3422442027022638
Epoch: 48, step: 484, loss: 0.2998344302177429, mean loss: 0.3422435950862848
Epoch: 48, step: 485, loss: 0.3373863399028778, mean loss: 0.3422435254961077
Epoch: 48, step: 486, loss: 0.33725932240486145, mean loss: 0.3422434540881636
Epoch: 48, step: 487, loss: 0.3202931880950928, mean loss: 0.34224313961443875
Epoch: 48, step: 488, loss: 0.3087458908557892, mean loss: 0.3422426597180367
Epoch: 48, step: 489, loss: 0.3570213317871094, mean loss: 0.34224287144079635
Epoch: 48, step: 490, loss: 0.312570720911026, mean loss: 0.3422424463566233
Epoch: 48, step: 491, loss: 0.3507969081401825, mean loss: 0.3422425689063595
Epoch: 48, step: 492, loss: 0.2893139719963074, mean loss: 0.3422418106713203
Epoch: 48, step: 493, loss: 0.33477362990379333, mean loss: 0.3422417036865229
Epoch: 48, step: 494, loss: 0.34840402007102966, mean loss: 0.34224179196300497
Epoch: 48, step: 495, loss: 0.35825860500335693, mean loss: 0.34224202140394355
Epoch: 48, step: 496, loss: 0.30113542079925537, mean loss: 0.34224143256008954
Epoch: 48, step: 497, loss: 0.31933829188346863, mean loss: 0.34224110448186756
Epoch: 48, step: 498, loss: 0.3443930149078369, mean loss: 0.34224113530667205
Epoch: 48, step: 499, loss: 0.333706259727478, mean loss: 0.3422410130515357
Epoch: 48, step: 500, loss: 0.2895384132862091, mean loss: 0.3422402581405626
Epoch: 48, step: 501, loss: 0.3098047971725464, mean loss: 0.3422397935423306
Epoch: 48, step: 502, loss: 0.31007450819015503, mean loss: 0.3422393328206325
Epoch: 48, step: 503, loss: 0.3419531583786011, mean loss: 0.34223932872165175
Epoch: 48, step: 504, loss: 0.30451083183288574, mean loss: 0.3422387883303876
Epoch: 48, step: 505, loss: 0.3854396939277649, mean loss: 0.3422394070949698
Epoch: 48, step: 506, loss: 0.30247029662132263, mean loss: 0.34223883749198963
Epoch: 48, step: 507, loss: 0.3456709384918213, mean loss: 0.3422388866484061
Epoch: 48, step: 508, loss: 0.3699096441268921, mean loss: 0.3422392829583627
Epoch: 48, step: 509, loss: 0.3377628028392792, mean loss: 0.34223921884561714
Epoch: 48, step: 510, loss: 0.3883216977119446, mean loss: 0.34223987883557555
Epoch: 48, step: 511, loss: 0.2956898808479309, mean loss: 0.3422392121593899
Epoch: 48, step: 512, loss: 0.2974465489387512, mean loss: 0.3422385706604537
Epoch: 48, step: 513, loss: 0.35017383098602295, mean loss: 0.3422386843038004
Epoch: 48, step: 514, loss: 0.3556647002696991, mean loss: 0.34223887657922347
Epoch: 48, step: 515, loss: 0.29002413153648376, mean loss: 0.34223812881693555
Epoch: 48, step: 516, loss: 0.30019477009773254, mean loss: 0.3422375267267049
Epoch: 48, step: 517, loss: 0.31563228368759155, mean loss: 0.34223714572651814
Epoch: 48, step: 518, loss: 0.30747950077056885, mean loss: 0.3422366479870478
Epoch: 48, step: 519, loss: 0.31464099884033203, mean loss: 0.3422362528150758
Epoch: 48, step: 520, loss: 0.313831627368927, mean loss: 0.3422358460643212
Epoch: 48, step: 521, loss: 0.35353249311447144, mean loss: 0.3422360078286058
Epoch: 48, step: 522, loss: 0.30873236060142517, mean loss: 0.34223552807422436
Epoch: 48, step: 523, loss: 0.3473484218120575, mean loss: 0.34223560128709074
Epoch: 48, step: 524, loss: 0.3366420269012451, mean loss: 0.342235521192379
Epoch: 48, step: 525, loss: 0.29696738719940186, mean loss: 0.34223487300465893
Epoch: 48, step: 526, loss: 0.3186492919921875, mean loss: 0.342234535291046
Epoch: 48, step: 527, loss: 0.33726757764816284, mean loss: 0.34223446417195036
Epoch: 48, step: 528, loss: 0.3359529972076416, mean loss: 0.34223437423241676
Epoch: 48, step: 529, loss: 0.2954692542552948, mean loss: 0.3422337046479264
Epoch: 48, step: 530, loss: 0.3345215320587158, mean loss: 0.3422335942263725
Epoch: 48, step: 531, loss: 0.3305094540119171, mean loss: 0.3422334263645631
Epoch: 48, step: 532, loss: 0.3211618959903717, mean loss: 0.342233124674673
Epoch: 48, step: 533, loss: 0.3765697479248047, mean loss: 0.34223361627939264
Epoch: 48, step: 534, loss: 0.31143808364868164, mean loss: 0.3422331753795311
Epoch: 48, step: 535, loss: 0.36166805028915405, mean loss: 0.3422334536247909
Epoch: 48, step: 536, loss: 0.3903079628944397, mean loss: 0.3422341418881772
Epoch: 48, step: 537, loss: 0.3197278380393982, mean loss: 0.34223381967910277
Epoch: 48, step: 538, loss: 0.34422767162323, mean loss: 0.3422338482234607
Epoch: 48, step: 539, loss: 0.3046422004699707, mean loss: 0.34223331006209445
Epoch: 48, step: 540, loss: 0.3390384316444397, mean loss: 0.3422332643249261
Epoch: 48, step: 541, loss: 0.3698813021183014, mean loss: 0.3422336601224151
Epoch: 48, step: 542, loss: 0.32919612526893616, mean loss: 0.34223347348531175
Epoch: 48, step: 543, loss: 0.4123396575450897, mean loss: 0.34223447706673726
Epoch: 48, step: 544, loss: 0.32557058334350586, mean loss: 0.3422342385238035
Epoch: 48, step: 545, loss: 0.34540238976478577, mean loss: 0.34223428387510535
Epoch: 48, step: 546, loss: 0.3090328872203827, mean loss: 0.34223380861212344
Epoch: 48, step: 547, loss: 0.3662714958190918, mean loss: 0.34223415269582236
Epoch: 48, step: 548, loss: 0.3395799398422241, mean loss: 0.3422341147030531
Epoch: 48, step: 549, loss: 0.31858766078948975, mean loss: 0.3422337762292918
Epoch: 48, step: 550, loss: 0.30348867177963257, mean loss: 0.3422332216423939
Epoch: 48, step: 551, loss: 0.3426274359226227, mean loss: 0.3422332272849892
Epoch: 48, step: 552, loss: 0.3227485120296478, mean loss: 0.34223294839405305
Epoch: 48, step: 553, loss: 0.33551356196403503, mean loss: 0.34223285221871125
Epoch: 48, step: 554, loss: 0.3647005259990692, mean loss: 0.3422331737964773
Epoch: 48, step: 555, loss: 0.311543732881546, mean loss: 0.3422327345475949
Epoch: 48, step: 556, loss: 0.3231891393661499, mean loss: 0.3422324619861559
Epoch: 48, step: 557, loss: 0.3220979571342468, mean loss: 0.34223217381519766
Epoch: 48, step: 558, loss: 0.3162803649902344, mean loss: 0.3422318023905891
Epoch: 48, step: 559, loss: 0.3229886293411255, mean loss: 0.34223152698451725
Epoch: 48, step: 560, loss: 0.31367433071136475, mean loss: 0.3422311182830693
Epoch: 48, step: 561, loss: 0.3234662711620331, mean loss: 0.34223084973042994
Epoch: 48, step: 562, loss: 0.3407069146633148, mean loss: 0.3422308279209835
Epoch: 48, step: 563, loss: 0.3409024178981781, mean loss: 0.34223080891002094
Epoch: 48, step: 564, loss: 0.317134290933609, mean loss: 0.34223044975725286
Epoch: 48, step: 565, loss: 0.36872196197509766, mean loss: 0.3422308288681636
Epoch: 48, step: 566, loss: 0.3158190846443176, mean loss: 0.3422304509041941
Epoch: 48, step: 567, loss: 0.3003249764442444, mean loss: 0.3422298512265401
Epoch: 48, step: 568, loss: 0.3235998749732971, mean loss: 0.34222958463080944
Epoch: 48, step: 569, loss: 0.34934765100479126, mean loss: 0.342229686489176
Epoch: 48, step: 570, loss: 0.3279707431793213, mean loss: 0.3422294824489472
Epoch: 48, step: 571, loss: 0.309365838766098, mean loss: 0.3422290121890353
Epoch: 48, step: 572, loss: 0.3148803412914276, mean loss: 0.34222862085082395
Epoch: 48, step: 573, loss: 0.3886081874370575, mean loss: 0.34222928449685586
Epoch: 48, step: 574, loss: 0.31772175431251526, mean loss: 0.3422289338231943
Epoch: 48, step: 575, loss: 0.3371250629425049, mean loss: 0.3422288607939063
Epoch: 48, step: 576, loss: 0.29801875352859497, mean loss: 0.3422282282178605
Epoch: 48, step: 577, loss: 0.312004029750824, mean loss: 0.34222779576402634
Epoch: 48, step: 578, loss: 0.3562595546245575, mean loss: 0.3422279965303462
Epoch: 48, step: 579, loss: 0.33518460392951965, mean loss: 0.34222789575496987
Epoch: 48, step: 580, loss: 0.34358587861061096, mean loss: 0.34222791518442425
Epoch: 48, step: 581, loss: 0.33775222301483154, mean loss: 0.34222785114899673
Epoch: 48, step: 582, loss: 0.34455788135528564, mean loss: 0.34222788448514674
Epoch: 48, step: 583, loss: 0.4001079201698303, mean loss: 0.3422287125731015
Epoch: 48, step: 584, loss: 0.3332856297492981, mean loss: 0.3422285846265112
Epoch: 48, step: 585, loss: 0.3676392734050751, mean loss: 0.34222894816607996
Epoch: 48, step: 586, loss: 0.33379143476486206, mean loss: 0.34222882745600686
Epoch: 48, step: 587, loss: 0.3386629819869995, mean loss: 0.34222877644248084
Epoch: 48, step: 588, loss: 0.3612643778324127, mean loss: 0.3422290487647851
Epoch: 48, step: 589, loss: 0.3212065100669861, mean loss: 0.34222874802176345
Epoch: 48, step: 590, loss: 0.3037969470024109, mean loss: 0.3422281982341861
Epoch: 48, step: 591, loss: 0.32302263379096985, mean loss: 0.3422279234921907
Epoch: 48, step: 592, loss: 0.3230392336845398, mean loss: 0.34222764899551944
Epoch: 48, step: 593, loss: 0.3069484531879425, mean loss: 0.3422271443293133
Epoch: 48, step: 594, loss: 0.35558128356933594, mean loss: 0.3422273353565243
Epoch: 48, step: 595, loss: 0.3259172737598419, mean loss: 0.3422271020490116
Epoch: 48, step: 596, loss: 0.34131067991256714, mean loss: 0.34222708894022535
Epoch: 48, step: 597, loss: 0.3452993929386139, mean loss: 0.3422271328867852
Epoch: 48, step: 598, loss: 0.3210853636264801, mean loss: 0.34222683047701763
Epoch: 48, step: 599, loss: 0.31457263231277466, mean loss: 0.3422264349197719
Epoch: 48, step: 600, loss: 0.31187617778778076, mean loss: 0.3422260008051275
Epoch: 48, step: 601, loss: 0.31083911657333374, mean loss: 0.3422255518695176
Epoch: 48, step: 602, loss: 0.33260223269462585, mean loss: 0.3422254142263913
Epoch: 48, step: 603, loss: 0.3220880329608917, mean loss: 0.34222512620388906
Epoch: 48, step: 604, loss: 0.3082888722419739, mean loss: 0.34222464082474
Epoch: 48, step: 605, loss: 0.33766481280326843, mean loss: 0.3422245756079429
Epoch: 48, step: 606, loss: 0.33106735348701477, mean loss: 0.34222441603440606
Epoch: 48, step: 607, loss: 0.30928680300712585, mean loss: 0.3422239449587049
Epoch: 48, step: 608, loss: 0.3488399386405945, mean loss: 0.3422240395796869
Epoch: 48, step: 609, loss: 0.32038643956184387, mean loss: 0.3422237272659656
Epoch: 48, step: 610, loss: 0.33922791481018066, mean loss: 0.3422236844215159
Epoch: 48, step: 611, loss: 0.34724292159080505, mean loss: 0.34222375620283807
Epoch: 48, step: 612, loss: 0.3528367578983307, mean loss: 0.34222390797976615
Epoch: 48, step: 613, loss: 0.3356679081916809, mean loss: 0.34222381422351256
Epoch: 48, step: 614, loss: 0.2959023118019104, mean loss: 0.3422231517969474
Epoch: 48, step: 615, loss: 0.3179233968257904, mean loss: 0.3422228043001654
Epoch: 48, step: 616, loss: 0.33450302481651306, mean loss: 0.3422226939056297
Epoch: 48, step: 617, loss: 0.34495285153388977, mean loss: 0.34222273294692285
Epoch: 48, step: 618, loss: 0.3531976044178009, mean loss: 0.3422228898854976
Epoch: 48, step: 619, loss: 0.3030145764350891, mean loss: 0.34222232922208956
Epoch: 48, step: 620, loss: 0.30341392755508423, mean loss: 0.34222177428519757
Epoch: 48, step: 621, loss: 0.36205825209617615, mean loss: 0.3422220579308894
Epoch: 48, step: 622, loss: 0.3212100863456726, mean loss: 0.34222175748087746
Epoch: 48, step: 623, loss: 0.3072907328605652, mean loss: 0.3422212580095806
Epoch: 48, step: 624, loss: 0.3825555145740509, mean loss: 0.3422218347322962
Epoch: 48, step: 625, loss: 0.36925336718559265, mean loss: 0.3422222212393804
Epoch: 48, step: 626, loss: 0.3567787706851959, mean loss: 0.342222429371459
Epoch: 48, step: 627, loss: 0.3264801502227783, mean loss: 0.34222220428882894
Epoch: 48, step: 628, loss: 0.3030576705932617, mean loss: 0.34222164432351965
Epoch: 48, step: 629, loss: 0.3296473026275635, mean loss: 0.34222146454110425
Epoch: 48, step: 630, loss: 0.34679585695266724, mean loss: 0.34222152994282296
Epoch: 48, step: 631, loss: 0.3474659323692322, mean loss: 0.34222160492284165
Epoch: 48, step: 632, loss: 0.3650294542312622, mean loss: 0.3422219310054681
Epoch: 48, step: 633, loss: 0.30110031366348267, mean loss: 0.3422213431002649
Epoch: 48, step: 634, loss: 0.34026479721069336, mean loss: 0.3422213151284307
Epoch: 48, step: 635, loss: 0.3166138529777527, mean loss: 0.34222094903558814
Epoch: 48, step: 636, loss: 0.3213024437427521, mean loss: 0.34222064998191626
Epoch: 48, step: 637, loss: 0.30871298909187317, mean loss: 0.34222017095888707
Epoch: 48, step: 638, loss: 0.3345397412776947, mean loss: 0.34222006116160497
Epoch: 48, step: 639, loss: 0.3326278626918793, mean loss: 0.3422199240361694
Epoch: 48, step: 640, loss: 0.34972772002220154, mean loss: 0.3422200313624597
Epoch: 48, step: 641, loss: 0.3502660095691681, mean loss: 0.34222014638058884
Epoch: 48, step: 642, loss: 0.34028160572052, mean loss: 0.34222011866933644
Epoch: 48, step: 643, loss: 0.33302807807922363, mean loss: 0.3422199872718782
Epoch: 48, step: 644, loss: 0.31906816363334656, mean loss: 0.3422196563282465
Epoch: 48, step: 645, loss: 0.33183613419532776, mean loss: 0.342219507903161
Epoch: 48, step: 646, loss: 0.3151945173740387, mean loss: 0.34221912160560775
Epoch: 48, step: 647, loss: 0.32259005308151245, mean loss: 0.3422188410300142
Epoch: 48, step: 648, loss: 0.30598685145378113, mean loss: 0.3422183231416253
Epoch: 48, step: 649, loss: 0.334789901971817, mean loss: 0.34221821696368343
Epoch: 48, step: 650, loss: 0.32182982563972473, mean loss: 0.34221792554691566
Epoch: 48, step: 651, loss: 0.31573233008384705, mean loss: 0.342217546986578
Epoch: 48, step: 652, loss: 0.31261157989501953, mean loss: 0.34221712383261405
Epoch: 48, step: 653, loss: 0.3075747489929199, mean loss: 0.34221662870105246
Epoch: 48, step: 654, loss: 0.31200993061065674, mean loss: 0.3422161969732652
Epoch: 48, step: 655, loss: 0.35052287578582764, mean loss: 0.3422163156943779
Epoch: 48, step: 656, loss: 0.34395265579223633, mean loss: 0.3422163405102263
Epoch: 48, step: 657, loss: 0.39029985666275024, mean loss: 0.34221702771211504
Epoch: 48, step: 658, loss: 0.36558598279953003, mean loss: 0.34221736169269396
Epoch: 48, step: 659, loss: 0.34150761365890503, mean loss: 0.342217351549379
Epoch: 48, step: 660, loss: 0.3091830611228943, mean loss: 0.34221687944884843
Epoch: 48, step: 661, loss: 0.29376092553138733, mean loss: 0.3422161869637266
Epoch: 48, step: 662, loss: 0.3745836317539215, mean loss: 0.342216649520994
Epoch: 48, step: 663, loss: 0.34928303956985474, mean loss: 0.34221675050404604
Epoch: 48, step: 664, loss: 0.34514784812927246, mean loss: 0.342216792390632
Epoch: 48, step: 665, loss: 0.3569042384624481, mean loss: 0.34221700227725455
Epoch: 48, step: 666, loss: 0.3076426088809967, mean loss: 0.34221650820912847
Epoch: 48, step: 667, loss: 0.3485735058784485, mean loss: 0.3422165990493352
Epoch: 48, step: 668, loss: 0.3369249403476715, mean loss: 0.34221652343368664
Epoch: 48, step: 669, loss: 0.33497461676597595, mean loss: 0.34221641995126734
Epoch: 48, step: 670, loss: 0.30797263979911804, mean loss: 0.3422159306355742
Epoch: 48, step: 671, loss: 0.33665475249290466, mean loss: 0.3422158511720091
Epoch: 48, step: 672, loss: 0.3322690725326538, mean loss: 0.34221570904471554
Epoch: 48, step: 673, loss: 0.2918963134288788, mean loss: 0.3422149900524083
Epoch: 48, step: 674, loss: 0.34784460067749023, mean loss: 0.3422150704903557
Epoch: 48, step: 675, loss: 0.3029891848564148, mean loss: 0.34221451002448106
Epoch: 48, step: 676, loss: 0.36623936891555786, mean loss: 0.3422148532906928
Epoch: 48, step: 677, loss: 0.29715919494628906, mean loss: 0.34221420954646725
Epoch: 48, step: 678, loss: 0.37799572944641113, mean loss: 0.34221472077676685
Epoch: 48, step: 679, loss: 0.3446936011314392, mean loss: 0.342214756193391
Epoch: 48, step: 680, loss: 0.3417973816394806, mean loss: 0.34221475023030107
Epoch: 48, step: 681, loss: 0.3145306408405304, mean loss: 0.34221435470912226
Epoch: 48, step: 682, loss: 0.3546444773674011, mean loss: 0.34221453229498777
Epoch: 48, step: 683, loss: 0.33823683857917786, mean loss: 0.3422144754675446
Epoch: 48, step: 684, loss: 0.3641441762447357, mean loss: 0.3422147887624112
Epoch: 48, step: 685, loss: 0.3550865352153778, mean loss: 0.3422149726497573
Epoch: 48, step: 686, loss: 0.3448115289211273, mean loss: 0.34221500974394825
Epoch: 48, step: 687, loss: 0.3288533687591553, mean loss: 0.34221481886336275
Epoch: 48, step: 688, loss: 0.31910622119903564, mean loss: 0.34221448874525495
Epoch: 48, step: 689, loss: 0.3078097403049469, mean loss: 0.34221399726289103
Epoch: 48, step: 690, loss: 0.3426826298236847, mean loss: 0.342214003957355
Epoch: 48, step: 691, loss: 0.32705238461494446, mean loss: 0.3422137873751691
Epoch: 48, step: 692, loss: 0.34366992115974426, mean loss: 0.34221380817559455
Epoch: 48, step: 693, loss: 0.32768985629081726, mean loss: 0.34221360070835055
Epoch: 48, step: 694, loss: 0.36206838488578796, mean loss: 0.34221388431976335
Epoch: 48, step: 695, loss: 0.35785168409347534, mean loss: 0.3422141076913748
Epoch: 48, step: 696, loss: 0.3283708691596985, mean loss: 0.3422139099562474
Epoch: 48, step: 697, loss: 0.29135212302207947, mean loss: 0.34221318346307594
Epoch: 48, step: 698, loss: 0.3147677481174469, mean loss: 0.34221279144703065
Epoch: 48, step: 699, loss: 0.341921329498291, mean loss: 0.3422127872840022
Epoch: 48, step: 700, loss: 0.3331102728843689, mean loss: 0.3422126572722272
Epoch: 48, step: 701, loss: 0.3219113051891327, mean loss: 0.342212367310904
Epoch: 48, step: 702, loss: 0.3406479060649872, mean loss: 0.34221234496624575
Epoch: 48, step: 703, loss: 0.29856428503990173, mean loss: 0.3422117215650242
Epoch: 48, step: 704, loss: 0.36702314019203186, mean loss: 0.34221207592780223
Epoch: 48, step: 705, loss: 0.33723723888397217, mean loss: 0.34221200487697184
Epoch: 48, step: 706, loss: 0.3181335926055908, mean loss: 0.3422116609929936
Epoch: 48, step: 707, loss: 0.33597058057785034, mean loss: 0.3422115718601685
Epoch: 48, step: 708, loss: 0.4173414707183838, mean loss: 0.34221264482254915
Epoch: 48, step: 709, loss: 0.32688358426094055, mean loss: 0.3422124259047724
Epoch: 48, step: 710, loss: 0.33671122789382935, mean loss: 0.34221234734204287
Epoch: 48, step: 711, loss: 0.3271966874599457, mean loss: 0.34221213290613683
Epoch: 48, step: 712, loss: 0.30532535910606384, mean loss: 0.34221160614035606
Epoch: 48, step: 713, loss: 0.3101917803287506, mean loss: 0.3422111488841111
Epoch: 48, step: 714, loss: 0.33610230684280396, mean loss: 0.34221106164858706
Epoch: 48, step: 715, loss: 0.2949727475643158, mean loss: 0.342210387085354
Epoch: 48, step: 716, loss: 0.3602393865585327, mean loss: 0.3422106445358313
Epoch: 48, step: 717, loss: 0.3543285131454468, mean loss: 0.34221081757408073
Epoch: 48, step: 718, loss: 0.30397453904151917, mean loss: 0.3422102715833262
Epoch: 48, step: 719, loss: 0.33971649408340454, mean loss: 0.3422102359742118
Epoch: 48, step: 720, loss: 0.30466145277023315, mean loss: 0.3422096998157836
Epoch: 48, step: 721, loss: 0.3237360119819641, mean loss: 0.34220943603407994
Epoch: 48, step: 722, loss: 0.35137805342674255, mean loss: 0.342209566948871
Epoch: 48, step: 723, loss: 0.3342548608779907, mean loss: 0.34220945336862557
Epoch: 48, step: 724, loss: 0.32044002413749695, mean loss: 0.342209142541074
Epoch: 48, step: 725, loss: 0.3674478828907013, mean loss: 0.34220950289888474
Epoch: 48, step: 726, loss: 0.32877740263938904, mean loss: 0.3422093111185872
Epoch: 48, step: 727, loss: 0.33272889256477356, mean loss: 0.34220917576138343
Epoch: 48, step: 728, loss: 0.37091565132141113, mean loss: 0.342209585613835
Epoch: 48, step: 729, loss: 0.33940833806991577, mean loss: 0.34220954562000927
Epoch: 48, step: 730, loss: 0.35924938321113586, mean loss: 0.3422097888968191
Epoch: 48, step: 731, loss: 0.3562578558921814, mean loss: 0.34220998945742376
Epoch: 48, step: 732, loss: 0.30747345089912415, mean loss: 0.3422094935399627
Epoch: 48, step: 733, loss: 0.29979822039604187, mean loss: 0.34220888806251726
Epoch: 48, step: 734, loss: 0.32389965653419495, mean loss: 0.3422086266775682
Epoch: 48, step: 735, loss: 0.31988587975502014, mean loss: 0.34220830799970553
Epoch: 48, step: 736, loss: 0.36889776587486267, mean loss: 0.3422086890109673
Epoch: 48, step: 737, loss: 0.2922067642211914, mean loss: 0.34220797520761553
Epoch: 48, step: 738, loss: 0.3625940680503845, mean loss: 0.342208266225486
Epoch: 48, step: 739, loss: 0.3541921377182007, mean loss: 0.3422084372965688
Epoch: 48, step: 740, loss: 0.360204815864563, mean loss: 0.3422086941931838
Epoch: 48, step: 741, loss: 0.3351222574710846, mean loss: 0.3422085930364087
Epoch: 48, step: 742, loss: 0.35899245738983154, mean loss: 0.34220883261765705
Epoch: 48, step: 743, loss: 0.29322630167007446, mean loss: 0.3422081334265678
Epoch: 48, step: 744, loss: 0.3356439173221588, mean loss: 0.3422080397283491
Epoch: 48, step: 745, loss: 0.32240328192710876, mean loss: 0.34220775703746725
Epoch: 48, step: 746, loss: 0.35206252336502075, mean loss: 0.34220789770128385
Epoch: 48, step: 747, loss: 0.3374828100204468, mean loss: 0.3422078302578399
Epoch: 48, step: 748, loss: 0.3431139290332794, mean loss: 0.34220784319083797
Epoch: 48, step: 749, loss: 0.35869503021240234, mean loss: 0.34220807851365237
Epoch: 48, step: 750, loss: 0.2971215844154358, mean loss: 0.3422074350000418
Epoch: 48, step: 751, loss: 0.3288457989692688, mean loss: 0.342207244293887
Epoch: 48, step: 752, loss: 0.35108721256256104, mean loss: 0.34220737103289034
Epoch: 48, step: 753, loss: 0.3619917929172516, mean loss: 0.34220765340125564
Epoch: 48, step: 754, loss: 0.31367602944374084, mean loss: 0.34220724619638093
Epoch: 48, step: 755, loss: 0.31121453642845154, mean loss: 0.34220680387306973
Epoch: 48, step: 756, loss: 0.32020431756973267, mean loss: 0.34220648986136265
Epoch: 48, step: 757, loss: 0.31619390845298767, mean loss: 0.3422061186242939
Epoch: 48, step: 758, loss: 0.35257822275161743, mean loss: 0.3422062666470726
Epoch: 48, step: 759, loss: 0.31588444113731384, mean loss: 0.34220589100736615
Epoch: 48, step: 760, loss: 0.30603495240211487, mean loss: 0.3422053748179836
Epoch: 48, step: 761, loss: 0.3397369980812073, mean loss: 0.34220533959269694
Epoch: 48, step: 762, loss: 0.38931602239608765, mean loss: 0.34220601188214117
Epoch: 48, step: 763, loss: 0.3300260007381439, mean loss: 0.34220583807069155
Epoch: 48, step: 764, loss: 0.313324511051178, mean loss: 0.34220542593365627
Epoch: 48, step: 765, loss: 0.2949143946170807, mean loss: 0.3422047510994527
Epoch: 48, step: 766, loss: 0.32985982298851013, mean loss: 0.34220457494214296
Epoch: 48, step: 767, loss: 0.3392047882080078, mean loss: 0.34220453213696694
Epoch: 48, step: 768, loss: 0.3055422902107239, mean loss: 0.34220400899600256
Epoch: 48, step: 769, loss: 0.3487894535064697, mean loss: 0.34220410296370485
Epoch: 48, step: 770, loss: 0.31061431765556335, mean loss: 0.34220365221551613
Epoch: 48, step: 771, loss: 0.3250654637813568, mean loss: 0.3422034076776982
Epoch: 48, step: 772, loss: 0.3500021994113922, mean loss: 0.34220351895388756
Epoch: 48, step: 773, loss: 0.34750235080718994, mean loss: 0.34220359455859967
Epoch: 48, step: 774, loss: 0.3284810185432434, mean loss: 0.3422033987651427
Epoch: 48, step: 775, loss: 0.3426264822483063, mean loss: 0.34220340480160377
Epoch: 48, step: 776, loss: 0.335463285446167, mean loss: 0.34220330863645154
Epoch: 48, step: 777, loss: 0.3634367287158966, mean loss: 0.3422036115815233
Epoch: 48, step: 778, loss: 0.33608126640319824, mean loss: 0.3422035242330024
Epoch: 48, step: 779, loss: 0.3089892864227295, mean loss: 0.3422030503666865
Epoch: 48, step: 780, loss: 0.331211656332016, mean loss: 0.34220289355510713
Epoch: 48, step: 781, loss: 0.33422398567199707, mean loss: 0.3422027797235683
Epoch: 48, step: 782, loss: 0.31080567836761475, mean loss: 0.3422023318014432
Epoch: 48, step: 783, loss: 0.2981865406036377, mean loss: 0.3422017038655953
Epoch: 48, step: 784, loss: 0.38562119007110596, mean loss: 0.34220232328563044
Epoch: 48, step: 785, loss: 0.3402385115623474, mean loss: 0.3422022952703986
Epoch: 48, step: 786, loss: 0.339902400970459, mean loss: 0.34220226246116736
Epoch: 48, step: 787, loss: 0.30536264181137085, mean loss: 0.34220173693162886
Epoch: 48, step: 788, loss: 0.3459620177745819, mean loss: 0.3422017905725305
Epoch: 48, step: 789, loss: 0.3041418194770813, mean loss: 0.3422012476497737
Epoch: 48, step: 790, loss: 0.310921311378479, mean loss: 0.34220080145009224
Epoch: 48, step: 791, loss: 0.31483566761016846, mean loss: 0.3422004110995582
Epoch: 48, step: 792, loss: 0.30165496468544006, mean loss: 0.3421998327464248
Epoch: 48, step: 793, loss: 0.37494122982025146, mean loss: 0.34220029977345634
Epoch: 48, step: 794, loss: 0.3139258325099945, mean loss: 0.34219989646897514
Epoch: 48, step: 795, loss: 0.3231215476989746, mean loss: 0.34219962434099016
Epoch: 48, step: 796, loss: 0.3471912443637848, mean loss: 0.34219969553898216
Epoch: 48, step: 797, loss: 0.3290133774280548, mean loss: 0.3421995074585641
Epoch: 48, step: 798, loss: 0.29219850897789, mean loss: 0.3421987942894682
Epoch: 48, step: 799, loss: 0.31860479712486267, mean loss: 0.3421984577707957
Epoch: 48, step: 800, loss: 0.33598238229751587, mean loss: 0.3421983691128368
Epoch: 48, step: 801, loss: 0.30087488889694214, mean loss: 0.3421977797372454
Epoch: 48, step: 802, loss: 0.36422550678253174, mean loss: 0.342198093902931
Epoch: 48, step: 803, loss: 0.3329414427280426, mean loss: 0.34219796188383156
Epoch: 48, step: 804, loss: 0.35071104764938354, mean loss: 0.34219808329641005
Epoch: 48, step: 805, loss: 0.3050719201564789, mean loss: 0.34219755381520495
Epoch: 48, step: 806, loss: 0.32617127895355225, mean loss: 0.3421973252569702
Epoch: 48, step: 807, loss: 0.34741929173469543, mean loss: 0.3421973997288253
Epoch: 48, step: 808, loss: 0.31886157393455505, mean loss: 0.342197066935143
Epoch: 48, step: 809, loss: 0.3228496015071869, mean loss: 0.3421967910236541
Epoch: 48, step: 810, loss: 0.32998737692832947, mean loss: 0.34219661690939635
Epoch: 48, step: 811, loss: 0.3326079249382019, mean loss: 0.342196480170306
Epoch: 48, step: 812, loss: 0.3258364200592041, mean loss: 0.3421962468717661
Epoch: 48, step: 813, loss: 0.33320391178131104, mean loss: 0.34219611864065225
Epoch: 48, step: 814, loss: 0.336343377828598, mean loss: 0.342196035181488
Epoch: 48, step: 815, loss: 0.2923973500728607, mean loss: 0.34219532507018996
Epoch: 48, step: 816, loss: 0.3011215627193451, mean loss: 0.34219473938149697
Epoch: 48, step: 817, loss: 0.30483338236808777, mean loss: 0.3421942066372076
Epoch: 48, step: 818, loss: 0.2989872097969055, mean loss: 0.34219359054736376
Epoch: 48, step: 819, loss: 0.3306736946105957, mean loss: 0.3421934262871696
Epoch: 48, step: 820, loss: 0.3062583804130554, mean loss: 0.3421929139029015
Epoch: 48, step: 821, loss: 0.30958256125450134, mean loss: 0.34219244893081024
Epoch: 48, step: 822, loss: 0.31270328164100647, mean loss: 0.3421920284678846
Epoch: 48, step: 823, loss: 0.35019055008888245, mean loss: 0.3421921425109099
Epoch: 48, step: 824, loss: 0.32381394505500793, mean loss: 0.34219188047806764
Epoch: 48, step: 825, loss: 0.3213655650615692, mean loss: 0.342191583544659
Epoch: 48, step: 826, loss: 0.3311607539653778, mean loss: 0.34219142627367455
Epoch: 48, step: 827, loss: 0.2819240391254425, mean loss: 0.34219056702948936
Epoch: 48, step: 828, loss: 0.32808250188827515, mean loss: 0.34219036589085233
Epoch: 48, step: 829, loss: 0.3555085062980652, mean loss: 0.3421905557648281
Epoch: 48, step: 830, loss: 0.33643850684165955, mean loss: 0.3421904737602243
Epoch: 48, step: 831, loss: 0.32016050815582275, mean loss: 0.34219015969251215
Epoch: 48, step: 832, loss: 0.325387179851532, mean loss: 0.3421899201461462
Epoch: 48, step: 833, loss: 0.3552994430065155, mean loss: 0.34219010703524694
Epoch: 48, step: 834, loss: 0.3119666278362274, mean loss: 0.34218967617606266
Epoch: 48, step: 835, loss: 0.31324446201324463, mean loss: 0.3421892635454223
Epoch: 48, step: 836, loss: 0.35715416073799133, mean loss: 0.34218947687557943
Epoch: 48, step: 837, loss: 0.3011801242828369, mean loss: 0.34218889228038923
Epoch: 48, step: 838, loss: 0.3497025966644287, mean loss: 0.3421889993879769
Epoch: 48, step: 839, loss: 0.3509660065174103, mean loss: 0.34218912450211664
Epoch: 48, step: 840, loss: 0.3378869295120239, mean loss: 0.3421890631762291
Epoch: 48, step: 841, loss: 0.318948894739151, mean loss: 0.3421887319026248
Epoch: 48, step: 842, loss: 0.32397884130477905, mean loss: 0.342188472336085
Epoch: 48, step: 843, loss: 0.3508423864841461, mean loss: 0.3421885956885303
Epoch: 48, step: 844, loss: 0.32780027389526367, mean loss: 0.342188390601058
Epoch: 48, step: 845, loss: 0.3538377583026886, mean loss: 0.3421885566458099
Epoch: 48, step: 846, loss: 0.30113738775253296, mean loss: 0.3421879715295897
Epoch: 48, step: 847, loss: 0.33162686228752136, mean loss: 0.34218782100066664
Epoch: 48, step: 848, loss: 0.3336150348186493, mean loss: 0.3421876988133235
Epoch: 48, step: 849, loss: 0.3707132041454315, mean loss: 0.34218810537963196
Epoch: 48, step: 850, loss: 0.33042892813682556, mean loss: 0.3421879377816495
Epoch: 48, step: 851, loss: 0.3481038808822632, mean loss: 0.3421880220975822
Epoch: 48, step: 852, loss: 0.37469640374183655, mean loss: 0.3421884854109385
Epoch: 48, step: 853, loss: 0.3258347809314728, mean loss: 0.3421882523393015
Epoch: 48, step: 854, loss: 0.32257479429244995, mean loss: 0.3421879728139114
Epoch: 48, step: 855, loss: 0.3403060734272003, mean loss: 0.3421879459940022
Epoch: 48, step: 856, loss: 0.32757604122161865, mean loss: 0.3421877377552533
Epoch: 48, step: 857, loss: 0.308223694562912, mean loss: 0.3421872537301259
Epoch: 48, step: 858, loss: 0.34078341722488403, mean loss: 0.3421872337241903
Epoch: 48, step: 859, loss: 0.34468263387680054, mean loss: 0.34218726928538495
Epoch: 48, step: 860, loss: 0.32793092727661133, mean loss: 0.3421870661254515
Epoch: 48, step: 861, loss: 0.34084177017211914, mean loss: 0.3421870469545912
Epoch: 48, step: 862, loss: 0.3557281792163849, mean loss: 0.34218723991693195
Epoch: 48, step: 863, loss: 0.3166126012802124, mean loss: 0.3421868754812469
Epoch: 48, step: 864, loss: 0.3312092423439026, mean loss: 0.3421867190534552
Epoch: 48, step: 865, loss: 0.3299619257450104, mean loss: 0.34218654485650873
Epoch: 48, step: 866, loss: 0.3442360758781433, mean loss: 0.3421865740608437
Epoch: 48, step: 867, loss: 0.31180912256240845, mean loss: 0.3421861412102951
Epoch: 48, step: 868, loss: 0.3255006670951843, mean loss: 0.3421859034611306
Epoch: 48, step: 869, loss: 0.3378417193889618, mean loss: 0.3421858415622951
Epoch: 48, step: 870, loss: 0.3388024568557739, mean loss: 0.3421857933542574
Epoch: 48, step: 871, loss: 0.37724563479423523, mean loss: 0.34218629289605385
Epoch: 48, step: 872, loss: 0.3082922399044037, mean loss: 0.3421858099715972
Epoch: 48, step: 873, loss: 0.29726284742355347, mean loss: 0.3421851699157093
Epoch: 48, step: 874, loss: 0.320366233587265, mean loss: 0.34218485904708223
Epoch: 48, step: 875, loss: 0.3798668086528778, mean loss: 0.34218539591876407
Epoch: 48, step: 876, loss: 0.2959408164024353, mean loss: 0.34218473706083025
Epoch: 48, step: 877, loss: 0.3076023459434509, mean loss: 0.3421842443639914
Epoch: 48, step: 878, loss: 0.3040730655193329, mean loss: 0.34218370140009513
Epoch: 48, step: 879, loss: 0.32058990001678467, mean loss: 0.34218339376102824
Epoch: 48, step: 880, loss: 0.3241037428379059, mean loss: 0.34218313619045965
Epoch: 48, step: 881, loss: 0.31963369250297546, mean loss: 0.3421828149458563
Epoch: 48, step: 882, loss: 0.3472038507461548, mean loss: 0.3421828864756775
Epoch: 48, step: 883, loss: 0.35391753911972046, mean loss: 0.34218305364549695
Epoch: 48, step: 884, loss: 0.34551408886909485, mean loss: 0.3421831010981691
Epoch: 48, step: 885, loss: 0.3608945608139038, mean loss: 0.34218336765077334
Epoch: 48, step: 886, loss: 0.31110385060310364, mean loss: 0.34218292491630353
Epoch: 48, step: 887, loss: 0.31667056679725647, mean loss: 0.34218256149239873
Epoch: 48, step: 888, loss: 0.3465937077999115, mean loss: 0.3421826243283456
Epoch: 48, step: 889, loss: 0.37380367517471313, mean loss: 0.3421830747578326
Epoch: 48, step: 890, loss: 0.309481680393219, mean loss: 0.3421826089459105
Epoch: 48, step: 891, loss: 0.31824588775634766, mean loss: 0.3421822679864041
Epoch: 48, step: 892, loss: 0.3291507661342621, mean loss: 0.3421820823656954
Epoch: 48, step: 893, loss: 0.2978980839252472, mean loss: 0.34218145159341895
Epoch: 48, step: 894, loss: 0.37740597128868103, mean loss: 0.3421819533171743
Epoch: 48, step: 895, loss: 0.34842443466186523, mean loss: 0.34218204223127735
Epoch: 48, step: 896, loss: 0.2884642481803894, mean loss: 0.3421812771186272
Epoch: 48, step: 897, loss: 0.3177871108055115, mean loss: 0.3421809296728743
Epoch: 48, step: 898, loss: 0.312594473361969, mean loss: 0.342180508279413
Epoch: 48, step: 899, loss: 0.31849199533462524, mean loss: 0.34218017089388136
Epoch: 48, step: 900, loss: 0.3343465328216553, mean loss: 0.3421800593242565
Epoch: 48, step: 901, loss: 0.3162744343280792, mean loss: 0.34217969037183965
Epoch: 48, step: 902, loss: 0.32264357805252075, mean loss: 0.3421794121390928
Epoch: 48, step: 903, loss: 0.32498154044151306, mean loss: 0.34217916721098957
Epoch: 48, step: 904, loss: 0.3212709426879883, mean loss: 0.3421788694451419
Epoch: 48, step: 905, loss: 0.293468713760376, mean loss: 0.34217817574615184
Epoch: 48, step: 906, loss: 0.33831730484962463, mean loss: 0.3421781207628724
Epoch: 48, step: 907, loss: 0.3060453236103058, mean loss: 0.3421776061972621
Epoch: 48, step: 908, loss: 0.3207709491252899, mean loss: 0.3421773013503207
Epoch: 48, step: 909, loss: 0.32245635986328125, mean loss: 0.3421770205132399
Epoch: 48, step: 910, loss: 0.31547248363494873, mean loss: 0.34217664023132544
Epoch: 48, step: 911, loss: 0.34033313393592834, mean loss: 0.342176613979527
Epoch: 48, step: 912, loss: 0.3309572637081146, mean loss: 0.3421764542166182
Epoch: 48, step: 913, loss: 0.2995035946369171, mean loss: 0.34217584656618133
Epoch: 48, step: 914, loss: 0.326652467250824, mean loss: 0.34217562552043945
Epoch: 48, step: 915, loss: 0.3419268727302551, mean loss: 0.3421756219783652
Epoch: 48, step: 916, loss: 0.34637922048568726, mean loss: 0.34217568183395913
Epoch: 48, step: 917, loss: 0.3455847501754761, mean loss: 0.342175730375442
Epoch: 48, step: 918, loss: 0.34593653678894043, mean loss: 0.3421757839245359
Epoch: 48, step: 919, loss: 0.3303001821041107, mean loss: 0.34217561483349734
Epoch: 48, step: 920, loss: 0.3358621597290039, mean loss: 0.34217552494049686
Epoch: 48, step: 921, loss: 0.3320085406303406, mean loss: 0.34217538018177157
Epoch: 48, step: 922, loss: 0.3247598707675934, mean loss: 0.3421751322212189
Epoch: 48, step: 923, loss: 0.30992987751960754, mean loss: 0.3421746731225416
Epoch: 48, step: 924, loss: 0.33503785729408264, mean loss: 0.3421745715120538
Epoch: 48, step: 925, loss: 0.3120265007019043, mean loss: 0.34217414228470094
Epoch: 48, step: 926, loss: 0.35861241817474365, mean loss: 0.34217437631815656
Epoch: 48, step: 927, loss: 0.3414298892021179, mean loss: 0.3421743657189664
Epoch: 48, step: 928, loss: 0.2973262071609497, mean loss: 0.342173727229216
Epoch: 48, step: 929, loss: 0.32240739464759827, mean loss: 0.34217344582588777
Epoch: 48, step: 930, loss: 0.3183324635028839, mean loss: 0.342173106418654
Epoch: 48, step: 931, loss: 0.3281632959842682, mean loss: 0.342172906973713
Epoch: 48, step: 932, loss: 0.3368947505950928, mean loss: 0.3421728318344664
Epoch: 48, step: 933, loss: 0.3088591694831848, mean loss: 0.34217235759162906
Epoch: 48, step: 934, loss: 0.32145237922668457, mean loss: 0.3421720626327217
Epoch: 48, step: 935, loss: 0.3571070730686188, mean loss: 0.34217227523678784
Epoch: 48, step: 936, loss: 0.2889462113380432, mean loss: 0.3421715175596124
Epoch: 48, step: 937, loss: 0.31413695216178894, mean loss: 0.3421711184910658
Epoch: 48, step: 938, loss: 0.3460127115249634, mean loss: 0.3421711731748857
Epoch: 48, step: 939, loss: 0.3706721067428589, mean loss: 0.34217157887057503
Epoch: 48, step: 940, loss: 0.3289603888988495, mean loss: 0.342171390818962
Epoch: 48, step: 941, loss: 0.3441777527332306, mean loss: 0.3421714193776478
Epoch: 48, step: 942, loss: 0.3610621988773346, mean loss: 0.34217168826640304
Epoch: 48, step: 943, loss: 0.3210807144641876, mean loss: 0.34217138806465797
Epoch: 48, step: 944, loss: 0.3473251461982727, mean loss: 0.34217146142045357
Epoch: 48, step: 945, loss: 0.3178924322128296, mean loss: 0.34217111585085
Epoch: 48, step: 946, loss: 0.3144916892051697, mean loss: 0.3421707218881314
Epoch: 48, step: 947, loss: 0.3744017779827118, mean loss: 0.34217118062789936
Epoch: 48, step: 948, loss: 0.320415735244751, mean loss: 0.3421708709903283
Epoch: 48, step: 949, loss: 0.3562881648540497, mean loss: 0.3421710719139266
Epoch: 48, step: 950, loss: 0.29576218128204346, mean loss: 0.34217041141137716
Epoch: 48, step: 951, loss: 0.3334333002567291, mean loss: 0.342170287064469
Epoch: 48, step: 952, loss: 0.30211973190307617, mean loss: 0.34216971707151145
Epoch: 48, step: 953, loss: 0.32895392179489136, mean loss: 0.34216952898914904
Epoch: 48, step: 954, loss: 0.325825572013855, mean loss: 0.34216929639124427
Epoch: 48, step: 955, loss: 0.34971487522125244, mean loss: 0.3421694037741046
Epoch: 48, step: 956, loss: 0.36733707785606384, mean loss: 0.342169761935941
Epoch: 48, step: 957, loss: 0.33114832639694214, mean loss: 0.34216960509183203
Epoch: 48, step: 958, loss: 0.32740893959999084, mean loss: 0.34216939503838906
Epoch: 48, step: 959, loss: 0.33856815099716187, mean loss: 0.34216934379117764
Epoch: 48, step: 960, loss: 0.31928643584251404, mean loss: 0.3421690181624447
Epoch: 48, step: 961, loss: 0.3133643865585327, mean loss: 0.3421686082721353
Epoch: 48, step: 962, loss: 0.30346548557281494, mean loss: 0.3421680575339966
Epoch: 48, step: 963, loss: 0.37177327275276184, mean loss: 0.34216847880463264
Epoch: 48, step: 964, loss: 0.3344346582889557, mean loss: 0.3421683687569568
Epoch: 48, step: 965, loss: 0.354597270488739, mean loss: 0.3421685456103352
Epoch: 48, step: 966, loss: 0.34449875354766846, mean loss: 0.34216857876686757
Epoch: 48, step: 967, loss: 0.3615627586841583, mean loss: 0.3421688547227571
Epoch: 48, step: 968, loss: 0.30724915862083435, mean loss: 0.3421683578644867
Epoch: 48, step: 969, loss: 0.3366532325744629, mean loss: 0.34216827939311006
Epoch: 48, step: 970, loss: 0.32259616255760193, mean loss: 0.342168000917279
Epoch: 48, step: 971, loss: 0.333767831325531, mean loss: 0.3421678813997559
Epoch: 48, step: 972, loss: 0.30837029218673706, mean loss: 0.34216740053485994
Epoch: 48, step: 973, loss: 0.2989267408847809, mean loss: 0.3421667853247235
Epoch: 48, step: 974, loss: 0.3620472848415375, mean loss: 0.34216706817218484
Epoch: 48, step: 975, loss: 0.35832083225250244, mean loss: 0.3421672979946877
Epoch: 48, step: 976, loss: 0.3136462867259979, mean loss: 0.3421668922269108
Epoch: 48, step: 977, loss: 0.335194855928421, mean loss: 0.34216679303732056
Epoch: 48, step: 978, loss: 0.32476919889450073, mean loss: 0.342166545529188
Epoch: 48, step: 979, loss: 0.3372684121131897, mean loss: 0.3421664758465297
Epoch: 48, step: 980, loss: 0.3836113214492798, mean loss: 0.3421670654478499
Epoch: 48, step: 981, loss: 0.30830124020576477, mean loss: 0.3421665836737975
Epoch: 48, step: 982, loss: 0.29287779331207275, mean loss: 0.34216588250315433
Epoch: 48, step: 983, loss: 0.3372354805469513, mean loss: 0.3421658123654231
Epoch: 48, step: 984, loss: 0.34608080983161926, mean loss: 0.3421658680576641
Epoch: 48, step: 985, loss: 0.3361275792121887, mean loss: 0.34216578216206467
Epoch: 48, step: 986, loss: 0.3176349401473999, mean loss: 0.34216543321197984
Epoch: 48, step: 987, loss: 0.33922243118286133, mean loss: 0.3421653913485086
Epoch: 48, step: 988, loss: 0.3716028928756714, mean loss: 0.34216581008368346
Epoch: 48, step: 989, loss: 0.3255772888660431, mean loss: 0.34216557412281157
Epoch: 48, step: 990, loss: 0.3413965702056885, mean loss: 0.34216556318438907
Epoch: 48, step: 991, loss: 0.39849787950515747, mean loss: 0.3421663644519744
Epoch: 48, step: 992, loss: 0.30324652791023254, mean loss: 0.3421658108663611
Epoch: 48, step: 993, loss: 0.3180510997772217, mean loss: 0.34216546786987306
Epoch: 48, step: 994, loss: 0.3594917953014374, mean loss: 0.34216571430802906
Epoch: 48, step: 995, loss: 0.3378811180591583, mean loss: 0.34216565336764887
Epoch: 48, step: 996, loss: 0.3216582238674164, mean loss: 0.34216536169191036
Epoch: 48, step: 997, loss: 0.33526307344436646, mean loss: 0.3421652635225426
Epoch: 48, step: 998, loss: 0.30296608805656433, mean loss: 0.34216470601126464
Epoch: 48, step: 999, loss: 0.35576656460762024, mean loss: 0.34216489946129586
Epoch: 48, step: 1000, loss: 0.3547992706298828, mean loss: 0.34216507914885247
Epoch: 48, step: 1001, loss: 0.3808794319629669, mean loss: 0.34216562974123543
Epoch: 48, step: 1002, loss: 0.3158843517303467, mean loss: 0.34216525597634867
Epoch: 48, step: 1003, loss: 0.3494395613670349, mean loss: 0.34216535942798687
Epoch: 48, step: 1004, loss: 0.318452388048172, mean loss: 0.34216502219842104
Epoch: 48, step: 1005, loss: 0.3655815124511719, mean loss: 0.34216535520690045
Epoch: 48, step: 1006, loss: 0.3480704426765442, mean loss: 0.3421654391826036
Epoch: 48, step: 1007, loss: 0.3369036316871643, mean loss: 0.34216536435598965
Epoch: 48, step: 1008, loss: 0.3491102159023285, mean loss: 0.34216546311527274
Epoch: 48, step: 1009, loss: 0.33603575825691223, mean loss: 0.34216537594902524
Epoch: 48, step: 1010, loss: 0.3557423949241638, mean loss: 0.34216556901557493
Epoch: 48, step: 1011, loss: 0.34224197268486023, mean loss: 0.3421655701020272
Epoch: 48, step: 1012, loss: 0.3354794681072235, mean loss: 0.34216547502770095
Epoch: 48, step: 1013, loss: 0.3158634901046753, mean loss: 0.3421651010268347
Epoch: 48, step: 1014, loss: 0.3385101854801178, mean loss: 0.342165049056531
Epoch: 48, step: 1015, loss: 0.3242241144180298, mean loss: 0.3421647939528079
Epoch: 48, step: 1016, loss: 0.3021281063556671, mean loss: 0.3421642246757302
Epoch: 48, step: 1017, loss: 0.33149558305740356, mean loss: 0.34216407298169327
Epoch: 48, step: 1018, loss: 0.35563769936561584, mean loss: 0.3421642645561965
Epoch: 48, step: 1019, loss: 0.3616870045661926, mean loss: 0.34216454213596115
Epoch: 48, step: 1020, loss: 0.3090134561061859, mean loss: 0.34216407079127187
Epoch: 48, step: 1021, loss: 0.3474317193031311, mean loss: 0.3421641456860384
Epoch: 48, step: 1022, loss: 0.3129024803638458, mean loss: 0.3421637296532621
Epoch: 48, step: 1023, loss: 0.328353613615036, mean loss: 0.3421635333083457
Epoch: 48, step: 1024, loss: 0.3555905818939209, mean loss: 0.34216372420429786
Epoch: 48, step: 1025, loss: 0.29962876439094543, mean loss: 0.3421631194819598
Epoch: 48, step: 1026, loss: 0.3523840606212616, mean loss: 0.3421632647916904
Epoch: 48, step: 1027, loss: 0.3706744909286499, mean loss: 0.34216367012615356
Epoch: 48, step: 1028, loss: 0.34523805975914, mean loss: 0.34216371383309024
Epoch: 48, step: 1029, loss: 0.32256457209587097, mean loss: 0.3421634352066404
Epoch: 48, step: 1030, loss: 0.3055236339569092, mean loss: 0.3421629143331882
Epoch: 48, step: 1031, loss: 0.361325740814209, mean loss: 0.34216318674912244
Epoch: 48, step: 1032, loss: 0.30743277072906494, mean loss: 0.3421626930336342
Epoch: 48, step: 1033, loss: 0.30574455857276917, mean loss: 0.34216217533348836
Epoch: 48, step: 1034, loss: 0.30871912837028503, mean loss: 0.34216169993230616
Epoch: 48, step: 1035, loss: 0.3178572654724121, mean loss: 0.3421613544436717
Epoch: 48, step: 1036, loss: 0.3371935188770294, mean loss: 0.3421612838266684
Epoch: 48, step: 1037, loss: 0.3202369213104248, mean loss: 0.3421609721797243
Epoch: 48, step: 1038, loss: 0.29375511407852173, mean loss: 0.34216028411760574
Epoch: 48, step: 1039, loss: 0.32256215810775757, mean loss: 0.34216000554519826
Epoch: 48, step: 1040, loss: 0.3014663755893707, mean loss: 0.3421594271245203
Epoch: 48, step: 1041, loss: 0.3121754825115204, mean loss: 0.3421590009377418
Epoch: 48, step: 1042, loss: 0.3362790644168854, mean loss: 0.34215891736249454
Epoch: 48, step: 1043, loss: 0.2975916266441345, mean loss: 0.34215828390847897
Epoch: 48, step: 1044, loss: 0.33342957496643066, mean loss: 0.34215815984535886
Epoch: 48, step: 1045, loss: 0.3043472468852997, mean loss: 0.34215762243791464
Epoch: 48, step: 1046, loss: 0.31875601410865784, mean loss: 0.34215728983500204
Epoch: 48, step: 1047, loss: 0.31844562292099, mean loss: 0.34215695283007147
Epoch: 48, step: 1048, loss: 0.38464006781578064, mean loss: 0.34215755661789404
Epoch: 48, step: 1049, loss: 0.30308061838150024, mean loss: 0.3421570012479751
Epoch: 48, step: 1050, loss: 0.3258642852306366, mean loss: 0.34215676969565334
Epoch: 48, step: 1051, loss: 0.33111822605133057, mean loss: 0.34215661281793686
Epoch: 48, step: 1052, loss: 0.3312382400035858, mean loss: 0.3421564576502709
Epoch: 48, step: 1053, loss: 0.3222041726112366, mean loss: 0.34215617410018934
Epoch: 48, step: 1054, loss: 0.3566247522830963, mean loss: 0.34215637971614826
Epoch: 48, step: 1055, loss: 0.33927038311958313, mean loss: 0.3421563387032362
Epoch: 48, step: 1056, loss: 0.3183363974094391, mean loss: 0.34215600020274173
Epoch: 48, step: 1057, loss: 0.33341172337532043, mean loss: 0.34215587594131175
Epoch: 48, step: 1058, loss: 0.39903882145881653, mean loss: 0.34215668427067353
Epoch: 48, step: 1059, loss: 0.3355688154697418, mean loss: 0.3421565906557585
Epoch: 48, step: 1060, loss: 0.3413754105567932, mean loss: 0.34215657955519296
Epoch: 48, step: 1061, loss: 0.35734793543815613, mean loss: 0.34215679542122135
Epoch: 48, step: 1062, loss: 0.33162280917167664, mean loss: 0.34215664573758015
Epoch: 48, step: 1063, loss: 0.322414368391037, mean loss: 0.34215636521187043
Epoch: 48, step: 1064, loss: 0.3670481741428375, mean loss: 0.34215671890425475
Epoch: 48, step: 1065, loss: 0.35219478607177734, mean loss: 0.34215686153500824
Epoch: 48, step: 1066, loss: 0.30083131790161133, mean loss: 0.3421562743492904
Epoch: 48, step: 1067, loss: 0.3672841191291809, mean loss: 0.34215663138033303
Epoch: 48, step: 1068, loss: 0.2989785671234131, mean loss: 0.34215601788998395
Epoch: 48, step: 1069, loss: 0.3282094895839691, mean loss: 0.34215581973522413
Epoch: 48, step: 1070, loss: 0.3095909655094147, mean loss: 0.3421553570545452
Epoch: 48, step: 1071, loss: 0.40790730714797974, mean loss: 0.34215629124342467
Epoch: 48, step: 1072, loss: 0.32348644733428955, mean loss: 0.34215602599026124
Epoch: 48, step: 1073, loss: 0.3344481289386749, mean loss: 0.3421559164813099
Epoch: 48, step: 1074, loss: 0.3154935836791992, mean loss: 0.3421555376850435
Epoch: 48, step: 1075, loss: 0.30155691504478455, mean loss: 0.34215496090174746
Epoch: 48, step: 1076, loss: 0.3241620659828186, mean loss: 0.34215470528091296
Epoch: 48, step: 1077, loss: 0.36422041058540344, mean loss: 0.34215501875875504
Epoch: 48, step: 1078, loss: 0.35733190178871155, mean loss: 0.3421552343670434
Epoch: 48, step: 1079, loss: 0.31853556632995605, mean loss: 0.3421548988222651
Epoch: 48, step: 1080, loss: 0.32525673508644104, mean loss: 0.3421546587676611
Epoch: 48, step: 1081, loss: 0.3367057740688324, mean loss: 0.34215458136213367
Epoch: 48, step: 1082, loss: 0.3090597689151764, mean loss: 0.34215411123197603
Epoch: 48, step: 1083, loss: 0.3271893560886383, mean loss: 0.342153898652353
Epoch: 48, step: 1084, loss: 0.32867297530174255, mean loss: 0.34215370715380405
Epoch: 48, step: 1085, loss: 0.31307655572891235, mean loss: 0.34215329411435086
Epoch: 48, step: 1086, loss: 0.3325042128562927, mean loss: 0.3421531570515906
Epoch: 48, step: 1087, loss: 0.3381844758987427, mean loss: 0.34215310067827875
Epoch: 48, step: 1088, loss: 0.3578847646713257, mean loss: 0.3421533241362409
Epoch: 48, step: 1089, loss: 0.3139125108718872, mean loss: 0.3421529229997211
Epoch: 48, step: 1090, loss: 0.3111156225204468, mean loss: 0.34215248214776195
Epoch: 48, step: 1091, loss: 0.3263229727745056, mean loss: 0.34215225730955146
Epoch: 48, step: 1092, loss: 0.33887606859207153, mean loss: 0.3421522107760848
Epoch: 48, step: 1093, loss: 0.35129842162132263, mean loss: 0.3421523406827809
Epoch: 48, step: 1094, loss: 0.34273549914360046, mean loss: 0.3421523489654582
Epoch: 48, step: 1095, loss: 0.31569918990135193, mean loss: 0.34215197325305247
Epoch: 48, step: 1096, loss: 0.32048898935317993, mean loss: 0.34215166557954624
Epoch: 48, step: 1097, loss: 0.3358038663864136, mean loss: 0.34215157542475017
Epoch: 48, step: 1098, loss: 0.34841981530189514, mean loss: 0.3421516644483385
Epoch: 48, step: 1099, loss: 0.3178289830684662, mean loss: 0.342151319014586
Epoch: 48, step: 1100, loss: 0.32799410820007324, mean loss: 0.342151117954969
Epoch: 48, step: 1101, loss: 0.31665948033332825, mean loss: 0.34215075592983735
Epoch: 48, step: 1102, loss: 0.33159852027893066, mean loss: 0.34215060607205633
Epoch: 48, step: 1103, loss: 0.3177006244659424, mean loss: 0.3421502588500953
Epoch: 48, step: 1104, loss: 0.30872243642807007, mean loss: 0.3421497841377045
Epoch: 48, step: 1105, loss: 0.34224212169647217, mean loss: 0.3421497854489823
Epoch: 48, step: 1106, loss: 0.3208834230899811, mean loss: 0.3421494834514765
Epoch: 48, step: 1107, loss: 0.323772668838501, mean loss: 0.3421492224913144
Epoch: 48, step: 1108, loss: 0.3018558621406555, mean loss: 0.34214865031312397
Epoch: 48, step: 1109, loss: 0.3054824769496918, mean loss: 0.34214812964950514
Epoch: 48, step: 1110, loss: 0.36858034133911133, mean loss: 0.34214850498443394
Epoch: 48, step: 1111, loss: 0.3255712687969208, mean loss: 0.3421482695925762
Epoch: 48, step: 1112, loss: 0.31737735867500305, mean loss: 0.3421479178579519
Epoch: 48, step: 1113, loss: 0.34441035985946655, mean loss: 0.34214794998304776
Epoch: 48, step: 1114, loss: 0.3381921947002411, mean loss: 0.3421478938148838
Epoch: 48, step: 1115, loss: 0.33255839347839355, mean loss: 0.3421477576545451
Epoch: 48, step: 1116, loss: 0.32723990082740784, mean loss: 0.34214754598240965
Epoch: 48, step: 1117, loss: 0.3434394896030426, mean loss: 0.34214756432606463
Epoch: 48, step: 1118, loss: 0.313347190618515, mean loss: 0.3421471554099097
Epoch: 48, step: 1119, loss: 0.34374773502349854, mean loss: 0.34214717813508594
Epoch: 48, step: 1120, loss: 0.3401136100292206, mean loss: 0.3421471492627093
Epoch: 48, step: 1121, loss: 0.3199436366558075, mean loss: 0.3421468340241511
Epoch: 48, step: 1122, loss: 0.32282382249832153, mean loss: 0.34214655968594526
Epoch: 48, step: 1123, loss: 0.32943078875541687, mean loss: 0.3421463791565153
Epoch: 48, step: 1124, loss: 0.3419160544872284, mean loss: 0.34214637588657665
Epoch: 48, step: 1125, loss: 0.3218148946762085, mean loss: 0.3421460872429296
Epoch: 48, step: 1126, loss: 0.33062905073165894, mean loss: 0.3421459237392383
Epoch: 48, step: 1127, loss: 0.3217627704143524, mean loss: 0.3421456343702246
Epoch: 48, step: 1128, loss: 0.31881940364837646, mean loss: 0.34214530322457476
Epoch: 48, step: 1129, loss: 0.3564748167991638, mean loss: 0.3421455066474414
Epoch: 48, step: 1130, loss: 0.32817545533180237, mean loss: 0.3421453083303437
Epoch: 48, step: 1131, loss: 0.33882027864456177, mean loss: 0.34214526112930904
Epoch: 48, step: 1132, loss: 0.33116644620895386, mean loss: 0.34214510527985315
Epoch: 48, step: 1133, loss: 0.2981102466583252, mean loss: 0.3421444801931396
Epoch: 48, step: 1134, loss: 0.3464794456958771, mean loss: 0.3421445417282724
Epoch: 48, step: 1135, loss: 0.3377422094345093, mean loss: 0.34214447923775043
Epoch: 48, step: 1136, loss: 0.3486097455024719, mean loss: 0.34214457101004336
Epoch: 48, step: 1137, loss: 0.3283999264240265, mean loss: 0.3421443759121784
Epoch: 48, step: 1138, loss: 0.30951058864593506, mean loss: 0.34214391269962974
Epoch: 48, step: 1139, loss: 0.30530333518981934, mean loss: 0.34214338978221776
Epoch: 48, step: 1140, loss: 0.307594895362854, mean loss: 0.3421428994057339
Epoch: 48, step: 1141, loss: 0.29868224263191223, mean loss: 0.3421422825400233
Epoch: 48, step: 1142, loss: 0.3370732367038727, mean loss: 0.34214221059274014
Epoch: 48, step: 1143, loss: 0.3362561762332916, mean loss: 0.34214212705075137
Epoch: 48, step: 1144, loss: 0.3095637261867523, mean loss: 0.3421416646637513
Epoch: 48, step: 1145, loss: 0.3504391312599182, mean loss: 0.34214178242847065
Epoch: 48, step: 1146, loss: 0.3743908107280731, mean loss: 0.34214224012767586
Epoch: 48, step: 1147, loss: 0.310410737991333, mean loss: 0.34214178977993054
Epoch: 48, step: 1148, loss: 0.30893808603286743, mean loss: 0.342141318544726
Epoch: 48, step: 1149, loss: 0.31627586483955383, mean loss: 0.3421409514609971
Epoch: 48, step: 1150, loss: 0.31657639145851135, mean loss: 0.3421405886527147
Epoch: 48, step: 1151, loss: 0.33988282084465027, mean loss: 0.3421405566112778
Epoch: 48, step: 1152, loss: 0.35616180300712585, mean loss: 0.3421407555929906
Epoch: 48, step: 1153, loss: 0.3104972541332245, mean loss: 0.34214030653243005
Epoch: 48, step: 1154, loss: 0.32976624369621277, mean loss: 0.3421401309316121
Epoch: 48, step: 1155, loss: 0.35582804679870605, mean loss: 0.3421403251746141
Epoch: 48, step: 1156, loss: 0.3153029978275299, mean loss: 0.3421399443358432
Epoch: 48, step: 1157, loss: 0.3402497470378876, mean loss: 0.3421399175131201
Epoch: 48, step: 1158, loss: 0.32597967982292175, mean loss: 0.3421396881955613
Epoch: 48, step: 1159, loss: 0.32316985726356506, mean loss: 0.34213941901303585
Epoch: 48, step: 1160, loss: 0.30299559235572815, mean loss: 0.3421388635687287
Epoch: 48, step: 1161, loss: 0.3771423101425171, mean loss: 0.34213936025469194
Epoch: 48, step: 1162, loss: 0.3151063919067383, mean loss: 0.34213897667231025
Epoch: 48, step: 1163, loss: 0.33469948172569275, mean loss: 0.34213887111162367
Epoch: 48, step: 1164, loss: 0.3256959617137909, mean loss: 0.3421386378027513
Epoch: 48, step: 1165, loss: 0.3285095691680908, mean loss: 0.34213844442228314
Epoch: 48, step: 1166, loss: 0.3240652084350586, mean loss: 0.34213818798794116
Epoch: 48, step: 1167, loss: 0.32994329929351807, mean loss: 0.3421380149617111
Epoch: 48, step: 1168, loss: 0.3285788297653198, mean loss: 0.3421378225809958
Epoch: 48, step: 1169, loss: 0.3528938293457031, mean loss: 0.342137975187431
Epoch: 48, step: 1170, loss: 0.32670220732688904, mean loss: 0.34213775618756065
Epoch: 48, step: 1171, loss: 0.31544068455696106, mean loss: 0.34213737741973205
Epoch: 48, step: 1172, loss: 0.30354368686676025, mean loss: 0.3421368298749984
Epoch: 48, step: 1173, loss: 0.3328106999397278, mean loss: 0.3421366975631927
Epoch: 48, step: 1174, loss: 0.3430357277393341, mean loss: 0.3421367103177457
Epoch: 48, step: 1175, loss: 0.30949312448501587, mean loss: 0.34213624720933244
Epoch: 48, step: 1176, loss: 0.3155924677848816, mean loss: 0.3421358706430679
Epoch: 48, step: 1177, loss: 0.3645496070384979, mean loss: 0.34213618861350903
Epoch: 48, step: 1178, loss: 0.34249991178512573, mean loss: 0.34213619377336163
Epoch: 48, step: 1179, loss: 0.37768903374671936, mean loss: 0.3421366981261956
Epoch: 48, step: 1180, loss: 0.31021133065223694, mean loss: 0.34213624523913627
Epoch: 48, step: 1181, loss: 0.33717653155326843, mean loss: 0.34213617488259973
Epoch: 48, step: 1182, loss: 0.3839300870895386, mean loss: 0.3421367677460965
Epoch: 48, step: 1183, loss: 0.303898423910141, mean loss: 0.3421362253274652
Epoch: 48, step: 1184, loss: 0.3646555244922638, mean loss: 0.3421365447637414
Epoch: 48, step: 1185, loss: 0.30084654688835144, mean loss: 0.34213595907339733
Epoch: 48, step: 1186, loss: 0.3210119903087616, mean loss: 0.3421356594383846
Epoch: 48, step: 1187, loss: 0.3212307393550873, mean loss: 0.3421353629146955
Epoch: 48, step: 1188, loss: 0.3371189534664154, mean loss: 0.3421352917609608
Epoch: 48, step: 1189, loss: 0.31273114681243896, mean loss: 0.34213487469272236
Epoch: 48, step: 1190, loss: 0.35647881031036377, mean loss: 0.3421350781441445
Epoch: 48, step: 1191, loss: 0.3627186119556427, mean loss: 0.34213537009259865
Epoch: 48, step: 1192, loss: 0.35192158818244934, mean loss: 0.3421355088943587
Epoch: 48, step: 1193, loss: 0.31523892283439636, mean loss: 0.342135127414966
Epoch: 48, step: 1194, loss: 0.3752356767654419, mean loss: 0.34213559687969075
Epoch: 48, step: 1195, loss: 0.32920041680336, mean loss: 0.342135413422777
Epoch: 48, step: 1196, loss: 0.3709869086742401, mean loss: 0.3421358226116075
Epoch: 48, step: 1197, loss: 0.3113921880722046, mean loss: 0.3421353865935315
Epoch: 48, step: 1198, loss: 0.3432592749595642, mean loss: 0.34213540253272345
Epoch: 48, step: 1199, loss: 0.3321291208267212, mean loss: 0.34213526062380434
Epoch: 48, step: 1200, loss: 0.30970627069473267, mean loss: 0.342134800722936
Epoch: 48, step: 1201, loss: 0.30644455552101135, mean loss: 0.3421342945788341
Epoch: 48, step: 1202, loss: 0.31929534673690796, mean loss: 0.3421339706910394
Epoch: 48, step: 1203, loss: 0.3882749676704407, mean loss: 0.34213462502476477
Epoch: 48, step: 1204, loss: 0.33997592329978943, mean loss: 0.3421345944122639
Epoch: 48, step: 1205, loss: 0.36894896626472473, mean loss: 0.34213497466087917
Epoch: 48, step: 1206, loss: 0.38825541734695435, mean loss: 0.34213562867529634
Epoch: 48, step: 1207, loss: 0.32922565937042236, mean loss: 0.3421354456070986
Epoch: 48, step: 1208, loss: 0.32291707396507263, mean loss: 0.3421351730872585
Epoch: 48, step: 1209, loss: 0.3536805510520935, mean loss: 0.34213533680039715
Epoch: 48, step: 1210, loss: 0.3350682854652405, mean loss: 0.3421352365912266
Epoch: 48, step: 1211, loss: 0.3172607123851776, mean loss: 0.34213488388116753
Epoch: 48, step: 1212, loss: 0.2804120182991028, mean loss: 0.3421340086898796
Epoch: 48, step: 1213, loss: 0.3787825107574463, mean loss: 0.3421345283351461
Epoch: 48, step: 1214, loss: 0.35541990399360657, mean loss: 0.3421347167080481
Epoch: 48, step: 1215, loss: 0.32532361149787903, mean loss: 0.3421344783473232
Epoch: 48, step: 1216, loss: 0.30301204323768616, mean loss: 0.3421339236473401
Epoch: 48, step: 1217, loss: 0.44931527972221375, mean loss: 0.3421354433036009
Epoch: 48, step: 1218, loss: 0.3079259395599365, mean loss: 0.34213495827568774
Epoch: 48, step: 1219, loss: 0.3081957995891571, mean loss: 0.34213447708759315
Epoch: 48, step: 1220, loss: 0.34488749504089355, mean loss: 0.3421345161192231
Epoch: 48, step: 1221, loss: 0.33292311429977417, mean loss: 0.3421343855240233
Epoch: 48, step: 1222, loss: 0.3097778558731079, mean loss: 0.34213392679389426
Epoch: 48, step: 1223, loss: 0.28252533078193665, mean loss: 0.34213308171342455
Epoch: 48, step: 1224, loss: 0.3244170844554901, mean loss: 0.3421328305544972
Epoch: 48, step: 1225, loss: 0.32122185826301575, mean loss: 0.3421325341047497
Epoch: 48, step: 1226, loss: 0.337029367685318, mean loss: 0.34213246175943124
Epoch: 48, step: 1227, loss: 0.29439935088157654, mean loss: 0.3421317850779615
Epoch: 48, step: 1228, loss: 0.33148249983787537, mean loss: 0.34213163411206593
Epoch: 48, step: 1229, loss: 0.30993643403053284, mean loss: 0.34213117771445767
Epoch: 48, step: 1230, loss: 0.34128251671791077, mean loss: 0.3421311656840507
Epoch: 48, step: 1231, loss: 0.3556691110134125, mean loss: 0.3421313575918718
Epoch: 48, step: 1232, loss: 0.31080928444862366, mean loss: 0.3421309135905515
Epoch: 48, step: 1233, loss: 0.350023090839386, mean loss: 0.34213102546333307
Epoch: 48, step: 1234, loss: 0.35971391201019287, mean loss: 0.34213127469982146
Epoch: 48, step: 1235, loss: 0.3518664240837097, mean loss: 0.3421314126930939
Epoch: 48, step: 1236, loss: 0.31865358352661133, mean loss: 0.3421310799055396
Epoch: 48, step: 1237, loss: 0.3749515116214752, mean loss: 0.3421315451136433
Epoch: 48, step: 1238, loss: 0.32509633898735046, mean loss: 0.34213130365418665
Epoch: 48, step: 1239, loss: 0.3180731236934662, mean loss: 0.34213096265492426
Epoch: 48, step: 1240, loss: 0.35841506719589233, mean loss: 0.34213119346161625
Epoch: 48, step: 1241, loss: 0.3167020082473755, mean loss: 0.34213083304002123
Epoch: 48, step: 1242, loss: 0.3065420389175415, mean loss: 0.3421303286279438
Epoch: 48, step: 1243, loss: 0.3465147614479065, mean loss: 0.3421303907691199
Epoch: 48, step: 1244, loss: 0.3359772562980652, mean loss: 0.34213030356112534
Epoch: 48, step: 1245, loss: 0.384552925825119, mean loss: 0.3421309048058072
Epoch: 48, step: 1246, loss: 0.332444429397583, mean loss: 0.34213076752388133
Epoch: 48, step: 1247, loss: 0.3532366156578064, mean loss: 0.3421309249196882
Epoch: 48, step: 1248, loss: 0.35189324617385864, mean loss: 0.3421310632726205
Epoch: 48, step: 1249, loss: 0.33227136731147766, mean loss: 0.342130923541661
Epoch: 48, step: 1250, loss: 0.3197095990180969, mean loss: 0.342130605792635
Epoch: 48, step: 1251, loss: 0.3416892886161804, mean loss: 0.3421305995384944
Epoch: 48, step: 1252, loss: 0.3608438968658447, mean loss: 0.3421308647308323
Epoch: 48, step: 1253, loss: 0.3315931260585785, mean loss: 0.3421307153991617
Epoch: 48, step: 1254, loss: 0.3208191692829132, mean loss: 0.3421304133947387
Epoch: 48, step: 1255, loss: 0.3567059636116028, mean loss: 0.34213061994091004
Epoch: 48, step: 1256, loss: 0.31897789239883423, mean loss: 0.342130291854533
Epoch: 48, step: 1257, loss: 0.31222817301750183, mean loss: 0.3421298681317211
Epoch: 48, step: 1258, loss: 0.3691042959690094, mean loss: 0.34213025036277683
Epoch: 48, step: 1259, loss: 0.3491652309894562, mean loss: 0.34213035004792997
Epoch: 48, step: 1260, loss: 0.35526153445243835, mean loss: 0.34213053611320143
Epoch: 48, step: 1261, loss: 0.30311647057533264, mean loss: 0.34212998330245614
Epoch: 48, step: 1262, loss: 0.32607194781303406, mean loss: 0.3421297557709579
Epoch: 48, step: 1263, loss: 0.3584786355495453, mean loss: 0.34212998742024064
Epoch: 48, step: 1264, loss: 0.3332667946815491, mean loss: 0.3421298618383551
Epoch: 48, step: 1265, loss: 0.32235434651374817, mean loss: 0.34212958164459323
Epoch: 48, step: 1266, loss: 0.32219311594963074, mean loss: 0.3421292991743727
Epoch: 48, step: 1267, loss: 0.330987811088562, mean loss: 0.34212914131820826
Epoch: 48, step: 1268, loss: 0.3503320515155792, mean loss: 0.34212925753801526
Epoch: 48, step: 1269, loss: 0.31482210755348206, mean loss: 0.34212887065254893
Epoch: 48, step: 1270, loss: 0.3127322196960449, mean loss: 0.34212845416910453
Epoch: 48, step: 1271, loss: 0.3963753283023834, mean loss: 0.3421292227126007
Epoch: 48, step: 1272, loss: 0.34898653626441956, mean loss: 0.34212931986232875
Epoch: 48, step: 1273, loss: 0.35030874609947205, mean loss: 0.3421294357412033
Epoch: 48, step: 1274, loss: 0.35673007369041443, mean loss: 0.342129642587194
Epoch: 48, step: 1275, loss: 0.3029096722602844, mean loss: 0.34212908696909566
Epoch: 48, step: 1276, loss: 0.3219801187515259, mean loss: 0.3421288015284715
Epoch: 48, step: 1277, loss: 0.32703933119773865, mean loss: 0.3421285877663192
Epoch: 48, step: 1278, loss: 0.29086020588874817, mean loss: 0.3421278614926883
Epoch: 48, step: 1279, loss: 0.2991352677345276, mean loss: 0.34212725246342496
Epoch: 48, step: 1280, loss: 0.32661500573158264, mean loss: 0.34212703272142886
Epoch: 48, step: 1281, loss: 0.3371911644935608, mean loss: 0.342126962802339
Epoch: 48, step: 1282, loss: 0.33372005820274353, mean loss: 0.34212684371593627
Epoch: 48, step: 1283, loss: 0.326692670583725, mean loss: 0.34212662508919917
Epoch: 48, step: 1284, loss: 0.33687353134155273, mean loss: 0.3421265506796103
Epoch: 48, step: 1285, loss: 0.38333767652511597, mean loss: 0.3421271344231419
Epoch: 48, step: 1286, loss: 0.30483025312423706, mean loss: 0.34212660613122137
Epoch: 48, step: 1287, loss: 0.38721591234207153, mean loss: 0.34212724478994955
Epoch: 48, step: 1288, loss: 0.33432695269584656, mean loss: 0.3421271343057908
Epoch: 48, step: 1289, loss: 0.36110448837280273, mean loss: 0.34212740309922535
Epoch: 48, step: 1290, loss: 0.3481364846229553, mean loss: 0.34212748821007793
Epoch: 48, step: 1291, loss: 0.30950304865837097, mean loss: 0.34212702613371465
Epoch: 48, step: 1292, loss: 0.30224546790122986, mean loss: 0.342126461279126
Epoch: 48, step: 1293, loss: 0.32218503952026367, mean loss: 0.3421261788467299
Epoch: 48, step: 1294, loss: 0.31658491492271423, mean loss: 0.3421258171083198
Epoch: 48, step: 1295, loss: 0.34308579564094543, mean loss: 0.3421258307042088
Epoch: 48, step: 1296, loss: 0.34685978293418884, mean loss: 0.3421258977488098
Epoch: 48, step: 1297, loss: 0.2976682484149933, mean loss: 0.34212526812624455
Epoch: 48, step: 1298, loss: 0.3282720148563385, mean loss: 0.3421250719350949
Epoch: 48, step: 1299, loss: 0.3326835632324219, mean loss: 0.34212493822540385
Epoch: 48, step: 1300, loss: 0.3526769280433655, mean loss: 0.34212508765949984
Epoch: 48, step: 1301, loss: 0.2777111530303955, mean loss: 0.3421241754617115
Epoch: 48, step: 1302, loss: 0.34793031215667725, mean loss: 0.3421242576841387
Epoch: 48, step: 1303, loss: 0.3415263593196869, mean loss: 0.34212424921724216
Epoch: 48, step: 1304, loss: 0.3369797170162201, mean loss: 0.3421241763660562
Epoch: 48, step: 1305, loss: 0.33171531558036804, mean loss: 0.34212402896934735
Epoch: 48, step: 1306, loss: 0.32676294445991516, mean loss: 0.3421238114487862
Epoch: 48, step: 1307, loss: 0.3426014482975006, mean loss: 0.3421238182122646
Epoch: 48, step: 1308, loss: 0.31507256627082825, mean loss: 0.3421234351639937
Epoch: 48, step: 1309, loss: 0.3642807602882385, mean loss: 0.3421237489093581
Epoch: 48, step: 1310, loss: 0.3136586844921112, mean loss: 0.3421233458527842
Epoch: 48, step: 1311, loss: 0.3087984323501587, mean loss: 0.3421228739889206
Epoch: 48, step: 1312, loss: 0.3197493553161621, mean loss: 0.34212255719573587
Epoch: 48, step: 1313, loss: 0.3296637535095215, mean loss: 0.3421223807903938
Epoch: 48, step: 1314, loss: 0.33114486932754517, mean loss: 0.34212222536100473
Epoch: 48, step: 1315, loss: 0.36174947023391724, mean loss: 0.3421225032570923
Epoch: 48, step: 1316, loss: 0.3439585566520691, mean loss: 0.3421225292528362
Epoch: 48, step: 1317, loss: 0.32814323902130127, mean loss: 0.3421223313299956
Epoch: 48, step: 1318, loss: 0.33452287316322327, mean loss: 0.3421222237361888
Epoch: 48, step: 1319, loss: 0.28145748376846313, mean loss: 0.3421213648515477
Epoch: 48, step: 1320, loss: 0.3318879306316376, mean loss: 0.34212121996977546
Epoch: 48, step: 1321, loss: 0.352521151304245, mean loss: 0.34212136720667746
Epoch: 48, step: 1322, loss: 0.31622448563575745, mean loss: 0.34212100057708067
Epoch: 48, step: 1323, loss: 0.3271634578704834, mean loss: 0.3421207888218467
Epoch: 48, step: 1324, loss: 0.32821643352508545, mean loss: 0.34212059197946526
Epoch: 48, step: 1325, loss: 0.31206339597702026, mean loss: 0.3421201664691733
Epoch: 48, step: 1326, loss: 0.33411234617233276, mean loss: 0.34212005310657906
Epoch: 48, step: 1327, loss: 0.30899307131767273, mean loss: 0.34211958415157073
Epoch: 48, step: 1328, loss: 0.3421040177345276, mean loss: 0.3421195839312112
Epoch: 48, step: 1329, loss: 0.34560269117355347, mean loss: 0.3421196332376754
Epoch: 48, step: 1330, loss: 0.3485916256904602, mean loss: 0.34211972485315684
Epoch: 48, step: 1331, loss: 0.3136031925678253, mean loss: 0.34211932118784505
Epoch: 48, step: 1332, loss: 0.34506022930145264, mean loss: 0.34211936281723304
Epoch: 48, step: 1333, loss: 0.3124682605266571, mean loss: 0.3421189431034164
Epoch: 48, step: 1334, loss: 0.3393629789352417, mean loss: 0.3421189040930668
Epoch: 48, step: 1335, loss: 0.3276035487651825, mean loss: 0.3421186986328226
Epoch: 48, step: 1336, loss: 0.34174010157585144, mean loss: 0.34211869327397737
Epoch: 48, step: 1337, loss: 0.3144369125366211, mean loss: 0.34211830145825567
Epoch: 48, step: 1338, loss: 0.3257705271244049, mean loss: 0.3421180700705282
Epoch: 48, step: 1339, loss: 0.2909189462661743, mean loss: 0.34211734540422284
Epoch: 48, step: 1340, loss: 0.32484492659568787, mean loss: 0.34211710093592274
Epoch: 48, step: 1341, loss: 0.3466331958770752, mean loss: 0.3421171648543837
Epoch: 48, step: 1342, loss: 0.3246673047542572, mean loss: 0.34211691788162735
Epoch: 48, step: 1343, loss: 0.36054450273513794, mean loss: 0.34211717868870467
Epoch: 48, step: 1344, loss: 0.35312917828559875, mean loss: 0.34211733454020693
Epoch: 48, step: 1345, loss: 0.3175317049026489, mean loss: 0.34211698658768014
Epoch: 48, step: 1346, loss: 0.329023540019989, mean loss: 0.3421168012829551
Epoch: 48, step: 1347, loss: 0.2990919351577759, mean loss: 0.3421161923830665
Epoch: 48, step: 1348, loss: 0.3373183608055115, mean loss: 0.34211612448377865
Epoch: 48, step: 1349, loss: 0.3532111942768097, mean loss: 0.34211628149985224
Epoch: 48, step: 1350, loss: 0.33199286460876465, mean loss: 0.3421161382365194
Epoch: 48, step: 1351, loss: 0.35492661595344543, mean loss: 0.34211631952370547
Epoch: 48, step: 1352, loss: 0.34134337306022644, mean loss: 0.34211630858552583
Epoch: 48, step: 1353, loss: 0.3554094433784485, mean loss: 0.3421164966976985
Epoch: 48, step: 1354, loss: 0.30556008219718933, mean loss: 0.34211597939238625
Epoch: 48, step: 1355, loss: 0.3179096281528473, mean loss: 0.342115636856143
Epoch: 48, step: 1356, loss: 0.36759617924690247, mean loss: 0.34211599741795073
Epoch: 48, step: 1357, loss: 0.3804073929786682, mean loss: 0.34211653925176366
Epoch: 48, step: 1358, loss: 0.3091573715209961, mean loss: 0.34211607287704515
Epoch: 48, step: 1359, loss: 0.3239041566848755, mean loss: 0.3421158151806988
Epoch: 48, step: 1360, loss: 0.3039903938770294, mean loss: 0.342115275718368
Epoch: 48, step: 1361, loss: 0.30960410833358765, mean loss: 0.3421148157024161
Epoch: 48, step: 1362, loss: 0.3040424585342407, mean loss: 0.34211427700617036
Epoch: 48, step: 1363, loss: 0.3249817192554474, mean loss: 0.3421140345963318
Epoch: 48, step: 1364, loss: 0.2958371639251709, mean loss: 0.3421133798306984
Epoch: 48, step: 1365, loss: 0.3304159641265869, mean loss: 0.3421132143277738
Epoch: 48, step: 1366, loss: 0.34223610162734985, mean loss: 0.34211321606644157
Epoch: 48, step: 1367, loss: 0.30202412605285645, mean loss: 0.34211264887501525
Epoch: 48, step: 1368, loss: 0.3716517984867096, mean loss: 0.34211306679708214
Epoch: 48, step: 1369, loss: 0.345723956823349, mean loss: 0.34211311788349774
Epoch: 48, step: 1370, loss: 0.31324875354766846, mean loss: 0.3421127095198978
Epoch: 48, step: 1371, loss: 0.3586154878139496, mean loss: 0.34211294299251244
Epoch: 48, step: 1372, loss: 0.3054314851760864, mean loss: 0.34211242404991055
Epoch: 48, step: 1373, loss: 0.3443065583705902, mean loss: 0.3421124550904889
Epoch: 48, step: 1374, loss: 0.3314554989337921, mean loss: 0.3421123043278853
Epoch: 48, step: 1375, loss: 0.30709129571914673, mean loss: 0.3421118088971388
Epoch: 48, step: 1376, loss: 0.30880898237228394, mean loss: 0.34211133777961666
Epoch: 48, step: 1377, loss: 0.32492244243621826, mean loss: 0.3421110946208199
Epoch: 48, step: 1378, loss: 0.3267548382282257, mean loss: 0.34211087739010604
Epoch: 48, step: 1379, loss: 0.31431272625923157, mean loss: 0.3421104841610118
Epoch: 48, step: 1380, loss: 0.32566508650779724, mean loss: 0.3421102515298085
Epoch: 48, step: 1381, loss: 0.2932138442993164, mean loss: 0.34210955986704744
Epoch: 48, step: 1382, loss: 0.35847389698028564, mean loss: 0.3421097913450461
Epoch: 48, step: 1383, loss: 0.31528788805007935, mean loss: 0.34210941194729666
Epoch: 48, step: 1384, loss: 0.3195565640926361, mean loss: 0.34210909294015557
Epoch: 48, step: 1385, loss: 0.2907998263835907, mean loss: 0.3421083671874248
Epoch: 48, step: 1386, loss: 0.2912556231021881, mean loss: 0.34210764790222864
Epoch: 48, step: 1387, loss: 0.34559884667396545, mean loss: 0.3421076972826922
Epoch: 48, step: 1388, loss: 0.30121809244155884, mean loss: 0.3421071189371972
Epoch: 48, step: 1389, loss: 0.31582555174827576, mean loss: 0.34210674721408907
Epoch: 48, step: 1390, loss: 0.3359076976776123, mean loss: 0.34210665953676933
Epoch: 48, step: 1391, loss: 0.31309306621551514, mean loss: 0.34210624918384275
Epoch: 48, step: 1392, loss: 0.32958534359931946, mean loss: 0.34210607209727767
Epoch: 48, step: 1393, loss: 0.3421424925327301, mean loss: 0.34210607261237447
Epoch: 48, step: 1394, loss: 0.3259531557559967, mean loss: 0.3421058441637505
Epoch: 48, step: 1395, loss: 0.3175210654735565, mean loss: 0.3421054964693073
Epoch: 48, step: 1396, loss: 0.3384065330028534, mean loss: 0.3421054441568228
Epoch: 48, step: 1397, loss: 0.32387635111808777, mean loss: 0.3421051863560444
Epoch: 48, step: 1398, loss: 0.32712772488594055, mean loss: 0.3421049745437172
Epoch: 48, step: 1399, loss: 0.33055025339126587, mean loss: 0.3421048111383383
Epoch: 48, step: 1400, loss: 0.3380906879901886, mean loss: 0.34210475437192833
Epoch: 48, step: 1401, loss: 0.33212876319885254, mean loss: 0.3421046132967357
Epoch: 48, step: 1402, loss: 0.32892587780952454, mean loss: 0.3421044269326618
Epoch: 48, step: 1403, loss: 0.29044461250305176, mean loss: 0.3421036964075412
Epoch: 48, step: 1404, loss: 0.31892454624176025, mean loss: 0.34210336863416047
Epoch: 48, step: 1405, loss: 0.37227776646614075, mean loss: 0.34210379532040486
Epoch: 48, step: 1406, loss: 0.32065367698669434, mean loss: 0.3421034920056191
Epoch: 48, step: 1407, loss: 0.3156895637512207, mean loss: 0.3421031185055024
Epoch: 48, step: 1408, loss: 0.35717979073524475, mean loss: 0.34210333169072643
Epoch: 48, step: 1409, loss: 0.3586540222167969, mean loss: 0.34210356571536554
Epoch: 48, step: 1410, loss: 0.3149579167366028, mean loss: 0.34210318188480154
Epoch: 48, step: 1411, loss: 0.3108440637588501, mean loss: 0.3421027398973839
Epoch: 48, step: 1412, loss: 0.29717206954956055, mean loss: 0.34210210461042245
Epoch: 48, step: 1413, loss: 0.361898273229599, mean loss: 0.3421023845098741
Epoch: 48, step: 1414, loss: 0.28501567244529724, mean loss: 0.34210157736815927
Epoch: 48, step: 1415, loss: 0.33580800890922546, mean loss: 0.3421014883854585
Epoch: 48, step: 1416, loss: 0.3429615795612335, mean loss: 0.34210150054583366
Epoch: 48, step: 1417, loss: 0.3298443853855133, mean loss: 0.34210132725140185
Epoch: 48, step: 1418, loss: 0.3427184224128723, mean loss: 0.34210133597593795
Epoch: 48, step: 1419, loss: 0.31331291794776917, mean loss: 0.34210092896895344
Epoch: 48, step: 1420, loss: 0.3644990026950836, mean loss: 0.3421012456255879
Epoch: 48, step: 1421, loss: 0.32372257113456726, mean loss: 0.3421009857975775
Epoch: 48, step: 1422, loss: 0.3498133420944214, mean loss: 0.3421010948292633
Epoch: 48, step: 1423, loss: 0.31884118914604187, mean loss: 0.3421007660022773
Epoch: 48, step: 1424, loss: 0.3195894658565521, mean loss: 0.3421004477628814
Epoch: 48, step: 1425, loss: 0.3280869126319885, mean loss: 0.34210024965811264
Epoch: 48, step: 1426, loss: 0.3363529443740845, mean loss: 0.3421001684114837
Epoch: 48, step: 1427, loss: 0.36507588624954224, mean loss: 0.342100493202519
Epoch: 48, step: 1428, loss: 0.3674193322658539, mean loss: 0.34210085111149774
Epoch: 48, step: 1429, loss: 0.34208208322525024, mean loss: 0.3421008508461973
Epoch: 48, step: 1430, loss: 0.3499830961227417, mean loss: 0.3421009622670485
Epoch: 48, step: 1431, loss: 0.33532872796058655, mean loss: 0.3421008665383039
Epoch: 48, step: 1432, loss: 0.3737413287162781, mean loss: 0.34210131378492453
Epoch: 48, step: 1433, loss: 0.3448101282119751, mean loss: 0.342101352074219
Epoch: 48, step: 1434, loss: 0.3000245690345764, mean loss: 0.3421007573241513
Epoch: 48, step: 1435, loss: 0.3241989016532898, mean loss: 0.34210050428723615
Epoch: 48, step: 1436, loss: 0.33553487062454224, mean loss: 0.3421004114854487
Epoch: 48, step: 1437, loss: 0.3662149906158447, mean loss: 0.34210075232755655
Epoch: 48, step: 1438, loss: 0.3320709764957428, mean loss: 0.34210061056594426
Epoch: 48, step: 1439, loss: 0.33682408928871155, mean loss: 0.3421005359882464
Epoch: 48, step: 1440, loss: 0.41622334718704224, mean loss: 0.34210158361606713
Epoch: 48, step: 1441, loss: 0.32821592688560486, mean loss: 0.3421013873634633
Epoch: 48, step: 1442, loss: 0.3477652966976166, mean loss: 0.3421014674130617
Epoch: 48, step: 1443, loss: 0.3676891028881073, mean loss: 0.34210182904508546
Valid: 48, mean loss: 0.18598807603120804
Epoch: 49, step: 0, loss: 0.32489123940467834, mean loss: 0.3421015858099336
Epoch: 49, step: 1, loss: 0.3256567418575287, mean loss: 0.3421013534002562
Epoch: 49, step: 2, loss: 0.3378685712814331, mean loss: 0.3421012935805567
Epoch: 49, step: 3, loss: 0.2975945770740509, mean loss: 0.34210066459926064
Epoch: 49, step: 4, loss: 0.33616700768470764, mean loss: 0.3421005807443559
Epoch: 49, step: 5, loss: 0.31124433875083923, mean loss: 0.3421001446876872
Epoch: 49, step: 6, loss: 0.33302515745162964, mean loss: 0.3421000164428808
Epoch: 49, step: 7, loss: 0.37356969714164734, mean loss: 0.34210046115602166
Epoch: 49, step: 8, loss: 0.3126968741416931, mean loss: 0.34210004564571267
Epoch: 49, step: 9, loss: 0.3488335907459259, mean loss: 0.34210014079797646
Epoch: 49, step: 10, loss: 0.32129865884780884, mean loss: 0.3420998468547268
Epoch: 49, step: 11, loss: 0.3303908109664917, mean loss: 0.3420996813980813
Epoch: 49, step: 12, loss: 0.3015395700931549, mean loss: 0.3420991082642048
Epoch: 49, step: 13, loss: 0.3683231770992279, mean loss: 0.34209947881767144
Epoch: 49, step: 14, loss: 0.3105662167072296, mean loss: 0.3420990332501069
Epoch: 49, step: 15, loss: 0.30543240904808044, mean loss: 0.3420985151550382
Epoch: 49, step: 16, loss: 0.33621761202812195, mean loss: 0.3420984320597458
Epoch: 49, step: 17, loss: 0.33295947313308716, mean loss: 0.34209830293098487
Epoch: 49, step: 18, loss: 0.3409439027309418, mean loss: 0.3420982866201378
Epoch: 49, step: 19, loss: 0.33376649022102356, mean loss: 0.3420981688994924
Epoch: 49, step: 20, loss: 0.2998802661895752, mean loss: 0.3420975724076559
Epoch: 49, step: 21, loss: 0.3070469796657562, mean loss: 0.34209707718890514
Epoch: 49, step: 22, loss: 0.3568660616874695, mean loss: 0.3420972858522728
Epoch: 49, step: 23, loss: 0.3124361038208008, mean loss: 0.34209686679064477
Epoch: 49, step: 24, loss: 0.3168756067752838, mean loss: 0.3420965104625339
Epoch: 49, step: 25, loss: 0.3024230897426605, mean loss: 0.3420959499609838
Epoch: 49, step: 26, loss: 0.365055114030838, mean loss: 0.3420962743208452
Epoch: 49, step: 27, loss: 0.3278959393501282, mean loss: 0.3420960737058055
Epoch: 49, step: 28, loss: 0.3187043368816376, mean loss: 0.34209574324402936
Epoch: 49, step: 29, loss: 0.3442133069038391, mean loss: 0.342095773159036
Epoch: 49, step: 30, loss: 0.32820290327072144, mean loss: 0.34209557689602316
Epoch: 49, step: 31, loss: 0.33510738611221313, mean loss: 0.3420954781760313
Epoch: 49, step: 32, loss: 0.38711631298065186, mean loss: 0.34209611416234
Epoch: 49, step: 33, loss: 0.34987354278564453, mean loss: 0.34209622402854456
Epoch: 49, step: 34, loss: 0.31563055515289307, mean loss: 0.342095850172138
Epoch: 49, step: 35, loss: 0.31794777512550354, mean loss: 0.34209550905908787
Epoch: 49, step: 36, loss: 0.3494727909564972, mean loss: 0.3420956132682879
Epoch: 49, step: 37, loss: 0.32117369771003723, mean loss: 0.3420953177359609
Epoch: 49, step: 38, loss: 0.3529263734817505, mean loss: 0.3420954707277788
Epoch: 49, step: 39, loss: 0.32263535261154175, mean loss: 0.3420951958518237
Epoch: 49, step: 40, loss: 0.3941327631473541, mean loss: 0.3420959308768572
Epoch: 49, step: 41, loss: 0.30278217792510986, mean loss: 0.3420953755821744
Epoch: 49, step: 42, loss: 0.33698147535324097, mean loss: 0.342095303350925
Epoch: 49, step: 43, loss: 0.35821831226348877, mean loss: 0.34209553107703955
Epoch: 49, step: 44, loss: 0.3284069001674652, mean loss: 0.3420953377375259
Epoch: 49, step: 45, loss: 0.3265271782875061, mean loss: 0.3420951178544795
Epoch: 49, step: 46, loss: 0.3185807764530182, mean loss: 0.3420947857450858
Epoch: 49, step: 47, loss: 0.30992186069488525, mean loss: 0.34209433135091244
Epoch: 49, step: 48, loss: 0.3893885016441345, mean loss: 0.3420949993004964
Epoch: 49, step: 49, loss: 0.3351541757583618, mean loss: 0.34209490127457287
Epoch: 49, step: 50, loss: 0.3569965064525604, mean loss: 0.34209511172841467
Epoch: 49, step: 51, loss: 0.3284328281879425, mean loss: 0.3420949187801102
Epoch: 49, step: 52, loss: 0.320112943649292, mean loss: 0.34209460833969824
Epoch: 49, step: 53, loss: 0.30792149901390076, mean loss: 0.3420941257368268
Epoch: 49, step: 54, loss: 0.3218592703342438, mean loss: 0.34209383997818194
Epoch: 49, step: 55, loss: 0.3334721028804779, mean loss: 0.3420937182228707
Epoch: 49, step: 56, loss: 0.34011298418045044, mean loss: 0.3420936902515372
Epoch: 49, step: 57, loss: 0.3508550226688385, mean loss: 0.3420938139747052
Epoch: 49, step: 58, loss: 0.35226279497146606, mean loss: 0.3420939575739567
Epoch: 49, step: 59, loss: 0.3104209303855896, mean loss: 0.3420935103158909
Epoch: 49, step: 60, loss: 0.35108959674835205, mean loss: 0.34209363734875636
Epoch: 49, step: 61, loss: 0.30628257989883423, mean loss: 0.3420931316714222
Epoch: 49, step: 62, loss: 0.35934334993362427, mean loss: 0.34209337525320477
Epoch: 49, step: 63, loss: 0.331537127494812, mean loss: 0.34209322619576676
Epoch: 49, step: 64, loss: 0.31305697560310364, mean loss: 0.34209281620084164
Epoch: 49, step: 65, loss: 0.3878510296344757, mean loss: 0.3420934623025252
Epoch: 49, step: 66, loss: 0.3395574986934662, mean loss: 0.34209342649546237
Epoch: 49, step: 67, loss: 0.35540127754211426, mean loss: 0.3420936143957652
Epoch: 49, step: 68, loss: 0.3160979449748993, mean loss: 0.342093247354898
Epoch: 49, step: 69, loss: 0.32483452558517456, mean loss: 0.3420930036771275
Epoch: 49, step: 70, loss: 0.29837894439697266, mean loss: 0.34209238648228263
Epoch: 49, step: 71, loss: 0.3146137595176697, mean loss: 0.34209199851951416
Epoch: 49, step: 72, loss: 0.3300669193267822, mean loss: 0.34209182874330396
Epoch: 49, step: 73, loss: 0.34692448377609253, mean loss: 0.34209189697223286
Epoch: 49, step: 74, loss: 0.3582509756088257, mean loss: 0.3420921251079169
Epoch: 49, step: 75, loss: 0.32935693860054016, mean loss: 0.3420919453136642
Epoch: 49, step: 76, loss: 0.3108821213245392, mean loss: 0.3420915047023109
Epoch: 49, step: 77, loss: 0.33054104447364807, mean loss: 0.3420913416385248
Epoch: 49, step: 78, loss: 0.3097347617149353, mean loss: 0.3420908848504973
Epoch: 49, step: 79, loss: 0.3346026539802551, mean loss: 0.34209077913827657
Epoch: 49, step: 80, loss: 0.3483866751194, mean loss: 0.3420908680169132
Epoch: 49, step: 81, loss: 0.3123134672641754, mean loss: 0.3420904476577733
Epoch: 49, step: 82, loss: 0.3192746639251709, mean loss: 0.34209012557835755
Epoch: 49, step: 83, loss: 0.3400909900665283, mean loss: 0.342090097357924
Epoch: 49, step: 84, loss: 0.3209698796272278, mean loss: 0.34208979922241306
Epoch: 49, step: 85, loss: 0.2995944321155548, mean loss: 0.3420891993612134
Epoch: 49, step: 86, loss: 0.3391807973384857, mean loss: 0.34208915830702286
Epoch: 49, step: 87, loss: 0.3275315761566162, mean loss: 0.3420889528191601
Epoch: 49, step: 88, loss: 0.3539949059486389, mean loss: 0.3420891208755244
Epoch: 49, step: 89, loss: 0.3344048857688904, mean loss: 0.34208901241160117
Epoch: 49, step: 90, loss: 0.3087710738182068, mean loss: 0.3420885421314398
Epoch: 49, step: 91, loss: 0.3557099997997284, mean loss: 0.34208873439456183
Epoch: 49, step: 92, loss: 0.315611869096756, mean loss: 0.3420883606861778
Epoch: 49, step: 93, loss: 0.3225453794002533, mean loss: 0.3420880848501681
Epoch: 49, step: 94, loss: 0.3529176414012909, mean loss: 0.34208823769990276
Epoch: 49, step: 95, loss: 0.3226892948150635, mean loss: 0.3420879639046269
Epoch: 49, step: 96, loss: 0.33843761682510376, mean loss: 0.3420879123846196
Epoch: 49, step: 97, loss: 0.34162676334381104, mean loss: 0.34208790587617915
Epoch: 49, step: 98, loss: 0.34367525577545166, mean loss: 0.34208792827897216
Epoch: 49, step: 99, loss: 0.3592885434627533, mean loss: 0.3420881710335051
Epoch: 49, step: 100, loss: 0.3240601122379303, mean loss: 0.34208791660474297
Epoch: 49, step: 101, loss: 0.2838948369026184, mean loss: 0.3420870953413754
Epoch: 49, step: 102, loss: 0.3369305431842804, mean loss: 0.34208702256936113
Epoch: 49, step: 103, loss: 0.34012430906295776, mean loss: 0.3420869948708922
Epoch: 49, step: 104, loss: 0.3416430354118347, mean loss: 0.3420869886056764
Epoch: 49, step: 105, loss: 0.3358859717845917, mean loss: 0.34208690109732465
Epoch: 49, step: 106, loss: 0.3230867385864258, mean loss: 0.34208663297203346
Epoch: 49, step: 107, loss: 0.365163654088974, mean loss: 0.3420869586242845
Epoch: 49, step: 108, loss: 0.31622353196144104, mean loss: 0.3420865936567171
Epoch: 49, step: 109, loss: 0.3226538300514221, mean loss: 0.34208631943828227
Epoch: 49, step: 110, loss: 0.34055984020233154, mean loss: 0.34208629789822503
Epoch: 49, step: 111, loss: 0.33800187706947327, mean loss: 0.3420862402640202
Epoch: 49, step: 112, loss: 0.31408318877220154, mean loss: 0.3420858451257864
Epoch: 49, step: 113, loss: 0.317365437746048, mean loss: 0.34208549631236207
Epoch: 49, step: 114, loss: 0.3568957448005676, mean loss: 0.3420857052870977
Epoch: 49, step: 115, loss: 0.36306536197662354, mean loss: 0.34208600130889316
Epoch: 49, step: 116, loss: 0.3485425114631653, mean loss: 0.34208609240860893
Epoch: 49, step: 117, loss: 0.376920610666275, mean loss: 0.3420865839078648
Epoch: 49, step: 118, loss: 0.3400132656097412, mean loss: 0.34208655465469656
Epoch: 49, step: 119, loss: 0.32034510374069214, mean loss: 0.3420862479013398
Epoch: 49, step: 120, loss: 0.32406339049339294, mean loss: 0.34208599361775827
Epoch: 49, step: 121, loss: 0.32674089074134827, mean loss: 0.3420857771175343
Epoch: 49, step: 122, loss: 0.35549846291542053, mean loss: 0.3420859663510985
Epoch: 49, step: 123, loss: 0.33559900522232056, mean loss: 0.3420858748307665
Epoch: 49, step: 124, loss: 0.3284742534160614, mean loss: 0.34208568279592766
Epoch: 49, step: 125, loss: 0.36709532141685486, mean loss: 0.3420860356307605
Epoch: 49, step: 126, loss: 0.37865984439849854, mean loss: 0.3420865516050952
Epoch: 49, step: 127, loss: 0.3180343210697174, mean loss: 0.34208621228690583
Epoch: 49, step: 128, loss: 0.3185400664806366, mean loss: 0.34208588011302127
Epoch: 49, step: 129, loss: 0.32746875286102295, mean loss: 0.34208567390689804
Epoch: 49, step: 130, loss: 0.3482190668582916, mean loss: 0.3420857604304207
Epoch: 49, step: 131, loss: 0.2750207781791687, mean loss: 0.3420848143608144
Epoch: 49, step: 132, loss: 0.308289498090744, mean loss: 0.3420843376251252
Epoch: 49, step: 133, loss: 0.31906944513320923, mean loss: 0.34208401296872104
Epoch: 49, step: 134, loss: 0.34260860085487366, mean loss: 0.34208402036864327
Epoch: 49, step: 135, loss: 0.30340903997421265, mean loss: 0.34208347482076207
Epoch: 49, step: 136, loss: 0.38516101241111755, mean loss: 0.3420840824623852
Epoch: 49, step: 137, loss: 0.379300594329834, mean loss: 0.34208460742235175
Epoch: 49, step: 138, loss: 0.30947619676589966, mean loss: 0.34208414746874916
Epoch: 49, step: 139, loss: 0.3263430595397949, mean loss: 0.3420839254380573
Epoch: 49, step: 140, loss: 0.3095666468143463, mean loss: 0.3420834667828445
Epoch: 49, step: 141, loss: 0.30131056904792786, mean loss: 0.3420828916904902
Epoch: 49, step: 142, loss: 0.3288504183292389, mean loss: 0.34208270505212635
Epoch: 49, step: 143, loss: 0.38645318150520325, mean loss: 0.3420833308698478
Epoch: 49, step: 144, loss: 0.3600941598415375, mean loss: 0.3420835848977032
Epoch: 49, step: 145, loss: 0.36150431632995605, mean loss: 0.3420838588072041
Epoch: 49, step: 146, loss: 0.3338513672351837, mean loss: 0.3420837426979905
Epoch: 49, step: 147, loss: 0.3264412581920624, mean loss: 0.342083522083011
Epoch: 49, step: 148, loss: 0.33953696489334106, mean loss: 0.342083486167953
Epoch: 49, step: 149, loss: 0.30315646529197693, mean loss: 0.3420829371732152
Epoch: 49, step: 150, loss: 0.33267176151275635, mean loss: 0.3420828044475935
Epoch: 49, step: 151, loss: 0.3427538275718689, mean loss: 0.3420828139108857
Epoch: 49, step: 152, loss: 0.32867008447647095, mean loss: 0.34208262475676654
Epoch: 49, step: 153, loss: 0.34731581807136536, mean loss: 0.3420826985572646
Epoch: 49, step: 154, loss: 0.37343332171440125, mean loss: 0.34208314066953427
Epoch: 49, step: 155, loss: 0.3152145445346832, mean loss: 0.34208276176897956
Epoch: 49, step: 156, loss: 0.3542385697364807, mean loss: 0.34208293318759064
Epoch: 49, step: 157, loss: 0.31562092900276184, mean loss: 0.34208256003131426
Epoch: 49, step: 158, loss: 0.3572368323802948, mean loss: 0.3420827737276035
Epoch: 49, step: 159, loss: 0.3125045597553253, mean loss: 0.34208235663958425
Epoch: 49, step: 160, loss: 0.37478092312812805, mean loss: 0.34208281772178584
Epoch: 49, step: 161, loss: 0.2848745286464691, mean loss: 0.3420820110395743
Epoch: 49, step: 162, loss: 0.30991172790527344, mean loss: 0.3420815574194847
Epoch: 49, step: 163, loss: 0.34214624762535095, mean loss: 0.34208155833164217
Epoch: 49, step: 164, loss: 0.3327171504497528, mean loss: 0.34208142629165567
Epoch: 49, step: 165, loss: 0.30009493231773376, mean loss: 0.34208083428220903
Epoch: 49, step: 166, loss: 0.30980971455574036, mean loss: 0.3420803792659276
Epoch: 49, step: 167, loss: 0.3601883053779602, mean loss: 0.34208063458043486
Epoch: 49, step: 168, loss: 0.3595867455005646, mean loss: 0.34208088140610876
Epoch: 49, step: 169, loss: 0.33779799938201904, mean loss: 0.34208082102089005
Epoch: 49, step: 170, loss: 0.3000848591327667, mean loss: 0.342080228919689
Epoch: 49, step: 171, loss: 0.3309069275856018, mean loss: 0.34208007138949875
Epoch: 49, step: 172, loss: 0.3027745187282562, mean loss: 0.342079517236012
Epoch: 49, step: 173, loss: 0.3567427694797516, mean loss: 0.3420797239645083
Epoch: 49, step: 174, loss: 0.34232813119888306, mean loss: 0.3420797274666052
Epoch: 49, step: 175, loss: 0.40236133337020874, mean loss: 0.3420805773172495
Epoch: 49, step: 176, loss: 0.32328975200653076, mean loss: 0.34208031240775305
Epoch: 49, step: 177, loss: 0.32343581318855286, mean loss: 0.34208004956483967
Epoch: 49, step: 178, loss: 0.37944185733795166, mean loss: 0.3420805762696789
Epoch: 49, step: 179, loss: 0.3388841152191162, mean loss: 0.3420805312084822
Epoch: 49, step: 180, loss: 0.35902082920074463, mean loss: 0.3420807700161283
Epoch: 49, step: 181, loss: 0.3183193504810333, mean loss: 0.3420804350557469
Epoch: 49, step: 182, loss: 0.34093448519706726, mean loss: 0.34208041890172924
Epoch: 49, step: 183, loss: 0.33016544580459595, mean loss: 0.34208025094327005
Epoch: 49, step: 184, loss: 0.3457227051258087, mean loss: 0.3420803022881085
Epoch: 49, step: 185, loss: 0.2996572256088257, mean loss: 0.34207970429148193
Epoch: 49, step: 186, loss: 0.3599311411380768, mean loss: 0.3420799559221833
Epoch: 49, step: 187, loss: 0.3295104503631592, mean loss: 0.34207977874715007
Epoch: 49, step: 188, loss: 0.30859145522117615, mean loss: 0.3420793067149628
Epoch: 49, step: 189, loss: 0.34187790751457214, mean loss: 0.3420793038761953
Epoch: 49, step: 190, loss: 0.32440048456192017, mean loss: 0.34207905469273
Epoch: 49, step: 191, loss: 0.3177531659603119, mean loss: 0.3420787118234633
Epoch: 49, step: 192, loss: 0.3827580213546753, mean loss: 0.3420792851833349
Epoch: 49, step: 193, loss: 0.3506605625152588, mean loss: 0.34207940613157073
Epoch: 49, step: 194, loss: 0.33734190464019775, mean loss: 0.3420793393601159
Epoch: 49, step: 195, loss: 0.33914634585380554, mean loss: 0.3420792980224016
Epoch: 49, step: 196, loss: 0.2932104170322418, mean loss: 0.34207860927237005
Epoch: 49, step: 197, loss: 0.3842618763446808, mean loss: 0.3420792037880714
Epoch: 49, step: 198, loss: 0.3353171646595001, mean loss: 0.342079108487682
Epoch: 49, step: 199, loss: 0.3246650993824005, mean loss: 0.342078863067857
Epoch: 49, step: 200, loss: 0.3758889138698578, mean loss: 0.34207933955433195
Epoch: 49, step: 201, loss: 0.36049795150756836, mean loss: 0.3420795991249505
Epoch: 49, step: 202, loss: 0.3663214445114136, mean loss: 0.34207994075667286
Epoch: 49, step: 203, loss: 0.3364849388599396, mean loss: 0.34207986190940826
Epoch: 49, step: 204, loss: 0.30973687767982483, mean loss: 0.3420794061240581
Epoch: 49, step: 205, loss: 0.31529223918914795, mean loss: 0.342079028637982
Epoch: 49, step: 206, loss: 0.31390732526779175, mean loss: 0.3420786316465446
Epoch: 49, step: 207, loss: 0.3452190160751343, mean loss: 0.34207867589974944
Epoch: 49, step: 208, loss: 0.35713547468185425, mean loss: 0.3420788880719298
Epoch: 49, step: 209, loss: 0.32003337144851685, mean loss: 0.3420785774229342
Epoch: 49, step: 210, loss: 0.3480556607246399, mean loss: 0.34207866164635214
Epoch: 49, step: 211, loss: 0.3300914466381073, mean loss: 0.34207849273620944
Epoch: 49, step: 212, loss: 0.3210035562515259, mean loss: 0.34207819577645965
Epoch: 49, step: 213, loss: 0.3258321285247803, mean loss: 0.3420779668618866
Epoch: 49, step: 214, loss: 0.3012412488460541, mean loss: 0.34207739146182153
Epoch: 49, step: 215, loss: 0.349884569644928, mean loss: 0.34207750146545934
Epoch: 49, step: 216, loss: 0.3287588357925415, mean loss: 0.3420773138072559
Epoch: 49, step: 217, loss: 0.29094401001930237, mean loss: 0.34207659335605145
Epoch: 49, step: 218, loss: 0.36390674114227295, mean loss: 0.3420769009312228
Epoch: 49, step: 219, loss: 0.2785152196884155, mean loss: 0.34207600539355876
Epoch: 49, step: 220, loss: 0.34960678219795227, mean loss: 0.34207611149520867
Epoch: 49, step: 221, loss: 0.3552896976470947, mean loss: 0.3420762976597407
Epoch: 49, step: 222, loss: 0.3080833852291107, mean loss: 0.34207581874467524
Epoch: 49, step: 223, loss: 0.3637753129005432, mean loss: 0.34207612445746977
Epoch: 49, step: 224, loss: 0.34745222330093384, mean loss: 0.34207620019744023
Epoch: 49, step: 225, loss: 0.35462215542793274, mean loss: 0.3420763769458445
Epoch: 49, step: 226, loss: 0.29822245240211487, mean loss: 0.3420757591370093
Epoch: 49, step: 227, loss: 0.3026397228240967, mean loss: 0.342075203574681
Epoch: 49, step: 228, loss: 0.314582496881485, mean loss: 0.3420748162716354
Epoch: 49, step: 229, loss: 0.3416450023651123, mean loss: 0.3420748102167245
Epoch: 49, step: 230, loss: 0.35374611616134644, mean loss: 0.34207497463141934
Epoch: 49, step: 231, loss: 0.34824544191360474, mean loss: 0.3420750615541004
Epoch: 49, step: 232, loss: 0.3557462692260742, mean loss: 0.3420752541361578
Epoch: 49, step: 233, loss: 0.32277318835258484, mean loss: 0.3420749822377808
Epoch: 49, step: 234, loss: 0.32875868678092957, mean loss: 0.3420747946605463
Epoch: 49, step: 235, loss: 0.3567969501018524, mean loss: 0.3420750020382148
Epoch: 49, step: 236, loss: 0.3905338943004608, mean loss: 0.3420756846251214
Epoch: 49, step: 237, loss: 0.3373135030269623, mean loss: 0.34207561754647253
Epoch: 49, step: 238, loss: 0.3158529996871948, mean loss: 0.34207524818781543
Epoch: 49, step: 239, loss: 0.3394469618797302, mean loss: 0.34207521116761275
Epoch: 49, step: 240, loss: 0.34602367877960205, mean loss: 0.34207526678218253
Epoch: 49, step: 241, loss: 0.34206900000572205, mean loss: 0.3420752666939156
Epoch: 49, step: 242, loss: 0.3357526659965515, mean loss: 0.3420751776419473
Epoch: 49, step: 243, loss: 0.4057007431983948, mean loss: 0.34207607377667343
Epoch: 49, step: 244, loss: 0.353804349899292, mean loss: 0.34207623896133454
Epoch: 49, step: 245, loss: 0.29364168643951416, mean loss: 0.3420755568037542
Epoch: 49, step: 246, loss: 0.30607596039772034, mean loss: 0.34207504978860825
Epoch: 49, step: 247, loss: 0.3234303891658783, mean loss: 0.34207478720254797
Epoch: 49, step: 248, loss: 0.3093169331550598, mean loss: 0.3420743258568111
Epoch: 49, step: 249, loss: 0.3037238121032715, mean loss: 0.34207378575437253
Epoch: 49, step: 250, loss: 0.29943710565567017, mean loss: 0.34207318529695147
Epoch: 49, step: 251, loss: 0.3106231391429901, mean loss: 0.34207274238846014
Epoch: 49, step: 252, loss: 0.3253391683101654, mean loss: 0.3420725067341899
Epoch: 49, step: 253, loss: 0.34681859612464905, mean loss: 0.34207257357110565
Epoch: 49, step: 254, loss: 0.34426450729370117, mean loss: 0.3420726044386293
Epoch: 49, step: 255, loss: 0.31867319345474243, mean loss: 0.3420722749251529
Epoch: 49, step: 256, loss: 0.2969614267349243, mean loss: 0.34207163967740684
Epoch: 49, step: 257, loss: 0.3197923004627228, mean loss: 0.34207132594575934
Epoch: 49, step: 258, loss: 0.3584403693675995, mean loss: 0.34207155644696924
Epoch: 49, step: 259, loss: 0.3163091838359833, mean loss: 0.34207119367840144
Epoch: 49, step: 260, loss: 0.3113461136817932, mean loss: 0.34207076103438666
Epoch: 49, step: 261, loss: 0.32313084602355957, mean loss: 0.3420704943426323
Epoch: 49, step: 262, loss: 0.3836636543273926, mean loss: 0.3420710800050605
Epoch: 49, step: 263, loss: 0.33912116289138794, mean loss: 0.3420710384686325
Epoch: 49, step: 264, loss: 0.3367030620574951, mean loss: 0.34207096288568645
Epoch: 49, step: 265, loss: 0.3365556597709656, mean loss: 0.3420708852294234
Epoch: 49, step: 266, loss: 0.36917829513549805, mean loss: 0.3420712669002893
Epoch: 49, step: 267, loss: 0.3571205139160156, mean loss: 0.3420714787898902
Epoch: 49, step: 268, loss: 0.31726598739624023, mean loss: 0.3420711295397474
Epoch: 49, step: 269, loss: 0.34035810828208923, mean loss: 0.3420711054215195
Epoch: 49, step: 270, loss: 0.32880574464797974, mean loss: 0.34207091865647554
Epoch: 49, step: 271, loss: 0.30322420597076416, mean loss: 0.34207037173536436
Epoch: 49, step: 272, loss: 0.30609965324401855, mean loss: 0.34206986531237527
Epoch: 49, step: 273, loss: 0.3282662332057953, mean loss: 0.34206967097713514
Epoch: 49, step: 274, loss: 0.4007086455821991, mean loss: 0.34207049651773863
Epoch: 49, step: 275, loss: 0.346382200717926, mean loss: 0.3420705572186087
Epoch: 49, step: 276, loss: 0.2958669662475586, mean loss: 0.34206990676612925
Epoch: 49, step: 277, loss: 0.3253612518310547, mean loss: 0.34206967154560197
Epoch: 49, step: 278, loss: 0.372239887714386, mean loss: 0.34207009626885343
Epoch: 49, step: 279, loss: 0.34123486280441284, mean loss: 0.34207008451096355
Epoch: 49, step: 280, loss: 0.3129291534423828, mean loss: 0.3420696742890923
Epoch: 49, step: 281, loss: 0.3361614942550659, mean loss: 0.3420695911198021
Epoch: 49, step: 282, loss: 0.3516201972961426, mean loss: 0.3420697255615338
Epoch: 49, step: 283, loss: 0.3390008211135864, mean loss: 0.34206968236186536
Epoch: 49, step: 284, loss: 0.3401109278202057, mean loss: 0.3420696547896952
Epoch: 49, step: 285, loss: 0.2967569828033447, mean loss: 0.342069016960355
Epoch: 49, step: 286, loss: 0.326842725276947, mean loss: 0.34206880263534506
Epoch: 49, step: 287, loss: 0.3551824986934662, mean loss: 0.3420689872208985
Epoch: 49, step: 288, loss: 0.29963624477386475, mean loss: 0.3420683899551874
Epoch: 49, step: 289, loss: 0.33459216356277466, mean loss: 0.3420682847244018
Epoch: 49, step: 290, loss: 0.3405399024486542, mean loss: 0.3420682632121314
Epoch: 49, step: 291, loss: 0.3556973934173584, mean loss: 0.34206845504202393
Epoch: 49, step: 292, loss: 0.34177279472351074, mean loss: 0.342068450880666
Epoch: 49, step: 293, loss: 0.29421550035476685, mean loss: 0.3420677773697508
Epoch: 49, step: 294, loss: 0.3344326317310333, mean loss: 0.3420676699096779
Epoch: 49, step: 295, loss: 0.30649903416633606, mean loss: 0.34206716930961395
Epoch: 49, step: 296, loss: 0.3488616943359375, mean loss: 0.3420672649357666
Epoch: 49, step: 297, loss: 0.2992118299007416, mean loss: 0.34206666179681544
Epoch: 49, step: 298, loss: 0.35625386238098145, mean loss: 0.3420668614618719
Epoch: 49, step: 299, loss: 0.3017694354057312, mean loss: 0.34206629433979835
Epoch: 49, step: 300, loss: 0.33915385603904724, mean loss: 0.34206625335244595
Epoch: 49, step: 301, loss: 0.31557437777519226, mean loss: 0.3420658805319954
Epoch: 49, step: 302, loss: 0.29158180952072144, mean loss: 0.342065170079118
Epoch: 49, step: 303, loss: 0.31488141417503357, mean loss: 0.3420647875325953
Epoch: 49, step: 304, loss: 0.35176435112953186, mean loss: 0.3420649240288956
Epoch: 49, step: 305, loss: 0.3423217236995697, mean loss: 0.3420649276426367
Epoch: 49, step: 306, loss: 0.3491402864456177, mean loss: 0.34206502720723153
Epoch: 49, step: 307, loss: 0.35016608238220215, mean loss: 0.3420651412038427
Epoch: 49, step: 308, loss: 0.3024364411830902, mean loss: 0.3420645835636538
Epoch: 49, step: 309, loss: 0.34446850419044495, mean loss: 0.3420646173902464
Epoch: 49, step: 310, loss: 0.3227814733982086, mean loss: 0.34206434605271996
Epoch: 49, step: 311, loss: 0.3339272737503052, mean loss: 0.3420642315557269
Epoch: 49, step: 312, loss: 0.332163006067276, mean loss: 0.3420640922372408
Epoch: 49, step: 313, loss: 0.3242679536342621, mean loss: 0.3420638418342775
Epoch: 49, step: 314, loss: 0.32473087310791016, mean loss: 0.3420635979518399
Epoch: 49, step: 315, loss: 0.3255506157875061, mean loss: 0.3420633656102403
Epoch: 49, step: 316, loss: 0.3100045323371887, mean loss: 0.34206291454115256
Epoch: 49, step: 317, loss: 0.3346720039844513, mean loss: 0.3420628105522036
Epoch: 49, step: 318, loss: 0.3333164155483246, mean loss: 0.34206268749353314
Epoch: 49, step: 319, loss: 0.3186204433441162, mean loss: 0.34206235767412646
Epoch: 49, step: 320, loss: 0.30840402841567993, mean loss: 0.3420618841267165
Epoch: 49, step: 321, loss: 0.3340717554092407, mean loss: 0.34206177171318886
Epoch: 49, step: 322, loss: 0.3062158524990082, mean loss: 0.342061267402222
Epoch: 49, step: 323, loss: 0.350005567073822, mean loss: 0.3420613791678336
Epoch: 49, step: 324, loss: 0.3355104923248291, mean loss: 0.342061287006963
Epoch: 49, step: 325, loss: 0.3427381217479706, mean loss: 0.34206129652884953
Epoch: 49, step: 326, loss: 0.39521628618240356, mean loss: 0.34206204431650133
Epoch: 49, step: 327, loss: 0.2923162579536438, mean loss: 0.3420613444995754
Epoch: 49, step: 328, loss: 0.3400372862815857, mean loss: 0.34206131602580153
Epoch: 49, step: 329, loss: 0.33060422539711, mean loss: 0.3420611548535506
Epoch: 49, step: 330, loss: 0.3449912667274475, mean loss: 0.3420611960722245
Epoch: 49, step: 331, loss: 0.304926335811615, mean loss: 0.34206067369347903
Epoch: 49, step: 332, loss: 0.29114842414855957, mean loss: 0.3420599575172838
Epoch: 49, step: 333, loss: 0.3177637755870819, mean loss: 0.3420596157507635
Epoch: 49, step: 334, loss: 0.35566654801368713, mean loss: 0.3420598071523792
Epoch: 49, step: 335, loss: 0.35642850399017334, mean loss: 0.34206000926649666
Epoch: 49, step: 336, loss: 0.35062599182128906, mean loss: 0.34206012975631356
Epoch: 49, step: 337, loss: 0.37755081057548523, mean loss: 0.34206062896413447
Epoch: 49, step: 338, loss: 0.3088345229625702, mean loss: 0.3420601616161353
Epoch: 49, step: 339, loss: 0.32728925347328186, mean loss: 0.3420599538560905
Epoch: 49, step: 340, loss: 0.3240165710449219, mean loss: 0.34205970007065917
Epoch: 49, step: 341, loss: 0.3319908380508423, mean loss: 0.3420595584511759
Epoch: 49, step: 342, loss: 0.3611004650592804, mean loss: 0.3420598262595362
Epoch: 49, step: 343, loss: 0.32904744148254395, mean loss: 0.3420596432442791
Epoch: 49, step: 344, loss: 0.33798879384994507, mean loss: 0.34205958598981867
Epoch: 49, step: 345, loss: 0.35438308119773865, mean loss: 0.3420597593111768
Epoch: 49, step: 346, loss: 0.337860107421875, mean loss: 0.34205970024683513
Epoch: 49, step: 347, loss: 0.32196044921875, mean loss: 0.34205941757285013
Epoch: 49, step: 348, loss: 0.3068755567073822, mean loss: 0.3420589227572835
Epoch: 49, step: 349, loss: 0.3444640636444092, mean loss: 0.34205895658200836
Epoch: 49, step: 350, loss: 0.3300658166408539, mean loss: 0.34205878791872707
Epoch: 49, step: 351, loss: 0.3388752043247223, mean loss: 0.342058743147624
Epoch: 49, step: 352, loss: 0.339110404253006, mean loss: 0.3420587016853774
Epoch: 49, step: 353, loss: 0.3643735349178314, mean loss: 0.34205901549262296
Epoch: 49, step: 354, loss: 0.34527039527893066, mean loss: 0.3420590606527218
Epoch: 49, step: 355, loss: 0.3247511684894562, mean loss: 0.3420588172635306
Epoch: 49, step: 356, loss: 0.35468631982803345, mean loss: 0.34205899483306873
Epoch: 49, step: 357, loss: 0.27516740560531616, mean loss: 0.3420580542083081
Epoch: 49, step: 358, loss: 0.3611930310726166, mean loss: 0.34205832327920543
Epoch: 49, step: 359, loss: 0.3319178521633148, mean loss: 0.3420581806886335
Epoch: 49, step: 360, loss: 0.3428307771682739, mean loss: 0.3420581915523718
Epoch: 49, step: 361, loss: 0.31483662128448486, mean loss: 0.3420578087861204
Epoch: 49, step: 362, loss: 0.3178364932537079, mean loss: 0.3420574682116532
Epoch: 49, step: 363, loss: 0.33687007427215576, mean loss: 0.3420573952730433
Epoch: 49, step: 364, loss: 0.3112070560455322, mean loss: 0.3420569615004694
Epoch: 49, step: 365, loss: 0.3657044470310211, mean loss: 0.3420572939923218
Epoch: 49, step: 366, loss: 0.2999516427516937, mean loss: 0.3420567019805782
Epoch: 49, step: 367, loss: 0.33399128913879395, mean loss: 0.34205658858126375
Epoch: 49, step: 368, loss: 0.3244397044181824, mean loss: 0.342056340892207
Epoch: 49, step: 369, loss: 0.33637097477912903, mean loss: 0.34205626095848213
Epoch: 49, step: 370, loss: 0.31652703881263733, mean loss: 0.3420559020339929
Epoch: 49, step: 371, loss: 0.3399529755115509, mean loss: 0.34205587246861047
Epoch: 49, step: 372, loss: 0.3179113268852234, mean loss: 0.3420555330213304
Epoch: 49, step: 373, loss: 0.321370929479599, mean loss: 0.3420552422213369
Epoch: 49, step: 374, loss: 0.36711323261260986, mean loss: 0.3420555945007986
Epoch: 49, step: 375, loss: 0.3009359836578369, mean loss: 0.34205501642608055
Epoch: 49, step: 376, loss: 0.3125629723072052, mean loss: 0.3420546018218305
Epoch: 49, step: 377, loss: 0.3439052402973175, mean loss: 0.3420546278380601
Epoch: 49, step: 378, loss: 0.3221696615219116, mean loss: 0.3420543482996287
Epoch: 49, step: 379, loss: 0.3558598756790161, mean loss: 0.34205454237193217
Epoch: 49, step: 380, loss: 0.36028560996055603, mean loss: 0.3420547986530178
Epoch: 49, step: 381, loss: 0.33672448992729187, mean loss: 0.3420547237238839
Epoch: 49, step: 382, loss: 0.34347742795944214, mean loss: 0.34205474372281885
Epoch: 49, step: 383, loss: 0.3400837182998657, mean loss: 0.34205471601652954
Epoch: 49, step: 384, loss: 0.2972213327884674, mean loss: 0.34205408581196073
Epoch: 49, step: 385, loss: 0.3369992673397064, mean loss: 0.3420540147594394
Epoch: 49, step: 386, loss: 0.36433184146881104, mean loss: 0.34205432790095314
Epoch: 49, step: 387, loss: 0.3606407642364502, mean loss: 0.3420545891518855
Epoch: 49, step: 388, loss: 0.3590935170650482, mean loss: 0.3420548286476746
Epoch: 49, step: 389, loss: 0.32313835620880127, mean loss: 0.3420545627652295
Epoch: 49, step: 390, loss: 0.29193490743637085, mean loss: 0.34205385831310464
Epoch: 49, step: 391, loss: 0.3361508846282959, mean loss: 0.3420537753455766
Epoch: 49, step: 392, loss: 0.29940667748451233, mean loss: 0.3420531759401337
Epoch: 49, step: 393, loss: 0.3178788423538208, mean loss: 0.34205283617437704
Epoch: 49, step: 394, loss: 0.3780926465988159, mean loss: 0.34205334270008186
Epoch: 49, step: 395, loss: 0.3044552505016327, mean loss: 0.34205281428075146
Epoch: 49, step: 396, loss: 0.30924588441848755, mean loss: 0.34205235320490274
Epoch: 49, step: 397, loss: 0.32186323404312134, mean loss: 0.3420520694665442
Epoch: 49, step: 398, loss: 0.29599273204803467, mean loss: 0.3420514221566234
Epoch: 49, step: 399, loss: 0.2964398264884949, mean loss: 0.34205078114819587
Epoch: 49, step: 400, loss: 0.32890209555625916, mean loss: 0.3420505963640483
Epoch: 49, step: 401, loss: 0.35279202461242676, mean loss: 0.34205074731584917
Epoch: 49, step: 402, loss: 0.31355202198028564, mean loss: 0.34205034682223157
Epoch: 49, step: 403, loss: 0.34373414516448975, mean loss: 0.34205037048437803
Epoch: 49, step: 404, loss: 0.32875150442123413, mean loss: 0.34205018360018496
Epoch: 49, step: 405, loss: 0.31648290157318115, mean loss: 0.3420498243173932
Epoch: 49, step: 406, loss: 0.3501111567020416, mean loss: 0.342049937597221
Epoch: 49, step: 407, loss: 0.3241892457008362, mean loss: 0.3420496866179071
Epoch: 49, step: 408, loss: 0.32039886713027954, mean loss: 0.34204938238381044
Epoch: 49, step: 409, loss: 0.35280659794807434, mean loss: 0.34204953354048023
Epoch: 49, step: 410, loss: 0.32727643847465515, mean loss: 0.3420493259569785
Epoch: 49, step: 411, loss: 0.3210248351097107, mean loss: 0.34204903053641245
Epoch: 49, step: 412, loss: 0.319512277841568, mean loss: 0.342048713871113
Epoch: 49, step: 413, loss: 0.3459216356277466, mean loss: 0.3420487682890104
Epoch: 49, step: 414, loss: 0.36701804399490356, mean loss: 0.34204911912398117
Epoch: 49, step: 415, loss: 0.404477596282959, mean loss: 0.34204999627338206
Epoch: 49, step: 416, loss: 0.3173188269138336, mean loss: 0.34204964879372884
Epoch: 49, step: 417, loss: 0.3318660855293274, mean loss: 0.34204950571390663
Epoch: 49, step: 418, loss: 0.35112836956977844, mean loss: 0.34204963327082766
Epoch: 49, step: 419, loss: 0.3771257996559143, mean loss: 0.34205012607972934
Epoch: 49, step: 420, loss: 0.3263058066368103, mean loss: 0.3420499048801924
Epoch: 49, step: 421, loss: 0.31137505173683167, mean loss: 0.34204947392044155
Epoch: 49, step: 422, loss: 0.33781927824020386, mean loss: 0.3420494144900523
Epoch: 49, step: 423, loss: 0.35626256465911865, mean loss: 0.3420496141690375
Epoch: 49, step: 424, loss: 0.3373161256313324, mean loss: 0.3420495476697113
Epoch: 49, step: 425, loss: 0.3129933476448059, mean loss: 0.3420491394738187
Epoch: 49, step: 426, loss: 0.31336331367492676, mean loss: 0.34204873648678813
Epoch: 49, step: 427, loss: 0.3494877517223358, mean loss: 0.3420488409908232
Epoch: 49, step: 428, loss: 0.337789922952652, mean loss: 0.34204878116195425
Epoch: 49, step: 429, loss: 0.2838490605354309, mean loss: 0.34204796358938905
Epoch: 49, step: 430, loss: 0.35943445563316345, mean loss: 0.34204820782628687
Epoch: 49, step: 431, loss: 0.3151092827320099, mean loss: 0.34204782940681877
Epoch: 49, step: 432, loss: 0.36595654487609863, mean loss: 0.34204816525527104
Epoch: 49, step: 433, loss: 0.3236238956451416, mean loss: 0.3420479064510905
Epoch: 49, step: 434, loss: 0.38497471809387207, mean loss: 0.3420485094319679
Epoch: 49, step: 435, loss: 0.31572994589805603, mean loss: 0.3420481397476841
Epoch: 49, step: 436, loss: 0.3550545871257782, mean loss: 0.3420483224404682
Epoch: 49, step: 437, loss: 0.31730103492736816, mean loss: 0.3420479748369129
Epoch: 49, step: 438, loss: 0.3435138463973999, mean loss: 0.3420479954264425
Epoch: 49, step: 439, loss: 0.3171045184135437, mean loss: 0.3420476450770266
Epoch: 49, step: 440, loss: 0.32234975695610046, mean loss: 0.34204736840963723
Epoch: 49, step: 441, loss: 0.3258315622806549, mean loss: 0.3420471406531535
Epoch: 49, step: 442, loss: 0.29427194595336914, mean loss: 0.34204646964380364
Epoch: 49, step: 443, loss: 0.3348240554332733, mean loss: 0.3420463682054018
Epoch: 49, step: 444, loss: 0.34982338547706604, mean loss: 0.3420464774316384
Epoch: 49, step: 445, loss: 0.3385687470436096, mean loss: 0.3420464285884825
Epoch: 49, step: 446, loss: 0.3262084722518921, mean loss: 0.34204620615464776
Epoch: 49, step: 447, loss: 0.3137260973453522, mean loss: 0.34204580842265503
Epoch: 49, step: 448, loss: 0.3324125409126282, mean loss: 0.3420456731334547
Epoch: 49, step: 449, loss: 0.385101318359375, mean loss: 0.3420462777966183
Epoch: 49, step: 450, loss: 0.310968279838562, mean loss: 0.3420458413507919
Epoch: 49, step: 451, loss: 0.3450927436351776, mean loss: 0.3420458841395556
Epoch: 49, step: 452, loss: 0.3172324299812317, mean loss: 0.3420455356800328
Epoch: 49, step: 453, loss: 0.32858315110206604, mean loss: 0.34204534662814995
Epoch: 49, step: 454, loss: 0.3086972236633301, mean loss: 0.34204487832798613
Epoch: 49, step: 455, loss: 0.30924439430236816, mean loss: 0.3420444177246605
Epoch: 49, step: 456, loss: 0.33741798996925354, mean loss: 0.34204435275860434
Epoch: 49, step: 457, loss: 0.3626915514469147, mean loss: 0.3420446426903409
Epoch: 49, step: 458, loss: 0.29615285992622375, mean loss: 0.34204399827859105
Epoch: 49, step: 459, loss: 0.36606791615486145, mean loss: 0.34204433561736153
Epoch: 49, step: 460, loss: 0.3156442642211914, mean loss: 0.34204396491835154
Epoch: 49, step: 461, loss: 0.30386871099472046, mean loss: 0.342043428884569
Epoch: 49, step: 462, loss: 0.2860223948955536, mean loss: 0.3420426422822018
Epoch: 49, step: 463, loss: 0.3376533091068268, mean loss: 0.34204258065157594
Epoch: 49, step: 464, loss: 0.35477885603904724, mean loss: 0.3420427594791042
Epoch: 49, step: 465, loss: 0.2957206666469574, mean loss: 0.342042109088876
Epoch: 49, step: 466, loss: 0.3178960680961609, mean loss: 0.34204177006860176
Epoch: 49, step: 467, loss: 0.40229982137680054, mean loss: 0.3420426161043665
Epoch: 49, step: 468, loss: 0.31458473205566406, mean loss: 0.34204223059528893
Epoch: 49, step: 469, loss: 0.3064810037612915, mean loss: 0.3420417313221747
Epoch: 49, step: 470, loss: 0.2888341248035431, mean loss: 0.3420409843076083
Epoch: 49, step: 471, loss: 0.31170275807380676, mean loss: 0.3420405583764263
Epoch: 49, step: 472, loss: 0.30958062410354614, mean loss: 0.3420401026640862
Epoch: 49, step: 473, loss: 0.34711846709251404, mean loss: 0.3420401739593891
Epoch: 49, step: 474, loss: 0.3249892294406891, mean loss: 0.3420399345840537
Epoch: 49, step: 475, loss: 0.3454241454601288, mean loss: 0.34203998209375264
Epoch: 49, step: 476, loss: 0.2983832061290741, mean loss: 0.3420393692208431
Epoch: 49, step: 477, loss: 0.3103879988193512, mean loss: 0.34203892489130383
Epoch: 49, step: 478, loss: 0.32133400440216064, mean loss: 0.3420386342347377
Epoch: 49, step: 479, loss: 0.3123149275779724, mean loss: 0.3420382169779201
Epoch: 49, step: 480, loss: 0.2923148572444916, mean loss: 0.3420375189788503
Epoch: 49, step: 481, loss: 0.33944597840309143, mean loss: 0.3420374826002241
Epoch: 49, step: 482, loss: 0.29851141571998596, mean loss: 0.34203687161372964
Epoch: 49, step: 483, loss: 0.33139827847480774, mean loss: 0.34203672227918247
Epoch: 49, step: 484, loss: 0.29409363865852356, mean loss: 0.34203604930879156
Epoch: 49, step: 485, loss: 0.36826464533805847, mean loss: 0.34203641747077507
Epoch: 49, step: 486, loss: 0.33258652687072754, mean loss: 0.34203628482769993
Epoch: 49, step: 487, loss: 0.3172467052936554, mean loss: 0.3420359368744753
Epoch: 49, step: 488, loss: 0.3073805272579193, mean loss: 0.34203545044862627
Epoch: 49, step: 489, loss: 0.3357953429222107, mean loss: 0.3420353628632527
Epoch: 49, step: 490, loss: 0.31329986453056335, mean loss: 0.34203495954103097
Epoch: 49, step: 491, loss: 0.3089193105697632, mean loss: 0.3420344947469459
Epoch: 49, step: 492, loss: 0.3520614206790924, mean loss: 0.3420346354777061
Epoch: 49, step: 493, loss: 0.2938201427459717, mean loss: 0.34203395878307125
Epoch: 49, step: 494, loss: 0.31795534491539, mean loss: 0.3420336208423565
Epoch: 49, step: 495, loss: 0.3731187880039215, mean loss: 0.3420340571131582
Epoch: 49, step: 496, loss: 0.3803222179412842, mean loss: 0.34203459446822854
Epoch: 49, step: 497, loss: 0.3170700669288635, mean loss: 0.342034244108564
Epoch: 49, step: 498, loss: 0.38620659708976746, mean loss: 0.3420348640279097
Epoch: 49, step: 499, loss: 0.3009026348590851, mean loss: 0.3420342867820754
Epoch: 49, step: 500, loss: 0.3154393434524536, mean loss: 0.3420339135563807
Epoch: 49, step: 501, loss: 0.3444870710372925, mean loss: 0.3420339479827957
Epoch: 49, step: 502, loss: 0.3602203130722046, mean loss: 0.3420342031977873
Epoch: 49, step: 503, loss: 0.35765475034713745, mean loss: 0.34203442240277115
Epoch: 49, step: 504, loss: 0.3308393955230713, mean loss: 0.34203426530384073
Epoch: 49, step: 505, loss: 0.3002372086048126, mean loss: 0.342033678777267
Epoch: 49, step: 506, loss: 0.30350592732429504, mean loss: 0.3420331381355391
Epoch: 49, step: 507, loss: 0.3378986716270447, mean loss: 0.34203308011933864
Epoch: 49, step: 508, loss: 0.3935607671737671, mean loss: 0.34203380316272675
Epoch: 49, step: 509, loss: 0.3272278308868408, mean loss: 0.34203359540626116
Epoch: 49, step: 510, loss: 0.3116282522678375, mean loss: 0.34203316876639783
Epoch: 49, step: 511, loss: 0.34034252166748047, mean loss: 0.3420331450440105
Epoch: 49, step: 512, loss: 0.388882040977478, mean loss: 0.3420338023970803
Epoch: 49, step: 513, loss: 0.32382670044898987, mean loss: 0.34203354693051724
Epoch: 49, step: 514, loss: 0.3080384433269501, mean loss: 0.3420330699468408
Epoch: 49, step: 515, loss: 0.34298789501190186, mean loss: 0.34203308334375776
Epoch: 49, step: 516, loss: 0.36037957668304443, mean loss: 0.3420333407553069
Epoch: 49, step: 517, loss: 0.35163986682891846, mean loss: 0.3420334755383424
Epoch: 49, step: 518, loss: 0.35522276163101196, mean loss: 0.3420336605862006
Epoch: 49, step: 519, loss: 0.38981616497039795, mean loss: 0.3420343309732086
Epoch: 49, step: 520, loss: 0.3099767863750458, mean loss: 0.3420338812131935
Epoch: 49, step: 521, loss: 0.3371190130710602, mean loss: 0.34203381225968554
Epoch: 49, step: 522, loss: 0.3451533615589142, mean loss: 0.34203385602502034
Epoch: 49, step: 523, loss: 0.3566420078277588, mean loss: 0.3420340609654216
Epoch: 49, step: 524, loss: 0.29397279024124146, mean loss: 0.34203338671462935
Epoch: 49, step: 525, loss: 0.3160582482814789, mean loss: 0.34203302231494315
Epoch: 49, step: 526, loss: 0.32942789793014526, mean loss: 0.34203284548281787
Epoch: 49, step: 527, loss: 0.3725915253162384, mean loss: 0.34203327417200247
Epoch: 49, step: 528, loss: 0.3237970769405365, mean loss: 0.3420330183510411
Epoch: 49, step: 529, loss: 0.3340787887573242, mean loss: 0.34203290676910925
Epoch: 49, step: 530, loss: 0.3358532190322876, mean loss: 0.3420328200816664
Epoch: 49, step: 531, loss: 0.32098230719566345, mean loss: 0.3420325247933586
Epoch: 49, step: 532, loss: 0.31010350584983826, mean loss: 0.3420320769119331
Epoch: 49, step: 533, loss: 0.35145917534828186, mean loss: 0.3420322091478489
Epoch: 49, step: 534, loss: 0.33078399300575256, mean loss: 0.3420320513689407
Epoch: 49, step: 535, loss: 0.33601871132850647, mean loss: 0.3420319670209067
Epoch: 49, step: 536, loss: 0.3269194960594177, mean loss: 0.34203175504398103
Epoch: 49, step: 537, loss: 0.3697616755962372, mean loss: 0.34203214399565374
Epoch: 49, step: 538, loss: 0.3529365658760071, mean loss: 0.3420322969435727
Epoch: 49, step: 539, loss: 0.3246658146381378, mean loss: 0.34203205336073067
Epoch: 49, step: 540, loss: 0.33842843770980835, mean loss: 0.34203200281701
Epoch: 49, step: 541, loss: 0.3344199061393738, mean loss: 0.342031896052491
Epoch: 49, step: 542, loss: 0.3393665552139282, mean loss: 0.34203185866990726
Epoch: 49, step: 543, loss: 0.3285731375217438, mean loss: 0.34203166990803985
Epoch: 49, step: 544, loss: 0.3346467614173889, mean loss: 0.34203156633433834
Epoch: 49, step: 545, loss: 0.34833088517189026, mean loss: 0.342031654681353
Epoch: 49, step: 546, loss: 0.32926079630851746, mean loss: 0.34203147557446584
Epoch: 49, step: 547, loss: 0.33605989813804626, mean loss: 0.34203139182632497
Epoch: 49, step: 548, loss: 0.32785820960998535, mean loss: 0.3420311930579046
Epoch: 49, step: 549, loss: 0.34531834721565247, mean loss: 0.34203123915716915
Epoch: 49, step: 550, loss: 0.33392956852912903, mean loss: 0.3420311255404046
Epoch: 49, step: 551, loss: 0.3301190137863159, mean loss: 0.342030958488857
Epoch: 49, step: 552, loss: 0.2789415121078491, mean loss: 0.34203007375556416
Epoch: 49, step: 553, loss: 0.3168495297431946, mean loss: 0.3420297206417791
Epoch: 49, step: 554, loss: 0.36728692054748535, mean loss: 0.3420300748255643
Epoch: 49, step: 555, loss: 0.33577677607536316, mean loss: 0.34202998713627286
Epoch: 49, step: 556, loss: 0.3174249529838562, mean loss: 0.3420296421075382
Epoch: 49, step: 557, loss: 0.31328245997428894, mean loss: 0.3420292390004045
Epoch: 49, step: 558, loss: 0.3491910398006439, mean loss: 0.3420293394252913
Epoch: 49, step: 559, loss: 0.3128524720668793, mean loss: 0.3420289303043737
Epoch: 49, step: 560, loss: 0.3498240113258362, mean loss: 0.34202903960623754
Epoch: 49, step: 561, loss: 0.34694164991378784, mean loss: 0.342029108489413
Epoch: 49, step: 562, loss: 0.29406651854515076, mean loss: 0.34202843598152666
Epoch: 49, step: 563, loss: 0.315043181180954, mean loss: 0.34202805761283905
Epoch: 49, step: 564, loss: 0.33241143822669983, mean loss: 0.34202792277710503
Epoch: 49, step: 565, loss: 0.31262168288230896, mean loss: 0.3420275104745912
Epoch: 49, step: 566, loss: 0.3496517837047577, mean loss: 0.3420276173724114
Epoch: 49, step: 567, loss: 0.34365755319595337, mean loss: 0.34202764022496907
Epoch: 49, step: 568, loss: 0.28987208008766174, mean loss: 0.34202690898683186
Epoch: 49, step: 569, loss: 0.3575187921524048, mean loss: 0.3420271261850929
Epoch: 49, step: 570, loss: 0.30733221769332886, mean loss: 0.34202663976468417
Epoch: 49, step: 571, loss: 0.32435014843940735, mean loss: 0.34202639194487533
Epoch: 49, step: 572, loss: 0.30777332186698914, mean loss: 0.34202591173247815
Epoch: 49, step: 573, loss: 0.3388593792915344, mean loss: 0.34202586733976204
Epoch: 49, step: 574, loss: 0.3255690932273865, mean loss: 0.34202563662977464
Epoch: 49, step: 575, loss: 0.3318629264831543, mean loss: 0.3420254941592124
Epoch: 49, step: 576, loss: 0.3139808773994446, mean loss: 0.34202510100854217
Epoch: 49, step: 577, loss: 0.3247115910053253, mean loss: 0.34202485829805346
Epoch: 49, step: 578, loss: 0.30515289306640625, mean loss: 0.34202434141342136
Epoch: 49, step: 579, loss: 0.3326112926006317, mean loss: 0.342024209459726
Epoch: 49, step: 580, loss: 0.3208039402961731, mean loss: 0.3420239119946074
Epoch: 49, step: 581, loss: 0.3466780483722687, mean loss: 0.3420239772352418
Epoch: 49, step: 582, loss: 0.34720781445503235, mean loss: 0.3420240499000846
Epoch: 49, step: 583, loss: 0.3354368507862091, mean loss: 0.34202395756480125
Epoch: 49, step: 584, loss: 0.3141343593597412, mean loss: 0.3420235666311417
Epoch: 49, step: 585, loss: 0.33523282408714294, mean loss: 0.3420234714453809
Epoch: 49, step: 586, loss: 0.3378092050552368, mean loss: 0.342023412374885
Epoch: 49, step: 587, loss: 0.2914174497127533, mean loss: 0.3420227030515689
Epoch: 49, step: 588, loss: 0.334958016872406, mean loss: 0.34202260403010726
Epoch: 49, step: 589, loss: 0.32287129759788513, mean loss: 0.34202233560151374
Epoch: 49, step: 590, loss: 0.308112770318985, mean loss: 0.34202186032483384
Epoch: 49, step: 591, loss: 0.3089810311794281, mean loss: 0.3420213972308558
Epoch: 49, step: 592, loss: 0.35968804359436035, mean loss: 0.3420216448397412
Epoch: 49, step: 593, loss: 0.3265739679336548, mean loss: 0.3420214283341083
Epoch: 49, step: 594, loss: 0.3074387311935425, mean loss: 0.34202094364998137
Epoch: 49, step: 595, loss: 0.3384007215499878, mean loss: 0.3420208929124814
Epoch: 49, step: 596, loss: 0.3139025866985321, mean loss: 0.34202049883926494
Epoch: 49, step: 597, loss: 0.3472015857696533, mean loss: 0.34202057145028786
Epoch: 49, step: 598, loss: 0.33094704151153564, mean loss: 0.34202041626102375
Epoch: 49, step: 599, loss: 0.3670310080051422, mean loss: 0.34202076676542065
Epoch: 49, step: 600, loss: 0.3298289179801941, mean loss: 0.34202059590833883
Epoch: 49, step: 601, loss: 0.3368009626865387, mean loss: 0.34202052276120437
Epoch: 49, step: 602, loss: 0.2984788715839386, mean loss: 0.34201991258377507
Epoch: 49, step: 603, loss: 0.3265497386455536, mean loss: 0.342019695793221
Epoch: 49, step: 604, loss: 0.3016243278980255, mean loss: 0.34201912972256765
Epoch: 49, step: 605, loss: 0.3284081518650055, mean loss: 0.3420189389911159
Epoch: 49, step: 606, loss: 0.3249804973602295, mean loss: 0.3420187002337538
Epoch: 49, step: 607, loss: 0.3635823726654053, mean loss: 0.3420190023983246
Epoch: 49, step: 608, loss: 0.3465439975261688, mean loss: 0.34201906580468805
Epoch: 49, step: 609, loss: 0.2988446056842804, mean loss: 0.34201846083229054
Epoch: 49, step: 610, loss: 0.30109235644340515, mean loss: 0.34201788737250677
Epoch: 49, step: 611, loss: 0.33262255787849426, mean loss: 0.3420177557262578
Epoch: 49, step: 612, loss: 0.3038589060306549, mean loss: 0.34201722105644744
Epoch: 49, step: 613, loss: 0.38619327545166016, mean loss: 0.3420178400287663
Epoch: 49, step: 614, loss: 0.41924285888671875, mean loss: 0.3420189220511403
Epoch: 49, step: 615, loss: 0.3189646005630493, mean loss: 0.3420185990348106
Epoch: 49, step: 616, loss: 0.2901932895183563, mean loss: 0.3420178729155566
Epoch: 49, step: 617, loss: 0.33342114090919495, mean loss: 0.34201775246928756
Epoch: 49, step: 618, loss: 0.3178545832633972, mean loss: 0.342017413931015
Epoch: 49, step: 619, loss: 0.3212452232837677, mean loss: 0.3420171229061516
Epoch: 49, step: 620, loss: 0.30033600330352783, mean loss: 0.34201653894886
Epoch: 49, step: 621, loss: 0.357779860496521, mean loss: 0.3420167597917184
Epoch: 49, step: 622, loss: 0.34359413385391235, mean loss: 0.3420167818902917
Epoch: 49, step: 623, loss: 0.35678526759147644, mean loss: 0.3420169887897832
Epoch: 49, step: 624, loss: 0.2988728880882263, mean loss: 0.3420163843698297
Epoch: 49, step: 625, loss: 0.34821152687072754, mean loss: 0.34201647115841083
Epoch: 49, step: 626, loss: 0.40935003757476807, mean loss: 0.34201741443014805
Epoch: 49, step: 627, loss: 0.31321465969085693, mean loss: 0.34201701093980375
Epoch: 49, step: 628, loss: 0.3379858732223511, mean loss: 0.34201695446942876
Epoch: 49, step: 629, loss: 0.33608007431030273, mean loss: 0.34201687130353964
Epoch: 49, step: 630, loss: 0.33487188816070557, mean loss: 0.34201677121552443
Epoch: 49, step: 631, loss: 0.3260464668273926, mean loss: 0.34201654750419497
Epoch: 49, step: 632, loss: 0.3450150191783905, mean loss: 0.34201658950606745
Epoch: 49, step: 633, loss: 0.33579716086387634, mean loss: 0.3420165023870222
Epoch: 49, step: 634, loss: 0.3302854001522064, mean loss: 0.3420163380651576
Epoch: 49, step: 635, loss: 0.31534603238105774, mean loss: 0.3420159644896073
Epoch: 49, step: 636, loss: 0.3531217873096466, mean loss: 0.34201612004859516
Epoch: 49, step: 637, loss: 0.34975841641426086, mean loss: 0.3420162284932315
Epoch: 49, step: 638, loss: 0.32688871026039124, mean loss: 0.34201601660839037
Epoch: 49, step: 639, loss: 0.347838431596756, mean loss: 0.34201609815938744
Epoch: 49, step: 640, loss: 0.3069867491722107, mean loss: 0.3420156075316442
Epoch: 49, step: 641, loss: 0.37106937170028687, mean loss: 0.3420160144585072
Epoch: 49, step: 642, loss: 0.314350426197052, mean loss: 0.3420156269798554
Epoch: 49, step: 643, loss: 0.3302198648452759, mean loss: 0.34201546177310277
Epoch: 49, step: 644, loss: 0.32601916790008545, mean loss: 0.34201523773851117
Epoch: 49, step: 645, loss: 0.3182717561721802, mean loss: 0.34201490520606714
Epoch: 49, step: 646, loss: 0.3815121352672577, mean loss: 0.342015458365319
Epoch: 49, step: 647, loss: 0.35227298736572266, mean loss: 0.34201560202014225
Epoch: 49, step: 648, loss: 0.3400261402130127, mean loss: 0.3420155741584826
Epoch: 49, step: 649, loss: 0.35389864444732666, mean loss: 0.342015740574054
Epoch: 49, step: 650, loss: 0.31401872634887695, mean loss: 0.3420153484974477
Epoch: 49, step: 651, loss: 0.31312376260757446, mean loss: 0.3420149438987208
Epoch: 49, step: 652, loss: 0.36540091037750244, mean loss: 0.3420152713919846
Epoch: 49, step: 653, loss: 0.34369227290153503, mean loss: 0.34201529487611165
Epoch: 49, step: 654, loss: 0.33000656962394714, mean loss: 0.3420151267125899
Epoch: 49, step: 655, loss: 0.33908799290657043, mean loss: 0.34201508572320705
Epoch: 49, step: 656, loss: 0.34419333934783936, mean loss: 0.34201511622540726
Epoch: 49, step: 657, loss: 0.3358459770679474, mean loss: 0.3420150298398364
Epoch: 49, step: 658, loss: 0.31737905740737915, mean loss: 0.3420146848706782
Epoch: 49, step: 659, loss: 0.31843331456184387, mean loss: 0.34201435467337915
Epoch: 49, step: 660, loss: 0.29739394783973694, mean loss: 0.342013729886468
Epoch: 49, step: 661, loss: 0.34083032608032227, mean loss: 0.3420137133163623
Epoch: 49, step: 662, loss: 0.36068156361579895, mean loss: 0.3420139747012921
Epoch: 49, step: 663, loss: 0.3321506083011627, mean loss: 0.34201383659759005
Epoch: 49, step: 664, loss: 0.31916821002960205, mean loss: 0.3420135167249116
Epoch: 49, step: 665, loss: 0.3159922957420349, mean loss: 0.3420131523942994
Epoch: 49, step: 666, loss: 0.29216092824935913, mean loss: 0.3420124544087185
Epoch: 49, step: 667, loss: 0.3457713723182678, mean loss: 0.3420125070369375
Epoch: 49, step: 668, loss: 0.3624267280101776, mean loss: 0.34201279285032177
Epoch: 49, step: 669, loss: 0.3313104510307312, mean loss: 0.3420126430121421
Epoch: 49, step: 670, loss: 0.31010907888412476, mean loss: 0.3420121963524178
Epoch: 49, step: 671, loss: 0.38322773575782776, mean loss: 0.3420127733745857
Epoch: 49, step: 672, loss: 0.29843807220458984, mean loss: 0.34201216333242956
Epoch: 49, step: 673, loss: 0.3130747377872467, mean loss: 0.34201175821657426
Epoch: 49, step: 674, loss: 0.31916892528533936, mean loss: 0.34201143842778603
Epoch: 49, step: 675, loss: 0.3259575664997101, mean loss: 0.3420112136843667
Epoch: 49, step: 676, loss: 0.343776673078537, mean loss: 0.3420112383992659
Epoch: 49, step: 677, loss: 0.3035958409309387, mean loss: 0.34201070062457223
Epoch: 49, step: 678, loss: 0.3150770664215088, mean loss: 0.34201032358762673
Epoch: 49, step: 679, loss: 0.32886138558387756, mean loss: 0.34201013952163756
Epoch: 49, step: 680, loss: 0.3391498029232025, mean loss: 0.3420100994816499
Epoch: 49, step: 681, loss: 0.322573184967041, mean loss: 0.34200982740076136
Epoch: 49, step: 682, loss: 0.317987322807312, mean loss: 0.3420094911347919
Epoch: 49, step: 683, loss: 0.35176393389701843, mean loss: 0.3420096276751441
Epoch: 49, step: 684, loss: 0.3237326741218567, mean loss: 0.3420093718423093
Epoch: 49, step: 685, loss: 0.3616155982017517, mean loss: 0.34200964627788444
Epoch: 49, step: 686, loss: 0.36650756001472473, mean loss: 0.34200998917941067
Epoch: 49, step: 687, loss: 0.3056408762931824, mean loss: 0.3420094801217867
Epoch: 49, step: 688, loss: 0.33455199003219604, mean loss: 0.34200937574093304
Epoch: 49, step: 689, loss: 0.3001548945903778, mean loss: 0.342008789921137
Epoch: 49, step: 690, loss: 0.3279348909854889, mean loss: 0.3420085929373737
Epoch: 49, step: 691, loss: 0.3235883414745331, mean loss: 0.34200833512397844
Epoch: 49, step: 692, loss: 0.32337281107902527, mean loss: 0.3420080743012371
Epoch: 49, step: 693, loss: 0.33025825023651123, mean loss: 0.34200790985303464
Epoch: 49, step: 694, loss: 0.32416483759880066, mean loss: 0.3420076601284366
Epoch: 49, step: 695, loss: 0.33823665976524353, mean loss: 0.34200760735174224
Epoch: 49, step: 696, loss: 0.32482925057411194, mean loss: 0.3420073669369692
Epoch: 49, step: 697, loss: 0.3072512745857239, mean loss: 0.342006880524839
Epoch: 49, step: 698, loss: 0.32075199484825134, mean loss: 0.3420065830664991
Epoch: 49, step: 699, loss: 0.31052452325820923, mean loss: 0.3420061424868444
Epoch: 49, step: 700, loss: 0.32678765058517456, mean loss: 0.34200592951272146
Epoch: 49, step: 701, loss: 0.35100409388542175, mean loss: 0.3420060554351426
Epoch: 49, step: 702, loss: 0.3395291268825531, mean loss: 0.342006020772909
Epoch: 49, step: 703, loss: 0.302163690328598, mean loss: 0.3420054632256036
Epoch: 49, step: 704, loss: 0.2903602719306946, mean loss: 0.34200474052103336
Epoch: 49, step: 705, loss: 0.30789902806282043, mean loss: 0.342004263264415
Epoch: 49, step: 706, loss: 0.32714003324508667, mean loss: 0.34200405526545025
Epoch: 49, step: 707, loss: 0.37012290954589844, mean loss: 0.3420044487342496
Epoch: 49, step: 708, loss: 0.3132738769054413, mean loss: 0.3420040467112757
Epoch: 49, step: 709, loss: 0.34519529342651367, mean loss: 0.342004091365331
Epoch: 49, step: 710, loss: 0.3342031240463257, mean loss: 0.3420039822105138
Epoch: 49, step: 711, loss: 0.31965646147727966, mean loss: 0.3420036695178299
Epoch: 49, step: 712, loss: 0.2863420248031616, mean loss: 0.3420028906956173
Epoch: 49, step: 713, loss: 0.32666000723838806, mean loss: 0.34200267601976087
Epoch: 49, step: 714, loss: 0.3356921672821045, mean loss: 0.34200258772508557
Epoch: 49, step: 715, loss: 0.32773447036743164, mean loss: 0.34200238809281897
Epoch: 49, step: 716, loss: 0.3095160722732544, mean loss: 0.3420019335671125
Epoch: 49, step: 717, loss: 0.28845474123954773, mean loss: 0.34200118438290106
Epoch: 49, step: 718, loss: 0.3357570767402649, mean loss: 0.3420010970221785
Epoch: 49, step: 719, loss: 0.30698683857917786, mean loss: 0.34200060714783687
Epoch: 49, step: 720, loss: 0.335785835981369, mean loss: 0.34200052019999116
Epoch: 49, step: 721, loss: 0.28467097878456116, mean loss: 0.34199971814143587
Epoch: 49, step: 722, loss: 0.36148062348365784, mean loss: 0.34199999068169723
Epoch: 49, step: 723, loss: 0.3167581558227539, mean loss: 0.34199963755026386
Epoch: 49, step: 724, loss: 0.36839860677719116, mean loss: 0.3420000068647562
Epoch: 49, step: 725, loss: 0.32290318608283997, mean loss: 0.34199973970909764
Epoch: 49, step: 726, loss: 0.3629515469074249, mean loss: 0.34200003281105473
Epoch: 49, step: 727, loss: 0.3131330609321594, mean loss: 0.341999628986816
Epoch: 49, step: 728, loss: 0.3181748390197754, mean loss: 0.34199929570305065
Epoch: 49, step: 729, loss: 0.37470436096191406, mean loss: 0.3419997532061318
Epoch: 49, step: 730, loss: 0.35651230812072754, mean loss: 0.3419999562158387
Epoch: 49, step: 731, loss: 0.34018540382385254, mean loss: 0.3419999308332235
Epoch: 49, step: 732, loss: 0.31264394521713257, mean loss: 0.3419995201968233
Epoch: 49, step: 733, loss: 0.307329386472702, mean loss: 0.34199903523202085
Epoch: 49, step: 734, loss: 0.3520823121070862, mean loss: 0.3419991762746259
Epoch: 49, step: 735, loss: 0.3474165201187134, mean loss: 0.341999252050151
Epoch: 49, step: 736, loss: 0.3033473789691925, mean loss: 0.3419987114115839
Epoch: 49, step: 737, loss: 0.3025365471839905, mean loss: 0.3419981594468844
Epoch: 49, step: 738, loss: 0.32774704694747925, mean loss: 0.3419979601166865
Epoch: 49, step: 739, loss: 0.31750351190567017, mean loss: 0.34199761751782487
Epoch: 49, step: 740, loss: 0.34618839621543884, mean loss: 0.3419976761325737
Epoch: 49, step: 741, loss: 0.32302847504615784, mean loss: 0.3419974108216407
Epoch: 49, step: 742, loss: 0.3084578216075897, mean loss: 0.3419969417299161
Epoch: 49, step: 743, loss: 0.3134942948818207, mean loss: 0.3419965430914987
Epoch: 49, step: 744, loss: 0.3384615480899811, mean loss: 0.3419964936517006
Epoch: 49, step: 745, loss: 0.3360757827758789, mean loss: 0.3419964108468717
Epoch: 49, step: 746, loss: 0.29930996894836426, mean loss: 0.3419958138587468
Epoch: 49, step: 747, loss: 0.3434929847717285, mean loss: 0.3419958347970287
Epoch: 49, step: 748, loss: 0.32654181122779846, mean loss: 0.3419956186719526
Epoch: 49, step: 749, loss: 0.36226966977119446, mean loss: 0.34199590220132214
Epoch: 49, step: 750, loss: 0.31701305508613586, mean loss: 0.34199555282507765
Epoch: 49, step: 751, loss: 0.31562936305999756, mean loss: 0.3419951841084338
Epoch: 49, step: 752, loss: 0.3113267123699188, mean loss: 0.34199475523274353
Epoch: 49, step: 753, loss: 0.33358457684516907, mean loss: 0.3419946376243197
Epoch: 49, step: 754, loss: 0.3846622705459595, mean loss: 0.3419952342826369
Epoch: 49, step: 755, loss: 0.34588372707366943, mean loss: 0.34199528865802553
Epoch: 49, step: 756, loss: 0.3017612099647522, mean loss: 0.34199472604593134
Epoch: 49, step: 757, loss: 0.3025211989879608, mean loss: 0.34199417407670774
Epoch: 49, step: 758, loss: 0.31054675579071045, mean loss: 0.3419937343449272
Epoch: 49, step: 759, loss: 0.3489114046096802, mean loss: 0.3419938310739146
Epoch: 49, step: 760, loss: 0.3116159439086914, mean loss: 0.3419934063093528
Epoch: 49, step: 761, loss: 0.3307039737701416, mean loss: 0.341993248454931
Epoch: 49, step: 762, loss: 0.31025323271751404, mean loss: 0.3419928046565594
Epoch: 49, step: 763, loss: 0.32206639647483826, mean loss: 0.34199252604346964
Epoch: 49, step: 764, loss: 0.31071212887763977, mean loss: 0.34199208868385267
Epoch: 49, step: 765, loss: 0.3072962760925293, mean loss: 0.34199160357699615
Epoch: 49, step: 766, loss: 0.3059340715408325, mean loss: 0.34199109943801936
Epoch: 49, step: 767, loss: 0.3171534240245819, mean loss: 0.34199075217450764
Epoch: 49, step: 768, loss: 0.32070431113243103, mean loss: 0.3419904545661044
Epoch: 49, step: 769, loss: 0.3564278781414032, mean loss: 0.34199065641471293
Epoch: 49, step: 770, loss: 0.32776007056236267, mean loss: 0.3419904574606697
Epoch: 49, step: 771, loss: 0.31689029932022095, mean loss: 0.34199010654692763
Epoch: 49, step: 772, loss: 0.3137684166431427, mean loss: 0.34198971199800476
Epoch: 49, step: 773, loss: 0.32304808497428894, mean loss: 0.341989447191252
Epoch: 49, step: 774, loss: 0.3169856071472168, mean loss: 0.3419890976387497
Epoch: 49, step: 775, loss: 0.3405889868736267, mean loss: 0.34198907806554096
Epoch: 49, step: 776, loss: 0.35266149044036865, mean loss: 0.3419892272611902
Epoch: 49, step: 777, loss: 0.3608737885951996, mean loss: 0.3419894912553934
Epoch: 49, step: 778, loss: 0.35459184646606445, mean loss: 0.34198966742587233
Epoch: 49, step: 779, loss: 0.33178120851516724, mean loss: 0.3419895247220741
Epoch: 49, step: 780, loss: 0.3621768057346344, mean loss: 0.34198980691563846
Epoch: 49, step: 781, loss: 0.34508970379829407, mean loss: 0.3419898502478099
Epoch: 49, step: 782, loss: 0.3700822591781616, mean loss: 0.3419902429344414
Epoch: 49, step: 783, loss: 0.3249902129173279, mean loss: 0.3419900053047235
Epoch: 49, step: 784, loss: 0.3026004433631897, mean loss: 0.34198945471748066
Epoch: 49, step: 785, loss: 0.30985185503959656, mean loss: 0.3419890055044355
Epoch: 49, step: 786, loss: 0.336518257856369, mean loss: 0.3419889290364701
Epoch: 49, step: 787, loss: 0.3352809548377991, mean loss: 0.34198883527634766
Epoch: 49, step: 788, loss: 0.35155656933784485, mean loss: 0.34198896900664416
Epoch: 49, step: 789, loss: 0.2983858585357666, mean loss: 0.3419883595650196
Epoch: 49, step: 790, loss: 0.33056938648223877, mean loss: 0.3419881999640149
Epoch: 49, step: 791, loss: 0.30127719044685364, mean loss: 0.3419876309612543
Epoch: 49, step: 792, loss: 0.3857116103172302, mean loss: 0.3419882420666416
Epoch: 49, step: 793, loss: 0.3487551808357239, mean loss: 0.34198833664300454
Epoch: 49, step: 794, loss: 0.3717789649963379, mean loss: 0.3419887529981687
Epoch: 49, step: 795, loss: 0.34406065940856934, mean loss: 0.34198878195482135
Epoch: 49, step: 796, loss: 0.33308401703834534, mean loss: 0.34198865750490426
Epoch: 49, step: 797, loss: 0.34072145819664, mean loss: 0.34198863979521216
Epoch: 49, step: 798, loss: 0.3273414671421051, mean loss: 0.34198843509711063
Epoch: 49, step: 799, loss: 0.3452889919281006, mean loss: 0.3419884812226184
Epoch: 49, step: 800, loss: 0.3354758620262146, mean loss: 0.34198839020959104
Epoch: 49, step: 801, loss: 0.3132735788822174, mean loss: 0.3419879889293522
Epoch: 49, step: 802, loss: 0.30621805787086487, mean loss: 0.34198748906307325
Epoch: 49, step: 803, loss: 0.359952837228775, mean loss: 0.3419877401160102
Epoch: 49, step: 804, loss: 0.30687421560287476, mean loss: 0.34198724943638703
Epoch: 49, step: 805, loss: 0.31967535614967346, mean loss: 0.3419869376522937
Epoch: 49, step: 806, loss: 0.3181687891483307, mean loss: 0.34198660482459636
Epoch: 49, step: 807, loss: 0.3542620837688446, mean loss: 0.3419867763560779
Epoch: 49, step: 808, loss: 0.3656653165817261, mean loss: 0.3419871072236839
Epoch: 49, step: 809, loss: 0.3233433961868286, mean loss: 0.34198684671295204
Epoch: 49, step: 810, loss: 0.3202875554561615, mean loss: 0.34198654351048086
Epoch: 49, step: 811, loss: 0.31460949778556824, mean loss: 0.34198616097854306
Epoch: 49, step: 812, loss: 0.3474363088607788, mean loss: 0.3419862371308979
Epoch: 49, step: 813, loss: 0.35927334427833557, mean loss: 0.34198647867214627
Epoch: 49, step: 814, loss: 0.3452688455581665, mean loss: 0.3419865245338345
Epoch: 49, step: 815, loss: 0.3171362578868866, mean loss: 0.3419861773272922
Epoch: 49, step: 816, loss: 0.3285180628299713, mean loss: 0.3419859891541753
Epoch: 49, step: 817, loss: 0.3560258746147156, mean loss: 0.34198618531319197
Epoch: 49, step: 818, loss: 0.3132546544075012, mean loss: 0.3419857838946673
Epoch: 49, step: 819, loss: 0.30627498030662537, mean loss: 0.341985284973191
Epoch: 49, step: 820, loss: 0.3227962851524353, mean loss: 0.34198501688428223
Epoch: 49, step: 821, loss: 0.3413108289241791, mean loss: 0.3419850074653552
Epoch: 49, step: 822, loss: 0.3244943916797638, mean loss: 0.34198476311134374
Epoch: 49, step: 823, loss: 0.3361292779445648, mean loss: 0.34198468130797455
Epoch: 49, step: 824, loss: 0.3086925446987152, mean loss: 0.34198421621057984
Epoch: 49, step: 825, loss: 0.3316473364830017, mean loss: 0.341984071804448
Epoch: 49, step: 826, loss: 0.3072147071361542, mean loss: 0.3419835860834714
Epoch: 49, step: 827, loss: 0.3162398636341095, mean loss: 0.34198322645391105
Epoch: 49, step: 828, loss: 0.347649484872818, mean loss: 0.3419833056081811
Epoch: 49, step: 829, loss: 0.30900341272354126, mean loss: 0.34198284490507036
Epoch: 49, step: 830, loss: 0.325300395488739, mean loss: 0.3419826118676555
Epoch: 49, step: 831, loss: 0.31349390745162964, mean loss: 0.34198221391402617
Epoch: 49, step: 832, loss: 0.31270623207092285, mean loss: 0.3419818049687714
Epoch: 49, step: 833, loss: 0.315149188041687, mean loss: 0.341981430159204
Epoch: 49, step: 834, loss: 0.36727508902549744, mean loss: 0.3419817834670062
Epoch: 49, step: 835, loss: 0.31040793657302856, mean loss: 0.3419813424422144
Epoch: 49, step: 836, loss: 0.3338843584060669, mean loss: 0.34198122934478814
Epoch: 49, step: 837, loss: 0.30221158266067505, mean loss: 0.34198067385624603
Epoch: 49, step: 838, loss: 0.31745055317878723, mean loss: 0.34198033123286903
Epoch: 49, step: 839, loss: 0.38560453057289124, mean loss: 0.3419809405434358
Epoch: 49, step: 840, loss: 0.3154204189777374, mean loss: 0.3419805695708872
Epoch: 49, step: 841, loss: 0.384922057390213, mean loss: 0.3419811693290902
Epoch: 49, step: 842, loss: 0.315615177154541, mean loss: 0.3419808010838329
Epoch: 49, step: 843, loss: 0.3462567627429962, mean loss: 0.3419808608039678
Epoch: 49, step: 844, loss: 0.3251708745956421, mean loss: 0.34198062603090307
Epoch: 49, step: 845, loss: 0.30896419286727905, mean loss: 0.34198016492041505
Epoch: 49, step: 846, loss: 0.37989941239356995, mean loss: 0.3419806944966545
Epoch: 49, step: 847, loss: 0.32773447036743164, mean loss: 0.3419804955381588
Epoch: 49, step: 848, loss: 0.30928558111190796, mean loss: 0.3419800389371613
Epoch: 49, step: 849, loss: 0.31551095843315125, mean loss: 0.34197966928824214
Epoch: 49, step: 850, loss: 0.30553632974624634, mean loss: 0.3419791603528093
Epoch: 49, step: 851, loss: 0.3367060720920563, mean loss: 0.34197908671455296
Epoch: 49, step: 852, loss: 0.3322170078754425, mean loss: 0.3419789503898055
Epoch: 49, step: 853, loss: 0.3407588601112366, mean loss: 0.3419789333518181
Epoch: 49, step: 854, loss: 0.3713822662830353, mean loss: 0.3419793439498119
Epoch: 49, step: 855, loss: 0.2982468605041504, mean loss: 0.34197873326328665
Epoch: 49, step: 856, loss: 0.3315926790237427, mean loss: 0.3419785882329955
Epoch: 49, step: 857, loss: 0.3073182702064514, mean loss: 0.341978104244976
Epoch: 49, step: 858, loss: 0.3101942539215088, mean loss: 0.34197766042943
Epoch: 49, step: 859, loss: 0.36876076459884644, mean loss: 0.3419780344115593
Epoch: 49, step: 860, loss: 0.3468327522277832, mean loss: 0.341978102198786
Epoch: 49, step: 861, loss: 0.39246052503585815, mean loss: 0.3419788070833518
Epoch: 49, step: 862, loss: 0.29379796981811523, mean loss: 0.3419781343451502
Epoch: 49, step: 863, loss: 0.3194289803504944, mean loss: 0.34197781950077716
Epoch: 49, step: 864, loss: 0.31955406069755554, mean loss: 0.3419775064116161
Epoch: 49, step: 865, loss: 0.326595276594162, mean loss: 0.3419772916419948
Epoch: 49, step: 866, loss: 0.32582253217697144, mean loss: 0.34197706608931666
Epoch: 49, step: 867, loss: 0.33452528715133667, mean loss: 0.34197696204906564
Epoch: 49, step: 868, loss: 0.3770480155944824, mean loss: 0.34197745169728266
Epoch: 49, step: 869, loss: 0.3193787932395935, mean loss: 0.3419771361881315
Epoch: 49, step: 870, loss: 0.3561927378177643, mean loss: 0.3419773346552128
Epoch: 49, step: 871, loss: 0.35145461559295654, mean loss: 0.3419774669677294
Epoch: 49, step: 872, loss: 0.36243537068367004, mean loss: 0.34197775257696195
Epoch: 49, step: 873, loss: 0.3249886631965637, mean loss: 0.34197751539855376
Epoch: 49, step: 874, loss: 0.3125385046005249, mean loss: 0.341977104417124
Epoch: 49, step: 875, loss: 0.3130711317062378, mean loss: 0.3419767008827719
Epoch: 49, step: 876, loss: 0.3493146300315857, mean loss: 0.3419768033206029
Epoch: 49, step: 877, loss: 0.33938470482826233, mean loss: 0.34197676713529296
Epoch: 49, step: 878, loss: 0.3407706320285797, mean loss: 0.34197675029806107
Epoch: 49, step: 879, loss: 0.36148181557655334, mean loss: 0.3419770225782732
Epoch: 49, step: 880, loss: 0.3368324637413025, mean loss: 0.34197695076400353
Epoch: 49, step: 881, loss: 0.3018433451652527, mean loss: 0.34197639053611334
Epoch: 49, step: 882, loss: 0.3501250445842743, mean loss: 0.34197650428217413
Epoch: 49, step: 883, loss: 0.33244338631629944, mean loss: 0.3419763712124091
Epoch: 49, step: 884, loss: 0.3160855770111084, mean loss: 0.34197600981608295
Epoch: 49, step: 885, loss: 0.354553759098053, mean loss: 0.341976185379988
Epoch: 49, step: 886, loss: 0.3879057466983795, mean loss: 0.34197682646929634
Epoch: 49, step: 887, loss: 0.32829979062080383, mean loss: 0.3419766355665571
Epoch: 49, step: 888, loss: 0.32524120807647705, mean loss: 0.34197640197834456
Epoch: 49, step: 889, loss: 0.3445623219013214, mean loss: 0.34197643807135636
Epoch: 49, step: 890, loss: 0.31806302070617676, mean loss: 0.3419761043041733
Epoch: 49, step: 891, loss: 0.32023677229881287, mean loss: 0.341975800885627
Epoch: 49, step: 892, loss: 0.354708194732666, mean loss: 0.34197597859074286
Epoch: 49, step: 893, loss: 0.3327891230583191, mean loss: 0.34197585037224276
Epoch: 49, step: 894, loss: 0.34363406896591187, mean loss: 0.3419758735152358
Epoch: 49, step: 895, loss: 0.3022511899471283, mean loss: 0.3419753191038646
Epoch: 49, step: 896, loss: 0.3749832510948181, mean loss: 0.3419757797675073
Epoch: 49, step: 897, loss: 0.33017128705978394, mean loss: 0.3419756150245382
Epoch: 49, step: 898, loss: 0.3480461537837982, mean loss: 0.34197569974352166
Epoch: 49, step: 899, loss: 0.3292398452758789, mean loss: 0.34197552200747067
Epoch: 49, step: 900, loss: 0.32268810272216797, mean loss: 0.34197525284438424
Epoch: 49, step: 901, loss: 0.3190633952617645, mean loss: 0.34197493310537974
Epoch: 49, step: 902, loss: 0.34106072783470154, mean loss: 0.34197492034766236
Epoch: 49, step: 903, loss: 0.3650287091732025, mean loss: 0.34197524205836327
Epoch: 49, step: 904, loss: 0.353456050157547, mean loss: 0.3419754022683534
Epoch: 49, step: 905, loss: 0.33003944158554077, mean loss: 0.34197523570921906
Epoch: 49, step: 906, loss: 0.36586514115333557, mean loss: 0.34197556907379273
Epoch: 49, step: 907, loss: 0.3082408308982849, mean loss: 0.34197509833900014
Epoch: 49, step: 908, loss: 0.3518626093864441, mean loss: 0.3419752363074791
Epoch: 49, step: 909, loss: 0.30684730410575867, mean loss: 0.341974746145726
Epoch: 49, step: 910, loss: 0.33571603894233704, mean loss: 0.341974658815334
Epoch: 49, step: 911, loss: 0.31327202916145325, mean loss: 0.34197425832097594
Epoch: 49, step: 912, loss: 0.3445358872413635, mean loss: 0.3419742940634716
Epoch: 49, step: 913, loss: 0.31647029519081116, mean loss: 0.34197393821027117
Epoch: 49, step: 914, loss: 0.34045612812042236, mean loss: 0.3419739170328062
Epoch: 49, step: 915, loss: 0.3390556871891022, mean loss: 0.34197387631635007
Epoch: 49, step: 916, loss: 0.3080931007862091, mean loss: 0.34197340360311734
Epoch: 49, step: 917, loss: 0.30047357082366943, mean loss: 0.34197282459493056
Epoch: 49, step: 918, loss: 0.35434672236442566, mean loss: 0.3419729972338949
Epoch: 49, step: 919, loss: 0.3003556728363037, mean loss: 0.3419724166026599
Epoch: 49, step: 920, loss: 0.3104374408721924, mean loss: 0.3419719766431788
Epoch: 49, step: 921, loss: 0.3455876410007477, mean loss: 0.3419720270863323
Epoch: 49, step: 922, loss: 0.28977468609809875, mean loss: 0.34197129887666156
Epoch: 49, step: 923, loss: 0.35548675060272217, mean loss: 0.3419714874292805
Epoch: 49, step: 924, loss: 0.31000155210494995, mean loss: 0.3419710414263603
Epoch: 49, step: 925, loss: 0.29503124952316284, mean loss: 0.34197038659262374
Epoch: 49, step: 926, loss: 0.33225128054618835, mean loss: 0.3419702510080912
Epoch: 49, step: 927, loss: 0.353117436170578, mean loss: 0.34197040651259936
Epoch: 49, step: 928, loss: 0.30118098855018616, mean loss: 0.3419698375034906
Epoch: 49, step: 929, loss: 0.33546948432922363, mean loss: 0.34196974682535014
Epoch: 49, step: 930, loss: 0.3660142421722412, mean loss: 0.3419700822347737
Epoch: 49, step: 931, loss: 0.353762149810791, mean loss: 0.3419702467262866
Epoch: 49, step: 932, loss: 0.32752078771591187, mean loss: 0.3419700451687393
Epoch: 49, step: 933, loss: 0.3597998321056366, mean loss: 0.3419702938754897
Epoch: 49, step: 934, loss: 0.3358592689037323, mean loss: 0.3419702086343162
Epoch: 49, step: 935, loss: 0.32606804370880127, mean loss: 0.3419699868220509
Epoch: 49, step: 936, loss: 0.3399280905723572, mean loss: 0.34196995834094046
Epoch: 49, step: 937, loss: 0.3026856482028961, mean loss: 0.3419694103967591
Epoch: 49, step: 938, loss: 0.3052336871623993, mean loss: 0.34196889800784447
Epoch: 49, step: 939, loss: 0.37723833322525024, mean loss: 0.34196938993815046
Epoch: 49, step: 940, loss: 0.3432542681694031, mean loss: 0.3419694078590988
Epoch: 49, step: 941, loss: 0.3450919985771179, mean loss: 0.34196945141109075
Epoch: 49, step: 942, loss: 0.3314577341079712, mean loss: 0.34196930480211013
Epoch: 49, step: 943, loss: 0.32041358947753906, mean loss: 0.3419690041645184
Epoch: 49, step: 944, loss: 0.34132784605026245, mean loss: 0.34196899522241003
Epoch: 49, step: 945, loss: 0.3566427528858185, mean loss: 0.34196919987162017
Epoch: 49, step: 946, loss: 0.3093741834163666, mean loss: 0.34196874528790044
Epoch: 49, step: 947, loss: 0.3156648874282837, mean loss: 0.3419683784484234
Epoch: 49, step: 948, loss: 0.29652246832847595, mean loss: 0.3419677446584489
Epoch: 49, step: 949, loss: 0.32647770643234253, mean loss: 0.3419675286369413
Epoch: 49, step: 950, loss: 0.41676434874534607, mean loss: 0.3419685717264599
Epoch: 49, step: 951, loss: 0.3222993016242981, mean loss: 0.3419682974297273
Epoch: 49, step: 952, loss: 0.3327636420726776, mean loss: 0.3419681690684985
Epoch: 49, step: 953, loss: 0.35096827149391174, mean loss: 0.3419682945754351
Epoch: 49, step: 954, loss: 0.34563639760017395, mean loss: 0.34196834572662566
Epoch: 49, step: 955, loss: 0.3002275824546814, mean loss: 0.34196776366555814
Epoch: 49, step: 956, loss: 0.31475532054901123, mean loss: 0.3419673842023769
Epoch: 49, step: 957, loss: 0.36195191740989685, mean loss: 0.34196766287227687
Epoch: 49, step: 958, loss: 0.3021503984928131, mean loss: 0.34196710765698884
Epoch: 49, step: 959, loss: 0.31244364380836487, mean loss: 0.3419666959850628
Epoch: 49, step: 960, loss: 0.29272571206092834, mean loss: 0.3419660093837838
Epoch: 49, step: 961, loss: 0.4148695468902588, mean loss: 0.34196702591432715
Epoch: 49, step: 962, loss: 0.3251204788684845, mean loss: 0.34196679101775795
Epoch: 49, step: 963, loss: 0.31880563497543335, mean loss: 0.3419664680791628
Epoch: 49, step: 964, loss: 0.3539445102214813, mean loss: 0.34196663508801856
Epoch: 49, step: 965, loss: 0.3687548041343689, mean loss: 0.34196700858804707
Epoch: 49, step: 966, loss: 0.31127169728279114, mean loss: 0.34196658061778223
Epoch: 49, step: 967, loss: 0.2998979687690735, mean loss: 0.3419659940831237
Epoch: 49, step: 968, loss: 0.32010698318481445, mean loss: 0.34196568932173094
Epoch: 49, step: 969, loss: 0.30564382672309875, mean loss: 0.3419651829242935
Epoch: 49, step: 970, loss: 0.34079137444496155, mean loss: 0.34196516655934756
Epoch: 49, step: 971, loss: 0.3410882353782654, mean loss: 0.3419651543335615
Epoch: 49, step: 972, loss: 0.30839914083480835, mean loss: 0.3419646863775953
Epoch: 49, step: 973, loss: 0.37113919854164124, mean loss: 0.34196509310437856
Epoch: 49, step: 974, loss: 0.3368794620037079, mean loss: 0.34196502220572805
Epoch: 49, step: 975, loss: 0.3257022202014923, mean loss: 0.34196479548959013
Epoch: 49, step: 976, loss: 0.3012572228908539, mean loss: 0.341964228002205
Epoch: 49, step: 977, loss: 0.3539607524871826, mean loss: 0.34196439523844563
Epoch: 49, step: 978, loss: 0.3206712603569031, mean loss: 0.34196409840796005
Epoch: 49, step: 979, loss: 0.3013324737548828, mean loss: 0.34196353200302176
Epoch: 49, step: 980, loss: 0.3095943033695221, mean loss: 0.34196308078219245
Epoch: 49, step: 981, loss: 0.3494798541069031, mean loss: 0.34196318556310806
Epoch: 49, step: 982, loss: 0.32140424847602844, mean loss: 0.341962898983464
Epoch: 49, step: 983, loss: 0.36409690976142883, mean loss: 0.34196320751441994
Epoch: 49, step: 984, loss: 0.31902068853378296, mean loss: 0.341962887717944
Epoch: 49, step: 985, loss: 0.3928850293159485, mean loss: 0.34196359751334415
Epoch: 49, step: 986, loss: 0.3076210618019104, mean loss: 0.34196311882503017
Epoch: 49, step: 987, loss: 0.32788076996803284, mean loss: 0.3419629225389455
Epoch: 49, step: 988, loss: 0.3282438814640045, mean loss: 0.3419627313194727
Epoch: 49, step: 989, loss: 0.3710416853427887, mean loss: 0.34196313662365724
Epoch: 49, step: 990, loss: 0.3225914537906647, mean loss: 0.34196286662375713
Epoch: 49, step: 991, loss: 0.30786851048469543, mean loss: 0.3419623914278473
Epoch: 49, step: 992, loss: 0.3468174934387207, mean loss: 0.3419624590957174
Epoch: 49, step: 993, loss: 0.3587619662284851, mean loss: 0.34196269323518963
Epoch: 49, step: 994, loss: 0.31212317943573, mean loss: 0.3419622773592604
Epoch: 49, step: 995, loss: 0.3348333537578583, mean loss: 0.34196217800420964
Epoch: 49, step: 996, loss: 0.38090813159942627, mean loss: 0.34196272078226203
Epoch: 49, step: 997, loss: 0.32320621609687805, mean loss: 0.34196245938213543
Epoch: 49, step: 998, loss: 0.3154207766056061, mean loss: 0.34196208948898826
Epoch: 49, step: 999, loss: 0.33445513248443604, mean loss: 0.3419619848711583
Epoch: 49, step: 1000, loss: 0.3144534230232239, mean loss: 0.3419616015139688
Epoch: 49, step: 1001, loss: 0.30451393127441406, mean loss: 0.3419610796534064
Epoch: 49, step: 1002, loss: 0.3398020267486572, mean loss: 0.34196104956585077
Epoch: 49, step: 1003, loss: 0.3230251967906952, mean loss: 0.34196078568830374
Epoch: 49, step: 1004, loss: 0.31819453835487366, mean loss: 0.34196045450218127
Epoch: 49, step: 1005, loss: 0.35129693150520325, mean loss: 0.34196058460553685
Epoch: 49, step: 1006, loss: 0.39936065673828125, mean loss: 0.34196138446162055
Epoch: 49, step: 1007, loss: 0.3143775761127472, mean loss: 0.34196100009329733
Epoch: 49, step: 1008, loss: 0.3568930923938751, mean loss: 0.3419612081625832
Epoch: 49, step: 1009, loss: 0.2728974521160126, mean loss: 0.3419602458161232
Epoch: 49, step: 1010, loss: 0.4020279347896576, mean loss: 0.341961082798148
Epoch: 49, step: 1011, loss: 0.34582623839378357, mean loss: 0.3419611366544014
Epoch: 49, step: 1012, loss: 0.32270124554634094, mean loss: 0.34196086829492717
Epoch: 49, step: 1013, loss: 0.3270137310028076, mean loss: 0.341960660030509
Epoch: 49, step: 1014, loss: 0.2949763536453247, mean loss: 0.3419600053885731
Epoch: 49, step: 1015, loss: 0.3183497190475464, mean loss: 0.34195967642621533
Epoch: 49, step: 1016, loss: 0.3222469389438629, mean loss: 0.3419594017722719
Epoch: 49, step: 1017, loss: 0.3571508824825287, mean loss: 0.3419596134294278
Epoch: 49, step: 1018, loss: 0.3365707993507385, mean loss: 0.3419595383501651
Epoch: 49, step: 1019, loss: 0.3151155114173889, mean loss: 0.34195916435291074
Epoch: 49, step: 1020, loss: 0.3128643035888672, mean loss: 0.341958759002161
Epoch: 49, step: 1021, loss: 0.32673180103302, mean loss: 0.34195854686253646
Epoch: 49, step: 1022, loss: 0.3492620885372162, mean loss: 0.34195864861293246
Epoch: 49, step: 1023, loss: 0.3769978880882263, mean loss: 0.3419591367605986
Epoch: 49, step: 1024, loss: 0.33534443378448486, mean loss: 0.3419590446094308
Epoch: 49, step: 1025, loss: 0.3167072534561157, mean loss: 0.3419586928249841
Epoch: 49, step: 1026, loss: 0.32076847553253174, mean loss: 0.3419583976267158
Epoch: 49, step: 1027, loss: 0.306323766708374, mean loss: 0.3419579012120424
Epoch: 49, step: 1028, loss: 0.31986740231513977, mean loss: 0.34195759348063753
Epoch: 49, step: 1029, loss: 0.33721381425857544, mean loss: 0.3419575273984039
Epoch: 49, step: 1030, loss: 0.32848507165908813, mean loss: 0.34195733972576486
Epoch: 49, step: 1031, loss: 0.33899372816085815, mean loss: 0.34195729844293815
Epoch: 49, step: 1032, loss: 0.3444567322731018, mean loss: 0.34195733325932826
Epoch: 49, step: 1033, loss: 0.32231995463371277, mean loss: 0.3419570597201358
Epoch: 49, step: 1034, loss: 0.3100043535232544, mean loss: 0.3419566146405827
Epoch: 49, step: 1035, loss: 0.3305804431438446, mean loss: 0.341956456180427
Epoch: 49, step: 1036, loss: 0.3134818971157074, mean loss: 0.34195605956015673
Epoch: 49, step: 1037, loss: 0.31679800152778625, mean loss: 0.3419557091400933
Epoch: 49, step: 1038, loss: 0.3464744985103607, mean loss: 0.34195577208026146
Epoch: 49, step: 1039, loss: 0.32088515162467957, mean loss: 0.3419554786012312
Epoch: 49, step: 1040, loss: 0.3590358793735504, mean loss: 0.3419557164997614
Epoch: 49, step: 1041, loss: 0.3599957525730133, mean loss: 0.34195596776074466
Epoch: 49, step: 1042, loss: 0.40300944447517395, mean loss: 0.3419568180995616
Epoch: 49, step: 1043, loss: 0.3570387065410614, mean loss: 0.34195702815371815
Epoch: 49, step: 1044, loss: 0.3543466627597809, mean loss: 0.3419572007088999
Epoch: 49, step: 1045, loss: 0.3262532651424408, mean loss: 0.3419569819972266
Epoch: 49, step: 1046, loss: 0.33305954933166504, mean loss: 0.3419568580827291
Epoch: 49, step: 1047, loss: 0.3175593614578247, mean loss: 0.34195651830365514
Epoch: 49, step: 1048, loss: 0.33079782128334045, mean loss: 0.34195636290086956
Epoch: 49, step: 1049, loss: 0.35463714599609375, mean loss: 0.34195653949869
Epoch: 49, step: 1050, loss: 0.34315699338912964, mean loss: 0.34195655621647364
Epoch: 49, step: 1051, loss: 0.3136212229728699, mean loss: 0.34195616161791575
Epoch: 49, step: 1052, loss: 0.31966671347618103, mean loss: 0.3419558512188273
Epoch: 49, step: 1053, loss: 0.3369315266609192, mean loss: 0.34195578125190684
Epoch: 49, step: 1054, loss: 0.35688865184783936, mean loss: 0.3419559891987478
Epoch: 49, step: 1055, loss: 0.350085973739624, mean loss: 0.34195610241080904
Epoch: 49, step: 1056, loss: 0.3220371901988983, mean loss: 0.3419558250388539
Epoch: 49, step: 1057, loss: 0.3021848499774933, mean loss: 0.34195527123353653
Epoch: 49, step: 1058, loss: 0.2995387613773346, mean loss: 0.3419546805977382
Epoch: 49, step: 1059, loss: 0.3412265479564667, mean loss: 0.3419546704588744
Epoch: 49, step: 1060, loss: 0.29080095887184143, mean loss: 0.3419539581802832
Epoch: 49, step: 1061, loss: 0.313934326171875, mean loss: 0.34195356803252064
Epoch: 49, step: 1062, loss: 0.3727967143058777, mean loss: 0.3419539974891585
Epoch: 49, step: 1063, loss: 0.329902708530426, mean loss: 0.3419538296906489
Epoch: 49, step: 1064, loss: 0.3279300332069397, mean loss: 0.3419536344302587
Epoch: 49, step: 1065, loss: 0.3588108420372009, mean loss: 0.3419538691383928
Epoch: 49, step: 1066, loss: 0.33556604385375977, mean loss: 0.34195378019995687
Epoch: 49, step: 1067, loss: 0.3309037983417511, mean loss: 0.3419536263519136
Epoch: 49, step: 1068, loss: 0.34086373448371887, mean loss: 0.34195361117764467
Epoch: 49, step: 1069, loss: 0.3553514778614044, mean loss: 0.3419537977099127
Epoch: 49, step: 1070, loss: 0.3428639769554138, mean loss: 0.34195381038173867
Epoch: 49, step: 1071, loss: 0.3483937978744507, mean loss: 0.3419539000401935
Epoch: 49, step: 1072, loss: 0.3738287389278412, mean loss: 0.3419543438002192
Epoch: 49, step: 1073, loss: 0.30595728754997253, mean loss: 0.34195384265785184
Epoch: 49, step: 1074, loss: 0.33977243304252625, mean loss: 0.3419538122892141
Epoch: 49, step: 1075, loss: 0.32849717140197754, mean loss: 0.34195362495430925
Epoch: 49, step: 1076, loss: 0.3261742889881134, mean loss: 0.34195340528736
Epoch: 49, step: 1077, loss: 0.3271900415420532, mean loss: 0.3419531997668023
Epoch: 49, step: 1078, loss: 0.3784100115299225, mean loss: 0.34195370727444846
Epoch: 49, step: 1079, loss: 0.32583341002464294, mean loss: 0.3419534828702883
Epoch: 49, step: 1080, loss: 0.3267914652824402, mean loss: 0.3419532718088912
Epoch: 49, step: 1081, loss: 0.30134832859039307, mean loss: 0.34195270657958055
Epoch: 49, step: 1082, loss: 0.35284385085105896, mean loss: 0.3419528581844786
Epoch: 49, step: 1083, loss: 0.3614165484905243, mean loss: 0.3419531291155798
Epoch: 49, step: 1084, loss: 0.3022977411746979, mean loss: 0.3419525771273288
Epoch: 49, step: 1085, loss: 0.33345526456832886, mean loss: 0.3419524588495448
Epoch: 49, step: 1086, loss: 0.33354225754737854, mean loss: 0.34195234178592965
Epoch: 49, step: 1087, loss: 0.3535813093185425, mean loss: 0.34195250365007324
Epoch: 49, step: 1088, loss: 0.35742366313934326, mean loss: 0.34195271899086926
Epoch: 49, step: 1089, loss: 0.3108758330345154, mean loss: 0.3419522864422798
Epoch: 49, step: 1090, loss: 0.29209792613983154, mean loss: 0.34195159254607954
Epoch: 49, step: 1091, loss: 0.3135523498058319, mean loss: 0.3419511972776971
Epoch: 49, step: 1092, loss: 0.3164069950580597, mean loss: 0.34195084175149326
Epoch: 49, step: 1093, loss: 0.341492235660553, mean loss: 0.34195083536866666
Epoch: 49, step: 1094, loss: 0.3046181797981262, mean loss: 0.34195031578431057
Epoch: 49, step: 1095, loss: 0.360617071390152, mean loss: 0.34195057557882713
Epoch: 49, step: 1096, loss: 0.3126412034034729, mean loss: 0.34195016767140257
Epoch: 49, step: 1097, loss: 0.3336547911167145, mean loss: 0.3419500522237371
Epoch: 49, step: 1098, loss: 0.3118896484375, mean loss: 0.3419496338756223
Epoch: 49, step: 1099, loss: 0.41584914922714233, mean loss: 0.34195066231465804
Epoch: 49, step: 1100, loss: 0.33198508620262146, mean loss: 0.3419505236284324
Epoch: 49, step: 1101, loss: 0.35381123423576355, mean loss: 0.3419506886860545
Epoch: 49, step: 1102, loss: 0.3380797207355499, mean loss: 0.3419506348171174
Epoch: 49, step: 1103, loss: 0.3312781751155853, mean loss: 0.34195048629972663
Epoch: 49, step: 1104, loss: 0.34772875905036926, mean loss: 0.3419505667087489
Epoch: 49, step: 1105, loss: 0.36607813835144043, mean loss: 0.34195090245742893
Epoch: 49, step: 1106, loss: 0.3266119062900543, mean loss: 0.34195068900967185
Epoch: 49, step: 1107, loss: 0.35545212030410767, mean loss: 0.3419508768844255
Epoch: 49, step: 1108, loss: 0.3470739722251892, mean loss: 0.341950948172192
Epoch: 49, step: 1109, loss: 0.33593177795410156, mean loss: 0.34195086441672745
Epoch: 49, step: 1110, loss: 0.30620813369750977, mean loss: 0.3419503670712042
Epoch: 49, step: 1111, loss: 0.35691529512405396, mean loss: 0.34195057529917844
Epoch: 49, step: 1112, loss: 0.32538041472435, mean loss: 0.3419503447385671
Epoch: 49, step: 1113, loss: 0.3656492829322815, mean loss: 0.3419506744858635
Epoch: 49, step: 1114, loss: 0.3099606931209564, mean loss: 0.341950229383091
Epoch: 49, step: 1115, loss: 0.3445461094379425, mean loss: 0.3419502655011906
Epoch: 49, step: 1116, loss: 0.3033091127872467, mean loss: 0.3419497278701927
Epoch: 49, step: 1117, loss: 0.31273308396339417, mean loss: 0.3419493213721001
Epoch: 49, step: 1118, loss: 0.3234444558620453, mean loss: 0.3419490639131017
Epoch: 49, step: 1119, loss: 0.335776150226593, mean loss: 0.34194897803028007
Epoch: 49, step: 1120, loss: 0.35786858201026917, mean loss: 0.3419491995142594
Epoch: 49, step: 1121, loss: 0.3593646287918091, mean loss: 0.3419494418057711
Epoch: 49, step: 1122, loss: 0.3210318386554718, mean loss: 0.3419491507944444
Epoch: 49, step: 1123, loss: 0.34698405861854553, mean loss: 0.3419492208404631
Epoch: 49, step: 1124, loss: 0.3316892683506012, mean loss: 0.3419490781052133
Epoch: 49, step: 1125, loss: 0.3718494772911072, mean loss: 0.3419494940702558
Epoch: 49, step: 1126, loss: 0.3311605453491211, mean loss: 0.3419493439798489
Epoch: 49, step: 1127, loss: 0.3140852153301239, mean loss: 0.34194895635355305
Epoch: 49, step: 1128, loss: 0.36750900745391846, mean loss: 0.3419493119221849
Epoch: 49, step: 1129, loss: 0.3427356779575348, mean loss: 0.3419493228612556
Epoch: 49, step: 1130, loss: 0.36121219396591187, mean loss: 0.3419495908216811
Epoch: 49, step: 1131, loss: 0.37553292512893677, mean loss: 0.3419500579835761
Epoch: 49, step: 1132, loss: 0.3463630676269531, mean loss: 0.3419501193700141
Epoch: 49, step: 1133, loss: 0.3043781816959381, mean loss: 0.3419495967390825
Epoch: 49, step: 1134, loss: 0.3540269136428833, mean loss: 0.3419497647339206
Epoch: 49, step: 1135, loss: 0.3086196780204773, mean loss: 0.3419493011206296
Epoch: 49, step: 1136, loss: 0.38510391116142273, mean loss: 0.341949901382269
Epoch: 49, step: 1137, loss: 0.34440305829048157, mean loss: 0.34194993550412767
Epoch: 49, step: 1138, loss: 0.3393438160419464, mean loss: 0.34194989925516095
Epoch: 49, step: 1139, loss: 0.3419683873653412, mean loss: 0.3419498995123117
Epoch: 49, step: 1140, loss: 0.3353288173675537, mean loss: 0.3419498074210959
Epoch: 49, step: 1141, loss: 0.3402647376060486, mean loss: 0.3419497839841461
Epoch: 49, step: 1142, loss: 0.342680424451828, mean loss: 0.3419497941461855
Epoch: 49, step: 1143, loss: 0.30609622597694397, mean loss: 0.34194929548737923
Epoch: 49, step: 1144, loss: 0.3097226321697235, mean loss: 0.341948847278546
Epoch: 49, step: 1145, loss: 0.296750545501709, mean loss: 0.3419482186687469
Epoch: 49, step: 1146, loss: 0.3117298185825348, mean loss: 0.34194779840255374
Epoch: 49, step: 1147, loss: 0.3189564049243927, mean loss: 0.3419474786513093
Epoch: 49, step: 1148, loss: 0.30831870436668396, mean loss: 0.3419470109679176
Epoch: 49, step: 1149, loss: 0.33141764998435974, mean loss: 0.3419468645356173
Epoch: 49, step: 1150, loss: 0.3324219286441803, mean loss: 0.34194673207374443
Epoch: 49, step: 1151, loss: 0.3179236352443695, mean loss: 0.3419463979927405
Epoch: 49, step: 1152, loss: 0.33375048637390137, mean loss: 0.3419462840165815
Epoch: 49, step: 1153, loss: 0.35025638341903687, mean loss: 0.3419463995790819
Epoch: 49, step: 1154, loss: 0.3391343057155609, mean loss: 0.3419463604738843
Epoch: 49, step: 1155, loss: 0.3606707453727722, mean loss: 0.34194662085302685
Epoch: 49, step: 1156, loss: 0.34915199875831604, mean loss: 0.34194672104878987
Epoch: 49, step: 1157, loss: 0.3265836834907532, mean loss: 0.34194650741809823
Epoch: 49, step: 1158, loss: 0.34506502747535706, mean loss: 0.34194655078207037
Epoch: 49, step: 1159, loss: 0.3253742456436157, mean loss: 0.3419463203423193
Epoch: 49, step: 1160, loss: 0.2949092388153076, mean loss: 0.34194566629554973
Epoch: 49, step: 1161, loss: 0.35055798292160034, mean loss: 0.3419457860474425
Epoch: 49, step: 1162, loss: 0.33093684911727905, mean loss: 0.34194563297333236
Epoch: 49, step: 1163, loss: 0.3288513123989105, mean loss: 0.3419454509054712
Epoch: 49, step: 1164, loss: 0.37066778540611267, mean loss: 0.3419458502649698
Epoch: 49, step: 1165, loss: 0.3241313397884369, mean loss: 0.3419456025728801
Epoch: 49, step: 1166, loss: 0.2855396270751953, mean loss: 0.3419448183178365
Epoch: 49, step: 1167, loss: 0.3155234754085541, mean loss: 0.34194445096698134
Epoch: 49, step: 1168, loss: 0.3317130506038666, mean loss: 0.34194430871602044
Epoch: 49, step: 1169, loss: 0.3718424439430237, mean loss: 0.34194472439512436
Epoch: 49, step: 1170, loss: 0.3126443326473236, mean loss: 0.3419443170322182
Epoch: 49, step: 1171, loss: 0.33422523736953735, mean loss: 0.3419442097154617
Epoch: 49, step: 1172, loss: 0.3296491503715515, mean loss: 0.3419440387821894
Epoch: 49, step: 1173, loss: 0.31073635816574097, mean loss: 0.34194360492037074
Epoch: 49, step: 1174, loss: 0.3385700583457947, mean loss: 0.3419435580206116
Epoch: 49, step: 1175, loss: 0.33256545662879944, mean loss: 0.3419434276460719
Epoch: 49, step: 1176, loss: 0.33938372135162354, mean loss: 0.3419433920614821
Epoch: 49, step: 1177, loss: 0.294524222612381, mean loss: 0.3419427328576362
Epoch: 49, step: 1178, loss: 0.32646986842155457, mean loss: 0.3419425177625582
Epoch: 49, step: 1179, loss: 0.28983116149902344, mean loss: 0.34194179334979874
Epoch: 49, step: 1180, loss: 0.3282833695411682, mean loss: 0.3419416034833349
Epoch: 49, step: 1181, loss: 0.321905255317688, mean loss: 0.3419413249608827
Epoch: 49, step: 1182, loss: 0.35404321551322937, mean loss: 0.3419414931852193
Epoch: 49, step: 1183, loss: 0.31199443340301514, mean loss: 0.34194107690693487
Epoch: 49, step: 1184, loss: 0.33609092235565186, mean loss: 0.3419409955881521
Epoch: 49, step: 1185, loss: 0.31936463713645935, mean loss: 0.341940681774824
Epoch: 49, step: 1186, loss: 0.30950987339019775, mean loss: 0.3419402309900585
Epoch: 49, step: 1187, loss: 0.35496339201927185, mean loss: 0.3419404120080868
Epoch: 49, step: 1188, loss: 0.3563652038574219, mean loss: 0.34194061250557584
Epoch: 49, step: 1189, loss: 0.3313292860984802, mean loss: 0.3419404650154248
Epoch: 49, step: 1190, loss: 0.3436011075973511, mean loss: 0.34194048809689565
Epoch: 49, step: 1191, loss: 0.29582464694976807, mean loss: 0.34193984713618586
Epoch: 49, step: 1192, loss: 0.3409888446331024, mean loss: 0.3419398339184552
Epoch: 49, step: 1193, loss: 0.3176313042640686, mean loss: 0.3419394960653676
Epoch: 49, step: 1194, loss: 0.3383537232875824, mean loss: 0.34193944622905154
Epoch: 49, step: 1195, loss: 0.3550049960613251, mean loss: 0.34193962781607945
Epoch: 49, step: 1196, loss: 0.323151558637619, mean loss: 0.34193936670022357
Epoch: 49, step: 1197, loss: 0.30397745966911316, mean loss: 0.3419388391144461
Epoch: 49, step: 1198, loss: 0.3217899203300476, mean loss: 0.3419385590933387
Epoch: 49, step: 1199, loss: 0.37299081683158875, mean loss: 0.34193899063841815
Epoch: 49, step: 1200, loss: 0.33082106709480286, mean loss: 0.3419388361305378
Epoch: 49, step: 1201, loss: 0.325848788022995, mean loss: 0.3419386125272122
Epoch: 49, step: 1202, loss: 0.3242158889770508, mean loss: 0.341938366238026
Epoch: 49, step: 1203, loss: 0.3502335846424103, mean loss: 0.3419384815134346
Epoch: 49, step: 1204, loss: 0.3564089238643646, mean loss: 0.34193868260072285
Epoch: 49, step: 1205, loss: 0.3369863033294678, mean loss: 0.3419386137813561
Epoch: 49, step: 1206, loss: 0.32924672961235046, mean loss: 0.34193843741455415
Epoch: 49, step: 1207, loss: 0.323460191488266, mean loss: 0.3419381806438643
Epoch: 49, step: 1208, loss: 0.3418785035610199, mean loss: 0.3419381798146128
Epoch: 49, step: 1209, loss: 0.3544682264328003, mean loss: 0.34193835392525695
Epoch: 49, step: 1210, loss: 0.313467413187027, mean loss: 0.34193795831420276
Epoch: 49, step: 1211, loss: 0.3019507825374603, mean loss: 0.34193740268981726
Epoch: 49, step: 1212, loss: 0.33363693952560425, mean loss: 0.341937287355949
Epoch: 49, step: 1213, loss: 0.31608349084854126, mean loss: 0.34193692812576276
Epoch: 49, step: 1214, loss: 0.33450156450271606, mean loss: 0.34193682481521237
Epoch: 49, step: 1215, loss: 0.3174493908882141, mean loss: 0.34193648457964954
Epoch: 49, step: 1216, loss: 0.30908527970314026, mean loss: 0.34193602814175095
Epoch: 49, step: 1217, loss: 0.3314935266971588, mean loss: 0.3419358830546161
Epoch: 49, step: 1218, loss: 0.3259814977645874, mean loss: 0.34193566138896425
Epoch: 49, step: 1219, loss: 0.30270135402679443, mean loss: 0.3419351162863278
Epoch: 49, step: 1220, loss: 0.3529459536075592, mean loss: 0.3419352692634916
Epoch: 49, step: 1221, loss: 0.3478449285030365, mean loss: 0.3419353513671794
Epoch: 49, step: 1222, loss: 0.34561625123023987, mean loss: 0.34193540250570403
Epoch: 49, step: 1223, loss: 0.35702890157699585, mean loss: 0.34193561219588287
Epoch: 49, step: 1224, loss: 0.3492204248905182, mean loss: 0.34193571340054374
Epoch: 49, step: 1225, loss: 0.31042003631591797, mean loss: 0.34193527557334963
Epoch: 49, step: 1226, loss: 0.3278537690639496, mean loss: 0.3419350799506816
Epoch: 49, step: 1227, loss: 0.29941049218177795, mean loss: 0.34193448920012914
Epoch: 49, step: 1228, loss: 0.3473607897758484, mean loss: 0.3419345645811193
Epoch: 49, step: 1229, loss: 0.284331351518631, mean loss: 0.34193376438089895
Epoch: 49, step: 1230, loss: 0.35180872678756714, mean loss: 0.3419339015579227
Epoch: 49, step: 1231, loss: 0.35365381836891174, mean loss: 0.341934064361679
Epoch: 49, step: 1232, loss: 0.31089290976524353, mean loss: 0.3419336331686551
Epoch: 49, step: 1233, loss: 0.356506884098053, mean loss: 0.3419338356030339
Epoch: 49, step: 1234, loss: 0.3070937991142273, mean loss: 0.3419333516531445
Epoch: 49, step: 1235, loss: 0.3620052635669708, mean loss: 0.34193363046067743
Epoch: 49, step: 1236, loss: 0.29677632451057434, mean loss: 0.34193300321489034
Epoch: 49, step: 1237, loss: 0.33415260910987854, mean loss: 0.34193289514485525
Epoch: 49, step: 1238, loss: 0.3131598234176636, mean loss: 0.3419324954911053
Epoch: 49, step: 1239, loss: 0.3413272202014923, mean loss: 0.341932487084037
Epoch: 49, step: 1240, loss: 0.3905969560146332, mean loss: 0.3419331630076023
Epoch: 49, step: 1241, loss: 0.3600170910358429, mean loss: 0.34193341418024636
Epoch: 49, step: 1242, loss: 0.3370012044906616, mean loss: 0.34193334567638256
Epoch: 49, step: 1243, loss: 0.3100303113460541, mean loss: 0.34193290257868353
Epoch: 49, step: 1244, loss: 0.35484248399734497, mean loss: 0.34193308187593524
Epoch: 49, step: 1245, loss: 0.35184890031814575, mean loss: 0.3419332195918104
Epoch: 49, step: 1246, loss: 0.3169534504413605, mean loss: 0.3419328726650275
Epoch: 49, step: 1247, loss: 0.30361202359199524, mean loss: 0.34193234046057946
Epoch: 49, step: 1248, loss: 0.3029346764087677, mean loss: 0.3419317988639674
Epoch: 49, step: 1249, loss: 0.33091047406196594, mean loss: 0.3419316458027669
Epoch: 49, step: 1250, loss: 0.3485662341117859, mean loss: 0.3419317379408689
Epoch: 49, step: 1251, loss: 0.3178093135356903, mean loss: 0.3419314029444184
Epoch: 49, step: 1252, loss: 0.3167635202407837, mean loss: 0.3419310534341808
Epoch: 49, step: 1253, loss: 0.3435753583908081, mean loss: 0.34193107626857816
Epoch: 49, step: 1254, loss: 0.3297828137874603, mean loss: 0.341930907568484
Epoch: 49, step: 1255, loss: 0.32505154609680176, mean loss: 0.34193067317197406
Epoch: 49, step: 1256, loss: 0.31574520468711853, mean loss: 0.34193030955056564
Epoch: 49, step: 1257, loss: 0.3395596146583557, mean loss: 0.3419302766306488
Epoch: 49, step: 1258, loss: 0.3009483218193054, mean loss: 0.3419297075553893
Epoch: 49, step: 1259, loss: 0.30279219150543213, mean loss: 0.3419291640995455
Epoch: 49, step: 1260, loss: 0.3517351746559143, mean loss: 0.3419293002619871
Epoch: 49, step: 1261, loss: 0.31877192854881287, mean loss: 0.34192897871221184
Epoch: 49, step: 1262, loss: 0.3136695623397827, mean loss: 0.3419285863238647
Epoch: 49, step: 1263, loss: 0.31182461977005005, mean loss: 0.3419281683293277
Epoch: 49, step: 1264, loss: 0.33264485001564026, mean loss: 0.3419280394319462
Epoch: 49, step: 1265, loss: 0.34463873505592346, mean loss: 0.34192807706899636
Epoch: 49, step: 1266, loss: 0.3144296407699585, mean loss: 0.34192769526823413
Epoch: 49, step: 1267, loss: 0.3600531816482544, mean loss: 0.3419279469272142
Epoch: 49, step: 1268, loss: 0.3690130114555359, mean loss: 0.3419283229780927
Epoch: 49, step: 1269, loss: 0.3419640064239502, mean loss: 0.34192832347351726
Epoch: 49, step: 1270, loss: 0.37282466888427734, mean loss: 0.3419287524285676
Epoch: 49, step: 1271, loss: 0.3333606421947479, mean loss: 0.34192863347329694
Epoch: 49, step: 1272, loss: 0.3060515820980072, mean loss: 0.34192813538153705
Epoch: 49, step: 1273, loss: 0.352272093296051, mean loss: 0.3419282789877833
Epoch: 49, step: 1274, loss: 0.31853753328323364, mean loss: 0.34192795425613015
Epoch: 49, step: 1275, loss: 0.3252488374710083, mean loss: 0.3419277227046421
Epoch: 49, step: 1276, loss: 0.31197041273117065, mean loss: 0.34192730682150557
Epoch: 49, step: 1277, loss: 0.3608725368976593, mean loss: 0.34192756982550476
Epoch: 49, step: 1278, loss: 0.32588014006614685, mean loss: 0.3419273470528282
Epoch: 49, step: 1279, loss: 0.3639698922634125, mean loss: 0.3419276530462927
Epoch: 49, step: 1280, loss: 0.3732296824455261, mean loss: 0.3419280875734024
Epoch: 49, step: 1281, loss: 0.3322010934352875, mean loss: 0.3419279525475252
Epoch: 49, step: 1282, loss: 0.3446231484413147, mean loss: 0.34192798996053614
Epoch: 49, step: 1283, loss: 0.3222145438194275, mean loss: 0.34192771631469854
Epoch: 49, step: 1284, loss: 0.31330549716949463, mean loss: 0.34192731901011997
Epoch: 49, step: 1285, loss: 0.2995956540107727, mean loss: 0.34192673141309327
Epoch: 49, step: 1286, loss: 0.3568398654460907, mean loss: 0.34192693841632793
Epoch: 49, step: 1287, loss: 0.31748804450035095, mean loss: 0.341926599194548
Epoch: 49, step: 1288, loss: 0.3561497926712036, mean loss: 0.34192679661551373
Epoch: 49, step: 1289, loss: 0.3193664252758026, mean loss: 0.34192648347708354
Epoch: 49, step: 1290, loss: 0.2740413248538971, mean loss: 0.3419255412427279
Epoch: 49, step: 1291, loss: 0.3415147364139557, mean loss: 0.3419255355409065
Epoch: 49, step: 1292, loss: 0.33977702260017395, mean loss: 0.34192550572074326
Epoch: 49, step: 1293, loss: 0.32549145817756653, mean loss: 0.34192527762848035
Epoch: 49, step: 1294, loss: 0.3350348174571991, mean loss: 0.34192518199538474
Epoch: 49, step: 1295, loss: 0.2917632758617401, mean loss: 0.34192448580504814
Epoch: 49, step: 1296, loss: 0.3196498453617096, mean loss: 0.34192417666260516
Epoch: 49, step: 1297, loss: 0.3168124258518219, mean loss: 0.34192382814967304
Epoch: 49, step: 1298, loss: 0.36225467920303345, mean loss: 0.34192411030706743
Epoch: 49, step: 1299, loss: 0.3716966509819031, mean loss: 0.3419245234932098
Epoch: 49, step: 1300, loss: 0.3304652273654938, mean loss: 0.34192436446221863
Epoch: 49, step: 1301, loss: 0.38922590017318726, mean loss: 0.34192502089919596
Epoch: 49, step: 1302, loss: 0.34388765692710876, mean loss: 0.3419250481357109
Epoch: 49, step: 1303, loss: 0.33125177025794983, mean loss: 0.3419249000191708
Epoch: 49, step: 1304, loss: 0.36361756920814514, mean loss: 0.34192520105120183
Epoch: 49, step: 1305, loss: 0.3416574001312256, mean loss: 0.3419251973349447
Epoch: 49, step: 1306, loss: 0.3392919600009918, mean loss: 0.3419251607941771
Epoch: 49, step: 1307, loss: 0.34263476729393005, mean loss: 0.34192517064107014
Epoch: 49, step: 1308, loss: 0.3438141942024231, mean loss: 0.3419251968538442
Epoch: 49, step: 1309, loss: 0.32822975516319275, mean loss: 0.34192500681357985
Epoch: 49, step: 1310, loss: 0.3340917229652405, mean loss: 0.3419248981191171
Epoch: 49, step: 1311, loss: 0.353588342666626, mean loss: 0.3419250599585541
Epoch: 49, step: 1312, loss: 0.3125375807285309, mean loss: 0.34192465218989865
Epoch: 49, step: 1313, loss: 0.2868337035179138, mean loss: 0.3419238877810091
Epoch: 49, step: 1314, loss: 0.31930503249168396, mean loss: 0.34192357393972356
Epoch: 49, step: 1315, loss: 0.3394309878349304, mean loss: 0.34192353935505676
Epoch: 49, step: 1316, loss: 0.34184810519218445, mean loss: 0.3419235383084212
Epoch: 49, step: 1317, loss: 0.3118893504142761, mean loss: 0.34192312159521127
Epoch: 49, step: 1318, loss: 0.3351570963859558, mean loss: 0.34192302772042515
Epoch: 49, step: 1319, loss: 0.3326244056224823, mean loss: 0.34192289870907466
Epoch: 49, step: 1320, loss: 0.30346810817718506, mean loss: 0.3419223651853357
Epoch: 49, step: 1321, loss: 0.324084997177124, mean loss: 0.34192211771220926
Epoch: 49, step: 1322, loss: 0.33057892322540283, mean loss: 0.3419219603405131
Epoch: 49, step: 1323, loss: 0.3152930736541748, mean loss: 0.3419215909053482
Epoch: 49, step: 1324, loss: 0.30542057752609253, mean loss: 0.3419210845165165
Epoch: 49, step: 1325, loss: 0.3655794560909271, mean loss: 0.3419214127312105
Epoch: 49, step: 1326, loss: 0.2951652407646179, mean loss: 0.3419207640876751
Epoch: 49, step: 1327, loss: 0.3540489077568054, mean loss: 0.3419209323378231
Epoch: 49, step: 1328, loss: 0.34598249197006226, mean loss: 0.3419209886818563
Epoch: 49, step: 1329, loss: 0.33864516019821167, mean loss: 0.341920943238518
Epoch: 49, step: 1330, loss: 0.3532911241054535, mean loss: 0.34192110096710804
Epoch: 49, step: 1331, loss: 0.3535253703594208, mean loss: 0.34192126194077066
Epoch: 49, step: 1332, loss: 0.3202863931655884, mean loss: 0.3419209618274555
Epoch: 49, step: 1333, loss: 0.30930158495903015, mean loss: 0.3419205093461562
Epoch: 49, step: 1334, loss: 0.3375685214996338, mean loss: 0.34192044897817897
Epoch: 49, step: 1335, loss: 0.3104250431060791, mean loss: 0.3419200121002193
Epoch: 49, step: 1336, loss: 0.3264928460121155, mean loss: 0.3419197981104271
Epoch: 49, step: 1337, loss: 0.3602728247642517, mean loss: 0.3419200526812188
Epoch: 49, step: 1338, loss: 0.33429914712905884, mean loss: 0.3419199469747821
Epoch: 49, step: 1339, loss: 0.352865606546402, mean loss: 0.34192009879540425
Epoch: 49, step: 1340, loss: 0.31843388080596924, mean loss: 0.3419197730368014
Epoch: 49, step: 1341, loss: 0.34520748257637024, mean loss: 0.3419198186373664
Epoch: 49, step: 1342, loss: 0.30944809317588806, mean loss: 0.3419193682604477
Epoch: 49, step: 1343, loss: 0.36396220326423645, mean loss: 0.3419196739863146
Epoch: 49, step: 1344, loss: 0.35709288716316223, mean loss: 0.34191988443018057
Epoch: 49, step: 1345, loss: 0.33369046449661255, mean loss: 0.34191977029437387
Epoch: 49, step: 1346, loss: 0.35476505756378174, mean loss: 0.3419199484462853
Epoch: 49, step: 1347, loss: 0.28817451000213623, mean loss: 0.3419192030585337
Epoch: 49, step: 1348, loss: 0.3119918704032898, mean loss: 0.34191878800642
Epoch: 49, step: 1349, loss: 0.3445848226547241, mean loss: 0.34191882498024534
Epoch: 49, step: 1350, loss: 0.3341083824634552, mean loss: 0.34191871666284873
Epoch: 49, step: 1351, loss: 0.3156469464302063, mean loss: 0.34191835232365986
Epoch: 49, step: 1352, loss: 0.3452705442905426, mean loss: 0.3419183988115042
Epoch: 49, step: 1353, loss: 0.3278834819793701, mean loss: 0.3419182041794583
Epoch: 49, step: 1354, loss: 0.3338768184185028, mean loss: 0.34191809266546236
Epoch: 49, step: 1355, loss: 0.3601110279560089, mean loss: 0.3419183449526724
Epoch: 49, step: 1356, loss: 0.2988113760948181, mean loss: 0.341917747182938
Epoch: 49, step: 1357, loss: 0.3151259124279022, mean loss: 0.34191737566236285
Epoch: 49, step: 1358, loss: 0.30453184247016907, mean loss: 0.34191685724687104
Epoch: 49, step: 1359, loss: 0.3330182135105133, mean loss: 0.34191673385339755
Epoch: 49, step: 1360, loss: 0.34532812237739563, mean loss: 0.3419167811569255
Epoch: 49, step: 1361, loss: 0.2629205286502838, mean loss: 0.34191568578194964
Epoch: 49, step: 1362, loss: 0.3073810935020447, mean loss: 0.34191520692627664
Epoch: 49, step: 1363, loss: 0.3162722885608673, mean loss: 0.3419148513672311
Epoch: 49, step: 1364, loss: 0.35016530752182007, mean loss: 0.3419149657646487
Epoch: 49, step: 1365, loss: 0.3221098482608795, mean loss: 0.34191469115887646
Epoch: 49, step: 1366, loss: 0.32968753576278687, mean loss: 0.3419145216268909
Epoch: 49, step: 1367, loss: 0.3485328257083893, mean loss: 0.3419146133897449
Epoch: 49, step: 1368, loss: 0.3392530679702759, mean loss: 0.34191457648790197
Epoch: 49, step: 1369, loss: 0.3280811607837677, mean loss: 0.3419143846927698
Epoch: 49, step: 1370, loss: 0.3293841481208801, mean loss: 0.34191421096813723
Epoch: 49, step: 1371, loss: 0.36843058466911316, mean loss: 0.34191457859754193
Epoch: 49, step: 1372, loss: 0.28650256991386414, mean loss: 0.34191381036273094
Epoch: 49, step: 1373, loss: 0.322238951921463, mean loss: 0.3419135375933085
Epoch: 49, step: 1374, loss: 0.3317708969116211, mean loss: 0.3419133969791387
Epoch: 49, step: 1375, loss: 0.3749352693557739, mean loss: 0.341913854776959
Epoch: 49, step: 1376, loss: 0.36882370710372925, mean loss: 0.34191422783578546
Epoch: 49, step: 1377, loss: 0.31441569328308105, mean loss: 0.3419138466211772
Epoch: 49, step: 1378, loss: 0.3125641644001007, mean loss: 0.3419134397495861
Epoch: 49, step: 1379, loss: 0.3346875011920929, mean loss: 0.3419133395785403
Epoch: 49, step: 1380, loss: 0.359511137008667, mean loss: 0.3419135835282115
Epoch: 49, step: 1381, loss: 0.3457780182361603, mean loss: 0.3419136370982399
Epoch: 49, step: 1382, loss: 0.3380919098854065, mean loss: 0.34191358412097084
Epoch: 49, step: 1383, loss: 0.34057220816612244, mean loss: 0.3419135655269044
Epoch: 49, step: 1384, loss: 0.32576102018356323, mean loss: 0.34191334162447246
Epoch: 49, step: 1385, loss: 0.3206673860549927, mean loss: 0.3419130471225794
Epoch: 49, step: 1386, loss: 0.3337782323360443, mean loss: 0.3419129343629938
Epoch: 49, step: 1387, loss: 0.32803112268447876, mean loss: 0.34191274194489
Epoch: 49, step: 1388, loss: 0.3376634418964386, mean loss: 0.3419126830454507
Epoch: 49, step: 1389, loss: 0.359255313873291, mean loss: 0.34191292342788115
Epoch: 49, step: 1390, loss: 0.3535427153110504, mean loss: 0.3419130846236604
Epoch: 49, step: 1391, loss: 0.3410886228084564, mean loss: 0.34191307319629144
Epoch: 49, step: 1392, loss: 0.3449692726135254, mean loss: 0.3419131155558448
Epoch: 49, step: 1393, loss: 0.3187901973724365, mean loss: 0.3419127950718783
Epoch: 49, step: 1394, loss: 0.3900579512119293, mean loss: 0.3419134623551611
Epoch: 49, step: 1395, loss: 0.2858346998691559, mean loss: 0.3419126851242807
Epoch: 49, step: 1396, loss: 0.3506958782672882, mean loss: 0.34191280685439784
Epoch: 49, step: 1397, loss: 0.34983959794044495, mean loss: 0.3419129167137416
Epoch: 49, step: 1398, loss: 0.32253026962280273, mean loss: 0.3419126480886
Epoch: 49, step: 1399, loss: 0.29614517092704773, mean loss: 0.3419120138034794
Epoch: 49, step: 1400, loss: 0.33788150548934937, mean loss: 0.3419119579459976
Epoch: 49, step: 1401, loss: 0.3280084729194641, mean loss: 0.34191176526486694
Epoch: 49, step: 1402, loss: 0.329956591129303, mean loss: 0.34191159958665446
Epoch: 49, step: 1403, loss: 0.31330427527427673, mean loss: 0.34191120314369006
Epoch: 49, step: 1404, loss: 0.3272644281387329, mean loss: 0.3419110001701309
Epoch: 49, step: 1405, loss: 0.32157713174819946, mean loss: 0.34191071838929854
Epoch: 49, step: 1406, loss: 0.3274032175540924, mean loss: 0.34191051735135897
Epoch: 49, step: 1407, loss: 0.3306136429309845, mean loss: 0.34191036080689885
Epoch: 49, step: 1408, loss: 0.3300236165523529, mean loss: 0.3419101960907033
Epoch: 49, step: 1409, loss: 0.33705708384513855, mean loss: 0.34191012884141353
Epoch: 49, step: 1410, loss: 0.33846619725227356, mean loss: 0.34191008111971816
Epoch: 49, step: 1411, loss: 0.3108614385128021, mean loss: 0.3419096508924345
Epoch: 49, step: 1412, loss: 0.3478614389896393, mean loss: 0.34190973336258235
Epoch: 49, step: 1413, loss: 0.3331877291202545, mean loss: 0.34190961250898333
Epoch: 49, step: 1414, loss: 0.34092825651168823, mean loss: 0.3419095989113333
Epoch: 49, step: 1415, loss: 0.31314724683761597, mean loss: 0.34190920038625333
Epoch: 49, step: 1416, loss: 0.3255193829536438, mean loss: 0.3419089732955486
Epoch: 49, step: 1417, loss: 0.35851186513900757, mean loss: 0.34190920333533914
Epoch: 49, step: 1418, loss: 0.3049141466617584, mean loss: 0.3419086907609481
Epoch: 49, step: 1419, loss: 0.34533044695854187, mean loss: 0.3419087381694523
Epoch: 49, step: 1420, loss: 0.3512827157974243, mean loss: 0.3419088680443103
Epoch: 49, step: 1421, loss: 0.3297249674797058, mean loss: 0.3419086992407889
Epoch: 49, step: 1422, loss: 0.36194220185279846, mean loss: 0.341908976793853
Epoch: 49, step: 1423, loss: 0.3291148543357849, mean loss: 0.3419087995408403
Epoch: 49, step: 1424, loss: 0.33435866236686707, mean loss: 0.3419086949407769
Epoch: 49, step: 1425, loss: 0.3374066948890686, mean loss: 0.34190863257065623
Epoch: 49, step: 1426, loss: 0.33857959508895874, mean loss: 0.3419085864512447
Epoch: 49, step: 1427, loss: 0.3152585029602051, mean loss: 0.3419082172546985
Epoch: 49, step: 1428, loss: 0.3295274078845978, mean loss: 0.341908045739711
Epoch: 49, step: 1429, loss: 0.38709986209869385, mean loss: 0.34190867178653944
Epoch: 49, step: 1430, loss: 0.3207562565803528, mean loss: 0.34190837876403946
Epoch: 49, step: 1431, loss: 0.32620930671691895, mean loss: 0.341908161289223
Epoch: 49, step: 1432, loss: 0.3184823989868164, mean loss: 0.3419078367832415
Epoch: 49, step: 1433, loss: 0.2974686026573181, mean loss: 0.34190722119612244
Epoch: 49, step: 1434, loss: 0.3093325197696686, mean loss: 0.34190676996672503
Epoch: 49, step: 1435, loss: 0.3307197391986847, mean loss: 0.34190661500453023
Epoch: 49, step: 1436, loss: 0.32515203952789307, mean loss: 0.3419063829241973
Epoch: 49, step: 1437, loss: 0.3180153965950012, mean loss: 0.34190605199660873
Epoch: 49, step: 1438, loss: 0.3110722601413727, mean loss: 0.3419056249062028
Epoch: 49, step: 1439, loss: 0.34736135601997375, mean loss: 0.3419057004745323
Epoch: 49, step: 1440, loss: 0.3375573456287384, mean loss: 0.3419056402455083
Epoch: 49, step: 1441, loss: 0.3772870600223541, mean loss: 0.34190613030644873
Epoch: 49, step: 1442, loss: 0.3271051347255707, mean loss: 0.3419059253036706
Epoch: 49, step: 1443, loss: 0.3852941393852234, mean loss: 0.34190652624846396
Valid: 49, mean loss: 0.18474165350198746
Epoch: 50, step: 0, loss: 0.3200392723083496, mean loss: 0.3419062233821056
Epoch: 50, step: 1, loss: 0.2894798815250397, mean loss: 0.3419054972756008
Epoch: 50, step: 2, loss: 0.33313342928886414, mean loss: 0.34190537578386243
Epoch: 50, step: 3, loss: 0.29927128553390503, mean loss: 0.3419047853167103
Epoch: 50, step: 4, loss: 0.3463020920753479, mean loss: 0.3419048462170186
Epoch: 50, step: 5, loss: 0.3109375536441803, mean loss: 0.3419044173427897
Epoch: 50, step: 6, loss: 0.3561367690563202, mean loss: 0.3419046144476648
Epoch: 50, step: 7, loss: 0.34086859226226807, mean loss: 0.3419046000999168
Epoch: 50, step: 8, loss: 0.3148851990699768, mean loss: 0.341904225916629
Epoch: 50, step: 9, loss: 0.3432644009590149, mean loss: 0.34190424475300957
Epoch: 50, step: 10, loss: 0.36207759380340576, mean loss: 0.3419045241197134
Epoch: 50, step: 11, loss: 0.29580092430114746, mean loss: 0.3419038856718125
Epoch: 50, step: 12, loss: 0.35517576336860657, mean loss: 0.3419040694597412
Epoch: 50, step: 13, loss: 0.33838343620300293, mean loss: 0.3419040207069612
Epoch: 50, step: 14, loss: 0.3207647204399109, mean loss: 0.34190372797968477
Epoch: 50, step: 15, loss: 0.3451712727546692, mean loss: 0.3419037732265106
Epoch: 50, step: 16, loss: 0.3495076596736908, mean loss: 0.34190387851870563
Epoch: 50, step: 17, loss: 0.3057039976119995, mean loss: 0.341903377260281
Epoch: 50, step: 18, loss: 0.32067564129829407, mean loss: 0.34190308332466907
Epoch: 50, step: 19, loss: 0.28681012988090515, mean loss: 0.3419023204756876
Epoch: 50, step: 20, loss: 0.29972386360168457, mean loss: 0.3419017364564013
Epoch: 50, step: 21, loss: 0.31807979941368103, mean loss: 0.3419014066131812
Epoch: 50, step: 22, loss: 0.38290050625801086, mean loss: 0.341901974286909
Epoch: 50, step: 23, loss: 0.33965110778808594, mean loss: 0.3419019431218323
Epoch: 50, step: 24, loss: 0.35027581453323364, mean loss: 0.34190205906328486
Epoch: 50, step: 25, loss: 0.3359808623790741, mean loss: 0.3419019770817729
Epoch: 50, step: 26, loss: 0.3600411117076874, mean loss: 0.3419022282224076
Epoch: 50, step: 27, loss: 0.3328952193260193, mean loss: 0.3419021035199529
Epoch: 50, step: 28, loss: 0.3597446084022522, mean loss: 0.341902350546838
Epoch: 50, step: 29, loss: 0.3297354280948639, mean loss: 0.3419021820998983
Epoch: 50, step: 30, loss: 0.3253297209739685, mean loss: 0.3419019526629374
Epoch: 50, step: 31, loss: 0.3256722390651703, mean loss: 0.3419017279742454
Epoch: 50, step: 32, loss: 0.2986910045146942, mean loss: 0.34190112976119236
Epoch: 50, step: 33, loss: 0.3386535048484802, mean loss: 0.34190108480141007
Epoch: 50, step: 34, loss: 0.3578987419605255, mean loss: 0.34190130626824966
Epoch: 50, step: 35, loss: 0.34226399660110474, mean loss: 0.34190131128915796
Epoch: 50, step: 36, loss: 0.3395445644855499, mean loss: 0.34190127866395476
Epoch: 50, step: 37, loss: 0.3209206759929657, mean loss: 0.34190098822675175
Epoch: 50, step: 38, loss: 0.31587639451026917, mean loss: 0.3419006279699138
Epoch: 50, step: 39, loss: 0.3391169309616089, mean loss: 0.341900589435902
Epoch: 50, step: 40, loss: 0.340915322303772, mean loss: 0.3419005757972878
Epoch: 50, step: 41, loss: 0.3445853888988495, mean loss: 0.34190061296144575
Epoch: 50, step: 42, loss: 0.29103830456733704, mean loss: 0.341899908916647
Epoch: 50, step: 43, loss: 0.37501874566078186, mean loss: 0.3419003673469214
Epoch: 50, step: 44, loss: 0.3205334544181824, mean loss: 0.3419000715906348
Epoch: 50, step: 45, loss: 0.35081008076667786, mean loss: 0.341900194919389
Epoch: 50, step: 46, loss: 0.32801005244255066, mean loss: 0.34190000266029896
Epoch: 50, step: 47, loss: 0.2974720299243927, mean loss: 0.34189938772323863
Epoch: 50, step: 48, loss: 0.34493589401245117, mean loss: 0.34189942975158905
Epoch: 50, step: 49, loss: 0.3533250093460083, mean loss: 0.341899587891099
Epoch: 50, step: 50, loss: 0.3633972406387329, mean loss: 0.3418998854323475
Epoch: 50, step: 51, loss: 0.3212219476699829, mean loss: 0.34189959924043917
Epoch: 50, step: 52, loss: 0.35175657272338867, mean loss: 0.34189973566347326
Epoch: 50, step: 53, loss: 0.3398258686065674, mean loss: 0.34189970696102
Epoch: 50, step: 54, loss: 0.3672623634338379, mean loss: 0.3419000579769563
Epoch: 50, step: 55, loss: 0.30165278911590576, mean loss: 0.34189950096758875
Epoch: 50, step: 56, loss: 0.3308752179145813, mean loss: 0.3418993483971381
Epoch: 50, step: 57, loss: 0.2924974858760834, mean loss: 0.34189866471003744
Epoch: 50, step: 58, loss: 0.31934788823127747, mean loss: 0.341898352627439
Epoch: 50, step: 59, loss: 0.3055771589279175, mean loss: 0.34189784998152567
Epoch: 50, step: 60, loss: 0.3109797537326813, mean loss: 0.34189742211454005
Epoch: 50, step: 61, loss: 0.33321699500083923, mean loss: 0.3418973019901716
Epoch: 50, step: 62, loss: 0.31826260685920715, mean loss: 0.3418969749252126
Epoch: 50, step: 63, loss: 0.3199569880962372, mean loss: 0.3418966713164056
Epoch: 50, step: 64, loss: 0.3484158515930176, mean loss: 0.3418967615285453
Epoch: 50, step: 65, loss: 0.3031875789165497, mean loss: 0.34189622587993307
Epoch: 50, step: 66, loss: 0.3204897344112396, mean loss: 0.3418959296660115
Epoch: 50, step: 67, loss: 0.3497712016105652, mean loss: 0.34189603863916623
Epoch: 50, step: 68, loss: 0.3845692574977875, mean loss: 0.3418966291166719
Epoch: 50, step: 69, loss: 0.3343173861503601, mean loss: 0.3418965242426859
Epoch: 50, step: 70, loss: 0.3381349742412567, mean loss: 0.3418964721948382
Epoch: 50, step: 71, loss: 0.35423922538757324, mean loss: 0.3418966429767896
Epoch: 50, step: 72, loss: 0.3029140830039978, mean loss: 0.34189610359749206
Epoch: 50, step: 73, loss: 0.345325231552124, mean loss: 0.34189615104371
Epoch: 50, step: 74, loss: 0.33074358105659485, mean loss: 0.3418959967362733
Epoch: 50, step: 75, loss: 0.2998507022857666, mean loss: 0.34189541500382475
Epoch: 50, step: 76, loss: 0.29032889008522034, mean loss: 0.34189470154691703
Epoch: 50, step: 77, loss: 0.35118183493614197, mean loss: 0.3418948300387595
Epoch: 50, step: 78, loss: 0.31251686811447144, mean loss: 0.341894423586513
Epoch: 50, step: 79, loss: 0.3173043727874756, mean loss: 0.34189408338105093
Epoch: 50, step: 80, loss: 0.2864283323287964, mean loss: 0.3418933160182439
Epoch: 50, step: 81, loss: 0.3288184702396393, mean loss: 0.3418931351316362
Epoch: 50, step: 82, loss: 0.386478453874588, mean loss: 0.34189375194774435
Epoch: 50, step: 83, loss: 0.3353365659713745, mean loss: 0.34189366123353404
Epoch: 50, step: 84, loss: 0.32014769315719604, mean loss: 0.3418933603970109
Epoch: 50, step: 85, loss: 0.30700963735580444, mean loss: 0.34189287781776956
Epoch: 50, step: 86, loss: 0.3071165978908539, mean loss: 0.3418923967315448
Epoch: 50, step: 87, loss: 0.308596134185791, mean loss: 0.3418919361258766
Epoch: 50, step: 88, loss: 0.35196346044540405, mean loss: 0.3418920754489315
Epoch: 50, step: 89, loss: 0.30243581533432007, mean loss: 0.341891529643701
Epoch: 50, step: 90, loss: 0.319779634475708, mean loss: 0.3418912237702843
Epoch: 50, step: 91, loss: 0.34318217635154724, mean loss: 0.3418912416277593
Epoch: 50, step: 92, loss: 0.33872294425964355, mean loss: 0.3418911978019758
Epoch: 50, step: 93, loss: 0.3375217020511627, mean loss: 0.3418911373613341
Epoch: 50, step: 94, loss: 0.30518999695777893, mean loss: 0.34189062970326084
Epoch: 50, step: 95, loss: 0.32919371128082275, mean loss: 0.3418904540791817
Epoch: 50, step: 96, loss: 0.36810144782066345, mean loss: 0.3418908166252589
Epoch: 50, step: 97, loss: 0.32730668783187866, mean loss: 0.3418906149028213
Epoch: 50, step: 98, loss: 0.29022079706192017, mean loss: 0.34188990023432186
Epoch: 50, step: 99, loss: 0.34887805581092834, mean loss: 0.3418899968893091
Epoch: 50, step: 100, loss: 0.34808966517448425, mean loss: 0.34189008263733867
Epoch: 50, step: 101, loss: 0.3306916356086731, mean loss: 0.34188992775300586
Epoch: 50, step: 102, loss: 0.314274400472641, mean loss: 0.34188954581135367
Epoch: 50, step: 103, loss: 0.341337651014328, mean loss: 0.3418895381783763
Epoch: 50, step: 104, loss: 0.3083847761154175, mean loss: 0.3418890747973921
Epoch: 50, step: 105, loss: 0.3397302031517029, mean loss: 0.3418890449399578
Epoch: 50, step: 106, loss: 0.3573583662509918, mean loss: 0.34188925887942856
Epoch: 50, step: 107, loss: 0.38677793741226196, mean loss: 0.3418898796776602
Epoch: 50, step: 108, loss: 0.3220002055168152, mean loss: 0.341889604612673
Epoch: 50, step: 109, loss: 0.3565055727958679, mean loss: 0.34188980674195224
Epoch: 50, step: 110, loss: 0.29607337713241577, mean loss: 0.3418891731394629
Epoch: 50, step: 111, loss: 0.3043730556964874, mean loss: 0.34188865433044857
Epoch: 50, step: 112, loss: 0.30805572867393494, mean loss: 0.34188818646262875
Epoch: 50, step: 113, loss: 0.28167322278022766, mean loss: 0.3418873537751314
Epoch: 50, step: 114, loss: 0.34076038002967834, mean loss: 0.3418873381908993
Epoch: 50, step: 115, loss: 0.3515413701534271, mean loss: 0.3418874716887692
Epoch: 50, step: 116, loss: 0.33025699853897095, mean loss: 0.34188731086250224
Epoch: 50, step: 117, loss: 0.33211928606033325, mean loss: 0.34188717579205224
Epoch: 50, step: 118, loss: 0.3145703971385956, mean loss: 0.3418867980658855
Epoch: 50, step: 119, loss: 0.3940739333629608, mean loss: 0.34188751968003506
Epoch: 50, step: 120, loss: 0.3326345682144165, mean loss: 0.3418873917372319
Epoch: 50, step: 121, loss: 0.3486824333667755, mean loss: 0.34188748569262073
Epoch: 50, step: 122, loss: 0.3131740689277649, mean loss: 0.3418870886762253
Epoch: 50, step: 123, loss: 0.34337317943573, mean loss: 0.34188710922391014
Epoch: 50, step: 124, loss: 0.3147646188735962, mean loss: 0.341886734215402
Epoch: 50, step: 125, loss: 0.3522392213344574, mean loss: 0.34188687735185525
Epoch: 50, step: 126, loss: 0.36453238129615784, mean loss: 0.34188719045075255
Epoch: 50, step: 127, loss: 0.36822134256362915, mean loss: 0.3418875545442172
Epoch: 50, step: 128, loss: 0.294269323348999, mean loss: 0.3418868961882162
Epoch: 50, step: 129, loss: 0.31838953495025635, mean loss: 0.3418865713249335
Epoch: 50, step: 130, loss: 0.31425121426582336, mean loss: 0.34188618925698117
Epoch: 50, step: 131, loss: 0.3072362244129181, mean loss: 0.34188571021637887
Epoch: 50, step: 132, loss: 0.32656919956207275, mean loss: 0.34188549846640787
Epoch: 50, step: 133, loss: 0.3442630469799042, mean loss: 0.3418855313354392
Epoch: 50, step: 134, loss: 0.300388365983963, mean loss: 0.34188495765512744
Epoch: 50, step: 135, loss: 0.303508996963501, mean loss: 0.34188442713145056
Epoch: 50, step: 136, loss: 0.35715004801750183, mean loss: 0.341884638166203
Epoch: 50, step: 137, loss: 0.3669258654117584, mean loss: 0.3418849843359512
Epoch: 50, step: 138, loss: 0.3130626082420349, mean loss: 0.3418845859011361
Epoch: 50, step: 139, loss: 0.3276912569999695, mean loss: 0.34188438969808244
Epoch: 50, step: 140, loss: 0.32353997230529785, mean loss: 0.34188413611550283
Epoch: 50, step: 141, loss: 0.29611778259277344, mean loss: 0.341883503476738
Epoch: 50, step: 142, loss: 0.3598144054412842, mean loss: 0.3418837513362678
Epoch: 50, step: 143, loss: 0.34461450576782227, mean loss: 0.3418837890830669
Epoch: 50, step: 144, loss: 0.34098413586616516, mean loss: 0.34188377664747055
Epoch: 50, step: 145, loss: 0.3472180962562561, mean loss: 0.34188385038091273
Epoch: 50, step: 146, loss: 0.37214356660842896, mean loss: 0.3418842686389777
Epoch: 50, step: 147, loss: 0.3082866370677948, mean loss: 0.3418838042497538
Epoch: 50, step: 148, loss: 0.3362237513065338, mean loss: 0.3418837260171183
Epoch: 50, step: 149, loss: 0.36739978194236755, mean loss: 0.34188407869239024
Epoch: 50, step: 150, loss: 0.30855792760849, mean loss: 0.34188361807469203
Epoch: 50, step: 151, loss: 0.27157583832740784, mean loss: 0.34188264632851023
Epoch: 50, step: 152, loss: 0.36625802516937256, mean loss: 0.34188298322371624
Epoch: 50, step: 153, loss: 0.3311729431152344, mean loss: 0.3418828352009378
Epoch: 50, step: 154, loss: 0.3235100209712982, mean loss: 0.3418825812749586
Epoch: 50, step: 155, loss: 0.3769122362136841, mean loss: 0.3418830654041937
Epoch: 50, step: 156, loss: 0.3333376944065094, mean loss: 0.3418829473040652
Epoch: 50, step: 157, loss: 0.3195297122001648, mean loss: 0.341882638378513
Epoch: 50, step: 158, loss: 0.3735639750957489, mean loss: 0.34188307621398223
Epoch: 50, step: 159, loss: 0.3233652114868164, mean loss: 0.3418828203009816
Epoch: 50, step: 160, loss: 0.35021454095840454, mean loss: 0.3418829354420197
Epoch: 50, step: 161, loss: 0.30682772397994995, mean loss: 0.3418824509997508
Epoch: 50, step: 162, loss: 0.30247360467910767, mean loss: 0.34188190640035165
Epoch: 50, step: 163, loss: 0.3300020098686218, mean loss: 0.34188174223175216
Epoch: 50, step: 164, loss: 0.3928603231906891, mean loss: 0.34188244669635465
Epoch: 50, step: 165, loss: 0.31999778747558594, mean loss: 0.3418821442800373
Epoch: 50, step: 166, loss: 0.307013601064682, mean loss: 0.34188166245070606
Epoch: 50, step: 167, loss: 0.3387662470340729, mean loss: 0.3418816194010789
Epoch: 50, step: 168, loss: 0.3441343307495117, mean loss: 0.3418816505292049
Epoch: 50, step: 169, loss: 0.3502429127693176, mean loss: 0.34188176606412596
Epoch: 50, step: 170, loss: 0.31214314699172974, mean loss: 0.34188135514512424
Epoch: 50, step: 171, loss: 0.3241226375102997, mean loss: 0.3418811097640703
Epoch: 50, step: 172, loss: 0.32981249690055847, mean loss: 0.34188094300833455
Epoch: 50, step: 173, loss: 0.31556496024131775, mean loss: 0.3418805793973311
Epoch: 50, step: 174, loss: 0.3428446054458618, mean loss: 0.3418805927172074
Epoch: 50, step: 175, loss: 0.32082855701446533, mean loss: 0.34188030184681245
Epoch: 50, step: 176, loss: 0.28992483019828796, mean loss: 0.34187958400175605
Epoch: 50, step: 177, loss: 0.28505221009254456, mean loss: 0.341878798854696
Epoch: 50, step: 178, loss: 0.42488738894462585, mean loss: 0.34187994571483626
Epoch: 50, step: 179, loss: 0.3372839391231537, mean loss: 0.34187988221654125
Epoch: 50, step: 180, loss: 0.32569822669029236, mean loss: 0.3418796586543422
Epoch: 50, step: 181, loss: 0.319818377494812, mean loss: 0.3418793538647376
Epoch: 50, step: 182, loss: 0.3021765351295471, mean loss: 0.3418788053544695
Epoch: 50, step: 183, loss: 0.33576658368110657, mean loss: 0.3418787209128571
Epoch: 50, step: 184, loss: 0.3169499635696411, mean loss: 0.34187837652165254
Epoch: 50, step: 185, loss: 0.31723687052726746, mean loss: 0.34187803610353307
Epoch: 50, step: 186, loss: 0.35104846954345703, mean loss: 0.3418781627897259
Epoch: 50, step: 187, loss: 0.31293201446533203, mean loss: 0.34187776291476973
Epoch: 50, step: 188, loss: 0.322642058134079, mean loss: 0.34187749718786675
Epoch: 50, step: 189, loss: 0.36594635248184204, mean loss: 0.3418778296765433
Epoch: 50, step: 190, loss: 0.3286038637161255, mean loss: 0.34187764631167805
Epoch: 50, step: 191, loss: 0.37407875061035156, mean loss: 0.3418780911274629
Epoch: 50, step: 192, loss: 0.31581631302833557, mean loss: 0.34187773112334513
Epoch: 50, step: 193, loss: 0.33734574913978577, mean loss: 0.3418776685217209
Epoch: 50, step: 194, loss: 0.35044893622398376, mean loss: 0.34187778691757287
Epoch: 50, step: 195, loss: 0.31534209847450256, mean loss: 0.3418774203822886
Epoch: 50, step: 196, loss: 0.30236634612083435, mean loss: 0.3418768746266045
Epoch: 50, step: 197, loss: 0.3362644612789154, mean loss: 0.3418767971049416
Epoch: 50, step: 198, loss: 0.36044877767562866, mean loss: 0.3418770536275534
Epoch: 50, step: 199, loss: 0.35810303688049316, mean loss: 0.34187727774334414
Epoch: 50, step: 200, loss: 0.3367292284965515, mean loss: 0.34187720663867366
Epoch: 50, step: 201, loss: 0.3532555401325226, mean loss: 0.34187736379363476
Epoch: 50, step: 202, loss: 0.3237745761871338, mean loss: 0.3418771137654922
Epoch: 50, step: 203, loss: 0.314409077167511, mean loss: 0.34187673439368127
Epoch: 50, step: 204, loss: 0.30280444025993347, mean loss: 0.341876194758378
Epoch: 50, step: 205, loss: 0.2910197377204895, mean loss: 0.3418754923793343
Epoch: 50, step: 206, loss: 0.3154700994491577, mean loss: 0.34187512769922146
Epoch: 50, step: 207, loss: 0.34317630529403687, mean loss: 0.34187514566930205
Epoch: 50, step: 208, loss: 0.34656354784965515, mean loss: 0.34187521041818936
Epoch: 50, step: 209, loss: 0.3366377353668213, mean loss: 0.3418751380873642
Epoch: 50, step: 210, loss: 0.3137378990650177, mean loss: 0.341874749510504
Epoch: 50, step: 211, loss: 0.3624022603034973, mean loss: 0.34187503299267263
Epoch: 50, step: 212, loss: 0.29965293407440186, mean loss: 0.3418744499192063
Epoch: 50, step: 213, loss: 0.3240283131599426, mean loss: 0.3418742034732599
Epoch: 50, step: 214, loss: 0.3432254195213318, mean loss: 0.3418742221325991
Epoch: 50, step: 215, loss: 0.2930516302585602, mean loss: 0.3418735479364011
Epoch: 50, step: 216, loss: 0.3798525631427765, mean loss: 0.3418740723852903
Epoch: 50, step: 217, loss: 0.3114951252937317, mean loss: 0.34187365289086774
Epoch: 50, step: 218, loss: 0.31968697905540466, mean loss: 0.3418733465254963
Epoch: 50, step: 219, loss: 0.2993568181991577, mean loss: 0.34187275944280743
Epoch: 50, step: 220, loss: 0.297411173582077, mean loss: 0.34187214551057976
Epoch: 50, step: 221, loss: 0.30630287528038025, mean loss: 0.34187165437155803
Epoch: 50, step: 222, loss: 0.35797542333602905, mean loss: 0.34187187672866787
Epoch: 50, step: 223, loss: 0.3331388235092163, mean loss: 0.34187175614635784
Epoch: 50, step: 224, loss: 0.3346940875053406, mean loss: 0.3418716570415095
Epoch: 50, step: 225, loss: 0.3406704068183899, mean loss: 0.34187164045561186
Epoch: 50, step: 226, loss: 0.3406479060649872, mean loss: 0.3418716235595042
Epoch: 50, step: 227, loss: 0.3318788707256317, mean loss: 0.341871485591414
Epoch: 50, step: 228, loss: 0.36907118558883667, mean loss: 0.34187186112745616
Epoch: 50, step: 229, loss: 0.3314874768257141, mean loss: 0.3418717177561418
Epoch: 50, step: 230, loss: 0.33010101318359375, mean loss: 0.341871555246932
Epoch: 50, step: 231, loss: 0.3465847671031952, mean loss: 0.3418716203177827
Epoch: 50, step: 232, loss: 0.32695087790489197, mean loss: 0.3418714143240725
Epoch: 50, step: 233, loss: 0.349611759185791, mean loss: 0.3418715211847299
Epoch: 50, step: 234, loss: 0.320995569229126, mean loss: 0.34187123298217653
Epoch: 50, step: 235, loss: 0.32798826694488525, mean loss: 0.34187104132380175
Epoch: 50, step: 236, loss: 0.3368714153766632, mean loss: 0.3418709723034676
Epoch: 50, step: 237, loss: 0.3529681861400604, mean loss: 0.34187112549949505
Epoch: 50, step: 238, loss: 0.3138648569583893, mean loss: 0.3418707388808429
Epoch: 50, step: 239, loss: 0.3361005485057831, mean loss: 0.34187065922608895
Epoch: 50, step: 240, loss: 0.34658685326576233, mean loss: 0.34187072433002236
Epoch: 50, step: 241, loss: 0.3364424407482147, mean loss: 0.34187064939719913
Epoch: 50, step: 242, loss: 0.3291119337081909, mean loss: 0.34187047327644643
Epoch: 50, step: 243, loss: 0.3469555675983429, mean loss: 0.34187054346989687
Epoch: 50, step: 244, loss: 0.3137165307998657, mean loss: 0.3418701548438679
Epoch: 50, step: 245, loss: 0.3040161728858948, mean loss: 0.3418696323307967
Epoch: 50, step: 246, loss: 0.32828134298324585, mean loss: 0.3418694447690019
Epoch: 50, step: 247, loss: 0.3120744824409485, mean loss: 0.3418690335090316
Epoch: 50, step: 248, loss: 0.33981379866600037, mean loss: 0.3418690051410094
Epoch: 50, step: 249, loss: 0.3744758665561676, mean loss: 0.3418694552012083
Epoch: 50, step: 250, loss: 0.35052210092544556, mean loss: 0.34186957462876244
Epoch: 50, step: 251, loss: 0.3366640508174896, mean loss: 0.34186950278086575
Epoch: 50, step: 252, loss: 0.3299523890018463, mean loss: 0.3418693383002538
Epoch: 50, step: 253, loss: 0.31347090005874634, mean loss: 0.341868946348971
Epoch: 50, step: 254, loss: 0.296875923871994, mean loss: 0.3418683253701224
Epoch: 50, step: 255, loss: 0.31271255016326904, mean loss: 0.341867922977288
Epoch: 50, step: 256, loss: 0.3561279773712158, mean loss: 0.34186811978442044
Epoch: 50, step: 257, loss: 0.35087209939956665, mean loss: 0.3418682440492306
Epoch: 50, step: 258, loss: 0.32695940136909485, mean loss: 0.3418680382936629
Epoch: 50, step: 259, loss: 0.3332158625125885, mean loss: 0.341867918887428
Epoch: 50, step: 260, loss: 0.3109116554260254, mean loss: 0.34186749167467273
Epoch: 50, step: 261, loss: 0.3340873122215271, mean loss: 0.34186738430557645
Epoch: 50, step: 262, loss: 0.3267786502838135, mean loss: 0.34186717607883976
Epoch: 50, step: 263, loss: 0.3325580060482025, mean loss: 0.3418670476127044
Epoch: 50, step: 264, loss: 0.322630912065506, mean loss: 0.3418667821585466
Epoch: 50, step: 265, loss: 0.41571253538131714, mean loss: 0.34186780119855464
Epoch: 50, step: 266, loss: 0.33475178480148315, mean loss: 0.34186770300190794
Epoch: 50, step: 267, loss: 0.31644055247306824, mean loss: 0.3418673521277217
Epoch: 50, step: 268, loss: 0.318620502948761, mean loss: 0.3418670313443636
Epoch: 50, step: 269, loss: 0.32131174206733704, mean loss: 0.3418667477057645
Epoch: 50, step: 270, loss: 0.30635207891464233, mean loss: 0.3418662576522425
Epoch: 50, step: 271, loss: 0.3088240325450897, mean loss: 0.34186580172132974
Epoch: 50, step: 272, loss: 0.3005951941013336, mean loss: 0.341865232259494
Epoch: 50, step: 273, loss: 0.34613245725631714, mean loss: 0.3418652911388852
Epoch: 50, step: 274, loss: 0.30547553300857544, mean loss: 0.3418647890380486
Epoch: 50, step: 275, loss: 0.32299357652664185, mean loss: 0.3418645286592679
Epoch: 50, step: 276, loss: 0.3834925591945648, mean loss: 0.3418651030212108
Epoch: 50, step: 277, loss: 0.31542542576789856, mean loss: 0.34186473822531066
Epoch: 50, step: 278, loss: 0.3720642924308777, mean loss: 0.34186515489157543
Epoch: 50, step: 279, loss: 0.3145497143268585, mean loss: 0.3418647780229142
Epoch: 50, step: 280, loss: 0.2891927659511566, mean loss: 0.34186405132195713
Epoch: 50, step: 281, loss: 0.3128565549850464, mean loss: 0.3418636511191987
Epoch: 50, step: 282, loss: 0.2846145033836365, mean loss: 0.34186286129058047
Epoch: 50, step: 283, loss: 0.28488364815711975, mean loss: 0.3418620751969166
Epoch: 50, step: 284, loss: 0.33694660663604736, mean loss: 0.34186200738331984
Epoch: 50, step: 285, loss: 0.34463924169540405, mean loss: 0.3418620456973986
Epoch: 50, step: 286, loss: 0.30255967378616333, mean loss: 0.3418615034984952
Epoch: 50, step: 287, loss: 0.3467981517314911, mean loss: 0.3418615716014672
Epoch: 50, step: 288, loss: 0.33716240525245667, mean loss: 0.34186150677554394
Epoch: 50, step: 289, loss: 0.31093958020210266, mean loss: 0.34186108020737493
Epoch: 50, step: 290, loss: 0.34706154465675354, mean loss: 0.34186115194682465
Epoch: 50, step: 291, loss: 0.3379087448120117, mean loss: 0.34186109742484794
Epoch: 50, step: 292, loss: 0.3448503315448761, mean loss: 0.3418611386596447
Epoch: 50, step: 293, loss: 0.3568646013736725, mean loss: 0.34186134562108583
Epoch: 50, step: 294, loss: 0.30674201250076294, mean loss: 0.34186086118308157
Epoch: 50, step: 295, loss: 0.35039544105529785, mean loss: 0.3418609789079198
Epoch: 50, step: 296, loss: 0.3281238377094269, mean loss: 0.3418607894222694
Epoch: 50, step: 297, loss: 0.31104379892349243, mean loss: 0.3418603643486053
Epoch: 50, step: 298, loss: 0.33153846859931946, mean loss: 0.3418602219756657
Epoch: 50, step: 299, loss: 0.33147308230400085, mean loss: 0.34186007870477364
Epoch: 50, step: 300, loss: 0.33777913451194763, mean loss: 0.34186002241666463
Epoch: 50, step: 301, loss: 0.3663381040096283, mean loss: 0.3418603600360626
Epoch: 50, step: 302, loss: 0.3468247950077057, mean loss: 0.3418604285081944
Epoch: 50, step: 303, loss: 0.3214726448059082, mean loss: 0.341860147312899
Epoch: 50, step: 304, loss: 0.34731459617614746, mean loss: 0.34186022254148823
Epoch: 50, step: 305, loss: 0.34237393736839294, mean loss: 0.3418602296266236
Epoch: 50, step: 306, loss: 0.3193523585796356, mean loss: 0.34185991920320175
Epoch: 50, step: 307, loss: 0.356428325176239, mean loss: 0.3418601201245618
Epoch: 50, step: 308, loss: 0.3325592279434204, mean loss: 0.34185999185231725
Epoch: 50, step: 309, loss: 0.2932831943035126, mean loss: 0.34185932191992796
Epoch: 50, step: 310, loss: 0.3401895761489868, mean loss: 0.34185929889244565
Epoch: 50, step: 311, loss: 0.3401550352573395, mean loss: 0.3418592753892512
Epoch: 50, step: 312, loss: 0.34169936180114746, mean loss: 0.341859273183942
Epoch: 50, step: 313, loss: 0.29009464383125305, mean loss: 0.3418585593269026
Epoch: 50, step: 314, loss: 0.30600765347480774, mean loss: 0.34185806493393767
Epoch: 50, step: 315, loss: 0.3778700530529022, mean loss: 0.341858561541419
Epoch: 50, step: 316, loss: 0.34510868787765503, mean loss: 0.34185860636023857
Epoch: 50, step: 317, loss: 0.33337581157684326, mean loss: 0.3418584893852147
Epoch: 50, step: 318, loss: 0.2976853847503662, mean loss: 0.34185788026064545
Epoch: 50, step: 319, loss: 0.33271509408950806, mean loss: 0.34185775418802866
Epoch: 50, step: 320, loss: 0.35351938009262085, mean loss: 0.3418579149914636
Epoch: 50, step: 321, loss: 0.3315228521823883, mean loss: 0.34185777248211735
Epoch: 50, step: 322, loss: 0.3137848377227783, mean loss: 0.3418573853920251
Epoch: 50, step: 323, loss: 0.32366055250167847, mean loss: 0.34185713448428573
Epoch: 50, step: 324, loss: 0.3546335697174072, mean loss: 0.3418573106502317
Epoch: 50, step: 325, loss: 0.31624385714530945, mean loss: 0.3418569574878692
Epoch: 50, step: 326, loss: 0.35288241505622864, mean loss: 0.34185710950653214
Epoch: 50, step: 327, loss: 0.33863624930381775, mean loss: 0.34185706509802505
Epoch: 50, step: 328, loss: 0.3286983072757721, mean loss: 0.34185688367048817
Epoch: 50, step: 329, loss: 0.37414100766181946, mean loss: 0.341857328784565
Epoch: 50, step: 330, loss: 0.3244159519672394, mean loss: 0.341857088316671
Epoch: 50, step: 331, loss: 0.3148069977760315, mean loss: 0.3418567153765819
Epoch: 50, step: 332, loss: 0.35625335574150085, mean loss: 0.3418569138605873
Epoch: 50, step: 333, loss: 0.3495343029499054, mean loss: 0.3418570197059714
Epoch: 50, step: 334, loss: 0.3126649260520935, mean loss: 0.3418566172506925
Epoch: 50, step: 335, loss: 0.3203476369380951, mean loss: 0.3418563207223436
Epoch: 50, step: 336, loss: 0.3447662591934204, mean loss: 0.34185636083895266
Epoch: 50, step: 337, loss: 0.368621826171875, mean loss: 0.3418567298243856
Epoch: 50, step: 338, loss: 0.3229132890701294, mean loss: 0.3418564686760274
Epoch: 50, step: 339, loss: 0.31709954142570496, mean loss: 0.34185612738946486
Epoch: 50, step: 340, loss: 0.3889067769050598, mean loss: 0.3418567759971421
Epoch: 50, step: 341, loss: 0.34122467041015625, mean loss: 0.34185676728349224
Epoch: 50, step: 342, loss: 0.32096749544143677, mean loss: 0.3418564793263931
Epoch: 50, step: 343, loss: 0.34206581115722656, mean loss: 0.34185648221197745
Epoch: 50, step: 344, loss: 0.31009936332702637, mean loss: 0.341856044454463
Epoch: 50, step: 345, loss: 0.3333200216293335, mean loss: 0.3418559267908726
Epoch: 50, step: 346, loss: 0.34848299622535706, mean loss: 0.3418560181395078
Epoch: 50, step: 347, loss: 0.34835025668144226, mean loss: 0.34185610765594576
Epoch: 50, step: 348, loss: 0.3254101276397705, mean loss: 0.34185588096805186
Epoch: 50, step: 349, loss: 0.32391971349716187, mean loss: 0.34185563374313843
Epoch: 50, step: 350, loss: 0.3177979588508606, mean loss: 0.3418553021464011
Epoch: 50, step: 351, loss: 0.34628942608833313, mean loss: 0.34185536326289606
Epoch: 50, step: 352, loss: 0.3416915833950043, mean loss: 0.3418553610055136
Epoch: 50, step: 353, loss: 0.30158042907714844, mean loss: 0.3418548059026671
Epoch: 50, step: 354, loss: 0.2955199182033539, mean loss: 0.3418541672852362
Epoch: 50, step: 355, loss: 0.3394893407821655, mean loss: 0.341854134692115
Epoch: 50, step: 356, loss: 0.34087249636650085, mean loss: 0.3418541211629128
Epoch: 50, step: 357, loss: 0.33982178568840027, mean loss: 0.3418540931531072
Epoch: 50, step: 358, loss: 0.33407947421073914, mean loss: 0.34185398600418093
Epoch: 50, step: 359, loss: 0.3255675733089447, mean loss: 0.3418537615497612
Epoch: 50, step: 360, loss: 0.39654186367988586, mean loss: 0.34185451523427673
Epoch: 50, step: 361, loss: 0.37145519256591797, mean loss: 0.3418549231706254
Epoch: 50, step: 362, loss: 0.3025716245174408, mean loss: 0.34185438180245353
Epoch: 50, step: 363, loss: 0.3781895041465759, mean loss: 0.3418548825345293
Epoch: 50, step: 364, loss: 0.3124759793281555, mean loss: 0.34185447767125904
Epoch: 50, step: 365, loss: 0.3122362196445465, mean loss: 0.3418540695151249
Epoch: 50, step: 366, loss: 0.3291943371295929, mean loss: 0.3418538950593477
Epoch: 50, step: 367, loss: 0.29778507351875305, mean loss: 0.3418532877831166
Epoch: 50, step: 368, loss: 0.34305858612060547, mean loss: 0.34185330439211403
Epoch: 50, step: 369, loss: 0.34462714195251465, mean loss: 0.3418533426150376
Epoch: 50, step: 370, loss: 0.35642966628074646, mean loss: 0.3418535434710774
Epoch: 50, step: 371, loss: 0.34728044271469116, mean loss: 0.34185361825059624
Epoch: 50, step: 372, loss: 0.34862399101257324, mean loss: 0.3418537115411142
Epoch: 50, step: 373, loss: 0.36897018551826477, mean loss: 0.3418540851800755
Epoch: 50, step: 374, loss: 0.4159647226333618, mean loss: 0.3418551063393928
Epoch: 50, step: 375, loss: 0.371306836605072, mean loss: 0.3418555121447591
Epoch: 50, step: 376, loss: 0.31521105766296387, mean loss: 0.3418551450249487
Epoch: 50, step: 377, loss: 0.3306839168071747, mean loss: 0.34185499110463924
Epoch: 50, step: 378, loss: 0.3168821632862091, mean loss: 0.341854647026768
Epoch: 50, step: 379, loss: 0.32372596859931946, mean loss: 0.34185439725164496
Epoch: 50, step: 380, loss: 0.3408970832824707, mean loss: 0.3418543840620503
Epoch: 50, step: 381, loss: 0.3246382474899292, mean loss: 0.3418541468663741
Epoch: 50, step: 382, loss: 0.34009718894958496, mean loss: 0.3418541226601837
Epoch: 50, step: 383, loss: 0.358394056558609, mean loss: 0.34185435053318464
Epoch: 50, step: 384, loss: 0.3696230947971344, mean loss: 0.34185473310181813
Epoch: 50, step: 385, loss: 0.3178657293319702, mean loss: 0.34185440261103794
Epoch: 50, step: 386, loss: 0.37272223830223083, mean loss: 0.3418548278639853
Epoch: 50, step: 387, loss: 0.33638209104537964, mean loss: 0.34185475246947356
Epoch: 50, step: 388, loss: 0.31480422616004944, mean loss: 0.34185437981622985
Epoch: 50, step: 389, loss: 0.32501932978630066, mean loss: 0.3418541478965435
Epoch: 50, step: 390, loss: 0.368397980928421, mean loss: 0.3418545135594085
Epoch: 50, step: 391, loss: 0.3108581006526947, mean loss: 0.34185408656452054
Epoch: 50, step: 392, loss: 0.2999820411205292, mean loss: 0.34185350975896844
Epoch: 50, step: 393, loss: 0.3310964107513428, mean loss: 0.3418533615773142
Epoch: 50, step: 394, loss: 0.3422974646091461, mean loss: 0.3418533676948572
Epoch: 50, step: 395, loss: 0.31221234798431396, mean loss: 0.34185295939385285
Epoch: 50, step: 396, loss: 0.36235710978507996, mean loss: 0.3418532418318378
Epoch: 50, step: 397, loss: 0.3396291732788086, mean loss: 0.3418532111964408
Epoch: 50, step: 398, loss: 0.3306193947792053, mean loss: 0.3418530564585461
Epoch: 50, step: 399, loss: 0.352412611246109, mean loss: 0.3418532019069591
Epoch: 50, step: 400, loss: 0.3391619622707367, mean loss: 0.3418531648380532
Epoch: 50, step: 401, loss: 0.3338826894760132, mean loss: 0.34185305505491553
Epoch: 50, step: 402, loss: 0.33462077379226685, mean loss: 0.3418529554408326
Epoch: 50, step: 403, loss: 0.33013054728507996, mean loss: 0.3418527939840512
Epoch: 50, step: 404, loss: 0.3311031758785248, mean loss: 0.34185264592788284
Epoch: 50, step: 405, loss: 0.3396862745285034, mean loss: 0.3418526160905223
Epoch: 50, step: 406, loss: 0.3485907018184662, mean loss: 0.3418527088926726
Epoch: 50, step: 407, loss: 0.3442835807800293, mean loss: 0.34185274237206725
Epoch: 50, step: 408, loss: 0.3082716464996338, mean loss: 0.34185227987987105
Epoch: 50, step: 409, loss: 0.30144211649894714, mean loss: 0.34185172334270836
Epoch: 50, step: 410, loss: 0.32100531458854675, mean loss: 0.3418514362455915
Epoch: 50, step: 411, loss: 0.3215201199054718, mean loss: 0.3418511562461928
Epoch: 50, step: 412, loss: 0.3259288966655731, mean loss: 0.34185093697058677
Epoch: 50, step: 413, loss: 0.32497766613960266, mean loss: 0.34185070460119754
Epoch: 50, step: 414, loss: 0.37128937244415283, mean loss: 0.34185111000872825
Epoch: 50, step: 415, loss: 0.30662328004837036, mean loss: 0.34185062488382517
Epoch: 50, step: 416, loss: 0.32152706384658813, mean loss: 0.341850345010503
Epoch: 50, step: 417, loss: 0.29858842492103577, mean loss: 0.34184974926399264
Epoch: 50, step: 418, loss: 0.3426309823989868, mean loss: 0.34184976002196416
Epoch: 50, step: 419, loss: 0.3493247330188751, mean loss: 0.3418498629546686
Epoch: 50, step: 420, loss: 0.30855029821395874, mean loss: 0.34184940441561323
Epoch: 50, step: 421, loss: 0.3092908263206482, mean loss: 0.34184895608620763
Epoch: 50, step: 422, loss: 0.33541223406791687, mean loss: 0.34184886745420373
Epoch: 50, step: 423, loss: 0.3436063230037689, mean loss: 0.3418488916535807
Epoch: 50, step: 424, loss: 0.31561478972435, mean loss: 0.3418485304267039
Epoch: 50, step: 425, loss: 0.33388063311576843, mean loss: 0.34184842071534277
Epoch: 50, step: 426, loss: 0.3281688392162323, mean loss: 0.34184823236140416
Epoch: 50, step: 427, loss: 0.3363131284713745, mean loss: 0.3418481561496967
Epoch: 50, step: 428, loss: 0.3238483965396881, mean loss: 0.3418479083181197
Epoch: 50, step: 429, loss: 0.3179420530796051, mean loss: 0.34184757917237774
Epoch: 50, step: 430, loss: 0.36082372069358826, mean loss: 0.3418478404401769
Epoch: 50, step: 431, loss: 0.3627040684223175, mean loss: 0.34184812758947725
Epoch: 50, step: 432, loss: 0.34174609184265137, mean loss: 0.34184812618466476
Epoch: 50, step: 433, loss: 0.3099055588245392, mean loss: 0.341847686410353
Epoch: 50, step: 434, loss: 0.30771180987358093, mean loss: 0.3418472164457831
Epoch: 50, step: 435, loss: 0.3583928942680359, mean loss: 0.3418474442347283
Epoch: 50, step: 436, loss: 0.36435022950172424, mean loss: 0.3418477540325623
Epoch: 50, step: 437, loss: 0.4128189980983734, mean loss: 0.3418487310865019
Epoch: 50, step: 438, loss: 0.40305057168006897, mean loss: 0.3418495736344526
Epoch: 50, step: 439, loss: 0.3361804783344269, mean loss: 0.3418494955907398
Epoch: 50, step: 440, loss: 0.35469889640808105, mean loss: 0.3418496724798357
Epoch: 50, step: 441, loss: 0.3087753355503082, mean loss: 0.3418492171738567
Epoch: 50, step: 442, loss: 0.3455375134944916, mean loss: 0.3418492679467642
Epoch: 50, step: 443, loss: 0.3158304989337921, mean loss: 0.3418489097785877
Epoch: 50, step: 444, loss: 0.31938135623931885, mean loss: 0.34184860049985494
Epoch: 50, step: 445, loss: 0.30236220359802246, mean loss: 0.3418480569544856
Epoch: 50, step: 446, loss: 0.35082173347473145, mean loss: 0.34184818047887783
Epoch: 50, step: 447, loss: 0.33703330159187317, mean loss: 0.3418481142020514
Epoch: 50, step: 448, loss: 0.298942506313324, mean loss: 0.3418475236143229
Epoch: 50, step: 449, loss: 0.32832053303718567, mean loss: 0.3418473374203714
Epoch: 50, step: 450, loss: 0.29797276854515076, mean loss: 0.34184673351170014
Epoch: 50, step: 451, loss: 0.3455425798892975, mean loss: 0.34184678438223887
Epoch: 50, step: 452, loss: 0.3741565942764282, mean loss: 0.3418472290962891
Epoch: 50, step: 453, loss: 0.33200696110725403, mean loss: 0.34184709365614835
Epoch: 50, step: 454, loss: 0.3850369453430176, mean loss: 0.3418476881073449
Epoch: 50, step: 455, loss: 0.3521369993686676, mean loss: 0.3418478297241592
Epoch: 50, step: 456, loss: 0.3200473487377167, mean loss: 0.3418475296776257
Epoch: 50, step: 457, loss: 0.32457682490348816, mean loss: 0.34184729197902713
Epoch: 50, step: 458, loss: 0.31885939836502075, mean loss: 0.3418469755984877
Epoch: 50, step: 459, loss: 0.3464464247226715, mean loss: 0.34184703889946655
Epoch: 50, step: 460, loss: 0.3284752368927002, mean loss: 0.3418468548694916
Epoch: 50, step: 461, loss: 0.35188958048820496, mean loss: 0.34184699308101374
Epoch: 50, step: 462, loss: 0.34278297424316406, mean loss: 0.3418470059621384
Epoch: 50, step: 463, loss: 0.33334553241729736, mean loss: 0.34184688896508975
Epoch: 50, step: 464, loss: 0.352396160364151, mean loss: 0.3418470341418791
Epoch: 50, step: 465, loss: 0.3261657655239105, mean loss: 0.34184681834262476
Epoch: 50, step: 466, loss: 0.2994001507759094, mean loss: 0.3418462342168515
Epoch: 50, step: 467, loss: 0.34689420461654663, mean loss: 0.34184630368305946
Epoch: 50, step: 468, loss: 0.3746015429496765, mean loss: 0.3418467544287594
Epoch: 50, step: 469, loss: 0.35067957639694214, mean loss: 0.34184687597577973
Epoch: 50, step: 470, loss: 0.31322965025901794, mean loss: 0.3418464821842299
Epoch: 50, step: 471, loss: 0.3846355676651001, mean loss: 0.3418470709816413
Epoch: 50, step: 472, loss: 0.30921047925949097, mean loss: 0.341846621893373
Epoch: 50, step: 473, loss: 0.30479520559310913, mean loss: 0.34184611206294807
Epoch: 50, step: 474, loss: 0.32447800040245056, mean loss: 0.3418458730796435
Epoch: 50, step: 475, loss: 0.33347636461257935, mean loss: 0.3418457579177129
Epoch: 50, step: 476, loss: 0.33440104126930237, mean loss: 0.3418456554820503
Epoch: 50, step: 477, loss: 0.33399778604507446, mean loss: 0.3418455475006882
Epoch: 50, step: 478, loss: 0.32148098945617676, mean loss: 0.34184526730203324
Epoch: 50, step: 479, loss: 0.30700162053108215, mean loss: 0.3418447878902725
Epoch: 50, step: 480, loss: 0.3015861213207245, mean loss: 0.3418442339811825
Epoch: 50, step: 481, loss: 0.3426203727722168, mean loss: 0.3418442446597383
Epoch: 50, step: 482, loss: 0.3098829686641693, mean loss: 0.3418438049245045
Epoch: 50, step: 483, loss: 0.29489991068840027, mean loss: 0.34184315906167034
Epoch: 50, step: 484, loss: 0.30332615971565247, mean loss: 0.3418426291449152
Epoch: 50, step: 485, loss: 0.3641926646232605, mean loss: 0.3418429366324022
Epoch: 50, step: 486, loss: 0.33891138434410095, mean loss: 0.34184289630122483
Epoch: 50, step: 487, loss: 0.288421630859375, mean loss: 0.3418421613619578
Epoch: 50, step: 488, loss: 0.35737985372543335, mean loss: 0.34184237511771676
Epoch: 50, step: 489, loss: 0.3582380414009094, mean loss: 0.3418426006737256
Epoch: 50, step: 490, loss: 0.3157407343387604, mean loss: 0.3418422415939725
Epoch: 50, step: 491, loss: 0.34069347381591797, mean loss: 0.34184222579075096
Epoch: 50, step: 492, loss: 0.33462148904800415, mean loss: 0.34184212645881057
Epoch: 50, step: 493, loss: 0.337945818901062, mean loss: 0.34184207286006024
Epoch: 50, step: 494, loss: 0.29723161458969116, mean loss: 0.3418414591939447
Epoch: 50, step: 495, loss: 0.3536291718482971, mean loss: 0.3418416213447185
Epoch: 50, step: 496, loss: 0.3916647136211395, mean loss: 0.3418423066975154
Epoch: 50, step: 497, loss: 0.30664706230163574, mean loss: 0.34184182256804285
Epoch: 50, step: 498, loss: 0.3249065577983856, mean loss: 0.34184158961759276
Epoch: 50, step: 499, loss: 0.3221072256565094, mean loss: 0.3418413181682948
Epoch: 50, step: 500, loss: 0.3372798264026642, mean loss: 0.34184125542511706
Epoch: 50, step: 501, loss: 0.3338986337184906, mean loss: 0.34184114617610456
Epoch: 50, step: 502, loss: 0.3473888337612152, mean loss: 0.34184122248227605
Epoch: 50, step: 503, loss: 0.36214885115623474, mean loss: 0.3418415018015525
Epoch: 50, step: 504, loss: 0.30612218379974365, mean loss: 0.34184101051047205
Epoch: 50, step: 505, loss: 0.36097487807273865, mean loss: 0.34184127367812756
Epoch: 50, step: 506, loss: 0.3338760435581207, mean loss: 0.34184116412567567
Epoch: 50, step: 507, loss: 0.31415021419525146, mean loss: 0.3418407832741885
Epoch: 50, step: 508, loss: 0.30590498447418213, mean loss: 0.34184028903277686
Epoch: 50, step: 509, loss: 0.3136376738548279, mean loss: 0.3418399011546971
Epoch: 50, step: 510, loss: 0.34051719307899475, mean loss: 0.34183988296339074
Epoch: 50, step: 511, loss: 0.3149286210536957, mean loss: 0.3418395128558169
Epoch: 50, step: 512, loss: 0.34378525614738464, mean loss: 0.34183953961503866
Epoch: 50, step: 513, loss: 0.3400576412677765, mean loss: 0.3418395151094641
Epoch: 50, step: 514, loss: 0.34451764822006226, mean loss: 0.34183955194000953
Epoch: 50, step: 515, loss: 0.33091476559638977, mean loss: 0.34183940170091026
Epoch: 50, step: 516, loss: 0.3379698395729065, mean loss: 0.34183934848691455
Epoch: 50, step: 517, loss: 0.3210488259792328, mean loss: 0.34183906258077706
Epoch: 50, step: 518, loss: 0.33785316348075867, mean loss: 0.3418390077684295
Epoch: 50, step: 519, loss: 0.36250871419906616, mean loss: 0.3418392920053166
Epoch: 50, step: 520, loss: 0.31972163915634155, mean loss: 0.3418389878613575
Epoch: 50, step: 521, loss: 0.37736138701438904, mean loss: 0.34183947632975986
Epoch: 50, step: 522, loss: 0.3146594166755676, mean loss: 0.3418391025819819
Epoch: 50, step: 523, loss: 0.3205472230911255, mean loss: 0.341838809805464
Epoch: 50, step: 524, loss: 0.2944192588329315, mean loss: 0.3418381577662619
Epoch: 50, step: 525, loss: 0.3141575753688812, mean loss: 0.3418377771515932
Epoch: 50, step: 526, loss: 0.32764968276023865, mean loss: 0.3418375820645637
Epoch: 50, step: 527, loss: 0.36028435826301575, mean loss: 0.34183783570520004
Epoch: 50, step: 528, loss: 0.35836443305015564, mean loss: 0.3418380629405167
Epoch: 50, step: 529, loss: 0.3238983154296875, mean loss: 0.3418378162782383
Epoch: 50, step: 530, loss: 0.3122432827949524, mean loss: 0.3418374093742567
Epoch: 50, step: 531, loss: 0.3044191300868988, mean loss: 0.34183689490635694
Epoch: 50, step: 532, loss: 0.3664461076259613, mean loss: 0.34183723325638676
Epoch: 50, step: 533, loss: 0.3040601909160614, mean loss: 0.34183671387009784
Epoch: 50, step: 534, loss: 0.32185110449790955, mean loss: 0.3418364390971636
Epoch: 50, step: 535, loss: 0.30799591541290283, mean loss: 0.3418359738457931
Epoch: 50, step: 536, loss: 0.30092304944992065, mean loss: 0.341835411368314
Epoch: 50, step: 537, loss: 0.32675984501838684, mean loss: 0.34183520410984736
Epoch: 50, step: 538, loss: 0.31777432560920715, mean loss: 0.34183487332610685
Epoch: 50, step: 539, loss: 0.3050681948661804, mean loss: 0.34183436787273236
Epoch: 50, step: 540, loss: 0.3207234740257263, mean loss: 0.341834077652721
Epoch: 50, step: 541, loss: 0.3237592577934265, mean loss: 0.3418338291742648
Epoch: 50, step: 542, loss: 0.3377608358860016, mean loss: 0.34183377318271524
Epoch: 50, step: 543, loss: 0.3479635715484619, mean loss: 0.3418338574480617
Epoch: 50, step: 544, loss: 0.3311426341533661, mean loss: 0.341833710479565
Epoch: 50, step: 545, loss: 0.3981701135635376, mean loss: 0.3418344849056927
Epoch: 50, step: 546, loss: 0.308075487613678, mean loss: 0.3418340208453563
Epoch: 50, step: 547, loss: 0.30644580721855164, mean loss: 0.34183353439605696
Epoch: 50, step: 548, loss: 0.32088860869407654, mean loss: 0.3418332464893407
Epoch: 50, step: 549, loss: 0.318479061126709, mean loss: 0.34183292546961064
Epoch: 50, step: 550, loss: 0.32729560136795044, mean loss: 0.3418327256465965
Epoch: 50, step: 551, loss: 0.34004825353622437, mean loss: 0.34183270111844455
Epoch: 50, step: 552, loss: 0.3096502125263214, mean loss: 0.34183225876570866
Epoch: 50, step: 553, loss: 0.33395078778266907, mean loss: 0.3418321504352941
Epoch: 50, step: 554, loss: 0.33283090591430664, mean loss: 0.3418320267153501
Epoch: 50, step: 555, loss: 0.3307096064090729, mean loss: 0.3418318738424557
Epoch: 50, step: 556, loss: 0.3481023907661438, mean loss: 0.3418319600268356
Epoch: 50, step: 557, loss: 0.31104475259780884, mean loss: 0.34183153688151235
Epoch: 50, step: 558, loss: 0.36227181553840637, mean loss: 0.3418318178127876
Epoch: 50, step: 559, loss: 0.3555246889591217, mean loss: 0.34183200600507935
Epoch: 50, step: 560, loss: 0.3795798420906067, mean loss: 0.34183252479723564
Epoch: 50, step: 561, loss: 0.33174416422843933, mean loss: 0.3418323861484826
Epoch: 50, step: 562, loss: 0.34656840562820435, mean loss: 0.3418324512367758
Epoch: 50, step: 563, loss: 0.29036906361579895, mean loss: 0.34183174397236454
Epoch: 50, step: 564, loss: 0.34768447279930115, mean loss: 0.3418318244056611
Epoch: 50, step: 565, loss: 0.3318045735359192, mean loss: 0.3418316866043409
Epoch: 50, step: 566, loss: 0.33032941818237305, mean loss: 0.3418315285344957
Epoch: 50, step: 567, loss: 0.3855527341365814, mean loss: 0.3418321293646079
Epoch: 50, step: 568, loss: 0.32923078536987305, mean loss: 0.34183195619548373
Epoch: 50, step: 569, loss: 0.31186410784721375, mean loss: 0.34183154437951085
Epoch: 50, step: 570, loss: 0.3216296434402466, mean loss: 0.34183126677028547
Epoch: 50, step: 571, loss: 0.3760812282562256, mean loss: 0.3418317374178077
Epoch: 50, step: 572, loss: 0.38003841042518616, mean loss: 0.34183226242946047
Epoch: 50, step: 573, loss: 0.3189738988876343, mean loss: 0.34183194832877145
Epoch: 50, step: 574, loss: 0.3443012535572052, mean loss: 0.34183198225945133
Epoch: 50, step: 575, loss: 0.3116910457611084, mean loss: 0.34183156809906196
Epoch: 50, step: 576, loss: 0.37035730481147766, mean loss: 0.3418319600599385
Epoch: 50, step: 577, loss: 0.3254541754722595, mean loss: 0.34183173502236414
Epoch: 50, step: 578, loss: 0.3232194483280182, mean loss: 0.34183147928531504
Epoch: 50, step: 579, loss: 0.3108513355255127, mean loss: 0.34183105361694793
Epoch: 50, step: 580, loss: 0.3636344075202942, mean loss: 0.34183135319175323
Epoch: 50, step: 581, loss: 0.3423798978328705, mean loss: 0.34183136072857057
Epoch: 50, step: 582, loss: 0.3054652214050293, mean loss: 0.3418308610770129
Epoch: 50, step: 583, loss: 0.291887104511261, mean loss: 0.3418301748855894
Epoch: 50, step: 584, loss: 0.3711579144001007, mean loss: 0.34183057782217685
Epoch: 50, step: 585, loss: 0.3428577482700348, mean loss: 0.3418305919343749
Epoch: 50, step: 586, loss: 0.320598840713501, mean loss: 0.34183030023735184
Epoch: 50, step: 587, loss: 0.38019558787345886, mean loss: 0.34183082731994285
Epoch: 50, step: 588, loss: 0.3361869156360626, mean loss: 0.34183074978196754
Epoch: 50, step: 589, loss: 0.3407485783100128, mean loss: 0.3418307349149326
Epoch: 50, step: 590, loss: 0.31803449988365173, mean loss: 0.34183040800315734
Epoch: 50, step: 591, loss: 0.360662043094635, mean loss: 0.34183066670789264
Epoch: 50, step: 592, loss: 0.2668270468711853, mean loss: 0.3418296363393155
Epoch: 50, step: 593, loss: 0.3342001140117645, mean loss: 0.3418295315295465
Epoch: 50, step: 594, loss: 0.30523478984832764, mean loss: 0.34182902881999666
Epoch: 50, step: 595, loss: 0.36182039976119995, mean loss: 0.3418293034418295
Epoch: 50, step: 596, loss: 0.33191612362861633, mean loss: 0.34182916726616547
Epoch: 50, step: 597, loss: 0.29029977321624756, mean loss: 0.34182845942537243
Epoch: 50, step: 598, loss: 0.33222270011901855, mean loss: 0.34182832747631675
Epoch: 50, step: 599, loss: 0.4424814283847809, mean loss: 0.3418297100738567
Epoch: 50, step: 600, loss: 0.3196032643318176, mean loss: 0.34182940476972984
Epoch: 50, step: 601, loss: 0.36310458183288574, mean loss: 0.34182969700314464
Epoch: 50, step: 602, loss: 0.34243887662887573, mean loss: 0.3418297053706518
Epoch: 50, step: 603, loss: 0.33907726407051086, mean loss: 0.3418296675644695
Epoch: 50, step: 604, loss: 0.3150126039981842, mean loss: 0.34182929922350985
Epoch: 50, step: 605, loss: 0.3222880959510803, mean loss: 0.34182903082250893
Epoch: 50, step: 606, loss: 0.31112605333328247, mean loss: 0.3418286091188611
Epoch: 50, step: 607, loss: 0.3208528757095337, mean loss: 0.34182832102231386
Epoch: 50, step: 608, loss: 0.34360799193382263, mean loss: 0.3418283454653211
Epoch: 50, step: 609, loss: 0.3424152433872223, mean loss: 0.3418283535259985
Epoch: 50, step: 610, loss: 0.3246452510356903, mean loss: 0.3418281175300296
Epoch: 50, step: 611, loss: 0.35000964999198914, mean loss: 0.34182822989519557
Epoch: 50, step: 612, loss: 0.3617613613605499, mean loss: 0.3418285036530611
Epoch: 50, step: 613, loss: 0.34112751483917236, mean loss: 0.34182849402594523
Epoch: 50, step: 614, loss: 0.2828945815563202, mean loss: 0.3418276846609453
Epoch: 50, step: 615, loss: 0.35030660033226013, mean loss: 0.3418278011039753
Epoch: 50, step: 616, loss: 0.32717713713645935, mean loss: 0.34182759990557426
Epoch: 50, step: 617, loss: 0.35826393961906433, mean loss: 0.341827825623662
Epoch: 50, step: 618, loss: 0.332941472530365, mean loss: 0.34182770359022163
Epoch: 50, step: 619, loss: 0.3581065535545349, mean loss: 0.3418279271393835
Epoch: 50, step: 620, loss: 0.3070211708545685, mean loss: 0.3418274491624773
Epoch: 50, step: 621, loss: 0.3272913694381714, mean loss: 0.34182724955137456
Epoch: 50, step: 622, loss: 0.3265683948993683, mean loss: 0.3418270400179215
Epoch: 50, step: 623, loss: 0.40182530879974365, mean loss: 0.3418278638983563
Epoch: 50, step: 624, loss: 0.3284744620323181, mean loss: 0.3418276805354745
Epoch: 50, step: 625, loss: 0.3057814836502075, mean loss: 0.34182718557218
Epoch: 50, step: 626, loss: 0.29108381271362305, mean loss: 0.3418264888062435
Epoch: 50, step: 627, loss: 0.33626025915145874, mean loss: 0.341826412376441
Epoch: 50, step: 628, loss: 0.3168259561061859, mean loss: 0.34182606910032476
Epoch: 50, step: 629, loss: 0.30459895730018616, mean loss: 0.341825557949538
Epoch: 50, step: 630, loss: 0.3330375552177429, mean loss: 0.341825437286596
Epoch: 50, step: 631, loss: 0.2963069975376129, mean loss: 0.3418248123080186
Epoch: 50, step: 632, loss: 0.3392171263694763, mean loss: 0.3418247765043865
Epoch: 50, step: 633, loss: 0.31841710209846497, mean loss: 0.34182445512049425
Epoch: 50, step: 634, loss: 0.3247937262058258, mean loss: 0.3418242212943267
Epoch: 50, step: 635, loss: 0.31854280829429626, mean loss: 0.3418239016527621
Epoch: 50, step: 636, loss: 0.32792919874191284, mean loss: 0.3418237108884128
Epoch: 50, step: 637, loss: 0.3190959095954895, mean loss: 0.34182339885621404
Epoch: 50, step: 638, loss: 0.3504366874694824, mean loss: 0.34182351710726927
Epoch: 50, step: 639, loss: 0.3339535593986511, mean loss: 0.34182340906281966
Epoch: 50, step: 640, loss: 0.3129720687866211, mean loss: 0.3418230129762712
Epoch: 50, step: 641, loss: 0.3272130787372589, mean loss: 0.3418228124060749
Epoch: 50, step: 642, loss: 0.37450870871543884, mean loss: 0.34182326112312816
Epoch: 50, step: 643, loss: 0.38862845301628113, mean loss: 0.34182390366323984
Epoch: 50, step: 644, loss: 0.35720258951187134, mean loss: 0.34182411477842756
Epoch: 50, step: 645, loss: 0.30794650316238403, mean loss: 0.34182364972047496
Epoch: 50, step: 646, loss: 0.30743297934532166, mean loss: 0.34182317762594294
Epoch: 50, step: 647, loss: 0.3152795732021332, mean loss: 0.3418228132562358
Epoch: 50, step: 648, loss: 0.33474260568618774, mean loss: 0.3418227160660538
Epoch: 50, step: 649, loss: 0.3248022496700287, mean loss: 0.34182248242890356
Epoch: 50, step: 650, loss: 0.3320504128932953, mean loss: 0.3418223482911493
Epoch: 50, step: 651, loss: 0.35216954350471497, mean loss: 0.34182249032150147
Epoch: 50, step: 652, loss: 0.3013375997543335, mean loss: 0.3418219346149339
Epoch: 50, step: 653, loss: 0.3519788980484009, mean loss: 0.3418220740302499
Epoch: 50, step: 654, loss: 0.3727656304836273, mean loss: 0.3418224987582226
Epoch: 50, step: 655, loss: 0.3319336175918579, mean loss: 0.341822363026352
Epoch: 50, step: 656, loss: 0.37560006976127625, mean loss: 0.3418228266428437
Epoch: 50, step: 657, loss: 0.3632320165634155, mean loss: 0.341823120491013
Epoch: 50, step: 658, loss: 0.2914462685585022, mean loss: 0.34182242906165033
Epoch: 50, step: 659, loss: 0.3223849833011627, mean loss: 0.341822162283641
Epoch: 50, step: 660, loss: 0.3355875611305237, mean loss: 0.3418220767152141
Epoch: 50, step: 661, loss: 0.31989315152168274, mean loss: 0.3418217757500307
Epoch: 50, step: 662, loss: 0.36096346378326416, mean loss: 0.3418220384579625
Epoch: 50, step: 663, loss: 0.3729524314403534, mean loss: 0.3418224656976554
Epoch: 50, step: 664, loss: 0.3069739043712616, mean loss: 0.34182198743564585
Epoch: 50, step: 665, loss: 0.33498045802116394, mean loss: 0.3418218935437152
Epoch: 50, step: 666, loss: 0.3082190155982971, mean loss: 0.3418214323901348
Epoch: 50, step: 667, loss: 0.3979320824146271, mean loss: 0.3418222024215618
Epoch: 50, step: 668, loss: 0.37662237882614136, mean loss: 0.3418226799933194
Epoch: 50, step: 669, loss: 0.3583848476409912, mean loss: 0.34182290727708015
Epoch: 50, step: 670, loss: 0.34523481130599976, mean loss: 0.34182295409823027
Epoch: 50, step: 671, loss: 0.348849892616272, mean loss: 0.34182305052674217
Epoch: 50, step: 672, loss: 0.32707279920578003, mean loss: 0.3418228481163663
Epoch: 50, step: 673, loss: 0.3509455919265747, mean loss: 0.34182297330153266
Epoch: 50, step: 674, loss: 0.3073726296424866, mean loss: 0.3418225005695442
Epoch: 50, step: 675, loss: 0.33069515228271484, mean loss: 0.34182234788075383
Epoch: 50, step: 676, loss: 0.3319057822227478, mean loss: 0.34182221180811556
Epoch: 50, step: 677, loss: 0.3214108347892761, mean loss: 0.34182193173213904
Epoch: 50, step: 678, loss: 0.29551461338996887, mean loss: 0.3418212963321151
Epoch: 50, step: 679, loss: 0.35907140374183655, mean loss: 0.34182153302403895
Epoch: 50, step: 680, loss: 0.31684714555740356, mean loss: 0.3418211903505374
Epoch: 50, step: 681, loss: 0.3356829583644867, mean loss: 0.34182110612902883
Epoch: 50, step: 682, loss: 0.36344751715660095, mean loss: 0.3418214028568121
Epoch: 50, step: 683, loss: 0.3706427216529846, mean loss: 0.3418217982977703
Epoch: 50, step: 684, loss: 0.30248886346817017, mean loss: 0.34182125864029855
Epoch: 50, step: 685, loss: 0.3130543828010559, mean loss: 0.3418208639571517
Epoch: 50, step: 686, loss: 0.35866519808769226, mean loss: 0.3418210950591882
Epoch: 50, step: 687, loss: 0.3316362798213959, mean loss: 0.34182095532678725
Epoch: 50, step: 688, loss: 0.3439868688583374, mean loss: 0.3418209850420191
Epoch: 50, step: 689, loss: 0.30338338017463684, mean loss: 0.341820457704869
Epoch: 50, step: 690, loss: 0.31890448927879333, mean loss: 0.3418201433180664
Epoch: 50, step: 691, loss: 0.3284262418746948, mean loss: 0.34181995956811523
Epoch: 50, step: 692, loss: 0.3198097050189972, mean loss: 0.3418196576151904
Epoch: 50, step: 693, loss: 0.32921820878982544, mean loss: 0.3418194847415818
Epoch: 50, step: 694, loss: 0.3411429822444916, mean loss: 0.34181947546107566
Epoch: 50, step: 695, loss: 0.35278570652008057, mean loss: 0.3418196258977397
Epoch: 50, step: 696, loss: 0.333334743976593, mean loss: 0.3418195095022512
Epoch: 50, step: 697, loss: 0.3301592469215393, mean loss: 0.3418193495491307
Epoch: 50, step: 698, loss: 0.3276751935482025, mean loss: 0.3418191555251249
Epoch: 50, step: 699, loss: 0.33693456649780273, mean loss: 0.34181908852116016
Epoch: 50, step: 700, loss: 0.32478609681129456, mean loss: 0.3418188548756449
Epoch: 50, step: 701, loss: 0.36236897110939026, mean loss: 0.3418191367625099
Epoch: 50, step: 702, loss: 0.32325392961502075, mean loss: 0.3418188821062249
Epoch: 50, step: 703, loss: 0.3212433457374573, mean loss: 0.3418185998784134
Epoch: 50, step: 704, loss: 0.3494613468647003, mean loss: 0.34181870471000225
Epoch: 50, step: 705, loss: 0.29603826999664307, mean loss: 0.3418180767721821
Epoch: 50, step: 706, loss: 0.3985660970211029, mean loss: 0.34181885513393406
Epoch: 50, step: 707, loss: 0.31440454721450806, mean loss: 0.34181847912159086
Epoch: 50, step: 708, loss: 0.37257876992225647, mean loss: 0.3418189010213673
Epoch: 50, step: 709, loss: 0.33039039373397827, mean loss: 0.34181874427322184
Epoch: 50, step: 710, loss: 0.40410345792770386, mean loss: 0.34181959852996846
Epoch: 50, step: 711, loss: 0.3197670578956604, mean loss: 0.3418192960757684
Epoch: 50, step: 712, loss: 0.3170345425605774, mean loss: 0.34181895615348407
Epoch: 50, step: 713, loss: 0.34767770767211914, mean loss: 0.3418190365050149
Epoch: 50, step: 714, loss: 0.31971392035484314, mean loss: 0.3418187333422068
Epoch: 50, step: 715, loss: 0.37115219235420227, mean loss: 0.3418191356333228
Epoch: 50, step: 716, loss: 0.3565097749233246, mean loss: 0.34181933710402634
Epoch: 50, step: 717, loss: 0.32304930686950684, mean loss: 0.3418190796911758
Epoch: 50, step: 718, loss: 0.34790706634521484, mean loss: 0.34181916318089256
Epoch: 50, step: 719, loss: 0.37375548481941223, mean loss: 0.341819601144711
Epoch: 50, step: 720, loss: 0.28353434801101685, mean loss: 0.3418188018515974
Epoch: 50, step: 721, loss: 0.3357190489768982, mean loss: 0.3418187182039619
Epoch: 50, step: 722, loss: 0.3243853747844696, mean loss: 0.3418184791388738
Epoch: 50, step: 723, loss: 0.3614109754562378, mean loss: 0.3418187478089456
Epoch: 50, step: 724, loss: 0.3549618721008301, mean loss: 0.34181892803690983
Epoch: 50, step: 725, loss: 0.2914678454399109, mean loss: 0.3418182375961535
Epoch: 50, step: 726, loss: 0.30973920226097107, mean loss: 0.34181779771743453
Epoch: 50, step: 727, loss: 0.3388272225856781, mean loss: 0.3418177567102064
Epoch: 50, step: 728, loss: 0.2950182557106018, mean loss: 0.3418171149970196
Epoch: 50, step: 729, loss: 0.34768399596214294, mean loss: 0.3418171954423914
Epoch: 50, step: 730, loss: 0.29967671632766724, mean loss: 0.34181661762940224
Epoch: 50, step: 731, loss: 0.3090972304344177, mean loss: 0.34181616900071804
Epoch: 50, step: 732, loss: 0.36108872294425964, mean loss: 0.3418164332508372
Epoch: 50, step: 733, loss: 0.3150663673877716, mean loss: 0.34181606647997775
Epoch: 50, step: 734, loss: 0.32469892501831055, mean loss: 0.341815831789617
Epoch: 50, step: 735, loss: 0.3334813117980957, mean loss: 0.3418157175179269
Epoch: 50, step: 736, loss: 0.34746119379997253, mean loss: 0.3418157949200175
Epoch: 50, step: 737, loss: 0.3052676022052765, mean loss: 0.3418152938342637
Epoch: 50, step: 738, loss: 0.3380955755710602, mean loss: 0.34181524283660447
Epoch: 50, step: 739, loss: 0.3508886396884918, mean loss: 0.34181536723195477
Epoch: 50, step: 740, loss: 0.3405481278896332, mean loss: 0.3418153498584701
Epoch: 50, step: 741, loss: 0.3120799660682678, mean loss: 0.34181494220055303
Epoch: 50, step: 742, loss: 0.3188129961490631, mean loss: 0.3418146268591762
Epoch: 50, step: 743, loss: 0.35082802176475525, mean loss: 0.3418147504251296
Epoch: 50, step: 744, loss: 0.3433326184749603, mean loss: 0.34181477123352016
Epoch: 50, step: 745, loss: 0.32725781202316284, mean loss: 0.3418145716755018
Epoch: 50, step: 746, loss: 0.3220360577106476, mean loss: 0.3418143005401026
Epoch: 50, step: 747, loss: 0.34334784746170044, mean loss: 0.3418143215625696
Epoch: 50, step: 748, loss: 0.3299683928489685, mean loss: 0.34181415917612545
Epoch: 50, step: 749, loss: 0.316377729177475, mean loss: 0.34181381049305487
Epoch: 50, step: 750, loss: 0.3081376850605011, mean loss: 0.34181334886640913
Epoch: 50, step: 751, loss: 0.3035549521446228, mean loss: 0.3418128244339505
Epoch: 50, step: 752, loss: 0.33322492241859436, mean loss: 0.34181270671566594
Epoch: 50, step: 753, loss: 0.3382268249988556, mean loss: 0.3418126575630257
Epoch: 50, step: 754, loss: 0.3552905023097992, mean loss: 0.34181284230491793
Epoch: 50, step: 755, loss: 0.3291229009628296, mean loss: 0.3418126683652647
Epoch: 50, step: 756, loss: 0.33442559838294983, mean loss: 0.3418125671128834
Epoch: 50, step: 757, loss: 0.3363661468029022, mean loss: 0.34181249246143586
Epoch: 50, step: 758, loss: 0.35761305689811707, mean loss: 0.34181270902915795
Epoch: 50, step: 759, loss: 0.3506290018558502, mean loss: 0.3418128298665048
Epoch: 50, step: 760, loss: 0.3181530237197876, mean loss: 0.3418125055863257
Epoch: 50, step: 761, loss: 0.34805235266685486, mean loss: 0.3418125911082012
Epoch: 50, step: 762, loss: 0.32781898975372314, mean loss: 0.34181239931782315
Epoch: 50, step: 763, loss: 0.35674557089805603, mean loss: 0.34181260398274804
Epoch: 50, step: 764, loss: 0.3043608069419861, mean loss: 0.3418120906983371
Epoch: 50, step: 765, loss: 0.35722190141677856, mean loss: 0.3418123018899979
Epoch: 50, step: 766, loss: 0.3446142375469208, mean loss: 0.34181234029003704
Epoch: 50, step: 767, loss: 0.3382551372051239, mean loss: 0.3418122915398577
Epoch: 50, step: 768, loss: 0.30632635951042175, mean loss: 0.34181180522468235
Epoch: 50, step: 769, loss: 0.3281140625476837, mean loss: 0.34181161750722755
Epoch: 50, step: 770, loss: 0.37013810873031616, mean loss: 0.3418120056955657
Epoch: 50, step: 771, loss: 0.3481232225894928, mean loss: 0.3418120921837652
Epoch: 50, step: 772, loss: 0.3067072331905365, mean loss: 0.34181161111735714
Epoch: 50, step: 773, loss: 0.3301311433315277, mean loss: 0.34181145105394023
Epoch: 50, step: 774, loss: 0.3273024260997772, mean loss: 0.3418112522320841
Epoch: 50, step: 775, loss: 0.3045445382595062, mean loss: 0.3418107415612612
Epoch: 50, step: 776, loss: 0.3098790645599365, mean loss: 0.34181030400316753
Epoch: 50, step: 777, loss: 0.35086706280708313, mean loss: 0.3418104281057574
Epoch: 50, step: 778, loss: 0.35054782032966614, mean loss: 0.3418105478305032
Epoch: 50, step: 779, loss: 0.33212754130363464, mean loss: 0.3418104151502274
Epoch: 50, step: 780, loss: 0.3305850923061371, mean loss: 0.34181026133864845
Epoch: 50, step: 781, loss: 0.343164324760437, mean loss: 0.34181027989203727
Epoch: 50, step: 782, loss: 0.31377434730529785, mean loss: 0.3418098957487082
Epoch: 50, step: 783, loss: 0.3588796854019165, mean loss: 0.3418101296327054
Epoch: 50, step: 784, loss: 0.326805055141449, mean loss: 0.341809924041495
Epoch: 50, step: 785, loss: 0.36691004037857056, mean loss: 0.34181026794465913
Epoch: 50, step: 786, loss: 0.32265880703926086, mean loss: 0.34181000554915164
Epoch: 50, step: 787, loss: 0.33714017271995544, mean loss: 0.3418099415683215
Epoch: 50, step: 788, loss: 0.3085878789424896, mean loss: 0.34180948640298664
Epoch: 50, step: 789, loss: 0.28904253244400024, mean loss: 0.3418087634689688
Epoch: 50, step: 790, loss: 0.40894606709480286, mean loss: 0.3418096832714599
Epoch: 50, step: 791, loss: 0.28770431876182556, mean loss: 0.3418089420208501
Epoch: 50, step: 792, loss: 0.3295692801475525, mean loss: 0.3418087743381699
Epoch: 50, step: 793, loss: 0.32960623502731323, mean loss: 0.341808607166357
Epoch: 50, step: 794, loss: 0.3448777496814728, mean loss: 0.34180864921228504
Epoch: 50, step: 795, loss: 0.31852760910987854, mean loss: 0.3418083302764515
Epoch: 50, step: 796, loss: 0.3423910439014435, mean loss: 0.341808338259158
Epoch: 50, step: 797, loss: 0.34617993235588074, mean loss: 0.3418083981456494
Epoch: 50, step: 798, loss: 0.3091195225715637, mean loss: 0.3418079503466991
Epoch: 50, step: 799, loss: 0.3259175419807434, mean loss: 0.34180773266987213
Epoch: 50, step: 800, loss: 0.32070067524909973, mean loss: 0.34180744353605996
Epoch: 50, step: 801, loss: 0.33386465907096863, mean loss: 0.3418073347337742
Epoch: 50, step: 802, loss: 0.34936338663101196, mean loss: 0.34180743823708093
Epoch: 50, step: 803, loss: 0.3137190639972687, mean loss: 0.34180705348591334
Epoch: 50, step: 804, loss: 0.3063763380050659, mean loss: 0.3418065681668875
Epoch: 50, step: 805, loss: 0.337178498506546, mean loss: 0.34180650477388336
Epoch: 50, step: 806, loss: 0.3030368983745575, mean loss: 0.3418059737343063
Epoch: 50, step: 807, loss: 0.3074071705341339, mean loss: 0.34180550256945863
Epoch: 50, step: 808, loss: 0.31270208954811096, mean loss: 0.3418051039417138
Epoch: 50, step: 809, loss: 0.35830825567245483, mean loss: 0.3418053299813211
Epoch: 50, step: 810, loss: 0.3698926270008087, mean loss: 0.34180571468084614
Epoch: 50, step: 811, loss: 0.3739049732685089, mean loss: 0.341806154324447
Epoch: 50, step: 812, loss: 0.3116794526576996, mean loss: 0.34180574170338407
Epoch: 50, step: 813, loss: 0.33964499831199646, mean loss: 0.341805712109835
Epoch: 50, step: 814, loss: 0.34207236766815186, mean loss: 0.34180571576190044
Epoch: 50, step: 815, loss: 0.3429536521434784, mean loss: 0.3418057314836105
Epoch: 50, step: 816, loss: 0.30423811078071594, mean loss: 0.3418052169784856
Epoch: 50, step: 817, loss: 0.28310462832450867, mean loss: 0.3418044130590595
Epoch: 50, step: 818, loss: 0.3145100474357605, mean loss: 0.34180403926092995
Epoch: 50, step: 819, loss: 0.30994102358818054, mean loss: 0.3418036029008139
Epoch: 50, step: 820, loss: 0.3434425890445709, mean loss: 0.341803625346222
Epoch: 50, step: 821, loss: 0.2927754819393158, mean loss: 0.34180295393016374
Epoch: 50, step: 822, loss: 0.329380065202713, mean loss: 0.34180278380720625
Epoch: 50, step: 823, loss: 0.36599719524383545, mean loss: 0.3418031151285723
Epoch: 50, step: 824, loss: 0.36441096663475037, mean loss: 0.3418034247191441
Epoch: 50, step: 825, loss: 0.3092952370643616, mean loss: 0.3418029795600548
Epoch: 50, step: 826, loss: 0.3037581443786621, mean loss: 0.34180245859061636
Epoch: 50, step: 827, loss: 0.32401061058044434, mean loss: 0.3418022149601183
Epoch: 50, step: 828, loss: 0.33375948667526245, mean loss: 0.34180210482950873
Epoch: 50, step: 829, loss: 0.3057420253753662, mean loss: 0.3418016110587371
Epoch: 50, step: 830, loss: 0.322275310754776, mean loss: 0.34180134368871196
Epoch: 50, step: 831, loss: 0.3269701898097992, mean loss: 0.34180114061124073
Epoch: 50, step: 832, loss: 0.31213605403900146, mean loss: 0.34180073442381076
Epoch: 50, step: 833, loss: 0.3763090670108795, mean loss: 0.3418012069206285
Epoch: 50, step: 834, loss: 0.3036338984966278, mean loss: 0.3418006843313436
Epoch: 50, step: 835, loss: 0.3645748198032379, mean loss: 0.3418009961520275
Epoch: 50, step: 836, loss: 0.3532981872558594, mean loss: 0.3418011535680099
Epoch: 50, step: 837, loss: 0.302874892950058, mean loss: 0.3418006206089938
Epoch: 50, step: 838, loss: 0.33276087045669556, mean loss: 0.3418004968429215
Epoch: 50, step: 839, loss: 0.30774232745170593, mean loss: 0.3418000305481599
Epoch: 50, step: 840, loss: 0.3206920027732849, mean loss: 0.34179974155940324
Epoch: 50, step: 841, loss: 0.3567960262298584, mean loss: 0.34179994686983656
Epoch: 50, step: 842, loss: 0.33842504024505615, mean loss: 0.34179990066545524
Epoch: 50, step: 843, loss: 0.3393229842185974, mean loss: 0.3417998667555318
Epoch: 50, step: 844, loss: 0.3264678716659546, mean loss: 0.34179965685759095
Epoch: 50, step: 845, loss: 0.3456191122531891, mean loss: 0.3417997091459489
Epoch: 50, step: 846, loss: 0.32016560435295105, mean loss: 0.3417994129790318
Epoch: 50, step: 847, loss: 0.3162345290184021, mean loss: 0.3417990630052617
Epoch: 50, step: 848, loss: 0.36974409222602844, mean loss: 0.3417994455570998
Epoch: 50, step: 849, loss: 0.29909735918045044, mean loss: 0.3417988609973958
Epoch: 50, step: 850, loss: 0.2908114194869995, mean loss: 0.3417981630269161
Epoch: 50, step: 851, loss: 0.3937815725803375, mean loss: 0.3417988746215275
Epoch: 50, step: 852, loss: 0.3449779748916626, mean loss: 0.34179891813925123
Epoch: 50, step: 853, loss: 0.32706359028816223, mean loss: 0.3417987164346512
Epoch: 50, step: 854, loss: 0.2909037172794342, mean loss: 0.34179801976776797
Epoch: 50, step: 855, loss: 0.3330186903476715, mean loss: 0.3417978995951686
Epoch: 50, step: 856, loss: 0.34452199935913086, mean loss: 0.34179793688248894
Epoch: 50, step: 857, loss: 0.2854929268360138, mean loss: 0.34179716619330985
Epoch: 50, step: 858, loss: 0.29461508989334106, mean loss: 0.34179652038545183
Epoch: 50, step: 859, loss: 0.35421881079673767, mean loss: 0.3417966904140641
Epoch: 50, step: 860, loss: 0.3804948031902313, mean loss: 0.3417972200825983
Epoch: 50, step: 861, loss: 0.3229672312736511, mean loss: 0.3417969623564368
Epoch: 50, step: 862, loss: 0.2852779030799866, mean loss: 0.34179618879034623
Epoch: 50, step: 863, loss: 0.2911233901977539, mean loss: 0.3417954952504553
Epoch: 50, step: 864, loss: 0.3719155192375183, mean loss: 0.3417959074864641
Epoch: 50, step: 865, loss: 0.2921152114868164, mean loss: 0.3417952275437274
Epoch: 50, step: 866, loss: 0.3652183413505554, mean loss: 0.341795548114078
Epoch: 50, step: 867, loss: 0.3142108917236328, mean loss: 0.34179517059373543
Epoch: 50, step: 868, loss: 0.3061453700065613, mean loss: 0.3417946827014612
Epoch: 50, step: 869, loss: 0.34205231070518494, mean loss: 0.341794686227231
Epoch: 50, step: 870, loss: 0.35893577337265015, mean loss: 0.3417949208084896
Epoch: 50, step: 871, loss: 0.29626283049583435, mean loss: 0.34179429769580194
Epoch: 50, step: 872, loss: 0.3286924660205841, mean loss: 0.34179411839795354
Epoch: 50, step: 873, loss: 0.31702134013175964, mean loss: 0.34179377938848005
Epoch: 50, step: 874, loss: 0.44474923610687256, mean loss: 0.34179518828970096
Epoch: 50, step: 875, loss: 0.3222070038318634, mean loss: 0.3417949202374751
Epoch: 50, step: 876, loss: 0.3448108434677124, mean loss: 0.34179496150796007
Epoch: 50, step: 877, loss: 0.3586060702800751, mean loss: 0.3417951915513216
Epoch: 50, step: 878, loss: 0.3133881986141205, mean loss: 0.34179480283509756
Epoch: 50, step: 879, loss: 0.2867175340652466, mean loss: 0.3417940491778894
Epoch: 50, step: 880, loss: 0.3512929081916809, mean loss: 0.3417941791550246
Epoch: 50, step: 881, loss: 0.3187461197376251, mean loss: 0.34179386378243737
Epoch: 50, step: 882, loss: 0.32071855664253235, mean loss: 0.34179357540747823
Epoch: 50, step: 883, loss: 0.37448084354400635, mean loss: 0.34179402266362374
Epoch: 50, step: 884, loss: 0.3308578133583069, mean loss: 0.34179387302677205
Epoch: 50, step: 885, loss: 0.3109438121318817, mean loss: 0.3417934509204741
Epoch: 50, step: 886, loss: 0.3013341724872589, mean loss: 0.34179289734352564
Epoch: 50, step: 887, loss: 0.3330383598804474, mean loss: 0.3417927775627482
Epoch: 50, step: 888, loss: 0.3227185904979706, mean loss: 0.3417925165906858
Epoch: 50, step: 889, loss: 0.3160759210586548, mean loss: 0.34179216474234086
Epoch: 50, step: 890, loss: 0.3177375793457031, mean loss: 0.34179183563772614
Epoch: 50, step: 891, loss: 0.30833786725997925, mean loss: 0.34179137794101
Epoch: 50, step: 892, loss: 0.2999750077724457, mean loss: 0.34179080584285876
Epoch: 50, step: 893, loss: 0.31602028012275696, mean loss: 0.34179045327594876
Epoch: 50, step: 894, loss: 0.3647395074367523, mean loss: 0.34179076723797297
Epoch: 50, step: 895, loss: 0.3401798605918884, mean loss: 0.3417907451997404
Epoch: 50, step: 896, loss: 0.32624563574790955, mean loss: 0.3417905325356167
Epoch: 50, step: 897, loss: 0.32391804456710815, mean loss: 0.34179028803524775
Epoch: 50, step: 898, loss: 0.3179582953453064, mean loss: 0.34178996201173595
Epoch: 50, step: 899, loss: 0.319831907749176, mean loss: 0.3417896616279567
Epoch: 50, step: 900, loss: 0.37879297137260437, mean loss: 0.34179016782225974
Epoch: 50, step: 901, loss: 0.3439410924911499, mean loss: 0.3417901972458688
Epoch: 50, step: 902, loss: 0.3544653356075287, mean loss: 0.3417903706332587
Epoch: 50, step: 903, loss: 0.32062768936157227, mean loss: 0.3417900811459355
Epoch: 50, step: 904, loss: 0.37769803404808044, mean loss: 0.3417905723292048
Epoch: 50, step: 905, loss: 0.31720101833343506, mean loss: 0.34179023597440494
Epoch: 50, step: 906, loss: 0.3282022476196289, mean loss: 0.3417900501100095
Epoch: 50, step: 907, loss: 0.3565111756324768, mean loss: 0.3417902514713588
Epoch: 50, step: 908, loss: 0.31385770440101624, mean loss: 0.3417898694042115
Epoch: 50, step: 909, loss: 0.3483065664768219, mean loss: 0.34178995853972066
Epoch: 50, step: 910, loss: 0.3371029496192932, mean loss: 0.34178989443159846
Epoch: 50, step: 911, loss: 0.32522058486938477, mean loss: 0.3417896678024601
Epoch: 50, step: 912, loss: 0.3337405323982239, mean loss: 0.3417895577107472
Epoch: 50, step: 913, loss: 0.3308606445789337, mean loss: 0.3417894082330393
Epoch: 50, step: 914, loss: 0.3264957368373871, mean loss: 0.34178919906021027
Epoch: 50, step: 915, loss: 0.3292357325553894, mean loss: 0.3417890273677421
Epoch: 50, step: 916, loss: 0.30821460485458374, mean loss: 0.3417885681801043
Epoch: 50, step: 917, loss: 0.3134293258190155, mean loss: 0.34178818032427727
Epoch: 50, step: 918, loss: 0.3280453085899353, mean loss: 0.3417879923721481
Epoch: 50, step: 919, loss: 0.33659666776657104, mean loss: 0.34178792137482034
Epoch: 50, step: 920, loss: 0.3193955719470978, mean loss: 0.3417876151379058
Epoch: 50, step: 921, loss: 0.39205285906791687, mean loss: 0.3417883025540587
Epoch: 50, step: 922, loss: 0.34577399492263794, mean loss: 0.34178835706074423
Epoch: 50, step: 923, loss: 0.33517566323280334, mean loss: 0.3417882666295065
Epoch: 50, step: 924, loss: 0.3112338185310364, mean loss: 0.3417878487909
Epoch: 50, step: 925, loss: 0.3320333659648895, mean loss: 0.3417877153980873
Epoch: 50, step: 926, loss: 0.31521284580230713, mean loss: 0.3417873519910065
Epoch: 50, step: 927, loss: 0.33640727400779724, mean loss: 0.3417872784203088
Epoch: 50, step: 928, loss: 0.3364919126033783, mean loss: 0.34178720600901075
Epoch: 50, step: 929, loss: 0.2834457755088806, mean loss: 0.3417864082320314
Epoch: 50, step: 930, loss: 0.34874409437179565, mean loss: 0.34178650337206967
Epoch: 50, step: 931, loss: 0.3563685417175293, mean loss: 0.3417867027654726
Epoch: 50, step: 932, loss: 0.33024173974990845, mean loss: 0.34178654490290694
Epoch: 50, step: 933, loss: 0.3149069547653198, mean loss: 0.34178617736400385
Epoch: 50, step: 934, loss: 0.32239916920661926, mean loss: 0.34178591227877575
Epoch: 50, step: 935, loss: 0.3140151798725128, mean loss: 0.3417855325651955
Epoch: 50, step: 936, loss: 0.3759714663028717, mean loss: 0.3417859999884387
Epoch: 50, step: 937, loss: 0.33168312907218933, mean loss: 0.34178586185407744
Epoch: 50, step: 938, loss: 0.350586473941803, mean loss: 0.3417859821812912
Epoch: 50, step: 939, loss: 0.32607173919677734, mean loss: 0.34178576732973276
Epoch: 50, step: 940, loss: 0.32295989990234375, mean loss: 0.3417855099382912
Epoch: 50, step: 941, loss: 0.3324083983898163, mean loss: 0.34178538173409184
Epoch: 50, step: 942, loss: 0.34976303577423096, mean loss: 0.3417854908033676
Epoch: 50, step: 943, loss: 0.30934858322143555, mean loss: 0.3417850473369509
Epoch: 50, step: 944, loss: 0.31202414631843567, mean loss: 0.3417846404615525
Epoch: 50, step: 945, loss: 0.33494800329208374, mean loss: 0.3417845469959198
Epoch: 50, step: 946, loss: 0.30987828969955444, mean loss: 0.3417841108022646
Epoch: 50, step: 947, loss: 0.36650413274765015, mean loss: 0.34178444874755287
Epoch: 50, step: 948, loss: 0.30387115478515625, mean loss: 0.3417839304452663
Epoch: 50, step: 949, loss: 0.3301064968109131, mean loss: 0.34178377080844285
Epoch: 50, step: 950, loss: 0.33751875162124634, mean loss: 0.3417837125041246
Epoch: 50, step: 951, loss: 0.31853044033050537, mean loss: 0.3417833946280286
Epoch: 50, step: 952, loss: 0.35978978872299194, mean loss: 0.3417836407750642
Epoch: 50, step: 953, loss: 0.33111757040023804, mean loss: 0.3417834949720954
Epoch: 50, step: 954, loss: 0.35592401027679443, mean loss: 0.34178368826736305
Epoch: 50, step: 955, loss: 0.35567790269851685, mean loss: 0.34178387819319866
Epoch: 50, step: 956, loss: 0.31258639693260193, mean loss: 0.34178347908605566
Epoch: 50, step: 957, loss: 0.34952107071876526, mean loss: 0.34178358485154453
Epoch: 50, step: 958, loss: 0.3291655480861664, mean loss: 0.34178341237738874
Epoch: 50, step: 959, loss: 0.35435402393341064, mean loss: 0.34178358420094745
Epoch: 50, step: 960, loss: 0.32606929540634155, mean loss: 0.34178336941043347
Epoch: 50, step: 961, loss: 0.3240690529346466, mean loss: 0.34178312728588145
Epoch: 50, step: 962, loss: 0.33899256587028503, mean loss: 0.3417830891441785
Epoch: 50, step: 963, loss: 0.3210214078426361, mean loss: 0.3417828053750939
Epoch: 50, step: 964, loss: 0.3057669699192047, mean loss: 0.34178231312011603
Epoch: 50, step: 965, loss: 0.2847557067871094, mean loss: 0.34178153370609404
Epoch: 50, step: 966, loss: 0.341660737991333, mean loss: 0.34178153205513506
Epoch: 50, step: 967, loss: 0.3498692810535431, mean loss: 0.3417816425918314
Epoch: 50, step: 968, loss: 0.3923919200897217, mean loss: 0.3417823342819939
Epoch: 50, step: 969, loss: 0.3147307336330414, mean loss: 0.34178196457308796
Epoch: 50, step: 970, loss: 0.3208976984024048, mean loss: 0.34178167915583013
Epoch: 50, step: 971, loss: 0.3332352638244629, mean loss: 0.3417815623568451
Epoch: 50, step: 972, loss: 0.33443787693977356, mean loss: 0.3417814619962556
Epoch: 50, step: 973, loss: 0.3537904918193817, mean loss: 0.34178162611233265
Epoch: 50, step: 974, loss: 0.3127823770046234, mean loss: 0.341781229812379
Epoch: 50, step: 975, loss: 0.335649698972702, mean loss: 0.3417811460208239
Epoch: 50, step: 976, loss: 0.32516688108444214, mean loss: 0.34178091897865304
Epoch: 50, step: 977, loss: 0.3794589340686798, mean loss: 0.341781433860381
Epoch: 50, step: 978, loss: 0.35134172439575195, mean loss: 0.3417815645029224
Epoch: 50, step: 979, loss: 0.3197459876537323, mean loss: 0.34178126338818
Epoch: 50, step: 980, loss: 0.308053195476532, mean loss: 0.3417808025025961
Epoch: 50, step: 981, loss: 0.29661500453948975, mean loss: 0.34178018533173493
Epoch: 50, step: 982, loss: 0.32416442036628723, mean loss: 0.34177994462330585
Epoch: 50, step: 983, loss: 0.3127646744251251, mean loss: 0.3417795481531731
Epoch: 50, step: 984, loss: 0.33294692635536194, mean loss: 0.34177942746420953
Epoch: 50, step: 985, loss: 0.3098992109298706, mean loss: 0.3417789918588132
Epoch: 50, step: 986, loss: 0.32719483971595764, mean loss: 0.34177879258637217
Epoch: 50, step: 987, loss: 0.3432111442089081, mean loss: 0.3417788121572256
Epoch: 50, step: 988, loss: 0.3143753111362457, mean loss: 0.3417784377361921
Epoch: 50, step: 989, loss: 0.3155435621738434, mean loss: 0.34177807928728426
Epoch: 50, step: 990, loss: 0.3237634003162384, mean loss: 0.34177783315485033
Epoch: 50, step: 991, loss: 0.30272069573402405, mean loss: 0.3417772995290795
Epoch: 50, step: 992, loss: 0.34952861070632935, mean loss: 0.341777405431436
Epoch: 50, step: 993, loss: 0.3382919132709503, mean loss: 0.3417773578115196
Epoch: 50, step: 994, loss: 0.38791635632514954, mean loss: 0.3417779881687641
Epoch: 50, step: 995, loss: 0.32964491844177246, mean loss: 0.3417778224073874
Epoch: 50, step: 996, loss: 0.3083825409412384, mean loss: 0.34177736616899695
Epoch: 50, step: 997, loss: 0.33727020025253296, mean loss: 0.34177730459400973
Epoch: 50, step: 998, loss: 0.2743763327598572, mean loss: 0.34177638380312686
Epoch: 50, step: 999, loss: 0.3995191156864166, mean loss: 0.34177717263826185
Epoch: 50, step: 1000, loss: 0.3114907741546631, mean loss: 0.3417767588953009
Epoch: 50, step: 1001, loss: 0.31441813707351685, mean loss: 0.3417763851538482
Epoch: 50, step: 1002, loss: 0.32423046231269836, mean loss: 0.341776145465272
Epoch: 50, step: 1003, loss: 0.32552579045295715, mean loss: 0.34177592347801705
Epoch: 50, step: 1004, loss: 0.32387834787368774, mean loss: 0.3417756789923179
Epoch: 50, step: 1005, loss: 0.3906014859676361, mean loss: 0.3417763459568697
Epoch: 50, step: 1006, loss: 0.3480530381202698, mean loss: 0.3417764316958313
Epoch: 50, step: 1007, loss: 0.35029178857803345, mean loss: 0.34177654801313107
Epoch: 50, step: 1008, loss: 0.35217714309692383, mean loss: 0.3417766900802961
Epoch: 50, step: 1009, loss: 0.37679755687713623, mean loss: 0.34177716844208816
Epoch: 50, step: 1010, loss: 0.31341519951820374, mean loss: 0.3417767810417122
Epoch: 50, step: 1011, loss: 0.3141966164112091, mean loss: 0.3417764043252637
Epoch: 50, step: 1012, loss: 0.3180253803730011, mean loss: 0.34177607991533715
Epoch: 50, step: 1013, loss: 0.36483755707740784, mean loss: 0.3417763949025959
Epoch: 50, step: 1014, loss: 0.31401365995407104, mean loss: 0.3417760157079644
Epoch: 50, step: 1015, loss: 0.3183384835720062, mean loss: 0.34177569559306964
Epoch: 50, step: 1016, loss: 0.31067776679992676, mean loss: 0.3417752708566178
Epoch: 50, step: 1017, loss: 0.30047059059143066, mean loss: 0.34177470672375065
Epoch: 50, step: 1018, loss: 0.3237920105457306, mean loss: 0.34177446112225135
Epoch: 50, step: 1019, loss: 0.2993077039718628, mean loss: 0.34177388113376256
Epoch: 50, step: 1020, loss: 0.3920811712741852, mean loss: 0.3417745681947169
Epoch: 50, step: 1021, loss: 0.3454952538013458, mean loss: 0.3417746190084834
Epoch: 50, step: 1022, loss: 0.36448389291763306, mean loss: 0.34177492914701785
Epoch: 50, step: 1023, loss: 0.3287281095981598, mean loss: 0.3417747509701967
Epoch: 50, step: 1024, loss: 0.3284800350666046, mean loss: 0.3417745694104029
Epoch: 50, step: 1025, loss: 0.3101387023925781, mean loss: 0.3417741373798807
Epoch: 50, step: 1026, loss: 0.29796165227890015, mean loss: 0.3417735390693518
Epoch: 50, step: 1027, loss: 0.30750104784965515, mean loss: 0.3417730710449456
Epoch: 50, step: 1028, loss: 0.27393651008605957, mean loss: 0.34177214468297207
Epoch: 50, step: 1029, loss: 0.33340486884117126, mean loss: 0.341772030422753
Epoch: 50, step: 1030, loss: 0.3071901202201843, mean loss: 0.34177155819227406
Epoch: 50, step: 1031, loss: 0.33123910427093506, mean loss: 0.341771414369165
Epoch: 50, step: 1032, loss: 0.3346010744571686, mean loss: 0.3417713164578421
Epoch: 50, step: 1033, loss: 0.2899177074432373, mean loss: 0.3417706084040827
Epoch: 50, step: 1034, loss: 0.32579997181892395, mean loss: 0.3417703903302575
Epoch: 50, step: 1035, loss: 0.34941285848617554, mean loss: 0.3417704946842386
Epoch: 50, step: 1036, loss: 0.35220450162887573, mean loss: 0.341770637153304
Epoch: 50, step: 1037, loss: 0.36810103058815, mean loss: 0.34177099667149724
Epoch: 50, step: 1038, loss: 0.28285276889801025, mean loss: 0.34177019220628374
Epoch: 50, step: 1039, loss: 0.32025641202926636, mean loss: 0.34176989846269856
Epoch: 50, step: 1040, loss: 0.32790470123291016, mean loss: 0.3417697091534697
Epoch: 50, step: 1041, loss: 0.3371705114841461, mean loss: 0.3417696463589301
Epoch: 50, step: 1042, loss: 0.2937198877334595, mean loss: 0.34176899032683655
Epoch: 50, step: 1043, loss: 0.33785393834114075, mean loss: 0.34176893687464954
Epoch: 50, step: 1044, loss: 0.33298197388648987, mean loss: 0.3417688169079216
Epoch: 50, step: 1045, loss: 0.33407944440841675, mean loss: 0.3417687119278203
Epoch: 50, step: 1046, loss: 0.2879015803337097, mean loss: 0.34176797651023877
Epoch: 50, step: 1047, loss: 0.3379138708114624, mean loss: 0.3417679238930247
Epoch: 50, step: 1048, loss: 0.333474725484848, mean loss: 0.34176781067375334
Epoch: 50, step: 1049, loss: 0.33561044931411743, mean loss: 0.34176772661421256
Epoch: 50, step: 1050, loss: 0.3387320637702942, mean loss: 0.3417676851722822
Epoch: 50, step: 1051, loss: 0.33623841404914856, mean loss: 0.3417676096894131
Epoch: 50, step: 1052, loss: 0.327429860830307, mean loss: 0.3417674139602435
Epoch: 50, step: 1053, loss: 0.31630218029022217, mean loss: 0.34176706633098547
Epoch: 50, step: 1054, loss: 0.34958192706108093, mean loss: 0.34176717301122206
Epoch: 50, step: 1055, loss: 0.3262692987918854, mean loss: 0.34176696145347635
Epoch: 50, step: 1056, loss: 0.3390883505344391, mean loss: 0.3417669248889034
Epoch: 50, step: 1057, loss: 0.32593879103660583, mean loss: 0.3417667088287618
Epoch: 50, step: 1058, loss: 0.3140219449996948, mean loss: 0.34176633010718727
Epoch: 50, step: 1059, loss: 0.31509289145469666, mean loss: 0.3417659660143856
Epoch: 50, step: 1060, loss: 0.3250252604484558, mean loss: 0.34176573750664524
Epoch: 50, step: 1061, loss: 0.2998100221157074, mean loss: 0.3417651648261916
Epoch: 50, step: 1062, loss: 0.30230236053466797, mean loss: 0.34176462618043196
Epoch: 50, step: 1063, loss: 0.33041220903396606, mean loss: 0.3417644712282433
Epoch: 50, step: 1064, loss: 0.3518257439136505, mean loss: 0.3417646085553802
Epoch: 50, step: 1065, loss: 0.331385999917984, mean loss: 0.34176446689883233
Epoch: 50, step: 1066, loss: 0.3149197995662689, mean loss: 0.3417641005037659
Epoch: 50, step: 1067, loss: 0.3801104426383972, mean loss: 0.3417646238747073
Epoch: 50, step: 1068, loss: 0.31430473923683167, mean loss: 0.34176424909294917
Epoch: 50, step: 1069, loss: 0.3966566324234009, mean loss: 0.3417649982724678
Epoch: 50, step: 1070, loss: 0.3125874102115631, mean loss: 0.34176460005778453
Epoch: 50, step: 1071, loss: 0.3528518080711365, mean loss: 0.34176475137353973
Epoch: 50, step: 1072, loss: 0.3510691225528717, mean loss: 0.34176487835580033
Epoch: 50, step: 1073, loss: 0.3559044301509857, mean loss: 0.3417650713239991
Epoch: 50, step: 1074, loss: 0.3078668713569641, mean loss: 0.3417646087078276
Epoch: 50, step: 1075, loss: 0.34680306911468506, mean loss: 0.3417646774678637
Epoch: 50, step: 1076, loss: 0.3268766701221466, mean loss: 0.34176447429350687
Epoch: 50, step: 1077, loss: 0.3111521601676941, mean loss: 0.3417640565376439
Epoch: 50, step: 1078, loss: 0.32962766289711, mean loss: 0.3417638909186584
Epoch: 50, step: 1079, loss: 0.3588862419128418, mean loss: 0.3417641245751949
Epoch: 50, step: 1080, loss: 0.34104520082473755, mean loss: 0.3417641147646881
Epoch: 50, step: 1081, loss: 0.322513222694397, mean loss: 0.34176385206863624
Epoch: 50, step: 1082, loss: 0.34363651275634766, mean loss: 0.3417638776224576
Epoch: 50, step: 1083, loss: 0.31500187516212463, mean loss: 0.34176351244039244
Epoch: 50, step: 1084, loss: 0.3400156795978546, mean loss: 0.341763488590589
Epoch: 50, step: 1085, loss: 0.32227441668510437, mean loss: 0.34176322265887077
Epoch: 50, step: 1086, loss: 0.34561842679977417, mean loss: 0.3417632752630726
Epoch: 50, step: 1087, loss: 0.3276039958000183, mean loss: 0.34176308206255596
Epoch: 50, step: 1088, loss: 0.3223845064640045, mean loss: 0.3417628176494026
Epoch: 50, step: 1089, loss: 0.3936901390552521, mean loss: 0.34176352616790995
Epoch: 50, step: 1090, loss: 0.30436378717422485, mean loss: 0.34176301587689206
Epoch: 50, step: 1091, loss: 0.36959028244018555, mean loss: 0.3417633955536175
Epoch: 50, step: 1092, loss: 0.35090216994285583, mean loss: 0.3417635202418468
Epoch: 50, step: 1093, loss: 0.3324569761753082, mean loss: 0.34176339326632266
Epoch: 50, step: 1094, loss: 0.33331093192100525, mean loss: 0.3417632779452046
Epoch: 50, step: 1095, loss: 0.314347505569458, mean loss: 0.3417629039033418
Epoch: 50, step: 1096, loss: 0.33628273010253906, mean loss: 0.34176282913665557
Epoch: 50, step: 1097, loss: 0.4154593348503113, mean loss: 0.34176383457344395
Epoch: 50, step: 1098, loss: 0.282929390668869, mean loss: 0.34176303190977997
Epoch: 50, step: 1099, loss: 0.33151909708976746, mean loss: 0.34176289215623534
Epoch: 50, step: 1100, loss: 0.3441934287548065, mean loss: 0.341762925314536
Epoch: 50, step: 1101, loss: 0.33252981305122375, mean loss: 0.34176279935464043
Epoch: 50, step: 1102, loss: 0.3519727885723114, mean loss: 0.34176293863937934
Epoch: 50, step: 1103, loss: 0.3401440680027008, mean loss: 0.34176291655503693
Epoch: 50, step: 1104, loss: 0.37185972929000854, mean loss: 0.3417633271247489
Epoch: 50, step: 1105, loss: 0.3213646113872528, mean loss: 0.3417630488567253
Epoch: 50, step: 1106, loss: 0.3322477340698242, mean loss: 0.34176291905582246
Epoch: 50, step: 1107, loss: 0.32476869225502014, mean loss: 0.34176268723628295
Epoch: 50, step: 1108, loss: 0.3455752432346344, mean loss: 0.3417627392429397
Epoch: 50, step: 1109, loss: 0.326202929019928, mean loss: 0.3417625269961763
Epoch: 50, step: 1110, loss: 0.3153393864631653, mean loss: 0.34176216657085773
Epoch: 50, step: 1111, loss: 0.3238581717014313, mean loss: 0.34176192235442837
Epoch: 50, step: 1112, loss: 0.2951548993587494, mean loss: 0.34176128662784516
Epoch: 50, step: 1113, loss: 0.34447452425956726, mean loss: 0.3417613236362969
Epoch: 50, step: 1114, loss: 0.3403632640838623, mean loss: 0.34176130456708115
Epoch: 50, step: 1115, loss: 0.37296557426452637, mean loss: 0.34176173018044925
Epoch: 50, step: 1116, loss: 0.3072284162044525, mean loss: 0.3417612591667147
Epoch: 50, step: 1117, loss: 0.32545191049575806, mean loss: 0.34176103671999397
Epoch: 50, step: 1118, loss: 0.3063293397426605, mean loss: 0.34176055346603557
Epoch: 50, step: 1119, loss: 0.3578062653541565, mean loss: 0.34176077231098767
Epoch: 50, step: 1120, loss: 0.3167051076889038, mean loss: 0.3417604305853617
Epoch: 50, step: 1121, loss: 0.33861243724823, mean loss: 0.3417603876515446
Epoch: 50, step: 1122, loss: 0.30285778641700745, mean loss: 0.34175985708676637
Epoch: 50, step: 1123, loss: 0.3762491047382355, mean loss: 0.34176032745455387
Epoch: 50, step: 1124, loss: 0.3569751977920532, mean loss: 0.3417605349536379
Epoch: 50, step: 1125, loss: 0.38132786750793457, mean loss: 0.34176107456213356
Epoch: 50, step: 1126, loss: 0.3332255780696869, mean loss: 0.3417609581589466
Epoch: 50, step: 1127, loss: 0.3237133324146271, mean loss: 0.3417607120370594
Epoch: 50, step: 1128, loss: 0.36531880497932434, mean loss: 0.3417610333027652
Epoch: 50, step: 1129, loss: 0.3488544523715973, mean loss: 0.341761130035604
Epoch: 50, step: 1130, loss: 0.34030693769454956, mean loss: 0.34176111020507743
Epoch: 50, step: 1131, loss: 0.3372218608856201, mean loss: 0.3417610483050976
Epoch: 50, step: 1132, loss: 0.34903985261917114, mean loss: 0.34176114756197123
Epoch: 50, step: 1133, loss: 0.362527459859848, mean loss: 0.3417614307363828
Epoch: 50, step: 1134, loss: 0.31764283776283264, mean loss: 0.34176110185395325
Epoch: 50, step: 1135, loss: 0.3207353949546814, mean loss: 0.34176081515019385
Epoch: 50, step: 1136, loss: 0.3150448799133301, mean loss: 0.34176045086020057
Epoch: 50, step: 1137, loss: 0.36173954606056213, mean loss: 0.34176072328507173
Epoch: 50, step: 1138, loss: 0.3338600695133209, mean loss: 0.3417606155572084
Epoch: 50, step: 1139, loss: 0.3073277771472931, mean loss: 0.34176014606118427
Epoch: 50, step: 1140, loss: 0.32374051213264465, mean loss: 0.34175990036458986
Epoch: 50, step: 1141, loss: 0.37246617674827576, mean loss: 0.34176031903706106
Epoch: 50, step: 1142, loss: 0.3752581775188446, mean loss: 0.3417607757658352
Epoch: 50, step: 1143, loss: 0.33140766620635986, mean loss: 0.3417606346076006
Epoch: 50, step: 1144, loss: 0.28626132011413574, mean loss: 0.34175987791914886
Epoch: 50, step: 1145, loss: 0.32181283831596375, mean loss: 0.34175960596103794
Epoch: 50, step: 1146, loss: 0.3589116930961609, mean loss: 0.3417598398095544
Epoch: 50, step: 1147, loss: 0.29317957162857056, mean loss: 0.34175917748381707
Epoch: 50, step: 1148, loss: 0.32899749279022217, mean loss: 0.3417590034980137
Epoch: 50, step: 1149, loss: 0.36057811975479126, mean loss: 0.3417592600640158
Epoch: 50, step: 1150, loss: 0.3695438802242279, mean loss: 0.3417596388539459
Epoch: 50, step: 1151, loss: 0.3308444619178772, mean loss: 0.34175949004850176
Epoch: 50, step: 1152, loss: 0.3490254878997803, mean loss: 0.34175958910372584
Epoch: 50, step: 1153, loss: 0.33138710260391235, mean loss: 0.3417594477005781
Epoch: 50, step: 1154, loss: 0.3890324532985687, mean loss: 0.3417600921420694
Epoch: 50, step: 1155, loss: 0.36414313316345215, mean loss: 0.3417603972710435
Epoch: 50, step: 1156, loss: 0.30542197823524475, mean loss: 0.34175990190701505
Epoch: 50, step: 1157, loss: 0.3357016444206238, mean loss: 0.3417598193221915
Epoch: 50, step: 1158, loss: 0.3539567291736603, mean loss: 0.34175998558549736
Epoch: 50, step: 1159, loss: 0.3221990764141083, mean loss: 0.34175971894278784
Epoch: 50, step: 1160, loss: 0.3545832633972168, mean loss: 0.34175989374335564
Epoch: 50, step: 1161, loss: 0.3454433083534241, mean loss: 0.3417599439521096
Epoch: 50, step: 1162, loss: 0.3290497362613678, mean loss: 0.3417597707011835
Epoch: 50, step: 1163, loss: 0.30832478404045105, mean loss: 0.34175931496012985
Epoch: 50, step: 1164, loss: 0.3333808481693268, mean loss: 0.34175920075762467
Epoch: 50, step: 1165, loss: 0.3635181486606598, mean loss: 0.34175949733843736
Epoch: 50, step: 1166, loss: 0.3369898200035095, mean loss: 0.34175943232722883
Epoch: 50, step: 1167, loss: 0.3207052946090698, mean loss: 0.3417591453610076
Epoch: 50, step: 1168, loss: 0.3511468470096588, mean loss: 0.34175927331288986
Epoch: 50, step: 1169, loss: 0.3101213276386261, mean loss: 0.3417588421019634
Epoch: 50, step: 1170, loss: 0.32309356331825256, mean loss: 0.3417585877061015
Epoch: 50, step: 1171, loss: 0.3125021755695343, mean loss: 0.3417581889652721
Epoch: 50, step: 1172, loss: 0.33843258023262024, mean loss: 0.34175814364057866
Epoch: 50, step: 1173, loss: 0.3498578667640686, mean loss: 0.3417582540301325
Epoch: 50, step: 1174, loss: 0.3146955668926239, mean loss: 0.34175788520305056
Epoch: 50, step: 1175, loss: 0.3511289358139038, mean loss: 0.34175801291579877
Epoch: 50, step: 1176, loss: 0.32293567061424255, mean loss: 0.34175775640023803
Epoch: 50, step: 1177, loss: 0.3219221830368042, mean loss: 0.34175748607979645
Epoch: 50, step: 1178, loss: 0.35291770100593567, mean loss: 0.34175763816983484
Epoch: 50, step: 1179, loss: 0.2837156653404236, mean loss: 0.3417568471917369
Epoch: 50, step: 1180, loss: 0.3833557069301605, mean loss: 0.34175741408043747
Epoch: 50, step: 1181, loss: 0.3347061574459076, mean loss: 0.3417573179907065
Epoch: 50, step: 1182, loss: 0.34521618485450745, mean loss: 0.34175736512515
Epoch: 50, step: 1183, loss: 0.38568058609962463, mean loss: 0.3417579636646269
Epoch: 50, step: 1184, loss: 0.3057321012020111, mean loss: 0.34175747274873863
Epoch: 50, step: 1185, loss: 0.31653913855552673, mean loss: 0.34175712910915895
Epoch: 50, step: 1186, loss: 0.2966553568840027, mean loss: 0.341756514534749
Epoch: 50, step: 1187, loss: 0.3197992146015167, mean loss: 0.3417562153400587
Epoch: 50, step: 1188, loss: 0.340510755777359, mean loss: 0.34175619836940146
Epoch: 50, step: 1189, loss: 0.3046072721481323, mean loss: 0.34175569218427787
Epoch: 50, step: 1190, loss: 0.32672005891799927, mean loss: 0.34175548731401767
Epoch: 50, step: 1191, loss: 0.3514230251312256, mean loss: 0.34175561903869905
Epoch: 50, step: 1192, loss: 0.33710384368896484, mean loss: 0.3417555556569685
Epoch: 50, step: 1193, loss: 0.32697057723999023, mean loss: 0.3417553542102778
Epoch: 50, step: 1194, loss: 0.31630846858024597, mean loss: 0.34175500749884474
Epoch: 50, step: 1195, loss: 0.3295782804489136, mean loss: 0.3417548415943397
Epoch: 50, step: 1196, loss: 0.3363553583621979, mean loss: 0.3417547680288911
Epoch: 50, step: 1197, loss: 0.3547014892101288, mean loss: 0.3417549444195445
Epoch: 50, step: 1198, loss: 0.3133395314216614, mean loss: 0.3417545572833029
Epoch: 50, step: 1199, loss: 0.30105048418045044, mean loss: 0.3417540027318982
Epoch: 50, step: 1200, loss: 0.33214640617370605, mean loss: 0.3417538718399954
Epoch: 50, step: 1201, loss: 0.3053887188434601, mean loss: 0.34175337641544296
Epoch: 50, step: 1202, loss: 0.34608155488967896, mean loss: 0.34175343538004216
Epoch: 50, step: 1203, loss: 0.3456611633300781, mean loss: 0.3417534886159414
Epoch: 50, step: 1204, loss: 0.28314536809921265, mean loss: 0.34175269019457344
Epoch: 50, step: 1205, loss: 0.3268560767173767, mean loss: 0.34175248726002483
Epoch: 50, step: 1206, loss: 0.3121020495891571, mean loss: 0.34175208334162915
Epoch: 50, step: 1207, loss: 0.3156863749027252, mean loss: 0.34175172826168637
Epoch: 50, step: 1208, loss: 0.3033546805381775, mean loss: 0.3417512052052802
Epoch: 50, step: 1209, loss: 0.3161897361278534, mean loss: 0.3417508570038216
Epoch: 50, step: 1210, loss: 0.3347134292125702, mean loss: 0.3417507611404252
Epoch: 50, step: 1211, loss: 0.3446141481399536, mean loss: 0.3417508001447705
Epoch: 50, step: 1212, loss: 0.30839914083480835, mean loss: 0.3417503458429532
Epoch: 50, step: 1213, loss: 0.3106342554092407, mean loss: 0.3417499219988576
Epoch: 50, step: 1214, loss: 0.33275315165519714, mean loss: 0.3417497994520982
Epoch: 50, step: 1215, loss: 0.30999889969825745, mean loss: 0.3417493669728055
Epoch: 50, step: 1216, loss: 0.3387305736541748, mean loss: 0.34174932585435447
Epoch: 50, step: 1217, loss: 0.32919007539749146, mean loss: 0.3417491547893506
Epoch: 50, step: 1218, loss: 0.3093295693397522, mean loss: 0.34174871321992784
Epoch: 50, step: 1219, loss: 0.31212368607521057, mean loss: 0.3417483097191495
Epoch: 50, step: 1220, loss: 0.31637832522392273, mean loss: 0.3417479641778943
Epoch: 50, step: 1221, loss: 0.31066590547561646, mean loss: 0.3417475408434891
Epoch: 50, step: 1222, loss: 0.3504674732685089, mean loss: 0.3417476596064438
Epoch: 50, step: 1223, loss: 0.310743123292923, mean loss: 0.3417472373393879
Epoch: 50, step: 1224, loss: 0.33205631375312805, mean loss: 0.34174710535540986
Epoch: 50, step: 1225, loss: 0.3286827504634857, mean loss: 0.34174692742994894
Epoch: 50, step: 1226, loss: 0.33424657583236694, mean loss: 0.3417468252828968
Epoch: 50, step: 1227, loss: 0.3536302447319031, mean loss: 0.34174698712060786
Epoch: 50, step: 1228, loss: 0.35781165957450867, mean loss: 0.3417472058989169
Epoch: 50, step: 1229, loss: 0.30857035517692566, mean loss: 0.3417467540828918
Epoch: 50, step: 1230, loss: 0.31169891357421875, mean loss: 0.3417463448845899
Epoch: 50, step: 1231, loss: 0.29500460624694824, mean loss: 0.34174570835366824
Epoch: 50, step: 1232, loss: 0.32213854789733887, mean loss: 0.34174544134618584
Epoch: 50, step: 1233, loss: 0.31647419929504395, mean loss: 0.3417450972107438
Epoch: 50, step: 1234, loss: 0.3329455852508545, mean loss: 0.341744977383523
Epoch: 50, step: 1235, loss: 0.33417221903800964, mean loss: 0.3417448742630052
Epoch: 50, step: 1236, loss: 0.34986409544944763, mean loss: 0.3417449848233656
Epoch: 50, step: 1237, loss: 0.3444487154483795, mean loss: 0.3417450216398724
Epoch: 50, step: 1238, loss: 0.342323899269104, mean loss: 0.3417450295223004
Epoch: 50, step: 1239, loss: 0.31986376643180847, mean loss: 0.3417447315748182
Epoch: 50, step: 1240, loss: 0.3070071041584015, mean loss: 0.3417442585743496
Epoch: 50, step: 1241, loss: 0.3577564060688019, mean loss: 0.3417444765987429
Epoch: 50, step: 1242, loss: 0.3142678737640381, mean loss: 0.3417441024772768
Epoch: 50, step: 1243, loss: 0.3212147057056427, mean loss: 0.3417438229527851
Epoch: 50, step: 1244, loss: 0.3248611092567444, mean loss: 0.34174359308398944
Epoch: 50, step: 1245, loss: 0.31834444403648376, mean loss: 0.3417432744941541
Epoch: 50, step: 1246, loss: 0.4032839238643646, mean loss: 0.3417441123860948
Epoch: 50, step: 1247, loss: 0.3427566587924957, mean loss: 0.3417441261719897
Epoch: 50, step: 1248, loss: 0.3277599811553955, mean loss: 0.34174393577940415
Epoch: 50, step: 1249, loss: 0.3414759933948517, mean loss: 0.34174393213144794
Epoch: 50, step: 1250, loss: 0.3227281868457794, mean loss: 0.3417436732412315
Epoch: 50, step: 1251, loss: 0.37419393658638, mean loss: 0.34174411502992813
Epoch: 50, step: 1252, loss: 0.31875404715538025, mean loss: 0.34174380203974564
Epoch: 50, step: 1253, loss: 0.32066240906715393, mean loss: 0.3417435150384527
Epoch: 50, step: 1254, loss: 0.3323398232460022, mean loss: 0.3417433870186883
Epoch: 50, step: 1255, loss: 0.35657986998558044, mean loss: 0.3417435889965113
Epoch: 50, step: 1256, loss: 0.3355092406272888, mean loss: 0.3417435041257928
Epoch: 50, step: 1257, loss: 0.33427637815475464, mean loss: 0.3417434024741555
Epoch: 50, step: 1258, loss: 0.342117577791214, mean loss: 0.3417434075678175
Epoch: 50, step: 1259, loss: 0.3219621479511261, mean loss: 0.341743138288487
Epoch: 50, step: 1260, loss: 0.3276969790458679, mean loss: 0.34174294708282354
Epoch: 50, step: 1261, loss: 0.3197017312049866, mean loss: 0.34174264704721496
Epoch: 50, step: 1262, loss: 0.3421527147293091, mean loss: 0.3417426526291771
Epoch: 50, step: 1263, loss: 0.3087179660797119, mean loss: 0.3417422030935331
Epoch: 50, step: 1264, loss: 0.3355112373828888, mean loss: 0.34174211827810114
Epoch: 50, step: 1265, loss: 0.3439459502696991, mean loss: 0.3417421482760865
Epoch: 50, step: 1266, loss: 0.32971614599227905, mean loss: 0.3417419845835132
Epoch: 50, step: 1267, loss: 0.37560132145881653, mean loss: 0.3417424454554149
Epoch: 50, step: 1268, loss: 0.3467617630958557, mean loss: 0.34174251377426557
Epoch: 50, step: 1269, loss: 0.3539141118526459, mean loss: 0.3417426794418588
Epoch: 50, step: 1270, loss: 0.32809439301490784, mean loss: 0.3417424936775923
Epoch: 50, step: 1271, loss: 0.33134061098098755, mean loss: 0.341742352101445
Epoch: 50, step: 1272, loss: 0.31071898341178894, mean loss: 0.34174192985968693
Epoch: 50, step: 1273, loss: 0.3579632043838501, mean loss: 0.34174215063539704
Epoch: 50, step: 1274, loss: 0.32577815651893616, mean loss: 0.3417419333642964
Epoch: 50, step: 1275, loss: 0.3574824631214142, mean loss: 0.3417421475911155
Epoch: 50, step: 1276, loss: 0.35621702671051025, mean loss: 0.3417423445898922
Epoch: 50, step: 1277, loss: 0.3107115924358368, mean loss: 0.34174192227638134
Epoch: 50, step: 1278, loss: 0.3139151334762573, mean loss: 0.3417415435724142
Epoch: 50, step: 1279, loss: 0.31830447912216187, mean loss: 0.34174122461399764
Epoch: 50, step: 1280, loss: 0.3091440498828888, mean loss: 0.34174078100034605
Epoch: 50, step: 1281, loss: 0.32956573367118835, mean loss: 0.3417406153128671
Epoch: 50, step: 1282, loss: 0.32770371437072754, mean loss: 0.34174042429044094
Epoch: 50, step: 1283, loss: 0.37677842378616333, mean loss: 0.34174090110171274
Epoch: 50, step: 1284, loss: 0.40855398774147034, mean loss: 0.34174181030885215
Epoch: 50, step: 1285, loss: 0.3376999497413635, mean loss: 0.3417417553070754
Epoch: 50, step: 1286, loss: 0.3131984770298004, mean loss: 0.34174136689445445
Epoch: 50, step: 1287, loss: 0.3238242566585541, mean loss: 0.34174112308444143
Epoch: 50, step: 1288, loss: 0.3122212290763855, mean loss: 0.34174072139311334
Epoch: 50, step: 1289, loss: 0.3913904130458832, mean loss: 0.34174139699104034
Epoch: 50, step: 1290, loss: 0.3363061845302582, mean loss: 0.34174132303351545
Epoch: 50, step: 1291, loss: 0.34080901741981506, mean loss: 0.34174131034770455
Epoch: 50, step: 1292, loss: 0.3050098419189453, mean loss: 0.3417408105522352
Epoch: 50, step: 1293, loss: 0.3418106734752655, mean loss: 0.34174081150282876
Epoch: 50, step: 1294, loss: 0.30803367495536804, mean loss: 0.3417403528711321
Epoch: 50, step: 1295, loss: 0.4033634662628174, mean loss: 0.3417411913264683
Epoch: 50, step: 1296, loss: 0.37633016705513, mean loss: 0.3417416619439864
Epoch: 50, step: 1297, loss: 0.3395487070083618, mean loss: 0.34174163210705294
Epoch: 50, step: 1298, loss: 0.31392645835876465, mean loss: 0.34174125366416597
Epoch: 50, step: 1299, loss: 0.31567472219467163, mean loss: 0.3417408990174793
Epoch: 50, step: 1300, loss: 0.3280301094055176, mean loss: 0.34174071247866195
Epoch: 50, step: 1301, loss: 0.34256112575531006, mean loss: 0.3417407236404436
Epoch: 50, step: 1302, loss: 0.32645103335380554, mean loss: 0.3417405156259369
Epoch: 50, step: 1303, loss: 0.3584095537662506, mean loss: 0.3417407424032298
Epoch: 50, step: 1304, loss: 0.3315993845462799, mean loss: 0.3417406044349575
Epoch: 50, step: 1305, loss: 0.3602246642112732, mean loss: 0.3417408558982364
Epoch: 50, step: 1306, loss: 0.3140351176261902, mean loss: 0.34174047898531285
Epoch: 50, step: 1307, loss: 0.3459997773170471, mean loss: 0.34174053692864326
Epoch: 50, step: 1308, loss: 0.34293651580810547, mean loss: 0.3417405531984725
Epoch: 50, step: 1309, loss: 0.32704663276672363, mean loss: 0.34174035330838365
Epoch: 50, step: 1310, loss: 0.3486744165420532, mean loss: 0.34174044763526307
Epoch: 50, step: 1311, loss: 0.3593516945838928, mean loss: 0.34174068720495165
Epoch: 50, step: 1312, loss: 0.3008045256137848, mean loss: 0.34174013034886375
Epoch: 50, step: 1313, loss: 0.3219473958015442, mean loss: 0.3417398611112417
Epoch: 50, step: 1314, loss: 0.3517499566078186, mean loss: 0.34173999727522864
Epoch: 50, step: 1315, loss: 0.3360198736190796, mean loss: 0.34173991946735477
Epoch: 50, step: 1316, loss: 0.3158155083656311, mean loss: 0.34173956683583956
Epoch: 50, step: 1317, loss: 0.3158004581928253, mean loss: 0.3417392140092033
Epoch: 50, step: 1318, loss: 0.344807893037796, mean loss: 0.3417392557491485
Epoch: 50, step: 1319, loss: 0.3828021287918091, mean loss: 0.34173981427571326
Epoch: 50, step: 1320, loss: 0.3355249762535095, mean loss: 0.34173972974424577
Epoch: 50, step: 1321, loss: 0.30672141909599304, mean loss: 0.34173925344721023
Epoch: 50, step: 1322, loss: 0.34361305832862854, mean loss: 0.341739278933179
Epoch: 50, step: 1323, loss: 0.3076603412628174, mean loss: 0.34173881542551254
Epoch: 50, step: 1324, loss: 0.3809818625450134, mean loss: 0.3417393491629776
Epoch: 50, step: 1325, loss: 0.3418976366519928, mean loss: 0.34173935131578737
Epoch: 50, step: 1326, loss: 0.3445282280445099, mean loss: 0.341739389245755
Epoch: 50, step: 1327, loss: 0.32186082005500793, mean loss: 0.3417391188920232
Epoch: 50, step: 1328, loss: 0.34587398171424866, mean loss: 0.3417391751264725
Epoch: 50, step: 1329, loss: 0.3800274431705475, mean loss: 0.34173969584275216
Epoch: 50, step: 1330, loss: 0.35536158084869385, mean loss: 0.34173988109638676
Epoch: 50, step: 1331, loss: 0.3135286867618561, mean loss: 0.3417394974376486
Epoch: 50, step: 1332, loss: 0.2896299362182617, mean loss: 0.3417387887821984
Epoch: 50, step: 1333, loss: 0.3285963237285614, mean loss: 0.3417386100558262
Epoch: 50, step: 1334, loss: 0.3908803164958954, mean loss: 0.34173927833224477
Epoch: 50, step: 1335, loss: 0.3251352608203888, mean loss: 0.34173905253783776
Epoch: 50, step: 1336, loss: 0.32967841625213623, mean loss: 0.34173888853010986
Epoch: 50, step: 1337, loss: 0.3204960525035858, mean loss: 0.3417385996612798
Epoch: 50, step: 1338, loss: 0.31586432456970215, mean loss: 0.34173824781701906
Epoch: 50, step: 1339, loss: 0.3074166774749756, mean loss: 0.3417377811108681
Epoch: 50, step: 1340, loss: 0.3712042570114136, mean loss: 0.34173818179179305
Epoch: 50, step: 1341, loss: 0.39663127064704895, mean loss: 0.34173892821001467
Epoch: 50, step: 1342, loss: 0.308044970035553, mean loss: 0.3417384700568502
Epoch: 50, step: 1343, loss: 0.2998059391975403, mean loss: 0.3417378998875521
Epoch: 50, step: 1344, loss: 0.3580401539802551, mean loss: 0.3417381215512151
Epoch: 50, step: 1345, loss: 0.3534628450870514, mean loss: 0.34173828097148995
Epoch: 50, step: 1346, loss: 0.3582485020160675, mean loss: 0.3417385054567993
Epoch: 50, step: 1347, loss: 0.3063368499279022, mean loss: 0.34173802411596704
Epoch: 50, step: 1348, loss: 0.34064406156539917, mean loss: 0.3417380092420388
Epoch: 50, step: 1349, loss: 0.40405046939849854, mean loss: 0.3417388564542775
Epoch: 50, step: 1350, loss: 0.3541702330112457, mean loss: 0.34173902547137525
Epoch: 50, step: 1351, loss: 0.3038272261619568, mean loss: 0.34173851002924843
Epoch: 50, step: 1352, loss: 0.32739177346229553, mean loss: 0.34173831497620416
Epoch: 50, step: 1353, loss: 0.3027202785015106, mean loss: 0.34173778450829656
Epoch: 50, step: 1354, loss: 0.3123329281806946, mean loss: 0.3417373847413694
Epoch: 50, step: 1355, loss: 0.32173851132392883, mean loss: 0.341737112855005
Epoch: 50, step: 1356, loss: 0.3192416727542877, mean loss: 0.3417368070317645
Epoch: 50, step: 1357, loss: 0.27537769079208374, mean loss: 0.34173590489853306
Epoch: 50, step: 1358, loss: 0.34518754482269287, mean loss: 0.34173595182195404
Epoch: 50, step: 1359, loss: 0.3254798650741577, mean loss: 0.3417357308311065
Epoch: 50, step: 1360, loss: 0.3236222267150879, mean loss: 0.3417354845932343
Epoch: 50, step: 1361, loss: 0.344558447599411, mean loss: 0.3417355229685232
Epoch: 50, step: 1362, loss: 0.35314488410949707, mean loss: 0.34173567806498667
Epoch: 50, step: 1363, loss: 0.34593918919563293, mean loss: 0.341735735205859
Epoch: 50, step: 1364, loss: 0.30226507782936096, mean loss: 0.3417351986646046
Epoch: 50, step: 1365, loss: 0.31944841146469116, mean loss: 0.3417348957150464
Epoch: 50, step: 1366, loss: 0.3133741319179535, mean loss: 0.3417345102057311
Epoch: 50, step: 1367, loss: 0.34500086307525635, mean loss: 0.3417345546048295
Epoch: 50, step: 1368, loss: 0.3791418671607971, mean loss: 0.3417350630705223
Epoch: 50, step: 1369, loss: 0.32497256994247437, mean loss: 0.34173483522638576
Epoch: 50, step: 1370, loss: 0.3306935131549835, mean loss: 0.3417346851492892
Epoch: 50, step: 1371, loss: 0.36037778854370117, mean loss: 0.3417349385487264
Epoch: 50, step: 1372, loss: 0.30726203322410583, mean loss: 0.34173446999497264
Epoch: 50, step: 1373, loss: 0.32608139514923096, mean loss: 0.34173425724216805
Epoch: 50, step: 1374, loss: 0.3602063059806824, mean loss: 0.3417345083063711
Epoch: 50, step: 1375, loss: 0.33506083488464355, mean loss: 0.3417344176018829
Epoch: 50, step: 1376, loss: 0.3663448393344879, mean loss: 0.3417347520871396
Epoch: 50, step: 1377, loss: 0.3337426483631134, mean loss: 0.3417346434663056
Epoch: 50, step: 1378, loss: 0.3455337584018707, mean loss: 0.3417346950994473
Epoch: 50, step: 1379, loss: 0.3215523660182953, mean loss: 0.341734420808484
Epoch: 50, step: 1380, loss: 0.3283536434173584, mean loss: 0.3417342389574981
Epoch: 50, step: 1381, loss: 0.3996414840221405, mean loss: 0.341735025933186
Epoch: 50, step: 1382, loss: 0.3185247480869293, mean loss: 0.34173471050329257
Epoch: 50, step: 1383, loss: 0.3026178777217865, mean loss: 0.3417341789090223
Epoch: 50, step: 1384, loss: 0.3299291431903839, mean loss: 0.3417340184818195
Epoch: 50, step: 1385, loss: 0.3270420432090759, mean loss: 0.34173381882461196
Epoch: 50, step: 1386, loss: 0.31060802936553955, mean loss: 0.34173339584515283
Epoch: 50, step: 1387, loss: 0.31591445207595825, mean loss: 0.3417330449870813
Epoch: 50, step: 1388, loss: 0.3330560326576233, mean loss: 0.34173292707526937
Epoch: 50, step: 1389, loss: 0.3126131594181061, mean loss: 0.3417325313724883
Epoch: 50, step: 1390, loss: 0.3359932601451874, mean loss: 0.34173245338372304
Epoch: 50, step: 1391, loss: 0.32387015223503113, mean loss: 0.3417322106630313
Epoch: 50, step: 1392, loss: 0.3430359959602356, mean loss: 0.3417322283791904
Epoch: 50, step: 1393, loss: 0.3045719861984253, mean loss: 0.3417317234434323
Epoch: 50, step: 1394, loss: 0.3315661549568176, mean loss: 0.3417315853149115
Epoch: 50, step: 1395, loss: 0.33266374468803406, mean loss: 0.3417314621038589
Epoch: 50, step: 1396, loss: 0.31597551703453064, mean loss: 0.34173111214468843
Epoch: 50, step: 1397, loss: 0.30777478218078613, mean loss: 0.3417306507689722
Epoch: 50, step: 1398, loss: 0.3131759762763977, mean loss: 0.34173026279257995
Epoch: 50, step: 1399, loss: 0.3122138977050781, mean loss: 0.34172986175501086
Epoch: 50, step: 1400, loss: 0.3142684996128082, mean loss: 0.34172948864374686
Epoch: 50, step: 1401, loss: 0.36036455631256104, mean loss: 0.34172974183072097
Epoch: 50, step: 1402, loss: 0.33722546696662903, mean loss: 0.3417296806338287
Epoch: 50, step: 1403, loss: 0.386327862739563, mean loss: 0.3417302865544594
Epoch: 50, step: 1404, loss: 0.33732151985168457, mean loss: 0.341730226656807
Epoch: 50, step: 1405, loss: 0.29243043065071106, mean loss: 0.34172955687722373
Epoch: 50, step: 1406, loss: 0.3707084357738495, mean loss: 0.3417299505745473
Epoch: 50, step: 1407, loss: 0.33023157715797424, mean loss: 0.34172979436362705
Epoch: 50, step: 1408, loss: 0.30965444445610046, mean loss: 0.34172935861052744
Epoch: 50, step: 1409, loss: 0.3533989191055298, mean loss: 0.3417295171427988
Epoch: 50, step: 1410, loss: 0.33161234855651855, mean loss: 0.34172937970181055
Epoch: 50, step: 1411, loss: 0.31721773743629456, mean loss: 0.3417290467174837
Epoch: 50, step: 1412, loss: 0.3121981620788574, mean loss: 0.34172864555349586
Epoch: 50, step: 1413, loss: 0.3396008312702179, mean loss: 0.3417286166484739
Epoch: 50, step: 1414, loss: 0.3359081447124481, mean loss: 0.3417285375820889
Epoch: 50, step: 1415, loss: 0.3677304983139038, mean loss: 0.3417288907928139
Epoch: 50, step: 1416, loss: 0.3178921043872833, mean loss: 0.3417285669982229
Epoch: 50, step: 1417, loss: 0.3201959431171417, mean loss: 0.3417282745069316
Epoch: 50, step: 1418, loss: 0.341436505317688, mean loss: 0.3417282705436994
Epoch: 50, step: 1419, loss: 0.330104261636734, mean loss: 0.3417281126517012
Epoch: 50, step: 1420, loss: 0.3378313183784485, mean loss: 0.3417280597212293
Epoch: 50, step: 1421, loss: 0.30817466974258423, mean loss: 0.3417276039690088
Epoch: 50, step: 1422, loss: 0.2945040464401245, mean loss: 0.3417269625450309
Epoch: 50, step: 1423, loss: 0.3492628335952759, mean loss: 0.3417270649012062
Epoch: 50, step: 1424, loss: 0.3450913727283478, mean loss: 0.3417271105963889
Epoch: 50, step: 1425, loss: 0.3056657016277313, mean loss: 0.34172662080461735
Epoch: 50, step: 1426, loss: 0.34914448857307434, mean loss: 0.34172672155390454
Epoch: 50, step: 1427, loss: 0.3701934516429901, mean loss: 0.3417271081830414
Epoch: 50, step: 1428, loss: 0.3519214391708374, mean loss: 0.3417272466384189
Epoch: 50, step: 1429, loss: 0.30122461915016174, mean loss: 0.34172669655519894
Epoch: 50, step: 1430, loss: 0.3732364773750305, mean loss: 0.34172712449697373
Epoch: 50, step: 1431, loss: 0.30932119488716125, mean loss: 0.3417266843903678
Epoch: 50, step: 1432, loss: 0.3351909816265106, mean loss: 0.341726595629856
Epoch: 50, step: 1433, loss: 0.35646945238113403, mean loss: 0.34172679584791765
Epoch: 50, step: 1434, loss: 0.3135363459587097, mean loss: 0.3417264130075579
Epoch: 50, step: 1435, loss: 0.32298216223716736, mean loss: 0.3417261584547472
Epoch: 50, step: 1436, loss: 0.31391265988349915, mean loss: 0.34172578074383325
Epoch: 50, step: 1437, loss: 0.3310512602329254, mean loss: 0.3417256357844303
Epoch: 50, step: 1438, loss: 0.3367389738559723, mean loss: 0.3417255680667545
Epoch: 50, step: 1439, loss: 0.3184587359428406, mean loss: 0.34172525211303206
Epoch: 50, step: 1440, loss: 0.3333859443664551, mean loss: 0.34172513887030387
Epoch: 50, step: 1441, loss: 0.3291897773742676, mean loss: 0.3417249686500288
Epoch: 50, step: 1442, loss: 0.31379327178001404, mean loss: 0.3417245893648711
Epoch: 50, step: 1443, loss: 0.3525845408439636, mean loss: 0.34172473683040094
Valid: 50, mean loss: 0.18598592032988864
Epoch: 51, step: 0, loss: 0.3428782522678375, mean loss: 0.34172475249358836
Epoch: 51, step: 1, loss: 0.301866739988327, mean loss: 0.34172421128276215
Epoch: 51, step: 2, loss: 0.3584465980529785, mean loss: 0.3417244383441057
Epoch: 51, step: 3, loss: 0.34593403339385986, mean loss: 0.34172449550241346
Epoch: 51, step: 4, loss: 0.32931917905807495, mean loss: 0.341724327064058
Epoch: 51, step: 5, loss: 0.30580833554267883, mean loss: 0.34172383940633194
Epoch: 51, step: 6, loss: 0.35623282194137573, mean loss: 0.3417240364027412
Epoch: 51, step: 7, loss: 0.33831751346588135, mean loss: 0.3417239901511399
Epoch: 51, step: 8, loss: 0.3323342204093933, mean loss: 0.3417238626645509
Epoch: 51, step: 9, loss: 0.3302292823791504, mean loss: 0.34172370660269025
Epoch: 51, step: 10, loss: 0.35548135638237, mean loss: 0.34172389338769843
Epoch: 51, step: 11, loss: 0.3283272385597229, mean loss: 0.34172371150631975
Epoch: 51, step: 12, loss: 0.33437255024909973, mean loss: 0.34172361170370413
Epoch: 51, step: 13, loss: 0.28480663895606995, mean loss: 0.34172283898420663
Epoch: 51, step: 14, loss: 0.3425193130970001, mean loss: 0.34172284979719775
Epoch: 51, step: 15, loss: 0.34581074118614197, mean loss: 0.3417229052939584
Epoch: 51, step: 16, loss: 0.3374663293361664, mean loss: 0.3417228475079392
Epoch: 51, step: 17, loss: 0.3777436316013336, mean loss: 0.34172333650883646
Epoch: 51, step: 18, loss: 0.33433765172958374, mean loss: 0.34172323624568157
Epoch: 51, step: 19, loss: 0.36193203926086426, mean loss: 0.34172351058325506
Epoch: 51, step: 20, loss: 0.3024289309978485, mean loss: 0.34172297716060407
Epoch: 51, step: 21, loss: 0.32706379890441895, mean loss: 0.3417227781654332
Epoch: 51, step: 22, loss: 0.30736109614372253, mean loss: 0.3417223117193716
Epoch: 51, step: 23, loss: 0.3571512997150421, mean loss: 0.3417225211588568
Epoch: 51, step: 24, loss: 0.35512152314186096, mean loss: 0.34172270304000063
Epoch: 51, step: 25, loss: 0.3076900839805603, mean loss: 0.3417222410796496
Epoch: 51, step: 26, loss: 0.316199392080307, mean loss: 0.3417218946360151
Epoch: 51, step: 27, loss: 0.28766706585884094, mean loss: 0.34172116091317906
Epoch: 51, step: 28, loss: 0.3244588077068329, mean loss: 0.3417209266027369
Epoch: 51, step: 29, loss: 0.3014458119869232, mean loss: 0.3417203799361433
Epoch: 51, step: 30, loss: 0.368869811296463, mean loss: 0.3417207484387746
Epoch: 51, step: 31, loss: 0.3342069685459137, mean loss: 0.34172064645468353
Epoch: 51, step: 32, loss: 0.31921881437301636, mean loss: 0.34172034104279
Epoch: 51, step: 33, loss: 0.34498754143714905, mean loss: 0.34172038538710436
Epoch: 51, step: 34, loss: 0.3306444585323334, mean loss: 0.34172023506032395
Epoch: 51, step: 35, loss: 0.35860973596572876, mean loss: 0.34172046428807784
Epoch: 51, step: 36, loss: 0.3038325607776642, mean loss: 0.3417199500726965
Epoch: 51, step: 37, loss: 0.35526466369628906, mean loss: 0.34172013389932476
Epoch: 51, step: 38, loss: 0.30930137634277344, mean loss: 0.34171969392324403
Epoch: 51, step: 39, loss: 0.32868775725364685, mean loss: 0.34171951706074105
Epoch: 51, step: 40, loss: 0.32908734679222107, mean loss: 0.34171934562598133
Epoch: 51, step: 41, loss: 0.31832677125930786, mean loss: 0.341719028163039
Epoch: 51, step: 42, loss: 0.31686437129974365, mean loss: 0.341718690862608
Epoch: 51, step: 43, loss: 0.32838067412376404, mean loss: 0.34171850985597546
Epoch: 51, step: 44, loss: 0.32269397377967834, mean loss: 0.34171825168262426
Epoch: 51, step: 45, loss: 0.34201496839523315, mean loss: 0.3417182557091776
Epoch: 51, step: 46, loss: 0.34176990389823914, mean loss: 0.3417182564100527
Epoch: 51, step: 47, loss: 0.31184911727905273, mean loss: 0.34171785108601305
Epoch: 51, step: 48, loss: 0.3548465669155121, mean loss: 0.3417180292401909
Epoch: 51, step: 49, loss: 0.3230189383029938, mean loss: 0.341717775500525
Epoch: 51, step: 50, loss: 0.37010520696640015, mean loss: 0.34171816070211897
Epoch: 51, step: 51, loss: 0.3505009114742279, mean loss: 0.3417182798775257
Epoch: 51, step: 52, loss: 0.315522700548172, mean loss: 0.34171792442778787
Epoch: 51, step: 53, loss: 0.35200005769729614, mean loss: 0.34171806394491544
Epoch: 51, step: 54, loss: 0.35220301151275635, mean loss: 0.3417182062120774
Epoch: 51, step: 55, loss: 0.3296736478805542, mean loss: 0.3417180427852343
Epoch: 51, step: 56, loss: 0.32672491669654846, mean loss: 0.3417178393534479
Epoch: 51, step: 57, loss: 0.30182337760925293, mean loss: 0.34171729805929385
Epoch: 51, step: 58, loss: 0.3606342375278473, mean loss: 0.3417175547237372
Epoch: 51, step: 59, loss: 0.31861791014671326, mean loss: 0.34171724131273407
Epoch: 51, step: 60, loss: 0.3239518702030182, mean loss: 0.3417170002792749
Epoch: 51, step: 61, loss: 0.2956111431121826, mean loss: 0.34171637474190797
Epoch: 51, step: 62, loss: 0.3037009537220001, mean loss: 0.34171585897785545
Epoch: 51, step: 63, loss: 0.3161216080188751, mean loss: 0.3417155117394151
Epoch: 51, step: 64, loss: 0.3101062774658203, mean loss: 0.3417150829012234
Epoch: 51, step: 65, loss: 0.33171817660331726, mean loss: 0.3417149472763923
Epoch: 51, step: 66, loss: 0.34680354595184326, mean loss: 0.3417150163108468
Epoch: 51, step: 67, loss: 0.3171057403087616, mean loss: 0.34171468245372716
Epoch: 51, step: 68, loss: 0.34896719455718994, mean loss: 0.34171478084223533
Epoch: 51, step: 69, loss: 0.34182673692703247, mean loss: 0.3417147823610253
Epoch: 51, step: 70, loss: 0.30364325642585754, mean loss: 0.34171426589184084
Epoch: 51, step: 71, loss: 0.3406772017478943, mean loss: 0.3417142518234684
Epoch: 51, step: 72, loss: 0.33792468905448914, mean loss: 0.34171420041656403
Epoch: 51, step: 73, loss: 0.3568832278251648, mean loss: 0.3417144061875753
Epoch: 51, step: 74, loss: 0.30325594544410706, mean loss: 0.34171388449763457
Epoch: 51, step: 75, loss: 0.3376598656177521, mean loss: 0.3417138295055174
Epoch: 51, step: 76, loss: 0.32950568199157715, mean loss: 0.3417136639061968
Epoch: 51, step: 77, loss: 0.3087773323059082, mean loss: 0.34171321714225117
Epoch: 51, step: 78, loss: 0.292874276638031, mean loss: 0.34171255467679934
Epoch: 51, step: 79, loss: 0.3001810908317566, mean loss: 0.3417119913397063
Epoch: 51, step: 80, loss: 0.3162551522254944, mean loss: 0.3417116460451778
Epoch: 51, step: 81, loss: 0.34317830204963684, mean loss: 0.34171166593851265
Epoch: 51, step: 82, loss: 0.3342932462692261, mean loss: 0.34171156531839153
Epoch: 51, step: 83, loss: 0.381644606590271, mean loss: 0.3417121069449279
Epoch: 51, step: 84, loss: 0.35370534658432007, mean loss: 0.34171226961144496
Epoch: 51, step: 85, loss: 0.3483281135559082, mean loss: 0.3417123593421373
Epoch: 51, step: 86, loss: 0.39491721987724304, mean loss: 0.3417130809498808
Epoch: 51, step: 87, loss: 0.31777969002723694, mean loss: 0.34171275635010157
Epoch: 51, step: 88, loss: 0.39897066354751587, mean loss: 0.3417135329075073
Epoch: 51, step: 89, loss: 0.30511873960494995, mean loss: 0.34171303659924646
Epoch: 51, step: 90, loss: 0.36004137992858887, mean loss: 0.3417132851697127
Epoch: 51, step: 91, loss: 0.31808486580848694, mean loss: 0.341712964723535
Epoch: 51, step: 92, loss: 0.3238508701324463, mean loss: 0.3417127224829422
Epoch: 51, step: 93, loss: 0.3192686438560486, mean loss: 0.34171241810692676
Epoch: 51, step: 94, loss: 0.3977051377296448, mean loss: 0.34171317744350066
Epoch: 51, step: 95, loss: 0.3448260426521301, mean loss: 0.3417132196575664
Epoch: 51, step: 96, loss: 0.33807480335235596, mean loss: 0.3417131703170868
Epoch: 51, step: 97, loss: 0.3313037157058716, mean loss: 0.3417130291566272
Epoch: 51, step: 98, loss: 0.3220197260379791, mean loss: 0.34171276210344087
Epoch: 51, step: 99, loss: 0.3551507890224457, mean loss: 0.3417129443288005
Epoch: 51, step: 100, loss: 0.2992788851261139, mean loss: 0.34171236891271534
Epoch: 51, step: 101, loss: 0.32890453934669495, mean loss: 0.34171219523781005
Epoch: 51, step: 102, loss: 0.32672974467277527, mean loss: 0.34171199207767383
Epoch: 51, step: 103, loss: 0.32549458742141724, mean loss: 0.34171177217469806
Epoch: 51, step: 104, loss: 0.30351245403289795, mean loss: 0.34171125421081866
Epoch: 51, step: 105, loss: 0.33539536595344543, mean loss: 0.34171116857165584
Epoch: 51, step: 106, loss: 0.399555504322052, mean loss: 0.34171195289099726
Epoch: 51, step: 107, loss: 0.32632291316986084, mean loss: 0.34171174423171047
Epoch: 51, step: 108, loss: 0.35294193029403687, mean loss: 0.34171189649922584
Epoch: 51, step: 109, loss: 0.313504695892334, mean loss: 0.34171151404945216
Epoch: 51, step: 110, loss: 0.3265506327152252, mean loss: 0.3417113084921159
Epoch: 51, step: 111, loss: 0.3584275543689728, mean loss: 0.3417115351346382
Epoch: 51, step: 112, loss: 0.3543052077293396, mean loss: 0.34171170588009414
Epoch: 51, step: 113, loss: 0.3519001305103302, mean loss: 0.3417118440132408
Epoch: 51, step: 114, loss: 0.30132681131362915, mean loss: 0.3417112964863939
Epoch: 51, step: 115, loss: 0.311868816614151, mean loss: 0.34171089189745857
Epoch: 51, step: 116, loss: 0.3321802318096161, mean loss: 0.34171076268744127
Epoch: 51, step: 117, loss: 0.3087218403816223, mean loss: 0.34171031545279057
Epoch: 51, step: 118, loss: 0.3275044858455658, mean loss: 0.34171012286531977
Epoch: 51, step: 119, loss: 0.33422210812568665, mean loss: 0.3417100213521868
Epoch: 51, step: 120, loss: 0.3529609739780426, mean loss: 0.34171017387645475
Epoch: 51, step: 121, loss: 0.3615148067474365, mean loss: 0.34171044235560327
Epoch: 51, step: 122, loss: 0.3700370490550995, mean loss: 0.34171082635667016
Epoch: 51, step: 123, loss: 0.3544837236404419, mean loss: 0.3417109995062375
Epoch: 51, step: 124, loss: 0.3215656876564026, mean loss: 0.34171072641982114
Epoch: 51, step: 125, loss: 0.37880828976631165, mean loss: 0.3417112293012546
Epoch: 51, step: 126, loss: 0.3023611605167389, mean loss: 0.34171069589288566
Epoch: 51, step: 127, loss: 0.32374846935272217, mean loss: 0.3417104524099038
Epoch: 51, step: 128, loss: 0.3233271837234497, mean loss: 0.34171020322295614
Epoch: 51, step: 129, loss: 0.33827465772628784, mean loss: 0.3417101566544429
Epoch: 51, step: 130, loss: 0.32414138317108154, mean loss: 0.3417099185145109
Epoch: 51, step: 131, loss: 0.3191079795360565, mean loss: 0.3417096121555462
Epoch: 51, step: 132, loss: 0.3741198778152466, mean loss: 0.34171005145594685
Epoch: 51, step: 133, loss: 0.36317095160484314, mean loss: 0.34171034234076547
Epoch: 51, step: 134, loss: 0.3687305748462677, mean loss: 0.34171070857278957
Epoch: 51, step: 135, loss: 0.32486265897750854, mean loss: 0.34171048021754974
Epoch: 51, step: 136, loss: 0.330613374710083, mean loss: 0.34171032981154403
Epoch: 51, step: 137, loss: 0.3377785086631775, mean loss: 0.3417102765218372
Epoch: 51, step: 138, loss: 0.3275124430656433, mean loss: 0.3417100840949441
Epoch: 51, step: 139, loss: 0.3522651791572571, mean loss: 0.3417102271489268
Epoch: 51, step: 140, loss: 0.3451117277145386, mean loss: 0.3417102732490903
Epoch: 51, step: 141, loss: 0.34665927290916443, mean loss: 0.34171034032143005
Epoch: 51, step: 142, loss: 0.3164491653442383, mean loss: 0.34170999796878015
Epoch: 51, step: 143, loss: 0.3783361613750458, mean loss: 0.34171049433896783
Epoch: 51, step: 144, loss: 0.32422083616256714, mean loss: 0.3417102573164011
Epoch: 51, step: 145, loss: 0.33444952964782715, mean loss: 0.3417101589192244
Epoch: 51, step: 146, loss: 0.29970744252204895, mean loss: 0.3417095897073097
Epoch: 51, step: 147, loss: 0.3357270061969757, mean loss: 0.34170950863370403
Epoch: 51, step: 148, loss: 0.3487500250339508, mean loss: 0.3417096040427049
Epoch: 51, step: 149, loss: 0.33251455426216125, mean loss: 0.341709479438404
Epoch: 51, step: 150, loss: 0.3178717792034149, mean loss: 0.3417091564124506
Epoch: 51, step: 151, loss: 0.29469040036201477, mean loss: 0.34170851926740137
Epoch: 51, step: 152, loss: 0.3461090326309204, mean loss: 0.3417085788973777
Epoch: 51, step: 153, loss: 0.3203981816768646, mean loss: 0.34170829013078213
Epoch: 51, step: 154, loss: 0.36204734444618225, mean loss: 0.3417085657314585
Epoch: 51, step: 155, loss: 0.331868976354599, mean loss: 0.3417084324036892
Epoch: 51, step: 156, loss: 0.3549099564552307, mean loss: 0.34170861128370505
Epoch: 51, step: 157, loss: 0.3483113944530487, mean loss: 0.34170870074988713
Epoch: 51, step: 158, loss: 0.334612101316452, mean loss: 0.341708604593912
Epoch: 51, step: 159, loss: 0.3109778165817261, mean loss: 0.3417081882101386
Epoch: 51, step: 160, loss: 0.3346439599990845, mean loss: 0.34170809249537387
Epoch: 51, step: 161, loss: 0.3384416997432709, mean loss: 0.34170804823890755
Epoch: 51, step: 162, loss: 0.2939130663871765, mean loss: 0.3417074006718495
Epoch: 51, step: 163, loss: 0.3614765703678131, mean loss: 0.34170766851774287
Epoch: 51, step: 164, loss: 0.4307252764701843, mean loss: 0.34170887457131294
Epoch: 51, step: 165, loss: 0.3450964093208313, mean loss: 0.3417089204666489
Epoch: 51, step: 166, loss: 0.33509910106658936, mean loss: 0.34170883091604803
Epoch: 51, step: 167, loss: 0.33665987849235535, mean loss: 0.341708762513181
Epoch: 51, step: 168, loss: 0.3251574635505676, mean loss: 0.3417085382803363
Epoch: 51, step: 169, loss: 0.3256930410861969, mean loss: 0.34170832130933904
Epoch: 51, step: 170, loss: 0.3228242099285126, mean loss: 0.341708065479069
Epoch: 51, step: 171, loss: 0.2945033609867096, mean loss: 0.34170742598757
Epoch: 51, step: 172, loss: 0.34452682733535767, mean loss: 0.34170746418204206
Epoch: 51, step: 173, loss: 0.33775684237480164, mean loss: 0.3417074106636345
Epoch: 51, step: 174, loss: 0.31194478273391724, mean loss: 0.34170700747979393
Epoch: 51, step: 175, loss: 0.30076006054878235, mean loss: 0.34170645279343614
Epoch: 51, step: 176, loss: 0.3203165531158447, mean loss: 0.34170616303984735
Epoch: 51, step: 177, loss: 0.33752259612083435, mean loss: 0.3417061063688425
Epoch: 51, step: 178, loss: 0.30050143599510193, mean loss: 0.3417055482139264
Epoch: 51, step: 179, loss: 0.33322522044181824, mean loss: 0.34170543334169284
Epoch: 51, step: 180, loss: 0.34462153911590576, mean loss: 0.34170547284194036
Epoch: 51, step: 181, loss: 0.3144812285900116, mean loss: 0.3417051040796581
Epoch: 51, step: 182, loss: 0.3025413453578949, mean loss: 0.3417045735994988
Epoch: 51, step: 183, loss: 0.34425970911979675, mean loss: 0.34170460820880044
Epoch: 51, step: 184, loss: 0.30978846549987793, mean loss: 0.3417041759106153
Epoch: 51, step: 185, loss: 0.35654401779174805, mean loss: 0.3417043769107762
Epoch: 51, step: 186, loss: 0.33463695645332336, mean loss: 0.3417042811864808
Epoch: 51, step: 187, loss: 0.3858359456062317, mean loss: 0.34170487891733486
Epoch: 51, step: 188, loss: 0.30109405517578125, mean loss: 0.3417043288811215
Epoch: 51, step: 189, loss: 0.34078890085220337, mean loss: 0.3417043164826597
Epoch: 51, step: 190, loss: 0.3455497920513153, mean loss: 0.34170436856467457
Epoch: 51, step: 191, loss: 0.29321154952049255, mean loss: 0.3417037118007783
Epoch: 51, step: 192, loss: 0.3416063189506531, mean loss: 0.3417037104817533
Epoch: 51, step: 193, loss: 0.31735754013061523, mean loss: 0.34170338075762274
Epoch: 51, step: 194, loss: 0.3297727108001709, mean loss: 0.3417032191808143
Epoch: 51, step: 195, loss: 0.3206816017627716, mean loss: 0.3417029344893541
Epoch: 51, step: 196, loss: 0.32702234387397766, mean loss: 0.341702735675814
Epoch: 51, step: 197, loss: 0.31909677386283875, mean loss: 0.3417024295361941
Epoch: 51, step: 198, loss: 0.35717660188674927, mean loss: 0.3417026390912278
Epoch: 51, step: 199, loss: 0.38046202063560486, mean loss: 0.3417031639731619
Epoch: 51, step: 200, loss: 0.3414852023124695, mean loss: 0.3417031610215516
Epoch: 51, step: 201, loss: 0.31202664971351624, mean loss: 0.34170275915129045
Epoch: 51, step: 202, loss: 0.36875292658805847, mean loss: 0.341703125451444
Epoch: 51, step: 203, loss: 0.3435431122779846, mean loss: 0.34170315036730936
Epoch: 51, step: 204, loss: 0.3290656507015228, mean loss: 0.3417029792410969
Epoch: 51, step: 205, loss: 0.3267611861228943, mean loss: 0.3417027769148529
Epoch: 51, step: 206, loss: 0.34756574034690857, mean loss: 0.3417028563039395
Epoch: 51, step: 207, loss: 0.34630921483039856, mean loss: 0.3417029186767733
Epoch: 51, step: 208, loss: 0.31278297305107117, mean loss: 0.3417025270888131
Epoch: 51, step: 209, loss: 0.3644685745239258, mean loss: 0.3417028353462864
Epoch: 51, step: 210, loss: 0.3184744715690613, mean loss: 0.341702520833203
Epoch: 51, step: 211, loss: 0.3431834876537323, mean loss: 0.34170254088528845
Epoch: 51, step: 212, loss: 0.3703383803367615, mean loss: 0.34170292860533463
Epoch: 51, step: 213, loss: 0.3438916802406311, mean loss: 0.3417029582399258
Epoch: 51, step: 214, loss: 0.3156847059726715, mean loss: 0.3417026059707065
Epoch: 51, step: 215, loss: 0.32615721225738525, mean loss: 0.34170239549962994
Epoch: 51, step: 216, loss: 0.3398926556110382, mean loss: 0.34170237099766154
Epoch: 51, step: 217, loss: 0.32501277327537537, mean loss: 0.3417021450411789
Epoch: 51, step: 218, loss: 0.31217730045318604, mean loss: 0.34170174531676223
Epoch: 51, step: 219, loss: 0.31434375047683716, mean loss: 0.34170137493342473
Epoch: 51, step: 220, loss: 0.31101757287979126, mean loss: 0.34170095952961976
Epoch: 51, step: 221, loss: 0.3085927367210388, mean loss: 0.3417005113095617
Epoch: 51, step: 222, loss: 0.3173825144767761, mean loss: 0.3417001820962888
Epoch: 51, step: 223, loss: 0.3017812669277191, mean loss: 0.3416996416875168
Epoch: 51, step: 224, loss: 0.31338173151016235, mean loss: 0.3416992583344164
Epoch: 51, step: 225, loss: 0.3403882682323456, mean loss: 0.3416992405871563
Epoch: 51, step: 226, loss: 0.31264713406562805, mean loss: 0.3416988473055367
Epoch: 51, step: 227, loss: 0.34302660822868347, mean loss: 0.3416988652793417
Epoch: 51, step: 228, loss: 0.351500540971756, mean loss: 0.34169899796213093
Epoch: 51, step: 229, loss: 0.30058416724205017, mean loss: 0.3416984414086653
Epoch: 51, step: 230, loss: 0.30442747473716736, mean loss: 0.34169793689473404
Epoch: 51, step: 231, loss: 0.3592437207698822, mean loss: 0.34169817439789985
Epoch: 51, step: 232, loss: 0.31968188285827637, mean loss: 0.341697876385101
Epoch: 51, step: 233, loss: 0.3115841746330261, mean loss: 0.3416974687711733
Epoch: 51, step: 234, loss: 0.3305218815803528, mean loss: 0.34169731750237986
Epoch: 51, step: 235, loss: 0.32352063059806824, mean loss: 0.3416970714725084
Epoch: 51, step: 236, loss: 0.3087264895439148, mean loss: 0.3416966252064599
Epoch: 51, step: 237, loss: 0.32212620973587036, mean loss: 0.34169636031899786
Epoch: 51, step: 238, loss: 0.3441019058227539, mean loss: 0.3416963928778477
Epoch: 51, step: 239, loss: 0.34465107321739197, mean loss: 0.3416964328686487
Epoch: 51, step: 240, loss: 0.34438464045524597, mean loss: 0.34169646925232044
Epoch: 51, step: 241, loss: 0.31469371914863586, mean loss: 0.3416961037872783
Epoch: 51, step: 242, loss: 0.3296736776828766, mean loss: 0.3416959410735925
Epoch: 51, step: 243, loss: 0.31547465920448303, mean loss: 0.34169558619483187
Epoch: 51, step: 244, loss: 0.34095898270606995, mean loss: 0.34169557622577706
Epoch: 51, step: 245, loss: 0.34861165285110474, mean loss: 0.3416956698254066
Epoch: 51, step: 246, loss: 0.299614816904068, mean loss: 0.34169510032637535
Epoch: 51, step: 247, loss: 0.29556071758270264, mean loss: 0.3416944759775589
Epoch: 51, step: 248, loss: 0.31898725032806396, mean loss: 0.3416941686788209
Epoch: 51, step: 249, loss: 0.30899104475975037, mean loss: 0.34169372611076504
Epoch: 51, step: 250, loss: 0.35924622416496277, mean loss: 0.3416939636437247
Epoch: 51, step: 251, loss: 0.3119667172431946, mean loss: 0.3416935613588053
Epoch: 51, step: 252, loss: 0.29855650663375854, mean loss: 0.34169297761312245
Epoch: 51, step: 253, loss: 0.32290080189704895, mean loss: 0.34169272331428197
Epoch: 51, step: 254, loss: 0.34153950214385986, mean loss: 0.3416927212408957
Epoch: 51, step: 255, loss: 0.3270673155784607, mean loss: 0.34169252333283534
Epoch: 51, step: 256, loss: 0.3042432963848114, mean loss: 0.34169201658425347
Epoch: 51, step: 257, loss: 0.31138280034065247, mean loss: 0.34169160645710883
Epoch: 51, step: 258, loss: 0.31308525800704956, mean loss: 0.3416912193774443
Epoch: 51, step: 259, loss: 0.32825028896331787, mean loss: 0.3416910375073099
Epoch: 51, step: 260, loss: 0.32338371872901917, mean loss: 0.3416907897930987
Epoch: 51, step: 261, loss: 0.30387088656425476, mean loss: 0.34169027806329016
Epoch: 51, step: 262, loss: 0.3097938597202301, mean loss: 0.341689846488225
Epoch: 51, step: 263, loss: 0.34832248091697693, mean loss: 0.34168993622999083
Epoch: 51, step: 264, loss: 0.3147351145744324, mean loss: 0.34168957152715823
Epoch: 51, step: 265, loss: 0.3018641769886017, mean loss: 0.34168903269080947
Epoch: 51, step: 266, loss: 0.37539249658584595, mean loss: 0.3416894886914575
Epoch: 51, step: 267, loss: 0.3254387676715851, mean loss: 0.34168926882565737
Epoch: 51, step: 268, loss: 0.4714025855064392, mean loss: 0.3416910237715624
Epoch: 51, step: 269, loss: 0.29685044288635254, mean loss: 0.34169041711273074
Epoch: 51, step: 270, loss: 0.3356192409992218, mean loss: 0.3416903349754634
Epoch: 51, step: 271, loss: 0.2849719822406769, mean loss: 0.3416895676402081
Epoch: 51, step: 272, loss: 0.3395921587944031, mean loss: 0.34168953926501905
Epoch: 51, step: 273, loss: 0.3241436779499054, mean loss: 0.34168930189575425
Epoch: 51, step: 274, loss: 0.35473841428756714, mean loss: 0.3416894784283425
Epoch: 51, step: 275, loss: 0.32142505049705505, mean loss: 0.34168920428835425
Epoch: 51, step: 276, loss: 0.2873503267765045, mean loss: 0.34168846919443624
Epoch: 51, step: 277, loss: 0.33544009923934937, mean loss: 0.3416883846679089
Epoch: 51, step: 278, loss: 0.3314814269542694, mean loss: 0.34168824659237473
Epoch: 51, step: 279, loss: 0.3556276261806488, mean loss: 0.34168843515602915
Epoch: 51, step: 280, loss: 0.3451436758041382, mean loss: 0.3416884818958418
Epoch: 51, step: 281, loss: 0.35043230652809143, mean loss: 0.34168860017391217
Epoch: 51, step: 282, loss: 0.3216400742530823, mean loss: 0.34168832898035745
Epoch: 51, step: 283, loss: 0.3013206124305725, mean loss: 0.3416877829393912
Epoch: 51, step: 284, loss: 0.3307792842388153, mean loss: 0.3416876353856748
Epoch: 51, step: 285, loss: 0.33498814702033997, mean loss: 0.34168754476632723
Epoch: 51, step: 286, loss: 0.3621325194835663, mean loss: 0.34168782130762543
Epoch: 51, step: 287, loss: 0.3293069899082184, mean loss: 0.3416876538452086
Epoch: 51, step: 288, loss: 0.29937803745269775, mean loss: 0.34168708157549965
Epoch: 51, step: 289, loss: 0.3166578412055969, mean loss: 0.34168674304058516
Epoch: 51, step: 290, loss: 0.35132595896720886, mean loss: 0.3416868734147777
Epoch: 51, step: 291, loss: 0.3700946867465973, mean loss: 0.34168725763644686
Epoch: 51, step: 292, loss: 0.375577449798584, mean loss: 0.34168771600224696
Epoch: 51, step: 293, loss: 0.3308910131454468, mean loss: 0.3416875699785128
Epoch: 51, step: 294, loss: 0.3627043664455414, mean loss: 0.341687854223586
Epoch: 51, step: 295, loss: 0.30288031697273254, mean loss: 0.3416873293718515
Epoch: 51, step: 296, loss: 0.35786324739456177, mean loss: 0.3416875481397613
Epoch: 51, step: 297, loss: 0.3091047704219818, mean loss: 0.3416871074865775
Epoch: 51, step: 298, loss: 0.30467456579208374, mean loss: 0.34168660693153247
Epoch: 51, step: 299, loss: 0.3076922297477722, mean loss: 0.34168614720015217
Epoch: 51, step: 300, loss: 0.34803688526153564, mean loss: 0.3416862330847699
Epoch: 51, step: 301, loss: 0.3029722273349762, mean loss: 0.3416857095404842
Epoch: 51, step: 302, loss: 0.35792553424835205, mean loss: 0.34168592915486623
Epoch: 51, step: 303, loss: 0.29510220885276794, mean loss: 0.34168529920246316
Epoch: 51, step: 304, loss: 0.3666878938674927, mean loss: 0.341685637308383
Epoch: 51, step: 305, loss: 0.3258204758167267, mean loss: 0.34168542276934993
Epoch: 51, step: 306, loss: 0.32660144567489624, mean loss: 0.34168521879675867
Epoch: 51, step: 307, loss: 0.3281457722187042, mean loss: 0.341685035712507
Epoch: 51, step: 308, loss: 0.35149383544921875, mean loss: 0.3416851683480963
Epoch: 51, step: 309, loss: 0.305398166179657, mean loss: 0.3416846776781911
Epoch: 51, step: 310, loss: 0.33921974897384644, mean loss: 0.34168464434807544
Epoch: 51, step: 311, loss: 0.3088401257991791, mean loss: 0.3416842002391654
Epoch: 51, step: 312, loss: 0.34635815024375916, mean loss: 0.34168426343737524
Epoch: 51, step: 313, loss: 0.32170721888542175, mean loss: 0.3416839933240061
Epoch: 51, step: 314, loss: 0.3334668278694153, mean loss: 0.3416838822196719
Epoch: 51, step: 315, loss: 0.3486642837524414, mean loss: 0.341683976600439
Epoch: 51, step: 316, loss: 0.3057061731815338, mean loss: 0.34168349015753774
Epoch: 51, step: 317, loss: 0.3790222406387329, mean loss: 0.34168399499448754
Epoch: 51, step: 318, loss: 0.3104359209537506, mean loss: 0.34168357251197545
Epoch: 51, step: 319, loss: 0.37858715653419495, mean loss: 0.3416840714517843
Epoch: 51, step: 320, loss: 0.3386286199092865, mean loss: 0.3416840301423604
Epoch: 51, step: 321, loss: 0.363191157579422, mean loss: 0.34168432091281487
Epoch: 51, step: 322, loss: 0.31840062141418457, mean loss: 0.34168400612785
Epoch: 51, step: 323, loss: 0.3895609974861145, mean loss: 0.34168465339411863
Epoch: 51, step: 324, loss: 0.30639564990997314, mean loss: 0.34168417631583603
Epoch: 51, step: 325, loss: 0.31727468967437744, mean loss: 0.341683846324128
Epoch: 51, step: 326, loss: 0.31018537282943726, mean loss: 0.3416834205022046
Epoch: 51, step: 327, loss: 0.3227200508117676, mean loss: 0.34168316414345146
Epoch: 51, step: 328, loss: 0.32616177201271057, mean loss: 0.34168295431835133
Epoch: 51, step: 329, loss: 0.34840667247772217, mean loss: 0.3416830452113429
Epoch: 51, step: 330, loss: 0.32863783836364746, mean loss: 0.3416828688651875
Epoch: 51, step: 331, loss: 0.3075769543647766, mean loss: 0.34168240782492443
Epoch: 51, step: 332, loss: 0.35812821984291077, mean loss: 0.34168263013472366
Epoch: 51, step: 333, loss: 0.33213722705841064, mean loss: 0.3416825011044298
Epoch: 51, step: 334, loss: 0.32593676447868347, mean loss: 0.3416822882638044
Epoch: 51, step: 335, loss: 0.32305803894996643, mean loss: 0.3416820365167199
Epoch: 51, step: 336, loss: 0.32067763805389404, mean loss: 0.3416817526006001
Epoch: 51, step: 337, loss: 0.3142470717430115, mean loss: 0.3416813817714679
Epoch: 51, step: 338, loss: 0.35374173521995544, mean loss: 0.3416815447866666
Epoch: 51, step: 339, loss: 0.34988224506378174, mean loss: 0.34168165563090697
Epoch: 51, step: 340, loss: 0.32878297567367554, mean loss: 0.3416814812890815
Epoch: 51, step: 341, loss: 0.3349568843841553, mean loss: 0.3416813903989549
Epoch: 51, step: 342, loss: 0.31021827459335327, mean loss: 0.34168096514700785
Epoch: 51, step: 343, loss: 0.35370326042175293, mean loss: 0.3416811276368072
Epoch: 51, step: 344, loss: 0.31447136402130127, mean loss: 0.3416807598826327
Epoch: 51, step: 345, loss: 0.35491201281547546, mean loss: 0.34168093870751354
Epoch: 51, step: 346, loss: 0.35579243302345276, mean loss: 0.34168112942657825
Epoch: 51, step: 347, loss: 0.31342053413391113, mean loss: 0.34168074748535093
Epoch: 51, step: 348, loss: 0.3278804123401642, mean loss: 0.34168056097669275
Epoch: 51, step: 349, loss: 0.3036123216152191, mean loss: 0.34168004649931133
Epoch: 51, step: 350, loss: 0.31363770365715027, mean loss: 0.3416796675231259
Epoch: 51, step: 351, loss: 0.32508909702301025, mean loss: 0.3416794433141078
Epoch: 51, step: 352, loss: 0.33377617597579956, mean loss: 0.3416793365088679
Epoch: 51, step: 353, loss: 0.35890939831733704, mean loss: 0.3416795693538341
Epoch: 51, step: 354, loss: 0.32201653718948364, mean loss: 0.3416793036335924
Epoch: 51, step: 355, loss: 0.345233678817749, mean loss: 0.34167935166568947
Epoch: 51, step: 356, loss: 0.36737504601478577, mean loss: 0.34167969890010996
Epoch: 51, step: 357, loss: 0.34485241770744324, mean loss: 0.3416797417735297
Epoch: 51, step: 358, loss: 0.29340165853500366, mean loss: 0.3416790893934473
Epoch: 51, step: 359, loss: 0.34211239218711853, mean loss: 0.341679095248574
Epoch: 51, step: 360, loss: 0.3488236963748932, mean loss: 0.3416791917907147
Epoch: 51, step: 361, loss: 0.3184575140476227, mean loss: 0.3416788780097004
Epoch: 51, step: 362, loss: 0.3657192289829254, mean loss: 0.34167920284858017
Epoch: 51, step: 363, loss: 0.3499550521373749, mean loss: 0.3416793146722923
Epoch: 51, step: 364, loss: 0.35246193408966064, mean loss: 0.34167946036564606
Epoch: 51, step: 365, loss: 0.3195399045944214, mean loss: 0.34167916122288466
Epoch: 51, step: 366, loss: 0.32815027236938477, mean loss: 0.34167897842723466
Epoch: 51, step: 367, loss: 0.33615371584892273, mean loss: 0.34167890377363014
Epoch: 51, step: 368, loss: 0.3416316509246826, mean loss: 0.3416789031351903
Epoch: 51, step: 369, loss: 0.30645492672920227, mean loss: 0.3416784272255461
Epoch: 51, step: 370, loss: 0.4250951409339905, mean loss: 0.34167955424998314
Epoch: 51, step: 371, loss: 0.3215855360031128, mean loss: 0.34167928276789483
Epoch: 51, step: 372, loss: 0.33173614740371704, mean loss: 0.34167914843206165
Epoch: 51, step: 373, loss: 0.37721434235572815, mean loss: 0.3416796285206066
Epoch: 51, step: 374, loss: 0.3370952606201172, mean loss: 0.3416795665855913
Epoch: 51, step: 375, loss: 0.32918408513069153, mean loss: 0.3416793977733587
Epoch: 51, step: 376, loss: 0.2948192358016968, mean loss: 0.34167876470758046
Epoch: 51, step: 377, loss: 0.3531283438205719, mean loss: 0.34167891938563716
Epoch: 51, step: 378, loss: 0.3306095004081726, mean loss: 0.34167876984537293
Epoch: 51, step: 379, loss: 0.31708139181137085, mean loss: 0.34167843755614197
Epoch: 51, step: 380, loss: 0.31935811042785645, mean loss: 0.34167813603196595
Epoch: 51, step: 381, loss: 0.3114776909351349, mean loss: 0.3416777280611841
Epoch: 51, step: 382, loss: 0.3650953471660614, mean loss: 0.34167804440007543
Epoch: 51, step: 383, loss: 0.36634010076522827, mean loss: 0.34167837754505254
Epoch: 51, step: 384, loss: 0.3573378622531891, mean loss: 0.3416785890768132
Epoch: 51, step: 385, loss: 0.3447507321834564, mean loss: 0.3416786305754368
Epoch: 51, step: 386, loss: 0.3208494484424591, mean loss: 0.34167834921786855
Epoch: 51, step: 387, loss: 0.3276725709438324, mean loss: 0.34167816003240453
Epoch: 51, step: 388, loss: 0.31361737847328186, mean loss: 0.34167778100168095
Epoch: 51, step: 389, loss: 0.32145410776138306, mean loss: 0.34167750783430867
Epoch: 51, step: 390, loss: 0.31549569964408875, mean loss: 0.3416771541933525
Epoch: 51, step: 391, loss: 0.31359192728996277, mean loss: 0.3416767748478057
Epoch: 51, step: 392, loss: 0.3436375856399536, mean loss: 0.34167680133200673
Epoch: 51, step: 393, loss: 0.32680439949035645, mean loss: 0.34167660045675563
Epoch: 51, step: 394, loss: 0.3819408118724823, mean loss: 0.34167714428111057
Epoch: 51, step: 395, loss: 0.35794010758399963, mean loss: 0.34167736393215464
Epoch: 51, step: 396, loss: 0.37237581610679626, mean loss: 0.34167777854638426
Epoch: 51, step: 397, loss: 0.3189527094364166, mean loss: 0.34167747162505435
Epoch: 51, step: 398, loss: 0.30215758085250854, mean loss: 0.341676937882624
Epoch: 51, step: 399, loss: 0.3232531249523163, mean loss: 0.3416766890601275
Epoch: 51, step: 400, loss: 0.3082563281059265, mean loss: 0.34167623770809896
Epoch: 51, step: 401, loss: 0.38012924790382385, mean loss: 0.341676757020556
Epoch: 51, step: 402, loss: 0.3364783525466919, mean loss: 0.341676686816436
Epoch: 51, step: 403, loss: 0.32103195786476135, mean loss: 0.3416764080144568
Epoch: 51, step: 404, loss: 0.3203843832015991, mean loss: 0.3416761204747897
Epoch: 51, step: 405, loss: 0.3111397325992584, mean loss: 0.3416757080995314
Epoch: 51, step: 406, loss: 0.306011438369751, mean loss: 0.34167522648186616
Epoch: 51, step: 407, loss: 0.3456207513809204, mean loss: 0.34167527976232986
Epoch: 51, step: 408, loss: 0.34847524762153625, mean loss: 0.34167537158802036
Epoch: 51, step: 409, loss: 0.3564823269844055, mean loss: 0.3416755715361041
Epoch: 51, step: 410, loss: 0.30055564641952515, mean loss: 0.3416750162741351
Epoch: 51, step: 411, loss: 0.33310264348983765, mean loss: 0.34167490051885824
Epoch: 51, step: 412, loss: 0.3291952311992645, mean loss: 0.34167473200447984
Epoch: 51, step: 413, loss: 0.3336741328239441, mean loss: 0.34167462397294807
Epoch: 51, step: 414, loss: 0.3453817367553711, mean loss: 0.3416746740291571
Epoch: 51, step: 415, loss: 0.3440890610218048, mean loss: 0.34167470662957555
Epoch: 51, step: 416, loss: 0.35257333517074585, mean loss: 0.34167485378703416
Epoch: 51, step: 417, loss: 0.29398319125175476, mean loss: 0.3416742098446273
Epoch: 51, step: 418, loss: 0.3191600441932678, mean loss: 0.341673905857945
Epoch: 51, step: 419, loss: 0.3467218577861786, mean loss: 0.34167397401456534
Epoch: 51, step: 420, loss: 0.3359736502170563, mean loss: 0.341673897050766
Epoch: 51, step: 421, loss: 0.35840079188346863, mean loss: 0.34167412288846255
Epoch: 51, step: 422, loss: 0.32830747961997986, mean loss: 0.3416739424215438
Epoch: 51, step: 423, loss: 0.3437809646129608, mean loss: 0.34167397086867607
Epoch: 51, step: 424, loss: 0.3185485303401947, mean loss: 0.3416736586538422
Epoch: 51, step: 425, loss: 0.3676743805408478, mean loss: 0.34167400968289424
Epoch: 51, step: 426, loss: 0.3307345509529114, mean loss: 0.3416738619940723
Epoch: 51, step: 427, loss: 0.3522150218486786, mean loss: 0.341674004303715
Epoch: 51, step: 428, loss: 0.30765828490257263, mean loss: 0.3416735450848444
Epoch: 51, step: 429, loss: 0.33937186002731323, mean loss: 0.341673514012065
Epoch: 51, step: 430, loss: 0.32692477107048035, mean loss: 0.34167331490652414
Epoch: 51, step: 431, loss: 0.32307302951812744, mean loss: 0.34167306380919993
Epoch: 51, step: 432, loss: 0.31185656785964966, mean loss: 0.34167266130240365
Epoch: 51, step: 433, loss: 0.36803120374679565, mean loss: 0.3416730171238681
Epoch: 51, step: 434, loss: 0.3591445982456207, mean loss: 0.34167325297452916
Epoch: 51, step: 435, loss: 0.31254252791404724, mean loss: 0.3416728597411995
Epoch: 51, step: 436, loss: 0.3898881673812866, mean loss: 0.3416735105869985
Epoch: 51, step: 437, loss: 0.3293435275554657, mean loss: 0.34167334415003636
Epoch: 51, step: 438, loss: 0.3023238778114319, mean loss: 0.3416728129962448
Epoch: 51, step: 439, loss: 0.31521886587142944, mean loss: 0.3416724559158074
Epoch: 51, step: 440, loss: 0.2879931330680847, mean loss: 0.34167173135182216
Epoch: 51, step: 441, loss: 0.3120873272418976, mean loss: 0.341671332026658
Epoch: 51, step: 442, loss: 0.33544957637786865, mean loss: 0.34167124804761106
Epoch: 51, step: 443, loss: 0.36678653955459595, mean loss: 0.3416715870403158
Epoch: 51, step: 444, loss: 0.32401353120803833, mean loss: 0.3416713487045867
Epoch: 51, step: 445, loss: 0.35765349864959717, mean loss: 0.34167156441723273
Epoch: 51, step: 446, loss: 0.3034331500530243, mean loss: 0.3416710483165678
Epoch: 51, step: 447, loss: 0.3372923731803894, mean loss: 0.34167098921875516
Epoch: 51, step: 448, loss: 0.3531414866447449, mean loss: 0.3416711440309159
Epoch: 51, step: 449, loss: 0.30588701367378235, mean loss: 0.3416706610750712
Epoch: 51, step: 450, loss: 0.31054767966270447, mean loss: 0.34167024103348387
Epoch: 51, step: 451, loss: 0.35455143451690674, mean loss: 0.3416704148781379
Epoch: 51, step: 452, loss: 0.32350704073905945, mean loss: 0.34167016974845466
Epoch: 51, step: 453, loss: 0.3277494013309479, mean loss: 0.3416699818787629
Epoch: 51, step: 454, loss: 0.34389013051986694, mean loss: 0.34167001184068735
Epoch: 51, step: 455, loss: 0.3324812352657318, mean loss: 0.34166988783560537
Epoch: 51, step: 456, loss: 0.33663493394851685, mean loss: 0.3416698198884267
Epoch: 51, step: 457, loss: 0.29284796118736267, mean loss: 0.34166916104171946
Epoch: 51, step: 458, loss: 0.32821086049079895, mean loss: 0.3416689794255831
Epoch: 51, step: 459, loss: 0.37746432423591614, mean loss: 0.34166946246758906
Epoch: 51, step: 460, loss: 0.31492355465888977, mean loss: 0.3416691015485174
Epoch: 51, step: 461, loss: 0.34831392765045166, mean loss: 0.3416691912150235
Epoch: 51, step: 462, loss: 0.3268507122993469, mean loss: 0.3416689912544406
Epoch: 51, step: 463, loss: 0.33837199211120605, mean loss: 0.3416689467653282
Epoch: 51, step: 464, loss: 0.33224862813949585, mean loss: 0.3416688196509612
Epoch: 51, step: 465, loss: 0.31811854243278503, mean loss: 0.34166850187633946
Epoch: 51, step: 466, loss: 0.31956636905670166, mean loss: 0.3416682036462141
Epoch: 51, step: 467, loss: 0.35040122270584106, mean loss: 0.34166832148163967
Epoch: 51, step: 468, loss: 0.3585110306739807, mean loss: 0.34166854873879016
Epoch: 51, step: 469, loss: 0.2860994338989258, mean loss: 0.34166779895987065
Epoch: 51, step: 470, loss: 0.37808850407600403, mean loss: 0.34166829036788676
Epoch: 51, step: 471, loss: 0.3037984073162079, mean loss: 0.34166777941366566
Epoch: 51, step: 472, loss: 0.31219539046287537, mean loss: 0.34166738176685113
Epoch: 51, step: 473, loss: 0.3152841031551361, mean loss: 0.341667025803676
Epoch: 51, step: 474, loss: 0.3471235930919647, mean loss: 0.3416670994226845
Epoch: 51, step: 475, loss: 0.31219807267189026, mean loss: 0.3416667018373263
Epoch: 51, step: 476, loss: 0.32835695147514343, mean loss: 0.34166652226945265
Epoch: 51, step: 477, loss: 0.35025033354759216, mean loss: 0.3416666380759781
Epoch: 51, step: 478, loss: 0.31056153774261475, mean loss: 0.3416662184342969
Epoch: 51, step: 479, loss: 0.31647631525993347, mean loss: 0.3416658785996526
Epoch: 51, step: 480, loss: 0.3118492662906647, mean loss: 0.34166547635193173
Epoch: 51, step: 481, loss: 0.33995577692985535, mean loss: 0.3416654532871579
Epoch: 51, step: 482, loss: 0.3337918817996979, mean loss: 0.3416653470698351
Epoch: 51, step: 483, loss: 0.3128165602684021, mean loss: 0.3416649578945329
Epoch: 51, step: 484, loss: 0.3602104187011719, mean loss: 0.34166520807274664
Epoch: 51, step: 485, loss: 0.32375290989875793, mean loss: 0.34166496643915467
Epoch: 51, step: 486, loss: 0.311495840549469, mean loss: 0.34166455946871194
Epoch: 51, step: 487, loss: 0.32469677925109863, mean loss: 0.3416643305826679
Epoch: 51, step: 488, loss: 0.30943092703819275, mean loss: 0.3416638957776075
Epoch: 51, step: 489, loss: 0.32940012216567993, mean loss: 0.34166373035049424
Epoch: 51, step: 490, loss: 0.32860174775123596, mean loss: 0.34166355415864696
Epoch: 51, step: 491, loss: 0.32737505435943604, mean loss: 0.34166336142502496
Epoch: 51, step: 492, loss: 0.3415869176387787, mean loss: 0.34166336039390977
Epoch: 51, step: 493, loss: 0.36603376269340515, mean loss: 0.34166368911065825
Epoch: 51, step: 494, loss: 0.34553423523902893, mean loss: 0.3416637413172719
Epoch: 51, step: 495, loss: 0.31798434257507324, mean loss: 0.3416634219296439
Epoch: 51, step: 496, loss: 0.29528331756591797, mean loss: 0.34166279636343405
Epoch: 51, step: 497, loss: 0.3135501444339752, mean loss: 0.34166241719033474
Epoch: 51, step: 498, loss: 0.3497161567211151, mean loss: 0.3416625258147434
Epoch: 51, step: 499, loss: 0.31307336688041687, mean loss: 0.3416621402250944
Epoch: 51, step: 500, loss: 0.31649959087371826, mean loss: 0.3416618008556244
Epoch: 51, step: 501, loss: 0.36447030305862427, mean loss: 0.34166210847170897
Epoch: 51, step: 502, loss: 0.39098361134529114, mean loss: 0.3416627736571227
Epoch: 51, step: 503, loss: 0.3463122844696045, mean loss: 0.34166283636293826
Epoch: 51, step: 504, loss: 0.327323853969574, mean loss: 0.3416626429822805
Epoch: 51, step: 505, loss: 0.30855488777160645, mean loss: 0.3416621964852446
Epoch: 51, step: 506, loss: 0.3130444586277008, mean loss: 0.34166181054658085
Epoch: 51, step: 507, loss: 0.3580068349838257, mean loss: 0.3416620309725227
Epoch: 51, step: 508, loss: 0.3044479191303253, mean loss: 0.34166152911674014
Epoch: 51, step: 509, loss: 0.3066284656524658, mean loss: 0.34166105668014246
Epoch: 51, step: 510, loss: 0.30239659547805786, mean loss: 0.34166052718838597
Epoch: 51, step: 511, loss: 0.3218938112258911, mean loss: 0.34166026063253124
Epoch: 51, step: 512, loss: 0.3346583843231201, mean loss: 0.34166016621290385
Epoch: 51, step: 513, loss: 0.3174026906490326, mean loss: 0.34165983910759407
Epoch: 51, step: 514, loss: 0.38512149453163147, mean loss: 0.34166042516802403
Epoch: 51, step: 515, loss: 0.3281646966934204, mean loss: 0.34166024318678784
Epoch: 51, step: 516, loss: 0.3132762312889099, mean loss: 0.3416598604517668
Epoch: 51, step: 517, loss: 0.341555118560791, mean loss: 0.3416598590394277
Epoch: 51, step: 518, loss: 0.34318506717681885, mean loss: 0.3416598796050485
Epoch: 51, step: 519, loss: 0.3494715690612793, mean loss: 0.3416599849349856
Epoch: 51, step: 520, loss: 0.34444621205329895, mean loss: 0.34166002250293703
Epoch: 51, step: 521, loss: 0.3110096752643585, mean loss: 0.34165960923611344
Epoch: 51, step: 522, loss: 0.35950779914855957, mean loss: 0.3416598498847835
Epoch: 51, step: 523, loss: 0.3421725928783417, mean loss: 0.3416598567980479
Epoch: 51, step: 524, loss: 0.35201069712638855, mean loss: 0.3416599963555494
Epoch: 51, step: 525, loss: 0.2978644371032715, mean loss: 0.3416594058801651
Epoch: 51, step: 526, loss: 0.3000916838645935, mean loss: 0.34165884544924174
Epoch: 51, step: 527, loss: 0.3366539180278778, mean loss: 0.34165877797192656
Epoch: 51, step: 528, loss: 0.3154054880142212, mean loss: 0.34165842402520796
Epoch: 51, step: 529, loss: 0.33423054218292236, mean loss: 0.3416583238838937
Epoch: 51, step: 530, loss: 0.34618324041366577, mean loss: 0.34165838488714995
Epoch: 51, step: 531, loss: 0.3321846127510071, mean loss: 0.34165825716696907
Epoch: 51, step: 532, loss: 0.3505052924156189, mean loss: 0.3416583764362203
Epoch: 51, step: 533, loss: 0.3593200445175171, mean loss: 0.34165861453468727
Epoch: 51, step: 534, loss: 0.29724907875061035, mean loss: 0.3416580158539854
Epoch: 51, step: 535, loss: 0.35220953822135925, mean loss: 0.3416581580961311
Epoch: 51, step: 536, loss: 0.34874510765075684, mean loss: 0.341658253632044
Epoch: 51, step: 537, loss: 0.3116925358772278, mean loss: 0.34165784968340746
Epoch: 51, step: 538, loss: 0.3224424421787262, mean loss: 0.3416575906563055
Epoch: 51, step: 539, loss: 0.33763420581817627, mean loss: 0.34165753642109525
Epoch: 51, step: 540, loss: 0.35050728917121887, mean loss: 0.3416576557141161
Epoch: 51, step: 541, loss: 0.3152954578399658, mean loss: 0.3416573003613828
Epoch: 51, step: 542, loss: 0.3196224570274353, mean loss: 0.3416570033438011
Epoch: 51, step: 543, loss: 0.31005701422691345, mean loss: 0.3416565773990511
Epoch: 51, step: 544, loss: 0.29508906602859497, mean loss: 0.3416559497115048
Epoch: 51, step: 545, loss: 0.3211793899536133, mean loss: 0.3416556737098906
Epoch: 51, step: 546, loss: 0.3487796187400818, mean loss: 0.34165576973157824
Epoch: 51, step: 547, loss: 0.33588695526123047, mean loss: 0.3416556919763692
Epoch: 51, step: 548, loss: 0.28722596168518066, mean loss: 0.3416549583528428
Epoch: 51, step: 549, loss: 0.3487098515033722, mean loss: 0.34165505343995434
Epoch: 51, step: 550, loss: 0.3311336934566498, mean loss: 0.34165491163309425
Epoch: 51, step: 551, loss: 0.31351232528686523, mean loss: 0.34165453233250737
Epoch: 51, step: 552, loss: 0.34787872433662415, mean loss: 0.3416546162198883
Epoch: 51, step: 553, loss: 0.3532843589782715, mean loss: 0.34165477295919067
Epoch: 51, step: 554, loss: 0.34310510754585266, mean loss: 0.3416547925057423
Epoch: 51, step: 555, loss: 0.35526126623153687, mean loss: 0.341654975881399
Epoch: 51, step: 556, loss: 0.3349597156047821, mean loss: 0.34165488564999674
Epoch: 51, step: 557, loss: 0.31341829895973206, mean loss: 0.34165450511326334
Epoch: 51, step: 558, loss: 0.33260777592658997, mean loss: 0.3416543831946187
Epoch: 51, step: 559, loss: 0.35222503542900085, mean loss: 0.3416545256485597
Epoch: 51, step: 560, loss: 0.3518086075782776, mean loss: 0.34165466248680415
Epoch: 51, step: 561, loss: 0.3779929578304291, mean loss: 0.3416551521816448
Epoch: 51, step: 562, loss: 0.3368090093135834, mean loss: 0.3416550868759072
Epoch: 51, step: 563, loss: 0.3142363131046295, mean loss: 0.3416547173904909
Epoch: 51, step: 564, loss: 0.3116241693496704, mean loss: 0.3416543127152084
Epoch: 51, step: 565, loss: 0.31353703141212463, mean loss: 0.34165393382717035
Epoch: 51, step: 566, loss: 0.33513349294662476, mean loss: 0.34165384596363424
Epoch: 51, step: 567, loss: 0.3363502323627472, mean loss: 0.3416537744979198
Epoch: 51, step: 568, loss: 0.3242148458957672, mean loss: 0.3416535395130977
Epoch: 51, step: 569, loss: 0.35707181692123413, mean loss: 0.34165374726739484
Epoch: 51, step: 570, loss: 0.34441474080085754, mean loss: 0.34165378447002953
Epoch: 51, step: 571, loss: 0.33899906277656555, mean loss: 0.3416537486998224
Epoch: 51, step: 572, loss: 0.3110312223434448, mean loss: 0.3416533360918437
Epoch: 51, step: 573, loss: 0.33973437547683716, mean loss: 0.34165331023611306
Epoch: 51, step: 574, loss: 0.30771854519844055, mean loss: 0.3416528530113453
Epoch: 51, step: 575, loss: 0.31321069598197937, mean loss: 0.34165246979715735
Epoch: 51, step: 576, loss: 0.3409099876880646, mean loss: 0.3416524597934912
Epoch: 51, step: 577, loss: 0.3461858034133911, mean loss: 0.34165252087165693
Epoch: 51, step: 578, loss: 0.28150299191474915, mean loss: 0.3416517104823038
Epoch: 51, step: 579, loss: 0.34591999650001526, mean loss: 0.34165176798777397
Epoch: 51, step: 580, loss: 0.3124266266822815, mean loss: 0.3416513742506058
Epoch: 51, step: 581, loss: 0.30357369780540466, mean loss: 0.3416508612541296
Epoch: 51, step: 582, loss: 0.31570565700531006, mean loss: 0.3416505117154947
Epoch: 51, step: 583, loss: 0.34936878085136414, mean loss: 0.3416506156960564
Epoch: 51, step: 584, loss: 0.3289510905742645, mean loss: 0.34165044461029315
Epoch: 51, step: 585, loss: 0.32417044043540955, mean loss: 0.34165020912593136
Epoch: 51, step: 586, loss: 0.31140846014022827, mean loss: 0.3416498017253981
Epoch: 51, step: 587, loss: 0.31918880343437195, mean loss: 0.3416494991470183
Epoch: 51, step: 588, loss: 0.32369109988212585, mean loss: 0.3416492572276662
Epoch: 51, step: 589, loss: 0.33198419213294983, mean loss: 0.34164912703038336
Epoch: 51, step: 590, loss: 0.30671000480651855, mean loss: 0.34164865637473274
Epoch: 51, step: 591, loss: 0.2900119125843048, mean loss: 0.34164796079921966
Epoch: 51, step: 592, loss: 0.3013276159763336, mean loss: 0.34164741766917905
Epoch: 51, step: 593, loss: 0.3488721251487732, mean loss: 0.3416475149873649
Epoch: 51, step: 594, loss: 0.3088938891887665, mean loss: 0.3416470737957298
Epoch: 51, step: 595, loss: 0.3465891480445862, mean loss: 0.34164714036461785
Epoch: 51, step: 596, loss: 0.3206603527069092, mean loss: 0.34164685768001424
Epoch: 51, step: 597, loss: 0.31987911462783813, mean loss: 0.3416465644801671
Epoch: 51, step: 598, loss: 0.3164367079734802, mean loss: 0.3416462249214679
Epoch: 51, step: 599, loss: 0.3421202301979065, mean loss: 0.3416462313058933
Epoch: 51, step: 600, loss: 0.318915456533432, mean loss: 0.34164592514689573
Epoch: 51, step: 601, loss: 0.31889808177948, mean loss: 0.34164561876212934
Epoch: 51, step: 602, loss: 0.3626148998737335, mean loss: 0.3416459011881009
Epoch: 51, step: 603, loss: 0.38779810070991516, mean loss: 0.34164652278328894
Epoch: 51, step: 604, loss: 0.31379130482673645, mean loss: 0.3416461476237857
Epoch: 51, step: 605, loss: 0.29946666955947876, mean loss: 0.3416455795500071
Epoch: 51, step: 606, loss: 0.3661835491657257, mean loss: 0.3416459100232615
Epoch: 51, step: 607, loss: 0.33926230669021606, mean loss: 0.3416458779217244
Epoch: 51, step: 608, loss: 0.3645613491535187, mean loss: 0.34164618653513035
Epoch: 51, step: 609, loss: 0.327750563621521, mean loss: 0.3416459993987752
Epoch: 51, step: 610, loss: 0.30736246705055237, mean loss: 0.34164553769879075
Epoch: 51, step: 611, loss: 0.38654083013534546, mean loss: 0.34164614230033724
Epoch: 51, step: 612, loss: 0.3786683976650238, mean loss: 0.341646640869568
Epoch: 51, step: 613, loss: 0.36878496408462524, mean loss: 0.3416470063294944
Epoch: 51, step: 614, loss: 0.30648040771484375, mean loss: 0.3416465327626727
Epoch: 51, step: 615, loss: 0.3444811701774597, mean loss: 0.3416465709344666
Epoch: 51, step: 616, loss: 0.31316983699798584, mean loss: 0.34164618746624054
Epoch: 51, step: 617, loss: 0.3397301733493805, mean loss: 0.34164616166550643
Epoch: 51, step: 618, loss: 0.36058178544044495, mean loss: 0.3416464166460994
Epoch: 51, step: 619, loss: 0.3409055769443512, mean loss: 0.3416464066703413
Epoch: 51, step: 620, loss: 0.35433685779571533, mean loss: 0.34164657755098665
Epoch: 51, step: 621, loss: 0.2945975661277771, mean loss: 0.3416459440307833
Epoch: 51, step: 622, loss: 0.3209433853626251, mean loss: 0.3416456652722678
Epoch: 51, step: 623, loss: 0.3385806083679199, mean loss: 0.34164562400204507
Epoch: 51, step: 624, loss: 0.327029287815094, mean loss: 0.3416454271993927
Epoch: 51, step: 625, loss: 0.33639639616012573, mean loss: 0.341645356524409
Epoch: 51, step: 626, loss: 0.3003014922142029, mean loss: 0.34164479986212754
Epoch: 51, step: 627, loss: 0.37888363003730774, mean loss: 0.3416453012466355
Epoch: 51, step: 628, loss: 0.35875824093818665, mean loss: 0.3416455316525662
Epoch: 51, step: 629, loss: 0.3537655472755432, mean loss: 0.3416456948323549
Epoch: 51, step: 630, loss: 0.3161773383617401, mean loss: 0.341645351939639
Epoch: 51, step: 631, loss: 0.34579992294311523, mean loss: 0.3416454078738709
Epoch: 51, step: 632, loss: 0.3329929709434509, mean loss: 0.3416452913850933
Epoch: 51, step: 633, loss: 0.31040719151496887, mean loss: 0.3416448708285373
Epoch: 51, step: 634, loss: 0.3114122748374939, mean loss: 0.34164446381449576
Epoch: 51, step: 635, loss: 0.30087709426879883, mean loss: 0.3416439149807647
Epoch: 51, step: 636, loss: 0.3343926668167114, mean loss: 0.3416438173616136
Epoch: 51, step: 637, loss: 0.32408609986305237, mean loss: 0.3416435809959059
Epoch: 51, step: 638, loss: 0.4008691608905792, mean loss: 0.3416443782924596
Epoch: 51, step: 639, loss: 0.31073111295700073, mean loss: 0.34164396214274584
Epoch: 51, step: 640, loss: 0.33831849694252014, mean loss: 0.3416439173764377
Epoch: 51, step: 641, loss: 0.3103308081626892, mean loss: 0.3416434958554349
Epoch: 51, step: 642, loss: 0.3424842357635498, mean loss: 0.34164350717289166
Epoch: 51, step: 643, loss: 0.3258053660392761, mean loss: 0.34164329397370563
Epoch: 51, step: 644, loss: 0.29383584856987, mean loss: 0.34164265044040454
Epoch: 51, step: 645, loss: 0.3306526243686676, mean loss: 0.34164250250628053
Epoch: 51, step: 646, loss: 0.3223100006580353, mean loss: 0.34164224227957946
Epoch: 51, step: 647, loss: 0.3366435766220093, mean loss: 0.3416421749955427
Epoch: 51, step: 648, loss: 0.30149179697036743, mean loss: 0.3416416345626887
Epoch: 51, step: 649, loss: 0.35751277208328247, mean loss: 0.34164184818878934
Epoch: 51, step: 650, loss: 0.3449559807777405, mean loss: 0.3416418927965367
Epoch: 51, step: 651, loss: 0.31327715516090393, mean loss: 0.3416415110163919
Epoch: 51, step: 652, loss: 0.3587929308414459, mean loss: 0.3416417418658182
Epoch: 51, step: 653, loss: 0.31921130418777466, mean loss: 0.34164143996754803
Epoch: 51, step: 654, loss: 0.3271782696247101, mean loss: 0.34164124530583867
Epoch: 51, step: 655, loss: 0.323908269405365, mean loss: 0.3416410066385991
Epoch: 51, step: 656, loss: 0.3044658303260803, mean loss: 0.3416405063064863
Epoch: 51, step: 657, loss: 0.31405285000801086, mean loss: 0.3416401350155884
Epoch: 51, step: 658, loss: 0.3486171364784241, mean loss: 0.34164022891491225
Epoch: 51, step: 659, loss: 0.35270610451698303, mean loss: 0.3416403778419633
Epoch: 51, step: 660, loss: 0.3194308280944824, mean loss: 0.3416400789448535
Epoch: 51, step: 661, loss: 0.3617249131202698, mean loss: 0.3416403492438088
Epoch: 51, step: 662, loss: 0.308005690574646, mean loss: 0.3416398965992576
Epoch: 51, step: 663, loss: 0.33957406878471375, mean loss: 0.34163986879837727
Epoch: 51, step: 664, loss: 0.302109032869339, mean loss: 0.341639336819264
Epoch: 51, step: 665, loss: 0.2984412610530853, mean loss: 0.3416387554967534
Epoch: 51, step: 666, loss: 0.3360532820224762, mean loss: 0.3416386803332719
Epoch: 51, step: 667, loss: 0.3030785024166107, mean loss: 0.34163816143756304
Epoch: 51, step: 668, loss: 0.371355801820755, mean loss: 0.3416385613358363
Epoch: 51, step: 669, loss: 0.3367329239845276, mean loss: 0.3416384953235459
Epoch: 51, step: 670, loss: 0.329562246799469, mean loss: 0.34163833282272477
Epoch: 51, step: 671, loss: 0.33031338453292847, mean loss: 0.34163818043362565
Epoch: 51, step: 672, loss: 0.3135210871696472, mean loss: 0.3416378020936326
Epoch: 51, step: 673, loss: 0.33509010076522827, mean loss: 0.3416377139897906
Epoch: 51, step: 674, loss: 0.32892513275146484, mean loss: 0.3416375429355348
Epoch: 51, step: 675, loss: 0.3463605046272278, mean loss: 0.34163760648453495
Epoch: 51, step: 676, loss: 0.3464592695236206, mean loss: 0.3416376713607212
Epoch: 51, step: 677, loss: 0.317934513092041, mean loss: 0.34163735243552723
Epoch: 51, step: 678, loss: 0.33104822039604187, mean loss: 0.34163720996103025
Epoch: 51, step: 679, loss: 0.3063187003135681, mean loss: 0.3416367347644632
Epoch: 51, step: 680, loss: 0.36283135414123535, mean loss: 0.3416370199258406
Epoch: 51, step: 681, loss: 0.330858439207077, mean loss: 0.3416368749082059
Epoch: 51, step: 682, loss: 0.36807191371917725, mean loss: 0.3416372305668334
Epoch: 51, step: 683, loss: 0.36735019087791443, mean loss: 0.3416375765059184
Epoch: 51, step: 684, loss: 0.2973683178424835, mean loss: 0.3416369809206332
Epoch: 51, step: 685, loss: 0.3525582253932953, mean loss: 0.34163712784979333
Epoch: 51, step: 686, loss: 0.342236191034317, mean loss: 0.3416371359091923
Epoch: 51, step: 687, loss: 0.33518537878990173, mean loss: 0.3416370491126966
Epoch: 51, step: 688, loss: 0.3871155381202698, mean loss: 0.341637660933678
Epoch: 51, step: 689, loss: 0.3328537046909332, mean loss: 0.34163754276492286
Epoch: 51, step: 690, loss: 0.3363190293312073, mean loss: 0.341637471217019
Epoch: 51, step: 691, loss: 0.31020569801330566, mean loss: 0.34163704838322106
Epoch: 51, step: 692, loss: 0.30770206451416016, mean loss: 0.3416365918812924
Epoch: 51, step: 693, loss: 0.33991575241088867, mean loss: 0.3416365687324389
Epoch: 51, step: 694, loss: 0.33771318197250366, mean loss: 0.34163651595547445
Epoch: 51, step: 695, loss: 0.3379175364971161, mean loss: 0.34163646592884733
Epoch: 51, step: 696, loss: 0.3517981767654419, mean loss: 0.3416366026193793
Epoch: 51, step: 697, loss: 0.33543163537979126, mean loss: 0.34163651915421506
Epoch: 51, step: 698, loss: 0.336407333612442, mean loss: 0.3416364488155747
Epoch: 51, step: 699, loss: 0.3188735842704773, mean loss: 0.341636142632634
Epoch: 51, step: 700, loss: 0.323845237493515, mean loss: 0.34163590333066157
Epoch: 51, step: 701, loss: 0.29258981347084045, mean loss: 0.3416352436302088
Epoch: 51, step: 702, loss: 0.3187912702560425, mean loss: 0.34163493636867337
Epoch: 51, step: 703, loss: 0.34758201241493225, mean loss: 0.341635016358398
Epoch: 51, step: 704, loss: 0.3010921776294708, mean loss: 0.34163447105397254
Epoch: 51, step: 705, loss: 0.3434794247150421, mean loss: 0.34163449586841316
Epoch: 51, step: 706, loss: 0.32607194781303406, mean loss: 0.3416342865565269
Epoch: 51, step: 707, loss: 0.3001392185688019, mean loss: 0.34163372846706075
Epoch: 51, step: 708, loss: 0.35449862480163574, mean loss: 0.34163390149163725
Epoch: 51, step: 709, loss: 0.31722450256347656, mean loss: 0.3416335732053456
Epoch: 51, step: 710, loss: 0.3235142230987549, mean loss: 0.3416333295183023
Epoch: 51, step: 711, loss: 0.34692633152008057, mean loss: 0.3416334007029007
Epoch: 51, step: 712, loss: 0.33280855417251587, mean loss: 0.3416332820207789
Epoch: 51, step: 713, loss: 0.35232412815093994, mean loss: 0.34163342579611083
Epoch: 51, step: 714, loss: 0.2960790693759918, mean loss: 0.34163281316877026
Epoch: 51, step: 715, loss: 0.3271879553794861, mean loss: 0.3416326189130173
Epoch: 51, step: 716, loss: 0.3129701316356659, mean loss: 0.3416322334624817
Epoch: 51, step: 717, loss: 0.3354071378707886, mean loss: 0.34163214974908523
Epoch: 51, step: 718, loss: 0.35738059878349304, mean loss: 0.341632361527107
Epoch: 51, step: 719, loss: 0.32965347170829773, mean loss: 0.3416322004425793
Epoch: 51, step: 720, loss: 0.3133031129837036, mean loss: 0.341631819496066
Epoch: 51, step: 721, loss: 0.36625269055366516, mean loss: 0.3416321505730509
Epoch: 51, step: 722, loss: 0.30995169281959534, mean loss: 0.3416317245714944
Epoch: 51, step: 723, loss: 0.2831614315509796, mean loss: 0.3416309383422961
Epoch: 51, step: 724, loss: 0.30452147126197815, mean loss: 0.34163043935122345
Epoch: 51, step: 725, loss: 0.3277508318424225, mean loss: 0.3416302527221054
Epoch: 51, step: 726, loss: 0.3288935720920563, mean loss: 0.3416300814634074
Epoch: 51, step: 727, loss: 0.3620617687702179, mean loss: 0.34163035618625076
Epoch: 51, step: 728, loss: 0.32543760538101196, mean loss: 0.34163013846273815
Epoch: 51, step: 729, loss: 0.29867276549339294, mean loss: 0.3416295608768483
Epoch: 51, step: 730, loss: 0.31242987513542175, mean loss: 0.3416291682760316
Epoch: 51, step: 731, loss: 0.3271637260913849, mean loss: 0.3416289737853063
Epoch: 51, step: 732, loss: 0.3432411849498749, mean loss: 0.3416289954615122
Epoch: 51, step: 733, loss: 0.340173602104187, mean loss: 0.34162897589398744
Epoch: 51, step: 734, loss: 0.36678260564804077, mean loss: 0.34162931407586344
Epoch: 51, step: 735, loss: 0.36107972264289856, mean loss: 0.34162957557638196
Epoch: 51, step: 736, loss: 0.36399519443511963, mean loss: 0.34162987626632774
Epoch: 51, step: 737, loss: 0.32799434661865234, mean loss: 0.34162969294872875
Epoch: 51, step: 738, loss: 0.3425048291683197, mean loss: 0.34162970471400067
Epoch: 51, step: 739, loss: 0.3122875690460205, mean loss: 0.3416293102456248
Epoch: 51, step: 740, loss: 0.37079086899757385, mean loss: 0.34162970228109907
Epoch: 51, step: 741, loss: 0.36996474862098694, mean loss: 0.3416300832001744
Epoch: 51, step: 742, loss: 0.31969138979911804, mean loss: 0.34162978827373025
Epoch: 51, step: 743, loss: 0.3110969364643097, mean loss: 0.34162937781973485
Epoch: 51, step: 744, loss: 0.30892306566238403, mean loss: 0.3416289381537606
Epoch: 51, step: 745, loss: 0.3446674644947052, mean loss: 0.34162897899965844
Epoch: 51, step: 746, loss: 0.3208320140838623, mean loss: 0.341628699436742
Epoch: 51, step: 747, loss: 0.33044055104255676, mean loss: 0.34162854904223194
Epoch: 51, step: 748, loss: 0.3827962875366211, mean loss: 0.3416291024241159
Epoch: 51, step: 749, loss: 0.3330129384994507, mean loss: 0.34162898660612084
Epoch: 51, step: 750, loss: 0.33282628655433655, mean loss: 0.34162886828230804
Epoch: 51, step: 751, loss: 0.3224203586578369, mean loss: 0.3416286100895339
Epoch: 51, step: 752, loss: 0.3379974961280823, mean loss: 0.34162856128227065
Epoch: 51, step: 753, loss: 0.3618972599506378, mean loss: 0.34162883371833974
Epoch: 51, step: 754, loss: 0.3504355847835541, mean loss: 0.3416289520902408
Epoch: 51, step: 755, loss: 0.3582998812198639, mean loss: 0.3416291761618689
Epoch: 51, step: 756, loss: 0.3204362094402313, mean loss: 0.34162889131399427
Epoch: 51, step: 757, loss: 0.3134733736515045, mean loss: 0.3416285128897898
Epoch: 51, step: 758, loss: 0.33645644783973694, mean loss: 0.3416284433755894
Epoch: 51, step: 759, loss: 0.33333420753479004, mean loss: 0.3416283318999182
Epoch: 51, step: 760, loss: 0.3159760534763336, mean loss: 0.34162798713439946
Epoch: 51, step: 761, loss: 0.396123468875885, mean loss: 0.3416287195414868
Epoch: 51, step: 762, loss: 0.33272820711135864, mean loss: 0.3416285999221979
Epoch: 51, step: 763, loss: 0.33280953764915466, mean loss: 0.3416284813991591
Epoch: 51, step: 764, loss: 0.30934208631515503, mean loss: 0.34162804749472436
Epoch: 51, step: 765, loss: 0.3886193335056305, mean loss: 0.34162867901314947
Epoch: 51, step: 766, loss: 0.3522859811782837, mean loss: 0.34162882223528285
Epoch: 51, step: 767, loss: 0.3519640862941742, mean loss: 0.34162896112772034
Epoch: 51, step: 768, loss: 0.3527050316333771, mean loss: 0.3416291099736277
Epoch: 51, step: 769, loss: 0.3132103681564331, mean loss: 0.3416287280731545
Epoch: 51, step: 770, loss: 0.3153427541255951, mean loss: 0.34162837483826974
Epoch: 51, step: 771, loss: 0.3602185547351837, mean loss: 0.3416286246525556
Epoch: 51, step: 772, loss: 0.31191128492355347, mean loss: 0.34162822531719234
Epoch: 51, step: 773, loss: 0.32733604311943054, mean loss: 0.34162803326443364
Epoch: 51, step: 774, loss: 0.29883864521980286, mean loss: 0.3416274582850864
Epoch: 51, step: 775, loss: 0.3841876685619354, mean loss: 0.341628030177189
Epoch: 51, step: 776, loss: 0.3344537019729614, mean loss: 0.3416279337752567
Epoch: 51, step: 777, loss: 0.32148534059524536, mean loss: 0.3416276631215094
Epoch: 51, step: 778, loss: 0.31930825114250183, mean loss: 0.3416273632221237
Epoch: 51, step: 779, loss: 0.29554539918899536, mean loss: 0.3416267440406227
Epoch: 51, step: 780, loss: 0.3034127354621887, mean loss: 0.3416262305840076
Epoch: 51, step: 781, loss: 0.29606130719184875, mean loss: 0.34162561836618865
Epoch: 51, step: 782, loss: 0.3196200132369995, mean loss: 0.3416253226992247
Epoch: 51, step: 783, loss: 0.31747525930404663, mean loss: 0.34162499822371284
Epoch: 51, step: 784, loss: 0.34408774971961975, mean loss: 0.341625031312314
Epoch: 51, step: 785, loss: 0.334170401096344, mean loss: 0.34162493115605685
Epoch: 51, step: 786, loss: 0.31047165393829346, mean loss: 0.3416245126036094
Epoch: 51, step: 787, loss: 0.3242712616920471, mean loss: 0.3416242794612659
Epoch: 51, step: 788, loss: 0.401347815990448, mean loss: 0.34162508184107765
Epoch: 51, step: 789, loss: 0.3239465355873108, mean loss: 0.3416248443347465
Epoch: 51, step: 790, loss: 0.31716594099998474, mean loss: 0.3416245157406263
Epoch: 51, step: 791, loss: 0.3529329299926758, mean loss: 0.3416246676619312
Epoch: 51, step: 792, loss: 0.3558869957923889, mean loss: 0.3416248592646037
Epoch: 51, step: 793, loss: 0.32741421461105347, mean loss: 0.34162466835882094
Epoch: 51, step: 794, loss: 0.38192999362945557, mean loss: 0.3416252098132369
Epoch: 51, step: 795, loss: 0.29401206970214844, mean loss: 0.34162457019555675
Epoch: 51, step: 796, loss: 0.30095794796943665, mean loss: 0.34162402390222074
Epoch: 51, step: 797, loss: 0.35323789715766907, mean loss: 0.3416241799145962
Epoch: 51, step: 798, loss: 0.36885055899620056, mean loss: 0.3416245456491728
Epoch: 51, step: 799, loss: 0.3626176714897156, mean loss: 0.3416248276480691
Epoch: 51, step: 800, loss: 0.29221442341804504, mean loss: 0.34162416393117434
Epoch: 51, step: 801, loss: 0.3136075437068939, mean loss: 0.34162378759637835
Epoch: 51, step: 802, loss: 0.324797123670578, mean loss: 0.3416235615743234
Epoch: 51, step: 803, loss: 0.3414832651615143, mean loss: 0.3416235596898347
Epoch: 51, step: 804, loss: 0.34908556938171387, mean loss: 0.3416236599196523
Epoch: 51, step: 805, loss: 0.34563177824020386, mean loss: 0.34162371375603
Epoch: 51, step: 806, loss: 0.3030923902988434, mean loss: 0.34162319621666243
Epoch: 51, step: 807, loss: 0.309006005525589, mean loss: 0.3416227581197585
Epoch: 51, step: 808, loss: 0.3155197203159332, mean loss: 0.34162240752222983
Epoch: 51, step: 809, loss: 0.3358190357685089, mean loss: 0.34162232957649485
Epoch: 51, step: 810, loss: 0.3475710451602936, mean loss: 0.341622409473286
Epoch: 51, step: 811, loss: 0.3069688677787781, mean loss: 0.3416219440501946
Epoch: 51, step: 812, loss: 0.2985130548477173, mean loss: 0.34162136507321184
Epoch: 51, step: 813, loss: 0.33343786001205444, mean loss: 0.3416212551655449
Epoch: 51, step: 814, loss: 0.3318405747413635, mean loss: 0.3416211238089537
Epoch: 51, step: 815, loss: 0.31150174140930176, mean loss: 0.3416207193047582
Epoch: 51, step: 816, loss: 0.30633237957954407, mean loss: 0.34162024538767777
Epoch: 51, step: 817, loss: 0.35844388604164124, mean loss: 0.3416204713236002
Epoch: 51, step: 818, loss: 0.32698577642440796, mean loss: 0.34162027478713375
Epoch: 51, step: 819, loss: 0.3417772054672241, mean loss: 0.3416202768946042
Epoch: 51, step: 820, loss: 0.34350842237472534, mean loss: 0.34162030225075113
Epoch: 51, step: 821, loss: 0.35979509353637695, mean loss: 0.341620546319068
Epoch: 51, step: 822, loss: 0.3102947473526001, mean loss: 0.34162012565220934
Epoch: 51, step: 823, loss: 0.3274787962436676, mean loss: 0.34161993575414024
Epoch: 51, step: 824, loss: 0.32357707619667053, mean loss: 0.34161969346728854
Epoch: 51, step: 825, loss: 0.3153549134731293, mean loss: 0.3416193407778835
Epoch: 51, step: 826, loss: 0.30058571696281433, mean loss: 0.34161878977650284
Epoch: 51, step: 827, loss: 0.42531824111938477, mean loss: 0.3416199136814784
Epoch: 51, step: 828, loss: 0.30205678939819336, mean loss: 0.3416193824403
Epoch: 51, step: 829, loss: 0.34515681862831116, mean loss: 0.3416194299392417
Epoch: 51, step: 830, loss: 0.3384734094142914, mean loss: 0.3416193876966029
Epoch: 51, step: 831, loss: 0.3339063823223114, mean loss: 0.3416192841329666
Epoch: 51, step: 832, loss: 0.32405972480773926, mean loss: 0.3416190483613952
Epoch: 51, step: 833, loss: 0.34133026003837585, mean loss: 0.3416190444838968
Epoch: 51, step: 834, loss: 0.32895761728286743, mean loss: 0.34161887448393435
Epoch: 51, step: 835, loss: 0.2958272099494934, mean loss: 0.3416182596656672
Epoch: 51, step: 836, loss: 0.28184130787849426, mean loss: 0.34161745708579067
Epoch: 51, step: 837, loss: 0.3186430335044861, mean loss: 0.3416171486297398
Epoch: 51, step: 838, loss: 0.3133004307746887, mean loss: 0.34161676845281547
Epoch: 51, step: 839, loss: 0.3109267055988312, mean loss: 0.3416163564171722
Epoch: 51, step: 840, loss: 0.31717681884765625, mean loss: 0.3416160283036249
Epoch: 51, step: 841, loss: 0.3611915111541748, mean loss: 0.34161629111117064
Epoch: 51, step: 842, loss: 0.3594810664653778, mean loss: 0.34161653094866384
Epoch: 51, step: 843, loss: 0.361354798078537, mean loss: 0.3416167959345291
Epoch: 51, step: 844, loss: 0.36601290106773376, mean loss: 0.34161712344738515
Epoch: 51, step: 845, loss: 0.2903442680835724, mean loss: 0.3416164351287469
Epoch: 51, step: 846, loss: 0.38338544964790344, mean loss: 0.3416169958543986
Epoch: 51, step: 847, loss: 0.3470081686973572, mean loss: 0.3416170682269063
Epoch: 51, step: 848, loss: 0.3552841246128082, mean loss: 0.34161725169456614
Epoch: 51, step: 849, loss: 0.3426366448402405, mean loss: 0.3416172653787977
Epoch: 51, step: 850, loss: 0.31271329522132874, mean loss: 0.34161687738000374
Epoch: 51, step: 851, loss: 0.33037182688713074, mean loss: 0.34161672643162405
Epoch: 51, step: 852, loss: 0.3351834714412689, mean loss: 0.34161664007573067
Epoch: 51, step: 853, loss: 0.2931080758571625, mean loss: 0.34161598893658307
Epoch: 51, step: 854, loss: 0.32900765538215637, mean loss: 0.3416158196949348
Epoch: 51, step: 855, loss: 0.30921030044555664, mean loss: 0.3416153847215221
Epoch: 51, step: 856, loss: 0.3114130198955536, mean loss: 0.34161497932609347
Epoch: 51, step: 857, loss: 0.31746476888656616, mean loss: 0.3416146551708971
Epoch: 51, step: 858, loss: 0.3254988491535187, mean loss: 0.34161443886006376
Epoch: 51, step: 859, loss: 0.3050326704978943, mean loss: 0.3416139478559786
Epoch: 51, step: 860, loss: 0.3401426672935486, mean loss: 0.34161392810857155
Epoch: 51, step: 861, loss: 0.323915034532547, mean loss: 0.3416136905586618
Epoch: 51, step: 862, loss: 0.30748680233955383, mean loss: 0.34161323252266224
Epoch: 51, step: 863, loss: 0.3482946455478668, mean loss: 0.34161332219642915
Epoch: 51, step: 864, loss: 0.34274181723594666, mean loss: 0.3416133373421839
Epoch: 51, step: 865, loss: 0.3376098871231079, mean loss: 0.3416132836118092
Epoch: 51, step: 866, loss: 0.30420422554016113, mean loss: 0.34161278155093133
Epoch: 51, step: 867, loss: 0.36476999521255493, mean loss: 0.3416130923359547
Epoch: 51, step: 868, loss: 0.3493180572986603, mean loss: 0.3416131957402595
Epoch: 51, step: 869, loss: 0.3868124783039093, mean loss: 0.3416138023280492
Epoch: 51, step: 870, loss: 0.3375309705734253, mean loss: 0.3416137475359704
Epoch: 51, step: 871, loss: 0.31933456659317017, mean loss: 0.34161344855077336
Epoch: 51, step: 872, loss: 0.3369673788547516, mean loss: 0.34161338620164905
Epoch: 51, step: 873, loss: 0.3114379048347473, mean loss: 0.3416129812594691
Epoch: 51, step: 874, loss: 0.32600724697113037, mean loss: 0.34161277183993466
Epoch: 51, step: 875, loss: 0.32408657670021057, mean loss: 0.34161253665213087
Epoch: 51, step: 876, loss: 0.3534480035305023, mean loss: 0.3416126954726899
Epoch: 51, step: 877, loss: 0.3319476246833801, mean loss: 0.341612565778495
Epoch: 51, step: 878, loss: 0.3031989634037018, mean loss: 0.3416120503188064
Epoch: 51, step: 879, loss: 0.3083988428115845, mean loss: 0.3416116046475125
Epoch: 51, step: 880, loss: 0.36910733580589294, mean loss: 0.34161197359392187
Epoch: 51, step: 881, loss: 0.3116101622581482, mean loss: 0.3416115710255385
Epoch: 51, step: 882, loss: 0.3441680371761322, mean loss: 0.3416116053280886
Epoch: 51, step: 883, loss: 0.3524608016014099, mean loss: 0.34161175090017254
Epoch: 51, step: 884, loss: 0.3392852246761322, mean loss: 0.34161171968378395
Epoch: 51, step: 885, loss: 0.29231947660446167, mean loss: 0.3416110583092626
Epoch: 51, step: 886, loss: 0.31810352206230164, mean loss: 0.3416107429031061
Epoch: 51, step: 887, loss: 0.3271661102771759, mean loss: 0.34161054909866473
Epoch: 51, step: 888, loss: 0.3213344216346741, mean loss: 0.3416102770563819
Epoch: 51, step: 889, loss: 0.3401520252227783, mean loss: 0.34161025749146073
Epoch: 51, step: 890, loss: 0.32630428671836853, mean loss: 0.3416100521386631
Epoch: 51, step: 891, loss: 0.32243746519088745, mean loss: 0.34160979491279975
Epoch: 51, step: 892, loss: 0.3196932077407837, mean loss: 0.3416095008764531
Epoch: 51, step: 893, loss: 0.37458929419517517, mean loss: 0.3416099433325603
Epoch: 51, step: 894, loss: 0.3662707507610321, mean loss: 0.341610274176916
Epoch: 51, step: 895, loss: 0.3210929334163666, mean loss: 0.34160999892415556
Epoch: 51, step: 896, loss: 0.4181280732154846, mean loss: 0.3416110254474688
Epoch: 51, step: 897, loss: 0.34054893255233765, mean loss: 0.3416110111992209
Epoch: 51, step: 898, loss: 0.3215253949165344, mean loss: 0.34161074174915473
Epoch: 51, step: 899, loss: 0.3673788905143738, mean loss: 0.34161108742618795
Epoch: 51, step: 900, loss: 0.3344622850418091, mean loss: 0.3416109915270346
Epoch: 51, step: 901, loss: 0.3434499502182007, mean loss: 0.3416110161958122
Epoch: 51, step: 902, loss: 0.345655620098114, mean loss: 0.34161107045156897
Epoch: 51, step: 903, loss: 0.2978304326534271, mean loss: 0.3416104831703837
Epoch: 51, step: 904, loss: 0.3454035222530365, mean loss: 0.3416105340501954
Epoch: 51, step: 905, loss: 0.3157251179218292, mean loss: 0.34161018682798044
Epoch: 51, step: 906, loss: 0.34707173705101013, mean loss: 0.3416102600872288
Epoch: 51, step: 907, loss: 0.35847795009613037, mean loss: 0.34161048634125296
Epoch: 51, step: 908, loss: 0.31428492069244385, mean loss: 0.34161011981588646
Epoch: 51, step: 909, loss: 0.3282073140144348, mean loss: 0.34160994004275824
Epoch: 51, step: 910, loss: 0.3122407793998718, mean loss: 0.3416095461166548
Epoch: 51, step: 911, loss: 0.3274998962879181, mean loss: 0.3416093568676362
Epoch: 51, step: 912, loss: 0.3040832579135895, mean loss: 0.3416088535467012
Epoch: 51, step: 913, loss: 0.37069427967071533, mean loss: 0.34160924365139983
Epoch: 51, step: 914, loss: 0.331544429063797, mean loss: 0.3416091086601233
Epoch: 51, step: 915, loss: 0.34261852502822876, mean loss: 0.3416091221984329
Epoch: 51, step: 916, loss: 0.35043880343437195, mean loss: 0.341609240620681
Epoch: 51, step: 917, loss: 0.35872042179107666, mean loss: 0.3416094701099808
Epoch: 51, step: 918, loss: 0.3735159635543823, mean loss: 0.3416098980232011
Epoch: 51, step: 919, loss: 0.3198259770870209, mean loss: 0.34160960587255285
Epoch: 51, step: 920, loss: 0.32127490639686584, mean loss: 0.34160933316150244
Epoch: 51, step: 921, loss: 0.34934940934181213, mean loss: 0.3416094369631839
Epoch: 51, step: 922, loss: 0.3276582658290863, mean loss: 0.3416092498674025
Epoch: 51, step: 923, loss: 0.3339346945285797, mean loss: 0.3416091469471775
Epoch: 51, step: 924, loss: 0.3061928451061249, mean loss: 0.34160867200045913
Epoch: 51, step: 925, loss: 0.31466811895370483, mean loss: 0.34160831072175396
Epoch: 51, step: 926, loss: 0.3724172115325928, mean loss: 0.34160872387030783
Epoch: 51, step: 927, loss: 0.31782424449920654, mean loss: 0.3416084049237948
Epoch: 51, step: 928, loss: 0.30107665061950684, mean loss: 0.34160786140597593
Epoch: 51, step: 929, loss: 0.3165702819824219, mean loss: 0.3416075256645724
Epoch: 51, step: 930, loss: 0.3126509487628937, mean loss: 0.34160713737658177
Epoch: 51, step: 931, loss: 0.3536320924758911, mean loss: 0.34160729862088424
Epoch: 51, step: 932, loss: 0.2988916039466858, mean loss: 0.3416067258478487
Epoch: 51, step: 933, loss: 0.3874363303184509, mean loss: 0.3416073403669357
Epoch: 51, step: 934, loss: 0.33789893984794617, mean loss: 0.34160729064247547
Epoch: 51, step: 935, loss: 0.3463085889816284, mean loss: 0.34160735367946043
Epoch: 51, step: 936, loss: 0.3215753138065338, mean loss: 0.341607085085048
Epoch: 51, step: 937, loss: 0.3224200904369354, mean loss: 0.3416068278246548
Epoch: 51, step: 938, loss: 0.3697099983692169, mean loss: 0.3416072046286255
Epoch: 51, step: 939, loss: 0.326037734746933, mean loss: 0.3416069958778226
Epoch: 51, step: 940, loss: 0.3371826410293579, mean loss: 0.34160693655818936
Epoch: 51, step: 941, loss: 0.3601120114326477, mean loss: 0.34160718466205436
Epoch: 51, step: 942, loss: 0.3398881256580353, mean loss: 0.3416071616143516
Epoch: 51, step: 943, loss: 0.33648309111595154, mean loss: 0.34160709291602886
Epoch: 51, step: 944, loss: 0.3103298842906952, mean loss: 0.3416066735886666
Epoch: 51, step: 945, loss: 0.3581039607524872, mean loss: 0.341606894761574
Epoch: 51, step: 946, loss: 0.30410152673721313, mean loss: 0.3416063919479903
Epoch: 51, step: 947, loss: 0.32037773728370667, mean loss: 0.3416061073510541
Epoch: 51, step: 948, loss: 0.3200747072696686, mean loss: 0.34160581869930284
Epoch: 51, step: 949, loss: 0.3155305087566376, mean loss: 0.34160546913620204
Epoch: 51, step: 950, loss: 0.31016266345977783, mean loss: 0.3416050476226197
Epoch: 51, step: 951, loss: 0.3389822542667389, mean loss: 0.3416050124626465
Epoch: 51, step: 952, loss: 0.3015578091144562, mean loss: 0.34160447561527535
Epoch: 51, step: 953, loss: 0.33951830863952637, mean loss: 0.34160444764982084
Epoch: 51, step: 954, loss: 0.3358249366283417, mean loss: 0.3416043701754442
Epoch: 51, step: 955, loss: 0.3082984983921051, mean loss: 0.34160392371603693
Epoch: 51, step: 956, loss: 0.2972053587436676, mean loss: 0.34160332856898834
Epoch: 51, step: 957, loss: 0.3640708327293396, mean loss: 0.34160362973389224
Epoch: 51, step: 958, loss: 0.3305189609527588, mean loss: 0.34160348115181405
Epoch: 51, step: 959, loss: 0.32404065132141113, mean loss: 0.34160324573776346
Epoch: 51, step: 960, loss: 0.32206952571868896, mean loss: 0.3416029839091994
Epoch: 51, step: 961, loss: 0.3764064311981201, mean loss: 0.3416034504058255
Epoch: 51, step: 962, loss: 0.31397318840026855, mean loss: 0.34160308006172907
Epoch: 51, step: 963, loss: 0.33744871616363525, mean loss: 0.3416030243791763
Epoch: 51, step: 964, loss: 0.3595786988735199, mean loss: 0.3416032653108936
Epoch: 51, step: 965, loss: 0.3107140362262726, mean loss: 0.34160285130165774
Epoch: 51, step: 966, loss: 0.3804064989089966, mean loss: 0.3416033713811046
Epoch: 51, step: 967, loss: 0.3523131012916565, mean loss: 0.34160351492007834
Epoch: 51, step: 968, loss: 0.37765011191368103, mean loss: 0.3416039980342407
Epoch: 51, step: 969, loss: 0.35775381326675415, mean loss: 0.3416042144790799
Epoch: 51, step: 970, loss: 0.3386271297931671, mean loss: 0.34160417457980113
Epoch: 51, step: 971, loss: 0.3682332932949066, mean loss: 0.34160453146195396
Epoch: 51, step: 972, loss: 0.3462478816509247, mean loss: 0.3416045936910732
Epoch: 51, step: 973, loss: 0.3134634494781494, mean loss: 0.341604216554937
Epoch: 51, step: 974, loss: 0.31930848956108093, mean loss: 0.34160391776070237
Epoch: 51, step: 975, loss: 0.3461228609085083, mean loss: 0.341603978320112
Epoch: 51, step: 976, loss: 0.35787713527679443, mean loss: 0.3416041963975561
Epoch: 51, step: 977, loss: 0.38402900099754333, mean loss: 0.34160476492700587
Epoch: 51, step: 978, loss: 0.3180196285247803, mean loss: 0.3416044488698063
Epoch: 51, step: 979, loss: 0.3486379086971283, mean loss: 0.34160454312178723
Epoch: 51, step: 980, loss: 0.3309343457221985, mean loss: 0.3416044001375675
Epoch: 51, step: 981, loss: 0.312350869178772, mean loss: 0.3416040081357054
Epoch: 51, step: 982, loss: 0.330732524394989, mean loss: 0.3416038624580855
Epoch: 51, step: 983, loss: 0.30946797132492065, mean loss: 0.34160343184368963
Epoch: 51, step: 984, loss: 0.32844990491867065, mean loss: 0.34160325559146965
Epoch: 51, step: 985, loss: 0.3477446436882019, mean loss: 0.34160333788261393
Epoch: 51, step: 986, loss: 0.32615476846694946, mean loss: 0.3416031308832515
Epoch: 51, step: 987, loss: 0.31539836525917053, mean loss: 0.3416027797635492
Epoch: 51, step: 988, loss: 0.3398497700691223, mean loss: 0.34160275627515
Epoch: 51, step: 989, loss: 0.3279173970222473, mean loss: 0.34160257290886586
Epoch: 51, step: 990, loss: 0.3394303619861603, mean loss: 0.3416025438044119
Epoch: 51, step: 991, loss: 0.3530378043651581, mean loss: 0.34160269701815005
Epoch: 51, step: 992, loss: 0.3376505672931671, mean loss: 0.3416026440668025
Epoch: 51, step: 993, loss: 0.34083351492881775, mean loss: 0.34160263376200956
Epoch: 51, step: 994, loss: 0.336652010679245, mean loss: 0.3416025674344451
Epoch: 51, step: 995, loss: 0.2934042811393738, mean loss: 0.3416019216910596
Epoch: 51, step: 996, loss: 0.32956087589263916, mean loss: 0.3416017603715998
Epoch: 51, step: 997, loss: 0.30080682039260864, mean loss: 0.34160121383024267
Epoch: 51, step: 998, loss: 0.3054327368736267, mean loss: 0.34160072927741175
Epoch: 51, step: 999, loss: 0.3625268042087555, mean loss: 0.3416010096224486
Epoch: 51, step: 1000, loss: 0.3383428454399109, mean loss: 0.3416009659736552
Epoch: 51, step: 1001, loss: 0.3239530026912689, mean loss: 0.34160072955156584
Epoch: 51, step: 1002, loss: 0.3272920846939087, mean loss: 0.3416005378674411
Epoch: 51, step: 1003, loss: 0.3095797598361969, mean loss: 0.3416001089104961
Epoch: 51, step: 1004, loss: 0.338873028755188, mean loss: 0.3416000723784574
Epoch: 51, step: 1005, loss: 0.31108754873275757, mean loss: 0.3415996636373503
Epoch: 51, step: 1006, loss: 0.34702932834625244, mean loss: 0.3415997363713352
Epoch: 51, step: 1007, loss: 0.33710500597953796, mean loss: 0.3415996761622264
Epoch: 51, step: 1008, loss: 0.3692542016506195, mean loss: 0.34160004660313953
Epoch: 51, step: 1009, loss: 0.32664546370506287, mean loss: 0.3415998462845645
Epoch: 51, step: 1010, loss: 0.3145614266395569, mean loss: 0.3415994841062825
Epoch: 51, step: 1011, loss: 0.33425500988960266, mean loss: 0.3415993857287346
Epoch: 51, step: 1012, loss: 0.3175477683544159, mean loss: 0.34159906356715064
Epoch: 51, step: 1013, loss: 0.32188525795936584, mean loss: 0.3415987995123192
Epoch: 51, step: 1014, loss: 0.3327873945236206, mean loss: 0.34159868149031264
Epoch: 51, step: 1015, loss: 0.3655339777469635, mean loss: 0.34159900208094024
Epoch: 51, step: 1016, loss: 0.31331172585487366, mean loss: 0.3415986232047368
Epoch: 51, step: 1017, loss: 0.2876496911048889, mean loss: 0.3415979006292352
Epoch: 51, step: 1018, loss: 0.36087656021118164, mean loss: 0.3415981588382488
Epoch: 51, step: 1019, loss: 0.3105854094028473, mean loss: 0.34159774347409155
Epoch: 51, step: 1020, loss: 0.33982110023498535, mean loss: 0.3415977196792313
Epoch: 51, step: 1021, loss: 0.3335936963558197, mean loss: 0.34159761248153325
Epoch: 51, step: 1022, loss: 0.3342519700527191, mean loss: 0.3415975141028328
Epoch: 51, step: 1023, loss: 0.3672313690185547, mean loss: 0.3415978574072593
Epoch: 51, step: 1024, loss: 0.3510458171367645, mean loss: 0.3415979839384801
Epoch: 51, step: 1025, loss: 0.37318024039268494, mean loss: 0.34159840689624704
Epoch: 51, step: 1026, loss: 0.3145802915096283, mean loss: 0.34159804506748637
Epoch: 51, step: 1027, loss: 0.3178424537181854, mean loss: 0.3415977269349688
Epoch: 51, step: 1028, loss: 0.3083883225917816, mean loss: 0.34159728220388336
Epoch: 51, step: 1029, loss: 0.3334048092365265, mean loss: 0.3415971724940383
Epoch: 51, step: 1030, loss: 0.3410055935382843, mean loss: 0.34159716457199
Epoch: 51, step: 1031, loss: 0.3353784680366516, mean loss: 0.3415970812962852
Epoch: 51, step: 1032, loss: 0.32436615228652954, mean loss: 0.3415968505568472
Epoch: 51, step: 1033, loss: 0.304250031709671, mean loss: 0.34159635045214637
Epoch: 51, step: 1034, loss: 0.29855191707611084, mean loss: 0.3415957740594071
Epoch: 51, step: 1035, loss: 0.30396053194999695, mean loss: 0.3415952701059777
Epoch: 51, step: 1036, loss: 0.2893833518028259, mean loss: 0.34159457097342316
Epoch: 51, step: 1037, loss: 0.3949219286441803, mean loss: 0.3415952850324691
Epoch: 51, step: 1038, loss: 0.32641470432281494, mean loss: 0.34159508176558495
Epoch: 51, step: 1039, loss: 0.3833141028881073, mean loss: 0.3415956403727983
Epoch: 51, step: 1040, loss: 0.32937994599342346, mean loss: 0.34159547680990915
Epoch: 51, step: 1041, loss: 0.33860230445861816, mean loss: 0.34159543673315645
Epoch: 51, step: 1042, loss: 0.31398388743400574, mean loss: 0.34159506703629755
Epoch: 51, step: 1043, loss: 0.3730979859828949, mean loss: 0.3415954888298781
Epoch: 51, step: 1044, loss: 0.3581762909889221, mean loss: 0.34159571082779155
Epoch: 51, step: 1045, loss: 0.34815067052841187, mean loss: 0.3415957985900047
Epoch: 51, step: 1046, loss: 0.33399641513824463, mean loss: 0.3415956968457055
Epoch: 51, step: 1047, loss: 0.3344872295856476, mean loss: 0.34159560167530895
Epoch: 51, step: 1048, loss: 0.3105202317237854, mean loss: 0.34159518563404734
Epoch: 51, step: 1049, loss: 0.3438868820667267, mean loss: 0.3415952163151788
Epoch: 51, step: 1050, loss: 0.32569482922554016, mean loss: 0.3415950034443429
Epoch: 51, step: 1051, loss: 0.38040393590927124, mean loss: 0.34159552300271906
Epoch: 51, step: 1052, loss: 0.3458552062511444, mean loss: 0.3415955800288814
Epoch: 51, step: 1053, loss: 0.33491119742393494, mean loss: 0.341595490543452
Epoch: 51, step: 1054, loss: 0.3501208424568176, mean loss: 0.34159560467285016
Epoch: 51, step: 1055, loss: 0.31396204233169556, mean loss: 0.34159523474564346
Epoch: 51, step: 1056, loss: 0.366610586643219, mean loss: 0.34159556961869597
Epoch: 51, step: 1057, loss: 0.31501153111457825, mean loss: 0.34159521375086777
Epoch: 51, step: 1058, loss: 0.34985390305519104, mean loss: 0.3415953243045176
Epoch: 51, step: 1059, loss: 0.35484743118286133, mean loss: 0.34159550169939445
Epoch: 51, step: 1060, loss: 0.31124037504196167, mean loss: 0.3415950953661282
Epoch: 51, step: 1061, loss: 0.3164185583591461, mean loss: 0.3415947583578958
Epoch: 51, step: 1062, loss: 0.36449357867240906, mean loss: 0.34159506487295216
Epoch: 51, step: 1063, loss: 0.3174884021282196, mean loss: 0.34159474219448743
Epoch: 51, step: 1064, loss: 0.3444856107234955, mean loss: 0.34159478088953793
Epoch: 51, step: 1065, loss: 0.2961224317550659, mean loss: 0.34159417223809724
Epoch: 51, step: 1066, loss: 0.35847237706184387, mean loss: 0.3415943981513473
Epoch: 51, step: 1067, loss: 0.33730337023735046, mean loss: 0.3415943407170942
Epoch: 51, step: 1068, loss: 0.31237563490867615, mean loss: 0.3415939496378201
Epoch: 51, step: 1069, loss: 0.3083283603191376, mean loss: 0.34159350439878433
Epoch: 51, step: 1070, loss: 0.33216699957847595, mean loss: 0.341593378232622
Epoch: 51, step: 1071, loss: 0.3470202684402466, mean loss: 0.34159345086619725
Epoch: 51, step: 1072, loss: 0.2833237051963806, mean loss: 0.34159267099353546
Epoch: 51, step: 1073, loss: 0.3359484374523163, mean loss: 0.34159259545305604
Epoch: 51, step: 1074, loss: 0.313996285200119, mean loss: 0.3415922261184791
Epoch: 51, step: 1075, loss: 0.33333277702331543, mean loss: 0.3415921155798135
Epoch: 51, step: 1076, loss: 0.34910961985588074, mean loss: 0.3415922161874643
Epoch: 51, step: 1077, loss: 0.3564540445804596, mean loss: 0.3415924150824135
Epoch: 51, step: 1078, loss: 0.3450092077255249, mean loss: 0.34159246080853056
Epoch: 51, step: 1079, loss: 0.3137775957584381, mean loss: 0.34159208857383955
Epoch: 51, step: 1080, loss: 0.32837679982185364, mean loss: 0.3415919117215311
Epoch: 51, step: 1081, loss: 0.3361496925354004, mean loss: 0.34159183889254
Epoch: 51, step: 1082, loss: 0.3396071493625641, mean loss: 0.34159181233333746
Epoch: 51, step: 1083, loss: 0.3038617670536041, mean loss: 0.34159130743496896
Epoch: 51, step: 1084, loss: 0.31867852807044983, mean loss: 0.34159100082335414
Epoch: 51, step: 1085, loss: 0.33508044481277466, mean loss: 0.3415909137023049
Epoch: 51, step: 1086, loss: 0.3386927545070648, mean loss: 0.341590874921087
Epoch: 51, step: 1087, loss: 0.3781529366970062, mean loss: 0.3415913641634701
Epoch: 51, step: 1088, loss: 0.333670973777771, mean loss: 0.34159125818096725
Epoch: 51, step: 1089, loss: 0.3569975793361664, mean loss: 0.3415914643297236
Epoch: 51, step: 1090, loss: 0.2967095673084259, mean loss: 0.3415908637824964
Epoch: 51, step: 1091, loss: 0.36176949739456177, mean loss: 0.34159113378134054
Epoch: 51, step: 1092, loss: 0.3189318776130676, mean loss: 0.34159083059475065
Epoch: 51, step: 1093, loss: 0.34308868646621704, mean loss: 0.3415908506361736
Epoch: 51, step: 1094, loss: 0.3643909692764282, mean loss: 0.3415911556993754
Epoch: 51, step: 1095, loss: 0.3268428444862366, mean loss: 0.3415909583711548
Epoch: 51, step: 1096, loss: 0.3321892023086548, mean loss: 0.3415908325800085
Epoch: 51, step: 1097, loss: 0.33046895265579224, mean loss: 0.34159068377639173
Epoch: 51, step: 1098, loss: 0.35626786947250366, mean loss: 0.3415908801450911
Epoch: 51, step: 1099, loss: 0.3452966511249542, mean loss: 0.3415909297246022
Epoch: 51, step: 1100, loss: 0.3000192642211914, mean loss: 0.3415903735447172
Epoch: 51, step: 1101, loss: 0.2946315407752991, mean loss: 0.3415897452992891
Epoch: 51, step: 1102, loss: 0.3085009753704071, mean loss: 0.3415893026223933
Epoch: 51, step: 1103, loss: 0.334230899810791, mean loss: 0.341589204179588
Epoch: 51, step: 1104, loss: 0.3488818407058716, mean loss: 0.341589301741248
Epoch: 51, step: 1105, loss: 0.33271515369415283, mean loss: 0.3415891830235484
Epoch: 51, step: 1106, loss: 0.33706846833229065, mean loss: 0.3415891225465689
Epoch: 51, step: 1107, loss: 0.309335857629776, mean loss: 0.34158869107630835
Epoch: 51, step: 1108, loss: 0.2824559807777405, mean loss: 0.34158790003500833
Epoch: 51, step: 1109, loss: 0.3202851116657257, mean loss: 0.3415876150631223
Epoch: 51, step: 1110, loss: 0.32532718777656555, mean loss: 0.34158739754687206
Epoch: 51, step: 1111, loss: 0.31987935304641724, mean loss: 0.3415871071615585
Epoch: 51, step: 1112, loss: 0.30433622002601624, mean loss: 0.34158660886859415
Epoch: 51, step: 1113, loss: 0.3176807463169098, mean loss: 0.3415862890919475
Epoch: 51, step: 1114, loss: 0.3072455823421478, mean loss: 0.34158582973980595
Epoch: 51, step: 1115, loss: 0.32442906498908997, mean loss: 0.34158560024857065
Epoch: 51, step: 1116, loss: 0.30787044763565063, mean loss: 0.34158514927610356
Epoch: 51, step: 1117, loss: 0.3939066231250763, mean loss: 0.341585849116582
Epoch: 51, step: 1118, loss: 0.32397982478141785, mean loss: 0.3415856136254389
Epoch: 51, step: 1119, loss: 0.3195037841796875, mean loss: 0.3415853182716664
Epoch: 51, step: 1120, loss: 0.3152761459350586, mean loss: 0.3415849663801083
Epoch: 51, step: 1121, loss: 0.3049887716770172, mean loss: 0.34158447690367916
Epoch: 51, step: 1122, loss: 0.3733173608779907, mean loss: 0.34158490132734165
Epoch: 51, step: 1123, loss: 0.38150060176849365, mean loss: 0.3415854351880901
Epoch: 51, step: 1124, loss: 0.37594518065452576, mean loss: 0.34158589473342926
Epoch: 51, step: 1125, loss: 0.3156411051750183, mean loss: 0.3415855477387849
Epoch: 51, step: 1126, loss: 0.34906119108200073, mean loss: 0.34158564771930333
Epoch: 51, step: 1127, loss: 0.3700024485588074, mean loss: 0.3415860277653211
Epoch: 51, step: 1128, loss: 0.3509398400783539, mean loss: 0.3415861528614429
Epoch: 51, step: 1129, loss: 0.3573604226112366, mean loss: 0.3415863638207302
Epoch: 51, step: 1130, loss: 0.33975252509117126, mean loss: 0.3415863392959729
Epoch: 51, step: 1131, loss: 0.29444167017936707, mean loss: 0.34158570881735517
Epoch: 51, step: 1132, loss: 0.36916545033454895, mean loss: 0.34158607764388627
Epoch: 51, step: 1133, loss: 0.39922034740448, mean loss: 0.3415868483822018
Epoch: 51, step: 1134, loss: 0.31446078419685364, mean loss: 0.34158648563244337
Epoch: 51, step: 1135, loss: 0.3413887023925781, mean loss: 0.3415864829875752
Epoch: 51, step: 1136, loss: 0.3477224111557007, mean loss: 0.34158656503954254
Epoch: 51, step: 1137, loss: 0.3615890443325043, mean loss: 0.3415868325167335
Epoch: 51, step: 1138, loss: 0.3430445194244385, mean loss: 0.34158685200895644
Epoch: 51, step: 1139, loss: 0.34601300954818726, mean loss: 0.34158691119484563
Epoch: 51, step: 1140, loss: 0.2992800176143646, mean loss: 0.34158634548121886
Epoch: 51, step: 1141, loss: 0.34092187881469727, mean loss: 0.3415863365963117
Epoch: 51, step: 1142, loss: 0.35826534032821655, mean loss: 0.3415865596164052
Epoch: 51, step: 1143, loss: 0.3177250921726227, mean loss: 0.3415862405616445
Epoch: 51, step: 1144, loss: 0.3453199863433838, mean loss: 0.3415862904853737
Epoch: 51, step: 1145, loss: 0.29987260699272156, mean loss: 0.34158573274124354
Epoch: 51, step: 1146, loss: 0.32570958137512207, mean loss: 0.3415855204676897
Epoch: 51, step: 1147, loss: 0.3475258946418762, mean loss: 0.3415855998929514
Epoch: 51, step: 1148, loss: 0.36799106001853943, mean loss: 0.34158595294016336
Epoch: 51, step: 1149, loss: 0.33581826090812683, mean loss: 0.34158587582579547
Epoch: 51, step: 1150, loss: 0.322032630443573, mean loss: 0.34158561440129676
Epoch: 51, step: 1151, loss: 0.3284742534160614, mean loss: 0.34158543910634803
Epoch: 51, step: 1152, loss: 0.28252527117729187, mean loss: 0.3415846495002418
Epoch: 51, step: 1153, loss: 0.3152849078178406, mean loss: 0.3415842978900158
Epoch: 51, step: 1154, loss: 0.3387967646121979, mean loss: 0.34158426062302993
Epoch: 51, step: 1155, loss: 0.35632559657096863, mean loss: 0.34158445769971374
Epoch: 51, step: 1156, loss: 0.32839035987854004, mean loss: 0.34158428131038976
Epoch: 51, step: 1157, loss: 0.32955029606819153, mean loss: 0.34158412043253567
Epoch: 51, step: 1158, loss: 0.294450581073761, mean loss: 0.34158349033027563
Epoch: 51, step: 1159, loss: 0.3158529996871948, mean loss: 0.34158314635815323
Epoch: 51, step: 1160, loss: 0.31670188903808594, mean loss: 0.3415828137432569
Epoch: 51, step: 1161, loss: 0.368400514125824, mean loss: 0.34158317223990664
Epoch: 51, step: 1162, loss: 0.3164253532886505, mean loss: 0.34158283593690086
Epoch: 51, step: 1163, loss: 0.32127681374549866, mean loss: 0.34158256449504715
Epoch: 51, step: 1164, loss: 0.3198838531970978, mean loss: 0.34158227444022354
Epoch: 51, step: 1165, loss: 0.3068826496601105, mean loss: 0.3415818106035068
Epoch: 51, step: 1166, loss: 0.3347885310649872, mean loss: 0.3415817197976154
Epoch: 51, step: 1167, loss: 0.3631322979927063, mean loss: 0.3415820078607362
Epoch: 51, step: 1168, loss: 0.3194578289985657, mean loss: 0.34158171213434024
Epoch: 51, step: 1169, loss: 0.2947932183742523, mean loss: 0.3415810867367708
Epoch: 51, step: 1170, loss: 0.31508320569992065, mean loss: 0.34158073255804944
Epoch: 51, step: 1171, loss: 0.3397744596004486, mean loss: 0.3415807084151795
Epoch: 51, step: 1172, loss: 0.3039606213569641, mean loss: 0.34158020558711827
Epoch: 51, step: 1173, loss: 0.3694070279598236, mean loss: 0.34158057751395904
Epoch: 51, step: 1174, loss: 0.3771458566188812, mean loss: 0.3415810528648606
Epoch: 51, step: 1175, loss: 0.316131055355072, mean loss: 0.3415807127152013
Epoch: 51, step: 1176, loss: 0.3250713050365448, mean loss: 0.34158049206314267
Epoch: 51, step: 1177, loss: 0.3348205089569092, mean loss: 0.34158040171560977
Epoch: 51, step: 1178, loss: 0.35406494140625, mean loss: 0.34158056856991514
Epoch: 51, step: 1179, loss: 0.30653131008148193, mean loss: 0.3415801001472367
Epoch: 51, step: 1180, loss: 0.29971227049827576, mean loss: 0.34157954060390694
Epoch: 51, step: 1181, loss: 0.30738699436187744, mean loss: 0.3415790836431414
Epoch: 51, step: 1182, loss: 0.2767011523246765, mean loss: 0.34157821660408705
Epoch: 51, step: 1183, loss: 0.3667704463005066, mean loss: 0.3415785532725761
Epoch: 51, step: 1184, loss: 0.30781441926956177, mean loss: 0.34157810205534744
Epoch: 51, step: 1185, loss: 0.3154965937137604, mean loss: 0.34157775351187103
Epoch: 51, step: 1186, loss: 0.36511796712875366, mean loss: 0.34157806809023583
Epoch: 51, step: 1187, loss: 0.31798508763313293, mean loss: 0.34157775281093744
Epoch: 51, step: 1188, loss: 0.32807618379592896, mean loss: 0.34157757238827613
Epoch: 51, step: 1189, loss: 0.3355070948600769, mean loss: 0.3415774912690318
Epoch: 51, step: 1190, loss: 0.3609362542629242, mean loss: 0.3415777499549808
Epoch: 51, step: 1191, loss: 0.34203606843948364, mean loss: 0.34157775607928575
Epoch: 51, step: 1192, loss: 0.3463957905769348, mean loss: 0.3415778204596657
Epoch: 51, step: 1193, loss: 0.34051641821861267, mean loss: 0.3415778062770013
Epoch: 51, step: 1194, loss: 0.3113594055175781, mean loss: 0.3415774024982127
Epoch: 51, step: 1195, loss: 0.30072543025016785, mean loss: 0.3415768566407535
Epoch: 51, step: 1196, loss: 0.4261743128299713, mean loss: 0.3415779870032044
Epoch: 51, step: 1197, loss: 0.3577040731906891, mean loss: 0.34157820247160703
Epoch: 51, step: 1198, loss: 0.29946649074554443, mean loss: 0.34157763980426703
Epoch: 51, step: 1199, loss: 0.3059595227241516, mean loss: 0.34157716390617127
Epoch: 51, step: 1200, loss: 0.3729325532913208, mean loss: 0.3415775828438342
Epoch: 51, step: 1201, loss: 0.29412052035331726, mean loss: 0.34157694878105876
Epoch: 51, step: 1202, loss: 0.3581984043121338, mean loss: 0.3415771708534936
Epoch: 51, step: 1203, loss: 0.31349191069602966, mean loss: 0.3415767956228908
Epoch: 51, step: 1204, loss: 0.34408730268478394, mean loss: 0.3415768291638474
Epoch: 51, step: 1205, loss: 0.3175114393234253, mean loss: 0.3415765076489531
Epoch: 51, step: 1206, loss: 0.3189459443092346, mean loss: 0.3415762053074568
Epoch: 51, step: 1207, loss: 0.3303043842315674, mean loss: 0.3415760547193486
Epoch: 51, step: 1208, loss: 0.29977181553840637, mean loss: 0.3415754962348633
Epoch: 51, step: 1209, loss: 0.3077958822250366, mean loss: 0.34157504496153107
Epoch: 51, step: 1210, loss: 0.29163554310798645, mean loss: 0.3415743778116833
Epoch: 51, step: 1211, loss: 0.3444336950778961, mean loss: 0.34157441600925287
Epoch: 51, step: 1212, loss: 0.32057803869247437, mean loss: 0.34157413552276106
Epoch: 51, step: 1213, loss: 0.3555808663368225, mean loss: 0.3415743226334348
Epoch: 51, step: 1214, loss: 0.2944841980934143, mean loss: 0.34157369358249184
Epoch: 51, step: 1215, loss: 0.3276948034763336, mean loss: 0.3415735081845476
Epoch: 51, step: 1216, loss: 0.3017215430736542, mean loss: 0.34157297583839796
Epoch: 51, step: 1217, loss: 0.34465616941452026, mean loss: 0.3415730170234261
Epoch: 51, step: 1218, loss: 0.35003194212913513, mean loss: 0.341573130015493
Epoch: 51, step: 1219, loss: 0.31101909279823303, mean loss: 0.3415727218882594
Epoch: 51, step: 1220, loss: 0.33283019065856934, mean loss: 0.3415726051109772
Epoch: 51, step: 1221, loss: 0.3242940306663513, mean loss: 0.3415723743176338
Epoch: 51, step: 1222, loss: 0.3319129943847656, mean loss: 0.341572245297105
Epoch: 51, step: 1223, loss: 0.324142724275589, mean loss: 0.3415720124937575
Epoch: 51, step: 1224, loss: 0.31778883934020996, mean loss: 0.34157169482992933
Epoch: 51, step: 1225, loss: 0.34475648403167725, mean loss: 0.34157173736751717
Epoch: 51, step: 1226, loss: 0.3314930498600006, mean loss: 0.3415716027534809
Epoch: 51, step: 1227, loss: 0.33908945322036743, mean loss: 0.34157156960157453
Epoch: 51, step: 1228, loss: 0.3194532096385956, mean loss: 0.34157127418987787
Epoch: 51, step: 1229, loss: 0.3893798291683197, mean loss: 0.3415719127099914
Epoch: 51, step: 1230, loss: 0.3300635516643524, mean loss: 0.34157175900900916
Epoch: 51, step: 1231, loss: 0.3425768315792084, mean loss: 0.34157177243216974
Epoch: 51, step: 1232, loss: 0.36757323145866394, mean loss: 0.34157211968778933
Epoch: 51, step: 1233, loss: 0.34692326188087463, mean loss: 0.34157219115260135
Epoch: 51, step: 1234, loss: 0.3268175423145294, mean loss: 0.3415719941060484
Epoch: 51, step: 1235, loss: 0.30382755398750305, mean loss: 0.34157149004034165
Epoch: 51, step: 1236, loss: 0.32657429575920105, mean loss: 0.34157128975997303
Epoch: 51, step: 1237, loss: 0.33718615770339966, mean loss: 0.3415712311994103
Epoch: 51, step: 1238, loss: 0.29835376143455505, mean loss: 0.3415706540661522
Epoch: 51, step: 1239, loss: 0.3330810070037842, mean loss: 0.34157054069551146
Epoch: 51, step: 1240, loss: 0.4148581922054291, mean loss: 0.34157151936482455
Epoch: 51, step: 1241, loss: 0.33012208342552185, mean loss: 0.34157136647328357
Epoch: 51, step: 1242, loss: 0.33276671171188354, mean loss: 0.34157124890074414
Epoch: 51, step: 1243, loss: 0.30714139342308044, mean loss: 0.3415707891494425
Epoch: 51, step: 1244, loss: 0.3357788026332855, mean loss: 0.341570711808491
Epoch: 51, step: 1245, loss: 0.3069906532764435, mean loss: 0.3415702500638184
Epoch: 51, step: 1246, loss: 0.35422632098197937, mean loss: 0.3415704190570341
Epoch: 51, step: 1247, loss: 0.30332687497138977, mean loss: 0.34156990840777807
Epoch: 51, step: 1248, loss: 0.3400866985321045, mean loss: 0.34156988860339216
Epoch: 51, step: 1249, loss: 0.3312998116016388, mean loss: 0.34156975147522434
Epoch: 51, step: 1250, loss: 0.29645881056785583, mean loss: 0.34156914915276076
Epoch: 51, step: 1251, loss: 0.3205358386039734, mean loss: 0.3415688683191976
Epoch: 51, step: 1252, loss: 0.3343048691749573, mean loss: 0.3415687713326808
Epoch: 51, step: 1253, loss: 0.30557993054389954, mean loss: 0.3415682908279839
Epoch: 51, step: 1254, loss: 0.36128365993499756, mean loss: 0.3415685540540498
Epoch: 51, step: 1255, loss: 0.3342925012111664, mean loss: 0.34156845691048715
Epoch: 51, step: 1256, loss: 0.37350884079933167, mean loss: 0.3415688833451661
Epoch: 51, step: 1257, loss: 0.2929495871067047, mean loss: 0.3415682342397185
Epoch: 51, step: 1258, loss: 0.3388383090496063, mean loss: 0.34156819779357894
Epoch: 51, step: 1259, loss: 0.3143807649612427, mean loss: 0.34156783482988096
Epoch: 51, step: 1260, loss: 0.34158217906951904, mean loss: 0.34156783502138005
Epoch: 51, step: 1261, loss: 0.30229538679122925, mean loss: 0.34156731073162716
Epoch: 51, step: 1262, loss: 0.3415575325489044, mean loss: 0.3415673106010895
Epoch: 51, step: 1263, loss: 0.3192930519580841, mean loss: 0.34156701324621896
Epoch: 51, step: 1264, loss: 0.3239482045173645, mean loss: 0.3415667780433898
Epoch: 51, step: 1265, loss: 0.3281060755252838, mean loss: 0.34156659835172626
Epoch: 51, step: 1266, loss: 0.37819600105285645, mean loss: 0.34156708732400937
Epoch: 51, step: 1267, loss: 0.3254275321960449, mean loss: 0.34156687187715
Epoch: 51, step: 1268, loss: 0.3305826485157013, mean loss: 0.3415667252507519
Epoch: 51, step: 1269, loss: 0.34074318408966064, mean loss: 0.3415667142575976
Epoch: 51, step: 1270, loss: 0.35219135880470276, mean loss: 0.3415668560802572
Epoch: 51, step: 1271, loss: 0.3517574965953827, mean loss: 0.34156699210781494
Epoch: 51, step: 1272, loss: 0.31983456015586853, mean loss: 0.3415667020210262
Epoch: 51, step: 1273, loss: 0.2907755970954895, mean loss: 0.341566024065062
Epoch: 51, step: 1274, loss: 0.3725026845932007, mean loss: 0.3415664369998386
Epoch: 51, step: 1275, loss: 0.3503921329975128, mean loss: 0.34156655480144027
Epoch: 51, step: 1276, loss: 0.3356814980506897, mean loss: 0.3415664762512774
Epoch: 51, step: 1277, loss: 0.32465940713882446, mean loss: 0.3415662505890005
Epoch: 51, step: 1278, loss: 0.3385329246520996, mean loss: 0.34156621010308913
Epoch: 51, step: 1279, loss: 0.36552804708480835, mean loss: 0.3415665299183283
Epoch: 51, step: 1280, loss: 0.3162749111652374, mean loss: 0.3415661923591858
Epoch: 51, step: 1281, loss: 0.3526545763015747, mean loss: 0.34156634035032296
Epoch: 51, step: 1282, loss: 0.3485765755176544, mean loss: 0.3415664339111911
Epoch: 51, step: 1283, loss: 0.2953304946422577, mean loss: 0.3415658168396122
Epoch: 51, step: 1284, loss: 0.39860278367996216, mean loss: 0.34156657805311885
Epoch: 51, step: 1285, loss: 0.3737463653087616, mean loss: 0.34156700751778263
Epoch: 51, step: 1286, loss: 0.32808107137680054, mean loss: 0.34156682753972095
Epoch: 51, step: 1287, loss: 0.29223597049713135, mean loss: 0.34156616919806393
Epoch: 51, step: 1288, loss: 0.36996904015541077, mean loss: 0.34156654824162225
Epoch: 51, step: 1289, loss: 0.3133804202079773, mean loss: 0.3415661720955733
Epoch: 51, step: 1290, loss: 0.3352731764316559, mean loss: 0.3415660881161823
Epoch: 51, step: 1291, loss: 0.34757453203201294, mean loss: 0.34156616829718894
Epoch: 51, step: 1292, loss: 0.33715444803237915, mean loss: 0.34156610942479926
Epoch: 51, step: 1293, loss: 0.3418215811252594, mean loss: 0.3415661128339068
Epoch: 51, step: 1294, loss: 0.33820056915283203, mean loss: 0.3415660679234639
Epoch: 51, step: 1295, loss: 0.39250537753105164, mean loss: 0.34156674765804634
Epoch: 51, step: 1296, loss: 0.34145593643188477, mean loss: 0.34156674617940014
Epoch: 51, step: 1297, loss: 0.3472099006175995, mean loss: 0.34156682147969153
Epoch: 51, step: 1298, loss: 0.3326003849506378, mean loss: 0.34156670183627547
Epoch: 51, step: 1299, loss: 0.3125942349433899, mean loss: 0.34156631524806436
Epoch: 51, step: 1300, loss: 0.3896179795265198, mean loss: 0.3415669564071047
Epoch: 51, step: 1301, loss: 0.3218745291233063, mean loss: 0.3415666936522241
Epoch: 51, step: 1302, loss: 0.34169355034828186, mean loss: 0.3415666953448428
Epoch: 51, step: 1303, loss: 0.3132697343826294, mean loss: 0.3415663177902588
Epoch: 51, step: 1304, loss: 0.31841400265693665, mean loss: 0.3415660088826665
Epoch: 51, step: 1305, loss: 0.33238551020622253, mean loss: 0.34156588639435864
Epoch: 51, step: 1306, loss: 0.28383690118789673, mean loss: 0.3415651161713435
Epoch: 51, step: 1307, loss: 0.332724392414093, mean loss: 0.34156499821953756
Epoch: 51, step: 1308, loss: 0.34075453877449036, mean loss: 0.34156498740663555
Epoch: 51, step: 1309, loss: 0.35924455523490906, mean loss: 0.3415652232788749
Epoch: 51, step: 1310, loss: 0.30349838733673096, mean loss: 0.3415647154163448
Epoch: 51, step: 1311, loss: 0.30621692538261414, mean loss: 0.3415642438358171
Epoch: 51, step: 1312, loss: 0.33607611060142517, mean loss: 0.3415641706187295
Epoch: 51, step: 1313, loss: 0.3432798981666565, mean loss: 0.3415641935079148
Epoch: 51, step: 1314, loss: 0.3121703267097473, mean loss: 0.341563801375325
Epoch: 51, step: 1315, loss: 0.36565500497817993, mean loss: 0.3415641227627797
Epoch: 51, step: 1316, loss: 0.41236236691474915, mean loss: 0.3415650672304916
Epoch: 51, step: 1317, loss: 0.3588322103023529, mean loss: 0.3415652975757742
Epoch: 51, step: 1318, loss: 0.3059474527835846, mean loss: 0.34156482243677505
Epoch: 51, step: 1319, loss: 0.41106459498405457, mean loss: 0.3415657495454212
Epoch: 51, step: 1320, loss: 0.32641980051994324, mean loss: 0.3415655475051487
Epoch: 51, step: 1321, loss: 0.3181914985179901, mean loss: 0.341565235709815
Epoch: 51, step: 1322, loss: 0.29434680938720703, mean loss: 0.34156460585366066
Epoch: 51, step: 1323, loss: 0.31639981269836426, mean loss: 0.34156427017986446
Epoch: 51, step: 1324, loss: 0.31951722502708435, mean loss: 0.34156397609770844
Epoch: 51, step: 1325, loss: 0.37319979071617126, mean loss: 0.3415643980773619
Epoch: 51, step: 1326, loss: 0.3210128843784332, mean loss: 0.3415641239511838
Epoch: 51, step: 1327, loss: 0.31947389245033264, mean loss: 0.3415638293047625
Epoch: 51, step: 1328, loss: 0.397234171628952, mean loss: 0.34156457184330735
Epoch: 51, step: 1329, loss: 0.3372098505496979, mean loss: 0.3415645137602213
Epoch: 51, step: 1330, loss: 0.34091416001319885, mean loss: 0.34156450508594655
Epoch: 51, step: 1331, loss: 0.29199039936065674, mean loss: 0.3415638438862863
Epoch: 51, step: 1332, loss: 0.35345104336738586, mean loss: 0.34156400243089974
Epoch: 51, step: 1333, loss: 0.324195921421051, mean loss: 0.34156377078853783
Epoch: 51, step: 1334, loss: 0.3475605249404907, mean loss: 0.341563850767654
Epoch: 51, step: 1335, loss: 0.3260380029678345, mean loss: 0.34156364370113224
Epoch: 51, step: 1336, loss: 0.30312538146972656, mean loss: 0.34156313106110037
Epoch: 51, step: 1337, loss: 0.3559722900390625, mean loss: 0.34156332322934047
Epoch: 51, step: 1338, loss: 0.32110872864723206, mean loss: 0.34156305043958035
Epoch: 51, step: 1339, loss: 0.3489445745944977, mean loss: 0.3415631488809032
Epoch: 51, step: 1340, loss: 0.3160347044467926, mean loss: 0.34156280843355463
Epoch: 51, step: 1341, loss: 0.34011733531951904, mean loss: 0.34156278915698146
Epoch: 51, step: 1342, loss: 0.343479186296463, mean loss: 0.3415628147133731
Epoch: 51, step: 1343, loss: 0.29804059863090515, mean loss: 0.3415622343242964
Epoch: 51, step: 1344, loss: 0.31848976016044617, mean loss: 0.3415619266461814
Epoch: 51, step: 1345, loss: 0.3364855647087097, mean loss: 0.3415618589523297
Epoch: 51, step: 1346, loss: 0.3097691535949707, mean loss: 0.34156143499871716
Epoch: 51, step: 1347, loss: 0.34353938698768616, mean loss: 0.3415614613742237
Epoch: 51, step: 1348, loss: 0.3420822322368622, mean loss: 0.34156146831848333
Epoch: 51, step: 1349, loss: 0.3419407308101654, mean loss: 0.3415614733757211
Epoch: 51, step: 1350, loss: 0.321315735578537, mean loss: 0.3415612034145531
Epoch: 51, step: 1351, loss: 0.37247759103775024, mean loss: 0.3415616156550409
Epoch: 51, step: 1352, loss: 0.3273521363735199, mean loss: 0.34156142618773844
Epoch: 51, step: 1353, loss: 0.31790316104888916, mean loss: 0.3415611107357912
Epoch: 51, step: 1354, loss: 0.3214520514011383, mean loss: 0.3415608426114251
Epoch: 51, step: 1355, loss: 0.34434938430786133, mean loss: 0.3415608797919811
Epoch: 51, step: 1356, loss: 0.32844191789627075, mean loss: 0.3415607048748214
Epoch: 51, step: 1357, loss: 0.3468070924282074, mean loss: 0.3415607748247901
Epoch: 51, step: 1358, loss: 0.36017367243766785, mean loss: 0.3415610229868318
Epoch: 51, step: 1359, loss: 0.3077968657016754, mean loss: 0.34156057282207675
Epoch: 51, step: 1360, loss: 0.3328237235546112, mean loss: 0.3415604563385187
Epoch: 51, step: 1361, loss: 0.2985621988773346, mean loss: 0.34155988307428037
Epoch: 51, step: 1362, loss: 0.33419662714004517, mean loss: 0.34155978490669686
Epoch: 51, step: 1363, loss: 0.3553277552127838, mean loss: 0.34155996846005526
Epoch: 51, step: 1364, loss: 0.35788461565971375, mean loss: 0.3415601860959016
Epoch: 51, step: 1365, loss: 0.3258967995643616, mean loss: 0.34155997727859017
Epoch: 51, step: 1366, loss: 0.31024378538131714, mean loss: 0.34155955979059643
Epoch: 51, step: 1367, loss: 0.3681375980377197, mean loss: 0.341559914107749
Epoch: 51, step: 1368, loss: 0.3591701090335846, mean loss: 0.34156014886965597
Epoch: 51, step: 1369, loss: 0.31653162837028503, mean loss: 0.3415598152183309
Epoch: 51, step: 1370, loss: 0.3566645383834839, mean loss: 0.3415600165743686
Epoch: 51, step: 1371, loss: 0.4286428391933441, mean loss: 0.34156117743102077
Epoch: 51, step: 1372, loss: 0.31389835476875305, mean loss: 0.34156080867696953
Epoch: 51, step: 1373, loss: 0.31594303250312805, mean loss: 0.34156046718857774
Epoch: 51, step: 1374, loss: 0.3512510657310486, mean loss: 0.3415605963638339
Epoch: 51, step: 1375, loss: 0.3580448031425476, mean loss: 0.3415608160946627
Epoch: 51, step: 1376, loss: 0.32891327142715454, mean loss: 0.3415606475079381
Epoch: 51, step: 1377, loss: 0.3699157238006592, mean loss: 0.34156102546475464
Epoch: 51, step: 1378, loss: 0.36887601017951965, mean loss: 0.34156138955289717
Epoch: 51, step: 1379, loss: 0.3038577139377594, mean loss: 0.3415608869980398
Epoch: 51, step: 1380, loss: 0.32299286127090454, mean loss: 0.3415606395068605
Epoch: 51, step: 1381, loss: 0.3108922243118286, mean loss: 0.341560230736365
Epoch: 51, step: 1382, loss: 0.3537057340145111, mean loss: 0.34156039261813126
Epoch: 51, step: 1383, loss: 0.3220438063144684, mean loss: 0.3415601324940935
Epoch: 51, step: 1384, loss: 0.3132557272911072, mean loss: 0.34155975524789267
Epoch: 51, step: 1385, loss: 0.36113885045051575, mean loss: 0.34156001619811527
Epoch: 51, step: 1386, loss: 0.31915998458862305, mean loss: 0.3415597176544252
Epoch: 51, step: 1387, loss: 0.35030001401901245, mean loss: 0.3415598341420087
Epoch: 51, step: 1388, loss: 0.3286997079849243, mean loss: 0.34155966274907285
Epoch: 51, step: 1389, loss: 0.30815061926841736, mean loss: 0.34155921749700735
Epoch: 51, step: 1390, loss: 0.3002426028251648, mean loss: 0.34155866686577296
Epoch: 51, step: 1391, loss: 0.31099236011505127, mean loss: 0.3415582595105468
Epoch: 51, step: 1392, loss: 0.36246103048324585, mean loss: 0.3415585380767338
Epoch: 51, step: 1393, loss: 0.3875274658203125, mean loss: 0.341559150685382
Epoch: 51, step: 1394, loss: 0.35961800813674927, mean loss: 0.341559391345005
Epoch: 51, step: 1395, loss: 0.31832772493362427, mean loss: 0.3415590817545678
Epoch: 51, step: 1396, loss: 0.34252989292144775, mean loss: 0.3415590946916444
Epoch: 51, step: 1397, loss: 0.3785969614982605, mean loss: 0.3415595882534739
Epoch: 51, step: 1398, loss: 0.28519564867019653, mean loss: 0.34155883716490354
Epoch: 51, step: 1399, loss: 0.3170560598373413, mean loss: 0.3415585106527596
Epoch: 51, step: 1400, loss: 0.3331579267978668, mean loss: 0.3415583987121392
Epoch: 51, step: 1401, loss: 0.33440980315208435, mean loss: 0.34155830345595556
Epoch: 51, step: 1402, loss: 0.3617851436138153, mean loss: 0.34155857297825704
Epoch: 51, step: 1403, loss: 0.33656665682792664, mean loss: 0.34155850646194547
Epoch: 51, step: 1404, loss: 0.3223758935928345, mean loss: 0.34155825086076663
Epoch: 51, step: 1405, loss: 0.34117403626441956, mean loss: 0.3415582457413183
Epoch: 51, step: 1406, loss: 0.33312591910362244, mean loss: 0.3415581333866976
Epoch: 51, step: 1407, loss: 0.29643481969833374, mean loss: 0.341557532159366
Epoch: 51, step: 1408, loss: 0.34407737851142883, mean loss: 0.3415575657335916
Epoch: 51, step: 1409, loss: 0.35268890857696533, mean loss: 0.34155771404471214
Epoch: 51, step: 1410, loss: 0.35667291283607483, mean loss: 0.3415579154330113
Epoch: 51, step: 1411, loss: 0.3109985291957855, mean loss: 0.3415575082785368
Epoch: 51, step: 1412, loss: 0.3328493535518646, mean loss: 0.34155739225798276
Epoch: 51, step: 1413, loss: 0.33683082461357117, mean loss: 0.34155732928577937
Epoch: 51, step: 1414, loss: 0.3252236545085907, mean loss: 0.3415571116746364
Epoch: 51, step: 1415, loss: 0.30200693011283875, mean loss: 0.3415565847604137
Epoch: 51, step: 1416, loss: 0.2769230306148529, mean loss: 0.3415557236800371
Epoch: 51, step: 1417, loss: 0.36164072155952454, mean loss: 0.34155599125881037
Epoch: 51, step: 1418, loss: 0.337140828371048, mean loss: 0.3415559324393802
Epoch: 51, step: 1419, loss: 0.3235032260417938, mean loss: 0.3415556919418528
Epoch: 51, step: 1420, loss: 0.33251330256462097, mean loss: 0.34155557148106047
Epoch: 51, step: 1421, loss: 0.34259146451950073, mean loss: 0.34155558528082386
Epoch: 51, step: 1422, loss: 0.3266507089138031, mean loss: 0.34155538672651414
Epoch: 51, step: 1423, loss: 0.3673803210258484, mean loss: 0.3415557307470595
Epoch: 51, step: 1424, loss: 0.33020439743995667, mean loss: 0.3415555795350638
Epoch: 51, step: 1425, loss: 0.3211059272289276, mean loss: 0.3415553071272803
Epoch: 51, step: 1426, loss: 0.3303526043891907, mean loss: 0.34155515789917973
Epoch: 51, step: 1427, loss: 0.3610105812549591, mean loss: 0.34155541705603387
Epoch: 51, step: 1428, loss: 0.3323000967502594, mean loss: 0.3415552937717598
Epoch: 51, step: 1429, loss: 0.3817192316055298, mean loss: 0.34155582876307283
Epoch: 51, step: 1430, loss: 0.343481183052063, mean loss: 0.3415558544088176
Epoch: 51, step: 1431, loss: 0.3250785171985626, mean loss: 0.34155563493338986
Epoch: 51, step: 1432, loss: 0.31733328104019165, mean loss: 0.3415553122999083
Epoch: 51, step: 1433, loss: 0.3292364180088043, mean loss: 0.341555148218629
Epoch: 51, step: 1434, loss: 0.3069046437740326, mean loss: 0.34155468669803807
Epoch: 51, step: 1435, loss: 0.34286949038505554, mean loss: 0.3415547042100744
Epoch: 51, step: 1436, loss: 0.3494715094566345, mean loss: 0.3415548096535987
Epoch: 51, step: 1437, loss: 0.3491363525390625, mean loss: 0.3415549106304358
Epoch: 51, step: 1438, loss: 0.3291875720024109, mean loss: 0.34155474591487267
Epoch: 51, step: 1439, loss: 0.3912819027900696, mean loss: 0.3415554082018696
Epoch: 51, step: 1440, loss: 0.3384408950805664, mean loss: 0.34155536672203846
Epoch: 51, step: 1441, loss: 0.3799757659435272, mean loss: 0.3415558784072956
Epoch: 51, step: 1442, loss: 0.30432066321372986, mean loss: 0.3415553825129971
Epoch: 51, step: 1443, loss: 0.330349862575531, mean loss: 0.3415552332811633
Valid: 51, mean loss: 0.1851623331507047
Epoch: 52, step: 0, loss: 0.3515830636024475, mean loss: 0.34155536682709303
Epoch: 52, step: 1, loss: 0.33784714341163635, mean loss: 0.34155531744337464
Epoch: 52, step: 2, loss: 0.3598691523075104, mean loss: 0.3415555613319214
Epoch: 52, step: 3, loss: 0.3186495006084442, mean loss: 0.34155525629196076
Epoch: 52, step: 4, loss: 0.3248234689235687, mean loss: 0.3415550334777521
Epoch: 52, step: 5, loss: 0.3154377341270447, mean loss: 0.34155468568299685
Epoch: 52, step: 6, loss: 0.3054550290107727, mean loss: 0.34155420496315303
Epoch: 52, step: 7, loss: 0.3573871850967407, mean loss: 0.34155441579968404
Epoch: 52, step: 8, loss: 0.30323225259780884, mean loss: 0.34155390549749887
Epoch: 52, step: 9, loss: 0.319965124130249, mean loss: 0.34155361802271433
Epoch: 52, step: 10, loss: 0.3196660578250885, mean loss: 0.3415533265732916
Epoch: 52, step: 11, loss: 0.3226173520088196, mean loss: 0.3415530744298221
Epoch: 52, step: 12, loss: 0.33344197273254395, mean loss: 0.3415529664272429
Epoch: 52, step: 13, loss: 0.3561839461326599, mean loss: 0.34155316124202423
Epoch: 52, step: 14, loss: 0.33125343918800354, mean loss: 0.34155302410073757
Epoch: 52, step: 15, loss: 0.33894556760787964, mean loss: 0.3415529893827932
Epoch: 52, step: 16, loss: 0.32056286931037903, mean loss: 0.3415527099057934
Epoch: 52, step: 17, loss: 0.3447478413581848, mean loss: 0.3415527524474206
Epoch: 52, step: 18, loss: 0.34910205006599426, mean loss: 0.3415528529613224
Epoch: 52, step: 19, loss: 0.410430371761322, mean loss: 0.34155377000769294
Epoch: 52, step: 20, loss: 0.3200491666793823, mean loss: 0.3415534836957552
Epoch: 52, step: 21, loss: 0.3307535648345947, mean loss: 0.3415533399077262
Epoch: 52, step: 22, loss: 0.35623565316200256, mean loss: 0.3415535353826001
Epoch: 52, step: 23, loss: 0.35841330885887146, mean loss: 0.3415537598443835
Epoch: 52, step: 24, loss: 0.3441500961780548, mean loss: 0.34155379441012224
Epoch: 52, step: 25, loss: 0.37093183398246765, mean loss: 0.34155418552282524
Epoch: 52, step: 26, loss: 0.3353519141674042, mean loss: 0.3415541029524817
Epoch: 52, step: 27, loss: 0.30997055768966675, mean loss: 0.3415536824888619
Epoch: 52, step: 28, loss: 0.4304155111312866, mean loss: 0.3415548654677967
Epoch: 52, step: 29, loss: 0.3417589068412781, mean loss: 0.3415548681840747
Epoch: 52, step: 30, loss: 0.3092299997806549, mean loss: 0.34155443786859657
Epoch: 52, step: 31, loss: 0.35091811418533325, mean loss: 0.3415545625181748
Epoch: 52, step: 32, loss: 0.32045847177505493, mean loss: 0.34155428169003427
Epoch: 52, step: 33, loss: 0.3001345694065094, mean loss: 0.3415537303240924
Epoch: 52, step: 34, loss: 0.30474603176116943, mean loss: 0.34155324035832213
Epoch: 52, step: 35, loss: 0.34743162989616394, mean loss: 0.34155331860747734
Epoch: 52, step: 36, loss: 0.31112903356552124, mean loss: 0.3415529136253137
Epoch: 52, step: 37, loss: 0.3295729160308838, mean loss: 0.3415527541599143
Epoch: 52, step: 38, loss: 0.3499196171760559, mean loss: 0.34155286552950204
Epoch: 52, step: 39, loss: 0.36858129501342773, mean loss: 0.3415532252945628
Epoch: 52, step: 40, loss: 0.3634081482887268, mean loss: 0.3415535161931904
Epoch: 52, step: 41, loss: 0.33529868721961975, mean loss: 0.3415534329397767
Epoch: 52, step: 42, loss: 0.3026306629180908, mean loss: 0.34155291487439726
Epoch: 52, step: 43, loss: 0.31339913606643677, mean loss: 0.34155254015019443
Epoch: 52, step: 44, loss: 0.3687254786491394, mean loss: 0.3415529018146894
Epoch: 52, step: 45, loss: 0.3078494668006897, mean loss: 0.34155245323701466
Epoch: 52, step: 46, loss: 0.3371613621711731, mean loss: 0.34155239479433064
Epoch: 52, step: 47, loss: 0.37247925996780396, mean loss: 0.34155280640614355
Epoch: 52, step: 48, loss: 0.3477616310119629, mean loss: 0.34155288903952796
Epoch: 52, step: 49, loss: 0.3109516203403473, mean loss: 0.3415524817719843
Epoch: 52, step: 50, loss: 0.3510780930519104, mean loss: 0.34155260854518166
Epoch: 52, step: 51, loss: 0.30626243352890015, mean loss: 0.3415521388862115
Epoch: 52, step: 52, loss: 0.3453451097011566, mean loss: 0.34155218936425696
Epoch: 52, step: 53, loss: 0.3351065516471863, mean loss: 0.3415521035848298
Epoch: 52, step: 54, loss: 0.34152525663375854, mean loss: 0.34155210322755164
Epoch: 52, step: 55, loss: 0.3032391667366028, mean loss: 0.34155159336733004
Epoch: 52, step: 56, loss: 0.3158952295780182, mean loss: 0.3415512519425674
Epoch: 52, step: 57, loss: 0.32439273595809937, mean loss: 0.3415510236068478
Epoch: 52, step: 58, loss: 0.33466199040412903, mean loss: 0.341550931932753
Epoch: 52, step: 59, loss: 0.32635313272476196, mean loss: 0.34155072969451367
Epoch: 52, step: 60, loss: 0.343622624874115, mean loss: 0.34155075726500933
Epoch: 52, step: 61, loss: 0.3076992928981781, mean loss: 0.34155030681305504
Epoch: 52, step: 62, loss: 0.32236528396606445, mean loss: 0.3415500515267269
Epoch: 52, step: 63, loss: 0.39868712425231934, mean loss: 0.3415508118135154
Epoch: 52, step: 64, loss: 0.29044482111930847, mean loss: 0.34155013178755905
Epoch: 52, step: 65, loss: 0.3735199570655823, mean loss: 0.34155055717842686
Epoch: 52, step: 66, loss: 0.4248920679092407, mean loss: 0.34155166610678467
Epoch: 52, step: 67, loss: 0.321328729391098, mean loss: 0.34155139702731374
Epoch: 52, step: 68, loss: 0.3479602634906769, mean loss: 0.3415514823003617
Epoch: 52, step: 69, loss: 0.3794732987880707, mean loss: 0.3415519868616391
Epoch: 52, step: 70, loss: 0.28985294699668884, mean loss: 0.3415512989993756
Epoch: 52, step: 71, loss: 0.3410360515117645, mean loss: 0.3415512921440338
Epoch: 52, step: 72, loss: 0.35839447379112244, mean loss: 0.3415515162387325
Epoch: 52, step: 73, loss: 0.3382212519645691, mean loss: 0.34155147193091373
Epoch: 52, step: 74, loss: 0.3202509880065918, mean loss: 0.34155118854036354
Epoch: 52, step: 75, loss: 0.2979099750518799, mean loss: 0.34155060792712466
Epoch: 52, step: 76, loss: 0.3364872634410858, mean loss: 0.3415505405640636
Epoch: 52, step: 77, loss: 0.3237079083919525, mean loss: 0.3415503031876943
Epoch: 52, step: 78, loss: 0.3699280321598053, mean loss: 0.3415506807167825
Epoch: 52, step: 79, loss: 0.3386133909225464, mean loss: 0.34155064164044957
Epoch: 52, step: 80, loss: 0.32044801115989685, mean loss: 0.34155036090463453
Epoch: 52, step: 81, loss: 0.32246968150138855, mean loss: 0.3415501070709322
Epoch: 52, step: 82, loss: 0.3612443506717682, mean loss: 0.34155036906350383
Epoch: 52, step: 83, loss: 0.30415666103363037, mean loss: 0.3415498716215304
Epoch: 52, step: 84, loss: 0.3211032450199127, mean loss: 0.3415495996272425
Epoch: 52, step: 85, loss: 0.42118221521377563, mean loss: 0.34155065893784975
Epoch: 52, step: 86, loss: 0.3536602556705475, mean loss: 0.3415508200232735
Epoch: 52, step: 87, loss: 0.34651029109954834, mean loss: 0.3415508859947415
Epoch: 52, step: 88, loss: 0.36159080266952515, mean loss: 0.3415511525645258
Epoch: 52, step: 89, loss: 0.34117391705513, mean loss: 0.34155114754662813
Epoch: 52, step: 90, loss: 0.30440711975097656, mean loss: 0.3415506534721154
Epoch: 52, step: 91, loss: 0.32647505402565, mean loss: 0.34155045294538694
Epoch: 52, step: 92, loss: 0.2942584156990051, mean loss: 0.34154982390297933
Epoch: 52, step: 93, loss: 0.3334331512451172, mean loss: 0.3415497159426609
Epoch: 52, step: 94, loss: 0.330474853515625, mean loss: 0.3415495686372538
Epoch: 52, step: 95, loss: 0.30461984872817993, mean loss: 0.34154907744604407
Epoch: 52, step: 96, loss: 0.3885655701160431, mean loss: 0.34154970279009766
Epoch: 52, step: 97, loss: 0.3224366307258606, mean loss: 0.3415494485795789
Epoch: 52, step: 98, loss: 0.30177170038223267, mean loss: 0.34154891952870314
Epoch: 52, step: 99, loss: 0.36361244320869446, mean loss: 0.3415492129734507
Epoch: 52, step: 100, loss: 0.2857019305229187, mean loss: 0.3415484702147699
Epoch: 52, step: 101, loss: 0.36891627311706543, mean loss: 0.341548834196721
Epoch: 52, step: 102, loss: 0.326978862285614, mean loss: 0.34154864042390365
Epoch: 52, step: 103, loss: 0.3091428577899933, mean loss: 0.3415482094500948
Epoch: 52, step: 104, loss: 0.29460394382476807, mean loss: 0.3415475851331288
Epoch: 52, step: 105, loss: 0.348428338766098, mean loss: 0.3415476766398133
Epoch: 52, step: 106, loss: 0.32554662227630615, mean loss: 0.3415474638456865
Epoch: 52, step: 107, loss: 0.34358319640159607, mean loss: 0.3415474909180382
Epoch: 52, step: 108, loss: 0.35269811749458313, mean loss: 0.34154763920356257
Epoch: 52, step: 109, loss: 0.30645450949668884, mean loss: 0.3415471725271921
Epoch: 52, step: 110, loss: 0.3363015353679657, mean loss: 0.3415471027704512
Epoch: 52, step: 111, loss: 0.33455929160118103, mean loss: 0.3415470098474303
Epoch: 52, step: 112, loss: 0.35316693782806396, mean loss: 0.34154716436569443
Epoch: 52, step: 113, loss: 0.3217425048351288, mean loss: 0.34154690101286433
Epoch: 52, step: 114, loss: 0.33518514037132263, mean loss: 0.34154681641835827
Epoch: 52, step: 115, loss: 0.2993108928203583, mean loss: 0.34154625480031137
Epoch: 52, step: 116, loss: 0.3428093194961548, mean loss: 0.34154627159526774
Epoch: 52, step: 117, loss: 0.34427306056022644, mean loss: 0.3415463078528664
Epoch: 52, step: 118, loss: 0.3046042323112488, mean loss: 0.3415458166475857
Epoch: 52, step: 119, loss: 0.3171750605106354, mean loss: 0.3415454926028546
Epoch: 52, step: 120, loss: 0.3301287293434143, mean loss: 0.3415453408023619
Epoch: 52, step: 121, loss: 0.31398388743400574, mean loss: 0.34154497434240483
Epoch: 52, step: 122, loss: 0.3197951912879944, mean loss: 0.3415446851588671
Epoch: 52, step: 123, loss: 0.3408876061439514, mean loss: 0.34154467642250835
Epoch: 52, step: 124, loss: 0.32758763432502747, mean loss: 0.34154449085562366
Epoch: 52, step: 125, loss: 0.3496209681034088, mean loss: 0.34154459823559613
Epoch: 52, step: 126, loss: 0.3102772831916809, mean loss: 0.34154418252975227
Epoch: 52, step: 127, loss: 0.32508519291877747, mean loss: 0.34154396370676765
Epoch: 52, step: 128, loss: 0.34047839045524597, mean loss: 0.34154394954011313
Epoch: 52, step: 129, loss: 0.3489070236682892, mean loss: 0.34154404742990185
Epoch: 52, step: 130, loss: 0.3134750723838806, mean loss: 0.34154367426653826
Epoch: 52, step: 131, loss: 0.29755645990371704, mean loss: 0.3415430894857039
Epoch: 52, step: 132, loss: 0.33872896432876587, mean loss: 0.34154305207427416
Epoch: 52, step: 133, loss: 0.32872334122657776, mean loss: 0.3415428816492542
Epoch: 52, step: 134, loss: 0.3451041579246521, mean loss: 0.34154292899217165
Epoch: 52, step: 135, loss: 0.32030412554740906, mean loss: 0.34154264665138356
Epoch: 52, step: 136, loss: 0.285683810710907, mean loss: 0.3415419040945748
Epoch: 52, step: 137, loss: 0.34805142879486084, mean loss: 0.34154199062748497
Epoch: 52, step: 138, loss: 0.3173832595348358, mean loss: 0.3415416694830675
Epoch: 52, step: 139, loss: 0.3690505921840668, mean loss: 0.3415420351570546
Epoch: 52, step: 140, loss: 0.320747047662735, mean loss: 0.3415417587345647
Epoch: 52, step: 141, loss: 0.3336033523082733, mean loss: 0.34154165321274593
Epoch: 52, step: 142, loss: 0.35151025652885437, mean loss: 0.3415417857193365
Epoch: 52, step: 143, loss: 0.32879769802093506, mean loss: 0.3415416163221691
Epoch: 52, step: 144, loss: 0.3180903196334839, mean loss: 0.3415413046066096
Epoch: 52, step: 145, loss: 0.3251255452632904, mean loss: 0.34154108641058994
Epoch: 52, step: 146, loss: 0.31873902678489685, mean loss: 0.3415407833327721
Epoch: 52, step: 147, loss: 0.35378870368003845, mean loss: 0.34154094612612035
Epoch: 52, step: 148, loss: 0.30828672647476196, mean loss: 0.34154050413322257
Epoch: 52, step: 149, loss: 0.3077116012573242, mean loss: 0.34154005450799496
Epoch: 52, step: 150, loss: 0.29765385389328003, mean loss: 0.34153947121740613
Epoch: 52, step: 151, loss: 0.3588750660419464, mean loss: 0.34153970162137776
Epoch: 52, step: 152, loss: 0.3274839520454407, mean loss: 0.3415395148116653
Epoch: 52, step: 153, loss: 0.3306340277194977, mean loss: 0.34153936987284
Epoch: 52, step: 154, loss: 0.2913956046104431, mean loss: 0.341538703448518
Epoch: 52, step: 155, loss: 0.31926557421684265, mean loss: 0.3415384074364874
Epoch: 52, step: 156, loss: 0.3659965693950653, mean loss: 0.3415387324834933
Epoch: 52, step: 157, loss: 0.31995612382888794, mean loss: 0.34153844565617153
Epoch: 52, step: 158, loss: 0.3104710578918457, mean loss: 0.34153803278406014
Epoch: 52, step: 159, loss: 0.335985004901886, mean loss: 0.34153795898770833
Epoch: 52, step: 160, loss: 0.32483530044555664, mean loss: 0.3415377370225189
Epoch: 52, step: 161, loss: 0.3372856676578522, mean loss: 0.3415376805166137
Epoch: 52, step: 162, loss: 0.360939085483551, mean loss: 0.3415379383391671
Epoch: 52, step: 163, loss: 0.42413175106048584, mean loss: 0.34153903590219165
Epoch: 52, step: 164, loss: 0.3533746600151062, mean loss: 0.3415391931799628
Epoch: 52, step: 165, loss: 0.3558535873889923, mean loss: 0.34153938339435946
Epoch: 52, step: 166, loss: 0.3275498151779175, mean loss: 0.34153919749882805
Epoch: 52, step: 167, loss: 0.3006364107131958, mean loss: 0.34153865398353644
Epoch: 52, step: 168, loss: 0.3208765983581543, mean loss: 0.341538379430264
Epoch: 52, step: 169, loss: 0.3362780511379242, mean loss: 0.341538309533
Epoch: 52, step: 170, loss: 0.3381844758987427, mean loss: 0.34153826496911216
Epoch: 52, step: 171, loss: 0.34368935227394104, mean loss: 0.3415382935511917
Epoch: 52, step: 172, loss: 0.3341861665248871, mean loss: 0.341538195862787
Epoch: 52, step: 173, loss: 0.3320031464099884, mean loss: 0.34153806917136964
Epoch: 52, step: 174, loss: 0.3145642578601837, mean loss: 0.34153771077732065
Epoch: 52, step: 175, loss: 0.36672675609588623, mean loss: 0.34153804545319916
Epoch: 52, step: 176, loss: 0.35180121660232544, mean loss: 0.3415381818136741
Epoch: 52, step: 177, loss: 0.32090210914611816, mean loss: 0.3415379076384467
Epoch: 52, step: 178, loss: 0.3371875286102295, mean loss: 0.34153784983915847
Epoch: 52, step: 179, loss: 0.34142956137657166, mean loss: 0.34153784840045326
Epoch: 52, step: 180, loss: 0.3220902979373932, mean loss: 0.3415375900264817
Epoch: 52, step: 181, loss: 0.3404383361339569, mean loss: 0.34153757542233804
Epoch: 52, step: 182, loss: 0.32909590005874634, mean loss: 0.34153741013058736
Epoch: 52, step: 183, loss: 0.3271224796772003, mean loss: 0.3415372186260378
Epoch: 52, step: 184, loss: 0.30208396911621094, mean loss: 0.3415366944905641
Epoch: 52, step: 185, loss: 0.3263612985610962, mean loss: 0.3415364928884714
Epoch: 52, step: 186, loss: 0.35860008001327515, mean loss: 0.3415367195717942
Epoch: 52, step: 187, loss: 0.3848220109939575, mean loss: 0.34153729459293536
Epoch: 52, step: 188, loss: 0.3249639868736267, mean loss: 0.34153707442863923
Epoch: 52, step: 189, loss: 0.301079124212265, mean loss: 0.34153653698144065
Epoch: 52, step: 190, loss: 0.310663640499115, mean loss: 0.34153612686844126
Epoch: 52, step: 191, loss: 0.3323286175727844, mean loss: 0.34153600455827526
Epoch: 52, step: 192, loss: 0.3339228332042694, mean loss: 0.3415359034282245
Epoch: 52, step: 193, loss: 0.3602942228317261, mean loss: 0.3415361526022555
Epoch: 52, step: 194, loss: 0.38138002157211304, mean loss: 0.341536681856788
Epoch: 52, step: 195, loss: 0.35304805636405945, mean loss: 0.3415368347627774
Epoch: 52, step: 196, loss: 0.3356512784957886, mean loss: 0.3415367565857665
Epoch: 52, step: 197, loss: 0.3461001217365265, mean loss: 0.3415368171994948
Epoch: 52, step: 198, loss: 0.2952711284160614, mean loss: 0.3415362026752239
Epoch: 52, step: 199, loss: 0.37346526980400085, mean loss: 0.3415366267676042
Epoch: 52, step: 200, loss: 0.3397330641746521, mean loss: 0.34153660281241033
Epoch: 52, step: 201, loss: 0.31069594621658325, mean loss: 0.34153619318753853
Epoch: 52, step: 202, loss: 0.3695579469203949, mean loss: 0.34153656536686583
Epoch: 52, step: 203, loss: 0.3450762629508972, mean loss: 0.3415366123797966
Epoch: 52, step: 204, loss: 0.30999431014060974, mean loss: 0.3415361934523765
Epoch: 52, step: 205, loss: 0.314134418964386, mean loss: 0.34153582952199046
Epoch: 52, step: 206, loss: 0.3185792863368988, mean loss: 0.3415355246339742
Epoch: 52, step: 207, loss: 0.30863961577415466, mean loss: 0.34153508774610686
Epoch: 52, step: 208, loss: 0.3000395894050598, mean loss: 0.34153453665511596
Epoch: 52, step: 209, loss: 0.31857767701148987, mean loss: 0.3415342317750442
Epoch: 52, step: 210, loss: 0.34733930230140686, mean loss: 0.3415343088686381
Epoch: 52, step: 211, loss: 0.3216714859008789, mean loss: 0.34153404508612856
Epoch: 52, step: 212, loss: 0.3208794891834259, mean loss: 0.3415337707928801
Epoch: 52, step: 213, loss: 0.32204094529151917, mean loss: 0.34153351193089104
Epoch: 52, step: 214, loss: 0.32389000058174133, mean loss: 0.34153327763064606
Epoch: 52, step: 215, loss: 0.35992592573165894, mean loss: 0.34153352187594643
Epoch: 52, step: 216, loss: 0.3192906975746155, mean loss: 0.34153322650612633
Epoch: 52, step: 217, loss: 0.359076589345932, mean loss: 0.34153345946714986
Epoch: 52, step: 218, loss: 0.299027681350708, mean loss: 0.34153289503385525
Epoch: 52, step: 219, loss: 0.31914809346199036, mean loss: 0.3415325977905136
Epoch: 52, step: 220, loss: 0.3609844744205475, mean loss: 0.34153285608469663
Epoch: 52, step: 221, loss: 0.304320752620697, mean loss: 0.3415323619656757
Epoch: 52, step: 222, loss: 0.34334293007850647, mean loss: 0.34153238600689295
Epoch: 52, step: 223, loss: 0.3537868857383728, mean loss: 0.34153254872332234
Epoch: 52, step: 224, loss: 0.3239465653896332, mean loss: 0.34153231521803995
Epoch: 52, step: 225, loss: 0.34833088517189026, mean loss: 0.3415324054877103
Epoch: 52, step: 226, loss: 0.32655760645866394, mean loss: 0.3415322066588046
Epoch: 52, step: 227, loss: 0.3683740198612213, mean loss: 0.34153256304806057
Epoch: 52, step: 228, loss: 0.33318406343460083, mean loss: 0.3415324522032365
Epoch: 52, step: 229, loss: 0.33297640085220337, mean loss: 0.3415323386042117
Epoch: 52, step: 230, loss: 0.3630881905555725, mean loss: 0.3415326247982923
Epoch: 52, step: 231, loss: 0.33871108293533325, mean loss: 0.34153258733756653
Epoch: 52, step: 232, loss: 0.3277064561843872, mean loss: 0.3415324037747998
Epoch: 52, step: 233, loss: 0.315264493227005, mean loss: 0.34153205503325623
Epoch: 52, step: 234, loss: 0.39058786630630493, mean loss: 0.3415327063059256
Epoch: 52, step: 235, loss: 0.3638603091239929, mean loss: 0.3415330027267585
Epoch: 52, step: 236, loss: 0.3296106159687042, mean loss: 0.3415328444474786
Epoch: 52, step: 237, loss: 0.3104134202003479, mean loss: 0.34153243131756
Epoch: 52, step: 238, loss: 0.36490917205810547, mean loss: 0.3415327416543681
Epoch: 52, step: 239, loss: 0.3246331512928009, mean loss: 0.3415325173076396
Epoch: 52, step: 240, loss: 0.34136879444122314, mean loss: 0.3415325151342022
Epoch: 52, step: 241, loss: 0.29634395241737366, mean loss: 0.3415319152594814
Epoch: 52, step: 242, loss: 0.3357395827770233, mean loss: 0.34153183836773054
Epoch: 52, step: 243, loss: 0.33075764775276184, mean loss: 0.34153169534496974
Epoch: 52, step: 244, loss: 0.3320358395576477, mean loss: 0.341531569293229
Epoch: 52, step: 245, loss: 0.37107324600219727, mean loss: 0.3415319614359097
Epoch: 52, step: 246, loss: 0.3500666320323944, mean loss: 0.34153207472549085
Epoch: 52, step: 247, loss: 0.3390333950519562, mean loss: 0.34153204155835065
Epoch: 52, step: 248, loss: 0.31882986426353455, mean loss: 0.341531740216682
Epoch: 52, step: 249, loss: 0.344411700963974, mean loss: 0.3415317784438814
Epoch: 52, step: 250, loss: 0.32684189081192017, mean loss: 0.3415315834600399
Epoch: 52, step: 251, loss: 0.35160407423973083, mean loss: 0.34153171715383845
Epoch: 52, step: 252, loss: 0.32180505990982056, mean loss: 0.341531455322203
Epoch: 52, step: 253, loss: 0.3362426459789276, mean loss: 0.34153138512484504
Epoch: 52, step: 254, loss: 0.33568304777145386, mean loss: 0.3415313075020088
Epoch: 52, step: 255, loss: 0.2843899428844452, mean loss: 0.34153054909570413
Epoch: 52, step: 256, loss: 0.2901873290538788, mean loss: 0.34152986765406845
Epoch: 52, step: 257, loss: 0.31738415360450745, mean loss: 0.34152954718962375
Epoch: 52, step: 258, loss: 0.31448692083358765, mean loss: 0.3415291882818191
Epoch: 52, step: 259, loss: 0.3556090295314789, mean loss: 0.341529375145986
Epoch: 52, step: 260, loss: 0.29666197299957275, mean loss: 0.34152877968483664
Epoch: 52, step: 261, loss: 0.318448007106781, mean loss: 0.3415284733706684
Epoch: 52, step: 262, loss: 0.29437875747680664, mean loss: 0.341527847636227
Epoch: 52, step: 263, loss: 0.37311607599258423, mean loss: 0.34152826684511806
Epoch: 52, step: 264, loss: 0.34699636697769165, mean loss: 0.3415283394115737
Epoch: 52, step: 265, loss: 0.32951149344444275, mean loss: 0.34152817993966816
Epoch: 52, step: 266, loss: 0.33815911412239075, mean loss: 0.3415281352304144
Epoch: 52, step: 267, loss: 0.34737521409988403, mean loss: 0.3415282128231591
Epoch: 52, step: 268, loss: 0.37218132615089417, mean loss: 0.34152861959510233
Epoch: 52, step: 269, loss: 0.3299119174480438, mean loss: 0.34152846544156656
Epoch: 52, step: 270, loss: 0.39139729738235474, mean loss: 0.3415291271917482
Epoch: 52, step: 271, loss: 0.3644174635410309, mean loss: 0.3415294309117104
Epoch: 52, step: 272, loss: 0.30419808626174927, mean loss: 0.3415289355448144
Epoch: 52, step: 273, loss: 0.31810182332992554, mean loss: 0.34152862468374096
Epoch: 52, step: 274, loss: 0.3473050892353058, mean loss: 0.34152870133228935
Epoch: 52, step: 275, loss: 0.3473266661167145, mean loss: 0.34152877826510586
Epoch: 52, step: 276, loss: 0.34424132108688354, mean loss: 0.34152881425718207
Epoch: 52, step: 277, loss: 0.3456677496433258, mean loss: 0.3415288691749883
Epoch: 52, step: 278, loss: 0.2819291949272156, mean loss: 0.34152807838227733
Epoch: 52, step: 279, loss: 0.33341702818870544, mean loss: 0.34152797076299335
Epoch: 52, step: 280, loss: 0.30780553817749023, mean loss: 0.34152752333191977
Epoch: 52, step: 281, loss: 0.3285515308380127, mean loss: 0.3415273511680284
Epoch: 52, step: 282, loss: 0.33618035912513733, mean loss: 0.3415272802257291
Epoch: 52, step: 283, loss: 0.33456045389175415, mean loss: 0.34152718779317676
Epoch: 52, step: 284, loss: 0.3085435628890991, mean loss: 0.34152675018786843
Epoch: 52, step: 285, loss: 0.336012065410614, mean loss: 0.34152667702358397
Epoch: 52, step: 286, loss: 0.3320900797843933, mean loss: 0.341526551828264
Epoch: 52, step: 287, loss: 0.30439379811286926, mean loss: 0.3415260591946178
Epoch: 52, step: 288, loss: 0.3683096766471863, mean loss: 0.3415264145233978
Epoch: 52, step: 289, loss: 0.3658754229545593, mean loss: 0.3415267375487956
Epoch: 52, step: 290, loss: 0.27985912561416626, mean loss: 0.3415259194481053
Epoch: 52, step: 291, loss: 0.3183324337005615, mean loss: 0.3415256117605788
Epoch: 52, step: 292, loss: 0.32167020440101624, mean loss: 0.34152534835988946
Epoch: 52, step: 293, loss: 0.3162495791912079, mean loss: 0.34152501305744104
Epoch: 52, step: 294, loss: 0.3389208912849426, mean loss: 0.3415249785122283
Epoch: 52, step: 295, loss: 0.3174624443054199, mean loss: 0.34152465931274023
Epoch: 52, step: 296, loss: 0.34902113676071167, mean loss: 0.3415247587553011
Epoch: 52, step: 297, loss: 0.39310774207115173, mean loss: 0.3415254430067976
Epoch: 52, step: 298, loss: 0.3121105134487152, mean loss: 0.3415250528210951
Epoch: 52, step: 299, loss: 0.41019248962402344, mean loss: 0.34152596367476945
Epoch: 52, step: 300, loss: 0.31379199028015137, mean loss: 0.34152559579651937
Epoch: 52, step: 301, loss: 0.343325674533844, mean loss: 0.3415256196734094
Epoch: 52, step: 302, loss: 0.31507259607315063, mean loss: 0.34152526879567063
Epoch: 52, step: 303, loss: 0.29445087909698486, mean loss: 0.341524644400646
Epoch: 52, step: 304, loss: 0.33058688044548035, mean loss: 0.3415244993239949
Epoch: 52, step: 305, loss: 0.37055328488349915, mean loss: 0.3415248843517897
Epoch: 52, step: 306, loss: 0.3576430380344391, mean loss: 0.34152509813458276
Epoch: 52, step: 307, loss: 0.2905746102333069, mean loss: 0.341524422362819
Epoch: 52, step: 308, loss: 0.34187552332878113, mean loss: 0.34152442701951574
Epoch: 52, step: 309, loss: 0.34950926899909973, mean loss: 0.34152453292208584
Epoch: 52, step: 310, loss: 0.3573983609676361, mean loss: 0.34152474345310146
Epoch: 52, step: 311, loss: 0.319161057472229, mean loss: 0.3415244468524916
Epoch: 52, step: 312, loss: 0.29917654395103455, mean loss: 0.3415238852166658
Epoch: 52, step: 313, loss: 0.26969605684280396, mean loss: 0.3415229326182152
Epoch: 52, step: 314, loss: 0.34832507371902466, mean loss: 0.3415230228286989
Epoch: 52, step: 315, loss: 0.328997403383255, mean loss: 0.34152285671523747
Epoch: 52, step: 316, loss: 0.3545372188091278, mean loss: 0.3415230293080641
Epoch: 52, step: 317, loss: 0.32145968079566956, mean loss: 0.34152276323708153
Epoch: 52, step: 318, loss: 0.3628518283367157, mean loss: 0.3415230460896695
Epoch: 52, step: 319, loss: 0.30856677889823914, mean loss: 0.34152260905026793
Epoch: 52, step: 320, loss: 0.33433011174201965, mean loss: 0.3415225136704418
Epoch: 52, step: 321, loss: 0.3540421426296234, mean loss: 0.3415226796912475
Epoch: 52, step: 322, loss: 0.3514183759689331, mean loss: 0.34152281091475967
Epoch: 52, step: 323, loss: 0.32795432209968567, mean loss: 0.34152263098996233
Epoch: 52, step: 324, loss: 0.35307326912879944, mean loss: 0.3415227841550418
Epoch: 52, step: 325, loss: 0.34481558203697205, mean loss: 0.34152282781799403
Epoch: 52, step: 326, loss: 0.320186585187912, mean loss: 0.3415225449002372
Epoch: 52, step: 327, loss: 0.32496729493141174, mean loss: 0.34152232538117006
Epoch: 52, step: 328, loss: 0.3207048177719116, mean loss: 0.34152204934914004
Epoch: 52, step: 329, loss: 0.3202770948410034, mean loss: 0.3415217676530661
Epoch: 52, step: 330, loss: 0.41216710209846497, mean loss: 0.3415227043578016
Epoch: 52, step: 331, loss: 0.3648533225059509, mean loss: 0.34152301370039173
Epoch: 52, step: 332, loss: 0.34269192814826965, mean loss: 0.3415230291989193
Epoch: 52, step: 333, loss: 0.3537200391292572, mean loss: 0.3415231909157914
Epoch: 52, step: 334, loss: 0.30422326922416687, mean loss: 0.3415226963727251
Epoch: 52, step: 335, loss: 0.31821712851524353, mean loss: 0.34152238737866675
Epoch: 52, step: 336, loss: 0.33690741658210754, mean loss: 0.3415223261924447
Epoch: 52, step: 337, loss: 0.3283516466617584, mean loss: 0.3415221515752102
Epoch: 52, step: 338, loss: 0.3234521448612213, mean loss: 0.34152191200573623
Epoch: 52, step: 339, loss: 0.36951884627342224, mean loss: 0.3415222831800252
Epoch: 52, step: 340, loss: 0.3505091369152069, mean loss: 0.3415224023232425
Epoch: 52, step: 341, loss: 0.3299650251865387, mean loss: 0.34152224910334145
Epoch: 52, step: 342, loss: 0.3343360722064972, mean loss: 0.3415221538351242
Epoch: 52, step: 343, loss: 0.2885105013847351, mean loss: 0.34152145106107007
Epoch: 52, step: 344, loss: 0.31843069195747375, mean loss: 0.3415211449515543
Epoch: 52, step: 345, loss: 0.31084656715393066, mean loss: 0.3415207383102811
Epoch: 52, step: 346, loss: 0.41009700298309326, mean loss: 0.341521647387827
Epoch: 52, step: 347, loss: 0.3571373224258423, mean loss: 0.3415218543934349
Epoch: 52, step: 348, loss: 0.30383002758026123, mean loss: 0.34152135474701717
Epoch: 52, step: 349, loss: 0.3395613431930542, mean loss: 0.3415213287652632
Epoch: 52, step: 350, loss: 0.3287341594696045, mean loss: 0.3415211592618327
Epoch: 52, step: 351, loss: 0.35308581590652466, mean loss: 0.34152131255791757
Epoch: 52, step: 352, loss: 0.32231763005256653, mean loss: 0.3415210580055852
Epoch: 52, step: 353, loss: 0.31412169337272644, mean loss: 0.3415206948210907
Epoch: 52, step: 354, loss: 0.3540290296077728, mean loss: 0.3415208606195715
Epoch: 52, step: 355, loss: 0.31136834621429443, mean loss: 0.34152046095207766
Epoch: 52, step: 356, loss: 0.34289559721946716, mean loss: 0.341520479179081
Epoch: 52, step: 357, loss: 0.30051982402801514, mean loss: 0.34151993573535766
Epoch: 52, step: 358, loss: 0.3372851312160492, mean loss: 0.3415198796058294
Epoch: 52, step: 359, loss: 0.36286765336990356, mean loss: 0.3415201625526771
Epoch: 52, step: 360, loss: 0.3554501533508301, mean loss: 0.341520347180582
Epoch: 52, step: 361, loss: 0.3341469466686249, mean loss: 0.3415202494549291
Epoch: 52, step: 362, loss: 0.31781113147735596, mean loss: 0.3415199352229378
Epoch: 52, step: 363, loss: 0.3359004557132721, mean loss: 0.34151986074539564
Epoch: 52, step: 364, loss: 0.3053336441516876, mean loss: 0.3415193811592083
Epoch: 52, step: 365, loss: 0.322327196598053, mean loss: 0.34151912680311636
Epoch: 52, step: 366, loss: 0.3987372815608978, mean loss: 0.3415198851114426
Epoch: 52, step: 367, loss: 0.3010391891002655, mean loss: 0.34151934863063244
Epoch: 52, step: 368, loss: 0.3323404788970947, mean loss: 0.34151922698691833
Epoch: 52, step: 369, loss: 0.32665637135505676, mean loss: 0.3415190300183314
Epoch: 52, step: 370, loss: 0.28811269998550415, mean loss: 0.34151832226537904
Epoch: 52, step: 371, loss: 0.30810925364494324, mean loss: 0.3415178795265953
Epoch: 52, step: 372, loss: 0.35592973232269287, mean loss: 0.34151807051071686
Epoch: 52, step: 373, loss: 0.31126531958580017, mean loss: 0.3415176696102514
Epoch: 52, step: 374, loss: 0.33955347537994385, mean loss: 0.341517643581678
Epoch: 52, step: 375, loss: 0.31535327434539795, mean loss: 0.34151729686842086
Epoch: 52, step: 376, loss: 0.3730365037918091, mean loss: 0.3415177145349805
Epoch: 52, step: 377, loss: 0.3756730258464813, mean loss: 0.34151816712702604
Epoch: 52, step: 378, loss: 0.30591216683387756, mean loss: 0.34151769531815207
Epoch: 52, step: 379, loss: 0.3563675582408905, mean loss: 0.34151789208847755
Epoch: 52, step: 380, loss: 0.31985530257225037, mean loss: 0.34151760504890477
Epoch: 52, step: 381, loss: 0.31129640340805054, mean loss: 0.3415172046089731
Epoch: 52, step: 382, loss: 0.3349817097187042, mean loss: 0.34151711801286483
Epoch: 52, step: 383, loss: 0.3106565475463867, mean loss: 0.34151670911194176
Epoch: 52, step: 384, loss: 0.3456103205680847, mean loss: 0.34151676335135794
Epoch: 52, step: 385, loss: 0.33518749475479126, mean loss: 0.34151667949110676
Epoch: 52, step: 386, loss: 0.3136730194091797, mean loss: 0.3415163105787506
Epoch: 52, step: 387, loss: 0.38507431745529175, mean loss: 0.3415168876894464
Epoch: 52, step: 388, loss: 0.3249971866607666, mean loss: 0.3415166688187834
Epoch: 52, step: 389, loss: 0.35716286301612854, mean loss: 0.3415168761135474
Epoch: 52, step: 390, loss: 0.37325069308280945, mean loss: 0.3415172965459454
Epoch: 52, step: 391, loss: 0.31501930952072144, mean loss: 0.3415169454862339
Epoch: 52, step: 392, loss: 0.34748172760009766, mean loss: 0.34151702450985727
Epoch: 52, step: 393, loss: 0.2897353768348694, mean loss: 0.34151633849666635
Epoch: 52, step: 394, loss: 0.3362392485141754, mean loss: 0.34151626858569323
Epoch: 52, step: 395, loss: 0.3261186182498932, mean loss: 0.34151606460007594
Epoch: 52, step: 396, loss: 0.31615766882896423, mean loss: 0.3415157286605413
Epoch: 52, step: 397, loss: 0.30862972140312195, mean loss: 0.34151529300350214
Epoch: 52, step: 398, loss: 0.3275880515575409, mean loss: 0.3415151085049601
Epoch: 52, step: 399, loss: 0.3368973433971405, mean loss: 0.3415150473327856
Epoch: 52, step: 400, loss: 0.3431415259838104, mean loss: 0.3415150688786883
Epoch: 52, step: 401, loss: 0.34868869185447693, mean loss: 0.3415151639061486
Epoch: 52, step: 402, loss: 0.31392142176628113, mean loss: 0.34151479838254795
Epoch: 52, step: 403, loss: 0.2926967144012451, mean loss: 0.34151415171688826
Epoch: 52, step: 404, loss: 0.3410502076148987, mean loss: 0.3415141455713635
Epoch: 52, step: 405, loss: 0.3124409019947052, mean loss: 0.3415137604646851
Epoch: 52, step: 406, loss: 0.32929977774620056, mean loss: 0.3415135986793653
Epoch: 52, step: 407, loss: 0.32723721861839294, mean loss: 0.3415134095782201
Epoch: 52, step: 408, loss: 0.31991735100746155, mean loss: 0.3415131235263429
Epoch: 52, step: 409, loss: 0.36004120111465454, mean loss: 0.341513368937845
Epoch: 52, step: 410, loss: 0.32614582777023315, mean loss: 0.3415131653915574
Epoch: 52, step: 411, loss: 0.3606470227241516, mean loss: 0.34151341882013136
Epoch: 52, step: 412, loss: 0.31039950251579285, mean loss: 0.3415130067207379
Epoch: 52, step: 413, loss: 0.3111775815486908, mean loss: 0.34151260493767027
Epoch: 52, step: 414, loss: 0.3491785526275635, mean loss: 0.3415127064693669
Epoch: 52, step: 415, loss: 0.3686465620994568, mean loss: 0.3415130658391437
Epoch: 52, step: 416, loss: 0.3287368714809418, mean loss: 0.34151289662923234
Epoch: 52, step: 417, loss: 0.39299076795578003, mean loss: 0.3415135784011621
Epoch: 52, step: 418, loss: 0.30807915329933167, mean loss: 0.34151313560214874
Epoch: 52, step: 419, loss: 0.32299521565437317, mean loss: 0.341512890357672
Epoch: 52, step: 420, loss: 0.32617703080177307, mean loss: 0.34151268725791495
Epoch: 52, step: 421, loss: 0.32935968041419983, mean loss: 0.3415125263122542
Epoch: 52, step: 422, loss: 0.3081393539905548, mean loss: 0.3415120843478739
Epoch: 52, step: 423, loss: 0.3772891163825989, mean loss: 0.34151255814054304
Epoch: 52, step: 424, loss: 0.31316909193992615, mean loss: 0.3415121827950237
Epoch: 52, step: 425, loss: 0.33534786105155945, mean loss: 0.34151210116351505
Epoch: 52, step: 426, loss: 0.3145151734352112, mean loss: 0.34151174365934067
Epoch: 52, step: 427, loss: 0.3201325833797455, mean loss: 0.34151146055165116
Epoch: 52, step: 428, loss: 0.3489464819431305, mean loss: 0.34151155900658703
Epoch: 52, step: 429, loss: 0.3362220227718353, mean loss: 0.34151148896320355
Epoch: 52, step: 430, loss: 0.31189775466918945, mean loss: 0.34151109682699554
Epoch: 52, step: 431, loss: 0.33327898383140564, mean loss: 0.34151098782126205
Epoch: 52, step: 432, loss: 0.31878992915153503, mean loss: 0.34151068696376985
Epoch: 52, step: 433, loss: 0.33918213844299316, mean loss: 0.34151065613105197
Epoch: 52, step: 434, loss: 0.3332633376121521, mean loss: 0.3415105469283122
Epoch: 52, step: 435, loss: 0.38958102464675903, mean loss: 0.34151118342105247
Epoch: 52, step: 436, loss: 0.35450538992881775, mean loss: 0.34151135547277717
Epoch: 52, step: 437, loss: 0.31217655539512634, mean loss: 0.3415109670661347
Epoch: 52, step: 438, loss: 0.3539249300956726, mean loss: 0.3415111314307067
Epoch: 52, step: 439, loss: 0.38230761885643005, mean loss: 0.3415116715812128
Epoch: 52, step: 440, loss: 0.3495284616947174, mean loss: 0.3415117777230936
Epoch: 52, step: 441, loss: 0.3821590542793274, mean loss: 0.34151231588377884
Epoch: 52, step: 442, loss: 0.335836261510849, mean loss: 0.34151224073510644
Epoch: 52, step: 443, loss: 0.3724021911621094, mean loss: 0.3415126497001865
Epoch: 52, step: 444, loss: 0.31019216775894165, mean loss: 0.34151223504060807
Epoch: 52, step: 445, loss: 0.34357643127441406, mean loss: 0.34151226236864884
Epoch: 52, step: 446, loss: 0.31494033336639404, mean loss: 0.34151191058564756
Epoch: 52, step: 447, loss: 0.30251240730285645, mean loss: 0.3415113942821197
Epoch: 52, step: 448, loss: 0.3359943628311157, mean loss: 0.3415113212446486
Epoch: 52, step: 449, loss: 0.3127511441707611, mean loss: 0.3415109405067806
Epoch: 52, step: 450, loss: 0.32903218269348145, mean loss: 0.3415107753105533
Epoch: 52, step: 451, loss: 0.3256784677505493, mean loss: 0.3415105657221556
Epoch: 52, step: 452, loss: 0.3241395950317383, mean loss: 0.3415103357679494
Epoch: 52, step: 453, loss: 0.3891299068927765, mean loss: 0.3415109661400752
Epoch: 52, step: 454, loss: 0.33218178153038025, mean loss: 0.34151084264505105
Epoch: 52, step: 455, loss: 0.37190505862236023, mean loss: 0.34151124498297303
Epoch: 52, step: 456, loss: 0.3171823024749756, mean loss: 0.3415109229372717
Epoch: 52, step: 457, loss: 0.33710747957229614, mean loss: 0.3415108646490319
Epoch: 52, step: 458, loss: 0.3616178631782532, mean loss: 0.3415111308012091
Epoch: 52, step: 459, loss: 0.32537367939949036, mean loss: 0.34151091719593296
Epoch: 52, step: 460, loss: 0.373000830411911, mean loss: 0.3415113340103609
Epoch: 52, step: 461, loss: 0.33553946018218994, mean loss: 0.3415112549650422
Epoch: 52, step: 462, loss: 0.3361896276473999, mean loss: 0.3415111845274925
Epoch: 52, step: 463, loss: 0.4194973409175873, mean loss: 0.3415122167457844
Epoch: 52, step: 464, loss: 0.34116801619529724, mean loss: 0.3415122121900348
Epoch: 52, step: 465, loss: 0.32541391253471375, mean loss: 0.3415119991199173
Epoch: 52, step: 466, loss: 0.3489159047603607, mean loss: 0.3415120971135066
Epoch: 52, step: 467, loss: 0.3048977255821228, mean loss: 0.34151161251438106
Epoch: 52, step: 468, loss: 0.31877875328063965, mean loss: 0.3415113116440549
Epoch: 52, step: 469, loss: 0.35112884640693665, mean loss: 0.3415114389308381
Epoch: 52, step: 470, loss: 0.30897289514541626, mean loss: 0.3415110082932729
Epoch: 52, step: 471, loss: 0.3265523612499237, mean loss: 0.341510810322825
Epoch: 52, step: 472, loss: 0.3281797170639038, mean loss: 0.341510633894598
Epoch: 52, step: 473, loss: 0.3017091155052185, mean loss: 0.34151010715472363
Epoch: 52, step: 474, loss: 0.3098528981208801, mean loss: 0.3415096882035301
Epoch: 52, step: 475, loss: 0.3299889862537384, mean loss: 0.3415095357406913
Epoch: 52, step: 476, loss: 0.3134138584136963, mean loss: 0.3415091639326145
Epoch: 52, step: 477, loss: 0.3099692761898041, mean loss: 0.3415087465506207
Epoch: 52, step: 478, loss: 0.3276347517967224, mean loss: 0.3415085629520293
Epoch: 52, step: 479, loss: 0.3952740728855133, mean loss: 0.3415092744371809
Epoch: 52, step: 480, loss: 0.3304617702960968, mean loss: 0.3415091282462277
Epoch: 52, step: 481, loss: 0.3345906734466553, mean loss: 0.34150903669594584
Epoch: 52, step: 482, loss: 0.33046531677246094, mean loss: 0.34150889055893663
Epoch: 52, step: 483, loss: 0.32024526596069336, mean loss: 0.3415086091898502
Epoch: 52, step: 484, loss: 0.31607380509376526, mean loss: 0.3415082726304428
Epoch: 52, step: 485, loss: 0.35867881774902344, mean loss: 0.34150849983219367
Epoch: 52, step: 486, loss: 0.38744473457336426, mean loss: 0.34150910765534603
Epoch: 52, step: 487, loss: 0.3433137536048889, mean loss: 0.3415091315339047
Epoch: 52, step: 488, loss: 0.31598779559135437, mean loss: 0.34150879384736066
Epoch: 52, step: 489, loss: 0.33135247230529785, mean loss: 0.34150865946537723
Epoch: 52, step: 490, loss: 0.3077368438243866, mean loss: 0.34150821262411657
Epoch: 52, step: 491, loss: 0.3097895681858063, mean loss: 0.34150779295430395
Epoch: 52, step: 492, loss: 0.3242637813091278, mean loss: 0.34150756480157185
Epoch: 52, step: 493, loss: 0.314982533454895, mean loss: 0.3415072138578108
Epoch: 52, step: 494, loss: 0.32389944791793823, mean loss: 0.34150698089846887
Epoch: 52, step: 495, loss: 0.3189125657081604, mean loss: 0.34150668196727724
Epoch: 52, step: 496, loss: 0.2994047999382019, mean loss: 0.3415061249535572
Epoch: 52, step: 497, loss: 0.3416258692741394, mean loss: 0.3415061265377702
Epoch: 52, step: 498, loss: 0.3143441677093506, mean loss: 0.34150576719080805
Epoch: 52, step: 499, loss: 0.3256951868534088, mean loss: 0.34150555802294624
Epoch: 52, step: 500, loss: 0.37669306993484497, mean loss: 0.3415060235339586
Epoch: 52, step: 501, loss: 0.31892114877700806, mean loss: 0.3415057247527077
Epoch: 52, step: 502, loss: 0.31001606583595276, mean loss: 0.34150530817323504
Epoch: 52, step: 503, loss: 0.326810747385025, mean loss: 0.3415051137801671
Epoch: 52, step: 504, loss: 0.3109701871871948, mean loss: 0.34150470984162
Epoch: 52, step: 505, loss: 0.33778706192970276, mean loss: 0.34150466066248
Epoch: 52, step: 506, loss: 0.31880253553390503, mean loss: 0.3415043603499576
Epoch: 52, step: 507, loss: 0.3188631236553192, mean loss: 0.34150406084685303
Epoch: 52, step: 508, loss: 0.3302628993988037, mean loss: 0.3415039121483405
Epoch: 52, step: 509, loss: 0.3098808825016022, mean loss: 0.3415034938432313
Epoch: 52, step: 510, loss: 0.3431512713432312, mean loss: 0.3415035156395183
Epoch: 52, step: 511, loss: 0.34017303586006165, mean loss: 0.34150349804057945
Epoch: 52, step: 512, loss: 0.32480064034461975, mean loss: 0.34150327710623074
Epoch: 52, step: 513, loss: 0.33017176389694214, mean loss: 0.34150312722245507
Epoch: 52, step: 514, loss: 0.33533012866973877, mean loss: 0.3415030455722751
Epoch: 52, step: 515, loss: 0.28832247853279114, mean loss: 0.3415023421628386
Epoch: 52, step: 516, loss: 0.3361958861351013, mean loss: 0.34150227197626326
Epoch: 52, step: 517, loss: 0.288042813539505, mean loss: 0.3415015648966871
Epoch: 52, step: 518, loss: 0.31855258345603943, mean loss: 0.3415012613668361
Epoch: 52, step: 519, loss: 0.358904093503952, mean loss: 0.3415014915386716
Epoch: 52, step: 520, loss: 0.2984851002693176, mean loss: 0.3415009226065171
Epoch: 52, step: 521, loss: 0.3534029722213745, mean loss: 0.3415010800202139
Epoch: 52, step: 522, loss: 0.33166319131851196, mean loss: 0.34150094990834257
Epoch: 52, step: 523, loss: 0.32901427149772644, mean loss: 0.34150078476685164
Epoch: 52, step: 524, loss: 0.3503597378730774, mean loss: 0.34150090192862415
Epoch: 52, step: 525, loss: 0.33144688606262207, mean loss: 0.3415007689636194
Epoch: 52, step: 526, loss: 0.2855076193809509, mean loss: 0.3415000284604179
Epoch: 52, step: 527, loss: 0.3277047872543335, mean loss: 0.3414998460222936
Epoch: 52, step: 528, loss: 0.32973140478134155, mean loss: 0.3414996903900781
Epoch: 52, step: 529, loss: 0.3182082772254944, mean loss: 0.3414993823759391
Epoch: 52, step: 530, loss: 0.35122475028038025, mean loss: 0.341499510986049
Epoch: 52, step: 531, loss: 0.3019963800907135, mean loss: 0.341498988596061
Epoch: 52, step: 532, loss: 0.3329959213733673, mean loss: 0.34149887615286106
Epoch: 52, step: 533, loss: 0.33085522055625916, mean loss: 0.3414987354047243
Epoch: 52, step: 534, loss: 0.32209667563438416, mean loss: 0.3414984788417769
Epoch: 52, step: 535, loss: 0.30519652366638184, mean loss: 0.3414979988095758
Epoch: 52, step: 536, loss: 0.2920675575733185, mean loss: 0.34149734518390656
Epoch: 52, step: 537, loss: 0.3501197397708893, mean loss: 0.341497459197534
Epoch: 52, step: 538, loss: 0.33004534244537354, mean loss: 0.34149730776858994
Epoch: 52, step: 539, loss: 0.30699577927589417, mean loss: 0.3414968515681286
Epoch: 52, step: 540, loss: 0.40926599502563477, mean loss: 0.3414977476416382
Epoch: 52, step: 541, loss: 0.3027098476886749, mean loss: 0.34149723477769595
Epoch: 52, step: 542, loss: 0.3368186056613922, mean loss: 0.34149717291643383
Epoch: 52, step: 543, loss: 0.31608253717422485, mean loss: 0.3414968368862384
Epoch: 52, step: 544, loss: 0.3284425139427185, mean loss: 0.34149666428535064
Epoch: 52, step: 545, loss: 0.2791895866394043, mean loss: 0.34149584048814774
Epoch: 52, step: 546, loss: 0.3139740526676178, mean loss: 0.3414954766117966
Epoch: 52, step: 547, loss: 0.3352849781513214, mean loss: 0.3414953945014462
Epoch: 52, step: 548, loss: 0.3350808620452881, mean loss: 0.3414953096946393
Epoch: 52, step: 549, loss: 0.33194273710250854, mean loss: 0.3414951834013398
Epoch: 52, step: 550, loss: 0.3577378988265991, mean loss: 0.34149539814129437
Epoch: 52, step: 551, loss: 0.30704131722450256, mean loss: 0.341494942640489
Epoch: 52, step: 552, loss: 0.3128751814365387, mean loss: 0.34149456427741604
Epoch: 52, step: 553, loss: 0.34191668033599854, mean loss: 0.34149456985786153
Epoch: 52, step: 554, loss: 0.31539976596832275, mean loss: 0.3414942248847128
Epoch: 52, step: 555, loss: 0.38467976450920105, mean loss: 0.3414947957897367
Epoch: 52, step: 556, loss: 0.30986475944519043, mean loss: 0.3414943776519041
Epoch: 52, step: 557, loss: 0.3594367206096649, mean loss: 0.341494614840162
Epoch: 52, step: 558, loss: 0.3182043433189392, mean loss: 0.34149430695919486
Epoch: 52, step: 559, loss: 0.33587127923965454, mean loss: 0.3414942326277159
Epoch: 52, step: 560, loss: 0.33780473470687866, mean loss: 0.34149418385644437
Epoch: 52, step: 561, loss: 0.39499181509017944, mean loss: 0.3414948910293622
Epoch: 52, step: 562, loss: 0.34854817390441895, mean loss: 0.34149498426385844
Epoch: 52, step: 563, loss: 0.3312612771987915, mean loss: 0.3414948489904081
Epoch: 52, step: 564, loss: 0.3729327917098999, mean loss: 0.3414952645448834
Epoch: 52, step: 565, loss: 0.2947606146335602, mean loss: 0.34149464680292774
Epoch: 52, step: 566, loss: 0.28528228402137756, mean loss: 0.34149390379370453
Epoch: 52, step: 567, loss: 0.379680871963501, mean loss: 0.34149440853844615
Epoch: 52, step: 568, loss: 0.32674846053123474, mean loss: 0.3414942136331762
Epoch: 52, step: 569, loss: 0.3254196345806122, mean loss: 0.34149400116947043
Epoch: 52, step: 570, loss: 0.30263751745224, mean loss: 0.3414934875956231
Epoch: 52, step: 571, loss: 0.2861427962779999, mean loss: 0.34149275602423373
Epoch: 52, step: 572, loss: 0.3201708495616913, mean loss: 0.3414924742158191
Epoch: 52, step: 573, loss: 0.3609711527824402, mean loss: 0.34149273165916666
Epoch: 52, step: 574, loss: 0.3482898473739624, mean loss: 0.34149282149324295
Epoch: 52, step: 575, loss: 0.3648633062839508, mean loss: 0.34149313036516077
Epoch: 52, step: 576, loss: 0.3439367413520813, mean loss: 0.34149316266029045
Epoch: 52, step: 577, loss: 0.342678040266037, mean loss: 0.34149317831960385
Epoch: 52, step: 578, loss: 0.3384081721305847, mean loss: 0.3414931375487766
Epoch: 52, step: 579, loss: 0.33088040351867676, mean loss: 0.34149299729485116
Epoch: 52, step: 580, loss: 0.3604283630847931, mean loss: 0.3414932475342595
Epoch: 52, step: 581, loss: 0.33178454637527466, mean loss: 0.3414931192310858
Epoch: 52, step: 582, loss: 0.3348936438560486, mean loss: 0.3414930320183441
Epoch: 52, step: 583, loss: 0.32444366812705994, mean loss: 0.3414928067122349
Epoch: 52, step: 584, loss: 0.3411997854709625, mean loss: 0.3414928028400316
Epoch: 52, step: 585, loss: 0.3591534495353699, mean loss: 0.34149303621803057
Epoch: 52, step: 586, loss: 0.33519572019577026, mean loss: 0.3414929530027544
Epoch: 52, step: 587, loss: 0.37650054693222046, mean loss: 0.3414934156011202
Epoch: 52, step: 588, loss: 0.31354209780693054, mean loss: 0.3414930462508844
Epoch: 52, step: 589, loss: 0.3077866733074188, mean loss: 0.3414926008589218
Epoch: 52, step: 590, loss: 0.3461140990257263, mean loss: 0.3414926619260364
Epoch: 52, step: 591, loss: 0.3278849422931671, mean loss: 0.34149248212001587
Epoch: 52, step: 592, loss: 0.3615044951438904, mean loss: 0.3414927465458694
Epoch: 52, step: 593, loss: 0.32834893465042114, mean loss: 0.34149257287429763
Epoch: 52, step: 594, loss: 0.3440302312374115, mean loss: 0.34149260640439505
Epoch: 52, step: 595, loss: 0.3405049741268158, mean loss: 0.3414925933549754
Epoch: 52, step: 596, loss: 0.3339623808860779, mean loss: 0.34149249386085545
Epoch: 52, step: 597, loss: 0.3258291780948639, mean loss: 0.34149228690955974
Epoch: 52, step: 598, loss: 0.33397871255874634, mean loss: 0.34149218763789685
Epoch: 52, step: 599, loss: 0.34368667006492615, mean loss: 0.34149221663169277
Epoch: 52, step: 600, loss: 0.3287660479545593, mean loss: 0.34149204849406806
Epoch: 52, step: 601, loss: 0.34902629256248474, mean loss: 0.34149214803488015
Epoch: 52, step: 602, loss: 0.34792962670326233, mean loss: 0.34149223308434
Epoch: 52, step: 603, loss: 0.3227105736732483, mean loss: 0.3414919849516521
Epoch: 52, step: 604, loss: 0.2917339503765106, mean loss: 0.34149132758525663
Epoch: 52, step: 605, loss: 0.32281506061553955, mean loss: 0.3414910808514736
Epoch: 52, step: 606, loss: 0.2990991175174713, mean loss: 0.34149052081496745
Epoch: 52, step: 607, loss: 0.33011138439178467, mean loss: 0.34149037048818104
Epoch: 52, step: 608, loss: 0.3213227689266205, mean loss: 0.3414901040628067
Epoch: 52, step: 609, loss: 0.3206337094306946, mean loss: 0.3414898285417278
Epoch: 52, step: 610, loss: 0.37487223744392395, mean loss: 0.3414902695304978
Epoch: 52, step: 611, loss: 0.315851092338562, mean loss: 0.341489930835951
Epoch: 52, step: 612, loss: 0.38212886452674866, mean loss: 0.341490467670784
Epoch: 52, step: 613, loss: 0.3461255431175232, mean loss: 0.3414905288986967
Epoch: 52, step: 614, loss: 0.3556056320667267, mean loss: 0.34149071535237974
Epoch: 52, step: 615, loss: 0.30599039793014526, mean loss: 0.34149024641655834
Epoch: 52, step: 616, loss: 0.3727770745754242, mean loss: 0.3414906596895015
Epoch: 52, step: 617, loss: 0.349738746881485, mean loss: 0.34149076863842487
Epoch: 52, step: 618, loss: 0.32101044058799744, mean loss: 0.3414904981174948
Epoch: 52, step: 619, loss: 0.31739377975463867, mean loss: 0.3414901798325268
Epoch: 52, step: 620, loss: 0.3242526054382324, mean loss: 0.3414899521505551
Epoch: 52, step: 621, loss: 0.32378390431404114, mean loss: 0.3414897182838554
Epoch: 52, step: 622, loss: 0.3381585478782654, mean loss: 0.34148967428535576
Epoch: 52, step: 623, loss: 0.30994144082069397, mean loss: 0.3414892575979949
Epoch: 52, step: 624, loss: 0.34142351150512695, mean loss: 0.34148925672963554
Epoch: 52, step: 625, loss: 0.3468124568462372, mean loss: 0.34148932703631746
Epoch: 52, step: 626, loss: 0.28782156109809875, mean loss: 0.3414886182234542
Epoch: 52, step: 627, loss: 0.318060964345932, mean loss: 0.3414883088086162
Epoch: 52, step: 628, loss: 0.34235048294067383, mean loss: 0.34148832019541353
Epoch: 52, step: 629, loss: 0.33069178462028503, mean loss: 0.34148817760665556
Epoch: 52, step: 630, loss: 0.36724576354026794, mean loss: 0.34148851778000616
Epoch: 52, step: 631, loss: 0.33744993805885315, mean loss: 0.3414884644442993
Epoch: 52, step: 632, loss: 0.3088602125644684, mean loss: 0.3414880335433355
Epoch: 52, step: 633, loss: 0.32925453782081604, mean loss: 0.3414878719853243
Epoch: 52, step: 634, loss: 0.38613852858543396, mean loss: 0.34148846164311125
Epoch: 52, step: 635, loss: 0.29635167121887207, mean loss: 0.3414878655732995
Epoch: 52, step: 636, loss: 0.3649686574935913, mean loss: 0.3414881756530872
Epoch: 52, step: 637, loss: 0.3163630962371826, mean loss: 0.34148784386374914
Epoch: 52, step: 638, loss: 0.34129050374031067, mean loss: 0.34148784125780773
Epoch: 52, step: 639, loss: 0.35712459683418274, mean loss: 0.34148804774359337
Epoch: 52, step: 640, loss: 0.34643176198005676, mean loss: 0.3414881130252455
Epoch: 52, step: 641, loss: 0.29462769627571106, mean loss: 0.3414874942425075
Epoch: 52, step: 642, loss: 0.3592158854007721, mean loss: 0.341487728339392
Epoch: 52, step: 643, loss: 0.3778785169124603, mean loss: 0.34148820886002496
Epoch: 52, step: 644, loss: 0.3220408260822296, mean loss: 0.34148795207127003
Epoch: 52, step: 645, loss: 0.3292238116264343, mean loss: 0.34148779013422137
Epoch: 52, step: 646, loss: 0.3020365536212921, mean loss: 0.34148726922266776
Epoch: 52, step: 647, loss: 0.3314206898212433, mean loss: 0.341487136305965
Epoch: 52, step: 648, loss: 0.3454492390155792, mean loss: 0.3414871886199292
Epoch: 52, step: 649, loss: 0.3224037289619446, mean loss: 0.3414869366531535
Epoch: 52, step: 650, loss: 0.37014809250831604, mean loss: 0.3414873150731994
Epoch: 52, step: 651, loss: 0.2853972017765045, mean loss: 0.3414865745118937
Epoch: 52, step: 652, loss: 0.3785114288330078, mean loss: 0.3414870633469278
Epoch: 52, step: 653, loss: 0.37090355157852173, mean loss: 0.34148745172442285
Epoch: 52, step: 654, loss: 0.3377821743488312, mean loss: 0.34148740280534945
Epoch: 52, step: 655, loss: 0.341434121131897, mean loss: 0.3414874021019053
Epoch: 52, step: 656, loss: 0.3096008896827698, mean loss: 0.34148698113006004
Epoch: 52, step: 657, loss: 0.32046812772750854, mean loss: 0.34148670363879446
Epoch: 52, step: 658, loss: 0.3322305679321289, mean loss: 0.3414865814407443
Epoch: 52, step: 659, loss: 0.35965603590011597, mean loss: 0.34148682130786234
Epoch: 52, step: 660, loss: 0.3349801003932953, mean loss: 0.3414867354094226
Epoch: 52, step: 661, loss: 0.302775114774704, mean loss: 0.34148622436492576
Epoch: 52, step: 662, loss: 0.29256919026374817, mean loss: 0.34148557860402357
Epoch: 52, step: 663, loss: 0.3462909758090973, mean loss: 0.34148564203993553
Epoch: 52, step: 664, loss: 0.32714518904685974, mean loss: 0.34148545273452197
Epoch: 52, step: 665, loss: 0.3298575282096863, mean loss: 0.3414852992386732
Epoch: 52, step: 666, loss: 0.33982113003730774, mean loss: 0.34148527727089284
Epoch: 52, step: 667, loss: 0.3246209919452667, mean loss: 0.3414850546576962
Epoch: 52, step: 668, loss: 0.33918115496635437, mean loss: 0.34148502424598914
Epoch: 52, step: 669, loss: 0.31187307834625244, mean loss: 0.3414846333704922
Epoch: 52, step: 670, loss: 0.3345192074775696, mean loss: 0.3414845414285989
Epoch: 52, step: 671, loss: 0.3390306830406189, mean loss: 0.34148450903870464
Epoch: 52, step: 672, loss: 0.31715041399002075, mean loss: 0.34148418784316803
Epoch: 52, step: 673, loss: 0.32767122983932495, mean loss: 0.3414840055227699
Epoch: 52, step: 674, loss: 0.3050987124443054, mean loss: 0.3414835252712873
Epoch: 52, step: 675, loss: 0.3234686851501465, mean loss: 0.34148328749556106
Epoch: 52, step: 676, loss: 0.3329196572303772, mean loss: 0.3414831744667184
Epoch: 52, step: 677, loss: 0.3726649582386017, mean loss: 0.3414835860204994
Epoch: 52, step: 678, loss: 0.3127390742301941, mean loss: 0.34148320664013865
Epoch: 52, step: 679, loss: 0.3492453396320343, mean loss: 0.34148330908619756
Epoch: 52, step: 680, loss: 0.3084372878074646, mean loss: 0.34148287294448687
Epoch: 52, step: 681, loss: 0.33547213673591614, mean loss: 0.3414827936157788
Epoch: 52, step: 682, loss: 0.3109651803970337, mean loss: 0.3414823908546536
Epoch: 52, step: 683, loss: 0.2960669994354248, mean loss: 0.3414817914856067
Epoch: 52, step: 684, loss: 0.32333821058273315, mean loss: 0.3414815520390901
Epoch: 52, step: 685, loss: 0.32187312841415405, mean loss: 0.3414812932640007
Epoch: 52, step: 686, loss: 0.33563292026519775, mean loss: 0.3414812160832287
Epoch: 52, step: 687, loss: 0.32597294449806213, mean loss: 0.3414810114238169
Epoch: 52, step: 688, loss: 0.3208348751068115, mean loss: 0.34148073896467607
Epoch: 52, step: 689, loss: 0.3086119294166565, mean loss: 0.3414803052133294
Epoch: 52, step: 690, loss: 0.32364824414253235, mean loss: 0.3414800698966708
Epoch: 52, step: 691, loss: 0.33461567759513855, mean loss: 0.34147997931350504
Epoch: 52, step: 692, loss: 0.35413113236427307, mean loss: 0.3414801462571064
Epoch: 52, step: 693, loss: 0.3653488755226135, mean loss: 0.34148046122278775
Epoch: 52, step: 694, loss: 0.3610367476940155, mean loss: 0.34148071927916546
Epoch: 52, step: 695, loss: 0.31123217940330505, mean loss: 0.34148032013765967
Epoch: 52, step: 696, loss: 0.32466429471969604, mean loss: 0.34148009824644876
Epoch: 52, step: 697, loss: 0.33964940905570984, mean loss: 0.3414800740904148
Epoch: 52, step: 698, loss: 0.3318944573402405, mean loss: 0.3414799476093989
Epoch: 52, step: 699, loss: 0.33924874663352966, mean loss: 0.3414799181693692
Epoch: 52, step: 700, loss: 0.32594892382621765, mean loss: 0.3414797132452464
Epoch: 52, step: 701, loss: 0.34225666522979736, mean loss: 0.341479723496625
Epoch: 52, step: 702, loss: 0.358513206243515, mean loss: 0.3414799482394407
Epoch: 52, step: 703, loss: 0.296560138463974, mean loss: 0.34147935556726194
Epoch: 52, step: 704, loss: 0.33919647336006165, mean loss: 0.3414793254473009
Epoch: 52, step: 705, loss: 0.34340906143188477, mean loss: 0.34147935090757464
Epoch: 52, step: 706, loss: 0.36062338948249817, mean loss: 0.341479603484111
Epoch: 52, step: 707, loss: 0.3150663673877716, mean loss: 0.34147925500614257
Epoch: 52, step: 708, loss: 0.3446565568447113, mean loss: 0.3414792969247124
Epoch: 52, step: 709, loss: 0.3175656199455261, mean loss: 0.3414789814325229
Epoch: 52, step: 710, loss: 0.312450110912323, mean loss: 0.34147859846084094
Epoch: 52, step: 711, loss: 0.34395667910575867, mean loss: 0.3414786311531977
Epoch: 52, step: 712, loss: 0.3090725839138031, mean loss: 0.3414782036384256
Epoch: 52, step: 713, loss: 0.3513401746749878, mean loss: 0.34147833374015163
Epoch: 52, step: 714, loss: 0.38105303049087524, mean loss: 0.34147885581311377
Epoch: 52, step: 715, loss: 0.3504723906517029, mean loss: 0.34147897445506986
Epoch: 52, step: 716, loss: 0.343928724527359, mean loss: 0.3414790067715407
Epoch: 52, step: 717, loss: 0.32639145851135254, mean loss: 0.3414788077431226
Epoch: 52, step: 718, loss: 0.35097384452819824, mean loss: 0.34147893299589327
Epoch: 52, step: 719, loss: 0.3072566092014313, mean loss: 0.3414784815616938
Epoch: 52, step: 720, loss: 0.34048905968666077, mean loss: 0.34147846851018443
Epoch: 52, step: 721, loss: 0.3186299502849579, mean loss: 0.34147816711830703
Epoch: 52, step: 722, loss: 0.3527538478374481, mean loss: 0.34147831585240523
Epoch: 52, step: 723, loss: 0.29345235228538513, mean loss: 0.34147768236478365
Epoch: 52, step: 724, loss: 0.40464338660240173, mean loss: 0.34147851554252673
Epoch: 52, step: 725, loss: 0.35610637068748474, mean loss: 0.34147870848650996
Epoch: 52, step: 726, loss: 0.3212106227874756, mean loss: 0.3414784411504195
Epoch: 52, step: 727, loss: 0.3353107273578644, mean loss: 0.3414783597993354
Epoch: 52, step: 728, loss: 0.30261924862861633, mean loss: 0.3414778472611029
Epoch: 52, step: 729, loss: 0.3710585832595825, mean loss: 0.3414782374156308
Epoch: 52, step: 730, loss: 0.3048294484615326, mean loss: 0.34147775404353475
Epoch: 52, step: 731, loss: 0.29970473051071167, mean loss: 0.34147720309360685
Epoch: 52, step: 732, loss: 0.3822430670261383, mean loss: 0.3414777407528824
Epoch: 52, step: 733, loss: 0.3508377969264984, mean loss: 0.3414778642006439
Epoch: 52, step: 734, loss: 0.2968730926513672, mean loss: 0.3414772759256937
Epoch: 52, step: 735, loss: 0.3116634786128998, mean loss: 0.34147688272832466
Epoch: 52, step: 736, loss: 0.3160085380077362, mean loss: 0.3414765468451104
Epoch: 52, step: 737, loss: 0.3291454613208771, mean loss: 0.341476384221663
Epoch: 52, step: 738, loss: 0.36336925625801086, mean loss: 0.34147667294298967
Epoch: 52, step: 739, loss: 0.3169882595539093, mean loss: 0.34147634999614435
Epoch: 52, step: 740, loss: 0.3689947724342346, mean loss: 0.34147671289717746
Epoch: 52, step: 741, loss: 0.335600882768631, mean loss: 0.3414766354102972
Epoch: 52, step: 742, loss: 0.33142194151878357, mean loss: 0.34147650281684744
Epoch: 52, step: 743, loss: 0.3734499216079712, mean loss: 0.34147692445176137
Epoch: 52, step: 744, loss: 0.30465036630630493, mean loss: 0.34147643882468415
Epoch: 52, step: 745, loss: 0.33640480041503906, mean loss: 0.3414763719465238
Epoch: 52, step: 746, loss: 0.31673553586006165, mean loss: 0.3414760457009105
Epoch: 52, step: 747, loss: 0.3087153136730194, mean loss: 0.3414756137064484
Epoch: 52, step: 748, loss: 0.35659143328666687, mean loss: 0.3414758130262999
Epoch: 52, step: 749, loss: 0.347636878490448, mean loss: 0.34147589426611985
Epoch: 52, step: 750, loss: 0.3231469988822937, mean loss: 0.3414756525844602
Epoch: 52, step: 751, loss: 0.3255667984485626, mean loss: 0.34147544281581393
Epoch: 52, step: 752, loss: 0.3042142689228058, mean loss: 0.3414749515093452
Epoch: 52, step: 753, loss: 0.36958691477775574, mean loss: 0.34147532217419146
Epoch: 52, step: 754, loss: 0.334426611661911, mean loss: 0.3414752292360098
Epoch: 52, step: 755, loss: 0.3178498446941376, mean loss: 0.34147491773629274
Epoch: 52, step: 756, loss: 0.3398683965206146, mean loss: 0.3414748965546563
Epoch: 52, step: 757, loss: 0.30648916959762573, mean loss: 0.34147443528145854
Epoch: 52, step: 758, loss: 0.31398874521255493, mean loss: 0.34147407289810694
Epoch: 52, step: 759, loss: 0.35502102971076965, mean loss: 0.34147425150475197
Epoch: 52, step: 760, loss: 0.3116466701030731, mean loss: 0.34147385825525095
Epoch: 52, step: 761, loss: 0.31630825996398926, mean loss: 0.3414735264741265
Epoch: 52, step: 762, loss: 0.3515990376472473, mean loss: 0.3414736599662515
Epoch: 52, step: 763, loss: 0.30435842275619507, mean loss: 0.3414731706549979
Epoch: 52, step: 764, loss: 0.3475080728530884, mean loss: 0.3414732502154925
Epoch: 52, step: 765, loss: 0.3363504111766815, mean loss: 0.3414731826799764
Epoch: 52, step: 766, loss: 0.37508758902549744, mean loss: 0.34147362582026175
Epoch: 52, step: 767, loss: 0.398826003074646, mean loss: 0.3414743818893565
Epoch: 52, step: 768, loss: 0.31913310289382935, mean loss: 0.34147408737099966
Epoch: 52, step: 769, loss: 0.32097434997558594, mean loss: 0.3414738171326939
Epoch: 52, step: 770, loss: 0.32469141483306885, mean loss: 0.3414735959011683
Epoch: 52, step: 771, loss: 0.3198186457157135, mean loss: 0.341473310441767
Epoch: 52, step: 772, loss: 0.3057636618614197, mean loss: 0.3414728397170391
Epoch: 52, step: 773, loss: 0.30043908953666687, mean loss: 0.3414722988171132
Epoch: 52, step: 774, loss: 0.32003292441368103, mean loss: 0.34147201621064627
Epoch: 52, step: 775, loss: 0.29865720868110657, mean loss: 0.34147145184800354
Epoch: 52, step: 776, loss: 0.3015507459640503, mean loss: 0.34147092564084763
Epoch: 52, step: 777, loss: 0.30968451499938965, mean loss: 0.3414705066598727
Epoch: 52, step: 778, loss: 0.3386881947517395, mean loss: 0.3414704699863268
Epoch: 52, step: 779, loss: 0.32332104444503784, mean loss: 0.34147023076260213
Epoch: 52, step: 780, loss: 0.31486693024635315, mean loss: 0.34146988011476814
Epoch: 52, step: 781, loss: 0.31221944093704224, mean loss: 0.341469494581103
Epoch: 52, step: 782, loss: 0.36909276247024536, mean loss: 0.3414698586631355
Epoch: 52, step: 783, loss: 0.3748922049999237, mean loss: 0.3414702991727614
Epoch: 52, step: 784, loss: 0.33630889654159546, mean loss: 0.3414702311458924
Epoch: 52, step: 785, loss: 0.35455045104026794, mean loss: 0.34147040353985997
Epoch: 52, step: 786, loss: 0.31451329588890076, mean loss: 0.34147004825672783
Epoch: 52, step: 787, loss: 0.31250306963920593, mean loss: 0.3414696664893888
Epoch: 52, step: 788, loss: 0.3577338755130768, mean loss: 0.3414698808390471
Epoch: 52, step: 789, loss: 0.35109102725982666, mean loss: 0.34147000763662244
Epoch: 52, step: 790, loss: 0.3069919943809509, mean loss: 0.3414695532551301
Epoch: 52, step: 791, loss: 0.298796147108078, mean loss: 0.3414689908749753
Epoch: 52, step: 792, loss: 0.3295896351337433, mean loss: 0.3414688343225347
Epoch: 52, step: 793, loss: 0.30982211232185364, mean loss: 0.34146841727077015
Epoch: 52, step: 794, loss: 0.33429408073425293, mean loss: 0.3414683227260561
Epoch: 52, step: 795, loss: 0.4126985967159271, mean loss: 0.341469261399215
Epoch: 52, step: 796, loss: 0.3626759648323059, mean loss: 0.34146954085765124
Epoch: 52, step: 797, loss: 0.3325081169605255, mean loss: 0.341469422767043
Epoch: 52, step: 798, loss: 0.347348690032959, mean loss: 0.3414695002410144
Epoch: 52, step: 799, loss: 0.33977627754211426, mean loss: 0.3414694779288873
Epoch: 52, step: 800, loss: 0.30364125967025757, mean loss: 0.3414689794611481
Epoch: 52, step: 801, loss: 0.3430679142475128, mean loss: 0.3414690005302585
Epoch: 52, step: 802, loss: 0.31463396549224854, mean loss: 0.34146864693055584
Epoch: 52, step: 803, loss: 0.3557089567184448, mean loss: 0.3414688345696981
Epoch: 52, step: 804, loss: 0.3536747992038727, mean loss: 0.3414689954009294
Epoch: 52, step: 805, loss: 0.36449456214904785, mean loss: 0.3414692987920637
Epoch: 52, step: 806, loss: 0.32602012157440186, mean loss: 0.34146909523218205
Epoch: 52, step: 807, loss: 0.3325294554233551, mean loss: 0.3414689774441588
Epoch: 52, step: 808, loss: 0.3288228511810303, mean loss: 0.3414688108219437
Epoch: 52, step: 809, loss: 0.31757083535194397, mean loss: 0.3414684959523098
Epoch: 52, step: 810, loss: 0.35205087065696716, mean loss: 0.3414686353793735
Epoch: 52, step: 811, loss: 0.29893314838409424, mean loss: 0.3414680749645251
Epoch: 52, step: 812, loss: 0.3537759780883789, mean loss: 0.3414682371218501
Epoch: 52, step: 813, loss: 0.33325356245040894, mean loss: 0.3414681288944691
Epoch: 52, step: 814, loss: 0.3244117498397827, mean loss: 0.34146790418162437
Epoch: 52, step: 815, loss: 0.3719273805618286, mean loss: 0.3414683054711003
Epoch: 52, step: 816, loss: 0.3564109206199646, mean loss: 0.34146850233053183
Epoch: 52, step: 817, loss: 0.3047335147857666, mean loss: 0.34146801837685825
Epoch: 52, step: 818, loss: 0.33039039373397827, mean loss: 0.3414678724400587
Epoch: 52, step: 819, loss: 0.3155319094657898, mean loss: 0.3414675307637799
Epoch: 52, step: 820, loss: 0.33404284715652466, mean loss: 0.34146743295345955
Epoch: 52, step: 821, loss: 0.3666541278362274, mean loss: 0.34146776475025686
Epoch: 52, step: 822, loss: 0.3196617364883423, mean loss: 0.34146747749243833
Epoch: 52, step: 823, loss: 0.3454344570636749, mean loss: 0.34146752975004674
Epoch: 52, step: 824, loss: 0.32204195857048035, mean loss: 0.3414672738574963
Epoch: 52, step: 825, loss: 0.33820056915283203, mean loss: 0.34146723082584596
Epoch: 52, step: 826, loss: 0.31121543049812317, mean loss: 0.3414668323301557
Epoch: 52, step: 827, loss: 0.3057385981082916, mean loss: 0.3414663617016423
Epoch: 52, step: 828, loss: 0.3601762652397156, mean loss: 0.3414666081537352
Epoch: 52, step: 829, loss: 0.3270568251609802, mean loss: 0.3414664183465354
Epoch: 52, step: 830, loss: 0.3464033305644989, mean loss: 0.34146648337521357
Epoch: 52, step: 831, loss: 0.3684995472431183, mean loss: 0.3414668394482361
Epoch: 52, step: 832, loss: 0.3308973014354706, mean loss: 0.3414667002306545
Epoch: 52, step: 833, loss: 0.32656392455101013, mean loss: 0.3414665039400447
Epoch: 52, step: 834, loss: 0.3124760091304779, mean loss: 0.34146612209930066
Epoch: 52, step: 835, loss: 0.40029338002204895, mean loss: 0.34146689691698573
Epoch: 52, step: 836, loss: 0.318055659532547, mean loss: 0.3414665885700989
Epoch: 52, step: 837, loss: 0.34874022006988525, mean loss: 0.3414666843690544
Epoch: 52, step: 838, loss: 0.3460691273212433, mean loss: 0.34146674498573826
Epoch: 52, step: 839, loss: 0.3233475089073181, mean loss: 0.34146650634866
Epoch: 52, step: 840, loss: 0.33514246344566345, mean loss: 0.34146642305975977
Epoch: 52, step: 841, loss: 0.3402875065803528, mean loss: 0.34146640753340024
Epoch: 52, step: 842, loss: 0.3157789409160614, mean loss: 0.34146606923327755
Epoch: 52, step: 843, loss: 0.35288164019584656, mean loss: 0.3414662195726728
Epoch: 52, step: 844, loss: 0.3031065762042999, mean loss: 0.3414657143951694
Epoch: 52, step: 845, loss: 0.34918051958084106, mean loss: 0.3414658159939945
Epoch: 52, step: 846, loss: 0.34262797236442566, mean loss: 0.3414658312986152
Epoch: 52, step: 847, loss: 0.32012155652046204, mean loss: 0.34146555021619346
Epoch: 52, step: 848, loss: 0.32049018144607544, mean loss: 0.34146527399552673
Epoch: 52, step: 849, loss: 0.3774406313896179, mean loss: 0.3414657477419698
Epoch: 52, step: 850, loss: 0.3448309898376465, mean loss: 0.34146579205703975
Epoch: 52, step: 851, loss: 0.35089293122291565, mean loss: 0.3414659161963493
Epoch: 52, step: 852, loss: 0.33056876063346863, mean loss: 0.34146577270132605
Epoch: 52, step: 853, loss: 0.34854358434677124, mean loss: 0.34146586590155315
Epoch: 52, step: 854, loss: 0.3294770419597626, mean loss: 0.34146570803547016
Epoch: 52, step: 855, loss: 0.3214651942253113, mean loss: 0.341465444676761
Epoch: 52, step: 856, loss: 0.33609190583229065, mean loss: 0.34146537392109777
Epoch: 52, step: 857, loss: 0.3415951430797577, mean loss: 0.3414653756298008
Epoch: 52, step: 858, loss: 0.3374459743499756, mean loss: 0.34146532270603447
Epoch: 52, step: 859, loss: 0.30308666825294495, mean loss: 0.3414648173779883
Epoch: 52, step: 860, loss: 0.36623117327690125, mean loss: 0.3414651434699171
Epoch: 52, step: 861, loss: 0.3319379985332489, mean loss: 0.3414650180302207
Epoch: 52, step: 862, loss: 0.3233432173728943, mean loss: 0.34146477943164194
Epoch: 52, step: 863, loss: 0.31924930214881897, mean loss: 0.34146448693799747
Epoch: 52, step: 864, loss: 0.3313148319721222, mean loss: 0.34146435330726577
Epoch: 52, step: 865, loss: 0.29801657795906067, mean loss: 0.34146378127978405
Epoch: 52, step: 866, loss: 0.31192547082901, mean loss: 0.3414633923875393
Epoch: 52, step: 867, loss: 0.366978257894516, mean loss: 0.3414637283039318
Epoch: 52, step: 868, loss: 0.3228739798069, mean loss: 0.3414634835635063
Epoch: 52, step: 869, loss: 0.35478249192237854, mean loss: 0.3414636589105186
Epoch: 52, step: 870, loss: 0.33555155992507935, mean loss: 0.34146358107775376
Epoch: 52, step: 871, loss: 0.3454797863960266, mean loss: 0.3414636339503883
Epoch: 52, step: 872, loss: 0.3724042475223541, mean loss: 0.3414640412727455
Epoch: 52, step: 873, loss: 0.32281923294067383, mean loss: 0.3414637958235955
Epoch: 52, step: 874, loss: 0.3652981221675873, mean loss: 0.34146410958590534
Epoch: 52, step: 875, loss: 0.33057934045791626, mean loss: 0.3414639662973854
Epoch: 52, step: 876, loss: 0.32375368475914, mean loss: 0.3414637331599993
Epoch: 52, step: 877, loss: 0.31641051173210144, mean loss: 0.34146340336480896
Epoch: 52, step: 878, loss: 0.29733580350875854, mean loss: 0.34146282248627147
Epoch: 52, step: 879, loss: 0.29624494910240173, mean loss: 0.3414622272636332
Epoch: 52, step: 880, loss: 0.3140577971935272, mean loss: 0.3414618665318864
Epoch: 52, step: 881, loss: 0.3560296297073364, mean loss: 0.3414620582886743
Epoch: 52, step: 882, loss: 0.31258299946784973, mean loss: 0.34146167815600764
Epoch: 52, step: 883, loss: 0.3123014569282532, mean loss: 0.34146129432747574
Epoch: 52, step: 884, loss: 0.31413865089416504, mean loss: 0.341460934691244
Epoch: 52, step: 885, loss: 0.3675270974636078, mean loss: 0.34146127778444396
Epoch: 52, step: 886, loss: 0.3082951605319977, mean loss: 0.34146084124456566
Epoch: 52, step: 887, loss: 0.31380629539489746, mean loss: 0.341460477254018
Epoch: 52, step: 888, loss: 0.3152799904346466, mean loss: 0.3414601326696462
Epoch: 52, step: 889, loss: 0.34613728523254395, mean loss: 0.3414601942289471
Epoch: 52, step: 890, loss: 0.29002517461776733, mean loss: 0.3414595172653175
Epoch: 52, step: 891, loss: 0.33384430408477783, mean loss: 0.34145941703876864
Epoch: 52, step: 892, loss: 0.32265838980674744, mean loss: 0.3414591695949704
Epoch: 52, step: 893, loss: 0.3344787657260895, mean loss: 0.3414590777257926
Epoch: 52, step: 894, loss: 0.30752813816070557, mean loss: 0.34145863116617314
Epoch: 52, step: 895, loss: 0.3231673240661621, mean loss: 0.3414583904404006
Epoch: 52, step: 896, loss: 0.34220683574676514, mean loss: 0.3414584002903092
Epoch: 52, step: 897, loss: 0.3449278473854065, mean loss: 0.3414584459493398
Epoch: 52, step: 898, loss: 0.33027395606040955, mean loss: 0.341458298759822
Epoch: 52, step: 899, loss: 0.3308248221874237, mean loss: 0.34145815882356134
Epoch: 52, step: 900, loss: 0.38138043880462646, mean loss: 0.34145868419275927
Epoch: 52, step: 901, loss: 0.36033710837364197, mean loss: 0.341458932625766
Epoch: 52, step: 902, loss: 0.3368954658508301, mean loss: 0.34145887257303903
Epoch: 52, step: 903, loss: 0.3349606692790985, mean loss: 0.3414587870613629
Epoch: 52, step: 904, loss: 0.35604968667030334, mean loss: 0.34145897906456857
Epoch: 52, step: 905, loss: 0.31970643997192383, mean loss: 0.34145869282435104
Epoch: 52, step: 906, loss: 0.3337026834487915, mean loss: 0.34145859076488166
Epoch: 52, step: 907, loss: 0.3165656626224518, mean loss: 0.3414582632091137
Epoch: 52, step: 908, loss: 0.33557605743408203, mean loss: 0.34145818580861403
Epoch: 52, step: 909, loss: 0.31712308526039124, mean loss: 0.3414578656014961
Epoch: 52, step: 910, loss: 0.3467894196510315, mean loss: 0.34145793575444616
Epoch: 52, step: 911, loss: 0.3402729630470276, mean loss: 0.3414579201627
Epoch: 52, step: 912, loss: 0.32991480827331543, mean loss: 0.34145776828164726
Epoch: 52, step: 913, loss: 0.39951345324516296, mean loss: 0.341458532152137
Epoch: 52, step: 914, loss: 0.353397935628891, mean loss: 0.3414586892433502
Epoch: 52, step: 915, loss: 0.349983811378479, mean loss: 0.34145880141010637
Epoch: 52, step: 916, loss: 0.3035494089126587, mean loss: 0.3414583026351245
Epoch: 52, step: 917, loss: 0.32432660460472107, mean loss: 0.3414580772358398
Epoch: 52, step: 918, loss: 0.30340832471847534, mean loss: 0.34145757662731013
Epoch: 52, step: 919, loss: 0.343548983335495, mean loss: 0.3414576041429231
Epoch: 52, step: 920, loss: 0.3219064474105835, mean loss: 0.3414573469213213
Epoch: 52, step: 921, loss: 0.34309154748916626, mean loss: 0.34145736842113145
Epoch: 52, step: 922, loss: 0.3334600031375885, mean loss: 0.3414572632078691
Epoch: 52, step: 923, loss: 0.31725576519966125, mean loss: 0.34145694481737804
Epoch: 52, step: 924, loss: 0.30634114146232605, mean loss: 0.34145648284635527
Epoch: 52, step: 925, loss: 0.3262837529182434, mean loss: 0.3414562832419412
Epoch: 52, step: 926, loss: 0.3196748197078705, mean loss: 0.3414559967002911
Epoch: 52, step: 927, loss: 0.3125323951244354, mean loss: 0.34145561620669007
Epoch: 52, step: 928, loss: 0.3250780403614044, mean loss: 0.341455400760463
Epoch: 52, step: 929, loss: 0.30676913261413574, mean loss: 0.34145494447026664
Epoch: 52, step: 930, loss: 0.33139368891716003, mean loss: 0.3414548121184131
Epoch: 52, step: 931, loss: 0.31521672010421753, mean loss: 0.34145446697118853
Epoch: 52, step: 932, loss: 0.31983622908592224, mean loss: 0.34145418259926646
Epoch: 52, step: 933, loss: 0.30597221851348877, mean loss: 0.34145371586642487
Epoch: 52, step: 934, loss: 0.394346684217453, mean loss: 0.34145441161597895
Epoch: 52, step: 935, loss: 0.37440940737724304, mean loss: 0.34145484509745533
Epoch: 52, step: 936, loss: 0.331163227558136, mean loss: 0.34145470972596514
Epoch: 52, step: 937, loss: 0.3370441794395447, mean loss: 0.3414546517125186
Epoch: 52, step: 938, loss: 0.3416436016559601, mean loss: 0.3414546541978191
Epoch: 52, step: 939, loss: 0.3258083462715149, mean loss: 0.34145444840116623
Epoch: 52, step: 940, loss: 0.3460019528865814, mean loss: 0.34145450821392825
Epoch: 52, step: 941, loss: 0.33241933584213257, mean loss: 0.3414543893769906
Epoch: 52, step: 942, loss: 0.349168986082077, mean loss: 0.3414544908434543
Epoch: 52, step: 943, loss: 0.347086638212204, mean loss: 0.34145456491946663
Epoch: 52, step: 944, loss: 0.33449897170066833, mean loss: 0.3414544734382253
Epoch: 52, step: 945, loss: 0.3105371296405792, mean loss: 0.3414540668129814
Epoch: 52, step: 946, loss: 0.3118908107280731, mean loss: 0.3414536780018275
Epoch: 52, step: 947, loss: 0.3312182128429413, mean loss: 0.3414535433884186
Epoch: 52, step: 948, loss: 0.3487384617328644, mean loss: 0.3414536391959642
Epoch: 52, step: 949, loss: 0.3737591803073883, mean loss: 0.34145406405644335
Epoch: 52, step: 950, loss: 0.3485785722732544, mean loss: 0.341454157751892
Epoch: 52, step: 951, loss: 0.32855942845344543, mean loss: 0.3414539881736529
Epoch: 52, step: 952, loss: 0.3201979696750641, mean loss: 0.34145370864
Epoch: 52, step: 953, loss: 0.32432231307029724, mean loss: 0.341453483351402
Epoch: 52, step: 954, loss: 0.35255998373031616, mean loss: 0.3414536294069282
Epoch: 52, step: 955, loss: 0.3432307839393616, mean loss: 0.3414536527770104
Epoch: 52, step: 956, loss: 0.35350990295410156, mean loss: 0.34145381131800817
Epoch: 52, step: 957, loss: 0.3343489170074463, mean loss: 0.3414537178891058
Epoch: 52, step: 958, loss: 0.3596469461917877, mean loss: 0.3414539571257397
Epoch: 52, step: 959, loss: 0.3111010491847992, mean loss: 0.3414535579974531
Epoch: 52, step: 960, loss: 0.34048792719841003, mean loss: 0.3414535452999712
Epoch: 52, step: 961, loss: 0.37320390343666077, mean loss: 0.3414539627931748
Epoch: 52, step: 962, loss: 0.33407604694366455, mean loss: 0.34145386578043535
Epoch: 52, step: 963, loss: 0.35217800736427307, mean loss: 0.3414540067910805
Epoch: 52, step: 964, loss: 0.3417029082775116, mean loss: 0.34145401006381776
Epoch: 52, step: 965, loss: 0.33401361107826233, mean loss: 0.34145391223334226
Epoch: 52, step: 966, loss: 0.3294215202331543, mean loss: 0.3414537540268864
Epoch: 52, step: 967, loss: 0.3010595738887787, mean loss: 0.3414532229158611
Epoch: 52, step: 968, loss: 0.34079790115356445, mean loss: 0.34145321429966846
Epoch: 52, step: 969, loss: 0.33819425106048584, mean loss: 0.3414531714512733
Epoch: 52, step: 970, loss: 0.30659550428390503, mean loss: 0.3414527131535417
Epoch: 52, step: 971, loss: 0.3348543345928192, mean loss: 0.3414526264012598
Epoch: 52, step: 972, loss: 0.3039129376411438, mean loss: 0.3414521328541231
Epoch: 52, step: 973, loss: 0.3050679862499237, mean loss: 0.34145165450558373
Epoch: 52, step: 974, loss: 0.3465796113014221, mean loss: 0.34145172192281414
Epoch: 52, step: 975, loss: 0.31775790452957153, mean loss: 0.34145141042437344
Epoch: 52, step: 976, loss: 0.3063812255859375, mean loss: 0.3414509493688967
Epoch: 52, step: 977, loss: 0.31520357728004456, mean loss: 0.3414506043083954
Epoch: 52, step: 978, loss: 0.3436163663864136, mean loss: 0.34145063278016474
Epoch: 52, step: 979, loss: 0.371755450963974, mean loss: 0.3414510311713172
Epoch: 52, step: 980, loss: 0.3123167157173157, mean loss: 0.3414506481727836
Epoch: 52, step: 981, loss: 0.31595444679260254, mean loss: 0.34145031300515666
Epoch: 52, step: 982, loss: 0.3670544922351837, mean loss: 0.34145064958781274
Epoch: 52, step: 983, loss: 0.30766186118125916, mean loss: 0.34145020541928284
Epoch: 52, step: 984, loss: 0.35400304198265076, mean loss: 0.3414503704296882
Epoch: 52, step: 985, loss: 0.35066527128219604, mean loss: 0.3414504915604405
Epoch: 52, step: 986, loss: 0.3190234899520874, mean loss: 0.3414501967592363
Epoch: 52, step: 987, loss: 0.3639448583126068, mean loss: 0.3414504924459385
Epoch: 52, step: 988, loss: 0.3478437662124634, mean loss: 0.3414505764828191
Epoch: 52, step: 989, loss: 0.3302614986896515, mean loss: 0.34145042940905546
Epoch: 52, step: 990, loss: 0.4016375243663788, mean loss: 0.34145122052217414
Epoch: 52, step: 991, loss: 0.3369755446910858, mean loss: 0.34145116169362744
Epoch: 52, step: 992, loss: 0.3217565715312958, mean loss: 0.34145090283017715
Epoch: 52, step: 993, loss: 0.3153216242790222, mean loss: 0.34145055939442953
Epoch: 52, step: 994, loss: 0.31590116024017334, mean loss: 0.34145022358486427
Epoch: 52, step: 995, loss: 0.3308759331703186, mean loss: 0.3414500846030755
Epoch: 52, step: 996, loss: 0.3264870345592499, mean loss: 0.34144988794078934
Epoch: 52, step: 997, loss: 0.3669731318950653, mean loss: 0.34145022339335557
Epoch: 52, step: 998, loss: 0.3196576237678528, mean loss: 0.34144993697649556
Epoch: 52, step: 999, loss: 0.31170231103897095, mean loss: 0.3414495460130593
Epoch: 52, step: 1000, loss: 0.32107633352279663, mean loss: 0.3414492782580292
Epoch: 52, step: 1001, loss: 0.35498708486557007, mean loss: 0.34144945617637074
Epoch: 52, step: 1002, loss: 0.3387743830680847, mean loss: 0.3414494210201353
Epoch: 52, step: 1003, loss: 0.35633838176727295, mean loss: 0.34144961669064927
Epoch: 52, step: 1004, loss: 0.3554040789604187, mean loss: 0.34144980007758724
Epoch: 52, step: 1005, loss: 0.3285072445869446, mean loss: 0.3414496299911745
Epoch: 52, step: 1006, loss: 0.3514408469200134, mean loss: 0.3414497612904311
Epoch: 52, step: 1007, loss: 0.3203152120113373, mean loss: 0.34144948355508
Epoch: 52, step: 1008, loss: 0.3194894790649414, mean loss: 0.34144919497597054
Epoch: 52, step: 1009, loss: 0.3315831422805786, mean loss: 0.3414490653266671
Epoch: 52, step: 1010, loss: 0.3693525791168213, mean loss: 0.34144943200052336
Epoch: 52, step: 1011, loss: 0.32833853363990784, mean loss: 0.3414492597153938
Epoch: 52, step: 1012, loss: 0.2977660298347473, mean loss: 0.341448685698891
Epoch: 52, step: 1013, loss: 0.3296688199043274, mean loss: 0.341448530908402
Epoch: 52, step: 1014, loss: 0.33286574482917786, mean loss: 0.34144841812985083
Epoch: 52, step: 1015, loss: 0.33989378809928894, mean loss: 0.34144839770214624
Epoch: 52, step: 1016, loss: 0.3249571621417999, mean loss: 0.3414481810115798
Epoch: 52, step: 1017, loss: 0.3511866629123688, mean loss: 0.3414483089710298
Epoch: 52, step: 1018, loss: 0.3053918480873108, mean loss: 0.34144783521091726
Epoch: 52, step: 1019, loss: 0.3518858850002289, mean loss: 0.3414479723587833
Epoch: 52, step: 1020, loss: 0.3247721493244171, mean loss: 0.34144775325430116
Epoch: 52, step: 1021, loss: 0.3493020534515381, mean loss: 0.34144785645099274
Epoch: 52, step: 1022, loss: 0.30591249465942383, mean loss: 0.341447389562346
Epoch: 52, step: 1023, loss: 0.34071993827819824, mean loss: 0.34144738000470354
Epoch: 52, step: 1024, loss: 0.34889236092567444, mean loss: 0.3414474778195436
Epoch: 52, step: 1025, loss: 0.2903537154197693, mean loss: 0.3414468065401154
Epoch: 52, step: 1026, loss: 0.3214004337787628, mean loss: 0.34144654317057244
Epoch: 52, step: 1027, loss: 0.3298124074935913, mean loss: 0.3414463903231333
Epoch: 52, step: 1028, loss: 0.30432814359664917, mean loss: 0.34144590267587016
Epoch: 52, step: 1029, loss: 0.3518078923225403, mean loss: 0.3414460388064785
Epoch: 52, step: 1030, loss: 0.331762433052063, mean loss: 0.34144591158980786
Epoch: 52, step: 1031, loss: 0.32466793060302734, mean loss: 0.3414456911749236
Epoch: 52, step: 1032, loss: 0.3089580535888672, mean loss: 0.3414452643855017
Epoch: 52, step: 1033, loss: 0.32969412207603455, mean loss: 0.34144511001301664
Epoch: 52, step: 1034, loss: 0.34001898765563965, mean loss: 0.341445091278569
Epoch: 52, step: 1035, loss: 0.35796570777893066, mean loss: 0.3414453083010126
Epoch: 52, step: 1036, loss: 0.32648035883903503, mean loss: 0.3414451117171116
Epoch: 52, step: 1037, loss: 0.42089858651161194, mean loss: 0.34144615542720796
Epoch: 52, step: 1038, loss: 0.32774364948272705, mean loss: 0.34144597543185884
Epoch: 52, step: 1039, loss: 0.3927958607673645, mean loss: 0.3414466499522106
Epoch: 52, step: 1040, loss: 0.30801236629486084, mean loss: 0.34144621077287474
Epoch: 52, step: 1041, loss: 0.32589906454086304, mean loss: 0.3414460065544821
Epoch: 52, step: 1042, loss: 0.32666686177253723, mean loss: 0.34144581242666583
Epoch: 52, step: 1043, loss: 0.34075990319252014, mean loss: 0.3414458034171924
Epoch: 52, step: 1044, loss: 0.2989445924758911, mean loss: 0.3414452451676693
Epoch: 52, step: 1045, loss: 0.33668309450149536, mean loss: 0.3414451826180769
Epoch: 52, step: 1046, loss: 0.3318895399570465, mean loss: 0.34144505710888057
Epoch: 52, step: 1047, loss: 0.32728511095046997, mean loss: 0.34144487112660993
Epoch: 52, step: 1048, loss: 0.30343469977378845, mean loss: 0.34144437189271115
Epoch: 52, step: 1049, loss: 0.3433825969696045, mean loss: 0.3414443973494486
Epoch: 52, step: 1050, loss: 0.3394009470939636, mean loss: 0.34144437051103127
Epoch: 52, step: 1051, loss: 0.3230505883693695, mean loss: 0.34144412893259496
Epoch: 52, step: 1052, loss: 0.2928476929664612, mean loss: 0.3414434906899141
Epoch: 52, step: 1053, loss: 0.301842600107193, mean loss: 0.34144297059731626
Epoch: 52, step: 1054, loss: 0.357053279876709, mean loss: 0.3414431756103743
Epoch: 52, step: 1055, loss: 0.3478679656982422, mean loss: 0.3414432599872141
Epoch: 52, step: 1056, loss: 0.3212403655052185, mean loss: 0.3414429946658603
Epoch: 52, step: 1057, loss: 0.36539191007614136, mean loss: 0.3414433091789721
Epoch: 52, step: 1058, loss: 0.3729642927646637, mean loss: 0.34144372312809135
Epoch: 52, step: 1059, loss: 0.3289499878883362, mean loss: 0.3414435590563463
Epoch: 52, step: 1060, loss: 0.3154582381248474, mean loss: 0.3414432178132449
Epoch: 52, step: 1061, loss: 0.41389888525009155, mean loss: 0.341444169299357
Epoch: 52, step: 1062, loss: 0.35560914874076843, mean loss: 0.3414443553110895
Epoch: 52, step: 1063, loss: 0.31481561064720154, mean loss: 0.341444005632228
Epoch: 52, step: 1064, loss: 0.3157540261745453, mean loss: 0.3414436682853151
Epoch: 52, step: 1065, loss: 0.3230787217617035, mean loss: 0.3414434271299388
Epoch: 52, step: 1066, loss: 0.3610115945339203, mean loss: 0.34144368408177916
Epoch: 52, step: 1067, loss: 0.32429930567741394, mean loss: 0.341443458959945
Epoch: 52, step: 1068, loss: 0.3037876486778259, mean loss: 0.3414429645101862
Epoch: 52, step: 1069, loss: 0.34070834517478943, mean loss: 0.3414429548641958
Epoch: 52, step: 1070, loss: 0.33727630972862244, mean loss: 0.3414429001543764
Epoch: 52, step: 1071, loss: 0.3125971555709839, mean loss: 0.341442521402478
Epoch: 52, step: 1072, loss: 0.3137381374835968, mean loss: 0.3414421576417091
Epoch: 52, step: 1073, loss: 0.3351125121116638, mean loss: 0.34144207453405
Epoch: 52, step: 1074, loss: 0.4005361795425415, mean loss: 0.34144285042398353
Epoch: 52, step: 1075, loss: 0.369927316904068, mean loss: 0.34144322441256714
Epoch: 52, step: 1076, loss: 0.32987266778945923, mean loss: 0.3414430724982151
Epoch: 52, step: 1077, loss: 0.4059639871120453, mean loss: 0.3414439196073532
Epoch: 52, step: 1078, loss: 0.2919674217700958, mean loss: 0.3414432700281675
Epoch: 52, step: 1079, loss: 0.3372712731361389, mean loss: 0.34144321525455007
Epoch: 52, step: 1080, loss: 0.3369556963443756, mean loss: 0.34144315633925765
Epoch: 52, step: 1081, loss: 0.2964608669281006, mean loss: 0.3414425657879985
Epoch: 52, step: 1082, loss: 0.28591057658195496, mean loss: 0.34144183674427836
Epoch: 52, step: 1083, loss: 0.2699885964393616, mean loss: 0.3414408986930219
Epoch: 52, step: 1084, loss: 0.33299094438552856, mean loss: 0.3414407877619268
Epoch: 52, step: 1085, loss: 0.31162452697753906, mean loss: 0.3414403963388588
Epoch: 52, step: 1086, loss: 0.3722454905509949, mean loss: 0.34144080073786387
Epoch: 52, step: 1087, loss: 0.3362151086330414, mean loss: 0.34144073213762094
Epoch: 52, step: 1088, loss: 0.2984137237071991, mean loss: 0.34144016730823107
Epoch: 52, step: 1089, loss: 0.3354528844356537, mean loss: 0.34144008871227327
Epoch: 52, step: 1090, loss: 0.35692667961120605, mean loss: 0.3414402920043997
Epoch: 52, step: 1091, loss: 0.33193638920783997, mean loss: 0.34144016724852155
Epoch: 52, step: 1092, loss: 0.3177582919597626, mean loss: 0.34143985638524477
Epoch: 52, step: 1093, loss: 0.30452731251716614, mean loss: 0.3414393718542024
Epoch: 52, step: 1094, loss: 0.3190450072288513, mean loss: 0.3414390778993224
Epoch: 52, step: 1095, loss: 0.30582427978515625, mean loss: 0.341438610415361
Epoch: 52, step: 1096, loss: 0.34314101934432983, mean loss: 0.34143863276108427
Epoch: 52, step: 1097, loss: 0.30509886145591736, mean loss: 0.3414381557735629
Epoch: 52, step: 1098, loss: 0.2925261855125427, mean loss: 0.341437513774662
Epoch: 52, step: 1099, loss: 0.3773423731327057, mean loss: 0.3414379850412573
Epoch: 52, step: 1100, loss: 0.3254355490207672, mean loss: 0.34143777500521505
Epoch: 52, step: 1101, loss: 0.30940285325050354, mean loss: 0.3414373545442391
Epoch: 52, step: 1102, loss: 0.32464247941970825, mean loss: 0.34143713411301857
Epoch: 52, step: 1103, loss: 0.3417743146419525, mean loss: 0.3414371385384245
Epoch: 52, step: 1104, loss: 0.30396732687950134, mean loss: 0.34143664676343655
Epoch: 52, step: 1105, loss: 0.31034567952156067, mean loss: 0.3414362387133638
Epoch: 52, step: 1106, loss: 0.32080331444740295, mean loss: 0.34143596792231107
Epoch: 52, step: 1107, loss: 0.31583794951438904, mean loss: 0.3414356319726758
Epoch: 52, step: 1108, loss: 0.33588844537734985, mean loss: 0.3414355591720853
Epoch: 52, step: 1109, loss: 0.3096776604652405, mean loss: 0.3414351423908219
Epoch: 52, step: 1110, loss: 0.3716070353984833, mean loss: 0.3414355383526194
Epoch: 52, step: 1111, loss: 0.33320164680480957, mean loss: 0.3414354302962999
Epoch: 52, step: 1112, loss: 0.33238887786865234, mean loss: 0.34143531157669743
Epoch: 52, step: 1113, loss: 0.35816311836242676, mean loss: 0.3414355310959592
Epoch: 52, step: 1114, loss: 0.33693569898605347, mean loss: 0.34143547204536917
Epoch: 52, step: 1115, loss: 0.3677981197834015, mean loss: 0.3414358179937149
Epoch: 52, step: 1116, loss: 0.3807486593723297, mean loss: 0.34143633387641786
Epoch: 52, step: 1117, loss: 0.3325967788696289, mean loss: 0.3414362178808925
Epoch: 52, step: 1118, loss: 0.3192594647407532, mean loss: 0.34143592687411967
Epoch: 52, step: 1119, loss: 0.31011372804641724, mean loss: 0.3414355158647922
Epoch: 52, step: 1120, loss: 0.3037658929824829, mean loss: 0.341435021571167
Epoch: 52, step: 1121, loss: 0.32281872630119324, mean loss: 0.34143477729488736
Epoch: 52, step: 1122, loss: 0.3657148480415344, mean loss: 0.3414350958849957
Epoch: 52, step: 1123, loss: 0.30457714200019836, mean loss: 0.34143461226097477
Epoch: 52, step: 1124, loss: 0.3199743330478668, mean loss: 0.34143433067805307
Epoch: 52, step: 1125, loss: 0.337533563375473, mean loss: 0.3414342794962846
Epoch: 52, step: 1126, loss: 0.3398470878601074, mean loss: 0.34143425867109745
Epoch: 52, step: 1127, loss: 0.3751285970211029, mean loss: 0.3414347007611881
Epoch: 52, step: 1128, loss: 0.3979899287223816, mean loss: 0.34143544279023624
Epoch: 52, step: 1129, loss: 0.33850231766700745, mean loss: 0.34143540430687114
Epoch: 52, step: 1130, loss: 0.3121287226676941, mean loss: 0.34143501980062413
Epoch: 52, step: 1131, loss: 0.33838599920272827, mean loss: 0.3414349797977299
Epoch: 52, step: 1132, loss: 0.35718655586242676, mean loss: 0.34143518645437393
Epoch: 52, step: 1133, loss: 0.284630686044693, mean loss: 0.3414344412036535
Epoch: 52, step: 1134, loss: 0.3137246370315552, mean loss: 0.3414340776676582
Epoch: 52, step: 1135, loss: 0.30395954847335815, mean loss: 0.3414335860307828
Epoch: 52, step: 1136, loss: 0.32233381271362305, mean loss: 0.341433335459798
Epoch: 52, step: 1137, loss: 0.3133786916732788, mean loss: 0.34143296741419954
Epoch: 52, step: 1138, loss: 0.34144458174705505, mean loss: 0.3414329675665646
Epoch: 52, step: 1139, loss: 0.3453071415424347, mean loss: 0.34143301839006746
Epoch: 52, step: 1140, loss: 0.3041006326675415, mean loss: 0.34143252865012963
Epoch: 52, step: 1141, loss: 0.3087630867958069, mean loss: 0.3414321000860229
Epoch: 52, step: 1142, loss: 0.3240355849266052, mean loss: 0.3414318718781395
Epoch: 52, step: 1143, loss: 0.2996678650379181, mean loss: 0.3414313240241302
Epoch: 52, step: 1144, loss: 0.3179411292076111, mean loss: 0.34143101588730207
Epoch: 52, step: 1145, loss: 0.3229014277458191, mean loss: 0.34143077282530687
Epoch: 52, step: 1146, loss: 0.32768911123275757, mean loss: 0.3414305925713344
Epoch: 52, step: 1147, loss: 0.33608922362327576, mean loss: 0.34143052250773
Epoch: 52, step: 1148, loss: 0.3256703019142151, mean loss: 0.34143031578106714
Epoch: 52, step: 1149, loss: 0.31205201148986816, mean loss: 0.3414299304311853
Epoch: 52, step: 1150, loss: 0.3739957809448242, mean loss: 0.3414303575859291
Epoch: 52, step: 1151, loss: 0.3682502806186676, mean loss: 0.3414307093687601
Epoch: 52, step: 1152, loss: 0.35192736983299255, mean loss: 0.34143084704613136
Epoch: 52, step: 1153, loss: 0.3559301793575287, mean loss: 0.341431037221262
Epoch: 52, step: 1154, loss: 0.3567032814025879, mean loss: 0.3414312375313781
Epoch: 52, step: 1155, loss: 0.37715402245521545, mean loss: 0.3414317060637862
Epoch: 52, step: 1156, loss: 0.32002317905426025, mean loss: 0.3414314252778067
Epoch: 52, step: 1157, loss: 0.3491796553134918, mean loss: 0.34143152689926926
Epoch: 52, step: 1158, loss: 0.35160595178604126, mean loss: 0.3414316603395999
Epoch: 52, step: 1159, loss: 0.36105379462242126, mean loss: 0.34143191768581593
Epoch: 52, step: 1160, loss: 0.35332190990448, mean loss: 0.3414320736221852
Epoch: 52, step: 1161, loss: 0.3342727720737457, mean loss: 0.34143197972970585
Epoch: 52, step: 1162, loss: 0.30089786648750305, mean loss: 0.34143144814174975
Epoch: 52, step: 1163, loss: 0.3193134665489197, mean loss: 0.34143115807746827
Epoch: 52, step: 1164, loss: 0.3261198103427887, mean loss: 0.341430957280808
Epoch: 52, step: 1165, loss: 0.32986360788345337, mean loss: 0.3414308055858229
Epoch: 52, step: 1166, loss: 0.3338487446308136, mean loss: 0.34143070615547794
Epoch: 52, step: 1167, loss: 0.3089604377746582, mean loss: 0.34143028034939865
Epoch: 52, step: 1168, loss: 0.34017592668533325, mean loss: 0.34143026390036885
Epoch: 52, step: 1169, loss: 0.37503352761268616, mean loss: 0.341430704552677
Epoch: 52, step: 1170, loss: 0.3250572979450226, mean loss: 0.34143048984481816
Epoch: 52, step: 1171, loss: 0.3518904447555542, mean loss: 0.3414306270065663
Epoch: 52, step: 1172, loss: 0.32945552468299866, mean loss: 0.3414304699786972
Epoch: 52, step: 1173, loss: 0.3879600465297699, mean loss: 0.3414310801066318
Epoch: 52, step: 1174, loss: 0.3564266562461853, mean loss: 0.34143127673640167
Epoch: 52, step: 1175, loss: 0.29535967111587524, mean loss: 0.341430672629541
Epoch: 52, step: 1176, loss: 0.3736978769302368, mean loss: 0.3414310957227594
Epoch: 52, step: 1177, loss: 0.35055243968963623, mean loss: 0.3414312153218464
Epoch: 52, step: 1178, loss: 0.30609598755836487, mean loss: 0.3414307520123185
Epoch: 52, step: 1179, loss: 0.3411870300769806, mean loss: 0.3414307488167196
Epoch: 52, step: 1180, loss: 0.335940420627594, mean loss: 0.34143067683035305
Epoch: 52, step: 1181, loss: 0.3304227888584137, mean loss: 0.34143053250246563
Epoch: 52, step: 1182, loss: 0.3469352722167969, mean loss: 0.3414306046758961
Epoch: 52, step: 1183, loss: 0.33898240327835083, mean loss: 0.3414305725775979
Epoch: 52, step: 1184, loss: 0.3541003167629242, mean loss: 0.34143073868807194
Epoch: 52, step: 1185, loss: 0.35492444038391113, mean loss: 0.34143091559896815
Epoch: 52, step: 1186, loss: 0.3260045349597931, mean loss: 0.3414307133520899
Epoch: 52, step: 1187, loss: 0.32904738187789917, mean loss: 0.34143055100310105
Epoch: 52, step: 1188, loss: 0.3310335576534271, mean loss: 0.3414304146973555
Epoch: 52, step: 1189, loss: 0.2813711166381836, mean loss: 0.34142962732356413
Epoch: 52, step: 1190, loss: 0.4073442220687866, mean loss: 0.34143049144861487
Epoch: 52, step: 1191, loss: 0.3544977903366089, mean loss: 0.34143066275562706
Epoch: 52, step: 1192, loss: 0.3537527918815613, mean loss: 0.34143082429164684
Epoch: 52, step: 1193, loss: 0.3271735608577728, mean loss: 0.3414306373895804
Epoch: 52, step: 1194, loss: 0.32864782214164734, mean loss: 0.34143046981862424
Epoch: 52, step: 1195, loss: 0.34860676527023315, mean loss: 0.3414305638920269
Epoch: 52, step: 1196, loss: 0.3412192761898041, mean loss: 0.341430561122312
Epoch: 52, step: 1197, loss: 0.3556986153125763, mean loss: 0.34143074815602975
Epoch: 52, step: 1198, loss: 0.3269626200199127, mean loss: 0.3414305585021158
Epoch: 52, step: 1199, loss: 0.3224067986011505, mean loss: 0.3414303091344577
Epoch: 52, step: 1200, loss: 0.35658809542655945, mean loss: 0.34143050782347306
Epoch: 52, step: 1201, loss: 0.35490670800209045, mean loss: 0.3414306844678587
Epoch: 52, step: 1202, loss: 0.3487485945224762, mean loss: 0.34143078038887237
Epoch: 52, step: 1203, loss: 0.3687610626220703, mean loss: 0.3414311386214817
Epoch: 52, step: 1204, loss: 0.366355836391449, mean loss: 0.34143146531852825
Epoch: 52, step: 1205, loss: 0.33180806040763855, mean loss: 0.34143133918272583
Epoch: 52, step: 1206, loss: 0.34325700998306274, mean loss: 0.34143136311182737
Epoch: 52, step: 1207, loss: 0.33834269642829895, mean loss: 0.34143132262914566
Epoch: 52, step: 1208, loss: 0.3209044337272644, mean loss: 0.34143105358987935
Epoch: 52, step: 1209, loss: 0.2892855107784271, mean loss: 0.34143037014414274
Epoch: 52, step: 1210, loss: 0.3209775984287262, mean loss: 0.3414301020833331
Epoch: 52, step: 1211, loss: 0.32832255959510803, mean loss: 0.3414299302937854
Epoch: 52, step: 1212, loss: 0.3293323218822479, mean loss: 0.3414297717426732
Epoch: 52, step: 1213, loss: 0.29429858922958374, mean loss: 0.3414291540500503
Epoch: 52, step: 1214, loss: 0.3545456528663635, mean loss: 0.3414293259502222
Epoch: 52, step: 1215, loss: 0.3404228091239929, mean loss: 0.34142931275934324
Epoch: 52, step: 1216, loss: 0.3773762285709381, mean loss: 0.34142978385449835
Epoch: 52, step: 1217, loss: 0.321940153837204, mean loss: 0.34142952844037605
Epoch: 52, step: 1218, loss: 0.30511072278022766, mean loss: 0.3414290524839676
Epoch: 52, step: 1219, loss: 0.3256533443927765, mean loss: 0.34142884574669113
Epoch: 52, step: 1220, loss: 0.324631005525589, mean loss: 0.3414286256174767
Epoch: 52, step: 1221, loss: 0.282144695520401, mean loss: 0.34142784873462917
Epoch: 52, step: 1222, loss: 0.29783323407173157, mean loss: 0.34142727745899837
Epoch: 52, step: 1223, loss: 0.34870752692222595, mean loss: 0.3414273728601078
Epoch: 52, step: 1224, loss: 0.3299693167209625, mean loss: 0.34142722271457376
Epoch: 52, step: 1225, loss: 0.3045544922351837, mean loss: 0.3414267395433276
Epoch: 52, step: 1226, loss: 0.3583119213581085, mean loss: 0.34142696079972296
Epoch: 52, step: 1227, loss: 0.30954959988594055, mean loss: 0.34142654309752535
Epoch: 52, step: 1228, loss: 0.3168103098869324, mean loss: 0.3414262205451031
Epoch: 52, step: 1229, loss: 0.3103492259979248, mean loss: 0.34142581334110733
Epoch: 52, step: 1230, loss: 0.3475441038608551, mean loss: 0.34142589350843816
Epoch: 52, step: 1231, loss: 0.34606873989105225, mean loss: 0.3414259543423792
Epoch: 52, step: 1232, loss: 0.33728837966918945, mean loss: 0.3414259001295849
Epoch: 52, step: 1233, loss: 0.3256823420524597, mean loss: 0.34142569385147276
Epoch: 52, step: 1234, loss: 0.34846699237823486, mean loss: 0.34142578610804714
Epoch: 52, step: 1235, loss: 0.34079405665397644, mean loss: 0.3414257778311034
Epoch: 52, step: 1236, loss: 0.33518195152282715, mean loss: 0.3414256960253214
Epoch: 52, step: 1237, loss: 0.3265116810798645, mean loss: 0.341425500626441
Epoch: 52, step: 1238, loss: 0.43515247106552124, mean loss: 0.34142672859256623
Epoch: 52, step: 1239, loss: 0.30713406205177307, mean loss: 0.3414262793122688
Epoch: 52, step: 1240, loss: 0.3355088233947754, mean loss: 0.34142620178661126
Epoch: 52, step: 1241, loss: 0.32234686613082886, mean loss: 0.34142595182806734
Epoch: 52, step: 1242, loss: 0.3275987505912781, mean loss: 0.3414257706801558
Epoch: 52, step: 1243, loss: 0.37167689204216003, mean loss: 0.3414261669899782
Epoch: 52, step: 1244, loss: 0.36412325501441956, mean loss: 0.34142646433304114
Epoch: 52, step: 1245, loss: 0.3330972194671631, mean loss: 0.3414263552172491
Epoch: 52, step: 1246, loss: 0.33777645230293274, mean loss: 0.3414263074029711
Epoch: 52, step: 1247, loss: 0.33260396122932434, mean loss: 0.3414261918304211
Epoch: 52, step: 1248, loss: 0.3136135935783386, mean loss: 0.3414258274907398
Epoch: 52, step: 1249, loss: 0.33246123790740967, mean loss: 0.3414257100578809
Epoch: 52, step: 1250, loss: 0.3106960952281952, mean loss: 0.3414253075163906
Epoch: 52, step: 1251, loss: 0.31105750799179077, mean loss: 0.34142490971969786
Epoch: 52, step: 1252, loss: 0.3418067693710327, mean loss: 0.34142491472172365
Epoch: 52, step: 1253, loss: 0.3383387327194214, mean loss: 0.34142487429598156
Epoch: 52, step: 1254, loss: 0.32088619470596313, mean loss: 0.34142460526437957
Epoch: 52, step: 1255, loss: 0.30192574858665466, mean loss: 0.3414240878844063
Epoch: 52, step: 1256, loss: 0.404084712266922, mean loss: 0.3414249086405054
Epoch: 52, step: 1257, loss: 0.336076557636261, mean loss: 0.34142483858639644
Epoch: 52, step: 1258, loss: 0.32667458057403564, mean loss: 0.34142464538616574
Epoch: 52, step: 1259, loss: 0.3349362313747406, mean loss: 0.34142456040143776
Epoch: 52, step: 1260, loss: 0.32205840945243835, mean loss: 0.3414243067484633
Epoch: 52, step: 1261, loss: 0.3375406563282013, mean loss: 0.3414242558820531
Epoch: 52, step: 1262, loss: 0.2921565771102905, mean loss: 0.3414236106032909
Epoch: 52, step: 1263, loss: 0.3239748179912567, mean loss: 0.34142338207237344
Epoch: 52, step: 1264, loss: 0.3274625539779663, mean loss: 0.34142319922653774
Epoch: 52, step: 1265, loss: 0.3077312111854553, mean loss: 0.3414227579662496
Epoch: 52, step: 1266, loss: 0.3495326638221741, mean loss: 0.3414228641794099
Epoch: 52, step: 1267, loss: 0.31701987981796265, mean loss: 0.34142254458456
Epoch: 52, step: 1268, loss: 0.33356913924217224, mean loss: 0.3414224417334089
Epoch: 52, step: 1269, loss: 0.33774158358573914, mean loss: 0.3414223935281371
Epoch: 52, step: 1270, loss: 0.2982352674007416, mean loss: 0.341421827948099
Epoch: 52, step: 1271, loss: 0.3421637713909149, mean loss: 0.34142183766448775
Epoch: 52, step: 1272, loss: 0.3521016240119934, mean loss: 0.34142197752366127
Epoch: 52, step: 1273, loss: 0.30665910243988037, mean loss: 0.3414215222857801
Epoch: 52, step: 1274, loss: 0.3220076262950897, mean loss: 0.34142126805407114
Epoch: 52, step: 1275, loss: 0.3045676648616791, mean loss: 0.34142078544966076
Epoch: 52, step: 1276, loss: 0.30051496624946594, mean loss: 0.34142024978778424
Epoch: 52, step: 1277, loss: 0.31883949041366577, mean loss: 0.3414199540965162
Epoch: 52, step: 1278, loss: 0.3073718547821045, mean loss: 0.34141950824818756
Epoch: 52, step: 1279, loss: 0.32469791173934937, mean loss: 0.341419289287412
Epoch: 52, step: 1280, loss: 0.37314078211784363, mean loss: 0.34141970465873844
Epoch: 52, step: 1281, loss: 0.3445124626159668, mean loss: 0.3414197451557655
Epoch: 52, step: 1282, loss: 0.35798561573028564, mean loss: 0.3414199620688683
Epoch: 52, step: 1283, loss: 0.3034398853778839, mean loss: 0.34141946476518775
Epoch: 52, step: 1284, loss: 0.3906096816062927, mean loss: 0.3414201088438129
Epoch: 52, step: 1285, loss: 0.3362216651439667, mean loss: 0.34142004077819244
Epoch: 52, step: 1286, loss: 0.33589598536491394, mean loss: 0.34141996845013467
Epoch: 52, step: 1287, loss: 0.3218444287776947, mean loss: 0.3414197121452788
Epoch: 52, step: 1288, loss: 0.35874542593955994, mean loss: 0.3414199389899283
Epoch: 52, step: 1289, loss: 0.3504128158092499, mean loss: 0.3414200567316447
Epoch: 52, step: 1290, loss: 0.3382544219493866, mean loss: 0.34142001528524213
Epoch: 52, step: 1291, loss: 0.3403502106666565, mean loss: 0.34142000127889727
Epoch: 52, step: 1292, loss: 0.3170798122882843, mean loss: 0.3414196826107862
Epoch: 52, step: 1293, loss: 0.30749407410621643, mean loss: 0.3414192384536745
Epoch: 52, step: 1294, loss: 0.3400164842605591, mean loss: 0.3414192200889311
Epoch: 52, step: 1295, loss: 0.3079802393913269, mean loss: 0.3414187823142571
Epoch: 52, step: 1296, loss: 0.34873539209365845, mean loss: 0.34141887810020694
Epoch: 52, step: 1297, loss: 0.3477064073085785, mean loss: 0.3414189604127931
Epoch: 52, step: 1298, loss: 0.3659400939941406, mean loss: 0.3414192814246614
Epoch: 52, step: 1299, loss: 0.2942954897880554, mean loss: 0.34141866452421055
Epoch: 52, step: 1300, loss: 0.3669740855693817, mean loss: 0.34141899906741763
Epoch: 52, step: 1301, loss: 0.3473964333534241, mean loss: 0.3414190773163283
Epoch: 52, step: 1302, loss: 0.33105751872062683, mean loss: 0.34141894167785525
Epoch: 52, step: 1303, loss: 0.3059403598308563, mean loss: 0.3414184772498805
Epoch: 52, step: 1304, loss: 0.35886773467063904, mean loss: 0.34141870566423027
Epoch: 52, step: 1305, loss: 0.3323305547237396, mean loss: 0.3414185867000323
Epoch: 52, step: 1306, loss: 0.37429720163345337, mean loss: 0.3414190170765613
Epoch: 52, step: 1307, loss: 0.38266435265541077, mean loss: 0.34141955696524107
Epoch: 52, step: 1308, loss: 0.34530746936798096, mean loss: 0.34141960785614517
Epoch: 52, step: 1309, loss: 0.32880836725234985, mean loss: 0.3414194427832296
Epoch: 52, step: 1310, loss: 0.3948047459125519, mean loss: 0.34142014155288797
Epoch: 52, step: 1311, loss: 0.3244703710079193, mean loss: 0.34141991969725255
Epoch: 52, step: 1312, loss: 0.3233524262905121, mean loss: 0.34141968321483207
Epoch: 52, step: 1313, loss: 0.3082531988620758, mean loss: 0.34141924910990873
Epoch: 52, step: 1314, loss: 0.3440849184989929, mean loss: 0.34141928399949933
Epoch: 52, step: 1315, loss: 0.361640602350235, mean loss: 0.3414195486625844
Epoch: 52, step: 1316, loss: 0.33969321846961975, mean loss: 0.34141952606811815
Epoch: 52, step: 1317, loss: 0.31501004099845886, mean loss: 0.3414191804213748
Epoch: 52, step: 1318, loss: 0.329868882894516, mean loss: 0.34141902925332046
Epoch: 52, step: 1319, loss: 0.31498444080352783, mean loss: 0.3414186832870807
Epoch: 52, step: 1320, loss: 0.31881776452064514, mean loss: 0.3414183874983808
Epoch: 52, step: 1321, loss: 0.3320501148700714, mean loss: 0.34141826489305915
Epoch: 52, step: 1322, loss: 0.315893292427063, mean loss: 0.3414179308446569
Epoch: 52, step: 1323, loss: 0.31004536151885986, mean loss: 0.34141752027342037
Epoch: 52, step: 1324, loss: 0.3639439344406128, mean loss: 0.34141781507161134
Epoch: 52, step: 1325, loss: 0.3207187056541443, mean loss: 0.3414175441904977
Epoch: 52, step: 1326, loss: 0.3799971342086792, mean loss: 0.34141804905982986
Epoch: 52, step: 1327, loss: 0.29803866147994995, mean loss: 0.34141748138568334
Epoch: 52, step: 1328, loss: 0.31668099761009216, mean loss: 0.3414171576817461
Epoch: 52, step: 1329, loss: 0.3394664227962494, mean loss: 0.3414171321545812
Epoch: 52, step: 1330, loss: 0.30785560607910156, mean loss: 0.34141669297681027
Epoch: 52, step: 1331, loss: 0.30805811285972595, mean loss: 0.34141625646045176
Epoch: 52, step: 1332, loss: 0.35064923763275146, mean loss: 0.34141637727778174
Epoch: 52, step: 1333, loss: 0.35226136445999146, mean loss: 0.3414165191870118
Epoch: 52, step: 1334, loss: 0.33407062292099, mean loss: 0.34141642306547426
Epoch: 52, step: 1335, loss: 0.32433781027793884, mean loss: 0.3414161995936226
Epoch: 52, step: 1336, loss: 0.34063684940338135, mean loss: 0.3414161893960408
Epoch: 52, step: 1337, loss: 0.31666508316993713, mean loss: 0.34141586553889497
Epoch: 52, step: 1338, loss: 0.2973252832889557, mean loss: 0.34141528864091064
Epoch: 52, step: 1339, loss: 0.3222838342189789, mean loss: 0.34141503832094383
Epoch: 52, step: 1340, loss: 0.31050217151641846, mean loss: 0.34141463385579573
Epoch: 52, step: 1341, loss: 0.37576204538345337, mean loss: 0.34141508325278025
Epoch: 52, step: 1342, loss: 0.32949942350387573, mean loss: 0.3414149273519056
Epoch: 52, step: 1343, loss: 0.3243251144886017, mean loss: 0.3414147037569079
Epoch: 52, step: 1344, loss: 0.3166767358779907, mean loss: 0.3414143801013157
Epoch: 52, step: 1345, loss: 0.3588886260986328, mean loss: 0.34141460872007173
Epoch: 52, step: 1346, loss: 0.311105877161026, mean loss: 0.3414142121905819
Epoch: 52, step: 1347, loss: 0.308265745639801, mean loss: 0.3414137785144796
Epoch: 52, step: 1348, loss: 0.33855700492858887, mean loss: 0.3414137411402553
Epoch: 52, step: 1349, loss: 0.324374794960022, mean loss: 0.341413518228272
Epoch: 52, step: 1350, loss: 0.34103989601135254, mean loss: 0.3414135133404239
Epoch: 52, step: 1351, loss: 0.3486647605895996, mean loss: 0.34141360820237115
Epoch: 52, step: 1352, loss: 0.3468568027019501, mean loss: 0.3414136794101589
Epoch: 52, step: 1353, loss: 0.3163616359233856, mean loss: 0.3414133516839941
Epoch: 52, step: 1354, loss: 0.3197369873523712, mean loss: 0.34141306812154454
Epoch: 52, step: 1355, loss: 0.3829730749130249, mean loss: 0.34141361178758495
Epoch: 52, step: 1356, loss: 0.31843191385269165, mean loss: 0.3414133111570933
Epoch: 52, step: 1357, loss: 0.3575042486190796, mean loss: 0.34141352164472455
Epoch: 52, step: 1358, loss: 0.33659303188323975, mean loss: 0.3414134585881002
Epoch: 52, step: 1359, loss: 0.3373517096042633, mean loss: 0.34141340545722715
Epoch: 52, step: 1360, loss: 0.3298906683921814, mean loss: 0.3414132547327302
Epoch: 52, step: 1361, loss: 0.3024495840072632, mean loss: 0.3414127450705886
Epoch: 52, step: 1362, loss: 0.3386636972427368, mean loss: 0.34141270911229077
Epoch: 52, step: 1363, loss: 0.39138731360435486, mean loss: 0.3414133627852423
Epoch: 52, step: 1364, loss: 0.3316194713115692, mean loss: 0.3414132346818131
Epoch: 52, step: 1365, loss: 0.3381097912788391, mean loss: 0.34141319147356497
Epoch: 52, step: 1366, loss: 0.356661856174469, mean loss: 0.34141339091983663
Epoch: 52, step: 1367, loss: 0.33363455533981323, mean loss: 0.34141328917719277
Epoch: 52, step: 1368, loss: 0.3510429263114929, mean loss: 0.3414134151255969
Epoch: 52, step: 1369, loss: 0.33867523074150085, mean loss: 0.341413379312675
Epoch: 52, step: 1370, loss: 0.3271484375, mean loss: 0.34141319274285575
Epoch: 52, step: 1371, loss: 0.3929760456085205, mean loss: 0.34141386711969157
Epoch: 52, step: 1372, loss: 0.3110443651676178, mean loss: 0.34141346993024924
Epoch: 52, step: 1373, loss: 0.3144820034503937, mean loss: 0.3414131177099767
Epoch: 52, step: 1374, loss: 0.30121609568595886, mean loss: 0.34141259200444557
Epoch: 52, step: 1375, loss: 0.3350207209587097, mean loss: 0.3414125084112377
Epoch: 52, step: 1376, loss: 0.283297598361969, mean loss: 0.34141174839148947
Epoch: 52, step: 1377, loss: 0.32771506905555725, mean loss: 0.3414115692703201
Epoch: 52, step: 1378, loss: 0.3861773610115051, mean loss: 0.3414121546966052
Epoch: 52, step: 1379, loss: 0.38636985421180725, mean loss: 0.3414127426248826
Epoch: 52, step: 1380, loss: 0.3149791359901428, mean loss: 0.3414123969474625
Epoch: 52, step: 1381, loss: 0.33107632398605347, mean loss: 0.34141226178239176
Epoch: 52, step: 1382, loss: 0.3205634355545044, mean loss: 0.34141198914536297
Epoch: 52, step: 1383, loss: 0.32061856985092163, mean loss: 0.3414117172364382
Epoch: 52, step: 1384, loss: 0.29206588864326477, mean loss: 0.3414110719651844
Epoch: 52, step: 1385, loss: 0.34054067730903625, mean loss: 0.3414110605836082
Epoch: 52, step: 1386, loss: 0.33853858709335327, mean loss: 0.3414110230226603
Epoch: 52, step: 1387, loss: 0.32579782605171204, mean loss: 0.3414108188645326
Epoch: 52, step: 1388, loss: 0.3397052586078644, mean loss: 0.3414107965629222
Epoch: 52, step: 1389, loss: 0.3457314074039459, mean loss: 0.3414108530577422
Epoch: 52, step: 1390, loss: 0.3362373411655426, mean loss: 0.3414107854115662
Epoch: 52, step: 1391, loss: 0.32610756158828735, mean loss: 0.34141058531711244
Epoch: 52, step: 1392, loss: 0.3895253837108612, mean loss: 0.34141121442497446
Epoch: 52, step: 1393, loss: 0.3740982711315155, mean loss: 0.34141164180732203
Epoch: 52, step: 1394, loss: 0.29746657609939575, mean loss: 0.3414110672343358
Epoch: 52, step: 1395, loss: 0.30347275733947754, mean loss: 0.34141057120497154
Epoch: 52, step: 1396, loss: 0.3160228729248047, mean loss: 0.34141023927455016
Epoch: 52, step: 1397, loss: 0.333810031414032, mean loss: 0.34141013990724295
Epoch: 52, step: 1398, loss: 0.34661734104156494, mean loss: 0.3414102079868007
Epoch: 52, step: 1399, loss: 0.34843572974205017, mean loss: 0.34141029983809446
Epoch: 52, step: 1400, loss: 0.29297834634780884, mean loss: 0.34140966664961653
Epoch: 52, step: 1401, loss: 0.3496575355529785, mean loss: 0.3414097744789917
Epoch: 52, step: 1402, loss: 0.29382580518722534, mean loss: 0.34140915239313463
Epoch: 52, step: 1403, loss: 0.3095971643924713, mean loss: 0.3414087365066628
Epoch: 52, step: 1404, loss: 0.31134745478630066, mean loss: 0.3414083435127716
Epoch: 52, step: 1405, loss: 0.30930644273757935, mean loss: 0.3414079238471668
Epoch: 52, step: 1406, loss: 0.3227960169315338, mean loss: 0.3414076805383634
Epoch: 52, step: 1407, loss: 0.35718998312950134, mean loss: 0.34140788685376017
Epoch: 52, step: 1408, loss: 0.31289684772491455, mean loss: 0.3414075141458222
Epoch: 52, step: 1409, loss: 0.3451937437057495, mean loss: 0.34140756364031305
Epoch: 52, step: 1410, loss: 0.34288254380226135, mean loss: 0.34140758292135154
Epoch: 52, step: 1411, loss: 0.3135392963886261, mean loss: 0.3414072186300243
Epoch: 52, step: 1412, loss: 0.30564385652542114, mean loss: 0.34140675114120583
Epoch: 52, step: 1413, loss: 0.2994459569454193, mean loss: 0.34140620264843186
Epoch: 52, step: 1414, loss: 0.3268266022205353, mean loss: 0.3414060120728933
Epoch: 52, step: 1415, loss: 0.3032098114490509, mean loss: 0.3414055128022588
Epoch: 52, step: 1416, loss: 0.301746129989624, mean loss: 0.3414049944128357
Epoch: 52, step: 1417, loss: 0.28903862833976746, mean loss: 0.3414043099388589
Epoch: 52, step: 1418, loss: 0.34827131032943726, mean loss: 0.34140439969535685
Epoch: 52, step: 1419, loss: 0.32979288697242737, mean loss: 0.34140424792674806
Epoch: 52, step: 1420, loss: 0.31171685457229614, mean loss: 0.3414038599018967
Epoch: 52, step: 1421, loss: 0.32582685351371765, mean loss: 0.3414036563075118
Epoch: 52, step: 1422, loss: 0.3352179229259491, mean loss: 0.34140357545987704
Epoch: 52, step: 1423, loss: 0.29893845319747925, mean loss: 0.3414030204473004
Epoch: 52, step: 1424, loss: 0.3276863694190979, mean loss: 0.34140284117513714
Epoch: 52, step: 1425, loss: 0.34562650322914124, mean loss: 0.34140289637630367
Epoch: 52, step: 1426, loss: 0.3381081521511078, mean loss: 0.34140285331619485
Epoch: 52, step: 1427, loss: 0.3463967740535736, mean loss: 0.341402918582554
Epoch: 52, step: 1428, loss: 0.3186284601688385, mean loss: 0.3414026209433573
Epoch: 52, step: 1429, loss: 0.3076469898223877, mean loss: 0.34140217979707643
Epoch: 52, step: 1430, loss: 0.3173755407333374, mean loss: 0.34140186580134907
Epoch: 52, step: 1431, loss: 0.3414154648780823, mean loss: 0.3414018659790683
Epoch: 52, step: 1432, loss: 0.3191462755203247, mean loss: 0.34140157513615643
Epoch: 52, step: 1433, loss: 0.36053168773651123, mean loss: 0.34140182513109385
Epoch: 52, step: 1434, loss: 0.3478211760520935, mean loss: 0.3414019090189566
Epoch: 52, step: 1435, loss: 0.29897573590278625, mean loss: 0.34140135460239296
Epoch: 52, step: 1436, loss: 0.3290831744670868, mean loss: 0.3414011936330348
Epoch: 52, step: 1437, loss: 0.32152432203292847, mean loss: 0.34140093389292553
Epoch: 52, step: 1438, loss: 0.3498058021068573, mean loss: 0.34140104372172075
Epoch: 52, step: 1439, loss: 0.3561362028121948, mean loss: 0.34140123626770513
Epoch: 52, step: 1440, loss: 0.3366508185863495, mean loss: 0.34140117419427307
Epoch: 52, step: 1441, loss: 0.3665928840637207, mean loss: 0.3414015033685821
Epoch: 52, step: 1442, loss: 0.29970991611480713, mean loss: 0.3414009586012688
Epoch: 52, step: 1443, loss: 0.36297333240509033, mean loss: 0.34140124047517517
Valid: 52, mean loss: 0.18552004297574362
Epoch: 53, step: 0, loss: 0.32485049962997437, mean loss: 0.34140102421890867
Epoch: 53, step: 1, loss: 0.3710826635360718, mean loss: 0.3414014120418281
Epoch: 53, step: 2, loss: 0.3356795310974121, mean loss: 0.34140133728020344
Epoch: 53, step: 3, loss: 0.302231103181839, mean loss: 0.34140082549184114
Epoch: 53, step: 4, loss: 0.3258475661277771, mean loss: 0.34140062227954693
Epoch: 53, step: 5, loss: 0.30952244997024536, mean loss: 0.34140020577830166
Epoch: 53, step: 6, loss: 0.3370988965034485, mean loss: 0.3414001495806864
Epoch: 53, step: 7, loss: 0.33108335733413696, mean loss: 0.3414000147911352
Epoch: 53, step: 8, loss: 0.3225320279598236, mean loss: 0.3413997682829
Epoch: 53, step: 9, loss: 0.3398686647415161, mean loss: 0.3413997482794569
Epoch: 53, step: 10, loss: 0.29918405413627625, mean loss: 0.3413991967503276
Epoch: 53, step: 11, loss: 0.30593961477279663, mean loss: 0.34139873349282895
Epoch: 53, step: 12, loss: 0.36218783259391785, mean loss: 0.3413990050859977
Epoch: 53, step: 13, loss: 0.34698644280433655, mean loss: 0.3413990780805071
Epoch: 53, step: 14, loss: 0.32643452286720276, mean loss: 0.3413988825855143
Epoch: 53, step: 15, loss: 0.3167172968387604, mean loss: 0.3413985601527173
Epoch: 53, step: 16, loss: 0.341751366853714, mean loss: 0.3413985647616175
Epoch: 53, step: 17, loss: 0.32418981194496155, mean loss: 0.34139833995753105
Epoch: 53, step: 18, loss: 0.3293442726135254, mean loss: 0.34139818249299964
Epoch: 53, step: 19, loss: 0.32326987385749817, mean loss: 0.34139794568261406
Epoch: 53, step: 20, loss: 0.3347463309764862, mean loss: 0.34139785879359985
Epoch: 53, step: 21, loss: 0.33263689279556274, mean loss: 0.34139774435195086
Epoch: 53, step: 22, loss: 0.30595120787620544, mean loss: 0.34139728133142344
Epoch: 53, step: 23, loss: 0.30924224853515625, mean loss: 0.3413968613116628
Epoch: 53, step: 24, loss: 0.32387658953666687, mean loss: 0.34139663245902
Epoch: 53, step: 25, loss: 0.34595850110054016, mean loss: 0.3413966920461127
Epoch: 53, step: 26, loss: 0.37580668926239014, mean loss: 0.3413971415033577
Epoch: 53, step: 27, loss: 0.31762832403182983, mean loss: 0.3413968310433594
Epoch: 53, step: 28, loss: 0.347439706325531, mean loss: 0.34139690997225636
Epoch: 53, step: 29, loss: 0.3227290213108063, mean loss: 0.34139666614517944
Epoch: 53, step: 30, loss: 0.3629564642906189, mean loss: 0.341396947740704
Epoch: 53, step: 31, loss: 0.39225882291793823, mean loss: 0.34139761204605873
Epoch: 53, step: 32, loss: 0.31382235884666443, mean loss: 0.3413972518912465
Epoch: 53, step: 33, loss: 0.3843487501144409, mean loss: 0.34139781286476245
Epoch: 53, step: 34, loss: 0.36714139580726624, mean loss: 0.34139814908771676
Epoch: 53, step: 35, loss: 0.3047730326652527, mean loss: 0.3413976707532112
Epoch: 53, step: 36, loss: 0.3384080231189728, mean loss: 0.34139763170806714
Epoch: 53, step: 37, loss: 0.3368551731109619, mean loss: 0.341397572383807
Epoch: 53, step: 38, loss: 0.32785147428512573, mean loss: 0.3413973954748193
Epoch: 53, step: 39, loss: 0.33349940180778503, mean loss: 0.3413972923301493
Epoch: 53, step: 40, loss: 0.331203818321228, mean loss: 0.34139715920915353
Epoch: 53, step: 41, loss: 0.37679895758628845, mean loss: 0.3413976215305469
Epoch: 53, step: 42, loss: 0.2911621332168579, mean loss: 0.3413969655006636
Epoch: 53, step: 43, loss: 0.30795449018478394, mean loss: 0.3413965287779918
Epoch: 53, step: 44, loss: 0.37128379940986633, mean loss: 0.3413969190684267
Epoch: 53, step: 45, loss: 0.3430575132369995, mean loss: 0.3413969407534298
Epoch: 53, step: 46, loss: 0.38390570878982544, mean loss: 0.34139749585036283
Epoch: 53, step: 47, loss: 0.3698337972164154, mean loss: 0.34139786717840365
Epoch: 53, step: 48, loss: 0.37277916073799133, mean loss: 0.3413982769575076
Epoch: 53, step: 49, loss: 0.3393821120262146, mean loss: 0.3413982506306301
Epoch: 53, step: 50, loss: 0.3272843360900879, mean loss: 0.34139806633497
Epoch: 53, step: 51, loss: 0.3492903709411621, mean loss: 0.3413981693891929
Epoch: 53, step: 52, loss: 0.3686649799346924, mean loss: 0.3413985254224963
Epoch: 53, step: 53, loss: 0.3281247913837433, mean loss: 0.3413983521044742
Epoch: 53, step: 54, loss: 0.3372126817703247, mean loss: 0.34139829745198313
Epoch: 53, step: 55, loss: 0.3024158775806427, mean loss: 0.34139778846337043
Epoch: 53, step: 56, loss: 0.3128032088279724, mean loss: 0.34139741511237176
Epoch: 53, step: 57, loss: 0.3306502401828766, mean loss: 0.34139727479150833
Epoch: 53, step: 58, loss: 0.2792678773403168, mean loss: 0.34139646360745995
Epoch: 53, step: 59, loss: 0.37964195013046265, mean loss: 0.3413969629479462
Epoch: 53, step: 60, loss: 0.336228609085083, mean loss: 0.34139689546979723
Epoch: 53, step: 61, loss: 0.31234240531921387, mean loss: 0.34139651613864663
Epoch: 53, step: 62, loss: 0.3116329610347748, mean loss: 0.34139612755512155
Epoch: 53, step: 63, loss: 0.29826751351356506, mean loss: 0.3413955644889818
Epoch: 53, step: 64, loss: 0.35633811354637146, mean loss: 0.341395759569064
Epoch: 53, step: 65, loss: 0.3416275978088379, mean loss: 0.3413957625957519
Epoch: 53, step: 66, loss: 0.37600454688072205, mean loss: 0.3413962144134556
Epoch: 53, step: 67, loss: 0.43328630924224854, mean loss: 0.34139741402304863
Epoch: 53, step: 68, loss: 0.3494679629802704, mean loss: 0.3413975193813202
Epoch: 53, step: 69, loss: 0.32532015442848206, mean loss: 0.3413973094995292
Epoch: 53, step: 70, loss: 0.3247341215610504, mean loss: 0.3413970919729579
Epoch: 53, step: 71, loss: 0.3457559049129486, mean loss: 0.34139714887354977
Epoch: 53, step: 72, loss: 0.2927253544330597, mean loss: 0.3413965135130062
Epoch: 53, step: 73, loss: 0.3164217472076416, mean loss: 0.3413961874972071
Epoch: 53, step: 74, loss: 0.34725555777549744, mean loss: 0.3413962639833021
Epoch: 53, step: 75, loss: 0.3406529724597931, mean loss: 0.3413962542807707
Epoch: 53, step: 76, loss: 0.36280694603919983, mean loss: 0.34139653376088086
Epoch: 53, step: 77, loss: 0.3223022222518921, mean loss: 0.3413962845204226
Epoch: 53, step: 78, loss: 0.32193100452423096, mean loss: 0.3413960304409823
Epoch: 53, step: 79, loss: 0.36301475763320923, mean loss: 0.3413963126255904
Epoch: 53, step: 80, loss: 0.3581087589263916, mean loss: 0.3413965307667192
Epoch: 53, step: 81, loss: 0.2818739712238312, mean loss: 0.34139575385180104
Epoch: 53, step: 82, loss: 0.31315141916275024, mean loss: 0.3413953851989956
Epoch: 53, step: 83, loss: 0.31933853030204773, mean loss: 0.34139509731063156
Epoch: 53, step: 84, loss: 0.3302285373210907, mean loss: 0.34139495156543154
Epoch: 53, step: 85, loss: 0.32808801531791687, mean loss: 0.34139477788644945
Epoch: 53, step: 86, loss: 0.34871336817741394, mean loss: 0.3413948734057109
Epoch: 53, step: 87, loss: 0.36174002289772034, mean loss: 0.34139513893885487
Epoch: 53, step: 88, loss: 0.2920275926589966, mean loss: 0.34139449463055455
Epoch: 53, step: 89, loss: 0.33238106966018677, mean loss: 0.34139437699560676
Epoch: 53, step: 90, loss: 0.32915252447128296, mean loss: 0.34139421722827157
Epoch: 53, step: 91, loss: 0.331397145986557, mean loss: 0.34139408675908123
Epoch: 53, step: 92, loss: 0.3513510823249817, mean loss: 0.3413942167035584
Epoch: 53, step: 93, loss: 0.3459872603416443, mean loss: 0.3413942766446181
Epoch: 53, step: 94, loss: 0.31127819418907166, mean loss: 0.3413938836228052
Epoch: 53, step: 95, loss: 0.33682772517204285, mean loss: 0.3413938240341633
Epoch: 53, step: 96, loss: 0.36655983328819275, mean loss: 0.34139415244780896
Epoch: 53, step: 97, loss: 0.3202088177204132, mean loss: 0.3413938759851347
Epoch: 53, step: 98, loss: 0.31615501642227173, mean loss: 0.34139354662939664
Epoch: 53, step: 99, loss: 0.3439255654811859, mean loss: 0.3413935796706699
Epoch: 53, step: 100, loss: 0.3306998014450073, mean loss: 0.3413934401253275
Epoch: 53, step: 101, loss: 0.315193772315979, mean loss: 0.3413930982448592
Epoch: 53, step: 102, loss: 0.3511587679386139, mean loss: 0.34139322567579405
Epoch: 53, step: 103, loss: 0.33562102913856506, mean loss: 0.34139315035614615
Epoch: 53, step: 104, loss: 0.3353685438632965, mean loss: 0.3413930717439028
Epoch: 53, step: 105, loss: 0.3365814685821533, mean loss: 0.341393008960386
Epoch: 53, step: 106, loss: 0.3642811179161072, mean loss: 0.34139330760871067
Epoch: 53, step: 107, loss: 0.3354785144329071, mean loss: 0.3413932304323905
Epoch: 53, step: 108, loss: 0.3221917748451233, mean loss: 0.3413929798947463
Epoch: 53, step: 109, loss: 0.3299117088317871, mean loss: 0.34139283009083904
Epoch: 53, step: 110, loss: 0.31068217754364014, mean loss: 0.34139242939341663
Epoch: 53, step: 111, loss: 0.3647027611732483, mean loss: 0.3413927335311414
Epoch: 53, step: 112, loss: 0.29403653740882874, mean loss: 0.341392115667013
Epoch: 53, step: 113, loss: 0.3126128315925598, mean loss: 0.3413917401838296
Epoch: 53, step: 114, loss: 0.298127681016922, mean loss: 0.3413911757252185
Epoch: 53, step: 115, loss: 0.36908406019210815, mean loss: 0.3413915370247236
Epoch: 53, step: 116, loss: 0.31458035111427307, mean loss: 0.3413911872329988
Epoch: 53, step: 117, loss: 0.3054933249950409, mean loss: 0.3413907188982012
Epoch: 53, step: 118, loss: 0.34436360001564026, mean loss: 0.341390757682837
Epoch: 53, step: 119, loss: 0.36756786704063416, mean loss: 0.3413910991887254
Epoch: 53, step: 120, loss: 0.33552688360214233, mean loss: 0.3413910226853193
Epoch: 53, step: 121, loss: 0.3158339262008667, mean loss: 0.341390689276802
Epoch: 53, step: 122, loss: 0.3417760729789734, mean loss: 0.341390694304311
Epoch: 53, step: 123, loss: 0.33689188957214355, mean loss: 0.34139063561608396
Epoch: 53, step: 124, loss: 0.32680144906044006, mean loss: 0.3413904452983497
Epoch: 53, step: 125, loss: 0.3795592188835144, mean loss: 0.3413909432082037
Epoch: 53, step: 126, loss: 0.31080812215805054, mean loss: 0.34139054426194754
Epoch: 53, step: 127, loss: 0.33605965971946716, mean loss: 0.341390474722624
Epoch: 53, step: 128, loss: 0.32621538639068604, mean loss: 0.34139027677205813
Epoch: 53, step: 129, loss: 0.3313780725002289, mean loss: 0.3413901461701397
Epoch: 53, step: 130, loss: 0.3331843316555023, mean loss: 0.34139003913265725
Epoch: 53, step: 131, loss: 0.3161584734916687, mean loss: 0.3413897100138317
Epoch: 53, step: 132, loss: 0.3455673158168793, mean loss: 0.3413897645055268
Epoch: 53, step: 133, loss: 0.3083903193473816, mean loss: 0.3413893340742384
Epoch: 53, step: 134, loss: 0.3422737419605255, mean loss: 0.3413893456099433
Epoch: 53, step: 135, loss: 0.3165535032749176, mean loss: 0.34138902166980745
Epoch: 53, step: 136, loss: 0.33109110593795776, mean loss: 0.34138888735325534
Epoch: 53, step: 137, loss: 0.3440069258213043, mean loss: 0.34138892150009853
Epoch: 53, step: 138, loss: 0.2890889644622803, mean loss: 0.3413882393653013
Epoch: 53, step: 139, loss: 0.30019232630729675, mean loss: 0.34138770206468233
Epoch: 53, step: 140, loss: 0.3739168345928192, mean loss: 0.3413881263226679
Epoch: 53, step: 141, loss: 0.33131518959999084, mean loss: 0.34138799494910294
Epoch: 53, step: 142, loss: 0.3084944486618042, mean loss: 0.3413875659494774
Epoch: 53, step: 143, loss: 0.36538806557655334, mean loss: 0.34138787896136674
Epoch: 53, step: 144, loss: 0.36117368936538696, mean loss: 0.3413881370023752
Epoch: 53, step: 145, loss: 0.31445470452308655, mean loss: 0.34138778574865863
Epoch: 53, step: 146, loss: 0.3265177011489868, mean loss: 0.3413875918222303
Epoch: 53, step: 147, loss: 0.35810747742652893, mean loss: 0.34138780986977335
Epoch: 53, step: 148, loss: 0.3524637222290039, mean loss: 0.3413879543111912
Epoch: 53, step: 149, loss: 0.3173203766345978, mean loss: 0.3413876404490374
Epoch: 53, step: 150, loss: 0.37294912338256836, mean loss: 0.3413880520328687
Epoch: 53, step: 151, loss: 0.3332134187221527, mean loss: 0.34138794543131806
Epoch: 53, step: 152, loss: 0.3122464418411255, mean loss: 0.3413875654156228
Epoch: 53, step: 153, loss: 0.37029266357421875, mean loss: 0.3413879423435909
Epoch: 53, step: 154, loss: 0.3671664893627167, mean loss: 0.34138827849635495
Epoch: 53, step: 155, loss: 0.3414701819419861, mean loss: 0.3413882795643636
Epoch: 53, step: 156, loss: 0.34734246134757996, mean loss: 0.34138835720498717
Epoch: 53, step: 157, loss: 0.37184321880340576, mean loss: 0.3413887543214508
Epoch: 53, step: 158, loss: 0.316550076007843, mean loss: 0.3413884304414869
Epoch: 53, step: 159, loss: 0.2997055649757385, mean loss: 0.34138788693153194
Epoch: 53, step: 160, loss: 0.3371255397796631, mean loss: 0.34138783135478895
Epoch: 53, step: 161, loss: 0.3262813985347748, mean loss: 0.341387634384585
Epoch: 53, step: 162, loss: 0.3376512825489044, mean loss: 0.3413875856675652
Epoch: 53, step: 163, loss: 0.30744343996047974, mean loss: 0.3413871430871737
Epoch: 53, step: 164, loss: 0.3473626375198364, mean loss: 0.34138722099758
Epoch: 53, step: 165, loss: 0.3506981432437897, mean loss: 0.3413873423947774
Epoch: 53, step: 166, loss: 0.31448352336883545, mean loss: 0.34138699162333286
Epoch: 53, step: 167, loss: 0.3087143301963806, mean loss: 0.3413865656433925
Epoch: 53, step: 168, loss: 0.3351786136627197, mean loss: 0.34138648470635147
Epoch: 53, step: 169, loss: 0.3275485336780548, mean loss: 0.3413863042944844
Epoch: 53, step: 170, loss: 0.3720129728317261, mean loss: 0.3413867035835414
Epoch: 53, step: 171, loss: 0.3156460225582123, mean loss: 0.3413863679989431
Epoch: 53, step: 172, loss: 0.33246123790740967, mean loss: 0.34138625164238107
Epoch: 53, step: 173, loss: 0.37164103984832764, mean loss: 0.341386646067696
Epoch: 53, step: 174, loss: 0.3503599464893341, mean loss: 0.3413867630492025
Epoch: 53, step: 175, loss: 0.32755717635154724, mean loss: 0.3413865827604882
Epoch: 53, step: 176, loss: 0.2856525778770447, mean loss: 0.3413858561963969
Epoch: 53, step: 177, loss: 0.31830865144729614, mean loss: 0.3413855553594167
Epoch: 53, step: 178, loss: 0.2992061376571655, mean loss: 0.34138500551105466
Epoch: 53, step: 179, loss: 0.3433064818382263, mean loss: 0.3413850305589784
Epoch: 53, step: 180, loss: 0.3315436840057373, mean loss: 0.34138490227111906
Epoch: 53, step: 181, loss: 0.32641521096229553, mean loss: 0.3413847071347514
Epoch: 53, step: 182, loss: 0.35360705852508545, mean loss: 0.3413848664562842
Epoch: 53, step: 183, loss: 0.3384803235530853, mean loss: 0.34138482859530467
Epoch: 53, step: 184, loss: 0.3263198733329773, mean loss: 0.3413846322248097
Epoch: 53, step: 185, loss: 0.2945815622806549, mean loss: 0.34138402215846353
Epoch: 53, step: 186, loss: 0.36551690101623535, mean loss: 0.34138433672042157
Epoch: 53, step: 187, loss: 0.33540821075439453, mean loss: 0.34138425882514045
Epoch: 53, step: 188, loss: 0.3367224335670471, mean loss: 0.34138419806178677
Epoch: 53, step: 189, loss: 0.3149566650390625, mean loss: 0.34138385360344337
Epoch: 53, step: 190, loss: 0.3195033073425293, mean loss: 0.3413835684145657
Epoch: 53, step: 191, loss: 0.34367039799690247, mean loss: 0.34138359822048797
Epoch: 53, step: 192, loss: 0.29922962188720703, mean loss: 0.3413830488040483
Epoch: 53, step: 193, loss: 0.3184720575809479, mean loss: 0.3413827501961289
Epoch: 53, step: 194, loss: 0.3206109404563904, mean loss: 0.3413824794725278
Epoch: 53, step: 195, loss: 0.3483718931674957, mean loss: 0.3413825705659187
Epoch: 53, step: 196, loss: 0.35401803255081177, mean loss: 0.34138273524240326
Epoch: 53, step: 197, loss: 0.31676289439201355, mean loss: 0.3413824143791053
Epoch: 53, step: 198, loss: 0.34051719307899475, mean loss: 0.34138240310307216
Epoch: 53, step: 199, loss: 0.3566865622997284, mean loss: 0.3413826025525743
Epoch: 53, step: 200, loss: 0.3665245473384857, mean loss: 0.34138293020749183
Epoch: 53, step: 201, loss: 0.3158268630504608, mean loss: 0.34138259715998803
Epoch: 53, step: 202, loss: 0.36950960755348206, mean loss: 0.3413829637073314
Epoch: 53, step: 203, loss: 0.3061247766017914, mean loss: 0.34138250423345856
Epoch: 53, step: 204, loss: 0.33419933915138245, mean loss: 0.34138241062587577
Epoch: 53, step: 205, loss: 0.3319122791290283, mean loss: 0.3413822872172451
Epoch: 53, step: 206, loss: 0.3443585932254791, mean loss: 0.3413823260020352
Epoch: 53, step: 207, loss: 0.3264116942882538, mean loss: 0.34138213091952657
Epoch: 53, step: 208, loss: 0.3784698247909546, mean loss: 0.34138261420348004
Epoch: 53, step: 209, loss: 0.32131004333496094, mean loss: 0.3413823526443486
Epoch: 53, step: 210, loss: 0.35111936926841736, mean loss: 0.34138247952258666
Epoch: 53, step: 211, loss: 0.3442803621292114, mean loss: 0.3413825172829667
Epoch: 53, step: 212, loss: 0.33419251441955566, mean loss: 0.34138242359604426
Epoch: 53, step: 213, loss: 0.3381909132003784, mean loss: 0.3413823820106796
Epoch: 53, step: 214, loss: 0.34589487314224243, mean loss: 0.34138244080765057
Epoch: 53, step: 215, loss: 0.3167557120323181, mean loss: 0.3413821199298586
Epoch: 53, step: 216, loss: 0.3570033311843872, mean loss: 0.34138232346620767
Epoch: 53, step: 217, loss: 0.30783817172050476, mean loss: 0.3413818864088559
Epoch: 53, step: 218, loss: 0.34022682905197144, mean loss: 0.34138187135944476
Epoch: 53, step: 219, loss: 0.30086565017700195, mean loss: 0.3413813434745534
Epoch: 53, step: 220, loss: 0.37117889523506165, mean loss: 0.34138173170109515
Epoch: 53, step: 221, loss: 0.3444887101650238, mean loss: 0.3413817721807895
Epoch: 53, step: 222, loss: 0.30780136585235596, mean loss: 0.3413813346795671
Epoch: 53, step: 223, loss: 0.33347436785697937, mean loss: 0.3413812316652513
Epoch: 53, step: 224, loss: 0.35513293743133545, mean loss: 0.3413814108242305
Epoch: 53, step: 225, loss: 0.38133832812309265, mean loss: 0.3413819313812708
Epoch: 53, step: 226, loss: 0.3098681569099426, mean loss: 0.34138152082648937
Epoch: 53, step: 227, loss: 0.3173585832118988, mean loss: 0.3413812078648216
Epoch: 53, step: 228, loss: 0.3323516249656677, mean loss: 0.3413810902323924
Epoch: 53, step: 229, loss: 0.3638207018375397, mean loss: 0.34138138255947614
Epoch: 53, step: 230, loss: 0.31796061992645264, mean loss: 0.34138107745463875
Epoch: 53, step: 231, loss: 0.3688477873802185, mean loss: 0.341381435261813
Epoch: 53, step: 232, loss: 0.3325035572052002, mean loss: 0.3413813196117374
Epoch: 53, step: 233, loss: 0.3019793629646301, mean loss: 0.3413808063381964
Epoch: 53, step: 234, loss: 0.33548814058303833, mean loss: 0.34138072957779475
Epoch: 53, step: 235, loss: 0.33443307876586914, mean loss: 0.34138063907588234
Epoch: 53, step: 236, loss: 0.32820820808410645, mean loss: 0.34138046749059414
Epoch: 53, step: 237, loss: 0.3127068281173706, mean loss: 0.3413800939900161
Epoch: 53, step: 238, loss: 0.3382858633995056, mean loss: 0.3413800536853361
Epoch: 53, step: 239, loss: 0.30868345499038696, mean loss: 0.3413796277931007
Epoch: 53, step: 240, loss: 0.3017692565917969, mean loss: 0.34137911185167336
Epoch: 53, step: 241, loss: 0.32663702964782715, mean loss: 0.3413789198324715
Epoch: 53, step: 242, loss: 0.31506961584091187, mean loss: 0.34137857715185943
Epoch: 53, step: 243, loss: 0.3294598460197449, mean loss: 0.3413784219115352
Epoch: 53, step: 244, loss: 0.35050126910209656, mean loss: 0.34137854073419294
Epoch: 53, step: 245, loss: 0.31523597240448, mean loss: 0.34137820023863
Epoch: 53, step: 246, loss: 0.29378068447113037, mean loss: 0.34137758030979837
Epoch: 53, step: 247, loss: 0.32258597016334534, mean loss: 0.3413773355636386
Epoch: 53, step: 248, loss: 0.3717183470726013, mean loss: 0.3413777307266543
Epoch: 53, step: 249, loss: 0.3321729898452759, mean loss: 0.34137761084516016
Epoch: 53, step: 250, loss: 0.3344708979129791, mean loss: 0.3413775208940911
Epoch: 53, step: 251, loss: 0.2951797544956207, mean loss: 0.3413769192353289
Epoch: 53, step: 252, loss: 0.33717575669288635, mean loss: 0.34137686452200544
Epoch: 53, step: 253, loss: 0.3771589696407318, mean loss: 0.34137733051978003
Epoch: 53, step: 254, loss: 0.32214927673339844, mean loss: 0.34137708011210965
Epoch: 53, step: 255, loss: 0.3823728859424591, mean loss: 0.34137761399508393
Epoch: 53, step: 256, loss: 0.29526951909065247, mean loss: 0.34137701354326266
Epoch: 53, step: 257, loss: 0.33246666193008423, mean loss: 0.3413768975079506
Epoch: 53, step: 258, loss: 0.3274781107902527, mean loss: 0.34137671651295487
Epoch: 53, step: 259, loss: 0.35430672764778137, mean loss: 0.3413768848900141
Epoch: 53, step: 260, loss: 0.32873764634132385, mean loss: 0.34137672030159394
Epoch: 53, step: 261, loss: 0.3339707553386688, mean loss: 0.34137662386222417
Epoch: 53, step: 262, loss: 0.33406153321266174, mean loss: 0.3413765286074465
Epoch: 53, step: 263, loss: 0.30320456624031067, mean loss: 0.34137603155079815
Epoch: 53, step: 264, loss: 0.3399900794029236, mean loss: 0.3413760135038413
Epoch: 53, step: 265, loss: 0.3510228991508484, mean loss: 0.3413761391176027
Epoch: 53, step: 266, loss: 0.31557121872901917, mean loss: 0.34137580311166005
Epoch: 53, step: 267, loss: 0.3282772898674011, mean loss: 0.34137563255810216
Epoch: 53, step: 268, loss: 0.3053297996520996, mean loss: 0.3413751632174307
Epoch: 53, step: 269, loss: 0.3742544651031494, mean loss: 0.34137559132219214
Epoch: 53, step: 270, loss: 0.33321860432624817, mean loss: 0.34137548511557264
Epoch: 53, step: 271, loss: 0.3547888994216919, mean loss: 0.34137565976030865
Epoch: 53, step: 272, loss: 0.30585139989852905, mean loss: 0.341375197234954
Epoch: 53, step: 273, loss: 0.3118152320384979, mean loss: 0.34137481236964146
Epoch: 53, step: 274, loss: 0.30963170528411865, mean loss: 0.34137439908560374
Epoch: 53, step: 275, loss: 0.33773186802864075, mean loss: 0.3413743516617539
Epoch: 53, step: 276, loss: 0.3373282849788666, mean loss: 0.34137429898476707
Epoch: 53, step: 277, loss: 0.3284360468387604, mean loss: 0.3413741305398752
Epoch: 53, step: 278, loss: 0.3513140380382538, mean loss: 0.34137425994721915
Epoch: 53, step: 279, loss: 0.3115614056587219, mean loss: 0.3413738718196572
Epoch: 53, step: 280, loss: 0.3211579918861389, mean loss: 0.34137360863660315
Epoch: 53, step: 281, loss: 0.37807732820510864, mean loss: 0.3413740864625147
Epoch: 53, step: 282, loss: 0.371911883354187, mean loss: 0.3413744840124319
Epoch: 53, step: 283, loss: 0.32725614309310913, mean loss: 0.34137430021815834
Epoch: 53, step: 284, loss: 0.3529262840747833, mean loss: 0.3413744506013269
Epoch: 53, step: 285, loss: 0.3280831575393677, mean loss: 0.3413742775781674
Epoch: 53, step: 286, loss: 0.3034217059612274, mean loss: 0.34137378352628417
Epoch: 53, step: 287, loss: 0.2975744903087616, mean loss: 0.34137321337146487
Epoch: 53, step: 288, loss: 0.3472875654697418, mean loss: 0.3413732903602062
Epoch: 53, step: 289, loss: 0.3022928535938263, mean loss: 0.34137278164607787
Epoch: 53, step: 290, loss: 0.34147363901138306, mean loss: 0.34137278295893164
Epoch: 53, step: 291, loss: 0.3133685886859894, mean loss: 0.3413724184348991
Epoch: 53, step: 292, loss: 0.3320339322090149, mean loss: 0.3413722968795952
Epoch: 53, step: 293, loss: 0.33439916372299194, mean loss: 0.3413722061143184
Epoch: 53, step: 294, loss: 0.3593592643737793, mean loss: 0.3413724402384969
Epoch: 53, step: 295, loss: 0.33028852939605713, mean loss: 0.34137229596933927
Epoch: 53, step: 296, loss: 0.32576560974121094, mean loss: 0.3413720928339838
Epoch: 53, step: 297, loss: 0.33937719464302063, mean loss: 0.34137206686888955
Epoch: 53, step: 298, loss: 0.3330572247505188, mean loss: 0.3413719586463997
Epoch: 53, step: 299, loss: 0.35040155053138733, mean loss: 0.3413720761702424
Epoch: 53, step: 300, loss: 0.34331193566322327, mean loss: 0.3413721014179809
Epoch: 53, step: 301, loss: 0.33884161710739136, mean loss: 0.3413720684835468
Epoch: 53, step: 302, loss: 0.31501030921936035, mean loss: 0.3413717253878318
Epoch: 53, step: 303, loss: 0.3410320281982422, mean loss: 0.34137172096676366
Epoch: 53, step: 304, loss: 0.3204968571662903, mean loss: 0.34137144928952745
Epoch: 53, step: 305, loss: 0.37030714750289917, mean loss: 0.34137182587010234
Epoch: 53, step: 306, loss: 0.34172961115837097, mean loss: 0.3413718305264004
Epoch: 53, step: 307, loss: 0.3363093137741089, mean loss: 0.34137176464252805
Epoch: 53, step: 308, loss: 0.3535730242729187, mean loss: 0.3413719234283277
Epoch: 53, step: 309, loss: 0.3274081349372864, mean loss: 0.3413717417075436
Epoch: 53, step: 310, loss: 0.3563414216041565, mean loss: 0.34137193651617803
Epoch: 53, step: 311, loss: 0.34269410371780396, mean loss: 0.34137195372203927
Epoch: 53, step: 312, loss: 0.2968641221523285, mean loss: 0.34137137453235133
Epoch: 53, step: 313, loss: 0.30534857511520386, mean loss: 0.3413709057662553
Epoch: 53, step: 314, loss: 0.307524174451828, mean loss: 0.34137046532314996
Epoch: 53, step: 315, loss: 0.3169167637825012, mean loss: 0.34137014711445823
Epoch: 53, step: 316, loss: 0.30930349230766296, mean loss: 0.34136972984611635
Epoch: 53, step: 317, loss: 0.37142691016197205, mean loss: 0.3413701209610196
Epoch: 53, step: 318, loss: 0.3120307922363281, mean loss: 0.3413697391920286
Epoch: 53, step: 319, loss: 0.3298666775226593, mean loss: 0.3413695895139244
Epoch: 53, step: 320, loss: 0.3190317451953888, mean loss: 0.34136929885715994
Epoch: 53, step: 321, loss: 0.33415907621383667, mean loss: 0.3413692050400178
Epoch: 53, step: 322, loss: 0.372474730014801, mean loss: 0.3413696097700285
Epoch: 53, step: 323, loss: 0.30489692091941833, mean loss: 0.3413691352112582
Epoch: 53, step: 324, loss: 0.32288888096809387, mean loss: 0.34136889476140664
Epoch: 53, step: 325, loss: 0.3511539399623871, mean loss: 0.3413690220747013
Epoch: 53, step: 326, loss: 0.3096192181110382, mean loss: 0.34136860898314453
Epoch: 53, step: 327, loss: 0.32291048765182495, mean loss: 0.34136836883064214
Epoch: 53, step: 328, loss: 0.34299567341804504, mean loss: 0.3413683900026876
Epoch: 53, step: 329, loss: 0.35084351897239685, mean loss: 0.3413685132772442
Epoch: 53, step: 330, loss: 0.33352115750312805, mean loss: 0.34136841118188266
Epoch: 53, step: 331, loss: 0.3394838869571686, mean loss: 0.3413683866642382
Epoch: 53, step: 332, loss: 0.352018803358078, mean loss: 0.341368525224268
Epoch: 53, step: 333, loss: 0.3203286826610565, mean loss: 0.3413682515032137
Epoch: 53, step: 334, loss: 0.41464143991470337, mean loss: 0.34136920474957966
Epoch: 53, step: 335, loss: 0.3331266939640045, mean loss: 0.3413690975201632
Epoch: 53, step: 336, loss: 0.37201789021492004, mean loss: 0.3413694962347646
Epoch: 53, step: 337, loss: 0.34919795393943787, mean loss: 0.3413695980749845
Epoch: 53, step: 338, loss: 0.3034985363483429, mean loss: 0.34136910541765303
Epoch: 53, step: 339, loss: 0.3483615219593048, mean loss: 0.3413691963794667
Epoch: 53, step: 340, loss: 0.3283018171787262, mean loss: 0.34136902639287586
Epoch: 53, step: 341, loss: 0.279758483171463, mean loss: 0.34136822494448993
Epoch: 53, step: 342, loss: 0.31924518942832947, mean loss: 0.34136793716516617
Epoch: 53, step: 343, loss: 0.3136005699634552, mean loss: 0.3413675759683401
Epoch: 53, step: 344, loss: 0.310822457075119, mean loss: 0.3413671786437971
Epoch: 53, step: 345, loss: 0.358646422624588, mean loss: 0.34136740340567934
Epoch: 53, step: 346, loss: 0.3086501955986023, mean loss: 0.34136697783812764
Epoch: 53, step: 347, loss: 0.3631177842617035, mean loss: 0.34136726075704577
Epoch: 53, step: 348, loss: 0.3644634783267975, mean loss: 0.34136756117220124
Epoch: 53, step: 349, loss: 0.33078476786613464, mean loss: 0.34136742352238325
Epoch: 53, step: 350, loss: 0.2855505645275116, mean loss: 0.3413666975249717
Epoch: 53, step: 351, loss: 0.328878253698349, mean loss: 0.34136653509268633
Epoch: 53, step: 352, loss: 0.3286013603210449, mean loss: 0.3413663690632297
Epoch: 53, step: 353, loss: 0.3060323894023895, mean loss: 0.34136590949998463
Epoch: 53, step: 354, loss: 0.34155529737472534, mean loss: 0.3413659119631822
Epoch: 53, step: 355, loss: 0.3806712329387665, mean loss: 0.3413664231654631
Epoch: 53, step: 356, loss: 0.3352794051170349, mean loss: 0.34136634399915783
Epoch: 53, step: 357, loss: 0.3042598068714142, mean loss: 0.3413658614066604
Epoch: 53, step: 358, loss: 0.3168979287147522, mean loss: 0.34136554319083945
Epoch: 53, step: 359, loss: 0.32254454493522644, mean loss: 0.3413652984189743
Epoch: 53, step: 360, loss: 0.34104153513908386, mean loss: 0.34136529420840533
Epoch: 53, step: 361, loss: 0.3237142860889435, mean loss: 0.34136506465852995
Epoch: 53, step: 362, loss: 0.394320011138916, mean loss: 0.34136575332419716
Epoch: 53, step: 363, loss: 0.3301275372505188, mean loss: 0.341365607175944
Epoch: 53, step: 364, loss: 0.34325847029685974, mean loss: 0.34136563179150925
Epoch: 53, step: 365, loss: 0.29308193922042847, mean loss: 0.3413650038988128
Epoch: 53, step: 366, loss: 0.3205289840698242, mean loss: 0.3413647329457467
Epoch: 53, step: 367, loss: 0.2929622232913971, mean loss: 0.34136410352429475
Epoch: 53, step: 368, loss: 0.32985201478004456, mean loss: 0.3413639538241771
Epoch: 53, step: 369, loss: 0.3161012828350067, mean loss: 0.341363625319444
Epoch: 53, step: 370, loss: 0.32165050506591797, mean loss: 0.3413633689819766
Epoch: 53, step: 371, loss: 0.3137485682964325, mean loss: 0.3413630099005155
Epoch: 53, step: 372, loss: 0.335349440574646, mean loss: 0.3413629317057385
Epoch: 53, step: 373, loss: 0.3437406122684479, mean loss: 0.3413629626224493
Epoch: 53, step: 374, loss: 0.39041709899902344, mean loss: 0.3413636004595301
Epoch: 53, step: 375, loss: 0.33713817596435547, mean loss: 0.3413635455182432
Epoch: 53, step: 376, loss: 0.3742857277393341, mean loss: 0.3413639735849483
Epoch: 53, step: 377, loss: 0.32925182580947876, mean loss: 0.34136381610025485
Epoch: 53, step: 378, loss: 0.3400016725063324, mean loss: 0.34136379838960756
Epoch: 53, step: 379, loss: 0.2829732596874237, mean loss: 0.3413630392032816
Epoch: 53, step: 380, loss: 0.34264472126960754, mean loss: 0.34136305586733146
Epoch: 53, step: 381, loss: 0.30702054500579834, mean loss: 0.34136260936200263
Epoch: 53, step: 382, loss: 0.3103232979774475, mean loss: 0.3413622058085815
Epoch: 53, step: 383, loss: 0.3061257302761078, mean loss: 0.34136174769225286
Epoch: 53, step: 384, loss: 0.32949116826057434, mean loss: 0.3413615933625282
Epoch: 53, step: 385, loss: 0.3241312503814697, mean loss: 0.3413613693532848
Epoch: 53, step: 386, loss: 0.31805679202079773, mean loss: 0.3413610663777218
Epoch: 53, step: 387, loss: 0.30672064423561096, mean loss: 0.3413606160342202
Epoch: 53, step: 388, loss: 0.3210345208644867, mean loss: 0.34136035178784835
Epoch: 53, step: 389, loss: 0.3249298930168152, mean loss: 0.34136013818889394
Epoch: 53, step: 390, loss: 0.3029560148715973, mean loss: 0.34135963893479154
Epoch: 53, step: 391, loss: 0.3220243752002716, mean loss: 0.3413593875793793
Epoch: 53, step: 392, loss: 0.3097931742668152, mean loss: 0.341358977228865
Epoch: 53, step: 393, loss: 0.29091009497642517, mean loss: 0.3413583214183165
Epoch: 53, step: 394, loss: 0.3329729735851288, mean loss: 0.3413582124143539
Epoch: 53, step: 395, loss: 0.3071243166923523, mean loss: 0.34135776740219026
Epoch: 53, step: 396, loss: 0.34599143266677856, mean loss: 0.3413578276352008
Epoch: 53, step: 397, loss: 0.3342345952987671, mean loss: 0.34135773504151384
Epoch: 53, step: 398, loss: 0.3352373242378235, mean loss: 0.3413576554843678
Epoch: 53, step: 399, loss: 0.3419484496116638, mean loss: 0.3413576631638007
Epoch: 53, step: 400, loss: 0.3288857340812683, mean loss: 0.3413575010496353
Epoch: 53, step: 401, loss: 0.3496982157230377, mean loss: 0.3413576094635313
Epoch: 53, step: 402, loss: 0.32177507877349854, mean loss: 0.341357354930085
Epoch: 53, step: 403, loss: 0.3009157180786133, mean loss: 0.34135682927711564
Epoch: 53, step: 404, loss: 0.30295783281326294, mean loss: 0.3413563301804981
Epoch: 53, step: 405, loss: 0.3552446961402893, mean loss: 0.3413565106942359
Epoch: 53, step: 406, loss: 0.30985745787620544, mean loss: 0.3413561012912957
Epoch: 53, step: 407, loss: 0.3333633244037628, mean loss: 0.34135599740805045
Epoch: 53, step: 408, loss: 0.320627897977829, mean loss: 0.34135572800552866
Epoch: 53, step: 409, loss: 0.3139554262161255, mean loss: 0.34135537188921
Epoch: 53, step: 410, loss: 0.3564748167991638, mean loss: 0.3413555683910998
Epoch: 53, step: 411, loss: 0.3289284408092499, mean loss: 0.34135540688237165
Epoch: 53, step: 412, loss: 0.3084864616394043, mean loss: 0.34135497970782824
Epoch: 53, step: 413, loss: 0.34878188371658325, mean loss: 0.3413550762288171
Epoch: 53, step: 414, loss: 0.3243853747844696, mean loss: 0.3413548556912855
Epoch: 53, step: 415, loss: 0.3143675625324249, mean loss: 0.3413545049701081
Epoch: 53, step: 416, loss: 0.2994433343410492, mean loss: 0.3413539603084409
Epoch: 53, step: 417, loss: 0.33766162395477295, mean loss: 0.34135391232486256
Epoch: 53, step: 418, loss: 0.31493547558784485, mean loss: 0.34135356900980834
Epoch: 53, step: 419, loss: 0.34235429763793945, mean loss: 0.3413535820143908
Epoch: 53, step: 420, loss: 0.3494909405708313, mean loss: 0.34135368775891745
Epoch: 53, step: 421, loss: 0.33788397908210754, mean loss: 0.34135364267083007
Epoch: 53, step: 422, loss: 0.36395785212516785, mean loss: 0.34135393640365386
Epoch: 53, step: 423, loss: 0.34764185547828674, mean loss: 0.3413540181116308
Epoch: 53, step: 424, loss: 0.34462037682533264, mean loss: 0.3413540605555763
Epoch: 53, step: 425, loss: 0.33158764243125916, mean loss: 0.34135393364975597
Epoch: 53, step: 426, loss: 0.3361351490020752, mean loss: 0.341353865837224
Epoch: 53, step: 427, loss: 0.3255477249622345, mean loss: 0.3413536604559756
Epoch: 53, step: 428, loss: 0.3366158604621887, mean loss: 0.3413535988949253
Epoch: 53, step: 429, loss: 0.31980010867118835, mean loss: 0.3413533188412595
Epoch: 53, step: 430, loss: 0.31659996509552, mean loss: 0.34135299721458506
Epoch: 53, step: 431, loss: 0.30616360902786255, mean loss: 0.341352539995779
Epoch: 53, step: 432, loss: 0.3332558870315552, mean loss: 0.341352434796624
Epoch: 53, step: 433, loss: 0.34216827154159546, mean loss: 0.34135244539658693
Epoch: 53, step: 434, loss: 0.35031309723854065, mean loss: 0.3413525618185839
Epoch: 53, step: 435, loss: 0.34303992986679077, mean loss: 0.3413525837415655
Epoch: 53, step: 436, loss: 0.3345045745372772, mean loss: 0.34135249477056157
Epoch: 53, step: 437, loss: 0.3188795745372772, mean loss: 0.34135220280070017
Epoch: 53, step: 438, loss: 0.36374345421791077, mean loss: 0.3413524937057347
Epoch: 53, step: 439, loss: 0.3339642882347107, mean loss: 0.34135239772011045
Epoch: 53, step: 440, loss: 0.3281741440296173, mean loss: 0.34135222651392527
Epoch: 53, step: 441, loss: 0.4109777808189392, mean loss: 0.3413531310473301
Epoch: 53, step: 442, loss: 0.2916243076324463, mean loss: 0.3413524850087018
Epoch: 53, step: 443, loss: 0.3603048622608185, mean loss: 0.34135273122021254
Epoch: 53, step: 444, loss: 0.3053363859653473, mean loss: 0.3413522633357113
Epoch: 53, step: 445, loss: 0.3176382780075073, mean loss: 0.3413519552738582
Epoch: 53, step: 446, loss: 0.3212698996067047, mean loss: 0.34135169439679214
Epoch: 53, step: 447, loss: 0.30320239067077637, mean loss: 0.34135119882256865
Epoch: 53, step: 448, loss: 0.3312900960445404, mean loss: 0.34135106812664656
Epoch: 53, step: 449, loss: 0.3279077112674713, mean loss: 0.3413508934967739
Epoch: 53, step: 450, loss: 0.37401387095451355, mean loss: 0.34135131778496036
Epoch: 53, step: 451, loss: 0.38273656368255615, mean loss: 0.34135185536739177
Epoch: 53, step: 452, loss: 0.39322757720947266, mean loss: 0.34135252920933296
Epoch: 53, step: 453, loss: 0.3046947717666626, mean loss: 0.34135205304798616
Epoch: 53, step: 454, loss: 0.33456137776374817, mean loss: 0.34135196484250624
Epoch: 53, step: 455, loss: 0.3251279890537262, mean loss: 0.34135175410868035
Epoch: 53, step: 456, loss: 0.33932292461395264, mean loss: 0.34135172775648076
Epoch: 53, step: 457, loss: 0.34087321162223816, mean loss: 0.3413517215411783
Epoch: 53, step: 458, loss: 0.3395659625530243, mean loss: 0.34135169834679213
Epoch: 53, step: 459, loss: 0.2906360924243927, mean loss: 0.34135103963412167
Epoch: 53, step: 460, loss: 0.3101329207420349, mean loss: 0.34135063416714556
Epoch: 53, step: 461, loss: 0.35183393955230713, mean loss: 0.3413507703245784
Epoch: 53, step: 462, loss: 0.3419741094112396, mean loss: 0.3413507784204169
Epoch: 53, step: 463, loss: 0.3165580630302429, mean loss: 0.34135045642037287
Epoch: 53, step: 464, loss: 0.31982991099357605, mean loss: 0.34135017692188035
Epoch: 53, step: 465, loss: 0.3131323754787445, mean loss: 0.34134981044740775
Epoch: 53, step: 466, loss: 0.30759313702583313, mean loss: 0.3413493720433581
Epoch: 53, step: 467, loss: 0.3006434738636017, mean loss: 0.3413488433953298
Epoch: 53, step: 468, loss: 0.30418139696121216, mean loss: 0.3413483607074889
Epoch: 53, step: 469, loss: 0.3253478705883026, mean loss: 0.34134815291431314
Epoch: 53, step: 470, loss: 0.2822249233722687, mean loss: 0.3413473851100777
Epoch: 53, step: 471, loss: 0.3355998992919922, mean loss: 0.34134731047128203
Epoch: 53, step: 472, loss: 0.35949668288230896, mean loss: 0.34134754616211266
Epoch: 53, step: 473, loss: 0.3532865047454834, mean loss: 0.34134770120144187
Epoch: 53, step: 474, loss: 0.31453341245651245, mean loss: 0.3413473529955808
Epoch: 53, step: 475, loss: 0.3310409486293793, mean loss: 0.34134721916007843
Epoch: 53, step: 476, loss: 0.3255921006202698, mean loss: 0.34134701457206224
Epoch: 53, step: 477, loss: 0.3231911361217499, mean loss: 0.34134677881205117
Epoch: 53, step: 478, loss: 0.3468925952911377, mean loss: 0.3413468508253542
Epoch: 53, step: 479, loss: 0.34015122056007385, mean loss: 0.34134683530010795
Epoch: 53, step: 480, loss: 0.32557186484336853, mean loss: 0.34134663046494435
Epoch: 53, step: 481, loss: 0.3002081513404846, mean loss: 0.3413460962961033
Epoch: 53, step: 482, loss: 0.33744654059410095, mean loss: 0.34134604566238647
Epoch: 53, step: 483, loss: 0.35122352838516235, mean loss: 0.34134617391473304
Epoch: 53, step: 484, loss: 0.32727766036987305, mean loss: 0.34134599124709414
Epoch: 53, step: 485, loss: 0.30449163913726807, mean loss: 0.34134551273100555
Epoch: 53, step: 486, loss: 0.30122804641723633, mean loss: 0.3413449918534778
Epoch: 53, step: 487, loss: 0.3326781988143921, mean loss: 0.3413448793269517
Epoch: 53, step: 488, loss: 0.3631875514984131, mean loss: 0.34134516292067507
Epoch: 53, step: 489, loss: 0.31234678626060486, mean loss: 0.34134478642595073
Epoch: 53, step: 490, loss: 0.357511430978775, mean loss: 0.34134499631967796
Epoch: 53, step: 491, loss: 0.297537237405777, mean loss: 0.3413444275650182
Epoch: 53, step: 492, loss: 0.3434353470802307, mean loss: 0.3413444547110035
Epoch: 53, step: 493, loss: 0.3682217597961426, mean loss: 0.3413448036490904
Epoch: 53, step: 494, loss: 0.34614625573158264, mean loss: 0.34134486598375335
Epoch: 53, step: 495, loss: 0.32054007053375244, mean loss: 0.34134459588982063
Epoch: 53, step: 496, loss: 0.29236236214637756, mean loss: 0.3413439599964072
Epoch: 53, step: 497, loss: 0.36492860317230225, mean loss: 0.3413442661711856
Epoch: 53, step: 498, loss: 0.35521623492240906, mean loss: 0.34134444625412297
Epoch: 53, step: 499, loss: 0.32621437311172485, mean loss: 0.3413442498412927
Epoch: 53, step: 500, loss: 0.35758015513420105, mean loss: 0.34134446060687745
Epoch: 53, step: 501, loss: 0.32480576634407043, mean loss: 0.34134424591344
Epoch: 53, step: 502, loss: 0.32398146390914917, mean loss: 0.3413440205252138
Epoch: 53, step: 503, loss: 0.4014243483543396, mean loss: 0.3413448004245833
Epoch: 53, step: 504, loss: 0.29406386613845825, mean loss: 0.34134418668139127
Epoch: 53, step: 505, loss: 0.37965768575668335, mean loss: 0.34134468401386453
Epoch: 53, step: 506, loss: 0.3081534206867218, mean loss: 0.34134425317671285
Epoch: 53, step: 507, loss: 0.3069339990615845, mean loss: 0.34134380652232404
Epoch: 53, step: 508, loss: 0.3350701332092285, mean loss: 0.34134372508940763
Epoch: 53, step: 509, loss: 0.30835989117622375, mean loss: 0.3413432969614526
Epoch: 53, step: 510, loss: 0.33886846899986267, mean loss: 0.34134326483876837
Epoch: 53, step: 511, loss: 0.2985709309577942, mean loss: 0.34134270967115143
Epoch: 53, step: 512, loss: 0.33257925510406494, mean loss: 0.34134259592652727
Epoch: 53, step: 513, loss: 0.3231073319911957, mean loss: 0.3413423592463111
Epoch: 53, step: 514, loss: 0.3725002408027649, mean loss: 0.3413427636472814
Epoch: 53, step: 515, loss: 0.3321266174316406, mean loss: 0.3413426440316364
Epoch: 53, step: 516, loss: 0.3320589065551758, mean loss: 0.34134252354029354
Epoch: 53, step: 517, loss: 0.33299729228019714, mean loss: 0.3413424152309975
Epoch: 53, step: 518, loss: 0.3056873083114624, mean loss: 0.34134195248415555
Epoch: 53, step: 519, loss: 0.2985609173774719, mean loss: 0.34134139726125273
Epoch: 53, step: 520, loss: 0.299071729183197, mean loss: 0.3413408486821179
Epoch: 53, step: 521, loss: 0.308932900428772, mean loss: 0.3413404280946305
Epoch: 53, step: 522, loss: 0.312000572681427, mean loss: 0.3413400473295223
Epoch: 53, step: 523, loss: 0.35412099957466125, mean loss: 0.3413402131952854
Epoch: 53, step: 524, loss: 0.3088023066520691, mean loss: 0.3413397909376509
Epoch: 53, step: 525, loss: 0.30268386006355286, mean loss: 0.3413392892904387
Epoch: 53, step: 526, loss: 0.35034188628196716, mean loss: 0.3413394061177657
Epoch: 53, step: 527, loss: 0.3523326516151428, mean loss: 0.34133954877602546
Epoch: 53, step: 528, loss: 0.30668944120407104, mean loss: 0.3413390991308408
Epoch: 53, step: 529, loss: 0.28894922137260437, mean loss: 0.34133841929022213
Epoch: 53, step: 530, loss: 0.30564144253730774, mean loss: 0.3413379560721181
Epoch: 53, step: 531, loss: 0.34523269534111023, mean loss: 0.3413380066111411
Epoch: 53, step: 532, loss: 0.3151487112045288, mean loss: 0.34133766677729427
Epoch: 53, step: 533, loss: 0.3334200978279114, mean loss: 0.3413375640397842
Epoch: 53, step: 534, loss: 0.34132835268974304, mean loss: 0.34133756392026027
Epoch: 53, step: 535, loss: 0.32353222370147705, mean loss: 0.3413373328861058
Epoch: 53, step: 536, loss: 0.34945544600486755, mean loss: 0.3413374382217546
Epoch: 53, step: 537, loss: 0.356833279132843, mean loss: 0.34133763928365823
Epoch: 53, step: 538, loss: 0.3729066848754883, mean loss: 0.34133804889357106
Epoch: 53, step: 539, loss: 0.3653571307659149, mean loss: 0.3413383605382912
Epoch: 53, step: 540, loss: 0.323241651058197, mean loss: 0.3413381257386924
Epoch: 53, step: 541, loss: 0.35748395323753357, mean loss: 0.34133833522344076
Epoch: 53, step: 542, loss: 0.32742583751678467, mean loss: 0.34133815471746987
Epoch: 53, step: 543, loss: 0.33576780557632446, mean loss: 0.3413380824466055
Epoch: 53, step: 544, loss: 0.3456670045852661, mean loss: 0.34133813861020995
Epoch: 53, step: 545, loss: 0.2972380518913269, mean loss: 0.34133756646139035
Epoch: 53, step: 546, loss: 0.3515521287918091, mean loss: 0.3413376989820812
Epoch: 53, step: 547, loss: 0.35399240255355835, mean loss: 0.34133786315830816
Epoch: 53, step: 548, loss: 0.33096611499786377, mean loss: 0.34133772860182654
Epoch: 53, step: 549, loss: 0.3713173270225525, mean loss: 0.341338117533074
Epoch: 53, step: 550, loss: 0.32032909989356995, mean loss: 0.3413378449824774
Epoch: 53, step: 551, loss: 0.32188186049461365, mean loss: 0.34133759258269936
Epoch: 53, step: 552, loss: 0.33391836285591125, mean loss: 0.34133749633531363
Epoch: 53, step: 553, loss: 0.3460093140602112, mean loss: 0.3413375569405821
Epoch: 53, step: 554, loss: 0.3595362603664398, mean loss: 0.34133779302064005
Epoch: 53, step: 555, loss: 0.33705756068229675, mean loss: 0.3413377374966631
Epoch: 53, step: 556, loss: 0.31075239181518555, mean loss: 0.34133734074296695
Epoch: 53, step: 557, loss: 0.30393242835998535, mean loss: 0.34133685553201376
Epoch: 53, step: 558, loss: 0.32488152384757996, mean loss: 0.34133664207867054
Epoch: 53, step: 559, loss: 0.3440167009830475, mean loss: 0.3413366768430936
Epoch: 53, step: 560, loss: 0.28610360622406006, mean loss: 0.3413359603958076
Epoch: 53, step: 561, loss: 0.3305518627166748, mean loss: 0.3413358205133566
Epoch: 53, step: 562, loss: 0.34082457423210144, mean loss: 0.3413358138819761
Epoch: 53, step: 563, loss: 0.3269020617008209, mean loss: 0.3413356266640636
Epoch: 53, step: 564, loss: 0.3315233886241913, mean loss: 0.34133549939272956
Epoch: 53, step: 565, loss: 0.35701784491539, mean loss: 0.3413357028006717
Epoch: 53, step: 566, loss: 0.3260537087917328, mean loss: 0.34133550458806183
Epoch: 53, step: 567, loss: 0.33000144362449646, mean loss: 0.3413353575833801
Epoch: 53, step: 568, loss: 0.3160191774368286, mean loss: 0.34133502923251374
Epoch: 53, step: 569, loss: 0.33111920952796936, mean loss: 0.3413348967350467
Epoch: 53, step: 570, loss: 0.37346094846725464, mean loss: 0.3413353133991419
Epoch: 53, step: 571, loss: 0.33283355832099915, mean loss: 0.3413352031356656
Epoch: 53, step: 572, loss: 0.34192031621932983, mean loss: 0.3413352107241889
Epoch: 53, step: 573, loss: 0.30982330441474915, mean loss: 0.3413348020412549
Epoch: 53, step: 574, loss: 0.3114905059337616, mean loss: 0.341334414990843
Epoch: 53, step: 575, loss: 0.3102186620235443, mean loss: 0.34133401145615183
Epoch: 53, step: 576, loss: 0.34877729415893555, mean loss: 0.3413341079855155
Epoch: 53, step: 577, loss: 0.2919650673866272, mean loss: 0.34133346774377515
Epoch: 53, step: 578, loss: 0.32078465819358826, mean loss: 0.3413332012602702
Epoch: 53, step: 579, loss: 0.3040321469306946, mean loss: 0.3413327175345942
Epoch: 53, step: 580, loss: 0.3317457139492035, mean loss: 0.3413325932105038
Epoch: 53, step: 581, loss: 0.3547528088092804, mean loss: 0.34133276724136197
Epoch: 53, step: 582, loss: 0.32472118735313416, mean loss: 0.34133255182827904
Epoch: 53, step: 583, loss: 0.3130021095275879, mean loss: 0.34133218445390406
Epoch: 53, step: 584, loss: 0.3232960104942322, mean loss: 0.3413319505732557
Epoch: 53, step: 585, loss: 0.3261931836605072, mean loss: 0.3413317542667266
Epoch: 53, step: 586, loss: 0.34259775280952454, mean loss: 0.34133177068289566
Epoch: 53, step: 587, loss: 0.36845260858535767, mean loss: 0.3413321223535116
Epoch: 53, step: 588, loss: 0.32374581694602966, mean loss: 0.341331894318276
Epoch: 53, step: 589, loss: 0.30775532126426697, mean loss: 0.34133145894869205
Epoch: 53, step: 590, loss: 0.34936854243278503, mean loss: 0.34133156315993235
Epoch: 53, step: 591, loss: 0.3330061137676239, mean loss: 0.34133145521105274
Epoch: 53, step: 592, loss: 0.3594120442867279, mean loss: 0.341331689643326
Epoch: 53, step: 593, loss: 0.31535622477531433, mean loss: 0.34133135285074157
Epoch: 53, step: 594, loss: 0.31575924158096313, mean loss: 0.3413310212922566
Epoch: 53, step: 595, loss: 0.3327430188655853, mean loss: 0.34133090994485454
Epoch: 53, step: 596, loss: 0.3549192547798157, mean loss: 0.3413310861217119
Epoch: 53, step: 597, loss: 0.37853729724884033, mean loss: 0.341331568504846
Epoch: 53, step: 598, loss: 0.37866437435150146, mean loss: 0.34133205252302085
Epoch: 53, step: 599, loss: 0.32449522614479065, mean loss: 0.34133183423714236
Epoch: 53, step: 600, loss: 0.3151281177997589, mean loss: 0.34133149451592787
Epoch: 53, step: 601, loss: 0.35012927651405334, mean loss: 0.3413316085743457
Epoch: 53, step: 602, loss: 0.34956809878349304, mean loss: 0.341331715354539
Epoch: 53, step: 603, loss: 0.34023967385292053, mean loss: 0.34133170119718703
Epoch: 53, step: 604, loss: 0.3136621117591858, mean loss: 0.3413313424900888
Epoch: 53, step: 605, loss: 0.3741482198238373, mean loss: 0.3413317679208406
Epoch: 53, step: 606, loss: 0.336772084236145, mean loss: 0.3413317088108744
Epoch: 53, step: 607, loss: 0.3457517623901367, mean loss: 0.3413317661099874
Epoch: 53, step: 608, loss: 0.2791367173194885, mean loss: 0.3413309598584637
Epoch: 53, step: 609, loss: 0.3123529851436615, mean loss: 0.34133058421387685
Epoch: 53, step: 610, loss: 0.3727174401283264, mean loss: 0.34133099107977416
Epoch: 53, step: 611, loss: 0.33595919609069824, mean loss: 0.3413309214464263
Epoch: 53, step: 612, loss: 0.3450702428817749, mean loss: 0.3413309699177651
Epoch: 53, step: 613, loss: 0.3460594117641449, mean loss: 0.34133103120988456
Epoch: 53, step: 614, loss: 0.3205290734767914, mean loss: 0.3413307615693576
Epoch: 53, step: 615, loss: 0.3159991204738617, mean loss: 0.34133043321812234
Epoch: 53, step: 616, loss: 0.31469786167144775, mean loss: 0.3413300880085727
Epoch: 53, step: 617, loss: 0.32123836874961853, mean loss: 0.3413298275844734
Epoch: 53, step: 618, loss: 0.3385167717933655, mean loss: 0.3413297911227841
Epoch: 53, step: 619, loss: 0.3269292712211609, mean loss: 0.3413296044714996
Epoch: 53, step: 620, loss: 0.3534564673900604, mean loss: 0.34132976165090834
Epoch: 53, step: 621, loss: 0.34377631545066833, mean loss: 0.3413297933609143
Epoch: 53, step: 622, loss: 0.3003121018409729, mean loss: 0.34132926173378036
Epoch: 53, step: 623, loss: 0.33796316385269165, mean loss: 0.341329218106611
Epoch: 53, step: 624, loss: 0.34351909160614014, mean loss: 0.3413292464886567
Epoch: 53, step: 625, loss: 0.3756530284881592, mean loss: 0.341329691339249
Epoch: 53, step: 626, loss: 0.3388109505176544, mean loss: 0.341329658695736
Epoch: 53, step: 627, loss: 0.40957075357437134, mean loss: 0.3413305431059859
Epoch: 53, step: 628, loss: 0.35288605093955994, mean loss: 0.341330692864385
Epoch: 53, step: 629, loss: 0.3178353011608124, mean loss: 0.34133038837005225
Epoch: 53, step: 630, loss: 0.3123611509799957, mean loss: 0.34133001294092963
Epoch: 53, step: 631, loss: 0.32750916481018066, mean loss: 0.3413298338308766
Epoch: 53, step: 632, loss: 0.2948000431060791, mean loss: 0.3413292308400035
Epoch: 53, step: 633, loss: 0.3038763105869293, mean loss: 0.341328745484792
Epoch: 53, step: 634, loss: 0.30474451184272766, mean loss: 0.3413282713930994
Epoch: 53, step: 635, loss: 0.32681816816329956, mean loss: 0.34132808336045334
Epoch: 53, step: 636, loss: 0.3110961616039276, mean loss: 0.3413276915979353
Epoch: 53, step: 637, loss: 0.3890274465084076, mean loss: 0.34132830971060746
Epoch: 53, step: 638, loss: 0.32675591111183167, mean loss: 0.34132812087803305
Epoch: 53, step: 639, loss: 0.3155342638492584, mean loss: 0.3413277866394876
Epoch: 53, step: 640, loss: 0.31226783990859985, mean loss: 0.3413274100836101
Epoch: 53, step: 641, loss: 0.3431909680366516, mean loss: 0.3413274342310944
Epoch: 53, step: 642, loss: 0.3322679102420807, mean loss: 0.34132731684173273
Epoch: 53, step: 643, loss: 0.33000677824020386, mean loss: 0.34132717015703024
Epoch: 53, step: 644, loss: 0.3057350516319275, mean loss: 0.34132670898182876
Epoch: 53, step: 645, loss: 0.33879297971725464, mean loss: 0.3413266761521459
Epoch: 53, step: 646, loss: 0.29899293184280396, mean loss: 0.3413261276383752
Epoch: 53, step: 647, loss: 0.3199371099472046, mean loss: 0.34132585050676484
Epoch: 53, step: 648, loss: 0.35404667258262634, mean loss: 0.3413260153248169
Epoch: 53, step: 649, loss: 0.3075190782546997, mean loss: 0.3413255773089962
Epoch: 53, step: 650, loss: 0.3446359634399414, mean loss: 0.3413256201990903
Epoch: 53, step: 651, loss: 0.32589229941368103, mean loss: 0.3413254202441672
Epoch: 53, step: 652, loss: 0.30016031861305237, mean loss: 0.3413248869138357
Epoch: 53, step: 653, loss: 0.36304157972335815, mean loss: 0.3413251682691697
Epoch: 53, step: 654, loss: 0.32963669300079346, mean loss: 0.34132501683854966
Epoch: 53, step: 655, loss: 0.34523123502731323, mean loss: 0.34132506744509716
Epoch: 53, step: 656, loss: 0.31664595007896423, mean loss: 0.34132474772185467
Epoch: 53, step: 657, loss: 0.34682777523994446, mean loss: 0.3413248190138293
Epoch: 53, step: 658, loss: 0.33717092871665955, mean loss: 0.3413247652006866
Epoch: 53, step: 659, loss: 0.3294072151184082, mean loss: 0.34132461081227744
Epoch: 53, step: 660, loss: 0.3375300467014313, mean loss: 0.34132456165543534
Epoch: 53, step: 661, loss: 0.33842045068740845, mean loss: 0.3413245240344937
Epoch: 53, step: 662, loss: 0.3619300425052643, mean loss: 0.34132479096264284
Epoch: 53, step: 663, loss: 0.38267987966537476, mean loss: 0.34132532667807763
Epoch: 53, step: 664, loss: 0.2965085208415985, mean loss: 0.34132474612694436
Epoch: 53, step: 665, loss: 0.3054761588573456, mean loss: 0.34132428175497526
Epoch: 53, step: 666, loss: 0.34288591146469116, mean loss: 0.3413243019836014
Epoch: 53, step: 667, loss: 0.32937830686569214, mean loss: 0.341324147242732
Epoch: 53, step: 668, loss: 0.33576661348342896, mean loss: 0.34132407525488523
Epoch: 53, step: 669, loss: 0.3563946485519409, mean loss: 0.341324270464508
Epoch: 53, step: 670, loss: 0.3442939221858978, mean loss: 0.3413243089300044
Epoch: 53, step: 671, loss: 0.30539414286613464, mean loss: 0.34132384353745915
Epoch: 53, step: 672, loss: 0.40387243032455444, mean loss: 0.3413246536998423
Epoch: 53, step: 673, loss: 0.3453766405582428, mean loss: 0.3413247061826397
Epoch: 53, step: 674, loss: 0.3255404829978943, mean loss: 0.3413245017423275
Epoch: 53, step: 675, loss: 0.3488141596317291, mean loss: 0.3413245987485689
Epoch: 53, step: 676, loss: 0.3327827453613281, mean loss: 0.34132448811569727
Epoch: 53, step: 677, loss: 0.3354494273662567, mean loss: 0.34132441202373054
Epoch: 53, step: 678, loss: 0.3771522641181946, mean loss: 0.34132487604896133
Epoch: 53, step: 679, loss: 0.29768866300582886, mean loss: 0.34132431090088794
Epoch: 53, step: 680, loss: 0.31281134486198425, mean loss: 0.34132394162413354
Epoch: 53, step: 681, loss: 0.29656749963760376, mean loss: 0.34132336198259206
Epoch: 53, step: 682, loss: 0.3224993050098419, mean loss: 0.3413231181950252
Epoch: 53, step: 683, loss: 0.31586241722106934, mean loss: 0.3413227884615377
Epoch: 53, step: 684, loss: 0.36175537109375, mean loss: 0.3413230530740276
Epoch: 53, step: 685, loss: 0.331271767616272, mean loss: 0.34132292290637944
Epoch: 53, step: 686, loss: 0.34537798166275024, mean loss: 0.3413229754201229
Epoch: 53, step: 687, loss: 0.2954399585723877, mean loss: 0.34132238123446057
Epoch: 53, step: 688, loss: 0.3516334891319275, mean loss: 0.3413225147617122
Epoch: 53, step: 689, loss: 0.33767956495285034, mean loss: 0.34132246758668683
Epoch: 53, step: 690, loss: 0.3745652139186859, mean loss: 0.34132289806395827
Epoch: 53, step: 691, loss: 0.30463284254074097, mean loss: 0.3413224229518749
Epoch: 53, step: 692, loss: 0.36685997247695923, mean loss: 0.3413227536420598
Epoch: 53, step: 693, loss: 0.3483816683292389, mean loss: 0.34132284504799415
Epoch: 53, step: 694, loss: 0.3305356204509735, mean loss: 0.3413227053659581
Epoch: 53, step: 695, loss: 0.3319772183895111, mean loss: 0.34132258435431756
Epoch: 53, step: 696, loss: 0.3296671211719513, mean loss: 0.34132243343350827
Epoch: 53, step: 697, loss: 0.3656013011932373, mean loss: 0.3413227478044491
Epoch: 53, step: 698, loss: 0.33071327209472656, mean loss: 0.3413226104311701
Epoch: 53, step: 699, loss: 0.3114902377128601, mean loss: 0.3413222241615834
Epoch: 53, step: 700, loss: 0.31981346011161804, mean loss: 0.3413219456696946
Epoch: 53, step: 701, loss: 0.3160191476345062, mean loss: 0.34132161805752853
Epoch: 53, step: 702, loss: 0.37106093764305115, mean loss: 0.3413220031073063
Epoch: 53, step: 703, loss: 0.39727893471717834, mean loss: 0.34132272760018023
Epoch: 53, step: 704, loss: 0.38614246249198914, mean loss: 0.3413233078885769
Epoch: 53, step: 705, loss: 0.3446144759654999, mean loss: 0.34132335049931356
Epoch: 53, step: 706, loss: 0.3319826126098633, mean loss: 0.3413232295663925
Epoch: 53, step: 707, loss: 0.30221015214920044, mean loss: 0.3413227231826869
Epoch: 53, step: 708, loss: 0.2988463044166565, mean loss: 0.3413221732620649
Epoch: 53, step: 709, loss: 0.3824519217014313, mean loss: 0.3413227057411364
Epoch: 53, step: 710, loss: 0.29182347655296326, mean loss: 0.34132206491634726
Epoch: 53, step: 711, loss: 0.3556065559387207, mean loss: 0.34132224984321563
Epoch: 53, step: 712, loss: 0.3695472478866577, mean loss: 0.3413226152390088
Epoch: 53, step: 713, loss: 0.3283787965774536, mean loss: 0.3413224476728091
Epoch: 53, step: 714, loss: 0.3311140239238739, mean loss: 0.3413223155197967
Epoch: 53, step: 715, loss: 0.37001773715019226, mean loss: 0.34132268699118273
Epoch: 53, step: 716, loss: 0.36009153723716736, mean loss: 0.34132292995679064
Epoch: 53, step: 717, loss: 0.32093334197998047, mean loss: 0.3413226660139042
Epoch: 53, step: 718, loss: 0.3429940342903137, mean loss: 0.34132268764945944
Epoch: 53, step: 719, loss: 0.31844577193260193, mean loss: 0.34132239151582255
Epoch: 53, step: 720, loss: 0.33966678380966187, mean loss: 0.34132237008483984
Epoch: 53, step: 721, loss: 0.33891722559928894, mean loss: 0.34132233895189545
Epoch: 53, step: 722, loss: 0.31052452325820923, mean loss: 0.3413219403004723
Epoch: 53, step: 723, loss: 0.3432798385620117, mean loss: 0.34132196564346523
Epoch: 53, step: 724, loss: 0.34990519285202026, mean loss: 0.34132207674313525
Epoch: 53, step: 725, loss: 0.3209366500377655, mean loss: 0.34132181288144187
Epoch: 53, step: 726, loss: 0.31536349654197693, mean loss: 0.34132147689060144
Epoch: 53, step: 727, loss: 0.3642398416996002, mean loss: 0.3413217735300631
Epoch: 53, step: 728, loss: 0.3106798529624939, mean loss: 0.34132137692737136
Epoch: 53, step: 729, loss: 0.30192625522613525, mean loss: 0.3413208670373646
Epoch: 53, step: 730, loss: 0.335978239774704, mean loss: 0.3413207978887778
Epoch: 53, step: 731, loss: 0.32865622639656067, mean loss: 0.34132063397581064
Epoch: 53, step: 732, loss: 0.32268664240837097, mean loss: 0.3413203928059204
Epoch: 53, step: 733, loss: 0.3434135317802429, mean loss: 0.3413204198959597
Epoch: 53, step: 734, loss: 0.34597480297088623, mean loss: 0.3413204801336171
Epoch: 53, step: 735, loss: 0.3534708023071289, mean loss: 0.34132063738270046
Epoch: 53, step: 736, loss: 0.31952351331710815, mean loss: 0.3413203552886645
Epoch: 53, step: 737, loss: 0.3595726788043976, mean loss: 0.3413205915035411
Epoch: 53, step: 738, loss: 0.3302624225616455, mean loss: 0.3413204483946265
Epoch: 53, step: 739, loss: 0.3316706418991089, mean loss: 0.34132032351360236
Epoch: 53, step: 740, loss: 0.3148166537284851, mean loss: 0.3413199805261451
Epoch: 53, step: 741, loss: 0.28349870443344116, mean loss: 0.34131923226313177
Epoch: 53, step: 742, loss: 0.3208363652229309, mean loss: 0.3413189671985308
Epoch: 53, step: 743, loss: 0.3484947383403778, mean loss: 0.3413190600575186
Epoch: 53, step: 744, loss: 0.322020024061203, mean loss: 0.3413188103190971
Epoch: 53, step: 745, loss: 0.31213614344596863, mean loss: 0.34131843268682305
Epoch: 53, step: 746, loss: 0.3042471408843994, mean loss: 0.3413179529796348
Epoch: 53, step: 747, loss: 0.33995798230171204, mean loss: 0.34131793538167055
Epoch: 53, step: 748, loss: 0.3678843677043915, mean loss: 0.34131827914575646
Epoch: 53, step: 749, loss: 0.33154740929603577, mean loss: 0.3413181527143772
Epoch: 53, step: 750, loss: 0.3259446620941162, mean loss: 0.34131795378976737
Epoch: 53, step: 751, loss: 0.33361613750457764, mean loss: 0.3413178541337417
Epoch: 53, step: 752, loss: 0.33100518584251404, mean loss: 0.3413177206968744
Epoch: 53, step: 753, loss: 0.3331153094768524, mean loss: 0.3413176145662528
Epoch: 53, step: 754, loss: 0.3306148946285248, mean loss: 0.3413174760860435
Epoch: 53, step: 755, loss: 0.32917454838752747, mean loss: 0.3413173189733262
Epoch: 53, step: 756, loss: 0.3467041552066803, mean loss: 0.34131738867064704
Epoch: 53, step: 757, loss: 0.3678877055644989, mean loss: 0.34131773244496316
Epoch: 53, step: 758, loss: 0.36148834228515625, mean loss: 0.34131799341467295
Epoch: 53, step: 759, loss: 0.3305775821208954, mean loss: 0.341317854455773
Epoch: 53, step: 760, loss: 0.3424549102783203, mean loss: 0.3413178691667536
Epoch: 53, step: 761, loss: 0.39115315675735474, mean loss: 0.34131851391650897
Epoch: 53, step: 762, loss: 0.34984090924263, mean loss: 0.34131862417455056
Epoch: 53, step: 763, loss: 0.36977246403694153, mean loss: 0.3413189922898458
Epoch: 53, step: 764, loss: 0.292075514793396, mean loss: 0.34131835522142795
Epoch: 53, step: 765, loss: 0.32861384749412537, mean loss: 0.3413181908639061
Epoch: 53, step: 766, loss: 0.3311160206794739, mean loss: 0.3413180588806956
Epoch: 53, step: 767, loss: 0.313603937625885, mean loss: 0.3413177003539006
Epoch: 53, step: 768, loss: 0.3272985517978668, mean loss: 0.3413175189959808
Epoch: 53, step: 769, loss: 0.30288904905319214, mean loss: 0.341317021874691
Epoch: 53, step: 770, loss: 0.34711432456970215, mean loss: 0.341317096869228
Epoch: 53, step: 771, loss: 0.3428328335285187, mean loss: 0.3413171164767083
Epoch: 53, step: 772, loss: 0.340246319770813, mean loss: 0.34131710262512427
Epoch: 53, step: 773, loss: 0.32526877522468567, mean loss: 0.34131689503027524
Epoch: 53, step: 774, loss: 0.3147134780883789, mean loss: 0.34131655090339225
Epoch: 53, step: 775, loss: 0.3401441276073456, mean loss: 0.34131653573777815
Epoch: 53, step: 776, loss: 0.3415742516517639, mean loss: 0.34131653907136045
Epoch: 53, step: 777, loss: 0.30645182728767395, mean loss: 0.3413160880985007
Epoch: 53, step: 778, loss: 0.3402833640575409, mean loss: 0.34131607474045284
Epoch: 53, step: 779, loss: 0.3118079900741577, mean loss: 0.34131569306510273
Epoch: 53, step: 780, loss: 0.3433154225349426, mean loss: 0.3413157189304743
Epoch: 53, step: 781, loss: 0.30684947967529297, mean loss: 0.3413152731348971
Epoch: 53, step: 782, loss: 0.32492101192474365, mean loss: 0.3413150610898708
Epoch: 53, step: 783, loss: 0.3209932744503021, mean loss: 0.34131479824923444
Epoch: 53, step: 784, loss: 0.32401880621910095, mean loss: 0.3413145745469176
Epoch: 53, step: 785, loss: 0.3225158751010895, mean loss: 0.34131433141207906
Epoch: 53, step: 786, loss: 0.37852442264556885, mean loss: 0.34131481266624986
Epoch: 53, step: 787, loss: 0.3405095934867859, mean loss: 0.34131480225213734
Epoch: 53, step: 788, loss: 0.3256939947605133, mean loss: 0.34131460022671745
Epoch: 53, step: 789, loss: 0.40468037128448486, mean loss: 0.3413154197317879
Epoch: 53, step: 790, loss: 0.2944841682910919, mean loss: 0.3413148140743323
Epoch: 53, step: 791, loss: 0.33852484822273254, mean loss: 0.341314777992833
Epoch: 53, step: 792, loss: 0.34361085295677185, mean loss: 0.3413148076866573
Epoch: 53, step: 793, loss: 0.32083186507225037, mean loss: 0.34131454279590107
Epoch: 53, step: 794, loss: 0.3155863285064697, mean loss: 0.3413142100762263
Epoch: 53, step: 795, loss: 0.34059420228004456, mean loss: 0.3413142007651385
Epoch: 53, step: 796, loss: 0.37080496549606323, mean loss: 0.3413145821326039
Epoch: 53, step: 797, loss: 0.33556151390075684, mean loss: 0.3413145077362735
Epoch: 53, step: 798, loss: 0.3718452751636505, mean loss: 0.3413149025425921
Epoch: 53, step: 799, loss: 0.34679463505744934, mean loss: 0.34131497340242395
Epoch: 53, step: 800, loss: 0.31930413842201233, mean loss: 0.341314688778331
Epoch: 53, step: 801, loss: 0.33991360664367676, mean loss: 0.34131467066104576
Epoch: 53, step: 802, loss: 0.3433484435081482, mean loss: 0.3413146969592658
Epoch: 53, step: 803, loss: 0.3213905096054077, mean loss: 0.3413144393277959
Epoch: 53, step: 804, loss: 0.30225715041160583, mean loss: 0.3413139343005914
Epoch: 53, step: 805, loss: 0.33808833360671997, mean loss: 0.34131389259275446
Epoch: 53, step: 806, loss: 0.3362513780593872, mean loss: 0.341313827134001
Epoch: 53, step: 807, loss: 0.3423894941806793, mean loss: 0.3413138410422897
Epoch: 53, step: 808, loss: 0.2947598993778229, mean loss: 0.3413132391113389
Epoch: 53, step: 809, loss: 0.33634358644485474, mean loss: 0.34131317485578994
Epoch: 53, step: 810, loss: 0.3319510519504547, mean loss: 0.3413130538089867
Epoch: 53, step: 811, loss: 0.3108460605144501, mean loss: 0.34131265989357895
Epoch: 53, step: 812, loss: 0.33645567297935486, mean loss: 0.34131259709718725
Epoch: 53, step: 813, loss: 0.31920498609542847, mean loss: 0.3413123112697236
Epoch: 53, step: 814, loss: 0.37987303733825684, mean loss: 0.3413128098116977
Epoch: 53, step: 815, loss: 0.3002769947052002, mean loss: 0.3413122792767762
Epoch: 53, step: 816, loss: 0.32782530784606934, mean loss: 0.3413121049116076
Epoch: 53, step: 817, loss: 0.3501465320587158, mean loss: 0.34131221912527465
Epoch: 53, step: 818, loss: 0.3043762147426605, mean loss: 0.34131174161361505
Epoch: 53, step: 819, loss: 0.3045880198478699, mean loss: 0.3413112668525001
Epoch: 53, step: 820, loss: 0.34388506412506104, mean loss: 0.3413113001258996
Epoch: 53, step: 821, loss: 0.35051825642585754, mean loss: 0.341311419149561
Epoch: 53, step: 822, loss: 0.34021085500717163, mean loss: 0.34131140492211426
Epoch: 53, step: 823, loss: 0.3322085738182068, mean loss: 0.3413112872475822
Epoch: 53, step: 824, loss: 0.34724071621894836, mean loss: 0.3413113638977751
Epoch: 53, step: 825, loss: 0.3160703480243683, mean loss: 0.34131103760940323
Epoch: 53, step: 826, loss: 0.3146139085292816, mean loss: 0.34131069250244633
Epoch: 53, step: 827, loss: 0.3426022529602051, mean loss: 0.3413107091979021
Epoch: 53, step: 828, loss: 0.3395625650882721, mean loss: 0.34131068660067465
Epoch: 53, step: 829, loss: 0.3449832797050476, mean loss: 0.34131073407350504
Epoch: 53, step: 830, loss: 0.3146344721317291, mean loss: 0.3413103892541218
Epoch: 53, step: 831, loss: 0.2920222580432892, mean loss: 0.34130975216023823
Epoch: 53, step: 832, loss: 0.33032870292663574, mean loss: 0.3413096102220332
Epoch: 53, step: 833, loss: 0.3584037721157074, mean loss: 0.341309831173897
Epoch: 53, step: 834, loss: 0.31322047114372253, mean loss: 0.341309468107473
Epoch: 53, step: 835, loss: 0.2907092273235321, mean loss: 0.34130881408719604
Epoch: 53, step: 836, loss: 0.36170536279678345, mean loss: 0.3413090777140842
Epoch: 53, step: 837, loss: 0.3284793794155121, mean loss: 0.3413089118914359
Epoch: 53, step: 838, loss: 0.35795629024505615, mean loss: 0.3413091270544602
Epoch: 53, step: 839, loss: 0.36210963129997253, mean loss: 0.34130939589207904
Epoch: 53, step: 840, loss: 0.3099723756313324, mean loss: 0.3413089908797329
Epoch: 53, step: 841, loss: 0.323382169008255, mean loss: 0.3413087591892183
Epoch: 53, step: 842, loss: 0.3513585329055786, mean loss: 0.3413088890732082
Epoch: 53, step: 843, loss: 0.34422463178634644, mean loss: 0.3413089267559873
Epoch: 53, step: 844, loss: 0.36462512612342834, mean loss: 0.3413092280884164
Epoch: 53, step: 845, loss: 0.3083270490169525, mean loss: 0.34130880184091617
Epoch: 53, step: 846, loss: 0.3028782606124878, mean loss: 0.34130830518754474
Epoch: 53, step: 847, loss: 0.34193241596221924, mean loss: 0.34130831325307553
Epoch: 53, step: 848, loss: 0.3274597227573395, mean loss: 0.3413081342867854
Epoch: 53, step: 849, loss: 0.3236358165740967, mean loss: 0.3413079059091561
Epoch: 53, step: 850, loss: 0.3390618860721588, mean loss: 0.34130787688443703
Epoch: 53, step: 851, loss: 0.30266571044921875, mean loss: 0.34130737752841467
Epoch: 53, step: 852, loss: 0.3438912034034729, mean loss: 0.3413074109176487
Epoch: 53, step: 853, loss: 0.3530583679676056, mean loss: 0.3413075627662654
Epoch: 53, step: 854, loss: 0.33498960733413696, mean loss: 0.3413074811252219
Epoch: 53, step: 855, loss: 0.350629061460495, mean loss: 0.3413076015777512
Epoch: 53, step: 856, loss: 0.3304983973503113, mean loss: 0.34130746190409955
Epoch: 53, step: 857, loss: 0.33528268337249756, mean loss: 0.34130738405452554
Epoch: 53, step: 858, loss: 0.3898783326148987, mean loss: 0.341308011659138
Epoch: 53, step: 859, loss: 0.3080906271934509, mean loss: 0.34130758244960124
Epoch: 53, step: 860, loss: 0.2933163046836853, mean loss: 0.3413069623511716
Epoch: 53, step: 861, loss: 0.3887311816215515, mean loss: 0.3413075751146839
Epoch: 53, step: 862, loss: 0.284288227558136, mean loss: 0.34130683838301445
Epoch: 53, step: 863, loss: 0.2963755428791046, mean loss: 0.34130625784531865
Epoch: 53, step: 864, loss: 0.3505357503890991, mean loss: 0.3413063770940304
Epoch: 53, step: 865, loss: 0.3881582021713257, mean loss: 0.3413069824304096
Epoch: 53, step: 866, loss: 0.31243041157722473, mean loss: 0.34130660934327856
Epoch: 53, step: 867, loss: 0.37711334228515625, mean loss: 0.3413070719625672
Epoch: 53, step: 868, loss: 0.3301650583744049, mean loss: 0.3413069280107631
Epoch: 53, step: 869, loss: 0.30906417965888977, mean loss: 0.3413065114485509
Epoch: 53, step: 870, loss: 0.3391672670841217, mean loss: 0.341306483810806
Epoch: 53, step: 871, loss: 0.32702043652534485, mean loss: 0.3413062992460899
Epoch: 53, step: 872, loss: 0.3712642192840576, mean loss: 0.34130668627431854
Epoch: 53, step: 873, loss: 0.29553768038749695, mean loss: 0.3413060949893292
Epoch: 53, step: 874, loss: 0.4025792181491852, mean loss: 0.3413068865601582
Epoch: 53, step: 875, loss: 0.36103251576423645, mean loss: 0.34130714138691
Epoch: 53, step: 876, loss: 0.3464653789997101, mean loss: 0.3413072080230584
Epoch: 53, step: 877, loss: 0.34037378430366516, mean loss: 0.34130719596487835
Epoch: 53, step: 878, loss: 0.3366895616054535, mean loss: 0.34130713631399723
Epoch: 53, step: 879, loss: 0.3370802104473114, mean loss: 0.3413070817110175
Epoch: 53, step: 880, loss: 0.30574995279312134, mean loss: 0.3413066223937333
Epoch: 53, step: 881, loss: 0.35855233669281006, mean loss: 0.3413068451662848
Epoch: 53, step: 882, loss: 0.33616116642951965, mean loss: 0.3413067786975289
Epoch: 53, step: 883, loss: 0.3634224832057953, mean loss: 0.3413070643710913
Epoch: 53, step: 884, loss: 0.3532918393611908, mean loss: 0.3413072191791437
Epoch: 53, step: 885, loss: 0.3347441852092743, mean loss: 0.34130713440513805
Epoch: 53, step: 886, loss: 0.3127971589565277, mean loss: 0.34130676614960065
Epoch: 53, step: 887, loss: 0.3143121302127838, mean loss: 0.34130641747179213
Epoch: 53, step: 888, loss: 0.3136206865310669, mean loss: 0.34130605987203316
Epoch: 53, step: 889, loss: 0.3154858946800232, mean loss: 0.34130572637296064
Epoch: 53, step: 890, loss: 0.29845115542411804, mean loss: 0.34130517286081374
Epoch: 53, step: 891, loss: 0.3144136369228363, mean loss: 0.34130482553264757
Epoch: 53, step: 892, loss: 0.3089291453361511, mean loss: 0.34130440737726886
Epoch: 53, step: 893, loss: 0.3265649974346161, mean loss: 0.34130421700956365
Epoch: 53, step: 894, loss: 0.35681983828544617, mean loss: 0.34130441739988326
Epoch: 53, step: 895, loss: 0.3476213216781616, mean loss: 0.34130449898411996
Epoch: 53, step: 896, loss: 0.37038907408714294, mean loss: 0.3413048746130846
Epoch: 53, step: 897, loss: 0.33060237765312195, mean loss: 0.3413047363915043
Epoch: 53, step: 898, loss: 0.32426923513412476, mean loss: 0.3413045163827061
Epoch: 53, step: 899, loss: 0.37072432041168213, mean loss: 0.34130489632645067
Epoch: 53, step: 900, loss: 0.33823177218437195, mean loss: 0.3413048566389254
Epoch: 53, step: 901, loss: 0.3292911946773529, mean loss: 0.3413047014918071
Epoch: 53, step: 902, loss: 0.4061861038208008, mean loss: 0.3413055393739318
Epoch: 53, step: 903, loss: 0.3711296617984772, mean loss: 0.3413059245193735
Epoch: 53, step: 904, loss: 0.36215972900390625, mean loss: 0.3413061938196368
Epoch: 53, step: 905, loss: 0.34641024470329285, mean loss: 0.341306259731087
Epoch: 53, step: 906, loss: 0.4124467074871063, mean loss: 0.3413071783954261
Epoch: 53, step: 907, loss: 0.3466982841491699, mean loss: 0.3413072480119777
Epoch: 53, step: 908, loss: 0.32761090993881226, mean loss: 0.3413070711503918
Epoch: 53, step: 909, loss: 0.36293700337409973, mean loss: 0.3413073504553197
Epoch: 53, step: 910, loss: 0.3229956328868866, mean loss: 0.3413071140011848
Epoch: 53, step: 911, loss: 0.33441591262817383, mean loss: 0.34130702501816
Epoch: 53, step: 912, loss: 0.33726540207862854, mean loss: 0.34130697283115063
Epoch: 53, step: 913, loss: 0.3183573782444, mean loss: 0.3413066765008742
Epoch: 53, step: 914, loss: 0.28622397780418396, mean loss: 0.34130596526998475
Epoch: 53, step: 915, loss: 0.31201207637786865, mean loss: 0.34130558703053515
Epoch: 53, step: 916, loss: 0.3429113030433655, mean loss: 0.3413056077630948
Epoch: 53, step: 917, loss: 0.33760544657707214, mean loss: 0.34130555998825707
Epoch: 53, step: 918, loss: 0.33379632234573364, mean loss: 0.34130546303356774
Epoch: 53, step: 919, loss: 0.3564988374710083, mean loss: 0.3413056591986046
Epoch: 53, step: 920, loss: 0.28847891092300415, mean loss: 0.34130497714951324
Epoch: 53, step: 921, loss: 0.33440279960632324, mean loss: 0.3413048880362648
Epoch: 53, step: 922, loss: 0.37213295698165894, mean loss: 0.3413052860489037
Epoch: 53, step: 923, loss: 0.333110511302948, mean loss: 0.34130518024980816
Epoch: 53, step: 924, loss: 0.31973981857299805, mean loss: 0.3413049018326002
Epoch: 53, step: 925, loss: 0.33567866683006287, mean loss: 0.34130482919665556
Epoch: 53, step: 926, loss: 0.3307965397834778, mean loss: 0.3413046935340545
Epoch: 53, step: 927, loss: 0.3524838387966156, mean loss: 0.3413048378555787
Epoch: 53, step: 928, loss: 0.3348999321460724, mean loss: 0.34130475517002457
Epoch: 53, step: 929, loss: 0.3108011484146118, mean loss: 0.34130436138201553
Epoch: 53, step: 930, loss: 0.33884936571121216, mean loss: 0.3413043296895214
Epoch: 53, step: 931, loss: 0.2817865312099457, mean loss: 0.34130356136102713
Epoch: 53, step: 932, loss: 0.3819594979286194, mean loss: 0.3413040861907769
Epoch: 53, step: 933, loss: 0.3385075330734253, mean loss: 0.34130405009038295
Epoch: 53, step: 934, loss: 0.2931250333786011, mean loss: 0.3413034281608296
Epoch: 53, step: 935, loss: 0.38097140192985535, mean loss: 0.3413039402170821
Epoch: 53, step: 936, loss: 0.32659605145454407, mean loss: 0.3413037503619302
Epoch: 53, step: 937, loss: 0.3360002636909485, mean loss: 0.34130368190334404
Epoch: 53, step: 938, loss: 0.34330350160598755, mean loss: 0.3413037077171286
Epoch: 53, step: 939, loss: 0.3182200491428375, mean loss: 0.341303409755819
Epoch: 53, step: 940, loss: 0.32509955763816833, mean loss: 0.34130320060098934
Epoch: 53, step: 941, loss: 0.33180585503578186, mean loss: 0.3413030780134688
Epoch: 53, step: 942, loss: 0.3338501751422882, mean loss: 0.3413029818159487
Epoch: 53, step: 943, loss: 0.3319183588027954, mean loss: 0.3413028606865278
Epoch: 53, step: 944, loss: 0.35415491461753845, mean loss: 0.3413030265687113
Epoch: 53, step: 945, loss: 0.2946329712867737, mean loss: 0.3413024242034556
Epoch: 53, step: 946, loss: 0.3209700286388397, mean loss: 0.3413021617788558
Epoch: 53, step: 947, loss: 0.34439894556999207, mean loss: 0.3413022017476709
Epoch: 53, step: 948, loss: 0.3338562548160553, mean loss: 0.34130210564737623
Epoch: 53, step: 949, loss: 0.310123085975647, mean loss: 0.34130170324398357
Epoch: 53, step: 950, loss: 0.3484765291213989, mean loss: 0.34130179584269393
Epoch: 53, step: 951, loss: 0.3190292418003082, mean loss: 0.3413015083955559
Epoch: 53, step: 952, loss: 0.3182366192340851, mean loss: 0.34130121072646946
Epoch: 53, step: 953, loss: 0.3521254062652588, mean loss: 0.34130135041874343
Epoch: 53, step: 954, loss: 0.33182263374328613, mean loss: 0.34130122809220254
Epoch: 53, step: 955, loss: 0.3555918335914612, mean loss: 0.3413014125156681
Epoch: 53, step: 956, loss: 0.3097544014453888, mean loss: 0.3413010053996765
Epoch: 53, step: 957, loss: 0.3243025839328766, mean loss: 0.3413007860369011
Epoch: 53, step: 958, loss: 0.3196070194244385, mean loss: 0.3413005060848214
Epoch: 53, step: 959, loss: 0.35405412316322327, mean loss: 0.3413006706646113
Epoch: 53, step: 960, loss: 0.3342931866645813, mean loss: 0.34130058023729526
Epoch: 53, step: 961, loss: 0.30416539311408997, mean loss: 0.341300101036491
Epoch: 53, step: 962, loss: 0.35050463676452637, mean loss: 0.3413002198123569
Epoch: 53, step: 963, loss: 0.31799957156181335, mean loss: 0.3412999191433127
Epoch: 53, step: 964, loss: 0.3150709867477417, mean loss: 0.34129958069237404
Epoch: 53, step: 965, loss: 0.3522796928882599, mean loss: 0.3412997223748974
Epoch: 53, step: 966, loss: 0.36483973264694214, mean loss: 0.3413000261208847
Epoch: 53, step: 967, loss: 0.33512192964553833, mean loss: 0.34129994640351086
Epoch: 53, step: 968, loss: 0.3154548704624176, mean loss: 0.34129961292296296
Epoch: 53, step: 969, loss: 0.3158670961856842, mean loss: 0.34129928476992516
Epoch: 53, step: 970, loss: 0.35477215051651, mean loss: 0.341299458606625
Epoch: 53, step: 971, loss: 0.30606895685195923, mean loss: 0.3412990040429669
Epoch: 53, step: 972, loss: 0.3680063486099243, mean loss: 0.341299348631633
Epoch: 53, step: 973, loss: 0.2865263819694519, mean loss: 0.3412986419383878
Epoch: 53, step: 974, loss: 0.3606354892253876, mean loss: 0.3412988914235606
Epoch: 53, step: 975, loss: 0.36501777172088623, mean loss: 0.34129919744203996
Epoch: 53, step: 976, loss: 0.3030938506126404, mean loss: 0.34129870452706457
Epoch: 53, step: 977, loss: 0.3529644012451172, mean loss: 0.3412988550327634
Epoch: 53, step: 978, loss: 0.32114872336387634, mean loss: 0.3412985950679627
Epoch: 53, step: 979, loss: 0.32335948944091797, mean loss: 0.3412983636314673
Epoch: 53, step: 980, loss: 0.31663793325424194, mean loss: 0.34129804548573206
Epoch: 53, step: 981, loss: 0.31534913182258606, mean loss: 0.34129771072151316
Epoch: 53, step: 982, loss: 0.3190860450267792, mean loss: 0.34129742417483583
Epoch: 53, step: 983, loss: 0.33121463656425476, mean loss: 0.34129729410120446
Epoch: 53, step: 984, loss: 0.3351050019264221, mean loss: 0.341297214218183
Epoch: 53, step: 985, loss: 0.3077542185783386, mean loss: 0.341296781505837
Epoch: 53, step: 986, loss: 0.31052884459495544, mean loss: 0.341296384597506
Epoch: 53, step: 987, loss: 0.36695870757102966, mean loss: 0.341296715638824
Epoch: 53, step: 988, loss: 0.32579973340034485, mean loss: 0.3412965157319312
Epoch: 53, step: 989, loss: 0.32636284828186035, mean loss: 0.34129632309413227
Epoch: 53, step: 990, loss: 0.32727113366127014, mean loss: 0.3412961421776374
Epoch: 53, step: 991, loss: 0.36022672057151794, mean loss: 0.34129638636754495
Epoch: 53, step: 992, loss: 0.37694084644317627, mean loss: 0.34129684614774586
Epoch: 53, step: 993, loss: 0.3176215887069702, mean loss: 0.34129654076300475
Epoch: 53, step: 994, loss: 0.3244684636592865, mean loss: 0.3412963237021472
Epoch: 53, step: 995, loss: 0.33919814229011536, mean loss: 0.34129629663861644
Epoch: 53, step: 996, loss: 0.3138252794742584, mean loss: 0.34129594230646765
Epoch: 53, step: 997, loss: 0.34569570422172546, mean loss: 0.34129599905562175
Epoch: 53, step: 998, loss: 0.3077961206436157, mean loss: 0.34129556697195956
Epoch: 53, step: 999, loss: 0.379482239484787, mean loss: 0.3412960594998514
Epoch: 53, step: 1000, loss: 0.3615924119949341, mean loss: 0.3412963212768044
Epoch: 53, step: 1001, loss: 0.3268795311450958, mean loss: 0.3412961353352803
Epoch: 53, step: 1002, loss: 0.2951810359954834, mean loss: 0.34129554057034395
Epoch: 53, step: 1003, loss: 0.3249603807926178, mean loss: 0.34129532989195227
Epoch: 53, step: 1004, loss: 0.32624563574790955, mean loss: 0.341295135795016
Epoch: 53, step: 1005, loss: 0.3158600330352783, mean loss: 0.3412948077609842
Epoch: 53, step: 1006, loss: 0.3599160313606262, mean loss: 0.3412950479139859
Epoch: 53, step: 1007, loss: 0.32820096611976624, mean loss: 0.34129487904524985
Epoch: 53, step: 1008, loss: 0.3448292315006256, mean loss: 0.34129492462568417
Epoch: 53, step: 1009, loss: 0.31660735607147217, mean loss: 0.34129460624895214
Epoch: 53, step: 1010, loss: 0.40944743156433105, mean loss: 0.3412954851525968
Epoch: 53, step: 1011, loss: 0.31466537714004517, mean loss: 0.3412951417332734
Epoch: 53, step: 1012, loss: 0.3520783483982086, mean loss: 0.3412952807906809
Epoch: 53, step: 1013, loss: 0.3284488618373871, mean loss: 0.3412951151287647
Epoch: 53, step: 1014, loss: 0.315566748380661, mean loss: 0.34129478335104607
Epoch: 53, step: 1015, loss: 0.30935436487197876, mean loss: 0.34129437147171354
Epoch: 53, step: 1016, loss: 0.3006516098976135, mean loss: 0.3412938473803446
Epoch: 53, step: 1017, loss: 0.3282407522201538, mean loss: 0.3412936790619028
Epoch: 53, step: 1018, loss: 0.349333256483078, mean loss: 0.34129378273016525
Epoch: 53, step: 1019, loss: 0.35168641805648804, mean loss: 0.34129391673877013
Epoch: 53, step: 1020, loss: 0.30122247338294983, mean loss: 0.34129340004124253
Epoch: 53, step: 1021, loss: 0.31083354353904724, mean loss: 0.3412930072844988
Epoch: 53, step: 1022, loss: 0.36694565415382385, mean loss: 0.3412933380516559
Epoch: 53, step: 1023, loss: 0.3250831663608551, mean loss: 0.3412931290391786
Epoch: 53, step: 1024, loss: 0.3417716920375824, mean loss: 0.3412931352096467
Epoch: 53, step: 1025, loss: 0.31294092535972595, mean loss: 0.34129276964826233
Epoch: 53, step: 1026, loss: 0.33675581216812134, mean loss: 0.3412927111514086
Epoch: 53, step: 1027, loss: 0.313979834318161, mean loss: 0.34129235899982485
Epoch: 53, step: 1028, loss: 0.3483494520187378, mean loss: 0.34129244998747355
Epoch: 53, step: 1029, loss: 0.33833047747612, mean loss: 0.34129241179902414
Epoch: 53, step: 1030, loss: 0.33961236476898193, mean loss: 0.3412923901386058
Epoch: 53, step: 1031, loss: 0.32520508766174316, mean loss: 0.3412921827317872
Epoch: 53, step: 1032, loss: 0.378286749124527, mean loss: 0.341292659681009
Epoch: 53, step: 1033, loss: 0.3405403196811676, mean loss: 0.3412926499816562
Epoch: 53, step: 1034, loss: 0.3299470841884613, mean loss: 0.3412925037137099
Epoch: 53, step: 1035, loss: 0.35306090116500854, mean loss: 0.34129265543088
Epoch: 53, step: 1036, loss: 0.3111168146133423, mean loss: 0.34129226641154475
Epoch: 53, step: 1037, loss: 0.3115842342376709, mean loss: 0.341291883428018
Epoch: 53, step: 1038, loss: 0.28935790061950684, mean loss: 0.34129121392546147
Epoch: 53, step: 1039, loss: 0.32901227474212646, mean loss: 0.34129105563459383
Epoch: 53, step: 1040, loss: 0.2966662347316742, mean loss: 0.3412904803723131
Epoch: 53, step: 1041, loss: 0.33443590998649597, mean loss: 0.34129039201061473
Epoch: 53, step: 1042, loss: 0.30877915024757385, mean loss: 0.34128997291629615
Epoch: 53, step: 1043, loss: 0.33324453234672546, mean loss: 0.3412898692058629
Epoch: 53, step: 1044, loss: 0.2857237756252289, mean loss: 0.34128915293565937
Epoch: 53, step: 1045, loss: 0.3212900459766388, mean loss: 0.34128889514212307
Epoch: 53, step: 1046, loss: 0.3056483566761017, mean loss: 0.3412884357325088
Epoch: 53, step: 1047, loss: 0.365619421005249, mean loss: 0.34128874935696446
Epoch: 53, step: 1048, loss: 0.34587228298187256, mean loss: 0.341288808437585
Epoch: 53, step: 1049, loss: 0.283293217420578, mean loss: 0.34128806089832314
Epoch: 53, step: 1050, loss: 0.3227776885032654, mean loss: 0.3412878223103284
Epoch: 53, step: 1051, loss: 0.31806108355522156, mean loss: 0.3412875229349578
Epoch: 53, step: 1052, loss: 0.3222862184047699, mean loss: 0.34128727802544523
Epoch: 53, step: 1053, loss: 0.3943890929222107, mean loss: 0.34128796245066234
Epoch: 53, step: 1054, loss: 0.29512548446655273, mean loss: 0.34128736747369476
Epoch: 53, step: 1055, loss: 0.311346173286438, mean loss: 0.34128698157388826
Epoch: 53, step: 1056, loss: 0.34495851397514343, mean loss: 0.3412870288941579
Epoch: 53, step: 1057, loss: 0.30138686299324036, mean loss: 0.34128651465049376
Epoch: 53, step: 1058, loss: 0.33263280987739563, mean loss: 0.34128640312074454
Epoch: 53, step: 1059, loss: 0.31002500653266907, mean loss: 0.3412860002261602
Epoch: 53, step: 1060, loss: 0.3456319570541382, mean loss: 0.3412860562358109
Epoch: 53, step: 1061, loss: 0.33936113119125366, mean loss: 0.34128603142815767
Epoch: 53, step: 1062, loss: 0.3472785949707031, mean loss: 0.34128610865689074
Epoch: 53, step: 1063, loss: 0.3368207812309265, mean loss: 0.34128605111104526
Epoch: 53, step: 1064, loss: 0.3267538249492645, mean loss: 0.3412858638328494
Epoch: 53, step: 1065, loss: 0.3724824786186218, mean loss: 0.3412862658614428
Epoch: 53, step: 1066, loss: 0.34797921776771545, mean loss: 0.3412863521119345
Epoch: 53, step: 1067, loss: 0.2692813277244568, mean loss: 0.34128542421213565
Epoch: 53, step: 1068, loss: 0.36436522006988525, mean loss: 0.3412857216283527
Epoch: 53, step: 1069, loss: 0.3180502653121948, mean loss: 0.3412854222100862
Epoch: 53, step: 1070, loss: 0.34698718786239624, mean loss: 0.3412854956836072
Epoch: 53, step: 1071, loss: 0.3326565623283386, mean loss: 0.34128538449174395
Epoch: 53, step: 1072, loss: 0.32709839940071106, mean loss: 0.34128520168155013
Epoch: 53, step: 1073, loss: 0.3261272609233856, mean loss: 0.34128500636236403
Epoch: 53, step: 1074, loss: 0.33856457471847534, mean loss: 0.3412849713084173
Epoch: 53, step: 1075, loss: 0.3231627643108368, mean loss: 0.3412847377988951
Epoch: 53, step: 1076, loss: 0.3155960440635681, mean loss: 0.34128440679741673
Epoch: 53, step: 1077, loss: 0.32000958919525146, mean loss: 0.34128413267272145
Epoch: 53, step: 1078, loss: 0.33791351318359375, mean loss: 0.3412840892430596
Epoch: 53, step: 1079, loss: 0.30557236075401306, mean loss: 0.3412836291115272
Epoch: 53, step: 1080, loss: 0.3407037854194641, mean loss: 0.34128362164056625
Epoch: 53, step: 1081, loss: 0.33556801080703735, mean loss: 0.3412835479990733
Epoch: 53, step: 1082, loss: 0.35356879234313965, mean loss: 0.34128370628348154
Epoch: 53, step: 1083, loss: 0.3304680585861206, mean loss: 0.3412835669353098
Epoch: 53, step: 1084, loss: 0.35635414719581604, mean loss: 0.34128376110128195
Epoch: 53, step: 1085, loss: 0.3220174312591553, mean loss: 0.3412835128814123
Epoch: 53, step: 1086, loss: 0.32079628109931946, mean loss: 0.3412832489353194
Epoch: 53, step: 1087, loss: 0.35919272899627686, mean loss: 0.341283479668121
Epoch: 53, step: 1088, loss: 0.3376726508140564, mean loss: 0.3412834331494102
Epoch: 53, step: 1089, loss: 0.3691198229789734, mean loss: 0.34128379176410484
Epoch: 53, step: 1090, loss: 0.30852726101875305, mean loss: 0.34128336976893914
Epoch: 53, step: 1091, loss: 0.3206945061683655, mean loss: 0.3412831045305644
Epoch: 53, step: 1092, loss: 0.29412445425987244, mean loss: 0.3412824970117203
Epoch: 53, step: 1093, loss: 0.30445653200149536, mean loss: 0.3412820226092648
Epoch: 53, step: 1094, loss: 0.29269832372665405, mean loss: 0.34128139674843183
Epoch: 53, step: 1095, loss: 0.3401636779308319, mean loss: 0.34128138235003413
Epoch: 53, step: 1096, loss: 0.3355855643749237, mean loss: 0.341281308977738
Epoch: 53, step: 1097, loss: 0.33720776438713074, mean loss: 0.34128125650389296
Epoch: 53, step: 1098, loss: 0.3534544110298157, mean loss: 0.3412814133117986
Epoch: 53, step: 1099, loss: 0.296237587928772, mean loss: 0.34128083308939827
Epoch: 53, step: 1100, loss: 0.3296547532081604, mean loss: 0.34128068333246653
Epoch: 53, step: 1101, loss: 0.35935506224632263, mean loss: 0.3412809161477139
Epoch: 53, step: 1102, loss: 0.3128209710121155, mean loss: 0.3412805495611854
Epoch: 53, step: 1103, loss: 0.29275843501091003, mean loss: 0.34127992456615025
Epoch: 53, step: 1104, loss: 0.300003319978714, mean loss: 0.3412793929046411
Epoch: 53, step: 1105, loss: 0.36177709698677063, mean loss: 0.3412796569210259
Epoch: 53, step: 1106, loss: 0.34442245960235596, mean loss: 0.3412796974007163
Epoch: 53, step: 1107, loss: 0.33728763461112976, mean loss: 0.3412796459831121
Epoch: 53, step: 1108, loss: 0.3294404149055481, mean loss: 0.3412794934962678
Epoch: 53, step: 1109, loss: 0.28422513604164124, mean loss: 0.3412787586574247
Epoch: 53, step: 1110, loss: 0.3370491862297058, mean loss: 0.34127870418281103
Epoch: 53, step: 1111, loss: 0.3168703317642212, mean loss: 0.3412783898201762
Epoch: 53, step: 1112, loss: 0.33337461948394775, mean loss: 0.34127828802649557
Epoch: 53, step: 1113, loss: 0.310712605714798, mean loss: 0.3412778943721887
Epoch: 53, step: 1114, loss: 0.33083298802375793, mean loss: 0.3412777598543535
Epoch: 53, step: 1115, loss: 0.330697625875473, mean loss: 0.3412776235967039
Epoch: 53, step: 1116, loss: 0.3715630769729614, mean loss: 0.341278013626883
Epoch: 53, step: 1117, loss: 0.32770606875419617, mean loss: 0.3412778388433044
Epoch: 53, step: 1118, loss: 0.3555811941623688, mean loss: 0.341278023043834
Epoch: 53, step: 1119, loss: 0.318781316280365, mean loss: 0.3412777333319558
Epoch: 53, step: 1120, loss: 0.3104485273361206, mean loss: 0.3412773363195288
Epoch: 53, step: 1121, loss: 0.3732299506664276, mean loss: 0.3412777477936878
Epoch: 53, step: 1122, loss: 0.28722357749938965, mean loss: 0.34127705171268474
Epoch: 53, step: 1123, loss: 0.3433472216129303, mean loss: 0.34127707837089405
Epoch: 53, step: 1124, loss: 0.304992139339447, mean loss: 0.3412766111246827
Epoch: 53, step: 1125, loss: 0.32747071981430054, mean loss: 0.3412764333465876
Epoch: 53, step: 1126, loss: 0.3333824574947357, mean loss: 0.3412763316973795
Epoch: 53, step: 1127, loss: 0.3268858790397644, mean loss: 0.3412761463966757
Epoch: 53, step: 1128, loss: 0.29724928736686707, mean loss: 0.34127557948588355
Epoch: 53, step: 1129, loss: 0.3396085202693939, mean loss: 0.341275558020312
Epoch: 53, step: 1130, loss: 0.31072136759757996, mean loss: 0.3412751646001451
Epoch: 53, step: 1131, loss: 0.3251538872718811, mean loss: 0.34127495702292365
Epoch: 53, step: 1132, loss: 0.3062550723552704, mean loss: 0.3412745061134449
Epoch: 53, step: 1133, loss: 0.3387340009212494, mean loss: 0.3412744734027968
Epoch: 53, step: 1134, loss: 0.3124319612979889, mean loss: 0.3412741020415738
Epoch: 53, step: 1135, loss: 0.3502790331840515, mean loss: 0.34127421798290286
Epoch: 53, step: 1136, loss: 0.3094591796398163, mean loss: 0.3412738083595223
Epoch: 53, step: 1137, loss: 0.36030319333076477, mean loss: 0.34127405336254757
Epoch: 53, step: 1138, loss: 0.34245309233665466, mean loss: 0.34127406854245995
Epoch: 53, step: 1139, loss: 0.3299923241138458, mean loss: 0.34127392329392214
Epoch: 53, step: 1140, loss: 0.3446614444255829, mean loss: 0.3412739669065177
Epoch: 53, step: 1141, loss: 0.31525230407714844, mean loss: 0.3412736318952806
Epoch: 53, step: 1142, loss: 0.34841933846473694, mean loss: 0.3412737238902155
Epoch: 53, step: 1143, loss: 0.3263947665691376, mean loss: 0.3412735323386768
Epoch: 53, step: 1144, loss: 0.2853285074234009, mean loss: 0.3412728121122917
Epoch: 53, step: 1145, loss: 0.3395901918411255, mean loss: 0.34127279045081393
Epoch: 53, step: 1146, loss: 0.31981873512268066, mean loss: 0.3412725142622002
Epoch: 53, step: 1147, loss: 0.33937111496925354, mean loss: 0.34127248978486635
Epoch: 53, step: 1148, loss: 0.3430769443511963, mean loss: 0.34127251301390005
Epoch: 53, step: 1149, loss: 0.3449665606021881, mean loss: 0.3412725605673563
Epoch: 53, step: 1150, loss: 0.31396380066871643, mean loss: 0.3412722090263512
Epoch: 53, step: 1151, loss: 0.37184858322143555, mean loss: 0.34127260262573067
Epoch: 53, step: 1152, loss: 0.333424836397171, mean loss: 0.3412725016053763
Epoch: 53, step: 1153, loss: 0.36046087741851807, mean loss: 0.34127274860452433
Epoch: 53, step: 1154, loss: 0.2833148241043091, mean loss: 0.34127200256046936
Epoch: 53, step: 1155, loss: 0.3762000501155853, mean loss: 0.3412724521543263
Epoch: 53, step: 1156, loss: 0.33899569511413574, mean loss: 0.341272422848285
Epoch: 53, step: 1157, loss: 0.36309319734573364, mean loss: 0.3412727037180816
Epoch: 53, step: 1158, loss: 0.3375850319862366, mean loss: 0.341272656252201
Epoch: 53, step: 1159, loss: 0.3181154727935791, mean loss: 0.3412723581882631
Epoch: 53, step: 1160, loss: 0.3197072446346283, mean loss: 0.341272080619968
Epoch: 53, step: 1161, loss: 0.31055012345314026, mean loss: 0.3412716851974493
Epoch: 53, step: 1162, loss: 0.3647473454475403, mean loss: 0.3412719873489423
Epoch: 53, step: 1163, loss: 0.33508315682411194, mean loss: 0.3412719076945132
Epoch: 53, step: 1164, loss: 0.31097427010536194, mean loss: 0.3412715177484717
Epoch: 53, step: 1165, loss: 0.31159111857414246, mean loss: 0.34127113575151974
Epoch: 53, step: 1166, loss: 0.34461772441864014, mean loss: 0.3412711788227133
Epoch: 53, step: 1167, loss: 0.34218692779541016, mean loss: 0.3412711906084144
Epoch: 53, step: 1168, loss: 0.3587772846221924, mean loss: 0.34127141590917004
Epoch: 53, step: 1169, loss: 0.3210514485836029, mean loss: 0.3412711556846285
Epoch: 53, step: 1170, loss: 0.3074624538421631, mean loss: 0.34127072058299995
Epoch: 53, step: 1171, loss: 0.3420257568359375, mean loss: 0.341270730299826
Epoch: 53, step: 1172, loss: 0.3379015624523163, mean loss: 0.3412706869413826
Epoch: 53, step: 1173, loss: 0.34216246008872986, mean loss: 0.34127069841762825
Epoch: 53, step: 1174, loss: 0.34223389625549316, mean loss: 0.34127071081288013
Epoch: 53, step: 1175, loss: 0.33431169390678406, mean loss: 0.3412706212594634
Epoch: 53, step: 1176, loss: 0.32170817255973816, mean loss: 0.3412703695196559
Epoch: 53, step: 1177, loss: 0.35974955558776855, mean loss: 0.34127060731641395
Epoch: 53, step: 1178, loss: 0.3145364224910736, mean loss: 0.3412702632958142
Epoch: 53, step: 1179, loss: 0.3446659743785858, mean loss: 0.34127030699191113
Epoch: 53, step: 1180, loss: 0.3587460517883301, mean loss: 0.3412705318673476
Epoch: 53, step: 1181, loss: 0.2949821650981903, mean loss: 0.34126993624279134
Epoch: 53, step: 1182, loss: 0.3281421959400177, mean loss: 0.34126976732121506
Epoch: 53, step: 1183, loss: 0.3156885802745819, mean loss: 0.34126943815878974
Epoch: 53, step: 1184, loss: 0.31311655044555664, mean loss: 0.34126907591001904
Epoch: 53, step: 1185, loss: 0.3881728947162628, mean loss: 0.34126967942296077
Epoch: 53, step: 1186, loss: 0.31449130177497864, mean loss: 0.3412693348691496
Epoch: 53, step: 1187, loss: 0.33544713258743286, mean loss: 0.34126925995661384
Epoch: 53, step: 1188, loss: 0.34539932012557983, mean loss: 0.3412693130961793
Epoch: 53, step: 1189, loss: 0.33474043011665344, mean loss: 0.341269229093156
Epoch: 53, step: 1190, loss: 0.32304495573043823, mean loss: 0.34126899461593097
Epoch: 53, step: 1191, loss: 0.31011801958084106, mean loss: 0.3412685938262774
Epoch: 53, step: 1192, loss: 0.33084917068481445, mean loss: 0.3412684597712997
Epoch: 53, step: 1193, loss: 0.3563193380832672, mean loss: 0.34126865341150137
Epoch: 53, step: 1194, loss: 0.3475619852542877, mean loss: 0.34126873437862787
Epoch: 53, step: 1195, loss: 0.3186734616756439, mean loss: 0.34126844368193293
Epoch: 53, step: 1196, loss: 0.317064493894577, mean loss: 0.34126813229300745
Epoch: 53, step: 1197, loss: 0.3008870482444763, mean loss: 0.3412676127885169
Epoch: 53, step: 1198, loss: 0.3510268032550812, mean loss: 0.34126773833933277
Epoch: 53, step: 1199, loss: 0.31906384229660034, mean loss: 0.3412674526925458
Epoch: 53, step: 1200, loss: 0.3504001498222351, mean loss: 0.341267570180577
Epoch: 53, step: 1201, loss: 0.3269558548927307, mean loss: 0.3412673860691806
Epoch: 53, step: 1202, loss: 0.3378126621246338, mean loss: 0.34126734162685807
Epoch: 53, step: 1203, loss: 0.32694295048713684, mean loss: 0.3412671573571357
Epoch: 53, step: 1204, loss: 0.3261198103427887, mean loss: 0.3412669625033722
Epoch: 53, step: 1205, loss: 0.29391518235206604, mean loss: 0.3412663533832488
Epoch: 53, step: 1206, loss: 0.3510189950466156, mean loss: 0.3412664788369035
Epoch: 53, step: 1207, loss: 0.3089773952960968, mean loss: 0.34126606348980365
Epoch: 53, step: 1208, loss: 0.3252745270729065, mean loss: 0.3412658577870674
Epoch: 53, step: 1209, loss: 0.3160382807254791, mean loss: 0.34126553328323345
Epoch: 53, step: 1210, loss: 0.3732469379901886, mean loss: 0.3412659446566652
Epoch: 53, step: 1211, loss: 0.3718082010746002, mean loss: 0.3412663375134312
Epoch: 53, step: 1212, loss: 0.390279620885849, mean loss: 0.34126696794990136
Epoch: 53, step: 1213, loss: 0.317870557308197, mean loss: 0.3412666670159544
Epoch: 53, step: 1214, loss: 0.3272255063056946, mean loss: 0.34126648641527896
Epoch: 53, step: 1215, loss: 0.33616936206817627, mean loss: 0.3412664208557231
Epoch: 53, step: 1216, loss: 0.37699729204177856, mean loss: 0.34126688042267816
Epoch: 53, step: 1217, loss: 0.3156721293926239, mean loss: 0.34126655122973887
Epoch: 53, step: 1218, loss: 0.3411884009838104, mean loss: 0.34126655022460395
Epoch: 53, step: 1219, loss: 0.32660967111587524, mean loss: 0.34126636171653846
Epoch: 53, step: 1220, loss: 0.33128130435943604, mean loss: 0.34126623329631856
Epoch: 53, step: 1221, loss: 0.3257688581943512, mean loss: 0.34126603398342015
Epoch: 53, step: 1222, loss: 0.3017745018005371, mean loss: 0.341265526086408
Epoch: 53, step: 1223, loss: 0.3056993782520294, mean loss: 0.3412650686792904
Epoch: 53, step: 1224, loss: 0.3068828582763672, mean loss: 0.3412646265041756
Epoch: 53, step: 1225, loss: 0.3230989873409271, mean loss: 0.3412643928865522
Epoch: 53, step: 1226, loss: 0.3441234529018402, mean loss: 0.34126442965477216
Epoch: 53, step: 1227, loss: 0.3355214595794678, mean loss: 0.3412643557997043
Epoch: 53, step: 1228, loss: 0.30842530727386475, mean loss: 0.3412639334922684
Epoch: 53, step: 1229, loss: 0.3050145208835602, mean loss: 0.34126346733382845
Epoch: 53, step: 1230, loss: 0.33990150690078735, mean loss: 0.3412634498195809
Epoch: 53, step: 1231, loss: 0.34256309270858765, mean loss: 0.3412634665322357
Epoch: 53, step: 1232, loss: 0.33061835169792175, mean loss: 0.34126332964398476
Epoch: 53, step: 1233, loss: 0.36621934175491333, mean loss: 0.3412636505555928
Epoch: 53, step: 1234, loss: 0.33712491393089294, mean loss: 0.34126359733589007
Epoch: 53, step: 1235, loss: 0.33252930641174316, mean loss: 0.34126348502374465
Epoch: 53, step: 1236, loss: 0.3163721263408661, mean loss: 0.3412631649558682
Epoch: 53, step: 1237, loss: 0.3200669586658478, mean loss: 0.3412628924059609
Epoch: 53, step: 1238, loss: 0.3303224444389343, mean loss: 0.3412627517307997
Epoch: 53, step: 1239, loss: 0.3070102632045746, mean loss: 0.3412623113089444
Epoch: 53, step: 1240, loss: 0.31483811140060425, mean loss: 0.3412619715483603
Epoch: 53, step: 1241, loss: 0.34216204285621643, mean loss: 0.3412619831212678
Epoch: 53, step: 1242, loss: 0.32084545493125916, mean loss: 0.34126172061367294
Epoch: 53, step: 1243, loss: 0.31638434529304504, mean loss: 0.3412614007543935
Epoch: 53, step: 1244, loss: 0.37690284848213196, mean loss: 0.3412618590061611
Epoch: 53, step: 1245, loss: 0.3774634003639221, mean loss: 0.34126232445322013
Epoch: 53, step: 1246, loss: 0.32615095376968384, mean loss: 0.34126213016722157
Epoch: 53, step: 1247, loss: 0.34892770648002625, mean loss: 0.34126222872181544
Epoch: 53, step: 1248, loss: 0.30160820484161377, mean loss: 0.3412617189054865
Epoch: 53, step: 1249, loss: 0.327628493309021, mean loss: 0.34126154363067235
Epoch: 53, step: 1250, loss: 0.3565610349178314, mean loss: 0.34126174032521084
Epoch: 53, step: 1251, loss: 0.30926451086997986, mean loss: 0.34126132896516953
Epoch: 53, step: 1252, loss: 0.32427284121513367, mean loss: 0.3412611105620359
Epoch: 53, step: 1253, loss: 0.3190307021141052, mean loss: 0.34126082477271075
Epoch: 53, step: 1254, loss: 0.3457823395729065, mean loss: 0.3412608828995803
Epoch: 53, step: 1255, loss: 0.32218697667121887, mean loss: 0.34126063769586984
Epoch: 53, step: 1256, loss: 0.372363805770874, mean loss: 0.34126103753605386
Epoch: 53, step: 1257, loss: 0.3081764578819275, mean loss: 0.3412606122297207
Epoch: 53, step: 1258, loss: 0.3336787223815918, mean loss: 0.3412605147648488
Epoch: 53, step: 1259, loss: 0.3424486815929413, mean loss: 0.34126053003848655
Epoch: 53, step: 1260, loss: 0.3321768641471863, mean loss: 0.34126041327134954
Epoch: 53, step: 1261, loss: 0.29679927229881287, mean loss: 0.34125984174731205
Epoch: 53, step: 1262, loss: 0.30081644654273987, mean loss: 0.3412593218759167
Epoch: 53, step: 1263, loss: 0.32483187317848206, mean loss: 0.3412591107153339
Epoch: 53, step: 1264, loss: 0.33110612630844116, mean loss: 0.3412589802092166
Epoch: 53, step: 1265, loss: 0.36997735500335693, mean loss: 0.3412593493494875
Epoch: 53, step: 1266, loss: 0.29348424077033997, mean loss: 0.34125873526564865
Epoch: 53, step: 1267, loss: 0.336353063583374, mean loss: 0.3412586722107427
Epoch: 53, step: 1268, loss: 0.2971087098121643, mean loss: 0.3412581047378002
Epoch: 53, step: 1269, loss: 0.3796485364437103, mean loss: 0.34125859817539445
Epoch: 53, step: 1270, loss: 0.3681145906448364, mean loss: 0.34125894335478946
Epoch: 53, step: 1271, loss: 0.3167847692966461, mean loss: 0.3412586287928896
Epoch: 53, step: 1272, loss: 0.3209114372730255, mean loss: 0.34125836727767184
Epoch: 53, step: 1273, loss: 0.30481287837028503, mean loss: 0.3412578988627821
Epoch: 53, step: 1274, loss: 0.33889034390449524, mean loss: 0.34125786843422223
Epoch: 53, step: 1275, loss: 0.33406245708465576, mean loss: 0.34125777595772433
Epoch: 53, step: 1276, loss: 0.3348263204097748, mean loss: 0.34125769330076244
Epoch: 53, step: 1277, loss: 0.3388333320617676, mean loss: 0.34125766214331177
Epoch: 53, step: 1278, loss: 0.34955859184265137, mean loss: 0.3412577688239829
Epoch: 53, step: 1279, loss: 0.2936791181564331, mean loss: 0.34125715736751516
Epoch: 53, step: 1280, loss: 0.3329913914203644, mean loss: 0.34125705114148674
Epoch: 53, step: 1281, loss: 0.34035414457321167, mean loss: 0.3412570395380919
Epoch: 53, step: 1282, loss: 0.37715092301368713, mean loss: 0.3412575008101278
Epoch: 53, step: 1283, loss: 0.3976054787635803, mean loss: 0.3412582249282777
Epoch: 53, step: 1284, loss: 0.27659136056900024, mean loss: 0.341257393916232
Epoch: 53, step: 1285, loss: 0.3210424780845642, mean loss: 0.3412571341445104
Epoch: 53, step: 1286, loss: 0.29233646392822266, mean loss: 0.34125650549764763
Epoch: 53, step: 1287, loss: 0.2896091043949127, mean loss: 0.34125584181991564
Epoch: 53, step: 1288, loss: 0.38097769021987915, mean loss: 0.34125635224574413
Epoch: 53, step: 1289, loss: 0.3170613944530487, mean loss: 0.34125604134448495
Epoch: 53, step: 1290, loss: 0.3352473974227905, mean loss: 0.3412559641353832
Epoch: 53, step: 1291, loss: 0.32582637667655945, mean loss: 0.34125576587279766
Epoch: 53, step: 1292, loss: 0.32804110646247864, mean loss: 0.34125559607312644
Epoch: 53, step: 1293, loss: 0.39149972796440125, mean loss: 0.34125624166883856
Epoch: 53, step: 1294, loss: 0.30354827642440796, mean loss: 0.3412557571587682
Epoch: 53, step: 1295, loss: 0.29987025260925293, mean loss: 0.34125522540278647
Epoch: 53, step: 1296, loss: 0.3066164553165436, mean loss: 0.3412547803402765
Epoch: 53, step: 1297, loss: 0.3667111098766327, mean loss: 0.34125510741633375
Epoch: 53, step: 1298, loss: 0.37584370374679565, mean loss: 0.341255551822757
Epoch: 53, step: 1299, loss: 0.3305736184120178, mean loss: 0.3412554145792915
Epoch: 53, step: 1300, loss: 0.36941269040107727, mean loss: 0.34125577634455584
Epoch: 53, step: 1301, loss: 0.30079448223114014, mean loss: 0.34125525650368793
Epoch: 53, step: 1302, loss: 0.31874075531959534, mean loss: 0.34125496724434207
Epoch: 53, step: 1303, loss: 0.3109985589981079, mean loss: 0.3412545785243636
Epoch: 53, step: 1304, loss: 0.3267325460910797, mean loss: 0.3412543919545776
Epoch: 53, step: 1305, loss: 0.29850515723228455, mean loss: 0.3412538427468034
Epoch: 53, step: 1306, loss: 0.3100246787071228, mean loss: 0.3412534415447834
Epoch: 53, step: 1307, loss: 0.3461746871471405, mean loss: 0.34125350476736305
Epoch: 53, step: 1308, loss: 0.36063963174819946, mean loss: 0.34125375381512685
Epoch: 53, step: 1309, loss: 0.3302193582057953, mean loss: 0.3412536120613743
Epoch: 53, step: 1310, loss: 0.32377344369888306, mean loss: 0.34125338750465933
Epoch: 53, step: 1311, loss: 0.32664233446121216, mean loss: 0.3412531998080733
Epoch: 53, step: 1312, loss: 0.31136849522590637, mean loss: 0.3412528159079566
Epoch: 53, step: 1313, loss: 0.4097510278224945, mean loss: 0.34125369582743753
Epoch: 53, step: 1314, loss: 0.346729576587677, mean loss: 0.3412537661690147
Epoch: 53, step: 1315, loss: 0.3563380241394043, mean loss: 0.3412539599345317
Epoch: 53, step: 1316, loss: 0.35818615555763245, mean loss: 0.34125417743502146
Epoch: 53, step: 1317, loss: 0.3158271312713623, mean loss: 0.34125385081914267
Epoch: 53, step: 1318, loss: 0.32157784700393677, mean loss: 0.3412535980798867
Epoch: 53, step: 1319, loss: 0.32159146666526794, mean loss: 0.34125334552206654
Epoch: 53, step: 1320, loss: 0.2911789119243622, mean loss: 0.3412527023299789
Epoch: 53, step: 1321, loss: 0.29135242104530334, mean loss: 0.3412520613830618
Epoch: 53, step: 1322, loss: 0.36001911759376526, mean loss: 0.3412523024344549
Epoch: 53, step: 1323, loss: 0.2880510687828064, mean loss: 0.3412516191058271
Epoch: 53, step: 1324, loss: 0.3310263156890869, mean loss: 0.3412514877714138
Epoch: 53, step: 1325, loss: 0.3202892243862152, mean loss: 0.3412512185342977
Epoch: 53, step: 1326, loss: 0.2921515107154846, mean loss: 0.341250587910891
Epoch: 53, step: 1327, loss: 0.35006004571914673, mean loss: 0.3412507010557383
Epoch: 53, step: 1328, loss: 0.3212590217590332, mean loss: 0.34125044429459606
Epoch: 53, step: 1329, loss: 0.32940709590911865, mean loss: 0.341250292187684
Epoch: 53, step: 1330, loss: 0.29882752895355225, mean loss: 0.34124974734914404
Epoch: 53, step: 1331, loss: 0.32954689860343933, mean loss: 0.34124959705056257
Epoch: 53, step: 1332, loss: 0.3332715332508087, mean loss: 0.34124949459035836
Epoch: 53, step: 1333, loss: 0.3657490015029907, mean loss: 0.34124980922713066
Epoch: 53, step: 1334, loss: 0.31889328360557556, mean loss: 0.34124952211544507
Epoch: 53, step: 1335, loss: 0.3813098669052124, mean loss: 0.3412500365802418
Epoch: 53, step: 1336, loss: 0.3519259989261627, mean loss: 0.34125017368181426
Epoch: 53, step: 1337, loss: 0.33185267448425293, mean loss: 0.34125005299991884
Epoch: 53, step: 1338, loss: 0.34355929493904114, mean loss: 0.34125008265462903
Epoch: 53, step: 1339, loss: 0.29948270320892334, mean loss: 0.34124954629522586
Epoch: 53, step: 1340, loss: 0.3360646963119507, mean loss: 0.3412494797143829
Epoch: 53, step: 1341, loss: 0.3634110987186432, mean loss: 0.34124976429741455
Epoch: 53, step: 1342, loss: 0.3333415687084198, mean loss: 0.3412496627475515
Epoch: 53, step: 1343, loss: 0.3247160315513611, mean loss: 0.34124945044040683
Epoch: 53, step: 1344, loss: 0.31021344661712646, mean loss: 0.3412490519144772
Epoch: 53, step: 1345, loss: 0.3728463649749756, mean loss: 0.34124945764283515
Epoch: 53, step: 1346, loss: 0.2803901135921478, mean loss: 0.3412486761825692
Epoch: 53, step: 1347, loss: 0.3239876627922058, mean loss: 0.34124845454654723
Epoch: 53, step: 1348, loss: 0.385489821434021, mean loss: 0.34124902261021983
Epoch: 53, step: 1349, loss: 0.34249478578567505, mean loss: 0.34124903860574096
Epoch: 53, step: 1350, loss: 0.3621620833873749, mean loss: 0.3412493071244778
Epoch: 53, step: 1351, loss: 0.3270280063152313, mean loss: 0.34124912452855555
Epoch: 53, step: 1352, loss: 0.3492305278778076, mean loss: 0.34124922700532706
Epoch: 53, step: 1353, loss: 0.32775092124938965, mean loss: 0.341249053696828
Epoch: 53, step: 1354, loss: 0.3783038854598999, mean loss: 0.34124952944800296
Epoch: 53, step: 1355, loss: 0.3320657014846802, mean loss: 0.34124941153731114
Epoch: 53, step: 1356, loss: 0.3073740005493164, mean loss: 0.341248976618247
Epoch: 53, step: 1357, loss: 0.35540226101875305, mean loss: 0.34124915832686686
Epoch: 53, step: 1358, loss: 0.32135283946990967, mean loss: 0.3412489028888977
Epoch: 53, step: 1359, loss: 0.3481883406639099, mean loss: 0.3412489919794047
Epoch: 53, step: 1360, loss: 0.33019116520881653, mean loss: 0.3412488500176524
Epoch: 53, step: 1361, loss: 0.3351186215877533, mean loss: 0.3412487713180295
Epoch: 53, step: 1362, loss: 0.3134637176990509, mean loss: 0.3412484146192219
Epoch: 53, step: 1363, loss: 0.32739168405532837, mean loss: 0.3412482367316466
Epoch: 53, step: 1364, loss: 0.3364419937133789, mean loss: 0.34124817503167076
Epoch: 53, step: 1365, loss: 0.3314393162727356, mean loss: 0.34124804911240764
Epoch: 53, step: 1366, loss: 0.34649163484573364, mean loss: 0.34124811642502695
Epoch: 53, step: 1367, loss: 0.35287967324256897, mean loss: 0.3412482657389784
Epoch: 53, step: 1368, loss: 0.3246908485889435, mean loss: 0.3412480531946317
Epoch: 53, step: 1369, loss: 0.40121588110923767, mean loss: 0.34124882298010467
Epoch: 53, step: 1370, loss: 0.3323582708835602, mean loss: 0.3412487088567449
Epoch: 53, step: 1371, loss: 0.3802292048931122, mean loss: 0.3412492092225289
Epoch: 53, step: 1372, loss: 0.3367912471294403, mean loss: 0.341249151999474
Epoch: 53, step: 1373, loss: 0.289625346660614, mean loss: 0.34124848935724694
Epoch: 53, step: 1374, loss: 0.3220680356025696, mean loss: 0.3412482431604513
Epoch: 53, step: 1375, loss: 0.33698180317878723, mean loss: 0.34124818839791116
Epoch: 53, step: 1376, loss: 0.3213915228843689, mean loss: 0.34124793352792804
Epoch: 53, step: 1377, loss: 0.30654817819595337, mean loss: 0.341247488145367
Epoch: 53, step: 1378, loss: 0.3347150981426239, mean loss: 0.3412474043011088
Epoch: 53, step: 1379, loss: 0.34549087285995483, mean loss: 0.34124745876599943
Epoch: 53, step: 1380, loss: 0.33447006344795227, mean loss: 0.3412473717792922
Epoch: 53, step: 1381, loss: 0.3680390417575836, mean loss: 0.34124771564137063
Epoch: 53, step: 1382, loss: 0.32870832085609436, mean loss: 0.3412475547045191
Epoch: 53, step: 1383, loss: 0.3518263101577759, mean loss: 0.3412476904758043
Epoch: 53, step: 1384, loss: 0.3249434232711792, mean loss: 0.3412474812240722
Epoch: 53, step: 1385, loss: 0.32262250781059265, mean loss: 0.34124724219107067
Epoch: 53, step: 1386, loss: 0.34151458740234375, mean loss: 0.34124724562213643
Epoch: 53, step: 1387, loss: 0.3338455557823181, mean loss: 0.3412471506312504
Epoch: 53, step: 1388, loss: 0.30569058656692505, mean loss: 0.3412466943156992
Epoch: 53, step: 1389, loss: 0.3287290036678314, mean loss: 0.34124653367184193
Epoch: 53, step: 1390, loss: 0.3234454095363617, mean loss: 0.34124630522678545
Epoch: 53, step: 1391, loss: 0.3715112507343292, mean loss: 0.34124669361733917
Epoch: 53, step: 1392, loss: 0.3124839663505554, mean loss: 0.34124632450951414
Epoch: 53, step: 1393, loss: 0.3022283613681793, mean loss: 0.34124582380418933
Epoch: 53, step: 1394, loss: 0.3410266041755676, mean loss: 0.34124582099104844
Epoch: 53, step: 1395, loss: 0.3506411612033844, mean loss: 0.34124594155541826
Epoch: 53, step: 1396, loss: 0.40005701780319214, mean loss: 0.3412466962305231
Epoch: 53, step: 1397, loss: 0.3162608742713928, mean loss: 0.34124637561173754
Epoch: 53, step: 1398, loss: 0.37595775723457336, mean loss: 0.3412468210234687
Epoch: 53, step: 1399, loss: 0.347867876291275, mean loss: 0.34124690598285984
Epoch: 53, step: 1400, loss: 0.3157559931278229, mean loss: 0.34124657889532495
Epoch: 53, step: 1401, loss: 0.3446229100227356, mean loss: 0.34124662221827934
Epoch: 53, step: 1402, loss: 0.3381963074207306, mean loss: 0.34124658307906336
Epoch: 53, step: 1403, loss: 0.306569367647171, mean loss: 0.34124613813429544
Epoch: 53, step: 1404, loss: 0.3431990444660187, mean loss: 0.34124616319179485
Epoch: 53, step: 1405, loss: 0.3478141725063324, mean loss: 0.3412462474640281
Epoch: 53, step: 1406, loss: 0.32318243384361267, mean loss: 0.34124601569541907
Epoch: 53, step: 1407, loss: 0.33630967140197754, mean loss: 0.3412459523602344
Epoch: 53, step: 1408, loss: 0.3506093919277191, mean loss: 0.3412460724952028
Epoch: 53, step: 1409, loss: 0.30446869134902954, mean loss: 0.3412456006394492
Epoch: 53, step: 1410, loss: 0.3362969756126404, mean loss: 0.34124553714914185
Epoch: 53, step: 1411, loss: 0.3497798442840576, mean loss: 0.3412456466419461
Epoch: 53, step: 1412, loss: 0.3505379259586334, mean loss: 0.3412457658577947
Epoch: 53, step: 1413, loss: 0.33500176668167114, mean loss: 0.34124568575106473
Epoch: 53, step: 1414, loss: 0.30760347843170166, mean loss: 0.34124525414744533
Epoch: 53, step: 1415, loss: 0.3262920081615448, mean loss: 0.34124506231127266
Epoch: 53, step: 1416, loss: 0.38001546263694763, mean loss: 0.34124555969289816
Epoch: 53, step: 1417, loss: 0.34308114647865295, mean loss: 0.3412455832411571
Epoch: 53, step: 1418, loss: 0.39164650440216064, mean loss: 0.34124622981299274
Epoch: 53, step: 1419, loss: 0.3528358042240143, mean loss: 0.3412463784887729
Epoch: 53, step: 1420, loss: 0.36446383595466614, mean loss: 0.3412466763279512
Epoch: 53, step: 1421, loss: 0.3433082103729248, mean loss: 0.3412467027734709
Epoch: 53, step: 1422, loss: 0.2986249625682831, mean loss: 0.34124615602547265
Epoch: 53, step: 1423, loss: 0.32281750440597534, mean loss: 0.3412459196273555
Epoch: 53, step: 1424, loss: 0.35615989565849304, mean loss: 0.34124611093764234
Epoch: 53, step: 1425, loss: 0.32430872321128845, mean loss: 0.3412458936746581
Epoch: 53, step: 1426, loss: 0.34917593002319336, mean loss: 0.3412459953952593
Epoch: 53, step: 1427, loss: 0.3375339210033417, mean loss: 0.34124594778014394
Epoch: 53, step: 1428, loss: 0.32248595356941223, mean loss: 0.34124570714708113
Epoch: 53, step: 1429, loss: 0.3319183886051178, mean loss: 0.3412455875077884
Epoch: 53, step: 1430, loss: 0.34789156913757324, mean loss: 0.34124567275311796
Epoch: 53, step: 1431, loss: 0.3588673174381256, mean loss: 0.3412458987759578
Epoch: 53, step: 1432, loss: 0.3209042251110077, mean loss: 0.3412456378681958
Epoch: 53, step: 1433, loss: 0.35719504952430725, mean loss: 0.3412458424370034
Epoch: 53, step: 1434, loss: 0.33375927805900574, mean loss: 0.341245746414784
Epoch: 53, step: 1435, loss: 0.37422606348991394, mean loss: 0.3412461694128996
Epoch: 53, step: 1436, loss: 0.34431225061416626, mean loss: 0.34124620873726186
Epoch: 53, step: 1437, loss: 0.3165806829929352, mean loss: 0.34124589239090114
Epoch: 53, step: 1438, loss: 0.3303060829639435, mean loss: 0.34124575208476904
Epoch: 53, step: 1439, loss: 0.3264355957508087, mean loss: 0.34124556214278556
Epoch: 53, step: 1440, loss: 0.3255719840526581, mean loss: 0.34124536112989534
Epoch: 53, step: 1441, loss: 0.32968834042549133, mean loss: 0.3412452129135578
Epoch: 53, step: 1442, loss: 0.2963303327560425, mean loss: 0.34124463689714024
Epoch: 53, step: 1443, loss: 0.3118348717689514, mean loss: 0.3412442597328188
Valid: 53, mean loss: 0.18529472251733145
Epoch: 54, step: 0, loss: 0.3174373507499695, mean loss: 0.3412439544260106
Epoch: 54, step: 1, loss: 0.3486962616443634, mean loss: 0.3412440499953663
Epoch: 54, step: 2, loss: 0.32619956135749817, mean loss: 0.34124385706536414
Epoch: 54, step: 3, loss: 0.35536035895347595, mean loss: 0.3412440380925748
Epoch: 54, step: 4, loss: 0.317945271730423, mean loss: 0.34124373931766344
Epoch: 54, step: 5, loss: 0.3567870557308197, mean loss: 0.3412439386369476
Epoch: 54, step: 6, loss: 0.37647736072540283, mean loss: 0.3412443904459584
Epoch: 54, step: 7, loss: 0.33527275919914246, mean loss: 0.3412443138708757
Epoch: 54, step: 8, loss: 0.3191341459751129, mean loss: 0.34124403035266204
Epoch: 54, step: 9, loss: 0.32268717885017395, mean loss: 0.3412437924016003
Epoch: 54, step: 10, loss: 0.3321194052696228, mean loss: 0.3412436754027783
Epoch: 54, step: 11, loss: 0.338072806596756, mean loss: 0.341243634744359
Epoch: 54, step: 12, loss: 0.32521963119506836, mean loss: 0.34124342927944024
Epoch: 54, step: 13, loss: 0.3202858865261078, mean loss: 0.34124316055854326
Epoch: 54, step: 14, loss: 0.304025799036026, mean loss: 0.3412426833578211
Epoch: 54, step: 15, loss: 0.292012095451355, mean loss: 0.34124205213169656
Epoch: 54, step: 16, loss: 0.32496482133865356, mean loss: 0.3412418434305209
Epoch: 54, step: 17, loss: 0.3573557734489441, mean loss: 0.3412420500352599
Epoch: 54, step: 18, loss: 0.3468359112739563, mean loss: 0.34124212175602714
Epoch: 54, step: 19, loss: 0.32952550053596497, mean loss: 0.34124197153523095
Epoch: 54, step: 20, loss: 0.32948917150497437, mean loss: 0.341241820852512
Epoch: 54, step: 21, loss: 0.3235253393650055, mean loss: 0.34124159371230983
Epoch: 54, step: 22, loss: 0.3164046108722687, mean loss: 0.3412412752853705
Epoch: 54, step: 23, loss: 0.2971033453941345, mean loss: 0.3412407094144745
Epoch: 54, step: 24, loss: 0.35088714957237244, mean loss: 0.3412408330851987
Epoch: 54, step: 25, loss: 0.33722028136253357, mean loss: 0.3412407815409854
Epoch: 54, step: 26, loss: 0.36411532759666443, mean loss: 0.34124107479311744
Epoch: 54, step: 27, loss: 0.32448244094848633, mean loss: 0.341240859949855
Epoch: 54, step: 28, loss: 0.3607701361179352, mean loss: 0.3412411103091418
Epoch: 54, step: 29, loss: 0.30082738399505615, mean loss: 0.34124059222429814
Epoch: 54, step: 30, loss: 0.2934846580028534, mean loss: 0.3412399800236723
Epoch: 54, step: 31, loss: 0.30639371275901794, mean loss: 0.3412395333224716
Epoch: 54, step: 32, loss: 0.3427395522594452, mean loss: 0.34123955255126487
Epoch: 54, step: 33, loss: 0.35067617893218994, mean loss: 0.34123967351814577
Epoch: 54, step: 34, loss: 0.30947479605674744, mean loss: 0.3412392663335505
Epoch: 54, step: 35, loss: 0.37227582931518555, mean loss: 0.3412396641769974
Epoch: 54, step: 36, loss: 0.36385947465896606, mean loss: 0.3412399541262428
Epoch: 54, step: 37, loss: 0.31934505701065063, mean loss: 0.3412396734728073
Epoch: 54, step: 38, loss: 0.3224121630191803, mean loss: 0.34123943214087815
Epoch: 54, step: 39, loss: 0.3209345042705536, mean loss: 0.341239171874678
Epoch: 54, step: 40, loss: 0.37034380435943604, mean loss: 0.34123954492968506
Epoch: 54, step: 41, loss: 0.3341599404811859, mean loss: 0.34123945418646623
Epoch: 54, step: 42, loss: 0.3112628161907196, mean loss: 0.34123906996418707
Epoch: 54, step: 43, loss: 0.32177406549453735, mean loss: 0.34123882047681886
Epoch: 54, step: 44, loss: 0.3495262563228607, mean loss: 0.3412389266973985
Epoch: 54, step: 45, loss: 0.35043099522590637, mean loss: 0.3412390445112014
Epoch: 54, step: 46, loss: 0.37858182191848755, mean loss: 0.3412395231236286
Epoch: 54, step: 47, loss: 0.34972327947616577, mean loss: 0.3412396318562795
Epoch: 54, step: 48, loss: 0.3551846742630005, mean loss: 0.3412398105815907
Epoch: 54, step: 49, loss: 0.34138837456703186, mean loss: 0.3412398124856225
Epoch: 54, step: 50, loss: 0.31777188181877136, mean loss: 0.3412395117188281
Epoch: 54, step: 51, loss: 0.34919124841690063, mean loss: 0.34123961362758776
Epoch: 54, step: 52, loss: 0.3094625473022461, mean loss: 0.3412392063807138
Epoch: 54, step: 53, loss: 0.340331494808197, mean loss: 0.34123919474786013
Epoch: 54, step: 54, loss: 0.29953062534332275, mean loss: 0.34123866023504595
Epoch: 54, step: 55, loss: 0.30988866090774536, mean loss: 0.34123825847680156
Epoch: 54, step: 56, loss: 0.2875579297542572, mean loss: 0.34123757055850135
Epoch: 54, step: 57, loss: 0.27447617053985596, mean loss: 0.34123671501604524
Epoch: 54, step: 58, loss: 0.3293013870716095, mean loss: 0.341236562067651
Epoch: 54, step: 59, loss: 0.29312121868133545, mean loss: 0.3412359454888491
Epoch: 54, step: 60, loss: 0.32494619488716125, mean loss: 0.34123573674491225
Epoch: 54, step: 61, loss: 0.29333341121673584, mean loss: 0.3412351229115807
Epoch: 54, step: 62, loss: 0.3342553675174713, mean loss: 0.34123503347225687
Epoch: 54, step: 63, loss: 0.3424358665943146, mean loss: 0.3412350488596623
Epoch: 54, step: 64, loss: 0.36776164174079895, mean loss: 0.34123538876551796
Epoch: 54, step: 65, loss: 0.30796563625335693, mean loss: 0.3412349624597786
Epoch: 54, step: 66, loss: 0.35690009593963623, mean loss: 0.34123516318416747
Epoch: 54, step: 67, loss: 0.3578124940395355, mean loss: 0.3412353755942292
Epoch: 54, step: 68, loss: 0.32713866233825684, mean loss: 0.34123519497134164
Epoch: 54, step: 69, loss: 0.3064662218093872, mean loss: 0.3412347494780023
Epoch: 54, step: 70, loss: 0.332803338766098, mean loss: 0.3412346414480881
Epoch: 54, step: 71, loss: 0.3651106357574463, mean loss: 0.34123494736232435
Epoch: 54, step: 72, loss: 0.3206077814102173, mean loss: 0.3412346830775039
Epoch: 54, step: 73, loss: 0.3793049156665802, mean loss: 0.34123517084473753
Epoch: 54, step: 74, loss: 0.3209936320781708, mean loss: 0.341234911507397
Epoch: 54, step: 75, loss: 0.3682408630847931, mean loss: 0.3412352575068791
Epoch: 54, step: 76, loss: 0.33469533920288086, mean loss: 0.34123517371870565
Epoch: 54, step: 77, loss: 0.33578020334243774, mean loss: 0.3412351038315714
Epoch: 54, step: 78, loss: 0.3522990345954895, mean loss: 0.341235245576889
Epoch: 54, step: 79, loss: 0.3037621080875397, mean loss: 0.3412347654967223
Epoch: 54, step: 80, loss: 0.3484652042388916, mean loss: 0.3412348581269636
Epoch: 54, step: 81, loss: 0.34380778670310974, mean loss: 0.34123489108871735
Epoch: 54, step: 82, loss: 0.34118127822875977, mean loss: 0.34123489040189253
Epoch: 54, step: 83, loss: 0.3820062279701233, mean loss: 0.3412354127095734
Epoch: 54, step: 84, loss: 0.3576359152793884, mean loss: 0.34123562280811903
Epoch: 54, step: 85, loss: 0.3267231285572052, mean loss: 0.3412354368982749
Epoch: 54, step: 86, loss: 0.35561084747314453, mean loss: 0.3412356210496728
Epoch: 54, step: 87, loss: 0.32124683260917664, mean loss: 0.3412353649932519
Epoch: 54, step: 88, loss: 0.35138508677482605, mean loss: 0.3412354950095432
Epoch: 54, step: 89, loss: 0.38908252120018005, mean loss: 0.34123610791434417
Epoch: 54, step: 90, loss: 0.33616045117378235, mean loss: 0.3412360428976695
Epoch: 54, step: 91, loss: 0.3034440279006958, mean loss: 0.34123555880668477
Epoch: 54, step: 92, loss: 0.3419038653373718, mean loss: 0.3412355673671445
Epoch: 54, step: 93, loss: 0.38020822405815125, mean loss: 0.34123606656858796
Epoch: 54, step: 94, loss: 0.3317306339740753, mean loss: 0.3412359448148946
Epoch: 54, step: 95, loss: 0.323943167924881, mean loss: 0.3412357233170863
Epoch: 54, step: 96, loss: 0.3204836845397949, mean loss: 0.34123545751407147
Epoch: 54, step: 97, loss: 0.3390093743801117, mean loss: 0.3412354290015944
Epoch: 54, step: 98, loss: 0.36005493998527527, mean loss: 0.3412356700456032
Epoch: 54, step: 99, loss: 0.33206063508987427, mean loss: 0.3412355525314509
Epoch: 54, step: 100, loss: 0.33171167969703674, mean loss: 0.34123543055093375
Epoch: 54, step: 101, loss: 0.3170536160469055, mean loss: 0.34123512083738444
Epoch: 54, step: 102, loss: 0.3398059606552124, mean loss: 0.3412351025333567
Epoch: 54, step: 103, loss: 0.35168176889419556, mean loss: 0.3412352363277517
Epoch: 54, step: 104, loss: 0.3471238315105438, mean loss: 0.3412353117442446
Epoch: 54, step: 105, loss: 0.33704474568367004, mean loss: 0.34123525807545974
Epoch: 54, step: 106, loss: 0.31894469261169434, mean loss: 0.34123497260275165
Epoch: 54, step: 107, loss: 0.31667864322662354, mean loss: 0.34123465811669335
Epoch: 54, step: 108, loss: 0.33551400899887085, mean loss: 0.34123458485487457
Epoch: 54, step: 109, loss: 0.36513495445251465, mean loss: 0.34123489093239934
Epoch: 54, step: 110, loss: 0.3468635380268097, mean loss: 0.3412349630141427
Epoch: 54, step: 111, loss: 0.3304578363895416, mean loss: 0.34123482500155916
Epoch: 54, step: 112, loss: 0.32335472106933594, mean loss: 0.34123459603071904
Epoch: 54, step: 113, loss: 0.3464926779270172, mean loss: 0.3412346633643328
Epoch: 54, step: 114, loss: 0.34666478633880615, mean loss: 0.34123473290016887
Epoch: 54, step: 115, loss: 0.3162480890750885, mean loss: 0.341234412935975
Epoch: 54, step: 116, loss: 0.3172895908355713, mean loss: 0.34123410631666085
Epoch: 54, step: 117, loss: 0.3493826985359192, mean loss: 0.3412342106600447
Epoch: 54, step: 118, loss: 0.3414478302001953, mean loss: 0.3412342133954252
Epoch: 54, step: 119, loss: 0.31202971935272217, mean loss: 0.34123383943908886
Epoch: 54, step: 120, loss: 0.3068525791168213, mean loss: 0.34123339920117546
Epoch: 54, step: 121, loss: 0.32710427045822144, mean loss: 0.3412332182858032
Epoch: 54, step: 122, loss: 0.35877928137779236, mean loss: 0.3412334429501791
Epoch: 54, step: 123, loss: 0.3534444570541382, mean loss: 0.34123359930119196
Epoch: 54, step: 124, loss: 0.316443532705307, mean loss: 0.3412332818908311
Epoch: 54, step: 125, loss: 0.3363639712333679, mean loss: 0.3412332195453001
Epoch: 54, step: 126, loss: 0.2991781532764435, mean loss: 0.34123268108882254
Epoch: 54, step: 127, loss: 0.29167813062667847, mean loss: 0.3412320466200314
Epoch: 54, step: 128, loss: 0.30337265133857727, mean loss: 0.3412315618956824
Epoch: 54, step: 129, loss: 0.33332353830337524, mean loss: 0.341231460648357
Epoch: 54, step: 130, loss: 0.3570448160171509, mean loss: 0.341231663105952
Epoch: 54, step: 131, loss: 0.32962653040885925, mean loss: 0.3412315145279229
Epoch: 54, step: 132, loss: 0.35800936818122864, mean loss: 0.3412317293284408
Epoch: 54, step: 133, loss: 0.3470699191093445, mean loss: 0.3412318040716207
Epoch: 54, step: 134, loss: 0.35441580414772034, mean loss: 0.341231972857068
Epoch: 54, step: 135, loss: 0.32892194390296936, mean loss: 0.34123181526247365
Epoch: 54, step: 136, loss: 0.3557237386703491, mean loss: 0.3412320007875899
Epoch: 54, step: 137, loss: 0.3528193235397339, mean loss: 0.3412321491262072
Epoch: 54, step: 138, loss: 0.3329905867576599, mean loss: 0.3412320436207042
Epoch: 54, step: 139, loss: 0.3206873834133148, mean loss: 0.3412317806187557
Epoch: 54, step: 140, loss: 0.36005914211273193, mean loss: 0.34123202163366273
Epoch: 54, step: 141, loss: 0.327815979719162, mean loss: 0.34123184989293825
Epoch: 54, step: 142, loss: 0.33301207423210144, mean loss: 0.3412317446717288
Epoch: 54, step: 143, loss: 0.2899290919303894, mean loss: 0.34123108795574386
Epoch: 54, step: 144, loss: 0.34322887659072876, mean loss: 0.34123111352874774
Epoch: 54, step: 145, loss: 0.38725894689559937, mean loss: 0.3412317027076393
Epoch: 54, step: 146, loss: 0.3374868631362915, mean loss: 0.34123165477246564
Epoch: 54, step: 147, loss: 0.3327038586139679, mean loss: 0.3412315456152776
Epoch: 54, step: 148, loss: 0.3198375105857849, mean loss: 0.3412312717716292
Epoch: 54, step: 149, loss: 0.3066859543323517, mean loss: 0.34123082959722584
Epoch: 54, step: 150, loss: 0.3184925317764282, mean loss: 0.34123053855446445
Epoch: 54, step: 151, loss: 0.3014383614063263, mean loss: 0.34123002923415485
Epoch: 54, step: 152, loss: 0.31708166003227234, mean loss: 0.3412297201508541
Epoch: 54, step: 153, loss: 0.3356126546859741, mean loss: 0.3412296482570174
Epoch: 54, step: 154, loss: 0.38057729601860046, mean loss: 0.3412301518682314
Epoch: 54, step: 155, loss: 0.3289070427417755, mean loss: 0.34122999414656646
Epoch: 54, step: 156, loss: 0.3605230450630188, mean loss: 0.341230241072333
Epoch: 54, step: 157, loss: 0.34038597345352173, mean loss: 0.34123023026695226
Epoch: 54, step: 158, loss: 0.3262089192867279, mean loss: 0.3412300380187795
Epoch: 54, step: 159, loss: 0.3491169512271881, mean loss: 0.34123013895705645
Epoch: 54, step: 160, loss: 0.3116984963417053, mean loss: 0.3412297610100836
Epoch: 54, step: 161, loss: 0.3249683082103729, mean loss: 0.3412295528981176
Epoch: 54, step: 162, loss: 0.2998872995376587, mean loss: 0.3412290238120868
Epoch: 54, step: 163, loss: 0.33874091506004333, mean loss: 0.3412289919704084
Epoch: 54, step: 164, loss: 0.30433279275894165, mean loss: 0.34122851979575985
Epoch: 54, step: 165, loss: 0.2856602966785431, mean loss: 0.34122780867724334
Epoch: 54, step: 166, loss: 0.3190612196922302, mean loss: 0.3412275250102612
Epoch: 54, step: 167, loss: 0.30954837799072266, mean loss: 0.3412271196157713
Epoch: 54, step: 168, loss: 0.3251669108867645, mean loss: 0.34122691409771216
Epoch: 54, step: 169, loss: 0.35605546832084656, mean loss: 0.34122710385220023
Epoch: 54, step: 170, loss: 0.3131760060787201, mean loss: 0.3412267448992299
Epoch: 54, step: 171, loss: 0.3232206106185913, mean loss: 0.341226514488544
Epoch: 54, step: 172, loss: 0.3263377845287323, mean loss: 0.3412263239713274
Epoch: 54, step: 173, loss: 0.3191344738006592, mean loss: 0.3412260412861045
Epoch: 54, step: 174, loss: 0.35755643248558044, mean loss: 0.34122625024557013
Epoch: 54, step: 175, loss: 0.31954440474510193, mean loss: 0.34122597281382816
Epoch: 54, step: 176, loss: 0.3636132776737213, mean loss: 0.34122625926866496
Epoch: 54, step: 177, loss: 0.3421768248081207, mean loss: 0.34122627143138906
Epoch: 54, step: 178, loss: 0.3240993916988373, mean loss: 0.34122605229147823
Epoch: 54, step: 179, loss: 0.3781566619873047, mean loss: 0.3412265248157847
Epoch: 54, step: 180, loss: 0.30538415908813477, mean loss: 0.34122606622134366
Epoch: 54, step: 181, loss: 0.34067302942276, mean loss: 0.3412260591454615
Epoch: 54, step: 182, loss: 0.31602466106414795, mean loss: 0.3412257367078909
Epoch: 54, step: 183, loss: 0.3373798429965973, mean loss: 0.34122568750249543
Epoch: 54, step: 184, loss: 0.3318644165992737, mean loss: 0.34122556773341745
Epoch: 54, step: 185, loss: 0.3259155750274658, mean loss: 0.3412253718582773
Epoch: 54, step: 186, loss: 0.3303464949131012, mean loss: 0.34122523267635047
Epoch: 54, step: 187, loss: 0.31385135650634766, mean loss: 0.3412248824655607
Epoch: 54, step: 188, loss: 0.3139355182647705, mean loss: 0.341224533340451
Epoch: 54, step: 189, loss: 0.3107154071331024, mean loss: 0.34122414302847126
Epoch: 54, step: 190, loss: 0.32747918367385864, mean loss: 0.3412239671875236
Epoch: 54, step: 191, loss: 0.3478432893753052, mean loss: 0.34122405186823934
Epoch: 54, step: 192, loss: 0.3265514373779297, mean loss: 0.34122386416448863
Epoch: 54, step: 193, loss: 0.30883169174194336, mean loss: 0.34122344978336516
Epoch: 54, step: 194, loss: 0.3259952664375305, mean loss: 0.34122325497732015
Epoch: 54, step: 195, loss: 0.32984837889671326, mean loss: 0.34122310946644563
Epoch: 54, step: 196, loss: 0.3312593400478363, mean loss: 0.3412229820085072
Epoch: 54, step: 197, loss: 0.33956027030944824, mean loss: 0.3412229607391376
Epoch: 54, step: 198, loss: 0.35133665800094604, mean loss: 0.34122309011166413
Epoch: 54, step: 199, loss: 0.3148115277290344, mean loss: 0.34122275226421245
Epoch: 54, step: 200, loss: 0.3044719099998474, mean loss: 0.3412222821663286
Epoch: 54, step: 201, loss: 0.3756500482559204, mean loss: 0.341222722542983
Epoch: 54, step: 202, loss: 0.3519899249076843, mean loss: 0.34122286026797777
Epoch: 54, step: 203, loss: 0.3470603823661804, mean loss: 0.34122293493569456
Epoch: 54, step: 204, loss: 0.37477126717567444, mean loss: 0.3412233640467604
Epoch: 54, step: 205, loss: 0.3522936701774597, mean loss: 0.34122350564337
Epoch: 54, step: 206, loss: 0.35385510325431824, mean loss: 0.34122366720787395
Epoch: 54, step: 207, loss: 0.3030410706996918, mean loss: 0.34122317883945447
Epoch: 54, step: 208, loss: 0.3140731453895569, mean loss: 0.3412228315857172
Epoch: 54, step: 209, loss: 0.3400132656097412, mean loss: 0.341222816115352
Epoch: 54, step: 210, loss: 0.3429131805896759, mean loss: 0.34122283773486
Epoch: 54, step: 211, loss: 0.34417471289634705, mean loss: 0.3412228754884176
Epoch: 54, step: 212, loss: 0.32571956515312195, mean loss: 0.34122267720847627
Epoch: 54, step: 213, loss: 0.3115406930446625, mean loss: 0.34122229759491746
Epoch: 54, step: 214, loss: 0.3243268132209778, mean loss: 0.34122208151526157
Epoch: 54, step: 215, loss: 0.33401063084602356, mean loss: 0.3412219892877873
Epoch: 54, step: 216, loss: 0.3471522927284241, mean loss: 0.3412220651296586
Epoch: 54, step: 217, loss: 0.34661829471588135, mean loss: 0.34122213414044694
Epoch: 54, step: 218, loss: 0.3556728661060333, mean loss: 0.3412223189442319
Epoch: 54, step: 219, loss: 0.30336397886276245, mean loss: 0.3412218347974714
Epoch: 54, step: 220, loss: 0.3149752616882324, mean loss: 0.34122149915066774
Epoch: 54, step: 221, loss: 0.33242011070251465, mean loss: 0.3412213865980648
Epoch: 54, step: 222, loss: 0.31975752115249634, mean loss: 0.34122111212057216
Epoch: 54, step: 223, loss: 0.34009748697280884, mean loss: 0.34122109775196413
Epoch: 54, step: 224, loss: 0.3368349075317383, mean loss: 0.34122104166329237
Epoch: 54, step: 225, loss: 0.310498982667923, mean loss: 0.3412206488081353
Epoch: 54, step: 226, loss: 0.304295152425766, mean loss: 0.34122017663320103
Epoch: 54, step: 227, loss: 0.33661773800849915, mean loss: 0.34122011778149747
Epoch: 54, step: 228, loss: 0.36019107699394226, mean loss: 0.3412203603613736
Epoch: 54, step: 229, loss: 0.3496440649032593, mean loss: 0.3412204680731162
Epoch: 54, step: 230, loss: 0.31007927656173706, mean loss: 0.3412200698838043
Epoch: 54, step: 231, loss: 0.33931538462638855, mean loss: 0.3412200455297068
Epoch: 54, step: 232, loss: 0.3105500638484955, mean loss: 0.3412196533755854
Epoch: 54, step: 233, loss: 0.33328989148139954, mean loss: 0.3412195519849462
Epoch: 54, step: 234, loss: 0.34465986490249634, mean loss: 0.34121959597253
Epoch: 54, step: 235, loss: 0.29278361797332764, mean loss: 0.3412189766816539
Epoch: 54, step: 236, loss: 0.3343343436717987, mean loss: 0.3412188886575018
Epoch: 54, step: 237, loss: 0.3118252754211426, mean loss: 0.34121851284737525
Epoch: 54, step: 238, loss: 0.3499903976917267, mean loss: 0.3412186249983034
Epoch: 54, step: 239, loss: 0.32460179924964905, mean loss: 0.34121841255039315
Epoch: 54, step: 240, loss: 0.3133814334869385, mean loss: 0.34121805665616217
Epoch: 54, step: 241, loss: 0.34228572249412537, mean loss: 0.34121807030603607
Epoch: 54, step: 242, loss: 0.3698001801967621, mean loss: 0.34121843571737975
Epoch: 54, step: 243, loss: 0.32475242018699646, mean loss: 0.3412182252083599
Epoch: 54, step: 244, loss: 0.34360018372535706, mean loss: 0.34121825566000996
Epoch: 54, step: 245, loss: 0.3037428557872772, mean loss: 0.34121777656973007
Epoch: 54, step: 246, loss: 0.34553080797195435, mean loss: 0.34121783170736736
Epoch: 54, step: 247, loss: 0.34214523434638977, mean loss: 0.34121784356309753
Epoch: 54, step: 248, loss: 0.3535456359386444, mean loss: 0.3412180011571196
Epoch: 54, step: 249, loss: 0.3489856719970703, mean loss: 0.3412181004549341
Epoch: 54, step: 250, loss: 0.3329993486404419, mean loss: 0.341217995392081
Epoch: 54, step: 251, loss: 0.3068382740020752, mean loss: 0.34121755591105896
Epoch: 54, step: 252, loss: 0.2880072593688965, mean loss: 0.34121687572472725
Epoch: 54, step: 253, loss: 0.31601813435554504, mean loss: 0.34121655361375486
Epoch: 54, step: 254, loss: 0.3468155562877655, mean loss: 0.34121662518388274
Epoch: 54, step: 255, loss: 0.3724640905857086, mean loss: 0.34121702460439357
Epoch: 54, step: 256, loss: 0.3541748523712158, mean loss: 0.34121719023562036
Epoch: 54, step: 257, loss: 0.3255179524421692, mean loss: 0.34121698956535174
Epoch: 54, step: 258, loss: 0.34546250104904175, mean loss: 0.341217043831492
Epoch: 54, step: 259, loss: 0.302238792181015, mean loss: 0.34121654561773296
Epoch: 54, step: 260, loss: 0.3184956908226013, mean loss: 0.34121625520712423
Epoch: 54, step: 261, loss: 0.3384961783885956, mean loss: 0.3412162204404275
Epoch: 54, step: 262, loss: 0.32301974296569824, mean loss: 0.34121598786489005
Epoch: 54, step: 263, loss: 0.3628971576690674, mean loss: 0.34121626497595603
Epoch: 54, step: 264, loss: 0.33109453320503235, mean loss: 0.34121613560987213
Epoch: 54, step: 265, loss: 0.32173749804496765, mean loss: 0.3412158866561444
Epoch: 54, step: 266, loss: 0.3043050765991211, mean loss: 0.34121541491030055
Epoch: 54, step: 267, loss: 0.36876246333122253, mean loss: 0.3412157669762535
Epoch: 54, step: 268, loss: 0.3660607933998108, mean loss: 0.3412160845048678
Epoch: 54, step: 269, loss: 0.3044377565383911, mean loss: 0.34121561447025944
Epoch: 54, step: 270, loss: 0.29070860147476196, mean loss: 0.3412149689884775
Epoch: 54, step: 271, loss: 0.32686689496040344, mean loss: 0.3412147856218224
Epoch: 54, step: 272, loss: 0.3462405204772949, mean loss: 0.3412148498492867
Epoch: 54, step: 273, loss: 0.31830689311027527, mean loss: 0.3412145570958459
Epoch: 54, step: 274, loss: 0.3483070135116577, mean loss: 0.3412146477331083
Epoch: 54, step: 275, loss: 0.34904444217681885, mean loss: 0.3412147477918217
Epoch: 54, step: 276, loss: 0.365766316652298, mean loss: 0.34121506153786163
Epoch: 54, step: 277, loss: 0.3211512863636017, mean loss: 0.34121480514489544
Epoch: 54, step: 278, loss: 0.32142022252082825, mean loss: 0.34121455219514624
Epoch: 54, step: 279, loss: 0.35660621523857117, mean loss: 0.34121474887863434
Epoch: 54, step: 280, loss: 0.3376302421092987, mean loss: 0.34121470307433865
Epoch: 54, step: 281, loss: 0.34593015909194946, mean loss: 0.3412147633295971
Epoch: 54, step: 282, loss: 0.36896800994873047, mean loss: 0.3412151179628868
Epoch: 54, step: 283, loss: 0.32023316621780396, mean loss: 0.3412148498571911
Epoch: 54, step: 284, loss: 0.3097682297229767, mean loss: 0.34121444803993684
Epoch: 54, step: 285, loss: 0.30060040950775146, mean loss: 0.34121392909027376
Epoch: 54, step: 286, loss: 0.3075752258300781, mean loss: 0.34121349927409933
Epoch: 54, step: 287, loss: 0.35756972432136536, mean loss: 0.34121370826194874
Epoch: 54, step: 288, loss: 0.2881448268890381, mean loss: 0.3412130301953625
Epoch: 54, step: 289, loss: 0.357919842004776, mean loss: 0.34121324365729755
Epoch: 54, step: 290, loss: 0.3236903250217438, mean loss: 0.341213019770875
Epoch: 54, step: 291, loss: 0.36447271704673767, mean loss: 0.3412133169510415
Epoch: 54, step: 292, loss: 0.33144769072532654, mean loss: 0.34121319218100193
Epoch: 54, step: 293, loss: 0.30352601408958435, mean loss: 0.34121271067879044
Epoch: 54, step: 294, loss: 0.3179236948490143, mean loss: 0.3412124131354368
Epoch: 54, step: 295, loss: 0.37667596340179443, mean loss: 0.34121286621636315
Epoch: 54, step: 296, loss: 0.3111279308795929, mean loss: 0.3412124818573206
Epoch: 54, step: 297, loss: 0.3369867503643036, mean loss: 0.3412124278709204
Epoch: 54, step: 298, loss: 0.3169059157371521, mean loss: 0.34121211734377715
Epoch: 54, step: 299, loss: 0.348506897687912, mean loss: 0.34121221053684203
Epoch: 54, step: 300, loss: 0.3700423240661621, mean loss: 0.3412125788457135
Epoch: 54, step: 301, loss: 0.33338794112205505, mean loss: 0.3412124788861115
Epoch: 54, step: 302, loss: 0.32775062322616577, mean loss: 0.34121230691335175
Epoch: 54, step: 303, loss: 0.29892534017562866, mean loss: 0.3412117667119371
Epoch: 54, step: 304, loss: 0.30941542983055115, mean loss: 0.3412113605298893
Epoch: 54, step: 305, loss: 0.33582931756973267, mean loss: 0.34121129177790344
Epoch: 54, step: 306, loss: 0.3108215630054474, mean loss: 0.34121090357447775
Epoch: 54, step: 307, loss: 0.3056102991104126, mean loss: 0.34121044881227264
Epoch: 54, step: 308, loss: 0.3355323076248169, mean loss: 0.3412103762806103
Epoch: 54, step: 309, loss: 0.3173696994781494, mean loss: 0.341210071747529
Epoch: 54, step: 310, loss: 0.34103691577911377, mean loss: 0.341210069535719
Epoch: 54, step: 311, loss: 0.35198351740837097, mean loss: 0.34121020714873596
Epoch: 54, step: 312, loss: 0.3151443302631378, mean loss: 0.3412098742044285
Epoch: 54, step: 313, loss: 0.3076176047325134, mean loss: 0.34120944512958534
Epoch: 54, step: 314, loss: 0.3584786355495453, mean loss: 0.3412096657065408
Epoch: 54, step: 315, loss: 0.3248332738876343, mean loss: 0.34120945653584883
Epoch: 54, step: 316, loss: 0.3120688796043396, mean loss: 0.34120908433684083
Epoch: 54, step: 317, loss: 0.3469865024089813, mean loss: 0.34120915812816677
Epoch: 54, step: 318, loss: 0.29759499430656433, mean loss: 0.3412086010790088
Epoch: 54, step: 319, loss: 0.3508835732936859, mean loss: 0.3412087246481849
Epoch: 54, step: 320, loss: 0.3391176760196686, mean loss: 0.3412086979415598
Epoch: 54, step: 321, loss: 0.3069228529930115, mean loss: 0.3412082600524062
Epoch: 54, step: 322, loss: 0.34112125635147095, mean loss: 0.34120825894123363
Epoch: 54, step: 323, loss: 0.3380071222782135, mean loss: 0.3412082180582622
Epoch: 54, step: 324, loss: 0.34441831707954407, mean loss: 0.3412082590551718
Epoch: 54, step: 325, loss: 0.31166088581085205, mean loss: 0.34120788170372174
Epoch: 54, step: 326, loss: 0.2840290069580078, mean loss: 0.34120715147787156
Epoch: 54, step: 327, loss: 0.3295770585536957, mean loss: 0.34120700295298234
Epoch: 54, step: 328, loss: 0.35988283157348633, mean loss: 0.34120724145408216
Epoch: 54, step: 329, loss: 0.3483974039554596, mean loss: 0.34120733327543046
Epoch: 54, step: 330, loss: 0.336232453584671, mean loss: 0.34120726974497095
Epoch: 54, step: 331, loss: 0.3042607605457306, mean loss: 0.3412067979348213
Epoch: 54, step: 332, loss: 0.3004976809024811, mean loss: 0.3412062780824795
Epoch: 54, step: 333, loss: 0.3687012195587158, mean loss: 0.3412066291863165
Epoch: 54, step: 334, loss: 0.34869104623794556, mean loss: 0.3412067247593146
Epoch: 54, step: 335, loss: 0.32025808095932007, mean loss: 0.3412064572569676
Epoch: 54, step: 336, loss: 0.38406243920326233, mean loss: 0.3412070044966589
Epoch: 54, step: 337, loss: 0.33317962288856506, mean loss: 0.3412069019941484
Epoch: 54, step: 338, loss: 0.3197297155857086, mean loss: 0.34120662775311655
Epoch: 54, step: 339, loss: 0.3198048770427704, mean loss: 0.3412063544788085
Epoch: 54, step: 340, loss: 0.3375782370567322, mean loss: 0.3412063081527564
Epoch: 54, step: 341, loss: 0.36543384194374084, mean loss: 0.3412066175009751
Epoch: 54, step: 342, loss: 0.3054673373699188, mean loss: 0.34120616117134717
Epoch: 54, step: 343, loss: 0.3495257496833801, mean loss: 0.34120626739694104
Epoch: 54, step: 344, loss: 0.34810584783554077, mean loss: 0.3412063554905614
Epoch: 54, step: 345, loss: 0.35532575845718384, mean loss: 0.341206535764341
Epoch: 54, step: 346, loss: 0.32690882682800293, mean loss: 0.3412063532163163
Epoch: 54, step: 347, loss: 0.38440388441085815, mean loss: 0.3412069047398748
Epoch: 54, step: 348, loss: 0.3547481298446655, mean loss: 0.3412070776249703
Epoch: 54, step: 349, loss: 0.35471048951148987, mean loss: 0.34120725002509145
Epoch: 54, step: 350, loss: 0.31188493967056274, mean loss: 0.341206875667458
Epoch: 54, step: 351, loss: 0.3228246569633484, mean loss: 0.34120664098485787
Epoch: 54, step: 352, loss: 0.32096418738365173, mean loss: 0.3412063825562605
Epoch: 54, step: 353, loss: 0.3210894465446472, mean loss: 0.34120612573338277
Epoch: 54, step: 354, loss: 0.3300109803676605, mean loss: 0.3412059828123762
Epoch: 54, step: 355, loss: 0.3133947253227234, mean loss: 0.34120562776900326
Epoch: 54, step: 356, loss: 0.37514427304267883, mean loss: 0.3412060610301483
Epoch: 54, step: 357, loss: 0.3351724445819855, mean loss: 0.34120598400591295
Epoch: 54, step: 358, loss: 0.37866437435150146, mean loss: 0.34120646218795603
Epoch: 54, step: 359, loss: 0.32313716411590576, mean loss: 0.34120623152391816
Epoch: 54, step: 360, loss: 0.3596561551094055, mean loss: 0.34120646704383323
Epoch: 54, step: 361, loss: 0.3331274390220642, mean loss: 0.3412063639134492
Epoch: 54, step: 362, loss: 0.32189902663230896, mean loss: 0.34120611745463203
Epoch: 54, step: 363, loss: 0.3102574348449707, mean loss: 0.34120572239868857
Epoch: 54, step: 364, loss: 0.3151930570602417, mean loss: 0.34120539035460773
Epoch: 54, step: 365, loss: 0.2818812131881714, mean loss: 0.3412046331084669
Epoch: 54, step: 366, loss: 0.30466654896736145, mean loss: 0.34120416672239356
Epoch: 54, step: 367, loss: 0.32369375228881836, mean loss: 0.341203943215623
Epoch: 54, step: 368, loss: 0.363203763961792, mean loss: 0.34120422402257616
Epoch: 54, step: 369, loss: 0.2929132282733917, mean loss: 0.3412036076414495
Epoch: 54, step: 370, loss: 0.3374688923358917, mean loss: 0.3412035599725496
Epoch: 54, step: 371, loss: 0.4259378910064697, mean loss: 0.3412046414849179
Epoch: 54, step: 372, loss: 0.344628244638443, mean loss: 0.34120468518175073
Epoch: 54, step: 373, loss: 0.3227975070476532, mean loss: 0.34120445024648416
Epoch: 54, step: 374, loss: 0.31113019585609436, mean loss: 0.34120406640640055
Epoch: 54, step: 375, loss: 0.321259468793869, mean loss: 0.3412038118551752
Epoch: 54, step: 376, loss: 0.31411507725715637, mean loss: 0.3412034661283415
Epoch: 54, step: 377, loss: 0.3222598433494568, mean loss: 0.34120322435864525
Epoch: 54, step: 378, loss: 0.307097464799881, mean loss: 0.3412027890863645
Epoch: 54, step: 379, loss: 0.3309473991394043, mean loss: 0.3412026582043651
Epoch: 54, step: 380, loss: 0.3210386037826538, mean loss: 0.3412024008686526
Epoch: 54, step: 381, loss: 0.3578667938709259, mean loss: 0.34120261353861614
Epoch: 54, step: 382, loss: 0.32724303007125854, mean loss: 0.34120243538953987
Epoch: 54, step: 383, loss: 0.31639158725738525, mean loss: 0.34120211876309614
Epoch: 54, step: 384, loss: 0.34729012846946716, mean loss: 0.3412021964549289
Epoch: 54, step: 385, loss: 0.33981096744537354, mean loss: 0.34120217870105574
Epoch: 54, step: 386, loss: 0.34823372960090637, mean loss: 0.34120226843155227
Epoch: 54, step: 387, loss: 0.30384936928749084, mean loss: 0.34120179177263815
Epoch: 54, step: 388, loss: 0.31160715222358704, mean loss: 0.34120141412139654
Epoch: 54, step: 389, loss: 0.33864569664001465, mean loss: 0.34120138150881607
Epoch: 54, step: 390, loss: 0.3376214802265167, mean loss: 0.34120133582758183
Epoch: 54, step: 391, loss: 0.3315988779067993, mean loss: 0.34120121329723885
Epoch: 54, step: 392, loss: 0.3085656464099884, mean loss: 0.34120079686259136
Epoch: 54, step: 393, loss: 0.3034615218639374, mean loss: 0.34120031531002026
Epoch: 54, step: 394, loss: 0.32649558782577515, mean loss: 0.3412001276803169
Epoch: 54, step: 395, loss: 0.3123328387737274, mean loss: 0.3411997593435524
Epoch: 54, step: 396, loss: 0.31148603558540344, mean loss: 0.3411993802114054
Epoch: 54, step: 397, loss: 0.32718658447265625, mean loss: 0.34119920141747195
Epoch: 54, step: 398, loss: 0.3309025466442108, mean loss: 0.34119907004069655
Epoch: 54, step: 399, loss: 0.30833497643470764, mean loss: 0.3411986507274679
Epoch: 54, step: 400, loss: 0.3598611056804657, mean loss: 0.34119888883883925
Epoch: 54, step: 401, loss: 0.31420639157295227, mean loss: 0.3411985444501426
Epoch: 54, step: 402, loss: 0.3059846758842468, mean loss: 0.3411980951733138
Epoch: 54, step: 403, loss: 0.3469487130641937, mean loss: 0.3411981685417482
Epoch: 54, step: 404, loss: 0.30460408329963684, mean loss: 0.3411977016673113
Epoch: 54, step: 405, loss: 0.31838348507881165, mean loss: 0.34119741060282466
Epoch: 54, step: 406, loss: 0.3053458333015442, mean loss: 0.341196953213119
Epoch: 54, step: 407, loss: 0.33676910400390625, mean loss: 0.3411968967239221
Epoch: 54, step: 408, loss: 0.37383437156677246, mean loss: 0.34119731309790746
Epoch: 54, step: 409, loss: 0.3011602461338043, mean loss: 0.34119680232982436
Epoch: 54, step: 410, loss: 0.3109395205974579, mean loss: 0.3411964163311035
Epoch: 54, step: 411, loss: 0.3048427402973175, mean loss: 0.3411959525652715
Epoch: 54, step: 412, loss: 0.32005593180656433, mean loss: 0.34119568288431174
Epoch: 54, step: 413, loss: 0.31099003553390503, mean loss: 0.3411952975590489
Epoch: 54, step: 414, loss: 0.3310394287109375, mean loss: 0.3411951680050332
Epoch: 54, step: 415, loss: 0.3013768196105957, mean loss: 0.3411946600661058
Epoch: 54, step: 416, loss: 0.3220268487930298, mean loss: 0.34119441555688595
Epoch: 54, step: 417, loss: 0.3539603054523468, mean loss: 0.3411945783995767
Epoch: 54, step: 418, loss: 0.3383715748786926, mean loss: 0.34119454238958213
Epoch: 54, step: 419, loss: 0.32694581151008606, mean loss: 0.34119436063629266
Epoch: 54, step: 420, loss: 0.34232622385025024, mean loss: 0.3411943750738759
Epoch: 54, step: 421, loss: 0.33863988518714905, mean loss: 0.34119434249026553
Epoch: 54, step: 422, loss: 0.32043105363845825, mean loss: 0.34119407764901943
Epoch: 54, step: 423, loss: 0.3260577321052551, mean loss: 0.3411938845833875
Epoch: 54, step: 424, loss: 0.3483063578605652, mean loss: 0.3411939753025528
Epoch: 54, step: 425, loss: 0.30535608530044556, mean loss: 0.3411935181982697
Epoch: 54, step: 426, loss: 0.33212459087371826, mean loss: 0.34119340252760244
Epoch: 54, step: 427, loss: 0.35531941056251526, mean loss: 0.34119358269708405
Epoch: 54, step: 428, loss: 0.32099106907844543, mean loss: 0.34119332502839433
Epoch: 54, step: 429, loss: 0.3738655149936676, mean loss: 0.34119374173362055
Epoch: 54, step: 430, loss: 0.3247184157371521, mean loss: 0.34119353160791754
Epoch: 54, step: 431, loss: 0.32639575004577637, mean loss: 0.34119334287996167
Epoch: 54, step: 432, loss: 0.3036292493343353, mean loss: 0.34119286380111175
Epoch: 54, step: 433, loss: 0.3212081491947174, mean loss: 0.3411926089265472
Epoch: 54, step: 434, loss: 0.3221853971481323, mean loss: 0.3411923665216323
Epoch: 54, step: 435, loss: 0.30277901887893677, mean loss: 0.34119187663044676
Epoch: 54, step: 436, loss: 0.35843512415885925, mean loss: 0.341192096533365
Epoch: 54, step: 437, loss: 0.30453741550445557, mean loss: 0.34119162908264156
Epoch: 54, step: 438, loss: 0.3252495527267456, mean loss: 0.34119142577872835
Epoch: 54, step: 439, loss: 0.3260357081890106, mean loss: 0.34119123250544753
Epoch: 54, step: 440, loss: 0.33353546261787415, mean loss: 0.34119113487649094
Epoch: 54, step: 441, loss: 0.37955981492996216, mean loss: 0.3411916241605846
Epoch: 54, step: 442, loss: 0.3296249210834503, mean loss: 0.3411914766618524
Epoch: 54, step: 443, loss: 0.32677358388900757, mean loss: 0.3411912928070606
Epoch: 54, step: 444, loss: 0.34697872400283813, mean loss: 0.34119136660656835
Epoch: 54, step: 445, loss: 0.3330748975276947, mean loss: 0.34119126310921966
Epoch: 54, step: 446, loss: 0.3239761292934418, mean loss: 0.34119104359283015
Epoch: 54, step: 447, loss: 0.3523060381412506, mean loss: 0.3411911853223332
Epoch: 54, step: 448, loss: 0.34652280807495117, mean loss: 0.341191253306047
Epoch: 54, step: 449, loss: 0.3338225185871124, mean loss: 0.34119115934824323
Epoch: 54, step: 450, loss: 0.2935805916786194, mean loss: 0.3411905522796614
Epoch: 54, step: 451, loss: 0.34894901514053345, mean loss: 0.34119065120431663
Epoch: 54, step: 452, loss: 0.3161107897758484, mean loss: 0.34119033142641014
Epoch: 54, step: 453, loss: 0.3174538314342499, mean loss: 0.34119002878073895
Epoch: 54, step: 454, loss: 0.34657663106918335, mean loss: 0.34119009746024437
Epoch: 54, step: 455, loss: 0.3414154052734375, mean loss: 0.341190100332896
Epoch: 54, step: 456, loss: 0.3267919421195984, mean loss: 0.3411899167601879
Epoch: 54, step: 457, loss: 0.32380735874176025, mean loss: 0.3411896951399974
Epoch: 54, step: 458, loss: 0.2886873781681061, mean loss: 0.3411890257664146
Epoch: 54, step: 459, loss: 0.32667064666748047, mean loss: 0.34118884066800187
Epoch: 54, step: 460, loss: 0.3247057795524597, mean loss: 0.34118863052405046
Epoch: 54, step: 461, loss: 0.3098647892475128, mean loss: 0.34118823117881886
Epoch: 54, step: 462, loss: 0.34983187913894653, mean loss: 0.3411883413746138
Epoch: 54, step: 463, loss: 0.337027907371521, mean loss: 0.3411882883349146
Epoch: 54, step: 464, loss: 0.32197055220603943, mean loss: 0.3411880433388522
Epoch: 54, step: 465, loss: 0.3148826062679291, mean loss: 0.34118770798996934
Epoch: 54, step: 466, loss: 0.419772207736969, mean loss: 0.3411887097938237
Epoch: 54, step: 467, loss: 0.3379480540752411, mean loss: 0.3411886684821145
Epoch: 54, step: 468, loss: 0.30076441168785095, mean loss: 0.34118815316237716
Epoch: 54, step: 469, loss: 0.35414424538612366, mean loss: 0.3411883183217508
Epoch: 54, step: 470, loss: 0.3314361274242401, mean loss: 0.34118819400608674
Epoch: 54, step: 471, loss: 0.36007893085479736, mean loss: 0.34118843481193073
Epoch: 54, step: 472, loss: 0.33955129981040955, mean loss: 0.3411884139431497
Epoch: 54, step: 473, loss: 0.31279700994491577, mean loss: 0.341188052038701
Epoch: 54, step: 474, loss: 0.34267157316207886, mean loss: 0.34118807094886305
Epoch: 54, step: 475, loss: 0.34715986251831055, mean loss: 0.34118814706918593
Epoch: 54, step: 476, loss: 0.3019866645336151, mean loss: 0.34118764738807067
Epoch: 54, step: 477, loss: 0.35894331336021423, mean loss: 0.34118787370751863
Epoch: 54, step: 478, loss: 0.30403390526771545, mean loss: 0.3411874001370841
Epoch: 54, step: 479, loss: 0.31575891375541687, mean loss: 0.34118707602565373
Epoch: 54, step: 480, loss: 0.3327958285808563, mean loss: 0.34118696907219587
Epoch: 54, step: 481, loss: 0.35287943482398987, mean loss: 0.3411871181005391
Epoch: 54, step: 482, loss: 0.2932141125202179, mean loss: 0.3411865066600978
Epoch: 54, step: 483, loss: 0.3126644492149353, mean loss: 0.3411861431365515
Epoch: 54, step: 484, loss: 0.3440733551979065, mean loss: 0.3411861799346048
Epoch: 54, step: 485, loss: 0.3482602834701538, mean loss: 0.3411862700942176
Epoch: 54, step: 486, loss: 0.3896520137786865, mean loss: 0.3411868877833664
Epoch: 54, step: 487, loss: 0.31123217940330505, mean loss: 0.3411865060196483
Epoch: 54, step: 488, loss: 0.3319239616394043, mean loss: 0.34118638797282
Epoch: 54, step: 489, loss: 0.34794068336486816, mean loss: 0.3411864740520823
Epoch: 54, step: 490, loss: 0.438502699136734, mean loss: 0.34118771427058286
Epoch: 54, step: 491, loss: 0.32511743903160095, mean loss: 0.34118750947021537
Epoch: 54, step: 492, loss: 0.3619998097419739, mean loss: 0.34118777469979994
Epoch: 54, step: 493, loss: 0.3490755259990692, mean loss: 0.34118787521912325
Epoch: 54, step: 494, loss: 0.31191930174827576, mean loss: 0.3411875022332626
Epoch: 54, step: 495, loss: 0.33695852756500244, mean loss: 0.3411874483417514
Epoch: 54, step: 496, loss: 0.3609839379787445, mean loss: 0.3411877006131013
Epoch: 54, step: 497, loss: 0.30533093214035034, mean loss: 0.34118724368764225
Epoch: 54, step: 498, loss: 0.3673570156097412, mean loss: 0.34118757716673653
Epoch: 54, step: 499, loss: 0.27983230352401733, mean loss: 0.34118679533186164
Epoch: 54, step: 500, loss: 0.3354056775569916, mean loss: 0.34118672166546543
Epoch: 54, step: 501, loss: 0.33353230357170105, mean loss: 0.3411866241296198
Epoch: 54, step: 502, loss: 0.3376109004020691, mean loss: 0.3411865785668103
Epoch: 54, step: 503, loss: 0.328126460313797, mean loss: 0.34118641215347884
Epoch: 54, step: 504, loss: 0.3360520303249359, mean loss: 0.3411863467315063
Epoch: 54, step: 505, loss: 0.3197941184043884, mean loss: 0.34118607415654223
Epoch: 54, step: 506, loss: 0.32408198714256287, mean loss: 0.3411858562228876
Epoch: 54, step: 507, loss: 0.34499242901802063, mean loss: 0.3411859047241464
Epoch: 54, step: 508, loss: 0.3606204688549042, mean loss: 0.34118615234552796
Epoch: 54, step: 509, loss: 0.37397199869155884, mean loss: 0.3411865700741209
Epoch: 54, step: 510, loss: 0.3712086081504822, mean loss: 0.3411869525838114
Epoch: 54, step: 511, loss: 0.35091787576675415, mean loss: 0.34118707656356856
Epoch: 54, step: 512, loss: 0.317949116230011, mean loss: 0.34118678049710915
Epoch: 54, step: 513, loss: 0.3530840575695038, mean loss: 0.341186932074088
Epoch: 54, step: 514, loss: 0.3293089270591736, mean loss: 0.3411867807445723
Epoch: 54, step: 515, loss: 0.30854740738868713, mean loss: 0.34118636491399906
Epoch: 54, step: 516, loss: 0.3791182339191437, mean loss: 0.3411868481656139
Epoch: 54, step: 517, loss: 0.31220173835754395, mean loss: 0.34118647890032217
Epoch: 54, step: 518, loss: 0.3283885419368744, mean loss: 0.34118631585889325
Epoch: 54, step: 519, loss: 0.34890851378440857, mean loss: 0.34118641423585416
Epoch: 54, step: 520, loss: 0.3668745458126068, mean loss: 0.34118674148570544
Epoch: 54, step: 521, loss: 0.3500337302684784, mean loss: 0.3411868541890709
Epoch: 54, step: 522, loss: 0.3151339590549469, mean loss: 0.3411865223008286
Epoch: 54, step: 523, loss: 0.34870436787605286, mean loss: 0.341186618069562
Epoch: 54, step: 524, loss: 0.3579050898551941, mean loss: 0.3411868310410119
Epoch: 54, step: 525, loss: 0.30313828587532043, mean loss: 0.34118634635851763
Epoch: 54, step: 526, loss: 0.32563626766204834, mean loss: 0.3411861482759132
Epoch: 54, step: 527, loss: 0.3151630759239197, mean loss: 0.34118581678869786
Epoch: 54, step: 528, loss: 0.3615131080150604, mean loss: 0.34118607571859055
Epoch: 54, step: 529, loss: 0.3247493803501129, mean loss: 0.34118586634993886
Epoch: 54, step: 530, loss: 0.3160198926925659, mean loss: 0.34118554579287186
Epoch: 54, step: 531, loss: 0.3356230556964874, mean loss: 0.34118547494034607
Epoch: 54, step: 532, loss: 0.3457487225532532, mean loss: 0.341185533064225
Epoch: 54, step: 533, loss: 0.36705756187438965, mean loss: 0.3411858626022305
Epoch: 54, step: 534, loss: 0.3165263831615448, mean loss: 0.34118554851274696
Epoch: 54, step: 535, loss: 0.3260173499584198, mean loss: 0.3411853553168208
Epoch: 54, step: 536, loss: 0.31140846014022827, mean loss: 0.3411849760561229
Epoch: 54, step: 537, loss: 0.3035889267921448, mean loss: 0.34118449721095817
Epoch: 54, step: 538, loss: 0.34631937742233276, mean loss: 0.34118456261094815
Epoch: 54, step: 539, loss: 0.3351665139198303, mean loss: 0.3411844859635299
Epoch: 54, step: 540, loss: 0.3014053404331207, mean loss: 0.3411839793325388
Epoch: 54, step: 541, loss: 0.30790308117866516, mean loss: 0.34118355546924434
Epoch: 54, step: 542, loss: 0.3435782492160797, mean loss: 0.3411835859675154
Epoch: 54, step: 543, loss: 0.31384050846099854, mean loss: 0.34118323773677794
Epoch: 54, step: 544, loss: 0.3557429611682892, mean loss: 0.34118342316135775
Epoch: 54, step: 545, loss: 0.2976790964603424, mean loss: 0.3411828691213855
Epoch: 54, step: 546, loss: 0.3563030958175659, mean loss: 0.34118306167932005
Epoch: 54, step: 547, loss: 0.3431854248046875, mean loss: 0.3411830871793344
Epoch: 54, step: 548, loss: 0.36584222316741943, mean loss: 0.341183401208446
Epoch: 54, step: 549, loss: 0.32804298400878906, mean loss: 0.3411832338700205
Epoch: 54, step: 550, loss: 0.3359401822090149, mean loss: 0.34118316710251806
Epoch: 54, step: 551, loss: 0.3246082067489624, mean loss: 0.34118295603181265
Epoch: 54, step: 552, loss: 0.36847731471061707, mean loss: 0.3411833036022475
Epoch: 54, step: 553, loss: 0.32832279801368713, mean loss: 0.3411831398367364
Epoch: 54, step: 554, loss: 0.30045050382614136, mean loss: 0.34118262115448345
Epoch: 54, step: 555, loss: 0.33387520909309387, mean loss: 0.34118252810436295
Epoch: 54, step: 556, loss: 0.33414193987846375, mean loss: 0.34118243845302876
Epoch: 54, step: 557, loss: 0.32151827216148376, mean loss: 0.34118218806254447
Epoch: 54, step: 558, loss: 0.33025726675987244, mean loss: 0.34118204895359555
Epoch: 54, step: 559, loss: 0.33790841698646545, mean loss: 0.3411820072703934
Epoch: 54, step: 560, loss: 0.35898861289024353, mean loss: 0.34118223399926795
Epoch: 54, step: 561, loss: 0.3279099762439728, mean loss: 0.3411820650077256
Epoch: 54, step: 562, loss: 0.3394376337528229, mean loss: 0.34118204279670616
Epoch: 54, step: 563, loss: 0.30688056349754333, mean loss: 0.34118160605772857
Epoch: 54, step: 564, loss: 0.33009812235832214, mean loss: 0.34118146494055795
Epoch: 54, step: 565, loss: 0.3435409665107727, mean loss: 0.34118149498182976
Epoch: 54, step: 566, loss: 0.32871201634407043, mean loss: 0.34118133622193214
Epoch: 54, step: 567, loss: 0.290375292301178, mean loss: 0.3411806893737461
Epoch: 54, step: 568, loss: 0.35409680008888245, mean loss: 0.34118085381592217
Epoch: 54, step: 569, loss: 0.3363001346588135, mean loss: 0.3411807916775681
Epoch: 54, step: 570, loss: 0.32187649607658386, mean loss: 0.34118054591012187
Epoch: 54, step: 571, loss: 0.32451722025871277, mean loss: 0.3411803337681749
Epoch: 54, step: 572, loss: 0.2963806092739105, mean loss: 0.3411797634270567
Epoch: 54, step: 573, loss: 0.34518593549728394, mean loss: 0.34117981442861073
Epoch: 54, step: 574, loss: 0.34184780716896057, mean loss: 0.34117982293254756
Epoch: 54, step: 575, loss: 0.36628150939941406, mean loss: 0.3411801424875744
Epoch: 54, step: 576, loss: 0.3417249023914337, mean loss: 0.3411801494225088
Epoch: 54, step: 577, loss: 0.3320577144622803, mean loss: 0.3411800332930315
Epoch: 54, step: 578, loss: 0.34160366654396057, mean loss: 0.341180038685855
Epoch: 54, step: 579, loss: 0.2954491376876831, mean loss: 0.341179456541894
Epoch: 54, step: 580, loss: 0.30285292863845825, mean loss: 0.34117896866012787
Epoch: 54, step: 581, loss: 0.3309982419013977, mean loss: 0.3411788390650929
Epoch: 54, step: 582, loss: 0.3262673616409302, mean loss: 0.3411786492526281
Epoch: 54, step: 583, loss: 0.3207298219203949, mean loss: 0.3411783889569645
Epoch: 54, step: 584, loss: 0.39133667945861816, mean loss: 0.3411790274199487
Epoch: 54, step: 585, loss: 0.35000476241111755, mean loss: 0.34117913976096587
Epoch: 54, step: 586, loss: 0.3093574047088623, mean loss: 0.34117873471361465
Epoch: 54, step: 587, loss: 0.3654230535030365, mean loss: 0.34117904330684806
Epoch: 54, step: 588, loss: 0.3263370394706726, mean loss: 0.34117885439316087
Epoch: 54, step: 589, loss: 0.3268692195415497, mean loss: 0.3411786722579516
Epoch: 54, step: 590, loss: 0.3349479138851166, mean loss: 0.3411785929529206
Epoch: 54, step: 591, loss: 0.31451335549354553, mean loss: 0.3411782535623613
Epoch: 54, step: 592, loss: 0.33131229877471924, mean loss: 0.34117812799178276
Epoch: 54, step: 593, loss: 0.3006771504878998, mean loss: 0.34117761251542406
Epoch: 54, step: 594, loss: 0.31767842173576355, mean loss: 0.34117731343318275
Epoch: 54, step: 595, loss: 0.313783198595047, mean loss: 0.3411769647833477
Epoch: 54, step: 596, loss: 0.3162483870983124, mean loss: 0.34117664751688614
Epoch: 54, step: 597, loss: 0.29961463809013367, mean loss: 0.34117611856316826
Epoch: 54, step: 598, loss: 0.3106180727481842, mean loss: 0.34117572966026255
Epoch: 54, step: 599, loss: 0.316782146692276, mean loss: 0.34117541921454164
Epoch: 54, step: 600, loss: 0.309453547000885, mean loss: 0.34117501551024887
Epoch: 54, step: 601, loss: 0.315927118062973, mean loss: 0.3411746942002455
Epoch: 54, step: 602, loss: 0.3716246485710144, mean loss: 0.34117508170777766
Epoch: 54, step: 603, loss: 0.2978622615337372, mean loss: 0.34117453051383295
Epoch: 54, step: 604, loss: 0.3387889564037323, mean loss: 0.3411745001556788
Epoch: 54, step: 605, loss: 0.30314451456069946, mean loss: 0.341174016202794
Epoch: 54, step: 606, loss: 0.30921146273612976, mean loss: 0.3411736094665601
Epoch: 54, step: 607, loss: 0.36430981755256653, mean loss: 0.3411739038802841
Epoch: 54, step: 608, loss: 0.3236176371574402, mean loss: 0.3411736804754776
Epoch: 54, step: 609, loss: 0.33019185066223145, mean loss: 0.34117354073265044
Epoch: 54, step: 610, loss: 0.3434503376483917, mean loss: 0.34117356970432405
Epoch: 54, step: 611, loss: 0.32596269249916077, mean loss: 0.34117337615216337
Epoch: 54, step: 612, loss: 0.36025118827819824, mean loss: 0.34117361890639264
Epoch: 54, step: 613, loss: 0.3229600489139557, mean loss: 0.3411733871520983
Epoch: 54, step: 614, loss: 0.3367612957954407, mean loss: 0.3411733310121922
Epoch: 54, step: 615, loss: 0.34380024671554565, mean loss: 0.3411733644369136
Epoch: 54, step: 616, loss: 0.3383226990699768, mean loss: 0.34117332816567614
Epoch: 54, step: 617, loss: 0.30846166610717773, mean loss: 0.3411729119549977
Epoch: 54, step: 618, loss: 0.3202369809150696, mean loss: 0.3411726455776068
Epoch: 54, step: 619, loss: 0.31854042410850525, mean loss: 0.34117235762120357
Epoch: 54, step: 620, loss: 0.3763856291770935, mean loss: 0.34117280564430313
Epoch: 54, step: 621, loss: 0.3193788230419159, mean loss: 0.3411725283601152
Epoch: 54, step: 622, loss: 0.30153411626815796, mean loss: 0.3411720240482016
Epoch: 54, step: 623, loss: 0.3454184830188751, mean loss: 0.3411720780743972
Epoch: 54, step: 624, loss: 0.35260576009750366, mean loss: 0.34117222353923893
Epoch: 54, step: 625, loss: 0.34094929695129395, mean loss: 0.34117222070309494
Epoch: 54, step: 626, loss: 0.33054301142692566, mean loss: 0.34117208547658606
Epoch: 54, step: 627, loss: 0.38132941722869873, mean loss: 0.34117259635811564
Epoch: 54, step: 628, loss: 0.36107513308525085, mean loss: 0.3411728495549444
Epoch: 54, step: 629, loss: 0.31746646761894226, mean loss: 0.3411725479700535
Epoch: 54, step: 630, loss: 0.3678593337535858, mean loss: 0.3411728874663551
Epoch: 54, step: 631, loss: 0.34182214736938477, mean loss: 0.34117289572581855
Epoch: 54, step: 632, loss: 0.359176903963089, mean loss: 0.3411731247582224
Epoch: 54, step: 633, loss: 0.35732248425483704, mean loss: 0.3411733301946745
Epoch: 54, step: 634, loss: 0.32660138607025146, mean loss: 0.3411731448269254
Epoch: 54, step: 635, loss: 0.33428606390953064, mean loss: 0.34117305721840613
Epoch: 54, step: 636, loss: 0.30328142642974854, mean loss: 0.34117257521630995
Epoch: 54, step: 637, loss: 0.34699857234954834, mean loss: 0.3411726493252108
Epoch: 54, step: 638, loss: 0.3024679720401764, mean loss: 0.3411721569932476
Epoch: 54, step: 639, loss: 0.3291735351085663, mean loss: 0.3411720043700935
Epoch: 54, step: 640, loss: 0.31269562244415283, mean loss: 0.34117164215350004
Epoch: 54, step: 641, loss: 0.30457523465156555, mean loss: 0.3411711766569534
Epoch: 54, step: 642, loss: 0.3178410232067108, mean loss: 0.34117087990739603
Epoch: 54, step: 643, loss: 0.34383028745651245, mean loss: 0.3411709137334905
Epoch: 54, step: 644, loss: 0.31674376130104065, mean loss: 0.34117060303847985
Epoch: 54, step: 645, loss: 0.36437278985977173, mean loss: 0.34117089814909546
Epoch: 54, step: 646, loss: 0.34913167357444763, mean loss: 0.34117099940159695
Epoch: 54, step: 647, loss: 0.3905411958694458, mean loss: 0.3411716273294112
Epoch: 54, step: 648, loss: 0.3438847064971924, mean loss: 0.34117166183598246
Epoch: 54, step: 649, loss: 0.32166728377342224, mean loss: 0.34117141377073607
Epoch: 54, step: 650, loss: 0.37104564905166626, mean loss: 0.3411717937195486
Epoch: 54, step: 651, loss: 0.32264813780784607, mean loss: 0.3411715581335498
Epoch: 54, step: 652, loss: 0.3085048794746399, mean loss: 0.3411711426802354
Epoch: 54, step: 653, loss: 0.29823294281959534, mean loss: 0.3411705966011325
Epoch: 54, step: 654, loss: 0.3021811544895172, mean loss: 0.34117010074781623
Epoch: 54, step: 655, loss: 0.3190518915653229, mean loss: 0.34116981946018293
Epoch: 54, step: 656, loss: 0.3375801742076874, mean loss: 0.3411697738095623
Epoch: 54, step: 657, loss: 0.32202091813087463, mean loss: 0.3411695302907832
Epoch: 54, step: 658, loss: 0.29551517963409424, mean loss: 0.3411689497051577
Epoch: 54, step: 659, loss: 0.34663042426109314, mean loss: 0.3411690191577565
Epoch: 54, step: 660, loss: 0.3226819336414337, mean loss: 0.3411687840637738
Epoch: 54, step: 661, loss: 0.3448869585990906, mean loss: 0.3411688313459343
Epoch: 54, step: 662, loss: 0.35768941044807434, mean loss: 0.34116904142718024
Epoch: 54, step: 663, loss: 0.3162408173084259, mean loss: 0.34116872443552054
Epoch: 54, step: 664, loss: 0.35629647970199585, mean loss: 0.34116891680025735
Epoch: 54, step: 665, loss: 0.35252049565315247, mean loss: 0.34116906114524925
Epoch: 54, step: 666, loss: 0.3698793053627014, mean loss: 0.34116942621581137
Epoch: 54, step: 667, loss: 0.3329883813858032, mean loss: 0.3411693221895051
Epoch: 54, step: 668, loss: 0.33520346879959106, mean loss: 0.3411692463314926
Epoch: 54, step: 669, loss: 0.35037803649902344, mean loss: 0.3411693634231459
Epoch: 54, step: 670, loss: 0.33344483375549316, mean loss: 0.34116926520541774
Epoch: 54, step: 671, loss: 0.29880276322364807, mean loss: 0.34116872652036556
Epoch: 54, step: 672, loss: 0.34116822481155396, mean loss: 0.3411687265139865
Epoch: 54, step: 673, loss: 0.33355748653411865, mean loss: 0.34116862974043305
Epoch: 54, step: 674, loss: 0.3180904984474182, mean loss: 0.34116833631592103
Epoch: 54, step: 675, loss: 0.30123889446258545, mean loss: 0.3411678286436196
Epoch: 54, step: 676, loss: 0.31565743684768677, mean loss: 0.34116750430263076
Epoch: 54, step: 677, loss: 0.3077887296676636, mean loss: 0.341167079927842
Epoch: 54, step: 678, loss: 0.32229575514793396, mean loss: 0.3411668400025381
Epoch: 54, step: 679, loss: 0.314260870218277, mean loss: 0.3411664979311159
Epoch: 54, step: 680, loss: 0.3255097568035126, mean loss: 0.34116629888028605
Epoch: 54, step: 681, loss: 0.2997288405895233, mean loss: 0.341165772074897
Epoch: 54, step: 682, loss: 0.3206019699573517, mean loss: 0.3411655106451545
Epoch: 54, step: 683, loss: 0.32047852873802185, mean loss: 0.341165247652758
Epoch: 54, step: 684, loss: 0.343260258436203, mean loss: 0.34116527428616955
Epoch: 54, step: 685, loss: 0.3251788318157196, mean loss: 0.3411650710566245
Epoch: 54, step: 686, loss: 0.31751033663749695, mean loss: 0.3411647703468319
Epoch: 54, step: 687, loss: 0.3087368309497833, mean loss: 0.34116435811328927
Epoch: 54, step: 688, loss: 0.29500895738601685, mean loss: 0.3411637713796628
Epoch: 54, step: 689, loss: 0.354910284280777, mean loss: 0.34116394612495177
Epoch: 54, step: 690, loss: 0.30392202734947205, mean loss: 0.341163472712736
Epoch: 54, step: 691, loss: 0.3000878393650055, mean loss: 0.34116295057370427
Epoch: 54, step: 692, loss: 0.3589496314525604, mean loss: 0.34116317666887364
Epoch: 54, step: 693, loss: 0.2905504107475281, mean loss: 0.3411625333135168
Epoch: 54, step: 694, loss: 0.3347446024417877, mean loss: 0.34116245173414356
Epoch: 54, step: 695, loss: 0.3292210102081299, mean loss: 0.34116229994644875
Epoch: 54, step: 696, loss: 0.3031460642814636, mean loss: 0.3411618167281189
Epoch: 54, step: 697, loss: 0.3140541613101959, mean loss: 0.3411614721713985
Epoch: 54, step: 698, loss: 0.3642997741699219, mean loss: 0.3411617662712015
Epoch: 54, step: 699, loss: 0.31367096304893494, mean loss: 0.3411614168532949
Epoch: 54, step: 700, loss: 0.3326331079006195, mean loss: 0.34116130845682635
Epoch: 54, step: 701, loss: 0.3109215795993805, mean loss: 0.34116092410886556
Epoch: 54, step: 702, loss: 0.304645299911499, mean loss: 0.34116045999996486
Epoch: 54, step: 703, loss: 0.32576677203178406, mean loss: 0.3411602643506516
Epoch: 54, step: 704, loss: 0.29416733980178833, mean loss: 0.34115966709178924
Epoch: 54, step: 705, loss: 0.3175622522830963, mean loss: 0.34115936718310863
Epoch: 54, step: 706, loss: 0.3353298604488373, mean loss: 0.34115929309459225
Epoch: 54, step: 707, loss: 0.31165969371795654, mean loss: 0.3411589181822927
Epoch: 54, step: 708, loss: 0.3382617235183716, mean loss: 0.34115888136212796
Epoch: 54, step: 709, loss: 0.3406223952770233, mean loss: 0.34115887454406524
Epoch: 54, step: 710, loss: 0.3275080919265747, mean loss: 0.34115870106200824
Epoch: 54, step: 711, loss: 0.2961856424808502, mean loss: 0.3411581295255785
Epoch: 54, step: 712, loss: 0.3451516330242157, mean loss: 0.3411581802760455
Epoch: 54, step: 713, loss: 0.30924463272094727, mean loss: 0.34115777471564956
Epoch: 54, step: 714, loss: 0.3454098403453827, mean loss: 0.34115782875061706
Epoch: 54, step: 715, loss: 0.3262186050415039, mean loss: 0.3411576389063672
Epoch: 54, step: 716, loss: 0.3828166127204895, mean loss: 0.34115816829238393
Epoch: 54, step: 717, loss: 0.3265422582626343, mean loss: 0.3411579825614511
Epoch: 54, step: 718, loss: 0.3030376434326172, mean loss: 0.34115749815533725
Epoch: 54, step: 719, loss: 0.3497447669506073, mean loss: 0.3411576072748452
Epoch: 54, step: 720, loss: 0.32420647144317627, mean loss: 0.34115739187736077
Epoch: 54, step: 721, loss: 0.276474267244339, mean loss: 0.34115656996162425
Epoch: 54, step: 722, loss: 0.3398929536342621, mean loss: 0.34115655390530425
Epoch: 54, step: 723, loss: 0.297009140253067, mean loss: 0.34115599294706217
Epoch: 54, step: 724, loss: 0.3256821930408478, mean loss: 0.3411557963320267
Epoch: 54, step: 725, loss: 0.2920842170715332, mean loss: 0.34115517282081653
Epoch: 54, step: 726, loss: 0.31540483236312866, mean loss: 0.3411548456370947
Epoch: 54, step: 727, loss: 0.327886164188385, mean loss: 0.3411546770474239
Epoch: 54, step: 728, loss: 0.3290746212005615, mean loss: 0.3411545235621835
Epoch: 54, step: 729, loss: 0.35835760831832886, mean loss: 0.3411547421361773
Epoch: 54, step: 730, loss: 0.34931686520576477, mean loss: 0.34115484583880945
Epoch: 54, step: 731, loss: 0.39997076988220215, mean loss: 0.34115559310622884
Epoch: 54, step: 732, loss: 0.3137679100036621, mean loss: 0.34115524514496515
Epoch: 54, step: 733, loss: 0.3157045543193817, mean loss: 0.3411549217973495
Epoch: 54, step: 734, loss: 0.3704421818256378, mean loss: 0.3411552938833353
Epoch: 54, step: 735, loss: 0.35760051012039185, mean loss: 0.3411555028122945
Epoch: 54, step: 736, loss: 0.3223811388015747, mean loss: 0.34115526429560716
Epoch: 54, step: 737, loss: 0.29447638988494873, mean loss: 0.34115467127690136
Epoch: 54, step: 738, loss: 0.3505682647228241, mean loss: 0.3411547908677474
Epoch: 54, step: 739, loss: 0.3510461151599884, mean loss: 0.3411549165261179
Epoch: 54, step: 740, loss: 0.31696221232414246, mean loss: 0.3411546091883865
Epoch: 54, step: 741, loss: 0.3248368501663208, mean loss: 0.34115440189451446
Epoch: 54, step: 742, loss: 0.3466006815433502, mean loss: 0.3411544710808564
Epoch: 54, step: 743, loss: 0.3186827003955841, mean loss: 0.34115418561628974
Epoch: 54, step: 744, loss: 0.3448192775249481, mean loss: 0.34115423217428453
Epoch: 54, step: 745, loss: 0.3179429769515991, mean loss: 0.3411539373233506
Epoch: 54, step: 746, loss: 0.28264206647872925, mean loss: 0.34115319406063394
Epoch: 54, step: 747, loss: 0.33521461486816406, mean loss: 0.3411531186251988
Epoch: 54, step: 748, loss: 0.351127952337265, mean loss: 0.34115324532997765
Epoch: 54, step: 749, loss: 0.3619047999382019, mean loss: 0.34115350892211505
Epoch: 54, step: 750, loss: 0.3518962264060974, mean loss: 0.34115364537742876
Epoch: 54, step: 751, loss: 0.36199334263801575, mean loss: 0.34115391008245444
Epoch: 54, step: 752, loss: 0.32377204298973083, mean loss: 0.3411536893014577
Epoch: 54, step: 753, loss: 0.32872945070266724, mean loss: 0.3411535314932702
Epoch: 54, step: 754, loss: 0.30349501967430115, mean loss: 0.34115305317454164
Epoch: 54, step: 755, loss: 0.3068716824054718, mean loss: 0.3411526177560235
Epoch: 54, step: 756, loss: 0.3167600929737091, mean loss: 0.3411523079427968
Epoch: 54, step: 757, loss: 0.3393852710723877, mean loss: 0.34115228549967347
Epoch: 54, step: 758, loss: 0.3673849403858185, mean loss: 0.3411526186762136
Epoch: 54, step: 759, loss: 0.3103986382484436, mean loss: 0.3411522280800387
Epoch: 54, step: 760, loss: 0.3235848546028137, mean loss: 0.3411520049654486
Epoch: 54, step: 761, loss: 0.30206960439682007, mean loss: 0.34115150860536114
Epoch: 54, step: 762, loss: 0.3423689007759094, mean loss: 0.341151524066469
Epoch: 54, step: 763, loss: 0.3437849283218384, mean loss: 0.3411515575107699
Epoch: 54, step: 764, loss: 0.3157118558883667, mean loss: 0.34115123443001627
Epoch: 54, step: 765, loss: 0.33582931756973267, mean loss: 0.3411511668432537
Epoch: 54, step: 766, loss: 0.29236212372779846, mean loss: 0.3411505472447736
Epoch: 54, step: 767, loss: 0.3318396210670471, mean loss: 0.34115042900178144
Epoch: 54, step: 768, loss: 0.3635680675506592, mean loss: 0.3411507136882828
Epoch: 54, step: 769, loss: 0.3197755515575409, mean loss: 0.3411504422438649
Epoch: 54, step: 770, loss: 0.34724658727645874, mean loss: 0.34115051965817955
Epoch: 54, step: 771, loss: 0.33483654260635376, mean loss: 0.34115043947865686
Epoch: 54, step: 772, loss: 0.3465370535850525, mean loss: 0.34115050788097445
Epoch: 54, step: 773, loss: 0.35664644837379456, mean loss: 0.341150704654822
Epoch: 54, step: 774, loss: 0.3226913809776306, mean loss: 0.34115047025368833
Epoch: 54, step: 775, loss: 0.3175473213195801, mean loss: 0.341150170538774
Epoch: 54, step: 776, loss: 0.37081488966941833, mean loss: 0.34115054721927035
Epoch: 54, step: 777, loss: 0.34457287192344666, mean loss: 0.3411505906751546
Epoch: 54, step: 778, loss: 0.2970491051673889, mean loss: 0.34115003069184546
Epoch: 54, step: 779, loss: 0.3089536130428314, mean loss: 0.34114962187959436
Epoch: 54, step: 780, loss: 0.3211761713027954, mean loss: 0.3411493682710189
Epoch: 54, step: 781, loss: 0.3923376500606537, mean loss: 0.3411500182149203
Epoch: 54, step: 782, loss: 0.33787354826927185, mean loss: 0.34114997661370716
Epoch: 54, step: 783, loss: 0.34585869312286377, mean loss: 0.34115003639934083
Epoch: 54, step: 784, loss: 0.2885858118534088, mean loss: 0.341149369010347
Epoch: 54, step: 785, loss: 0.36102139949798584, mean loss: 0.3411496213151448
Epoch: 54, step: 786, loss: 0.32873156666755676, mean loss: 0.341149463651589
Epoch: 54, step: 787, loss: 0.35833972692489624, mean loss: 0.34114968190184636
Epoch: 54, step: 788, loss: 0.3499191105365753, mean loss: 0.34114979323846334
Epoch: 54, step: 789, loss: 0.3040064573287964, mean loss: 0.3411493216728651
Epoch: 54, step: 790, loss: 0.3257827162742615, mean loss: 0.3411491265834825
Epoch: 54, step: 791, loss: 0.44357937574386597, mean loss: 0.3411504269878239
Epoch: 54, step: 792, loss: 0.3620467782020569, mean loss: 0.3411506922743099
Epoch: 54, step: 793, loss: 0.3537180721759796, mean loss: 0.341150851819567
Epoch: 54, step: 794, loss: 0.3448154926300049, mean loss: 0.34115089834228235
Epoch: 54, step: 795, loss: 0.3149200975894928, mean loss: 0.3411505653457766
Epoch: 54, step: 796, loss: 0.3459373414516449, mean loss: 0.34115062611248737
Epoch: 54, step: 797, loss: 0.3018830418586731, mean loss: 0.3411501276284158
Epoch: 54, step: 798, loss: 0.2902141809463501, mean loss: 0.3411494810280136
Epoch: 54, step: 799, loss: 0.3187490701675415, mean loss: 0.3411491966722344
Epoch: 54, step: 800, loss: 0.3022800385951996, mean loss: 0.3411487032647922
Epoch: 54, step: 801, loss: 0.32033589482307434, mean loss: 0.3411484390690974
Epoch: 54, step: 802, loss: 0.3319282531738281, mean loss: 0.3411483220304717
Epoch: 54, step: 803, loss: 0.3048054873943329, mean loss: 0.3411478607099
Epoch: 54, step: 804, loss: 0.30928149819374084, mean loss: 0.34114745621690656
Epoch: 54, step: 805, loss: 0.3477794826030731, mean loss: 0.3411475403989074
Epoch: 54, step: 806, loss: 0.33327680826187134, mean loss: 0.341147440494967
Epoch: 54, step: 807, loss: 0.34607255458831787, mean loss: 0.34114750300910807
Epoch: 54, step: 808, loss: 0.3500388264656067, mean loss: 0.34114761586464476
Epoch: 54, step: 809, loss: 0.32183676958084106, mean loss: 0.3411473707595971
Epoch: 54, step: 810, loss: 0.30635592341423035, mean loss: 0.34114692917091693
Epoch: 54, step: 811, loss: 0.2952270209789276, mean loss: 0.34114634634220964
Epoch: 54, step: 812, loss: 0.2897811532020569, mean loss: 0.34114569440865117
Epoch: 54, step: 813, loss: 0.31103402376174927, mean loss: 0.34114531223235156
Epoch: 54, step: 814, loss: 0.29736390709877014, mean loss: 0.3411447565672993
Epoch: 54, step: 815, loss: 0.3206859529018402, mean loss: 0.34114449691145016
Epoch: 54, step: 816, loss: 0.3679085373878479, mean loss: 0.34114483658680805
Epoch: 54, step: 817, loss: 0.33984506130218506, mean loss: 0.3411448200909418
Epoch: 54, step: 818, loss: 0.2968222200870514, mean loss: 0.34114425758570666
Epoch: 54, step: 819, loss: 0.3107157051563263, mean loss: 0.3411438714169617
Epoch: 54, step: 820, loss: 0.34117910265922546, mean loss: 0.3411438718640757
Epoch: 54, step: 821, loss: 0.4275122582912445, mean loss: 0.34114496793740784
Epoch: 54, step: 822, loss: 0.3172423243522644, mean loss: 0.34114466460051796
Epoch: 54, step: 823, loss: 0.32786762714385986, mean loss: 0.34114449611019493
Epoch: 54, step: 824, loss: 0.34335777163505554, mean loss: 0.34114452419709135
Epoch: 54, step: 825, loss: 0.40119293332099915, mean loss: 0.3411452862133996
Epoch: 54, step: 826, loss: 0.3399902582168579, mean loss: 0.34114527155624197
Epoch: 54, step: 827, loss: 0.3818221092224121, mean loss: 0.34114578773356374
Epoch: 54, step: 828, loss: 0.3292156457901001, mean loss: 0.3411456363454292
Epoch: 54, step: 829, loss: 0.34127727150917053, mean loss: 0.34114563801579906
Epoch: 54, step: 830, loss: 0.36147812008857727, mean loss: 0.34114589601930223
Epoch: 54, step: 831, loss: 0.3528374433517456, mean loss: 0.3411460443741308
Epoch: 54, step: 832, loss: 0.3558829426765442, mean loss: 0.34114623136924943
Epoch: 54, step: 833, loss: 0.3754780888557434, mean loss: 0.3411466669974373
Epoch: 54, step: 834, loss: 0.34432485699653625, mean loss: 0.3411467073241683
Epoch: 54, step: 835, loss: 0.3694993555545807, mean loss: 0.34114706707456455
Epoch: 54, step: 836, loss: 0.36634278297424316, mean loss: 0.3411473867644114
Epoch: 54, step: 837, loss: 0.32050976157188416, mean loss: 0.34114712491213656
Epoch: 54, step: 838, loss: 0.32943421602249146, mean loss: 0.34114697629945
Epoch: 54, step: 839, loss: 0.3810734748840332, mean loss: 0.3411474828780455
Epoch: 54, step: 840, loss: 0.3091859817504883, mean loss: 0.3411470773627236
Epoch: 54, step: 841, loss: 0.38169392943382263, mean loss: 0.34114759179917303
Epoch: 54, step: 842, loss: 0.3652293086051941, mean loss: 0.3411478973310474
Epoch: 54, step: 843, loss: 0.30240902304649353, mean loss: 0.3411474058457101
Epoch: 54, step: 844, loss: 0.30069515109062195, mean loss: 0.34114689262899434
Epoch: 54, step: 845, loss: 0.31210631132125854, mean loss: 0.3411465241965604
Epoch: 54, step: 846, loss: 0.32321614027023315, mean loss: 0.3411462967200126
Epoch: 54, step: 847, loss: 0.3658660054206848, mean loss: 0.34114661032638505
Epoch: 54, step: 848, loss: 0.3030528724193573, mean loss: 0.34114612705663677
Epoch: 54, step: 849, loss: 0.3496357202529907, mean loss: 0.34114623475705536
Epoch: 54, step: 850, loss: 0.31619852781295776, mean loss: 0.3411459182702305
Epoch: 54, step: 851, loss: 0.3659934103488922, mean loss: 0.34114623348172995
Epoch: 54, step: 852, loss: 0.3092726171016693, mean loss: 0.3411458291430173
Epoch: 54, step: 853, loss: 0.310957133769989, mean loss: 0.3411454461835428
Epoch: 54, step: 854, loss: 0.3407559394836426, mean loss: 0.3411454412425082
Epoch: 54, step: 855, loss: 0.33024361729621887, mean loss: 0.34114530295064766
Epoch: 54, step: 856, loss: 0.32393744587898254, mean loss: 0.3411450846682396
Epoch: 54, step: 857, loss: 0.3178965747356415, mean loss: 0.3411447897636308
Epoch: 54, step: 858, loss: 0.33715641498565674, mean loss: 0.34114473917220844
Epoch: 54, step: 859, loss: 0.378268837928772, mean loss: 0.3411452100750797
Epoch: 54, step: 860, loss: 0.31827351450920105, mean loss: 0.3411449199613569
Epoch: 54, step: 861, loss: 0.35594555735588074, mean loss: 0.3411451076961725
Epoch: 54, step: 862, loss: 0.31506189703941345, mean loss: 0.34114477685470246
Epoch: 54, step: 863, loss: 0.347443550825119, mean loss: 0.3411448567478274
Epoch: 54, step: 864, loss: 0.32661065459251404, mean loss: 0.34114467239955487
Epoch: 54, step: 865, loss: 0.33214837312698364, mean loss: 0.34114455829413803
Epoch: 54, step: 866, loss: 0.3139175772666931, mean loss: 0.3411442129625166
Epoch: 54, step: 867, loss: 0.3602963387966156, mean loss: 0.3411444558741628
Epoch: 54, step: 868, loss: 0.33834657073020935, mean loss: 0.341144420388271
Epoch: 54, step: 869, loss: 0.32686522603034973, mean loss: 0.3411442392859404
Epoch: 54, step: 870, loss: 0.29842689633369446, mean loss: 0.3411436975108196
Epoch: 54, step: 871, loss: 0.3243959844112396, mean loss: 0.34114348510577314
Epoch: 54, step: 872, loss: 0.3099154233932495, mean loss: 0.3411430890568478
Epoch: 54, step: 873, loss: 0.29327869415283203, mean loss: 0.3411424820258408
Epoch: 54, step: 874, loss: 0.331459641456604, mean loss: 0.34114235922663
Epoch: 54, step: 875, loss: 0.3546988070011139, mean loss: 0.34114253114931775
Epoch: 54, step: 876, loss: 0.33414286375045776, mean loss: 0.34114244238075603
Epoch: 54, step: 877, loss: 0.3430345058441162, mean loss: 0.34114246637527074
Epoch: 54, step: 878, loss: 0.3842802941799164, mean loss: 0.34114301342780773
Epoch: 54, step: 879, loss: 0.34306782484054565, mean loss: 0.34114303783700184
Epoch: 54, step: 880, loss: 0.3394097089767456, mean loss: 0.34114301585634244
Epoch: 54, step: 881, loss: 0.31190577149391174, mean loss: 0.3411426450982156
Epoch: 54, step: 882, loss: 0.3092503249645233, mean loss: 0.3411422406761442
Epoch: 54, step: 883, loss: 0.3394598960876465, mean loss: 0.3411422193428372
Epoch: 54, step: 884, loss: 0.32468122243881226, mean loss: 0.3411420106085211
Epoch: 54, step: 885, loss: 0.32374536991119385, mean loss: 0.3411417900125345
Epoch: 54, step: 886, loss: 0.32928311824798584, mean loss: 0.3411416396419961
Epoch: 54, step: 887, loss: 0.3526209592819214, mean loss: 0.34114178520042127
Epoch: 54, step: 888, loss: 0.34024524688720703, mean loss: 0.3411417738324087
Epoch: 54, step: 889, loss: 0.3460792303085327, mean loss: 0.3411418364380496
Epoch: 54, step: 890, loss: 0.3365591764450073, mean loss: 0.3411417783318709
Epoch: 54, step: 891, loss: 0.2993984818458557, mean loss: 0.3411412490513454
Epoch: 54, step: 892, loss: 0.3292834758758545, mean loss: 0.34114109870364
Epoch: 54, step: 893, loss: 0.310030996799469, mean loss: 0.34114070425579035
Epoch: 54, step: 894, loss: 0.3544814884662628, mean loss: 0.34114087340267846
Epoch: 54, step: 895, loss: 0.3145381808280945, mean loss: 0.3411405361132402
Epoch: 54, step: 896, loss: 0.3296746611595154, mean loss: 0.3411403907418843
Epoch: 54, step: 897, loss: 0.3326781988143921, mean loss: 0.34114028345441405
Epoch: 54, step: 898, loss: 0.3439018726348877, mean loss: 0.3411403184666382
Epoch: 54, step: 899, loss: 0.347317099571228, mean loss: 0.3411403967766578
Epoch: 54, step: 900, loss: 0.35984569787979126, mean loss: 0.3411406339218472
Epoch: 54, step: 901, loss: 0.32850703597068787, mean loss: 0.34114047375554035
Epoch: 54, step: 902, loss: 0.3075058162212372, mean loss: 0.3411400473472754
Epoch: 54, step: 903, loss: 0.32880863547325134, mean loss: 0.34113989101598896
Epoch: 54, step: 904, loss: 0.3567640483379364, mean loss: 0.34114008908849464
Epoch: 54, step: 905, loss: 0.34251827001571655, mean loss: 0.3411401065599194
Epoch: 54, step: 906, loss: 0.3701254427433014, mean loss: 0.34114047400710296
Epoch: 54, step: 907, loss: 0.3235352635383606, mean loss: 0.3411402508286324
Epoch: 54, step: 908, loss: 0.33728423714637756, mean loss: 0.3411402019471761
Epoch: 54, step: 909, loss: 0.33063799142837524, mean loss: 0.34114006881568865
Epoch: 54, step: 910, loss: 0.424673467874527, mean loss: 0.3411411277151152
Epoch: 54, step: 911, loss: 0.33350297808647156, mean loss: 0.3411410308924092
Epoch: 54, step: 912, loss: 0.35984495282173157, mean loss: 0.3411412679840434
Epoch: 54, step: 913, loss: 0.3488132357597351, mean loss: 0.3411413652329694
Epoch: 54, step: 914, loss: 0.3407835364341736, mean loss: 0.3411413606972328
Epoch: 54, step: 915, loss: 0.3408472537994385, mean loss: 0.3411413569692642
Epoch: 54, step: 916, loss: 0.29482030868530273, mean loss: 0.3411407698316438
Epoch: 54, step: 917, loss: 0.3169730305671692, mean loss: 0.3411404634998662
Epoch: 54, step: 918, loss: 0.32155531644821167, mean loss: 0.3411402152566689
Epoch: 54, step: 919, loss: 0.33320480585098267, mean loss: 0.3411401146760386
Epoch: 54, step: 920, loss: 0.35293394327163696, mean loss: 0.34114026415990484
Epoch: 54, step: 921, loss: 0.33288735151290894, mean loss: 0.3411401595576
Epoch: 54, step: 922, loss: 0.331394225358963, mean loss: 0.341140036033421
Epoch: 54, step: 923, loss: 0.3403802216053009, mean loss: 0.34114002640332686
Epoch: 54, step: 924, loss: 0.3240481913089752, mean loss: 0.34113980977951863
Epoch: 54, step: 925, loss: 0.304442822933197, mean loss: 0.3411393446837435
Epoch: 54, step: 926, loss: 0.31640738248825073, mean loss: 0.34113903123606476
Epoch: 54, step: 927, loss: 0.33496272563934326, mean loss: 0.3411389529598608
Epoch: 54, step: 928, loss: 0.33422714471817017, mean loss: 0.3411388653632796
Epoch: 54, step: 929, loss: 0.31587710976600647, mean loss: 0.3411385452132834
Epoch: 54, step: 930, loss: 0.37229496240615845, mean loss: 0.3411389400631344
Epoch: 54, step: 931, loss: 0.3229507505893707, mean loss: 0.3411387095644591
Epoch: 54, step: 932, loss: 0.35924094915390015, mean loss: 0.34113893897098546
Epoch: 54, step: 933, loss: 0.2955199182033539, mean loss: 0.34113836085641486
Epoch: 54, step: 934, loss: 0.3176743984222412, mean loss: 0.3411380635092461
Epoch: 54, step: 935, loss: 0.35266223549842834, mean loss: 0.34113820954751645
Epoch: 54, step: 936, loss: 0.3417384624481201, mean loss: 0.3411382171540312
Epoch: 54, step: 937, loss: 0.3103175163269043, mean loss: 0.3411378265934104
Epoch: 54, step: 938, loss: 0.32214006781578064, mean loss: 0.3411375858564304
Epoch: 54, step: 939, loss: 0.30876073241233826, mean loss: 0.3411371755866062
Epoch: 54, step: 940, loss: 0.3820037543773651, mean loss: 0.34113769342913436
Epoch: 54, step: 941, loss: 0.3791397511959076, mean loss: 0.3411381749676651
Epoch: 54, step: 942, loss: 0.35523197054862976, mean loss: 0.3411383535532475
Epoch: 54, step: 943, loss: 0.3454195559024811, mean loss: 0.34113840780061633
Epoch: 54, step: 944, loss: 0.34992536902427673, mean loss: 0.3411385191393123
Epoch: 54, step: 945, loss: 0.30726927518844604, mean loss: 0.34113808999098927
Epoch: 54, step: 946, loss: 0.36111173033714294, mean loss: 0.3411383430685503
Epoch: 54, step: 947, loss: 0.3320574462413788, mean loss: 0.34113822800979976
Epoch: 54, step: 948, loss: 0.35916149616241455, mean loss: 0.3411384563692315
Epoch: 54, step: 949, loss: 0.3537130653858185, mean loss: 0.3411386156907354
Epoch: 54, step: 950, loss: 0.3644056022167206, mean loss: 0.3411389104819542
Epoch: 54, step: 951, loss: 0.31055745482444763, mean loss: 0.3411385230217923
Epoch: 54, step: 952, loss: 0.31191200017929077, mean loss: 0.3411381527330158
Epoch: 54, step: 953, loss: 0.3379724323749542, mean loss: 0.3411381126250675
Epoch: 54, step: 954, loss: 0.4050951600074768, mean loss: 0.34113892291566794
Epoch: 54, step: 955, loss: 0.36669033765792847, mean loss: 0.3411392466299377
Epoch: 54, step: 956, loss: 0.3371478021144867, mean loss: 0.34113919606243726
Epoch: 54, step: 957, loss: 0.3394945561885834, mean loss: 0.34113917522680404
Epoch: 54, step: 958, loss: 0.32404565811157227, mean loss: 0.3411389586749941
Epoch: 54, step: 959, loss: 0.35184603929519653, mean loss: 0.34113909431754785
Epoch: 54, step: 960, loss: 0.3364102244377136, mean loss: 0.3411390344106616
Epoch: 54, step: 961, loss: 0.3058605492115021, mean loss: 0.3411385874968153
Epoch: 54, step: 962, loss: 0.3598995506763458, mean loss: 0.3411388251608746
Epoch: 54, step: 963, loss: 0.34051206707954407, mean loss: 0.3411388172211979
Epoch: 54, step: 964, loss: 0.3814184069633484, mean loss: 0.34113932747049475
Epoch: 54, step: 965, loss: 0.31886494159698486, mean loss: 0.34113904530908673
Epoch: 54, step: 966, loss: 0.3505382239818573, mean loss: 0.3411391643719381
Epoch: 54, step: 967, loss: 0.3134996294975281, mean loss: 0.3411388142562247
Epoch: 54, step: 968, loss: 0.36817556619644165, mean loss: 0.34113915673202355
Epoch: 54, step: 969, loss: 0.322052538394928, mean loss: 0.3411389149640006
Epoch: 54, step: 970, loss: 0.3629782795906067, mean loss: 0.3411391915972435
Epoch: 54, step: 971, loss: 0.32839301228523254, mean loss: 0.3411390301469305
Epoch: 54, step: 972, loss: 0.3777196705341339, mean loss: 0.3411394934921329
Epoch: 54, step: 973, loss: 0.2850227653980255, mean loss: 0.34113878270393666
Epoch: 54, step: 974, loss: 0.3957746624946594, mean loss: 0.34113947472658096
Epoch: 54, step: 975, loss: 0.31115686893463135, mean loss: 0.3411390949691867
Epoch: 54, step: 976, loss: 0.32625046372413635, mean loss: 0.34113890639330935
Epoch: 54, step: 977, loss: 0.32827356457710266, mean loss: 0.3411387434460006
Epoch: 54, step: 978, loss: 0.3027852773666382, mean loss: 0.3411382576823874
Epoch: 54, step: 979, loss: 0.3327973783016205, mean loss: 0.3411381520427985
Epoch: 54, step: 980, loss: 0.31608685851097107, mean loss: 0.34113783476512166
Epoch: 54, step: 981, loss: 0.3457950949668884, mean loss: 0.34113789374914105
Epoch: 54, step: 982, loss: 0.39718762040138245, mean loss: 0.3411386036077595
Epoch: 54, step: 983, loss: 0.30940067768096924, mean loss: 0.341138201658343
Epoch: 54, step: 984, loss: 0.38369882106781006, mean loss: 0.3411387406664535
Epoch: 54, step: 985, loss: 0.33494752645492554, mean loss: 0.34113866225893835
Epoch: 54, step: 986, loss: 0.31726697087287903, mean loss: 0.3411383599440391
Epoch: 54, step: 987, loss: 0.30597177147865295, mean loss: 0.34113791459440557
Epoch: 54, step: 988, loss: 0.3050527572631836, mean loss: 0.3411374576178041
Epoch: 54, step: 989, loss: 0.3370699882507324, mean loss: 0.3411374061086816
Epoch: 54, step: 990, loss: 0.3790004551410675, mean loss: 0.3411378855880721
Epoch: 54, step: 991, loss: 0.3299236595630646, mean loss: 0.341137743578321
Epoch: 54, step: 992, loss: 0.3689673840999603, mean loss: 0.34113809599054
Epoch: 54, step: 993, loss: 0.3282102048397064, mean loss: 0.34113793228418127
Epoch: 54, step: 994, loss: 0.38056209683418274, mean loss: 0.34113843150749806
Epoch: 54, step: 995, loss: 0.36739999055862427, mean loss: 0.3411387640501594
Epoch: 54, step: 996, loss: 0.3568030893802643, mean loss: 0.3411389624005492
Epoch: 54, step: 997, loss: 0.31613844633102417, mean loss: 0.34113864583413406
Epoch: 54, step: 998, loss: 0.357059121131897, mean loss: 0.34113884742293177
Epoch: 54, step: 999, loss: 0.34667903184890747, mean loss: 0.34113891757316
Epoch: 54, step: 1000, loss: 0.30155521631240845, mean loss: 0.3411384163677298
Epoch: 54, step: 1001, loss: 0.30859407782554626, mean loss: 0.3411380042993241
Epoch: 54, step: 1002, loss: 0.2956889867782593, mean loss: 0.3411374288423353
Epoch: 54, step: 1003, loss: 0.28366926312446594, mean loss: 0.34113670121298967
Epoch: 54, step: 1004, loss: 0.3216725289821625, mean loss: 0.34113645477179205
Epoch: 54, step: 1005, loss: 0.3636535704135895, mean loss: 0.34113673986352994
Epoch: 54, step: 1006, loss: 0.327432781457901, mean loss: 0.3411365663583655
Epoch: 54, step: 1007, loss: 0.3278270959854126, mean loss: 0.34113639784992866
Epoch: 54, step: 1008, loss: 0.35290035605430603, mean loss: 0.34113654678907157
Epoch: 54, step: 1009, loss: 0.3732381761074066, mean loss: 0.34113695321083387
Epoch: 54, step: 1010, loss: 0.3231530785560608, mean loss: 0.34113672552938434
Epoch: 54, step: 1011, loss: 0.3496306836605072, mean loss: 0.3411368330641761
Epoch: 54, step: 1012, loss: 0.31147176027297974, mean loss: 0.34113645750463245
Epoch: 54, step: 1013, loss: 0.3421729803085327, mean loss: 0.34113647062683533
Epoch: 54, step: 1014, loss: 0.33118128776550293, mean loss: 0.34113634459750464
Epoch: 54, step: 1015, loss: 0.3392674922943115, mean loss: 0.34113632093875057
Epoch: 54, step: 1016, loss: 0.32808929681777954, mean loss: 0.3411361557719115
Epoch: 54, step: 1017, loss: 0.33616259694099426, mean loss: 0.34113609281068874
Epoch: 54, step: 1018, loss: 0.36446020007133484, mean loss: 0.3411363880712402
Epoch: 54, step: 1019, loss: 0.33012789487838745, mean loss: 0.34113624871616915
Epoch: 54, step: 1020, loss: 0.35074156522750854, mean loss: 0.3411363703070715
Epoch: 54, step: 1021, loss: 0.34233036637306213, mean loss: 0.3411363854213284
Epoch: 54, step: 1022, loss: 0.3594329357147217, mean loss: 0.34113661702616255
Epoch: 54, step: 1023, loss: 0.3075093924999237, mean loss: 0.3411361913650926
Epoch: 54, step: 1024, loss: 0.39010515809059143, mean loss: 0.34113681121758466
Epoch: 54, step: 1025, loss: 0.32215020060539246, mean loss: 0.3411365708868258
Epoch: 54, step: 1026, loss: 0.35359427332878113, mean loss: 0.3411367285732737
Epoch: 54, step: 1027, loss: 0.3207390010356903, mean loss: 0.34113647038726364
Epoch: 54, step: 1028, loss: 0.3536735773086548, mean loss: 0.3411366290747761
Epoch: 54, step: 1029, loss: 0.32714518904685974, mean loss: 0.3411364519813904
Epoch: 54, step: 1030, loss: 0.3178306818008423, mean loss: 0.3411361569977791
Epoch: 54, step: 1031, loss: 0.41442009806632996, mean loss: 0.34113708454867353
Epoch: 54, step: 1032, loss: 0.29093071818351746, mean loss: 0.34113644909744184
Epoch: 54, step: 1033, loss: 0.3767503798007965, mean loss: 0.341136899849634
Epoch: 54, step: 1034, loss: 0.354056715965271, mean loss: 0.3411370633688417
Epoch: 54, step: 1035, loss: 0.2951188087463379, mean loss: 0.34113648094775856
Epoch: 54, step: 1036, loss: 0.3132188320159912, mean loss: 0.34113612761794027
Epoch: 54, step: 1037, loss: 0.31698331236839294, mean loss: 0.34113582194027237
Epoch: 54, step: 1038, loss: 0.3119467496871948, mean loss: 0.3411354525284866
Epoch: 54, step: 1039, loss: 0.3286574184894562, mean loss: 0.341135294610672
Epoch: 54, step: 1040, loss: 0.33142971992492676, mean loss: 0.34113517178172775
Epoch: 54, step: 1041, loss: 0.3485542833805084, mean loss: 0.34113526567313984
Epoch: 54, step: 1042, loss: 0.32573845982551575, mean loss: 0.3411350708237258
Epoch: 54, step: 1043, loss: 0.39214614033699036, mean loss: 0.34113571637003703
Epoch: 54, step: 1044, loss: 0.3382970094680786, mean loss: 0.34113568044658754
Epoch: 54, step: 1045, loss: 0.371832937002182, mean loss: 0.3411360689112753
Epoch: 54, step: 1046, loss: 0.38255712389945984, mean loss: 0.34113659307582217
Epoch: 54, step: 1047, loss: 0.3697042167186737, mean loss: 0.3411369545814868
Epoch: 54, step: 1048, loss: 0.33806949853897095, mean loss: 0.34113691576521293
Epoch: 54, step: 1049, loss: 0.31275612115859985, mean loss: 0.34113655663284376
Epoch: 54, step: 1050, loss: 0.30384165048599243, mean loss: 0.34113608470671536
Epoch: 54, step: 1051, loss: 0.31331005692481995, mean loss: 0.34113573260331176
Epoch: 54, step: 1052, loss: 0.3469221591949463, mean loss: 0.3411358058223401
Epoch: 54, step: 1053, loss: 0.34676939249038696, mean loss: 0.3411358771064938
Epoch: 54, step: 1054, loss: 0.3095150887966156, mean loss: 0.3411354770003543
Epoch: 54, step: 1055, loss: 0.3101996183395386, mean loss: 0.3411350855657625
Epoch: 54, step: 1056, loss: 0.3453075885772705, mean loss: 0.3411351383602029
Epoch: 54, step: 1057, loss: 0.2987900674343109, mean loss: 0.34113460257723704
Epoch: 54, step: 1058, loss: 0.3573119044303894, mean loss: 0.34113480726252654
Epoch: 54, step: 1059, loss: 0.36619970202445984, mean loss: 0.3411351243951593
Epoch: 54, step: 1060, loss: 0.3524433970451355, mean loss: 0.34113526747084094
Epoch: 54, step: 1061, loss: 0.32167038321495056, mean loss: 0.3411350211983612
Epoch: 54, step: 1062, loss: 0.3166542053222656, mean loss: 0.34113471146752106
Epoch: 54, step: 1063, loss: 0.3259786069393158, mean loss: 0.34113451971518644
Epoch: 54, step: 1064, loss: 0.40536215901374817, mean loss: 0.3411353323015568
Epoch: 54, step: 1065, loss: 0.3364323079586029, mean loss: 0.3411352728012362
Epoch: 54, step: 1066, loss: 0.27468398213386536, mean loss: 0.3411344321032532
Epoch: 54, step: 1067, loss: 0.3501855134963989, mean loss: 0.34113454661012776
Epoch: 54, step: 1068, loss: 0.3186592757701874, mean loss: 0.34113426227499155
Epoch: 54, step: 1069, loss: 0.3903045654296875, mean loss: 0.3411348843216878
Epoch: 54, step: 1070, loss: 0.3461185395717621, mean loss: 0.34113494736842265
Epoch: 54, step: 1071, loss: 0.3349388539791107, mean loss: 0.3411348689844864
Epoch: 54, step: 1072, loss: 0.3106897175312042, mean loss: 0.34113448384170847
Epoch: 54, step: 1073, loss: 0.3136885464191437, mean loss: 0.34113413664452413
Epoch: 54, step: 1074, loss: 0.347909152507782, mean loss: 0.34113422234889046
Epoch: 54, step: 1075, loss: 0.38714760541915894, mean loss: 0.3411348044136462
Epoch: 54, step: 1076, loss: 0.28796520829200745, mean loss: 0.3411341318320095
Epoch: 54, step: 1077, loss: 0.2991291582584381, mean loss: 0.34113360048668134
Epoch: 54, step: 1078, loss: 0.3104326128959656, mean loss: 0.3411332121369553
Epoch: 54, step: 1079, loss: 0.32632899284362793, mean loss: 0.34113302487451735
Epoch: 54, step: 1080, loss: 0.30250629782676697, mean loss: 0.34113253628113477
Epoch: 54, step: 1081, loss: 0.33304837346076965, mean loss: 0.3411324340250339
Epoch: 54, step: 1082, loss: 0.34036293625831604, mean loss: 0.34113242429182494
Epoch: 54, step: 1083, loss: 0.3232242166996002, mean loss: 0.34113219777768894
Epoch: 54, step: 1084, loss: 0.3334702253341675, mean loss: 0.34113210086552687
Epoch: 54, step: 1085, loss: 0.3261684477329254, mean loss: 0.341131911600733
Epoch: 54, step: 1086, loss: 0.28417572379112244, mean loss: 0.3411311912108185
Epoch: 54, step: 1087, loss: 0.31519049406051636, mean loss: 0.3411308631133639
Epoch: 54, step: 1088, loss: 0.35489845275878906, mean loss: 0.341131037243379
Epoch: 54, step: 1089, loss: 0.3467932343482971, mean loss: 0.34113110885693104
Epoch: 54, step: 1090, loss: 0.30283123254776, mean loss: 0.3411306244591885
Epoch: 54, step: 1091, loss: 0.3542616665363312, mean loss: 0.34113079053196227
Epoch: 54, step: 1092, loss: 0.29094818234443665, mean loss: 0.34113015586340456
Epoch: 54, step: 1093, loss: 0.3014884293079376, mean loss: 0.34112965451363153
Epoch: 54, step: 1094, loss: 0.3658618628978729, mean loss: 0.34112996729845
Epoch: 54, step: 1095, loss: 0.2898466885089874, mean loss: 0.3411293187341189
Epoch: 54, step: 1096, loss: 0.32335031032562256, mean loss: 0.3411290938911458
Epoch: 54, step: 1097, loss: 0.35530227422714233, mean loss: 0.34112927313059666
Epoch: 54, step: 1098, loss: 0.3097907304763794, mean loss: 0.34112887681643095
Epoch: 54, step: 1099, loss: 0.34189027547836304, mean loss: 0.3411288864451256
Epoch: 54, step: 1100, loss: 0.3489496111869812, mean loss: 0.34112898534524505
Epoch: 54, step: 1101, loss: 0.3017899990081787, mean loss: 0.3411284878745663
Epoch: 54, step: 1102, loss: 0.35131627321243286, mean loss: 0.3411286167050439
Epoch: 54, step: 1103, loss: 0.3373144268989563, mean loss: 0.3411285684730029
Epoch: 54, step: 1104, loss: 0.32607555389404297, mean loss: 0.34112837812368285
Epoch: 54, step: 1105, loss: 0.3363855183124542, mean loss: 0.34112831814973416
Epoch: 54, step: 1106, loss: 0.3169776499271393, mean loss: 0.3411280127659194
Epoch: 54, step: 1107, loss: 0.3281816840171814, mean loss: 0.34112784906240484
Epoch: 54, step: 1108, loss: 0.3366086184978485, mean loss: 0.34112779191843867
Epoch: 54, step: 1109, loss: 0.3399713933467865, mean loss: 0.34112777729639976
Epoch: 54, step: 1110, loss: 0.3240763545036316, mean loss: 0.34112756169304154
Epoch: 54, step: 1111, loss: 0.30388784408569336, mean loss: 0.34112709082871817
Epoch: 54, step: 1112, loss: 0.36174529790878296, mean loss: 0.3411273515249854
Epoch: 54, step: 1113, loss: 0.3680969476699829, mean loss: 0.3411276925237987
Epoch: 54, step: 1114, loss: 0.31225186586380005, mean loss: 0.34112732742755947
Epoch: 54, step: 1115, loss: 0.3231279253959656, mean loss: 0.3411270998520521
Epoch: 54, step: 1116, loss: 0.35643190145492554, mean loss: 0.34112729335592223
Epoch: 54, step: 1117, loss: 0.3298254907131195, mean loss: 0.34112715046515124
Epoch: 54, step: 1118, loss: 0.3153988718986511, mean loss: 0.3411268251819024
Epoch: 54, step: 1119, loss: 0.34418749809265137, mean loss: 0.3411268638775749
Epoch: 54, step: 1120, loss: 0.32740649580955505, mean loss: 0.3411266904150154
Epoch: 54, step: 1121, loss: 0.3474556803703308, mean loss: 0.3411267704295538
Epoch: 54, step: 1122, loss: 0.34773004055023193, mean loss: 0.341126853910636
Epoch: 54, step: 1123, loss: 0.33674097061157227, mean loss: 0.3411267984633124
Epoch: 54, step: 1124, loss: 0.3148208558559418, mean loss: 0.3411264659018706
Epoch: 54, step: 1125, loss: 0.3525005280971527, mean loss: 0.3411266096916888
Epoch: 54, step: 1126, loss: 0.32140782475471497, mean loss: 0.34112636041182665
Epoch: 54, step: 1127, loss: 0.3752007782459259, mean loss: 0.3411267911665019
Epoch: 54, step: 1128, loss: 0.3192327320575714, mean loss: 0.34112651439437486
Epoch: 54, step: 1129, loss: 0.32979610562324524, mean loss: 0.341126371163662
Epoch: 54, step: 1130, loss: 0.3327926695346832, mean loss: 0.34112626581645344
Epoch: 54, step: 1131, loss: 0.33687064051628113, mean loss: 0.3411262120213215
Epoch: 54, step: 1132, loss: 0.3182891607284546, mean loss: 0.3411259233430258
Epoch: 54, step: 1133, loss: 0.3225359320640564, mean loss: 0.3411256883538806
Epoch: 54, step: 1134, loss: 0.30713364481925964, mean loss: 0.3411252586785695
Epoch: 54, step: 1135, loss: 0.34358447790145874, mean loss: 0.3411252897638565
Epoch: 54, step: 1136, loss: 0.3913624584674835, mean loss: 0.34112592476908576
Epoch: 54, step: 1137, loss: 0.34141451120376587, mean loss: 0.34112592841681477
Epoch: 54, step: 1138, loss: 0.33263465762138367, mean loss: 0.34112582108861156
Epoch: 54, step: 1139, loss: 0.3618990480899811, mean loss: 0.3411260836553111
Epoch: 54, step: 1140, loss: 0.3313388526439667, mean loss: 0.34112595994952083
Epoch: 54, step: 1141, loss: 0.3324326276779175, mean loss: 0.34112585007146184
Epoch: 54, step: 1142, loss: 0.33586636185646057, mean loss: 0.3411257835957959
Epoch: 54, step: 1143, loss: 0.327542781829834, mean loss: 0.34112561191983826
Epoch: 54, step: 1144, loss: 0.32514992356300354, mean loss: 0.3411254100051967
Epoch: 54, step: 1145, loss: 0.31907135248184204, mean loss: 0.34112513127036287
Epoch: 54, step: 1146, loss: 0.2955424189567566, mean loss: 0.34112455517096935
Epoch: 54, step: 1147, loss: 0.3153687119483948, mean loss: 0.34112422965856826
Epoch: 54, step: 1148, loss: 0.36902672052383423, mean loss: 0.34112458229668347
Epoch: 54, step: 1149, loss: 0.323458731174469, mean loss: 0.341124359034404
Epoch: 54, step: 1150, loss: 0.3067445158958435, mean loss: 0.3411239245449992
Epoch: 54, step: 1151, loss: 0.3188064694404602, mean loss: 0.3411236425025477
Epoch: 54, step: 1152, loss: 0.33275172114372253, mean loss: 0.3411235367016231
Epoch: 54, step: 1153, loss: 0.4017755389213562, mean loss: 0.3411243031871813
Epoch: 54, step: 1154, loss: 0.3224877119064331, mean loss: 0.3411240676715012
Epoch: 54, step: 1155, loss: 0.32454776763916016, mean loss: 0.34112385819493
Epoch: 54, step: 1156, loss: 0.36505720019340515, mean loss: 0.34112416063944745
Epoch: 54, step: 1157, loss: 0.33339840173721313, mean loss: 0.3411240630106292
Epoch: 54, step: 1158, loss: 0.34307044744491577, mean loss: 0.34112408760637614
Epoch: 54, step: 1159, loss: 0.34173014760017395, mean loss: 0.34112409526483745
Epoch: 54, step: 1160, loss: 0.3173377513885498, mean loss: 0.3411237946931216
Epoch: 54, step: 1161, loss: 0.36127007007598877, mean loss: 0.34112404926457124
Epoch: 54, step: 1162, loss: 0.331329882144928, mean loss: 0.3411239255055255
Epoch: 54, step: 1163, loss: 0.30099043250083923, mean loss: 0.34112341838532073
Epoch: 54, step: 1164, loss: 0.30875831842422485, mean loss: 0.34112300943041796
Epoch: 54, step: 1165, loss: 0.39421066641807556, mean loss: 0.34112368022035233
Epoch: 54, step: 1166, loss: 0.31355512142181396, mean loss: 0.3411233318817905
Epoch: 54, step: 1167, loss: 0.29222992062568665, mean loss: 0.34112271410392664
Epoch: 54, step: 1168, loss: 0.35399922728538513, mean loss: 0.34112287679914655
Epoch: 54, step: 1169, loss: 0.34339335560798645, mean loss: 0.34112290548636776
Epoch: 54, step: 1170, loss: 0.34038814902305603, mean loss: 0.3411228962029273
Epoch: 54, step: 1171, loss: 0.3270193636417389, mean loss: 0.34112271801102656
Epoch: 54, step: 1172, loss: 0.3225483298301697, mean loss: 0.341122483334806
Epoch: 54, step: 1173, loss: 0.3311466872692108, mean loss: 0.3411223572982164
Epoch: 54, step: 1174, loss: 0.3401870131492615, mean loss: 0.34112234548100434
Epoch: 54, step: 1175, loss: 0.353945255279541, mean loss: 0.3411225074846151
Epoch: 54, step: 1176, loss: 0.3302885890007019, mean loss: 0.3411223706114898
Epoch: 54, step: 1177, loss: 0.33183908462524414, mean loss: 0.341122253330165
Epoch: 54, step: 1178, loss: 0.33319446444511414, mean loss: 0.34112215317491407
Epoch: 54, step: 1179, loss: 0.31643611192703247, mean loss: 0.34112184130921536
Epoch: 54, step: 1180, loss: 0.31822115182876587, mean loss: 0.3411215520020223
Epoch: 54, step: 1181, loss: 0.34133151173591614, mean loss: 0.34112155465443567
Epoch: 54, step: 1182, loss: 0.28181397914886475, mean loss: 0.3411208054335574
Epoch: 54, step: 1183, loss: 0.29392698407173157, mean loss: 0.34112020925087216
Epoch: 54, step: 1184, loss: 0.31983625888824463, mean loss: 0.3411199403817275
Epoch: 54, step: 1185, loss: 0.3207012712955475, mean loss: 0.3411196824464923
Epoch: 54, step: 1186, loss: 0.32584676146507263, mean loss: 0.3411194895164495
Epoch: 54, step: 1187, loss: 0.3154231905937195, mean loss: 0.3411191649206872
Epoch: 54, step: 1188, loss: 0.3403325080871582, mean loss: 0.3411191549837601
Epoch: 54, step: 1189, loss: 0.32986223697662354, mean loss: 0.3411190127899142
Epoch: 54, step: 1190, loss: 0.3375893831253052, mean loss: 0.34111896820530613
Epoch: 54, step: 1191, loss: 0.347540944814682, mean loss: 0.34111904932364445
Epoch: 54, step: 1192, loss: 0.31667765974998474, mean loss: 0.3411187405994017
Epoch: 54, step: 1193, loss: 0.3083671033382416, mean loss: 0.34111832691192845
Epoch: 54, step: 1194, loss: 0.3395419120788574, mean loss: 0.3411183070004099
Epoch: 54, step: 1195, loss: 0.3259516656398773, mean loss: 0.3411181154346877
Epoch: 54, step: 1196, loss: 0.3254234790802002, mean loss: 0.3411179172025081
Epoch: 54, step: 1197, loss: 0.37154433131217957, mean loss: 0.3411183015005619
Epoch: 54, step: 1198, loss: 0.35380053520202637, mean loss: 0.3411184616803371
Epoch: 54, step: 1199, loss: 0.30063197016716003, mean loss: 0.3411179503323085
Epoch: 54, step: 1200, loss: 0.35779014229774475, mean loss: 0.34111816090093283
Epoch: 54, step: 1201, loss: 0.3347588777542114, mean loss: 0.3411180805846436
Epoch: 54, step: 1202, loss: 0.33047860860824585, mean loss: 0.34111794621224717
Epoch: 54, step: 1203, loss: 0.3256487250328064, mean loss: 0.3411177508444626
Epoch: 54, step: 1204, loss: 0.33118411898612976, mean loss: 0.34111762538972146
Epoch: 54, step: 1205, loss: 0.30358633399009705, mean loss: 0.34111715140205506
Epoch: 54, step: 1206, loss: 0.32807257771492004, mean loss: 0.3411169866624811
Epoch: 54, step: 1207, loss: 0.36409667134284973, mean loss: 0.3411172768686424
Epoch: 54, step: 1208, loss: 0.34415826201438904, mean loss: 0.3411173152721929
Epoch: 54, step: 1209, loss: 0.3223871886730194, mean loss: 0.341117078738884
Epoch: 54, step: 1210, loss: 0.326265811920166, mean loss: 0.34111689119210464
Epoch: 54, step: 1211, loss: 0.33350178599357605, mean loss: 0.34111679502721604
Epoch: 54, step: 1212, loss: 0.34144699573516846, mean loss: 0.34111679919699606
Epoch: 54, step: 1213, loss: 0.30669280886650085, mean loss: 0.341116364495767
Epoch: 54, step: 1214, loss: 0.337715208530426, mean loss: 0.341116321546998
Epoch: 54, step: 1215, loss: 0.34588003158569336, mean loss: 0.3411163817009282
Epoch: 54, step: 1216, loss: 0.3035127818584442, mean loss: 0.34111590686603316
Epoch: 54, step: 1217, loss: 0.33823809027671814, mean loss: 0.34111587052721215
Epoch: 54, step: 1218, loss: 0.31789085268974304, mean loss: 0.3411155772635233
Epoch: 54, step: 1219, loss: 0.3578716516494751, mean loss: 0.34111578884080485
Epoch: 54, step: 1220, loss: 0.31825605034828186, mean loss: 0.3411155001968096
Epoch: 54, step: 1221, loss: 0.33827266097068787, mean loss: 0.34111546430146844
Epoch: 54, step: 1222, loss: 0.3853365182876587, mean loss: 0.3411160226551596
Epoch: 54, step: 1223, loss: 0.37203994393348694, mean loss: 0.3411164131087111
Epoch: 54, step: 1224, loss: 0.31939709186553955, mean loss: 0.34111613887831954
Epoch: 54, step: 1225, loss: 0.32937943935394287, mean loss: 0.3411159906914111
Epoch: 54, step: 1226, loss: 0.3213929533958435, mean loss: 0.34111574167259495
Epoch: 54, step: 1227, loss: 0.3125712275505066, mean loss: 0.34111538128026475
Epoch: 54, step: 1228, loss: 0.3391210734844208, mean loss: 0.34111535610120036
Epoch: 54, step: 1229, loss: 0.32724419236183167, mean loss: 0.3411151809735113
Epoch: 54, step: 1230, loss: 0.3740094006061554, mean loss: 0.341115596267862
Epoch: 54, step: 1231, loss: 0.3800988793373108, mean loss: 0.3411160884313186
Epoch: 54, step: 1232, loss: 0.3272375762462616, mean loss: 0.3411159132174895
Epoch: 54, step: 1233, loss: 0.37077876925468445, mean loss: 0.34111628770121677
Epoch: 54, step: 1234, loss: 0.31715166568756104, mean loss: 0.34111598515962516
Epoch: 54, step: 1235, loss: 0.30641424655914307, mean loss: 0.3411155470727368
Epoch: 54, step: 1236, loss: 0.29576578736305237, mean loss: 0.34111497456873224
Epoch: 54, step: 1237, loss: 0.3290177881717682, mean loss: 0.34111482185347486
Epoch: 54, step: 1238, loss: 0.3244362771511078, mean loss: 0.3411146113056657
Epoch: 54, step: 1239, loss: 0.3521144986152649, mean loss: 0.34111475016507936
Epoch: 54, step: 1240, loss: 0.3072545826435089, mean loss: 0.3411143227294592
Epoch: 54, step: 1241, loss: 0.35583069920539856, mean loss: 0.3411145085000729
Epoch: 54, step: 1242, loss: 0.28743085265159607, mean loss: 0.3411138308387057
Epoch: 54, step: 1243, loss: 0.30766502022743225, mean loss: 0.34111340861186135
Epoch: 54, step: 1244, loss: 0.30338212847709656, mean loss: 0.3411129323330952
Epoch: 54, step: 1245, loss: 0.3075127601623535, mean loss: 0.34111250820631006
Epoch: 54, step: 1246, loss: 0.3197905421257019, mean loss: 0.34111223906772553
Epoch: 54, step: 1247, loss: 0.3502752184867859, mean loss: 0.3411123547268619
Epoch: 54, step: 1248, loss: 0.30781763792037964, mean loss: 0.34111193447167976
Epoch: 54, step: 1249, loss: 0.34082701802253723, mean loss: 0.3411119308754304
Epoch: 54, step: 1250, loss: 0.3462580740451813, mean loss: 0.34111199582984203
Epoch: 54, step: 1251, loss: 0.2996380031108856, mean loss: 0.34111147235338524
Epoch: 54, step: 1252, loss: 0.3394750952720642, mean loss: 0.3411114516996211
Epoch: 54, step: 1253, loss: 0.3322945237159729, mean loss: 0.34111134041692537
Epoch: 54, step: 1254, loss: 0.30869951844215393, mean loss: 0.34111093133686865
Epoch: 54, step: 1255, loss: 0.3385940194129944, mean loss: 0.3411108995705126
Epoch: 54, step: 1256, loss: 0.32639074325561523, mean loss: 0.34111071378736274
Epoch: 54, step: 1257, loss: 0.3529141843318939, mean loss: 0.3411108627571301
Epoch: 54, step: 1258, loss: 0.3109923005104065, mean loss: 0.3411104826402342
Epoch: 54, step: 1259, loss: 0.3003361225128174, mean loss: 0.3411099680463611
Epoch: 54, step: 1260, loss: 0.3342013657093048, mean loss: 0.3411098808572659
Epoch: 54, step: 1261, loss: 0.3132433295249939, mean loss: 0.34110952917560644
Epoch: 54, step: 1262, loss: 0.30654579401016235, mean loss: 0.3411090929796024
Epoch: 54, step: 1263, loss: 0.3103635013103485, mean loss: 0.34110870497365
Epoch: 54, step: 1264, loss: 0.3468092381954193, mean loss: 0.3411087769128383
Epoch: 54, step: 1265, loss: 0.34274977445602417, mean loss: 0.34110879762152235
Epoch: 54, step: 1266, loss: 0.33173149824142456, mean loss: 0.34110867928552574
Epoch: 54, step: 1267, loss: 0.3548371195793152, mean loss: 0.3411088525281724
Epoch: 54, step: 1268, loss: 0.3487849533557892, mean loss: 0.34110894939360026
Epoch: 54, step: 1269, loss: 0.3424883186817169, mean loss: 0.3411089667997695
Epoch: 54, step: 1270, loss: 0.34790945053100586, mean loss: 0.34110905261353824
Epoch: 54, step: 1271, loss: 0.3420610725879669, mean loss: 0.34110906462671176
Epoch: 54, step: 1272, loss: 0.3425271511077881, mean loss: 0.34110908252077327
Epoch: 54, step: 1273, loss: 0.3300669491291046, mean loss: 0.3411089431878598
Epoch: 54, step: 1274, loss: 0.31960710883140564, mean loss: 0.34110867187476146
Epoch: 54, step: 1275, loss: 0.33858978748321533, mean loss: 0.3411086400915334
Epoch: 54, step: 1276, loss: 0.3651600778102875, mean loss: 0.3411089435682184
Epoch: 54, step: 1277, loss: 0.3073238432407379, mean loss: 0.34110851727932034
Epoch: 54, step: 1278, loss: 0.3287454843521118, mean loss: 0.34110836128874655
Epoch: 54, step: 1279, loss: 0.29348474740982056, mean loss: 0.34110776040535756
Epoch: 54, step: 1280, loss: 0.29207929968833923, mean loss: 0.34110714180434165
Epoch: 54, step: 1281, loss: 0.29890310764312744, mean loss: 0.3411066093150767
Epoch: 54, step: 1282, loss: 0.3428471088409424, mean loss: 0.34110663127472196
Epoch: 54, step: 1283, loss: 0.304050087928772, mean loss: 0.34110616374326413
Epoch: 54, step: 1284, loss: 0.3184336721897125, mean loss: 0.34110587769474654
Epoch: 54, step: 1285, loss: 0.32421350479125977, mean loss: 0.3411056645740468
Epoch: 54, step: 1286, loss: 0.32274097204208374, mean loss: 0.34110543288091716
Epoch: 54, step: 1287, loss: 0.3783377408981323, mean loss: 0.34110590260624035
Epoch: 54, step: 1288, loss: 0.3026469051837921, mean loss: 0.34110541741104167
Epoch: 54, step: 1289, loss: 0.3502010703086853, mean loss: 0.34110553215952016
Epoch: 54, step: 1290, loss: 0.29933619499206543, mean loss: 0.3411050052146734
Epoch: 54, step: 1291, loss: 0.2895612120628357, mean loss: 0.34110435496749736
Epoch: 54, step: 1292, loss: 0.3524203896522522, mean loss: 0.3411044977223534
Epoch: 54, step: 1293, loss: 0.3024680018424988, mean loss: 0.3411040103185956
Epoch: 54, step: 1294, loss: 0.3011937439441681, mean loss: 0.3411035068524305
Epoch: 54, step: 1295, loss: 0.3249876797199249, mean loss: 0.3411033035545809
Epoch: 54, step: 1296, loss: 0.34581518173217773, mean loss: 0.34110336299320665
Epoch: 54, step: 1297, loss: 0.3212927579879761, mean loss: 0.3411031130927979
Epoch: 54, step: 1298, loss: 0.3665233850479126, mean loss: 0.34110343375217295
Epoch: 54, step: 1299, loss: 0.31426888704299927, mean loss: 0.34110309525695737
Epoch: 54, step: 1300, loss: 0.30792665481567383, mean loss: 0.3411026767693703
Epoch: 54, step: 1301, loss: 0.29996320605278015, mean loss: 0.3411021578426729
Epoch: 54, step: 1302, loss: 0.3047986328601837, mean loss: 0.3411016999215969
Epoch: 54, step: 1303, loss: 0.38017311692237854, mean loss: 0.3411021927497629
Epoch: 54, step: 1304, loss: 0.31627604365348816, mean loss: 0.3411018796085425
Epoch: 54, step: 1305, loss: 0.3586253225803375, mean loss: 0.3411021006352947
Epoch: 54, step: 1306, loss: 0.3419943153858185, mean loss: 0.341102111888839
Epoch: 54, step: 1307, loss: 0.383932888507843, mean loss: 0.3411026521085128
Epoch: 54, step: 1308, loss: 0.34662654995918274, mean loss: 0.3411027217799242
Epoch: 54, step: 1309, loss: 0.3464004099369049, mean loss: 0.34110278859737186
Epoch: 54, step: 1310, loss: 0.34913167357444763, mean loss: 0.34110288986094567
Epoch: 54, step: 1311, loss: 0.33853235840797424, mean loss: 0.34110285744076285
Epoch: 54, step: 1312, loss: 0.3068266808986664, mean loss: 0.34110242514654115
Epoch: 54, step: 1313, loss: 0.3010431230068207, mean loss: 0.3411019199213912
Epoch: 54, step: 1314, loss: 0.32119548320770264, mean loss: 0.3411016688659535
Epoch: 54, step: 1315, loss: 0.3316062092781067, mean loss: 0.3411015491128941
Epoch: 54, step: 1316, loss: 0.302249938249588, mean loss: 0.34110105913760164
Epoch: 54, step: 1317, loss: 0.32010331749916077, mean loss: 0.34110079432889434
Epoch: 54, step: 1318, loss: 0.30005696415901184, mean loss: 0.3411002767195852
Epoch: 54, step: 1319, loss: 0.35799461603164673, mean loss: 0.34110048977370283
Epoch: 54, step: 1320, loss: 0.3306674659252167, mean loss: 0.3411003582047425
Epoch: 54, step: 1321, loss: 0.3639604449272156, mean loss: 0.3411006464854901
Epoch: 54, step: 1322, loss: 0.34767916798591614, mean loss: 0.3411007294439322
Epoch: 54, step: 1323, loss: 0.3280446529388428, mean loss: 0.34110056480236217
Epoch: 54, step: 1324, loss: 0.32764264941215515, mean loss: 0.341100395095607
Epoch: 54, step: 1325, loss: 0.34968963265419006, mean loss: 0.34110050340608544
Epoch: 54, step: 1326, loss: 0.3634895086288452, mean loss: 0.34110078572838376
Epoch: 54, step: 1327, loss: 0.3646349012851715, mean loss: 0.3411010824866249
Epoch: 54, step: 1328, loss: 0.322459876537323, mean loss: 0.3411008474294917
Epoch: 54, step: 1329, loss: 0.32638323307037354, mean loss: 0.34110066184940496
Epoch: 54, step: 1330, loss: 0.32135719060897827, mean loss: 0.3411004128994858
Epoch: 54, step: 1331, loss: 0.32630330324172974, mean loss: 0.3411002263217174
Epoch: 54, step: 1332, loss: 0.3117768168449402, mean loss: 0.34109985658550235
Epoch: 54, step: 1333, loss: 0.38202497363090515, mean loss: 0.34110037260009124
Epoch: 54, step: 1334, loss: 0.3165958821773529, mean loss: 0.34110006363298173
Epoch: 54, step: 1335, loss: 0.3055534362792969, mean loss: 0.3410996154457294
Epoch: 54, step: 1336, loss: 0.3098887801170349, mean loss: 0.3410992219309799
Epoch: 54, step: 1337, loss: 0.3268478512763977, mean loss: 0.34109904224806575
Epoch: 54, step: 1338, loss: 0.3757915496826172, mean loss: 0.3410994796496598
Epoch: 54, step: 1339, loss: 0.29975226521492004, mean loss: 0.3410989583523877
Epoch: 54, step: 1340, loss: 0.33041706681251526, mean loss: 0.3410988236789691
Epoch: 54, step: 1341, loss: 0.3719688653945923, mean loss: 0.3410992128723642
Epoch: 54, step: 1342, loss: 0.35335060954093933, mean loss: 0.34109936732964014
Epoch: 54, step: 1343, loss: 0.3364817500114441, mean loss: 0.3410993091145958
Epoch: 54, step: 1344, loss: 0.31926336884498596, mean loss: 0.3410990338288547
Epoch: 54, step: 1345, loss: 0.33871203660964966, mean loss: 0.34109900373635554
Epoch: 54, step: 1346, loss: 0.3189144730567932, mean loss: 0.34109872406298614
Epoch: 54, step: 1347, loss: 0.34503045678138733, mean loss: 0.34109877362847346
Epoch: 54, step: 1348, loss: 0.32971706986427307, mean loss: 0.3410986301465477
Epoch: 54, step: 1349, loss: 0.3117921054363251, mean loss: 0.34109826070242205
Epoch: 54, step: 1350, loss: 0.3489646017551422, mean loss: 0.3410983598658979
Epoch: 54, step: 1351, loss: 0.31620997190475464, mean loss: 0.34109804612563016
Epoch: 54, step: 1352, loss: 0.33504384756088257, mean loss: 0.34109796980803425
Epoch: 54, step: 1353, loss: 0.3557192087173462, mean loss: 0.34109815411710914
Epoch: 54, step: 1354, loss: 0.32395198941230774, mean loss: 0.3410979379826257
Epoch: 54, step: 1355, loss: 0.3093862533569336, mean loss: 0.34109753824879036
Epoch: 54, step: 1356, loss: 0.30235710740089417, mean loss: 0.34109704992198
Epoch: 54, step: 1357, loss: 0.36708593368530273, mean loss: 0.3410973775101989
Epoch: 54, step: 1358, loss: 0.3218648135662079, mean loss: 0.3410971350880152
Epoch: 54, step: 1359, loss: 0.3236350119113922, mean loss: 0.3410969149846173
Epoch: 54, step: 1360, loss: 0.3097235858440399, mean loss: 0.3410965195407621
Epoch: 54, step: 1361, loss: 0.3583988845348358, mean loss: 0.34109673762497134
Epoch: 54, step: 1362, loss: 0.34565356373786926, mean loss: 0.34109679505985346
Epoch: 54, step: 1363, loss: 0.33508437871932983, mean loss: 0.34109671927946095
Epoch: 54, step: 1364, loss: 0.3233930468559265, mean loss: 0.34109649614548954
Epoch: 54, step: 1365, loss: 0.3509896695613861, mean loss: 0.3410966208357345
Epoch: 54, step: 1366, loss: 0.3474856913089752, mean loss: 0.3410967013604244
Epoch: 54, step: 1367, loss: 0.3263302445411682, mean loss: 0.34109651525363854
Epoch: 54, step: 1368, loss: 0.3364616930484772, mean loss: 0.34109645684010015
Epoch: 54, step: 1369, loss: 0.33149954676628113, mean loss: 0.3410963358899568
Epoch: 54, step: 1370, loss: 0.3647027015686035, mean loss: 0.34109663339793667
Epoch: 54, step: 1371, loss: 0.3256646394729614, mean loss: 0.34109643891296004
Epoch: 54, step: 1372, loss: 0.2979923188686371, mean loss: 0.3410958956909907
Epoch: 54, step: 1373, loss: 0.3346043527126312, mean loss: 0.34109581388200544
Epoch: 54, step: 1374, loss: 0.32493627071380615, mean loss: 0.34109561023563467
Epoch: 54, step: 1375, loss: 0.2932605445384979, mean loss: 0.34109500741446197
Epoch: 54, step: 1376, loss: 0.3137766420841217, mean loss: 0.34109466315066184
Epoch: 54, step: 1377, loss: 0.32973337173461914, mean loss: 0.3410945199784031
Epoch: 54, step: 1378, loss: 0.3594924807548523, mean loss: 0.34109475182215304
Epoch: 54, step: 1379, loss: 0.3914830982685089, mean loss: 0.34109538678795837
Epoch: 54, step: 1380, loss: 0.3277396857738495, mean loss: 0.34109521848899277
Epoch: 54, step: 1381, loss: 0.35274451971054077, mean loss: 0.3410953652832822
Epoch: 54, step: 1382, loss: 0.3592578172683716, mean loss: 0.34109559414770824
Epoch: 54, step: 1383, loss: 0.37425696849823, mean loss: 0.3410960120077681
Epoch: 54, step: 1384, loss: 0.3315955102443695, mean loss: 0.3410958922952927
Epoch: 54, step: 1385, loss: 0.2967049479484558, mean loss: 0.34109533294769123
Epoch: 54, step: 1386, loss: 0.3161565661430359, mean loss: 0.3410950187109965
Epoch: 54, step: 1387, loss: 0.30542951822280884, mean loss: 0.34109456931957866
Epoch: 54, step: 1388, loss: 0.30607569217681885, mean loss: 0.3410941280812854
Epoch: 54, step: 1389, loss: 0.3126422166824341, mean loss: 0.3410937695913603
Epoch: 54, step: 1390, loss: 0.3497733175754547, mean loss: 0.3410938789510184
Epoch: 54, step: 1391, loss: 0.32279160618782043, mean loss: 0.34109364835086764
Epoch: 54, step: 1392, loss: 0.35732388496398926, mean loss: 0.3410938528417471
Epoch: 54, step: 1393, loss: 0.3522461950778961, mean loss: 0.3410939933525476
Epoch: 54, step: 1394, loss: 0.29549509286880493, mean loss: 0.3410934188492594
Epoch: 54, step: 1395, loss: 0.3518274128437042, mean loss: 0.3410935540857911
Epoch: 54, step: 1396, loss: 0.32815882563591003, mean loss: 0.3410933911244762
Epoch: 54, step: 1397, loss: 0.34428897500038147, mean loss: 0.3410934313843078
Epoch: 54, step: 1398, loss: 0.3571203351020813, mean loss: 0.3410936332980554
Epoch: 54, step: 1399, loss: 0.3359498083591461, mean loss: 0.3410935684947781
Epoch: 54, step: 1400, loss: 0.35127267241477966, mean loss: 0.3410936967322262
Epoch: 54, step: 1401, loss: 0.3439825773239136, mean loss: 0.34109373312619673
Epoch: 54, step: 1402, loss: 0.34325748682022095, mean loss: 0.3410937603847121
Epoch: 54, step: 1403, loss: 0.3452565670013428, mean loss: 0.3410938128262165
Epoch: 54, step: 1404, loss: 0.3562124967575073, mean loss: 0.3410940032834283
Epoch: 54, step: 1405, loss: 0.31940758228302, mean loss: 0.34109373009276794
Epoch: 54, step: 1406, loss: 0.32301250100135803, mean loss: 0.34109350232071234
Epoch: 54, step: 1407, loss: 0.33009040355682373, mean loss: 0.3410933637147116
Epoch: 54, step: 1408, loss: 0.39674413204193115, mean loss: 0.34109406473843557
Epoch: 54, step: 1409, loss: 0.3368246555328369, mean loss: 0.3410940109580561
Epoch: 54, step: 1410, loss: 0.34360960125923157, mean loss: 0.3410940426457417
Epoch: 54, step: 1411, loss: 0.3482016921043396, mean loss: 0.3410941321762685
Epoch: 54, step: 1412, loss: 0.326601505279541, mean loss: 0.3410939496241908
Epoch: 54, step: 1413, loss: 0.33395716547966003, mean loss: 0.3410938597289377
Epoch: 54, step: 1414, loss: 0.34613725543022156, mean loss: 0.3410939232549759
Epoch: 54, step: 1415, loss: 0.3381251096725464, mean loss: 0.3410938858606089
Epoch: 54, step: 1416, loss: 0.3322089612483978, mean loss: 0.34109377394992896
Epoch: 54, step: 1417, loss: 0.34901124238967896, mean loss: 0.341093873673692
Epoch: 54, step: 1418, loss: 0.31981804966926575, mean loss: 0.34109360569933583
Epoch: 54, step: 1419, loss: 0.38252365589141846, mean loss: 0.341094127514669
Epoch: 54, step: 1420, loss: 0.30683714151382446, mean loss: 0.3410936960501804
Epoch: 54, step: 1421, loss: 0.3247452974319458, mean loss: 0.34109349014576695
Epoch: 54, step: 1422, loss: 0.33259955048561096, mean loss: 0.3410933831678496
Epoch: 54, step: 1423, loss: 0.37899190187454224, mean loss: 0.34109386047916834
Epoch: 54, step: 1424, loss: 0.3208785057067871, mean loss: 0.34109360588092935
Epoch: 54, step: 1425, loss: 0.3224552571773529, mean loss: 0.34109337114693394
Epoch: 54, step: 1426, loss: 0.3203967809677124, mean loss: 0.34109311049443747
Epoch: 54, step: 1427, loss: 0.3376842439174652, mean loss: 0.3410930675637718
Epoch: 54, step: 1428, loss: 0.3444487452507019, mean loss: 0.3410931098240537
Epoch: 54, step: 1429, loss: 0.3878060579299927, mean loss: 0.3410936981038828
Epoch: 54, step: 1430, loss: 0.3048650324344635, mean loss: 0.34109324186368145
Epoch: 54, step: 1431, loss: 0.3265964388847351, mean loss: 0.3410930593026929
Epoch: 54, step: 1432, loss: 0.3588015139102936, mean loss: 0.34109328230581104
Epoch: 54, step: 1433, loss: 0.3413445055484772, mean loss: 0.3410932854694333
Epoch: 54, step: 1434, loss: 0.32506680488586426, mean loss: 0.3410930836525492
Epoch: 54, step: 1435, loss: 0.33022651076316833, mean loss: 0.34109294681462937
Epoch: 54, step: 1436, loss: 0.34166470170021057, mean loss: 0.3410929540143937
Epoch: 54, step: 1437, loss: 0.33178073167800903, mean loss: 0.3410928367526724
Epoch: 54, step: 1438, loss: 0.304563969373703, mean loss: 0.3410923767782673
Epoch: 54, step: 1439, loss: 0.3534080386161804, mean loss: 0.34109253185610855
Epoch: 54, step: 1440, loss: 0.32705432176589966, mean loss: 0.3410923550903016
Epoch: 54, step: 1441, loss: 0.28387635946273804, mean loss: 0.3410916346491469
Epoch: 54, step: 1442, loss: 0.2961004078388214, mean loss: 0.3410910681445723
Epoch: 54, step: 1443, loss: 0.31530243158340454, mean loss: 0.34109074343245244
Valid: 54, mean loss: 0.18479694177707034
Epoch: 55, step: 0, loss: 0.2793286144733429, mean loss: 0.3410899657775632
Epoch: 55, step: 1, loss: 0.32890447974205017, mean loss: 0.34108981235047703
Epoch: 55, step: 2, loss: 0.329369455575943, mean loss: 0.3410896647816774
Epoch: 55, step: 3, loss: 0.34773334860801697, mean loss: 0.3410897484299931
Epoch: 55, step: 4, loss: 0.3251136541366577, mean loss: 0.34108954728307095
Epoch: 55, step: 5, loss: 0.2967257499694824, mean loss: 0.34108898872797166
Epoch: 55, step: 6, loss: 0.30424171686172485, mean loss: 0.3410885248142916
Epoch: 55, step: 7, loss: 0.3443650007247925, mean loss: 0.34108856606518434
Epoch: 55, step: 8, loss: 0.3068220317363739, mean loss: 0.3410881346543101
Epoch: 55, step: 9, loss: 0.33122071623802185, mean loss: 0.3410880104264564
Epoch: 55, step: 10, loss: 0.2766696810722351, mean loss: 0.34108719942912097
Epoch: 55, step: 11, loss: 0.3349151909351349, mean loss: 0.3410871217273321
Epoch: 55, step: 12, loss: 0.3468056619167328, mean loss: 0.3410871937193277
Epoch: 55, step: 13, loss: 0.37334099411964417, mean loss: 0.34108759976460307
Epoch: 55, step: 14, loss: 0.32658419013023376, mean loss: 0.3410874171824965
Epoch: 55, step: 15, loss: 0.3318292200565338, mean loss: 0.34108730063336107
Epoch: 55, step: 16, loss: 0.32322627305984497, mean loss: 0.3410870757881684
Epoch: 55, step: 17, loss: 0.34439313411712646, mean loss: 0.34108711740626463
Epoch: 55, step: 18, loss: 0.34538719058036804, mean loss: 0.3410871715367695
Epoch: 55, step: 19, loss: 0.3471226394176483, mean loss: 0.3410872475119442
Epoch: 55, step: 20, loss: 0.31356295943260193, mean loss: 0.341086901037352
Epoch: 55, step: 21, loss: 0.34301361441612244, mean loss: 0.3410869252904345
Epoch: 55, step: 22, loss: 0.3273088335990906, mean loss: 0.34108675185675635
Epoch: 55, step: 23, loss: 0.3282914459705353, mean loss: 0.34108659079606096
Epoch: 55, step: 24, loss: 0.3595743477344513, mean loss: 0.341086823507458
Epoch: 55, step: 25, loss: 0.32065510749816895, mean loss: 0.34108656633005435
Epoch: 55, step: 26, loss: 0.32531535625457764, mean loss: 0.34108636781771184
Epoch: 55, step: 27, loss: 0.3455944359302521, mean loss: 0.34108642456008564
Epoch: 55, step: 28, loss: 0.32574838399887085, mean loss: 0.34108623150491113
Epoch: 55, step: 29, loss: 0.32092052698135376, mean loss: 0.3410859776886176
Epoch: 55, step: 30, loss: 0.31581249833106995, mean loss: 0.3410856595871543
Epoch: 55, step: 31, loss: 0.3373943269252777, mean loss: 0.34108561312724567
Epoch: 55, step: 32, loss: 0.3386741280555725, mean loss: 0.3410855827761567
Epoch: 55, step: 33, loss: 0.32661348581314087, mean loss: 0.3410854006318095
Epoch: 55, step: 34, loss: 0.3810141384601593, mean loss: 0.3410859031645365
Epoch: 55, step: 35, loss: 0.3092040419578552, mean loss: 0.3410855019127593
Epoch: 55, step: 36, loss: 0.34853339195251465, mean loss: 0.3410855956476101
Epoch: 55, step: 37, loss: 0.3427340090274811, mean loss: 0.34108561639332957
Epoch: 55, step: 38, loss: 0.2981005012989044, mean loss: 0.341085075421066
Epoch: 55, step: 39, loss: 0.33133065700531006, mean loss: 0.3410849526622135
Epoch: 55, step: 40, loss: 0.3897247612476349, mean loss: 0.3410855647839913
Epoch: 55, step: 41, loss: 0.30836221575737, mean loss: 0.34108515297269754
Epoch: 55, step: 42, loss: 0.32189130783081055, mean loss: 0.34108491142826625
Epoch: 55, step: 43, loss: 0.29764068126678467, mean loss: 0.3410843647123929
Epoch: 55, step: 44, loss: 0.329077810049057, mean loss: 0.34108421362002944
Epoch: 55, step: 45, loss: 0.3521527647972107, mean loss: 0.3410843529066574
Epoch: 55, step: 46, loss: 0.3445565104484558, mean loss: 0.3410843965997318
Epoch: 55, step: 47, loss: 0.34520745277404785, mean loss: 0.3410844484829574
Epoch: 55, step: 48, loss: 0.34312888979911804, mean loss: 0.341084474209232
Epoch: 55, step: 49, loss: 0.3088493347167969, mean loss: 0.3410840685827126
Epoch: 55, step: 50, loss: 0.3315941095352173, mean loss: 0.3410839491685987
Epoch: 55, step: 51, loss: 0.32604047656059265, mean loss: 0.341083759875859
Epoch: 55, step: 52, loss: 0.3222901225090027, mean loss: 0.3410835233975913
Epoch: 55, step: 53, loss: 0.32954975962638855, mean loss: 0.34108337827133905
Epoch: 55, step: 54, loss: 0.4198639392852783, mean loss: 0.34108436953350973
Epoch: 55, step: 55, loss: 0.3625241219997406, mean loss: 0.3410846392973688
Epoch: 55, step: 56, loss: 0.3195981979370117, mean loss: 0.3410843689494523
Epoch: 55, step: 57, loss: 0.34755080938339233, mean loss: 0.3410844503108408
Epoch: 55, step: 58, loss: 0.37422704696655273, mean loss: 0.3410848673089995
Epoch: 55, step: 59, loss: 0.31137967109680176, mean loss: 0.341084493564709
Epoch: 55, step: 60, loss: 0.3214700222015381, mean loss: 0.34108424678281946
Epoch: 55, step: 61, loss: 0.3154870271682739, mean loss: 0.34108392473229715
Epoch: 55, step: 62, loss: 0.31417572498321533, mean loss: 0.34108358619198353
Epoch: 55, step: 63, loss: 0.32611480355262756, mean loss: 0.3410833978675077
Epoch: 55, step: 64, loss: 0.3030996024608612, mean loss: 0.3410829199937528
Epoch: 55, step: 65, loss: 0.3265567123889923, mean loss: 0.3410827372419776
Epoch: 55, step: 66, loss: 0.31311556696891785, mean loss: 0.3410823853961377
Epoch: 55, step: 67, loss: 0.3272172510623932, mean loss: 0.34108221096560315
Epoch: 55, step: 68, loss: 0.32793107628822327, mean loss: 0.34108204551963356
Epoch: 55, step: 69, loss: 0.31290048360824585, mean loss: 0.34108169098998314
Epoch: 55, step: 70, loss: 0.371201753616333, mean loss: 0.34108206990159107
Epoch: 55, step: 71, loss: 0.36293354630470276, mean loss: 0.34108234479059124
Epoch: 55, step: 72, loss: 0.3495614528656006, mean loss: 0.3410824514554306
Epoch: 55, step: 73, loss: 0.3099069893360138, mean loss: 0.34108205928165497
Epoch: 55, step: 74, loss: 0.3512877821922302, mean loss: 0.3410821876636024
Epoch: 55, step: 75, loss: 0.3165808916091919, mean loss: 0.34108187945569185
Epoch: 55, step: 76, loss: 0.3334643840789795, mean loss: 0.34108178363452407
Epoch: 55, step: 77, loss: 0.33839574456214905, mean loss: 0.34108174984701906
Epoch: 55, step: 78, loss: 0.36705243587493896, mean loss: 0.3410820765264242
Epoch: 55, step: 79, loss: 0.3438418507575989, mean loss: 0.3410821112405655
Epoch: 55, step: 80, loss: 0.2777363657951355, mean loss: 0.3410813144487585
Epoch: 55, step: 81, loss: 0.34100478887557983, mean loss: 0.3410813134861969
Epoch: 55, step: 82, loss: 0.37231242656707764, mean loss: 0.34108170631556284
Epoch: 55, step: 83, loss: 0.330507755279541, mean loss: 0.3410815733165812
Epoch: 55, step: 84, loss: 0.3260282874107361, mean loss: 0.34108138397898097
Epoch: 55, step: 85, loss: 0.30234038829803467, mean loss: 0.3410808967076344
Epoch: 55, step: 86, loss: 0.33116400241851807, mean loss: 0.34108077197780823
Epoch: 55, step: 87, loss: 0.3579612672328949, mean loss: 0.34108098428971717
Epoch: 55, step: 88, loss: 0.372102826833725, mean loss: 0.34108137445740316
Epoch: 55, step: 89, loss: 0.30268800258636475, mean loss: 0.3410808915826469
Epoch: 55, step: 90, loss: 0.3335520029067993, mean loss: 0.3410807968927464
Epoch: 55, step: 91, loss: 0.3185339868068695, mean loss: 0.3410805133278746
Epoch: 55, step: 92, loss: 0.32403215765953064, mean loss: 0.3410802989182099
Epoch: 55, step: 93, loss: 0.347293496131897, mean loss: 0.34108037705787353
Epoch: 55, step: 94, loss: 0.3367604613304138, mean loss: 0.34108032272956157
Epoch: 55, step: 95, loss: 0.317790150642395, mean loss: 0.3410800298303704
Epoch: 55, step: 96, loss: 0.2985162138938904, mean loss: 0.3410794945509215
Epoch: 55, step: 97, loss: 0.31329017877578735, mean loss: 0.3410791450789054
Epoch: 55, step: 98, loss: 0.33668237924575806, mean loss: 0.3410790897868892
Epoch: 55, step: 99, loss: 0.30534303188323975, mean loss: 0.3410786403897828
Epoch: 55, step: 100, loss: 0.3068285584449768, mean loss: 0.3410782096849131
Epoch: 55, step: 101, loss: 0.30381160974502563, mean loss: 0.3410777410523342
Epoch: 55, step: 102, loss: 0.30962857604026794, mean loss: 0.3410773455797663
Epoch: 55, step: 103, loss: 0.28926077485084534, mean loss: 0.34107669399570706
Epoch: 55, step: 104, loss: 0.3398139774799347, mean loss: 0.3410766781174736
Epoch: 55, step: 105, loss: 0.3259819746017456, mean loss: 0.34107648830906484
Epoch: 55, step: 106, loss: 0.33616065979003906, mean loss: 0.34107642649573705
Epoch: 55, step: 107, loss: 0.33556702733039856, mean loss: 0.3410763572195178
Epoch: 55, step: 108, loss: 0.32029902935028076, mean loss: 0.34107609596478217
Epoch: 55, step: 109, loss: 0.2993946075439453, mean loss: 0.341075571867103
Epoch: 55, step: 110, loss: 0.2987406551837921, mean loss: 0.3410750395599941
Epoch: 55, step: 111, loss: 0.3312297463417053, mean loss: 0.3410749157696554
Epoch: 55, step: 112, loss: 0.30504128336906433, mean loss: 0.34107446270448244
Epoch: 55, step: 113, loss: 0.3200501501560211, mean loss: 0.34107419836077346
Epoch: 55, step: 114, loss: 0.30383116006851196, mean loss: 0.3410737301010351
Epoch: 55, step: 115, loss: 0.3098263740539551, mean loss: 0.34107333723043504
Epoch: 55, step: 116, loss: 0.34630265831947327, mean loss: 0.3410734029774595
Epoch: 55, step: 117, loss: 0.31997793912887573, mean loss: 0.3410731377524872
Epoch: 55, step: 118, loss: 0.30791476368904114, mean loss: 0.34107272087052914
Epoch: 55, step: 119, loss: 0.34803834557533264, mean loss: 0.34107280844438764
Epoch: 55, step: 120, loss: 0.32049280405044556, mean loss: 0.3410725497098433
Epoch: 55, step: 121, loss: 0.29590922594070435, mean loss: 0.34107198191768606
Epoch: 55, step: 122, loss: 0.33647581934928894, mean loss: 0.34107192413557363
Epoch: 55, step: 123, loss: 0.33046892285346985, mean loss: 0.34107179083826294
Epoch: 55, step: 124, loss: 0.33832859992980957, mean loss: 0.3410717563522373
Epoch: 55, step: 125, loss: 0.35821446776390076, mean loss: 0.3410719718591316
Epoch: 55, step: 126, loss: 0.34142616391181946, mean loss: 0.34107197631174513
Epoch: 55, step: 127, loss: 0.3355681300163269, mean loss: 0.3410719071227486
Epoch: 55, step: 128, loss: 0.3453803062438965, mean loss: 0.3410719612830664
Epoch: 55, step: 129, loss: 0.3502591550350189, mean loss: 0.341072076772617
Epoch: 55, step: 130, loss: 0.2955077588558197, mean loss: 0.34107150400397906
Epoch: 55, step: 131, loss: 0.3260060250759125, mean loss: 0.34107131462497003
Epoch: 55, step: 132, loss: 0.31677258014678955, mean loss: 0.3410710091841384
Epoch: 55, step: 133, loss: 0.3305913209915161, mean loss: 0.34107087745363845
Epoch: 55, step: 134, loss: 0.30230122804641724, mean loss: 0.34107039012223994
Epoch: 55, step: 135, loss: 0.35162562131881714, mean loss: 0.34107052279898586
Epoch: 55, step: 136, loss: 0.36485493183135986, mean loss: 0.34107082175959313
Epoch: 55, step: 137, loss: 0.3184264898300171, mean loss: 0.34107053713288144
Epoch: 55, step: 138, loss: 0.32042694091796875, mean loss: 0.3410702776575711
Epoch: 55, step: 139, loss: 0.3472304940223694, mean loss: 0.34107035508613276
Epoch: 55, step: 140, loss: 0.34066450595855713, mean loss: 0.34107034998502633
Epoch: 55, step: 141, loss: 0.3745049238204956, mean loss: 0.34107077021797466
Epoch: 55, step: 142, loss: 0.3210015594959259, mean loss: 0.3410705179749632
Epoch: 55, step: 143, loss: 0.30537405610084534, mean loss: 0.3410700693240422
Epoch: 55, step: 144, loss: 0.30969905853271484, mean loss: 0.34106967504250146
Epoch: 55, step: 145, loss: 0.3408617377281189, mean loss: 0.34106967242910735
Epoch: 55, step: 146, loss: 0.34937745332717896, mean loss: 0.34106977684150064
Epoch: 55, step: 147, loss: 0.3628885746002197, mean loss: 0.3410700510572376
Epoch: 55, step: 148, loss: 0.30394643545150757, mean loss: 0.3410695844984571
Epoch: 55, step: 149, loss: 0.34648433327674866, mean loss: 0.3410696525485863
Epoch: 55, step: 150, loss: 0.3055516481399536, mean loss: 0.341069206179879
Epoch: 55, step: 151, loss: 0.34706199169158936, mean loss: 0.34106928149262106
Epoch: 55, step: 152, loss: 0.331438809633255, mean loss: 0.34106916046574187
Epoch: 55, step: 153, loss: 0.40410125255584717, mean loss: 0.34106995258492767
Epoch: 55, step: 154, loss: 0.36036473512649536, mean loss: 0.3410701950578468
Epoch: 55, step: 155, loss: 0.34963494539260864, mean loss: 0.34107030268766403
Epoch: 55, step: 156, loss: 0.3096161186695099, mean loss: 0.34106990742038806
Epoch: 55, step: 157, loss: 0.308287113904953, mean loss: 0.3410694954623907
Epoch: 55, step: 158, loss: 0.349838525056839, mean loss: 0.34106960565515
Epoch: 55, step: 159, loss: 0.4000277519226074, mean loss: 0.3410703465215268
Epoch: 55, step: 160, loss: 0.3296356797218323, mean loss: 0.34107020283563694
Epoch: 55, step: 161, loss: 0.3166640102863312, mean loss: 0.34106989615582806
Epoch: 55, step: 162, loss: 0.32638970017433167, mean loss: 0.34106971169185984
Epoch: 55, step: 163, loss: 0.3019774854183197, mean loss: 0.34106922048475447
Epoch: 55, step: 164, loss: 0.31454187631607056, mean loss: 0.34106888716385014
Epoch: 55, step: 165, loss: 0.3403399586677551, mean loss: 0.3410688780048461
Epoch: 55, step: 166, loss: 0.3144848942756653, mean loss: 0.34106854398064956
Epoch: 55, step: 167, loss: 0.31491073966026306, mean loss: 0.3410682153154699
Epoch: 55, step: 168, loss: 0.3511148691177368, mean loss: 0.3410683415471577
Epoch: 55, step: 169, loss: 0.3309778869152069, mean loss: 0.3410682147667251
Epoch: 55, step: 170, loss: 0.33483532071113586, mean loss: 0.34106813645518164
Epoch: 55, step: 171, loss: 0.28998517990112305, mean loss: 0.34106749464499275
Epoch: 55, step: 172, loss: 0.297072172164917, mean loss: 0.34106694189132747
Epoch: 55, step: 173, loss: 0.3242264986038208, mean loss: 0.3410667303120214
Epoch: 55, step: 174, loss: 0.34548476338386536, mean loss: 0.341066785818436
Epoch: 55, step: 175, loss: 0.32095247507095337, mean loss: 0.3410665331133912
Epoch: 55, step: 176, loss: 0.3503073453903198, mean loss: 0.3410666492083731
Epoch: 55, step: 177, loss: 0.3420538008213043, mean loss: 0.34106666161008686
Epoch: 55, step: 178, loss: 0.3287554681301117, mean loss: 0.34106650694490914
Epoch: 55, step: 179, loss: 0.322568416595459, mean loss: 0.3410662745568394
Epoch: 55, step: 180, loss: 0.3192531168460846, mean loss: 0.3410660005256374
Epoch: 55, step: 181, loss: 0.3217517137527466, mean loss: 0.34106575788994015
Epoch: 55, step: 182, loss: 0.3476116955280304, mean loss: 0.3410658401222384
Epoch: 55, step: 183, loss: 0.32443517446517944, mean loss: 0.34106563120477623
Epoch: 55, step: 184, loss: 0.34616774320602417, mean loss: 0.34106569529763475
Epoch: 55, step: 185, loss: 0.31401240825653076, mean loss: 0.34106535545783573
Epoch: 55, step: 186, loss: 0.30828559398651123, mean loss: 0.341064943687998
Epoch: 55, step: 187, loss: 0.32971417903900146, mean loss: 0.34106480110478216
Epoch: 55, step: 188, loss: 0.321537047624588, mean loss: 0.34106455580898043
Epoch: 55, step: 189, loss: 0.3554464876651764, mean loss: 0.34106473646382096
Epoch: 55, step: 190, loss: 0.3592652380466461, mean loss: 0.3410649650817454
Epoch: 55, step: 191, loss: 0.30110689997673035, mean loss: 0.3410644631716677
Epoch: 55, step: 192, loss: 0.33521708846092224, mean loss: 0.3410643897241816
Epoch: 55, step: 193, loss: 0.314323753118515, mean loss: 0.34106405384560995
Epoch: 55, step: 194, loss: 0.35466521978378296, mean loss: 0.34106422468233594
Epoch: 55, step: 195, loss: 0.32321733236312866, mean loss: 0.3410640005202037
Epoch: 55, step: 196, loss: 0.3184913396835327, mean loss: 0.34106371700461235
Epoch: 55, step: 197, loss: 0.3287699520587921, mean loss: 0.3410635625952458
Epoch: 55, step: 198, loss: 0.2988365590572357, mean loss: 0.34106303223184586
Epoch: 55, step: 199, loss: 0.29858076572418213, mean loss: 0.34106249866909144
Epoch: 55, step: 200, loss: 0.31527695059776306, mean loss: 0.34106217481548406
Epoch: 55, step: 201, loss: 0.3384416103363037, mean loss: 0.34106214190291617
Epoch: 55, step: 202, loss: 0.3185710906982422, mean loss: 0.34106185943363965
Epoch: 55, step: 203, loss: 0.34124135971069336, mean loss: 0.3410618616879886
Epoch: 55, step: 204, loss: 0.3203077018260956, mean loss: 0.3410616010391991
Epoch: 55, step: 205, loss: 0.32083600759506226, mean loss: 0.3410613470317964
Epoch: 55, step: 206, loss: 0.4365723133087158, mean loss: 0.34106254651144874
Epoch: 55, step: 207, loss: 0.3623090088367462, mean loss: 0.3410628133329478
Epoch: 55, step: 208, loss: 0.30985352396965027, mean loss: 0.3410624213992382
Epoch: 55, step: 209, loss: 0.2928309142589569, mean loss: 0.34106181570405875
Epoch: 55, step: 210, loss: 0.32752886414527893, mean loss: 0.3410616457582894
Epoch: 55, step: 211, loss: 0.2852671146392822, mean loss: 0.34106094510363905
Epoch: 55, step: 212, loss: 0.29569554328918457, mean loss: 0.34106037542270506
Epoch: 55, step: 213, loss: 0.31643983721733093, mean loss: 0.3410600662515193
Epoch: 55, step: 214, loss: 0.3890669345855713, mean loss: 0.3410606690878141
Epoch: 55, step: 215, loss: 0.289958119392395, mean loss: 0.34106002738620056
Epoch: 55, step: 216, loss: 0.3496074378490448, mean loss: 0.34106013471583957
Epoch: 55, step: 217, loss: 0.33436325192451477, mean loss: 0.3410600506242904
Epoch: 55, step: 218, loss: 0.31755247712135315, mean loss: 0.34105975544763695
Epoch: 55, step: 219, loss: 0.3192547559738159, mean loss: 0.341059481653068
Epoch: 55, step: 220, loss: 0.3795712888240814, mean loss: 0.3410599652206672
Epoch: 55, step: 221, loss: 0.4000665545463562, mean loss: 0.3410607061185518
Epoch: 55, step: 222, loss: 0.33437207341194153, mean loss: 0.3410606221358703
Epoch: 55, step: 223, loss: 0.3762977719306946, mean loss: 0.3410610645690705
Epoch: 55, step: 224, loss: 0.3365393579006195, mean loss: 0.3410610077958058
Epoch: 55, step: 225, loss: 0.32539865374565125, mean loss: 0.3410608111462057
Epoch: 55, step: 226, loss: 0.3899240791797638, mean loss: 0.34106142464411565
Epoch: 55, step: 227, loss: 0.32875069975852966, mean loss: 0.34106127007997233
Epoch: 55, step: 228, loss: 0.3170267641544342, mean loss: 0.341060968324697
Epoch: 55, step: 229, loss: 0.32747629284858704, mean loss: 0.3410607977700771
Epoch: 55, step: 230, loss: 0.3190169334411621, mean loss: 0.34106052101442647
Epoch: 55, step: 231, loss: 0.3253425657749176, mean loss: 0.3410603236815881
Epoch: 55, step: 232, loss: 0.3362017273902893, mean loss: 0.34106026268455986
Epoch: 55, step: 233, loss: 0.3431645929813385, mean loss: 0.3410602891029481
Epoch: 55, step: 234, loss: 0.34645596146583557, mean loss: 0.34106035684097286
Epoch: 55, step: 235, loss: 0.3465132713317871, mean loss: 0.3410604252967639
Epoch: 55, step: 236, loss: 0.34386494755744934, mean loss: 0.3410604605042442
Epoch: 55, step: 237, loss: 0.34627220034599304, mean loss: 0.3410605259306903
Epoch: 55, step: 238, loss: 0.32480835914611816, mean loss: 0.3410603219089629
Epoch: 55, step: 239, loss: 0.3011963665485382, mean loss: 0.3410598214827093
Epoch: 55, step: 240, loss: 0.3699672222137451, mean loss: 0.34106018436292335
Epoch: 55, step: 241, loss: 0.3352793753147125, mean loss: 0.3410601117962159
Epoch: 55, step: 242, loss: 0.32218119502067566, mean loss: 0.34105987481145794
Epoch: 55, step: 243, loss: 0.30648812651634216, mean loss: 0.34105944084193224
Epoch: 55, step: 244, loss: 0.3652040958404541, mean loss: 0.34105974391925603
Epoch: 55, step: 245, loss: 0.2989172637462616, mean loss: 0.3410592149297226
Epoch: 55, step: 246, loss: 0.33603695034980774, mean loss: 0.34105915188900837
Epoch: 55, step: 247, loss: 0.33085179328918457, mean loss: 0.34105902376531255
Epoch: 55, step: 248, loss: 0.33203595876693726, mean loss: 0.3410589105083996
Epoch: 55, step: 249, loss: 0.33095934987068176, mean loss: 0.341058783740976
Epoch: 55, step: 250, loss: 0.3031672537326813, mean loss: 0.34105830814094573
Epoch: 55, step: 251, loss: 0.3447118401527405, mean loss: 0.34105835399811024
Epoch: 55, step: 252, loss: 0.34951251745224, mean loss: 0.3410584601088812
Epoch: 55, step: 253, loss: 0.36643287539482117, mean loss: 0.34105877858687006
Epoch: 55, step: 254, loss: 0.3422575294971466, mean loss: 0.34105879363237884
Epoch: 55, step: 255, loss: 0.34771662950515747, mean loss: 0.34105887719375083
Epoch: 55, step: 256, loss: 0.355608731508255, mean loss: 0.3410590598042195
Epoch: 55, step: 257, loss: 0.3422553241252899, mean loss: 0.34105907481795383
Epoch: 55, step: 258, loss: 0.3215923309326172, mean loss: 0.3410588305033429
Epoch: 55, step: 259, loss: 0.3458132743835449, mean loss: 0.3410588901725683
Epoch: 55, step: 260, loss: 0.3448147773742676, mean loss: 0.3410589373091153
Epoch: 55, step: 261, loss: 0.36303630471229553, mean loss: 0.3410592131225663
Epoch: 55, step: 262, loss: 0.3178861141204834, mean loss: 0.34105892230647
Epoch: 55, step: 263, loss: 0.3166590631008148, mean loss: 0.3410586160987093
Epoch: 55, step: 264, loss: 0.3450239896774292, mean loss: 0.34105866586182126
Epoch: 55, step: 265, loss: 0.33219343423843384, mean loss: 0.34105855460976164
Epoch: 55, step: 266, loss: 0.30903661251068115, mean loss: 0.34105815276326096
Epoch: 55, step: 267, loss: 0.3640233874320984, mean loss: 0.3410584409526329
Epoch: 55, step: 268, loss: 0.3536860942840576, mean loss: 0.3410585994143193
Epoch: 55, step: 269, loss: 0.3431262969970703, mean loss: 0.34105862536108283
Epoch: 55, step: 270, loss: 0.35321342945098877, mean loss: 0.34105877788525857
Epoch: 55, step: 271, loss: 0.3339952528476715, mean loss: 0.34105868924994964
Epoch: 55, step: 272, loss: 0.3204587399959564, mean loss: 0.3410584307586235
Epoch: 55, step: 273, loss: 0.3195340931415558, mean loss: 0.3410581606713194
Epoch: 55, step: 274, loss: 0.3005126118659973, mean loss: 0.34105765191231563
Epoch: 55, step: 275, loss: 0.3361220955848694, mean loss: 0.34105758998252833
Epoch: 55, step: 276, loss: 0.342777818441391, mean loss: 0.34105761156713577
Epoch: 55, step: 277, loss: 0.348111093044281, mean loss: 0.3410577000697516
Epoch: 55, step: 278, loss: 0.36084505915641785, mean loss: 0.3410579483458791
Epoch: 55, step: 279, loss: 0.3871351182460785, mean loss: 0.34105852647850016
Epoch: 55, step: 280, loss: 0.36062729358673096, mean loss: 0.3410587720057471
Epoch: 55, step: 281, loss: 0.3802671432495117, mean loss: 0.34105926394285335
Epoch: 55, step: 282, loss: 0.31926223635673523, mean loss: 0.34105899046472093
Epoch: 55, step: 283, loss: 0.34974563121795654, mean loss: 0.3410590994509795
Epoch: 55, step: 284, loss: 0.337103009223938, mean loss: 0.3410590498168257
Epoch: 55, step: 285, loss: 0.3558090925216675, mean loss: 0.3410592348724389
Epoch: 55, step: 286, loss: 0.3238762617111206, mean loss: 0.34105901929572463
Epoch: 55, step: 287, loss: 0.2979629933834076, mean loss: 0.34105847862194144
Epoch: 55, step: 288, loss: 0.3314831852912903, mean loss: 0.3410583584938087
Epoch: 55, step: 289, loss: 0.3448599874973297, mean loss: 0.3410584061870593
Epoch: 55, step: 290, loss: 0.3490159213542938, mean loss: 0.34105850601663323
Epoch: 55, step: 291, loss: 0.3412898778915405, mean loss: 0.341058508919231
Epoch: 55, step: 292, loss: 0.34162941575050354, mean loss: 0.3410585160812602
Epoch: 55, step: 293, loss: 0.3060860335826874, mean loss: 0.341058077356789
Epoch: 55, step: 294, loss: 0.30922505259513855, mean loss: 0.34105767802134695
Epoch: 55, step: 295, loss: 0.36181628704071045, mean loss: 0.34105793842840476
Epoch: 55, step: 296, loss: 0.4271402657032013, mean loss: 0.3410590182774617
Epoch: 55, step: 297, loss: 0.3290494680404663, mean loss: 0.341058867627041
Epoch: 55, step: 298, loss: 0.36024266481399536, mean loss: 0.34105910826976343
Epoch: 55, step: 299, loss: 0.32710176706314087, mean loss: 0.34105893319021996
Epoch: 55, step: 300, loss: 0.3448514938354492, mean loss: 0.34105898076313856
Epoch: 55, step: 301, loss: 0.316072016954422, mean loss: 0.3410586673369349
Epoch: 55, step: 302, loss: 0.3467162251472473, mean loss: 0.3410587383021245
Epoch: 55, step: 303, loss: 0.31160828471183777, mean loss: 0.34105836889700697
Epoch: 55, step: 304, loss: 0.34387221932411194, mean loss: 0.341058404191462
Epoch: 55, step: 305, loss: 0.3394811451435089, mean loss: 0.34105838440796543
Epoch: 55, step: 306, loss: 0.3222973048686981, mean loss: 0.3410581490914536
Epoch: 55, step: 307, loss: 0.3413097560405731, mean loss: 0.34105815224727026
Epoch: 55, step: 308, loss: 0.30016547441482544, mean loss: 0.34105763935136246
Epoch: 55, step: 309, loss: 0.3156348466873169, mean loss: 0.3410573204902981
Epoch: 55, step: 310, loss: 0.3165353536605835, mean loss: 0.3410570129315464
Epoch: 55, step: 311, loss: 0.3314893841743469, mean loss: 0.3410568929341958
Epoch: 55, step: 312, loss: 0.3028993308544159, mean loss: 0.34105641436745326
Epoch: 55, step: 313, loss: 0.30300700664520264, mean loss: 0.3410559371631524
Epoch: 55, step: 314, loss: 0.37437114119529724, mean loss: 0.3410563549872451
Epoch: 55, step: 315, loss: 0.329026997089386, mean loss: 0.3410562041224175
Epoch: 55, step: 316, loss: 0.29766222834587097, mean loss: 0.3410556599086174
Epoch: 55, step: 317, loss: 0.32996559143066406, mean loss: 0.34105552082727003
Epoch: 55, step: 318, loss: 0.3099095821380615, mean loss: 0.3410551302287086
Epoch: 55, step: 319, loss: 0.3091132342815399, mean loss: 0.34105472965313866
Epoch: 55, step: 320, loss: 0.37890687584877014, mean loss: 0.34105520434177056
Epoch: 55, step: 321, loss: 0.3405616581439972, mean loss: 0.34105519815248264
Epoch: 55, step: 322, loss: 0.30885544419288635, mean loss: 0.34105479435836955
Epoch: 55, step: 323, loss: 0.2682681679725647, mean loss: 0.34105388160472805
Epoch: 55, step: 324, loss: 0.37295064330101013, mean loss: 0.34105428158919976
Epoch: 55, step: 325, loss: 0.3606358766555786, mean loss: 0.34105452713875795
Epoch: 55, step: 326, loss: 0.34298548102378845, mean loss: 0.3410545513522567
Epoch: 55, step: 327, loss: 0.37634187936782837, mean loss: 0.341054993837686
Epoch: 55, step: 328, loss: 0.297085165977478, mean loss: 0.3410544424849686
Epoch: 55, step: 329, loss: 0.31682270765304565, mean loss: 0.34105413863876377
Epoch: 55, step: 330, loss: 0.29239359498023987, mean loss: 0.3410535284828578
Epoch: 55, step: 331, loss: 0.3123069405555725, mean loss: 0.34105316803311453
Epoch: 55, step: 332, loss: 0.3090486526489258, mean loss: 0.34105276673767254
Epoch: 55, step: 333, loss: 0.3545173704624176, mean loss: 0.34105293556436117
Epoch: 55, step: 334, loss: 0.2902860641479492, mean loss: 0.3410522990290792
Epoch: 55, step: 335, loss: 0.3396221101284027, mean loss: 0.3410522810970252
Epoch: 55, step: 336, loss: 0.31954556703567505, mean loss: 0.3410520114440284
Epoch: 55, step: 337, loss: 0.2994028925895691, mean loss: 0.341051489250407
Epoch: 55, step: 338, loss: 0.3230491578578949, mean loss: 0.341051263541316
Epoch: 55, step: 339, loss: 0.32533591985702515, mean loss: 0.34105106650842126
Epoch: 55, step: 340, loss: 0.30223745107650757, mean loss: 0.3410505798844392
Epoch: 55, step: 341, loss: 0.32555195689201355, mean loss: 0.341050385573577
Epoch: 55, step: 342, loss: 0.33407363295555115, mean loss: 0.3410502981050437
Epoch: 55, step: 343, loss: 0.33126112818717957, mean loss: 0.34105017537837606
Epoch: 55, step: 344, loss: 0.3180568218231201, mean loss: 0.34104988711468204
Epoch: 55, step: 345, loss: 0.3711084723472595, mean loss: 0.34105026394923854
Epoch: 55, step: 346, loss: 0.41157180070877075, mean loss: 0.3410511480433722
Epoch: 55, step: 347, loss: 0.31618374586105347, mean loss: 0.34105083629677985
Epoch: 55, step: 348, loss: 0.30302295088768005, mean loss: 0.34105035957166846
Epoch: 55, step: 349, loss: 0.32826757431030273, mean loss: 0.34105019932614683
Epoch: 55, step: 350, loss: 0.3334046006202698, mean loss: 0.3410501034818086
Epoch: 55, step: 351, loss: 0.33964651823043823, mean loss: 0.3410500858868473
Epoch: 55, step: 352, loss: 0.33334919810295105, mean loss: 0.3410499893518319
Epoch: 55, step: 353, loss: 0.3307947814464569, mean loss: 0.34104986079857014
Epoch: 55, step: 354, loss: 0.3314615488052368, mean loss: 0.3410497406066304
Epoch: 55, step: 355, loss: 0.34227973222732544, mean loss: 0.3410497560246962
Epoch: 55, step: 356, loss: 0.3178504407405853, mean loss: 0.34104946522264445
Epoch: 55, step: 357, loss: 0.31872785091400146, mean loss: 0.34104918542602997
Epoch: 55, step: 358, loss: 0.3189425766468048, mean loss: 0.3410489083279367
Epoch: 55, step: 359, loss: 0.3283035457134247, mean loss: 0.341048748571574
Epoch: 55, step: 360, loss: 0.34209540486335754, mean loss: 0.34104876169069126
Epoch: 55, step: 361, loss: 0.38195714354515076, mean loss: 0.3410492744427137
Epoch: 55, step: 362, loss: 0.3419857919216156, mean loss: 0.34104928618102237
Epoch: 55, step: 363, loss: 0.33922410011291504, mean loss: 0.3410492633044297
Epoch: 55, step: 364, loss: 0.2809382379055023, mean loss: 0.3410485098918158
Epoch: 55, step: 365, loss: 0.3489813208580017, mean loss: 0.3410486093179177
Epoch: 55, step: 366, loss: 0.32109928131103516, mean loss: 0.34104835928560656
Epoch: 55, step: 367, loss: 0.3130568265914917, mean loss: 0.3410480084617647
Epoch: 55, step: 368, loss: 0.3135188817977905, mean loss: 0.3410476634376804
Epoch: 55, step: 369, loss: 0.3226237893104553, mean loss: 0.34104743253312936
Epoch: 55, step: 370, loss: 0.3186165690422058, mean loss: 0.34104715141290914
Epoch: 55, step: 371, loss: 0.3715622127056122, mean loss: 0.3410475338455
Epoch: 55, step: 372, loss: 0.31479611992836, mean loss: 0.3410472048515542
Epoch: 55, step: 373, loss: 0.3306504487991333, mean loss: 0.34104707455659405
Epoch: 55, step: 374, loss: 0.3156321048736572, mean loss: 0.34104675605330836
Epoch: 55, step: 375, loss: 0.3399908244609833, mean loss: 0.3410467428204196
Epoch: 55, step: 376, loss: 0.3153315782546997, mean loss: 0.34104642056313467
Epoch: 55, step: 377, loss: 0.3063948154449463, mean loss: 0.3410459863216108
Epoch: 55, step: 378, loss: 0.3638494312763214, mean loss: 0.3410462720826474
Epoch: 55, step: 379, loss: 0.32033640146255493, mean loss: 0.34104601256045913
Epoch: 55, step: 380, loss: 0.32814785838127136, mean loss: 0.3410458509314798
Epoch: 55, step: 381, loss: 0.3231322467327118, mean loss: 0.3410456264558501
Epoch: 55, step: 382, loss: 0.35004475712776184, mean loss: 0.34104573922267184
Epoch: 55, step: 383, loss: 0.3547663986682892, mean loss: 0.3410459111521421
Epoch: 55, step: 384, loss: 0.3558098375797272, mean loss: 0.34104609615216
Epoch: 55, step: 385, loss: 0.3388671576976776, mean loss: 0.34104606884921973
Epoch: 55, step: 386, loss: 0.35959842801094055, mean loss: 0.34104630131453184
Epoch: 55, step: 387, loss: 0.3223085105419159, mean loss: 0.3410460665286611
Epoch: 55, step: 388, loss: 0.3286338746547699, mean loss: 0.3410459110049498
Epoch: 55, step: 389, loss: 0.34181100130081177, mean loss: 0.3410459205913462
Epoch: 55, step: 390, loss: 0.3030669689178467, mean loss: 0.3410454447302284
Epoch: 55, step: 391, loss: 0.31461453437805176, mean loss: 0.3410451135656122
Epoch: 55, step: 392, loss: 0.35191264748573303, mean loss: 0.34104524972806594
Epoch: 55, step: 393, loss: 0.3206596374511719, mean loss: 0.3410449943140749
Epoch: 55, step: 394, loss: 0.30348101258277893, mean loss: 0.3410445236759526
Epoch: 55, step: 395, loss: 0.3365277647972107, mean loss: 0.3410444670863105
Epoch: 55, step: 396, loss: 0.3288165032863617, mean loss: 0.341044313886318
Epoch: 55, step: 397, loss: 0.3331059217453003, mean loss: 0.3410442144301535
Epoch: 55, step: 398, loss: 0.31704065203666687, mean loss: 0.3410439137052334
Epoch: 55, step: 399, loss: 0.30092790722846985, mean loss: 0.34104341112434544
Epoch: 55, step: 400, loss: 0.3696087896823883, mean loss: 0.341043768992307
Epoch: 55, step: 401, loss: 0.3492237627506256, mean loss: 0.34104387147024234
Epoch: 55, step: 402, loss: 0.318543016910553, mean loss: 0.3410435895858912
Epoch: 55, step: 403, loss: 0.3287613093852997, mean loss: 0.3410434357188813
Epoch: 55, step: 404, loss: 0.31498536467552185, mean loss: 0.3410431092789058
Epoch: 55, step: 405, loss: 0.32795006036758423, mean loss: 0.3410429452590512
Epoch: 55, step: 406, loss: 0.3368876278400421, mean loss: 0.34104289320501663
Epoch: 55, step: 407, loss: 0.30925318598747253, mean loss: 0.34104249497748723
Epoch: 55, step: 408, loss: 0.3013727366924286, mean loss: 0.34104199804331187
Epoch: 55, step: 409, loss: 0.3150325119495392, mean loss: 0.34104167223238746
Epoch: 55, step: 410, loss: 0.30064043402671814, mean loss: 0.3410411661478062
Epoch: 55, step: 411, loss: 0.372458279132843, mean loss: 0.34104155968815325
Epoch: 55, step: 412, loss: 0.3509703576564789, mean loss: 0.3410416840577494
Epoch: 55, step: 413, loss: 0.3558706045150757, mean loss: 0.34104186980468
Epoch: 55, step: 414, loss: 0.35829493403434753, mean loss: 0.3410420859137077
Epoch: 55, step: 415, loss: 0.35310447216033936, mean loss: 0.3410422370032694
Epoch: 55, step: 416, loss: 0.3390633463859558, mean loss: 0.34104221221663394
Epoch: 55, step: 417, loss: 0.3169529438018799, mean loss: 0.3410419104897819
Epoch: 55, step: 418, loss: 0.3278614580631256, mean loss: 0.34104174540188714
Epoch: 55, step: 419, loss: 0.3353433907032013, mean loss: 0.34104167402970903
Epoch: 55, step: 420, loss: 0.3457542359828949, mean loss: 0.34104173305404434
Epoch: 55, step: 421, loss: 0.3291136920452118, mean loss: 0.3410415836584755
Epoch: 55, step: 422, loss: 0.3681216835975647, mean loss: 0.3410419228253397
Epoch: 55, step: 423, loss: 0.3321096897125244, mean loss: 0.3410418109542772
Epoch: 55, step: 424, loss: 0.34407418966293335, mean loss: 0.34104184893259404
Epoch: 55, step: 425, loss: 0.32384833693504333, mean loss: 0.3410416335991772
Epoch: 55, step: 426, loss: 0.36587902903556824, mean loss: 0.34104194466152693
Epoch: 55, step: 427, loss: 0.34308359026908875, mean loss: 0.3410419702306784
Epoch: 55, step: 428, loss: 0.3396339416503906, mean loss: 0.3410419525970376
Epoch: 55, step: 429, loss: 0.35277897119522095, mean loss: 0.34104209958537324
Epoch: 55, step: 430, loss: 0.2979484796524048, mean loss: 0.34104155990997864
Epoch: 55, step: 431, loss: 0.3092152774333954, mean loss: 0.3410411613441008
Epoch: 55, step: 432, loss: 0.28830844163894653, mean loss: 0.3410405009716701
Epoch: 55, step: 433, loss: 0.32891541719436646, mean loss: 0.34104034913101366
Epoch: 55, step: 434, loss: 0.31964096426963806, mean loss: 0.3410400811529927
Epoch: 55, step: 435, loss: 0.32941779494285583, mean loss: 0.3410399356124421
Epoch: 55, step: 436, loss: 0.35176825523376465, mean loss: 0.34104006995657754
Epoch: 55, step: 437, loss: 0.32329362630844116, mean loss: 0.3410398477315826
Epoch: 55, step: 438, loss: 0.33336248993873596, mean loss: 0.34103975159516975
Epoch: 55, step: 439, loss: 0.3412104845046997, mean loss: 0.34103975373307244
Epoch: 55, step: 440, loss: 0.2895638942718506, mean loss: 0.34103910916489194
Epoch: 55, step: 441, loss: 0.3195776045322418, mean loss: 0.3410388404325207
Epoch: 55, step: 442, loss: 0.3447696566581726, mean loss: 0.3410388871477233
Epoch: 55, step: 443, loss: 0.3134233355522156, mean loss: 0.34103854136549855
Epoch: 55, step: 444, loss: 0.3697422444820404, mean loss: 0.3410389007682797
Epoch: 55, step: 445, loss: 0.3313208818435669, mean loss: 0.34103877908923075
Epoch: 55, step: 446, loss: 0.30297133326530457, mean loss: 0.34103830245375144
Epoch: 55, step: 447, loss: 0.29100003838539124, mean loss: 0.3410376759417057
Epoch: 55, step: 448, loss: 0.3526744544506073, mean loss: 0.34103782164001806
Epoch: 55, step: 449, loss: 0.3594071865081787, mean loss: 0.34103805163081397
Epoch: 55, step: 450, loss: 0.3341677784919739, mean loss: 0.34103796561369715
Epoch: 55, step: 451, loss: 0.3404849171638489, mean loss: 0.3410379586895128
Epoch: 55, step: 452, loss: 0.34539175033569336, mean loss: 0.3410380131984413
Epoch: 55, step: 453, loss: 0.32423850893974304, mean loss: 0.3410378028733761
Epoch: 55, step: 454, loss: 0.3285205364227295, mean loss: 0.341037646162685
Epoch: 55, step: 455, loss: 0.3664606213569641, mean loss: 0.3410379644432098
Epoch: 55, step: 456, loss: 0.3555009961128235, mean loss: 0.34103814550949507
Epoch: 55, step: 457, loss: 0.3176320493221283, mean loss: 0.34103785248643254
Epoch: 55, step: 458, loss: 0.36602261662483215, mean loss: 0.341038165269068
Epoch: 55, step: 459, loss: 0.3115389347076416, mean loss: 0.3410377959747445
Epoch: 55, step: 460, loss: 0.34023404121398926, mean loss: 0.3410377859128429
Epoch: 55, step: 461, loss: 0.3283289968967438, mean loss: 0.3410376268183158
Epoch: 55, step: 462, loss: 0.32408228516578674, mean loss: 0.3410374145661263
Epoch: 55, step: 463, loss: 0.34761402010917664, mean loss: 0.34103749689306967
Epoch: 55, step: 464, loss: 0.3383444845676422, mean loss: 0.3410374631819559
Epoch: 55, step: 465, loss: 0.3171067237854004, mean loss: 0.34103716362083886
Epoch: 55, step: 466, loss: 0.3240720331668854, mean loss: 0.3410369512567439
Epoch: 55, step: 467, loss: 0.3187066912651062, mean loss: 0.34103667173716656
Epoch: 55, step: 468, loss: 0.3687068819999695, mean loss: 0.34103701809536685
Epoch: 55, step: 469, loss: 0.3457023501396179, mean loss: 0.3410370764923132
Epoch: 55, step: 470, loss: 0.33670786023139954, mean loss: 0.34103702230327737
Epoch: 55, step: 471, loss: 0.3701377511024475, mean loss: 0.341037386554126
Epoch: 55, step: 472, loss: 0.3110722303390503, mean loss: 0.3410370114880224
Epoch: 55, step: 473, loss: 0.3189696967601776, mean loss: 0.3410367352806135
Epoch: 55, step: 474, loss: 0.32304203510284424, mean loss: 0.34103651005124774
Epoch: 55, step: 475, loss: 0.3527072072029114, mean loss: 0.34103665612485784
Epoch: 55, step: 476, loss: 0.31275057792663574, mean loss: 0.3410363020930644
Epoch: 55, step: 477, loss: 0.30044475197792053, mean loss: 0.34103579405093426
Epoch: 55, step: 478, loss: 0.3100926876068115, mean loss: 0.3410354067731655
Epoch: 55, step: 479, loss: 0.34199509024620056, mean loss: 0.3410354187842228
Epoch: 55, step: 480, loss: 0.3475598692893982, mean loss: 0.34103550044090425
Epoch: 55, step: 481, loss: 0.36774519085884094, mean loss: 0.34103583472152826
Epoch: 55, step: 482, loss: 0.3383985161781311, mean loss: 0.34103580171502607
Epoch: 55, step: 483, loss: 0.31682413816452026, mean loss: 0.3410354987056204
Epoch: 55, step: 484, loss: 0.3157980144023895, mean loss: 0.3410351828620023
Epoch: 55, step: 485, loss: 0.2920864522457123, mean loss: 0.34103457028308937
Epoch: 55, step: 486, loss: 0.334708034992218, mean loss: 0.3410344911093588
Epoch: 55, step: 487, loss: 0.3276712894439697, mean loss: 0.34103432387702076
Epoch: 55, step: 488, loss: 0.31462588906288147, mean loss: 0.34103399339566304
Epoch: 55, step: 489, loss: 0.373078852891922, mean loss: 0.3410343944075451
Epoch: 55, step: 490, loss: 0.3460628390312195, mean loss: 0.3410344573331076
Epoch: 55, step: 491, loss: 0.36529549956321716, mean loss: 0.34103476093009216
Epoch: 55, step: 492, loss: 0.30939027667045593, mean loss: 0.3410343649434034
Epoch: 55, step: 493, loss: 0.317496657371521, mean loss: 0.34103407040543043
Epoch: 55, step: 494, loss: 0.3470134735107422, mean loss: 0.34103414522746767
Epoch: 55, step: 495, loss: 0.3627628982067108, mean loss: 0.34103441712236954
Epoch: 55, step: 496, loss: 0.33656513690948486, mean loss: 0.3410343611983457
Epoch: 55, step: 497, loss: 0.32251283526420593, mean loss: 0.34103412944172096
Epoch: 55, step: 498, loss: 0.31514546275138855, mean loss: 0.3410338055054018
Epoch: 55, step: 499, loss: 0.3142872750759125, mean loss: 0.3410334708391051
Epoch: 55, step: 500, loss: 0.3559756278991699, mean loss: 0.34103365780069295
Epoch: 55, step: 501, loss: 0.329306960105896, mean loss: 0.34103351107391316
Epoch: 55, step: 502, loss: 0.30317673087120056, mean loss: 0.3410330374082574
Epoch: 55, step: 503, loss: 0.34552833437919617, mean loss: 0.34103309365290196
Epoch: 55, step: 504, loss: 0.34533610939979553, mean loss: 0.3410331474910721
Epoch: 55, step: 505, loss: 0.31903162598609924, mean loss: 0.3410328722174252
Epoch: 55, step: 506, loss: 0.3258717656135559, mean loss: 0.3410326825305033
Epoch: 55, step: 507, loss: 0.32916194200515747, mean loss: 0.3410325340125806
Epoch: 55, step: 508, loss: 0.31778374314308167, mean loss: 0.34103224314454933
Epoch: 55, step: 509, loss: 0.30780941247940063, mean loss: 0.34103182749547306
Epoch: 55, step: 510, loss: 0.3121880888938904, mean loss: 0.34103146663750056
Epoch: 55, step: 511, loss: 0.33699658513069153, mean loss: 0.34103141615857463
Epoch: 55, step: 512, loss: 0.30875566601753235, mean loss: 0.3410310123735279
Epoch: 55, step: 513, loss: 0.3681945502758026, mean loss: 0.34103135219810693
Epoch: 55, step: 514, loss: 0.3436145782470703, mean loss: 0.3410313845146898
Epoch: 55, step: 515, loss: 0.32177644968032837, mean loss: 0.34103114363530085
Epoch: 55, step: 516, loss: 0.3531615138053894, mean loss: 0.3410312953844304
Epoch: 55, step: 517, loss: 0.3554629385471344, mean loss: 0.3410314759198849
Epoch: 55, step: 518, loss: 0.40416911244392395, mean loss: 0.3410322657425813
Epoch: 55, step: 519, loss: 0.3403891324996948, mean loss: 0.3410322576973818
Epoch: 55, step: 520, loss: 0.32151028513908386, mean loss: 0.34103201349262385
Epoch: 55, step: 521, loss: 0.378752201795578, mean loss: 0.3410324853370649
Epoch: 55, step: 522, loss: 0.32398340106010437, mean loss: 0.34103227207155973
Epoch: 55, step: 523, loss: 0.3860585391521454, mean loss: 0.34103283529415407
Epoch: 55, step: 524, loss: 0.3353857100009918, mean loss: 0.34103276465652455
Epoch: 55, step: 525, loss: 0.3312617540359497, mean loss: 0.3410326424363932
Epoch: 55, step: 526, loss: 0.30114132165908813, mean loss: 0.3410321434643145
Epoch: 55, step: 527, loss: 0.3381092846393585, mean loss: 0.3410321069048155
Epoch: 55, step: 528, loss: 0.3050215244293213, mean loss: 0.3410316564853922
Epoch: 55, step: 529, loss: 0.30816343426704407, mean loss: 0.34103124537567087
Epoch: 55, step: 530, loss: 0.3341251611709595, mean loss: 0.3410311589967112
Epoch: 55, step: 531, loss: 0.32884860038757324, mean loss: 0.34103100662330454
Epoch: 55, step: 532, loss: 0.31812983751296997, mean loss: 0.34103072019041136
Epoch: 55, step: 533, loss: 0.3396933078765869, mean loss: 0.34103070346313924
Epoch: 55, step: 534, loss: 0.36510002613067627, mean loss: 0.34103100449900525
Epoch: 55, step: 535, loss: 0.3128717541694641, mean loss: 0.3410306523146748
Epoch: 55, step: 536, loss: 0.3206756114959717, mean loss: 0.34103039773983057
Epoch: 55, step: 537, loss: 0.3441227376461029, mean loss: 0.3410304364143835
Epoch: 55, step: 538, loss: 0.32871678471565247, mean loss: 0.3410302824148125
Epoch: 55, step: 539, loss: 0.34897640347480774, mean loss: 0.3410303817910138
Epoch: 55, step: 540, loss: 0.3501998484134674, mean loss: 0.3410304964652503
Epoch: 55, step: 541, loss: 0.3585014045238495, mean loss: 0.34103071495538384
Epoch: 55, step: 542, loss: 0.38466134667396545, mean loss: 0.34103126059063665
Epoch: 55, step: 543, loss: 0.3222714960575104, mean loss: 0.34103102598800883
Epoch: 55, step: 544, loss: 0.32323694229125977, mean loss: 0.3410308034646086
Epoch: 55, step: 545, loss: 0.35695967078208923, mean loss: 0.34103100266010816
Epoch: 55, step: 546, loss: 0.3212316930294037, mean loss: 0.34103075506660546
Epoch: 55, step: 547, loss: 0.32939350605010986, mean loss: 0.34103060954278325
Epoch: 55, step: 548, loss: 0.3478899896144867, mean loss: 0.3410306953182721
Epoch: 55, step: 549, loss: 0.33570876717567444, mean loss: 0.34103062876921447
Epoch: 55, step: 550, loss: 0.29033803939819336, mean loss: 0.34102999488206326
Epoch: 55, step: 551, loss: 0.2991701364517212, mean loss: 0.3410294714506319
Epoch: 55, step: 552, loss: 0.3458491563796997, mean loss: 0.34102953171703343
Epoch: 55, step: 553, loss: 0.36236006021499634, mean loss: 0.3410297984353231
Epoch: 55, step: 554, loss: 0.32936930656433105, mean loss: 0.3410296526336117
Epoch: 55, step: 555, loss: 0.32333463430404663, mean loss: 0.3410294313795063
Epoch: 55, step: 556, loss: 0.35649365186691284, mean loss: 0.3410296247378529
Epoch: 55, step: 557, loss: 0.3824978172779083, mean loss: 0.3410301432328458
Epoch: 55, step: 558, loss: 0.30325978994369507, mean loss: 0.3410296709794632
Epoch: 55, step: 559, loss: 0.3454515337944031, mean loss: 0.34102972626657013
Epoch: 55, step: 560, loss: 0.3720439076423645, mean loss: 0.34103011403593253
Epoch: 55, step: 561, loss: 0.38339322805404663, mean loss: 0.34103064369403085
Epoch: 55, step: 562, loss: 0.33232226967811584, mean loss: 0.34103053481621914
Epoch: 55, step: 563, loss: 0.3438480794429779, mean loss: 0.34103057004257226
Epoch: 55, step: 564, loss: 0.31468331813812256, mean loss: 0.3410302406401605
Epoch: 55, step: 565, loss: 0.30572590231895447, mean loss: 0.34102979925868976
Epoch: 55, step: 566, loss: 0.35730108618736267, mean loss: 0.3410300026828328
Epoch: 55, step: 567, loss: 0.3509814441204071, mean loss: 0.3410301270945125
Epoch: 55, step: 568, loss: 0.3300919830799103, mean loss: 0.3410299903489098
Epoch: 55, step: 569, loss: 0.35704928636550903, mean loss: 0.3410301906151433
Epoch: 55, step: 570, loss: 0.3352610468864441, mean loss: 0.3410301184927329
Epoch: 55, step: 571, loss: 0.2998138666152954, mean loss: 0.341029603238059
Epoch: 55, step: 572, loss: 0.299988329410553, mean loss: 0.3410290901772433
Epoch: 55, step: 573, loss: 0.30698075890541077, mean loss: 0.3410286645411797
Epoch: 55, step: 574, loss: 0.30423879623413086, mean loss: 0.34102820463908196
Epoch: 55, step: 575, loss: 0.3301689922809601, mean loss: 0.34102806889214016
Epoch: 55, step: 576, loss: 0.33158937096595764, mean loss: 0.3410279509039915
Epoch: 55, step: 577, loss: 0.3258053958415985, mean loss: 0.34102776061729606
Epoch: 55, step: 578, loss: 0.33730801939964294, mean loss: 0.34102771411994964
Epoch: 55, step: 579, loss: 0.3684905767440796, mean loss: 0.34102805740573244
Epoch: 55, step: 580, loss: 0.34145429730415344, mean loss: 0.3410280627336646
Epoch: 55, step: 581, loss: 0.3198353052139282, mean loss: 0.34102779783081816
Epoch: 55, step: 582, loss: 0.3684858977794647, mean loss: 0.34102814104419704
Epoch: 55, step: 583, loss: 0.31821954250335693, mean loss: 0.34102785595096996
Epoch: 55, step: 584, loss: 0.30795571208000183, mean loss: 0.34102744257500756
Epoch: 55, step: 585, loss: 0.3234599530696869, mean loss: 0.34102722299785704
Epoch: 55, step: 586, loss: 0.32150182127952576, mean loss: 0.3410269789516896
Epoch: 55, step: 587, loss: 0.3157826066017151, mean loss: 0.3410266634285875
Epoch: 55, step: 588, loss: 0.29176217317581177, mean loss: 0.34102604769172973
Epoch: 55, step: 589, loss: 0.3335127532482147, mean loss: 0.34102595378728723
Epoch: 55, step: 590, loss: 0.28660839796066284, mean loss: 0.3410252736613567
Epoch: 55, step: 591, loss: 0.316794753074646, mean loss: 0.3410249708252748
Epoch: 55, step: 592, loss: 0.337797075510025, mean loss: 0.3410249304831389
Epoch: 55, step: 593, loss: 0.38179850578308105, mean loss: 0.3410254400636536
Epoch: 55, step: 594, loss: 0.3654921352863312, mean loss: 0.34102574584001083
Epoch: 55, step: 595, loss: 0.38540327548980713, mean loss: 0.3410263004482098
Epoch: 55, step: 596, loss: 0.3205341100692749, mean loss: 0.3410260443502509
Epoch: 55, step: 597, loss: 0.33397209644317627, mean loss: 0.34102595619573683
Epoch: 55, step: 598, loss: 0.33159148693084717, mean loss: 0.341025838292873
Epoch: 55, step: 599, loss: 0.33135369420051575, mean loss: 0.34102571742128973
Epoch: 55, step: 600, loss: 0.32944273948669434, mean loss: 0.34102557267206224
Epoch: 55, step: 601, loss: 0.3234286904335022, mean loss: 0.3410253527715069
Epoch: 55, step: 602, loss: 0.34768179059028625, mean loss: 0.34102543595306495
Epoch: 55, step: 603, loss: 0.32176029682159424, mean loss: 0.3410251952110484
Epoch: 55, step: 604, loss: 0.36354056000709534, mean loss: 0.34102547656518517
Epoch: 55, step: 605, loss: 0.3338823914527893, mean loss: 0.34102538730563065
Epoch: 55, step: 606, loss: 0.3835880160331726, mean loss: 0.3410259191589892
Epoch: 55, step: 607, loss: 0.3011631369590759, mean loss: 0.3410254210485504
Epoch: 55, step: 608, loss: 0.3573361039161682, mean loss: 0.3410256248582052
Epoch: 55, step: 609, loss: 0.3196648061275482, mean loss: 0.3410253579480624
Epoch: 55, step: 610, loss: 0.303832083940506, mean loss: 0.3410248932122224
Epoch: 55, step: 611, loss: 0.389628142118454, mean loss: 0.34102550050991465
Epoch: 55, step: 612, loss: 0.3327155113220215, mean loss: 0.3410253966778805
Epoch: 55, step: 613, loss: 0.31614384055137634, mean loss: 0.341025085790556
Epoch: 55, step: 614, loss: 0.346542090177536, mean loss: 0.3410251547229529
Epoch: 55, step: 615, loss: 0.30508697032928467, mean loss: 0.3410247056977094
Epoch: 55, step: 616, loss: 0.30652308464050293, mean loss: 0.34102427462681645
Epoch: 55, step: 617, loss: 0.324298232793808, mean loss: 0.34102406565055726
Epoch: 55, step: 618, loss: 0.3390880227088928, mean loss: 0.3410240414618125
Epoch: 55, step: 619, loss: 0.33499976992607117, mean loss: 0.3410239661960512
Epoch: 55, step: 620, loss: 0.3070983290672302, mean loss: 0.34102354234281185
Epoch: 55, step: 621, loss: 0.3177773654460907, mean loss: 0.34102325191807364
Epoch: 55, step: 622, loss: 0.39545944333076477, mean loss: 0.34102393200491965
Epoch: 55, step: 623, loss: 0.39393386244773865, mean loss: 0.34102459301549437
Epoch: 55, step: 624, loss: 0.35652855038642883, mean loss: 0.3410247867060106
Epoch: 55, step: 625, loss: 0.3327063024044037, mean loss: 0.3410246827847116
Epoch: 55, step: 626, loss: 0.30256518721580505, mean loss: 0.34102420232328806
Epoch: 55, step: 627, loss: 0.3184086084365845, mean loss: 0.3410239197978797
Epoch: 55, step: 628, loss: 0.360324889421463, mean loss: 0.3410241609123174
Epoch: 55, step: 629, loss: 0.33639171719551086, mean loss: 0.3410241030429393
Epoch: 55, step: 630, loss: 0.30369332432746887, mean loss: 0.34102363670549546
Epoch: 55, step: 631, loss: 0.34711235761642456, mean loss: 0.3410237127650681
Epoch: 55, step: 632, loss: 0.33039477467536926, mean loss: 0.3410235799913046
Epoch: 55, step: 633, loss: 0.3322060704231262, mean loss: 0.34102346984678256
Epoch: 55, step: 634, loss: 0.31699615716934204, mean loss: 0.3410231697117169
Epoch: 55, step: 635, loss: 0.29391682147979736, mean loss: 0.3410225812942562
Epoch: 55, step: 636, loss: 0.31370118260383606, mean loss: 0.34102224001993053
Epoch: 55, step: 637, loss: 0.3335745632648468, mean loss: 0.34102214699141675
Epoch: 55, step: 638, loss: 0.32517746090888977, mean loss: 0.3410219490788013
Epoch: 55, step: 639, loss: 0.35421738028526306, mean loss: 0.3410221138980769
Epoch: 55, step: 640, loss: 0.31859833002090454, mean loss: 0.3410218338143423
Epoch: 55, step: 641, loss: 0.3265824615955353, mean loss: 0.34102165346196267
Epoch: 55, step: 642, loss: 0.3060053586959839, mean loss: 0.34102121610269853
Epoch: 55, step: 643, loss: 0.3235248327255249, mean loss: 0.3410209975727303
Epoch: 55, step: 644, loss: 0.36786267161369324, mean loss: 0.3410213328212664
Epoch: 55, step: 645, loss: 0.2900879681110382, mean loss: 0.34102069667902485
Epoch: 55, step: 646, loss: 0.32674330472946167, mean loss: 0.34102051836096686
Epoch: 55, step: 647, loss: 0.3133656084537506, mean loss: 0.3410201729681769
Epoch: 55, step: 648, loss: 0.31643927097320557, mean loss: 0.34101986597168643
Epoch: 55, step: 649, loss: 0.35554829239845276, mean loss: 0.34102004741825104
Epoch: 55, step: 650, loss: 0.39357343316078186, mean loss: 0.34102070375307564
Epoch: 55, step: 651, loss: 0.329045832157135, mean loss: 0.34102055420177685
Epoch: 55, step: 652, loss: 0.34773820638656616, mean loss: 0.3410206380958758
Epoch: 55, step: 653, loss: 0.31123942136764526, mean loss: 0.3410202661746938
Epoch: 55, step: 654, loss: 0.3063538670539856, mean loss: 0.3410198332505711
Epoch: 55, step: 655, loss: 0.3220955431461334, mean loss: 0.34101959692145745
Epoch: 55, step: 656, loss: 0.3243009150028229, mean loss: 0.3410193881388867
Epoch: 55, step: 657, loss: 0.3673913776874542, mean loss: 0.3410197174676605
Epoch: 55, step: 658, loss: 0.31523099541664124, mean loss: 0.3410193954266504
Epoch: 55, step: 659, loss: 0.3037475049495697, mean loss: 0.3410189299934526
Epoch: 55, step: 660, loss: 0.32180526852607727, mean loss: 0.3410186900656112
Epoch: 55, step: 661, loss: 0.3570832312107086, mean loss: 0.34101889066675933
Epoch: 55, step: 662, loss: 0.31912991404533386, mean loss: 0.34101861733813
Epoch: 55, step: 663, loss: 0.345844030380249, mean loss: 0.3410186775925259
Epoch: 55, step: 664, loss: 0.34344133734703064, mean loss: 0.34101870784363103
Epoch: 55, step: 665, loss: 0.3113124370574951, mean loss: 0.3410183369139956
Epoch: 55, step: 666, loss: 0.3477006256580353, mean loss: 0.3410184203518662
Epoch: 55, step: 667, loss: 0.3339567482471466, mean loss: 0.3410183321779562
Epoch: 55, step: 668, loss: 0.3135369122028351, mean loss: 0.3410179890419453
Epoch: 55, step: 669, loss: 0.31770598888397217, mean loss: 0.34101769796939996
Epoch: 55, step: 670, loss: 0.30661681294441223, mean loss: 0.341017268446919
Epoch: 55, step: 671, loss: 0.3345746099948883, mean loss: 0.3410171880061952
Epoch: 55, step: 672, loss: 0.33617204427719116, mean loss: 0.3410171275122228
Epoch: 55, step: 673, loss: 0.37573176622390747, mean loss: 0.34101756093593383
Epoch: 55, step: 674, loss: 0.3449973464012146, mean loss: 0.3410176106242473
Epoch: 55, step: 675, loss: 0.3546386957168579, mean loss: 0.34101778068373956
Epoch: 55, step: 676, loss: 0.3595944046974182, mean loss: 0.3410180126103287
Epoch: 55, step: 677, loss: 0.31080329418182373, mean loss: 0.34101763538844515
Epoch: 55, step: 678, loss: 0.28323376178741455, mean loss: 0.3410169139827647
Epoch: 55, step: 679, loss: 0.3076750934123993, mean loss: 0.3410164977303231
Epoch: 55, step: 680, loss: 0.32495811581611633, mean loss: 0.34101629725365096
Epoch: 55, step: 681, loss: 0.3595103919506073, mean loss: 0.34101652813546035
Epoch: 55, step: 682, loss: 0.32198697328567505, mean loss: 0.3410162905718878
Epoch: 55, step: 683, loss: 0.42422962188720703, mean loss: 0.3410173293880682
Epoch: 55, step: 684, loss: 0.33566176891326904, mean loss: 0.34101726253131176
Epoch: 55, step: 685, loss: 0.31716880202293396, mean loss: 0.34101696482002286
Epoch: 55, step: 686, loss: 0.34753313660621643, mean loss: 0.34101704616337347
Epoch: 55, step: 687, loss: 0.34417781233787537, mean loss: 0.34101708561968463
Epoch: 55, step: 688, loss: 0.32287079095840454, mean loss: 0.3410168590996349
Epoch: 55, step: 689, loss: 0.3175031542778015, mean loss: 0.3410165655819115
Epoch: 55, step: 690, loss: 0.358288437128067, mean loss: 0.34101678118116185
Epoch: 55, step: 691, loss: 0.35498109459877014, mean loss: 0.3410169554910457
Epoch: 55, step: 692, loss: 0.3337615728378296, mean loss: 0.3410168649266847
Epoch: 55, step: 693, loss: 0.33435148000717163, mean loss: 0.34101678172793143
Epoch: 55, step: 694, loss: 0.3239218294620514, mean loss: 0.3410165683477621
Epoch: 55, step: 695, loss: 0.3587772846221924, mean loss: 0.34101679003526864
Epoch: 55, step: 696, loss: 0.3409014344215393, mean loss: 0.3410167885954292
Epoch: 55, step: 697, loss: 0.353346049785614, mean loss: 0.34101694248420816
Epoch: 55, step: 698, loss: 0.32606467604637146, mean loss: 0.34101675585848346
Epoch: 55, step: 699, loss: 0.3180164396762848, mean loss: 0.3410164687851412
Epoch: 55, step: 700, loss: 0.31461936235427856, mean loss: 0.3410161393196274
Epoch: 55, step: 701, loss: 0.32722318172454834, mean loss: 0.34101596717018534
Epoch: 55, step: 702, loss: 0.31491225957870483, mean loss: 0.34101564137475093
Epoch: 55, step: 703, loss: 0.32739952206611633, mean loss: 0.3410154714366636
Epoch: 55, step: 704, loss: 0.3420661985874176, mean loss: 0.341015484550263
Epoch: 55, step: 705, loss: 0.34055185317993164, mean loss: 0.34101547876398425
Epoch: 55, step: 706, loss: 0.3211866021156311, mean loss: 0.34101523129588174
Epoch: 55, step: 707, loss: 0.337832510471344, mean loss: 0.34101519157542415
Epoch: 55, step: 708, loss: 0.3284507095813751, mean loss: 0.3410150347722444
Epoch: 55, step: 709, loss: 0.30321013927459717, mean loss: 0.34101456297771676
Epoch: 55, step: 710, loss: 0.3275739550590515, mean loss: 0.34101439524478044
Epoch: 55, step: 711, loss: 0.34843385219573975, mean loss: 0.3410144878352181
Epoch: 55, step: 712, loss: 0.3030671179294586, mean loss: 0.3410140142803792
Epoch: 55, step: 713, loss: 0.30746278166770935, mean loss: 0.3410135955912758
Epoch: 55, step: 714, loss: 0.31276997923851013, mean loss: 0.34101324314083153
Epoch: 55, step: 715, loss: 0.30699965357780457, mean loss: 0.34101281869252414
Epoch: 55, step: 716, loss: 0.34014177322387695, mean loss: 0.34101280782306975
Epoch: 55, step: 717, loss: 0.3460807204246521, mean loss: 0.3410128710628886
Epoch: 55, step: 718, loss: 0.34942564368247986, mean loss: 0.34101297604014835
Epoch: 55, step: 719, loss: 0.33667120337486267, mean loss: 0.3410129218628004
Epoch: 55, step: 720, loss: 0.3211899399757385, mean loss: 0.34101267451148354
Epoch: 55, step: 721, loss: 0.3481200635433197, mean loss: 0.34101276319643065
Epoch: 55, step: 722, loss: 0.3114769756793976, mean loss: 0.3410123946578494
Epoch: 55, step: 723, loss: 0.3323472738265991, mean loss: 0.3410122865384539
Epoch: 55, step: 724, loss: 0.34629544615745544, mean loss: 0.3410123524584691
Epoch: 55, step: 725, loss: 0.3596187233924866, mean loss: 0.3410125846144212
Epoch: 55, step: 726, loss: 0.3579404354095459, mean loss: 0.3410127958244577
Epoch: 55, step: 727, loss: 0.34354904294013977, mean loss: 0.34101282746900424
Epoch: 55, step: 728, loss: 0.3402969241142273, mean loss: 0.34101281853684845
Epoch: 55, step: 729, loss: 0.32394686341285706, mean loss: 0.34101260561164415
Epoch: 55, step: 730, loss: 0.3009733557701111, mean loss: 0.34101210606391746
Epoch: 55, step: 731, loss: 0.3124699294567108, mean loss: 0.341011749963301
Epoch: 55, step: 732, loss: 0.3549043536186218, mean loss: 0.34101192328936064
Epoch: 55, step: 733, loss: 0.31540095806121826, mean loss: 0.3410116037673751
Epoch: 55, step: 734, loss: 0.34285011887550354, mean loss: 0.3410116267043735
Epoch: 55, step: 735, loss: 0.3684654235839844, mean loss: 0.3410119692089506
Epoch: 55, step: 736, loss: 0.2848677337169647, mean loss: 0.3410112687805976
Epoch: 55, step: 737, loss: 0.3621864318847656, mean loss: 0.341011532948405
Epoch: 55, step: 738, loss: 0.28913643956184387, mean loss: 0.3410108857959532
Epoch: 55, step: 739, loss: 0.31939515471458435, mean loss: 0.3410106161386293
Epoch: 55, step: 740, loss: 0.3441872298717499, mean loss: 0.3410106557665498
Epoch: 55, step: 741, loss: 0.31229448318481445, mean loss: 0.3410102975398017
Epoch: 55, step: 742, loss: 0.41166311502456665, mean loss: 0.34101117890424026
Epoch: 55, step: 743, loss: 0.3557104766368866, mean loss: 0.341011362269563
Epoch: 55, step: 744, loss: 0.3277747631072998, mean loss: 0.3410111971526272
Epoch: 55, step: 745, loss: 0.3474862575531006, mean loss: 0.34101127792328306
Epoch: 55, step: 746, loss: 0.35927829146385193, mean loss: 0.3410115057852904
Epoch: 55, step: 747, loss: 0.28899145126342773, mean loss: 0.3410108568972737
Epoch: 55, step: 748, loss: 0.33468955755233765, mean loss: 0.34101077804760177
Epoch: 55, step: 749, loss: 0.3483351767063141, mean loss: 0.3410108694084432
Epoch: 55, step: 750, loss: 0.3305482864379883, mean loss: 0.34101073890510697
Epoch: 55, step: 751, loss: 0.336811363697052, mean loss: 0.34101068652553296
Epoch: 55, step: 752, loss: 0.33779993653297424, mean loss: 0.34101064647776136
Epoch: 55, step: 753, loss: 0.3302823305130005, mean loss: 0.3410105126648549
Epoch: 55, step: 754, loss: 0.3058894872665405, mean loss: 0.34101007461028177
Epoch: 55, step: 755, loss: 0.3538094162940979, mean loss: 0.3410102342508436
Epoch: 55, step: 756, loss: 0.3318364918231964, mean loss: 0.34101011983221446
Epoch: 55, step: 757, loss: 0.33961784839630127, mean loss: 0.3410101024674581
Epoch: 55, step: 758, loss: 0.3552015423774719, mean loss: 0.34101027946442625
Epoch: 55, step: 759, loss: 0.3638053834438324, mean loss: 0.34101056376355293
Epoch: 55, step: 760, loss: 0.31953611969947815, mean loss: 0.34101029593895527
Epoch: 55, step: 761, loss: 0.33141595125198364, mean loss: 0.34101017628186653
Epoch: 55, step: 762, loss: 0.33227747678756714, mean loss: 0.3410100673722536
Epoch: 55, step: 763, loss: 0.3633362650871277, mean loss: 0.34101034580931977
Epoch: 55, step: 764, loss: 0.323935329914093, mean loss: 0.341010132864057
Epoch: 55, step: 765, loss: 0.36423271894454956, mean loss: 0.34101042247304214
Epoch: 55, step: 766, loss: 0.3423529863357544, mean loss: 0.34101043921595386
Epoch: 55, step: 767, loss: 0.33833399415016174, mean loss: 0.3410104058388268
Epoch: 55, step: 768, loss: 0.3169030249118805, mean loss: 0.34101010520680836
Epoch: 55, step: 769, loss: 0.35016611218452454, mean loss: 0.3410102193857207
Epoch: 55, step: 770, loss: 0.32744982838630676, mean loss: 0.3410100502845622
Epoch: 55, step: 771, loss: 0.36775684356689453, mean loss: 0.3410103838189956
Epoch: 55, step: 772, loss: 0.3135790526866913, mean loss: 0.34101004175259164
Epoch: 55, step: 773, loss: 0.3447549343109131, mean loss: 0.3410100884505062
Epoch: 55, step: 774, loss: 0.30497920513153076, mean loss: 0.34100963915961124
Epoch: 55, step: 775, loss: 0.31350040435791016, mean loss: 0.3410092961345875
Epoch: 55, step: 776, loss: 0.3136521577835083, mean loss: 0.3410089550103765
Epoch: 55, step: 777, loss: 0.32422927021980286, mean loss: 0.34100874578215645
Epoch: 55, step: 778, loss: 0.28550755977630615, mean loss: 0.34100805373878923
Epoch: 55, step: 779, loss: 0.31175166368484497, mean loss: 0.3410076889458958
Epoch: 55, step: 780, loss: 0.33173108100891113, mean loss: 0.34100757327890985
Epoch: 55, step: 781, loss: 0.31269222497940063, mean loss: 0.3410072202285084
Epoch: 55, step: 782, loss: 0.318889856338501, mean loss: 0.34100694446121926
Epoch: 55, step: 783, loss: 0.3086484670639038, mean loss: 0.3410065410090548
Epoch: 55, step: 784, loss: 0.3503381013870239, mean loss: 0.34100665735542196
Epoch: 55, step: 785, loss: 0.3636329770088196, mean loss: 0.3410069394580035
Epoch: 55, step: 786, loss: 0.32813504338264465, mean loss: 0.34100677897455345
Epoch: 55, step: 787, loss: 0.3315926790237427, mean loss: 0.3410066616034689
Epoch: 55, step: 788, loss: 0.35735008120536804, mean loss: 0.3410068653638898
Epoch: 55, step: 789, loss: 0.3186419606208801, mean loss: 0.34100658653450766
Epoch: 55, step: 790, loss: 0.31439951062202454, mean loss: 0.34100625482095326
Epoch: 55, step: 791, loss: 0.31292611360549927, mean loss: 0.34100590474688436
Epoch: 55, step: 792, loss: 0.30239495635032654, mean loss: 0.34100542339163775
Epoch: 55, step: 793, loss: 0.332028329372406, mean loss: 0.34100531147733326
Epoch: 55, step: 794, loss: 0.3332764208316803, mean loss: 0.3410052151251467
Epoch: 55, step: 795, loss: 0.3341461420059204, mean loss: 0.3410051296176031
Epoch: 55, step: 796, loss: 0.3383680582046509, mean loss: 0.34100509674338175
Epoch: 55, step: 797, loss: 0.39313995838165283, mean loss: 0.34100574665813455
Epoch: 55, step: 798, loss: 0.3577311933040619, mean loss: 0.3410059551554562
Epoch: 55, step: 799, loss: 0.3184332251548767, mean loss: 0.3410056737701408
Epoch: 55, step: 800, loss: 0.3159383237361908, mean loss: 0.3410053612914877
Epoch: 55, step: 801, loss: 0.34095969796180725, mean loss: 0.3410053607222756
Epoch: 55, step: 802, loss: 0.31346678733825684, mean loss: 0.3410050174469882
Epoch: 55, step: 803, loss: 0.359113484621048, mean loss: 0.34100524317080116
Epoch: 55, step: 804, loss: 0.29823002219200134, mean loss: 0.34100470998013765
Epoch: 55, step: 805, loss: 0.3516952097415924, mean loss: 0.34100484323493985
Epoch: 55, step: 806, loss: 0.3695116639137268, mean loss: 0.34100519856195793
Epoch: 55, step: 807, loss: 0.3208131492137909, mean loss: 0.3410049468786385
Epoch: 55, step: 808, loss: 0.32089754939079285, mean loss: 0.34100469625358415
Epoch: 55, step: 809, loss: 0.3295444846153259, mean loss: 0.34100455341160935
Epoch: 55, step: 810, loss: 0.32553479075431824, mean loss: 0.34100436059633027
Epoch: 55, step: 811, loss: 0.3434576988220215, mean loss: 0.34100439117438175
Epoch: 55, step: 812, loss: 0.3183577358722687, mean loss: 0.3410041089132759
Epoch: 55, step: 813, loss: 0.32205477356910706, mean loss: 0.3410038727373986
Epoch: 55, step: 814, loss: 0.33910003304481506, mean loss: 0.3410038490091043
Epoch: 55, step: 815, loss: 0.34024742245674133, mean loss: 0.3410038395815836
Epoch: 55, step: 816, loss: 0.36125582456588745, mean loss: 0.3410040919836548
Epoch: 55, step: 817, loss: 0.30602920055389404, mean loss: 0.3410036560942828
Epoch: 55, step: 818, loss: 0.34429365396499634, mean loss: 0.34100369709676126
Epoch: 55, step: 819, loss: 0.3502047061920166, mean loss: 0.34100381176536915
Epoch: 55, step: 820, loss: 0.3177504539489746, mean loss: 0.34100352197140077
Epoch: 55, step: 821, loss: 0.317562073469162, mean loss: 0.34100322983700104
Epoch: 55, step: 822, loss: 0.3219471275806427, mean loss: 0.34100299235706816
Epoch: 55, step: 823, loss: 0.30374500155448914, mean loss: 0.3410025280483248
Epoch: 55, step: 824, loss: 0.31542909145355225, mean loss: 0.3410022093563615
Epoch: 55, step: 825, loss: 0.31021547317504883, mean loss: 0.3410018257018967
Epoch: 55, step: 826, loss: 0.32976552844047546, mean loss: 0.341001685680497
Epoch: 55, step: 827, loss: 0.32483795285224915, mean loss: 0.3410014842582456
Epoch: 55, step: 828, loss: 0.38875165581703186, mean loss: 0.3410020792833744
Epoch: 55, step: 829, loss: 0.33343735337257385, mean loss: 0.3410019850188771
Epoch: 55, step: 830, loss: 0.3493112027645111, mean loss: 0.341002088559241
Epoch: 55, step: 831, loss: 0.3162464499473572, mean loss: 0.3410017800854508
Epoch: 55, step: 832, loss: 0.3200884759426117, mean loss: 0.3410015194932718
Epoch: 55, step: 833, loss: 0.32359135150909424, mean loss: 0.34100130255495115
Epoch: 55, step: 834, loss: 0.38374948501586914, mean loss: 0.34100183520939586
Epoch: 55, step: 835, loss: 0.32986485958099365, mean loss: 0.34100169644125855
Epoch: 55, step: 836, loss: 0.29862478375434875, mean loss: 0.3410011684260987
Epoch: 55, step: 837, loss: 0.31481897830963135, mean loss: 0.3410008422007988
Epoch: 55, step: 838, loss: 0.29875633120536804, mean loss: 0.341000315848477
Epoch: 55, step: 839, loss: 0.3460030257701874, mean loss: 0.3410003781797743
Epoch: 55, step: 840, loss: 0.33838629722595215, mean loss: 0.3410003456100212
Epoch: 55, step: 841, loss: 0.3443666398525238, mean loss: 0.3410003875513414
Epoch: 55, step: 842, loss: 0.3378990888595581, mean loss: 0.3410003489121341
Epoch: 55, step: 843, loss: 0.29045569896698, mean loss: 0.34099971918211885
Epoch: 55, step: 844, loss: 0.3181707561016083, mean loss: 0.3409994347622213
Epoch: 55, step: 845, loss: 0.34663084149360657, mean loss: 0.34099950492152575
Epoch: 55, step: 846, loss: 0.33218640089035034, mean loss: 0.34099939512417404
Epoch: 55, step: 847, loss: 0.32616353034973145, mean loss: 0.34099921029504193
Epoch: 55, step: 848, loss: 0.3719647526741028, mean loss: 0.3409995960671629
Epoch: 55, step: 849, loss: 0.3140360414981842, mean loss: 0.3409992601564295
Epoch: 55, step: 850, loss: 0.3284754455089569, mean loss: 0.34099910413726137
Epoch: 55, step: 851, loss: 0.3362607955932617, mean loss: 0.34099904510910034
Epoch: 55, step: 852, loss: 0.3512154221534729, mean loss: 0.34099917237950317
Epoch: 55, step: 853, loss: 0.31513702869415283, mean loss: 0.34099885020615084
Epoch: 55, step: 854, loss: 0.3176525831222534, mean loss: 0.34099855937753565
Epoch: 55, step: 855, loss: 0.3470785915851593, mean loss: 0.34099863511663836
Epoch: 55, step: 856, loss: 0.297786146402359, mean loss: 0.34099809682436644
Epoch: 55, step: 857, loss: 0.29978659749031067, mean loss: 0.3409975834645501
Epoch: 55, step: 858, loss: 0.3888750374317169, mean loss: 0.3409981798528206
Epoch: 55, step: 859, loss: 0.32449451088905334, mean loss: 0.34099797427647577
Epoch: 55, step: 860, loss: 0.35611259937286377, mean loss: 0.3409981625479858
Epoch: 55, step: 861, loss: 0.3335403800010681, mean loss: 0.34099806965315826
Epoch: 55, step: 862, loss: 0.310160368680954, mean loss: 0.34099768554069393
Epoch: 55, step: 863, loss: 0.3050464689731598, mean loss: 0.34099723774017865
Epoch: 55, step: 864, loss: 0.3519097566604614, mean loss: 0.3409973736624421
Epoch: 55, step: 865, loss: 0.33704960346221924, mean loss: 0.34099732449110215
Epoch: 55, step: 866, loss: 0.33978256583213806, mean loss: 0.3409973093608985
Epoch: 55, step: 867, loss: 0.3533746004104614, mean loss: 0.34099746352205645
Epoch: 55, step: 868, loss: 0.4042791724205017, mean loss: 0.3409982516961388
Epoch: 55, step: 869, loss: 0.3134276568889618, mean loss: 0.3409979083084839
Epoch: 55, step: 870, loss: 0.3497048318386078, mean loss: 0.34099801675056995
Epoch: 55, step: 871, loss: 0.32588842511177063, mean loss: 0.3409978285675425
Epoch: 55, step: 872, loss: 0.35097596049308777, mean loss: 0.3409979528390472
Epoch: 55, step: 873, loss: 0.30984169244766235, mean loss: 0.3409975648117925
Epoch: 55, step: 874, loss: 0.31650739908218384, mean loss: 0.34099725980941714
Epoch: 55, step: 875, loss: 0.3083757162094116, mean loss: 0.3409968535433068
Epoch: 55, step: 876, loss: 0.31539395451545715, mean loss: 0.3409965346908088
Epoch: 55, step: 877, loss: 0.32618409395217896, mean loss: 0.34099635022244423
Epoch: 55, step: 878, loss: 0.325589656829834, mean loss: 0.3409961583558781
Epoch: 55, step: 879, loss: 0.33166006207466125, mean loss: 0.34099604209066914
Epoch: 55, step: 880, loss: 0.37416768074035645, mean loss: 0.34099645518189653
Epoch: 55, step: 881, loss: 0.3148241937160492, mean loss: 0.3409961292589872
Epoch: 55, step: 882, loss: 0.3519658148288727, mean loss: 0.3409962658626704
Epoch: 55, step: 883, loss: 0.3270019292831421, mean loss: 0.34099609159567773
Epoch: 55, step: 884, loss: 0.31806790828704834, mean loss: 0.3409958060819076
Epoch: 55, step: 885, loss: 0.29612118005752563, mean loss: 0.34099524728647485
Epoch: 55, step: 886, loss: 0.3539257049560547, mean loss: 0.34099540829930897
Epoch: 55, step: 887, loss: 0.33673399686813354, mean loss: 0.34099535523596
Epoch: 55, step: 888, loss: 0.3400615155696869, mean loss: 0.3409953436078776
Epoch: 55, step: 889, loss: 0.3509436845779419, mean loss: 0.340995467482127
Epoch: 55, step: 890, loss: 0.34657150506973267, mean loss: 0.3409955369126855
Epoch: 55, step: 891, loss: 0.3051632046699524, mean loss: 0.34099509074857254
Epoch: 55, step: 892, loss: 0.31585609912872314, mean loss: 0.3409947777358396
Epoch: 55, step: 893, loss: 0.2895941138267517, mean loss: 0.34099413773952625
Epoch: 55, step: 894, loss: 0.31747153401374817, mean loss: 0.3409938448601921
Epoch: 55, step: 895, loss: 0.3194243013858795, mean loss: 0.3409935763017047
Epoch: 55, step: 896, loss: 0.3498309552669525, mean loss: 0.34099368633294297
Epoch: 55, step: 897, loss: 0.3220252990722656, mean loss: 0.3409934501668624
Epoch: 55, step: 898, loss: 0.3300668001174927, mean loss: 0.34099331412619893
Epoch: 55, step: 899, loss: 0.3397424519062042, mean loss: 0.3409932985527151
Epoch: 55, step: 900, loss: 0.30201390385627747, mean loss: 0.34099281325752834
Epoch: 55, step: 901, loss: 0.3694199323654175, mean loss: 0.3409931671720114
Epoch: 55, step: 902, loss: 0.30593806505203247, mean loss: 0.3409927307453077
Epoch: 55, step: 903, loss: 0.3431623578071594, mean loss: 0.34099275775625165
Epoch: 55, step: 904, loss: 0.3149455487728119, mean loss: 0.34099243348349745
Epoch: 55, step: 905, loss: 0.3378415107727051, mean loss: 0.3409923942568123
Epoch: 55, step: 906, loss: 0.40092933177948, mean loss: 0.3409931404185951
Epoch: 55, step: 907, loss: 0.3258051574230194, mean loss: 0.3409929513440134
Epoch: 55, step: 908, loss: 0.35464656352996826, mean loss: 0.3409931213151594
Epoch: 55, step: 909, loss: 0.3592952489852905, mean loss: 0.34099334915192864
Epoch: 55, step: 910, loss: 0.3457000255584717, mean loss: 0.34099340774296333
Epoch: 55, step: 911, loss: 0.29011911153793335, mean loss: 0.34099277444245785
Epoch: 55, step: 912, loss: 0.3298802375793457, mean loss: 0.34099263611154945
Epoch: 55, step: 913, loss: 0.29597076773643494, mean loss: 0.3409920756780048
Epoch: 55, step: 914, loss: 0.30345022678375244, mean loss: 0.34099160836178033
Epoch: 55, step: 915, loss: 0.34962964057922363, mean loss: 0.3409917158855831
Epoch: 55, step: 916, loss: 0.3546972870826721, mean loss: 0.3409918864865664
Epoch: 55, step: 917, loss: 0.31306323409080505, mean loss: 0.34099153884718786
Epoch: 55, step: 918, loss: 0.3073418438434601, mean loss: 0.3409911200008616
Epoch: 55, step: 919, loss: 0.36594390869140625, mean loss: 0.3409914305907134
Epoch: 55, step: 920, loss: 0.31932076811790466, mean loss: 0.34099116085717174
Epoch: 55, step: 921, loss: 0.3088529706001282, mean loss: 0.3409907608398675
Epoch: 55, step: 922, loss: 0.38340359926223755, mean loss: 0.34099128873698886
Epoch: 55, step: 923, loss: 0.3796834349632263, mean loss: 0.34099177031801825
Epoch: 55, step: 924, loss: 0.3555662930011749, mean loss: 0.34099195171726754
Epoch: 55, step: 925, loss: 0.31945422291755676, mean loss: 0.34099168365502674
Epoch: 55, step: 926, loss: 0.31697526574134827, mean loss: 0.34099138474631935
Epoch: 55, step: 927, loss: 0.3687867224216461, mean loss: 0.3409917306832148
Epoch: 55, step: 928, loss: 0.34451383352279663, mean loss: 0.3409917745182699
Epoch: 55, step: 929, loss: 0.34449729323387146, mean loss: 0.34099181814638085
Epoch: 55, step: 930, loss: 0.3237084746360779, mean loss: 0.34099160304832965
Epoch: 55, step: 931, loss: 0.32754361629486084, mean loss: 0.3409914356848944
Epoch: 55, step: 932, loss: 0.339721143245697, mean loss: 0.3409914198759956
Epoch: 55, step: 933, loss: 0.33322617411613464, mean loss: 0.34099132323804654
Epoch: 55, step: 934, loss: 0.3701646029949188, mean loss: 0.3409916862929872
Epoch: 55, step: 935, loss: 0.32219433784484863, mean loss: 0.3409914523671018
Epoch: 55, step: 936, loss: 0.33055469393730164, mean loss: 0.3409913224872105
Epoch: 55, step: 937, loss: 0.3182964026927948, mean loss: 0.34099104006455444
Epoch: 55, step: 938, loss: 0.33494001626968384, mean loss: 0.3409909647646653
Epoch: 55, step: 939, loss: 0.3196527361869812, mean loss: 0.3409906992317064
Epoch: 55, step: 940, loss: 0.30997800827026367, mean loss: 0.3409903133145207
Epoch: 55, step: 941, loss: 0.33507755398750305, mean loss: 0.340990239737963
Epoch: 55, step: 942, loss: 0.3455440104007721, mean loss: 0.3409902964029788
Epoch: 55, step: 943, loss: 0.3496967852115631, mean loss: 0.3409904047411502
Epoch: 55, step: 944, loss: 0.32518893480300903, mean loss: 0.34099020811986064
Epoch: 55, step: 945, loss: 0.34062787890434265, mean loss: 0.3409902036113718
Epoch: 55, step: 946, loss: 0.2978830635547638, mean loss: 0.340989667232758
Epoch: 55, step: 947, loss: 0.3171570599079132, mean loss: 0.3409893706892665
Epoch: 55, step: 948, loss: 0.37756621837615967, mean loss: 0.3409898258006613
Epoch: 55, step: 949, loss: 0.34208858013153076, mean loss: 0.3409898394718611
Epoch: 55, step: 950, loss: 0.2882882356643677, mean loss: 0.3409891837427573
Epoch: 55, step: 951, loss: 0.3350312411785126, mean loss: 0.34098910961317774
Epoch: 55, step: 952, loss: 0.3404531478881836, mean loss: 0.3409891029447477
Epoch: 55, step: 953, loss: 0.37842872738838196, mean loss: 0.3409895687623559
Epoch: 55, step: 954, loss: 0.32798144221305847, mean loss: 0.3409894069194129
Epoch: 55, step: 955, loss: 0.32817888259887695, mean loss: 0.3409892475369564
Epoch: 55, step: 956, loss: 0.3709700107574463, mean loss: 0.34098962053872583
Epoch: 55, step: 957, loss: 0.34325066208839417, mean loss: 0.34098964866883047
Epoch: 55, step: 958, loss: 0.3150849938392639, mean loss: 0.3409893263874531
Epoch: 55, step: 959, loss: 0.3660711646080017, mean loss: 0.34098963842823715
Epoch: 55, step: 960, loss: 0.2852049469947815, mean loss: 0.34098894442478567
Epoch: 55, step: 961, loss: 0.3201602101325989, mean loss: 0.34098868530291393
Epoch: 55, step: 962, loss: 0.319050669670105, mean loss: 0.3409884123843163
Epoch: 55, step: 963, loss: 0.2855495512485504, mean loss: 0.3409877227089937
Epoch: 55, step: 964, loss: 0.34324508905410767, mean loss: 0.3409877507909287
Epoch: 55, step: 965, loss: 0.33293622732162476, mean loss: 0.340987650630161
Epoch: 55, step: 966, loss: 0.2939355969429016, mean loss: 0.3409870653109715
Epoch: 55, step: 967, loss: 0.3018747866153717, mean loss: 0.340986578767225
Epoch: 55, step: 968, loss: 0.2932068109512329, mean loss: 0.3409859844101884
Epoch: 55, step: 969, loss: 0.29926472902297974, mean loss: 0.34098546542455105
Epoch: 55, step: 970, loss: 0.3155282139778137, mean loss: 0.34098514875662245
Epoch: 55, step: 971, loss: 0.3159770965576172, mean loss: 0.34098483768024423
Epoch: 55, step: 972, loss: 0.33964619040489197, mean loss: 0.3409848210289528
Epoch: 55, step: 973, loss: 0.33044442534446716, mean loss: 0.3409846899197197
Epoch: 55, step: 974, loss: 0.3014492690563202, mean loss: 0.340984198155047
Epoch: 55, step: 975, loss: 0.39141520857810974, mean loss: 0.3409848254376285
Epoch: 55, step: 976, loss: 0.34183940291404724, mean loss: 0.3409848360670982
Epoch: 55, step: 977, loss: 0.3671000003814697, mean loss: 0.3409851608906549
Epoch: 55, step: 978, loss: 0.35246264934539795, mean loss: 0.340985303647262
Epoch: 55, step: 979, loss: 0.32641980051994324, mean loss: 0.34098512248428775
Epoch: 55, step: 980, loss: 0.3356108069419861, mean loss: 0.3409850556403985
Epoch: 55, step: 981, loss: 0.3618321120738983, mean loss: 0.3409853149256953
Epoch: 55, step: 982, loss: 0.34091028571128845, mean loss: 0.3409853139925309
Epoch: 55, step: 983, loss: 0.3141118884086609, mean loss: 0.3409849797625724
Epoch: 55, step: 984, loss: 0.3155301511287689, mean loss: 0.3409846631799142
Epoch: 55, step: 985, loss: 0.36586886644363403, mean loss: 0.34098497266183425
Epoch: 55, step: 986, loss: 0.3100890517234802, mean loss: 0.3409845884176647
Epoch: 55, step: 987, loss: 0.33386296033859253, mean loss: 0.34098449984901386
Epoch: 55, step: 988, loss: 0.37629273533821106, mean loss: 0.3409849389570178
Epoch: 55, step: 989, loss: 0.3233519196510315, mean loss: 0.34098471966813204
Epoch: 55, step: 990, loss: 0.316026896238327, mean loss: 0.3409844092899073
Epoch: 55, step: 991, loss: 0.297421395778656, mean loss: 0.3409838675422389
Epoch: 55, step: 992, loss: 0.3265463411808014, mean loss: 0.34098368800004597
Epoch: 55, step: 993, loss: 0.3680248558521271, mean loss: 0.3409840242744242
Epoch: 55, step: 994, loss: 0.36023661494255066, mean loss: 0.3409842636898401
Epoch: 55, step: 995, loss: 0.30409562587738037, mean loss: 0.340983804967225
Epoch: 55, step: 996, loss: 0.30995601415634155, mean loss: 0.34098341913101116
Epoch: 55, step: 997, loss: 0.28695565462112427, mean loss: 0.3409827472943016
Epoch: 55, step: 998, loss: 0.34900709986686707, mean loss: 0.3409828470761016
Epoch: 55, step: 999, loss: 0.29151850938796997, mean loss: 0.3409822320010247
Epoch: 55, step: 1000, loss: 0.3111191987991333, mean loss: 0.3409818606672536
Epoch: 55, step: 1001, loss: 0.33324679732322693, mean loss: 0.34098176448631623
Epoch: 55, step: 1002, loss: 0.3080289959907532, mean loss: 0.3409813547432266
Epoch: 55, step: 1003, loss: 0.3332405984401703, mean loss: 0.34098125849389427
Epoch: 55, step: 1004, loss: 0.33694037795066833, mean loss: 0.34098120824980915
Epoch: 55, step: 1005, loss: 0.3405841290950775, mean loss: 0.3409812033126103
Epoch: 55, step: 1006, loss: 0.3250979781150818, mean loss: 0.3409810058263781
Epoch: 55, step: 1007, loss: 0.32818207144737244, mean loss: 0.3409808466910722
Epoch: 55, step: 1008, loss: 0.32961559295654297, mean loss: 0.34098070538316416
Epoch: 55, step: 1009, loss: 0.29282012581825256, mean loss: 0.34098010659440914
Epoch: 55, step: 1010, loss: 0.31636956334114075, mean loss: 0.34097980061110356
Epoch: 55, step: 1011, loss: 0.3424678146839142, mean loss: 0.340979819111378
Epoch: 55, step: 1012, loss: 0.3333921432495117, mean loss: 0.34097972477601984
Epoch: 55, step: 1013, loss: 0.3357044756412506, mean loss: 0.34097965919120327
Epoch: 55, step: 1014, loss: 0.32892873883247375, mean loss: 0.34097950936935506
Epoch: 55, step: 1015, loss: 0.3313552737236023, mean loss: 0.3409793897185066
Epoch: 55, step: 1016, loss: 0.3120054602622986, mean loss: 0.34097902951201636
Epoch: 55, step: 1017, loss: 0.3754536211490631, mean loss: 0.3409794580979041
Epoch: 55, step: 1018, loss: 0.34937795996665955, mean loss: 0.34097956250623673
Epoch: 55, step: 1019, loss: 0.32348504662513733, mean loss: 0.3409793450209573
Epoch: 55, step: 1020, loss: 0.33546581864356995, mean loss: 0.34097927647971116
Epoch: 55, step: 1021, loss: 0.3003706634044647, mean loss: 0.34097877166117013
Epoch: 55, step: 1022, loss: 0.34252581000328064, mean loss: 0.34097879089265504
Epoch: 55, step: 1023, loss: 0.36039766669273376, mean loss: 0.3409790322888536
Epoch: 55, step: 1024, loss: 0.3569929003715515, mean loss: 0.34097923135489977
Epoch: 55, step: 1025, loss: 0.3382093608379364, mean loss: 0.3409791969234735
Epoch: 55, step: 1026, loss: 0.3269208073616028, mean loss: 0.3409790221700388
Epoch: 55, step: 1027, loss: 0.33741268515586853, mean loss: 0.3409789778390795
Epoch: 55, step: 1028, loss: 0.31642743945121765, mean loss: 0.3409786726576802
Epoch: 55, step: 1029, loss: 0.32437825202941895, mean loss: 0.3409784663131106
Epoch: 55, step: 1030, loss: 0.3203386962413788, mean loss: 0.34097820976228993
Epoch: 55, step: 1031, loss: 0.3605513572692871, mean loss: 0.34097845305204666
Epoch: 55, step: 1032, loss: 0.3299868702888489, mean loss: 0.3409783164308795
Epoch: 55, step: 1033, loss: 0.33576700091362, mean loss: 0.34097825165702716
Epoch: 55, step: 1034, loss: 0.3381817042827606, mean loss: 0.34097821689787766
Epoch: 55, step: 1035, loss: 0.2995091676712036, mean loss: 0.3409777014726859
Epoch: 55, step: 1036, loss: 0.3192775249481201, mean loss: 0.3409774317612062
Epoch: 55, step: 1037, loss: 0.3525574207305908, mean loss: 0.34097757568709264
Epoch: 55, step: 1038, loss: 0.3263699412345886, mean loss: 0.3409773941333267
Epoch: 55, step: 1039, loss: 0.3043660521507263, mean loss: 0.34097693910794785
Epoch: 55, step: 1040, loss: 0.3199930489063263, mean loss: 0.34097667831215606
Epoch: 55, step: 1041, loss: 0.3295087516307831, mean loss: 0.34097653578616016
Epoch: 55, step: 1042, loss: 0.3451358377933502, mean loss: 0.3409765874782672
Epoch: 55, step: 1043, loss: 0.3549853265285492, mean loss: 0.34097676157772844
Epoch: 55, step: 1044, loss: 0.37195536494255066, mean loss: 0.34097714657248845
Epoch: 55, step: 1045, loss: 0.2951778173446655, mean loss: 0.34097657739632425
Epoch: 55, step: 1046, loss: 0.3378258943557739, mean loss: 0.3409765382413534
Epoch: 55, step: 1047, loss: 0.31985726952552795, mean loss: 0.3409762757858591
Epoch: 55, step: 1048, loss: 0.3011932671070099, mean loss: 0.3409757813966076
Epoch: 55, step: 1049, loss: 0.3157755732536316, mean loss: 0.3409754682338371
Epoch: 55, step: 1050, loss: 0.3316379487514496, mean loss: 0.34097535219800457
Epoch: 55, step: 1051, loss: 0.3194970190525055, mean loss: 0.3409750852935764
Epoch: 55, step: 1052, loss: 0.3008231520652771, mean loss: 0.34097458634444777
Epoch: 55, step: 1053, loss: 0.31441277265548706, mean loss: 0.3409742562774238
Epoch: 55, step: 1054, loss: 0.3210905194282532, mean loss: 0.34097400919774873
Epoch: 55, step: 1055, loss: 0.38625696301460266, mean loss: 0.34097457188667235
Epoch: 55, step: 1056, loss: 0.35106921195983887, mean loss: 0.3409746973217665
Epoch: 55, step: 1057, loss: 0.36056846380233765, mean loss: 0.34097494078913
Epoch: 55, step: 1058, loss: 0.3418170213699341, mean loss: 0.3409749512524879
Epoch: 55, step: 1059, loss: 0.3523120880126953, mean loss: 0.3409750921214834
Epoch: 55, step: 1060, loss: 0.32976797223091125, mean loss: 0.3409749528697359
Epoch: 55, step: 1061, loss: 0.3461962044239044, mean loss: 0.34097501774450983
Epoch: 55, step: 1062, loss: 0.3409344553947449, mean loss: 0.34097501724052326
Epoch: 55, step: 1063, loss: 0.32407912611961365, mean loss: 0.3409748073119521
Epoch: 55, step: 1064, loss: 0.35380834341049194, mean loss: 0.3409749667644725
Epoch: 55, step: 1065, loss: 0.309552401304245, mean loss: 0.34097457635414696
Epoch: 55, step: 1066, loss: 0.3767896592617035, mean loss: 0.34097502133386925
Epoch: 55, step: 1067, loss: 0.30883461236953735, mean loss: 0.3409746220146047
Epoch: 55, step: 1068, loss: 0.3184252679347992, mean loss: 0.340974341860123
Epoch: 55, step: 1069, loss: 0.3310190737247467, mean loss: 0.34097421817683143
Epoch: 55, step: 1070, loss: 0.2921164929866791, mean loss: 0.3409736111807053
Epoch: 55, step: 1071, loss: 0.3383858799934387, mean loss: 0.3409735790317813
Epoch: 55, step: 1072, loss: 0.3461589217185974, mean loss: 0.34097364345157793
Epoch: 55, step: 1073, loss: 0.3968544900417328, mean loss: 0.34097433767532864
Epoch: 55, step: 1074, loss: 0.33908364176750183, mean loss: 0.34097431418696406
Epoch: 55, step: 1075, loss: 0.3070613443851471, mean loss: 0.34097389288690194
Epoch: 55, step: 1076, loss: 0.38771650195121765, mean loss: 0.3409744735620708
Epoch: 55, step: 1077, loss: 0.3489874005317688, mean loss: 0.34097457310400936
Epoch: 55, step: 1078, loss: 0.3243461847305298, mean loss: 0.3409743665376126
Epoch: 55, step: 1079, loss: 0.3391392230987549, mean loss: 0.3409743437407997
Epoch: 55, step: 1080, loss: 0.3770524561405182, mean loss: 0.3409747919105417
Epoch: 55, step: 1081, loss: 0.3184325397014618, mean loss: 0.340974511889521
Epoch: 55, step: 1082, loss: 0.29666754603385925, mean loss: 0.34097396151294057
Epoch: 55, step: 1083, loss: 0.33258917927742004, mean loss: 0.3409738573593304
Epoch: 55, step: 1084, loss: 0.3352222740650177, mean loss: 0.34097378591552824
Epoch: 55, step: 1085, loss: 0.3118576407432556, mean loss: 0.3409734242512402
Epoch: 55, step: 1086, loss: 0.33356544375419617, mean loss: 0.3409733322346392
Epoch: 55, step: 1087, loss: 0.34836816787719727, mean loss: 0.34097342408682335
Epoch: 55, step: 1088, loss: 0.3238816559314728, mean loss: 0.34097321179045703
Epoch: 55, step: 1089, loss: 0.34168562293052673, mean loss: 0.3409732206391856
Epoch: 55, step: 1090, loss: 0.30637815594673157, mean loss: 0.3409727909455451
Epoch: 55, step: 1091, loss: 0.37137922644615173, mean loss: 0.3409731686089431
Epoch: 55, step: 1092, loss: 0.3525503873825073, mean loss: 0.34097331240210416
Epoch: 55, step: 1093, loss: 0.30742040276527405, mean loss: 0.34097289566824873
Epoch: 55, step: 1094, loss: 0.32923921942710876, mean loss: 0.3409727499354506
Epoch: 55, step: 1095, loss: 0.32384979724884033, mean loss: 0.3409725372702327
Epoch: 55, step: 1096, loss: 0.3185247480869293, mean loss: 0.3409722584745848
Epoch: 55, step: 1097, loss: 0.38714689016342163, mean loss: 0.3409728319442647
Epoch: 55, step: 1098, loss: 0.31525593996047974, mean loss: 0.34097251255515176
Epoch: 55, step: 1099, loss: 0.3322763442993164, mean loss: 0.34097240455504924
Epoch: 55, step: 1100, loss: 0.31872281432151794, mean loss: 0.3409721282347075
Epoch: 55, step: 1101, loss: 0.3104923963546753, mean loss: 0.34097174970794614
Epoch: 55, step: 1102, loss: 0.32171615958213806, mean loss: 0.3409715105763921
Epoch: 55, step: 1103, loss: 0.31286776065826416, mean loss: 0.3409711615655392
Epoch: 55, step: 1104, loss: 0.3384843170642853, mean loss: 0.3409711306826519
Epoch: 55, step: 1105, loss: 0.36954957246780396, mean loss: 0.34097148557972595
Epoch: 55, step: 1106, loss: 0.3468603193759918, mean loss: 0.34097155870841317
Epoch: 55, step: 1107, loss: 0.3358280658721924, mean loss: 0.3409714948363086
Epoch: 55, step: 1108, loss: 0.37193629145622253, mean loss: 0.3409718793536455
Epoch: 55, step: 1109, loss: 0.3519008457660675, mean loss: 0.3409720150666271
Epoch: 55, step: 1110, loss: 0.36247581243515015, mean loss: 0.3409722820917152
Epoch: 55, step: 1111, loss: 0.3462388813495636, mean loss: 0.34097234748931193
Epoch: 55, step: 1112, loss: 0.35586318373680115, mean loss: 0.34097253239284525
Epoch: 55, step: 1113, loss: 0.3319115936756134, mean loss: 0.34097241988212035
Epoch: 55, step: 1114, loss: 0.33100011944770813, mean loss: 0.3409722960564491
Epoch: 55, step: 1115, loss: 0.3708178400993347, mean loss: 0.34097266664282094
Epoch: 55, step: 1116, loss: 0.3187652826309204, mean loss: 0.34097239090143483
Epoch: 55, step: 1117, loss: 0.36547428369522095, mean loss: 0.3409726951291633
Epoch: 55, step: 1118, loss: 0.3058468699455261, mean loss: 0.3409722589948037
Epoch: 55, step: 1119, loss: 0.27021387219429016, mean loss: 0.34097138044517866
Epoch: 55, step: 1120, loss: 0.322768896818161, mean loss: 0.3409711544424766
Epoch: 55, step: 1121, loss: 0.3278068006038666, mean loss: 0.3409709909954075
Epoch: 55, step: 1122, loss: 0.3227999210357666, mean loss: 0.340970765388341
Epoch: 55, step: 1123, loss: 0.3220013678073883, mean loss: 0.34097052987237975
Epoch: 55, step: 1124, loss: 0.323604941368103, mean loss: 0.34097031427130575
Epoch: 55, step: 1125, loss: 0.31058087944984436, mean loss: 0.3409699369783946
Epoch: 55, step: 1126, loss: 0.327390193939209, mean loss: 0.34096976838436827
Epoch: 55, step: 1127, loss: 0.3713243305683136, mean loss: 0.34097014523496894
Epoch: 55, step: 1128, loss: 0.39436212182044983, mean loss: 0.340970808085862
Epoch: 55, step: 1129, loss: 0.31793510913848877, mean loss: 0.3409705221057385
Epoch: 55, step: 1130, loss: 0.330987811088562, mean loss: 0.34097039817542085
Epoch: 55, step: 1131, loss: 0.36076951026916504, mean loss: 0.3409706439683508
Epoch: 55, step: 1132, loss: 0.37097853422164917, mean loss: 0.34097101649190986
Epoch: 55, step: 1133, loss: 0.3081238865852356, mean loss: 0.34097060872656104
Epoch: 55, step: 1134, loss: 0.3444289267063141, mean loss: 0.340970651657701
Epoch: 55, step: 1135, loss: 0.30623605847358704, mean loss: 0.34097022047202663
Epoch: 55, step: 1136, loss: 0.383968710899353, mean loss: 0.3409707542368196
Epoch: 55, step: 1137, loss: 0.3195120394229889, mean loss: 0.34097048786085676
Epoch: 55, step: 1138, loss: 0.3257569670677185, mean loss: 0.3409702990114322
Epoch: 55, step: 1139, loss: 0.3024716079235077, mean loss: 0.34096982112301255
Epoch: 55, step: 1140, loss: 0.3474177122116089, mean loss: 0.34096990116038906
Epoch: 55, step: 1141, loss: 0.2810899019241333, mean loss: 0.3409691578819298
Epoch: 55, step: 1142, loss: 0.33572569489479065, mean loss: 0.34096909279667986
Epoch: 55, step: 1143, loss: 0.31735238432884216, mean loss: 0.3409687996544766
Epoch: 55, step: 1144, loss: 0.33762019872665405, mean loss: 0.34096875809051047
Epoch: 55, step: 1145, loss: 0.3890995383262634, mean loss: 0.3409693554986012
Epoch: 55, step: 1146, loss: 0.3224942088127136, mean loss: 0.34096912618453107
Epoch: 55, step: 1147, loss: 0.30132734775543213, mean loss: 0.3409686341557054
Epoch: 55, step: 1148, loss: 0.3479240834712982, mean loss: 0.3409687204848061
Epoch: 55, step: 1149, loss: 0.3574201464653015, mean loss: 0.34096892467279144
Epoch: 55, step: 1150, loss: 0.3029067814350128, mean loss: 0.34096845226779166
Epoch: 55, step: 1151, loss: 0.3121819794178009, mean loss: 0.3409680949914072
Epoch: 55, step: 1152, loss: 0.33008962869644165, mean loss: 0.34096795997761475
Epoch: 55, step: 1153, loss: 0.3080233335494995, mean loss: 0.3409675511034565
Epoch: 55, step: 1154, loss: 0.36249473690986633, mean loss: 0.340967818272998
Epoch: 55, step: 1155, loss: 0.31391870975494385, mean loss: 0.3409674825761588
Epoch: 55, step: 1156, loss: 0.30129992961883545, mean loss: 0.34096699028241545
Epoch: 55, step: 1157, loss: 0.3409349024295807, mean loss: 0.34096698988419444
Epoch: 55, step: 1158, loss: 0.36261186003685, mean loss: 0.34096725850095755
Epoch: 55, step: 1159, loss: 0.3337472677230835, mean loss: 0.34096716890067486
Epoch: 55, step: 1160, loss: 0.35088154673576355, mean loss: 0.3409672919368476
Epoch: 55, step: 1161, loss: 0.3268812298774719, mean loss: 0.3409671171327715
Epoch: 55, step: 1162, loss: 0.3623802661895752, mean loss: 0.3409673828606429
Epoch: 55, step: 1163, loss: 0.343914270401001, mean loss: 0.3409674194297824
Epoch: 55, step: 1164, loss: 0.3127356767654419, mean loss: 0.3409670690948235
Epoch: 55, step: 1165, loss: 0.3418658971786499, mean loss: 0.34096708024847405
Epoch: 55, step: 1166, loss: 0.3655335307121277, mean loss: 0.34096738509231317
Epoch: 55, step: 1167, loss: 0.32613876461982727, mean loss: 0.34096720108699635
Epoch: 55, step: 1168, loss: 0.33362844586372375, mean loss: 0.3409671100230146
Epoch: 55, step: 1169, loss: 0.31633031368255615, mean loss: 0.3409668043176375
Epoch: 55, step: 1170, loss: 0.3422226309776306, mean loss: 0.34096681990035344
Epoch: 55, step: 1171, loss: 0.36350834369659424, mean loss: 0.3409670995996263
Epoch: 55, step: 1172, loss: 0.3161366581916809, mean loss: 0.34096679150287584
Epoch: 55, step: 1173, loss: 0.35776910185813904, mean loss: 0.34096699998378455
Epoch: 55, step: 1174, loss: 0.31218191981315613, mean loss: 0.3409666428266387
Epoch: 55, step: 1175, loss: 0.3771131634712219, mean loss: 0.34096709131689434
Epoch: 55, step: 1176, loss: 0.36095139384269714, mean loss: 0.34096733927032347
Epoch: 55, step: 1177, loss: 0.3134390711784363, mean loss: 0.34096699772006056
Epoch: 55, step: 1178, loss: 0.32953277230262756, mean loss: 0.3409668558544615
Epoch: 55, step: 1179, loss: 0.2992366552352905, mean loss: 0.34096633811003696
Epoch: 55, step: 1180, loss: 0.37314698100090027, mean loss: 0.3409667373686428
Epoch: 55, step: 1181, loss: 0.3357922434806824, mean loss: 0.3409666731705598
Epoch: 55, step: 1182, loss: 0.3286334276199341, mean loss: 0.3409665201583202
Epoch: 55, step: 1183, loss: 0.3514293432235718, mean loss: 0.3409666499635788
Epoch: 55, step: 1184, loss: 0.33739152550697327, mean loss: 0.3409666056099474
Epoch: 55, step: 1185, loss: 0.3601358234882355, mean loss: 0.34096684342373146
Epoch: 55, step: 1186, loss: 0.3477932810783386, mean loss: 0.3409669281116327
Epoch: 55, step: 1187, loss: 0.33849507570266724, mean loss: 0.34096689744653236
Epoch: 55, step: 1188, loss: 0.3164568245410919, mean loss: 0.3409665933852873
Epoch: 55, step: 1189, loss: 0.337928831577301, mean loss: 0.34096655570061035
Epoch: 55, step: 1190, loss: 0.31101328134536743, mean loss: 0.34096618412260793
Epoch: 55, step: 1191, loss: 0.34326431155204773, mean loss: 0.34096621263111077
Epoch: 55, step: 1192, loss: 0.31407061219215393, mean loss: 0.34096587899261027
Epoch: 55, step: 1193, loss: 0.3228202164173126, mean loss: 0.34096565389941835
Epoch: 55, step: 1194, loss: 0.32818734645843506, mean loss: 0.34096549538912324
Epoch: 55, step: 1195, loss: 0.33953866362571716, mean loss: 0.3409654776900094
Epoch: 55, step: 1196, loss: 0.34233197569847107, mean loss: 0.3409654946405038
Epoch: 55, step: 1197, loss: 0.32024121284484863, mean loss: 0.34096523757282915
Epoch: 55, step: 1198, loss: 0.3249398469924927, mean loss: 0.34096503879350193
Epoch: 55, step: 1199, loss: 0.35859882831573486, mean loss: 0.3409652575207349
Epoch: 55, step: 1200, loss: 0.3403412401676178, mean loss: 0.3409652497806008
Epoch: 55, step: 1201, loss: 0.3525140583515167, mean loss: 0.34096539302696743
Epoch: 55, step: 1202, loss: 0.30575817823410034, mean loss: 0.34096495633750173
Epoch: 55, step: 1203, loss: 0.34675318002700806, mean loss: 0.34096502813031393
Epoch: 55, step: 1204, loss: 0.3159197270870209, mean loss: 0.34096471749092117
Epoch: 55, step: 1205, loss: 0.3359128534793854, mean loss: 0.3409646548329199
Epoch: 55, step: 1206, loss: 0.3366098701953888, mean loss: 0.340964600821427
Epoch: 55, step: 1207, loss: 0.3153606653213501, mean loss: 0.3409642832650508
Epoch: 55, step: 1208, loss: 0.2994450032711029, mean loss: 0.34096376832278447
Epoch: 55, step: 1209, loss: 0.36255961656570435, mean loss: 0.3409640361616564
Epoch: 55, step: 1210, loss: 0.3315531611442566, mean loss: 0.34096391944631094
Epoch: 55, step: 1211, loss: 0.31020310521125793, mean loss: 0.3409635379499542
Epoch: 55, step: 1212, loss: 0.3260466754436493, mean loss: 0.3409633529529616
Epoch: 55, step: 1213, loss: 0.3259813189506531, mean loss: 0.34096316715002484
Epoch: 55, step: 1214, loss: 0.3414877653121948, mean loss: 0.34096317365586176
Epoch: 55, step: 1215, loss: 0.32036808133125305, mean loss: 0.3409629182477026
Epoch: 55, step: 1216, loss: 0.39245930314064026, mean loss: 0.34096355686750357
Epoch: 55, step: 1217, loss: 0.33410143852233887, mean loss: 0.3409634717696794
Epoch: 55, step: 1218, loss: 0.330472856760025, mean loss: 0.34096334167611414
Epoch: 55, step: 1219, loss: 0.3650185763835907, mean loss: 0.340963639980116
Epoch: 55, step: 1220, loss: 0.4108676612377167, mean loss: 0.34096450683470925
Epoch: 55, step: 1221, loss: 0.3226611614227295, mean loss: 0.3409642798643289
Epoch: 55, step: 1222, loss: 0.34168028831481934, mean loss: 0.34096428874307166
Epoch: 55, step: 1223, loss: 0.3271588683128357, mean loss: 0.3409641175533932
Epoch: 55, step: 1224, loss: 0.3354400098323822, mean loss: 0.34096404905432043
Epoch: 55, step: 1225, loss: 0.3112047612667084, mean loss: 0.3409636800429896
Epoch: 55, step: 1226, loss: 0.3309795558452606, mean loss: 0.3409635562426722
Epoch: 55, step: 1227, loss: 0.32388100028038025, mean loss: 0.3409633444264342
Epoch: 55, step: 1228, loss: 0.3349750339984894, mean loss: 0.3409632701749193
Epoch: 55, step: 1229, loss: 0.34820443391799927, mean loss: 0.3409633599599626
Epoch: 55, step: 1230, loss: 0.3133770823478699, mean loss: 0.34096301791488426
Epoch: 55, step: 1231, loss: 0.33971720933914185, mean loss: 0.3409630024681678
Epoch: 55, step: 1232, loss: 0.31841805577278137, mean loss: 0.3409627229379991
Epoch: 55, step: 1233, loss: 0.34144723415374756, mean loss: 0.3409627289452798
Epoch: 55, step: 1234, loss: 0.3278534710407257, mean loss: 0.34096256641031103
Epoch: 55, step: 1235, loss: 0.31421682238578796, mean loss: 0.34096223480765253
Epoch: 55, step: 1236, loss: 0.3180045783519745, mean loss: 0.34096195017449665
Epoch: 55, step: 1237, loss: 0.33855706453323364, mean loss: 0.3409619203586614
Epoch: 55, step: 1238, loss: 0.35890668630599976, mean loss: 0.3409621428355821
Epoch: 55, step: 1239, loss: 0.3049304783344269, mean loss: 0.34096169612513705
Epoch: 55, step: 1240, loss: 0.2911747395992279, mean loss: 0.34096107888810145
Epoch: 55, step: 1241, loss: 0.30647847056388855, mean loss: 0.34096065139301923
Epoch: 55, step: 1242, loss: 0.3558306097984314, mean loss: 0.34096083573972596
Epoch: 55, step: 1243, loss: 0.3291654586791992, mean loss: 0.3409606895112094
Epoch: 55, step: 1244, loss: 0.32145214080810547, mean loss: 0.34096044766469974
Epoch: 55, step: 1245, loss: 0.3010331690311432, mean loss: 0.34095995269434504
Epoch: 55, step: 1246, loss: 0.3176189959049225, mean loss: 0.3409596633448367
Epoch: 55, step: 1247, loss: 0.30318811535835266, mean loss: 0.3409591951102457
Epoch: 55, step: 1248, loss: 0.3406330943107605, mean loss: 0.3409591910677907
Epoch: 55, step: 1249, loss: 0.31353092193603516, mean loss: 0.34095885106197527
Epoch: 55, step: 1250, loss: 0.32201799750328064, mean loss: 0.3409586162706183
Epoch: 55, step: 1251, loss: 0.3161024749279022, mean loss: 0.34095830815700584
Epoch: 55, step: 1252, loss: 0.32327064871788025, mean loss: 0.34095808890571433
Epoch: 55, step: 1253, loss: 0.35230767726898193, mean loss: 0.3409582295903012
Epoch: 55, step: 1254, loss: 0.3554735779762268, mean loss: 0.3409584095140494
Epoch: 55, step: 1255, loss: 0.3218108117580414, mean loss: 0.3409581721745958
Epoch: 55, step: 1256, loss: 0.2935871481895447, mean loss: 0.34095758500571266
Epoch: 55, step: 1257, loss: 0.320270836353302, mean loss: 0.34095732859444006
Epoch: 55, step: 1258, loss: 0.3223162889480591, mean loss: 0.3409570975424978
Epoch: 55, step: 1259, loss: 0.3511652946472168, mean loss: 0.34095722406948226
Epoch: 55, step: 1260, loss: 0.3393456041812897, mean loss: 0.3409572040942726
Epoch: 55, step: 1261, loss: 0.34950870275497437, mean loss: 0.3409573100844397
Epoch: 55, step: 1262, loss: 0.33612093329429626, mean loss: 0.34095725014149275
Epoch: 55, step: 1263, loss: 0.3472910225391388, mean loss: 0.3409573286424644
Epoch: 55, step: 1264, loss: 0.3392890691757202, mean loss: 0.34095730796626106
Epoch: 55, step: 1265, loss: 0.32013124227523804, mean loss: 0.3409570498537547
Epoch: 55, step: 1266, loss: 0.3368659019470215, mean loss: 0.34095699914982586
Epoch: 55, step: 1267, loss: 0.3497921824455261, mean loss: 0.3409571086479333
Epoch: 55, step: 1268, loss: 0.32161960005760193, mean loss: 0.3409568689931032
Epoch: 55, step: 1269, loss: 0.3100520372390747, mean loss: 0.3409564859861413
Epoch: 55, step: 1270, loss: 0.3244812786579132, mean loss: 0.3409562818096244
Epoch: 55, step: 1271, loss: 0.3298760652542114, mean loss: 0.34095614449469164
Epoch: 55, step: 1272, loss: 0.3457334339618683, mean loss: 0.34095620369796165
Epoch: 55, step: 1273, loss: 0.36243537068367004, mean loss: 0.34095646987843337
Epoch: 55, step: 1274, loss: 0.3348986804485321, mean loss: 0.3409563948082378
Epoch: 55, step: 1275, loss: 0.3573998510837555, mean loss: 0.34095659857863875
Epoch: 55, step: 1276, loss: 0.3618526756763458, mean loss: 0.340956857523545
Epoch: 55, step: 1277, loss: 0.317634254693985, mean loss: 0.34095656851262984
Epoch: 55, step: 1278, loss: 0.30464720726013184, mean loss: 0.34095611857692737
Epoch: 55, step: 1279, loss: 0.33559510111808777, mean loss: 0.34095605214548425
Epoch: 55, step: 1280, loss: 0.3357211649417877, mean loss: 0.3409559872777973
Epoch: 55, step: 1281, loss: 0.3183024823665619, mean loss: 0.3409557065721777
Epoch: 55, step: 1282, loss: 0.34982678294181824, mean loss: 0.34095581649468826
Epoch: 55, step: 1283, loss: 0.3284699618816376, mean loss: 0.3409556617829687
Epoch: 55, step: 1284, loss: 0.37218940258026123, mean loss: 0.3409560487941923
Epoch: 55, step: 1285, loss: 0.3182748258113861, mean loss: 0.3409557677590402
Epoch: 55, step: 1286, loss: 0.33086922764778137, mean loss: 0.34095564278177537
Epoch: 55, step: 1287, loss: 0.3058883845806122, mean loss: 0.3409552082863325
Epoch: 55, step: 1288, loss: 0.3259057402610779, mean loss: 0.34095502182053533
Epoch: 55, step: 1289, loss: 0.3134861886501312, mean loss: 0.3409546814806373
Epoch: 55, step: 1290, loss: 0.33701035380363464, mean loss: 0.3409546326108714
Epoch: 55, step: 1291, loss: 0.33542317152023315, mean loss: 0.34095456407755426
Epoch: 55, step: 1292, loss: 0.3049659729003906, mean loss: 0.3409541181941008
Epoch: 55, step: 1293, loss: 0.3125224709510803, mean loss: 0.3409537659423571
Epoch: 55, step: 1294, loss: 0.35947203636169434, mean loss: 0.34095399537022575
Epoch: 55, step: 1295, loss: 0.3381907343864441, mean loss: 0.340953961135861
Epoch: 55, step: 1296, loss: 0.31804993748664856, mean loss: 0.3409536773787386
Epoch: 55, step: 1297, loss: 0.3196856379508972, mean loss: 0.34095341389302997
Epoch: 55, step: 1298, loss: 0.329152375459671, mean loss: 0.34095326769401324
Epoch: 55, step: 1299, loss: 0.32561495900154114, mean loss: 0.3409530776753228
Epoch: 55, step: 1300, loss: 0.3011765778064728, mean loss: 0.3409525849101208
Epoch: 55, step: 1301, loss: 0.3881421387195587, mean loss: 0.3409531695035874
Epoch: 55, step: 1302, loss: 0.3791598677635193, mean loss: 0.34095364280981066
Epoch: 55, step: 1303, loss: 0.3410766124725342, mean loss: 0.3409536443331453
Epoch: 55, step: 1304, loss: 0.35143741965293884, mean loss: 0.34095377420338774
Epoch: 55, step: 1305, loss: 0.3750119209289551, mean loss: 0.34095419610149647
Epoch: 55, step: 1306, loss: 0.3236011862754822, mean loss: 0.3409539811423152
Epoch: 55, step: 1307, loss: 0.36927270889282227, mean loss: 0.3409543319342059
Epoch: 55, step: 1308, loss: 0.31635457277297974, mean loss: 0.34095402721397944
Epoch: 55, step: 1309, loss: 0.3524061143398285, mean loss: 0.3409541690706266
Epoch: 55, step: 1310, loss: 0.2932029068470001, mean loss: 0.3409535775845528
Epoch: 55, step: 1311, loss: 0.3458007574081421, mean loss: 0.34095363762493114
Epoch: 55, step: 1312, loss: 0.34275728464126587, mean loss: 0.34095365996582044
Epoch: 55, step: 1313, loss: 0.34642916917800903, mean loss: 0.3409537277874224
Epoch: 55, step: 1314, loss: 0.29834190011024475, mean loss: 0.3409531999887269
Epoch: 55, step: 1315, loss: 0.33458784222602844, mean loss: 0.34095312114709786
Epoch: 55, step: 1316, loss: 0.30608171224594116, mean loss: 0.3409526892334907
Epoch: 55, step: 1317, loss: 0.36330878734588623, mean loss: 0.34095296613034365
Epoch: 55, step: 1318, loss: 0.30287715792655945, mean loss: 0.3409524945390655
Epoch: 55, step: 1319, loss: 0.3170621395111084, mean loss: 0.3409521986466327
Epoch: 55, step: 1320, loss: 0.3026323914527893, mean loss: 0.34095172404504
Epoch: 55, step: 1321, loss: 0.3483816683292389, mean loss: 0.3409518160658505
Epoch: 55, step: 1322, loss: 0.3554660677909851, mean loss: 0.3409519958244887
Epoch: 55, step: 1323, loss: 0.3420887589454651, mean loss: 0.34095200990309665
Epoch: 55, step: 1324, loss: 0.29931119084358215, mean loss: 0.34095149419538645
Epoch: 55, step: 1325, loss: 0.31621530652046204, mean loss: 0.3409511878497139
Epoch: 55, step: 1326, loss: 0.2870565354824066, mean loss: 0.34095052039888146
Epoch: 55, step: 1327, loss: 0.3756633996963501, mean loss: 0.3409509502903871
Epoch: 55, step: 1328, loss: 0.3402816355228424, mean loss: 0.3409509420015567
Epoch: 55, step: 1329, loss: 0.35677433013916016, mean loss: 0.34095113795682774
Epoch: 55, step: 1330, loss: 0.3070507347583771, mean loss: 0.34095071814279204
Epoch: 55, step: 1331, loss: 0.30900585651397705, mean loss: 0.3409503225505884
Epoch: 55, step: 1332, loss: 0.38771960139274597, mean loss: 0.3409509017151871
Epoch: 55, step: 1333, loss: 0.3445087969303131, mean loss: 0.3409509457736265
Epoch: 55, step: 1334, loss: 0.31807219982147217, mean loss: 0.34095066246304573
Epoch: 55, step: 1335, loss: 0.33780401945114136, mean loss: 0.34095062349822564
Epoch: 55, step: 1336, loss: 0.3267063498497009, mean loss: 0.34095044711384226
Epoch: 55, step: 1337, loss: 0.306357204914093, mean loss: 0.3409500187569959
Epoch: 55, step: 1338, loss: 0.3187353014945984, mean loss: 0.34094974368279657
Epoch: 55, step: 1339, loss: 0.35782554745674133, mean loss: 0.3409499526452009
Epoch: 55, step: 1340, loss: 0.3298177719116211, mean loss: 0.34094981480415465
Epoch: 55, step: 1341, loss: 0.33894240856170654, mean loss: 0.34094978994832836
Epoch: 55, step: 1342, loss: 0.3508825898170471, mean loss: 0.3409499129353381
Epoch: 55, step: 1343, loss: 0.36113521456718445, mean loss: 0.3409501628647823
Epoch: 55, step: 1344, loss: 0.3269732892513275, mean loss: 0.34094998980871083
Epoch: 55, step: 1345, loss: 0.3146556615829468, mean loss: 0.3409496642468627
Epoch: 55, step: 1346, loss: 0.31564047932624817, mean loss: 0.34094935088639466
Epoch: 55, step: 1347, loss: 0.32059162855148315, mean loss: 0.34094909883456304
Epoch: 55, step: 1348, loss: 0.2767926752567291, mean loss: 0.3409483045146683
Epoch: 55, step: 1349, loss: 0.3338015675544739, mean loss: 0.340948216032101
Epoch: 55, step: 1350, loss: 0.3161572813987732, mean loss: 0.340947909103443
Epoch: 55, step: 1351, loss: 0.3334444761276245, mean loss: 0.34094781620698167
Epoch: 55, step: 1352, loss: 0.3528260886669159, mean loss: 0.3409479632644447
Epoch: 55, step: 1353, loss: 0.3014954924583435, mean loss: 0.340947474834123
Epoch: 55, step: 1354, loss: 0.3753111958503723, mean loss: 0.34094790025932903
Epoch: 55, step: 1355, loss: 0.3611361086368561, mean loss: 0.34094815018762925
Epoch: 55, step: 1356, loss: 0.36329343914985657, mean loss: 0.34094842681697873
Epoch: 55, step: 1357, loss: 0.40196338295936584, mean loss: 0.3409491821582368
Epoch: 55, step: 1358, loss: 0.3273639976978302, mean loss: 0.3409490139810563
Epoch: 55, step: 1359, loss: 0.31338921189308167, mean loss: 0.3409486728099485
Epoch: 55, step: 1360, loss: 0.35117894411087036, mean loss: 0.3409487994519968
Epoch: 55, step: 1361, loss: 0.35904431343078613, mean loss: 0.34094902345627964
Epoch: 55, step: 1362, loss: 0.32072874903678894, mean loss: 0.3409487731526957
Epoch: 55, step: 1363, loss: 0.3182021677494049, mean loss: 0.34094849157954504
Epoch: 55, step: 1364, loss: 0.2982308864593506, mean loss: 0.3409479627981485
Epoch: 55, step: 1365, loss: 0.33591797947883606, mean loss: 0.34094790053509155
Epoch: 55, step: 1366, loss: 0.3175205588340759, mean loss: 0.34094761054608713
Epoch: 55, step: 1367, loss: 0.35532498359680176, mean loss: 0.3409477885103027
Epoch: 55, step: 1368, loss: 0.3718174695968628, mean loss: 0.3409481706128301
Epoch: 55, step: 1369, loss: 0.3080386519432068, mean loss: 0.3409477632663928
Epoch: 55, step: 1370, loss: 0.30795103311538696, mean loss: 0.34094735484552724
Epoch: 55, step: 1371, loss: 0.32428207993507385, mean loss: 0.3409471485717017
Epoch: 55, step: 1372, loss: 0.3060365617275238, mean loss: 0.34094671647254904
Epoch: 55, step: 1373, loss: 0.3509068787097931, mean loss: 0.340946839751038
Epoch: 55, step: 1374, loss: 0.3604350686073303, mean loss: 0.3409470809569153
Epoch: 55, step: 1375, loss: 0.35232800245285034, mean loss: 0.34094722181687737
Epoch: 55, step: 1376, loss: 0.2921849489212036, mean loss: 0.34094661830099315
Epoch: 55, step: 1377, loss: 0.3214659094810486, mean loss: 0.3409463771971438
Epoch: 55, step: 1378, loss: 0.2989480495452881, mean loss: 0.340945857409428
Epoch: 55, step: 1379, loss: 0.3003818690776825, mean loss: 0.3409453553798695
Epoch: 55, step: 1380, loss: 0.3270953297615051, mean loss: 0.3409451839707827
Epoch: 55, step: 1381, loss: 0.30523285269737244, mean loss: 0.3409447419974247
Epoch: 55, step: 1382, loss: 0.31611543893814087, mean loss: 0.340944434715479
Epoch: 55, step: 1383, loss: 0.3147335350513458, mean loss: 0.3409441103392146
Epoch: 55, step: 1384, loss: 0.3421350419521332, mean loss: 0.3409441250775552
Epoch: 55, step: 1385, loss: 0.3304455578327179, mean loss: 0.34094399515444007
Epoch: 55, step: 1386, loss: 0.3268324136734009, mean loss: 0.3409438205212835
Epoch: 55, step: 1387, loss: 0.3225184381008148, mean loss: 0.34094359250694806
Epoch: 55, step: 1388, loss: 0.37919896841049194, mean loss: 0.3409440659118399
Epoch: 55, step: 1389, loss: 0.2974781095981598, mean loss: 0.3409435280334051
Epoch: 55, step: 1390, loss: 0.3698666989803314, mean loss: 0.34094388594471603
Epoch: 55, step: 1391, loss: 0.3419880270957947, mean loss: 0.3409438988653361
Epoch: 55, step: 1392, loss: 0.32973238825798035, mean loss: 0.34094376013133776
Epoch: 55, step: 1393, loss: 0.3518506586551666, mean loss: 0.34094389509432094
Epoch: 55, step: 1394, loss: 0.3277990221977234, mean loss: 0.34094373244044607
Epoch: 55, step: 1395, loss: 0.37615150213241577, mean loss: 0.340944168093902
Epoch: 55, step: 1396, loss: 0.32836684584617615, mean loss: 0.3409440124667165
Epoch: 55, step: 1397, loss: 0.3337526321411133, mean loss: 0.3409439234843076
Epoch: 55, step: 1398, loss: 0.338236004114151, mean loss: 0.34094388997833286
Epoch: 55, step: 1399, loss: 0.3466629087924957, mean loss: 0.3409439607407532
Epoch: 55, step: 1400, loss: 0.37735849618911743, mean loss: 0.3409444112985965
Epoch: 55, step: 1401, loss: 0.3447217345237732, mean loss: 0.34094445803492107
Epoch: 55, step: 1402, loss: 0.35462498664855957, mean loss: 0.3409446273002121
Epoch: 55, step: 1403, loss: 0.3357880413532257, mean loss: 0.3409445635000296
Epoch: 55, step: 1404, loss: 0.30147475004196167, mean loss: 0.3409440751633336
Epoch: 55, step: 1405, loss: 0.35373392701148987, mean loss: 0.3409442334026606
Epoch: 55, step: 1406, loss: 0.3539195656776428, mean loss: 0.3409443939348129
Epoch: 55, step: 1407, loss: 0.33148884773254395, mean loss: 0.3409442769512651
Epoch: 55, step: 1408, loss: 0.33767762780189514, mean loss: 0.34094423653694417
Epoch: 55, step: 1409, loss: 0.3031116724014282, mean loss: 0.34094376848592184
Epoch: 55, step: 1410, loss: 0.2903129458427429, mean loss: 0.3409431421071483
Epoch: 55, step: 1411, loss: 0.3405146896839142, mean loss: 0.34094313680661853
Epoch: 55, step: 1412, loss: 0.36781176924705505, mean loss: 0.3409434692034421
Epoch: 55, step: 1413, loss: 0.3446086645126343, mean loss: 0.3409435145456905
Epoch: 55, step: 1414, loss: 0.2972090244293213, mean loss: 0.3409429735116073
Epoch: 55, step: 1415, loss: 0.3439100980758667, mean loss: 0.34094301021709206
Epoch: 55, step: 1416, loss: 0.35720229148864746, mean loss: 0.340943211353716
Epoch: 55, step: 1417, loss: 0.29745352268218994, mean loss: 0.34094267336800793
Epoch: 55, step: 1418, loss: 0.34979090094566345, mean loss: 0.340942782822944
Epoch: 55, step: 1419, loss: 0.32175159454345703, mean loss: 0.3409425454257609
Epoch: 55, step: 1420, loss: 0.3418872654438019, mean loss: 0.3409425571119105
Epoch: 55, step: 1421, loss: 0.33153393864631653, mean loss: 0.3409424407291087
Epoch: 55, step: 1422, loss: 0.35307568311691284, mean loss: 0.34094259081312817
Epoch: 55, step: 1423, loss: 0.29544976353645325, mean loss: 0.3409420280895213
Epoch: 55, step: 1424, loss: 0.33850008249282837, mean loss: 0.34094199788424456
Epoch: 55, step: 1425, loss: 0.3251650333404541, mean loss: 0.3409418027358817
Epoch: 55, step: 1426, loss: 0.3359992802143097, mean loss: 0.3409417416016093
Epoch: 55, step: 1427, loss: 0.3195357322692871, mean loss: 0.3409414768330395
Epoch: 55, step: 1428, loss: 0.3166578412055969, mean loss: 0.3409411764751423
Epoch: 55, step: 1429, loss: 0.34206265211105347, mean loss: 0.3409411903462077
Epoch: 55, step: 1430, loss: 0.3270396888256073, mean loss: 0.34094101840644786
Epoch: 55, step: 1431, loss: 0.38480982184410095, mean loss: 0.3409415609879973
Epoch: 55, step: 1432, loss: 0.3785776197910309, mean loss: 0.34094202647547217
Epoch: 55, step: 1433, loss: 0.31588026881217957, mean loss: 0.3409417165123576
Epoch: 55, step: 1434, loss: 0.33845648169517517, mean loss: 0.3409416857754234
Epoch: 55, step: 1435, loss: 0.3457004427909851, mean loss: 0.3409417446301406
Epoch: 55, step: 1436, loss: 0.3481822609901428, mean loss: 0.34094183417732093
Epoch: 55, step: 1437, loss: 0.32400035858154297, mean loss: 0.34094162465599226
Epoch: 55, step: 1438, loss: 0.37423768639564514, mean loss: 0.34094203643528387
Epoch: 55, step: 1439, loss: 0.3329443633556366, mean loss: 0.3409419375276277
Epoch: 55, step: 1440, loss: 0.29996758699417114, mean loss: 0.3409414308018819
Epoch: 55, step: 1441, loss: 0.3571842610836029, mean loss: 0.34094163167287544
Epoch: 55, step: 1442, loss: 0.3368464410305023, mean loss: 0.3409415810293099
Epoch: 55, step: 1443, loss: 0.30831971764564514, mean loss: 0.34094117761291465
Valid: 55, mean loss: 0.18533906588951748
Epoch: 56, step: 0, loss: 0.3664715588092804, mean loss: 0.3409414933289994
Epoch: 56, step: 1, loss: 0.35077330470085144, mean loss: 0.3409416149105216
Epoch: 56, step: 2, loss: 0.3249666094779968, mean loss: 0.3409414173638656
Epoch: 56, step: 3, loss: 0.3326941132545471, mean loss: 0.34094131537909894
Epoch: 56, step: 4, loss: 0.3314184546470642, mean loss: 0.34094119762247116
Epoch: 56, step: 5, loss: 0.3222370445728302, mean loss: 0.34094096633580057
Epoch: 56, step: 6, loss: 0.3076043128967285, mean loss: 0.34094055411567914
Epoch: 56, step: 7, loss: 0.34268897771835327, mean loss: 0.3409405757353201
Epoch: 56, step: 8, loss: 0.2964934706687927, mean loss: 0.3409400261439229
Epoch: 56, step: 9, loss: 0.3256025016307831, mean loss: 0.3409398364967617
Epoch: 56, step: 10, loss: 0.3592248260974884, mean loss: 0.3409400625862776
Epoch: 56, step: 11, loss: 0.3465554416179657, mean loss: 0.3409401320182356
Epoch: 56, step: 12, loss: 0.27859851717948914, mean loss: 0.34093936119816515
Epoch: 56, step: 13, loss: 0.3848575949668884, mean loss: 0.3409399042164615
Epoch: 56, step: 14, loss: 0.30937525629997253, mean loss: 0.3409395139464542
Epoch: 56, step: 15, loss: 0.3250106871128082, mean loss: 0.3409393170025023
Epoch: 56, step: 16, loss: 0.3276885151863098, mean loss: 0.3409391531716667
Epoch: 56, step: 17, loss: 0.35292062163352966, mean loss: 0.34093930130683225
Epoch: 56, step: 18, loss: 0.3208296000957489, mean loss: 0.34093905267978813
Epoch: 56, step: 19, loss: 0.34377825260162354, mean loss: 0.34093908778190873
Epoch: 56, step: 20, loss: 0.3245646357536316, mean loss: 0.34093888534076355
Epoch: 56, step: 21, loss: 0.31602743268013, mean loss: 0.34093857735850874
Epoch: 56, step: 22, loss: 0.36009323596954346, mean loss: 0.3409388141661368
Epoch: 56, step: 23, loss: 0.3888316750526428, mean loss: 0.3409394062547147
Epoch: 56, step: 24, loss: 0.36004912853240967, mean loss: 0.3409396425009568
Epoch: 56, step: 25, loss: 0.3222343623638153, mean loss: 0.3409394112575381
Epoch: 56, step: 26, loss: 0.3490758240222931, mean loss: 0.34093951184243343
Epoch: 56, step: 27, loss: 0.32417067885398865, mean loss: 0.34093930454340526
Epoch: 56, step: 28, loss: 0.33078399300575256, mean loss: 0.3409391790033519
Epoch: 56, step: 29, loss: 0.31698447465896606, mean loss: 0.34093888287874013
Epoch: 56, step: 30, loss: 0.318922758102417, mean loss: 0.3409386107219347
Epoch: 56, step: 31, loss: 0.3313465714454651, mean loss: 0.34093849214945554
Epoch: 56, step: 32, loss: 0.32322990894317627, mean loss: 0.3409382732466136
Epoch: 56, step: 33, loss: 0.35786762833595276, mean loss: 0.34093848251451997
Epoch: 56, step: 34, loss: 0.32672470808029175, mean loss: 0.3409383068167433
Epoch: 56, step: 35, loss: 0.3347580134868622, mean loss: 0.3409382304225118
Epoch: 56, step: 36, loss: 0.34972959756851196, mean loss: 0.3409383390907254
Epoch: 56, step: 37, loss: 0.38748881220817566, mean loss: 0.3409389144840793
Epoch: 56, step: 38, loss: 0.2991342842578888, mean loss: 0.34093839775873874
Epoch: 56, step: 39, loss: 0.33132264018058777, mean loss: 0.3409382789048183
Epoch: 56, step: 40, loss: 0.29960164427757263, mean loss: 0.3409377679767591
Epoch: 56, step: 41, loss: 0.3563717007637024, mean loss: 0.34093795874051935
Epoch: 56, step: 42, loss: 0.3638345003128052, mean loss: 0.34093824173879606
Epoch: 56, step: 43, loss: 0.28246793150901794, mean loss: 0.34093751906229647
Epoch: 56, step: 44, loss: 0.34634560346603394, mean loss: 0.3409375859038642
Epoch: 56, step: 45, loss: 0.289957731962204, mean loss: 0.3409369558228613
Epoch: 56, step: 46, loss: 0.2782972753047943, mean loss: 0.34093618164282996
Epoch: 56, step: 47, loss: 0.3398366868495941, mean loss: 0.3409361680540571
Epoch: 56, step: 48, loss: 0.3416025638580322, mean loss: 0.34093617629001177
Epoch: 56, step: 49, loss: 0.3044582009315491, mean loss: 0.34093572546598433
Epoch: 56, step: 50, loss: 0.32933494448661804, mean loss: 0.3409355820960161
Epoch: 56, step: 51, loss: 0.32980480790138245, mean loss: 0.3409354445363963
Epoch: 56, step: 52, loss: 0.32497915625572205, mean loss: 0.3409352473431207
Epoch: 56, step: 53, loss: 0.3213580846786499, mean loss: 0.3409350054048293
Epoch: 56, step: 54, loss: 0.31237170100212097, mean loss: 0.3409346524184552
Epoch: 56, step: 55, loss: 0.37203165888786316, mean loss: 0.3409350367116642
Epoch: 56, step: 56, loss: 0.3017585575580597, mean loss: 0.3409345525792492
Epoch: 56, step: 57, loss: 0.33007749915122986, mean loss: 0.34093441841235483
Epoch: 56, step: 58, loss: 0.3672696650028229, mean loss: 0.3409347438482209
Epoch: 56, step: 59, loss: 0.3371056616306305, mean loss: 0.34093469653120473
Epoch: 56, step: 60, loss: 0.3163948059082031, mean loss: 0.3409343932888121
Epoch: 56, step: 61, loss: 0.29644572734832764, mean loss: 0.34093384354378653
Epoch: 56, step: 62, loss: 0.3261249363422394, mean loss: 0.34093366055285396
Epoch: 56, step: 63, loss: 0.35697734355926514, mean loss: 0.34093385879923355
Epoch: 56, step: 64, loss: 0.3112685978412628, mean loss: 0.3409334922401391
Epoch: 56, step: 65, loss: 0.32195931673049927, mean loss: 0.34093325778844613
Epoch: 56, step: 66, loss: 0.3304983377456665, mean loss: 0.34093312885243837
Epoch: 56, step: 67, loss: 0.33879896998405457, mean loss: 0.34093310248266046
Epoch: 56, step: 68, loss: 0.33706533908843994, mean loss: 0.34093305469296536
Epoch: 56, step: 69, loss: 0.3140648305416107, mean loss: 0.3409327227159946
Epoch: 56, step: 70, loss: 0.31381720304489136, mean loss: 0.3409323876876426
Epoch: 56, step: 71, loss: 0.30377504229545593, mean loss: 0.3409319285922414
Epoch: 56, step: 72, loss: 0.3420892357826233, mean loss: 0.34093194289110584
Epoch: 56, step: 73, loss: 0.33896246552467346, mean loss: 0.3409319185579451
Epoch: 56, step: 74, loss: 0.2919423580169678, mean loss: 0.3409313132927387
Epoch: 56, step: 75, loss: 0.33174440264701843, mean loss: 0.34093119979001263
Epoch: 56, step: 76, loss: 0.33752188086509705, mean loss: 0.34093115766897475
Epoch: 56, step: 77, loss: 0.32754284143447876, mean loss: 0.3409309922626809
Epoch: 56, step: 78, loss: 0.29370203614234924, mean loss: 0.34093040877854863
Epoch: 56, step: 79, loss: 0.3286173641681671, mean loss: 0.34093025666048415
Epoch: 56, step: 80, loss: 0.3559461534023285, mean loss: 0.3409304421678872
Epoch: 56, step: 81, loss: 0.35196343064308167, mean loss: 0.3409305784684885
Epoch: 56, step: 82, loss: 0.3313540816307068, mean loss: 0.34093046016272255
Epoch: 56, step: 83, loss: 0.3664816915988922, mean loss: 0.3409307758126637
Epoch: 56, step: 84, loss: 0.30993959307670593, mean loss: 0.3409303929644168
Epoch: 56, step: 85, loss: 0.3296830952167511, mean loss: 0.3409302540231228
Epoch: 56, step: 86, loss: 0.3479929268360138, mean loss: 0.3409303412693929
Epoch: 56, step: 87, loss: 0.4768056273460388, mean loss: 0.34093201973670784
Epoch: 56, step: 88, loss: 0.2946116626262665, mean loss: 0.34093144754843674
Epoch: 56, step: 89, loss: 0.29698678851127625, mean loss: 0.34093090471350534
Epoch: 56, step: 90, loss: 0.32825836539268494, mean loss: 0.340930748175437
Epoch: 56, step: 91, loss: 0.3203895390033722, mean loss: 0.3409304944424318
Epoch: 56, step: 92, loss: 0.31059467792510986, mean loss: 0.3409301197272556
Epoch: 56, step: 93, loss: 0.3358040452003479, mean loss: 0.34093005640955354
Epoch: 56, step: 94, loss: 0.36216551065444946, mean loss: 0.3409303187084239
Epoch: 56, step: 95, loss: 0.3003166615962982, mean loss: 0.34092981705752085
Epoch: 56, step: 96, loss: 0.3592320680618286, mean loss: 0.3409300431200819
Epoch: 56, step: 97, loss: 0.3333827257156372, mean loss: 0.34092994989959075
Epoch: 56, step: 98, loss: 0.400251179933548, mean loss: 0.3409306825951435
Epoch: 56, step: 99, loss: 0.3544272780418396, mean loss: 0.34093084929386697
Epoch: 56, step: 100, loss: 0.33700060844421387, mean loss: 0.34093080075139987
Epoch: 56, step: 101, loss: 0.33609211444854736, mean loss: 0.34093074098944665
Epoch: 56, step: 102, loss: 0.3188736140727997, mean loss: 0.3409304685682514
Epoch: 56, step: 103, loss: 0.33617424964904785, mean loss: 0.3409304098262926
Epoch: 56, step: 104, loss: 0.31024134159088135, mean loss: 0.340930030803849
Epoch: 56, step: 105, loss: 0.3134448826313019, mean loss: 0.34092969135531037
Epoch: 56, step: 106, loss: 0.3633972406387329, mean loss: 0.34092996883180543
Epoch: 56, step: 107, loss: 0.39142248034477234, mean loss: 0.3409305924117036
Epoch: 56, step: 108, loss: 0.3183707296848297, mean loss: 0.3409303138020099
Epoch: 56, step: 109, loss: 0.32255229353904724, mean loss: 0.34093008684001885
Epoch: 56, step: 110, loss: 0.3521430492401123, mean loss: 0.34093022531439243
Epoch: 56, step: 111, loss: 0.34106677770614624, mean loss: 0.34093022700072406
Epoch: 56, step: 112, loss: 0.32092079520225525, mean loss: 0.3409299799005376
Epoch: 56, step: 113, loss: 0.36015576124191284, mean loss: 0.3409302173203472
Epoch: 56, step: 114, loss: 0.32859981060028076, mean loss: 0.34093006505362716
Epoch: 56, step: 115, loss: 0.33291691541671753, mean loss: 0.34092996610142123
Epoch: 56, step: 116, loss: 0.328530490398407, mean loss: 0.3409298129855582
Epoch: 56, step: 117, loss: 0.3603011667728424, mean loss: 0.3409300521912309
Epoch: 56, step: 118, loss: 0.3639101982116699, mean loss: 0.34093033595629296
Epoch: 56, step: 119, loss: 0.3202363848686218, mean loss: 0.34093008042494
Epoch: 56, step: 120, loss: 0.36748379468917847, mean loss: 0.3409304083092922
Epoch: 56, step: 121, loss: 0.3357933461666107, mean loss: 0.3409303448778085
Epoch: 56, step: 122, loss: 0.3441876471042633, mean loss: 0.34093038509787127
Epoch: 56, step: 123, loss: 0.31073442101478577, mean loss: 0.34093001225295494
Epoch: 56, step: 124, loss: 0.32575473189353943, mean loss: 0.34092982487836876
Epoch: 56, step: 125, loss: 0.3561200201511383, mean loss: 0.34093001243479887
Epoch: 56, step: 126, loss: 0.3431817889213562, mean loss: 0.34093004023759776
Epoch: 56, step: 127, loss: 0.2939437925815582, mean loss: 0.340929460103169
Epoch: 56, step: 128, loss: 0.36033445596694946, mean loss: 0.3409296996917243
Epoch: 56, step: 129, loss: 0.3526988625526428, mean loss: 0.3409298450007949
Epoch: 56, step: 130, loss: 0.4036605656147003, mean loss: 0.3409306195019445
Epoch: 56, step: 131, loss: 0.31396931409835815, mean loss: 0.34093028662988406
Epoch: 56, step: 132, loss: 0.3511495590209961, mean loss: 0.34093041279841363
Epoch: 56, step: 133, loss: 0.29054638743400574, mean loss: 0.34092979075805013
Epoch: 56, step: 134, loss: 0.33823126554489136, mean loss: 0.34092975744251275
Epoch: 56, step: 135, loss: 0.34811267256736755, mean loss: 0.3409298461204773
Epoch: 56, step: 136, loss: 0.3600391149520874, mean loss: 0.3409300820344639
Epoch: 56, step: 137, loss: 0.3092852532863617, mean loss: 0.3409296913672119
Epoch: 56, step: 138, loss: 0.29128047823905945, mean loss: 0.34092907843666453
Epoch: 56, step: 139, loss: 0.35132211446762085, mean loss: 0.3409292067394154
Epoch: 56, step: 140, loss: 0.363100528717041, mean loss: 0.34092948044254456
Epoch: 56, step: 141, loss: 0.35304102301597595, mean loss: 0.3409296299566864
Epoch: 56, step: 142, loss: 0.3228423595428467, mean loss: 0.3409294066763475
Epoch: 56, step: 143, loss: 0.3223807215690613, mean loss: 0.34092917770284975
Epoch: 56, step: 144, loss: 0.3312043249607086, mean loss: 0.34092905765627785
Epoch: 56, step: 145, loss: 0.3624597191810608, mean loss: 0.34092932343410187
Epoch: 56, step: 146, loss: 0.3366093933582306, mean loss: 0.3409292701088735
Epoch: 56, step: 147, loss: 0.359112024307251, mean loss: 0.34092949455406923
Epoch: 56, step: 148, loss: 0.3226220905780792, mean loss: 0.34092926857300476
Epoch: 56, step: 149, loss: 0.29455068707466125, mean loss: 0.34092869609687104
Epoch: 56, step: 150, loss: 0.33401253819465637, mean loss: 0.3409286107280146
Epoch: 56, step: 151, loss: 0.33845189213752747, mean loss: 0.34092858015728056
Epoch: 56, step: 152, loss: 0.30823323130607605, mean loss: 0.3409281765956966
Epoch: 56, step: 153, loss: 0.3645959198474884, mean loss: 0.34092846872514004
Epoch: 56, step: 154, loss: 0.36347445845603943, mean loss: 0.34092874700541664
Epoch: 56, step: 155, loss: 0.32748812437057495, mean loss: 0.34092858111276503
Epoch: 56, step: 156, loss: 0.32563111186027527, mean loss: 0.34092839230407035
Epoch: 56, step: 157, loss: 0.2944487929344177, mean loss: 0.3409278186376665
Epoch: 56, step: 158, loss: 0.3720800578594208, mean loss: 0.3409282031240373
Epoch: 56, step: 159, loss: 0.3498336374759674, mean loss: 0.34092831303510507
Epoch: 56, step: 160, loss: 0.334455281496048, mean loss: 0.3409282331457926
Epoch: 56, step: 161, loss: 0.31532400846481323, mean loss: 0.3409279171456855
Epoch: 56, step: 162, loss: 0.29228851199150085, mean loss: 0.34092731685929756
Epoch: 56, step: 163, loss: 0.2953055202960968, mean loss: 0.34092675382187143
Epoch: 56, step: 164, loss: 0.3564704656600952, mean loss: 0.34092694565086895
Epoch: 56, step: 165, loss: 0.34295985102653503, mean loss: 0.3409269707391742
Epoch: 56, step: 166, loss: 0.3461766839027405, mean loss: 0.340927035525653
Epoch: 56, step: 167, loss: 0.3257288932800293, mean loss: 0.340926847968364
Epoch: 56, step: 168, loss: 0.35284218192100525, mean loss: 0.3409269950113459
Epoch: 56, step: 169, loss: 0.31875941157341003, mean loss: 0.3409267214523035
Epoch: 56, step: 170, loss: 0.3160598576068878, mean loss: 0.34092641458658074
Epoch: 56, step: 171, loss: 0.33055058121681213, mean loss: 0.34092628654677903
Epoch: 56, step: 172, loss: 0.3038221299648285, mean loss: 0.3409258286799209
Epoch: 56, step: 173, loss: 0.34240996837615967, mean loss: 0.3409258469940414
Epoch: 56, step: 174, loss: 0.33222222328186035, mean loss: 0.3409257395936081
Epoch: 56, step: 175, loss: 0.4101020395755768, mean loss: 0.3409265932004687
Epoch: 56, step: 176, loss: 0.33332014083862305, mean loss: 0.34092649934115843
Epoch: 56, step: 177, loss: 0.3547479510307312, mean loss: 0.3409266698879328
Epoch: 56, step: 178, loss: 0.3263860046863556, mean loss: 0.3409264904687948
Epoch: 56, step: 179, loss: 0.35624489188194275, mean loss: 0.3409266794821877
Epoch: 56, step: 180, loss: 0.31254494190216064, mean loss: 0.3409263292849197
Epoch: 56, step: 181, loss: 0.30417877435684204, mean loss: 0.3409258758688976
Epoch: 56, step: 182, loss: 0.317320317029953, mean loss: 0.3409255846112466
Epoch: 56, step: 183, loss: 0.31052377820014954, mean loss: 0.34092520950258987
Epoch: 56, step: 184, loss: 0.3116984963417053, mean loss: 0.34092484889711466
Epoch: 56, step: 185, loss: 0.3531356453895569, mean loss: 0.34092499955469013
Epoch: 56, step: 186, loss: 0.32109177112579346, mean loss: 0.3409247548540889
Epoch: 56, step: 187, loss: 0.33924439549446106, mean loss: 0.34092473412222096
Epoch: 56, step: 188, loss: 0.29002857208251953, mean loss: 0.3409241061854137
Epoch: 56, step: 189, loss: 0.30033206939697266, mean loss: 0.3409236053830253
Epoch: 56, step: 190, loss: 0.29414764046669006, mean loss: 0.34092302829382765
Epoch: 56, step: 191, loss: 0.3107660710811615, mean loss: 0.3409226562429343
Epoch: 56, step: 192, loss: 0.2911040484905243, mean loss: 0.3409220416308989
Epoch: 56, step: 193, loss: 0.3724842071533203, mean loss: 0.3409224310084498
Epoch: 56, step: 194, loss: 0.32744985818862915, mean loss: 0.34092226480145466
Epoch: 56, step: 195, loss: 0.3484412133693695, mean loss: 0.3409223575592707
Epoch: 56, step: 196, loss: 0.3918161392211914, mean loss: 0.3409229854047409
Epoch: 56, step: 197, loss: 0.33481717109680176, mean loss: 0.34092291008197184
Epoch: 56, step: 198, loss: 0.35460084676742554, mean loss: 0.34092307881415157
Epoch: 56, step: 199, loss: 0.3008061647415161, mean loss: 0.3409225839346234
Epoch: 56, step: 200, loss: 0.3467724323272705, mean loss: 0.3409226560970658
Epoch: 56, step: 201, loss: 0.3691665530204773, mean loss: 0.34092300450326474
Epoch: 56, step: 202, loss: 0.3179483115673065, mean loss: 0.3409227210995007
Epoch: 56, step: 203, loss: 0.3237874209880829, mean loss: 0.34092250973003174
Epoch: 56, step: 204, loss: 0.33821192383766174, mean loss: 0.3409224762944905
Epoch: 56, step: 205, loss: 0.35228869318962097, mean loss: 0.34092261649699324
Epoch: 56, step: 206, loss: 0.3475247025489807, mean loss: 0.3409226979328464
Epoch: 56, step: 207, loss: 0.35168665647506714, mean loss: 0.3409228307032054
Epoch: 56, step: 208, loss: 0.3345721364021301, mean loss: 0.3409227523701685
Epoch: 56, step: 209, loss: 0.3485129475593567, mean loss: 0.340922845990752
Epoch: 56, step: 210, loss: 0.3152011036872864, mean loss: 0.34092252873213585
Epoch: 56, step: 211, loss: 0.358313649892807, mean loss: 0.3409227432360724
Epoch: 56, step: 212, loss: 0.32974863052368164, mean loss: 0.34092260541507863
Epoch: 56, step: 213, loss: 0.33663320541381836, mean loss: 0.3409225525104682
Epoch: 56, step: 214, loss: 0.35735511779785156, mean loss: 0.34092275518397536
Epoch: 56, step: 215, loss: 0.3367333710193634, mean loss: 0.34092270351421505
Epoch: 56, step: 216, loss: 0.34206441044807434, mean loss: 0.3409227175952813
Epoch: 56, step: 217, loss: 0.35177022218704224, mean loss: 0.34092285137965506
Epoch: 56, step: 218, loss: 0.34171992540359497, mean loss: 0.34092286121000204
Epoch: 56, step: 219, loss: 0.3530648946762085, mean loss: 0.34092301095635724
Epoch: 56, step: 220, loss: 0.3480885922908783, mean loss: 0.3409230993275891
Epoch: 56, step: 221, loss: 0.32245513796806335, mean loss: 0.34092287156988293
Epoch: 56, step: 222, loss: 0.31157684326171875, mean loss: 0.3409225096619531
Epoch: 56, step: 223, loss: 0.30500879883766174, mean loss: 0.34092206676398024
Epoch: 56, step: 224, loss: 0.3264188766479492, mean loss: 0.3409218879087703
Epoch: 56, step: 225, loss: 0.31407812237739563, mean loss: 0.34092155687207615
Epoch: 56, step: 226, loss: 0.3254067003726959, mean loss: 0.34092136554558494
Epoch: 56, step: 227, loss: 0.35577619075775146, mean loss: 0.340921548730427
Epoch: 56, step: 228, loss: 0.3316880762577057, mean loss: 0.340921434867671
Epoch: 56, step: 229, loss: 0.3802788555622101, mean loss: 0.3409219201985302
Epoch: 56, step: 230, loss: 0.34703582525253296, mean loss: 0.3409219955904169
Epoch: 56, step: 231, loss: 0.3478943109512329, mean loss: 0.3409220815664868
Epoch: 56, step: 232, loss: 0.3210071623325348, mean loss: 0.340921835997363
Epoch: 56, step: 233, loss: 0.3185243010520935, mean loss: 0.3409215598187279
Epoch: 56, step: 234, loss: 0.29895442724227905, mean loss: 0.34092104233845594
Epoch: 56, step: 235, loss: 0.3280775845050812, mean loss: 0.3409208839727613
Epoch: 56, step: 236, loss: 0.3385534882545471, mean loss: 0.340920854782052
Epoch: 56, step: 237, loss: 0.33019572496414185, mean loss: 0.34092072253956945
Epoch: 56, step: 238, loss: 0.3176969289779663, mean loss: 0.34092043619019197
Epoch: 56, step: 239, loss: 0.36433836817741394, mean loss: 0.3409207249297361
Epoch: 56, step: 240, loss: 0.3005242645740509, mean loss: 0.34092022685365747
Epoch: 56, step: 241, loss: 0.34325075149536133, mean loss: 0.3409202555879637
Epoch: 56, step: 242, loss: 0.3591826856136322, mean loss: 0.34092048075262305
Epoch: 56, step: 243, loss: 0.30062180757522583, mean loss: 0.34091998390060874
Epoch: 56, step: 244, loss: 0.3206927478313446, mean loss: 0.3409197345172349
Epoch: 56, step: 245, loss: 0.32951924204826355, mean loss: 0.34091959396129273
Epoch: 56, step: 246, loss: 0.3323153257369995, mean loss: 0.3409194878811282
Epoch: 56, step: 247, loss: 0.34531188011169434, mean loss: 0.34091954203331565
Epoch: 56, step: 248, loss: 0.35883989930152893, mean loss: 0.3409197629640822
Epoch: 56, step: 249, loss: 0.35636386275291443, mean loss: 0.3409199533640106
Epoch: 56, step: 250, loss: 0.31475403904914856, mean loss: 0.3409196307860125
Epoch: 56, step: 251, loss: 0.331016480922699, mean loss: 0.3409195086997427
Epoch: 56, step: 252, loss: 0.29131245613098145, mean loss: 0.34091889715034407
Epoch: 56, step: 253, loss: 0.3268773853778839, mean loss: 0.340918724050517
Epoch: 56, step: 254, loss: 0.33234789967536926, mean loss: 0.3409186183930955
Epoch: 56, step: 255, loss: 0.31214210391044617, mean loss: 0.34091826365302547
Epoch: 56, step: 256, loss: 0.3378111720085144, mean loss: 0.34091822535108585
Epoch: 56, step: 257, loss: 0.34122681617736816, mean loss: 0.3409182291551196
Epoch: 56, step: 258, loss: 0.3002171218395233, mean loss: 0.34091772743418575
Epoch: 56, step: 259, loss: 0.3237482011318207, mean loss: 0.3409175157887257
Epoch: 56, step: 260, loss: 0.294972687959671, mean loss: 0.34091694944261997
Epoch: 56, step: 261, loss: 0.31979402899742126, mean loss: 0.3409166890708471
Epoch: 56, step: 262, loss: 0.30416494607925415, mean loss: 0.34091623605590765
Epoch: 56, step: 263, loss: 0.3011069595813751, mean loss: 0.3409157453587812
Epoch: 56, step: 264, loss: 0.3659956455230713, mean loss: 0.3409160544948505
Epoch: 56, step: 265, loss: 0.2918986976146698, mean loss: 0.3409154503119727
Epoch: 56, step: 266, loss: 0.35171273350715637, mean loss: 0.3409155833965297
Epoch: 56, step: 267, loss: 0.357555627822876, mean loss: 0.34091578849494253
Epoch: 56, step: 268, loss: 0.3287466764450073, mean loss: 0.3409156385052706
Epoch: 56, step: 269, loss: 0.357176810503006, mean loss: 0.3409158389289154
Epoch: 56, step: 270, loss: 0.29740476608276367, mean loss: 0.34091530264897646
Epoch: 56, step: 271, loss: 0.31926438212394714, mean loss: 0.3409150358017012
Epoch: 56, step: 272, loss: 0.3259469270706177, mean loss: 0.34091485132225613
Epoch: 56, step: 273, loss: 0.3582701086997986, mean loss: 0.34091506522027404
Epoch: 56, step: 274, loss: 0.3475702106952667, mean loss: 0.3409151472418108
Epoch: 56, step: 275, loss: 0.30745360255241394, mean loss: 0.34091473484909834
Epoch: 56, step: 276, loss: 0.3457394242286682, mean loss: 0.3409147943096593
Epoch: 56, step: 277, loss: 0.3282696306705475, mean loss: 0.34091463846972886
Epoch: 56, step: 278, loss: 0.35745173692703247, mean loss: 0.34091484227163976
Epoch: 56, step: 279, loss: 0.34864044189453125, mean loss: 0.3409149374801533
Epoch: 56, step: 280, loss: 0.3628024160861969, mean loss: 0.34091520721308327
Epoch: 56, step: 281, loss: 0.32154861092567444, mean loss: 0.3409149685494857
Epoch: 56, step: 282, loss: 0.31144365668296814, mean loss: 0.3409146053652415
Epoch: 56, step: 283, loss: 0.31260859966278076, mean loss: 0.3409142565457302
Epoch: 56, step: 284, loss: 0.33266276121139526, mean loss: 0.34091415486246446
Epoch: 56, step: 285, loss: 0.30316221714019775, mean loss: 0.3409136896506626
Epoch: 56, step: 286, loss: 0.4248518943786621, mean loss: 0.34091472399656997
Epoch: 56, step: 287, loss: 0.3017773926258087, mean loss: 0.3409142417246436
Epoch: 56, step: 288, loss: 0.3538905084133148, mean loss: 0.34091440162343584
Epoch: 56, step: 289, loss: 0.2987464368343353, mean loss: 0.34091388201916756
Epoch: 56, step: 290, loss: 0.31590890884399414, mean loss: 0.34091357390539545
Epoch: 56, step: 291, loss: 0.3421836793422699, mean loss: 0.3409135895555684
Epoch: 56, step: 292, loss: 0.29700812697410583, mean loss: 0.3409130485614141
Epoch: 56, step: 293, loss: 0.3524513244628906, mean loss: 0.3409131907319444
Epoch: 56, step: 294, loss: 0.3059752881526947, mean loss: 0.34091276024484407
Epoch: 56, step: 295, loss: 0.33406123518943787, mean loss: 0.3409126758248705
Epoch: 56, step: 296, loss: 0.3333313465118408, mean loss: 0.34091258241388106
Epoch: 56, step: 297, loss: 0.3655964434146881, mean loss: 0.34091288654464424
Epoch: 56, step: 298, loss: 0.32411330938339233, mean loss: 0.34091267955898374
Epoch: 56, step: 299, loss: 0.31787386536598206, mean loss: 0.3409123957038978
Epoch: 56, step: 300, loss: 0.39890116453170776, mean loss: 0.3409131101592521
Epoch: 56, step: 301, loss: 0.32338857650756836, mean loss: 0.3409128942494666
Epoch: 56, step: 302, loss: 0.31366756558418274, mean loss: 0.3409125585794447
Epoch: 56, step: 303, loss: 0.3029714524745941, mean loss: 0.3409120911402309
Epoch: 56, step: 304, loss: 0.3121299147605896, mean loss: 0.3409117365445555
Epoch: 56, step: 305, loss: 0.308795303106308, mean loss: 0.34091134087579317
Epoch: 56, step: 306, loss: 0.3131847679615021, mean loss: 0.34091099929354196
Epoch: 56, step: 307, loss: 0.343729168176651, mean loss: 0.3409110340120272
Epoch: 56, step: 308, loss: 0.3518775999546051, mean loss: 0.3409111691131808
Epoch: 56, step: 309, loss: 0.3489101827144623, mean loss: 0.34091126765475327
Epoch: 56, step: 310, loss: 0.33406591415405273, mean loss: 0.3409111833264071
Epoch: 56, step: 311, loss: 0.293085515499115, mean loss: 0.34091059416621405
Epoch: 56, step: 312, loss: 0.3274849057197571, mean loss: 0.340910428778377
Epoch: 56, step: 313, loss: 0.33301833271980286, mean loss: 0.3409103315587355
Epoch: 56, step: 314, loss: 0.32355761528015137, mean loss: 0.34091011780005065
Epoch: 56, step: 315, loss: 0.31636756658554077, mean loss: 0.3409098154774193
Epoch: 56, step: 316, loss: 0.2998661696910858, mean loss: 0.34090930989550006
Epoch: 56, step: 317, loss: 0.3389299213886261, mean loss: 0.3409092855133894
Epoch: 56, step: 318, loss: 0.3424097001552582, mean loss: 0.3409093039952716
Epoch: 56, step: 319, loss: 0.3284318149089813, mean loss: 0.34090915030132835
Epoch: 56, step: 320, loss: 0.33944982290267944, mean loss: 0.34090913232599546
Epoch: 56, step: 321, loss: 0.32315751910209656, mean loss: 0.34090891367237014
Epoch: 56, step: 322, loss: 0.32856354117393494, mean loss: 0.3409087616114183
Epoch: 56, step: 323, loss: 0.34065714478492737, mean loss: 0.3409087585122309
Epoch: 56, step: 324, loss: 0.3319823443889618, mean loss: 0.3409086485661283
Epoch: 56, step: 325, loss: 0.3491995334625244, mean loss: 0.3409087506831981
Epoch: 56, step: 326, loss: 0.35028398036956787, mean loss: 0.3409088661544903
Epoch: 56, step: 327, loss: 0.38005372881889343, mean loss: 0.34090934828158
Epoch: 56, step: 328, loss: 0.33839139342308044, mean loss: 0.34090931726961027
Epoch: 56, step: 329, loss: 0.34225401282310486, mean loss: 0.3409093338311241
Epoch: 56, step: 330, loss: 0.3368709981441498, mean loss: 0.34090928409486343
Epoch: 56, step: 331, loss: 0.3184729516506195, mean loss: 0.3409090077717386
Epoch: 56, step: 332, loss: 0.2884086072444916, mean loss: 0.34090836119119344
Epoch: 56, step: 333, loss: 0.320911705493927, mean loss: 0.34090811492089496
Epoch: 56, step: 334, loss: 0.31218016147613525, mean loss: 0.3409077611240077
Epoch: 56, step: 335, loss: 0.32865241169929504, mean loss: 0.34090761019605914
Epoch: 56, step: 336, loss: 0.3136257827281952, mean loss: 0.34090727421709993
Epoch: 56, step: 337, loss: 0.333855003118515, mean loss: 0.34090718736860975
Epoch: 56, step: 338, loss: 0.31841346621513367, mean loss: 0.3409069103625736
Epoch: 56, step: 339, loss: 0.31445184350013733, mean loss: 0.3409065845773061
Epoch: 56, step: 340, loss: 0.3395423889160156, mean loss: 0.34090656777790135
Epoch: 56, step: 341, loss: 0.2924189865589142, mean loss: 0.3409059706843218
Epoch: 56, step: 342, loss: 0.32962939143180847, mean loss: 0.340905831822164
Epoch: 56, step: 343, loss: 0.3268749415874481, mean loss: 0.34090565904497167
Epoch: 56, step: 344, loss: 0.31431838870048523, mean loss: 0.34090533165182135
Epoch: 56, step: 345, loss: 0.3039678633213043, mean loss: 0.3409048768129058
Epoch: 56, step: 346, loss: 0.40005752444267273, mean loss: 0.3409056051951155
Epoch: 56, step: 347, loss: 0.2966039776802063, mean loss: 0.3409050596891864
Epoch: 56, step: 348, loss: 0.3209664523601532, mean loss: 0.3409048141791408
Epoch: 56, step: 349, loss: 0.31185370683670044, mean loss: 0.34090445646855716
Epoch: 56, step: 350, loss: 0.3057333528995514, mean loss: 0.3409040234068867
Epoch: 56, step: 351, loss: 0.30610570311546326, mean loss: 0.34090359494057104
Epoch: 56, step: 352, loss: 0.30831971764564514, mean loss: 0.3409031937452881
Epoch: 56, step: 353, loss: 0.3285117447376251, mean loss: 0.34090304117505726
Epoch: 56, step: 354, loss: 0.30678361654281616, mean loss: 0.34090262108339603
Epoch: 56, step: 355, loss: 0.34026017785072327, mean loss: 0.3409026131734818
Epoch: 56, step: 356, loss: 0.3529229164123535, mean loss: 0.3409027611684983
Epoch: 56, step: 357, loss: 0.34616124629974365, mean loss: 0.3409028259106265
Epoch: 56, step: 358, loss: 0.32851219177246094, mean loss: 0.3409026733598202
Epoch: 56, step: 359, loss: 0.36627286672592163, mean loss: 0.34090298570830546
Epoch: 56, step: 360, loss: 0.3123178780078888, mean loss: 0.3409026337833107
Epoch: 56, step: 361, loss: 0.32234251499176025, mean loss: 0.3409024052835841
Epoch: 56, step: 362, loss: 0.3607640266418457, mean loss: 0.34090264980352647
Epoch: 56, step: 363, loss: 0.3017198145389557, mean loss: 0.3409021674226324
Epoch: 56, step: 364, loss: 0.4309021234512329, mean loss: 0.34090327540076865
Epoch: 56, step: 365, loss: 0.32569560408592224, mean loss: 0.3409030881833451
Epoch: 56, step: 366, loss: 0.3425474762916565, mean loss: 0.3409031084267018
Epoch: 56, step: 367, loss: 0.34305235743522644, mean loss: 0.3409031348848588
Epoch: 56, step: 368, loss: 0.2894851863384247, mean loss: 0.34090250191613247
Epoch: 56, step: 369, loss: 0.38645726442337036, mean loss: 0.340903062700564
Epoch: 56, step: 370, loss: 0.3421326279640198, mean loss: 0.3409030778364692
Epoch: 56, step: 371, loss: 0.3139212429523468, mean loss: 0.3409027456951171
Epoch: 56, step: 372, loss: 0.29217329621315, mean loss: 0.3409021458520716
Epoch: 56, step: 373, loss: 0.3645230829715729, mean loss: 0.340902436614241
Epoch: 56, step: 374, loss: 0.3140468895435333, mean loss: 0.3409021060396762
Epoch: 56, step: 375, loss: 0.3227463960647583, mean loss: 0.34090188255727866
Epoch: 56, step: 376, loss: 0.3150534927845001, mean loss: 0.34090156438800734
Epoch: 56, step: 377, loss: 0.3407142162322998, mean loss: 0.3409015620819568
Epoch: 56, step: 378, loss: 0.3338352143764496, mean loss: 0.34090147510403
Epoch: 56, step: 379, loss: 0.31942546367645264, mean loss: 0.3409012107643689
Epoch: 56, step: 380, loss: 0.3380744159221649, mean loss: 0.34090117597090663
Epoch: 56, step: 381, loss: 0.3551601469516754, mean loss: 0.3409013514745743
Epoch: 56, step: 382, loss: 0.3208964765071869, mean loss: 0.34090110525163725
Epoch: 56, step: 383, loss: 0.3194071650505066, mean loss: 0.34090084070432286
Epoch: 56, step: 384, loss: 0.354638934135437, mean loss: 0.34090100979063076
Epoch: 56, step: 385, loss: 0.3127453625202179, mean loss: 0.34090066325958746
Epoch: 56, step: 386, loss: 0.3738344609737396, mean loss: 0.3409010685936475
Epoch: 56, step: 387, loss: 0.3857186436653137, mean loss: 0.3409016201809939
Epoch: 56, step: 388, loss: 0.31798720359802246, mean loss: 0.340901338167818
Epoch: 56, step: 389, loss: 0.32323160767555237, mean loss: 0.3409011207049178
Epoch: 56, step: 390, loss: 0.3220753073692322, mean loss: 0.34090088901685756
Epoch: 56, step: 391, loss: 0.3308422565460205, mean loss: 0.34090076522744545
Epoch: 56, step: 392, loss: 0.3327697515487671, mean loss: 0.340900665162052
Epoch: 56, step: 393, loss: 0.32924747467041016, mean loss: 0.34090052175228935
Epoch: 56, step: 394, loss: 0.34052789211273193, mean loss: 0.34090051716658637
Epoch: 56, step: 395, loss: 0.3640316128730774, mean loss: 0.34090080182196053
Epoch: 56, step: 396, loss: 0.31395015120506287, mean loss: 0.3409004701665463
Epoch: 56, step: 397, loss: 0.31382450461387634, mean loss: 0.34090013697310345
Epoch: 56, step: 398, loss: 0.2943984866142273, mean loss: 0.3408995647366569
Epoch: 56, step: 399, loss: 0.3613031208515167, mean loss: 0.34089981581408496
Epoch: 56, step: 400, loss: 0.30367881059646606, mean loss: 0.3408993577939629
Epoch: 56, step: 401, loss: 0.31947246193885803, mean loss: 0.3408990941302431
Epoch: 56, step: 402, loss: 0.34273168444633484, mean loss: 0.3408991166804826
Epoch: 56, step: 403, loss: 0.331563264131546, mean loss: 0.34089900180313176
Epoch: 56, step: 404, loss: 0.33525118231773376, mean loss: 0.34089893230775853
Epoch: 56, step: 405, loss: 0.3197944164276123, mean loss: 0.340898672623793
Epoch: 56, step: 406, loss: 0.3404650390148163, mean loss: 0.340898667288143
Epoch: 56, step: 407, loss: 0.31720206141471863, mean loss: 0.3408983757165578
Epoch: 56, step: 408, loss: 0.2884010672569275, mean loss: 0.3408977297786884
Epoch: 56, step: 409, loss: 0.3368076682090759, mean loss: 0.3408976794543341
Epoch: 56, step: 410, loss: 0.3690427839756012, mean loss: 0.34089802574906825
Epoch: 56, step: 411, loss: 0.34332165122032166, mean loss: 0.3408980555687625
Epoch: 56, step: 412, loss: 0.3567151725292206, mean loss: 0.34089825017630165
Epoch: 56, step: 413, loss: 0.3474477231502533, mean loss: 0.3408983307574303
Epoch: 56, step: 414, loss: 0.32559865713119507, mean loss: 0.34089814252094086
Epoch: 56, step: 415, loss: 0.3484515845775604, mean loss: 0.34089823545206854
Epoch: 56, step: 416, loss: 0.33586105704307556, mean loss: 0.34089817347967144
Epoch: 56, step: 417, loss: 0.36927589774131775, mean loss: 0.3408985226064678
Epoch: 56, step: 418, loss: 0.36386415362358093, mean loss: 0.34089880514563364
Epoch: 56, step: 419, loss: 0.33233654499053955, mean loss: 0.34089869980804993
Epoch: 56, step: 420, loss: 0.25902673602104187, mean loss: 0.3408976925869909
Epoch: 56, step: 421, loss: 0.31509220600128174, mean loss: 0.3408973751216637
Epoch: 56, step: 422, loss: 0.34312495589256287, mean loss: 0.3408974025255631
Epoch: 56, step: 423, loss: 0.3332783877849579, mean loss: 0.34089730879691016
Epoch: 56, step: 424, loss: 0.30996495485305786, mean loss: 0.34089692827366663
Epoch: 56, step: 425, loss: 0.3812348544597626, mean loss: 0.3408974244961563
Epoch: 56, step: 426, loss: 0.3094945549964905, mean loss: 0.3408970381942348
Epoch: 56, step: 427, loss: 0.31460240483283997, mean loss: 0.34089671473518146
Epoch: 56, step: 428, loss: 0.3863060772418976, mean loss: 0.3408972733240207
Epoch: 56, step: 429, loss: 0.4131048023700714, mean loss: 0.3408981615510614
Epoch: 56, step: 430, loss: 0.3294055163860321, mean loss: 0.34089802018141796
Epoch: 56, step: 431, loss: 0.3483244776725769, mean loss: 0.3408981115322531
Epoch: 56, step: 432, loss: 0.3383510708808899, mean loss: 0.3408980802021837
Epoch: 56, step: 433, loss: 0.37289872765541077, mean loss: 0.3408984738237667
Epoch: 56, step: 434, loss: 0.36193522810935974, mean loss: 0.34089873258161474
Epoch: 56, step: 435, loss: 0.33280834555625916, mean loss: 0.3408986330688592
Epoch: 56, step: 436, loss: 0.3288952112197876, mean loss: 0.34089848542711004
Epoch: 56, step: 437, loss: 0.3319939076900482, mean loss: 0.34089837590240296
Epoch: 56, step: 438, loss: 0.3289954960346222, mean loss: 0.3408982295009188
Epoch: 56, step: 439, loss: 0.3265344798564911, mean loss: 0.34089805283372354
Epoch: 56, step: 440, loss: 0.318429559469223, mean loss: 0.3408977764854871
Epoch: 56, step: 441, loss: 0.36211687326431274, mean loss: 0.34089803746372704
Epoch: 56, step: 442, loss: 0.341096431016922, mean loss: 0.34089803990378204
Epoch: 56, step: 443, loss: 0.3195456564426422, mean loss: 0.3408977772926803
Epoch: 56, step: 444, loss: 0.33395737409591675, mean loss: 0.34089769193431657
Epoch: 56, step: 445, loss: 0.3237324655056, mean loss: 0.3408974808258867
Epoch: 56, step: 446, loss: 0.3276469111442566, mean loss: 0.3408973178642987
Epoch: 56, step: 447, loss: 0.354402631521225, mean loss: 0.34089748395680236
Epoch: 56, step: 448, loss: 0.3127252757549286, mean loss: 0.34089713749057676
Epoch: 56, step: 449, loss: 0.34139055013656616, mean loss: 0.3408971435585681
Epoch: 56, step: 450, loss: 0.34642159938812256, mean loss: 0.34089721149751945
Epoch: 56, step: 451, loss: 0.3286300003528595, mean loss: 0.3408970606390027
Epoch: 56, step: 452, loss: 0.3493283689022064, mean loss: 0.3408971643234508
Epoch: 56, step: 453, loss: 0.32701408863067627, mean loss: 0.3408969935977112
Epoch: 56, step: 454, loss: 0.34664589166641235, mean loss: 0.3408970642933428
Epoch: 56, step: 455, loss: 0.31917646527290344, mean loss: 0.3408967971930105
Epoch: 56, step: 456, loss: 0.3022030293941498, mean loss: 0.3408963213778115
Epoch: 56, step: 457, loss: 0.33272647857666016, mean loss: 0.34089622091492566
Epoch: 56, step: 458, loss: 0.3162693977355957, mean loss: 0.34089591808764214
Epoch: 56, step: 459, loss: 0.3020652234554291, mean loss: 0.34089544060627586
Epoch: 56, step: 460, loss: 0.3242315948009491, mean loss: 0.3408952357019315
Epoch: 56, step: 461, loss: 0.33832162618637085, mean loss: 0.3408952040563382
Epoch: 56, step: 462, loss: 0.3023143708705902, mean loss: 0.34089472966489154
Epoch: 56, step: 463, loss: 0.3443107604980469, mean loss: 0.34089477166802495
Epoch: 56, step: 464, loss: 0.3769484758377075, mean loss: 0.3408952149748917
Epoch: 56, step: 465, loss: 0.29881998896598816, mean loss: 0.3408946976353367
Epoch: 56, step: 466, loss: 0.32272326946258545, mean loss: 0.3408944742097281
Epoch: 56, step: 467, loss: 0.29637378454208374, mean loss: 0.34089392681522573
Epoch: 56, step: 468, loss: 0.3441435992717743, mean loss: 0.3408939667703787
Epoch: 56, step: 469, loss: 0.3070317208766937, mean loss: 0.34089355043470243
Epoch: 56, step: 470, loss: 0.33461856842041016, mean loss: 0.34089347328486513
Epoch: 56, step: 471, loss: 0.3336343467235565, mean loss: 0.34089338403623526
Epoch: 56, step: 472, loss: 0.31221580505371094, mean loss: 0.34089303145894595
Epoch: 56, step: 473, loss: 0.3514036238193512, mean loss: 0.3408931606801262
Epoch: 56, step: 474, loss: 0.36743634939193726, mean loss: 0.34089348700807115
Epoch: 56, step: 475, loss: 0.33508095145225525, mean loss: 0.3408934155483274
Epoch: 56, step: 476, loss: 0.3008722960948944, mean loss: 0.3408929235317619
Epoch: 56, step: 477, loss: 0.3149643540382385, mean loss: 0.3408926047718409
Epoch: 56, step: 478, loss: 0.3614032566547394, mean loss: 0.3408928569220184
Epoch: 56, step: 479, loss: 0.3446216285228729, mean loss: 0.3408929027615591
Epoch: 56, step: 480, loss: 0.3087347149848938, mean loss: 0.34089250743071176
Epoch: 56, step: 481, loss: 0.3495340645313263, mean loss: 0.3408926136628203
Epoch: 56, step: 482, loss: 0.31143006682395935, mean loss: 0.3408922514792507
Epoch: 56, step: 483, loss: 0.4028998613357544, mean loss: 0.34089301373044134
Epoch: 56, step: 484, loss: 0.3485287129878998, mean loss: 0.34089310759390934
Epoch: 56, step: 485, loss: 0.34642332792282104, mean loss: 0.3408931755744911
Epoch: 56, step: 486, loss: 0.2910049259662628, mean loss: 0.34089256232757825
Epoch: 56, step: 487, loss: 0.32506468892097473, mean loss: 0.34089236776723053
Epoch: 56, step: 488, loss: 0.30132830142974854, mean loss: 0.34089188144138716
Epoch: 56, step: 489, loss: 0.3371412456035614, mean loss: 0.3408918353387267
Epoch: 56, step: 490, loss: 0.3107759356498718, mean loss: 0.3408914651598847
Epoch: 56, step: 491, loss: 0.2945944666862488, mean loss: 0.34089089609308604
Epoch: 56, step: 492, loss: 0.31705808639526367, mean loss: 0.34089060315197833
Epoch: 56, step: 493, loss: 0.359042763710022, mean loss: 0.3408908262666144
Epoch: 56, step: 494, loss: 0.3419288992881775, mean loss: 0.3408908390257808
Epoch: 56, step: 495, loss: 0.3191128373146057, mean loss: 0.34089057135122686
Epoch: 56, step: 496, loss: 0.3624562919139862, mean loss: 0.34089083641336426
Epoch: 56, step: 497, loss: 0.3569257855415344, mean loss: 0.34089103349491495
Epoch: 56, step: 498, loss: 0.3556254506111145, mean loss: 0.34089121458972604
Epoch: 56, step: 499, loss: 0.3279363512992859, mean loss: 0.34089105536865416
Epoch: 56, step: 500, loss: 0.3128476142883301, mean loss: 0.34089071070643967
Epoch: 56, step: 501, loss: 0.3427871763706207, mean loss: 0.3408907340142791
Epoch: 56, step: 502, loss: 0.3055848479270935, mean loss: 0.34089030010512567
Epoch: 56, step: 503, loss: 0.34062838554382324, mean loss: 0.3408902968862367
Epoch: 56, step: 504, loss: 0.31156694889068604, mean loss: 0.3408899365113028
Epoch: 56, step: 505, loss: 0.29581156373023987, mean loss: 0.3408893825187652
Epoch: 56, step: 506, loss: 0.3258865475654602, mean loss: 0.34088919814306684
Epoch: 56, step: 507, loss: 0.33521565794944763, mean loss: 0.34088912841957236
Epoch: 56, step: 508, loss: 0.344513863325119, mean loss: 0.34088917296426047
Epoch: 56, step: 509, loss: 0.3659132421016693, mean loss: 0.34088948048348205
Epoch: 56, step: 510, loss: 0.3251669108867645, mean loss: 0.3408892872721813
Epoch: 56, step: 511, loss: 0.3762674629688263, mean loss: 0.34088972202168605
Epoch: 56, step: 512, loss: 0.33393144607543945, mean loss: 0.3408896365150202
Epoch: 56, step: 513, loss: 0.3393453359603882, mean loss: 0.34088961753814
Epoch: 56, step: 514, loss: 0.3333222568035126, mean loss: 0.3408895245490306
Epoch: 56, step: 515, loss: 0.2960997223854065, mean loss: 0.34088897417053265
Epoch: 56, step: 516, loss: 0.32106906175613403, mean loss: 0.3408887306258181
Epoch: 56, step: 517, loss: 0.2994854748249054, mean loss: 0.3408882218738115
Epoch: 56, step: 518, loss: 0.3196171522140503, mean loss: 0.34088796050387354
Epoch: 56, step: 519, loss: 0.3615119755268097, mean loss: 0.340888213919963
Epoch: 56, step: 520, loss: 0.3252176344394684, mean loss: 0.3408880213712196
Epoch: 56, step: 521, loss: 0.3253309726715088, mean loss: 0.34088783021980906
Epoch: 56, step: 522, loss: 0.3506394922733307, mean loss: 0.3408879500382328
Epoch: 56, step: 523, loss: 0.32709017395973206, mean loss: 0.34088778050739194
Epoch: 56, step: 524, loss: 0.4150684177875519, mean loss: 0.3408886919405989
Epoch: 56, step: 525, loss: 0.3095480799674988, mean loss: 0.34088830687349025
Epoch: 56, step: 526, loss: 0.35537347197532654, mean loss: 0.34088848484359874
Epoch: 56, step: 527, loss: 0.29244381189346313, mean loss: 0.3408878896416999
Epoch: 56, step: 528, loss: 0.30546578764915466, mean loss: 0.34088745444331686
Epoch: 56, step: 529, loss: 0.34420114755630493, mean loss: 0.3408874951550783
Epoch: 56, step: 530, loss: 0.36849868297576904, mean loss: 0.3408878343796968
Epoch: 56, step: 531, loss: 0.2938551604747772, mean loss: 0.34088725655432567
Epoch: 56, step: 532, loss: 0.3199639618396759, mean loss: 0.34088699950191936
Epoch: 56, step: 533, loss: 0.3175967037677765, mean loss: 0.34088671337331994
Epoch: 56, step: 534, loss: 0.329293817281723, mean loss: 0.3408865709526994
Epoch: 56, step: 535, loss: 0.32923632860183716, mean loss: 0.34088642782932904
Epoch: 56, step: 536, loss: 0.33397090435028076, mean loss: 0.34088634287308184
Epoch: 56, step: 537, loss: 0.3002249002456665, mean loss: 0.3408858433590327
Epoch: 56, step: 538, loss: 0.37250572443008423, mean loss: 0.3408862317953443
Epoch: 56, step: 539, loss: 0.30427679419517517, mean loss: 0.34088578207005316
Epoch: 56, step: 540, loss: 0.3168453872203827, mean loss: 0.34088548675164704
Epoch: 56, step: 541, loss: 0.3236062824726105, mean loss: 0.34088527449205586
Epoch: 56, step: 542, loss: 0.34587743878364563, mean loss: 0.340885335815582
Epoch: 56, step: 543, loss: 0.31174054741859436, mean loss: 0.34088497780668364
Epoch: 56, step: 544, loss: 0.35988685488700867, mean loss: 0.34088521121916976
Epoch: 56, step: 545, loss: 0.35301321744918823, mean loss: 0.34088536019357374
Epoch: 56, step: 546, loss: 0.3137855529785156, mean loss: 0.34088502731709247
Epoch: 56, step: 547, loss: 0.3179375231266022, mean loss: 0.34088474544827474
Epoch: 56, step: 548, loss: 0.34267428517341614, mean loss: 0.34088476742928175
Epoch: 56, step: 549, loss: 0.3767588436603546, mean loss: 0.3408852080669636
Epoch: 56, step: 550, loss: 0.3669280707836151, mean loss: 0.34088552794490645
Epoch: 56, step: 551, loss: 0.3347461521625519, mean loss: 0.34088545253742164
Epoch: 56, step: 552, loss: 0.34968137741088867, mean loss: 0.3408855605729041
Epoch: 56, step: 553, loss: 0.3472902476787567, mean loss: 0.3408856392371688
Epoch: 56, step: 554, loss: 0.311951220035553, mean loss: 0.34088528386042377
Epoch: 56, step: 555, loss: 0.31924349069595337, mean loss: 0.3408850180560371
Epoch: 56, step: 556, loss: 0.3201276361942291, mean loss: 0.3408847631171164
Epoch: 56, step: 557, loss: 0.3360663056373596, mean loss: 0.34088470393830134
Epoch: 56, step: 558, loss: 0.3110641837120056, mean loss: 0.3408843376963276
Epoch: 56, step: 559, loss: 0.30549484491348267, mean loss: 0.3408839030641211
Epoch: 56, step: 560, loss: 0.35937124490737915, mean loss: 0.34088413011161073
Epoch: 56, step: 561, loss: 0.35260698199272156, mean loss: 0.3408842740810048
Epoch: 56, step: 562, loss: 0.3221830427646637, mean loss: 0.34088404441232834
Epoch: 56, step: 563, loss: 0.3324127495288849, mean loss: 0.34088394037815234
Epoch: 56, step: 564, loss: 0.307598739862442, mean loss: 0.3408835316146834
Epoch: 56, step: 565, loss: 0.32375791668891907, mean loss: 0.3408833213038038
Epoch: 56, step: 566, loss: 0.3482145071029663, mean loss: 0.340883411333225
Epoch: 56, step: 567, loss: 0.3427388668060303, mean loss: 0.34088343411856087
Epoch: 56, step: 568, loss: 0.3057924211025238, mean loss: 0.3408830031997317
Epoch: 56, step: 569, loss: 0.36008015275001526, mean loss: 0.34088323893848393
Epoch: 56, step: 570, loss: 0.30472439527511597, mean loss: 0.3408827949175634
Epoch: 56, step: 571, loss: 0.33454421162605286, mean loss: 0.3408827170824132
Epoch: 56, step: 572, loss: 0.2999425530433655, mean loss: 0.340882214360505
Epoch: 56, step: 573, loss: 0.30731382966041565, mean loss: 0.340881802164912
Epoch: 56, step: 574, loss: 0.29892751574516296, mean loss: 0.34088128700281006
Epoch: 56, step: 575, loss: 0.316698282957077, mean loss: 0.340880990060226
Epoch: 56, step: 576, loss: 0.2890341281890869, mean loss: 0.34088035344154655
Epoch: 56, step: 577, loss: 0.3490966856479645, mean loss: 0.34088045432723457
Epoch: 56, step: 578, loss: 0.32407012581825256, mean loss: 0.34088024792117744
Epoch: 56, step: 579, loss: 0.4060501456260681, mean loss: 0.3408810481016414
Epoch: 56, step: 580, loss: 0.3426803648471832, mean loss: 0.34088107019405645
Epoch: 56, step: 581, loss: 0.2950652837753296, mean loss: 0.3408805076644489
Epoch: 56, step: 582, loss: 0.34812137484550476, mean loss: 0.34088059656725905
Epoch: 56, step: 583, loss: 0.3352205753326416, mean loss: 0.340880527074807
Epoch: 56, step: 584, loss: 0.3277676999568939, mean loss: 0.3408803660804778
Epoch: 56, step: 585, loss: 0.34645190834999084, mean loss: 0.34088043448492555
Epoch: 56, step: 586, loss: 0.3136139512062073, mean loss: 0.34088009972558214
Epoch: 56, step: 587, loss: 0.3241853713989258, mean loss: 0.3408798947615748
Epoch: 56, step: 588, loss: 0.29711201786994934, mean loss: 0.340879357422534
Epoch: 56, step: 589, loss: 0.31831812858581543, mean loss: 0.3408790804413073
Epoch: 56, step: 590, loss: 0.28070393204689026, mean loss: 0.34087834168802766
Epoch: 56, step: 591, loss: 0.4159574806690216, mean loss: 0.34087926340206937
Epoch: 56, step: 592, loss: 0.3543780446052551, mean loss: 0.34087942911871993
Epoch: 56, step: 593, loss: 0.37078922986984253, mean loss: 0.3408797962993621
Epoch: 56, step: 594, loss: 0.34247201681137085, mean loss: 0.3408798158456432
Epoch: 56, step: 595, loss: 0.31593847274780273, mean loss: 0.3408795096666216
Epoch: 56, step: 596, loss: 0.3109605014324188, mean loss: 0.34087914238647243
Epoch: 56, step: 597, loss: 0.32543227076530457, mean loss: 0.34087895276589325
Epoch: 56, step: 598, loss: 0.3176758289337158, mean loss: 0.3408786679356779
Epoch: 56, step: 599, loss: 0.36938247084617615, mean loss: 0.3408790178301455
Epoch: 56, step: 600, loss: 0.3132982552051544, mean loss: 0.3408786792704865
Epoch: 56, step: 601, loss: 0.3298640847206116, mean loss: 0.34087854406568263
Epoch: 56, step: 602, loss: 0.35058826208114624, mean loss: 0.34087866325158633
Epoch: 56, step: 603, loss: 0.31102046370506287, mean loss: 0.340878296749407
Epoch: 56, step: 604, loss: 0.297291100025177, mean loss: 0.34087776173367434
Epoch: 56, step: 605, loss: 0.2972085773944855, mean loss: 0.34087722571815526
Epoch: 56, step: 606, loss: 0.3418125808238983, mean loss: 0.3408772371989902
Epoch: 56, step: 607, loss: 0.3304942846298218, mean loss: 0.34087710975701546
Epoch: 56, step: 608, loss: 0.38360631465911865, mean loss: 0.34087763421548517
Epoch: 56, step: 609, loss: 0.32937803864479065, mean loss: 0.34087749307112536
Epoch: 56, step: 610, loss: 0.3083319365978241, mean loss: 0.34087709361661206
Epoch: 56, step: 611, loss: 0.38495805859565735, mean loss: 0.34087763464666976
Epoch: 56, step: 612, loss: 0.32829755544662476, mean loss: 0.34087748024629666
Epoch: 56, step: 613, loss: 0.30617162585258484, mean loss: 0.34087705429261106
Epoch: 56, step: 614, loss: 0.3292604982852936, mean loss: 0.3408769117214454
Epoch: 56, step: 615, loss: 0.348965048789978, mean loss: 0.3408770109867506
Epoch: 56, step: 616, loss: 0.35278311371803284, mean loss: 0.34087715710796573
Epoch: 56, step: 617, loss: 0.3210600018501282, mean loss: 0.3408769138989716
Epoch: 56, step: 618, loss: 0.35420888662338257, mean loss: 0.34087707751558766
Epoch: 56, step: 619, loss: 0.32354581356048584, mean loss: 0.34087686482028606
Epoch: 56, step: 620, loss: 0.3140568435192108, mean loss: 0.34087653567969206
Epoch: 56, step: 621, loss: 0.313583642244339, mean loss: 0.3408762007400284
Epoch: 56, step: 622, loss: 0.35719016194343567, mean loss: 0.34087640094326577
Epoch: 56, step: 623, loss: 0.31984657049179077, mean loss: 0.34087614287053786
Epoch: 56, step: 624, loss: 0.3396168649196625, mean loss: 0.3408761274171889
Epoch: 56, step: 625, loss: 0.35576125979423523, mean loss: 0.3408763100792625
Epoch: 56, step: 626, loss: 0.28850412368774414, mean loss: 0.3408756674047783
Epoch: 56, step: 627, loss: 0.34092316031455994, mean loss: 0.34087566798757063
Epoch: 56, step: 628, loss: 0.3213061988353729, mean loss: 0.34087542785075947
Epoch: 56, step: 629, loss: 0.33746328949928284, mean loss: 0.3408753859809488
Epoch: 56, step: 630, loss: 0.3623594641685486, mean loss: 0.3408756496054434
Epoch: 56, step: 631, loss: 0.32283881306648254, mean loss: 0.3408754282837032
Epoch: 56, step: 632, loss: 0.3689900040626526, mean loss: 0.3408757732605217
Epoch: 56, step: 633, loss: 0.3739627003669739, mean loss: 0.34087617924505026
Epoch: 56, step: 634, loss: 0.2977673411369324, mean loss: 0.3408756502957612
Epoch: 56, step: 635, loss: 0.29870250821113586, mean loss: 0.34087513283389514
Epoch: 56, step: 636, loss: 0.33222097158432007, mean loss: 0.3408750266491704
Epoch: 56, step: 637, loss: 0.381645530462265, mean loss: 0.3408755268884751
Epoch: 56, step: 638, loss: 0.3267858922481537, mean loss: 0.34087535401588587
Epoch: 56, step: 639, loss: 0.3152901232242584, mean loss: 0.34087504010208053
Epoch: 56, step: 640, loss: 0.3176882266998291, mean loss: 0.3408747556187556
Epoch: 56, step: 641, loss: 0.31487536430358887, mean loss: 0.34087443663130296
Epoch: 56, step: 642, loss: 0.32870832085609436, mean loss: 0.34087428736662906
Epoch: 56, step: 643, loss: 0.288318932056427, mean loss: 0.3408736425789357
Epoch: 56, step: 644, loss: 0.33119067549705505, mean loss: 0.3408735237826423
Epoch: 56, step: 645, loss: 0.33731982111930847, mean loss: 0.34087348018427815
Epoch: 56, step: 646, loss: 0.3592258393764496, mean loss: 0.3408737053362109
Epoch: 56, step: 647, loss: 0.2926962077617645, mean loss: 0.3408731142882968
Epoch: 56, step: 648, loss: 0.32958415150642395, mean loss: 0.3408729757955069
Epoch: 56, step: 649, loss: 0.35602712631225586, mean loss: 0.34087316170406884
Epoch: 56, step: 650, loss: 0.3048384189605713, mean loss: 0.34087271964134735
Epoch: 56, step: 651, loss: 0.32946857810020447, mean loss: 0.34087257974069546
Epoch: 56, step: 652, loss: 0.3225894570350647, mean loss: 0.3408723554546851
Epoch: 56, step: 653, loss: 0.3123025894165039, mean loss: 0.3408720049828134
Epoch: 56, step: 654, loss: 0.36063113808631897, mean loss: 0.340872247369657
Epoch: 56, step: 655, loss: 0.3356146216392517, mean loss: 0.3408721828747388
Epoch: 56, step: 656, loss: 0.31612858176231384, mean loss: 0.34087187935047986
Epoch: 56, step: 657, loss: 0.32426393032073975, mean loss: 0.340871675626957
Epoch: 56, step: 658, loss: 0.3623855412006378, mean loss: 0.3408719395262931
Epoch: 56, step: 659, loss: 0.3555622398853302, mean loss: 0.3408721197223134
Epoch: 56, step: 660, loss: 0.32031309604644775, mean loss: 0.3408718675417102
Epoch: 56, step: 661, loss: 0.3077431619167328, mean loss: 0.3408714611841602
Epoch: 56, step: 662, loss: 0.33821913599967957, mean loss: 0.34087142865107073
Epoch: 56, step: 663, loss: 0.40324968099594116, mean loss: 0.3408721937655387
Epoch: 56, step: 664, loss: 0.3339090347290039, mean loss: 0.34087210835839477
Epoch: 56, step: 665, loss: 0.32985103130340576, mean loss: 0.3408719731802143
Epoch: 56, step: 666, loss: 0.3575803339481354, mean loss: 0.34087217811282605
Epoch: 56, step: 667, loss: 0.3406324088573456, mean loss: 0.34087217517202667
Epoch: 56, step: 668, loss: 0.3188059628009796, mean loss: 0.3408719045305395
Epoch: 56, step: 669, loss: 0.36142176389694214, mean loss: 0.3408721565709075
Epoch: 56, step: 670, loss: 0.28785738348960876, mean loss: 0.34087150636212504
Epoch: 56, step: 671, loss: 0.31228533387184143, mean loss: 0.3408711557664067
Epoch: 56, step: 672, loss: 0.3262128531932831, mean loss: 0.340870975991549
Epoch: 56, step: 673, loss: 0.3451100289821625, mean loss: 0.340871027980229
Epoch: 56, step: 674, loss: 0.3445877134799957, mean loss: 0.34087107356192
Epoch: 56, step: 675, loss: 0.3329698145389557, mean loss: 0.340870976661515
Epoch: 56, step: 676, loss: 0.3384038805961609, mean loss: 0.3408709464056184
Epoch: 56, step: 677, loss: 0.3489375710487366, mean loss: 0.3408710453316276
Epoch: 56, step: 678, loss: 0.35604989528656006, mean loss: 0.3408712314769737
Epoch: 56, step: 679, loss: 0.3443630039691925, mean loss: 0.34087127429769
Epoch: 56, step: 680, loss: 0.3324723541736603, mean loss: 0.34087117130032507
Epoch: 56, step: 681, loss: 0.32666099071502686, mean loss: 0.3408709970406362
Epoch: 56, step: 682, loss: 0.38036978244781494, mean loss: 0.34087148140898094
Epoch: 56, step: 683, loss: 0.3093603551387787, mean loss: 0.3408710949969749
Epoch: 56, step: 684, loss: 0.3404051959514618, mean loss: 0.34087108928385706
Epoch: 56, step: 685, loss: 0.3185727596282959, mean loss: 0.3408708158524695
Epoch: 56, step: 686, loss: 0.2935497462749481, mean loss: 0.34087023558895857
Epoch: 56, step: 687, loss: 0.32881876826286316, mean loss: 0.3408700878124807
Epoch: 56, step: 688, loss: 0.32921257615089417, mean loss: 0.3408699448684852
Epoch: 56, step: 689, loss: 0.3092311918735504, mean loss: 0.3408695569199726
Epoch: 56, step: 690, loss: 0.3441493809223175, mean loss: 0.34086959713607223
Epoch: 56, step: 691, loss: 0.37143129110336304, mean loss: 0.3408699718686973
Epoch: 56, step: 692, loss: 0.3286776840686798, mean loss: 0.3408698223746281
Epoch: 56, step: 693, loss: 0.31199684739112854, mean loss: 0.3408694683569354
Epoch: 56, step: 694, loss: 0.31752249598503113, mean loss: 0.3408691820982469
Epoch: 56, step: 695, loss: 0.32385510206222534, mean loss: 0.3408689734901052
Epoch: 56, step: 696, loss: 0.39478832483291626, mean loss: 0.3408696345824329
Epoch: 56, step: 697, loss: 0.30694955587387085, mean loss: 0.3408692187015238
Epoch: 56, step: 698, loss: 0.32349497079849243, mean loss: 0.3408690056852309
Epoch: 56, step: 699, loss: 0.36606407165527344, mean loss: 0.34086931458457337
Epoch: 56, step: 700, loss: 0.327769011259079, mean loss: 0.3408691539727506
Epoch: 56, step: 701, loss: 0.3186612129211426, mean loss: 0.3408688817031646
Epoch: 56, step: 702, loss: 0.35700055956840515, mean loss: 0.34086907947527667
Epoch: 56, step: 703, loss: 0.3384559750556946, mean loss: 0.34086904989131706
Epoch: 56, step: 704, loss: 0.32638809084892273, mean loss: 0.3408688723611396
Epoch: 56, step: 705, loss: 0.35079848766326904, mean loss: 0.34086899409235577
Epoch: 56, step: 706, loss: 0.30601489543914795, mean loss: 0.34086856680693994
Epoch: 56, step: 707, loss: 0.3424549102783203, mean loss: 0.3408685862540967
Epoch: 56, step: 708, loss: 0.31321197748184204, mean loss: 0.3408682472128849
Epoch: 56, step: 709, loss: 0.32707399129867554, mean loss: 0.3408680781117508
Epoch: 56, step: 710, loss: 0.36307594180107117, mean loss: 0.3408683503503495
Epoch: 56, step: 711, loss: 0.31005001068115234, mean loss: 0.3408679725635045
Epoch: 56, step: 712, loss: 0.37380874156951904, mean loss: 0.34086837636321526
Epoch: 56, step: 713, loss: 0.3496687710285187, mean loss: 0.3408684842402736
Epoch: 56, step: 714, loss: 0.3714185953140259, mean loss: 0.3408688587252645
Epoch: 56, step: 715, loss: 0.36319032311439514, mean loss: 0.3408691323396846
Epoch: 56, step: 716, loss: 0.3214523494243622, mean loss: 0.34086889433349543
Epoch: 56, step: 717, loss: 0.29656267166137695, mean loss: 0.3408683512452815
Epoch: 56, step: 718, loss: 0.35139966011047363, mean loss: 0.34086848033233225
Epoch: 56, step: 719, loss: 0.315312922000885, mean loss: 0.3408681670900503
Epoch: 56, step: 720, loss: 0.334069162607193, mean loss: 0.34086808375359773
Epoch: 56, step: 721, loss: 0.3369815945625305, mean loss: 0.34086803611688077
Epoch: 56, step: 722, loss: 0.3839859962463379, mean loss: 0.3408685646074507
Epoch: 56, step: 723, loss: 0.34637829661369324, mean loss: 0.3408686321386073
Epoch: 56, step: 724, loss: 0.3504728376865387, mean loss: 0.3408687498530731
Epoch: 56, step: 725, loss: 0.3258586525917053, mean loss: 0.3408685658832574
Epoch: 56, step: 726, loss: 0.32289448380470276, mean loss: 0.3408683455883465
Epoch: 56, step: 727, loss: 0.30198201537132263, mean loss: 0.3408678689934571
Epoch: 56, step: 728, loss: 0.31645917892456055, mean loss: 0.3408675698416908
Epoch: 56, step: 729, loss: 0.31281694769859314, mean loss: 0.34086722605878833
Epoch: 56, step: 730, loss: 0.31547796726226807, mean loss: 0.3408669148968446
Epoch: 56, step: 731, loss: 0.3055400550365448, mean loss: 0.3408664819484175
Epoch: 56, step: 732, loss: 0.2903343141078949, mean loss: 0.34086586265888674
Epoch: 56, step: 733, loss: 0.3100859820842743, mean loss: 0.3408654854452225
Epoch: 56, step: 734, loss: 0.35307347774505615, mean loss: 0.3408656350548047
Epoch: 56, step: 735, loss: 0.34223076701164246, mean loss: 0.340865651784363
Epoch: 56, step: 736, loss: 0.3304730951786041, mean loss: 0.34086552442616147
Epoch: 56, step: 737, loss: 0.33926868438720703, mean loss: 0.340865504857523
Epoch: 56, step: 738, loss: 0.3512309789657593, mean loss: 0.340865631880722
Epoch: 56, step: 739, loss: 0.3245810568332672, mean loss: 0.34086543232463345
Epoch: 56, step: 740, loss: 0.3662370443344116, mean loss: 0.34086574323220054
Epoch: 56, step: 741, loss: 0.3353302478790283, mean loss: 0.3408656754002353
Epoch: 56, step: 742, loss: 0.3426692485809326, mean loss: 0.3408656975009519
Epoch: 56, step: 743, loss: 0.32221412658691406, mean loss: 0.3408654689501859
Epoch: 56, step: 744, loss: 0.32800042629241943, mean loss: 0.3408653113077364
Epoch: 56, step: 745, loss: 0.3339536488056183, mean loss: 0.34086522661636887
Epoch: 56, step: 746, loss: 0.32751187682151794, mean loss: 0.34086506299443314
Epoch: 56, step: 747, loss: 0.35186323523521423, mean loss: 0.3408651977561378
Epoch: 56, step: 748, loss: 0.37501072883605957, mean loss: 0.34086561613961935
Epoch: 56, step: 749, loss: 0.3567854166030884, mean loss: 0.34086581120174675
Epoch: 56, step: 750, loss: 0.34072986245155334, mean loss: 0.34086580953601436
Epoch: 56, step: 751, loss: 0.30310511589050293, mean loss: 0.34086534687313397
Epoch: 56, step: 752, loss: 0.3497212827205658, mean loss: 0.34086545537915414
Epoch: 56, step: 753, loss: 0.351166695356369, mean loss: 0.3408655815919991
Epoch: 56, step: 754, loss: 0.34792688488960266, mean loss: 0.3408656681074342
Epoch: 56, step: 755, loss: 0.3344269394874573, mean loss: 0.34086558922078114
Epoch: 56, step: 756, loss: 0.34004732966423035, mean loss: 0.3408655791956705
Epoch: 56, step: 757, loss: 0.35439327359199524, mean loss: 0.3408657449315554
Epoch: 56, step: 758, loss: 0.3416663408279419, mean loss: 0.340865754740015
Epoch: 56, step: 759, loss: 0.35806259512901306, mean loss: 0.3408659654236422
Epoch: 56, step: 760, loss: 0.2997913658618927, mean loss: 0.34086546221262154
Epoch: 56, step: 761, loss: 0.3906272053718567, mean loss: 0.3408660718436602
Epoch: 56, step: 762, loss: 0.3189586102962494, mean loss: 0.34086580345867057
Epoch: 56, step: 763, loss: 0.35704490542411804, mean loss: 0.34086600166396736
Epoch: 56, step: 764, loss: 0.3095640540122986, mean loss: 0.34086561819794853
Epoch: 56, step: 765, loss: 0.35710665583610535, mean loss: 0.34086581715712577
Epoch: 56, step: 766, loss: 0.3438097834587097, mean loss: 0.34086585322144325
Epoch: 56, step: 767, loss: 0.3186311423778534, mean loss: 0.3408655808440564
Epoch: 56, step: 768, loss: 0.34648755192756653, mean loss: 0.34086564971290945
Epoch: 56, step: 769, loss: 0.28192153573036194, mean loss: 0.34086492765942705
Epoch: 56, step: 770, loss: 0.28266188502311707, mean loss: 0.34086421469265255
Epoch: 56, step: 771, loss: 0.35615941882133484, mean loss: 0.3408644020512214
Epoch: 56, step: 772, loss: 0.3529622256755829, mean loss: 0.3408645502416697
Epoch: 56, step: 773, loss: 0.33735063672065735, mean loss: 0.3408645071990483
Epoch: 56, step: 774, loss: 0.32362839579582214, mean loss: 0.34086429607309865
Epoch: 56, step: 775, loss: 0.34140121936798096, mean loss: 0.3408643026498171
Epoch: 56, step: 776, loss: 0.29194048047065735, mean loss: 0.3408637033942693
Epoch: 56, step: 777, loss: 0.33966299891471863, mean loss: 0.34086368868732336
Epoch: 56, step: 778, loss: 0.3322902023792267, mean loss: 0.34086358367542635
Epoch: 56, step: 779, loss: 0.3405878245830536, mean loss: 0.34086358029784697
Epoch: 56, step: 780, loss: 0.30562731623649597, mean loss: 0.3408631487188885
Epoch: 56, step: 781, loss: 0.30758029222488403, mean loss: 0.340862741070547
Epoch: 56, step: 782, loss: 0.36238160729408264, mean loss: 0.3408630046303376
Epoch: 56, step: 783, loss: 0.36563748121261597, mean loss: 0.3408633080606308
Epoch: 56, step: 784, loss: 0.3750133216381073, mean loss: 0.3408637263145418
Epoch: 56, step: 785, loss: 0.3194511830806732, mean loss: 0.3408634640666149
Epoch: 56, step: 786, loss: 0.3757079839706421, mean loss: 0.34086389081607177
Epoch: 56, step: 787, loss: 0.32881850004196167, mean loss: 0.3408637432949973
Epoch: 56, step: 788, loss: 0.346727579832077, mean loss: 0.3408638151090952
Epoch: 56, step: 789, loss: 0.3441876769065857, mean loss: 0.3408638558157574
Epoch: 56, step: 790, loss: 0.3409029245376587, mean loss: 0.3408638562942183
Epoch: 56, step: 791, loss: 0.3078945577144623, mean loss: 0.3408634525357856
Epoch: 56, step: 792, loss: 0.32435718178749084, mean loss: 0.34086325039425763
Epoch: 56, step: 793, loss: 0.34744665026664734, mean loss: 0.3408633310158731
Epoch: 56, step: 794, loss: 0.33457526564598083, mean loss: 0.3408632540119253
Epoch: 56, step: 795, loss: 0.3447531759738922, mean loss: 0.3408633016475114
Epoch: 56, step: 796, loss: 0.3523997962474823, mean loss: 0.3408634429205132
Epoch: 56, step: 797, loss: 0.3228676915168762, mean loss: 0.34086322255178103
Epoch: 56, step: 798, loss: 0.32597821950912476, mean loss: 0.3408630402782539
Epoch: 56, step: 799, loss: 0.3660129904747009, mean loss: 0.34086334824688386
Epoch: 56, step: 800, loss: 0.34407636523246765, mean loss: 0.3408633875907519
Epoch: 56, step: 801, loss: 0.42222195863723755, mean loss: 0.34086438382628503
Epoch: 56, step: 802, loss: 0.40309134125709534, mean loss: 0.34086514578591903
Epoch: 56, step: 803, loss: 0.2972632944583893, mean loss: 0.3408646118944153
Epoch: 56, step: 804, loss: 0.3370196521282196, mean loss: 0.34086456481462046
Epoch: 56, step: 805, loss: 0.34107986092567444, mean loss: 0.3408645674507918
Epoch: 56, step: 806, loss: 0.3206760883331299, mean loss: 0.3408643202580414
Epoch: 56, step: 807, loss: 0.31360703706741333, mean loss: 0.3408639865171854
Epoch: 56, step: 808, loss: 0.32297247648239136, mean loss: 0.34086376745445923
Epoch: 56, step: 809, loss: 0.3837810456752777, mean loss: 0.3408642929249666
Epoch: 56, step: 810, loss: 0.3511119782924652, mean loss: 0.3408644183940253
Epoch: 56, step: 811, loss: 0.4157325327396393, mean loss: 0.34086533504168615
Epoch: 56, step: 812, loss: 0.30812206864356995, mean loss: 0.34086493415445474
Epoch: 56, step: 813, loss: 0.30465760827064514, mean loss: 0.3408644908609622
Epoch: 56, step: 814, loss: 0.30950894951820374, mean loss: 0.34086410697353287
Epoch: 56, step: 815, loss: 0.319858193397522, mean loss: 0.3408638498002521
Epoch: 56, step: 816, loss: 0.335107684135437, mean loss: 0.34086377932895934
Epoch: 56, step: 817, loss: 0.3092219829559326, mean loss: 0.3408633919511237
Epoch: 56, step: 818, loss: 0.31360289454460144, mean loss: 0.3408630582158617
Epoch: 56, step: 819, loss: 0.3673115372657776, mean loss: 0.34086338200606603
Epoch: 56, step: 820, loss: 0.30873608589172363, mean loss: 0.34086298869889686
Epoch: 56, step: 821, loss: 0.2953992486000061, mean loss: 0.34086243213179723
Epoch: 56, step: 822, loss: 0.3441390097141266, mean loss: 0.34086247224316846
Epoch: 56, step: 823, loss: 0.3449838161468506, mean loss: 0.34086252269542466
Epoch: 56, step: 824, loss: 0.32588425278663635, mean loss: 0.3408623393381806
Epoch: 56, step: 825, loss: 0.3129347264766693, mean loss: 0.3408619974650889
Epoch: 56, step: 826, loss: 0.31804636120796204, mean loss: 0.3408617181731686
Epoch: 56, step: 827, loss: 0.33314716815948486, mean loss: 0.3408616237385849
Epoch: 56, step: 828, loss: 0.2892664074897766, mean loss: 0.34086099216407734
Epoch: 56, step: 829, loss: 0.3378433287143707, mean loss: 0.34086095522545945
Epoch: 56, step: 830, loss: 0.3169962167739868, mean loss: 0.34086066310552005
Epoch: 56, step: 831, loss: 0.32703498005867004, mean loss: 0.3408604938722278
Epoch: 56, step: 832, loss: 0.3012683689594269, mean loss: 0.34086000925070054
Epoch: 56, step: 833, loss: 0.3641855716705322, mean loss: 0.34086029476028973
Epoch: 56, step: 834, loss: 0.35265278816223145, mean loss: 0.340860439101021
Epoch: 56, step: 835, loss: 0.32540374994277954, mean loss: 0.3408602499126592
Epoch: 56, step: 836, loss: 0.32668909430503845, mean loss: 0.3408600764612252
Epoch: 56, step: 837, loss: 0.33144500851631165, mean loss: 0.34085996122453643
Epoch: 56, step: 838, loss: 0.3964161276817322, mean loss: 0.3408606412016053
Epoch: 56, step: 839, loss: 0.35952067375183105, mean loss: 0.34086086958739487
Epoch: 56, step: 840, loss: 0.34800899028778076, mean loss: 0.34086095707433817
Epoch: 56, step: 841, loss: 0.3599168360233307, mean loss: 0.3408611902993027
Epoch: 56, step: 842, loss: 0.34724491834640503, mean loss: 0.3408612684288148
Epoch: 56, step: 843, loss: 0.3214276134967804, mean loss: 0.34086103058607076
Epoch: 56, step: 844, loss: 0.310321569442749, mean loss: 0.3408606568272297
Epoch: 56, step: 845, loss: 0.32638588547706604, mean loss: 0.3408604796791285
Epoch: 56, step: 846, loss: 0.33445534110069275, mean loss: 0.34086040129141354
Epoch: 56, step: 847, loss: 0.36807557940483093, mean loss: 0.340860734353609
Epoch: 56, step: 848, loss: 0.3388039171695709, mean loss: 0.34086070918237327
Epoch: 56, step: 849, loss: 0.36815065145492554, mean loss: 0.340861043151366
Epoch: 56, step: 850, loss: 0.38493070006370544, mean loss: 0.34086158246063497
Epoch: 56, step: 851, loss: 0.3375420868396759, mean loss: 0.34086154183828904
Epoch: 56, step: 852, loss: 0.36261239647865295, mean loss: 0.34086180801123517
Epoch: 56, step: 853, loss: 0.3450990915298462, mean loss: 0.34086185986374645
Epoch: 56, step: 854, loss: 0.2997457683086395, mean loss: 0.3408613567238212
Epoch: 56, step: 855, loss: 0.32736387848854065, mean loss: 0.3408611915564419
Epoch: 56, step: 856, loss: 0.308838427066803, mean loss: 0.3408607997016617
Epoch: 56, step: 857, loss: 0.3134955167770386, mean loss: 0.34086046484344823
Epoch: 56, step: 858, loss: 0.35758790373802185, mean loss: 0.34086066952804
Epoch: 56, step: 859, loss: 0.3282192349433899, mean loss: 0.3408605148435583
Epoch: 56, step: 860, loss: 0.34917670488357544, mean loss: 0.3408606166017723
Epoch: 56, step: 861, loss: 0.29422059655189514, mean loss: 0.340860045914108
Epoch: 56, step: 862, loss: 0.35791993141174316, mean loss: 0.34086025465645137
Epoch: 56, step: 863, loss: 0.3287394940853119, mean loss: 0.3408601063503559
Epoch: 56, step: 864, loss: 0.33984023332595825, mean loss: 0.34086009387163935
Epoch: 56, step: 865, loss: 0.3349340856075287, mean loss: 0.3408600213645029
Epoch: 56, step: 866, loss: 0.33269748091697693, mean loss: 0.34085992149370176
Epoch: 56, step: 867, loss: 0.30486395955085754, mean loss: 0.3408594810791525
Epoch: 56, step: 868, loss: 0.35948488116264343, mean loss: 0.34085970896018075
Epoch: 56, step: 869, loss: 0.3190328776836395, mean loss: 0.34085944191303663
Epoch: 56, step: 870, loss: 0.3183175027370453, mean loss: 0.3408591661200572
Epoch: 56, step: 871, loss: 0.31373655796051025, mean loss: 0.34085883428820635
Epoch: 56, step: 872, loss: 0.3291572332382202, mean loss: 0.34085869112658984
Epoch: 56, step: 873, loss: 0.3265097737312317, mean loss: 0.34085851557889607
Epoch: 56, step: 874, loss: 0.33889374136924744, mean loss: 0.3408584915417264
Epoch: 56, step: 875, loss: 0.31727349758148193, mean loss: 0.34085820300497627
Epoch: 56, step: 876, loss: 0.30327272415161133, mean loss: 0.34085774319314555
Epoch: 56, step: 877, loss: 0.3264550268650055, mean loss: 0.34085756699588676
Epoch: 56, step: 878, loss: 0.3090309202671051, mean loss: 0.34085717764576834
Epoch: 56, step: 879, loss: 0.3384450674057007, mean loss: 0.34085714813766693
Epoch: 56, step: 880, loss: 0.3018782436847687, mean loss: 0.340856671302332
Epoch: 56, step: 881, loss: 0.3324393928050995, mean loss: 0.3408565683336424
Epoch: 56, step: 882, loss: 0.3609978258609772, mean loss: 0.34085681471892293
Epoch: 56, step: 883, loss: 0.3501749336719513, mean loss: 0.34085692870481804
Epoch: 56, step: 884, loss: 0.33090731501579285, mean loss: 0.3408568069955165
Epoch: 56, step: 885, loss: 0.3136866092681885, mean loss: 0.3408564746383578
Epoch: 56, step: 886, loss: 0.28413528203964233, mean loss: 0.34085578080962664
Epoch: 56, step: 887, loss: 0.35407042503356934, mean loss: 0.34085594245269624
Epoch: 56, step: 888, loss: 0.34061628580093384, mean loss: 0.34085593952122395
Epoch: 56, step: 889, loss: 0.33730801939964294, mean loss: 0.34085589612371286
Epoch: 56, step: 890, loss: 0.3782791495323181, mean loss: 0.3408563538725161
Epoch: 56, step: 891, loss: 0.3005141317844391, mean loss: 0.3408558604258934
Epoch: 56, step: 892, loss: 0.3354034125804901, mean loss: 0.3408557937349942
Epoch: 56, step: 893, loss: 0.3809569478034973, mean loss: 0.3408562842209903
Epoch: 56, step: 894, loss: 0.35743045806884766, mean loss: 0.34085648694086024
Epoch: 56, step: 895, loss: 0.3209434151649475, mean loss: 0.34085624338567705
Epoch: 56, step: 896, loss: 0.3214867115020752, mean loss: 0.34085600648138425
Epoch: 56, step: 897, loss: 0.3221378028392792, mean loss: 0.34085577754613755
Epoch: 56, step: 898, loss: 0.33256959915161133, mean loss: 0.34085567620227303
Epoch: 56, step: 899, loss: 0.32100436091423035, mean loss: 0.3408554334143066
Epoch: 56, step: 900, loss: 0.35401082038879395, mean loss: 0.34085559430694984
Epoch: 56, step: 901, loss: 0.3219113051891327, mean loss: 0.34085536261787225
Epoch: 56, step: 902, loss: 0.29581311345100403, mean loss: 0.3408548117568994
Epoch: 56, step: 903, loss: 0.3504919707775116, mean loss: 0.3408549296166859
Epoch: 56, step: 904, loss: 0.3504881262779236, mean loss: 0.340855047426573
Epoch: 56, step: 905, loss: 0.30788105726242065, mean loss: 0.3408546441736665
Epoch: 56, step: 906, loss: 0.35592806339263916, mean loss: 0.34085482851064686
Epoch: 56, step: 907, loss: 0.30775007605552673, mean loss: 0.34085442366849483
Epoch: 56, step: 908, loss: 0.33644068241119385, mean loss: 0.34085436969296184
Epoch: 56, step: 909, loss: 0.3140849769115448, mean loss: 0.34085404233472105
Epoch: 56, step: 910, loss: 0.31618064641952515, mean loss: 0.3408537406117505
Epoch: 56, step: 911, loss: 0.3364716172218323, mean loss: 0.3408536870248376
Epoch: 56, step: 912, loss: 0.32250750064849854, mean loss: 0.3408534626807509
Epoch: 56, step: 913, loss: 0.3230014443397522, mean loss: 0.34085324438220677
Epoch: 56, step: 914, loss: 0.35104233026504517, mean loss: 0.34085336897514484
Epoch: 56, step: 915, loss: 0.4033684730529785, mean loss: 0.34085413340537324
Epoch: 56, step: 916, loss: 0.3278655409812927, mean loss: 0.3408539745837347
Epoch: 56, step: 917, loss: 0.3420010507106781, mean loss: 0.34085398860975663
Epoch: 56, step: 918, loss: 0.332032173871994, mean loss: 0.340853880741193
Epoch: 56, step: 919, loss: 0.3413390815258026, mean loss: 0.3408538866739034
Epoch: 56, step: 920, loss: 0.29239121079444885, mean loss: 0.3408532941119925
Epoch: 56, step: 921, loss: 0.3299250304698944, mean loss: 0.34085316049176845
Epoch: 56, step: 922, loss: 0.32161545753479004, mean loss: 0.340852925274644
Epoch: 56, step: 923, loss: 0.3804219365119934, mean loss: 0.3408534090743608
Epoch: 56, step: 924, loss: 0.30472278594970703, mean loss: 0.34085296732029696
Epoch: 56, step: 925, loss: 0.3380547761917114, mean loss: 0.3408529331083991
Epoch: 56, step: 926, loss: 0.2988881468772888, mean loss: 0.3408524200350019
Epoch: 56, step: 927, loss: 0.34864920377731323, mean loss: 0.34085251535952926
Epoch: 56, step: 928, loss: 0.3676612973213196, mean loss: 0.34085284312329833
Epoch: 56, step: 929, loss: 0.32045215368270874, mean loss: 0.3408525937078224
Epoch: 56, step: 930, loss: 0.36840739846229553, mean loss: 0.34085293058421773
Epoch: 56, step: 931, loss: 0.32786545157432556, mean loss: 0.3408527718053164
Epoch: 56, step: 932, loss: 0.3345531225204468, mean loss: 0.34085269478966446
Epoch: 56, step: 933, loss: 0.3526023328304291, mean loss: 0.3408528384317833
Epoch: 56, step: 934, loss: 0.3456480801105499, mean loss: 0.3408528970540364
Epoch: 56, step: 935, loss: 0.3629815876483917, mean loss: 0.34085316757592626
Epoch: 56, step: 936, loss: 0.34650498628616333, mean loss: 0.34085323666821987
Epoch: 56, step: 937, loss: 0.28985580801963806, mean loss: 0.3408526132430145
Epoch: 56, step: 938, loss: 0.3391181230545044, mean loss: 0.3408525920397556
Epoch: 56, step: 939, loss: 0.3504689037799835, mean loss: 0.34085270959283054
Epoch: 56, step: 940, loss: 0.3252965211868286, mean loss: 0.3408525194310017
Epoch: 56, step: 941, loss: 0.3400976061820984, mean loss: 0.34085251020291024
Epoch: 56, step: 942, loss: 0.3150845170021057, mean loss: 0.34085219521772314
Epoch: 56, step: 943, loss: 0.34255653619766235, mean loss: 0.34085221605114996
Epoch: 56, step: 944, loss: 0.3555958569049835, mean loss: 0.34085239627142955
Epoch: 56, step: 945, loss: 0.31974831223487854, mean loss: 0.3408521383068282
Epoch: 56, step: 946, loss: 0.3200686275959015, mean loss: 0.3408518842638424
Epoch: 56, step: 947, loss: 0.3340509831905365, mean loss: 0.34085180113543734
Epoch: 56, step: 948, loss: 0.33076050877571106, mean loss: 0.34085167778960773
Epoch: 56, step: 949, loss: 0.36021363735198975, mean loss: 0.34085191444787605
Epoch: 56, step: 950, loss: 0.31963372230529785, mean loss: 0.34085165510433096
Epoch: 56, step: 951, loss: 0.3537321090698242, mean loss: 0.3408518125362998
Epoch: 56, step: 952, loss: 0.322007417678833, mean loss: 0.3408515822125913
Epoch: 56, step: 953, loss: 0.34889984130859375, mean loss: 0.3408516805804211
Epoch: 56, step: 954, loss: 0.2843399941921234, mean loss: 0.3408509898889388
Epoch: 56, step: 955, loss: 0.35232609510421753, mean loss: 0.34085113013710816
Epoch: 56, step: 956, loss: 0.29724204540252686, mean loss: 0.3408505971555419
Epoch: 56, step: 957, loss: 0.37127187848091125, mean loss: 0.3408509689538519
Epoch: 56, step: 958, loss: 0.313445508480072, mean loss: 0.3408506340179479
Epoch: 56, step: 959, loss: 0.3381394147872925, mean loss: 0.3408506008831802
Epoch: 56, step: 960, loss: 0.3105970621109009, mean loss: 0.34085023114851754
Epoch: 56, step: 961, loss: 0.2949029505252838, mean loss: 0.3408496696243
Epoch: 56, step: 962, loss: 0.31995755434036255, mean loss: 0.3408494143037422
Epoch: 56, step: 963, loss: 0.3258295953273773, mean loss: 0.34084923075020335
Epoch: 56, step: 964, loss: 0.33990907669067383, mean loss: 0.34084921926095063
Epoch: 56, step: 965, loss: 0.3575564920902252, mean loss: 0.3408494234314606
Epoch: 56, step: 966, loss: 0.32340970635414124, mean loss: 0.34084921031275156
Epoch: 56, step: 967, loss: 0.4126517176628113, mean loss: 0.340850087750763
Epoch: 56, step: 968, loss: 0.3209478557109833, mean loss: 0.3408498445453075
Epoch: 56, step: 969, loss: 0.3128215968608856, mean loss: 0.3408495020440527
Epoch: 56, step: 970, loss: 0.3554333448410034, mean loss: 0.34084968025438805
Epoch: 56, step: 971, loss: 0.3160223960876465, mean loss: 0.3408493768758729
Epoch: 56, step: 972, loss: 0.3444124460220337, mean loss: 0.3408494204144819
Epoch: 56, step: 973, loss: 0.33026161789894104, mean loss: 0.34084929103934425
Epoch: 56, step: 974, loss: 0.32210931181907654, mean loss: 0.340849062053418
Epoch: 56, step: 975, loss: 0.31274810433387756, mean loss: 0.34084871868883193
Epoch: 56, step: 976, loss: 0.35336148738861084, mean loss: 0.34084887158003196
Epoch: 56, step: 977, loss: 0.30982884764671326, mean loss: 0.340848492556744
Epoch: 56, step: 978, loss: 0.34363049268722534, mean loss: 0.34084852654865694
Epoch: 56, step: 979, loss: 0.2924592196941376, mean loss: 0.3408479353103639
Epoch: 56, step: 980, loss: 0.3583528697490692, mean loss: 0.34084814918945777
Epoch: 56, step: 981, loss: 0.33735576272010803, mean loss: 0.34084810651924213
Epoch: 56, step: 982, loss: 0.2994954586029053, mean loss: 0.34084760127594776
Epoch: 56, step: 983, loss: 0.3325779438018799, mean loss: 0.3408475002391787
Epoch: 56, step: 984, loss: 0.3048463463783264, mean loss: 0.3408470603907522
Epoch: 56, step: 985, loss: 0.33127525448799133, mean loss: 0.34084694344749134
Epoch: 56, step: 986, loss: 0.35093721747398376, mean loss: 0.34084706672361537
Epoch: 56, step: 987, loss: 0.319318950176239, mean loss: 0.3408468037109028
Epoch: 56, step: 988, loss: 0.35892799496650696, mean loss: 0.3408470246092359
Epoch: 56, step: 989, loss: 0.30633074045181274, mean loss: 0.3408466029281432
Epoch: 56, step: 990, loss: 0.2899659276008606, mean loss: 0.3408459813329404
Epoch: 56, step: 991, loss: 0.33060193061828613, mean loss: 0.34084585618572194
Epoch: 56, step: 992, loss: 0.3684931993484497, mean loss: 0.34084619393744947
Epoch: 56, step: 993, loss: 0.37092325091362, mean loss: 0.34084656136710784
Epoch: 56, step: 994, loss: 0.32794979214668274, mean loss: 0.3408464038185277
Epoch: 56, step: 995, loss: 0.3072393238544464, mean loss: 0.3408459932751614
Epoch: 56, step: 996, loss: 0.30167585611343384, mean loss: 0.3408455147794533
Epoch: 56, step: 997, loss: 0.3046562969684601, mean loss: 0.34084507270354736
Epoch: 56, step: 998, loss: 0.3477093279361725, mean loss: 0.3408451565540688
Epoch: 56, step: 999, loss: 0.324591726064682, mean loss: 0.3408449580122129
Epoch: 56, step: 1000, loss: 0.3454175591468811, mean loss: 0.34084501386759836
Epoch: 56, step: 1001, loss: 0.33763524889945984, mean loss: 0.34084497466005226
Epoch: 56, step: 1002, loss: 0.3388572037220001, mean loss: 0.3408449503795615
Epoch: 56, step: 1003, loss: 0.344062477350235, mean loss: 0.34084498968096094
Epoch: 56, step: 1004, loss: 0.2996218502521515, mean loss: 0.3408444861553355
Epoch: 56, step: 1005, loss: 0.34226006269454956, mean loss: 0.34084450344587586
Epoch: 56, step: 1006, loss: 0.3173167407512665, mean loss: 0.340844216069849
Epoch: 56, step: 1007, loss: 0.3308490812778473, mean loss: 0.34084409398739357
Epoch: 56, step: 1008, loss: 0.33236995339393616, mean loss: 0.34084399048391145
Epoch: 56, step: 1009, loss: 0.35293737053871155, mean loss: 0.34084413819112075
Epoch: 56, step: 1010, loss: 0.36958250403404236, mean loss: 0.34084448919406235
Epoch: 56, step: 1011, loss: 0.3266926407814026, mean loss: 0.3408443163491699
Epoch: 56, step: 1012, loss: 0.37664321064949036, mean loss: 0.3408447535768932
Epoch: 56, step: 1013, loss: 0.3193250000476837, mean loss: 0.3408444907498392
Epoch: 56, step: 1014, loss: 0.2901258170604706, mean loss: 0.3408438713153848
Epoch: 56, step: 1015, loss: 0.33123505115509033, mean loss: 0.34084375396291583
Epoch: 56, step: 1016, loss: 0.2875228226184845, mean loss: 0.340843102762621
Epoch: 56, step: 1017, loss: 0.3758670687675476, mean loss: 0.3408435304996817
Epoch: 56, step: 1018, loss: 0.32538262009620667, mean loss: 0.34084334168258407
Epoch: 56, step: 1019, loss: 0.30738565325737, mean loss: 0.34084293308397595
Epoch: 56, step: 1020, loss: 0.31767043471336365, mean loss: 0.34084265009565856
Epoch: 56, step: 1021, loss: 0.3149130046367645, mean loss: 0.3408423334402418
Epoch: 56, step: 1022, loss: 0.3000184893608093, mean loss: 0.34084183490147396
Epoch: 56, step: 1023, loss: 0.3661530911922455, mean loss: 0.3408421439975111
Epoch: 56, step: 1024, loss: 0.3373829424381256, mean loss: 0.3408421017549442
Epoch: 56, step: 1025, loss: 0.3876350522041321, mean loss: 0.34084267316721006
Epoch: 56, step: 1026, loss: 0.3404971957206726, mean loss: 0.3408426689484626
Epoch: 56, step: 1027, loss: 0.3017512559890747, mean loss: 0.3408421915952051
Epoch: 56, step: 1028, loss: 0.3353387713432312, mean loss: 0.34084212439263284
Epoch: 56, step: 1029, loss: 0.3487386703491211, mean loss: 0.3408422208166194
Epoch: 56, step: 1030, loss: 0.3553454279899597, mean loss: 0.34084239791176774
Epoch: 56, step: 1031, loss: 0.3096467852592468, mean loss: 0.34084201699435235
Epoch: 56, step: 1032, loss: 0.30946579575538635, mean loss: 0.3408416338762743
Epoch: 56, step: 1033, loss: 0.28608453273773193, mean loss: 0.34084096527507357
Epoch: 56, step: 1034, loss: 0.3398967981338501, mean loss: 0.3408409537466405
Epoch: 56, step: 1035, loss: 0.30750933289527893, mean loss: 0.3408405467671429
Epoch: 56, step: 1036, loss: 0.3753339350223541, mean loss: 0.34084096792669233
Epoch: 56, step: 1037, loss: 0.306521475315094, mean loss: 0.34084054889550125
Epoch: 56, step: 1038, loss: 0.3126799762248993, mean loss: 0.34084020506715956
Epoch: 56, step: 1039, loss: 0.356932669878006, mean loss: 0.3408404015467553
Epoch: 56, step: 1040, loss: 0.31530213356018066, mean loss: 0.340840089743227
Epoch: 56, step: 1041, loss: 0.32655102014541626, mean loss: 0.3408399152862935
Epoch: 56, step: 1042, loss: 0.338361531496048, mean loss: 0.34083988502778334
Epoch: 56, step: 1043, loss: 0.28764280676841736, mean loss: 0.3408392355542489
Epoch: 56, step: 1044, loss: 0.2997799813747406, mean loss: 0.3408387342753396
Epoch: 56, step: 1045, loss: 0.27960529923439026, mean loss: 0.3408379867056285
Epoch: 56, step: 1046, loss: 0.30721887946128845, mean loss: 0.34083757627104405
Epoch: 56, step: 1047, loss: 0.33956995606422424, mean loss: 0.3408375607956533
Epoch: 56, step: 1048, loss: 0.3547946810722351, mean loss: 0.3408377311852163
Epoch: 56, step: 1049, loss: 0.30401811003685, mean loss: 0.3408372816940286
Epoch: 56, step: 1050, loss: 0.31843069195747375, mean loss: 0.3408370081593923
Epoch: 56, step: 1051, loss: 0.32168397307395935, mean loss: 0.3408367743462778
Epoch: 56, step: 1052, loss: 0.3406001627445221, mean loss: 0.3408367714578468
Epoch: 56, step: 1053, loss: 0.34872326254844666, mean loss: 0.34083686773084043
Epoch: 56, step: 1054, loss: 0.335706889629364, mean loss: 0.340836805108273
Epoch: 56, step: 1055, loss: 0.3589320182800293, mean loss: 0.3408370259971057
Epoch: 56, step: 1056, loss: 0.36321425437927246, mean loss: 0.3408372991532974
Epoch: 56, step: 1057, loss: 0.3208102583885193, mean loss: 0.34083705468855335
Epoch: 56, step: 1058, loss: 0.2892032563686371, mean loss: 0.34083642441624495
Epoch: 56, step: 1059, loss: 0.3630620539188385, mean loss: 0.34083669571195196
Epoch: 56, step: 1060, loss: 0.3271230161190033, mean loss: 0.34083652831885347
Epoch: 56, step: 1061, loss: 0.3363197147846222, mean loss: 0.34083647318600757
Epoch: 56, step: 1062, loss: 0.3566693067550659, mean loss: 0.3408366664413882
Epoch: 56, step: 1063, loss: 0.32764554023742676, mean loss: 0.34083650543262195
Epoch: 56, step: 1064, loss: 0.3467141091823578, mean loss: 0.340836577172833
Epoch: 56, step: 1065, loss: 0.33498191833496094, mean loss: 0.3408365057135527
Epoch: 56, step: 1066, loss: 0.3428264856338501, mean loss: 0.34083653000203834
Epoch: 56, step: 1067, loss: 0.30064529180526733, mean loss: 0.3408360394581947
Epoch: 56, step: 1068, loss: 0.3104540705680847, mean loss: 0.34083566864339615
Epoch: 56, step: 1069, loss: 0.29528939723968506, mean loss: 0.3408351127536385
Epoch: 56, step: 1070, loss: 0.3271673917770386, mean loss: 0.34083494594188557
Epoch: 56, step: 1071, loss: 0.3249959945678711, mean loss: 0.3408347526330668
Epoch: 56, step: 1072, loss: 0.3132944703102112, mean loss: 0.34083441651773033
Epoch: 56, step: 1073, loss: 0.3595972955226898, mean loss: 0.3408346455064658
Epoch: 56, step: 1074, loss: 0.3215992748737335, mean loss: 0.34083441075414234
Epoch: 56, step: 1075, loss: 0.36086273193359375, mean loss: 0.34083465518081035
Epoch: 56, step: 1076, loss: 0.3148086369037628, mean loss: 0.3408343375618128
Epoch: 56, step: 1077, loss: 0.3614685833454132, mean loss: 0.34083458937706973
Epoch: 56, step: 1078, loss: 0.3215053677558899, mean loss: 0.3408343534908852
Epoch: 56, step: 1079, loss: 0.3307797908782959, mean loss: 0.3408342307904726
Epoch: 56, step: 1080, loss: 0.3078407645225525, mean loss: 0.34083382816107155
Epoch: 56, step: 1081, loss: 0.3299427926540375, mean loss: 0.34083369525604257
Epoch: 56, step: 1082, loss: 0.3289357125759125, mean loss: 0.3408335500648497
Epoch: 56, step: 1083, loss: 0.33068645000457764, mean loss: 0.3408334262412047
Epoch: 56, step: 1084, loss: 0.30245158076286316, mean loss: 0.3408329578786197
Epoch: 56, step: 1085, loss: 0.32446983456611633, mean loss: 0.3408327582065842
Epoch: 56, step: 1086, loss: 0.33170652389526367, mean loss: 0.3408326468444982
Epoch: 56, step: 1087, loss: 0.33822891116142273, mean loss: 0.3408326150730261
Epoch: 56, step: 1088, loss: 0.31799080967903137, mean loss: 0.34083233635467053
Epoch: 56, step: 1089, loss: 0.3302459418773651, mean loss: 0.3408322071798349
Epoch: 56, step: 1090, loss: 0.3326835632324219, mean loss: 0.340832107751564
Epoch: 56, step: 1091, loss: 0.3323540687561035, mean loss: 0.3408320043053368
Epoch: 56, step: 1092, loss: 0.3332313299179077, mean loss: 0.34083191156555387
Epoch: 56, step: 1093, loss: 0.36975380778312683, mean loss: 0.3408322644523522
Epoch: 56, step: 1094, loss: 0.29479676485061646, mean loss: 0.3408317027629758
Epoch: 56, step: 1095, loss: 0.3231619596481323, mean loss: 0.3408314871731379
Epoch: 56, step: 1096, loss: 0.3899737000465393, mean loss: 0.3408320867535831
Epoch: 56, step: 1097, loss: 0.3481927216053009, mean loss: 0.3408321765590399
Epoch: 56, step: 1098, loss: 0.39816686511039734, mean loss: 0.3408328760781955
Epoch: 56, step: 1099, loss: 0.33635184168815613, mean loss: 0.3408328214074329
Epoch: 56, step: 1100, loss: 0.3316800892353058, mean loss: 0.34083270974108537
Epoch: 56, step: 1101, loss: 0.3198751211166382, mean loss: 0.34083245405472
Epoch: 56, step: 1102, loss: 0.3188064694404602, mean loss: 0.34083218533700904
Epoch: 56, step: 1103, loss: 0.3142063617706299, mean loss: 0.3408318605050799
Epoch: 56, step: 1104, loss: 0.3285643458366394, mean loss: 0.34083171084466357
Epoch: 56, step: 1105, loss: 0.3826167583465576, mean loss: 0.34083222060491125
Epoch: 56, step: 1106, loss: 0.35635361075401306, mean loss: 0.340832409957123
Epoch: 56, step: 1107, loss: 0.32178938388824463, mean loss: 0.34083217764577195
Epoch: 56, step: 1108, loss: 0.3208496570587158, mean loss: 0.3408319338762309
Epoch: 56, step: 1109, loss: 0.32577410340309143, mean loss: 0.34083175018590867
Epoch: 56, step: 1110, loss: 0.30929139256477356, mean loss: 0.3408313654300975
Epoch: 56, step: 1111, loss: 0.3259226679801941, mean loss: 0.34083118356348474
Epoch: 56, step: 1112, loss: 0.36332911252975464, mean loss: 0.3408314580054498
Epoch: 56, step: 1113, loss: 0.3336707353591919, mean loss: 0.3408313706561287
Epoch: 56, step: 1114, loss: 0.337465763092041, mean loss: 0.34083132960162005
Epoch: 56, step: 1115, loss: 0.313790887594223, mean loss: 0.3408309997596829
Epoch: 56, step: 1116, loss: 0.3065037429332733, mean loss: 0.3408305810375787
Epoch: 56, step: 1117, loss: 0.3149492144584656, mean loss: 0.34083026534185795
Epoch: 56, step: 1118, loss: 0.32793694734573364, mean loss: 0.34083010807366826
Epoch: 56, step: 1119, loss: 0.35737913846969604, mean loss: 0.3408303099304988
Epoch: 56, step: 1120, loss: 0.31627532839775085, mean loss: 0.34083001042471683
Epoch: 56, step: 1121, loss: 0.33207157254219055, mean loss: 0.34082990359625975
Epoch: 56, step: 1122, loss: 0.3305618464946747, mean loss: 0.34082977835619604
Epoch: 56, step: 1123, loss: 0.35048940777778625, mean loss: 0.34082989617379644
Epoch: 56, step: 1124, loss: 0.31795865297317505, mean loss: 0.34082961721877564
Epoch: 56, step: 1125, loss: 0.35856619477272034, mean loss: 0.34082983354488317
Epoch: 56, step: 1126, loss: 0.3512875437736511, mean loss: 0.3408299610919338
Epoch: 56, step: 1127, loss: 0.35690784454345703, mean loss: 0.340830157182814
Epoch: 56, step: 1128, loss: 0.29645583033561707, mean loss: 0.3408296159862869
Epoch: 56, step: 1129, loss: 0.30087900161743164, mean loss: 0.34082912874802107
Epoch: 56, step: 1130, loss: 0.3409128785133362, mean loss: 0.340829129769422
Epoch: 56, step: 1131, loss: 0.34347257018089294, mean loss: 0.3408291620080728
Epoch: 56, step: 1132, loss: 0.3107365667819977, mean loss: 0.3408287950117775
Epoch: 56, step: 1133, loss: 0.34121689200401306, mean loss: 0.3408287997447831
Epoch: 56, step: 1134, loss: 0.2911504805088043, mean loss: 0.34082819390423336
Epoch: 56, step: 1135, loss: 0.34471091628074646, mean loss: 0.3408282412545062
Epoch: 56, step: 1136, loss: 0.3151778280735016, mean loss: 0.3408279284484041
Epoch: 56, step: 1137, loss: 0.3371814489364624, mean loss: 0.34082788398022634
Epoch: 56, step: 1138, loss: 0.30392351746559143, mean loss: 0.34082743394344095
Epoch: 56, step: 1139, loss: 0.3215055465698242, mean loss: 0.3408271983221618
Epoch: 56, step: 1140, loss: 0.3241269886493683, mean loss: 0.3408269946734858
Epoch: 56, step: 1141, loss: 0.32552504539489746, mean loss: 0.3408268080780016
Epoch: 56, step: 1142, loss: 0.29751384258270264, mean loss: 0.3408262799161923
Epoch: 56, step: 1143, loss: 0.29552415013313293, mean loss: 0.3408257275050887
Epoch: 56, step: 1144, loss: 0.32207027077674866, mean loss: 0.3408254988051079
Epoch: 56, step: 1145, loss: 0.31143710017204285, mean loss: 0.340825140453704
Epoch: 56, step: 1146, loss: 0.390553742647171, mean loss: 0.34082574681873057
Epoch: 56, step: 1147, loss: 0.33248674869537354, mean loss: 0.34082564513851155
Epoch: 56, step: 1148, loss: 0.32821378111839294, mean loss: 0.3408254913596714
Epoch: 56, step: 1149, loss: 0.344368040561676, mean loss: 0.34082553455411624
Epoch: 56, step: 1150, loss: 0.34944838285446167, mean loss: 0.34082563969157037
Epoch: 56, step: 1151, loss: 0.3233245611190796, mean loss: 0.34082542630541923
Epoch: 56, step: 1152, loss: 0.32506072521209717, mean loss: 0.34082523409281584
Epoch: 56, step: 1153, loss: 0.3521004319190979, mean loss: 0.34082537156505155
Epoch: 56, step: 1154, loss: 0.3089573383331299, mean loss: 0.34082498302052855
Epoch: 56, step: 1155, loss: 0.30978071689605713, mean loss: 0.34082460452423347
Epoch: 56, step: 1156, loss: 0.3580460846424103, mean loss: 0.3408248144885124
Epoch: 56, step: 1157, loss: 0.30298399925231934, mean loss: 0.34082435313893256
Epoch: 56, step: 1158, loss: 0.33440402150154114, mean loss: 0.3408242748641604
Epoch: 56, step: 1159, loss: 0.3436576724052429, mean loss: 0.34082430940767866
Epoch: 56, step: 1160, loss: 0.3000144958496094, mean loss: 0.3408238118787112
Epoch: 56, step: 1161, loss: 0.33148670196533203, mean loss: 0.3408236980476099
Epoch: 56, step: 1162, loss: 0.33850231766700745, mean loss: 0.34082366974741146
Epoch: 56, step: 1163, loss: 0.3471912741661072, mean loss: 0.340823747374617
Epoch: 56, step: 1164, loss: 0.31024307012557983, mean loss: 0.3408233745713737
Epoch: 56, step: 1165, loss: 0.3114219009876251, mean loss: 0.3408230161479483
Epoch: 56, step: 1166, loss: 0.34450027346611023, mean loss: 0.3408230609756027
Epoch: 56, step: 1167, loss: 0.3448644280433655, mean loss: 0.3408231102413413
Epoch: 56, step: 1168, loss: 0.31934747099876404, mean loss: 0.34082284844865735
Epoch: 56, step: 1169, loss: 0.332322359085083, mean loss: 0.34082274482711794
Epoch: 56, step: 1170, loss: 0.31000351905822754, mean loss: 0.3408223691432541
Epoch: 56, step: 1171, loss: 0.3127301037311554, mean loss: 0.34082202670499023
Epoch: 56, step: 1172, loss: 0.32264095544815063, mean loss: 0.3408218050846085
Epoch: 56, step: 1173, loss: 0.3850220739841461, mean loss: 0.3408223438626004
Epoch: 56, step: 1174, loss: 0.3224743902683258, mean loss: 0.3408221202134385
Epoch: 56, step: 1175, loss: 0.3358049988746643, mean loss: 0.3408220590588634
Epoch: 56, step: 1176, loss: 0.3364689350128174, mean loss: 0.340822005998515
Epoch: 56, step: 1177, loss: 0.2962574064731598, mean loss: 0.3408214628060096
Epoch: 56, step: 1178, loss: 0.29428133368492126, mean loss: 0.34082089554092765
Epoch: 56, step: 1179, loss: 0.32497790455818176, mean loss: 0.3408207024373371
Epoch: 56, step: 1180, loss: 0.32342293858528137, mean loss: 0.34082049038585494
Epoch: 56, step: 1181, loss: 0.3276149332523346, mean loss: 0.340820329432766
Epoch: 56, step: 1182, loss: 0.3356078267097473, mean loss: 0.3408202659020736
Epoch: 56, step: 1183, loss: 0.3126436769962311, mean loss: 0.34081992248615967
Epoch: 56, step: 1184, loss: 0.3268081247806549, mean loss: 0.3408197517126255
Epoch: 56, step: 1185, loss: 0.38119909167289734, mean loss: 0.34082024384352083
Epoch: 56, step: 1186, loss: 0.3277408182621002, mean loss: 0.3408200844374736
Epoch: 56, step: 1187, loss: 0.3706628084182739, mean loss: 0.3408204481424897
Epoch: 56, step: 1188, loss: 0.35243600606918335, mean loss: 0.340820589704138
Epoch: 56, step: 1189, loss: 0.29057854413986206, mean loss: 0.34081997739949027
Epoch: 56, step: 1190, loss: 0.34978678822517395, mean loss: 0.34082008667754554
Epoch: 56, step: 1191, loss: 0.31463125348091125, mean loss: 0.34081976751949256
Epoch: 56, step: 1192, loss: 0.3407427668571472, mean loss: 0.3408197665811124
Epoch: 56, step: 1193, loss: 0.3336310386657715, mean loss: 0.3408196789756636
Epoch: 56, step: 1194, loss: 0.3536556661128998, mean loss: 0.34081983539954325
Epoch: 56, step: 1195, loss: 0.3559305965900421, mean loss: 0.34082001954238006
Epoch: 56, step: 1196, loss: 0.3386547863483429, mean loss: 0.34081999315672556
Epoch: 56, step: 1197, loss: 0.34343910217285156, mean loss: 0.3408200250729476
Epoch: 56, step: 1198, loss: 0.33735036849975586, mean loss: 0.3408199827925463
Epoch: 56, step: 1199, loss: 0.3269631862640381, mean loss: 0.34081981393901095
Epoch: 56, step: 1200, loss: 0.3417806029319763, mean loss: 0.3408198256466694
Epoch: 56, step: 1201, loss: 0.3303237855434418, mean loss: 0.3408196977491223
Epoch: 56, step: 1202, loss: 0.386338472366333, mean loss: 0.34082025240293706
Epoch: 56, step: 1203, loss: 0.3232225179672241, mean loss: 0.3408200379742385
Epoch: 56, step: 1204, loss: 0.3500356376171112, mean loss: 0.3408201502651113
Epoch: 56, step: 1205, loss: 0.32566937804222107, mean loss: 0.34081996565718853
Epoch: 56, step: 1206, loss: 0.3349362313747406, mean loss: 0.34081989396640516
Epoch: 56, step: 1207, loss: 0.3388383686542511, mean loss: 0.3408198698226617
Epoch: 56, step: 1208, loss: 0.35290998220443726, mean loss: 0.34082001713191545
Epoch: 56, step: 1209, loss: 0.34995555877685547, mean loss: 0.3408201284405107
Epoch: 56, step: 1210, loss: 0.33221369981765747, mean loss: 0.3408200235799731
Epoch: 56, step: 1211, loss: 0.33901673555374146, mean loss: 0.34082000160901904
Epoch: 56, step: 1212, loss: 0.33448848128318787, mean loss: 0.340819924467794
Epoch: 56, step: 1213, loss: 0.2912655472755432, mean loss: 0.3408193207204172
Epoch: 56, step: 1214, loss: 0.35849666595458984, mean loss: 0.34081953609030763
Epoch: 56, step: 1215, loss: 0.33033499121665955, mean loss: 0.3408194083546245
Epoch: 56, step: 1216, loss: 0.3282477855682373, mean loss: 0.34081925519344486
Epoch: 56, step: 1217, loss: 0.3209637999534607, mean loss: 0.3408190132956446
Epoch: 56, step: 1218, loss: 0.3480243980884552, mean loss: 0.34081910107733865
Epoch: 56, step: 1219, loss: 0.36511409282684326, mean loss: 0.3408193970545297
Epoch: 56, step: 1220, loss: 0.33387988805770874, mean loss: 0.34081931251400466
Epoch: 56, step: 1221, loss: 0.3114679455757141, mean loss: 0.3408189549455163
Epoch: 56, step: 1222, loss: 0.4102114140987396, mean loss: 0.34081980029811965
Epoch: 56, step: 1223, loss: 0.33740943670272827, mean loss: 0.3408197587529048
Epoch: 56, step: 1224, loss: 0.3388270437717438, mean loss: 0.3408197344778499
Epoch: 56, step: 1225, loss: 0.3416562080383301, mean loss: 0.34081974466756315
Epoch: 56, step: 1226, loss: 0.33467403054237366, mean loss: 0.3408196698029114
Epoch: 56, step: 1227, loss: 0.33342596888542175, mean loss: 0.3408195797368767
Epoch: 56, step: 1228, loss: 0.3145119845867157, mean loss: 0.34081925927599516
Epoch: 56, step: 1229, loss: 0.3465879559516907, mean loss: 0.3408193295454019
Epoch: 56, step: 1230, loss: 0.34153953194618225, mean loss: 0.3408193383181944
Epoch: 56, step: 1231, loss: 0.3336860239505768, mean loss: 0.3408192514282805
Epoch: 56, step: 1232, loss: 0.34722593426704407, mean loss: 0.3408193294662458
Epoch: 56, step: 1233, loss: 0.28651413321495056, mean loss: 0.3408186679982898
Epoch: 56, step: 1234, loss: 0.31847241520881653, mean loss: 0.3408183958116275
Epoch: 56, step: 1235, loss: 0.3299613296985626, mean loss: 0.3408182635696529
Epoch: 56, step: 1236, loss: 0.29085686802864075, mean loss: 0.3408176550338794
Epoch: 56, step: 1237, loss: 0.3792817294597626, mean loss: 0.34081812352520025
Epoch: 56, step: 1238, loss: 0.3234286606311798, mean loss: 0.3408179117246218
Epoch: 56, step: 1239, loss: 0.3010839819908142, mean loss: 0.34081742777828866
Epoch: 56, step: 1240, loss: 0.33647969365119934, mean loss: 0.34081737494674214
Epoch: 56, step: 1241, loss: 0.3002089262008667, mean loss: 0.34081688036109986
Epoch: 56, step: 1242, loss: 0.32699888944625854, mean loss: 0.3408167120686167
Epoch: 56, step: 1243, loss: 0.3391202390193939, mean loss: 0.34081669140713367
Epoch: 56, step: 1244, loss: 0.34990739822387695, mean loss: 0.34081680212224186
Epoch: 56, step: 1245, loss: 0.3425202965736389, mean loss: 0.34081682286873377
Epoch: 56, step: 1246, loss: 0.30872923135757446, mean loss: 0.34081643208562906
Epoch: 56, step: 1247, loss: 0.34534409642219543, mean loss: 0.3408164872257345
Epoch: 56, step: 1248, loss: 0.3276820480823517, mean loss: 0.34081632727007405
Epoch: 56, step: 1249, loss: 0.3518828749656677, mean loss: 0.34081646204060884
Epoch: 56, step: 1250, loss: 0.3732612133026123, mean loss: 0.34081685715418447
Epoch: 56, step: 1251, loss: 0.3079439401626587, mean loss: 0.3408164568312633
Epoch: 56, step: 1252, loss: 0.3600423038005829, mean loss: 0.3408166909587518
Epoch: 56, step: 1253, loss: 0.3595181405544281, mean loss: 0.34081691869748865
Epoch: 56, step: 1254, loss: 0.30232226848602295, mean loss: 0.34081644993081817
Epoch: 56, step: 1255, loss: 0.2900976538658142, mean loss: 0.34081583231274626
Epoch: 56, step: 1256, loss: 0.30387356877326965, mean loss: 0.3408153824611427
Epoch: 56, step: 1257, loss: 0.3410436511039734, mean loss: 0.3408153852407711
Epoch: 56, step: 1258, loss: 0.3260854482650757, mean loss: 0.3408152058764398
Epoch: 56, step: 1259, loss: 0.34879302978515625, mean loss: 0.3408153030200752
Epoch: 56, step: 1260, loss: 0.32309699058532715, mean loss: 0.34081508727197857
Epoch: 56, step: 1261, loss: 0.3541531264781952, mean loss: 0.3408152496814373
Epoch: 56, step: 1262, loss: 0.34201210737228394, mean loss: 0.340815264254692
Epoch: 56, step: 1263, loss: 0.3185424208641052, mean loss: 0.3408149930579821
Epoch: 56, step: 1264, loss: 0.3281960189342499, mean loss: 0.3408148394097686
Epoch: 56, step: 1265, loss: 0.32958468794822693, mean loss: 0.340814702673479
Epoch: 56, step: 1266, loss: 0.34222930669784546, mean loss: 0.3408147198972316
Epoch: 56, step: 1267, loss: 0.3440411686897278, mean loss: 0.3408147591809309
Epoch: 56, step: 1268, loss: 0.32024165987968445, mean loss: 0.34081450869575075
Epoch: 56, step: 1269, loss: 0.334069162607193, mean loss: 0.3408144265696387
Epoch: 56, step: 1270, loss: 0.3277595639228821, mean loss: 0.3408142676256727
Epoch: 56, step: 1271, loss: 0.3215341567993164, mean loss: 0.3408140328916848
Epoch: 56, step: 1272, loss: 0.334628164768219, mean loss: 0.34081395758009414
Epoch: 56, step: 1273, loss: 0.32228246331214905, mean loss: 0.3408137319659537
Epoch: 56, step: 1274, loss: 0.3316526710987091, mean loss: 0.3408136204347582
Epoch: 56, step: 1275, loss: 0.29111796617507935, mean loss: 0.34081301542314074
Epoch: 56, step: 1276, loss: 0.3387783467769623, mean loss: 0.34081299065270154
Epoch: 56, step: 1277, loss: 0.36604931950569153, mean loss: 0.3408132978807804
Epoch: 56, step: 1278, loss: 0.3317033052444458, mean loss: 0.3408131869767151
Epoch: 56, step: 1279, loss: 0.3269908130168915, mean loss: 0.3408130187066776
Epoch: 56, step: 1280, loss: 0.32118192315101624, mean loss: 0.3408127797256616
Epoch: 56, step: 1281, loss: 0.352988064289093, mean loss: 0.34081292794084633
Epoch: 56, step: 1282, loss: 0.31877633929252625, mean loss: 0.3408126596828619
Epoch: 56, step: 1283, loss: 0.3820941150188446, mean loss: 0.340813162208247
Epoch: 56, step: 1284, loss: 0.3328271806240082, mean loss: 0.34081306499487146
Epoch: 56, step: 1285, loss: 0.3191753327846527, mean loss: 0.3408128016019048
Epoch: 56, step: 1286, loss: 0.32625845074653625, mean loss: 0.34081262443606564
Epoch: 56, step: 1287, loss: 0.3116338551044464, mean loss: 0.34081226925579816
Epoch: 56, step: 1288, loss: 0.3590236008167267, mean loss: 0.3408124909315928
Epoch: 56, step: 1289, loss: 0.3557896018028259, mean loss: 0.3408126732369081
Epoch: 56, step: 1290, loss: 0.34971460700035095, mean loss: 0.3408127815922579
Epoch: 56, step: 1291, loss: 0.327717661857605, mean loss: 0.3408126221989119
Epoch: 56, step: 1292, loss: 0.3620736598968506, mean loss: 0.34081288098437995
Epoch: 56, step: 1293, loss: 0.30626699328422546, mean loss: 0.34081246050326186
Epoch: 56, step: 1294, loss: 0.38862645626068115, mean loss: 0.3408130424723189
Epoch: 56, step: 1295, loss: 0.31356337666511536, mean loss: 0.34081271080647413
Epoch: 56, step: 1296, loss: 0.3326340317726135, mean loss: 0.34081261126193313
Epoch: 56, step: 1297, loss: 0.3662773072719574, mean loss: 0.34081292119470025
Epoch: 56, step: 1298, loss: 0.34086254239082336, mean loss: 0.34081292179863626
Epoch: 56, step: 1299, loss: 0.3105788230895996, mean loss: 0.34081255382606057
Epoch: 56, step: 1300, loss: 0.33117976784706116, mean loss: 0.34081243658896476
Epoch: 56, step: 1301, loss: 0.32989269495010376, mean loss: 0.3408123036904223
Epoch: 56, step: 1302, loss: 0.34463948011398315, mean loss: 0.3408123502684454
Epoch: 56, step: 1303, loss: 0.3005508482456207, mean loss: 0.3408118602784004
Epoch: 56, step: 1304, loss: 0.34965869784355164, mean loss: 0.3408119679447656
Epoch: 56, step: 1305, loss: 0.3430027663707733, mean loss: 0.34081199460654515
Epoch: 56, step: 1306, loss: 0.3734230101108551, mean loss: 0.34081239147424186
Epoch: 56, step: 1307, loss: 0.33312880992889404, mean loss: 0.3408122979681626
Epoch: 56, step: 1308, loss: 0.3397165536880493, mean loss: 0.3408122846335602
Epoch: 56, step: 1309, loss: 0.3234306275844574, mean loss: 0.3408120731109734
Epoch: 56, step: 1310, loss: 0.3985130488872528, mean loss: 0.34081277528287207
Epoch: 56, step: 1311, loss: 0.3471089005470276, mean loss: 0.34081285190044003
Epoch: 56, step: 1312, loss: 0.377817302942276, mean loss: 0.3408133022022403
Epoch: 56, step: 1313, loss: 0.3589441776275635, mean loss: 0.3408135228315502
Epoch: 56, step: 1314, loss: 0.34229910373687744, mean loss: 0.3408135409089289
Epoch: 56, step: 1315, loss: 0.29779183864593506, mean loss: 0.3408130174031822
Epoch: 56, step: 1316, loss: 0.3820602297782898, mean loss: 0.34081351931009957
Epoch: 56, step: 1317, loss: 0.3564019501209259, mean loss: 0.3408137089919132
Epoch: 56, step: 1318, loss: 0.34392258524894714, mean loss: 0.3408137468206157
Epoch: 56, step: 1319, loss: 0.33898359537124634, mean loss: 0.340813724551665
Epoch: 56, step: 1320, loss: 0.3488767147064209, mean loss: 0.3408138226594724
Epoch: 56, step: 1321, loss: 0.33697155117988586, mean loss: 0.34081377590854794
Epoch: 56, step: 1322, loss: 0.304263174533844, mean loss: 0.3408133311836964
Epoch: 56, step: 1323, loss: 0.34793636202812195, mean loss: 0.34081341785122504
Epoch: 56, step: 1324, loss: 0.32230472564697266, mean loss: 0.3408131926545174
Epoch: 56, step: 1325, loss: 0.3357795774936676, mean loss: 0.3408131314108727
Epoch: 56, step: 1326, loss: 0.3181565999984741, mean loss: 0.34081285575378845
Epoch: 56, step: 1327, loss: 0.34191375970840454, mean loss: 0.3408128691480842
Epoch: 56, step: 1328, loss: 0.3264314830303192, mean loss: 0.3408126941771485
Epoch: 56, step: 1329, loss: 0.3035750687122345, mean loss: 0.34081224113160424
Epoch: 56, step: 1330, loss: 0.3050090968608856, mean loss: 0.3408118055437428
Epoch: 56, step: 1331, loss: 0.3912551999092102, mean loss: 0.3408124192402045
Epoch: 56, step: 1332, loss: 0.3046483099460602, mean loss: 0.34081197927147944
Epoch: 56, step: 1333, loss: 0.34176576137542725, mean loss: 0.3408119908749504
Epoch: 56, step: 1334, loss: 0.3670305609703064, mean loss: 0.34081230983953753
Epoch: 56, step: 1335, loss: 0.34360945224761963, mean loss: 0.340812343868034
Epoch: 56, step: 1336, loss: 0.33750659227371216, mean loss: 0.3408123036525671
Epoch: 56, step: 1337, loss: 0.35948994755744934, mean loss: 0.34081253086898405
Epoch: 56, step: 1338, loss: 0.33661437034606934, mean loss: 0.3408124797983355
Epoch: 56, step: 1339, loss: 0.3002814054489136, mean loss: 0.34081198674356505
Epoch: 56, step: 1340, loss: 0.3024965226650238, mean loss: 0.3408115206470493
Epoch: 56, step: 1341, loss: 0.35537540912628174, mean loss: 0.3408116978103765
Epoch: 56, step: 1342, loss: 0.2983737885951996, mean loss: 0.34081118157807005
Epoch: 56, step: 1343, loss: 0.3049655556678772, mean loss: 0.34081074554233254
Epoch: 56, step: 1344, loss: 0.3270009756088257, mean loss: 0.34081057755865757
Epoch: 56, step: 1345, loss: 0.3461887240409851, mean loss: 0.34081064297827174
Epoch: 56, step: 1346, loss: 0.3207690715789795, mean loss: 0.3408103991961574
Epoch: 56, step: 1347, loss: 0.346844881772995, mean loss: 0.34081047259763864
Epoch: 56, step: 1348, loss: 0.3277091085910797, mean loss: 0.340810313238851
Epoch: 56, step: 1349, loss: 0.29093724489212036, mean loss: 0.34080970661384374
Epoch: 56, step: 1350, loss: 0.32119008898735046, mean loss: 0.34080946797591116
Epoch: 56, step: 1351, loss: 0.3638191223144531, mean loss: 0.34080974784423773
Epoch: 56, step: 1352, loss: 0.35914039611816406, mean loss: 0.3408099707987152
Epoch: 56, step: 1353, loss: 0.3478718400001526, mean loss: 0.3408100566907243
Epoch: 56, step: 1354, loss: 0.3243904709815979, mean loss: 0.34080985698523397
Epoch: 56, step: 1355, loss: 0.402736097574234, mean loss: 0.34081061016257025
Epoch: 56, step: 1356, loss: 0.3437505066394806, mean loss: 0.34081064591859944
Epoch: 56, step: 1357, loss: 0.32519978284835815, mean loss: 0.34081045605623816
Epoch: 56, step: 1358, loss: 0.31659257411956787, mean loss: 0.340810161517217
Epoch: 56, step: 1359, loss: 0.3140348196029663, mean loss: 0.3408098358782075
Epoch: 56, step: 1360, loss: 0.321029394865036, mean loss: 0.34080959531340344
Epoch: 56, step: 1361, loss: 0.35699617862701416, mean loss: 0.3408097921682099
Epoch: 56, step: 1362, loss: 0.3104773163795471, mean loss: 0.3408094232811559
Epoch: 56, step: 1363, loss: 0.32139015197753906, mean loss: 0.3408091871174245
Epoch: 56, step: 1364, loss: 0.33236515522003174, mean loss: 0.3408090844282042
Epoch: 56, step: 1365, loss: 0.3114621341228485, mean loss: 0.34080872753959535
Epoch: 56, step: 1366, loss: 0.3223608732223511, mean loss: 0.3408085031977496
Epoch: 56, step: 1367, loss: 0.3117590546607971, mean loss: 0.3408081499356553
Epoch: 56, step: 1368, loss: 0.29593905806541443, mean loss: 0.34080760430200613
Epoch: 56, step: 1369, loss: 0.35404348373413086, mean loss: 0.3408077652558626
Epoch: 56, step: 1370, loss: 0.3361453115940094, mean loss: 0.34080770855915604
Epoch: 56, step: 1371, loss: 0.33897337317466736, mean loss: 0.34080768625340935
Epoch: 56, step: 1372, loss: 0.318029522895813, mean loss: 0.34080740927147474
Epoch: 56, step: 1373, loss: 0.3091566860675812, mean loss: 0.3408070244040995
Epoch: 56, step: 1374, loss: 0.3336217403411865, mean loss: 0.3408069370333379
Epoch: 56, step: 1375, loss: 0.35422834753990173, mean loss: 0.34080710023142285
Epoch: 56, step: 1376, loss: 0.3077869713306427, mean loss: 0.3408066987269555
Epoch: 56, step: 1377, loss: 0.33017104864120483, mean loss: 0.34080656940556153
Epoch: 56, step: 1378, loss: 0.3431917428970337, mean loss: 0.34080659840709954
Epoch: 56, step: 1379, loss: 0.3650079667568207, mean loss: 0.34080689267012604
Epoch: 56, step: 1380, loss: 0.3262755572795868, mean loss: 0.3408067159866147
Epoch: 56, step: 1381, loss: 0.3447614908218384, mean loss: 0.340806764071322
Epoch: 56, step: 1382, loss: 0.32927677035331726, mean loss: 0.3408066238839143
Epoch: 56, step: 1383, loss: 0.325351744890213, mean loss: 0.3408064359780808
Epoch: 56, step: 1384, loss: 0.33913928270339966, mean loss: 0.3408064157084936
Epoch: 56, step: 1385, loss: 0.31377944350242615, mean loss: 0.34080608711308685
Epoch: 56, step: 1386, loss: 0.36461350321769714, mean loss: 0.34080637656143525
Epoch: 56, step: 1387, loss: 0.3361397385597229, mean loss: 0.3408063198255747
Epoch: 56, step: 1388, loss: 0.3037015497684479, mean loss: 0.34080586872020396
Epoch: 56, step: 1389, loss: 0.32521119713783264, mean loss: 0.3408056791285539
Epoch: 56, step: 1390, loss: 0.3306122422218323, mean loss: 0.34080555520372374
Epoch: 56, step: 1391, loss: 0.3322085440158844, mean loss: 0.3408054506884156
Epoch: 56, step: 1392, loss: 0.3166080415248871, mean loss: 0.34080515652002674
Epoch: 56, step: 1393, loss: 0.37887507677078247, mean loss: 0.3408056193311849
Epoch: 56, step: 1394, loss: 0.3274986743927002, mean loss: 0.34080545756232145
Epoch: 56, step: 1395, loss: 0.32021668553352356, mean loss: 0.34080520727333496
Epoch: 56, step: 1396, loss: 0.34940531849861145, mean loss: 0.34080531181997586
Epoch: 56, step: 1397, loss: 0.36763811111450195, mean loss: 0.3408056380070281
Epoch: 56, step: 1398, loss: 0.3231298625469208, mean loss: 0.3408054231379441
Epoch: 56, step: 1399, loss: 0.34338125586509705, mean loss: 0.34080545444972965
Epoch: 56, step: 1400, loss: 0.3006426990032196, mean loss: 0.34080496623778717
Epoch: 56, step: 1401, loss: 0.3624139726161957, mean loss: 0.3408052289101716
Epoch: 56, step: 1402, loss: 0.3034358620643616, mean loss: 0.3408047746652515
Epoch: 56, step: 1403, loss: 0.3157677948474884, mean loss: 0.3408044703308831
Epoch: 56, step: 1404, loss: 0.3076154589653015, mean loss: 0.3408040669102585
Epoch: 56, step: 1405, loss: 0.30616724491119385, mean loss: 0.34080364589625584
Epoch: 56, step: 1406, loss: 0.3215233087539673, mean loss: 0.34080341154469646
Epoch: 56, step: 1407, loss: 0.34250637888908386, mean loss: 0.34080343224393
Epoch: 56, step: 1408, loss: 0.3402698040008545, mean loss: 0.3408034257578624
Epoch: 56, step: 1409, loss: 0.317248672246933, mean loss: 0.3408031394614199
Epoch: 56, step: 1410, loss: 0.32561078667640686, mean loss: 0.34080295480808914
Epoch: 56, step: 1411, loss: 0.30497536063194275, mean loss: 0.34080251935189076
Epoch: 56, step: 1412, loss: 0.3597777187824249, mean loss: 0.34080274997769666
Epoch: 56, step: 1413, loss: 0.3228328824043274, mean loss: 0.34080253157341395
Epoch: 56, step: 1414, loss: 0.38746199011802673, mean loss: 0.3408030986617177
Epoch: 56, step: 1415, loss: 0.37682703137397766, mean loss: 0.3408035364829709
Epoch: 56, step: 1416, loss: 0.37244701385498047, mean loss: 0.34080392106115265
Epoch: 56, step: 1417, loss: 0.3363511562347412, mean loss: 0.3408038669452485
Epoch: 56, step: 1418, loss: 0.37060725688934326, mean loss: 0.34080422915117126
Epoch: 56, step: 1419, loss: 0.363493412733078, mean loss: 0.34080450489352193
Epoch: 56, step: 1420, loss: 0.37318044900894165, mean loss: 0.34080489835459155
Epoch: 56, step: 1421, loss: 0.42398205399513245, mean loss: 0.34080590918457043
Epoch: 56, step: 1422, loss: 0.3047454059123993, mean loss: 0.34080547095613495
Epoch: 56, step: 1423, loss: 0.32164934277534485, mean loss: 0.3408052381624326
Epoch: 56, step: 1424, loss: 0.30859652161598206, mean loss: 0.3408048467526871
Epoch: 56, step: 1425, loss: 0.3915151059627533, mean loss: 0.34080546299110254
Epoch: 56, step: 1426, loss: 0.3250046670436859, mean loss: 0.34080527097987473
Epoch: 56, step: 1427, loss: 0.30299970507621765, mean loss: 0.34080481157232717
Epoch: 56, step: 1428, loss: 0.3266482651233673, mean loss: 0.34080463954619555
Epoch: 56, step: 1429, loss: 0.3372904658317566, mean loss: 0.34080459684352327
Epoch: 56, step: 1430, loss: 0.3854947090148926, mean loss: 0.34080513989124395
Epoch: 56, step: 1431, loss: 0.3189740478992462, mean loss: 0.34080487461599374
Epoch: 56, step: 1432, loss: 0.297734797000885, mean loss: 0.3408043512666904
Epoch: 56, step: 1433, loss: 0.32594582438468933, mean loss: 0.3408041707212715
Epoch: 56, step: 1434, loss: 0.40331998467445374, mean loss: 0.3408049303394194
Epoch: 56, step: 1435, loss: 0.3268603980541229, mean loss: 0.34080476090403317
Epoch: 56, step: 1436, loss: 0.33913037180900574, mean loss: 0.3408047405593339
Epoch: 56, step: 1437, loss: 0.3363437354564667, mean loss: 0.3408046863564579
Epoch: 56, step: 1438, loss: 0.30747583508491516, mean loss: 0.3408042814034031
Epoch: 56, step: 1439, loss: 0.33822494745254517, mean loss: 0.340804250064295
Epoch: 56, step: 1440, loss: 0.33074378967285156, mean loss: 0.3408041278304041
Epoch: 56, step: 1441, loss: 0.32759639620780945, mean loss: 0.3408039673593373
Epoch: 56, step: 1442, loss: 0.33711934089660645, mean loss: 0.34080392259247105
Epoch: 56, step: 1443, loss: 0.35692065954208374, mean loss: 0.3408041184025618
Valid: 56, mean loss: 0.1852300763130188
Epoch: 57, step: 0, loss: 0.33769458532333374, mean loss: 0.3408040806237882
Epoch: 57, step: 1, loss: 0.33377549052238464, mean loss: 0.34080399523209703
Epoch: 57, step: 2, loss: 0.3425164222717285, mean loss: 0.34080401603644933
Epoch: 57, step: 3, loss: 0.3164491653442383, mean loss: 0.34080372015187976
Epoch: 57, step: 4, loss: 0.334047794342041, mean loss: 0.3408036380758309
Epoch: 57, step: 5, loss: 0.29043081402778625, mean loss: 0.34080302611645524
Epoch: 57, step: 6, loss: 0.3074764311313629, mean loss: 0.34080262124984545
Epoch: 57, step: 7, loss: 0.3781524896621704, mean loss: 0.3408030749874956
Epoch: 57, step: 8, loss: 0.3282495141029358, mean loss: 0.3408029224848427
Epoch: 57, step: 9, loss: 0.3725242018699646, mean loss: 0.3408033078353053
Epoch: 57, step: 10, loss: 0.3226017951965332, mean loss: 0.3408030867258089
Epoch: 57, step: 11, loss: 0.3157753348350525, mean loss: 0.34080278269578107
Epoch: 57, step: 12, loss: 0.3007289171218872, mean loss: 0.3408022958957474
Epoch: 57, step: 13, loss: 0.32126420736312866, mean loss: 0.34080205855835843
Epoch: 57, step: 14, loss: 0.31697940826416016, mean loss: 0.3408017691781088
Epoch: 57, step: 15, loss: 0.330183207988739, mean loss: 0.34080164019310816
Epoch: 57, step: 16, loss: 0.3630176782608032, mean loss: 0.3408019100508436
Epoch: 57, step: 17, loss: 0.3025816082954407, mean loss: 0.3408014457953015
Epoch: 57, step: 18, loss: 0.3090086579322815, mean loss: 0.3408010596183746
Epoch: 57, step: 19, loss: 0.3742201626300812, mean loss: 0.340801465544706
Epoch: 57, step: 20, loss: 0.31625834107398987, mean loss: 0.34080116743438676
Epoch: 57, step: 21, loss: 0.3262578845024109, mean loss: 0.34080099078817117
Epoch: 57, step: 22, loss: 0.32704153656959534, mean loss: 0.3408008236645577
Epoch: 57, step: 23, loss: 0.33749642968177795, mean loss: 0.3408007835295679
Epoch: 57, step: 24, loss: 0.3388451337814331, mean loss: 0.34080075977664076
Epoch: 57, step: 25, loss: 0.34046486020088196, mean loss: 0.34080075569692186
Epoch: 57, step: 26, loss: 0.35069650411605835, mean loss: 0.34080087588576524
Epoch: 57, step: 27, loss: 0.3568999767303467, mean loss: 0.3408010714150701
Epoch: 57, step: 28, loss: 0.34344208240509033, mean loss: 0.3408011034906982
Epoch: 57, step: 29, loss: 0.3063008785247803, mean loss: 0.34080068448337514
Epoch: 57, step: 30, loss: 0.36891549825668335, mean loss: 0.34080102593534534
Epoch: 57, step: 31, loss: 0.30455467104911804, mean loss: 0.34080058573186117
Epoch: 57, step: 32, loss: 0.35184839367866516, mean loss: 0.34080071990326966
Epoch: 57, step: 33, loss: 0.2968110740184784, mean loss: 0.3408001856723075
Epoch: 57, step: 34, loss: 0.32557985186576843, mean loss: 0.3408000008316555
Epoch: 57, step: 35, loss: 0.348458856344223, mean loss: 0.34080009384214216
Epoch: 57, step: 36, loss: 0.35267797112464905, mean loss: 0.34080023808741855
Epoch: 57, step: 37, loss: 0.35328617691993713, mean loss: 0.3408003897151701
Epoch: 57, step: 38, loss: 0.3205853998661041, mean loss: 0.3408001442297262
Epoch: 57, step: 39, loss: 0.30755943059921265, mean loss: 0.34079974056826956
Epoch: 57, step: 40, loss: 0.34946316480636597, mean loss: 0.3407998457720272
Epoch: 57, step: 41, loss: 0.31348705291748047, mean loss: 0.34079951410484016
Epoch: 57, step: 42, loss: 0.3219760060310364, mean loss: 0.3407992855282828
Epoch: 57, step: 43, loss: 0.34335818886756897, mean loss: 0.34079931660103563
Epoch: 57, step: 44, loss: 0.3271329998970032, mean loss: 0.34079915065302274
Epoch: 57, step: 45, loss: 0.34030672907829285, mean loss: 0.34079914467369476
Epoch: 57, step: 46, loss: 0.32314532995224, mean loss: 0.34079893031130365
Epoch: 57, step: 47, loss: 0.3288343846797943, mean loss: 0.3407987850329313
Epoch: 57, step: 48, loss: 0.3467715084552765, mean loss: 0.3407988575552843
Epoch: 57, step: 49, loss: 0.33328336477279663, mean loss: 0.34079876630133465
Epoch: 57, step: 50, loss: 0.3039538860321045, mean loss: 0.3407983189321307
Epoch: 57, step: 51, loss: 0.3667928874492645, mean loss: 0.3407986345534094
Epoch: 57, step: 52, loss: 0.34113073348999023, mean loss: 0.3407986385856448
Epoch: 57, step: 53, loss: 0.3460122346878052, mean loss: 0.34079870188663436
Epoch: 57, step: 54, loss: 0.33281564712524414, mean loss: 0.34079860496137954
Epoch: 57, step: 55, loss: 0.3021174669265747, mean loss: 0.3407981353249117
Epoch: 57, step: 56, loss: 0.32137927412986755, mean loss: 0.3407978995589772
Epoch: 57, step: 57, loss: 0.32694000005722046, mean loss: 0.34079773131116253
Epoch: 57, step: 58, loss: 0.37418919801712036, mean loss: 0.3407981367097652
Epoch: 57, step: 59, loss: 0.33651551604270935, mean loss: 0.3407980847160217
Epoch: 57, step: 60, loss: 0.32493650913238525, mean loss: 0.3407978921487259
Epoch: 57, step: 61, loss: 0.2933180034160614, mean loss: 0.3407973157266216
Epoch: 57, step: 62, loss: 0.31575217843055725, mean loss: 0.34079701167377174
Epoch: 57, step: 63, loss: 0.35168755054473877, mean loss: 0.3407971438854319
Epoch: 57, step: 64, loss: 0.3067096173763275, mean loss: 0.3407967300662617
Epoch: 57, step: 65, loss: 0.33037880063056946, mean loss: 0.34079660359517333
Epoch: 57, step: 66, loss: 0.3316127359867096, mean loss: 0.3407964921066439
Epoch: 57, step: 67, loss: 0.4221274256706238, mean loss: 0.34079747942010374
Epoch: 57, step: 68, loss: 0.33199766278266907, mean loss: 0.3407973725963952
Epoch: 57, step: 69, loss: 0.33118918538093567, mean loss: 0.34079725596104093
Epoch: 57, step: 70, loss: 0.343255877494812, mean loss: 0.3407972858062871
Epoch: 57, step: 71, loss: 0.2914891839027405, mean loss: 0.34079668726171436
Epoch: 57, step: 72, loss: 0.41826415061950684, mean loss: 0.3407976276176624
Epoch: 57, step: 73, loss: 0.29778653383255005, mean loss: 0.3407971055243194
Epoch: 57, step: 74, loss: 0.3618357479572296, mean loss: 0.3407973609003367
Epoch: 57, step: 75, loss: 0.3197048008441925, mean loss: 0.34079710487295206
Epoch: 57, step: 76, loss: 0.3340931832790375, mean loss: 0.34079702349986724
Epoch: 57, step: 77, loss: 0.3762810230255127, mean loss: 0.34079745420410734
Epoch: 57, step: 78, loss: 0.3398509621620178, mean loss: 0.340797442715741
Epoch: 57, step: 79, loss: 0.3178710341453552, mean loss: 0.34079716444210195
Epoch: 57, step: 80, loss: 0.3613462448120117, mean loss: 0.340797413857441
Epoch: 57, step: 81, loss: 0.34892764687538147, mean loss: 0.3407975125372931
Epoch: 57, step: 82, loss: 0.3359118700027466, mean loss: 0.34079745323903804
Epoch: 57, step: 83, loss: 0.32799413800239563, mean loss: 0.34079729784391183
Epoch: 57, step: 84, loss: 0.30834725499153137, mean loss: 0.3407969039992545
Epoch: 57, step: 85, loss: 0.33520936965942383, mean loss: 0.34079683618443374
Epoch: 57, step: 86, loss: 0.3477502465248108, mean loss: 0.3407969205756024
Epoch: 57, step: 87, loss: 0.33514291048049927, mean loss: 0.34079685195564396
Epoch: 57, step: 88, loss: 0.3440420925617218, mean loss: 0.34079689134106583
Epoch: 57, step: 89, loss: 0.30182522535324097, mean loss: 0.3407964183724745
Epoch: 57, step: 90, loss: 0.3723387122154236, mean loss: 0.3407968011719483
Epoch: 57, step: 91, loss: 0.34112873673439026, mean loss: 0.34079680520029254
Epoch: 57, step: 92, loss: 0.3271425664424896, mean loss: 0.34079663949552247
Epoch: 57, step: 93, loss: 0.3201562166213989, mean loss: 0.3407963890110333
Epoch: 57, step: 94, loss: 0.31627270579338074, mean loss: 0.34079609140435374
Epoch: 57, step: 95, loss: 0.31392961740493774, mean loss: 0.34079576537073886
Epoch: 57, step: 96, loss: 0.33255377411842346, mean loss: 0.3407956653526422
Epoch: 57, step: 97, loss: 0.33029696345329285, mean loss: 0.3407955379504883
Epoch: 57, step: 98, loss: 0.3276539444923401, mean loss: 0.34079537847867813
Epoch: 57, step: 99, loss: 0.3278963565826416, mean loss: 0.340795221952347
Epoch: 57, step: 100, loss: 0.2984135150909424, mean loss: 0.3407947076674162
Epoch: 57, step: 101, loss: 0.3294134736061096, mean loss: 0.34079456956240395
Epoch: 57, step: 102, loss: 0.3465251922607422, mean loss: 0.3407946390995131
Epoch: 57, step: 103, loss: 0.3433677554130554, mean loss: 0.3407946703221058
Epoch: 57, step: 104, loss: 0.33186042308807373, mean loss: 0.3407945619138785
Epoch: 57, step: 105, loss: 0.29805049300193787, mean loss: 0.3407940432632984
Epoch: 57, step: 106, loss: 0.3390302360057831, mean loss: 0.3407940218617664
Epoch: 57, step: 107, loss: 0.37507879734039307, mean loss: 0.34079443785836266
Epoch: 57, step: 108, loss: 0.3654993772506714, mean loss: 0.34079473761374557
Epoch: 57, step: 109, loss: 0.3547407388687134, mean loss: 0.34079490682437014
Epoch: 57, step: 110, loss: 0.30369043350219727, mean loss: 0.3407944566311705
Epoch: 57, step: 111, loss: 0.32972827553749084, mean loss: 0.340794322365445
Epoch: 57, step: 112, loss: 0.32233572006225586, mean loss: 0.34079409841035707
Epoch: 57, step: 113, loss: 0.3246625065803528, mean loss: 0.3407939026908668
Epoch: 57, step: 114, loss: 0.3268889784812927, mean loss: 0.34079373398887575
Epoch: 57, step: 115, loss: 0.3047831952571869, mean loss: 0.34079329709502526
Epoch: 57, step: 116, loss: 0.3041979670524597, mean loss: 0.3407928531116459
Epoch: 57, step: 117, loss: 0.32380810379981995, mean loss: 0.3407926470510666
Epoch: 57, step: 118, loss: 0.3536873459815979, mean loss: 0.3407928034888713
Epoch: 57, step: 119, loss: 0.3619879186153412, mean loss: 0.34079306062376635
Epoch: 57, step: 120, loss: 0.29385998845100403, mean loss: 0.34079249124803485
Epoch: 57, step: 121, loss: 0.31584468483924866, mean loss: 0.3407921885935837
Epoch: 57, step: 122, loss: 0.3638685941696167, mean loss: 0.3407924685417291
Epoch: 57, step: 123, loss: 0.3554348051548004, mean loss: 0.34079264617100674
Epoch: 57, step: 124, loss: 0.30533668398857117, mean loss: 0.3407922160524598
Epoch: 57, step: 125, loss: 0.38086551427841187, mean loss: 0.34079270217830865
Epoch: 57, step: 126, loss: 0.3483434319496155, mean loss: 0.3407927937744725
Epoch: 57, step: 127, loss: 0.3301767110824585, mean loss: 0.3407926649947805
Epoch: 57, step: 128, loss: 0.3458588421344757, mean loss: 0.34079272644991765
Epoch: 57, step: 129, loss: 0.2999073266983032, mean loss: 0.3407922304965982
Epoch: 57, step: 130, loss: 0.35501018166542053, mean loss: 0.3407924029629208
Epoch: 57, step: 131, loss: 0.31924378871917725, mean loss: 0.34079214157749815
Epoch: 57, step: 132, loss: 0.3189510405063629, mean loss: 0.34079187664741395
Epoch: 57, step: 133, loss: 0.35985827445983887, mean loss: 0.34079210791785636
Epoch: 57, step: 134, loss: 0.34745368361473083, mean loss: 0.3407921887200554
Epoch: 57, step: 135, loss: 0.2821682393550873, mean loss: 0.34079147764406
Epoch: 57, step: 136, loss: 0.29517409205436707, mean loss: 0.34079092433718156
Epoch: 57, step: 137, loss: 0.4013669192790985, mean loss: 0.3407916590725834
Epoch: 57, step: 138, loss: 0.3178689777851105, mean loss: 0.3407913810432884
Epoch: 57, step: 139, loss: 0.3323080241680145, mean loss: 0.34079127814986615
Epoch: 57, step: 140, loss: 0.37236809730529785, mean loss: 0.3407916611359443
Epoch: 57, step: 141, loss: 0.32727718353271484, mean loss: 0.34079149722475444
Epoch: 57, step: 142, loss: 0.3408737778663635, mean loss: 0.3407914982226883
Epoch: 57, step: 143, loss: 0.36703261733055115, mean loss: 0.34079181648202833
Epoch: 57, step: 144, loss: 0.3239510655403137, mean loss: 0.3407916122353552
Epoch: 57, step: 145, loss: 0.3267844021320343, mean loss: 0.34079144235626985
Epoch: 57, step: 146, loss: 0.311029851436615, mean loss: 0.340791081412835
Epoch: 57, step: 147, loss: 0.35790351033210754, mean loss: 0.34079128894690064
Epoch: 57, step: 148, loss: 0.3382027745246887, mean loss: 0.3407912575546062
Epoch: 57, step: 149, loss: 0.3190345764160156, mean loss: 0.3407909937029346
Epoch: 57, step: 150, loss: 0.3267686367034912, mean loss: 0.34079082365046004
Epoch: 57, step: 151, loss: 0.31038981676101685, mean loss: 0.34079045497465493
Epoch: 57, step: 152, loss: 0.32278338074684143, mean loss: 0.3407902366038587
Epoch: 57, step: 153, loss: 0.31163451075553894, mean loss: 0.3407898830382667
Epoch: 57, step: 154, loss: 0.31689897179603577, mean loss: 0.3407895933215302
Epoch: 57, step: 155, loss: 0.3401629328727722, mean loss: 0.3407895857223299
Epoch: 57, step: 156, loss: 0.3370150029659271, mean loss: 0.3407895399503933
Epoch: 57, step: 157, loss: 0.40221959352493286, mean loss: 0.340790284864098
Epoch: 57, step: 158, loss: 0.3358196020126343, mean loss: 0.34079022458928687
Epoch: 57, step: 159, loss: 0.33766448497772217, mean loss: 0.3407901866868324
Epoch: 57, step: 160, loss: 0.3063787817955017, mean loss: 0.340789769422104
Epoch: 57, step: 161, loss: 0.33971601724624634, mean loss: 0.34078975640219156
Epoch: 57, step: 162, loss: 0.3018563687801361, mean loss: 0.34078928431639627
Epoch: 57, step: 163, loss: 0.33626094460487366, mean loss: 0.34078922940879475
Epoch: 57, step: 164, loss: 0.3190612196922302, mean loss: 0.34078896595275804
Epoch: 57, step: 165, loss: 0.3293912708759308, mean loss: 0.3407888277553252
Epoch: 57, step: 166, loss: 0.32001450657844543, mean loss: 0.3407885758690424
Epoch: 57, step: 167, loss: 0.31732144951820374, mean loss: 0.3407882913362528
Epoch: 57, step: 168, loss: 0.340419203042984, mean loss: 0.34078828686120777
Epoch: 57, step: 169, loss: 0.33515533804893494, mean loss: 0.340788218564828
Epoch: 57, step: 170, loss: 0.3405177593231201, mean loss: 0.34078821528569947
Epoch: 57, step: 171, loss: 0.40300899744033813, mean loss: 0.34078896965987693
Epoch: 57, step: 172, loss: 0.49083808064460754, mean loss: 0.34079078885594616
Epoch: 57, step: 173, loss: 0.31138721108436584, mean loss: 0.34079043237116435
Epoch: 57, step: 174, loss: 0.3118199408054352, mean loss: 0.3407900811413162
Epoch: 57, step: 175, loss: 0.35718387365341187, mean loss: 0.3407902798924984
Epoch: 57, step: 176, loss: 0.3164207637310028, mean loss: 0.340789984450707
Epoch: 57, step: 177, loss: 0.341467946767807, mean loss: 0.34078999266982685
Epoch: 57, step: 178, loss: 0.33631861209869385, mean loss: 0.34078993846273276
Epoch: 57, step: 179, loss: 0.3401300013065338, mean loss: 0.3407899304623308
Epoch: 57, step: 180, loss: 0.32306522130966187, mean loss: 0.34078971558872156
Epoch: 57, step: 181, loss: 0.32263267040252686, mean loss: 0.3407894954766451
Epoch: 57, step: 182, loss: 0.3393861651420593, mean loss: 0.3407894784647246
Epoch: 57, step: 183, loss: 0.31913527846336365, mean loss: 0.3407892159641185
Epoch: 57, step: 184, loss: 0.32113054394721985, mean loss: 0.3407889776569649
Epoch: 57, step: 185, loss: 0.2994788885116577, mean loss: 0.3407884768921924
Epoch: 57, step: 186, loss: 0.2984361946582794, mean loss: 0.34078796350008095
Epoch: 57, step: 187, loss: 0.3704068064689636, mean loss: 0.34078832253376706
Epoch: 57, step: 188, loss: 0.308824747800827, mean loss: 0.34078793508240846
Epoch: 57, step: 189, loss: 0.351585328578949, mean loss: 0.34078806596307826
Epoch: 57, step: 190, loss: 0.3619965612888336, mean loss: 0.3407883230388649
Epoch: 57, step: 191, loss: 0.3309789001941681, mean loss: 0.3407882041367698
Epoch: 57, step: 192, loss: 0.3435346484184265, mean loss: 0.3407882374266
Epoch: 57, step: 193, loss: 0.36758720874786377, mean loss: 0.3407885622547414
Epoch: 57, step: 194, loss: 0.3277970850467682, mean loss: 0.3407884047880165
Epoch: 57, step: 195, loss: 0.39205336570739746, mean loss: 0.3407890261513555
Epoch: 57, step: 196, loss: 0.29685577750205994, mean loss: 0.34078849365940167
Epoch: 57, step: 197, loss: 0.3786473572254181, mean loss: 0.34078895252134583
Epoch: 57, step: 198, loss: 0.31945040822029114, mean loss: 0.34078869389426814
Epoch: 57, step: 199, loss: 0.3677029311656952, mean loss: 0.3407890200958155
Epoch: 57, step: 200, loss: 0.32336732745170593, mean loss: 0.3407888089468179
Epoch: 57, step: 201, loss: 0.3128487169742584, mean loss: 0.3407884703200821
Epoch: 57, step: 202, loss: 0.3478173315525055, mean loss: 0.3407885555070418
Epoch: 57, step: 203, loss: 0.3313072919845581, mean loss: 0.3407884405993493
Epoch: 57, step: 204, loss: 0.345319539308548, mean loss: 0.34078849551310486
Epoch: 57, step: 205, loss: 0.33180490136146545, mean loss: 0.34078838663953004
Epoch: 57, step: 206, loss: 0.30095723271369934, mean loss: 0.34078790392543046
Epoch: 57, step: 207, loss: 0.3144020736217499, mean loss: 0.34078758415919963
Epoch: 57, step: 208, loss: 0.36880359053611755, mean loss: 0.3407879236771944
Epoch: 57, step: 209, loss: 0.3493499457836151, mean loss: 0.3407880274366421
Epoch: 57, step: 210, loss: 0.3619842529296875, mean loss: 0.3407882843014307
Epoch: 57, step: 211, loss: 0.32924431562423706, mean loss: 0.3407881444084511
Epoch: 57, step: 212, loss: 0.31386464834213257, mean loss: 0.3407878181460929
Epoch: 57, step: 213, loss: 0.32980218529701233, mean loss: 0.3407876850224065
Epoch: 57, step: 214, loss: 0.32222065329551697, mean loss: 0.34078746003020155
Epoch: 57, step: 215, loss: 0.33740565180778503, mean loss: 0.3407874190505081
Epoch: 57, step: 216, loss: 0.3121482729911804, mean loss: 0.34078707201450614
Epoch: 57, step: 217, loss: 0.3353976309299469, mean loss: 0.3407870067085288
Epoch: 57, step: 218, loss: 0.3205832839012146, mean loss: 0.3407867618950398
Epoch: 57, step: 219, loss: 0.3210337460041046, mean loss: 0.34078652254577785
Epoch: 57, step: 220, loss: 0.3505239188671112, mean loss: 0.3407866405333497
Epoch: 57, step: 221, loss: 0.33608177304267883, mean loss: 0.34078658352538305
Epoch: 57, step: 222, loss: 0.32069340348243713, mean loss: 0.3407863400631683
Epoch: 57, step: 223, loss: 0.3704858124256134, mean loss: 0.34078669991719296
Epoch: 57, step: 224, loss: 0.3404477536678314, mean loss: 0.3407866958103963
Epoch: 57, step: 225, loss: 0.33788183331489563, mean loss: 0.3407866606144468
Epoch: 57, step: 226, loss: 0.3200613558292389, mean loss: 0.3407864095051624
Epoch: 57, step: 227, loss: 0.3439611494541168, mean loss: 0.34078644797007407
Epoch: 57, step: 228, loss: 0.36723294854164124, mean loss: 0.34078676839001387
Epoch: 57, step: 229, loss: 0.31495746970176697, mean loss: 0.3407864554517468
Epoch: 57, step: 230, loss: 0.31640833616256714, mean loss: 0.3407861600990131
Epoch: 57, step: 231, loss: 0.3432556688785553, mean loss: 0.3407861900179467
Epoch: 57, step: 232, loss: 0.3265262246131897, mean loss: 0.34078601725573876
Epoch: 57, step: 233, loss: 0.3678740859031677, mean loss: 0.3407863454288948
Epoch: 57, step: 234, loss: 0.344320684671402, mean loss: 0.3407863882470531
Epoch: 57, step: 235, loss: 0.3339740037918091, mean loss: 0.34078630571671226
Epoch: 57, step: 236, loss: 0.33460092544555664, mean loss: 0.34078623078327874
Epoch: 57, step: 237, loss: 0.3201330006122589, mean loss: 0.3407859805806018
Epoch: 57, step: 238, loss: 0.30300164222717285, mean loss: 0.34078552284938984
Epoch: 57, step: 239, loss: 0.3706395626068115, mean loss: 0.34078588450611996
Epoch: 57, step: 240, loss: 0.36831051111221313, mean loss: 0.34078621793991815
Epoch: 57, step: 241, loss: 0.34162771701812744, mean loss: 0.3407862281337289
Epoch: 57, step: 242, loss: 0.3562038540840149, mean loss: 0.3407864148985888
Epoch: 57, step: 243, loss: 0.304129958152771, mean loss: 0.34078597085778123
Epoch: 57, step: 244, loss: 0.3422640562057495, mean loss: 0.34078598876246485
Epoch: 57, step: 245, loss: 0.323427677154541, mean loss: 0.3407857784963165
Epoch: 57, step: 246, loss: 0.354095458984375, mean loss: 0.3407859397182957
Epoch: 57, step: 247, loss: 0.3056514859199524, mean loss: 0.3407855141350092
Epoch: 57, step: 248, loss: 0.30371400713920593, mean loss: 0.34078506509365597
Epoch: 57, step: 249, loss: 0.32642000913619995, mean loss: 0.34078489109409255
Epoch: 57, step: 250, loss: 0.32215428352355957, mean loss: 0.3407846654299303
Epoch: 57, step: 251, loss: 0.3035464584827423, mean loss: 0.340784214385757
Epoch: 57, step: 252, loss: 0.33027002215385437, mean loss: 0.34078408703516494
Epoch: 57, step: 253, loss: 0.3534858524799347, mean loss: 0.3407842408803412
Epoch: 57, step: 254, loss: 0.31445589661598206, mean loss: 0.34078392199241
Epoch: 57, step: 255, loss: 0.31084877252578735, mean loss: 0.34078355942337907
Epoch: 57, step: 256, loss: 0.3452431857585907, mean loss: 0.3407836134368997
Epoch: 57, step: 257, loss: 0.313381165266037, mean loss: 0.3407832815515211
Epoch: 57, step: 258, loss: 0.3249645531177521, mean loss: 0.34078308996494977
Epoch: 57, step: 259, loss: 0.32219335436820984, mean loss: 0.340782864820395
Epoch: 57, step: 260, loss: 0.33803898096084595, mean loss: 0.34078283158899025
Epoch: 57, step: 261, loss: 0.339544415473938, mean loss: 0.3407828165906117
Epoch: 57, step: 262, loss: 0.3299593925476074, mean loss: 0.3407826855104014
Epoch: 57, step: 263, loss: 0.3025500178337097, mean loss: 0.34078222248821866
Epoch: 57, step: 264, loss: 0.32672247290611267, mean loss: 0.3407820522176752
Epoch: 57, step: 265, loss: 0.317678302526474, mean loss: 0.3407817724231916
Epoch: 57, step: 266, loss: 0.3262665569782257, mean loss: 0.34078159664098817
Epoch: 57, step: 267, loss: 0.31625616550445557, mean loss: 0.340781299636639
Epoch: 57, step: 268, loss: 0.33350297808647156, mean loss: 0.34078121149682344
Epoch: 57, step: 269, loss: 0.3474968671798706, mean loss: 0.3407812928218214
Epoch: 57, step: 270, loss: 0.3077855706214905, mean loss: 0.3407808932562878
Epoch: 57, step: 271, loss: 0.33003175258636475, mean loss: 0.3407807630898956
Epoch: 57, step: 272, loss: 0.3147924244403839, mean loss: 0.34078044838870947
Epoch: 57, step: 273, loss: 0.3040372431278229, mean loss: 0.3407800034587579
Epoch: 57, step: 274, loss: 0.3329419195652008, mean loss: 0.3407799085471672
Epoch: 57, step: 275, loss: 0.32402145862579346, mean loss: 0.3407797056210566
Epoch: 57, step: 276, loss: 0.3991779685020447, mean loss: 0.34078041275023113
Epoch: 57, step: 277, loss: 0.33386707305908203, mean loss: 0.34078032903943645
Epoch: 57, step: 278, loss: 0.3165540397167206, mean loss: 0.34078003569678783
Epoch: 57, step: 279, loss: 0.32490670680999756, mean loss: 0.34077984349781354
Epoch: 57, step: 280, loss: 0.3598553240299225, mean loss: 0.3407800744665931
Epoch: 57, step: 281, loss: 0.31148725748062134, mean loss: 0.3407797197890657
Epoch: 57, step: 282, loss: 0.3297918736934662, mean loss: 0.34077958674979875
Epoch: 57, step: 283, loss: 0.28676337003707886, mean loss: 0.34077893273710125
Epoch: 57, step: 284, loss: 0.32294195890426636, mean loss: 0.3407787167748062
Epoch: 57, step: 285, loss: 0.35210078954696655, mean loss: 0.3407788538558626
Epoch: 57, step: 286, loss: 0.3279755115509033, mean loss: 0.3407786988423351
Epoch: 57, step: 287, loss: 0.3095201849937439, mean loss: 0.34077832039163714
Epoch: 57, step: 288, loss: 0.29608896374702454, mean loss: 0.34077777933861286
Epoch: 57, step: 289, loss: 0.3554563522338867, mean loss: 0.34077795704960945
Epoch: 57, step: 290, loss: 0.35977602005004883, mean loss: 0.3407781870531567
Epoch: 57, step: 291, loss: 0.3386991620063782, mean loss: 0.34077816188336196
Epoch: 57, step: 292, loss: 0.33486637473106384, mean loss: 0.3407780903129554
Epoch: 57, step: 293, loss: 0.29923754930496216, mean loss: 0.34077758741301345
Epoch: 57, step: 294, loss: 0.34338507056236267, mean loss: 0.3407776189794596
Epoch: 57, step: 295, loss: 0.3845583200454712, mean loss: 0.34077814898649395
Epoch: 57, step: 296, loss: 0.3263966739177704, mean loss: 0.340777974887165
Epoch: 57, step: 297, loss: 0.3759981095790863, mean loss: 0.3407784012500768
Epoch: 57, step: 298, loss: 0.32595953345298767, mean loss: 0.3407782218601002
Epoch: 57, step: 299, loss: 0.320639044046402, mean loss: 0.340777978068
Epoch: 57, step: 300, loss: 0.2962042987346649, mean loss: 0.34077743849386966
Epoch: 57, step: 301, loss: 0.41414952278137207, mean loss: 0.3407783266682346
Epoch: 57, step: 302, loss: 0.3138457238674164, mean loss: 0.3407780006510843
Epoch: 57, step: 303, loss: 0.32797467708587646, mean loss: 0.3407778456696825
Epoch: 57, step: 304, loss: 0.34787675738334656, mean loss: 0.34077793159939956
Epoch: 57, step: 305, loss: 0.35501545667648315, mean loss: 0.34077810393732144
Epoch: 57, step: 306, loss: 0.3470505177974701, mean loss: 0.3407781798607477
Epoch: 57, step: 307, loss: 0.3090003728866577, mean loss: 0.3407777952160424
Epoch: 57, step: 308, loss: 0.3102128505706787, mean loss: 0.3407774252565347
Epoch: 57, step: 309, loss: 0.3259449601173401, mean loss: 0.3407772457258617
Epoch: 57, step: 310, loss: 0.29436245560646057, mean loss: 0.34077668393268923
Epoch: 57, step: 311, loss: 0.3478659987449646, mean loss: 0.34077676973896875
Epoch: 57, step: 312, loss: 0.3445427119731903, mean loss: 0.3407768153199014
Epoch: 57, step: 313, loss: 0.3584398627281189, mean loss: 0.34077702910130836
Epoch: 57, step: 314, loss: 0.3259342908859253, mean loss: 0.3407768494571631
Epoch: 57, step: 315, loss: 0.2995917797088623, mean loss: 0.3407763509934026
Epoch: 57, step: 316, loss: 0.3514864444732666, mean loss: 0.34077648061631916
Epoch: 57, step: 317, loss: 0.33440101146698, mean loss: 0.34077640345575044
Epoch: 57, step: 318, loss: 0.3462037742137909, mean loss: 0.3407764691409473
Epoch: 57, step: 319, loss: 0.3465455174446106, mean loss: 0.34077653896047944
Epoch: 57, step: 320, loss: 0.3420015573501587, mean loss: 0.34077655378600546
Epoch: 57, step: 321, loss: 0.3008265793323517, mean loss: 0.3407760703057386
Epoch: 57, step: 322, loss: 0.3324597477912903, mean loss: 0.34077596966164
Epoch: 57, step: 323, loss: 0.3420439660549164, mean loss: 0.34077598500674106
Epoch: 57, step: 324, loss: 0.35140517354011536, mean loss: 0.34077611363802074
Epoch: 57, step: 325, loss: 0.34210526943206787, mean loss: 0.34077612972287435
Epoch: 57, step: 326, loss: 0.34368160367012024, mean loss: 0.3407761648832053
Epoch: 57, step: 327, loss: 0.29625385999679565, mean loss: 0.3407756261070679
Epoch: 57, step: 328, loss: 0.30995386838912964, mean loss: 0.3407752531293737
Epoch: 57, step: 329, loss: 0.3349817991256714, mean loss: 0.3407751830229577
Epoch: 57, step: 330, loss: 0.32304611802101135, mean loss: 0.3407749684866612
Epoch: 57, step: 331, loss: 0.3128952383995056, mean loss: 0.3407746311230348
Epoch: 57, step: 332, loss: 0.32059741020202637, mean loss: 0.34077438696794327
Epoch: 57, step: 333, loss: 0.30210813879966736, mean loss: 0.34077391909146193
Epoch: 57, step: 334, loss: 0.31653571128845215, mean loss: 0.34077362580336973
Epoch: 57, step: 335, loss: 0.30656197667121887, mean loss: 0.3407732118392691
Epoch: 57, step: 336, loss: 0.33921679854393005, mean loss: 0.340773193006753
Epoch: 57, step: 337, loss: 0.32478097081184387, mean loss: 0.3407729995040766
Epoch: 57, step: 338, loss: 0.3629860281944275, mean loss: 0.34077326827401005
Epoch: 57, step: 339, loss: 0.3188255727291107, mean loss: 0.34077300271772865
Epoch: 57, step: 340, loss: 0.3276815116405487, mean loss: 0.3407728443190659
Epoch: 57, step: 341, loss: 0.3378585875034332, mean loss: 0.3407728090588503
Epoch: 57, step: 342, loss: 0.29619213938713074, mean loss: 0.3407722696743338
Epoch: 57, step: 343, loss: 0.3535301089286804, mean loss: 0.34077242403042024
Epoch: 57, step: 344, loss: 0.31611549854278564, mean loss: 0.3407721257118415
Epoch: 57, step: 345, loss: 0.3159499764442444, mean loss: 0.34077182539789097
Epoch: 57, step: 346, loss: 0.31625252962112427, mean loss: 0.3407715287516412
Epoch: 57, step: 347, loss: 0.31695058941841125, mean loss: 0.34077124055793073
Epoch: 57, step: 348, loss: 0.34770467877388, mean loss: 0.340771324439976
Epoch: 57, step: 349, loss: 0.3063928484916687, mean loss: 0.34077090852771164
Epoch: 57, step: 350, loss: 0.29590144753456116, mean loss: 0.34077036570163105
Epoch: 57, step: 351, loss: 0.3349277675151825, mean loss: 0.3407702950193399
Epoch: 57, step: 352, loss: 0.3387387990951538, mean loss: 0.3407702704431078
Epoch: 57, step: 353, loss: 0.30841949582099915, mean loss: 0.3407698790809992
Epoch: 57, step: 354, loss: 0.32639065384864807, mean loss: 0.340769705131043
Epoch: 57, step: 355, loss: 0.3033381700515747, mean loss: 0.34076925231560845
Epoch: 57, step: 356, loss: 0.3378657102584839, mean loss: 0.3407692171914077
Epoch: 57, step: 357, loss: 0.325374573469162, mean loss: 0.34076903096437694
Epoch: 57, step: 358, loss: 0.3244752287864685, mean loss: 0.340768833862726
Epoch: 57, step: 359, loss: 0.33232009410858154, mean loss: 0.3407687316618774
Epoch: 57, step: 360, loss: 0.33750155568122864, mean loss: 0.3407686921407028
Epoch: 57, step: 361, loss: 0.33963891863822937, mean loss: 0.34076867847463893
Epoch: 57, step: 362, loss: 0.3293183147907257, mean loss: 0.34076853996943535
Epoch: 57, step: 363, loss: 0.30655980110168457, mean loss: 0.34076812618074187
Epoch: 57, step: 364, loss: 0.33545103669166565, mean loss: 0.3407680618660383
Epoch: 57, step: 365, loss: 0.3224138915538788, mean loss: 0.34076783985947867
Epoch: 57, step: 366, loss: 0.3277830481529236, mean loss: 0.34076768280121794
Epoch: 57, step: 367, loss: 0.33633026480674744, mean loss: 0.34076762912883424
Epoch: 57, step: 368, loss: 0.3125181198120117, mean loss: 0.3407672874436096
Epoch: 57, step: 369, loss: 0.3593394160270691, mean loss: 0.3407675120756591
Epoch: 57, step: 370, loss: 0.3278893530368805, mean loss: 0.3407673563147157
Epoch: 57, step: 371, loss: 0.35056304931640625, mean loss: 0.3407674747918928
Epoch: 57, step: 372, loss: 0.3396245837211609, mean loss: 0.3407674609689943
Epoch: 57, step: 373, loss: 0.3255976736545563, mean loss: 0.3407672774975336
Epoch: 57, step: 374, loss: 0.31598496437072754, mean loss: 0.3407669777707079
Epoch: 57, step: 375, loss: 0.35135310888290405, mean loss: 0.3407671058019003
Epoch: 57, step: 376, loss: 0.2977887988090515, mean loss: 0.34076658601829996
Epoch: 57, step: 377, loss: 0.34190624952316284, mean loss: 0.34076659980132856
Epoch: 57, step: 378, loss: 0.32299262285232544, mean loss: 0.34076638484641486
Epoch: 57, step: 379, loss: 0.3203794062137604, mean loss: 0.34076613829336444
Epoch: 57, step: 380, loss: 0.3231765329837799, mean loss: 0.34076592557334956
Epoch: 57, step: 381, loss: 0.32423362135887146, mean loss: 0.34076572564223073
Epoch: 57, step: 382, loss: 0.3981688618659973, mean loss: 0.3407664198306699
Epoch: 57, step: 383, loss: 0.33946460485458374, mean loss: 0.34076640408773257
Epoch: 57, step: 384, loss: 0.2877933382987976, mean loss: 0.34076576348857923
Epoch: 57, step: 385, loss: 0.32351866364479065, mean loss: 0.34076555492326804
Epoch: 57, step: 386, loss: 0.32668060064315796, mean loss: 0.3407653845991338
Epoch: 57, step: 387, loss: 0.31696435809135437, mean loss: 0.34076509678561795
Epoch: 57, step: 388, loss: 0.3090832829475403, mean loss: 0.3407647136784455
Epoch: 57, step: 389, loss: 0.36798587441444397, mean loss: 0.34076504284191667
Epoch: 57, step: 390, loss: 0.34883323311805725, mean loss: 0.3407651404028337
Epoch: 57, step: 391, loss: 0.3128140866756439, mean loss: 0.34076480242153107
Epoch: 57, step: 392, loss: 0.3633531630039215, mean loss: 0.3407650755543902
Epoch: 57, step: 393, loss: 0.3668442964553833, mean loss: 0.3407653908940543
Epoch: 57, step: 394, loss: 0.3648301362991333, mean loss: 0.340765681871956
Epoch: 57, step: 395, loss: 0.3452885150909424, mean loss: 0.3407657365589508
Epoch: 57, step: 396, loss: 0.34518587589263916, mean loss: 0.3407657900035954
Epoch: 57, step: 397, loss: 0.3020828366279602, mean loss: 0.34076532228718576
Epoch: 57, step: 398, loss: 0.3459630608558655, mean loss: 0.3407653851323932
Epoch: 57, step: 399, loss: 0.3082076609134674, mean loss: 0.3407649914857784
Epoch: 57, step: 400, loss: 0.36074668169021606, mean loss: 0.34076523307605516
Epoch: 57, step: 401, loss: 0.3418314456939697, mean loss: 0.34076524596703106
Epoch: 57, step: 402, loss: 0.3013741075992584, mean loss: 0.3407647697167334
Epoch: 57, step: 403, loss: 0.30386194586753845, mean loss: 0.34076432355627484
Epoch: 57, step: 404, loss: 0.31026118993759155, mean loss: 0.34076395477345206
Epoch: 57, step: 405, loss: 0.3332166075706482, mean loss: 0.34076386352714305
Epoch: 57, step: 406, loss: 0.32290440797805786, mean loss: 0.340763647611583
Epoch: 57, step: 407, loss: 0.3117576241493225, mean loss: 0.3407632969415378
Epoch: 57, step: 408, loss: 0.36512288451194763, mean loss: 0.3407635914346598
Epoch: 57, step: 409, loss: 0.324870228767395, mean loss: 0.3407633992955526
Epoch: 57, step: 410, loss: 0.3455032408237457, mean loss: 0.3407634565960704
Epoch: 57, step: 411, loss: 0.3172658085823059, mean loss: 0.3407631725335944
Epoch: 57, step: 412, loss: 0.30859294533729553, mean loss: 0.34076278363322815
Epoch: 57, step: 413, loss: 0.3851945996284485, mean loss: 0.340763320755348
Epoch: 57, step: 414, loss: 0.3209907114505768, mean loss: 0.3407630817334399
Epoch: 57, step: 415, loss: 0.335323303937912, mean loss: 0.3407630159752827
Epoch: 57, step: 416, loss: 0.31639599800109863, mean loss: 0.3407627214208194
Epoch: 57, step: 417, loss: 0.29433444142341614, mean loss: 0.34076216019121813
Epoch: 57, step: 418, loss: 0.40008074045181274, mean loss: 0.3407628772313654
Epoch: 57, step: 419, loss: 0.34282374382019043, mean loss: 0.34076290214272054
Epoch: 57, step: 420, loss: 0.3196464478969574, mean loss: 0.3407626468942074
Epoch: 57, step: 421, loss: 0.3327008783817291, mean loss: 0.34076254944747086
Epoch: 57, step: 422, loss: 0.3641306459903717, mean loss: 0.34076283190624135
Epoch: 57, step: 423, loss: 0.36781200766563416, mean loss: 0.34076315885561714
Epoch: 57, step: 424, loss: 0.3401027023792267, mean loss: 0.34076315087263
Epoch: 57, step: 425, loss: 0.3241203725337982, mean loss: 0.3407629497125466
Epoch: 57, step: 426, loss: 0.33708110451698303, mean loss: 0.3407629052108823
Epoch: 57, step: 427, loss: 0.3535352647304535, mean loss: 0.34076305958575565
Epoch: 57, step: 428, loss: 0.3301859498023987, mean loss: 0.3407629317456142
Epoch: 57, step: 429, loss: 0.3720453977584839, mean loss: 0.3407633098362861
Epoch: 57, step: 430, loss: 0.33909204602241516, mean loss: 0.3407632896370595
Epoch: 57, step: 431, loss: 0.3597052991390228, mean loss: 0.3407635185711845
Epoch: 57, step: 432, loss: 0.33951902389526367, mean loss: 0.340763503530338
Epoch: 57, step: 433, loss: 0.3659793436527252, mean loss: 0.340763808282944
Epoch: 57, step: 434, loss: 0.3500290513038635, mean loss: 0.34076392025909935
Epoch: 57, step: 435, loss: 0.32754936814308167, mean loss: 0.3407637605550469
Epoch: 57, step: 436, loss: 0.31981661915779114, mean loss: 0.34076350740209027
Epoch: 57, step: 437, loss: 0.322647362947464, mean loss: 0.34076328846529025
Epoch: 57, step: 438, loss: 0.3961988687515259, mean loss: 0.3407639584059562
Epoch: 57, step: 439, loss: 0.36902371048927307, mean loss: 0.3407642999217884
Epoch: 57, step: 440, loss: 0.31088149547576904, mean loss: 0.3407639387959205
Epoch: 57, step: 441, loss: 0.3598202168941498, mean loss: 0.3407641690832691
Epoch: 57, step: 442, loss: 0.31640851497650146, mean loss: 0.3407638747586796
Epoch: 57, step: 443, loss: 0.3841688632965088, mean loss: 0.34076439927758595
Epoch: 57, step: 444, loss: 0.2897650897502899, mean loss: 0.3407637829940732
Epoch: 57, step: 445, loss: 0.323467880487442, mean loss: 0.34076357399024854
Epoch: 57, step: 446, loss: 0.3169946074485779, mean loss: 0.3407632867693369
Epoch: 57, step: 447, loss: 0.3548226058483124, mean loss: 0.3407634566581556
Epoch: 57, step: 448, loss: 0.3670945167541504, mean loss: 0.34076377483136266
Epoch: 57, step: 449, loss: 0.31880468130111694, mean loss: 0.3407635094903258
Epoch: 57, step: 450, loss: 0.32895970344543457, mean loss: 0.3407633668616565
Epoch: 57, step: 451, loss: 0.3415793478488922, mean loss: 0.3407633767212624
Epoch: 57, step: 452, loss: 0.32904496788978577, mean loss: 0.34076323512789314
Epoch: 57, step: 453, loss: 0.31731998920440674, mean loss: 0.3407629518669047
Epoch: 57, step: 454, loss: 0.33867496252059937, mean loss: 0.34076292663836844
Epoch: 57, step: 455, loss: 0.32329046726226807, mean loss: 0.3407627155265399
Epoch: 57, step: 456, loss: 0.35732802748680115, mean loss: 0.340762915675298
Epoch: 57, step: 457, loss: 0.35832318663597107, mean loss: 0.3407631278429871
Epoch: 57, step: 458, loss: 0.3148914873600006, mean loss: 0.34076281525898044
Epoch: 57, step: 459, loss: 0.2923455238342285, mean loss: 0.34076223028300634
Epoch: 57, step: 460, loss: 0.34281519055366516, mean loss: 0.3407622550864988
Epoch: 57, step: 461, loss: 0.3007536232471466, mean loss: 0.3407617717153276
Epoch: 57, step: 462, loss: 0.3320484757423401, mean loss: 0.34076166644541456
Epoch: 57, step: 463, loss: 0.3365567922592163, mean loss: 0.3407616156447309
Epoch: 57, step: 464, loss: 0.3405472934246063, mean loss: 0.34076161305545394
Epoch: 57, step: 465, loss: 0.33426427841186523, mean loss: 0.3407615345605806
Epoch: 57, step: 466, loss: 0.3179411292076111, mean loss: 0.34076125886858
Epoch: 57, step: 467, loss: 0.32749107480049133, mean loss: 0.3407610985541885
Epoch: 57, step: 468, loss: 0.3106108605861664, mean loss: 0.3407607343197035
Epoch: 57, step: 469, loss: 0.32358723878860474, mean loss: 0.34076052685521374
Epoch: 57, step: 470, loss: 0.32021254301071167, mean loss: 0.3407602786282015
Epoch: 57, step: 471, loss: 0.2632525861263275, mean loss: 0.34075934231879706
Epoch: 57, step: 472, loss: 0.3417768180370331, mean loss: 0.3407593546099716
Epoch: 57, step: 473, loss: 0.3202160894870758, mean loss: 0.34075910644895685
Epoch: 57, step: 474, loss: 0.3479491174221039, mean loss: 0.34075919330267046
Epoch: 57, step: 475, loss: 0.32140785455703735, mean loss: 0.3407589595456794
Epoch: 57, step: 476, loss: 0.35837772488594055, mean loss: 0.3407591723712558
Epoch: 57, step: 477, loss: 0.36452943086624146, mean loss: 0.3407594595002208
Epoch: 57, step: 478, loss: 0.34347182512283325, mean loss: 0.3407594922634037
Epoch: 57, step: 479, loss: 0.34378358721733093, mean loss: 0.34075952879158355
Epoch: 57, step: 480, loss: 0.34346291422843933, mean loss: 0.34075956144550423
Epoch: 57, step: 481, loss: 0.36154904961586, mean loss: 0.34075981255660664
Epoch: 57, step: 482, loss: 0.3590030074119568, mean loss: 0.34076003290899826
Epoch: 57, step: 483, loss: 0.3455304801464081, mean loss: 0.34076009052866246
Epoch: 57, step: 484, loss: 0.3548598885536194, mean loss: 0.3407602608304757
Epoch: 57, step: 485, loss: 0.34289324283599854, mean loss: 0.3407602865929948
Epoch: 57, step: 486, loss: 0.3420184552669525, mean loss: 0.34076030178918626
Epoch: 57, step: 487, loss: 0.3193202316761017, mean loss: 0.3407600428386317
Epoch: 57, step: 488, loss: 0.30829721689224243, mean loss: 0.3407596507613107
Epoch: 57, step: 489, loss: 0.32009440660476685, mean loss: 0.3407594011750386
Epoch: 57, step: 490, loss: 0.33741697669029236, mean loss: 0.3407593608071056
Epoch: 57, step: 491, loss: 0.33722156286239624, mean loss: 0.3407593180800773
Epoch: 57, step: 492, loss: 0.31359758973121643, mean loss: 0.34075899004384164
Epoch: 57, step: 493, loss: 0.32490289211273193, mean loss: 0.3407587985496998
Epoch: 57, step: 494, loss: 0.34286510944366455, mean loss: 0.34075882398731555
Epoch: 57, step: 495, loss: 0.32809802889823914, mean loss: 0.34075867108654884
Epoch: 57, step: 496, loss: 0.33917057514190674, mean loss: 0.34075865190780424
Epoch: 57, step: 497, loss: 0.3204059302806854, mean loss: 0.34075840611979824
Epoch: 57, step: 498, loss: 0.34130993485450745, mean loss: 0.34075841278021024
Epoch: 57, step: 499, loss: 0.31305694580078125, mean loss: 0.3407580782537517
Epoch: 57, step: 500, loss: 0.3536144196987152, mean loss: 0.3407582335067006
Epoch: 57, step: 501, loss: 0.29271653294563293, mean loss: 0.34075765336299135
Epoch: 57, step: 502, loss: 0.35796114802360535, mean loss: 0.34075786110706713
Epoch: 57, step: 503, loss: 0.39089179039001465, mean loss: 0.3407584665015665
Epoch: 57, step: 504, loss: 0.31277844309806824, mean loss: 0.34075812863162575
Epoch: 57, step: 505, loss: 0.32945600152015686, mean loss: 0.3407579921555817
Epoch: 57, step: 506, loss: 0.3388337790966034, mean loss: 0.3407579689205028
Epoch: 57, step: 507, loss: 0.34011128544807434, mean loss: 0.3407579611118249
Epoch: 57, step: 508, loss: 0.29401519894599915, mean loss: 0.3407573967015931
Epoch: 57, step: 509, loss: 0.3363187313079834, mean loss: 0.34075734310617434
Epoch: 57, step: 510, loss: 0.3437674641609192, mean loss: 0.34075737945195317
Epoch: 57, step: 511, loss: 0.32232534885406494, mean loss: 0.3407571568966453
Epoch: 57, step: 512, loss: 0.3192780315876007, mean loss: 0.340756897552695
Epoch: 57, step: 513, loss: 0.32957905530929565, mean loss: 0.3407567625904598
Epoch: 57, step: 514, loss: 0.34668034315109253, mean loss: 0.3407568341114209
Epoch: 57, step: 515, loss: 0.3100418448448181, mean loss: 0.34075646326493597
Epoch: 57, step: 516, loss: 0.31876546144485474, mean loss: 0.34075619775329313
Epoch: 57, step: 517, loss: 0.32839587330818176, mean loss: 0.3407560485208728
Epoch: 57, step: 518, loss: 0.3962245285511017, mean loss: 0.34075671821167447
Epoch: 57, step: 519, loss: 0.3469783663749695, mean loss: 0.34075679332695147
Epoch: 57, step: 520, loss: 0.31021425127983093, mean loss: 0.34075642458481953
Epoch: 57, step: 521, loss: 0.31455329060554504, mean loss: 0.34075610823646774
Epoch: 57, step: 522, loss: 0.3177218735218048, mean loss: 0.34075583014934197
Epoch: 57, step: 523, loss: 0.2950316369533539, mean loss: 0.3407552781381241
Epoch: 57, step: 524, loss: 0.3794799745082855, mean loss: 0.34075574564137007
Epoch: 57, step: 525, loss: 0.3070819079875946, mean loss: 0.3407553391194388
Epoch: 57, step: 526, loss: 0.34865373373031616, mean loss: 0.3407554344703727
Epoch: 57, step: 527, loss: 0.3238217234611511, mean loss: 0.34075523004583497
Epoch: 57, step: 528, loss: 0.3190150856971741, mean loss: 0.34075496760098123
Epoch: 57, step: 529, loss: 0.3589361906051636, mean loss: 0.340755187080242
Epoch: 57, step: 530, loss: 0.3200547397136688, mean loss: 0.34075493719253974
Epoch: 57, step: 531, loss: 0.3364223539829254, mean loss: 0.3407548848919216
Epoch: 57, step: 532, loss: 0.31655973196029663, mean loss: 0.3407545928245524
Epoch: 57, step: 533, loss: 0.3662710189819336, mean loss: 0.34075490083771187
Epoch: 57, step: 534, loss: 0.3227427303791046, mean loss: 0.34075468341233545
Epoch: 57, step: 535, loss: 0.34149640798568726, mean loss: 0.3407546923656039
Epoch: 57, step: 536, loss: 0.3657512962818146, mean loss: 0.3407549940929733
Epoch: 57, step: 537, loss: 0.36368247866630554, mean loss: 0.3407552708412119
Epoch: 57, step: 538, loss: 0.2959674894809723, mean loss: 0.34075473023284514
Epoch: 57, step: 539, loss: 0.35533440113067627, mean loss: 0.34075490621380905
Epoch: 57, step: 540, loss: 0.40606170892715454, mean loss: 0.34075569447682624
Epoch: 57, step: 541, loss: 0.3166433572769165, mean loss: 0.3407554034407707
Epoch: 57, step: 542, loss: 0.367910772562027, mean loss: 0.3407557312022838
Epoch: 57, step: 543, loss: 0.288266658782959, mean loss: 0.3407550976741563
Epoch: 57, step: 544, loss: 0.3159828186035156, mean loss: 0.34075479868342484
Epoch: 57, step: 545, loss: 0.3254604637622833, mean loss: 0.3407546140896222
Epoch: 57, step: 546, loss: 0.31061047315597534, mean loss: 0.34075425027161566
Epoch: 57, step: 547, loss: 0.30485808849334717, mean loss: 0.3407538170361013
Epoch: 57, step: 548, loss: 0.340942919254303, mean loss: 0.3407538193183734
Epoch: 57, step: 549, loss: 0.3397189974784851, mean loss: 0.3407538068292735
Epoch: 57, step: 550, loss: 0.3354707658290863, mean loss: 0.3407537430698629
Epoch: 57, step: 551, loss: 0.35471072793006897, mean loss: 0.3407539115104236
Epoch: 57, step: 552, loss: 0.29302024841308594, mean loss: 0.3407533354413067
Epoch: 57, step: 553, loss: 0.3351414203643799, mean loss: 0.3407532677152673
Epoch: 57, step: 554, loss: 0.3576311767101288, mean loss: 0.3407534713997706
Epoch: 57, step: 555, loss: 0.35797396302223206, mean loss: 0.34075367921609157
Epoch: 57, step: 556, loss: 0.29859206080436707, mean loss: 0.340753170417221
Epoch: 57, step: 557, loss: 0.2991560697555542, mean loss: 0.34075266843690744
Epoch: 57, step: 558, loss: 0.3464636504650116, mean loss: 0.3407527373543538
Epoch: 57, step: 559, loss: 0.33183613419532776, mean loss: 0.34075262975427706
Epoch: 57, step: 560, loss: 0.3245719075202942, mean loss: 0.34075243449764026
Epoch: 57, step: 561, loss: 0.33179906010627747, mean loss: 0.3407523264564385
Epoch: 57, step: 562, loss: 0.3543224632740021, mean loss: 0.340752490206566
Epoch: 57, step: 563, loss: 0.344622939825058, mean loss: 0.3407525369105145
Epoch: 57, step: 564, loss: 0.35027042031288147, mean loss: 0.34075265175954134
Epoch: 57, step: 565, loss: 0.33873486518859863, mean loss: 0.34075262741189827
Epoch: 57, step: 566, loss: 0.30443066358566284, mean loss: 0.34075218913782496
Epoch: 57, step: 567, loss: 0.32370299100875854, mean loss: 0.3407519834184595
Epoch: 57, step: 568, loss: 0.31125491857528687, mean loss: 0.3407516275046977
Epoch: 57, step: 569, loss: 0.3144738972187042, mean loss: 0.34075131043949
Epoch: 57, step: 570, loss: 0.31177178025245667, mean loss: 0.34075096077877753
Epoch: 57, step: 571, loss: 0.35035210847854614, mean loss: 0.34075107662274107
Epoch: 57, step: 572, loss: 0.313859224319458, mean loss: 0.340750752159326
Epoch: 57, step: 573, loss: 0.3116753101348877, mean loss: 0.3407504013540604
Epoch: 57, step: 574, loss: 0.35380643606185913, mean loss: 0.3407505588777348
Epoch: 57, step: 575, loss: 0.33962282538414, mean loss: 0.34075054527156845
Epoch: 57, step: 576, loss: 0.3448876440525055, mean loss: 0.34075059518528966
Epoch: 57, step: 577, loss: 0.3256038725376129, mean loss: 0.34075041244366083
Epoch: 57, step: 578, loss: 0.32435840368270874, mean loss: 0.34075021468033534
Epoch: 57, step: 579, loss: 0.3277931213378906, mean loss: 0.3407500583598385
Epoch: 57, step: 580, loss: 0.2863622009754181, mean loss: 0.34074940220694266
Epoch: 57, step: 581, loss: 0.2945197522640228, mean loss: 0.3407488444840576
Epoch: 57, step: 582, loss: 0.30492985248565674, mean loss: 0.3407484123624522
Epoch: 57, step: 583, loss: 0.2936897873878479, mean loss: 0.34074784465235985
Epoch: 57, step: 584, loss: 0.3198060095310211, mean loss: 0.3407475920154047
Epoch: 57, step: 585, loss: 0.40325894951820374, mean loss: 0.34074834612737304
Epoch: 57, step: 586, loss: 0.32258522510528564, mean loss: 0.3407481270174023
Epoch: 57, step: 587, loss: 0.34111830592155457, mean loss: 0.34074813148298455
Epoch: 57, step: 588, loss: 0.33597826957702637, mean loss: 0.3407480739433642
Epoch: 57, step: 589, loss: 0.3377852439880371, mean loss: 0.3407480382026955
Epoch: 57, step: 590, loss: 0.3225155770778656, mean loss: 0.3407478182668564
Epoch: 57, step: 591, loss: 0.3438871502876282, mean loss: 0.340747856135759
Epoch: 57, step: 592, loss: 0.32975873351097107, mean loss: 0.34074772357858085
Epoch: 57, step: 593, loss: 0.30603867769241333, mean loss: 0.34074730490296523
Epoch: 57, step: 594, loss: 0.3222222626209259, mean loss: 0.3407470814485392
Epoch: 57, step: 595, loss: 0.3689323961734772, mean loss: 0.3407474214238688
Epoch: 57, step: 596, loss: 0.341959148645401, mean loss: 0.34074743603972096
Epoch: 57, step: 597, loss: 0.3285911977291107, mean loss: 0.3407472894129592
Epoch: 57, step: 598, loss: 0.2845362722873688, mean loss: 0.3407466114121013
Epoch: 57, step: 599, loss: 0.3613886535167694, mean loss: 0.34074686038737634
Epoch: 57, step: 600, loss: 0.3461436629295349, mean loss: 0.3407469254804608
Epoch: 57, step: 601, loss: 0.3237287700176239, mean loss: 0.34074672021987146
Epoch: 57, step: 602, loss: 0.31538498401641846, mean loss: 0.34074641432878094
Epoch: 57, step: 603, loss: 0.34415051341056824, mean loss: 0.340746455385553
Epoch: 57, step: 604, loss: 0.30181416869163513, mean loss: 0.3407459858296728
Epoch: 57, step: 605, loss: 0.3189530670642853, mean loss: 0.3407457229920487
Epoch: 57, step: 606, loss: 0.336740106344223, mean loss: 0.3407456746821331
Epoch: 57, step: 607, loss: 0.36843141913414, mean loss: 0.34074600858324333
Epoch: 57, step: 608, loss: 0.31782063841819763, mean loss: 0.3407457320974785
Epoch: 57, step: 609, loss: 0.3038333058357239, mean loss: 0.3407452869296469
Epoch: 57, step: 610, loss: 0.3406871557235718, mean loss: 0.34074528622858674
Epoch: 57, step: 611, loss: 0.34772399067878723, mean loss: 0.34074537039048314
Epoch: 57, step: 612, loss: 0.3283900320529938, mean loss: 0.3407452213891646
Epoch: 57, step: 613, loss: 0.28815531730651855, mean loss: 0.34074458717985845
Epoch: 57, step: 614, loss: 0.2898772358894348, mean loss: 0.34074397375111987
Epoch: 57, step: 615, loss: 0.37976816296577454, mean loss: 0.3407444443529868
Epoch: 57, step: 616, loss: 0.3247632682323456, mean loss: 0.340744251634553
Epoch: 57, step: 617, loss: 0.30936259031295776, mean loss: 0.3407438732048528
Epoch: 57, step: 618, loss: 0.31779351830482483, mean loss: 0.3407435964511429
Epoch: 57, step: 619, loss: 0.3352893888950348, mean loss: 0.340743530680745
Epoch: 57, step: 620, loss: 0.30848950147628784, mean loss: 0.34074314174527964
Epoch: 57, step: 621, loss: 0.29453808069229126, mean loss: 0.3407425845879053
Epoch: 57, step: 622, loss: 0.38197189569473267, mean loss: 0.3407430817398884
Epoch: 57, step: 623, loss: 0.33891117572784424, mean loss: 0.3407430596506344
Epoch: 57, step: 624, loss: 0.34400972723960876, mean loss: 0.3407430990398714
Epoch: 57, step: 625, loss: 0.31972023844718933, mean loss: 0.34074284555082474
Epoch: 57, step: 626, loss: 0.34573623538017273, mean loss: 0.3407429057592992
Epoch: 57, step: 627, loss: 0.32083383202552795, mean loss: 0.3407426657058395
Epoch: 57, step: 628, loss: 0.3002946078777313, mean loss: 0.34074217800966256
Epoch: 57, step: 629, loss: 0.34590670466423035, mean loss: 0.34074224027939
Epoch: 57, step: 630, loss: 0.30816686153411865, mean loss: 0.34074184751629005
Epoch: 57, step: 631, loss: 0.3491847515106201, mean loss: 0.3407419493116119
Epoch: 57, step: 632, loss: 0.414249449968338, mean loss: 0.34074283557414375
Epoch: 57, step: 633, loss: 0.34092792868614197, mean loss: 0.34074283780574066
Epoch: 57, step: 634, loss: 0.34869369864463806, mean loss: 0.34074293366507585
Epoch: 57, step: 635, loss: 0.3062865138053894, mean loss: 0.34074251824720525
Epoch: 57, step: 636, loss: 0.33873453736305237, mean loss: 0.34074249403862267
Epoch: 57, step: 637, loss: 0.3507561683654785, mean loss: 0.34074261476384543
Epoch: 57, step: 638, loss: 0.3136628270149231, mean loss: 0.340742288292873
Epoch: 57, step: 639, loss: 0.3583284914493561, mean loss: 0.3407425003076673
Epoch: 57, step: 640, loss: 0.3034557104110718, mean loss: 0.340742050793027
Epoch: 57, step: 641, loss: 0.30125975608825684, mean loss: 0.3407415748159962
Epoch: 57, step: 642, loss: 0.31590554118156433, mean loss: 0.3407412754099175
Epoch: 57, step: 643, loss: 0.3531741499900818, mean loss: 0.3407414252902649
Epoch: 57, step: 644, loss: 0.3604542315006256, mean loss: 0.34074166292852043
Epoch: 57, step: 645, loss: 0.3244687616825104, mean loss: 0.3407414667607498
Epoch: 57, step: 646, loss: 0.3225449323654175, mean loss: 0.3407412474064686
Epoch: 57, step: 647, loss: 0.3430449366569519, mean loss: 0.34074127517648223
Epoch: 57, step: 648, loss: 0.3905695676803589, mean loss: 0.34074187582853693
Epoch: 57, step: 649, loss: 0.3102829158306122, mean loss: 0.34074150866732283
Epoch: 57, step: 650, loss: 0.36229410767555237, mean loss: 0.34074176846552445
Epoch: 57, step: 651, loss: 0.31194552779197693, mean loss: 0.34074142135558383
Epoch: 57, step: 652, loss: 0.35087519884109497, mean loss: 0.3407415435066848
Epoch: 57, step: 653, loss: 0.297161340713501, mean loss: 0.3407410182035003
Epoch: 57, step: 654, loss: 0.319624125957489, mean loss: 0.3407407636696449
Epoch: 57, step: 655, loss: 0.32541361451148987, mean loss: 0.34074057892506704
Epoch: 57, step: 656, loss: 0.3231048583984375, mean loss: 0.3407403663568693
Epoch: 57, step: 657, loss: 0.3008618652820587, mean loss: 0.3407398856961037
Epoch: 57, step: 658, loss: 0.32404544949531555, mean loss: 0.3407396844783159
Epoch: 57, step: 659, loss: 0.3018307089805603, mean loss: 0.3407392155146733
Epoch: 57, step: 660, loss: 0.33082911372184753, mean loss: 0.3407390960712451
Epoch: 57, step: 661, loss: 0.31619980931282043, mean loss: 0.3407388003102862
Epoch: 57, step: 662, loss: 0.3076447546482086, mean loss: 0.3407384014474828
Epoch: 57, step: 663, loss: 0.33786725997924805, mean loss: 0.34073836684374337
Epoch: 57, step: 664, loss: 0.35247519612312317, mean loss: 0.3407385082973401
Epoch: 57, step: 665, loss: 0.33358246088027954, mean loss: 0.340738422052885
Epoch: 57, step: 666, loss: 0.33262738585472107, mean loss: 0.3407383243001137
Epoch: 57, step: 667, loss: 0.36659422516822815, mean loss: 0.34073863590709486
Epoch: 57, step: 668, loss: 0.32978132367134094, mean loss: 0.34073850385469195
Epoch: 57, step: 669, loss: 0.3481060564517975, mean loss: 0.34073859264392037
Epoch: 57, step: 670, loss: 0.3374267518520355, mean loss: 0.34073855273212594
Epoch: 57, step: 671, loss: 0.35355082154273987, mean loss: 0.34073870713401566
Epoch: 57, step: 672, loss: 0.34181568026542664, mean loss: 0.34073872011256656
Epoch: 57, step: 673, loss: 0.34387415647506714, mean loss: 0.3407387578971025
Epoch: 57, step: 674, loss: 0.33258384466171265, mean loss: 0.3407386596250078
Epoch: 57, step: 675, loss: 0.3376556932926178, mean loss: 0.3407386224736734
Epoch: 57, step: 676, loss: 0.3624878227710724, mean loss: 0.34073888455959617
Epoch: 57, step: 677, loss: 0.32429859042167664, mean loss: 0.34073868645034716
Epoch: 57, step: 678, loss: 0.35601159930229187, mean loss: 0.3407388704901709
Epoch: 57, step: 679, loss: 0.33279550075531006, mean loss: 0.34073877477308245
Epoch: 57, step: 680, loss: 0.2951158881187439, mean loss: 0.34073822502689133
Epoch: 57, step: 681, loss: 0.34199488162994385, mean loss: 0.3407382401691567
Epoch: 57, step: 682, loss: 0.3062910735607147, mean loss: 0.3407378250980453
Epoch: 57, step: 683, loss: 0.38985198736190796, mean loss: 0.3407384168919804
Epoch: 57, step: 684, loss: 0.3409707248210907, mean loss: 0.3407384196911072
Epoch: 57, step: 685, loss: 0.3494361340999603, mean loss: 0.3407385244904229
Epoch: 57, step: 686, loss: 0.35262298583984375, mean loss: 0.34073866768533045
Epoch: 57, step: 687, loss: 0.3287239670753479, mean loss: 0.3407385229229249
Epoch: 57, step: 688, loss: 0.3261949121952057, mean loss: 0.3407383476923656
Epoch: 57, step: 689, loss: 0.35141345858573914, mean loss: 0.34073847631125875
Epoch: 57, step: 690, loss: 0.30338141322135925, mean loss: 0.3407380262207385
Epoch: 57, step: 691, loss: 0.2985455393791199, mean loss: 0.34073751787752354
Epoch: 57, step: 692, loss: 0.34865880012512207, mean loss: 0.3407376133135092
Epoch: 57, step: 693, loss: 0.30664870142936707, mean loss: 0.34073720261362384
Epoch: 57, step: 694, loss: 0.323686420917511, mean loss: 0.340736997189944
Epoch: 57, step: 695, loss: 0.32883235812187195, mean loss: 0.34073685376746954
Epoch: 57, step: 696, loss: 0.3440374433994293, mean loss: 0.3407368935312143
Epoch: 57, step: 697, loss: 0.33487680554389954, mean loss: 0.34073682293284807
Epoch: 57, step: 698, loss: 0.3607056736946106, mean loss: 0.3407370635011226
Epoch: 57, step: 699, loss: 0.35322803258895874, mean loss: 0.34073721398022205
Epoch: 57, step: 700, loss: 0.3447066843509674, mean loss: 0.340737261799981
Epoch: 57, step: 701, loss: 0.294937402009964, mean loss: 0.34073671006091594
Epoch: 57, step: 702, loss: 0.3484402000904083, mean loss: 0.3407368028617499
Epoch: 57, step: 703, loss: 0.364989697933197, mean loss: 0.34073709502306476
Epoch: 57, step: 704, loss: 0.322475403547287, mean loss: 0.3407368750371412
Epoch: 57, step: 705, loss: 0.3486334979534149, mean loss: 0.3407369701611313
Epoch: 57, step: 706, loss: 0.3078956604003906, mean loss: 0.3407365745541957
Epoch: 57, step: 707, loss: 0.3123451769351959, mean loss: 0.34073623255509167
Epoch: 57, step: 708, loss: 0.3224644362926483, mean loss: 0.34073601245804813
Epoch: 57, step: 709, loss: 0.3235367238521576, mean loss: 0.3407358052826331
Epoch: 57, step: 710, loss: 0.3643406331539154, mean loss: 0.3407360896130619
Epoch: 57, step: 711, loss: 0.3228067457675934, mean loss: 0.34073587364891056
Epoch: 57, step: 712, loss: 0.34915491938591003, mean loss: 0.34073597505753894
Epoch: 57, step: 713, loss: 0.31838148832321167, mean loss: 0.34073570579774354
Epoch: 57, step: 714, loss: 0.34152644872665405, mean loss: 0.3407357153221275
Epoch: 57, step: 715, loss: 0.3535681962966919, mean loss: 0.3407358698856389
Epoch: 57, step: 716, loss: 0.3180708587169647, mean loss: 0.34073559689544114
Epoch: 57, step: 717, loss: 0.3557796776294708, mean loss: 0.3407357780926653
Epoch: 57, step: 718, loss: 0.31535205245018005, mean loss: 0.3407354723640994
Epoch: 57, step: 719, loss: 0.36478182673454285, mean loss: 0.34073576198151007
Epoch: 57, step: 720, loss: 0.34977036714553833, mean loss: 0.3407358707941558
Epoch: 57, step: 721, loss: 0.36045682430267334, mean loss: 0.34073610831015616
Epoch: 57, step: 722, loss: 0.298059344291687, mean loss: 0.34073559432424705
Epoch: 57, step: 723, loss: 0.3457828760147095, mean loss: 0.3407356551114338
Epoch: 57, step: 724, loss: 0.3032291829586029, mean loss: 0.3407352034058209
Epoch: 57, step: 725, loss: 0.3569762408733368, mean loss: 0.34073539900084787
Epoch: 57, step: 726, loss: 0.3246341943740845, mean loss: 0.3407352050921994
Epoch: 57, step: 727, loss: 0.339645117521286, mean loss: 0.34073519196430824
Epoch: 57, step: 728, loss: 0.320883184671402, mean loss: 0.3407349528900727
Epoch: 57, step: 729, loss: 0.3445095717906952, mean loss: 0.34073499834659743
Epoch: 57, step: 730, loss: 0.3523511588573456, mean loss: 0.340735138234608
Epoch: 57, step: 731, loss: 0.3950433135032654, mean loss: 0.3407357922347919
Epoch: 57, step: 732, loss: 0.3277299702167511, mean loss: 0.34073563561550724
Epoch: 57, step: 733, loss: 0.35020849108695984, mean loss: 0.34073574968857234
Epoch: 57, step: 734, loss: 0.32196295261383057, mean loss: 0.34073552362741033
Epoch: 57, step: 735, loss: 0.3623276948928833, mean loss: 0.3407357836362161
Epoch: 57, step: 736, loss: 0.33531004190444946, mean loss: 0.3407357183012564
Epoch: 57, step: 737, loss: 0.31910446286201477, mean loss: 0.34073545782807957
Epoch: 57, step: 738, loss: 0.3443368375301361, mean loss: 0.34073550119364004
Epoch: 57, step: 739, loss: 0.3459525406360626, mean loss: 0.34073556401320754
Epoch: 57, step: 740, loss: 0.3223467171192169, mean loss: 0.34073534259155414
Epoch: 57, step: 741, loss: 0.2950722873210907, mean loss: 0.34073479276548224
Epoch: 57, step: 742, loss: 0.35340794920921326, mean loss: 0.340734945360351
Epoch: 57, step: 743, loss: 0.30461642146110535, mean loss: 0.34073451046987396
Epoch: 57, step: 744, loss: 0.3174995183944702, mean loss: 0.340734230708853
Epoch: 57, step: 745, loss: 0.3519918918609619, mean loss: 0.340734366255138
Epoch: 57, step: 746, loss: 0.30925577878952026, mean loss: 0.3407339872461985
Epoch: 57, step: 747, loss: 0.3579759895801544, mean loss: 0.34073419484110234
Epoch: 57, step: 748, loss: 0.31964418292045593, mean loss: 0.3407339409189534
Epoch: 57, step: 749, loss: 0.30861732363700867, mean loss: 0.3407335542419653
Epoch: 57, step: 750, loss: 0.30730316042900085, mean loss: 0.34073315175224334
Epoch: 57, step: 751, loss: 0.3271249830722809, mean loss: 0.34073298791683904
Epoch: 57, step: 752, loss: 0.28880754113197327, mean loss: 0.34073236276849284
Epoch: 57, step: 753, loss: 0.3431378901004791, mean loss: 0.3407323917291166
Epoch: 57, step: 754, loss: 0.37739118933677673, mean loss: 0.340732833066386
Epoch: 57, step: 755, loss: 0.32896044850349426, mean loss: 0.3407326913397106
Epoch: 57, step: 756, loss: 0.3508095443248749, mean loss: 0.3407328126525739
Epoch: 57, step: 757, loss: 0.32420411705970764, mean loss: 0.3407326136698903
Epoch: 57, step: 758, loss: 0.31899920105934143, mean loss: 0.3407323520327467
Epoch: 57, step: 759, loss: 0.3227407932281494, mean loss: 0.3407321354444238
Epoch: 57, step: 760, loss: 0.33530062437057495, mean loss: 0.340732070058888
Epoch: 57, step: 761, loss: 0.3623771369457245, mean loss: 0.34073233062307345
Epoch: 57, step: 762, loss: 0.33954674005508423, mean loss: 0.34073231635105833
Epoch: 57, step: 763, loss: 0.3636946380138397, mean loss: 0.3407325927657548
Epoch: 57, step: 764, loss: 0.3529386818408966, mean loss: 0.3407327396978395
Epoch: 57, step: 765, loss: 0.3309864401817322, mean loss: 0.3407326223771433
Epoch: 57, step: 766, loss: 0.3345479369163513, mean loss: 0.340732547930132
Epoch: 57, step: 767, loss: 0.3716484308242798, mean loss: 0.34073292006989436
Epoch: 57, step: 768, loss: 0.33077871799468994, mean loss: 0.34073280025090624
Epoch: 57, step: 769, loss: 0.31131410598754883, mean loss: 0.3407324461415841
Epoch: 57, step: 770, loss: 0.32173269987106323, mean loss: 0.34073221744665194
Epoch: 57, step: 771, loss: 0.3108713626861572, mean loss: 0.34073185802374917
Epoch: 57, step: 772, loss: 0.3427688777446747, mean loss: 0.34073188254222775
Epoch: 57, step: 773, loss: 0.3154711425304413, mean loss: 0.3407315784963452
Epoch: 57, step: 774, loss: 0.35457631945610046, mean loss: 0.3407317451338157
Epoch: 57, step: 775, loss: 0.3327028155326843, mean loss: 0.34073164849752474
Epoch: 57, step: 776, loss: 0.33530235290527344, mean loss: 0.34073158315124574
Epoch: 57, step: 777, loss: 0.32969576120376587, mean loss: 0.3407314503271605
Epoch: 57, step: 778, loss: 0.34876173734664917, mean loss: 0.3407315469762996
Epoch: 57, step: 779, loss: 0.3107258081436157, mean loss: 0.3407311858442609
Epoch: 57, step: 780, loss: 0.3561196029186249, mean loss: 0.34073137104828394
Epoch: 57, step: 781, loss: 0.32561245560646057, mean loss: 0.3407311890899804
Epoch: 57, step: 782, loss: 0.3635079860687256, mean loss: 0.3407314632086813
Epoch: 57, step: 783, loss: 0.3293900489807129, mean loss: 0.34073132671642903
Epoch: 57, step: 784, loss: 0.3546050786972046, mean loss: 0.34073149368298433
Epoch: 57, step: 785, loss: 0.33288782835006714, mean loss: 0.34073139928789764
Epoch: 57, step: 786, loss: 0.29700374603271484, mean loss: 0.3407308730510211
Epoch: 57, step: 787, loss: 0.3127571940422058, mean loss: 0.340730536408114
Epoch: 57, step: 788, loss: 0.3075709640979767, mean loss: 0.3407301373615502
Epoch: 57, step: 789, loss: 0.32915356755256653, mean loss: 0.3407299980492947
Epoch: 57, step: 790, loss: 0.3355279862880707, mean loss: 0.3407299354491219
Epoch: 57, step: 791, loss: 0.31463930010795593, mean loss: 0.34072962148239094
Epoch: 57, step: 792, loss: 0.3525736331939697, mean loss: 0.34072976400789257
Epoch: 57, step: 793, loss: 0.4127501845359802, mean loss: 0.3407306306587617
Epoch: 57, step: 794, loss: 0.3665643632411957, mean loss: 0.34073094152278083
Epoch: 57, step: 795, loss: 0.3345702588558197, mean loss: 0.340730867390577
Epoch: 57, step: 796, loss: 0.3089131712913513, mean loss: 0.3407304845291836
Epoch: 57, step: 797, loss: 0.423539400100708, mean loss: 0.34073148095441846
Epoch: 57, step: 798, loss: 0.3393489122390747, mean loss: 0.3407314643184105
Epoch: 57, step: 799, loss: 0.34272632002830505, mean loss: 0.3407314883215836
Epoch: 57, step: 800, loss: 0.32693448662757874, mean loss: 0.3407313223106619
Epoch: 57, step: 801, loss: 0.34783491492271423, mean loss: 0.34073140778283867
Epoch: 57, step: 802, loss: 0.3730289936065674, mean loss: 0.34073179639067425
Epoch: 57, step: 803, loss: 0.33807048201560974, mean loss: 0.3407317643698545
Epoch: 57, step: 804, loss: 0.3312070071697235, mean loss: 0.34073164976976544
Epoch: 57, step: 805, loss: 0.3111901879310608, mean loss: 0.3407312943367236
Epoch: 57, step: 806, loss: 0.29646483063697815, mean loss: 0.34073076174376565
Epoch: 57, step: 807, loss: 0.32550469040870667, mean loss: 0.3407305785531485
Epoch: 57, step: 808, loss: 0.37298938632011414, mean loss: 0.34073096666638364
Epoch: 57, step: 809, loss: 0.3283950090408325, mean loss: 0.3407308182513878
Epoch: 57, step: 810, loss: 0.3392992913722992, mean loss: 0.3407308010287687
Epoch: 57, step: 811, loss: 0.337933748960495, mean loss: 0.3407307673779979
Epoch: 57, step: 812, loss: 0.3033183515071869, mean loss: 0.34073031728216324
Epoch: 57, step: 813, loss: 0.2955535352230072, mean loss: 0.3407297737824633
Epoch: 57, step: 814, loss: 0.34228023886680603, mean loss: 0.3407297924351236
Epoch: 57, step: 815, loss: 0.3196239471435547, mean loss: 0.3407295385271633
Epoch: 57, step: 816, loss: 0.31661397218704224, mean loss: 0.34072924841508706
Epoch: 57, step: 817, loss: 0.3480806052684784, mean loss: 0.34072933685139883
Epoch: 57, step: 818, loss: 0.3423095643520355, mean loss: 0.3407293558611971
Epoch: 57, step: 819, loss: 0.32663461565971375, mean loss: 0.34072918630653204
Epoch: 57, step: 820, loss: 0.3406352698802948, mean loss: 0.34072918517676476
Epoch: 57, step: 821, loss: 0.34628885984420776, mean loss: 0.3407292520560462
Epoch: 57, step: 822, loss: 0.3213135898113251, mean loss: 0.34072901850102766
Epoch: 57, step: 823, loss: 0.33866867423057556, mean loss: 0.34072899371701826
Epoch: 57, step: 824, loss: 0.30806392431259155, mean loss: 0.3407286007915927
Epoch: 57, step: 825, loss: 0.37788185477256775, mean loss: 0.3407290476996445
Epoch: 57, step: 826, loss: 0.33793529868125916, mean loss: 0.3407290140946765
Epoch: 57, step: 827, loss: 0.32495081424713135, mean loss: 0.34072882430686074
Epoch: 57, step: 828, loss: 0.32856690883636475, mean loss: 0.3407286780192214
Epoch: 57, step: 829, loss: 0.3528650999069214, mean loss: 0.3407288239984594
Epoch: 57, step: 830, loss: 0.3460308611392975, mean loss: 0.3407288877716241
Epoch: 57, step: 831, loss: 0.3435634672641754, mean loss: 0.3407289218656762
Epoch: 57, step: 832, loss: 0.3619515597820282, mean loss: 0.3407291771264731
Epoch: 57, step: 833, loss: 0.32182586193084717, mean loss: 0.34072894976466805
Epoch: 57, step: 834, loss: 0.3189672529697418, mean loss: 0.34072868802649653
Epoch: 57, step: 835, loss: 0.3273148536682129, mean loss: 0.34072852669393666
Epoch: 57, step: 836, loss: 0.3182026445865631, mean loss: 0.3407282557710657
Epoch: 57, step: 837, loss: 0.34023433923721313, mean loss: 0.34072824983071337
Epoch: 57, step: 838, loss: 0.29646745324134827, mean loss: 0.34072771751088715
Epoch: 57, step: 839, loss: 0.32315942645072937, mean loss: 0.3407275062214868
Epoch: 57, step: 840, loss: 0.3298221230506897, mean loss: 0.34072737506677453
Epoch: 57, step: 841, loss: 0.33115172386169434, mean loss: 0.3407272599056055
Epoch: 57, step: 842, loss: 0.3274330198764801, mean loss: 0.34072710002490614
Epoch: 57, step: 843, loss: 0.31757164001464844, mean loss: 0.3407268215534321
Epoch: 57, step: 844, loss: 0.30931007862091064, mean loss: 0.3407264437349176
Epoch: 57, step: 845, loss: 0.34116750955581665, mean loss: 0.34072644903912214
Epoch: 57, step: 846, loss: 0.3501848876476288, mean loss: 0.34072656278379904
Epoch: 57, step: 847, loss: 0.35840439796447754, mean loss: 0.34072677537020507
Epoch: 57, step: 848, loss: 0.3144279718399048, mean loss: 0.3407264591153675
Epoch: 57, step: 849, loss: 0.3300074636936188, mean loss: 0.3407263302162186
Epoch: 57, step: 850, loss: 0.37268319725990295, mean loss: 0.34072671450255015
Epoch: 57, step: 851, loss: 0.3581443428993225, mean loss: 0.3407269239497411
Epoch: 57, step: 852, loss: 0.3225453495979309, mean loss: 0.3407267053187199
Epoch: 57, step: 853, loss: 0.3358319103717804, mean loss: 0.34072664646016737
Epoch: 57, step: 854, loss: 0.30003875494003296, mean loss: 0.3407261572054325
Epoch: 57, step: 855, loss: 0.30085667967796326, mean loss: 0.3407256777975453
Epoch: 57, step: 856, loss: 0.323298841714859, mean loss: 0.34072546825223077
Epoch: 57, step: 857, loss: 0.2946104407310486, mean loss: 0.3407249137584771
Epoch: 57, step: 858, loss: 0.33891013264656067, mean loss: 0.3407248919375492
Epoch: 57, step: 859, loss: 0.3263026177883148, mean loss: 0.3407247185262113
Epoch: 57, step: 860, loss: 0.3520306944847107, mean loss: 0.34072485446599604
Epoch: 57, step: 861, loss: 0.3082733154296875, mean loss: 0.3407244642827685
Epoch: 57, step: 862, loss: 0.31529009342193604, mean loss: 0.34072415847460386
Epoch: 57, step: 863, loss: 0.3117985427379608, mean loss: 0.3407238106939116
Epoch: 57, step: 864, loss: 0.3378434479236603, mean loss: 0.34072377606292836
Epoch: 57, step: 865, loss: 0.3214274048805237, mean loss: 0.3407235440628901
Epoch: 57, step: 866, loss: 0.3098297417163849, mean loss: 0.3407231726315424
Epoch: 57, step: 867, loss: 0.31952178478240967, mean loss: 0.34072291773364094
Epoch: 57, step: 868, loss: 0.3372139632701874, mean loss: 0.34072287554704533
Epoch: 57, step: 869, loss: 0.31534430384635925, mean loss: 0.34072257043545695
Epoch: 57, step: 870, loss: 0.3537408113479614, mean loss: 0.3407227269442021
Epoch: 57, step: 871, loss: 0.3473404049873352, mean loss: 0.3407228065027263
Epoch: 57, step: 872, loss: 0.32699671387672424, mean loss: 0.3407226414879678
Epoch: 57, step: 873, loss: 0.3229251801967621, mean loss: 0.34072242752988446
Epoch: 57, step: 874, loss: 0.2915540635585785, mean loss: 0.3407218364431964
Epoch: 57, step: 875, loss: 0.308712363243103, mean loss: 0.3407214516399506
Epoch: 57, step: 876, loss: 0.32939645648002625, mean loss: 0.3407213154976754
Epoch: 57, step: 877, loss: 0.3384443521499634, mean loss: 0.34072128812572167
Epoch: 57, step: 878, loss: 0.33594486117362976, mean loss: 0.3407212307077723
Epoch: 57, step: 879, loss: 0.3337474465370178, mean loss: 0.34072114687615995
Epoch: 57, step: 880, loss: 0.3090612590312958, mean loss: 0.340720766298345
Epoch: 57, step: 881, loss: 0.37706440687179565, mean loss: 0.3407212031734571
Epoch: 57, step: 882, loss: 0.32777196168899536, mean loss: 0.3407210475166976
Epoch: 57, step: 883, loss: 0.3584381341934204, mean loss: 0.34072126048292845
Epoch: 57, step: 884, loss: 0.3077261447906494, mean loss: 0.34072086387365014
Epoch: 57, step: 885, loss: 0.3021119236946106, mean loss: 0.34072039979042085
Epoch: 57, step: 886, loss: 0.3282575011253357, mean loss: 0.34072024998696315
Epoch: 57, step: 887, loss: 0.3375438451766968, mean loss: 0.34072021180718515
Epoch: 57, step: 888, loss: 0.2957480549812317, mean loss: 0.34071967125696306
Epoch: 57, step: 889, loss: 0.3204014301300049, mean loss: 0.3407194270414636
Epoch: 57, step: 890, loss: 0.3830649256706238, mean loss: 0.340719936007901
Epoch: 57, step: 891, loss: 0.34096428751945496, mean loss: 0.3407199389448182
Epoch: 57, step: 892, loss: 0.3313845098018646, mean loss: 0.3407198267414896
Epoch: 57, step: 893, loss: 0.3465452492237091, mean loss: 0.3407198967569037
Epoch: 57, step: 894, loss: 0.293438196182251, mean loss: 0.3407193284877238
Epoch: 57, step: 895, loss: 0.3077807128429413, mean loss: 0.34071893260993374
Epoch: 57, step: 896, loss: 0.334011048078537, mean loss: 0.34071885199116647
Epoch: 57, step: 897, loss: 0.3492114245891571, mean loss: 0.34071895405799574
Epoch: 57, step: 898, loss: 0.359011709690094, mean loss: 0.3407191739043504
Epoch: 57, step: 899, loss: 0.3858334422111511, mean loss: 0.34071971609101886
Epoch: 57, step: 900, loss: 0.3605775535106659, mean loss: 0.34071995474113387
Epoch: 57, step: 901, loss: 0.3017636239528656, mean loss: 0.3407194865722745
Epoch: 57, step: 902, loss: 0.3381551504135132, mean loss: 0.34071945575500084
Epoch: 57, step: 903, loss: 0.3396205008029938, mean loss: 0.3407194425483125
Epoch: 57, step: 904, loss: 0.28672707080841064, mean loss: 0.34071879370291885
Epoch: 57, step: 905, loss: 0.3809705078601837, mean loss: 0.3407192774161661
Epoch: 57, step: 906, loss: 0.3385840654373169, mean loss: 0.3407192517571866
Epoch: 57, step: 907, loss: 0.34206363558769226, mean loss: 0.3407192679125393
Epoch: 57, step: 908, loss: 0.3718199133872986, mean loss: 0.34071964164201135
Epoch: 57, step: 909, loss: 0.3088093400001526, mean loss: 0.3407192581876909
Epoch: 57, step: 910, loss: 0.3555285632610321, mean loss: 0.34071943614350714
Epoch: 57, step: 911, loss: 0.31075239181518555, mean loss: 0.340719076049247
Epoch: 57, step: 912, loss: 0.32765570282936096, mean loss: 0.34071891907717
Epoch: 57, step: 913, loss: 0.31218668818473816, mean loss: 0.3407185762323586
Epoch: 57, step: 914, loss: 0.3547039031982422, mean loss: 0.3407187442787757
Epoch: 57, step: 915, loss: 0.30931875109672546, mean loss: 0.34071836698384655
Epoch: 57, step: 916, loss: 0.32982829213142395, mean loss: 0.340718236132842
Epoch: 57, step: 917, loss: 0.34466829895973206, mean loss: 0.34071828359472683
Epoch: 57, step: 918, loss: 0.38689088821411133, mean loss: 0.34071883837388045
Epoch: 57, step: 919, loss: 0.3124142289161682, mean loss: 0.34071849828869927
Epoch: 57, step: 920, loss: 0.3397202789783478, mean loss: 0.34071848629505147
Epoch: 57, step: 921, loss: 0.3064785599708557, mean loss: 0.3407180749058129
Epoch: 57, step: 922, loss: 0.36423203349113464, mean loss: 0.34071835742024364
Epoch: 57, step: 923, loss: 0.31380632519721985, mean loss: 0.3407180340826785
Epoch: 57, step: 924, loss: 0.311780720949173, mean loss: 0.3407176864163306
Epoch: 57, step: 925, loss: 0.3629438877105713, mean loss: 0.34071795344904915
Epoch: 57, step: 926, loss: 0.36968278884887695, mean loss: 0.34071830143770054
Epoch: 57, step: 927, loss: 0.33307573199272156, mean loss: 0.3407182096196237
Epoch: 57, step: 928, loss: 0.33393263816833496, mean loss: 0.34071812809852786
Epoch: 57, step: 929, loss: 0.31439605355262756, mean loss: 0.34071781187187
Epoch: 57, step: 930, loss: 0.3508239686489105, mean loss: 0.34071793328318895
Epoch: 57, step: 931, loss: 0.3258225917816162, mean loss: 0.3407177543386731
Epoch: 57, step: 932, loss: 0.32288801670074463, mean loss: 0.3407175401444943
Epoch: 57, step: 933, loss: 0.33603280782699585, mean loss: 0.3407174838660253
Epoch: 57, step: 934, loss: 0.3105360269546509, mean loss: 0.3407171212955159
Epoch: 57, step: 935, loss: 0.3540431559085846, mean loss: 0.3407172813795413
Epoch: 57, step: 936, loss: 0.313568651676178, mean loss: 0.3407169552502879
Epoch: 57, step: 937, loss: 0.3273974657058716, mean loss: 0.3407167952487317
Epoch: 57, step: 938, loss: 0.36253249645233154, mean loss: 0.3407170573086402
Epoch: 57, step: 939, loss: 0.3395293653011322, mean loss: 0.3407170430417268
Epoch: 57, step: 940, loss: 0.33234331011772156, mean loss: 0.34071694245513806
Epoch: 57, step: 941, loss: 0.37691372632980347, mean loss: 0.34071737725134077
Epoch: 57, step: 942, loss: 0.31767475605010986, mean loss: 0.34071710046642284
Epoch: 57, step: 943, loss: 0.3137966990470886, mean loss: 0.34071677710600606
Epoch: 57, step: 944, loss: 0.3376539647579193, mean loss: 0.3407167403167931
Epoch: 57, step: 945, loss: 0.3316552937030792, mean loss: 0.34071663147581716
Epoch: 57, step: 946, loss: 0.35657498240470886, mean loss: 0.3407168219550788
Epoch: 57, step: 947, loss: 0.34823936223983765, mean loss: 0.34071691230941104
Epoch: 57, step: 948, loss: 0.29825812578201294, mean loss: 0.3407164023368378
Epoch: 57, step: 949, loss: 0.3177850842475891, mean loss: 0.34071612691203673
Epoch: 57, step: 950, loss: 0.33040207624435425, mean loss: 0.34071600303292854
Epoch: 57, step: 951, loss: 0.31577417254447937, mean loss: 0.340715703467345
Epoch: 57, step: 952, loss: 0.37945398688316345, mean loss: 0.34071616873059446
Epoch: 57, step: 953, loss: 0.3700004518032074, mean loss: 0.3407165204430572
Epoch: 57, step: 954, loss: 0.32714492082595825, mean loss: 0.34071635744629253
Epoch: 57, step: 955, loss: 0.35178467631340027, mean loss: 0.34071649037671703
Epoch: 57, step: 956, loss: 0.30619311332702637, mean loss: 0.3407160757562036
Epoch: 57, step: 957, loss: 0.33877262473106384, mean loss: 0.3407160524159324
Epoch: 57, step: 958, loss: 0.31532227993011475, mean loss: 0.340715747447908
Epoch: 57, step: 959, loss: 0.3739132285118103, mean loss: 0.3407161461302477
Epoch: 57, step: 960, loss: 0.37120920419692993, mean loss: 0.34071651232965044
Epoch: 57, step: 961, loss: 0.3427797853946686, mean loss: 0.34071653710775857
Epoch: 57, step: 962, loss: 0.32003504037857056, mean loss: 0.34071628874402177
Epoch: 57, step: 963, loss: 0.3374243676662445, mean loss: 0.34071624921187316
Epoch: 57, step: 964, loss: 0.3453112840652466, mean loss: 0.340716304392242
Epoch: 57, step: 965, loss: 0.40069642663002014, mean loss: 0.34071702466654413
Epoch: 57, step: 966, loss: 0.3159056603908539, mean loss: 0.34071672672161135
Epoch: 57, step: 967, loss: 0.30437663197517395, mean loss: 0.34071629034024403
Epoch: 57, step: 968, loss: 0.3048880994319916, mean loss: 0.34071586011111826
Epoch: 57, step: 969, loss: 0.34964612126350403, mean loss: 0.3407159673454557
Epoch: 57, step: 970, loss: 0.3259691596031189, mean loss: 0.34071579026830845
Epoch: 57, step: 971, loss: 0.2858835458755493, mean loss: 0.3407151318599944
Epoch: 57, step: 972, loss: 0.2804527282714844, mean loss: 0.3407144082567285
Epoch: 57, step: 973, loss: 0.37777191400527954, mean loss: 0.3407148532208954
Epoch: 57, step: 974, loss: 0.3291468620300293, mean loss: 0.3407147143211056
Epoch: 57, step: 975, loss: 0.32040807604789734, mean loss: 0.3407144704971025
Epoch: 57, step: 976, loss: 0.3183501958847046, mean loss: 0.34071420197006147
Epoch: 57, step: 977, loss: 0.3113037049770355, mean loss: 0.3407138488435217
Epoch: 57, step: 978, loss: 0.3289555311203003, mean loss: 0.34071370766521386
Epoch: 57, step: 979, loss: 0.36619290709495544, mean loss: 0.34071401358202574
Epoch: 57, step: 980, loss: 0.2987874448299408, mean loss: 0.340713510195399
Epoch: 57, step: 981, loss: 0.3188454210758209, mean loss: 0.3407132476418017
Epoch: 57, step: 982, loss: 0.3449989855289459, mean loss: 0.3407132990967955
Epoch: 57, step: 983, loss: 0.35113003849983215, mean loss: 0.3407134241596995
Epoch: 57, step: 984, loss: 0.3814976215362549, mean loss: 0.34071391380705734
Epoch: 57, step: 985, loss: 0.3370037376880646, mean loss: 0.34071386926391956
Epoch: 57, step: 986, loss: 0.31288355588912964, mean loss: 0.340713535146465
Epoch: 57, step: 987, loss: 0.3663715124130249, mean loss: 0.3407138431801913
Epoch: 57, step: 988, loss: 0.3145533502101898, mean loss: 0.34071352911734426
Epoch: 57, step: 989, loss: 0.33670735359191895, mean loss: 0.3407134810228459
Epoch: 57, step: 990, loss: 0.352488249540329, mean loss: 0.34071362237830655
Epoch: 57, step: 991, loss: 0.36181655526161194, mean loss: 0.34071387571483575
Epoch: 57, step: 992, loss: 0.3483009934425354, mean loss: 0.3407139667955878
Epoch: 57, step: 993, loss: 0.3200487196445465, mean loss: 0.3407137187193453
Epoch: 57, step: 994, loss: 0.3071043789386749, mean loss: 0.3407133152604089
Epoch: 57, step: 995, loss: 0.32351675629615784, mean loss: 0.34071310882903744
Epoch: 57, step: 996, loss: 0.3520697057247162, mean loss: 0.34071324515455087
Epoch: 57, step: 997, loss: 0.3226698935031891, mean loss: 0.3407130285632891
Epoch: 57, step: 998, loss: 0.2994478642940521, mean loss: 0.3407125332247909
Epoch: 57, step: 999, loss: 0.3928588032722473, mean loss: 0.3407131591703189
Epoch: 57, step: 1000, loss: 0.2674389183521271, mean loss: 0.34071227962260114
Epoch: 57, step: 1001, loss: 0.32652464509010315, mean loss: 0.3407121093233029
Epoch: 57, step: 1002, loss: 0.3229968249797821, mean loss: 0.3407118966829032
Epoch: 57, step: 1003, loss: 0.3058074116706848, mean loss: 0.340711477721829
Epoch: 57, step: 1004, loss: 0.3248046338558197, mean loss: 0.340711286793116
Epoch: 57, step: 1005, loss: 0.34461790323257446, mean loss: 0.34071133368339185
Epoch: 57, step: 1006, loss: 0.3655162453651428, mean loss: 0.3407116314078314
Epoch: 57, step: 1007, loss: 0.32296091318130493, mean loss: 0.34071141835489765
Epoch: 57, step: 1008, loss: 0.3499644696712494, mean loss: 0.34071152941328087
Epoch: 57, step: 1009, loss: 0.3351021409034729, mean loss: 0.34071146208823094
Epoch: 57, step: 1010, loss: 0.33154919743537903, mean loss: 0.34071135212214093
Epoch: 57, step: 1011, loss: 0.3318660855293274, mean loss: 0.3407112459619562
Epoch: 57, step: 1012, loss: 0.30404379963874817, mean loss: 0.34071080588746927
Epoch: 57, step: 1013, loss: 0.32140886783599854, mean loss: 0.3407105742327076
Epoch: 57, step: 1014, loss: 0.30858114361763, mean loss: 0.3407101886317257
Epoch: 57, step: 1015, loss: 0.3296580910682678, mean loss: 0.34071005599169923
Epoch: 57, step: 1016, loss: 0.34624743461608887, mean loss: 0.34071012244688825
Epoch: 57, step: 1017, loss: 0.32609307765960693, mean loss: 0.3407099470269139
Epoch: 57, step: 1018, loss: 0.32808220386505127, mean loss: 0.34070979548247854
Epoch: 57, step: 1019, loss: 0.34502288699150085, mean loss: 0.34070984724288933
Epoch: 57, step: 1020, loss: 0.33275970816612244, mean loss: 0.3407097518362593
Epoch: 57, step: 1021, loss: 0.3236877918243408, mean loss: 0.3407095475645683
Epoch: 57, step: 1022, loss: 0.37015196681022644, mean loss: 0.3407099008834922
Epoch: 57, step: 1023, loss: 0.3159833550453186, mean loss: 0.3407096041601945
Epoch: 57, step: 1024, loss: 0.35190150141716003, mean loss: 0.34070973846349883
Epoch: 57, step: 1025, loss: 0.3580642640590668, mean loss: 0.34070994671613997
Epoch: 57, step: 1026, loss: 0.375316858291626, mean loss: 0.34071036199077337
Epoch: 57, step: 1027, loss: 0.35135218501091003, mean loss: 0.34071048968856327
Epoch: 57, step: 1028, loss: 0.33250048756599426, mean loss: 0.3407103911728725
Epoch: 57, step: 1029, loss: 0.3141671419143677, mean loss: 0.34071007267171743
Epoch: 57, step: 1030, loss: 0.3486797511577606, mean loss: 0.3407101683013565
Epoch: 57, step: 1031, loss: 0.32502511143684387, mean loss: 0.34070998009573056
Epoch: 57, step: 1032, loss: 0.3038980960845947, mean loss: 0.340709538393759
Epoch: 57, step: 1033, loss: 0.31368744373321533, mean loss: 0.3407092141623431
Epoch: 57, step: 1034, loss: 0.35635238885879517, mean loss: 0.3407094018586667
Epoch: 57, step: 1035, loss: 0.3448559045791626, mean loss: 0.34070945161033117
Epoch: 57, step: 1036, loss: 0.32309120893478394, mean loss: 0.34070924022101357
Epoch: 57, step: 1037, loss: 0.39575880765914917, mean loss: 0.34070990071542767
Epoch: 57, step: 1038, loss: 0.3600022494792938, mean loss: 0.3407101321856517
Epoch: 57, step: 1039, loss: 0.3025658428668976, mean loss: 0.34070967453472645
Epoch: 57, step: 1040, loss: 0.3273189961910248, mean loss: 0.34070951387679
Epoch: 57, step: 1041, loss: 0.3180558681488037, mean loss: 0.3407092420873991
Epoch: 57, step: 1042, loss: 0.37980788946151733, mean loss: 0.3407097111717217
Epoch: 57, step: 1043, loss: 0.3535757064819336, mean loss: 0.3407098655290894
Epoch: 57, step: 1044, loss: 0.33440542221069336, mean loss: 0.34070978989361955
Epoch: 57, step: 1045, loss: 0.33690550923347473, mean loss: 0.34070974425357037
Epoch: 57, step: 1046, loss: 0.3314442038536072, mean loss: 0.34070963309598656
Epoch: 57, step: 1047, loss: 0.3223312795162201, mean loss: 0.34070941261571425
Epoch: 57, step: 1048, loss: 0.3429854214191437, mean loss: 0.34070943992006547
Epoch: 57, step: 1049, loss: 0.3115193247795105, mean loss: 0.3407090897423364
Epoch: 57, step: 1050, loss: 0.2823517620563507, mean loss: 0.3407083896700264
Epoch: 57, step: 1051, loss: 0.3489052653312683, mean loss: 0.3407084880010684
Epoch: 57, step: 1052, loss: 0.324261873960495, mean loss: 0.3407082907072015
Epoch: 57, step: 1053, loss: 0.32852810621261597, mean loss: 0.34070814459525006
Epoch: 57, step: 1054, loss: 0.3197129964828491, mean loss: 0.34070789274313207
Epoch: 57, step: 1055, loss: 0.3171621859073639, mean loss: 0.34070761029858965
Epoch: 57, step: 1056, loss: 0.3645179569721222, mean loss: 0.3407078959142158
Epoch: 57, step: 1057, loss: 0.36721494793891907, mean loss: 0.3407082138741998
Epoch: 57, step: 1058, loss: 0.30453675985336304, mean loss: 0.34070777999203994
Epoch: 57, step: 1059, loss: 0.3245554566383362, mean loss: 0.34070758624475855
Epoch: 57, step: 1060, loss: 0.3455515503883362, mean loss: 0.3407076443474603
Epoch: 57, step: 1061, loss: 0.3407228887081146, mean loss: 0.3407076445303122
Epoch: 57, step: 1062, loss: 0.3400292694568634, mean loss: 0.34070763639348917
Epoch: 57, step: 1063, loss: 0.2860789895057678, mean loss: 0.34070698115375775
Epoch: 57, step: 1064, loss: 0.32988429069519043, mean loss: 0.34070685134326206
Epoch: 57, step: 1065, loss: 0.33967334032058716, mean loss: 0.34070683894717907
Epoch: 57, step: 1066, loss: 0.32643309235572815, mean loss: 0.34070666774781966
Epoch: 57, step: 1067, loss: 0.3324441909790039, mean loss: 0.34070656864883714
Epoch: 57, step: 1068, loss: 0.28687652945518494, mean loss: 0.34070592302667285
Epoch: 57, step: 1069, loss: 0.3222118318080902, mean loss: 0.3407057012164685
Epoch: 57, step: 1070, loss: 0.3510957360267639, mean loss: 0.34070582582859876
Epoch: 57, step: 1071, loss: 0.3493488132953644, mean loss: 0.3407059294864
Epoch: 57, step: 1072, loss: 0.32686275243759155, mean loss: 0.34070576346324066
Epoch: 57, step: 1073, loss: 0.32503318786621094, mean loss: 0.3407055755021028
Epoch: 57, step: 1074, loss: 0.3154555857181549, mean loss: 0.34070527268270573
Epoch: 57, step: 1075, loss: 0.35062676668167114, mean loss: 0.3407053916682905
Epoch: 57, step: 1076, loss: 0.306231290102005, mean loss: 0.3407049782354001
Epoch: 57, step: 1077, loss: 0.36706700921058655, mean loss: 0.34070529437996844
Epoch: 57, step: 1078, loss: 0.32997289299964905, mean loss: 0.34070516567403847
Epoch: 57, step: 1079, loss: 0.31139126420021057, mean loss: 0.34070481413782855
Epoch: 57, step: 1080, loss: 0.34476569294929504, mean loss: 0.340704862835844
Epoch: 57, step: 1081, loss: 0.3364466428756714, mean loss: 0.34070481177192796
Epoch: 57, step: 1082, loss: 0.34870803356170654, mean loss: 0.34070490774417667
Epoch: 57, step: 1083, loss: 0.36689493060112, mean loss: 0.3407052218033533
Epoch: 57, step: 1084, loss: 0.30396196246147156, mean loss: 0.34070478119971337
Epoch: 57, step: 1085, loss: 0.3364104628562927, mean loss: 0.3407047297053811
Epoch: 57, step: 1086, loss: 0.32086703181266785, mean loss: 0.3407044918290349
Epoch: 57, step: 1087, loss: 0.3130543828010559, mean loss: 0.34070416027705364
Epoch: 57, step: 1088, loss: 0.3208194673061371, mean loss: 0.34070392184290166
Epoch: 57, step: 1089, loss: 0.3010185658931732, mean loss: 0.34070344598789376
Epoch: 57, step: 1090, loss: 0.33273935317993164, mean loss: 0.3407033504940292
Epoch: 57, step: 1091, loss: 0.345074325799942, mean loss: 0.3407034029038051
Epoch: 57, step: 1092, loss: 0.44058096408843994, mean loss: 0.3407046004621219
Epoch: 57, step: 1093, loss: 0.36441904306411743, mean loss: 0.3407048848011378
Epoch: 57, step: 1094, loss: 0.3236364424228668, mean loss: 0.34070468015091687
Epoch: 57, step: 1095, loss: 0.3311222195625305, mean loss: 0.3407045652588183
Epoch: 57, step: 1096, loss: 0.3346535265445709, mean loss: 0.3407044927087468
Epoch: 57, step: 1097, loss: 0.31015241146087646, mean loss: 0.34070412640319025
Epoch: 57, step: 1098, loss: 0.3122963309288025, mean loss: 0.3407037858107283
Epoch: 57, step: 1099, loss: 0.34598690271377563, mean loss: 0.3407038491513779
Epoch: 57, step: 1100, loss: 0.32730406522750854, mean loss: 0.3407036884998424
Epoch: 57, step: 1101, loss: 0.30583611130714417, mean loss: 0.3407032704735003
Epoch: 57, step: 1102, loss: 0.36282673478126526, mean loss: 0.34070353570787354
Epoch: 57, step: 1103, loss: 0.3229219615459442, mean loss: 0.3407033225302233
Epoch: 57, step: 1104, loss: 0.3564925491809845, mean loss: 0.3407035118199821
Epoch: 57, step: 1105, loss: 0.283639520406723, mean loss: 0.34070282771429944
Epoch: 57, step: 1106, loss: 0.3489050567150116, mean loss: 0.34070292604468366
Epoch: 57, step: 1107, loss: 0.31238871812820435, mean loss: 0.34070258661090697
Epoch: 57, step: 1108, loss: 0.30680620670318604, mean loss: 0.3407021802623221
Epoch: 57, step: 1109, loss: 0.3262653946876526, mean loss: 0.34070200719672983
Epoch: 57, step: 1110, loss: 0.30652177333831787, mean loss: 0.3407015974551379
Epoch: 57, step: 1111, loss: 0.37391364574432373, mean loss: 0.3407019955856616
Epoch: 57, step: 1112, loss: 0.31726670265197754, mean loss: 0.3407017146576826
Epoch: 57, step: 1113, loss: 0.36643579602241516, mean loss: 0.34070202313843545
Epoch: 57, step: 1114, loss: 0.3558039963245392, mean loss: 0.3407022041673266
Epoch: 57, step: 1115, loss: 0.30498388409614563, mean loss: 0.3407017760133173
Epoch: 57, step: 1116, loss: 0.3513857424259186, mean loss: 0.34070190408004086
Epoch: 57, step: 1117, loss: 0.3044084906578064, mean loss: 0.34070146904284115
Epoch: 57, step: 1118, loss: 0.32641395926475525, mean loss: 0.3407012977852174
Epoch: 57, step: 1119, loss: 0.33808550238609314, mean loss: 0.3407012664312907
Epoch: 57, step: 1120, loss: 0.292479008436203, mean loss: 0.3407006884277428
Epoch: 57, step: 1121, loss: 0.32061269879341125, mean loss: 0.340700447651168
Epoch: 57, step: 1122, loss: 0.3329787254333496, mean loss: 0.34070035509897256
Epoch: 57, step: 1123, loss: 0.37245142459869385, mean loss: 0.34070073566122083
Epoch: 57, step: 1124, loss: 0.36848217248916626, mean loss: 0.3407010686402199
Epoch: 57, step: 1125, loss: 0.3288002610206604, mean loss: 0.3407009260028344
Epoch: 57, step: 1126, loss: 0.33054301142692566, mean loss: 0.34070080425639016
Epoch: 57, step: 1127, loss: 0.3640151023864746, mean loss: 0.34070108368371327
Epoch: 57, step: 1128, loss: 0.35527274012565613, mean loss: 0.34070125832633513
Epoch: 57, step: 1129, loss: 0.3161745071411133, mean loss: 0.3407009643745244
Epoch: 57, step: 1130, loss: 0.34138375520706177, mean loss: 0.3407009725576382
Epoch: 57, step: 1131, loss: 0.3453013300895691, mean loss: 0.3407010276913574
Epoch: 57, step: 1132, loss: 0.317911833524704, mean loss: 0.34070075457389515
Epoch: 57, step: 1133, loss: 0.3012952506542206, mean loss: 0.3407002823236624
Epoch: 57, step: 1134, loss: 0.3580978512763977, mean loss: 0.3407004908201085
Epoch: 57, step: 1135, loss: 0.349091500043869, mean loss: 0.3407005913786774
Epoch: 57, step: 1136, loss: 0.33824312686920166, mean loss: 0.34070056192856646
Epoch: 57, step: 1137, loss: 0.33204054832458496, mean loss: 0.3407004581487136
Epoch: 57, step: 1138, loss: 0.31817957758903503, mean loss: 0.3407001882662665
Epoch: 57, step: 1139, loss: 0.32501456141471863, mean loss: 0.3407000002973895
Epoch: 57, step: 1140, loss: 0.3280506134033203, mean loss: 0.3406998487151429
Epoch: 57, step: 1141, loss: 0.31317010521888733, mean loss: 0.34069951882007404
Epoch: 57, step: 1142, loss: 0.3551294803619385, mean loss: 0.340699691735456
Epoch: 57, step: 1143, loss: 0.31866419315338135, mean loss: 0.34069942768548017
Epoch: 57, step: 1144, loss: 0.3338473439216614, mean loss: 0.3406993455783808
Epoch: 57, step: 1145, loss: 0.31994491815567017, mean loss: 0.3406990968853592
Epoch: 57, step: 1146, loss: 0.3148476481437683, mean loss: 0.3406987871202314
Epoch: 57, step: 1147, loss: 0.3543960452079773, mean loss: 0.3406989512457357
Epoch: 57, step: 1148, loss: 0.3341057002544403, mean loss: 0.3406988722439624
Epoch: 57, step: 1149, loss: 0.29652756452560425, mean loss: 0.3406983429800486
Epoch: 57, step: 1150, loss: 0.33525553345680237, mean loss: 0.3406982777646791
Epoch: 57, step: 1151, loss: 0.3335115611553192, mean loss: 0.34069819165496656
Epoch: 57, step: 1152, loss: 0.30433931946754456, mean loss: 0.34069775601589936
Epoch: 57, step: 1153, loss: 0.2948830723762512, mean loss: 0.34069720708724155
Epoch: 57, step: 1154, loss: 0.334807425737381, mean loss: 0.3406971365196685
Epoch: 57, step: 1155, loss: 0.3697989284992218, mean loss: 0.3406974851944502
Epoch: 57, step: 1156, loss: 0.34485840797424316, mean loss: 0.3406975350467569
Epoch: 57, step: 1157, loss: 0.32815074920654297, mean loss: 0.3406973847246397
Epoch: 57, step: 1158, loss: 0.3742639720439911, mean loss: 0.3406977868786325
Epoch: 57, step: 1159, loss: 0.30862903594970703, mean loss: 0.3406974026744952
Epoch: 57, step: 1160, loss: 0.3296874761581421, mean loss: 0.34069727077011736
Epoch: 57, step: 1161, loss: 0.34988468885421753, mean loss: 0.340697380838622
Epoch: 57, step: 1162, loss: 0.352456271648407, mean loss: 0.34069752171258794
Epoch: 57, step: 1163, loss: 0.3172658383846283, mean loss: 0.3406972409994946
Epoch: 57, step: 1164, loss: 0.372018963098526, mean loss: 0.3406976162312713
Epoch: 57, step: 1165, loss: 0.33251383900642395, mean loss: 0.34069751819143584
Epoch: 57, step: 1166, loss: 0.31962132453918457, mean loss: 0.3406972657063367
Epoch: 57, step: 1167, loss: 0.3047761619091034, mean loss: 0.34069683538979306
Epoch: 57, step: 1168, loss: 0.33682432770729065, mean loss: 0.3406967889996774
Epoch: 57, step: 1169, loss: 0.34073665738105774, mean loss: 0.3406967894772689
Epoch: 57, step: 1170, loss: 0.33040130138397217, mean loss: 0.3406966661469931
Epoch: 57, step: 1171, loss: 0.3502855598926544, mean loss: 0.3406967810115564
Epoch: 57, step: 1172, loss: 0.33077409863471985, mean loss: 0.3406966621499906
Epoch: 57, step: 1173, loss: 0.3206188678741455, mean loss: 0.3406964216455193
Epoch: 57, step: 1174, loss: 0.31929925084114075, mean loss: 0.3406961653397947
Epoch: 57, step: 1175, loss: 0.3107227385044098, mean loss: 0.3406958063078025
Epoch: 57, step: 1176, loss: 0.3173235058784485, mean loss: 0.34069552634972106
Epoch: 57, step: 1177, loss: 0.320334255695343, mean loss: 0.34069528246127684
Epoch: 57, step: 1178, loss: 0.3130945861339569, mean loss: 0.34069495186254495
Epoch: 57, step: 1179, loss: 0.3192380964756012, mean loss: 0.3406946948572821
Epoch: 57, step: 1180, loss: 0.35492920875549316, mean loss: 0.34069486535296295
Epoch: 57, step: 1181, loss: 0.3247610032558441, mean loss: 0.3406946745054112
Epoch: 57, step: 1182, loss: 0.3270164728164673, mean loss: 0.3406945106769544
Epoch: 57, step: 1183, loss: 0.35143011808395386, mean loss: 0.3406946392594222
Epoch: 57, step: 1184, loss: 0.33437371253967285, mean loss: 0.3406945635533544
Epoch: 57, step: 1185, loss: 0.34312987327575684, mean loss: 0.3406945927208362
Epoch: 57, step: 1186, loss: 0.3366909325122833, mean loss: 0.34069454476993843
Epoch: 57, step: 1187, loss: 0.33592694997787476, mean loss: 0.3406944876702595
Epoch: 57, step: 1188, loss: 0.3089817464351654, mean loss: 0.34069410786330556
Epoch: 57, step: 1189, loss: 0.30861586332321167, mean loss: 0.34069372368351036
Epoch: 57, step: 1190, loss: 0.34465229511260986, mean loss: 0.3406937710921192
Epoch: 57, step: 1191, loss: 0.330057293176651, mean loss: 0.3406936437091501
Epoch: 57, step: 1192, loss: 0.3246120810508728, mean loss: 0.34069345111789184
Epoch: 57, step: 1193, loss: 0.307590126991272, mean loss: 0.34069305468039185
Epoch: 57, step: 1194, loss: 0.34614336490631104, mean loss: 0.34069311995122314
Epoch: 57, step: 1195, loss: 0.3384358882904053, mean loss: 0.34069309291980354
Epoch: 57, step: 1196, loss: 0.31410351395606995, mean loss: 0.3406927745007991
Epoch: 57, step: 1197, loss: 0.3288877606391907, mean loss: 0.3406926331335457
Epoch: 57, step: 1198, loss: 0.34770044684410095, mean loss: 0.34069271705242327
Epoch: 57, step: 1199, loss: 0.3007325232028961, mean loss: 0.3406922385330736
Epoch: 57, step: 1200, loss: 0.32188475131988525, mean loss: 0.3406920133179805
Epoch: 57, step: 1201, loss: 0.3386431336402893, mean loss: 0.3406919887834376
Epoch: 57, step: 1202, loss: 0.3919069468975067, mean loss: 0.34069260205543905
Epoch: 57, step: 1203, loss: 0.3491184711456299, mean loss: 0.3406927029495512
Epoch: 57, step: 1204, loss: 0.34651342034339905, mean loss: 0.3406927726478903
Epoch: 57, step: 1205, loss: 0.3271550238132477, mean loss: 0.3406926105463404
Epoch: 57, step: 1206, loss: 0.3306526839733124, mean loss: 0.3406924903292947
Epoch: 57, step: 1207, loss: 0.3758825659751892, mean loss: 0.3406929116865873
Epoch: 57, step: 1208, loss: 0.33983010053634644, mean loss: 0.3406929013556229
Epoch: 57, step: 1209, loss: 0.34921592473983765, mean loss: 0.3406930034057604
Epoch: 57, step: 1210, loss: 0.32445839047431946, mean loss: 0.3406928090234889
Epoch: 57, step: 1211, loss: 0.3446000814437866, mean loss: 0.3406928558059652
Epoch: 57, step: 1212, loss: 0.31142759323120117, mean loss: 0.3406925054119017
Epoch: 57, step: 1213, loss: 0.3498821258544922, mean loss: 0.34069261543824736
Epoch: 57, step: 1214, loss: 0.3006538152694702, mean loss: 0.3406921360637018
Epoch: 57, step: 1215, loss: 0.3196032643318176, mean loss: 0.3406918835749353
Epoch: 57, step: 1216, loss: 0.3206649422645569, mean loss: 0.34069164380311473
Epoch: 57, step: 1217, loss: 0.35071805119514465, mean loss: 0.34069176384247246
Epoch: 57, step: 1218, loss: 0.3418351709842682, mean loss: 0.3406917775315448
Epoch: 57, step: 1219, loss: 0.33338919281959534, mean loss: 0.3406916901047572
Epoch: 57, step: 1220, loss: 0.4551638066768646, mean loss: 0.3406930605523451
Epoch: 57, step: 1221, loss: 0.3258236348628998, mean loss: 0.3406928825393475
Epoch: 57, step: 1222, loss: 0.3157619833946228, mean loss: 0.3406925840765116
Epoch: 57, step: 1223, loss: 0.30955007672309875, mean loss: 0.3406922112552293
Epoch: 57, step: 1224, loss: 0.3462072014808655, mean loss: 0.340692277276924
Epoch: 57, step: 1225, loss: 0.3157782256603241, mean loss: 0.3406919790264917
Epoch: 57, step: 1226, loss: 0.3317238986492157, mean loss: 0.34069187166933146
Epoch: 57, step: 1227, loss: 0.33905309438705444, mean loss: 0.3406918520517141
Epoch: 57, step: 1228, loss: 0.2946930527687073, mean loss: 0.3406913014118864
Epoch: 57, step: 1229, loss: 0.29063329100608826, mean loss: 0.34069070218745673
Epoch: 57, step: 1230, loss: 0.32571256160736084, mean loss: 0.3406905228922703
Epoch: 57, step: 1231, loss: 0.3586733639240265, mean loss: 0.34069073815251727
Epoch: 57, step: 1232, loss: 0.31023427844047546, mean loss: 0.3406903735835067
Epoch: 57, step: 1233, loss: 0.36286747455596924, mean loss: 0.34069063904400526
Epoch: 57, step: 1234, loss: 0.3022075593471527, mean loss: 0.34069017840601407
Epoch: 57, step: 1235, loss: 0.31851184368133545, mean loss: 0.34068991293710277
Epoch: 57, step: 1236, loss: 0.34557783603668213, mean loss: 0.34068997144357355
Epoch: 57, step: 1237, loss: 0.34079334139823914, mean loss: 0.34068997268085544
Epoch: 57, step: 1238, loss: 0.34006792306900024, mean loss: 0.3406899652353504
Epoch: 57, step: 1239, loss: 0.3189961910247803, mean loss: 0.3406897055789348
Epoch: 57, step: 1240, loss: 0.3150899410247803, mean loss: 0.34068939917473423
Epoch: 57, step: 1241, loss: 0.30367693305015564, mean loss: 0.340688956176935
Epoch: 57, step: 1242, loss: 0.31485190987586975, mean loss: 0.340688646940106
Epoch: 57, step: 1243, loss: 0.3336677551269531, mean loss: 0.34068856290989946
Epoch: 57, step: 1244, loss: 0.40301916003227234, mean loss: 0.34068930891060706
Epoch: 57, step: 1245, loss: 0.3081784248352051, mean loss: 0.34068891981033567
Epoch: 57, step: 1246, loss: 0.3093477785587311, mean loss: 0.34068854471439586
Epoch: 57, step: 1247, loss: 0.30008649826049805, mean loss: 0.3406880587882331
Epoch: 57, step: 1248, loss: 0.34209197759628296, mean loss: 0.3406880755901624
Epoch: 57, step: 1249, loss: 0.34740200638771057, mean loss: 0.3406881559407069
Epoch: 57, step: 1250, loss: 0.3158663809299469, mean loss: 0.3406878588838368
Epoch: 57, step: 1251, loss: 0.3495935797691345, mean loss: 0.3406879654625932
Epoch: 57, step: 1252, loss: 0.33751365542411804, mean loss: 0.3406879274746558
Epoch: 57, step: 1253, loss: 0.3283601999282837, mean loss: 0.3406877799467419
Epoch: 57, step: 1254, loss: 0.3576138913631439, mean loss: 0.340687982501837
Epoch: 57, step: 1255, loss: 0.2963877320289612, mean loss: 0.34068745236624665
Epoch: 57, step: 1256, loss: 0.328084260225296, mean loss: 0.3406873015472179
Epoch: 57, step: 1257, loss: 0.3116745948791504, mean loss: 0.3406869543640732
Epoch: 57, step: 1258, loss: 0.3255155682563782, mean loss: 0.3406867728164993
Epoch: 57, step: 1259, loss: 0.3434986472129822, mean loss: 0.34068680646424
Epoch: 57, step: 1260, loss: 0.3708416521549225, mean loss: 0.34068716730193926
Epoch: 57, step: 1261, loss: 0.32650771737098694, mean loss: 0.3406869976304072
Epoch: 57, step: 1262, loss: 0.31872692704200745, mean loss: 0.34068673485898426
Epoch: 57, step: 1263, loss: 0.3213917016983032, mean loss: 0.34068650397982425
Epoch: 57, step: 1264, loss: 0.31096750497817993, mean loss: 0.34068614837455696
Epoch: 57, step: 1265, loss: 0.3986435532569885, mean loss: 0.34068684186062775
Epoch: 57, step: 1266, loss: 0.3126511573791504, mean loss: 0.3406865064052346
Epoch: 57, step: 1267, loss: 0.314852237701416, mean loss: 0.3406861972941417
Epoch: 57, step: 1268, loss: 0.31171390414237976, mean loss: 0.3406858506402399
Epoch: 57, step: 1269, loss: 0.3309319019317627, mean loss: 0.3406857339355005
Epoch: 57, step: 1270, loss: 0.2998259663581848, mean loss: 0.34068524505949604
Epoch: 57, step: 1271, loss: 0.31997549533843994, mean loss: 0.3406849972759387
Epoch: 57, step: 1272, loss: 0.41361942887306213, mean loss: 0.34068586989569194
Epoch: 57, step: 1273, loss: 0.3078063428401947, mean loss: 0.34068547651521464
Epoch: 57, step: 1274, loss: 0.316741019487381, mean loss: 0.34068519004001
Epoch: 57, step: 1275, loss: 0.31684285402297974, mean loss: 0.3406849047900098
Epoch: 57, step: 1276, loss: 0.3292767405509949, mean loss: 0.340684768304226
Epoch: 57, step: 1277, loss: 0.33652517199516296, mean loss: 0.3406847185399556
Epoch: 57, step: 1278, loss: 0.328921914100647, mean loss: 0.3406845778146701
Epoch: 57, step: 1279, loss: 0.3342112600803375, mean loss: 0.34068450037152354
Epoch: 57, step: 1280, loss: 0.3079662322998047, mean loss: 0.34068410895317813
Epoch: 57, step: 1281, loss: 0.32566988468170166, mean loss: 0.3406839293357087
Epoch: 57, step: 1282, loss: 0.30580922961235046, mean loss: 0.3406835121293142
Epoch: 57, step: 1283, loss: 0.35655906796455383, mean loss: 0.34068370204648135
Epoch: 57, step: 1284, loss: 0.33795663714408875, mean loss: 0.3406836694233562
Epoch: 57, step: 1285, loss: 0.3426913619041443, mean loss: 0.3406836934405402
Epoch: 57, step: 1286, loss: 0.3201075494289398, mean loss: 0.34068344729969435
Epoch: 57, step: 1287, loss: 0.29939135909080505, mean loss: 0.34068295335156035
Epoch: 57, step: 1288, loss: 0.31608960032463074, mean loss: 0.34068265916213936
Epoch: 57, step: 1289, loss: 0.31353166699409485, mean loss: 0.3406823343817359
Epoch: 57, step: 1290, loss: 0.31260982155799866, mean loss: 0.34068199858211123
Epoch: 57, step: 1291, loss: 0.3388090133666992, mean loss: 0.34068197617798185
Epoch: 57, step: 1292, loss: 0.31993287801742554, mean loss: 0.34068172798599655
Epoch: 57, step: 1293, loss: 0.3457240164279938, mean loss: 0.3406817882990087
Epoch: 57, step: 1294, loss: 0.32778674364089966, mean loss: 0.340681634057598
Epoch: 57, step: 1295, loss: 0.36347496509552, mean loss: 0.3406819066920537
Epoch: 57, step: 1296, loss: 0.3490014970302582, mean loss: 0.340682006202733
Epoch: 57, step: 1297, loss: 0.31131625175476074, mean loss: 0.34068165496293623
Epoch: 57, step: 1298, loss: 0.286354124546051, mean loss: 0.34068100516650274
Epoch: 57, step: 1299, loss: 0.3670932352542877, mean loss: 0.34068132107203913
Epoch: 57, step: 1300, loss: 0.31924426555633545, mean loss: 0.3406810646755326
Epoch: 57, step: 1301, loss: 0.34877198934555054, mean loss: 0.3406811614453528
Epoch: 57, step: 1302, loss: 0.35350579023361206, mean loss: 0.3406813148298212
Epoch: 57, step: 1303, loss: 0.3486047089099884, mean loss: 0.3406814095936599
Epoch: 57, step: 1304, loss: 0.33667269349098206, mean loss: 0.3406813616499657
Epoch: 57, step: 1305, loss: 0.343788206577301, mean loss: 0.3406813988069601
Epoch: 57, step: 1306, loss: 0.321929931640625, mean loss: 0.3406811745473516
Epoch: 57, step: 1307, loss: 0.3394136130809784, mean loss: 0.3406811593880344
Epoch: 57, step: 1308, loss: 0.2917003035545349, mean loss: 0.34068057361174686
Epoch: 57, step: 1309, loss: 0.4297207295894623, mean loss: 0.34068163845611027
Epoch: 57, step: 1310, loss: 0.3432341516017914, mean loss: 0.34068166898162655
Epoch: 57, step: 1311, loss: 0.3441746234893799, mean loss: 0.34068171075338577
Epoch: 57, step: 1312, loss: 0.3535420894622803, mean loss: 0.3406818645470346
Epoch: 57, step: 1313, loss: 0.34246692061424255, mean loss: 0.3406818858937623
Epoch: 57, step: 1314, loss: 0.2896842062473297, mean loss: 0.34068127604145315
Epoch: 57, step: 1315, loss: 0.3851383626461029, mean loss: 0.3406818076721645
Epoch: 57, step: 1316, loss: 0.332165390253067, mean loss: 0.34068170583159746
Epoch: 57, step: 1317, loss: 0.3377246558666229, mean loss: 0.34068167047118364
Epoch: 57, step: 1318, loss: 0.3442254960536957, mean loss: 0.3406817128477556
Epoch: 57, step: 1319, loss: 0.33887818455696106, mean loss: 0.3406816912816738
Epoch: 57, step: 1320, loss: 0.3555487394332886, mean loss: 0.34068186905551007
Epoch: 57, step: 1321, loss: 0.3552178144454956, mean loss: 0.340682042868082
Epoch: 57, step: 1322, loss: 0.324580579996109, mean loss: 0.3406818503382441
Epoch: 57, step: 1323, loss: 0.3421182930469513, mean loss: 0.3406818675139987
Epoch: 57, step: 1324, loss: 0.36472761631011963, mean loss: 0.34068215502908
Epoch: 57, step: 1325, loss: 0.3272058665752411, mean loss: 0.3406819938949904
Epoch: 57, step: 1326, loss: 0.3170599341392517, mean loss: 0.34068171145271436
Epoch: 57, step: 1327, loss: 0.36616018414497375, mean loss: 0.3406820160879515
Epoch: 57, step: 1328, loss: 0.3039182126522064, mean loss: 0.34068157652408104
Epoch: 57, step: 1329, loss: 0.34265318512916565, mean loss: 0.340681600097201
Epoch: 57, step: 1330, loss: 0.3127690553665161, mean loss: 0.3406812663707728
Epoch: 57, step: 1331, loss: 0.3459966778755188, mean loss: 0.3406813299218429
Epoch: 57, step: 1332, loss: 0.324126273393631, mean loss: 0.34068113199192185
Epoch: 57, step: 1333, loss: 0.32190462946891785, mean loss: 0.3406809075053897
Epoch: 57, step: 1334, loss: 0.3898238241672516, mean loss: 0.34068149503712175
Epoch: 57, step: 1335, loss: 0.32914498448371887, mean loss: 0.3406813571131756
Epoch: 57, step: 1336, loss: 0.3084915280342102, mean loss: 0.3406809722745232
Epoch: 57, step: 1337, loss: 0.34146955609321594, mean loss: 0.34068098170215655
Epoch: 57, step: 1338, loss: 0.3432142436504364, mean loss: 0.3406810119873066
Epoch: 57, step: 1339, loss: 0.3541317284107208, mean loss: 0.34068117278871757
Epoch: 57, step: 1340, loss: 0.32834288477897644, mean loss: 0.3406810252879942
Epoch: 57, step: 1341, loss: 0.31934037804603577, mean loss: 0.3406807701696769
Epoch: 57, step: 1342, loss: 0.32260897755622864, mean loss: 0.3406805541317023
Epoch: 57, step: 1343, loss: 0.3136749863624573, mean loss: 0.3406802312993998
Epoch: 57, step: 1344, loss: 0.3504812717437744, mean loss: 0.34068034846244766
Epoch: 57, step: 1345, loss: 0.319496750831604, mean loss: 0.3406800952337003
Epoch: 57, step: 1346, loss: 0.3117595314979553, mean loss: 0.340679749521385
Epoch: 57, step: 1347, loss: 0.3233589231967926, mean loss: 0.34067954247315985
Epoch: 57, step: 1348, loss: 0.33087390661239624, mean loss: 0.3406794252607824
Epoch: 57, step: 1349, loss: 0.30359557271003723, mean loss: 0.3406789819815676
Epoch: 57, step: 1350, loss: 0.3225748538970947, mean loss: 0.34067876557773674
Epoch: 57, step: 1351, loss: 0.30279988050460815, mean loss: 0.34067831280598115
Epoch: 57, step: 1352, loss: 0.35696715116500854, mean loss: 0.3406785075064791
Epoch: 57, step: 1353, loss: 0.34501832723617554, mean loss: 0.34067855937972774
Epoch: 57, step: 1354, loss: 0.3139137923717499, mean loss: 0.34067823946809406
Epoch: 57, step: 1355, loss: 0.3152606785297394, mean loss: 0.340677935662862
Epoch: 57, step: 1356, loss: 0.30862268805503845, mean loss: 0.34067755252478027
Epoch: 57, step: 1357, loss: 0.3117561638355255, mean loss: 0.34067720684805747
Epoch: 57, step: 1358, loss: 0.3198035955429077, mean loss: 0.34067695736365733
Epoch: 57, step: 1359, loss: 0.3156486451625824, mean loss: 0.3406766582252508
Epoch: 57, step: 1360, loss: 0.3184053599834442, mean loss: 0.34067639204185857
Epoch: 57, step: 1361, loss: 0.3158924877643585, mean loss: 0.3406760958316963
Epoch: 57, step: 1362, loss: 0.3795010447502136, mean loss: 0.3406765598508776
Epoch: 57, step: 1363, loss: 0.296568363904953, mean loss: 0.34067603269488816
Epoch: 57, step: 1364, loss: 0.3311149775981903, mean loss: 0.34067591842797895
Epoch: 57, step: 1365, loss: 0.3648058772087097, mean loss: 0.3406762068085844
Epoch: 57, step: 1366, loss: 0.31658315658569336, mean loss: 0.3406759188725196
Epoch: 57, step: 1367, loss: 0.38881760835647583, mean loss: 0.34067649420701795
Epoch: 57, step: 1368, loss: 0.3506743609905243, mean loss: 0.340676613688677
Epoch: 57, step: 1369, loss: 0.2947581708431244, mean loss: 0.3406760649369998
Epoch: 57, step: 1370, loss: 0.3097982406616211, mean loss: 0.34067569593373404
Epoch: 57, step: 1371, loss: 0.32198619842529297, mean loss: 0.34067547258887854
Epoch: 57, step: 1372, loss: 0.32756561040878296, mean loss: 0.3406753159241377
Epoch: 57, step: 1373, loss: 0.2834053933620453, mean loss: 0.34067463154849464
Epoch: 57, step: 1374, loss: 0.3545876145362854, mean loss: 0.3406747978066712
Epoch: 57, step: 1375, loss: 0.3443825840950012, mean loss: 0.34067484211366283
Epoch: 57, step: 1376, loss: 0.29136592149734497, mean loss: 0.3406742528931261
Epoch: 57, step: 1377, loss: 0.31697654724121094, mean loss: 0.34067396971905095
Epoch: 57, step: 1378, loss: 0.340888112783432, mean loss: 0.3406739722779079
Epoch: 57, step: 1379, loss: 0.3627670109272003, mean loss: 0.3406742362708179
Epoch: 57, step: 1380, loss: 0.3766070306301117, mean loss: 0.34067466563183735
Epoch: 57, step: 1381, loss: 0.36556893587112427, mean loss: 0.3406749630899595
Epoch: 57, step: 1382, loss: 0.315014511346817, mean loss: 0.3406746564805063
Epoch: 57, step: 1383, loss: 0.31212466955184937, mean loss: 0.34067431534889364
Epoch: 57, step: 1384, loss: 0.30898746848106384, mean loss: 0.34067393674080376
Epoch: 57, step: 1385, loss: 0.3415181040763855, mean loss: 0.34067394682715807
Epoch: 57, step: 1386, loss: 0.32586824893951416, mean loss: 0.34067376992653214
Epoch: 57, step: 1387, loss: 0.32745975255966187, mean loss: 0.34067361204542235
Epoch: 57, step: 1388, loss: 0.3044339418411255, mean loss: 0.34067317905893296
Epoch: 57, step: 1389, loss: 0.32456114888191223, mean loss: 0.3406729865569595
Epoch: 57, step: 1390, loss: 0.30699971318244934, mean loss: 0.3406725842430325
Epoch: 57, step: 1391, loss: 0.3336271643638611, mean loss: 0.34067250006836247
Epoch: 57, step: 1392, loss: 0.31168872117996216, mean loss: 0.34067215379079246
Epoch: 57, step: 1393, loss: 0.3704836368560791, mean loss: 0.34067250995292797
Epoch: 57, step: 1394, loss: 0.34883591532707214, mean loss: 0.34067260748115724
Epoch: 57, step: 1395, loss: 0.3270818889141083, mean loss: 0.34067244511474026
Epoch: 57, step: 1396, loss: 0.3290185332298279, mean loss: 0.3406723058887456
Epoch: 57, step: 1397, loss: 0.3119599521160126, mean loss: 0.3406719628744602
Epoch: 57, step: 1398, loss: 0.33265915513038635, mean loss: 0.3406718671499958
Epoch: 57, step: 1399, loss: 0.37943750619888306, mean loss: 0.3406723302555419
Epoch: 57, step: 1400, loss: 0.34788814187049866, mean loss: 0.3406724164566865
Epoch: 57, step: 1401, loss: 0.3170396089553833, mean loss: 0.3406721341390721
Epoch: 57, step: 1402, loss: 0.3413892984390259, mean loss: 0.3406721427062174
Epoch: 57, step: 1403, loss: 0.3464818298816681, mean loss: 0.34067221210710585
Epoch: 57, step: 1404, loss: 0.3377038240432739, mean loss: 0.34067217664800076
Epoch: 57, step: 1405, loss: 0.3480377793312073, mean loss: 0.340672264633316
Epoch: 57, step: 1406, loss: 0.3204449415206909, mean loss: 0.340672023012064
Epoch: 57, step: 1407, loss: 0.3808756172657013, mean loss: 0.3406725032499427
Epoch: 57, step: 1408, loss: 0.34253281354904175, mean loss: 0.3406725254713589
Epoch: 57, step: 1409, loss: 0.3113337457180023, mean loss: 0.3406721750236684
Epoch: 57, step: 1410, loss: 0.3575269877910614, mean loss: 0.34067237634968484
Epoch: 57, step: 1411, loss: 0.31448477506637573, mean loss: 0.3406720635498606
Epoch: 57, step: 1412, loss: 0.3323225677013397, mean loss: 0.34067196381985443
Epoch: 57, step: 1413, loss: 0.33319559693336487, mean loss: 0.34067187451994657
Epoch: 57, step: 1414, loss: 0.3397339880466461, mean loss: 0.3406718633176906
Epoch: 57, step: 1415, loss: 0.3221152126789093, mean loss: 0.3406716416769348
Epoch: 57, step: 1416, loss: 0.2972806394100189, mean loss: 0.3406711234207119
Epoch: 57, step: 1417, loss: 0.362777978181839, mean loss: 0.3406713874588214
Epoch: 57, step: 1418, loss: 0.3290458917617798, mean loss: 0.34067124860880055
Epoch: 57, step: 1419, loss: 0.3061950206756592, mean loss: 0.3406708368441826
Epoch: 57, step: 1420, loss: 0.36022067070007324, mean loss: 0.3406710703335812
Epoch: 57, step: 1421, loss: 0.41779249906539917, mean loss: 0.34067199140641924
Epoch: 57, step: 1422, loss: 0.3109196126461029, mean loss: 0.3406716360735227
Epoch: 57, step: 1423, loss: 0.31503358483314514, mean loss: 0.3406713298817293
Epoch: 57, step: 1424, loss: 0.31635162234306335, mean loss: 0.340671039438206
Epoch: 57, step: 1425, loss: 0.33748650550842285, mean loss: 0.3406710014066545
Epoch: 57, step: 1426, loss: 0.31505531072616577, mean loss: 0.34067069549287077
Epoch: 57, step: 1427, loss: 0.34077078104019165, mean loss: 0.3406706966881219
Epoch: 57, step: 1428, loss: 0.2994420528411865, mean loss: 0.34067020432938144
Epoch: 57, step: 1429, loss: 0.32351064682006836, mean loss: 0.34066999940978093
Epoch: 57, step: 1430, loss: 0.3209790587425232, mean loss: 0.34066976426318657
Epoch: 57, step: 1431, loss: 0.3743576109409332, mean loss: 0.3406701665541667
Epoch: 57, step: 1432, loss: 0.3169735074043274, mean loss: 0.34066988357857353
Epoch: 57, step: 1433, loss: 0.335360586643219, mean loss: 0.3406698201779271
Epoch: 57, step: 1434, loss: 0.3278350234031677, mean loss: 0.3406696669138122
Epoch: 57, step: 1435, loss: 0.310094952583313, mean loss: 0.34066930181644006
Epoch: 57, step: 1436, loss: 0.3672560155391693, mean loss: 0.3406696192886918
Epoch: 57, step: 1437, loss: 0.3554324209690094, mean loss: 0.34066979556937005
Epoch: 57, step: 1438, loss: 0.32036834955215454, mean loss: 0.34066955315536096
Epoch: 57, step: 1439, loss: 0.3185429573059082, mean loss: 0.3406692889508922
Epoch: 57, step: 1440, loss: 0.366917222738266, mean loss: 0.3406696023627991
Epoch: 57, step: 1441, loss: 0.32893234491348267, mean loss: 0.34066946221644145
Epoch: 57, step: 1442, loss: 0.3212151527404785, mean loss: 0.34066922992895265
Epoch: 57, step: 1443, loss: 0.35426366329193115, mean loss: 0.3406693922466688
Valid: 57, mean loss: 0.1848177214463552
Epoch: 58, step: 0, loss: 0.34084609150886536, mean loss: 0.3406693943564352
Epoch: 58, step: 1, loss: 0.3112853765487671, mean loss: 0.3406690435192476
Epoch: 58, step: 2, loss: 0.32315579056739807, mean loss: 0.3406688344182632
Epoch: 58, step: 3, loss: 0.33332955837249756, mean loss: 0.3406687467913941
Epoch: 58, step: 4, loss: 0.35094645619392395, mean loss: 0.3406688695000561
Epoch: 58, step: 5, loss: 0.29040083289146423, mean loss: 0.34066826934202216
Epoch: 58, step: 6, loss: 0.2961599826812744, mean loss: 0.3406677379568974
Epoch: 58, step: 7, loss: 0.2958715260028839, mean loss: 0.34066720314061333
Epoch: 58, step: 8, loss: 0.28499019145965576, mean loss: 0.34066653842777944
Epoch: 58, step: 9, loss: 0.3008025586605072, mean loss: 0.3406660625081528
Epoch: 58, step: 10, loss: 0.3355226516723633, mean loss: 0.3406660011038235
Epoch: 58, step: 11, loss: 0.3672812879085541, mean loss: 0.34066631884517784
Epoch: 58, step: 12, loss: 0.3148888647556305, mean loss: 0.34066601110979805
Epoch: 58, step: 13, loss: 0.3203901946544647, mean loss: 0.34066576905674006
Epoch: 58, step: 14, loss: 0.30712172389030457, mean loss: 0.3406653686121119
Epoch: 58, step: 15, loss: 0.32495346665382385, mean loss: 0.3406651810476248
Epoch: 58, step: 16, loss: 0.36053451895713806, mean loss: 0.34066541823963986
Epoch: 58, step: 17, loss: 0.3184584975242615, mean loss: 0.34066515314568363
Epoch: 58, step: 18, loss: 0.2990841269493103, mean loss: 0.34066465678028035
Epoch: 58, step: 19, loss: 0.344931036233902, mean loss: 0.34066470770874635
Epoch: 58, step: 20, loss: 0.3595496416091919, mean loss: 0.3406649331385853
Epoch: 58, step: 21, loss: 0.3340698480606079, mean loss: 0.34066485441386074
Epoch: 58, step: 22, loss: 0.37250328063964844, mean loss: 0.34066523446072705
Epoch: 58, step: 23, loss: 0.3490000069141388, mean loss: 0.34066533394951204
Epoch: 58, step: 24, loss: 0.3355933725833893, mean loss: 0.34066527340829705
Epoch: 58, step: 25, loss: 0.32395726442337036, mean loss: 0.34066507397635803
Epoch: 58, step: 26, loss: 0.34365320205688477, mean loss: 0.340665109643149
Epoch: 58, step: 27, loss: 0.30540362000465393, mean loss: 0.3406646887612006
Epoch: 58, step: 28, loss: 0.29977381229400635, mean loss: 0.34066420069258757
Epoch: 58, step: 29, loss: 0.3237667679786682, mean loss: 0.34066399900925803
Epoch: 58, step: 30, loss: 0.30004817247390747, mean loss: 0.34066351423518054
Epoch: 58, step: 31, loss: 0.34473705291748047, mean loss: 0.34066356285471033
Epoch: 58, step: 32, loss: 0.3245675563812256, mean loss: 0.3406633707438734
Epoch: 58, step: 33, loss: 0.3404109477996826, mean loss: 0.34066336773116307
Epoch: 58, step: 34, loss: 0.3285400867462158, mean loss: 0.3406632230394927
Epoch: 58, step: 35, loss: 0.3417009115219116, mean loss: 0.34066323542418364
Epoch: 58, step: 36, loss: 0.3153465688228607, mean loss: 0.3406629332763289
Epoch: 58, step: 37, loss: 0.3126308023929596, mean loss: 0.3406625987241045
Epoch: 58, step: 38, loss: 0.31076014041900635, mean loss: 0.34066224185453253
Epoch: 58, step: 39, loss: 0.32497069239616394, mean loss: 0.3406620545866614
Epoch: 58, step: 40, loss: 0.3123813271522522, mean loss: 0.340661717079621
Epoch: 58, step: 41, loss: 0.3006024658679962, mean loss: 0.34066123901136774
Epoch: 58, step: 42, loss: 0.35892799496650696, mean loss: 0.34066145700475586
Epoch: 58, step: 43, loss: 0.3445793092250824, mean loss: 0.34066150375940074
Epoch: 58, step: 44, loss: 0.30728763341903687, mean loss: 0.3406611054889335
Epoch: 58, step: 45, loss: 0.31001999974250793, mean loss: 0.3406607398345534
Epoch: 58, step: 46, loss: 0.347039133310318, mean loss: 0.34066081594994235
Epoch: 58, step: 47, loss: 0.3437137007713318, mean loss: 0.34066085238054883
Epoch: 58, step: 48, loss: 0.3250003457069397, mean loss: 0.34066066550322427
Epoch: 58, step: 49, loss: 0.3098425567150116, mean loss: 0.34066029775413964
Epoch: 58, step: 50, loss: 0.31066998839378357, mean loss: 0.3406599398873645
Epoch: 58, step: 51, loss: 0.3642927408218384, mean loss: 0.3406602218882348
Epoch: 58, step: 52, loss: 0.342777281999588, mean loss: 0.34066024714997467
Epoch: 58, step: 53, loss: 0.33755847811698914, mean loss: 0.34066021013867437
Epoch: 58, step: 54, loss: 0.3563615381717682, mean loss: 0.3406603974897075
Epoch: 58, step: 55, loss: 0.3138037919998169, mean loss: 0.34066007703574736
Epoch: 58, step: 56, loss: 0.38394829630851746, mean loss: 0.3406605935461373
Epoch: 58, step: 57, loss: 0.3339681327342987, mean loss: 0.3406605136933654
Epoch: 58, step: 58, loss: 0.2902820110321045, mean loss: 0.3406599125968189
Epoch: 58, step: 59, loss: 0.39381036162376404, mean loss: 0.3406605467595763
Epoch: 58, step: 60, loss: 0.3036373555660248, mean loss: 0.3406601050239125
Epoch: 58, step: 61, loss: 0.3874204456806183, mean loss: 0.340660662929998
Epoch: 58, step: 62, loss: 0.3141760230064392, mean loss: 0.3406603469407369
Epoch: 58, step: 63, loss: 0.380359023809433, mean loss: 0.3406608205815318
Epoch: 58, step: 64, loss: 0.2921203076839447, mean loss: 0.34066024145661805
Epoch: 58, step: 65, loss: 0.32069388031959534, mean loss: 0.340660003245719
Epoch: 58, step: 66, loss: 0.34449347853660583, mean loss: 0.340660048980878
Epoch: 58, step: 67, loss: 0.45369526743888855, mean loss: 0.34066139752798436
Epoch: 58, step: 68, loss: 0.312349408864975, mean loss: 0.34066105976073435
Epoch: 58, step: 69, loss: 0.3185836672782898, mean loss: 0.34066079637650964
Epoch: 58, step: 70, loss: 0.308705598115921, mean loss: 0.3406604151541929
Epoch: 58, step: 71, loss: 0.32450199127197266, mean loss: 0.34066022238811294
Epoch: 58, step: 72, loss: 0.35252609848976135, mean loss: 0.3406603639434497
Epoch: 58, step: 73, loss: 0.34149301052093506, mean loss: 0.3406603738764845
Epoch: 58, step: 74, loss: 0.3264234960079193, mean loss: 0.3406602040400611
Epoch: 58, step: 75, loss: 0.32016995549201965, mean loss: 0.3406599596080271
Epoch: 58, step: 76, loss: 0.329881876707077, mean loss: 0.34065983103578
Epoch: 58, step: 77, loss: 0.3326476514339447, mean loss: 0.34065973545926087
Epoch: 58, step: 78, loss: 0.3530547618865967, mean loss: 0.3406598833165741
Epoch: 58, step: 79, loss: 0.3577386140823364, mean loss: 0.34066008704224887
Epoch: 58, step: 80, loss: 0.33824899792671204, mean loss: 0.34066005828162815
Epoch: 58, step: 81, loss: 0.3280359208583832, mean loss: 0.34065990769669335
Epoch: 58, step: 82, loss: 0.2987760603427887, mean loss: 0.3406594080981086
Epoch: 58, step: 83, loss: 0.2851879894733429, mean loss: 0.3406587464322535
Epoch: 58, step: 84, loss: 0.3217514455318451, mean loss: 0.34065852090771304
Epoch: 58, step: 85, loss: 0.3013356029987335, mean loss: 0.34065805187317133
Epoch: 58, step: 86, loss: 0.33013054728507996, mean loss: 0.34065792630506353
Epoch: 58, step: 87, loss: 0.33265554904937744, mean loss: 0.3406578308568615
Epoch: 58, step: 88, loss: 0.3191182613372803, mean loss: 0.34065757394712143
Epoch: 58, step: 89, loss: 0.37677013874053955, mean loss: 0.340658004668774
Epoch: 58, step: 90, loss: 0.337529718875885, mean loss: 0.34065796735754
Epoch: 58, step: 91, loss: 0.3208930492401123, mean loss: 0.3406577316231032
Epoch: 58, step: 92, loss: 0.2920900881290436, mean loss: 0.34065715236800753
Epoch: 58, step: 93, loss: 0.34841689467430115, mean loss: 0.34065724491556265
Epoch: 58, step: 94, loss: 0.34241828322410583, mean loss: 0.3406572659185599
Epoch: 58, step: 95, loss: 0.34354063868522644, mean loss: 0.3406573003066522
Epoch: 58, step: 96, loss: 0.307882696390152, mean loss: 0.340656909430149
Epoch: 58, step: 97, loss: 0.33470261096954346, mean loss: 0.3406568384188376
Epoch: 58, step: 98, loss: 0.30229678750038147, mean loss: 0.3406563809400846
Epoch: 58, step: 99, loss: 0.3198694586753845, mean loss: 0.34065613303994785
Epoch: 58, step: 100, loss: 0.33347398042678833, mean loss: 0.3406560473882405
Epoch: 58, step: 101, loss: 0.3386456072330475, mean loss: 0.34065602341275747
Epoch: 58, step: 102, loss: 0.3579410910606384, mean loss: 0.34065622954319275
Epoch: 58, step: 103, loss: 0.3240480124950409, mean loss: 0.34065603148679785
Epoch: 58, step: 104, loss: 0.33582890033721924, mean loss: 0.34065597392295527
Epoch: 58, step: 105, loss: 0.32060983777046204, mean loss: 0.34065573487437134
Epoch: 58, step: 106, loss: 0.37132617831230164, mean loss: 0.34065610061261575
Epoch: 58, step: 107, loss: 0.32792147994041443, mean loss: 0.3406559487568958
Epoch: 58, step: 108, loss: 0.3159964382648468, mean loss: 0.3406556547047084
Epoch: 58, step: 109, loss: 0.3268126845359802, mean loss: 0.3406554896362606
Epoch: 58, step: 110, loss: 0.3409220278263092, mean loss: 0.34065549281451785
Epoch: 58, step: 111, loss: 0.3486391007900238, mean loss: 0.34065558801159856
Epoch: 58, step: 112, loss: 0.31444257497787476, mean loss: 0.3406552754495878
Epoch: 58, step: 113, loss: 0.2954765260219574, mean loss: 0.34065473674797536
Epoch: 58, step: 114, loss: 0.3035115599632263, mean loss: 0.34065429386606966
Epoch: 58, step: 115, loss: 0.39031463861465454, mean loss: 0.34065488599113225
Epoch: 58, step: 116, loss: 0.37281784415245056, mean loss: 0.3406552694815538
Epoch: 58, step: 117, loss: 0.3004426956176758, mean loss: 0.34065479001841004
Epoch: 58, step: 118, loss: 0.30628329515457153, mean loss: 0.34065438020459043
Epoch: 58, step: 119, loss: 0.3184162378311157, mean loss: 0.3406541150607716
Epoch: 58, step: 120, loss: 0.35504254698753357, mean loss: 0.34065428661099545
Epoch: 58, step: 121, loss: 0.3289501965045929, mean loss: 0.3406541470672738
Epoch: 58, step: 122, loss: 0.3277607858181, mean loss: 0.3406539933461263
Epoch: 58, step: 123, loss: 0.31734544038772583, mean loss: 0.34065371545312995
Epoch: 58, step: 124, loss: 0.3700026571750641, mean loss: 0.3406540653576535
Epoch: 58, step: 125, loss: 0.32242345809936523, mean loss: 0.3406538480109445
Epoch: 58, step: 126, loss: 0.32614272832870483, mean loss: 0.3406536750103164
Epoch: 58, step: 127, loss: 0.36770811676979065, mean loss: 0.3406539975477718
Epoch: 58, step: 128, loss: 0.3576540946960449, mean loss: 0.34065420021699544
Epoch: 58, step: 129, loss: 0.39112088084220886, mean loss: 0.3406548018559719
Epoch: 58, step: 130, loss: 0.3442392647266388, mean loss: 0.3406548445876681
Epoch: 58, step: 131, loss: 0.4124765694141388, mean loss: 0.34065570079057717
Epoch: 58, step: 132, loss: 0.3498397171497345, mean loss: 0.3406558102739933
Epoch: 58, step: 133, loss: 0.3468366265296936, mean loss: 0.340655883955135
Epoch: 58, step: 134, loss: 0.3021489381790161, mean loss: 0.3406554249216045
Epoch: 58, step: 135, loss: 0.30647414922714233, mean loss: 0.34065501745837146
Epoch: 58, step: 136, loss: 0.33663833141326904, mean loss: 0.34065496957740915
Epoch: 58, step: 137, loss: 0.365487277507782, mean loss: 0.3406552655877552
Epoch: 58, step: 138, loss: 0.3289366662502289, mean loss: 0.3406551258993579
Epoch: 58, step: 139, loss: 0.28292354941368103, mean loss: 0.3406544377339013
Epoch: 58, step: 140, loss: 0.28918126225471497, mean loss: 0.3406538241764474
Epoch: 58, step: 141, loss: 0.3072231411933899, mean loss: 0.3406534256892733
Epoch: 58, step: 142, loss: 0.37076255679130554, mean loss: 0.34065378457992357
Epoch: 58, step: 143, loss: 0.3201844096183777, mean loss: 0.3406535405948115
Epoch: 58, step: 144, loss: 0.37067586183547974, mean loss: 0.34065389844218674
Epoch: 58, step: 145, loss: 0.3506105840206146, mean loss: 0.3406540171182646
Epoch: 58, step: 146, loss: 0.3460020422935486, mean loss: 0.3406540808618751
Epoch: 58, step: 147, loss: 0.3225577771663666, mean loss: 0.3406538651729157
Epoch: 58, step: 148, loss: 0.3365829288959503, mean loss: 0.34065381665220346
Epoch: 58, step: 149, loss: 0.34518134593963623, mean loss: 0.34065387061431746
Epoch: 58, step: 150, loss: 0.32309690117836, mean loss: 0.34065366136113895
Epoch: 58, step: 151, loss: 0.31004059314727783, mean loss: 0.3406532965028698
Epoch: 58, step: 152, loss: 0.3411789536476135, mean loss: 0.3406533027677783
Epoch: 58, step: 153, loss: 0.3545891344547272, mean loss: 0.3406534688563975
Epoch: 58, step: 154, loss: 0.31579554080963135, mean loss: 0.3406531726006853
Epoch: 58, step: 155, loss: 0.34792646765708923, mean loss: 0.34065325928246837
Epoch: 58, step: 156, loss: 0.3028380274772644, mean loss: 0.34065280861291203
Epoch: 58, step: 157, loss: 0.3111568093299866, mean loss: 0.3406524570934354
Epoch: 58, step: 158, loss: 0.30281901359558105, mean loss: 0.3406520062175848
Epoch: 58, step: 159, loss: 0.2808505892753601, mean loss: 0.3406512935493497
Epoch: 58, step: 160, loss: 0.28220707178115845, mean loss: 0.3406505970634444
Epoch: 58, step: 161, loss: 0.38221460580825806, mean loss: 0.3406510923801823
Epoch: 58, step: 162, loss: 0.3023522198200226, mean loss: 0.34065063597938916
Epoch: 58, step: 163, loss: 0.33955734968185425, mean loss: 0.34065062295104775
Epoch: 58, step: 164, loss: 0.3280303478240967, mean loss: 0.34065047256107756
Epoch: 58, step: 165, loss: 0.3513580858707428, mean loss: 0.3406506001572227
Epoch: 58, step: 166, loss: 0.34837713837623596, mean loss: 0.34065069222860367
Epoch: 58, step: 167, loss: 0.33864057064056396, mean loss: 0.34065066827577256
Epoch: 58, step: 168, loss: 0.27295300364494324, mean loss: 0.34064986159252725
Epoch: 58, step: 169, loss: 0.36414262652397156, mean loss: 0.3406501415282405
Epoch: 58, step: 170, loss: 0.31604939699172974, mean loss: 0.3406498483935273
Epoch: 58, step: 171, loss: 0.3516523241996765, mean loss: 0.34064997949399684
Epoch: 58, step: 172, loss: 0.3284362852573395, mean loss: 0.3406498339629365
Epoch: 58, step: 173, loss: 0.38947170972824097, mean loss: 0.3406504156882155
Epoch: 58, step: 174, loss: 0.36168286204338074, mean loss: 0.34065066629226853
Epoch: 58, step: 175, loss: 0.31940746307373047, mean loss: 0.3406504131800388
Epoch: 58, step: 176, loss: 0.33008432388305664, mean loss: 0.34065028728685176
Epoch: 58, step: 177, loss: 0.3394380509853363, mean loss: 0.340650272843431
Epoch: 58, step: 178, loss: 0.31270286440849304, mean loss: 0.34064993986266784
Epoch: 58, step: 179, loss: 0.32736241817474365, mean loss: 0.34064978154972775
Epoch: 58, step: 180, loss: 0.3468623161315918, mean loss: 0.34064985556751076
Epoch: 58, step: 181, loss: 0.3251892328262329, mean loss: 0.34064967136774976
Epoch: 58, step: 182, loss: 0.3261525630950928, mean loss: 0.3406494986494764
Epoch: 58, step: 183, loss: 0.3233223855495453, mean loss: 0.3406492922170386
Epoch: 58, step: 184, loss: 0.2928529381752014, mean loss: 0.34064872278575037
Epoch: 58, step: 185, loss: 0.4183817207813263, mean loss: 0.3406496488621162
Epoch: 58, step: 186, loss: 0.3329515755176544, mean loss: 0.34064955715178674
Epoch: 58, step: 187, loss: 0.34356221556663513, mean loss: 0.3406495918510769
Epoch: 58, step: 188, loss: 0.32684871554374695, mean loss: 0.3406494274394508
Epoch: 58, step: 189, loss: 0.3122219741344452, mean loss: 0.3406490887835538
Epoch: 58, step: 190, loss: 0.34669336676597595, mean loss: 0.3406491607881043
Epoch: 58, step: 191, loss: 0.3301621675491333, mean loss: 0.34064903585966105
Epoch: 58, step: 192, loss: 0.32862719893455505, mean loss: 0.3406488926487858
Epoch: 58, step: 193, loss: 0.31990841031074524, mean loss: 0.34064864557945146
Epoch: 58, step: 194, loss: 0.3118778169155121, mean loss: 0.3406483028533426
Epoch: 58, step: 195, loss: 0.301655113697052, mean loss: 0.34064783836116697
Epoch: 58, step: 196, loss: 0.3438061475753784, mean loss: 0.34064787598292795
Epoch: 58, step: 197, loss: 0.3378433585166931, mean loss: 0.3406478425759301
Epoch: 58, step: 198, loss: 0.2924148440361023, mean loss: 0.34064726803841966
Epoch: 58, step: 199, loss: 0.35087794065475464, mean loss: 0.3406473899017775
Epoch: 58, step: 200, loss: 0.3284527063369751, mean loss: 0.34064724464569895
Epoch: 58, step: 201, loss: 0.32651782035827637, mean loss: 0.3406470763461029
Epoch: 58, step: 202, loss: 0.3616853356361389, mean loss: 0.3406473269358151
Epoch: 58, step: 203, loss: 0.3234950304031372, mean loss: 0.34064712263479396
Epoch: 58, step: 204, loss: 0.3005925714969635, mean loss: 0.34064664555067786
Epoch: 58, step: 205, loss: 0.28559187054634094, mean loss: 0.34064598980881877
Epoch: 58, step: 206, loss: 0.3229149580001831, mean loss: 0.3406457786220275
Epoch: 58, step: 207, loss: 0.3470950424671173, mean loss: 0.3406458554355559
Epoch: 58, step: 208, loss: 0.30212801694869995, mean loss: 0.34064539667686455
Epoch: 58, step: 209, loss: 0.32945236563682556, mean loss: 0.34064526336618783
Epoch: 58, step: 210, loss: 0.34289371967315674, mean loss: 0.3406452901453204
Epoch: 58, step: 211, loss: 0.32912781834602356, mean loss: 0.34064515297377307
Epoch: 58, step: 212, loss: 0.3175613284111023, mean loss: 0.34064487805178695
Epoch: 58, step: 213, loss: 0.3504784107208252, mean loss: 0.34064499516505503
Epoch: 58, step: 214, loss: 0.3615458905696869, mean loss: 0.3406452440830276
Epoch: 58, step: 215, loss: 0.3291935622692108, mean loss: 0.34064510770152734
Epoch: 58, step: 216, loss: 0.3196384310722351, mean loss: 0.34064485752971835
Epoch: 58, step: 217, loss: 0.3184332549571991, mean loss: 0.34064459301140737
Epoch: 58, step: 218, loss: 0.35487911105155945, mean loss: 0.3406447625284792
Epoch: 58, step: 219, loss: 0.34676477313041687, mean loss: 0.34064483541004215
Epoch: 58, step: 220, loss: 0.3005036413669586, mean loss: 0.34064435738503357
Epoch: 58, step: 221, loss: 0.3616693615913391, mean loss: 0.3406446077601998
Epoch: 58, step: 222, loss: 0.3595714271068573, mean loss: 0.34064483314655697
Epoch: 58, step: 223, loss: 0.3186399042606354, mean loss: 0.34064457110824975
Epoch: 58, step: 224, loss: 0.37525811791419983, mean loss: 0.34064498328714166
Epoch: 58, step: 225, loss: 0.3629089295864105, mean loss: 0.34064524840355664
Epoch: 58, step: 226, loss: 0.33054643869400024, mean loss: 0.34064512814956804
Epoch: 58, step: 227, loss: 0.3876258432865143, mean loss: 0.3406456875769929
Epoch: 58, step: 228, loss: 0.330463171005249, mean loss: 0.3406455663291324
Epoch: 58, step: 229, loss: 0.36776047945022583, mean loss: 0.3406458891949027
Epoch: 58, step: 230, loss: 0.41079437732696533, mean loss: 0.3406467244649946
Epoch: 58, step: 231, loss: 0.32678496837615967, mean loss: 0.34064655941265026
Epoch: 58, step: 232, loss: 0.326272189617157, mean loss: 0.3406463882586371
Epoch: 58, step: 233, loss: 0.37045592069625854, mean loss: 0.340646743193179
Epoch: 58, step: 234, loss: 0.3396487534046173, mean loss: 0.3406467313105092
Epoch: 58, step: 235, loss: 0.3326800763607025, mean loss: 0.3406466364558282
Epoch: 58, step: 236, loss: 0.39999350905418396, mean loss: 0.3406473430587476
Epoch: 58, step: 237, loss: 0.33520379662513733, mean loss: 0.3406472782469077
Epoch: 58, step: 238, loss: 0.3165045976638794, mean loss: 0.3406469908032461
Epoch: 58, step: 239, loss: 0.3251035213470459, mean loss: 0.3406468057443184
Epoch: 58, step: 240, loss: 0.34779179096221924, mean loss: 0.3406468908107551
Epoch: 58, step: 241, loss: 0.33359190821647644, mean loss: 0.34064680681686754
Epoch: 58, step: 242, loss: 0.34718114137649536, mean loss: 0.3406468846111953
Epoch: 58, step: 243, loss: 0.32565850019454956, mean loss: 0.3406467061695503
Epoch: 58, step: 244, loss: 0.3179561197757721, mean loss: 0.34064643603387407
Epoch: 58, step: 245, loss: 0.32847467064857483, mean loss: 0.34064629112845507
Epoch: 58, step: 246, loss: 0.302663654088974, mean loss: 0.3406458389488215
Epoch: 58, step: 247, loss: 0.2961982786655426, mean loss: 0.34064530981119906
Epoch: 58, step: 248, loss: 0.28866928815841675, mean loss: 0.34064469105640266
Epoch: 58, step: 249, loss: 0.33613890409469604, mean loss: 0.3406446374173588
Epoch: 58, step: 250, loss: 0.3493427634239197, mean loss: 0.34064474096277986
Epoch: 58, step: 251, loss: 0.3383859395980835, mean loss: 0.34064471407356783
Epoch: 58, step: 252, loss: 0.37752828001976013, mean loss: 0.3406451531375039
Epoch: 58, step: 253, loss: 0.3319544196128845, mean loss: 0.34064504968378007
Epoch: 58, step: 254, loss: 0.3883114755153656, mean loss: 0.34064561709394625
Epoch: 58, step: 255, loss: 0.30061665177345276, mean loss: 0.3406451406040248
Epoch: 58, step: 256, loss: 0.3012974262237549, mean loss: 0.3406446722290366
Epoch: 58, step: 257, loss: 0.3519853949546814, mean loss: 0.3406448072215699
Epoch: 58, step: 258, loss: 0.3521801829338074, mean loss: 0.34064494452949046
Epoch: 58, step: 259, loss: 0.3265596628189087, mean loss: 0.34064477687151645
Epoch: 58, step: 260, loss: 0.32873767614364624, mean loss: 0.34064463514225163
Epoch: 58, step: 261, loss: 0.33786842226982117, mean loss: 0.34064460209760583
Epoch: 58, step: 262, loss: 0.351970911026001, mean loss: 0.34064473691054314
Epoch: 58, step: 263, loss: 0.3566708564758301, mean loss: 0.34064492766134735
Epoch: 58, step: 264, loss: 0.3150540292263031, mean loss: 0.34064462306943816
Epoch: 58, step: 265, loss: 0.3313961923122406, mean loss: 0.34064451299265985
Epoch: 58, step: 266, loss: 0.3628406822681427, mean loss: 0.3406447771730152
Epoch: 58, step: 267, loss: 0.3376246690750122, mean loss: 0.3406447412279057
Epoch: 58, step: 268, loss: 0.315577894449234, mean loss: 0.34064444288764817
Epoch: 58, step: 269, loss: 0.3111739158630371, mean loss: 0.34064409213990327
Epoch: 58, step: 270, loss: 0.32237446308135986, mean loss: 0.3406438747038553
Epoch: 58, step: 271, loss: 0.30887189507484436, mean loss: 0.3406434965740397
Epoch: 58, step: 272, loss: 0.3521750271320343, mean loss: 0.34064363381332036
Epoch: 58, step: 273, loss: 0.3468192517757416, mean loss: 0.3406437073098329
Epoch: 58, step: 274, loss: 0.3177354037761688, mean loss: 0.34064343467956487
Epoch: 58, step: 275, loss: 0.31461572647094727, mean loss: 0.34064312492914584
Epoch: 58, step: 276, loss: 0.330437034368515, mean loss: 0.34064300347000004
Epoch: 58, step: 277, loss: 0.3051168918609619, mean loss: 0.3406425806910924
Epoch: 58, step: 278, loss: 0.33488985896110535, mean loss: 0.3406425122315747
Epoch: 58, step: 279, loss: 0.3350647985935211, mean loss: 0.340642445855508
Epoch: 58, step: 280, loss: 0.36811360716819763, mean loss: 0.34064277276471405
Epoch: 58, step: 281, loss: 0.30814096331596375, mean loss: 0.3406423859949608
Epoch: 58, step: 282, loss: 0.32391148805618286, mean loss: 0.34064218690056036
Epoch: 58, step: 283, loss: 0.2997047007083893, mean loss: 0.3406416997583095
Epoch: 58, step: 284, loss: 0.31839296221733093, mean loss: 0.3406414350090021
Epoch: 58, step: 285, loss: 0.3196495473384857, mean loss: 0.3406411852185779
Epoch: 58, step: 286, loss: 0.34253543615341187, mean loss: 0.3406412077587192
Epoch: 58, step: 287, loss: 0.3519682288169861, mean loss: 0.3406413425400264
Epoch: 58, step: 288, loss: 0.3033232092857361, mean loss: 0.3406408984932724
Epoch: 58, step: 289, loss: 0.39291661977767944, mean loss: 0.3406415205122782
Epoch: 58, step: 290, loss: 0.3194037079811096, mean loss: 0.3406412678105359
Epoch: 58, step: 291, loss: 0.3415331244468689, mean loss: 0.3406412784223182
Epoch: 58, step: 292, loss: 0.37443268299102783, mean loss: 0.34064168048555304
Epoch: 58, step: 293, loss: 0.3256639838218689, mean loss: 0.34064150227723067
Epoch: 58, step: 294, loss: 0.350104421377182, mean loss: 0.34064161486803224
Epoch: 58, step: 295, loss: 0.29946237802505493, mean loss: 0.34064112491899307
Epoch: 58, step: 296, loss: 0.31744205951690674, mean loss: 0.3406408489006537
Epoch: 58, step: 297, loss: 0.32213374972343445, mean loss: 0.3406406287091109
Epoch: 58, step: 298, loss: 0.3497208058834076, mean loss: 0.3406407367408675
Epoch: 58, step: 299, loss: 0.3277985155582428, mean loss: 0.34064058395186564
Epoch: 58, step: 300, loss: 0.3662413954734802, mean loss: 0.3406408885312563
Epoch: 58, step: 301, loss: 0.32897675037384033, mean loss: 0.34064074976167774
Epoch: 58, step: 302, loss: 0.35368040204048157, mean loss: 0.3406409048940587
Epoch: 58, step: 303, loss: 0.3404005169868469, mean loss: 0.34064090203420444
Epoch: 58, step: 304, loss: 0.32702216506004333, mean loss: 0.34064074001632405
Epoch: 58, step: 305, loss: 0.34776580333709717, mean loss: 0.34064082477997915
Epoch: 58, step: 306, loss: 0.31470638513565063, mean loss: 0.3406405162533533
Epoch: 58, step: 307, loss: 0.31115370988845825, mean loss: 0.34064016547050335
Epoch: 58, step: 308, loss: 0.30603229999542236, mean loss: 0.340639753771077
Epoch: 58, step: 309, loss: 0.32319411635398865, mean loss: 0.3406395462380964
Epoch: 58, step: 310, loss: 0.33849233388900757, mean loss: 0.3406395206952018
Epoch: 58, step: 311, loss: 0.3569071292877197, mean loss: 0.3406397142097692
Epoch: 58, step: 312, loss: 0.3540516793727875, mean loss: 0.3406398737525654
Epoch: 58, step: 313, loss: 0.3047840893268585, mean loss: 0.3406394472331113
Epoch: 58, step: 314, loss: 0.30901065468788147, mean loss: 0.34063907099995744
Epoch: 58, step: 315, loss: 0.3545835614204407, mean loss: 0.3406392368715188
Epoch: 58, step: 316, loss: 0.35097968578338623, mean loss: 0.34063935987106575
Epoch: 58, step: 317, loss: 0.3091476559638977, mean loss: 0.34063898528198633
Epoch: 58, step: 318, loss: 0.2848719358444214, mean loss: 0.3406383219492148
Epoch: 58, step: 319, loss: 0.30741414427757263, mean loss: 0.340637926762022
Epoch: 58, step: 320, loss: 0.3351369798183441, mean loss: 0.34063786133142065
Epoch: 58, step: 321, loss: 0.3475292921066284, mean loss: 0.34063794330005276
Epoch: 58, step: 322, loss: 0.32261577248573303, mean loss: 0.3406377289417915
Epoch: 58, step: 323, loss: 0.3246717154979706, mean loss: 0.340637539042017
Epoch: 58, step: 324, loss: 0.34489595890045166, mean loss: 0.3406375896910632
Epoch: 58, step: 325, loss: 0.3550901710987091, mean loss: 0.3406377615859871
Epoch: 58, step: 326, loss: 0.3044355809688568, mean loss: 0.3406373310125904
Epoch: 58, step: 327, loss: 0.30733156204223633, mean loss: 0.3406369348925979
Epoch: 58, step: 328, loss: 0.33381134271621704, mean loss: 0.3406368537138277
Epoch: 58, step: 329, loss: 0.3952596187591553, mean loss: 0.34063750335067083
Epoch: 58, step: 330, loss: 0.39221614599227905, mean loss: 0.3406381167760082
Epoch: 58, step: 331, loss: 0.3177497386932373, mean loss: 0.3406378445675252
Epoch: 58, step: 332, loss: 0.3605850040912628, mean loss: 0.3406380817936598
Epoch: 58, step: 333, loss: 0.3852870762348175, mean loss: 0.3406386127856732
Epoch: 58, step: 334, loss: 0.3228803873062134, mean loss: 0.3406384015969582
Epoch: 58, step: 335, loss: 0.34080827236175537, mean loss: 0.34063840361711284
Epoch: 58, step: 336, loss: 0.3235152065753937, mean loss: 0.3406381999852818
Epoch: 58, step: 337, loss: 0.2896547317504883, mean loss: 0.3406375936888347
Epoch: 58, step: 338, loss: 0.3267935812473297, mean loss: 0.3406374290575134
Epoch: 58, step: 339, loss: 0.31293419003486633, mean loss: 0.34063709961786365
Epoch: 58, step: 340, loss: 0.31068605184555054, mean loss: 0.3406367434520975
Epoch: 58, step: 341, loss: 0.32664090394973755, mean loss: 0.34063657702120465
Epoch: 58, step: 342, loss: 0.3665429651737213, mean loss: 0.3406368850821851
Epoch: 58, step: 343, loss: 0.3391719162464142, mean loss: 0.3406368676619887
Epoch: 58, step: 344, loss: 0.2912711203098297, mean loss: 0.34063628065237656
Epoch: 58, step: 345, loss: 0.3060781955718994, mean loss: 0.3406358697260159
Epoch: 58, step: 346, loss: 0.3285728096961975, mean loss: 0.3406357262872113
Epoch: 58, step: 347, loss: 0.337650865316391, mean loss: 0.34063569079540423
Epoch: 58, step: 348, loss: 0.3086901903152466, mean loss: 0.3406353109485477
Epoch: 58, step: 349, loss: 0.3495691120624542, mean loss: 0.34063541717433443
Epoch: 58, step: 350, loss: 0.3315791189670563, mean loss: 0.340635309493298
Epoch: 58, step: 351, loss: 0.37733331322669983, mean loss: 0.3406357458340634
Epoch: 58, step: 352, loss: 0.34391331672668457, mean loss: 0.34063578480405204
Epoch: 58, step: 353, loss: 0.3379902243614197, mean loss: 0.34063575334897817
Epoch: 58, step: 354, loss: 0.34573590755462646, mean loss: 0.3406358139878573
Epoch: 58, step: 355, loss: 0.34800201654434204, mean loss: 0.34063590156814166
Epoch: 58, step: 356, loss: 0.3344002068042755, mean loss: 0.3406358274298834
Epoch: 58, step: 357, loss: 0.3077494204044342, mean loss: 0.3406354364370523
Epoch: 58, step: 358, loss: 0.3887270390987396, mean loss: 0.3406360082005869
Epoch: 58, step: 359, loss: 0.3238801062107086, mean loss: 0.3406358089911758
Epoch: 58, step: 360, loss: 0.3168052136898041, mean loss: 0.34063552567474076
Epoch: 58, step: 361, loss: 0.29635512828826904, mean loss: 0.3406349992415978
Epoch: 58, step: 362, loss: 0.3389589786529541, mean loss: 0.3406349793162505
Epoch: 58, step: 363, loss: 0.39337968826293945, mean loss: 0.3406356063635298
Epoch: 58, step: 364, loss: 0.364475816488266, mean loss: 0.34063588978079534
Epoch: 58, step: 365, loss: 0.33639848232269287, mean loss: 0.3406358394062327
Epoch: 58, step: 366, loss: 0.34213969111442566, mean loss: 0.34063585728390255
Epoch: 58, step: 367, loss: 0.31945329904556274, mean loss: 0.3406356054703239
Epoch: 58, step: 368, loss: 0.3079763650894165, mean loss: 0.3406352172290954
Epoch: 58, step: 369, loss: 0.35562601685523987, mean loss: 0.34063539543217697
Epoch: 58, step: 370, loss: 0.33944547176361084, mean loss: 0.3406353812871314
Epoch: 58, step: 371, loss: 0.3430386185646057, mean loss: 0.34063540985492746
Epoch: 58, step: 372, loss: 0.3563383221626282, mean loss: 0.34063559651658937
Epoch: 58, step: 373, loss: 0.3677383363246918, mean loss: 0.34063591868500115
Epoch: 58, step: 374, loss: 0.3197612464427948, mean loss: 0.3406356705521515
Epoch: 58, step: 375, loss: 0.3271905183792114, mean loss: 0.340635510734348
Epoch: 58, step: 376, loss: 0.3350219130516052, mean loss: 0.34063544400827633
Epoch: 58, step: 377, loss: 0.32033833861351013, mean loss: 0.34063520274944603
Epoch: 58, step: 378, loss: 0.3481998145580292, mean loss: 0.34063529266412446
Epoch: 58, step: 379, loss: 0.328823059797287, mean loss: 0.34063515226293506
Epoch: 58, step: 380, loss: 0.2971690893173218, mean loss: 0.3406346356278104
Epoch: 58, step: 381, loss: 0.3388075828552246, mean loss: 0.3406346139118243
Epoch: 58, step: 382, loss: 0.36013907194137573, mean loss: 0.34063484573518
Epoch: 58, step: 383, loss: 0.31243234872817993, mean loss: 0.3406345105338749
Epoch: 58, step: 384, loss: 0.35229310393333435, mean loss: 0.3406346491006576
Epoch: 58, step: 385, loss: 0.30994996428489685, mean loss: 0.3406342844059321
Epoch: 58, step: 386, loss: 0.32753628492355347, mean loss: 0.3406341287349652
Epoch: 58, step: 387, loss: 0.3053561747074127, mean loss: 0.3406337094581167
Epoch: 58, step: 388, loss: 0.32169273495674133, mean loss: 0.34063348434818813
Epoch: 58, step: 389, loss: 0.3242230713367462, mean loss: 0.34063328931582604
Epoch: 58, step: 390, loss: 0.3578788936138153, mean loss: 0.34063349427172607
Epoch: 58, step: 391, loss: 0.3515456020832062, mean loss: 0.3406336239554565
Epoch: 58, step: 392, loss: 0.30781617760658264, mean loss: 0.34063323394480405
Epoch: 58, step: 393, loss: 0.33800947666168213, mean loss: 0.3406332027637939
Epoch: 58, step: 394, loss: 0.3472272753715515, mean loss: 0.3406332811275217
Epoch: 58, step: 395, loss: 0.31250569224357605, mean loss: 0.34063294686421325
Epoch: 58, step: 396, loss: 0.30734676122665405, mean loss: 0.34063255130175096
Epoch: 58, step: 397, loss: 0.31033235788345337, mean loss: 0.34063219122815125
Epoch: 58, step: 398, loss: 0.33774784207344055, mean loss: 0.3406321569522763
Epoch: 58, step: 399, loss: 0.32693347334861755, mean loss: 0.3406319941672729
Epoch: 58, step: 400, loss: 0.3266448974609375, mean loss: 0.3406318279569571
Epoch: 58, step: 401, loss: 0.33982643485069275, mean loss: 0.3406318183864898
Epoch: 58, step: 402, loss: 0.3402859568595886, mean loss: 0.34063181427667427
Epoch: 58, step: 403, loss: 0.3511616885662079, mean loss: 0.3406319393999488
Epoch: 58, step: 404, loss: 0.32995593547821045, mean loss: 0.340631812541768
Epoch: 58, step: 405, loss: 0.3382020592689514, mean loss: 0.3406317836704394
Epoch: 58, step: 406, loss: 0.3225231468677521, mean loss: 0.3406315684987192
Epoch: 58, step: 407, loss: 0.3009219169616699, mean loss: 0.34063109666350605
Epoch: 58, step: 408, loss: 0.33223286271095276, mean loss: 0.34063099687579024
Epoch: 58, step: 409, loss: 0.3111235499382019, mean loss: 0.3406306462728229
Epoch: 58, step: 410, loss: 0.29648593068122864, mean loss: 0.3406301217583024
Epoch: 58, step: 411, loss: 0.3265681564807892, mean loss: 0.340629954680154
Epoch: 58, step: 412, loss: 0.35835522413253784, mean loss: 0.34063016528158513
Epoch: 58, step: 413, loss: 0.3211172819137573, mean loss: 0.3406299334435108
Epoch: 58, step: 414, loss: 0.3512799143791199, mean loss: 0.3406300599774366
Epoch: 58, step: 415, loss: 0.2992858588695526, mean loss: 0.3406295687669872
Epoch: 58, step: 416, loss: 0.35608503222465515, mean loss: 0.34062975239116544
Epoch: 58, step: 417, loss: 0.36146146059036255, mean loss: 0.3406299998868076
Epoch: 58, step: 418, loss: 0.35800135135650635, mean loss: 0.3406302062684767
Epoch: 58, step: 419, loss: 0.30573514103889465, mean loss: 0.340629791699912
Epoch: 58, step: 420, loss: 0.36545273661613464, mean loss: 0.3406300866037994
Epoch: 58, step: 421, loss: 0.3512929379940033, mean loss: 0.3406302132801055
Epoch: 58, step: 422, loss: 0.3061387836933136, mean loss: 0.3406298035215123
Epoch: 58, step: 423, loss: 0.4011296331882477, mean loss: 0.34063052225166895
Epoch: 58, step: 424, loss: 0.33158406615257263, mean loss: 0.3406304147822165
Epoch: 58, step: 425, loss: 0.30693763494491577, mean loss: 0.3406300145258569
Epoch: 58, step: 426, loss: 0.34995394945144653, mean loss: 0.3406301252890511
Epoch: 58, step: 427, loss: 0.3308200538158417, mean loss: 0.3406300087522078
Epoch: 58, step: 428, loss: 0.2991214692592621, mean loss: 0.3406295156654127
Epoch: 58, step: 429, loss: 0.36978939175605774, mean loss: 0.3406298620562812
Epoch: 58, step: 430, loss: 0.3522164523601532, mean loss: 0.3406299996920307
Epoch: 58, step: 431, loss: 0.3339346945285797, mean loss: 0.3406299201602294
Epoch: 58, step: 432, loss: 0.30208247900009155, mean loss: 0.34062946227056784
Epoch: 58, step: 433, loss: 0.316542387008667, mean loss: 0.3406291761532174
Epoch: 58, step: 434, loss: 0.3117811679840088, mean loss: 0.34062883348738815
Epoch: 58, step: 435, loss: 0.32543203234672546, mean loss: 0.3406286529770881
Epoch: 58, step: 436, loss: 0.35217398405075073, mean loss: 0.34062879011294994
Epoch: 58, step: 437, loss: 0.3246387243270874, mean loss: 0.3406286001846237
Epoch: 58, step: 438, loss: 0.30826467275619507, mean loss: 0.3406282157738503
Epoch: 58, step: 439, loss: 0.3136560618877411, mean loss: 0.3406278954090426
Epoch: 58, step: 440, loss: 0.3559439480304718, mean loss: 0.34062807732502876
Epoch: 58, step: 441, loss: 0.3520040810108185, mean loss: 0.34062821244158914
Epoch: 58, step: 442, loss: 0.33349043130874634, mean loss: 0.3406281276648075
Epoch: 58, step: 443, loss: 0.34734418988227844, mean loss: 0.3406282074318061
Epoch: 58, step: 444, loss: 0.29141074419021606, mean loss: 0.34062762288053655
Epoch: 58, step: 445, loss: 0.3288205564022064, mean loss: 0.3406274826507629
Epoch: 58, step: 446, loss: 0.3095792829990387, mean loss: 0.3406271139029197
Epoch: 58, step: 447, loss: 0.30586132407188416, mean loss: 0.34062670100755355
Epoch: 58, step: 448, loss: 0.32351091504096985, mean loss: 0.34062649773459996
Epoch: 58, step: 449, loss: 0.3286120891571045, mean loss: 0.3406263550490512
Epoch: 58, step: 450, loss: 0.31339967250823975, mean loss: 0.340626031703297
Epoch: 58, step: 451, loss: 0.3719210624694824, mean loss: 0.3406264033605908
Epoch: 58, step: 452, loss: 0.3083462119102478, mean loss: 0.34062602000815984
Epoch: 58, step: 453, loss: 0.28109556436538696, mean loss: 0.34062531304599986
Epoch: 58, step: 454, loss: 0.3341710567474365, mean loss: 0.3406252363984967
Epoch: 58, step: 455, loss: 0.30997639894485474, mean loss: 0.34062487243263295
Epoch: 58, step: 456, loss: 0.299988329410553, mean loss: 0.34062438986493804
Epoch: 58, step: 457, loss: 0.3291238844394684, mean loss: 0.34062425329558255
Epoch: 58, step: 458, loss: 0.31044015288352966, mean loss: 0.3406238948614063
Epoch: 58, step: 459, loss: 0.32225197553634644, mean loss: 0.34062367669868215
Epoch: 58, step: 460, loss: 0.29554468393325806, mean loss: 0.3406231414013674
Epoch: 58, step: 461, loss: 0.30611640214920044, mean loss: 0.340622731650741
Epoch: 58, step: 462, loss: 0.3310379683971405, mean loss: 0.34062261783772363
Epoch: 58, step: 463, loss: 0.33192509412765503, mean loss: 0.3406225145613425
Epoch: 58, step: 464, loss: 0.3251045048236847, mean loss: 0.340622330299142
Epoch: 58, step: 465, loss: 0.31352412700653076, mean loss: 0.34062200853653435
Epoch: 58, step: 466, loss: 0.32812798023223877, mean loss: 0.3406218601848761
Epoch: 58, step: 467, loss: 0.3486867845058441, mean loss: 0.3406219559450794
Epoch: 58, step: 468, loss: 0.30047211050987244, mean loss: 0.3406214792249569
Epoch: 58, step: 469, loss: 0.32009798288345337, mean loss: 0.3406212355416397
Epoch: 58, step: 470, loss: 0.36106300354003906, mean loss: 0.34062147825168326
Epoch: 58, step: 471, loss: 0.3430536091327667, mean loss: 0.34062150712861716
Epoch: 58, step: 472, loss: 0.34151491522789, mean loss: 0.3406215177360152
Epoch: 58, step: 473, loss: 0.3285950720310211, mean loss: 0.3406213749482097
Epoch: 58, step: 474, loss: 0.3421138525009155, mean loss: 0.34062139266791425
Epoch: 58, step: 475, loss: 0.31262433528900146, mean loss: 0.34062106027183003
Epoch: 58, step: 476, loss: 0.37416425347328186, mean loss: 0.34062145850988584
Epoch: 58, step: 477, loss: 0.31668779253959656, mean loss: 0.34062117436331135
Epoch: 58, step: 478, loss: 0.314527302980423, mean loss: 0.3406208645739062
Epoch: 58, step: 479, loss: 0.34923192858695984, mean loss: 0.34062096680422266
Epoch: 58, step: 480, loss: 0.33567118644714355, mean loss: 0.34062090804126327
Epoch: 58, step: 481, loss: 0.298425555229187, mean loss: 0.34062040711108293
Epoch: 58, step: 482, loss: 0.34203052520751953, mean loss: 0.3406204238513702
Epoch: 58, step: 483, loss: 0.3551006019115448, mean loss: 0.3406205957514849
Epoch: 58, step: 484, loss: 0.3149176239967346, mean loss: 0.34062029062461957
Epoch: 58, step: 485, loss: 0.33604952692985535, mean loss: 0.34062023636450306
Epoch: 58, step: 486, loss: 0.31762972474098206, mean loss: 0.3406199634444586
Epoch: 58, step: 487, loss: 0.3220982551574707, mean loss: 0.3406197435761266
Epoch: 58, step: 488, loss: 0.3559204041957855, mean loss: 0.34061992520574425
Epoch: 58, step: 489, loss: 0.3522909879684448, mean loss: 0.34062006374783443
Epoch: 58, step: 490, loss: 0.32577723264694214, mean loss: 0.34061988755715866
Epoch: 58, step: 491, loss: 0.34793075919151306, mean loss: 0.34061997433926344
Epoch: 58, step: 492, loss: 0.32265573740005493, mean loss: 0.3406197611012441
Epoch: 58, step: 493, loss: 0.3312613070011139, mean loss: 0.34061965001639616
Epoch: 58, step: 494, loss: 0.2991947829723358, mean loss: 0.34061915830907075
Epoch: 58, step: 495, loss: 0.35495951771736145, mean loss: 0.3406193285250926
Epoch: 58, step: 496, loss: 0.29937732219696045, mean loss: 0.34061883899991924
Epoch: 58, step: 497, loss: 0.31830722093582153, mean loss: 0.3406185741735921
Epoch: 58, step: 498, loss: 0.33107060194015503, mean loss: 0.3406184608458899
Epoch: 58, step: 499, loss: 0.3314535319805145, mean loss: 0.34061835206593377
Epoch: 58, step: 500, loss: 0.32311058044433594, mean loss: 0.3406181442659549
Epoch: 58, step: 501, loss: 0.37661391496658325, mean loss: 0.3406185714951749
Epoch: 58, step: 502, loss: 0.31183964014053345, mean loss: 0.3406182299257564
Epoch: 58, step: 503, loss: 0.3111329674720764, mean loss: 0.34061787997723697
Epoch: 58, step: 504, loss: 0.3199532628059387, mean loss: 0.34061763472025924
Epoch: 58, step: 505, loss: 0.30228742957115173, mean loss: 0.3406171798055313
Epoch: 58, step: 506, loss: 0.3175462782382965, mean loss: 0.3406169059961867
Epoch: 58, step: 507, loss: 0.2875794768333435, mean loss: 0.3406162765465171
Epoch: 58, step: 508, loss: 0.33433493971824646, mean loss: 0.3406162020003234
Epoch: 58, step: 509, loss: 0.3277697265148163, mean loss: 0.3406160495416174
Epoch: 58, step: 510, loss: 0.34443917870521545, mean loss: 0.34061609491300415
Epoch: 58, step: 511, loss: 0.3849235773086548, mean loss: 0.3406166207304635
Epoch: 58, step: 512, loss: 0.3421996533870697, mean loss: 0.34061663951682386
Epoch: 58, step: 513, loss: 0.32756444811820984, mean loss: 0.3406164846240866
Epoch: 58, step: 514, loss: 0.3503791093826294, mean loss: 0.34061660047756137
Epoch: 58, step: 515, loss: 0.32751789689064026, mean loss: 0.34061644503654476
Epoch: 58, step: 516, loss: 0.3146530091762543, mean loss: 0.3406161369346821
Epoch: 58, step: 517, loss: 0.3663703203201294, mean loss: 0.3406164425497692
Epoch: 58, step: 518, loss: 0.3138379752635956, mean loss: 0.34061612478366593
Epoch: 58, step: 519, loss: 0.3739216923713684, mean loss: 0.340616519998774
Epoch: 58, step: 520, loss: 0.31343552470207214, mean loss: 0.34061619746373556
Epoch: 58, step: 521, loss: 0.3561064898967743, mean loss: 0.3406163812724124
Epoch: 58, step: 522, loss: 0.3070230484008789, mean loss: 0.3406159826567746
Epoch: 58, step: 523, loss: 0.3626873791217804, mean loss: 0.3406162445509849
Epoch: 58, step: 524, loss: 0.3349402844905853, mean loss: 0.34061617720212267
Epoch: 58, step: 525, loss: 0.3357056975364685, mean loss: 0.34061611893686167
Epoch: 58, step: 526, loss: 0.3695656955242157, mean loss: 0.3406164624337777
Epoch: 58, step: 527, loss: 0.3374544084072113, mean loss: 0.34061642491533883
Epoch: 58, step: 528, loss: 0.31396687030792236, mean loss: 0.3406161087164968
Epoch: 58, step: 529, loss: 0.36783528327941895, mean loss: 0.34061643167008787
Epoch: 58, step: 530, loss: 0.3313627541065216, mean loss: 0.34061632187715735
Epoch: 58, step: 531, loss: 0.33095619082450867, mean loss: 0.3406162072631019
Epoch: 58, step: 532, loss: 0.3197118639945984, mean loss: 0.340615959243368
Epoch: 58, step: 533, loss: 0.3328855633735657, mean loss: 0.34061586752711775
Epoch: 58, step: 534, loss: 0.3772032856941223, mean loss: 0.3406163016085083
Epoch: 58, step: 535, loss: 0.33011576533317566, mean loss: 0.34061617702925295
Epoch: 58, step: 536, loss: 0.3310912847518921, mean loss: 0.34061606402646166
Epoch: 58, step: 537, loss: 0.307167649269104, mean loss: 0.3406156672010404
Epoch: 58, step: 538, loss: 0.328226774930954, mean loss: 0.3406155202234002
Epoch: 58, step: 539, loss: 0.3189994692802429, mean loss: 0.34061526378090334
Epoch: 58, step: 540, loss: 0.3158620595932007, mean loss: 0.34061497012420366
Epoch: 58, step: 541, loss: 0.3570489287376404, mean loss: 0.3406151650842081
Epoch: 58, step: 542, loss: 0.31260010600090027, mean loss: 0.34061483273876547
Epoch: 58, step: 543, loss: 0.3332963287830353, mean loss: 0.3406147459196524
Epoch: 58, step: 544, loss: 0.32391610741615295, mean loss: 0.34061454782673684
Epoch: 58, step: 545, loss: 0.3376578986644745, mean loss: 0.3406145127529609
Epoch: 58, step: 546, loss: 0.31075412034988403, mean loss: 0.3406141585329535
Epoch: 58, step: 547, loss: 0.30995818972587585, mean loss: 0.3406137948797055
Epoch: 58, step: 548, loss: 0.3449253439903259, mean loss: 0.3406138460244026
Epoch: 58, step: 549, loss: 0.41791588068008423, mean loss: 0.34061476299001026
Epoch: 58, step: 550, loss: 0.3514045178890228, mean loss: 0.34061489097780306
Epoch: 58, step: 551, loss: 0.3247455954551697, mean loss: 0.34061470273886396
Epoch: 58, step: 552, loss: 0.31515777111053467, mean loss: 0.34061440077656485
Epoch: 58, step: 553, loss: 0.3294212520122528, mean loss: 0.34061426800844913
Epoch: 58, step: 554, loss: 0.329273521900177, mean loss: 0.3406141334911954
Epoch: 58, step: 555, loss: 0.27357345819473267, mean loss: 0.3406133383036059
Epoch: 58, step: 556, loss: 0.3071305453777313, mean loss: 0.3406129411598499
Epoch: 58, step: 557, loss: 0.332302987575531, mean loss: 0.34061284259558017
Epoch: 58, step: 558, loss: 0.37528446316719055, mean loss: 0.3406132538304199
Epoch: 58, step: 559, loss: 0.33643248677253723, mean loss: 0.34061320424356323
Epoch: 58, step: 560, loss: 0.3649716079235077, mean loss: 0.3406134931480463
Epoch: 58, step: 561, loss: 0.3541024625301361, mean loss: 0.3406136531329762
Epoch: 58, step: 562, loss: 0.367083340883255, mean loss: 0.3406139670710388
Epoch: 58, step: 563, loss: 0.35011357069015503, mean loss: 0.3406140797377168
Epoch: 58, step: 564, loss: 0.2892574071884155, mean loss: 0.3406134706473489
Epoch: 58, step: 565, loss: 0.32660531997680664, mean loss: 0.3406133045125892
Epoch: 58, step: 566, loss: 0.3589443564414978, mean loss: 0.3406135219137909
Epoch: 58, step: 567, loss: 0.3353639245033264, mean loss: 0.3406134596557571
Epoch: 58, step: 568, loss: 0.32933634519577026, mean loss: 0.34061332591547344
Epoch: 58, step: 569, loss: 0.32208266854286194, mean loss: 0.3406131061548253
Epoch: 58, step: 570, loss: 0.34204694628715515, mean loss: 0.34061312315896575
Epoch: 58, step: 571, loss: 0.3525967299938202, mean loss: 0.3406132652727985
Epoch: 58, step: 572, loss: 0.33715003728866577, mean loss: 0.3406132242027957
Epoch: 58, step: 573, loss: 0.30781200528144836, mean loss: 0.3406128352217113
Epoch: 58, step: 574, loss: 0.3536595106124878, mean loss: 0.340612989936991
Epoch: 58, step: 575, loss: 0.3301752507686615, mean loss: 0.3406128661615052
Epoch: 58, step: 576, loss: 0.3192981481552124, mean loss: 0.34061261340482596
Epoch: 58, step: 577, loss: 0.400813490152359, mean loss: 0.3406133272774306
Epoch: 58, step: 578, loss: 0.37087348103523254, mean loss: 0.34061368610341103
Epoch: 58, step: 579, loss: 0.29634910821914673, mean loss: 0.34061316121869484
Epoch: 58, step: 580, loss: 0.33764198422431946, mean loss: 0.34061312598720783
Epoch: 58, step: 581, loss: 0.35403525829315186, mean loss: 0.3406132851416687
Epoch: 58, step: 582, loss: 0.31155192852020264, mean loss: 0.3406129405474122
Epoch: 58, step: 583, loss: 0.3534257113933563, mean loss: 0.34061309247269733
Epoch: 58, step: 584, loss: 0.3294135630130768, mean loss: 0.3406129596777264
Epoch: 58, step: 585, loss: 0.317105770111084, mean loss: 0.3406126809517717
Epoch: 58, step: 586, loss: 0.3535196781158447, mean loss: 0.3406128339888858
Epoch: 58, step: 587, loss: 0.35794055461883545, mean loss: 0.3406130394396877
Epoch: 58, step: 588, loss: 0.33213120698928833, mean loss: 0.3406129388737417
Epoch: 58, step: 589, loss: 0.3952292203903198, mean loss: 0.3406135864310858
Epoch: 58, step: 590, loss: 0.37185218930244446, mean loss: 0.34061395680684753
Epoch: 58, step: 591, loss: 0.3786669075489044, mean loss: 0.34061440797054315
Epoch: 58, step: 592, loss: 0.3355715870857239, mean loss: 0.3406143481825191
Epoch: 58, step: 593, loss: 0.3197530508041382, mean loss: 0.34061410085250493
Epoch: 58, step: 594, loss: 0.31699228286743164, mean loss: 0.34061382079728086
Epoch: 58, step: 595, loss: 0.33172479271888733, mean loss: 0.3406137154121137
Epoch: 58, step: 596, loss: 0.29974186420440674, mean loss: 0.34061323085567313
Epoch: 58, step: 597, loss: 0.3362121284008026, mean loss: 0.3406131786789991
Epoch: 58, step: 598, loss: 0.33840662240982056, mean loss: 0.34061315251978025
Epoch: 58, step: 599, loss: 0.35135477781295776, mean loss: 0.3406132798626446
Epoch: 58, step: 600, loss: 0.3209092319011688, mean loss: 0.3406130462722808
Epoch: 58, step: 601, loss: 0.36153632402420044, mean loss: 0.3406132943136037
Epoch: 58, step: 602, loss: 0.3410515785217285, mean loss: 0.3406132995093148
Epoch: 58, step: 603, loss: 0.3229734003543854, mean loss: 0.3406130903967543
Epoch: 58, step: 604, loss: 0.3235880434513092, mean loss: 0.3406128885753649
Epoch: 58, step: 605, loss: 0.3567337691783905, mean loss: 0.34061307967615684
Epoch: 58, step: 606, loss: 0.36769354343414307, mean loss: 0.34061340069067525
Epoch: 58, step: 607, loss: 0.37601301074028015, mean loss: 0.3406138203162093
Epoch: 58, step: 608, loss: 0.3700447380542755, mean loss: 0.34061416918497256
Epoch: 58, step: 609, loss: 0.31124699115753174, mean loss: 0.34061382107589466
Epoch: 58, step: 610, loss: 0.3417817950248718, mean loss: 0.3406138349205179
Epoch: 58, step: 611, loss: 0.3288233280181885, mean loss: 0.3406136951629566
Epoch: 58, step: 612, loss: 0.3239676058292389, mean loss: 0.34061349785258693
Epoch: 58, step: 613, loss: 0.33708441257476807, mean loss: 0.3406134560219291
Epoch: 58, step: 614, loss: 0.3511178195476532, mean loss: 0.3406135805298946
Epoch: 58, step: 615, loss: 0.3058983087539673, mean loss: 0.3406131690554994
Epoch: 58, step: 616, loss: 0.3468049168586731, mean loss: 0.34061324244439584
Epoch: 58, step: 617, loss: 0.2956715226173401, mean loss: 0.3406127097702246
Epoch: 58, step: 618, loss: 0.35099926590919495, mean loss: 0.34061283287598537
Epoch: 58, step: 619, loss: 0.31155335903167725, mean loss: 0.3406124884551604
Epoch: 58, step: 620, loss: 0.3545117974281311, mean loss: 0.34061265319161604
Epoch: 58, step: 621, loss: 0.3764440417289734, mean loss: 0.3406130778649578
Epoch: 58, step: 622, loss: 0.3112620711326599, mean loss: 0.3406127300011743
Epoch: 58, step: 623, loss: 0.3309629559516907, mean loss: 0.3406126156348373
Epoch: 58, step: 624, loss: 0.3409360349178314, mean loss: 0.34061261946786386
Epoch: 58, step: 625, loss: 0.3139632046222687, mean loss: 0.3406123036341768
Epoch: 58, step: 626, loss: 0.3178539574146271, mean loss: 0.34061203391841555
Epoch: 58, step: 627, loss: 0.3583056330680847, mean loss: 0.3406122436079054
Epoch: 58, step: 628, loss: 0.2959825098514557, mean loss: 0.34061171470052387
Epoch: 58, step: 629, loss: 0.3217574954032898, mean loss: 0.34061149126164714
Epoch: 58, step: 630, loss: 0.33110588788986206, mean loss: 0.34061137861332497
Epoch: 58, step: 631, loss: 0.3410690724849701, mean loss: 0.3406113840372664
Epoch: 58, step: 632, loss: 0.3703126609325409, mean loss: 0.34061173601068456
Epoch: 58, step: 633, loss: 0.3104833960533142, mean loss: 0.340611378980609
Epoch: 58, step: 634, loss: 0.35398805141448975, mean loss: 0.3406115374964045
Epoch: 58, step: 635, loss: 0.3080739378929138, mean loss: 0.3406111519250009
Epoch: 58, step: 636, loss: 0.3301917612552643, mean loss: 0.34061102845641295
Epoch: 58, step: 637, loss: 0.32238292694091797, mean loss: 0.34061081245805397
Epoch: 58, step: 638, loss: 0.36430999636650085, mean loss: 0.34061109328401773
Epoch: 58, step: 639, loss: 0.3893283009529114, mean loss: 0.3406116705568359
Epoch: 58, step: 640, loss: 0.29842236638069153, mean loss: 0.34061117064210156
Epoch: 58, step: 641, loss: 0.30031463503837585, mean loss: 0.3406106931610531
Epoch: 58, step: 642, loss: 0.3880099356174469, mean loss: 0.3406112547967241
Epoch: 58, step: 643, loss: 0.3180161714553833, mean loss: 0.34061098706977805
Epoch: 58, step: 644, loss: 0.32934385538101196, mean loss: 0.3406108535682118
Epoch: 58, step: 645, loss: 0.3185173273086548, mean loss: 0.3406105917903704
Epoch: 58, step: 646, loss: 0.31937292218208313, mean loss: 0.3406103401562324
Epoch: 58, step: 647, loss: 0.32422366738319397, mean loss: 0.34061014600134176
Epoch: 58, step: 648, loss: 0.37887853384017944, mean loss: 0.3406105994128871
Epoch: 58, step: 649, loss: 0.32562142610549927, mean loss: 0.34061042182025536
Epoch: 58, step: 650, loss: 0.3327534794807434, mean loss: 0.34061032873183034
Epoch: 58, step: 651, loss: 0.34426894783973694, mean loss: 0.3406103720783436
Epoch: 58, step: 652, loss: 0.3265456259250641, mean loss: 0.34061020544430354
Epoch: 58, step: 653, loss: 0.3607975244522095, mean loss: 0.34061044461354517
Epoch: 58, step: 654, loss: 0.33313533663749695, mean loss: 0.3406103560532602
Epoch: 58, step: 655, loss: 0.29596787691116333, mean loss: 0.3406098271640655
Epoch: 58, step: 656, loss: 0.3281973898410797, mean loss: 0.3406096801129534
Epoch: 58, step: 657, loss: 0.4004499316215515, mean loss: 0.340610389036677
Epoch: 58, step: 658, loss: 0.34179794788360596, mean loss: 0.3406104031054459
Epoch: 58, step: 659, loss: 0.3896353542804718, mean loss: 0.34061098388722066
Epoch: 58, step: 660, loss: 0.3173978328704834, mean loss: 0.3406107088922434
Epoch: 58, step: 661, loss: 0.32152867317199707, mean loss: 0.3406104828392697
Epoch: 58, step: 662, loss: 0.3723713755607605, mean loss: 0.34061085908629596
Epoch: 58, step: 663, loss: 0.3190615177154541, mean loss: 0.34061060381073954
Epoch: 58, step: 664, loss: 0.34384506940841675, mean loss: 0.3406106421260741
Epoch: 58, step: 665, loss: 0.32290637493133545, mean loss: 0.3406104324046024
Epoch: 58, step: 666, loss: 0.3188108801841736, mean loss: 0.3406101741742014
Epoch: 58, step: 667, loss: 0.3156944215297699, mean loss: 0.3406098790338005
Epoch: 58, step: 668, loss: 0.31527167558670044, mean loss: 0.3406095788927995
Epoch: 58, step: 669, loss: 0.32219409942626953, mean loss: 0.34060936075677495
Epoch: 58, step: 670, loss: 0.3498174250125885, mean loss: 0.3406094698273393
Epoch: 58, step: 671, loss: 0.3075193762779236, mean loss: 0.34060907787607486
Epoch: 58, step: 672, loss: 0.33359387516975403, mean loss: 0.3406089947821725
Epoch: 58, step: 673, loss: 0.31877079606056213, mean loss: 0.3406087361154262
Epoch: 58, step: 674, loss: 0.3507903218269348, mean loss: 0.3406088567117486
Epoch: 58, step: 675, loss: 0.39640235900878906, mean loss: 0.340609517552966
Epoch: 58, step: 676, loss: 0.3396472930908203, mean loss: 0.3406095061561182
Epoch: 58, step: 677, loss: 0.35652169585227966, mean loss: 0.34060969462218116
Epoch: 58, step: 678, loss: 0.3274131715297699, mean loss: 0.34060953832268104
Epoch: 58, step: 679, loss: 0.3155934810638428, mean loss: 0.34060924203623444
Epoch: 58, step: 680, loss: 0.3067444860935211, mean loss: 0.3406088409518724
Epoch: 58, step: 681, loss: 0.33915281295776367, mean loss: 0.3406088237073027
Epoch: 58, step: 682, loss: 0.37783902883529663, mean loss: 0.34060926464062574
Epoch: 58, step: 683, loss: 0.3488677740097046, mean loss: 0.3406093624485438
Epoch: 58, step: 684, loss: 0.3414788544178009, mean loss: 0.340609372746067
Epoch: 58, step: 685, loss: 0.34226226806640625, mean loss: 0.34060939232132126
Epoch: 58, step: 686, loss: 0.33729004859924316, mean loss: 0.340609353010769
Epoch: 58, step: 687, loss: 0.2927387058734894, mean loss: 0.34060878609168876
Epoch: 58, step: 688, loss: 0.32540297508239746, mean loss: 0.34060860601552895
Epoch: 58, step: 689, loss: 0.304610013961792, mean loss: 0.3406081797040719
Epoch: 58, step: 690, loss: 0.3034801781177521, mean loss: 0.34060774002284805
Epoch: 58, step: 691, loss: 0.3168487846851349, mean loss: 0.34060745866531716
Epoch: 58, step: 692, loss: 0.3629106879234314, mean loss: 0.3406077227807681
Epoch: 58, step: 693, loss: 0.3004988729953766, mean loss: 0.3406072478162963
Epoch: 58, step: 694, loss: 0.3116011619567871, mean loss: 0.34060690433356916
Epoch: 58, step: 695, loss: 0.31164512038230896, mean loss: 0.34060656137951517
Epoch: 58, step: 696, loss: 0.3204893469810486, mean loss: 0.34060632316219586
Epoch: 58, step: 697, loss: 0.31508105993270874, mean loss: 0.34060602090922687
Epoch: 58, step: 698, loss: 0.30157044529914856, mean loss: 0.34060555868171494
Epoch: 58, step: 699, loss: 0.3540705740451813, mean loss: 0.3406057181215786
Epoch: 58, step: 700, loss: 0.35109835863113403, mean loss: 0.34060584236394426
Epoch: 58, step: 701, loss: 0.32842862606048584, mean loss: 0.3406056981763829
Epoch: 58, step: 702, loss: 0.32236212491989136, mean loss: 0.34060548216106995
Epoch: 58, step: 703, loss: 0.3517792820930481, mean loss: 0.3406056144642803
Epoch: 58, step: 704, loss: 0.2901550531387329, mean loss: 0.3406050171122393
Epoch: 58, step: 705, loss: 0.3826243579387665, mean loss: 0.3406055146298318
Epoch: 58, step: 706, loss: 0.31665754318237305, mean loss: 0.34060523108430735
Epoch: 58, step: 707, loss: 0.3318687379360199, mean loss: 0.3406051276448905
Epoch: 58, step: 708, loss: 0.35765644907951355, mean loss: 0.3406053295288539
Epoch: 58, step: 709, loss: 0.30207428336143494, mean loss: 0.3406048733349896
Epoch: 58, step: 710, loss: 0.3396171033382416, mean loss: 0.3406048616402831
Epoch: 58, step: 711, loss: 0.3369585871696472, mean loss: 0.34060481847071417
Epoch: 58, step: 712, loss: 0.3221414089202881, mean loss: 0.34060459987828473
Epoch: 58, step: 713, loss: 0.40574848651885986, mean loss: 0.3406053711221774
Epoch: 58, step: 714, loss: 0.3589338958263397, mean loss: 0.34060558811253705
Epoch: 58, step: 715, loss: 0.40332478284835815, mean loss: 0.34060633063271906
Epoch: 58, step: 716, loss: 0.3232332170009613, mean loss: 0.3406061249582866
Epoch: 58, step: 717, loss: 0.3269891142845154, mean loss: 0.3406059637529987
Epoch: 58, step: 718, loss: 0.3534167408943176, mean loss: 0.34060611541187735
Epoch: 58, step: 719, loss: 0.2920777201652527, mean loss: 0.34060554092097806
Epoch: 58, step: 720, loss: 0.3359299898147583, mean loss: 0.34060548557132664
Epoch: 58, step: 721, loss: 0.3235880434513092, mean loss: 0.34060528411949387
Epoch: 58, step: 722, loss: 0.366580069065094, mean loss: 0.34060559160437043
Epoch: 58, step: 723, loss: 0.3568539619445801, mean loss: 0.3406057839474068
Epoch: 58, step: 724, loss: 0.3416393995285034, mean loss: 0.34060579618287423
Epoch: 58, step: 725, loss: 0.34498485922813416, mean loss: 0.3406058480196015
Epoch: 58, step: 726, loss: 0.32650044560432434, mean loss: 0.3406056810502669
Epoch: 58, step: 727, loss: 0.34896811842918396, mean loss: 0.3406057800374518
Epoch: 58, step: 728, loss: 0.35055622458457947, mean loss: 0.3406058978206758
Epoch: 58, step: 729, loss: 0.31249144673347473, mean loss: 0.34060556503438894
Epoch: 58, step: 730, loss: 0.34093013405799866, mean loss: 0.3406055688762154
Epoch: 58, step: 731, loss: 0.332890123128891, mean loss: 0.340605477551873
Epoch: 58, step: 732, loss: 0.3552131652832031, mean loss: 0.34060565045460994
Epoch: 58, step: 733, loss: 0.3514017164707184, mean loss: 0.3406057782398763
Epoch: 58, step: 734, loss: 0.3380683660507202, mean loss: 0.3406057482067092
Epoch: 58, step: 735, loss: 0.336520254611969, mean loss: 0.34060569985080547
Epoch: 58, step: 736, loss: 0.3760053813457489, mean loss: 0.34060611883648995
Epoch: 58, step: 737, loss: 0.31396496295928955, mean loss: 0.3406058035192231
Epoch: 58, step: 738, loss: 0.379533976316452, mean loss: 0.3406062642567312
Epoch: 58, step: 739, loss: 0.3687344193458557, mean loss: 0.3406065971658242
Epoch: 58, step: 740, loss: 0.33095619082450867, mean loss: 0.3406064829503704
Epoch: 58, step: 741, loss: 0.30003541707992554, mean loss: 0.3406060027853188
Epoch: 58, step: 742, loss: 0.3329135775566101, mean loss: 0.3406059117453137
Epoch: 58, step: 743, loss: 0.30330386757850647, mean loss: 0.34060547028010624
Epoch: 58, step: 744, loss: 0.3244737386703491, mean loss: 0.3406052793652618
Epoch: 58, step: 745, loss: 0.3206363022327423, mean loss: 0.34060504304041234
Epoch: 58, step: 746, loss: 0.2984367907047272, mean loss: 0.3406045440019345
Epoch: 58, step: 747, loss: 0.3478846848011017, mean loss: 0.3406046301574469
Epoch: 58, step: 748, loss: 0.3229335844516754, mean loss: 0.34060442103512045
Epoch: 58, step: 749, loss: 0.3276940584182739, mean loss: 0.3406042682533802
Epoch: 58, step: 750, loss: 0.3013591170310974, mean loss: 0.34060380383020916
Epoch: 58, step: 751, loss: 0.32999715209007263, mean loss: 0.34060367831364496
Epoch: 58, step: 752, loss: 0.2996450960636139, mean loss: 0.34060319362537506
Epoch: 58, step: 753, loss: 0.348903089761734, mean loss: 0.340603291842024
Epoch: 58, step: 754, loss: 0.33455267548561096, mean loss: 0.34060322024302797
Epoch: 58, step: 755, loss: 0.32956573367118835, mean loss: 0.34060308963425046
Epoch: 58, step: 756, loss: 0.3519926071166992, mean loss: 0.34060322440708507
Epoch: 58, step: 757, loss: 0.33464911580085754, mean loss: 0.34060315395259916
Epoch: 58, step: 758, loss: 0.31711235642433167, mean loss: 0.3406028759911796
Epoch: 58, step: 759, loss: 0.3643619418144226, mean loss: 0.3406031571236321
Epoch: 58, step: 760, loss: 0.3280908167362213, mean loss: 0.3406030090713752
Epoch: 58, step: 761, loss: 0.30578625202178955, mean loss: 0.34060259710700186
Epoch: 58, step: 762, loss: 0.345879465341568, mean loss: 0.34060265954406316
Epoch: 58, step: 763, loss: 0.3530980944633484, mean loss: 0.34060280739103793
Epoch: 58, step: 764, loss: 0.32546618580818176, mean loss: 0.3406026282954526
Epoch: 58, step: 765, loss: 0.33152636885643005, mean loss: 0.34060252090697396
Epoch: 58, step: 766, loss: 0.3273971676826477, mean loss: 0.3406023646657356
Epoch: 58, step: 767, loss: 0.37011581659317017, mean loss: 0.3406027138547078
Epoch: 58, step: 768, loss: 0.35236793756484985, mean loss: 0.3406028530535307
Epoch: 58, step: 769, loss: 0.27762752771377563, mean loss: 0.34060210797739265
Epoch: 58, step: 770, loss: 0.3346983790397644, mean loss: 0.3406020381297898
Epoch: 58, step: 771, loss: 0.304090291261673, mean loss: 0.34060160616080026
Epoch: 58, step: 772, loss: 0.3338967561721802, mean loss: 0.34060152683693173
Epoch: 58, step: 773, loss: 0.31278759241104126, mean loss: 0.34060119777919295
Epoch: 58, step: 774, loss: 0.3487771451473236, mean loss: 0.34060129450506005
Epoch: 58, step: 775, loss: 0.3034927546977997, mean loss: 0.3406008554962132
Epoch: 58, step: 776, loss: 0.32203909754753113, mean loss: 0.3406006359058011
Epoch: 58, step: 777, loss: 0.3591481149196625, mean loss: 0.340600855324694
Epoch: 58, step: 778, loss: 0.34215623140335083, mean loss: 0.34060087372476117
Epoch: 58, step: 779, loss: 0.4114064872264862, mean loss: 0.3406017113438108
Epoch: 58, step: 780, loss: 0.34296050667762756, mean loss: 0.3406017392476511
Epoch: 58, step: 781, loss: 0.3473607301712036, mean loss: 0.34060181920353777
Epoch: 58, step: 782, loss: 0.31633424758911133, mean loss: 0.3406015321322464
Epoch: 58, step: 783, loss: 0.3252788484096527, mean loss: 0.34060135087593285
Epoch: 58, step: 784, loss: 0.30349263548851013, mean loss: 0.3406009119117469
Epoch: 58, step: 785, loss: 0.3633330762386322, mean loss: 0.3406011808105182
Epoch: 58, step: 786, loss: 0.3261517882347107, mean loss: 0.3406010098906756
Epoch: 58, step: 787, loss: 0.34118011593818665, mean loss: 0.340601016740759
Epoch: 58, step: 788, loss: 0.3281129002571106, mean loss: 0.34060086902407144
Epoch: 58, step: 789, loss: 0.3045862913131714, mean loss: 0.34060044302778897
Epoch: 58, step: 790, loss: 0.32469964027404785, mean loss: 0.3406002549483175
Epoch: 58, step: 791, loss: 0.37937942147254944, mean loss: 0.34060071363452266
Epoch: 58, step: 792, loss: 0.3200671970844269, mean loss: 0.3406004707636663
Epoch: 58, step: 793, loss: 0.3171026408672333, mean loss: 0.340600192834138
Epoch: 58, step: 794, loss: 0.3375447690486908, mean loss: 0.34060015669537747
Epoch: 58, step: 795, loss: 0.3405632972717285, mean loss: 0.3406001562594189
Epoch: 58, step: 796, loss: 0.32958561182022095, mean loss: 0.34060002598532413
Epoch: 58, step: 797, loss: 0.34397202730178833, mean loss: 0.3406000658670665
Epoch: 58, step: 798, loss: 0.3517513871192932, mean loss: 0.3406001977557639
Epoch: 58, step: 799, loss: 0.3274598717689514, mean loss: 0.34060004234458513
Epoch: 58, step: 800, loss: 0.36916792392730713, mean loss: 0.3406003802141058
Epoch: 58, step: 801, loss: 0.35590413212776184, mean loss: 0.34060056120793125
Epoch: 58, step: 802, loss: 0.29398736357688904, mean loss: 0.3406000099312754
Epoch: 58, step: 803, loss: 0.37173429131507874, mean loss: 0.3406003781402894
Epoch: 58, step: 804, loss: 0.3200857639312744, mean loss: 0.34060013552744584
Epoch: 58, step: 805, loss: 0.30197885632514954, mean loss: 0.34059967878439135
Epoch: 58, step: 806, loss: 0.30722829699516296, mean loss: 0.3405992841323521
Epoch: 58, step: 807, loss: 0.29990699887275696, mean loss: 0.34059880290854344
Epoch: 58, step: 808, loss: 0.32240405678749084, mean loss: 0.34059858774143187
Epoch: 58, step: 809, loss: 0.3498731851577759, mean loss: 0.3405986974195073
Epoch: 58, step: 810, loss: 0.32429197430610657, mean loss: 0.3405985045843062
Epoch: 58, step: 811, loss: 0.37845566868782043, mean loss: 0.3405989522590153
Epoch: 58, step: 812, loss: 0.33500728011131287, mean loss: 0.3405988861362441
Epoch: 58, step: 813, loss: 0.3105054795742035, mean loss: 0.3405985302792027
Epoch: 58, step: 814, loss: 0.3336152732372284, mean loss: 0.3405984477025825
Epoch: 58, step: 815, loss: 0.3325347602367401, mean loss: 0.34059835235106106
Epoch: 58, step: 816, loss: 0.3385167717933655, mean loss: 0.3405983277370706
Epoch: 58, step: 817, loss: 0.31606996059417725, mean loss: 0.3405980377008031
Epoch: 58, step: 818, loss: 0.3160460889339447, mean loss: 0.3405977473891269
Epoch: 58, step: 819, loss: 0.332339882850647, mean loss: 0.3405976497461181
Epoch: 58, step: 820, loss: 0.3606358468532562, mean loss: 0.3405978866798571
Epoch: 58, step: 821, loss: 0.34920647740364075, mean loss: 0.34059798846753087
Epoch: 58, step: 822, loss: 0.34611776471138, mean loss: 0.34059805373239926
Epoch: 58, step: 823, loss: 0.34987491369247437, mean loss: 0.3405981634190711
Epoch: 58, step: 824, loss: 0.3484950661659241, mean loss: 0.34059825678845934
Epoch: 58, step: 825, loss: 0.30542245507240295, mean loss: 0.34059784089068784
Epoch: 58, step: 826, loss: 0.3273289203643799, mean loss: 0.34059768400871326
Epoch: 58, step: 827, loss: 0.37573206424713135, mean loss: 0.340598099406919
Epoch: 58, step: 828, loss: 0.3060919940471649, mean loss: 0.34059769144170976
Epoch: 58, step: 829, loss: 0.31477227807044983, mean loss: 0.3405973861118125
Epoch: 58, step: 830, loss: 0.30732885003089905, mean loss: 0.3405969927876684
Epoch: 58, step: 831, loss: 0.3048221170902252, mean loss: 0.3405965698368066
Epoch: 58, step: 832, loss: 0.3190363943576813, mean loss: 0.34059631494320275
Epoch: 58, step: 833, loss: 0.31885096430778503, mean loss: 0.34059605786341846
Epoch: 58, step: 834, loss: 0.30447953939437866, mean loss: 0.3405956308886059
Epoch: 58, step: 835, loss: 0.31093278527259827, mean loss: 0.34059528021421215
Epoch: 58, step: 836, loss: 0.3206775486469269, mean loss: 0.3405950447494169
Epoch: 58, step: 837, loss: 0.3410201966762543, mean loss: 0.34059504977544747
Epoch: 58, step: 838, loss: 0.32127681374549866, mean loss: 0.34059482140320896
Epoch: 58, step: 839, loss: 0.3263765871524811, mean loss: 0.3405946533230802
Epoch: 58, step: 840, loss: 0.3534676134586334, mean loss: 0.3405948054983209
Epoch: 58, step: 841, loss: 0.325514018535614, mean loss: 0.34059462722578426
Epoch: 58, step: 842, loss: 0.38821858167648315, mean loss: 0.34059519018996004
Epoch: 58, step: 843, loss: 0.4180908203125, mean loss: 0.34059610625726966
Epoch: 58, step: 844, loss: 0.30407196283340454, mean loss: 0.340595674514496
Epoch: 58, step: 845, loss: 0.3498530983924866, mean loss: 0.34059578394289713
Epoch: 58, step: 846, loss: 0.33105018734931946, mean loss: 0.3405956711094524
Epoch: 58, step: 847, loss: 0.37973910570144653, mean loss: 0.3405961337978045
Epoch: 58, step: 848, loss: 0.3363480865955353, mean loss: 0.34059608358507415
Epoch: 58, step: 849, loss: 0.32588303089141846, mean loss: 0.3405959096760331
Epoch: 58, step: 850, loss: 0.36901456117630005, mean loss: 0.340596245581988
Epoch: 58, step: 851, loss: 0.3157380521297455, mean loss: 0.3405959517638062
Epoch: 58, step: 852, loss: 0.30138570070266724, mean loss: 0.340595488313052
Epoch: 58, step: 853, loss: 0.34167566895484924, mean loss: 0.34059550108023917
Epoch: 58, step: 854, loss: 0.366729736328125, mean loss: 0.34059580996999117
Epoch: 58, step: 855, loss: 0.33234503865242004, mean loss: 0.340595712452365
Epoch: 58, step: 856, loss: 0.3525127172470093, mean loss: 0.340595853300322
Epoch: 58, step: 857, loss: 0.3089924156665802, mean loss: 0.34059547978138055
Epoch: 58, step: 858, loss: 0.35537657141685486, mean loss: 0.3405956544760613
Epoch: 58, step: 859, loss: 0.3750823140144348, mean loss: 0.3405960620619775
Epoch: 58, step: 860, loss: 0.31903526186943054, mean loss: 0.3405958072453395
Epoch: 58, step: 861, loss: 0.31380409002304077, mean loss: 0.3405954906107729
Epoch: 58, step: 862, loss: 0.3368839621543884, mean loss: 0.3405954467470554
Epoch: 58, step: 863, loss: 0.3687240481376648, mean loss: 0.34059577917356326
Epoch: 58, step: 864, loss: 0.33404356241226196, mean loss: 0.34059570173975257
Epoch: 58, step: 865, loss: 0.3603195250034332, mean loss: 0.34059593483227735
Epoch: 58, step: 866, loss: 0.3138176500797272, mean loss: 0.3405956183751607
Epoch: 58, step: 867, loss: 0.3063005208969116, mean loss: 0.34059521309156965
Epoch: 58, step: 868, loss: 0.35554635524749756, mean loss: 0.3405953897751607
Epoch: 58, step: 869, loss: 0.29894474148750305, mean loss: 0.3405948975787072
Epoch: 58, step: 870, loss: 0.31035956740379333, mean loss: 0.34059454028423436
Epoch: 58, step: 871, loss: 0.33903542160987854, mean loss: 0.3405945218601623
Epoch: 58, step: 872, loss: 0.3198518455028534, mean loss: 0.3405942767472955
Epoch: 58, step: 873, loss: 0.3233107924461365, mean loss: 0.3405940725135576
Epoch: 58, step: 874, loss: 0.35179662704467773, mean loss: 0.3405942048892123
Epoch: 58, step: 875, loss: 0.2899045944213867, mean loss: 0.34059360591948046
Epoch: 58, step: 876, loss: 0.3136642277240753, mean loss: 0.3405932877143948
Epoch: 58, step: 877, loss: 0.3250277042388916, mean loss: 0.34059310378926805
Epoch: 58, step: 878, loss: 0.3384563624858856, mean loss: 0.3405930785415302
Epoch: 58, step: 879, loss: 0.37728261947631836, mean loss: 0.3405935120600685
Epoch: 58, step: 880, loss: 0.34040045738220215, mean loss: 0.3405935097789881
Epoch: 58, step: 881, loss: 0.37876182794570923, mean loss: 0.3405939607598961
Epoch: 58, step: 882, loss: 0.3664220869541168, mean loss: 0.3405942659306434
Epoch: 58, step: 883, loss: 0.34179627895355225, mean loss: 0.3405942801327917
Epoch: 58, step: 884, loss: 0.3016201853752136, mean loss: 0.3405938196474867
Epoch: 58, step: 885, loss: 0.3401690125465393, mean loss: 0.3405938146283806
Epoch: 58, step: 886, loss: 0.327972948551178, mean loss: 0.340593665514307
Epoch: 58, step: 887, loss: 0.3323307931423187, mean loss: 0.3405935678905786
Epoch: 58, step: 888, loss: 0.33349645137786865, mean loss: 0.34059348404094886
Epoch: 58, step: 889, loss: 0.33043453097343445, mean loss: 0.340593364018347
Epoch: 58, step: 890, loss: 0.30235978960990906, mean loss: 0.34059291231443284
Epoch: 58, step: 891, loss: 0.3176880478858948, mean loss: 0.3405926417120933
Epoch: 58, step: 892, loss: 0.3187265396118164, mean loss: 0.3405923833849375
Epoch: 58, step: 893, loss: 0.31388431787490845, mean loss: 0.3405920678583266
Epoch: 58, step: 894, loss: 0.33186474442481995, mean loss: 0.3405919647557543
Epoch: 58, step: 895, loss: 0.31699883937835693, mean loss: 0.340591686035343
Epoch: 58, step: 896, loss: 0.3741924464702606, mean loss: 0.34059208297754473
Epoch: 58, step: 897, loss: 0.32424110174179077, mean loss: 0.3405918898176955
Epoch: 58, step: 898, loss: 0.31443601846694946, mean loss: 0.34059158083290675
Epoch: 58, step: 899, loss: 0.34740784764289856, mean loss: 0.3405916613539436
Epoch: 58, step: 900, loss: 0.33559107780456543, mean loss: 0.340591602282398
Epoch: 58, step: 901, loss: 0.334050714969635, mean loss: 0.34059152501626394
Epoch: 58, step: 902, loss: 0.34924542903900146, mean loss: 0.34059162724181496
Epoch: 58, step: 903, loss: 0.3259420096874237, mean loss: 0.34059145419303455
Epoch: 58, step: 904, loss: 0.30639204382896423, mean loss: 0.34059105021686764
Epoch: 58, step: 905, loss: 0.35520851612091064, mean loss: 0.34059122288177707
Epoch: 58, step: 906, loss: 0.29501402378082275, mean loss: 0.3405906845196525
Epoch: 58, step: 907, loss: 0.3201090097427368, mean loss: 0.3405904425910584
Epoch: 58, step: 908, loss: 0.3493978977203369, mean loss: 0.34059054662308175
Epoch: 58, step: 909, loss: 0.3143768012523651, mean loss: 0.3405902369948498
Epoch: 58, step: 910, loss: 0.3520630896091461, mean loss: 0.34059037250685165
Epoch: 58, step: 911, loss: 0.3457867503166199, mean loss: 0.3405904338833258
Epoch: 58, step: 912, loss: 0.331676721572876, mean loss: 0.3405903286011867
Epoch: 58, step: 913, loss: 0.30728551745414734, mean loss: 0.34058993523417813
Epoch: 58, step: 914, loss: 0.34447380900382996, mean loss: 0.3405899811065224
Epoch: 58, step: 915, loss: 0.3951227068901062, mean loss: 0.3405906251836918
Epoch: 58, step: 916, loss: 0.3196764886379242, mean loss: 0.3405903781731384
Epoch: 58, step: 917, loss: 0.3724830746650696, mean loss: 0.3405907548437005
Epoch: 58, step: 918, loss: 0.42106738686561584, mean loss: 0.3405917053064566
Epoch: 58, step: 919, loss: 0.3554489016532898, mean loss: 0.3405918807741005
Epoch: 58, step: 920, loss: 0.30498209595680237, mean loss: 0.3405914602175498
Epoch: 58, step: 921, loss: 0.3102485239505768, mean loss: 0.340591101867451
Epoch: 58, step: 922, loss: 0.2914486229419708, mean loss: 0.3405905215015942
Epoch: 58, step: 923, loss: 0.3264448642730713, mean loss: 0.34059035444531816
Epoch: 58, step: 924, loss: 0.34949755668640137, mean loss: 0.34059045963565604
Epoch: 58, step: 925, loss: 0.38789719343185425, mean loss: 0.3405910183018243
Epoch: 58, step: 926, loss: 0.37907764315605164, mean loss: 0.3405914728020529
Epoch: 58, step: 927, loss: 0.3285697102546692, mean loss: 0.34059133083508847
Epoch: 58, step: 928, loss: 0.31709837913513184, mean loss: 0.3405910534062473
Epoch: 58, step: 929, loss: 0.3097633719444275, mean loss: 0.3405906893657019
Epoch: 58, step: 930, loss: 0.3484598398208618, mean loss: 0.3405907822904974
Epoch: 58, step: 931, loss: 0.33393236994743347, mean loss: 0.3405907036639287
Epoch: 58, step: 932, loss: 0.3706103265285492, mean loss: 0.34059105814964474
Epoch: 58, step: 933, loss: 0.3225952684879303, mean loss: 0.3405908456494716
Epoch: 58, step: 934, loss: 0.3070056438446045, mean loss: 0.3405904490691015
Epoch: 58, step: 935, loss: 0.33284714818000793, mean loss: 0.3405903576358301
Epoch: 58, step: 936, loss: 0.354509174823761, mean loss: 0.340590521987956
Epoch: 58, step: 937, loss: 0.33076202869415283, mean loss: 0.3405904059353725
Epoch: 58, step: 938, loss: 0.3240315318107605, mean loss: 0.3405902104143121
Epoch: 58, step: 939, loss: 0.29907387495040894, mean loss: 0.3405897202105684
Epoch: 58, step: 940, loss: 0.35140174627304077, mean loss: 0.3405898478719579
Epoch: 58, step: 941, loss: 0.36853328347206116, mean loss: 0.3405901778060217
Epoch: 58, step: 942, loss: 0.31907665729522705, mean loss: 0.3405899237943267
Epoch: 58, step: 943, loss: 0.3500741124153137, mean loss: 0.3405900357735066
Epoch: 58, step: 944, loss: 0.36471831798553467, mean loss: 0.3405903206511553
Epoch: 58, step: 945, loss: 0.33171480894088745, mean loss: 0.3405902158610574
Epoch: 58, step: 946, loss: 0.3852479159832001, mean loss: 0.3405907431128564
Epoch: 58, step: 947, loss: 0.358568012714386, mean loss: 0.34059095535925077
Epoch: 58, step: 948, loss: 0.347163587808609, mean loss: 0.340591032957301
Epoch: 58, step: 949, loss: 0.3332951068878174, mean loss: 0.3405909468208925
Epoch: 58, step: 950, loss: 0.3621954917907715, mean loss: 0.3405912018832276
Epoch: 58, step: 951, loss: 0.3111730217933655, mean loss: 0.34059085457755034
Epoch: 58, step: 952, loss: 0.330258309841156, mean loss: 0.3405907325948488
Epoch: 58, step: 953, loss: 0.3366609215736389, mean loss: 0.3405906862013109
Epoch: 58, step: 954, loss: 0.38388535380363464, mean loss: 0.3405911973121707
Epoch: 58, step: 955, loss: 0.34533900022506714, mean loss: 0.34059125336122054
Epoch: 58, step: 956, loss: 0.3659156858921051, mean loss: 0.3405915523192124
Epoch: 58, step: 957, loss: 0.34228837490081787, mean loss: 0.3405915723501719
Epoch: 58, step: 958, loss: 0.3009975850582123, mean loss: 0.34059110494939404
Epoch: 58, step: 959, loss: 0.32892516255378723, mean loss: 0.3405909672364089
Epoch: 58, step: 960, loss: 0.41021984815597534, mean loss: 0.3405917891749652
Epoch: 58, step: 961, loss: 0.31511545181274414, mean loss: 0.3405914884414694
Epoch: 58, step: 962, loss: 0.3235408365726471, mean loss: 0.3405912871707161
Epoch: 58, step: 963, loss: 0.3509742319583893, mean loss: 0.3405914097325083
Epoch: 58, step: 964, loss: 0.3185114562511444, mean loss: 0.34059114910059873
Epoch: 58, step: 965, loss: 0.32658451795578003, mean loss: 0.3405909837681883
Epoch: 58, step: 966, loss: 0.31985464692115784, mean loss: 0.3405907390021164
Epoch: 58, step: 967, loss: 0.33281099796295166, mean loss: 0.34059064717325616
Epoch: 58, step: 968, loss: 0.32421404123306274, mean loss: 0.34059045387282366
Epoch: 58, step: 969, loss: 0.34485507011413574, mean loss: 0.3405905042094097
Epoch: 58, step: 970, loss: 0.3225359320640564, mean loss: 0.34059029110821937
Epoch: 58, step: 971, loss: 0.31699249148368835, mean loss: 0.3405900125826584
Epoch: 58, step: 972, loss: 0.3332744240760803, mean loss: 0.3405899262375595
Epoch: 58, step: 973, loss: 0.3695094883441925, mean loss: 0.34059026756799066
Epoch: 58, step: 974, loss: 0.3416002094745636, mean loss: 0.34059027948794424
Epoch: 58, step: 975, loss: 0.3890443742275238, mean loss: 0.3405908513661278
Epoch: 58, step: 976, loss: 0.3361800014972687, mean loss: 0.34059079930780223
Epoch: 58, step: 977, loss: 0.33537012338638306, mean loss: 0.34059073769236586
Epoch: 58, step: 978, loss: 0.3362599313259125, mean loss: 0.34059068657994696
Epoch: 58, step: 979, loss: 0.34347063302993774, mean loss: 0.3405907205688349
Epoch: 58, step: 980, loss: 0.32752251625061035, mean loss: 0.3405905663407972
Epoch: 58, step: 981, loss: 0.36052507162094116, mean loss: 0.34059080160061356
Epoch: 58, step: 982, loss: 0.31581082940101624, mean loss: 0.3405905091598016
Epoch: 58, step: 983, loss: 0.31901881098747253, mean loss: 0.3405902545844361
Epoch: 58, step: 984, loss: 0.32185912132263184, mean loss: 0.340590033534207
Epoch: 58, step: 985, loss: 0.3497410714626312, mean loss: 0.34059014152634665
Epoch: 58, step: 986, loss: 0.3229931592941284, mean loss: 0.34058993386538494
Epoch: 58, step: 987, loss: 0.30059534311294556, mean loss: 0.3405894618971202
Epoch: 58, step: 988, loss: 0.3589297831058502, mean loss: 0.3405896783250737
Epoch: 58, step: 989, loss: 0.33807435631752014, mean loss: 0.3405896486429561
Epoch: 58, step: 990, loss: 0.3180958330631256, mean loss: 0.34058938320727905
Epoch: 58, step: 991, loss: 0.3293936550617218, mean loss: 0.340589251094939
Epoch: 58, step: 992, loss: 0.31366294622421265, mean loss: 0.3405889333616819
Epoch: 58, step: 993, loss: 0.33111655712127686, mean loss: 0.3405888215879552
Epoch: 58, step: 994, loss: 0.3094881474971771, mean loss: 0.3405884546053589
Epoch: 58, step: 995, loss: 0.29583486914634705, mean loss: 0.34058792652699177
Epoch: 58, step: 996, loss: 0.34205880761146545, mean loss: 0.34058794388272556
Epoch: 58, step: 997, loss: 0.3491854667663574, mean loss: 0.3405880453284233
Epoch: 58, step: 998, loss: 0.33980804681777954, mean loss: 0.34058803612500965
Epoch: 58, step: 999, loss: 0.31605803966522217, mean loss: 0.34058774669235364
Epoch: 58, step: 1000, loss: 0.3445838987827301, mean loss: 0.34058779384292165
Epoch: 58, step: 1001, loss: 0.3371022045612335, mean loss: 0.34058775271696556
Epoch: 58, step: 1002, loss: 0.30499720573425293, mean loss: 0.3405873327942827
Epoch: 58, step: 1003, loss: 0.33236053586006165, mean loss: 0.34058723572980426
Epoch: 58, step: 1004, loss: 0.3417985737323761, mean loss: 0.3405872500216976
Epoch: 58, step: 1005, loss: 0.3273736536502838, mean loss: 0.3405870941237721
Epoch: 58, step: 1006, loss: 0.3149452805519104, mean loss: 0.3405867915976265
Epoch: 58, step: 1007, loss: 0.33986812829971313, mean loss: 0.340586783118824
Epoch: 58, step: 1008, loss: 0.29663240909576416, mean loss: 0.34058626455044916
Epoch: 58, step: 1009, loss: 0.3148458003997803, mean loss: 0.3405859608711571
Epoch: 58, step: 1010, loss: 0.3848695755004883, mean loss: 0.34058648331154534
Epoch: 58, step: 1011, loss: 0.2960464060306549, mean loss: 0.34058595785171236
Epoch: 58, step: 1012, loss: 0.3194987177848816, mean loss: 0.340585709078751
Epoch: 58, step: 1013, loss: 0.35344260931015015, mean loss: 0.3405858607539537
Epoch: 58, step: 1014, loss: 0.32568690180778503, mean loss: 0.3405856849902845
Epoch: 58, step: 1015, loss: 0.3505650758743286, mean loss: 0.34058580271620564
Epoch: 58, step: 1016, loss: 0.3332885503768921, mean loss: 0.34058571663223225
Epoch: 58, step: 1017, loss: 0.3397376835346222, mean loss: 0.34058570662830284
Epoch: 58, step: 1018, loss: 0.30334264039993286, mean loss: 0.340585267290956
Epoch: 58, step: 1019, loss: 0.344372034072876, mean loss: 0.3405853119609742
Epoch: 58, step: 1020, loss: 0.30114442110061646, mean loss: 0.3405848467079943
Epoch: 58, step: 1021, loss: 0.3230895400047302, mean loss: 0.34058464033213964
Epoch: 58, step: 1022, loss: 0.33674585819244385, mean loss: 0.34058459505013267
Epoch: 58, step: 1023, loss: 0.29705262184143066, mean loss: 0.3405840815560635
Epoch: 58, step: 1024, loss: 0.35103848576545715, mean loss: 0.34058420487257873
Epoch: 58, step: 1025, loss: 0.3329416811466217, mean loss: 0.34058411472509087
Epoch: 58, step: 1026, loss: 0.3253821134567261, mean loss: 0.3405839354118026
Epoch: 58, step: 1027, loss: 0.31282392144203186, mean loss: 0.34058360797592185
Epoch: 58, step: 1028, loss: 0.3236645758152008, mean loss: 0.34058340841432005
Epoch: 58, step: 1029, loss: 0.3112298846244812, mean loss: 0.3405830621907845
Epoch: 58, step: 1030, loss: 0.3375948965549469, mean loss: 0.3405830269459166
Epoch: 58, step: 1031, loss: 0.3321106731891632, mean loss: 0.3405829270172301
Epoch: 58, step: 1032, loss: 0.3235490620136261, mean loss: 0.3405827261106428
Epoch: 58, step: 1033, loss: 0.3256193697452545, mean loss: 0.34058254962683215
Epoch: 58, step: 1034, loss: 0.36513185501098633, mean loss: 0.34058283916774507
Epoch: 58, step: 1035, loss: 0.33380502462387085, mean loss: 0.34058275922937475
Epoch: 58, step: 1036, loss: 0.3094924986362457, mean loss: 0.34058239255137884
Epoch: 58, step: 1037, loss: 0.32445767521858215, mean loss: 0.3405822023789843
Epoch: 58, step: 1038, loss: 0.3419964909553528, mean loss: 0.34058221905868585
Epoch: 58, step: 1039, loss: 0.31786686182022095, mean loss: 0.340581951163634
Epoch: 58, step: 1040, loss: 0.3310081958770752, mean loss: 0.34058183825625615
Epoch: 58, step: 1041, loss: 0.3692787289619446, mean loss: 0.34058217668693175
Epoch: 58, step: 1042, loss: 0.3349926769733429, mean loss: 0.34058211076913336
Epoch: 58, step: 1043, loss: 0.32213282585144043, mean loss: 0.34058189319654836
Epoch: 58, step: 1044, loss: 0.30603331327438354, mean loss: 0.3405814857696356
Epoch: 58, step: 1045, loss: 0.2999807894229889, mean loss: 0.34058100697654675
Epoch: 58, step: 1046, loss: 0.326416552066803, mean loss: 0.3405808399409106
Epoch: 58, step: 1047, loss: 0.31458157300949097, mean loss: 0.3405805333457817
Epoch: 58, step: 1048, loss: 0.3394365608692169, mean loss: 0.3405805198556993
Epoch: 58, step: 1049, loss: 0.32872116565704346, mean loss: 0.34058038000812263
Epoch: 58, step: 1050, loss: 0.3345569372177124, mean loss: 0.34058030897947045
Epoch: 58, step: 1051, loss: 0.33119720220565796, mean loss: 0.3405801983348455
Epoch: 58, step: 1052, loss: 0.294734925031662, mean loss: 0.34057965773849735
Epoch: 58, step: 1053, loss: 0.33048081398010254, mean loss: 0.3405795386567843
Epoch: 58, step: 1054, loss: 0.35756534337997437, mean loss: 0.3405797389445521
Epoch: 58, step: 1055, loss: 0.37272536754608154, mean loss: 0.3405801179846026
Epoch: 58, step: 1056, loss: 0.3063860833644867, mean loss: 0.3405797147958535
Epoch: 58, step: 1057, loss: 0.34994497895240784, mean loss: 0.3405798252222674
Epoch: 58, step: 1058, loss: 0.3237232267856598, mean loss: 0.3405796264674073
Epoch: 58, step: 1059, loss: 0.3036104738712311, mean loss: 0.34057919057210245
Epoch: 58, step: 1060, loss: 0.30695316195487976, mean loss: 0.3405787940995261
Epoch: 58, step: 1061, loss: 0.30355003476142883, mean loss: 0.34057835751170645
Epoch: 58, step: 1062, loss: 0.3296208381652832, mean loss: 0.34057822831852896
Epoch: 58, step: 1063, loss: 0.33215802907943726, mean loss: 0.34057812904245793
Epoch: 58, step: 1064, loss: 0.32112541794776917, mean loss: 0.34057789969325797
Epoch: 58, step: 1065, loss: 0.34118735790252686, mean loss: 0.34057790687873996
Epoch: 58, step: 1066, loss: 0.35850366950035095, mean loss: 0.3405781182200977
Epoch: 58, step: 1067, loss: 0.3703175187110901, mean loss: 0.34057846883788234
Epoch: 58, step: 1068, loss: 0.3903622627258301, mean loss: 0.3405790557655758
Epoch: 58, step: 1069, loss: 0.2879699468612671, mean loss: 0.3405784355360492
Epoch: 58, step: 1070, loss: 0.34893882274627686, mean loss: 0.34057853409878824
Epoch: 58, step: 1071, loss: 0.30688074231147766, mean loss: 0.3405781368316022
Epoch: 58, step: 1072, loss: 0.3870588541030884, mean loss: 0.3405786847917233
Epoch: 58, step: 1073, loss: 0.33769094944000244, mean loss: 0.3405786507486781
Epoch: 58, step: 1074, loss: 0.2945323586463928, mean loss: 0.3405781079227842
Epoch: 58, step: 1075, loss: 0.3521758019924164, mean loss: 0.34057824464290104
Epoch: 58, step: 1076, loss: 0.3005112409591675, mean loss: 0.34057777231617686
Epoch: 58, step: 1077, loss: 0.32506510615348816, mean loss: 0.34057758944848665
Epoch: 58, step: 1078, loss: 0.31927675008773804, mean loss: 0.3405773383511359
Epoch: 58, step: 1079, loss: 0.3205961585044861, mean loss: 0.34057710281289744
Epoch: 58, step: 1080, loss: 0.3266739845275879, mean loss: 0.34057693892480806
Epoch: 58, step: 1081, loss: 0.31281664967536926, mean loss: 0.3405766116941075
Epoch: 58, step: 1082, loss: 0.32509055733680725, mean loss: 0.3405764291508841
Epoch: 58, step: 1083, loss: 0.3277932107448578, mean loss: 0.3405762784693526
Epoch: 58, step: 1084, loss: 0.3018296957015991, mean loss: 0.3405758217513785
Epoch: 58, step: 1085, loss: 0.3386611044406891, mean loss: 0.3405757991822785
Epoch: 58, step: 1086, loss: 0.3356807231903076, mean loss: 0.34057574148386155
Epoch: 58, step: 1087, loss: 0.3207237124443054, mean loss: 0.34057550749011994
Epoch: 58, step: 1088, loss: 0.2922508418560028, mean loss: 0.34057493789917176
Epoch: 58, step: 1089, loss: 0.34539881348609924, mean loss: 0.3405749947563367
Epoch: 58, step: 1090, loss: 0.34352508187294006, mean loss: 0.34057502952746826
Epoch: 58, step: 1091, loss: 0.34653812646865845, mean loss: 0.34057509981054
Epoch: 58, step: 1092, loss: 0.35178667306900024, mean loss: 0.3405752319523664
Epoch: 58, step: 1093, loss: 0.3672398626804352, mean loss: 0.34057554622328934
Epoch: 58, step: 1094, loss: 0.3765895366668701, mean loss: 0.340575970681319
Epoch: 58, step: 1095, loss: 0.32935863733291626, mean loss: 0.34057583847627765
Epoch: 58, step: 1096, loss: 0.2857031226158142, mean loss: 0.3405751917660529
Epoch: 58, step: 1097, loss: 0.3401908278465271, mean loss: 0.34057518723613045
Epoch: 58, step: 1098, loss: 0.3667907118797302, mean loss: 0.3405754961956553
Epoch: 58, step: 1099, loss: 0.32337549328804016, mean loss: 0.34057529348973314
Epoch: 58, step: 1100, loss: 0.3075111210346222, mean loss: 0.3405749038255792
Epoch: 58, step: 1101, loss: 0.37496381998062134, mean loss: 0.3405753090971769
Epoch: 58, step: 1102, loss: 0.3132745623588562, mean loss: 0.3405749873630807
Epoch: 58, step: 1103, loss: 0.33080190420150757, mean loss: 0.34057487219051585
Epoch: 58, step: 1104, loss: 0.361358642578125, mean loss: 0.34057511711751526
Epoch: 58, step: 1105, loss: 0.2926473319530487, mean loss: 0.34057455231767125
Epoch: 58, step: 1106, loss: 0.3085964620113373, mean loss: 0.3405741754797365
Epoch: 58, step: 1107, loss: 0.3472365438938141, mean loss: 0.34057425398985214
Epoch: 58, step: 1108, loss: 0.31400999426841736, mean loss: 0.34057394095724913
Epoch: 58, step: 1109, loss: 0.3706803619861603, mean loss: 0.3405742957264159
Epoch: 58, step: 1110, loss: 0.33424216508865356, mean loss: 0.340574221110498
Epoch: 58, step: 1111, loss: 0.3255014419555664, mean loss: 0.3405740434995068
Epoch: 58, step: 1112, loss: 0.3435651361942291, mean loss: 0.3405740787448105
Epoch: 58, step: 1113, loss: 0.3805778920650482, mean loss: 0.3405745501210191
Epoch: 58, step: 1114, loss: 0.33712238073349, mean loss: 0.34057450944361345
Epoch: 58, step: 1115, loss: 0.3232137858867645, mean loss: 0.34057430488213497
Epoch: 58, step: 1116, loss: 0.3098111152648926, mean loss: 0.34057394240361377
Epoch: 58, step: 1117, loss: 0.37131211161613464, mean loss: 0.34057430458305543
Epoch: 58, step: 1118, loss: 0.361470490694046, mean loss: 0.34057455079420074
Epoch: 58, step: 1119, loss: 0.30244746804237366, mean loss: 0.34057410156379786
Epoch: 58, step: 1120, loss: 0.3440015912055969, mean loss: 0.3405741419475435
Epoch: 58, step: 1121, loss: 0.3576352596282959, mean loss: 0.3405743429645532
Epoch: 58, step: 1122, loss: 0.32406356930732727, mean loss: 0.340574148434083
Epoch: 58, step: 1123, loss: 0.3470180332660675, mean loss: 0.34057422435524837
Epoch: 58, step: 1124, loss: 0.3169799745082855, mean loss: 0.34057394637358257
Epoch: 58, step: 1125, loss: 0.35347020626068115, mean loss: 0.34057409831236396
Epoch: 58, step: 1126, loss: 0.32657355070114136, mean loss: 0.340573933365232
Epoch: 58, step: 1127, loss: 0.33785176277160645, mean loss: 0.34057390129441917
Epoch: 58, step: 1128, loss: 0.3567814826965332, mean loss: 0.34057409223917007
Epoch: 58, step: 1129, loss: 0.3193860948085785, mean loss: 0.3405738426220848
Epoch: 58, step: 1130, loss: 0.33707383275032043, mean loss: 0.3405738013887416
Epoch: 58, step: 1131, loss: 0.293843150138855, mean loss: 0.34057325086507106
Epoch: 58, step: 1132, loss: 0.30629318952560425, mean loss: 0.34057284702385837
Epoch: 58, step: 1133, loss: 0.36514416337013245, mean loss: 0.34057313648638865
Epoch: 58, step: 1134, loss: 0.3436530530452728, mean loss: 0.34057317276893556
Epoch: 58, step: 1135, loss: 0.30959179997444153, mean loss: 0.3405728078012983
Epoch: 58, step: 1136, loss: 0.3271949589252472, mean loss: 0.340572650209044
Epoch: 58, step: 1137, loss: 0.3538195788860321, mean loss: 0.34057280625720837
Epoch: 58, step: 1138, loss: 0.2979690432548523, mean loss: 0.3405723043929
Epoch: 58, step: 1139, loss: 0.33679914474487305, mean loss: 0.3405722599463132
Epoch: 58, step: 1140, loss: 0.2990915775299072, mean loss: 0.3405717713231945
Epoch: 58, step: 1141, loss: 0.3390187621116638, mean loss: 0.3405717530296848
Epoch: 58, step: 1142, loss: 0.3509346842765808, mean loss: 0.3405718750973124
Epoch: 58, step: 1143, loss: 0.34128257632255554, mean loss: 0.340571883468746
Epoch: 58, step: 1144, loss: 0.39485853910446167, mean loss: 0.3405725229101354
Epoch: 58, step: 1145, loss: 0.3892430067062378, mean loss: 0.34057309619200066
Epoch: 58, step: 1146, loss: 0.3386050760746002, mean loss: 0.34057307301127865
Epoch: 58, step: 1147, loss: 0.3272497355937958, mean loss: 0.3405729160815093
Epoch: 58, step: 1148, loss: 0.30778223276138306, mean loss: 0.34057252985892866
Epoch: 58, step: 1149, loss: 0.36458227038383484, mean loss: 0.3405728126525086
Epoch: 58, step: 1150, loss: 0.341815710067749, mean loss: 0.3405728272915369
Epoch: 58, step: 1151, loss: 0.29738375544548035, mean loss: 0.3405723186102987
Epoch: 58, step: 1152, loss: 0.3441856801509857, mean loss: 0.34057236116799894
Epoch: 58, step: 1153, loss: 0.31050845980644226, mean loss: 0.3405720070834659
Epoch: 58, step: 1154, loss: 0.3245588541030884, mean loss: 0.34057181848708423
Epoch: 58, step: 1155, loss: 0.321236252784729, mean loss: 0.34057159076336324
Epoch: 58, step: 1156, loss: 0.3425474166870117, mean loss: 0.3405716140332866
Epoch: 58, step: 1157, loss: 0.3662493824958801, mean loss: 0.34057191644488083
Epoch: 58, step: 1158, loss: 0.3263966739177704, mean loss: 0.3405717495025232
Epoch: 58, step: 1159, loss: 0.34146589040756226, mean loss: 0.3405717600327299
Epoch: 58, step: 1160, loss: 0.31802836060523987, mean loss: 0.34057149454453106
Epoch: 58, step: 1161, loss: 0.34295666217803955, mean loss: 0.3405715226337464
Epoch: 58, step: 1162, loss: 0.3266739249229431, mean loss: 0.34057135896893204
Epoch: 58, step: 1163, loss: 0.3273555636405945, mean loss: 0.34057120333518426
Epoch: 58, step: 1164, loss: 0.3149254620075226, mean loss: 0.340570901325677
Epoch: 58, step: 1165, loss: 0.32440218329429626, mean loss: 0.34057071092178115
Epoch: 58, step: 1166, loss: 0.32238471508026123, mean loss: 0.3405704967648099
Epoch: 58, step: 1167, loss: 0.34080418944358826, mean loss: 0.3405704995167256
Epoch: 58, step: 1168, loss: 0.3311998248100281, mean loss: 0.34057038917093707
Epoch: 58, step: 1169, loss: 0.31234538555145264, mean loss: 0.34057005680707825
Epoch: 58, step: 1170, loss: 0.3482131063938141, mean loss: 0.3405701468068379
Epoch: 58, step: 1171, loss: 0.34354040026664734, mean loss: 0.3405701817822684
Epoch: 58, step: 1172, loss: 0.3369177579879761, mean loss: 0.3405701387746288
Epoch: 58, step: 1173, loss: 0.29304879903793335, mean loss: 0.34056957921289577
Epoch: 58, step: 1174, loss: 0.3352739214897156, mean loss: 0.34056951685748793
Epoch: 58, step: 1175, loss: 0.3373035490512848, mean loss: 0.340569478401763
Epoch: 58, step: 1176, loss: 0.3615923225879669, mean loss: 0.3405697259361056
Epoch: 58, step: 1177, loss: 0.2879951596260071, mean loss: 0.3405691069020033
Epoch: 58, step: 1178, loss: 0.32630518078804016, mean loss: 0.34056893895477425
Epoch: 58, step: 1179, loss: 0.3084730803966522, mean loss: 0.34056856105411776
Epoch: 58, step: 1180, loss: 0.3149453401565552, mean loss: 0.3405682593666594
Epoch: 58, step: 1181, loss: 0.3250506520271301, mean loss: 0.3405680766647104
Epoch: 58, step: 1182, loss: 0.3547723889350891, mean loss: 0.34056824390215396
Epoch: 58, step: 1183, loss: 0.3500297963619232, mean loss: 0.3405683552984107
Epoch: 58, step: 1184, loss: 0.3206198513507843, mean loss: 0.3405681204360545
Epoch: 58, step: 1185, loss: 0.30390018224716187, mean loss: 0.3405676887336576
Epoch: 58, step: 1186, loss: 0.3070099949836731, mean loss: 0.3405672936537326
Epoch: 58, step: 1187, loss: 0.3195130527019501, mean loss: 0.34056704578181185
Epoch: 58, step: 1188, loss: 0.2943226993083954, mean loss: 0.34056650135277905
Epoch: 58, step: 1189, loss: 0.34196165204048157, mean loss: 0.340566517777524
Epoch: 58, step: 1190, loss: 0.35270506143569946, mean loss: 0.34056666067974856
Epoch: 58, step: 1191, loss: 0.36684972047805786, mean loss: 0.3405669700960675
Epoch: 58, step: 1192, loss: 0.33428922295570374, mean loss: 0.34056689619239877
Epoch: 58, step: 1193, loss: 0.35531193017959595, mean loss: 0.340567069773662
Epoch: 58, step: 1194, loss: 0.32938218116760254, mean loss: 0.34056693810463773
Epoch: 58, step: 1195, loss: 0.33177655935287476, mean loss: 0.340566834625112
Epoch: 58, step: 1196, loss: 0.35399308800697327, mean loss: 0.3405669926758646
Epoch: 58, step: 1197, loss: 0.3552916646003723, mean loss: 0.34056716600925985
Epoch: 58, step: 1198, loss: 0.2998410165309906, mean loss: 0.3405666866017252
Epoch: 58, step: 1199, loss: 0.35057276487350464, mean loss: 0.34056680438680703
Epoch: 58, step: 1200, loss: 0.3241773843765259, mean loss: 0.34056661146342576
Epoch: 58, step: 1201, loss: 0.3098679482936859, mean loss: 0.34056625010712505
Epoch: 58, step: 1202, loss: 0.38960421085357666, mean loss: 0.34056682732989885
Epoch: 58, step: 1203, loss: 0.3217073380947113, mean loss: 0.3405666053386418
Epoch: 58, step: 1204, loss: 0.36047080159187317, mean loss: 0.34056683962417744
Epoch: 58, step: 1205, loss: 0.33479705452919006, mean loss: 0.3405667717107956
Epoch: 58, step: 1206, loss: 0.31011319160461426, mean loss: 0.340566413260483
Epoch: 58, step: 1207, loss: 0.31718170642852783, mean loss: 0.3405661380167585
Epoch: 58, step: 1208, loss: 0.33638548851013184, mean loss: 0.34056608881006945
Epoch: 58, step: 1209, loss: 0.35804468393325806, mean loss: 0.34056629453257037
Epoch: 58, step: 1210, loss: 0.3110198974609375, mean loss: 0.3405659467765228
Epoch: 58, step: 1211, loss: 0.32023680210113525, mean loss: 0.3405657075087779
Epoch: 58, step: 1212, loss: 0.3130156695842743, mean loss: 0.3405653832571693
Epoch: 58, step: 1213, loss: 0.3260290026664734, mean loss: 0.3405652121724932
Epoch: 58, step: 1214, loss: 0.31438952684402466, mean loss: 0.3405649041036508
Epoch: 58, step: 1215, loss: 0.31730881333351135, mean loss: 0.3405646303995414
Epoch: 58, step: 1216, loss: 0.3018299639225006, mean loss: 0.340564174531325
Epoch: 58, step: 1217, loss: 0.3153373897075653, mean loss: 0.3405638776408363
Epoch: 58, step: 1218, loss: 0.3153300881385803, mean loss: 0.3405635806714055
Epoch: 58, step: 1219, loss: 0.34430545568466187, mean loss: 0.34056362470797064
Epoch: 58, step: 1220, loss: 0.3390756845474243, mean loss: 0.34056360719723006
Epoch: 58, step: 1221, loss: 0.3263956308364868, mean loss: 0.34056344046415454
Epoch: 58, step: 1222, loss: 0.29969993233680725, mean loss: 0.34056295957556226
Epoch: 58, step: 1223, loss: 0.3352561295032501, mean loss: 0.3405628971246341
Epoch: 58, step: 1224, loss: 0.3227775990962982, mean loss: 0.3405626878292009
Epoch: 58, step: 1225, loss: 0.31751906871795654, mean loss: 0.340562416657614
Epoch: 58, step: 1226, loss: 0.31463074684143066, mean loss: 0.3405621115037546
Epoch: 58, step: 1227, loss: 0.32281923294067383, mean loss: 0.34056190271488
Epoch: 58, step: 1228, loss: 0.33540764451026917, mean loss: 0.3405618420629907
Epoch: 58, step: 1229, loss: 0.3095298111438751, mean loss: 0.340561476902946
Epoch: 58, step: 1230, loss: 0.3881383240222931, mean loss: 0.3405620367425271
Epoch: 58, step: 1231, loss: 0.3292039930820465, mean loss: 0.34056190309332657
Epoch: 58, step: 1232, loss: 0.322645902633667, mean loss: 0.34056169227964816
Epoch: 58, step: 1233, loss: 0.33031752705574036, mean loss: 0.34056157174020374
Epoch: 58, step: 1234, loss: 0.34265175461769104, mean loss: 0.340561596334352
Epoch: 58, step: 1235, loss: 0.351532518863678, mean loss: 0.340561725422253
Epoch: 58, step: 1236, loss: 0.33495447039604187, mean loss: 0.3405616594460087
Epoch: 58, step: 1237, loss: 0.3304491937160492, mean loss: 0.3405615404618255
Epoch: 58, step: 1238, loss: 0.2967287302017212, mean loss: 0.3405610247270976
Epoch: 58, step: 1239, loss: 0.3142583966255188, mean loss: 0.3405607152552873
Epoch: 58, step: 1240, loss: 0.3331432044506073, mean loss: 0.3405606279832672
Epoch: 58, step: 1241, loss: 0.3155750036239624, mean loss: 0.34056033401399455
Epoch: 58, step: 1242, loss: 0.3034089505672455, mean loss: 0.34055989691318334
Epoch: 58, step: 1243, loss: 0.32095077633857727, mean loss: 0.3405596662067904
Epoch: 58, step: 1244, loss: 0.2995131015777588, mean loss: 0.3405591832889859
Epoch: 58, step: 1245, loss: 0.34211868047714233, mean loss: 0.3405592016364433
Epoch: 58, step: 1246, loss: 0.3405321538448334, mean loss: 0.34055920131823025
Epoch: 58, step: 1247, loss: 0.2816023826599121, mean loss: 0.34055850770859897
Epoch: 58, step: 1248, loss: 0.3335270583629608, mean loss: 0.3405584249866387
Epoch: 58, step: 1249, loss: 0.32773658633232117, mean loss: 0.34055827414502726
Epoch: 58, step: 1250, loss: 0.3270123600959778, mean loss: 0.34055811478695697
Epoch: 58, step: 1251, loss: 0.3044317960739136, mean loss: 0.34055768979144246
Epoch: 58, step: 1252, loss: 0.3635081350803375, mean loss: 0.34055795978079945
Epoch: 58, step: 1253, loss: 0.3269672393798828, mean loss: 0.34055779990125684
Epoch: 58, step: 1254, loss: 0.331676721572876, mean loss: 0.3405576954265862
Epoch: 58, step: 1255, loss: 0.3251665234565735, mean loss: 0.34055751437101534
Epoch: 58, step: 1256, loss: 0.3130873441696167, mean loss: 0.34055719122675765
Epoch: 58, step: 1257, loss: 0.3216988742351532, mean loss: 0.3405569693903032
Epoch: 58, step: 1258, loss: 0.3533962368965149, mean loss: 0.34055712042096403
Epoch: 58, step: 1259, loss: 0.3053620159626007, mean loss: 0.34055670641935887
Epoch: 58, step: 1260, loss: 0.335339218378067, mean loss: 0.34055664504653305
Epoch: 58, step: 1261, loss: 0.31371861696243286, mean loss: 0.34055632935702207
Epoch: 58, step: 1262, loss: 0.3381415605545044, mean loss: 0.34055630095298983
Epoch: 58, step: 1263, loss: 0.33228880167007446, mean loss: 0.3405562037065976
Epoch: 58, step: 1264, loss: 0.3488278388977051, mean loss: 0.340556301000494
Epoch: 58, step: 1265, loss: 0.34281012415885925, mean loss: 0.3405563275104467
Epoch: 58, step: 1266, loss: 0.39709314703941345, mean loss: 0.340556992500855
Epoch: 58, step: 1267, loss: 0.33909356594085693, mean loss: 0.340556975288122
Epoch: 58, step: 1268, loss: 0.31919580698013306, mean loss: 0.34055672404233206
Epoch: 58, step: 1269, loss: 0.3279154896736145, mean loss: 0.3405565753604101
Epoch: 58, step: 1270, loss: 0.3108465373516083, mean loss: 0.34055622592510426
Epoch: 58, step: 1271, loss: 0.32310545444488525, mean loss: 0.34055602067986196
Epoch: 58, step: 1272, loss: 0.3288082778453827, mean loss: 0.3405558825117604
Epoch: 58, step: 1273, loss: 0.34154239296913147, mean loss: 0.3405558941142168
Epoch: 58, step: 1274, loss: 0.3511069118976593, mean loss: 0.3405560182044209
Epoch: 58, step: 1275, loss: 0.31038570404052734, mean loss: 0.3405556633764329
Epoch: 58, step: 1276, loss: 0.31837543845176697, mean loss: 0.34055540252160776
Epoch: 58, step: 1277, loss: 0.32727569341659546, mean loss: 0.3405552463448571
Epoch: 58, step: 1278, loss: 0.339144766330719, mean loss: 0.3405552297570243
Epoch: 58, step: 1279, loss: 0.3050955533981323, mean loss: 0.3405548127413554
Epoch: 58, step: 1280, loss: 0.33847981691360474, mean loss: 0.3405547883391136
Epoch: 58, step: 1281, loss: 0.3347596526145935, mean loss: 0.3405547201883066
Epoch: 58, step: 1282, loss: 0.31489306688308716, mean loss: 0.3405544184107644
Epoch: 58, step: 1283, loss: 0.350716769695282, mean loss: 0.34055453791722384
Epoch: 58, step: 1284, loss: 0.31334424018859863, mean loss: 0.34055421793536034
Epoch: 58, step: 1285, loss: 0.3192578852176666, mean loss: 0.3405539675022279
Epoch: 58, step: 1286, loss: 0.32831504940986633, mean loss: 0.3405538235809907
Epoch: 58, step: 1287, loss: 0.28943943977355957, mean loss: 0.3405532225181519
Epoch: 58, step: 1288, loss: 0.3028481900691986, mean loss: 0.340552779143398
Epoch: 58, step: 1289, loss: 0.2974022626876831, mean loss: 0.3405522717409797
Epoch: 58, step: 1290, loss: 0.2983788549900055, mean loss: 0.34055177583400614
Epoch: 58, step: 1291, loss: 0.3322193920612335, mean loss: 0.34055167785667945
Epoch: 58, step: 1292, loss: 0.34445035457611084, mean loss: 0.34055172369919484
Epoch: 58, step: 1293, loss: 0.31947100162506104, mean loss: 0.34055147582484363
Epoch: 58, step: 1294, loss: 0.3336545526981354, mean loss: 0.34055139472941254
Epoch: 58, step: 1295, loss: 0.3123722970485687, mean loss: 0.34055106339772123
Epoch: 58, step: 1296, loss: 0.2978496551513672, mean loss: 0.3405505613176468
Epoch: 58, step: 1297, loss: 0.2887747287750244, mean loss: 0.3405499525483048
Epoch: 58, step: 1298, loss: 0.335290789604187, mean loss: 0.3405498907129008
Epoch: 58, step: 1299, loss: 0.3325347900390625, mean loss: 0.34054979647525
Epoch: 58, step: 1300, loss: 0.32906749844551086, mean loss: 0.34054966147356835
Epoch: 58, step: 1301, loss: 0.3043574392795563, mean loss: 0.3405492359530497
Epoch: 58, step: 1302, loss: 0.3384271562099457, mean loss: 0.34054921100354946
Epoch: 58, step: 1303, loss: 0.3364811837673187, mean loss: 0.3405491631759155
Epoch: 58, step: 1304, loss: 0.3173735439777374, mean loss: 0.34054889070428823
Epoch: 58, step: 1305, loss: 0.2981295585632324, mean loss: 0.3405483919936186
Epoch: 58, step: 1306, loss: 0.34520936012268066, mean loss: 0.3405484467905023
Epoch: 58, step: 1307, loss: 0.3394037187099457, mean loss: 0.3405484333326128
Epoch: 58, step: 1308, loss: 0.33332550525665283, mean loss: 0.34054834841792714
Epoch: 58, step: 1309, loss: 0.3013797402381897, mean loss: 0.34054788794664526
Epoch: 58, step: 1310, loss: 0.3270184099674225, mean loss: 0.34054772889420204
Epoch: 58, step: 1311, loss: 0.2915022373199463, mean loss: 0.34054715232254335
Epoch: 58, step: 1312, loss: 0.3394063115119934, mean loss: 0.3405471389111425
Epoch: 58, step: 1313, loss: 0.32239994406700134, mean loss: 0.34054692558037764
Epoch: 58, step: 1314, loss: 0.321707159280777, mean loss: 0.3405467041106385
Epoch: 58, step: 1315, loss: 0.3697487413883209, mean loss: 0.34054704738939523
Epoch: 58, step: 1316, loss: 0.3434365391731262, mean loss: 0.34054708135584344
Epoch: 58, step: 1317, loss: 0.3513687252998352, mean loss: 0.3405472085645415
Epoch: 58, step: 1318, loss: 0.3469705283641815, mean loss: 0.3405472840699405
Epoch: 58, step: 1319, loss: 0.33223599195480347, mean loss: 0.3405471863727885
Epoch: 58, step: 1320, loss: 0.3481924831867218, mean loss: 0.3405472762402766
Epoch: 58, step: 1321, loss: 0.37679949402809143, mean loss: 0.3405477023659764
Epoch: 58, step: 1322, loss: 0.31990790367126465, mean loss: 0.3405474597588804
Epoch: 58, step: 1323, loss: 0.300836980342865, mean loss: 0.34054699299411223
Epoch: 58, step: 1324, loss: 0.355133593082428, mean loss: 0.340547164445857
Epoch: 58, step: 1325, loss: 0.32655012607574463, mean loss: 0.3405469999257887
Epoch: 58, step: 1326, loss: 0.3279770612716675, mean loss: 0.3405468521814728
Epoch: 58, step: 1327, loss: 0.34359002113342285, mean loss: 0.34054688794979615
Epoch: 58, step: 1328, loss: 0.340279221534729, mean loss: 0.3405468848037775
Epoch: 58, step: 1329, loss: 0.3082799017429352, mean loss: 0.34054650555807264
Epoch: 58, step: 1330, loss: 0.32002967596054077, mean loss: 0.34054626441907193
Epoch: 58, step: 1331, loss: 0.305685430765152, mean loss: 0.3405458546965195
Epoch: 58, step: 1332, loss: 0.3186562955379486, mean loss: 0.34054559742956103
Epoch: 58, step: 1333, loss: 0.3441157937049866, mean loss: 0.3405456393894167
Epoch: 58, step: 1334, loss: 0.29869553446769714, mean loss: 0.3405451475386648
Epoch: 58, step: 1335, loss: 0.3542018532752991, mean loss: 0.34054530803962546
Epoch: 58, step: 1336, loss: 0.32700055837631226, mean loss: 0.3405451488563037
Epoch: 58, step: 1337, loss: 0.36070188879966736, mean loss: 0.3405453857435988
Epoch: 58, step: 1338, loss: 0.3254859447479248, mean loss: 0.3405452087631779
Epoch: 58, step: 1339, loss: 0.34905439615249634, mean loss: 0.3405453087630297
Epoch: 58, step: 1340, loss: 0.32001885771751404, mean loss: 0.3405450675392975
Epoch: 58, step: 1341, loss: 0.30381104350090027, mean loss: 0.34054463585170447
Epoch: 58, step: 1342, loss: 0.2988322973251343, mean loss: 0.3405441456661645
Epoch: 58, step: 1343, loss: 0.34917864203453064, mean loss: 0.3405442471338759
Epoch: 58, step: 1344, loss: 0.3691288232803345, mean loss: 0.3405445830396792
Epoch: 58, step: 1345, loss: 0.3565817177295685, mean loss: 0.3405447714945746
Epoch: 58, step: 1346, loss: 0.35232746601104736, mean loss: 0.3405449099532465
Epoch: 58, step: 1347, loss: 0.33044546842575073, mean loss: 0.34054479127590775
Epoch: 58, step: 1348, loss: 0.32413995265960693, mean loss: 0.34054459850686136
Epoch: 58, step: 1349, loss: 0.34753793478012085, mean loss: 0.34054468068279464
Epoch: 58, step: 1350, loss: 0.3230850398540497, mean loss: 0.34054447552385986
Epoch: 58, step: 1351, loss: 0.33465418219566345, mean loss: 0.34054440631097527
Epoch: 58, step: 1352, loss: 0.32265278697013855, mean loss: 0.34054419608103176
Epoch: 58, step: 1353, loss: 0.34746965765953064, mean loss: 0.3405442774555715
Epoch: 58, step: 1354, loss: 0.3247913718223572, mean loss: 0.3405440923602722
Epoch: 58, step: 1355, loss: 0.3323290944099426, mean loss: 0.34054399583588024
Epoch: 58, step: 1356, loss: 0.33740657567977905, mean loss: 0.340543958972327
Epoch: 58, step: 1357, loss: 0.31015023589134216, mean loss: 0.340543601861258
Epoch: 58, step: 1358, loss: 0.3421223759651184, mean loss: 0.3405436204108474
Epoch: 58, step: 1359, loss: 0.3582964241504669, mean loss: 0.34054382899252494
Epoch: 58, step: 1360, loss: 0.3680279552936554, mean loss: 0.3405441519059025
Epoch: 58, step: 1361, loss: 0.3018127977848053, mean loss: 0.3405436968532188
Epoch: 58, step: 1362, loss: 0.3704335689544678, mean loss: 0.34054404802365995
Epoch: 58, step: 1363, loss: 0.3340393900871277, mean loss: 0.3405439716025648
Epoch: 58, step: 1364, loss: 0.33047428727149963, mean loss: 0.3405438532985323
Epoch: 58, step: 1365, loss: 0.3481520116329193, mean loss: 0.3405439426821919
Epoch: 58, step: 1366, loss: 0.3661250174045563, mean loss: 0.3405442432152659
Epoch: 58, step: 1367, loss: 0.3080158531665802, mean loss: 0.3405438610678264
Epoch: 58, step: 1368, loss: 0.3334060311317444, mean loss: 0.3405437772127268
Epoch: 58, step: 1369, loss: 0.29158881306648254, mean loss: 0.3405432020974317
Epoch: 58, step: 1370, loss: 0.331977903842926, mean loss: 0.3405431014748238
Epoch: 58, step: 1371, loss: 0.3546779155731201, mean loss: 0.3405432675245172
Epoch: 58, step: 1372, loss: 0.35628101229667664, mean loss: 0.34054345240257616
Epoch: 58, step: 1373, loss: 0.34279710054397583, mean loss: 0.3405434788768395
Epoch: 58, step: 1374, loss: 0.3053866922855377, mean loss: 0.3405430658846444
Epoch: 58, step: 1375, loss: 0.33096909523010254, mean loss: 0.34054295341905544
Epoch: 58, step: 1376, loss: 0.38055112957954407, mean loss: 0.34054342339023047
Epoch: 58, step: 1377, loss: 0.3163186013698578, mean loss: 0.3405431388275379
Epoch: 58, step: 1378, loss: 0.2766660749912262, mean loss: 0.3405423884890732
Epoch: 58, step: 1379, loss: 0.37282857298851013, mean loss: 0.3405427677375873
Epoch: 58, step: 1380, loss: 0.35970237851142883, mean loss: 0.3405429927926279
Epoch: 58, step: 1381, loss: 0.3134894073009491, mean loss: 0.34054267501611685
Epoch: 58, step: 1382, loss: 0.32569292187690735, mean loss: 0.34054250059016816
Epoch: 58, step: 1383, loss: 0.3238048255443573, mean loss: 0.3405423039909029
Epoch: 58, step: 1384, loss: 0.3245851695537567, mean loss: 0.34054211656200084
Epoch: 58, step: 1385, loss: 0.3210287392139435, mean loss: 0.3405418873649637
Epoch: 58, step: 1386, loss: 0.35400110483169556, mean loss: 0.3405420454501828
Epoch: 58, step: 1387, loss: 0.34685277938842773, mean loss: 0.34054211957202846
Epoch: 58, step: 1388, loss: 0.3029405176639557, mean loss: 0.3405416779328428
Epoch: 58, step: 1389, loss: 0.31705257296562195, mean loss: 0.34054140205131583
Epoch: 58, step: 1390, loss: 0.3181588053703308, mean loss: 0.34054113916891
Epoch: 58, step: 1391, loss: 0.33051061630249023, mean loss: 0.3405410213623368
Epoch: 58, step: 1392, loss: 0.33892887830734253, mean loss: 0.34054100242824725
Epoch: 58, step: 1393, loss: 0.4025036692619324, mean loss: 0.34054173015082767
Epoch: 58, step: 1394, loss: 0.3311113715171814, mean loss: 0.34054161939697103
Epoch: 58, step: 1395, loss: 0.34475308656692505, mean loss: 0.34054166885752407
Epoch: 58, step: 1396, loss: 0.34128719568252563, mean loss: 0.3405416776130799
Epoch: 58, step: 1397, loss: 0.35124096274375916, mean loss: 0.34054180326528344
Epoch: 58, step: 1398, loss: 0.29244014620780945, mean loss: 0.340541238366961
Epoch: 58, step: 1399, loss: 0.2967303395271301, mean loss: 0.3405407238646728
Epoch: 58, step: 1400, loss: 0.3667159676551819, mean loss: 0.3405410312554141
Epoch: 58, step: 1401, loss: 0.3241647183895111, mean loss: 0.34054083894133763
Epoch: 58, step: 1402, loss: 0.3238513171672821, mean loss: 0.340540642951416
Epoch: 58, step: 1403, loss: 0.34722983837127686, mean loss: 0.3405407215036662
Epoch: 58, step: 1404, loss: 0.34619036316871643, mean loss: 0.3405407878474978
Epoch: 58, step: 1405, loss: 0.32071658968925476, mean loss: 0.3405405550543585
Epoch: 58, step: 1406, loss: 0.3139568269252777, mean loss: 0.3405402428885495
Epoch: 58, step: 1407, loss: 0.3298564851284027, mean loss: 0.34054011743343254
Epoch: 58, step: 1408, loss: 0.3728711009025574, mean loss: 0.34054049707885087
Epoch: 58, step: 1409, loss: 0.3110627830028534, mean loss: 0.340540150941911
Epoch: 58, step: 1410, loss: 0.3262368142604828, mean loss: 0.34053998298943533
Epoch: 58, step: 1411, loss: 0.32839643955230713, mean loss: 0.34053984039933344
Epoch: 58, step: 1412, loss: 0.3178878426551819, mean loss: 0.34053957442155214
Epoch: 58, step: 1413, loss: 0.3409697115421295, mean loss: 0.3405395794721254
Epoch: 58, step: 1414, loss: 0.328414648771286, mean loss: 0.3405394371055902
Epoch: 58, step: 1415, loss: 0.31391191482543945, mean loss: 0.3405391244585599
Epoch: 58, step: 1416, loss: 0.32873818278312683, mean loss: 0.3405389858994401
Epoch: 58, step: 1417, loss: 0.31888827681541443, mean loss: 0.3405387316936272
Epoch: 58, step: 1418, loss: 0.3560216724872589, mean loss: 0.3405389134801601
Epoch: 58, step: 1419, loss: 0.31926649808883667, mean loss: 0.3405386637218429
Epoch: 58, step: 1420, loss: 0.3047870397567749, mean loss: 0.340538243968823
Epoch: 58, step: 1421, loss: 0.3576669692993164, mean loss: 0.3405384450715695
Epoch: 58, step: 1422, loss: 0.4177872836589813, mean loss: 0.3405393520142004
Epoch: 58, step: 1423, loss: 0.32887187600135803, mean loss: 0.3405392150334075
Epoch: 58, step: 1424, loss: 0.33661121129989624, mean loss: 0.3405391689176282
Epoch: 58, step: 1425, loss: 0.31663021445274353, mean loss: 0.3405388882236172
Epoch: 58, step: 1426, loss: 0.3160228133201599, mean loss: 0.3405386004053181
Epoch: 58, step: 1427, loss: 0.36014100909233093, mean loss: 0.34053883053455836
Epoch: 58, step: 1428, loss: 0.3235081136226654, mean loss: 0.3405386305989282
Epoch: 58, step: 1429, loss: 0.3649369478225708, mean loss: 0.3405389170246663
Epoch: 58, step: 1430, loss: 0.34155037999153137, mean loss: 0.3405389288986666
Epoch: 58, step: 1431, loss: 0.35319650173187256, mean loss: 0.3405390774896324
Epoch: 58, step: 1432, loss: 0.3370378017425537, mean loss: 0.3405390363876104
Epoch: 58, step: 1433, loss: 0.34782668948173523, mean loss: 0.34053912193750235
Epoch: 58, step: 1434, loss: 0.29909780621528625, mean loss: 0.34053863546285573
Epoch: 58, step: 1435, loss: 0.3680388331413269, mean loss: 0.3405389582805962
Epoch: 58, step: 1436, loss: 0.36025863885879517, mean loss: 0.3405391897621323
Epoch: 58, step: 1437, loss: 0.3435640335083008, mean loss: 0.3405392252691607
Epoch: 58, step: 1438, loss: 0.3208012878894806, mean loss: 0.34053899357875467
Epoch: 58, step: 1439, loss: 0.29272595047950745, mean loss: 0.34053843234010434
Epoch: 58, step: 1440, loss: 0.3115590214729309, mean loss: 0.3405380921782264
Epoch: 58, step: 1441, loss: 0.3432462215423584, mean loss: 0.3405381239660209
Epoch: 58, step: 1442, loss: 0.3478184640407562, mean loss: 0.34053820942103674
Epoch: 58, step: 1443, loss: 0.3162654936313629, mean loss: 0.34053792451663056
Valid: 58, mean loss: 0.18601726492245993
Epoch: 59, step: 0, loss: 0.31739744544029236, mean loss: 0.34053765290519966
Epoch: 59, step: 1, loss: 0.3036474585533142, mean loss: 0.3405372199115337
Epoch: 59, step: 2, loss: 0.35179340839385986, mean loss: 0.34053735202797264
Epoch: 59, step: 3, loss: 0.3366830348968506, mean loss: 0.34053730678950866
Epoch: 59, step: 4, loss: 0.3547954261302948, mean loss: 0.34053747413636304
Epoch: 59, step: 5, loss: 0.297818660736084, mean loss: 0.3405369727536091
Epoch: 59, step: 6, loss: 0.3072182834148407, mean loss: 0.34053658170294965
Epoch: 59, step: 7, loss: 0.36086973547935486, mean loss: 0.34053682034378546
Epoch: 59, step: 8, loss: 0.3440823256969452, mean loss: 0.34053686195525606
Epoch: 59, step: 9, loss: 0.33291158080101013, mean loss: 0.3405367724629532
Epoch: 59, step: 10, loss: 0.30710282921791077, mean loss: 0.3405363800780172
Epoch: 59, step: 11, loss: 0.32649606466293335, mean loss: 0.34053621530105477
Epoch: 59, step: 12, loss: 0.29788142442703247, mean loss: 0.34053571471084865
Epoch: 59, step: 13, loss: 0.31567490100860596, mean loss: 0.34053542295150463
Epoch: 59, step: 14, loss: 0.31451573967933655, mean loss: 0.34053511759558497
Epoch: 59, step: 15, loss: 0.32675623893737793, mean loss: 0.3405349558944319
Epoch: 59, step: 16, loss: 0.3115249574184418, mean loss: 0.3405346154534373
Epoch: 59, step: 17, loss: 0.3823365867137909, mean loss: 0.3405351060062955
Epoch: 59, step: 18, loss: 0.3464255928993225, mean loss: 0.3405351751312957
Epoch: 59, step: 19, loss: 0.3238767981529236, mean loss: 0.3405349796471498
Epoch: 59, step: 20, loss: 0.3178723454475403, mean loss: 0.34053471370685384
Epoch: 59, step: 21, loss: 0.3562397062778473, mean loss: 0.34053489799881764
Epoch: 59, step: 22, loss: 0.3000904321670532, mean loss: 0.34053442340435125
Epoch: 59, step: 23, loss: 0.3080650568008423, mean loss: 0.3405340423979372
Epoch: 59, step: 24, loss: 0.35936570167541504, mean loss: 0.34053426337233644
Epoch: 59, step: 25, loss: 0.32785549759864807, mean loss: 0.3405341145989472
Epoch: 59, step: 26, loss: 0.3146362006664276, mean loss: 0.34053381071485567
Epoch: 59, step: 27, loss: 0.34056147933006287, mean loss: 0.34053381103951325
Epoch: 59, step: 28, loss: 0.3473750948905945, mean loss: 0.3405338913127177
Epoch: 59, step: 29, loss: 0.3510703444480896, mean loss: 0.3405340149422807
Epoch: 59, step: 30, loss: 0.35788020491600037, mean loss: 0.340534218471561
Epoch: 59, step: 31, loss: 0.3329136073589325, mean loss: 0.34053412905715363
Epoch: 59, step: 32, loss: 0.3514478802680969, mean loss: 0.34053425710923935
Epoch: 59, step: 33, loss: 0.3244722783565521, mean loss: 0.3405340686547192
Epoch: 59, step: 34, loss: 0.31849151849746704, mean loss: 0.3405338100334411
Epoch: 59, step: 35, loss: 0.33242613077163696, mean loss: 0.340533714908614
Epoch: 59, step: 36, loss: 0.35662683844566345, mean loss: 0.34053390372190856
Epoch: 59, step: 37, loss: 0.3329259753227234, mean loss: 0.34053381446259423
Epoch: 59, step: 38, loss: 0.3296663165092468, mean loss: 0.3405336869621783
Epoch: 59, step: 39, loss: 0.34568023681640625, mean loss: 0.34053374734218034
Epoch: 59, step: 40, loss: 0.30110403895378113, mean loss: 0.34053328475306543
Epoch: 59, step: 41, loss: 0.3086996078491211, mean loss: 0.3405329112849303
Epoch: 59, step: 42, loss: 0.3510022759437561, mean loss: 0.3405330341085751
Epoch: 59, step: 43, loss: 0.2895393967628479, mean loss: 0.3405324358725668
Epoch: 59, step: 44, loss: 0.3818756937980652, mean loss: 0.3405329208886732
Epoch: 59, step: 45, loss: 0.3182799518108368, mean loss: 0.3405326598322799
Epoch: 59, step: 46, loss: 0.3243691325187683, mean loss: 0.34053247021521676
Epoch: 59, step: 47, loss: 0.2844803035259247, mean loss: 0.340531812665516
Epoch: 59, step: 48, loss: 0.310713529586792, mean loss: 0.34053146287041863
Epoch: 59, step: 49, loss: 0.31747788190841675, mean loss: 0.3405311924344925
Epoch: 59, step: 50, loss: 0.3216954171657562, mean loss: 0.34053097147920647
Epoch: 59, step: 51, loss: 0.35654908418655396, mean loss: 0.3405311593793649
Epoch: 59, step: 52, loss: 0.3676334321498871, mean loss: 0.3405314772983173
Epoch: 59, step: 53, loss: 0.37202081084251404, mean loss: 0.34053184667466385
Epoch: 59, step: 54, loss: 0.3124581575393677, mean loss: 0.3405315173683902
Epoch: 59, step: 55, loss: 0.3066437542438507, mean loss: 0.3405311198672979
Epoch: 59, step: 56, loss: 0.3328409194946289, mean loss: 0.34053102966284327
Epoch: 59, step: 57, loss: 0.3248569667339325, mean loss: 0.340530845811494
Epoch: 59, step: 58, loss: 0.30379754304885864, mean loss: 0.3405304149475826
Epoch: 59, step: 59, loss: 0.33306458592414856, mean loss: 0.34053032737803884
Epoch: 59, step: 60, loss: 0.3143048882484436, mean loss: 0.34053001977351216
Epoch: 59, step: 61, loss: 0.3455568850040436, mean loss: 0.34053007873414026
Epoch: 59, step: 62, loss: 0.3338606357574463, mean loss: 0.3405300005084635
Epoch: 59, step: 63, loss: 0.34046387672424316, mean loss: 0.34052999973290893
Epoch: 59, step: 64, loss: 0.30002596974372864, mean loss: 0.3405295246736205
Epoch: 59, step: 65, loss: 0.35707202553749084, mean loss: 0.3405297186932408
Epoch: 59, step: 66, loss: 0.376780241727829, mean loss: 0.34053014385448344
Epoch: 59, step: 67, loss: 0.3417730927467346, mean loss: 0.34053015843213513
Epoch: 59, step: 68, loss: 0.3256058990955353, mean loss: 0.3405299833983072
Epoch: 59, step: 69, loss: 0.33524060249328613, mean loss: 0.3405299213644261
Epoch: 59, step: 70, loss: 0.3225049376487732, mean loss: 0.3405297099698219
Epoch: 59, step: 71, loss: 0.36628878116607666, mean loss: 0.34053001206522926
Epoch: 59, step: 72, loss: 0.3610363006591797, mean loss: 0.3405302525546052
Epoch: 59, step: 73, loss: 0.3317878842353821, mean loss: 0.34053015002888315
Epoch: 59, step: 74, loss: 0.35707971453666687, mean loss: 0.340530344110863
Epoch: 59, step: 75, loss: 0.3099798858165741, mean loss: 0.34052998584017286
Epoch: 59, step: 76, loss: 0.3000216782093048, mean loss: 0.3405295107975728
Epoch: 59, step: 77, loss: 0.338811993598938, mean loss: 0.34052949065641375
Epoch: 59, step: 78, loss: 0.31295010447502136, mean loss: 0.3405291672393961
Epoch: 59, step: 79, loss: 0.32230061292648315, mean loss: 0.3405289534799056
Epoch: 59, step: 80, loss: 0.3597143888473511, mean loss: 0.34052917845774683
Epoch: 59, step: 81, loss: 0.3520597815513611, mean loss: 0.3405293136696783
Epoch: 59, step: 82, loss: 0.3152655065059662, mean loss: 0.34052901742081093
Epoch: 59, step: 83, loss: 0.33601853251457214, mean loss: 0.3405289645305095
Epoch: 59, step: 84, loss: 0.3082120716571808, mean loss: 0.3405285855845207
Epoch: 59, step: 85, loss: 0.3492278754711151, mean loss: 0.34052868759068716
Epoch: 59, step: 86, loss: 0.3485422134399414, mean loss: 0.34052878155461724
Epoch: 59, step: 87, loss: 0.3640036880970001, mean loss: 0.3405290568103105
Epoch: 59, step: 88, loss: 0.2897402346134186, mean loss: 0.3405284612914948
Epoch: 59, step: 89, loss: 0.33681994676589966, mean loss: 0.3405284178082206
Epoch: 59, step: 90, loss: 0.32290565967559814, mean loss: 0.3405282111793307
Epoch: 59, step: 91, loss: 0.3513853847980499, mean loss: 0.34052833847946223
Epoch: 59, step: 92, loss: 0.34897172451019287, mean loss: 0.3405284374768245
Epoch: 59, step: 93, loss: 0.3368176221847534, mean loss: 0.3405283939686138
Epoch: 59, step: 94, loss: 0.3343124985694885, mean loss: 0.3405283210899349
Epoch: 59, step: 95, loss: 0.30358660221099854, mean loss: 0.34052788796937405
Epoch: 59, step: 96, loss: 0.3144117295742035, mean loss: 0.34052758177591863
Epoch: 59, step: 97, loss: 0.3807178735733032, mean loss: 0.3405280529730931
Epoch: 59, step: 98, loss: 0.33332309126853943, mean loss: 0.3405279685020021
Epoch: 59, step: 99, loss: 0.35216885805130005, mean loss: 0.3405281049783849
Epoch: 59, step: 100, loss: 0.293708860874176, mean loss: 0.34052755608165813
Epoch: 59, step: 101, loss: 0.35329127311706543, mean loss: 0.3405277057184261
Epoch: 59, step: 102, loss: 0.4070667624473572, mean loss: 0.3405284857868528
Epoch: 59, step: 103, loss: 0.36563077569007874, mean loss: 0.3405287800692667
Epoch: 59, step: 104, loss: 0.30800098180770874, mean loss: 0.34052839873964263
Epoch: 59, step: 105, loss: 0.3486841917037964, mean loss: 0.3405284943504485
Epoch: 59, step: 106, loss: 0.3386557996273041, mean loss: 0.34052847239700346
Epoch: 59, step: 107, loss: 0.35243475437164307, mean loss: 0.3405286119717242
Epoch: 59, step: 108, loss: 0.31584370136260986, mean loss: 0.3405283225993473
Epoch: 59, step: 109, loss: 0.3250463306903839, mean loss: 0.34052814111162183
Epoch: 59, step: 110, loss: 0.33918774127960205, mean loss: 0.3405281253989625
Epoch: 59, step: 111, loss: 0.345431923866272, mean loss: 0.34052818288241615
Epoch: 59, step: 112, loss: 0.344668984413147, mean loss: 0.34052823142127525
Epoch: 59, step: 113, loss: 0.32537564635276794, mean loss: 0.3405280538033516
Epoch: 59, step: 114, loss: 0.3793424665927887, mean loss: 0.34052850877882707
Epoch: 59, step: 115, loss: 0.319638192653656, mean loss: 0.3405282639092176
Epoch: 59, step: 116, loss: 0.31967073678970337, mean loss: 0.3405280194268161
Epoch: 59, step: 117, loss: 0.3291049897670746, mean loss: 0.3405278855328519
Epoch: 59, step: 118, loss: 0.34071817994117737, mean loss: 0.3405278877633437
Epoch: 59, step: 119, loss: 0.3625698983669281, mean loss: 0.34052814612063426
Epoch: 59, step: 120, loss: 0.320891410112381, mean loss: 0.34052791595857973
Epoch: 59, step: 121, loss: 0.2819306552410126, mean loss: 0.3405272291485195
Epoch: 59, step: 122, loss: 0.30138513445854187, mean loss: 0.34052677037503776
Epoch: 59, step: 123, loss: 0.3169156312942505, mean loss: 0.3405264936387616
Epoch: 59, step: 124, loss: 0.3278105556964874, mean loss: 0.3405263446023234
Epoch: 59, step: 125, loss: 0.3140450119972229, mean loss: 0.340526034232986
Epoch: 59, step: 126, loss: 0.3123011589050293, mean loss: 0.3405257034326704
Epoch: 59, step: 127, loss: 0.3050733506679535, mean loss: 0.34052528792996584
Epoch: 59, step: 128, loss: 0.32423079013824463, mean loss: 0.34052509696017047
Epoch: 59, step: 129, loss: 0.30630937218666077, mean loss: 0.34052469596018486
Epoch: 59, step: 130, loss: 0.3608285188674927, mean loss: 0.34052493391327016
Epoch: 59, step: 131, loss: 0.33791524171829224, mean loss: 0.34052490332902824
Epoch: 59, step: 132, loss: 0.3355603814125061, mean loss: 0.3405248451480825
Epoch: 59, step: 133, loss: 0.31638655066490173, mean loss: 0.340524562266394
Epoch: 59, step: 134, loss: 0.3293772339820862, mean loss: 0.34052443163006857
Epoch: 59, step: 135, loss: 0.3354514241218567, mean loss: 0.34052437217983295
Epoch: 59, step: 136, loss: 0.31995242834091187, mean loss: 0.3405241311014244
Epoch: 59, step: 137, loss: 0.34130287170410156, mean loss: 0.3405241402272195
Epoch: 59, step: 138, loss: 0.31984296441078186, mean loss: 0.34052389787442383
Epoch: 59, step: 139, loss: 0.342678964138031, mean loss: 0.3405239231283174
Epoch: 59, step: 140, loss: 0.36393529176712036, mean loss: 0.3405241974685056
Epoch: 59, step: 141, loss: 0.2996542453765869, mean loss: 0.3405237185499454
Epoch: 59, step: 142, loss: 0.31207239627838135, mean loss: 0.34052338515815184
Epoch: 59, step: 143, loss: 0.3487887680530548, mean loss: 0.34052348201054106
Epoch: 59, step: 144, loss: 0.35380926728248596, mean loss: 0.34052363768935046
Epoch: 59, step: 145, loss: 0.3251250982284546, mean loss: 0.3405234572560414
Epoch: 59, step: 146, loss: 0.3043646216392517, mean loss: 0.34052303356768243
Epoch: 59, step: 147, loss: 0.3164517879486084, mean loss: 0.340522751518029
Epoch: 59, step: 148, loss: 0.4183692932128906, mean loss: 0.34052366365748293
Epoch: 59, step: 149, loss: 0.3597172796726227, mean loss: 0.3405238885492882
Epoch: 59, step: 150, loss: 0.3314959406852722, mean loss: 0.3405237827699654
Epoch: 59, step: 151, loss: 0.35541972517967224, mean loss: 0.34052395730179286
Epoch: 59, step: 152, loss: 0.3468053936958313, mean loss: 0.3405240308988636
Epoch: 59, step: 153, loss: 0.3783492147922516, mean loss: 0.3405244740761793
Epoch: 59, step: 154, loss: 0.3701357841491699, mean loss: 0.3405248210118927
Epoch: 59, step: 155, loss: 0.3576570153236389, mean loss: 0.3405250217358864
Epoch: 59, step: 156, loss: 0.3439854383468628, mean loss: 0.3405250622782998
Epoch: 59, step: 157, loss: 0.3935311436653137, mean loss: 0.3405256832929141
Epoch: 59, step: 158, loss: 0.32609543204307556, mean loss: 0.34052551423133304
Epoch: 59, step: 159, loss: 0.33626002073287964, mean loss: 0.34052546425835517
Epoch: 59, step: 160, loss: 0.34630095958709717, mean loss: 0.3405255319211752
Epoch: 59, step: 161, loss: 0.3323138952255249, mean loss: 0.3405254357188661
Epoch: 59, step: 162, loss: 0.30714190006256104, mean loss: 0.3405250446231919
Epoch: 59, step: 163, loss: 0.36687713861465454, mean loss: 0.34052535334031925
Epoch: 59, step: 164, loss: 0.34927672147750854, mean loss: 0.3405254558621751
Epoch: 59, step: 165, loss: 0.35042107105255127, mean loss: 0.34052557178747195
Epoch: 59, step: 166, loss: 0.3205735385417938, mean loss: 0.3405253380558406
Epoch: 59, step: 167, loss: 0.32459551095962524, mean loss: 0.34052515144524254
Epoch: 59, step: 168, loss: 0.3182935118675232, mean loss: 0.34052489101486033
Epoch: 59, step: 169, loss: 0.3379969894886017, mean loss: 0.3405248614023504
Epoch: 59, step: 170, loss: 0.313810259103775, mean loss: 0.34052454846406865
Epoch: 59, step: 171, loss: 0.30611976981163025, mean loss: 0.3405241454467946
Epoch: 59, step: 172, loss: 0.3150799870491028, mean loss: 0.34052384739763863
Epoch: 59, step: 173, loss: 0.36697685718536377, mean loss: 0.3405241572607028
Epoch: 59, step: 174, loss: 0.3194579482078552, mean loss: 0.34052391049998715
Epoch: 59, step: 175, loss: 0.3237708508968353, mean loss: 0.34052371426398936
Epoch: 59, step: 176, loss: 0.3232715427875519, mean loss: 0.3405235121840405
Epoch: 59, step: 177, loss: 0.3349781334400177, mean loss: 0.34052344723008793
Epoch: 59, step: 178, loss: 0.34265565872192383, mean loss: 0.3405234722047467
Epoch: 59, step: 179, loss: 0.2813594937324524, mean loss: 0.34052277922336466
Epoch: 59, step: 180, loss: 0.3640638291835785, mean loss: 0.34052305495394736
Epoch: 59, step: 181, loss: 0.30903708934783936, mean loss: 0.3405226861708228
Epoch: 59, step: 182, loss: 0.3366912603378296, mean loss: 0.34052264129531673
Epoch: 59, step: 183, loss: 0.28480666875839233, mean loss: 0.3405219887306349
Epoch: 59, step: 184, loss: 0.29453226923942566, mean loss: 0.3405214500894912
Epoch: 59, step: 185, loss: 0.3372417986392975, mean loss: 0.34052141167798233
Epoch: 59, step: 186, loss: 0.3060959577560425, mean loss: 0.34052100848936256
Epoch: 59, step: 187, loss: 0.31429341435432434, mean loss: 0.3405207013171273
Epoch: 59, step: 188, loss: 0.33802300691604614, mean loss: 0.3405206720649823
Epoch: 59, step: 189, loss: 0.32901912927627563, mean loss: 0.3405205373644133
Epoch: 59, step: 190, loss: 0.37439557909965515, mean loss: 0.34052093408805667
Epoch: 59, step: 191, loss: 0.3355756103992462, mean loss: 0.34052087617214705
Epoch: 59, step: 192, loss: 0.3247205317020416, mean loss: 0.3405206911325697
Epoch: 59, step: 193, loss: 0.32597407698631287, mean loss: 0.34052052077756156
Epoch: 59, step: 194, loss: 0.33088406920433044, mean loss: 0.3405204079266572
Epoch: 59, step: 195, loss: 0.3291836977005005, mean loss: 0.3405202751658573
Epoch: 59, step: 196, loss: 0.3729690611362457, mean loss: 0.3405206551593693
Epoch: 59, step: 197, loss: 0.31848153471946716, mean loss: 0.3405203970719107
Epoch: 59, step: 198, loss: 0.33132392168045044, mean loss: 0.34052028937853995
Epoch: 59, step: 199, loss: 0.308363139629364, mean loss: 0.3405199128134813
Epoch: 59, step: 200, loss: 0.3073291778564453, mean loss: 0.3405195241495358
Epoch: 59, step: 201, loss: 0.3303978741168976, mean loss: 0.34051940562626787
Epoch: 59, step: 202, loss: 0.3140769302845001, mean loss: 0.34051909599178337
Epoch: 59, step: 203, loss: 0.3503688871860504, mean loss: 0.34051921132891677
Epoch: 59, step: 204, loss: 0.32349953055381775, mean loss: 0.3405190120375645
Epoch: 59, step: 205, loss: 0.35548895597457886, mean loss: 0.340519187325543
Epoch: 59, step: 206, loss: 0.3562747836112976, mean loss: 0.34051937181082204
Epoch: 59, step: 207, loss: 0.3180811107158661, mean loss: 0.34051910908002375
Epoch: 59, step: 208, loss: 0.31463971734046936, mean loss: 0.3405188060603909
Epoch: 59, step: 209, loss: 0.344530314207077, mean loss: 0.34051885303025425
Epoch: 59, step: 210, loss: 0.3351844251155853, mean loss: 0.3405187905713467
Epoch: 59, step: 211, loss: 0.31536903977394104, mean loss: 0.3405184961053623
Epoch: 59, step: 212, loss: 0.3323229253292084, mean loss: 0.3405184001486039
Epoch: 59, step: 213, loss: 0.30896198749542236, mean loss: 0.3405180306788386
Epoch: 59, step: 214, loss: 0.3433065116405487, mean loss: 0.3405180633266353
Epoch: 59, step: 215, loss: 0.3052560091018677, mean loss: 0.34051765048003035
Epoch: 59, step: 216, loss: 0.3144768178462982, mean loss: 0.34051734559865826
Epoch: 59, step: 217, loss: 0.34784165024757385, mean loss: 0.34051743134929224
Epoch: 59, step: 218, loss: 0.30692821741104126, mean loss: 0.3405170381020413
Epoch: 59, step: 219, loss: 0.31952688097953796, mean loss: 0.3405167923616985
Epoch: 59, step: 220, loss: 0.30610567331314087, mean loss: 0.3405163895013891
Epoch: 59, step: 221, loss: 0.3247385323047638, mean loss: 0.3405162047878955
Epoch: 59, step: 222, loss: 0.3130839765071869, mean loss: 0.34051588363887386
Epoch: 59, step: 223, loss: 0.3620598614215851, mean loss: 0.3405161358512103
Epoch: 59, step: 224, loss: 0.33909618854522705, mean loss: 0.3405161192282803
Epoch: 59, step: 225, loss: 0.36019167304039, mean loss: 0.34051634956184557
Epoch: 59, step: 226, loss: 0.32719072699546814, mean loss: 0.3405161935661235
Epoch: 59, step: 227, loss: 0.33537229895591736, mean loss: 0.34051613335008807
Epoch: 59, step: 228, loss: 0.30900609493255615, mean loss: 0.34051576448806387
Epoch: 59, step: 229, loss: 0.33364617824554443, mean loss: 0.34051568407242644
Epoch: 59, step: 230, loss: 0.33928102254867554, mean loss: 0.34051566961960095
Epoch: 59, step: 231, loss: 0.29934561252593994, mean loss: 0.3405151876926321
Epoch: 59, step: 232, loss: 0.3390149772167206, mean loss: 0.340515170131728
Epoch: 59, step: 233, loss: 0.3331189751625061, mean loss: 0.3405150835556427
Epoch: 59, step: 234, loss: 0.324442982673645, mean loss: 0.3405148954260307
Epoch: 59, step: 235, loss: 0.3802267909049988, mean loss: 0.34051536026233886
Epoch: 59, step: 236, loss: 0.30623510479927063, mean loss: 0.3405149590092462
Epoch: 59, step: 237, loss: 0.3551273047924042, mean loss: 0.34051513004590356
Epoch: 59, step: 238, loss: 0.3369901180267334, mean loss: 0.34051508878632586
Epoch: 59, step: 239, loss: 0.3476821780204773, mean loss: 0.3405151726747246
Epoch: 59, step: 240, loss: 0.32138845324516296, mean loss: 0.34051494880544747
Epoch: 59, step: 241, loss: 0.3576149046421051, mean loss: 0.34051514895006507
Epoch: 59, step: 242, loss: 0.32794463634490967, mean loss: 0.340515001821557
Epoch: 59, step: 243, loss: 0.3365601599216461, mean loss: 0.3405149555336134
Epoch: 59, step: 244, loss: 0.32785090804100037, mean loss: 0.3405148073138185
Epoch: 59, step: 245, loss: 0.3256956934928894, mean loss: 0.3405146338731942
Epoch: 59, step: 246, loss: 0.3689712584018707, mean loss: 0.3405149669212441
Epoch: 59, step: 247, loss: 0.32978320121765137, mean loss: 0.34051484132125226
Epoch: 59, step: 248, loss: 0.32315120100975037, mean loss: 0.34051463810701726
Epoch: 59, step: 249, loss: 0.33892571926116943, mean loss: 0.34051461951142653
Epoch: 59, step: 250, loss: 0.3227165937423706, mean loss: 0.34051441121826503
Epoch: 59, step: 251, loss: 0.307730108499527, mean loss: 0.3405140275427815
Epoch: 59, step: 252, loss: 0.34166744351387024, mean loss: 0.34051404104107835
Epoch: 59, step: 253, loss: 0.35323694348335266, mean loss: 0.34051418993402677
Epoch: 59, step: 254, loss: 0.33707401156425476, mean loss: 0.34051414967495
Epoch: 59, step: 255, loss: 0.32655319571495056, mean loss: 0.3405139862972179
Epoch: 59, step: 256, loss: 0.3376633822917938, mean loss: 0.34051395293848263
Epoch: 59, step: 257, loss: 0.34436535835266113, mean loss: 0.34051399800840815
Epoch: 59, step: 258, loss: 0.28934237360954285, mean loss: 0.3405133991947121
Epoch: 59, step: 259, loss: 0.3405621647834778, mean loss: 0.3405133997653635
Epoch: 59, step: 260, loss: 0.3104270398616791, mean loss: 0.34051304770105156
Epoch: 59, step: 261, loss: 0.3386796712875366, mean loss: 0.340513026247514
Epoch: 59, step: 262, loss: 0.32845959067344666, mean loss: 0.34051288520402445
Epoch: 59, step: 263, loss: 0.35534200072288513, mean loss: 0.34051305872515153
Epoch: 59, step: 264, loss: 0.32665401697158813, mean loss: 0.3405128965571246
Epoch: 59, step: 265, loss: 0.34067320823669434, mean loss: 0.3405128984329487
Epoch: 59, step: 266, loss: 0.34289589524269104, mean loss: 0.3405129263163229
Epoch: 59, step: 267, loss: 0.33774271607398987, mean loss: 0.34051289390255524
Epoch: 59, step: 268, loss: 0.3518378734588623, mean loss: 0.3405130264127004
Epoch: 59, step: 269, loss: 0.3011535704135895, mean loss: 0.340512565885052
Epoch: 59, step: 270, loss: 0.3235626816749573, mean loss: 0.3405123675642474
Epoch: 59, step: 271, loss: 0.3424733877182007, mean loss: 0.34051239050874305
Epoch: 59, step: 272, loss: 0.2945293188095093, mean loss: 0.34051185249997146
Epoch: 59, step: 273, loss: 0.31077468395233154, mean loss: 0.34051150457475154
Epoch: 59, step: 274, loss: 0.3126165568828583, mean loss: 0.34051117820735566
Epoch: 59, step: 275, loss: 0.32138392329216003, mean loss: 0.3405109544234859
Epoch: 59, step: 276, loss: 0.32116231322288513, mean loss: 0.3405107280521031
Epoch: 59, step: 277, loss: 0.33976832032203674, mean loss: 0.3405107193663304
Epoch: 59, step: 278, loss: 0.33662092685699463, mean loss: 0.3405106738583748
Epoch: 59, step: 279, loss: 0.3455659747123718, mean loss: 0.3405107330013021
Epoch: 59, step: 280, loss: 0.338664174079895, mean loss: 0.3405107113983104
Epoch: 59, step: 281, loss: 0.3714742064476013, mean loss: 0.34051107363765915
Epoch: 59, step: 282, loss: 0.3266349136829376, mean loss: 0.3405109113035191
Epoch: 59, step: 283, loss: 0.3512825071811676, mean loss: 0.3405110373165734
Epoch: 59, step: 284, loss: 0.3008654713630676, mean loss: 0.3405105735226782
Epoch: 59, step: 285, loss: 0.36373084783554077, mean loss: 0.3405108451620212
Epoch: 59, step: 286, loss: 0.2911924421787262, mean loss: 0.34051026822388164
Epoch: 59, step: 287, loss: 0.3539915680885315, mean loss: 0.3405104259294156
Epoch: 59, step: 288, loss: 0.3033119738101959, mean loss: 0.3405099907834588
Epoch: 59, step: 289, loss: 0.3430250883102417, mean loss: 0.3405100202046216
Epoch: 59, step: 290, loss: 0.33806511759757996, mean loss: 0.340509991604921
Epoch: 59, step: 291, loss: 0.3077831268310547, mean loss: 0.3405096087808431
Epoch: 59, step: 292, loss: 0.29923224449157715, mean loss: 0.340509125942533
Epoch: 59, step: 293, loss: 0.33220618963241577, mean loss: 0.3405090288208076
Epoch: 59, step: 294, loss: 0.31552502512931824, mean loss: 0.34050873657947583
Epoch: 59, step: 295, loss: 0.2841474115848541, mean loss: 0.3405080773210073
Epoch: 59, step: 296, loss: 0.3418997824192047, mean loss: 0.34050809359959266
Epoch: 59, step: 297, loss: 0.324421763420105, mean loss: 0.340507905442176
Epoch: 59, step: 298, loss: 0.36460989713668823, mean loss: 0.34050818735330174
Epoch: 59, step: 299, loss: 0.2813285291194916, mean loss: 0.34050749516117307
Epoch: 59, step: 300, loss: 0.31949377059936523, mean loss: 0.3405072493779928
Epoch: 59, step: 301, loss: 0.3264637887477875, mean loss: 0.3405070851231491
Epoch: 59, step: 302, loss: 0.31877148151397705, mean loss: 0.34050683090258965
Epoch: 59, step: 303, loss: 0.3001883924007416, mean loss: 0.34050635934190543
Epoch: 59, step: 304, loss: 0.3046180009841919, mean loss: 0.3405059395999333
Epoch: 59, step: 305, loss: 0.30156734585762024, mean loss: 0.3405054841884372
Epoch: 59, step: 306, loss: 0.3353976607322693, mean loss: 0.34050542444990806
Epoch: 59, step: 307, loss: 0.3344329297542572, mean loss: 0.34050535342990085
Epoch: 59, step: 308, loss: 0.3285556435585022, mean loss: 0.34050521367538505
Epoch: 59, step: 309, loss: 0.32091420888900757, mean loss: 0.34050498455690464
Epoch: 59, step: 310, loss: 0.3183916509151459, mean loss: 0.34050472594259656
Epoch: 59, step: 311, loss: 0.3587294816970825, mean loss: 0.34050493907769214
Epoch: 59, step: 312, loss: 0.34669217467308044, mean loss: 0.3405050114354041
Epoch: 59, step: 313, loss: 0.3074355125427246, mean loss: 0.3405046247028712
Epoch: 59, step: 314, loss: 0.3196415603160858, mean loss: 0.3405043807218116
Epoch: 59, step: 315, loss: 0.3694884777069092, mean loss: 0.3405047196695264
Epoch: 59, step: 316, loss: 0.30884066224098206, mean loss: 0.34050434938597385
Epoch: 59, step: 317, loss: 0.3779132664203644, mean loss: 0.3405047868455364
Epoch: 59, step: 318, loss: 0.3198172450065613, mean loss: 0.34050454492842436
Epoch: 59, step: 319, loss: 0.38369426131248474, mean loss: 0.3405050499767941
Epoch: 59, step: 320, loss: 0.334450900554657, mean loss: 0.34050497918210504
Epoch: 59, step: 321, loss: 0.31035056710243225, mean loss: 0.3405046265731563
Epoch: 59, step: 322, loss: 0.31720176339149475, mean loss: 0.3405043540856017
Epoch: 59, step: 323, loss: 0.3303900361061096, mean loss: 0.3405042358171501
Epoch: 59, step: 324, loss: 0.3346308171749115, mean loss: 0.34050416713906356
Epoch: 59, step: 325, loss: 0.31251657009124756, mean loss: 0.34050383988295346
Epoch: 59, step: 326, loss: 0.30491939187049866, mean loss: 0.34050342380250714
Epoch: 59, step: 327, loss: 0.32232344150543213, mean loss: 0.3405032112308045
Epoch: 59, step: 328, loss: 0.39761272072792053, mean loss: 0.3405038789830348
Epoch: 59, step: 329, loss: 0.338196337223053, mean loss: 0.3405038520024469
Epoch: 59, step: 330, loss: 0.34606462717056274, mean loss: 0.34050391702022104
Epoch: 59, step: 331, loss: 0.37199538946151733, mean loss: 0.34050428522095577
Epoch: 59, step: 332, loss: 0.3103921115398407, mean loss: 0.34050393315120536
Epoch: 59, step: 333, loss: 0.3364778161048889, mean loss: 0.3405038860786338
Epoch: 59, step: 334, loss: 0.3348797857761383, mean loss: 0.34050382032352394
Epoch: 59, step: 335, loss: 0.28143373131752014, mean loss: 0.3405031297037675
Epoch: 59, step: 336, loss: 0.31319379806518555, mean loss: 0.3405028104196124
Epoch: 59, step: 337, loss: 0.30368945002555847, mean loss: 0.34050238002514477
Epoch: 59, step: 338, loss: 0.3431866765022278, mean loss: 0.3405024114075786
Epoch: 59, step: 339, loss: 0.3296545445919037, mean loss: 0.34050228458534215
Epoch: 59, step: 340, loss: 0.34240567684173584, mean loss: 0.34050230683761024
Epoch: 59, step: 341, loss: 0.3429492115974426, mean loss: 0.34050233544366554
Epoch: 59, step: 342, loss: 0.3419923186302185, mean loss: 0.3405023528624241
Epoch: 59, step: 343, loss: 0.3479149341583252, mean loss: 0.3405024395187404
Epoch: 59, step: 344, loss: 0.3708111047744751, mean loss: 0.34050279383614673
Epoch: 59, step: 345, loss: 0.33772987127304077, mean loss: 0.3405027614202275
Epoch: 59, step: 346, loss: 0.3099002540111542, mean loss: 0.34050240367608237
Epoch: 59, step: 347, loss: 0.31031572818756104, mean loss: 0.34050205079714885
Epoch: 59, step: 348, loss: 0.35015609860420227, mean loss: 0.34050216365059216
Epoch: 59, step: 349, loss: 0.33496707677841187, mean loss: 0.340502098947545
Epoch: 59, step: 350, loss: 0.34225860238075256, mean loss: 0.3405021194801579
Epoch: 59, step: 351, loss: 0.31955158710479736, mean loss: 0.3405018745821781
Epoch: 59, step: 352, loss: 0.336500883102417, mean loss: 0.3405018278137591
Epoch: 59, step: 353, loss: 0.3226014971733093, mean loss: 0.34050161857552835
Epoch: 59, step: 354, loss: 0.3606313169002533, mean loss: 0.34050185387024523
Epoch: 59, step: 355, loss: 0.3358931541442871, mean loss: 0.3405018000000876
Epoch: 59, step: 356, loss: 0.3116995692253113, mean loss: 0.34050146334058096
Epoch: 59, step: 357, loss: 0.3280630111694336, mean loss: 0.34050131795343164
Epoch: 59, step: 358, loss: 0.3738895654678345, mean loss: 0.3405017082082094
Epoch: 59, step: 359, loss: 0.3452228307723999, mean loss: 0.3405017633898748
Epoch: 59, step: 360, loss: 0.3068121373653412, mean loss: 0.3405013696216732
Epoch: 59, step: 361, loss: 0.3384503424167633, mean loss: 0.3405013456493129
Epoch: 59, step: 362, loss: 0.34659284353256226, mean loss: 0.34050141684577245
Epoch: 59, step: 363, loss: 0.3216523230075836, mean loss: 0.34050119654313293
Epoch: 59, step: 364, loss: 0.33994588255882263, mean loss: 0.340501190052863
Epoch: 59, step: 365, loss: 0.33572086691856384, mean loss: 0.3405011341831646
Epoch: 59, step: 366, loss: 0.3246881365776062, mean loss: 0.3405009493720008
Epoch: 59, step: 367, loss: 0.36051538586616516, mean loss: 0.3405011832838854
Epoch: 59, step: 368, loss: 0.33014896512031555, mean loss: 0.3405010622972885
Epoch: 59, step: 369, loss: 0.34037667512893677, mean loss: 0.34050106084358994
Epoch: 59, step: 370, loss: 0.31537044048309326, mean loss: 0.34050076714835276
Epoch: 59, step: 371, loss: 0.2980622947216034, mean loss: 0.34050027118639936
Epoch: 59, step: 372, loss: 0.3582160472869873, mean loss: 0.34050047822137813
Epoch: 59, step: 373, loss: 0.3476523458957672, mean loss: 0.3405005618005259
Epoch: 59, step: 374, loss: 0.35537707805633545, mean loss: 0.34050073565050143
Epoch: 59, step: 375, loss: 0.3228907585144043, mean loss: 0.3405005298591545
Epoch: 59, step: 376, loss: 0.33427485823631287, mean loss: 0.34050045710639815
Epoch: 59, step: 377, loss: 0.3061095178127289, mean loss: 0.34050005522102067
Epoch: 59, step: 378, loss: 0.3330095410346985, mean loss: 0.3404999676894497
Epoch: 59, step: 379, loss: 0.31015825271606445, mean loss: 0.3404996131307536
Epoch: 59, step: 380, loss: 0.31622254848480225, mean loss: 0.34049932944396105
Epoch: 59, step: 381, loss: 0.28615203499794006, mean loss: 0.3404986943824447
Epoch: 59, step: 382, loss: 0.30530792474746704, mean loss: 0.3404982831744423
Epoch: 59, step: 383, loss: 0.3286019563674927, mean loss: 0.3404981441661833
Epoch: 59, step: 384, loss: 0.35075312852859497, mean loss: 0.3404982639939998
Epoch: 59, step: 385, loss: 0.2931864857673645, mean loss: 0.3404977111700622
Epoch: 59, step: 386, loss: 0.3238767385482788, mean loss: 0.3404975169612518
Epoch: 59, step: 387, loss: 0.41503003239631653, mean loss: 0.3404983878309872
Epoch: 59, step: 388, loss: 0.30788594484329224, mean loss: 0.34049800677773034
Epoch: 59, step: 389, loss: 0.3486471176147461, mean loss: 0.3404981019931959
Epoch: 59, step: 390, loss: 0.2991653382778168, mean loss: 0.3404976190604641
Epoch: 59, step: 391, loss: 0.34123069047927856, mean loss: 0.3404976276255833
Epoch: 59, step: 392, loss: 0.35800373554229736, mean loss: 0.3404978321624737
Epoch: 59, step: 393, loss: 0.39194172620773315, mean loss: 0.34049843321276047
Epoch: 59, step: 394, loss: 0.31642165780067444, mean loss: 0.3404981519124437
Epoch: 59, step: 395, loss: 0.33814045786857605, mean loss: 0.3404981243667146
Epoch: 59, step: 396, loss: 0.3378218710422516, mean loss: 0.34049809309951606
Epoch: 59, step: 397, loss: 0.3225790858268738, mean loss: 0.340497883750645
Epoch: 59, step: 398, loss: 0.33469676971435547, mean loss: 0.34049781597666245
Epoch: 59, step: 399, loss: 0.3166883587837219, mean loss: 0.3404975378157999
Epoch: 59, step: 400, loss: 0.32026106119155884, mean loss: 0.3404973014000771
Epoch: 59, step: 401, loss: 0.32915106415748596, mean loss: 0.3404971688474796
Epoch: 59, step: 402, loss: 0.3357207179069519, mean loss: 0.34049711304716723
Epoch: 59, step: 403, loss: 0.32229557633399963, mean loss: 0.34049690041239256
Epoch: 59, step: 404, loss: 0.3269328773021698, mean loss: 0.3404967419560298
Epoch: 59, step: 405, loss: 0.31313997507095337, mean loss: 0.3404964223750985
Epoch: 59, step: 406, loss: 0.3599984347820282, mean loss: 0.34049665019436187
Epoch: 59, step: 407, loss: 0.3109203577041626, mean loss: 0.3404963046930712
Epoch: 59, step: 408, loss: 0.3283745348453522, mean loss: 0.34049616309188147
Epoch: 59, step: 409, loss: 0.3533661365509033, mean loss: 0.3404963134315009
Epoch: 59, step: 410, loss: 0.3321433961391449, mean loss: 0.34049621585867046
Epoch: 59, step: 411, loss: 0.33548247814178467, mean loss: 0.34049615729244165
Epoch: 59, step: 412, loss: 0.296996533870697, mean loss: 0.34049564917269465
Epoch: 59, step: 413, loss: 0.34076008200645447, mean loss: 0.3404956522615024
Epoch: 59, step: 414, loss: 0.28505939245224, mean loss: 0.34049500472485633
Epoch: 59, step: 415, loss: 0.32455822825431824, mean loss: 0.3404948185736571
Epoch: 59, step: 416, loss: 0.31195786595344543, mean loss: 0.34049448524866416
Epoch: 59, step: 417, loss: 0.3506624400615692, mean loss: 0.3404946040137588
Epoch: 59, step: 418, loss: 0.3467295169830322, mean loss: 0.3404946768387657
Epoch: 59, step: 419, loss: 0.3538123071193695, mean loss: 0.3404948323894838
Epoch: 59, step: 420, loss: 0.32491743564605713, mean loss: 0.34049465044668337
Epoch: 59, step: 421, loss: 0.32722461223602295, mean loss: 0.3404944954554641
Epoch: 59, step: 422, loss: 0.3664395809173584, mean loss: 0.3404947984849957
Epoch: 59, step: 423, loss: 0.3394714295864105, mean loss: 0.34049478653254417
Epoch: 59, step: 424, loss: 0.30531540513038635, mean loss: 0.3404943756592607
Epoch: 59, step: 425, loss: 0.3438275158405304, mean loss: 0.3404944145878092
Epoch: 59, step: 426, loss: 0.320294588804245, mean loss: 0.34049417867192466
Epoch: 59, step: 427, loss: 0.3705064654350281, mean loss: 0.3404945291844768
Epoch: 59, step: 428, loss: 0.342437207698822, mean loss: 0.34049455187269306
Epoch: 59, step: 429, loss: 0.34092584252357483, mean loss: 0.34049455690960534
Epoch: 59, step: 430, loss: 0.35254621505737305, mean loss: 0.3404946976556101
Epoch: 59, step: 431, loss: 0.3179525136947632, mean loss: 0.3404944343984517
Epoch: 59, step: 432, loss: 0.32965928316116333, mean loss: 0.3404943078624506
Epoch: 59, step: 433, loss: 0.32409319281578064, mean loss: 0.34049411632776594
Epoch: 59, step: 434, loss: 0.355787456035614, mean loss: 0.3404942949235982
Epoch: 59, step: 435, loss: 0.29701513051986694, mean loss: 0.34049378717924556
Epoch: 59, step: 436, loss: 0.294668048620224, mean loss: 0.3404932520381369
Epoch: 59, step: 437, loss: 0.33211398124694824, mean loss: 0.34049315418832504
Epoch: 59, step: 438, loss: 0.32919105887413025, mean loss: 0.340493022208465
Epoch: 59, step: 439, loss: 0.3022972047328949, mean loss: 0.34049257618322476
Epoch: 59, step: 440, loss: 0.311221182346344, mean loss: 0.3404922343754333
Epoch: 59, step: 441, loss: 0.31758421659469604, mean loss: 0.3404919668771524
Epoch: 59, step: 442, loss: 0.3034176528453827, mean loss: 0.34049153396324594
Epoch: 59, step: 443, loss: 0.31710055470466614, mean loss: 0.340491260831774
Epoch: 59, step: 444, loss: 0.3001788258552551, mean loss: 0.34049079011757194
Epoch: 59, step: 445, loss: 0.2900876998901367, mean loss: 0.34049020158519033
Epoch: 59, step: 446, loss: 0.29816973209381104, mean loss: 0.3404897074354117
Epoch: 59, step: 447, loss: 0.34328344464302063, mean loss: 0.3404897400557611
Epoch: 59, step: 448, loss: 0.32067254185676575, mean loss: 0.3404895086680771
Epoch: 59, step: 449, loss: 0.3344655930995941, mean loss: 0.3404894383330285
Epoch: 59, step: 450, loss: 0.3363150358200073, mean loss: 0.34048938959340525
Epoch: 59, step: 451, loss: 0.3595375120639801, mean loss: 0.34048961199349015
Epoch: 59, step: 452, loss: 0.3301756680011749, mean loss: 0.34048949157242286
Epoch: 59, step: 453, loss: 0.30817002058029175, mean loss: 0.3404891142289203
Epoch: 59, step: 454, loss: 0.3335687518119812, mean loss: 0.3404890334317035
Epoch: 59, step: 455, loss: 0.3216792345046997, mean loss: 0.3404888138244681
Epoch: 59, step: 456, loss: 0.3628374934196472, mean loss: 0.340489074745622
Epoch: 59, step: 457, loss: 0.31982290744781494, mean loss: 0.34048883347064013
Epoch: 59, step: 458, loss: 0.3182361423969269, mean loss: 0.3404885736762198
Epoch: 59, step: 459, loss: 0.36112722754478455, mean loss: 0.3404888146243597
Epoch: 59, step: 460, loss: 0.3295471668243408, mean loss: 0.3404886868864305
Epoch: 59, step: 461, loss: 0.3188328444957733, mean loss: 0.34048843406891915
Epoch: 59, step: 462, loss: 0.2961168885231018, mean loss: 0.3404879160667764
Epoch: 59, step: 463, loss: 0.3523310720920563, mean loss: 0.34048805432449325
Epoch: 59, step: 464, loss: 0.3163742125034332, mean loss: 0.3404877728213375
Epoch: 59, step: 465, loss: 0.3316936790943146, mean loss: 0.34048767016095455
Epoch: 59, step: 466, loss: 0.35079440474510193, mean loss: 0.3404877904781812
Epoch: 59, step: 467, loss: 0.33447781205177307, mean loss: 0.3404877203206071
Epoch: 59, step: 468, loss: 0.32399415969848633, mean loss: 0.3404875277850252
Epoch: 59, step: 469, loss: 0.3256474435329437, mean loss: 0.3404873545531216
Epoch: 59, step: 470, loss: 0.3161849081516266, mean loss: 0.34048707086808067
Epoch: 59, step: 471, loss: 0.38897910714149475, mean loss: 0.3404876369141687
Epoch: 59, step: 472, loss: 0.3357617259025574, mean loss: 0.34048758174939486
Epoch: 59, step: 473, loss: 0.33248069882392883, mean loss: 0.34048748828747205
Epoch: 59, step: 474, loss: 0.31191059947013855, mean loss: 0.34048715472198526
Epoch: 59, step: 475, loss: 0.33844324946403503, mean loss: 0.3404871308646543
Epoch: 59, step: 476, loss: 0.3356780409812927, mean loss: 0.34048707473156825
Epoch: 59, step: 477, loss: 0.3278283178806305, mean loss: 0.34048692697662686
Epoch: 59, step: 478, loss: 0.33038488030433655, mean loss: 0.34048680906537304
Epoch: 59, step: 479, loss: 0.31316906213760376, mean loss: 0.3404864902159061
Epoch: 59, step: 480, loss: 0.3243963122367859, mean loss: 0.34048630241546984
Epoch: 59, step: 481, loss: 0.37454846501350403, mean loss: 0.34048669997566733
Epoch: 59, step: 482, loss: 0.3225071430206299, mean loss: 0.34048649012778215
Epoch: 59, step: 483, loss: 0.33792126178741455, mean loss: 0.3404864601881423
Epoch: 59, step: 484, loss: 0.3170911371707916, mean loss: 0.3404861871366721
Epoch: 59, step: 485, loss: 0.3410058617591858, mean loss: 0.34048619320182727
Epoch: 59, step: 486, loss: 0.3183607757091522, mean loss: 0.34048593497770474
Epoch: 59, step: 487, loss: 0.2960118353366852, mean loss: 0.340485415929812
Epoch: 59, step: 488, loss: 0.32988202571868896, mean loss: 0.3404852921813121
Epoch: 59, step: 489, loss: 0.4003792107105255, mean loss: 0.3404859911743627
Epoch: 59, step: 490, loss: 0.3694571852684021, mean loss: 0.34048632927925715
Epoch: 59, step: 491, loss: 0.33816975355148315, mean loss: 0.3404863022442496
Epoch: 59, step: 492, loss: 0.3181961476802826, mean loss: 0.34048604211570843
Epoch: 59, step: 493, loss: 0.3071589469909668, mean loss: 0.3404856531894029
Epoch: 59, step: 494, loss: 0.3653944134712219, mean loss: 0.34048594387057457
Epoch: 59, step: 495, loss: 0.33163195848464966, mean loss: 0.3404858405472143
Epoch: 59, step: 496, loss: 0.3511728048324585, mean loss: 0.34048596525943453
Epoch: 59, step: 497, loss: 0.31271621584892273, mean loss: 0.3404856412023312
Epoch: 59, step: 498, loss: 0.31201544404029846, mean loss: 0.3404853089752799
Epoch: 59, step: 499, loss: 0.4170946478843689, mean loss: 0.3404862029416133
Epoch: 59, step: 500, loss: 0.2856440246105194, mean loss: 0.34048556298714194
Epoch: 59, step: 501, loss: 0.3179837465286255, mean loss: 0.3404853004160614
Epoch: 59, step: 502, loss: 0.3302801251411438, mean loss: 0.340485181334447
Epoch: 59, step: 503, loss: 0.3370508551597595, mean loss: 0.34048514126062934
Epoch: 59, step: 504, loss: 0.29683563113212585, mean loss: 0.3404846319373994
Epoch: 59, step: 505, loss: 0.32617220282554626, mean loss: 0.3404844649351228
Epoch: 59, step: 506, loss: 0.3843175768852234, mean loss: 0.3404849763887703
Epoch: 59, step: 507, loss: 0.36078429222106934, mean loss: 0.3404852132425441
Epoch: 59, step: 508, loss: 0.31357064843177795, mean loss: 0.34048489920526726
Epoch: 59, step: 509, loss: 0.3503682613372803, mean loss: 0.3404850145223061
Epoch: 59, step: 510, loss: 0.3174808621406555, mean loss: 0.34048474611771395
Epoch: 59, step: 511, loss: 0.3342647850513458, mean loss: 0.3404846735461796
Epoch: 59, step: 512, loss: 0.333636999130249, mean loss: 0.34048459365171796
Epoch: 59, step: 513, loss: 0.35600584745407104, mean loss: 0.34048477474206684
Epoch: 59, step: 514, loss: 0.3371891379356384, mean loss: 0.34048473629149684
Epoch: 59, step: 515, loss: 0.31777194142341614, mean loss: 0.34048447130182363
Epoch: 59, step: 516, loss: 0.3764684796333313, mean loss: 0.34048489112155145
Epoch: 59, step: 517, loss: 0.3732443153858185, mean loss: 0.3404852733161085
Epoch: 59, step: 518, loss: 0.34368380904197693, mean loss: 0.3404853106320477
Epoch: 59, step: 519, loss: 0.3033335506916046, mean loss: 0.34048487720351694
Epoch: 59, step: 520, loss: 0.3022938370704651, mean loss: 0.3404844316554911
Epoch: 59, step: 521, loss: 0.3295148015022278, mean loss: 0.34048430368201815
Epoch: 59, step: 522, loss: 0.3995145261287689, mean loss: 0.34048499233007107
Epoch: 59, step: 523, loss: 0.32845553755760193, mean loss: 0.34048485199578765
Epoch: 59, step: 524, loss: 0.3516849875450134, mean loss: 0.34048498265380084
Epoch: 59, step: 525, loss: 0.3351403772830963, mean loss: 0.34048492030568284
Epoch: 59, step: 526, loss: 0.33750879764556885, mean loss: 0.34048488558778145
Epoch: 59, step: 527, loss: 0.3657625615596771, mean loss: 0.3404851804605822
Epoch: 59, step: 528, loss: 0.31695064902305603, mean loss: 0.3404849059253656
Epoch: 59, step: 529, loss: 0.32720810174942017, mean loss: 0.34048475105048315
Epoch: 59, step: 530, loss: 0.3415495455265045, mean loss: 0.34048476347124296
Epoch: 59, step: 531, loss: 0.36508429050445557, mean loss: 0.34048505041981325
Epoch: 59, step: 532, loss: 0.3640040159225464, mean loss: 0.34048532476064897
Epoch: 59, step: 533, loss: 0.34501779079437256, mean loss: 0.3404853776297267
Epoch: 59, step: 534, loss: 0.30980992317199707, mean loss: 0.34048501981919777
Epoch: 59, step: 535, loss: 0.3136174976825714, mean loss: 0.34048470642954004
Epoch: 59, step: 536, loss: 0.3230949342250824, mean loss: 0.34048450359315025
Epoch: 59, step: 537, loss: 0.35861316323280334, mean loss: 0.34048471504554534
Epoch: 59, step: 538, loss: 0.33839109539985657, mean loss: 0.3404846906258842
Epoch: 59, step: 539, loss: 0.3364500403404236, mean loss: 0.34048464356688585
Epoch: 59, step: 540, loss: 0.32215574383735657, mean loss: 0.34048442978637417
Epoch: 59, step: 541, loss: 0.3649301528930664, mean loss: 0.3404847149075935
Epoch: 59, step: 542, loss: 0.3163304030895233, mean loss: 0.34048443318851795
Epoch: 59, step: 543, loss: 0.3446054458618164, mean loss: 0.3404844812525799
Epoch: 59, step: 544, loss: 0.3187316060066223, mean loss: 0.3404842275481066
Epoch: 59, step: 545, loss: 0.305921345949173, mean loss: 0.34048382444482467
Epoch: 59, step: 546, loss: 0.3369409441947937, mean loss: 0.3404837831250639
Epoch: 59, step: 547, loss: 0.33555084466934204, mean loss: 0.3404837255940593
Epoch: 59, step: 548, loss: 0.3190409541130066, mean loss: 0.3404834755180026
Epoch: 59, step: 549, loss: 0.3486436903476715, mean loss: 0.34048357068529705
Epoch: 59, step: 550, loss: 0.36235353350639343, mean loss: 0.34048382573751834
Epoch: 59, step: 551, loss: 0.3332687318325043, mean loss: 0.34048374159451905
Epoch: 59, step: 552, loss: 0.32813066244125366, mean loss: 0.3404835975336069
Epoch: 59, step: 553, loss: 0.3486664295196533, mean loss: 0.34048369296021896
Epoch: 59, step: 554, loss: 0.3357838988304138, mean loss: 0.34048363815276333
Epoch: 59, step: 555, loss: 0.34134700894355774, mean loss: 0.34048364822099253
Epoch: 59, step: 556, loss: 0.3644874095916748, mean loss: 0.3404839281384458
Epoch: 59, step: 557, loss: 0.3619261085987091, mean loss: 0.3404841781813646
Epoch: 59, step: 558, loss: 0.31617626547813416, mean loss: 0.3404838947236921
Epoch: 59, step: 559, loss: 0.3354471027851105, mean loss: 0.3404838359897034
Epoch: 59, step: 560, loss: 0.33283665776252747, mean loss: 0.3404837468170618
Epoch: 59, step: 561, loss: 0.3229773938655853, mean loss: 0.34048354268038705
Epoch: 59, step: 562, loss: 0.3239535093307495, mean loss: 0.34048334993054913
Epoch: 59, step: 563, loss: 0.34569063782691956, mean loss: 0.3404834106498576
Epoch: 59, step: 564, loss: 0.3121081292629242, mean loss: 0.3404830797852293
Epoch: 59, step: 565, loss: 0.31957730650901794, mean loss: 0.34048283602023693
Epoch: 59, step: 566, loss: 0.3020796477794647, mean loss: 0.34048238823753063
Epoch: 59, step: 567, loss: 0.31716635823249817, mean loss: 0.3404821163748609
Epoch: 59, step: 568, loss: 0.3233283758163452, mean loss: 0.34048191636622616
Epoch: 59, step: 569, loss: 0.2872806787490845, mean loss: 0.34048129605937244
Epoch: 59, step: 570, loss: 0.3424028754234314, mean loss: 0.3404813184640195
Epoch: 59, step: 571, loss: 0.3477797508239746, mean loss: 0.3404814035590708
Epoch: 59, step: 572, loss: 0.33975520730018616, mean loss: 0.34048139509218583
Epoch: 59, step: 573, loss: 0.31600573658943176, mean loss: 0.34048110972832313
Epoch: 59, step: 574, loss: 0.3194071650505066, mean loss: 0.3404808640282068
Epoch: 59, step: 575, loss: 0.3309954106807709, mean loss: 0.3404807534390478
Epoch: 59, step: 576, loss: 0.35046136379241943, mean loss: 0.34048086979979486
Epoch: 59, step: 577, loss: 0.35321658849716187, mean loss: 0.34048101827973865
Epoch: 59, step: 578, loss: 0.3489706814289093, mean loss: 0.34048111725570074
Epoch: 59, step: 579, loss: 0.31984883546829224, mean loss: 0.340480876718933
Epoch: 59, step: 580, loss: 0.3357958197593689, mean loss: 0.34048082209989805
Epoch: 59, step: 581, loss: 0.3307536542415619, mean loss: 0.3404807087005665
Epoch: 59, step: 582, loss: 0.31318405270576477, mean loss: 0.3404803904798366
Epoch: 59, step: 583, loss: 0.33695173263549805, mean loss: 0.3404803493436994
Epoch: 59, step: 584, loss: 0.3147815763950348, mean loss: 0.34048004975785934
Epoch: 59, step: 585, loss: 0.3629232347011566, mean loss: 0.34048031138832896
Epoch: 59, step: 586, loss: 0.31958290934562683, mean loss: 0.3404800677805973
Epoch: 59, step: 587, loss: 0.3251790404319763, mean loss: 0.34047988941368335
Epoch: 59, step: 588, loss: 0.3760216236114502, mean loss: 0.3404803037254418
Epoch: 59, step: 589, loss: 0.35968470573425293, mean loss: 0.340480527589499
Epoch: 59, step: 590, loss: 0.3453378975391388, mean loss: 0.34048058421078137
Epoch: 59, step: 591, loss: 0.30361536145210266, mean loss: 0.3404801544860791
Epoch: 59, step: 592, loss: 0.42134881019592285, mean loss: 0.340481097132056
Epoch: 59, step: 593, loss: 0.29122093319892883, mean loss: 0.34048052293734876
Epoch: 59, step: 594, loss: 0.3158377408981323, mean loss: 0.3404802356953066
Epoch: 59, step: 595, loss: 0.33751752972602844, mean loss: 0.34048020116171407
Epoch: 59, step: 596, loss: 0.3363032937049866, mean loss: 0.34048015247583696
Epoch: 59, step: 597, loss: 0.33612483739852905, mean loss: 0.340480101711039
Epoch: 59, step: 598, loss: 0.3210696876049042, mean loss: 0.34047987546925207
Epoch: 59, step: 599, loss: 0.3601793646812439, mean loss: 0.3404801050777328
Epoch: 59, step: 600, loss: 0.3676231801509857, mean loss: 0.3404804214416508
Epoch: 59, step: 601, loss: 0.3059568405151367, mean loss: 0.3404800190595332
Epoch: 59, step: 602, loss: 0.31642019748687744, mean loss: 0.340479738638764
Epoch: 59, step: 603, loss: 0.3350958526134491, mean loss: 0.34047967588950967
Epoch: 59, step: 604, loss: 0.343500018119812, mean loss: 0.34047971109122327
Epoch: 59, step: 605, loss: 0.31481489539146423, mean loss: 0.34047941197446957
Epoch: 59, step: 606, loss: 0.3312704861164093, mean loss: 0.340479304648084
Epoch: 59, step: 607, loss: 0.31215572357177734, mean loss: 0.34047897455180554
Epoch: 59, step: 608, loss: 0.3293386399745941, mean loss: 0.34047884471864226
Epoch: 59, step: 609, loss: 0.3432942032814026, mean loss: 0.34047887752938466
Epoch: 59, step: 610, loss: 0.3200131058692932, mean loss: 0.3404786390200362
Epoch: 59, step: 611, loss: 0.34863555431365967, mean loss: 0.34047873408011564
Epoch: 59, step: 612, loss: 0.343012273311615, mean loss: 0.3404787636054479
Epoch: 59, step: 613, loss: 0.3217100203037262, mean loss: 0.3404785448810183
Epoch: 59, step: 614, loss: 0.3095584511756897, mean loss: 0.3404781845531617
Epoch: 59, step: 615, loss: 0.34721148014068604, mean loss: 0.34047826301882606
Epoch: 59, step: 616, loss: 0.3328404426574707, mean loss: 0.3404781740134264
Epoch: 59, step: 617, loss: 0.3299863934516907, mean loss: 0.34047805175155116
Epoch: 59, step: 618, loss: 0.3771309554576874, mean loss: 0.3404784788669005
Epoch: 59, step: 619, loss: 0.3623410165309906, mean loss: 0.340478733627524
Epoch: 59, step: 620, loss: 0.32265347242355347, mean loss: 0.34047852591505207
Epoch: 59, step: 621, loss: 0.3573751151561737, mean loss: 0.3404787228036913
Epoch: 59, step: 622, loss: 0.3078700602054596, mean loss: 0.34047834283349127
Epoch: 59, step: 623, loss: 0.35981306433677673, mean loss: 0.3404785681273797
Epoch: 59, step: 624, loss: 0.35172760486602783, mean loss: 0.34047869920295254
Epoch: 59, step: 625, loss: 0.31270354986190796, mean loss: 0.340478375566247
Epoch: 59, step: 626, loss: 0.3412383496761322, mean loss: 0.34047838442138034
Epoch: 59, step: 627, loss: 0.31280699372291565, mean loss: 0.3404780620011867
Epoch: 59, step: 628, loss: 0.3158320486545563, mean loss: 0.3404777748352869
Epoch: 59, step: 629, loss: 0.3594747483730316, mean loss: 0.3404779961781613
Epoch: 59, step: 630, loss: 0.35279160737991333, mean loss: 0.34047813964829543
Epoch: 59, step: 631, loss: 0.34270381927490234, mean loss: 0.3404781655801548
Epoch: 59, step: 632, loss: 0.28615710139274597, mean loss: 0.34047753268143544
Epoch: 59, step: 633, loss: 0.3768365681171417, mean loss: 0.3404779562982994
Epoch: 59, step: 634, loss: 0.3054918944835663, mean loss: 0.34047754868261493
Epoch: 59, step: 635, loss: 0.32798707485198975, mean loss: 0.3404774031602709
Epoch: 59, step: 636, loss: 0.33002418279647827, mean loss: 0.34047728137470634
Epoch: 59, step: 637, loss: 0.32702478766441345, mean loss: 0.3404771246478416
Epoch: 59, step: 638, loss: 0.3078818917274475, mean loss: 0.3404767449049288
Epoch: 59, step: 639, loss: 0.3260534107685089, mean loss: 0.34047657687130495
Epoch: 59, step: 640, loss: 0.37721961736679077, mean loss: 0.3404770049272773
Epoch: 59, step: 641, loss: 0.2894792854785919, mean loss: 0.34047641081139096
Epoch: 59, step: 642, loss: 0.29645299911499023, mean loss: 0.34047589795113287
Epoch: 59, step: 643, loss: 0.3557797074317932, mean loss: 0.34047607623409515
Epoch: 59, step: 644, loss: 0.31460288166999817, mean loss: 0.3404757748257406
Epoch: 59, step: 645, loss: 0.33360350131988525, mean loss: 0.34047569476850165
Epoch: 59, step: 646, loss: 0.33737924695014954, mean loss: 0.3404756586974438
Epoch: 59, step: 647, loss: 0.31111475825309753, mean loss: 0.34047531667120495
Epoch: 59, step: 648, loss: 0.33267512917518616, mean loss: 0.34047522580758455
Epoch: 59, step: 649, loss: 0.29876092076301575, mean loss: 0.34047473988738974
Epoch: 59, step: 650, loss: 0.337166965007782, mean loss: 0.3404747013563417
Epoch: 59, step: 651, loss: 0.3042924702167511, mean loss: 0.3404742798878027
Epoch: 59, step: 652, loss: 0.3525938391685486, mean loss: 0.3404744210607841
Epoch: 59, step: 653, loss: 0.31997013092041016, mean loss: 0.34047418222222686
Epoch: 59, step: 654, loss: 0.29748716950416565, mean loss: 0.3404736815057213
Epoch: 59, step: 655, loss: 0.32146990299224854, mean loss: 0.34047346015061586
Epoch: 59, step: 656, loss: 0.35103753209114075, mean loss: 0.34047358319898857
Epoch: 59, step: 657, loss: 0.3419411778450012, mean loss: 0.3404736002930628
Epoch: 59, step: 658, loss: 0.3413051962852478, mean loss: 0.34047360997911474
Epoch: 59, step: 659, loss: 0.3182319104671478, mean loss: 0.34047335092092995
Epoch: 59, step: 660, loss: 0.32187044620513916, mean loss: 0.34047313424780234
Epoch: 59, step: 661, loss: 0.2899892032146454, mean loss: 0.34047254625447576
Epoch: 59, step: 662, loss: 0.3506130576133728, mean loss: 0.34047266436103835
Epoch: 59, step: 663, loss: 0.3110646903514862, mean loss: 0.34047232185027654
Epoch: 59, step: 664, loss: 0.3290501832962036, mean loss: 0.34047218881969743
Epoch: 59, step: 665, loss: 0.3191937804222107, mean loss: 0.34047194099867767
Epoch: 59, step: 666, loss: 0.30656591057777405, mean loss: 0.34047154611344865
Epoch: 59, step: 667, loss: 0.3241245746612549, mean loss: 0.3404713557313158
Epoch: 59, step: 668, loss: 0.3370515704154968, mean loss: 0.34047131590385044
Epoch: 59, step: 669, loss: 0.31752392649650574, mean loss: 0.3404710486573337
Epoch: 59, step: 670, loss: 0.30860650539398193, mean loss: 0.34047067756549093
Epoch: 59, step: 671, loss: 0.3144015967845917, mean loss: 0.3404703739706619
Epoch: 59, step: 672, loss: 0.3971736431121826, mean loss: 0.3404710343168769
Epoch: 59, step: 673, loss: 0.3240065276622772, mean loss: 0.3404708425792892
Epoch: 59, step: 674, loss: 0.3389151692390442, mean loss: 0.34047082446288973
Epoch: 59, step: 675, loss: 0.3265230655670166, mean loss: 0.34047066203789794
Epoch: 59, step: 676, loss: 0.29616856575012207, mean loss: 0.3404701461353874
Epoch: 59, step: 677, loss: 0.31410837173461914, mean loss: 0.34046983915336254
Epoch: 59, step: 678, loss: 0.3286229968070984, mean loss: 0.3404697011988665
Epoch: 59, step: 679, loss: 0.32170581817626953, mean loss: 0.3404694826991341
Epoch: 59, step: 680, loss: 0.32034197449684143, mean loss: 0.3404692483231288
Epoch: 59, step: 681, loss: 0.3437653183937073, mean loss: 0.3404692867039722
Epoch: 59, step: 682, loss: 0.31852594017982483, mean loss: 0.3404690311892768
Epoch: 59, step: 683, loss: 0.37233829498291016, mean loss: 0.3404694022799125
Epoch: 59, step: 684, loss: 0.32998690009117126, mean loss: 0.34046928022145734
Epoch: 59, step: 685, loss: 0.33623799681663513, mean loss: 0.34046923095288645
Epoch: 59, step: 686, loss: 0.3410649299621582, mean loss: 0.34046923788905553
Epoch: 59, step: 687, loss: 0.34917062520980835, mean loss: 0.34046933920463607
Epoch: 59, step: 688, loss: 0.28844794631004333, mean loss: 0.3404687334947578
Epoch: 59, step: 689, loss: 0.3125188648700714, mean loss: 0.3404684080649017
Epoch: 59, step: 690, loss: 0.30685922503471375, mean loss: 0.34046801674627336
Epoch: 59, step: 691, loss: 0.3601830005645752, mean loss: 0.3404682462892109
Epoch: 59, step: 692, loss: 0.30039605498313904, mean loss: 0.34046777973131287
Epoch: 59, step: 693, loss: 0.34149596095085144, mean loss: 0.3404677917022201
Epoch: 59, step: 694, loss: 0.3494872748851776, mean loss: 0.3404678967130266
Epoch: 59, step: 695, loss: 0.31768810749053955, mean loss: 0.3404676314986967
Epoch: 59, step: 696, loss: 0.31354740262031555, mean loss: 0.34046731808283187
Epoch: 59, step: 697, loss: 0.341147780418396, mean loss: 0.34046732600494906
Epoch: 59, step: 698, loss: 0.34098300337791443, mean loss: 0.3404673320085275
Epoch: 59, step: 699, loss: 0.3534567952156067, mean loss: 0.34046748323167186
Epoch: 59, step: 700, loss: 0.3580477237701416, mean loss: 0.3404676878981973
Epoch: 59, step: 701, loss: 0.32334673404693604, mean loss: 0.34046748858093906
Epoch: 59, step: 702, loss: 0.286952942609787, mean loss: 0.3404668655871211
Epoch: 59, step: 703, loss: 0.31977593898773193, mean loss: 0.3404666247148673
Epoch: 59, step: 704, loss: 0.2996640205383301, mean loss: 0.3404661497191842
Epoch: 59, step: 705, loss: 0.3162609040737152, mean loss: 0.34046586794174427
Epoch: 59, step: 706, loss: 0.33757907152175903, mean loss: 0.3404658343364404
Epoch: 59, step: 707, loss: 0.34571367502212524, mean loss: 0.3404658954260368
Epoch: 59, step: 708, loss: 0.3274802267551422, mean loss: 0.34046574426290693
Epoch: 59, step: 709, loss: 0.32555434107780457, mean loss: 0.34046557068477284
Epoch: 59, step: 710, loss: 0.3385799527168274, mean loss: 0.3404655487352464
Epoch: 59, step: 711, loss: 0.33221137523651123, mean loss: 0.34046545265369993
Epoch: 59, step: 712, loss: 0.3318184018135071, mean loss: 0.3404653520000916
Epoch: 59, step: 713, loss: 0.34208837151527405, mean loss: 0.3404653708921823
Epoch: 59, step: 714, loss: 0.34056204557418823, mean loss: 0.34046537201747107
Epoch: 59, step: 715, loss: 0.3431944251060486, mean loss: 0.34046540378315093
Epoch: 59, step: 716, loss: 0.3224596083164215, mean loss: 0.34046519420141746
Epoch: 59, step: 717, loss: 0.34622472524642944, mean loss: 0.340465261239747
Epoch: 59, step: 718, loss: 0.32436808943748474, mean loss: 0.34046507387814773
Epoch: 59, step: 719, loss: 0.3175375759601593, mean loss: 0.3404648070186813
Epoch: 59, step: 720, loss: 0.3538229465484619, mean loss: 0.34046496249593877
Epoch: 59, step: 721, loss: 0.3307599425315857, mean loss: 0.34046484953916645
Epoch: 59, step: 722, loss: 0.3107178807258606, mean loss: 0.3404645033180883
Epoch: 59, step: 723, loss: 0.3729058504104614, mean loss: 0.34046488089428817
Epoch: 59, step: 724, loss: 0.34356796741485596, mean loss: 0.34046491700986553
Epoch: 59, step: 725, loss: 0.31679925322532654, mean loss: 0.3404646415779181
Epoch: 59, step: 726, loss: 0.3447115421295166, mean loss: 0.3404646910047369
Epoch: 59, step: 727, loss: 0.3051707148551941, mean loss: 0.3404642802466699
Epoch: 59, step: 728, loss: 0.3336022198200226, mean loss: 0.34046420038562336
Epoch: 59, step: 729, loss: 0.3404938280582428, mean loss: 0.3404642007304279
Epoch: 59, step: 730, loss: 0.3270372152328491, mean loss: 0.3404640444700499
Epoch: 59, step: 731, loss: 0.32940158247947693, mean loss: 0.3404639157289877
Epoch: 59, step: 732, loss: 0.3031012713909149, mean loss: 0.3404634809206653
Epoch: 59, step: 733, loss: 0.3308548033237457, mean loss: 0.3404633691008399
Epoch: 59, step: 734, loss: 0.3363130986690521, mean loss: 0.3404633208031309
Epoch: 59, step: 735, loss: 0.3251115679740906, mean loss: 0.34046314215311896
Epoch: 59, step: 736, loss: 0.33670175075531006, mean loss: 0.34046309838190886
Epoch: 59, step: 737, loss: 0.33631670475006104, mean loss: 0.34046305013099964
Epoch: 59, step: 738, loss: 0.3080570697784424, mean loss: 0.34046267303225813
Epoch: 59, step: 739, loss: 0.3402291536331177, mean loss: 0.3404626703148941
Epoch: 59, step: 740, loss: 0.346053808927536, mean loss: 0.34046273537579463
Epoch: 59, step: 741, loss: 0.32326531410217285, mean loss: 0.3404625352615114
Epoch: 59, step: 742, loss: 0.3355724811553955, mean loss: 0.3404624783600568
Epoch: 59, step: 743, loss: 0.405457079410553, mean loss: 0.3404632346388682
Epoch: 59, step: 744, loss: 0.34017252922058105, mean loss: 0.340463231256252
Epoch: 59, step: 745, loss: 0.34387651085853577, mean loss: 0.340463270972335
Epoch: 59, step: 746, loss: 0.36357495188713074, mean loss: 0.34046353989104755
Epoch: 59, step: 747, loss: 0.3084246516227722, mean loss: 0.3404631671030895
Epoch: 59, step: 748, loss: 0.3454168140888214, mean loss: 0.34046322474049695
Epoch: 59, step: 749, loss: 0.3227101266384125, mean loss: 0.34046301817942254
Epoch: 59, step: 750, loss: 0.32373228669166565, mean loss: 0.3404628235160662
Epoch: 59, step: 751, loss: 0.3629559278488159, mean loss: 0.34046308522203184
Epoch: 59, step: 752, loss: 0.3434849977493286, mean loss: 0.3404631203813999
Epoch: 59, step: 753, loss: 0.32418563961982727, mean loss: 0.34046293099826136
Epoch: 59, step: 754, loss: 0.364262193441391, mean loss: 0.340463207891636
Epoch: 59, step: 755, loss: 0.3242521286010742, mean loss: 0.3404630192854454
Epoch: 59, step: 756, loss: 0.34317639470100403, mean loss: 0.3404630508535747
Epoch: 59, step: 757, loss: 0.3595251142978668, mean loss: 0.34046327262409665
Epoch: 59, step: 758, loss: 0.2954612970352173, mean loss: 0.3404627490713587
Epoch: 59, step: 759, loss: 0.3726266026496887, mean loss: 0.34046312326110206
Epoch: 59, step: 760, loss: 0.3503892719745636, mean loss: 0.340463238739175
Epoch: 59, step: 761, loss: 0.3110300600528717, mean loss: 0.340462896325686
Epoch: 59, step: 762, loss: 0.30810537934303284, mean loss: 0.3404625198960279
Epoch: 59, step: 763, loss: 0.3819563686847687, mean loss: 0.3404630026071585
Epoch: 59, step: 764, loss: 0.3184743821620941, mean loss: 0.34046274680952415
Epoch: 59, step: 765, loss: 0.3293082118034363, mean loss: 0.3404626170482924
Epoch: 59, step: 766, loss: 0.3226463496685028, mean loss: 0.34046240979322473
Epoch: 59, step: 767, loss: 0.3307560086250305, mean loss: 0.34046229688082924
Epoch: 59, step: 768, loss: 0.3672407865524292, mean loss: 0.3404626083853912
Epoch: 59, step: 769, loss: 0.35133954882621765, mean loss: 0.3404627349114648
Epoch: 59, step: 770, loss: 0.3309039771556854, mean loss: 0.34046262372045244
Epoch: 59, step: 771, loss: 0.3298436999320984, mean loss: 0.34046250019863283
Epoch: 59, step: 772, loss: 0.36335551738739014, mean loss: 0.3404627664924968
Epoch: 59, step: 773, loss: 0.30218207836151123, mean loss: 0.3404623212128861
Epoch: 59, step: 774, loss: 0.27313923835754395, mean loss: 0.34046153812227586
Epoch: 59, step: 775, loss: 0.3466925323009491, mean loss: 0.3404616105992937
Epoch: 59, step: 776, loss: 0.323459267616272, mean loss: 0.3404614128355425
Epoch: 59, step: 777, loss: 0.35367825627326965, mean loss: 0.3404615665662452
Epoch: 59, step: 778, loss: 0.33430930972099304, mean loss: 0.340461495007573
Epoch: 59, step: 779, loss: 0.4032408893108368, mean loss: 0.34046222520430586
Epoch: 59, step: 780, loss: 0.32717105746269226, mean loss: 0.34046207061449996
Epoch: 59, step: 781, loss: 0.33259037137031555, mean loss: 0.3404619790596924
Epoch: 59, step: 782, loss: 0.35399118065834045, mean loss: 0.34046213641441386
Epoch: 59, step: 783, loss: 0.3087386190891266, mean loss: 0.3404617674504999
Epoch: 59, step: 784, loss: 0.33400583267211914, mean loss: 0.34046169236490215
Epoch: 59, step: 785, loss: 0.36087194085121155, mean loss: 0.3404619297430567
Epoch: 59, step: 786, loss: 0.3390166461467743, mean loss: 0.3404619129341108
Epoch: 59, step: 787, loss: 0.3238392472267151, mean loss: 0.34046171961133326
Epoch: 59, step: 788, loss: 0.3018347918987274, mean loss: 0.34046127038265717
Epoch: 59, step: 789, loss: 0.3449041545391083, mean loss: 0.3404613220525122
Epoch: 59, step: 790, loss: 0.33811256289482117, mean loss: 0.3404612947372302
Epoch: 59, step: 791, loss: 0.3416062593460083, mean loss: 0.34046130805263014
Epoch: 59, step: 792, loss: 0.2986971437931061, mean loss: 0.3404608223606898
Epoch: 59, step: 793, loss: 0.3572990894317627, mean loss: 0.3404610181772623
Epoch: 59, step: 794, loss: 0.340363472700119, mean loss: 0.3404610170428939
Epoch: 59, step: 795, loss: 0.3191244602203369, mean loss: 0.3404607689203148
Epoch: 59, step: 796, loss: 0.3284401297569275, mean loss: 0.34046062913406283
Epoch: 59, step: 797, loss: 0.29492494463920593, mean loss: 0.340460099612416
Epoch: 59, step: 798, loss: 0.3123281002044678, mean loss: 0.34045977247712433
Epoch: 59, step: 799, loss: 0.3465815484523773, mean loss: 0.34045984366387694
Epoch: 59, step: 800, loss: 0.3679407835006714, mean loss: 0.34046016322083633
Epoch: 59, step: 801, loss: 0.3817288279533386, mean loss: 0.34046064310019086
Epoch: 59, step: 802, loss: 0.33328765630722046, mean loss: 0.34046055969239786
Epoch: 59, step: 803, loss: 0.30305010080337524, mean loss: 0.34046012468706194
Epoch: 59, step: 804, loss: 0.30640536546707153, mean loss: 0.34045972870609403
Epoch: 59, step: 805, loss: 0.29729294776916504, mean loss: 0.3404592267784535
Epoch: 59, step: 806, loss: 0.34833401441574097, mean loss: 0.34045931834255755
Epoch: 59, step: 807, loss: 0.33782699704170227, mean loss: 0.3404592877355939
Epoch: 59, step: 808, loss: 0.31315338611602783, mean loss: 0.3404589702435688
Epoch: 59, step: 809, loss: 0.29898178577423096, mean loss: 0.3404584879843721
Epoch: 59, step: 810, loss: 0.34560880064964294, mean loss: 0.34045854786685453
Epoch: 59, step: 811, loss: 0.29586124420166016, mean loss: 0.340458029341791
Epoch: 59, step: 812, loss: 0.37556886672973633, mean loss: 0.340458437564621
Epoch: 59, step: 813, loss: 0.3193032145500183, mean loss: 0.340458191602256
Epoch: 59, step: 814, loss: 0.3319772183895111, mean loss: 0.34045809299890045
Epoch: 59, step: 815, loss: 0.32625848054885864, mean loss: 0.34045792791016344
Epoch: 59, step: 816, loss: 0.31108930706977844, mean loss: 0.3404575864661859
Epoch: 59, step: 817, loss: 0.3648223280906677, mean loss: 0.34045786973102216
Epoch: 59, step: 818, loss: 0.335237592458725, mean loss: 0.34045780904070916
Epoch: 59, step: 819, loss: 0.3341592252254486, mean loss: 0.34045773581498584
Epoch: 59, step: 820, loss: 0.300266832113266, mean loss: 0.3404572685712584
Epoch: 59, step: 821, loss: 0.3438127934932709, mean loss: 0.34045730758082526
Epoch: 59, step: 822, loss: 0.36156684160232544, mean loss: 0.3404575529863057
Epoch: 59, step: 823, loss: 0.34261640906333923, mean loss: 0.3404575780834468
Epoch: 59, step: 824, loss: 0.3834823668003082, mean loss: 0.3404580782495541
Epoch: 59, step: 825, loss: 0.37039533257484436, mean loss: 0.3404584262681345
Epoch: 59, step: 826, loss: 0.3141779899597168, mean loss: 0.34045812076337056
Epoch: 59, step: 827, loss: 0.33756324648857117, mean loss: 0.34045808711143305
Epoch: 59, step: 828, loss: 0.3564763069152832, mean loss: 0.34045827331567374
Epoch: 59, step: 829, loss: 0.2912219762802124, mean loss: 0.3404577009736256
Epoch: 59, step: 830, loss: 0.38744401931762695, mean loss: 0.34045824715468903
Epoch: 59, step: 831, loss: 0.30659544467926025, mean loss: 0.34045785352932895
Epoch: 59, step: 832, loss: 0.31295740604400635, mean loss: 0.34045753386447775
Epoch: 59, step: 833, loss: 0.35316091775894165, mean loss: 0.3404576815267339
Epoch: 59, step: 834, loss: 0.30692893266677856, mean loss: 0.3404572917980447
Epoch: 59, step: 835, loss: 0.3050577938556671, mean loss: 0.34045688032908034
Epoch: 59, step: 836, loss: 0.3214181065559387, mean loss: 0.34045665903290595
Epoch: 59, step: 837, loss: 0.3825185000896454, mean loss: 0.3404571479307958
Epoch: 59, step: 838, loss: 0.339555025100708, mean loss: 0.3404571374452628
Epoch: 59, step: 839, loss: 0.3112480342388153, mean loss: 0.3404567979466435
Epoch: 59, step: 840, loss: 0.3001904785633087, mean loss: 0.34045632993498126
Epoch: 59, step: 841, loss: 0.4003312289714813, mean loss: 0.34045702584724136
Epoch: 59, step: 842, loss: 0.33024540543556213, mean loss: 0.34045690716129184
Epoch: 59, step: 843, loss: 0.3139839768409729, mean loss: 0.3404565994796284
Epoch: 59, step: 844, loss: 0.3327268362045288, mean loss: 0.34045650964148994
Epoch: 59, step: 845, loss: 0.33975905179977417, mean loss: 0.3404565015354738
Epoch: 59, step: 846, loss: 0.34265729784965515, mean loss: 0.3404565271133397
Epoch: 59, step: 847, loss: 0.3724241554737091, mean loss: 0.34045689863986517
Epoch: 59, step: 848, loss: 0.320472776889801, mean loss: 0.34045666638788363
Epoch: 59, step: 849, loss: 0.35166075825691223, mean loss: 0.3404567965983742
Epoch: 59, step: 850, loss: 0.3427368998527527, mean loss: 0.3404568230967211
Epoch: 59, step: 851, loss: 0.31767699122428894, mean loss: 0.34045655836271366
Epoch: 59, step: 852, loss: 0.2756856679916382, mean loss: 0.3404558056417015
Epoch: 59, step: 853, loss: 0.3197536766529083, mean loss: 0.340455565059145
Epoch: 59, step: 854, loss: 0.34129300713539124, mean loss: 0.3404555747910723
Epoch: 59, step: 855, loss: 0.3342604637145996, mean loss: 0.34045550279842746
Epoch: 59, step: 856, loss: 0.35962143540382385, mean loss: 0.34045572552084974
Epoch: 59, step: 857, loss: 0.3329616189002991, mean loss: 0.34045563843475707
Epoch: 59, step: 858, loss: 0.30365869402885437, mean loss: 0.3404552108367743
Epoch: 59, step: 859, loss: 0.32719025015830994, mean loss: 0.3404550566934179
Epoch: 59, step: 860, loss: 0.30888256430625916, mean loss: 0.34045468981457727
Epoch: 59, step: 861, loss: 0.32153990864753723, mean loss: 0.34045447002349255
Epoch: 59, step: 862, loss: 0.3344164490699768, mean loss: 0.3404543998620806
Epoch: 59, step: 863, loss: 0.3369596302509308, mean loss: 0.34045435925355616
Epoch: 59, step: 864, loss: 0.33041107654571533, mean loss: 0.3404542425539744
Epoch: 59, step: 865, loss: 0.3468814790248871, mean loss: 0.34045431723544206
Epoch: 59, step: 866, loss: 0.3377320170402527, mean loss: 0.3404542856039605
Epoch: 59, step: 867, loss: 0.33536791801452637, mean loss: 0.3404542265041326
Epoch: 59, step: 868, loss: 0.32859745621681213, mean loss: 0.3404540887388356
Epoch: 59, step: 869, loss: 0.34040534496307373, mean loss: 0.3404540881724821
Epoch: 59, step: 870, loss: 0.3465108275413513, mean loss: 0.3404541585448591
Epoch: 59, step: 871, loss: 0.31478267908096313, mean loss: 0.34045386027512514
Epoch: 59, step: 872, loss: 0.30115512013435364, mean loss: 0.34045340367936894
Epoch: 59, step: 873, loss: 0.3452802300453186, mean loss: 0.3404534597596102
Epoch: 59, step: 874, loss: 0.3359676003456116, mean loss: 0.340453407641482
Epoch: 59, step: 875, loss: 0.30876997113227844, mean loss: 0.3404530395376096
Epoch: 59, step: 876, loss: 0.3123539090156555, mean loss: 0.34045271308064257
Epoch: 59, step: 877, loss: 0.3318049907684326, mean loss: 0.34045261261218157
Epoch: 59, step: 878, loss: 0.3008975386619568, mean loss: 0.34045215307022453
Epoch: 59, step: 879, loss: 0.33676859736442566, mean loss: 0.3404521102759996
Epoch: 59, step: 880, loss: 0.359783411026001, mean loss: 0.34045233485748766
Epoch: 59, step: 881, loss: 0.3621014654636383, mean loss: 0.34045258636345443
Epoch: 59, step: 882, loss: 0.3367370665073395, mean loss: 0.3404525431993859
Epoch: 59, step: 883, loss: 0.3387462794780731, mean loss: 0.340452523377549
Epoch: 59, step: 884, loss: 0.36083874106407166, mean loss: 0.3404527602035348
Epoch: 59, step: 885, loss: 0.3163292706012726, mean loss: 0.3404524799650459
Epoch: 59, step: 886, loss: 0.3254116475582123, mean loss: 0.34045230524027553
Epoch: 59, step: 887, loss: 0.3140794038772583, mean loss: 0.3404519988778695
Epoch: 59, step: 888, loss: 0.33524155616760254, mean loss: 0.34045193835114923
Epoch: 59, step: 889, loss: 0.307203084230423, mean loss: 0.34045155212279476
Epoch: 59, step: 890, loss: 0.30751603841781616, mean loss: 0.3404511695387379
Epoch: 59, step: 891, loss: 0.35047560930252075, mean loss: 0.34045128598283886
Epoch: 59, step: 892, loss: 0.31062909960746765, mean loss: 0.34045093957172506
Epoch: 59, step: 893, loss: 0.3322555422782898, mean loss: 0.3404508443760311
Epoch: 59, step: 894, loss: 0.3910430073738098, mean loss: 0.34045143203517086
Epoch: 59, step: 895, loss: 0.3156125247478485, mean loss: 0.3404511435193124
Epoch: 59, step: 896, loss: 0.32695794105529785, mean loss: 0.3404509867910945
Epoch: 59, step: 897, loss: 0.38610726594924927, mean loss: 0.3404515170984232
Epoch: 59, step: 898, loss: 0.328020840883255, mean loss: 0.3404513727151696
Epoch: 59, step: 899, loss: 0.31121960282325745, mean loss: 0.3404510331898735
Epoch: 59, step: 900, loss: 0.35489925742149353, mean loss: 0.34045120100320303
Epoch: 59, step: 901, loss: 0.3905659019947052, mean loss: 0.34045178306900004
Epoch: 59, step: 902, loss: 0.3538934886455536, mean loss: 0.3404519391881835
Epoch: 59, step: 903, loss: 0.3629383444786072, mean loss: 0.3404522003543309
Epoch: 59, step: 904, loss: 0.3452417552471161, mean loss: 0.34045225598150003
Epoch: 59, step: 905, loss: 0.3166019916534424, mean loss: 0.3404519789813801
Epoch: 59, step: 906, loss: 0.3230983018875122, mean loss: 0.34045177743582306
Epoch: 59, step: 907, loss: 0.36137211322784424, mean loss: 0.34045202040172234
Epoch: 59, step: 908, loss: 0.34845536947250366, mean loss: 0.34045211335043696
Epoch: 59, step: 909, loss: 0.36537081003189087, mean loss: 0.34045240274602706
Epoch: 59, step: 910, loss: 0.3134075701236725, mean loss: 0.3404520886620081
Epoch: 59, step: 911, loss: 0.30389392375946045, mean loss: 0.34045166410023797
Epoch: 59, step: 912, loss: 0.3042292296886444, mean loss: 0.34045124344229966
Epoch: 59, step: 913, loss: 0.35203316807746887, mean loss: 0.3404513779438051
Epoch: 59, step: 914, loss: 0.3391513228416443, mean loss: 0.3404513628463715
Epoch: 59, step: 915, loss: 0.3625302314758301, mean loss: 0.34045161924348954
Epoch: 59, step: 916, loss: 0.3220973312854767, mean loss: 0.3404514061015951
Epoch: 59, step: 917, loss: 0.3206291198730469, mean loss: 0.34045117591502577
Epoch: 59, step: 918, loss: 0.32824528217315674, mean loss: 0.3404510341755641
Epoch: 59, step: 919, loss: 0.30482059717178345, mean loss: 0.3404506204262376
Epoch: 59, step: 920, loss: 0.33384138345718384, mean loss: 0.3404505436790568
Epoch: 59, step: 921, loss: 0.3094257712364197, mean loss: 0.34045018342019756
Epoch: 59, step: 922, loss: 0.3286108076572418, mean loss: 0.3404500459432672
Epoch: 59, step: 923, loss: 0.3476358950138092, mean loss: 0.34045012938322394
Epoch: 59, step: 924, loss: 0.3533743917942047, mean loss: 0.34045027945419865
Epoch: 59, step: 925, loss: 0.3179055452346802, mean loss: 0.340450017677484
Epoch: 59, step: 926, loss: 0.31325143575668335, mean loss: 0.3404497018665866
Epoch: 59, step: 927, loss: 0.41379550099372864, mean loss: 0.34045055349678405
Epoch: 59, step: 928, loss: 0.3334433436393738, mean loss: 0.34045047213585683
Epoch: 59, step: 929, loss: 0.3269740641117096, mean loss: 0.34045031566268935
Epoch: 59, step: 930, loss: 0.310149222612381, mean loss: 0.3404499638439444
Epoch: 59, step: 931, loss: 0.33405131101608276, mean loss: 0.34044988955157923
Epoch: 59, step: 932, loss: 0.3167758882045746, mean loss: 0.34044961468479396
Epoch: 59, step: 933, loss: 0.3451766073703766, mean loss: 0.3404496695668639
Epoch: 59, step: 934, loss: 0.38074302673339844, mean loss: 0.3404501373816712
Epoch: 59, step: 935, loss: 0.3595658242702484, mean loss: 0.340450359316456
Epoch: 59, step: 936, loss: 0.35854703187942505, mean loss: 0.34045056941795676
Epoch: 59, step: 937, loss: 0.325910359621048, mean loss: 0.34045040060877807
Epoch: 59, step: 938, loss: 0.3258132338523865, mean loss: 0.3404502306759197
Epoch: 59, step: 939, loss: 0.3396221995353699, mean loss: 0.34045022106285266
Epoch: 59, step: 940, loss: 0.4404374659061432, mean loss: 0.340451381856064
Epoch: 59, step: 941, loss: 0.3415258526802063, mean loss: 0.34045139432989463
Epoch: 59, step: 942, loss: 0.3014880418777466, mean loss: 0.3404509419987502
Epoch: 59, step: 943, loss: 0.3259340822696686, mean loss: 0.3404507734724009
Epoch: 59, step: 944, loss: 0.3022802770137787, mean loss: 0.3404503303559237
Epoch: 59, step: 945, loss: 0.30511245131492615, mean loss: 0.34044992012770703
Epoch: 59, step: 946, loss: 0.32734742760658264, mean loss: 0.34044976802605603
Epoch: 59, step: 947, loss: 0.34882497787475586, mean loss: 0.34044986524942444
Epoch: 59, step: 948, loss: 0.32450467348098755, mean loss: 0.3404496801523002
Epoch: 59, step: 949, loss: 0.30388733744621277, mean loss: 0.3404492557293124
Epoch: 59, step: 950, loss: 0.3421993851661682, mean loss: 0.34044927604492914
Epoch: 59, step: 951, loss: 0.33884623646736145, mean loss: 0.3404492574369571
Epoch: 59, step: 952, loss: 0.33494409918785095, mean loss: 0.34044919353420433
Epoch: 59, step: 953, loss: 0.33059608936309814, mean loss: 0.3404490791627108
Epoch: 59, step: 954, loss: 0.2898325026035309, mean loss: 0.3404484916294661
Epoch: 59, step: 955, loss: 0.3450131416320801, mean loss: 0.34044854461314616
Epoch: 59, step: 956, loss: 0.34181857109069824, mean loss: 0.3404485605153954
Epoch: 59, step: 957, loss: 0.3393370509147644, mean loss: 0.3404485476139677
Epoch: 59, step: 958, loss: 0.35416939854621887, mean loss: 0.3404487068717117
Epoch: 59, step: 959, loss: 0.31090259552001953, mean loss: 0.3404483639343498
Epoch: 59, step: 960, loss: 0.34686174988746643, mean loss: 0.34044843837271177
Epoch: 59, step: 961, loss: 0.31544625759124756, mean loss: 0.340448148182819
Epoch: 59, step: 962, loss: 0.30938345193862915, mean loss: 0.34044778763202055
Epoch: 59, step: 963, loss: 0.32352548837661743, mean loss: 0.3404475912265046
Epoch: 59, step: 964, loss: 0.3322473466396332, mean loss: 0.340447496052997
Epoch: 59, step: 965, loss: 0.3189997673034668, mean loss: 0.34044724712970426
Epoch: 59, step: 966, loss: 0.3893175423145294, mean loss: 0.3404478143139386
Epoch: 59, step: 967, loss: 0.3309464156627655, mean loss: 0.34044770404284336
Epoch: 59, step: 968, loss: 0.3621580898761749, mean loss: 0.340447956005773
Epoch: 59, step: 969, loss: 0.3122520446777344, mean loss: 0.3404476287779647
Epoch: 59, step: 970, loss: 0.2904249429702759, mean loss: 0.3404470482461392
Epoch: 59, step: 971, loss: 0.35554957389831543, mean loss: 0.34044722351451784
Epoch: 59, step: 972, loss: 0.38849663734436035, mean loss: 0.3404477811328473
Epoch: 59, step: 973, loss: 0.3133571147918701, mean loss: 0.3404474667465604
Epoch: 59, step: 974, loss: 0.3299408555030823, mean loss: 0.3404473448190994
Epoch: 59, step: 975, loss: 0.331457257270813, mean loss: 0.34044724049185215
Epoch: 59, step: 976, loss: 0.3652339577674866, mean loss: 0.3404475281308722
Epoch: 59, step: 977, loss: 0.3337832987308502, mean loss: 0.3404474507963003
Epoch: 59, step: 978, loss: 0.38032102584838867, mean loss: 0.34044791350097164
Epoch: 59, step: 979, loss: 0.3420976996421814, mean loss: 0.3404479326453522
Epoch: 59, step: 980, loss: 0.35877710580825806, mean loss: 0.34044814533752255
Epoch: 59, step: 981, loss: 0.3462061882019043, mean loss: 0.3404482121532164
Epoch: 59, step: 982, loss: 0.3594125807285309, mean loss: 0.3404484322111026
Epoch: 59, step: 983, loss: 0.35839155316352844, mean loss: 0.34044864041626566
Epoch: 59, step: 984, loss: 0.31417933106422424, mean loss: 0.3404483356007106
Epoch: 59, step: 985, loss: 0.3328293561935425, mean loss: 0.3404482471950179
Epoch: 59, step: 986, loss: 0.3662872612476349, mean loss: 0.3404485470106898
Epoch: 59, step: 987, loss: 0.4034664034843445, mean loss: 0.34044927821203197
Epoch: 59, step: 988, loss: 0.3398754894733429, mean loss: 0.3404492715543916
Epoch: 59, step: 989, loss: 0.3534248173236847, mean loss: 0.3404494221072165
Epoch: 59, step: 990, loss: 0.3356788158416748, mean loss: 0.34044936675540866
Epoch: 59, step: 991, loss: 0.36375540494918823, mean loss: 0.3404496371647254
Epoch: 59, step: 992, loss: 0.38103923201560974, mean loss: 0.3404501081017922
Epoch: 59, step: 993, loss: 0.3419351577758789, mean loss: 0.3404501253317455
Epoch: 59, step: 994, loss: 0.3547573387622833, mean loss: 0.34045029132603066
Epoch: 59, step: 995, loss: 0.3258291482925415, mean loss: 0.3404501216914586
Epoch: 59, step: 996, loss: 0.3616560399532318, mean loss: 0.3404503677197702
Epoch: 59, step: 997, loss: 0.35292840003967285, mean loss: 0.34045051248660224
Epoch: 59, step: 998, loss: 0.3363087773323059, mean loss: 0.3404504644358434
Epoch: 59, step: 999, loss: 0.3365051746368408, mean loss: 0.3404504186646963
Epoch: 59, step: 1000, loss: 0.3337826728820801, mean loss: 0.3404503413099649
Epoch: 59, step: 1001, loss: 0.29714423418045044, mean loss: 0.3404498389072742
Epoch: 59, step: 1002, loss: 0.30686575174331665, mean loss: 0.3404494492961747
Epoch: 59, step: 1003, loss: 0.3320600092411041, mean loss: 0.34044935197088405
Epoch: 59, step: 1004, loss: 0.32692110538482666, mean loss: 0.34044919503248905
Epoch: 59, step: 1005, loss: 0.3321203887462616, mean loss: 0.34044909841284815
Epoch: 59, step: 1006, loss: 0.3258633315563202, mean loss: 0.3404489292103047
Epoch: 59, step: 1007, loss: 0.37128105759620667, mean loss: 0.34044928687501147
Epoch: 59, step: 1008, loss: 0.3157700300216675, mean loss: 0.3404490005893337
Epoch: 59, step: 1009, loss: 0.326140820980072, mean loss: 0.34044883461272407
Epoch: 59, step: 1010, loss: 0.3153567910194397, mean loss: 0.3404485435453677
Epoch: 59, step: 1011, loss: 0.3173462748527527, mean loss: 0.34044827556248103
Epoch: 59, step: 1012, loss: 0.29572540521621704, mean loss: 0.34044775678984307
Epoch: 59, step: 1013, loss: 0.3294192850589752, mean loss: 0.34044762886417634
Epoch: 59, step: 1014, loss: 0.3740217387676239, mean loss: 0.34044801830531385
Epoch: 59, step: 1015, loss: 0.32567891478538513, mean loss: 0.34044784699385466
Epoch: 59, step: 1016, loss: 0.36210867762565613, mean loss: 0.34044809824170164
Epoch: 59, step: 1017, loss: 0.3162574768066406, mean loss: 0.3404478176536134
Epoch: 59, step: 1018, loss: 0.3856150209903717, mean loss: 0.34044834154392645
Epoch: 59, step: 1019, loss: 0.3645744025707245, mean loss: 0.340448621376684
Epoch: 59, step: 1020, loss: 0.33623605966567993, mean loss: 0.3404485725166946
Epoch: 59, step: 1021, loss: 0.32543331384658813, mean loss: 0.3404483983621251
Epoch: 59, step: 1022, loss: 0.31219005584716797, mean loss: 0.3404480706113681
Epoch: 59, step: 1023, loss: 0.2958381772041321, mean loss: 0.3404475532152488
Epoch: 59, step: 1024, loss: 0.3620224595069885, mean loss: 0.34044780344322445
Epoch: 59, step: 1025, loss: 0.30901193618774414, mean loss: 0.34044743885104084
Epoch: 59, step: 1026, loss: 0.3118709325790405, mean loss: 0.3404471074254784
Epoch: 59, step: 1027, loss: 0.31413203477859497, mean loss: 0.34044680223118623
Epoch: 59, step: 1028, loss: 0.3043116629123688, mean loss: 0.3404463831515768
Epoch: 59, step: 1029, loss: 0.4143231511116028, mean loss: 0.3404472399322226
Epoch: 59, step: 1030, loss: 0.3334124684333801, mean loss: 0.3404471583478987
Epoch: 59, step: 1031, loss: 0.3458004295825958, mean loss: 0.3404472204306471
Epoch: 59, step: 1032, loss: 0.32655516266822815, mean loss: 0.3404470593240848
Epoch: 59, step: 1033, loss: 0.34655529260635376, mean loss: 0.3404471301606067
Epoch: 59, step: 1034, loss: 0.33296719193458557, mean loss: 0.3404470434175766
Epoch: 59, step: 1035, loss: 0.3060944378376007, mean loss: 0.3404466450433584
Epoch: 59, step: 1036, loss: 0.34704136848449707, mean loss: 0.3404467215189935
Epoch: 59, step: 1037, loss: 0.30996736884117126, mean loss: 0.3404463680696269
Epoch: 59, step: 1038, loss: 0.3114249110221863, mean loss: 0.34044603153043695
Epoch: 59, step: 1039, loss: 0.3155122697353363, mean loss: 0.3404457423964118
Epoch: 59, step: 1040, loss: 0.35690972208976746, mean loss: 0.34044593331190853
Epoch: 59, step: 1041, loss: 0.3258243501186371, mean loss: 0.34044576376271685
Epoch: 59, step: 1042, loss: 0.3123364746570587, mean loss: 0.3404454378163457
Epoch: 59, step: 1043, loss: 0.34213826060295105, mean loss: 0.3404454574455524
Epoch: 59, step: 1044, loss: 0.31367310881614685, mean loss: 0.34044514700911693
Epoch: 59, step: 1045, loss: 0.30911460518836975, mean loss: 0.340444783722762
Epoch: 59, step: 1046, loss: 0.3084010183811188, mean loss: 0.34044441217069005
Epoch: 59, step: 1047, loss: 0.3163313865661621, mean loss: 0.3404441325799289
Epoch: 59, step: 1048, loss: 0.32955896854400635, mean loss: 0.34044400636781186
Epoch: 59, step: 1049, loss: 0.32259446382522583, mean loss: 0.3404437994069958
Epoch: 59, step: 1050, loss: 0.316438227891922, mean loss: 0.3404435210718478
Epoch: 59, step: 1051, loss: 0.3453279733657837, mean loss: 0.34044357770449196
Epoch: 59, step: 1052, loss: 0.3365113139152527, mean loss: 0.3404435321124991
Epoch: 59, step: 1053, loss: 0.3351484537124634, mean loss: 0.3404434707202858
Epoch: 59, step: 1054, loss: 0.3815065324306488, mean loss: 0.34044394680823503
Epoch: 59, step: 1055, loss: 0.34284523129463196, mean loss: 0.340443974648569
Epoch: 59, step: 1056, loss: 0.31756338477134705, mean loss: 0.3404437093755944
Epoch: 59, step: 1057, loss: 0.31628841161727905, mean loss: 0.3404434293271589
Epoch: 59, step: 1058, loss: 0.31676235795021057, mean loss: 0.34044315477992826
Epoch: 59, step: 1059, loss: 0.306689977645874, mean loss: 0.3404427634659659
Epoch: 59, step: 1060, loss: 0.3736695349216461, mean loss: 0.3404431486726327
Epoch: 59, step: 1061, loss: 0.33204612135887146, mean loss: 0.34044305132482366
Epoch: 59, step: 1062, loss: 0.37817758321762085, mean loss: 0.3404434887809951
Epoch: 59, step: 1063, loss: 0.3621983826160431, mean loss: 0.34044374098240754
Epoch: 59, step: 1064, loss: 0.3548709750175476, mean loss: 0.34044390823335563
Epoch: 59, step: 1065, loss: 0.3501301407814026, mean loss: 0.3404440205218784
Epoch: 59, step: 1066, loss: 0.33312442898750305, mean loss: 0.34044393566983827
Epoch: 59, step: 1067, loss: 0.30298036336898804, mean loss: 0.3404435013800731
Epoch: 59, step: 1068, loss: 0.3139702379703522, mean loss: 0.34044319449705673
Epoch: 59, step: 1069, loss: 0.3161320388317108, mean loss: 0.3404429126808642
Epoch: 59, step: 1070, loss: 0.3036997318267822, mean loss: 0.34044248675692046
Epoch: 59, step: 1071, loss: 0.350568562746048, mean loss: 0.3404426041362035
Epoch: 59, step: 1072, loss: 0.3460717797279358, mean loss: 0.34044266938763323
Epoch: 59, step: 1073, loss: 0.30474722385406494, mean loss: 0.3404422556233405
Epoch: 59, step: 1074, loss: 0.3347621560096741, mean loss: 0.3404421897831438
Epoch: 59, step: 1075, loss: 0.3620602786540985, mean loss: 0.3404424403637362
Epoch: 59, step: 1076, loss: 0.33617183566093445, mean loss: 0.3404423908626791
Epoch: 59, step: 1077, loss: 0.337138295173645, mean loss: 0.34044235256498
Epoch: 59, step: 1078, loss: 0.3358413875102997, mean loss: 0.34044229923591535
Epoch: 59, step: 1079, loss: 0.31089362502098083, mean loss: 0.3404419567458345
Epoch: 59, step: 1080, loss: 0.3287433683872223, mean loss: 0.34044182115247407
Epoch: 59, step: 1081, loss: 0.3362518548965454, mean loss: 0.3404417725889207
Epoch: 59, step: 1082, loss: 0.34633010625839233, mean loss: 0.340441840836509
Epoch: 59, step: 1083, loss: 0.32040300965309143, mean loss: 0.34044160858301825
Epoch: 59, step: 1084, loss: 0.36704280972480774, mean loss: 0.34044191689192915
Epoch: 59, step: 1085, loss: 0.3231496214866638, mean loss: 0.3404417164759049
Epoch: 59, step: 1086, loss: 0.35082462430000305, mean loss: 0.34044183681140344
Epoch: 59, step: 1087, loss: 0.3216789662837982, mean loss: 0.3404416193565969
Epoch: 59, step: 1088, loss: 0.3173855245113373, mean loss: 0.3404413521479877
Epoch: 59, step: 1089, loss: 0.3558046519756317, mean loss: 0.3404415301988862
Epoch: 59, step: 1090, loss: 0.3359934985637665, mean loss: 0.34044147864961877
Epoch: 59, step: 1091, loss: 0.34132784605026245, mean loss: 0.3404414889218165
Epoch: 59, step: 1092, loss: 0.37775006890296936, mean loss: 0.34044192128955725
Epoch: 59, step: 1093, loss: 0.31855133175849915, mean loss: 0.34044166760327227
Epoch: 59, step: 1094, loss: 0.32147902250289917, mean loss: 0.34044144785097946
Epoch: 59, step: 1095, loss: 0.3626748323440552, mean loss: 0.34044170550388464
Epoch: 59, step: 1096, loss: 0.32846924662590027, mean loss: 0.3404415667619371
Epoch: 59, step: 1097, loss: 0.3438797891139984, mean loss: 0.3404416066050589
Epoch: 59, step: 1098, loss: 0.2896750271320343, mean loss: 0.3404410183139705
Epoch: 59, step: 1099, loss: 0.3048747777938843, mean loss: 0.34044060617157085
Epoch: 59, step: 1100, loss: 0.36232811212539673, mean loss: 0.34044085980154587
Epoch: 59, step: 1101, loss: 0.3180050551891327, mean loss: 0.34044059982095987
Epoch: 59, step: 1102, loss: 0.41952991485595703, mean loss: 0.3404415162778717
Epoch: 59, step: 1103, loss: 0.32132673263549805, mean loss: 0.34044129478559315
Epoch: 59, step: 1104, loss: 0.3077133893966675, mean loss: 0.3404409155558578
Epoch: 59, step: 1105, loss: 0.3201356530189514, mean loss: 0.3404406802743749
Epoch: 59, step: 1106, loss: 0.3134191930294037, mean loss: 0.340440367174167
Epoch: 59, step: 1107, loss: 0.34958019852638245, mean loss: 0.3404404730769218
Epoch: 59, step: 1108, loss: 0.33046698570251465, mean loss: 0.3404403575159766
Epoch: 59, step: 1109, loss: 0.3785857558250427, mean loss: 0.3404407994944985
Epoch: 59, step: 1110, loss: 0.38809818029403687, mean loss: 0.34044135167891926
Epoch: 59, step: 1111, loss: 0.3379998803138733, mean loss: 0.34044132339102745
Epoch: 59, step: 1112, loss: 0.33229511976242065, mean loss: 0.340441229006854
Epoch: 59, step: 1113, loss: 0.3505117893218994, mean loss: 0.3404413456858056
Epoch: 59, step: 1114, loss: 0.29830965399742126, mean loss: 0.3404408575476576
Epoch: 59, step: 1115, loss: 0.31237345933914185, mean loss: 0.34044053236230437
Epoch: 59, step: 1116, loss: 0.3287024199962616, mean loss: 0.3404403963675832
Epoch: 59, step: 1117, loss: 0.2955249845981598, mean loss: 0.3404398759953172
Epoch: 59, step: 1118, loss: 0.3124890625476837, mean loss: 0.3404395521719557
Epoch: 59, step: 1119, loss: 0.37703144550323486, mean loss: 0.34043997610139326
Epoch: 59, step: 1120, loss: 0.34593069553375244, mean loss: 0.3404400397124946
Epoch: 59, step: 1121, loss: 0.3381010591983795, mean loss: 0.34044001261524354
Epoch: 59, step: 1122, loss: 0.35078349709510803, mean loss: 0.3404401324438384
Epoch: 59, step: 1123, loss: 0.2932032346725464, mean loss: 0.3404395852137901
Epoch: 59, step: 1124, loss: 0.34685084223747253, mean loss: 0.3404396594860648
Epoch: 59, step: 1125, loss: 0.32180505990982056, mean loss: 0.34043944361294354
Epoch: 59, step: 1126, loss: 0.3300861120223999, mean loss: 0.3404393236758284
Epoch: 59, step: 1127, loss: 0.3238518238067627, mean loss: 0.3404391315218519
Epoch: 59, step: 1128, loss: 0.363506555557251, mean loss: 0.34043939873788476
Epoch: 59, step: 1129, loss: 0.39507797360420227, mean loss: 0.340440031670893
Epoch: 59, step: 1130, loss: 0.312677264213562, mean loss: 0.34043971007084367
Epoch: 59, step: 1131, loss: 0.39128023386001587, mean loss: 0.34044029899360095
Epoch: 59, step: 1132, loss: 0.36159804463386536, mean loss: 0.34044054407631524
Epoch: 59, step: 1133, loss: 0.35406315326690674, mean loss: 0.3404407018732478
Epoch: 59, step: 1134, loss: 0.4193042814731598, mean loss: 0.34044161537569306
Epoch: 59, step: 1135, loss: 0.3250163197517395, mean loss: 0.34044143670155574
Epoch: 59, step: 1136, loss: 0.30185002088546753, mean loss: 0.34044098969501346
Epoch: 59, step: 1137, loss: 0.29906630516052246, mean loss: 0.34044051045526397
Epoch: 59, step: 1138, loss: 0.3218073844909668, mean loss: 0.3404402946317166
Epoch: 59, step: 1139, loss: 0.3287585973739624, mean loss: 0.3404401593266613
Epoch: 59, step: 1140, loss: 0.3308543562889099, mean loss: 0.3404400482989091
Epoch: 59, step: 1141, loss: 0.33425140380859375, mean loss: 0.34043997661964287
Epoch: 59, step: 1142, loss: 0.30619117617607117, mean loss: 0.34043957994142743
Epoch: 59, step: 1143, loss: 0.3236430585384369, mean loss: 0.3404393854021478
Epoch: 59, step: 1144, loss: 0.3015597462654114, mean loss: 0.34043893509882567
Epoch: 59, step: 1145, loss: 0.35045748949050903, mean loss: 0.34043905113220907
Epoch: 59, step: 1146, loss: 0.3217303156852722, mean loss: 0.3404388344529711
Epoch: 59, step: 1147, loss: 0.3090818524360657, mean loss: 0.3404384712895548
Epoch: 59, step: 1148, loss: 0.3380419909954071, mean loss: 0.3404384435348464
Epoch: 59, step: 1149, loss: 0.35117265582084656, mean loss: 0.3404385678511122
Epoch: 59, step: 1150, loss: 0.35671159625053406, mean loss: 0.3404387563119551
Epoch: 59, step: 1151, loss: 0.3170941472053528, mean loss: 0.34043848595700643
Epoch: 59, step: 1152, loss: 0.3418399393558502, mean loss: 0.34043850218711214
Epoch: 59, step: 1153, loss: 0.3405112624168396, mean loss: 0.34043850302973205
Epoch: 59, step: 1154, loss: 0.32004597783088684, mean loss: 0.3404382668712023
Epoch: 59, step: 1155, loss: 0.34327587485313416, mean loss: 0.3404382997321434
Epoch: 59, step: 1156, loss: 0.36637961864471436, mean loss: 0.34043860014230765
Epoch: 59, step: 1157, loss: 0.32884547114372253, mean loss: 0.34043846589109755
Epoch: 59, step: 1158, loss: 0.3132513463497162, mean loss: 0.3404381510613883
Epoch: 59, step: 1159, loss: 0.3652089238166809, mean loss: 0.3404384379062254
Epoch: 59, step: 1160, loss: 0.33737167716026306, mean loss: 0.34043840239363526
Epoch: 59, step: 1161, loss: 0.3403256833553314, mean loss: 0.34043840108838225
Epoch: 59, step: 1162, loss: 0.34050241112709045, mean loss: 0.3404384018295909
Epoch: 59, step: 1163, loss: 0.2957696318626404, mean loss: 0.34043788459047597
Epoch: 59, step: 1164, loss: 0.335243821144104, mean loss: 0.3404378244468527
Epoch: 59, step: 1165, loss: 0.3395163118839264, mean loss: 0.34043781377650506
Epoch: 59, step: 1166, loss: 0.3287161588668823, mean loss: 0.3404376780510797
Epoch: 59, step: 1167, loss: 0.3180963695049286, mean loss: 0.3404374193633331
Epoch: 59, step: 1168, loss: 0.3011297881603241, mean loss: 0.3404369642295266
Epoch: 59, step: 1169, loss: 0.3378185033798218, mean loss: 0.34043693391133595
Epoch: 59, step: 1170, loss: 0.3456084430217743, mean loss: 0.34043699378963566
Epoch: 59, step: 1171, loss: 0.33053070306777954, mean loss: 0.34043687909101206
Epoch: 59, step: 1172, loss: 0.3762487471103668, mean loss: 0.34043729372899584
Epoch: 59, step: 1173, loss: 0.3430427610874176, mean loss: 0.3404373238953425
Epoch: 59, step: 1174, loss: 0.3420925438404083, mean loss: 0.34043734305941314
Epoch: 59, step: 1175, loss: 0.30731940269470215, mean loss: 0.34043695962565723
Epoch: 59, step: 1176, loss: 0.33943766355514526, mean loss: 0.340436948056115
Epoch: 59, step: 1177, loss: 0.3244595527648926, mean loss: 0.34043676307689336
Epoch: 59, step: 1178, loss: 0.3410763740539551, mean loss: 0.3404367704819408
Epoch: 59, step: 1179, loss: 0.3244948089122772, mean loss: 0.34043658591722875
Epoch: 59, step: 1180, loss: 0.3813232481479645, mean loss: 0.34043705926849394
Epoch: 59, step: 1181, loss: 0.30680394172668457, mean loss: 0.3404366698971547
Epoch: 59, step: 1182, loss: 0.3565191924571991, mean loss: 0.34043685608271557
Epoch: 59, step: 1183, loss: 0.32523128390312195, mean loss: 0.34043668005154887
Epoch: 59, step: 1184, loss: 0.32719406485557556, mean loss: 0.3404365267468268
Epoch: 59, step: 1185, loss: 0.3307276666164398, mean loss: 0.34043641435234495
Epoch: 59, step: 1186, loss: 0.32197460532188416, mean loss: 0.34043620063194824
Epoch: 59, step: 1187, loss: 0.3085307776927948, mean loss: 0.34043583128782273
Epoch: 59, step: 1188, loss: 0.3305843472480774, mean loss: 0.34043571724621785
Epoch: 59, step: 1189, loss: 0.31368890404701233, mean loss: 0.34043540762645075
Epoch: 59, step: 1190, loss: 0.3363521099090576, mean loss: 0.3404353603589485
Epoch: 59, step: 1191, loss: 0.38292109966278076, mean loss: 0.34043585216034805
Epoch: 59, step: 1192, loss: 0.3429681360721588, mean loss: 0.34043588147292153
Epoch: 59, step: 1193, loss: 0.33882439136505127, mean loss: 0.34043586281925664
Epoch: 59, step: 1194, loss: 0.3119140863418579, mean loss: 0.3404355326717126
Epoch: 59, step: 1195, loss: 0.3223022520542145, mean loss: 0.3404353227763448
Epoch: 59, step: 1196, loss: 0.2956169843673706, mean loss: 0.340434804003546
Epoch: 59, step: 1197, loss: 0.3116971552371979, mean loss: 0.3404344713687708
Epoch: 59, step: 1198, loss: 0.3284900486469269, mean loss: 0.34043433311513666
Epoch: 59, step: 1199, loss: 0.3020192086696625, mean loss: 0.34043388847505557
Epoch: 59, step: 1200, loss: 0.32264724373817444, mean loss: 0.34043368260396356
Epoch: 59, step: 1201, loss: 0.3160052001476288, mean loss: 0.3404333998603531
Epoch: 59, step: 1202, loss: 0.2973390817642212, mean loss: 0.3404329010777503
Epoch: 59, step: 1203, loss: 0.2982145845890045, mean loss: 0.34043241243982797
Epoch: 59, step: 1204, loss: 0.28275731205940247, mean loss: 0.34043174491166994
Epoch: 59, step: 1205, loss: 0.34917256236076355, mean loss: 0.3404318460761968
Epoch: 59, step: 1206, loss: 0.32791373133659363, mean loss: 0.34043170119564015
Epoch: 59, step: 1207, loss: 0.328061580657959, mean loss: 0.3404315580295768
Epoch: 59, step: 1208, loss: 0.3315109312534332, mean loss: 0.3404314547875564
Epoch: 59, step: 1209, loss: 0.3404088318347931, mean loss: 0.3404314545257348
Epoch: 59, step: 1210, loss: 0.32509127259254456, mean loss: 0.3404312769917163
Epoch: 59, step: 1211, loss: 0.30282145738601685, mean loss: 0.34043084173318
Epoch: 59, step: 1212, loss: 0.3392723798751831, mean loss: 0.34043082832645316
Epoch: 59, step: 1213, loss: 0.31669700145721436, mean loss: 0.34043055366117286
Epoch: 59, step: 1214, loss: 0.3033094108104706, mean loss: 0.3404301240730087
Epoch: 59, step: 1215, loss: 0.30812132358551025, mean loss: 0.34042975018048816
Epoch: 59, step: 1216, loss: 0.37542784214019775, mean loss: 0.340430155190058
Epoch: 59, step: 1217, loss: 0.29992854595184326, mean loss: 0.3404296864973781
Epoch: 59, step: 1218, loss: 0.3171476423740387, mean loss: 0.34042941707604935
Epoch: 59, step: 1219, loss: 0.3299582302570343, mean loss: 0.3404292959041967
Epoch: 59, step: 1220, loss: 0.3616655766963959, mean loss: 0.34042954164613165
Epoch: 59, step: 1221, loss: 0.32766807079315186, mean loss: 0.3404293939746876
Epoch: 59, step: 1222, loss: 0.344575971364975, mean loss: 0.3404294419569298
Epoch: 59, step: 1223, loss: 0.32345980405807495, mean loss: 0.340429245594538
Epoch: 59, step: 1224, loss: 0.32536768913269043, mean loss: 0.3404290713133279
Epoch: 59, step: 1225, loss: 0.32860758900642395, mean loss: 0.34042893452544626
Epoch: 59, step: 1226, loss: 0.32287585735321045, mean loss: 0.34042873141889857
Epoch: 59, step: 1227, loss: 0.3272228538990021, mean loss: 0.3404285786155393
Epoch: 59, step: 1228, loss: 0.3404799997806549, mean loss: 0.34042857921051956
Epoch: 59, step: 1229, loss: 0.3091723918914795, mean loss: 0.3404282175579229
Epoch: 59, step: 1230, loss: 0.33305391669273376, mean loss: 0.3404281322338822
Epoch: 59, step: 1231, loss: 0.3308567702770233, mean loss: 0.3404280214901191
Epoch: 59, step: 1232, loss: 0.3043505549430847, mean loss: 0.34042760406695616
Epoch: 59, step: 1233, loss: 0.3152131140232086, mean loss: 0.34042731233387685
Epoch: 59, step: 1234, loss: 0.3194071054458618, mean loss: 0.34042706913170534
Epoch: 59, step: 1235, loss: 0.37000003457069397, mean loss: 0.3404274112846746
Epoch: 59, step: 1236, loss: 0.350039005279541, mean loss: 0.34042752248750213
Epoch: 59, step: 1237, loss: 0.31815263628959656, mean loss: 0.34042726477773283
Epoch: 59, step: 1238, loss: 0.35179710388183594, mean loss: 0.3404273963198061
Epoch: 59, step: 1239, loss: 0.3503502607345581, mean loss: 0.3404275111199405
Epoch: 59, step: 1240, loss: 0.3538689613342285, mean loss: 0.3404276666256871
Epoch: 59, step: 1241, loss: 0.3406403362751007, mean loss: 0.34042766908605926
Epoch: 59, step: 1242, loss: 0.36437931656837463, mean loss: 0.3404279461791247
Epoch: 59, step: 1243, loss: 0.34412693977355957, mean loss: 0.34042798897173915
Epoch: 59, step: 1244, loss: 0.3406841456890106, mean loss: 0.34042799193510975
Epoch: 59, step: 1245, loss: 0.3542071580886841, mean loss: 0.3404281513387116
Epoch: 59, step: 1246, loss: 0.31734320521354675, mean loss: 0.34042788428474396
Epoch: 59, step: 1247, loss: 0.32484230399131775, mean loss: 0.340427703987901
Epoch: 59, step: 1248, loss: 0.3209596872329712, mean loss: 0.3404274787809283
Epoch: 59, step: 1249, loss: 0.337360680103302, mean loss: 0.3404274433044612
Epoch: 59, step: 1250, loss: 0.34395068883895874, mean loss: 0.34042748406059536
Epoch: 59, step: 1251, loss: 0.31538358330726624, mean loss: 0.34042719436157687
Epoch: 59, step: 1252, loss: 0.35833021998405457, mean loss: 0.3404274014550727
Epoch: 59, step: 1253, loss: 0.3229212462902069, mean loss: 0.3404271989547238
Epoch: 59, step: 1254, loss: 0.33678606152534485, mean loss: 0.34042715683679076
Epoch: 59, step: 1255, loss: 0.3307689428329468, mean loss: 0.3404270451191439
Epoch: 59, step: 1256, loss: 0.3694641888141632, mean loss: 0.3404273809911633
Epoch: 59, step: 1257, loss: 0.33279240131378174, mean loss: 0.3404272926785384
Epoch: 59, step: 1258, loss: 0.3544512391090393, mean loss: 0.3404274548894739
Epoch: 59, step: 1259, loss: 0.3114565908908844, mean loss: 0.34042711979573836
Epoch: 59, step: 1260, loss: 0.34011608362197876, mean loss: 0.3404271161981561
Epoch: 59, step: 1261, loss: 0.3340926766395569, mean loss: 0.34042704293206666
Epoch: 59, step: 1262, loss: 0.3373730182647705, mean loss: 0.3404270076086802
Epoch: 59, step: 1263, loss: 0.32282528281211853, mean loss: 0.3404268040263902
Epoch: 59, step: 1264, loss: 0.3479434847831726, mean loss: 0.34042689096363077
Epoch: 59, step: 1265, loss: 0.34005072712898254, mean loss: 0.3404268866130047
Epoch: 59, step: 1266, loss: 0.3204765319824219, mean loss: 0.3404266558743693
Epoch: 59, step: 1267, loss: 0.337525337934494, mean loss: 0.34042662231915627
Epoch: 59, step: 1268, loss: 0.3561762273311615, mean loss: 0.34042680446921714
Epoch: 59, step: 1269, loss: 0.3320181965827942, mean loss: 0.3404267072216529
Epoch: 59, step: 1270, loss: 0.3416101634502411, mean loss: 0.3404267209084494
Epoch: 59, step: 1271, loss: 0.3370356559753418, mean loss: 0.34042668169087836
Epoch: 59, step: 1272, loss: 0.32514891028404236, mean loss: 0.340426505005923
Epoch: 59, step: 1273, loss: 0.332900732755661, mean loss: 0.3404264179725906
Epoch: 59, step: 1274, loss: 0.3200932741165161, mean loss: 0.3404261828285093
Epoch: 59, step: 1275, loss: 0.33782410621643066, mean loss: 0.34042615273695814
Epoch: 59, step: 1276, loss: 0.3252819776535034, mean loss: 0.3404259776051241
Epoch: 59, step: 1277, loss: 0.31734931468963623, mean loss: 0.3404257107426809
Epoch: 59, step: 1278, loss: 0.3295692801475525, mean loss: 0.34042558519852834
Epoch: 59, step: 1279, loss: 0.3542536199092865, mean loss: 0.3404257451045683
Epoch: 59, step: 1280, loss: 0.3115406632423401, mean loss: 0.3404254110841714
Epoch: 59, step: 1281, loss: 0.3098222613334656, mean loss: 0.34042505720052757
Epoch: 59, step: 1282, loss: 0.3145797550678253, mean loss: 0.3404247583383514
Epoch: 59, step: 1283, loss: 0.30516254901885986, mean loss: 0.3404243505884749
Epoch: 59, step: 1284, loss: 0.3115510940551758, mean loss: 0.3404240167202665
Epoch: 59, step: 1285, loss: 0.3354521691799164, mean loss: 0.34042395923029706
Epoch: 59, step: 1286, loss: 0.30897605419158936, mean loss: 0.3404235955992362
Epoch: 59, step: 1287, loss: 0.322704553604126, mean loss: 0.34042339071692274
Epoch: 59, step: 1288, loss: 0.34860971570014954, mean loss: 0.34042348537293227
Epoch: 59, step: 1289, loss: 0.3286321759223938, mean loss: 0.34042334903514987
Epoch: 59, step: 1290, loss: 0.3519110083580017, mean loss: 0.34042348186042215
Epoch: 59, step: 1291, loss: 0.36378026008605957, mean loss: 0.3404237519184444
Epoch: 59, step: 1292, loss: 0.3573471009731293, mean loss: 0.34042394758898115
Epoch: 59, step: 1293, loss: 0.3289334177970886, mean loss: 0.3404238147351276
Epoch: 59, step: 1294, loss: 0.3391466736793518, mean loss: 0.3404237999689548
Epoch: 59, step: 1295, loss: 0.34528714418411255, mean loss: 0.3404238561977877
Epoch: 59, step: 1296, loss: 0.31553030014038086, mean loss: 0.3404235683877215
Epoch: 59, step: 1297, loss: 0.36967116594314575, mean loss: 0.34042390653369176
Epoch: 59, step: 1298, loss: 0.3415360748767853, mean loss: 0.3404239193918725
Epoch: 59, step: 1299, loss: 0.29896602034568787, mean loss: 0.34042344008763825
Epoch: 59, step: 1300, loss: 0.3062332272529602, mean loss: 0.3404230448113531
Epoch: 59, step: 1301, loss: 0.32355639338493347, mean loss: 0.34042284981665466
Epoch: 59, step: 1302, loss: 0.3409883975982666, mean loss: 0.34042285635485486
Epoch: 59, step: 1303, loss: 0.3002071678638458, mean loss: 0.34042239143360065
Epoch: 59, step: 1304, loss: 0.32654550671577454, mean loss: 0.34042223100904234
Epoch: 59, step: 1305, loss: 0.3263159394264221, mean loss: 0.34042206793429747
Epoch: 59, step: 1306, loss: 0.33384692668914795, mean loss: 0.34042199192374006
Epoch: 59, step: 1307, loss: 0.3175147473812103, mean loss: 0.34042172711234936
Epoch: 59, step: 1308, loss: 0.33245983719825745, mean loss: 0.34042163507269946
Epoch: 59, step: 1309, loss: 0.3653644323348999, mean loss: 0.340421923408737
Epoch: 59, step: 1310, loss: 0.3258649706840515, mean loss: 0.34042175513388384
Epoch: 59, step: 1311, loss: 0.34874972701072693, mean loss: 0.34042185140211195
Epoch: 59, step: 1312, loss: 0.36014285683631897, mean loss: 0.3404220793668952
Epoch: 59, step: 1313, loss: 0.3059389591217041, mean loss: 0.3404216807641875
Epoch: 59, step: 1314, loss: 0.3053886890411377, mean loss: 0.3404212758099999
Epoch: 59, step: 1315, loss: 0.3173905909061432, mean loss: 0.3404210095962388
Epoch: 59, step: 1316, loss: 0.3208962082862854, mean loss: 0.3404207839099106
Epoch: 59, step: 1317, loss: 0.3226056396961212, mean loss: 0.3404205779878146
Epoch: 59, step: 1318, loss: 0.2988739609718323, mean loss: 0.34042009776337934
Epoch: 59, step: 1319, loss: 0.3579370081424713, mean loss: 0.3404203002335626
Epoch: 59, step: 1320, loss: 0.3314007818698883, mean loss: 0.3404201959821627
Epoch: 59, step: 1321, loss: 0.31396758556365967, mean loss: 0.34041989023526126
Epoch: 59, step: 1322, loss: 0.30205878615379333, mean loss: 0.34041944685167985
Epoch: 59, step: 1323, loss: 0.2963900864124298, mean loss: 0.34041893795939554
Epoch: 59, step: 1324, loss: 0.35666704177856445, mean loss: 0.34041912575315453
Epoch: 59, step: 1325, loss: 0.3565642237663269, mean loss: 0.34041931235422723
Epoch: 59, step: 1326, loss: 0.3371553122997284, mean loss: 0.34041927463015326
Epoch: 59, step: 1327, loss: 0.3287898004055023, mean loss: 0.3404191402226568
Epoch: 59, step: 1328, loss: 0.33276981115341187, mean loss: 0.3404190518166577
Epoch: 59, step: 1329, loss: 0.3523940145969391, mean loss: 0.34041919021393463
Epoch: 59, step: 1330, loss: 0.30859658122062683, mean loss: 0.34041882243729854
Epoch: 59, step: 1331, loss: 0.3436617851257324, mean loss: 0.3404188599160648
Epoch: 59, step: 1332, loss: 0.30957192182540894, mean loss: 0.3404185034235815
Epoch: 59, step: 1333, loss: 0.35386043787002563, mean loss: 0.340418658767791
Epoch: 59, step: 1334, loss: 0.33212828636169434, mean loss: 0.34041856295967127
Epoch: 59, step: 1335, loss: 0.32729846239089966, mean loss: 0.3404184113382992
Epoch: 59, step: 1336, loss: 0.3111068904399872, mean loss: 0.34041807260601326
Epoch: 59, step: 1337, loss: 0.3330950438976288, mean loss: 0.34041798797998524
Epoch: 59, step: 1338, loss: 0.32297465205192566, mean loss: 0.34041778640448483
Epoch: 59, step: 1339, loss: 0.31381621956825256, mean loss: 0.3404174789998574
Epoch: 59, step: 1340, loss: 0.32408562302589417, mean loss: 0.340417290273001
Epoch: 59, step: 1341, loss: 0.3878940939903259, mean loss: 0.34041783889676996
Epoch: 59, step: 1342, loss: 0.3390332758426666, mean loss: 0.34041782289747424
Epoch: 59, step: 1343, loss: 0.3067198395729065, mean loss: 0.3404174335054784
Epoch: 59, step: 1344, loss: 0.30351588129997253, mean loss: 0.3404170071000497
Epoch: 59, step: 1345, loss: 0.3432702422142029, mean loss: 0.3404170400694185
Epoch: 59, step: 1346, loss: 0.34532448649406433, mean loss: 0.3404170967747144
Epoch: 59, step: 1347, loss: 0.37342971563339233, mean loss: 0.3404174782294525
Epoch: 59, step: 1348, loss: 0.33019328117370605, mean loss: 0.34041736009210133
Epoch: 59, step: 1349, loss: 0.3401375412940979, mean loss: 0.3404173568589213
Epoch: 59, step: 1350, loss: 0.2976152300834656, mean loss: 0.34041686230536344
Epoch: 59, step: 1351, loss: 0.33983099460601807, mean loss: 0.3404168555360828
Epoch: 59, step: 1352, loss: 0.3704911172389984, mean loss: 0.34041720301856904
Epoch: 59, step: 1353, loss: 0.33750706911087036, mean loss: 0.3404171693948382
Epoch: 59, step: 1354, loss: 0.33119291067123413, mean loss: 0.3404170628188457
Epoch: 59, step: 1355, loss: 0.3286908268928528, mean loss: 0.3404169273368704
Epoch: 59, step: 1356, loss: 0.3448365032672882, mean loss: 0.3404169783989472
Epoch: 59, step: 1357, loss: 0.3231123983860016, mean loss: 0.3404167784708097
Epoch: 59, step: 1358, loss: 0.3317771852016449, mean loss: 0.3404166786545857
Epoch: 59, step: 1359, loss: 0.3097505569458008, mean loss: 0.34041632436231584
Epoch: 59, step: 1360, loss: 0.3343873620033264, mean loss: 0.3404162547092276
Epoch: 59, step: 1361, loss: 0.31618717312812805, mean loss: 0.3404159747919284
Epoch: 59, step: 1362, loss: 0.35637030005455017, mean loss: 0.3404161591092757
Epoch: 59, step: 1363, loss: 0.3255667984485626, mean loss: 0.3404159875593605
Epoch: 59, step: 1364, loss: 0.35317808389663696, mean loss: 0.34041613499407514
Epoch: 59, step: 1365, loss: 0.31173470616340637, mean loss: 0.34041580365435525
Epoch: 59, step: 1366, loss: 0.3925620913505554, mean loss: 0.34041640606286344
Epoch: 59, step: 1367, loss: 0.2851458191871643, mean loss: 0.34041576756895287
Epoch: 59, step: 1368, loss: 0.3176843523979187, mean loss: 0.3404155049753507
Epoch: 59, step: 1369, loss: 0.3021663427352905, mean loss: 0.3404150631256379
Epoch: 59, step: 1370, loss: 0.3826321065425873, mean loss: 0.3404155508062023
Epoch: 59, step: 1371, loss: 0.34160637855529785, mean loss: 0.34041556456218314
Epoch: 59, step: 1372, loss: 0.29183414578437805, mean loss: 0.34041500337493624
Epoch: 59, step: 1373, loss: 0.31411314010620117, mean loss: 0.34041469955302023
Epoch: 59, step: 1374, loss: 0.38761764764785767, mean loss: 0.34041524480429486
Epoch: 59, step: 1375, loss: 0.32061144709587097, mean loss: 0.3404150160490656
Epoch: 59, step: 1376, loss: 0.2962016761302948, mean loss: 0.3404145053431883
Epoch: 59, step: 1377, loss: 0.31265589594841003, mean loss: 0.34041418470870916
Epoch: 59, step: 1378, loss: 0.3610801696777344, mean loss: 0.34041442341485956
Epoch: 59, step: 1379, loss: 0.328966349363327, mean loss: 0.3404142911833629
Epoch: 59, step: 1380, loss: 0.32799437642097473, mean loss: 0.34041414772823325
Epoch: 59, step: 1381, loss: 0.31978029012680054, mean loss: 0.3404139094014343
Epoch: 59, step: 1382, loss: 0.33807510137557983, mean loss: 0.3404138823878626
Epoch: 59, step: 1383, loss: 0.34307360649108887, mean loss: 0.3404139131077067
Epoch: 59, step: 1384, loss: 0.32719820737838745, mean loss: 0.3404137604679159
Epoch: 59, step: 1385, loss: 0.2939056158065796, mean loss: 0.3404132233107162
Epoch: 59, step: 1386, loss: 0.3015826344490051, mean loss: 0.34041277483250615
Epoch: 59, step: 1387, loss: 0.3156849145889282, mean loss: 0.34041248923862916
Epoch: 59, step: 1388, loss: 0.3376365900039673, mean loss: 0.3404124571788124
Epoch: 59, step: 1389, loss: 0.32801517844200134, mean loss: 0.3404123140000221
Epoch: 59, step: 1390, loss: 0.3092952370643616, mean loss: 0.34041195462647944
Epoch: 59, step: 1391, loss: 0.30682656168937683, mean loss: 0.3404115667506429
Epoch: 59, step: 1392, loss: 0.3245445489883423, mean loss: 0.3404113835054528
Epoch: 59, step: 1393, loss: 0.3129352927207947, mean loss: 0.34041106619293654
Epoch: 59, step: 1394, loss: 0.2811359167098999, mean loss: 0.3404103816512465
Epoch: 59, step: 1395, loss: 0.39031773805618286, mean loss: 0.3404109580019071
Epoch: 59, step: 1396, loss: 0.3109859824180603, mean loss: 0.34041061819412144
Epoch: 59, step: 1397, loss: 0.2976739704608917, mean loss: 0.34041012466515025
Epoch: 59, step: 1398, loss: 0.3449997901916504, mean loss: 0.34041017766665754
Epoch: 59, step: 1399, loss: 0.3147661089897156, mean loss: 0.34040988153209384
Epoch: 59, step: 1400, loss: 0.3291440010070801, mean loss: 0.3404097514365879
Epoch: 59, step: 1401, loss: 0.38755685091018677, mean loss: 0.34041029587294297
Epoch: 59, step: 1402, loss: 0.3003599941730499, mean loss: 0.3404098333929871
Epoch: 59, step: 1403, loss: 0.30860182642936707, mean loss: 0.3404094660949852
Epoch: 59, step: 1404, loss: 0.33957192301750183, mean loss: 0.34040945642369874
Epoch: 59, step: 1405, loss: 0.3482947051525116, mean loss: 0.3404095474752764
Epoch: 59, step: 1406, loss: 0.3384338319301605, mean loss: 0.34040952466179947
Epoch: 59, step: 1407, loss: 0.39391574263572693, mean loss: 0.34041014248797347
Epoch: 59, step: 1408, loss: 0.3721722364425659, mean loss: 0.3404105092346273
Epoch: 59, step: 1409, loss: 0.32718563079833984, mean loss: 0.34041035653298496
Epoch: 59, step: 1410, loss: 0.369236022233963, mean loss: 0.3404106893659627
Epoch: 59, step: 1411, loss: 0.3558019697666168, mean loss: 0.340410867077957
Epoch: 59, step: 1412, loss: 0.32177847623825073, mean loss: 0.3404106519456862
Epoch: 59, step: 1413, loss: 0.37441137433052063, mean loss: 0.3404110445183959
Epoch: 59, step: 1414, loss: 0.342838853597641, mean loss: 0.3404110725495822
Epoch: 59, step: 1415, loss: 0.3190191388130188, mean loss: 0.3404108255637865
Epoch: 59, step: 1416, loss: 0.3052578270435333, mean loss: 0.3404104197009423
Epoch: 59, step: 1417, loss: 0.3234117329120636, mean loss: 0.34041022344298416
Epoch: 59, step: 1418, loss: 0.33324602246284485, mean loss: 0.3404101407298169
Epoch: 59, step: 1419, loss: 0.31279945373535156, mean loss: 0.3404098219586084
Epoch: 59, step: 1420, loss: 0.3536437153816223, mean loss: 0.340409974744937
Epoch: 59, step: 1421, loss: 0.33569788932800293, mean loss: 0.34040992034417256
Epoch: 59, step: 1422, loss: 0.35174939036369324, mean loss: 0.3404100512562129
Epoch: 59, step: 1423, loss: 0.3075054883956909, mean loss: 0.3404096713836331
Epoch: 59, step: 1424, loss: 0.3407803475856781, mean loss: 0.3404096756629211
Epoch: 59, step: 1425, loss: 0.3197060823440552, mean loss: 0.34040943665212336
Epoch: 59, step: 1426, loss: 0.34884268045425415, mean loss: 0.3404095340078349
Epoch: 59, step: 1427, loss: 0.35658782720565796, mean loss: 0.34040972077239434
Epoch: 59, step: 1428, loss: 0.31245195865631104, mean loss: 0.34040939802766573
Epoch: 59, step: 1429, loss: 0.33483991026878357, mean loss: 0.340409333734177
Epoch: 59, step: 1430, loss: 0.3157878518104553, mean loss: 0.3404090495100676
Epoch: 59, step: 1431, loss: 0.3436063528060913, mean loss: 0.34040908641849554
Epoch: 59, step: 1432, loss: 0.33850207924842834, mean loss: 0.34040906440499924
Epoch: 59, step: 1433, loss: 0.3072260916233063, mean loss: 0.34040868136248764
Epoch: 59, step: 1434, loss: 0.29670441150665283, mean loss: 0.34040817687483477
Epoch: 59, step: 1435, loss: 0.3329096734523773, mean loss: 0.3404080903190191
Epoch: 59, step: 1436, loss: 0.31042996048927307, mean loss: 0.3404077442830994
Epoch: 59, step: 1437, loss: 0.3569115102291107, mean loss: 0.3404079347829718
Epoch: 59, step: 1438, loss: 0.31944626569747925, mean loss: 0.3404076928291531
Epoch: 59, step: 1439, loss: 0.32169103622436523, mean loss: 0.3404074767912866
Epoch: 59, step: 1440, loss: 0.3683888018131256, mean loss: 0.34040779976328495
Epoch: 59, step: 1441, loss: 0.3336312174797058, mean loss: 0.34040772154607907
Epoch: 59, step: 1442, loss: 0.3780198395252228, mean loss: 0.34040815567064164
Epoch: 59, step: 1443, loss: 0.3817445635795593, mean loss: 0.3404086327759961
Valid: 59, mean loss: 0.1863272488117218
Epoch: 60, step: 0, loss: 0.29860424995422363, mean loss: 0.3404081502748382
Epoch: 60, step: 1, loss: 0.32149890065193176, mean loss: 0.3404079320290726
Epoch: 60, step: 2, loss: 0.32132646441459656, mean loss: 0.34040771179815243
Epoch: 60, step: 3, loss: 0.32551077008247375, mean loss: 0.3404075398653964
Epoch: 60, step: 4, loss: 0.34354230761528015, mean loss: 0.3404075760448384
Epoch: 60, step: 5, loss: 0.3148708641529083, mean loss: 0.34040728132018994
Epoch: 60, step: 6, loss: 0.3323032855987549, mean loss: 0.3404071877913231
Epoch: 60, step: 7, loss: 0.3648192286491394, mean loss: 0.34040746952939965
Epoch: 60, step: 8, loss: 0.33235782384872437, mean loss: 0.34040737662993537
Epoch: 60, step: 9, loss: 0.31778663396835327, mean loss: 0.3404071155711626
Epoch: 60, step: 10, loss: 0.32386401295661926, mean loss: 0.3404069246546975
Epoch: 60, step: 11, loss: 0.3785021901130676, mean loss: 0.3404073642898526
Epoch: 60, step: 12, loss: 0.3274707496166229, mean loss: 0.3404072149976795
Epoch: 60, step: 13, loss: 0.35050615668296814, mean loss: 0.340407331540963
Epoch: 60, step: 14, loss: 0.33540743589401245, mean loss: 0.3404072738420922
Epoch: 60, step: 15, loss: 0.3165188729763031, mean loss: 0.34040699817276904
Epoch: 60, step: 16, loss: 0.35162249207496643, mean loss: 0.3404071275967498
Epoch: 60, step: 17, loss: 0.3352722227573395, mean loss: 0.3404070683419223
Epoch: 60, step: 18, loss: 0.31542515754699707, mean loss: 0.3404067800636039
Epoch: 60, step: 19, loss: 0.2957428991794586, mean loss: 0.34040626467148666
Epoch: 60, step: 20, loss: 0.33651161193847656, mean loss: 0.34040621973024743
Epoch: 60, step: 21, loss: 0.33589598536491394, mean loss: 0.3404061676862793
Epoch: 60, step: 22, loss: 0.3360897898674011, mean loss: 0.3404061178798127
Epoch: 60, step: 23, loss: 0.3366142511367798, mean loss: 0.3404060741261578
Epoch: 60, step: 24, loss: 0.3193986415863037, mean loss: 0.34040583172804395
Epoch: 60, step: 25, loss: 0.3306828439235687, mean loss: 0.3404057195388601
Epoch: 60, step: 26, loss: 0.32284167408943176, mean loss: 0.3404055168775767
Epoch: 60, step: 27, loss: 0.3009454905986786, mean loss: 0.3404050615765858
Epoch: 60, step: 28, loss: 0.33598601818084717, mean loss: 0.34040501058899625
Epoch: 60, step: 29, loss: 0.3617965877056122, mean loss: 0.3404052574053931
Epoch: 60, step: 30, loss: 0.34019020199775696, mean loss: 0.3404052549241086
Epoch: 60, step: 31, loss: 0.33264923095703125, mean loss: 0.34040516543703125
Epoch: 60, step: 32, loss: 0.2949693202972412, mean loss: 0.3404046412155881
Epoch: 60, step: 33, loss: 0.33770960569381714, mean loss: 0.3404046101216554
Epoch: 60, step: 34, loss: 0.3211785554885864, mean loss: 0.34040438830389214
Epoch: 60, step: 35, loss: 0.3215997815132141, mean loss: 0.3404041713510241
Epoch: 60, step: 36, loss: 0.3203616142272949, mean loss: 0.34040394011831965
Epoch: 60, step: 37, loss: 0.31289538741111755, mean loss: 0.3404036227534438
Epoch: 60, step: 38, loss: 0.28870463371276855, mean loss: 0.34040302631152547
Epoch: 60, step: 39, loss: 0.35914599895477295, mean loss: 0.340403242543328
Epoch: 60, step: 40, loss: 0.3197896480560303, mean loss: 0.3404030047334909
Epoch: 60, step: 41, loss: 0.3128680884838104, mean loss: 0.3404026870791192
Epoch: 60, step: 42, loss: 0.32904407382011414, mean loss: 0.34040255604289227
Epoch: 60, step: 43, loss: 0.32516080141067505, mean loss: 0.3404023802116589
Epoch: 60, step: 44, loss: 0.3134419322013855, mean loss: 0.3404020691953584
Epoch: 60, step: 45, loss: 0.3282822370529175, mean loss: 0.34040192938233044
Epoch: 60, step: 46, loss: 0.3573886752128601, mean loss: 0.3404021253372698
Epoch: 60, step: 47, loss: 0.31448355317115784, mean loss: 0.3404018263504185
Epoch: 60, step: 48, loss: 0.32498401403427124, mean loss: 0.34040164849841514
Epoch: 60, step: 49, loss: 0.32688015699386597, mean loss: 0.3404014925231988
Epoch: 60, step: 50, loss: 0.3188624382019043, mean loss: 0.3404012440654082
Epoch: 60, step: 51, loss: 0.34701332449913025, mean loss: 0.3404013203363494
Epoch: 60, step: 52, loss: 0.3613995909690857, mean loss: 0.34040156255049164
Epoch: 60, step: 53, loss: 0.31643807888031006, mean loss: 0.3404012861359339
Epoch: 60, step: 54, loss: 0.3521344065666199, mean loss: 0.3404014214738476
Epoch: 60, step: 55, loss: 0.3239462375640869, mean loss: 0.34040123167058206
Epoch: 60, step: 56, loss: 0.32018089294433594, mean loss: 0.3404009984406119
Epoch: 60, step: 57, loss: 0.3241330087184906, mean loss: 0.34040081080087714
Epoch: 60, step: 58, loss: 0.35197997093200684, mean loss: 0.34040094435674434
Epoch: 60, step: 59, loss: 0.3117259442806244, mean loss: 0.34040061361856583
Epoch: 60, step: 60, loss: 0.34597980976104736, mean loss: 0.3404006779684135
Epoch: 60, step: 61, loss: 0.3162662982940674, mean loss: 0.34040039960828716
Epoch: 60, step: 62, loss: 0.30455154180526733, mean loss: 0.34039998614095845
Epoch: 60, step: 63, loss: 0.3212881088256836, mean loss: 0.3403997657142502
Epoch: 60, step: 64, loss: 0.31234875321388245, mean loss: 0.3403994421918178
Epoch: 60, step: 65, loss: 0.2906510531902313, mean loss: 0.34039886843234324
Epoch: 60, step: 66, loss: 0.30695170164108276, mean loss: 0.3403984826830174
Epoch: 60, step: 67, loss: 0.3688245117664337, mean loss: 0.340398810519308
Epoch: 60, step: 68, loss: 0.3612965941429138, mean loss: 0.34039905152985617
Epoch: 60, step: 69, loss: 0.33457252383232117, mean loss: 0.3403989843342882
Epoch: 60, step: 70, loss: 0.3486997187137604, mean loss: 0.34039908006302366
Epoch: 60, step: 71, loss: 0.33379778265953064, mean loss: 0.3403990039340288
Epoch: 60, step: 72, loss: 0.3644395172595978, mean loss: 0.34039928117634916
Epoch: 60, step: 73, loss: 0.35373160243034363, mean loss: 0.34039943492685376
Epoch: 60, step: 74, loss: 0.3038078844547272, mean loss: 0.34039901295198816
Epoch: 60, step: 75, loss: 0.3228663504123688, mean loss: 0.34039881076712564
Epoch: 60, step: 76, loss: 0.313412070274353, mean loss: 0.34039849956239654
Epoch: 60, step: 77, loss: 0.3375023901462555, mean loss: 0.34039846616553066
Epoch: 60, step: 78, loss: 0.31812044978141785, mean loss: 0.3403982092666229
Epoch: 60, step: 79, loss: 0.3356468379497528, mean loss: 0.3403981544768245
Epoch: 60, step: 80, loss: 0.34928569197654724, mean loss: 0.34039825696108433
Epoch: 60, step: 81, loss: 0.33453166484832764, mean loss: 0.34039818931282767
Epoch: 60, step: 82, loss: 0.37100860476493835, mean loss: 0.34039854228050004
Epoch: 60, step: 83, loss: 0.31087973713874817, mean loss: 0.3403982019040743
Epoch: 60, step: 84, loss: 0.3124358057975769, mean loss: 0.34039787947805983
Epoch: 60, step: 85, loss: 0.34013256430625916, mean loss: 0.3403978764188253
Epoch: 60, step: 86, loss: 0.3323895037174225, mean loss: 0.3403977840788078
Epoch: 60, step: 87, loss: 0.3112061619758606, mean loss: 0.3403974474905998
Epoch: 60, step: 88, loss: 0.30651113390922546, mean loss: 0.34039705677568804
Epoch: 60, step: 89, loss: 0.3609446883201599, mean loss: 0.34039729369061417
Epoch: 60, step: 90, loss: 0.33699461817741394, mean loss: 0.3403972544580962
Epoch: 60, step: 91, loss: 0.31853967905044556, mean loss: 0.3403970024452819
Epoch: 60, step: 92, loss: 0.339586079120636, mean loss: 0.34039699309563043
Epoch: 60, step: 93, loss: 0.33970606327056885, mean loss: 0.34039698512955224
Epoch: 60, step: 94, loss: 0.35592764616012573, mean loss: 0.3403971641883063
Epoch: 60, step: 95, loss: 0.33695051074028015, mean loss: 0.3403971244510179
Epoch: 60, step: 96, loss: 0.3013789653778076, mean loss: 0.3403966746065562
Epoch: 60, step: 97, loss: 0.3296709954738617, mean loss: 0.3403965509504985
Epoch: 60, step: 98, loss: 0.3038059175014496, mean loss: 0.3403961291029622
Epoch: 60, step: 99, loss: 0.31217464804649353, mean loss: 0.3403958037457907
Epoch: 60, step: 100, loss: 0.33333587646484375, mean loss: 0.3403957223548997
Epoch: 60, step: 101, loss: 0.3033541440963745, mean loss: 0.3403952953232627
Epoch: 60, step: 102, loss: 0.31607967615127563, mean loss: 0.3403950150053215
Epoch: 60, step: 103, loss: 0.3083631098270416, mean loss: 0.3403946457359175
Epoch: 60, step: 104, loss: 0.3082718551158905, mean loss: 0.3403942754230393
Epoch: 60, step: 105, loss: 0.2983326017856598, mean loss: 0.3403937905398904
Epoch: 60, step: 106, loss: 0.3649221658706665, mean loss: 0.3403940732975112
Epoch: 60, step: 107, loss: 0.37272360920906067, mean loss: 0.3403944459808689
Epoch: 60, step: 108, loss: 0.29810068011283875, mean loss: 0.3403939584390428
Epoch: 60, step: 109, loss: 0.32903754711151123, mean loss: 0.3403938275294021
Epoch: 60, step: 110, loss: 0.35614013671875, mean loss: 0.34039400904096034
Epoch: 60, step: 111, loss: 0.3902190029621124, mean loss: 0.34039458337923406
Epoch: 60, step: 112, loss: 0.3234873116016388, mean loss: 0.3403943884894691
Epoch: 60, step: 113, loss: 0.3376554250717163, mean loss: 0.3403943569178595
Epoch: 60, step: 114, loss: 0.3445720672607422, mean loss: 0.3403944050731283
Epoch: 60, step: 115, loss: 0.3608701825141907, mean loss: 0.34039464108882106
Epoch: 60, step: 116, loss: 0.3185943067073822, mean loss: 0.3403943898084128
Epoch: 60, step: 117, loss: 0.3162813186645508, mean loss: 0.3403941118735694
Epoch: 60, step: 118, loss: 0.32397013902664185, mean loss: 0.34039392256787376
Epoch: 60, step: 119, loss: 0.3749164044857025, mean loss: 0.34039432047568746
Epoch: 60, step: 120, loss: 0.3225559890270233, mean loss: 0.3403941148725772
Epoch: 60, step: 121, loss: 0.3511127233505249, mean loss: 0.3403942384129345
Epoch: 60, step: 122, loss: 0.2931046485900879, mean loss: 0.3403936933696577
Epoch: 60, step: 123, loss: 0.29132014513015747, mean loss: 0.3403931277716189
Epoch: 60, step: 124, loss: 0.3078821897506714, mean loss: 0.34039275307055256
Epoch: 60, step: 125, loss: 0.3547690510749817, mean loss: 0.3403929187610074
Epoch: 60, step: 126, loss: 0.3618835210800171, mean loss: 0.34039316644275647
Epoch: 60, step: 127, loss: 0.3069484829902649, mean loss: 0.3403927809932422
Epoch: 60, step: 128, loss: 0.3548099398612976, mean loss: 0.34039294714888385
Epoch: 60, step: 129, loss: 0.31444039940834045, mean loss: 0.3403926480530242
Epoch: 60, step: 130, loss: 0.3178602457046509, mean loss: 0.3403923883763771
Epoch: 60, step: 131, loss: 0.33567145466804504, mean loss: 0.34039233397018953
Epoch: 60, step: 132, loss: 0.33785197138786316, mean loss: 0.34039230469423293
Epoch: 60, step: 133, loss: 0.31996461749076843, mean loss: 0.3403920692816992
Epoch: 60, step: 134, loss: 0.3325435221195221, mean loss: 0.3403919788345985
Epoch: 60, step: 135, loss: 0.33345168828964233, mean loss: 0.34039189885522003
Epoch: 60, step: 136, loss: 0.3384265899658203, mean loss: 0.3403918762074114
Epoch: 60, step: 137, loss: 0.3587971329689026, mean loss: 0.34039208830329704
Epoch: 60, step: 138, loss: 0.3333390951156616, mean loss: 0.34039200702795175
Epoch: 60, step: 139, loss: 0.3213673532009125, mean loss: 0.34039178779939877
Epoch: 60, step: 140, loss: 0.328069269657135, mean loss: 0.3403916458038221
Epoch: 60, step: 141, loss: 0.30835771560668945, mean loss: 0.3403912766727788
Epoch: 60, step: 142, loss: 0.32392871379852295, mean loss: 0.34039108697476333
Epoch: 60, step: 143, loss: 0.3213598132133484, mean loss: 0.34039086768003435
Epoch: 60, step: 144, loss: 0.3312924802303314, mean loss: 0.3403907628417852
Epoch: 60, step: 145, loss: 0.3377545177936554, mean loss: 0.3403907324653991
Epoch: 60, step: 146, loss: 0.3510083854198456, mean loss: 0.34039085480691283
Epoch: 60, step: 147, loss: 0.29297447204589844, mean loss: 0.34039030845969015
Epoch: 60, step: 148, loss: 0.3343680500984192, mean loss: 0.34039023907003985
Epoch: 60, step: 149, loss: 0.3093944787979126, mean loss: 0.3403898819348829
Epoch: 60, step: 150, loss: 0.3171755373477936, mean loss: 0.3403896144607832
Epoch: 60, step: 151, loss: 0.31099358201026917, mean loss: 0.34038927576559874
Epoch: 60, step: 152, loss: 0.3252186179161072, mean loss: 0.3403891009743385
Epoch: 60, step: 153, loss: 0.32111653685569763, mean loss: 0.3403888789248406
Epoch: 60, step: 154, loss: 0.3446834087371826, mean loss: 0.34038892840384066
Epoch: 60, step: 155, loss: 0.3239802420139313, mean loss: 0.34038873935496294
Epoch: 60, step: 156, loss: 0.33564239740371704, mean loss: 0.34038868467171407
Epoch: 60, step: 157, loss: 0.33288124203681946, mean loss: 0.3403885981784465
Epoch: 60, step: 158, loss: 0.31206923723220825, mean loss: 0.340388271914769
Epoch: 60, step: 159, loss: 0.3504844307899475, mean loss: 0.3403883882299634
Epoch: 60, step: 160, loss: 0.3145677149295807, mean loss: 0.34038809076019577
Epoch: 60, step: 161, loss: 0.3117687702178955, mean loss: 0.34038776105211827
Epoch: 60, step: 162, loss: 0.33298519253730774, mean loss: 0.34038767577201834
Epoch: 60, step: 163, loss: 0.31930646300315857, mean loss: 0.34038743291209517
Epoch: 60, step: 164, loss: 0.391104131937027, mean loss: 0.3403880171722072
Epoch: 60, step: 165, loss: 0.333919495344162, mean loss: 0.34038794265521727
Epoch: 60, step: 166, loss: 0.3483142554759979, mean loss: 0.3403880339648216
Epoch: 60, step: 167, loss: 0.3139088749885559, mean loss: 0.3403877289334999
Epoch: 60, step: 168, loss: 0.33059045672416687, mean loss: 0.34038761607340234
Epoch: 60, step: 169, loss: 0.37246695160865784, mean loss: 0.34038798560842753
Epoch: 60, step: 170, loss: 0.34234127402305603, mean loss: 0.34038800810889885
Epoch: 60, step: 171, loss: 0.3693080246448517, mean loss: 0.34038834124275746
Epoch: 60, step: 172, loss: 0.3097451329231262, mean loss: 0.34038798826326916
Epoch: 60, step: 173, loss: 0.32100486755371094, mean loss: 0.34038776499143847
Epoch: 60, step: 174, loss: 0.3248119354248047, mean loss: 0.3403875855774021
Epoch: 60, step: 175, loss: 0.3295297920703888, mean loss: 0.3403874605106689
Epoch: 60, step: 176, loss: 0.3269951045513153, mean loss: 0.34038730625106584
Epoch: 60, step: 177, loss: 0.34303611516952515, mean loss: 0.34038733676097066
Epoch: 60, step: 178, loss: 0.3230991065502167, mean loss: 0.3403871376313998
Epoch: 60, step: 179, loss: 0.30888956785202026, mean loss: 0.3403867748397645
Epoch: 60, step: 180, loss: 0.3813067674636841, mean loss: 0.3403872461542232
Epoch: 60, step: 181, loss: 0.36614951491355896, mean loss: 0.34038754287934775
Epoch: 60, step: 182, loss: 0.3324805796146393, mean loss: 0.34038745180943236
Epoch: 60, step: 183, loss: 0.33651307225227356, mean loss: 0.3403874071860614
Epoch: 60, step: 184, loss: 0.3454408645629883, mean loss: 0.34038746538885295
Epoch: 60, step: 185, loss: 0.2972334027290344, mean loss: 0.3403869683711087
Epoch: 60, step: 186, loss: 0.30549174547195435, mean loss: 0.3403865664774247
Epoch: 60, step: 187, loss: 0.38117456436157227, mean loss: 0.34038703623370015
Epoch: 60, step: 188, loss: 0.3232448995113373, mean loss: 0.3403868388096054
Epoch: 60, step: 189, loss: 0.3369990587234497, mean loss: 0.3403867997933658
Epoch: 60, step: 190, loss: 0.3569425046443939, mean loss: 0.3403869904591977
Epoch: 60, step: 191, loss: 0.30044302344322205, mean loss: 0.3403865304448364
Epoch: 60, step: 192, loss: 0.2962990999221802, mean loss: 0.34038602271815965
Epoch: 60, step: 193, loss: 0.3373998701572418, mean loss: 0.3403859883289508
Epoch: 60, step: 194, loss: 0.3451923131942749, mean loss: 0.34038604367903846
Epoch: 60, step: 195, loss: 0.3812600374221802, mean loss: 0.34038651438236134
Epoch: 60, step: 196, loss: 0.3527129888534546, mean loss: 0.34038665633192744
Epoch: 60, step: 197, loss: 0.3192259967327118, mean loss: 0.3403864126522066
Epoch: 60, step: 198, loss: 0.3224020004272461, mean loss: 0.3403862055515695
Epoch: 60, step: 199, loss: 0.3472820520401001, mean loss: 0.3403862849602117
Epoch: 60, step: 200, loss: 0.37323543429374695, mean loss: 0.34038666322795774
Epoch: 60, step: 201, loss: 0.3608284890651703, mean loss: 0.3403868986189648
Epoch: 60, step: 202, loss: 0.3048049509525299, mean loss: 0.34038648889166767
Epoch: 60, step: 203, loss: 0.29417574405670166, mean loss: 0.34038595677954897
Epoch: 60, step: 204, loss: 0.3199874758720398, mean loss: 0.3403857218957801
Epoch: 60, step: 205, loss: 0.31292724609375, mean loss: 0.3403854057214508
Epoch: 60, step: 206, loss: 0.34812483191490173, mean loss: 0.3403854948370932
Epoch: 60, step: 207, loss: 0.3073234260082245, mean loss: 0.34038511414820194
Epoch: 60, step: 208, loss: 0.34122908115386963, mean loss: 0.34038512386583836
Epoch: 60, step: 209, loss: 0.3231966495513916, mean loss: 0.3403849259559441
Epoch: 60, step: 210, loss: 0.29537233710289, mean loss: 0.34038440768224715
Epoch: 60, step: 211, loss: 0.3407835066318512, mean loss: 0.34038441227740845
Epoch: 60, step: 212, loss: 0.31345924735069275, mean loss: 0.3403841022689467
Epoch: 60, step: 213, loss: 0.3727976083755493, mean loss: 0.3403844754642642
Epoch: 60, step: 214, loss: 0.32265815138816833, mean loss: 0.3403842713732611
Epoch: 60, step: 215, loss: 0.3169075548648834, mean loss: 0.3403840010785606
Epoch: 60, step: 216, loss: 0.37463125586509705, mean loss: 0.34038439537326093
Epoch: 60, step: 217, loss: 0.34319448471069336, mean loss: 0.3403844277259439
Epoch: 60, step: 218, loss: 0.3063127100467682, mean loss: 0.3403840354612658
Epoch: 60, step: 219, loss: 0.31233376264572144, mean loss: 0.34038371252466876
Epoch: 60, step: 220, loss: 0.33020874857902527, mean loss: 0.3403835953839043
Epoch: 60, step: 221, loss: 0.31755852699279785, mean loss: 0.34038333260998255
Epoch: 60, step: 222, loss: 0.39916422963142395, mean loss: 0.34038400931809787
Epoch: 60, step: 223, loss: 0.34511831402778625, mean loss: 0.34038406382059266
Epoch: 60, step: 224, loss: 0.31007909774780273, mean loss: 0.3403837149462926
Epoch: 60, step: 225, loss: 0.32527872920036316, mean loss: 0.3403835410579388
Epoch: 60, step: 226, loss: 0.35233116149902344, mean loss: 0.3403836785971705
Epoch: 60, step: 227, loss: 0.3477911651134491, mean loss: 0.34038376387007324
Epoch: 60, step: 228, loss: 0.3168221712112427, mean loss: 0.34038349263876333
Epoch: 60, step: 229, loss: 0.3467095196247101, mean loss: 0.34038356546053133
Epoch: 60, step: 230, loss: 0.3245308995246887, mean loss: 0.34038338297539894
Epoch: 60, step: 231, loss: 0.3062567412853241, mean loss: 0.34038299013718076
Epoch: 60, step: 232, loss: 0.3345819413661957, mean loss: 0.34038292336098136
Epoch: 60, step: 233, loss: 0.33852705359458923, mean loss: 0.34038290199820576
Epoch: 60, step: 234, loss: 0.32143086194992065, mean loss: 0.3403826838452268
Epoch: 60, step: 235, loss: 0.3119679391384125, mean loss: 0.3403823567727936
Epoch: 60, step: 236, loss: 0.3394257426261902, mean loss: 0.34038234576166126
Epoch: 60, step: 237, loss: 0.3430718183517456, mean loss: 0.3403823767185501
Epoch: 60, step: 238, loss: 0.3913203775882721, mean loss: 0.3403829630282552
Epoch: 60, step: 239, loss: 0.3333439826965332, mean loss: 0.34038288200868416
Epoch: 60, step: 240, loss: 0.34851765632629395, mean loss: 0.34038297563990755
Epoch: 60, step: 241, loss: 0.3274787962436676, mean loss: 0.34038282711455825
Epoch: 60, step: 242, loss: 0.3212880790233612, mean loss: 0.34038260733913506
Epoch: 60, step: 243, loss: 0.3147173523902893, mean loss: 0.3403823119423422
Epoch: 60, step: 244, loss: 0.3335455060005188, mean loss: 0.340382233254353
Epoch: 60, step: 245, loss: 0.3625955283641815, mean loss: 0.3403824889145872
Epoch: 60, step: 246, loss: 0.35032325983047485, mean loss: 0.3403826033249238
Epoch: 60, step: 247, loss: 0.30719149112701416, mean loss: 0.3403822213261185
Epoch: 60, step: 248, loss: 0.3139735460281372, mean loss: 0.34038191739034646
Epoch: 60, step: 249, loss: 0.295655757188797, mean loss: 0.34038140264572453
Epoch: 60, step: 250, loss: 0.32276931405067444, mean loss: 0.3403811999539775
Epoch: 60, step: 251, loss: 0.29792484641075134, mean loss: 0.3403807113433627
Epoch: 60, step: 252, loss: 0.3501972258090973, mean loss: 0.3403808243158054
Epoch: 60, step: 253, loss: 0.38586628437042236, mean loss: 0.34038134777496315
Epoch: 60, step: 254, loss: 0.3084815442562103, mean loss: 0.34038098066749417
Epoch: 60, step: 255, loss: 0.3319167196750641, mean loss: 0.34038088326069765
Epoch: 60, step: 256, loss: 0.31278496980667114, mean loss: 0.340380565690316
Epoch: 60, step: 257, loss: 0.3043164014816284, mean loss: 0.340380150673121
Epoch: 60, step: 258, loss: 0.3024258315563202, mean loss: 0.34037971390953203
Epoch: 60, step: 259, loss: 0.3143557012081146, mean loss: 0.34037941443872993
Epoch: 60, step: 260, loss: 0.3276109993457794, mean loss: 0.3403792675081412
Epoch: 60, step: 261, loss: 0.33832985162734985, mean loss: 0.34037924392507196
Epoch: 60, step: 262, loss: 0.34386295080184937, mean loss: 0.34037928401237477
Epoch: 60, step: 263, loss: 0.33762049674987793, mean loss: 0.34037925226714716
Epoch: 60, step: 264, loss: 0.3123607039451599, mean loss: 0.34037892986281687
Epoch: 60, step: 265, loss: 0.34297817945480347, mean loss: 0.3403789597715642
Epoch: 60, step: 266, loss: 0.32336893677711487, mean loss: 0.34037876404483336
Epoch: 60, step: 267, loss: 0.29585322737693787, mean loss: 0.3403782517152818
Epoch: 60, step: 268, loss: 0.3458629548549652, mean loss: 0.3403783148238567
Epoch: 60, step: 269, loss: 0.38338103890419006, mean loss: 0.3403788096198995
Epoch: 60, step: 270, loss: 0.31375575065612793, mean loss: 0.34037850329436004
Epoch: 60, step: 271, loss: 0.34593141078948975, mean loss: 0.3403785671855085
Epoch: 60, step: 272, loss: 0.34003108739852905, mean loss: 0.34037856318748994
Epoch: 60, step: 273, loss: 0.3138270080089569, mean loss: 0.3403782576952197
Epoch: 60, step: 274, loss: 0.3223486840724945, mean loss: 0.3403780502560708
Epoch: 60, step: 275, loss: 0.36803483963012695, mean loss: 0.34037836845743047
Epoch: 60, step: 276, loss: 0.32620909810066223, mean loss: 0.3403782054367285
Epoch: 60, step: 277, loss: 0.34384334087371826, mean loss: 0.34037824530344696
Epoch: 60, step: 278, loss: 0.3490229547023773, mean loss: 0.34037834476052076
Epoch: 60, step: 279, loss: 0.31019338965415955, mean loss: 0.34037799748768244
Epoch: 60, step: 280, loss: 0.3744044899940491, mean loss: 0.3403783889522595
Epoch: 60, step: 281, loss: 0.37296774983406067, mean loss: 0.3403787638787555
Epoch: 60, step: 282, loss: 0.3402579426765442, mean loss: 0.3403787624887758
Epoch: 60, step: 283, loss: 0.39845308661460876, mean loss: 0.3403794305933744
Epoch: 60, step: 284, loss: 0.35262084007263184, mean loss: 0.3403795714206333
Epoch: 60, step: 285, loss: 0.31874099373817444, mean loss: 0.34037932248961517
Epoch: 60, step: 286, loss: 0.34600430727005005, mean loss: 0.3403793871989089
Epoch: 60, step: 287, loss: 0.32534605264663696, mean loss: 0.3403792142588372
Epoch: 60, step: 288, loss: 0.3661029040813446, mean loss: 0.3403795101749276
Epoch: 60, step: 289, loss: 0.32009953260421753, mean loss: 0.34037927688403186
Epoch: 60, step: 290, loss: 0.36018630862236023, mean loss: 0.34037950473177014
Epoch: 60, step: 291, loss: 0.3290826082229614, mean loss: 0.34037937478081415
Epoch: 60, step: 292, loss: 0.3701654076576233, mean loss: 0.3403797174128742
Epoch: 60, step: 293, loss: 0.28893178701400757, mean loss: 0.3403791256083973
Epoch: 60, step: 294, loss: 0.33571285009384155, mean loss: 0.3403790719329442
Epoch: 60, step: 295, loss: 0.30108267068862915, mean loss: 0.3403786199176543
Epoch: 60, step: 296, loss: 0.3715932071208954, mean loss: 0.3403789789660135
Epoch: 60, step: 297, loss: 0.3120502829551697, mean loss: 0.3403786531166034
Epoch: 60, step: 298, loss: 0.3419252336025238, mean loss: 0.34037867090586355
Epoch: 60, step: 299, loss: 0.31110596656799316, mean loss: 0.34037833420579067
Epoch: 60, step: 300, loss: 0.3733271360397339, mean loss: 0.3403787131846595
Epoch: 60, step: 301, loss: 0.2991905212402344, mean loss: 0.340378239441337
Epoch: 60, step: 302, loss: 0.34165817499160767, mean loss: 0.34037825416288503
Epoch: 60, step: 303, loss: 0.3388938009738922, mean loss: 0.3403782370892148
Epoch: 60, step: 304, loss: 0.3372393250465393, mean loss: 0.3403782009869427
Epoch: 60, step: 305, loss: 0.38929274678230286, mean loss: 0.3403787635722922
Epoch: 60, step: 306, loss: 0.3477657437324524, mean loss: 0.3403788485318671
Epoch: 60, step: 307, loss: 0.34010207653045654, mean loss: 0.34037884534867713
Epoch: 60, step: 308, loss: 0.33120492100715637, mean loss: 0.34037873983942063
Epoch: 60, step: 309, loss: 0.3310600221157074, mean loss: 0.34037863266612883
Epoch: 60, step: 310, loss: 0.3840663731098175, mean loss: 0.3403791351070489
Epoch: 60, step: 311, loss: 0.31859108805656433, mean loss: 0.3403788845314779
Epoch: 60, step: 312, loss: 0.32044199109077454, mean loss: 0.3403786552479174
Epoch: 60, step: 313, loss: 0.3113400936126709, mean loss: 0.3403783212947739
Epoch: 60, step: 314, loss: 0.3350023329257965, mean loss: 0.34037825946982575
Epoch: 60, step: 315, loss: 0.33341193199157715, mean loss: 0.34037817935657905
Epoch: 60, step: 316, loss: 0.4139693081378937, mean loss: 0.3403790256499054
Epoch: 60, step: 317, loss: 0.31046298146247864, mean loss: 0.34037868162124574
Epoch: 60, step: 318, loss: 0.307197242975235, mean loss: 0.34037830004557623
Epoch: 60, step: 319, loss: 0.3362913727760315, mean loss: 0.34037825304779257
Epoch: 60, step: 320, loss: 0.3054359257221222, mean loss: 0.3403778512317219
Epoch: 60, step: 321, loss: 0.36288774013519287, mean loss: 0.3403781100791369
Epoch: 60, step: 322, loss: 0.34703755378723145, mean loss: 0.34037818665703445
Epoch: 60, step: 323, loss: 0.33515557646751404, mean loss: 0.340378126602182
Epoch: 60, step: 324, loss: 0.32515862584114075, mean loss: 0.3403779515949864
Epoch: 60, step: 325, loss: 0.3238818049430847, mean loss: 0.3403777619099756
Epoch: 60, step: 326, loss: 0.35872653126716614, mean loss: 0.34037797289539945
Epoch: 60, step: 327, loss: 0.33355712890625, mean loss: 0.34037789446604627
Epoch: 60, step: 328, loss: 0.3132242262363434, mean loss: 0.34037758224366554
Epoch: 60, step: 329, loss: 0.31886422634124756, mean loss: 0.34037733487841426
Epoch: 60, step: 330, loss: 0.32418644428253174, mean loss: 0.34037714871416874
Epoch: 60, step: 331, loss: 0.32661470770835876, mean loss: 0.3403769904742639
Epoch: 60, step: 332, loss: 0.3340022563934326, mean loss: 0.3403769171787115
Epoch: 60, step: 333, loss: 0.368836373090744, mean loss: 0.34037724439668365
Epoch: 60, step: 334, loss: 0.34152814745903015, mean loss: 0.34037725762925697
Epoch: 60, step: 335, loss: 0.33720308542251587, mean loss: 0.3403772211344514
Epoch: 60, step: 336, loss: 0.3575953543186188, mean loss: 0.340377419096363
Epoch: 60, step: 337, loss: 0.30663132667541504, mean loss: 0.34037703111213224
Epoch: 60, step: 338, loss: 0.34605640172958374, mean loss: 0.34037709640801533
Epoch: 60, step: 339, loss: 0.30810242891311646, mean loss: 0.34037672534952496
Epoch: 60, step: 340, loss: 0.3556974530220032, mean loss: 0.3403769014883101
Epoch: 60, step: 341, loss: 0.33787307143211365, mean loss: 0.3403768727026987
Epoch: 60, step: 342, loss: 0.290425181388855, mean loss: 0.3403762984331137
Epoch: 60, step: 343, loss: 0.3164721131324768, mean loss: 0.34037602362182307
Epoch: 60, step: 344, loss: 0.31710922718048096, mean loss: 0.34037575614126386
Epoch: 60, step: 345, loss: 0.32004284858703613, mean loss: 0.340375522392068
Epoch: 60, step: 346, loss: 0.3662818372249603, mean loss: 0.34037582021030327
Epoch: 60, step: 347, loss: 0.30380430817604065, mean loss: 0.340375399790107
Epoch: 60, step: 348, loss: 0.31169062852859497, mean loss: 0.3403750700383998
Epoch: 60, step: 349, loss: 0.3062955141067505, mean loss: 0.34037467827433576
Epoch: 60, step: 350, loss: 0.31408804655075073, mean loss: 0.3403743760978839
Epoch: 60, step: 351, loss: 0.34011268615722656, mean loss: 0.34037437308967694
Epoch: 60, step: 352, loss: 0.31818631291389465, mean loss: 0.34037411803398077
Epoch: 60, step: 353, loss: 0.43482843041419983, mean loss: 0.34037520379061204
Epoch: 60, step: 354, loss: 0.3210625946521759, mean loss: 0.3403749817938405
Epoch: 60, step: 355, loss: 0.33703944087028503, mean loss: 0.34037494345252683
Epoch: 60, step: 356, loss: 0.4000338315963745, mean loss: 0.34037562921052017
Epoch: 60, step: 357, loss: 0.3157990276813507, mean loss: 0.34037534671435327
Epoch: 60, step: 358, loss: 0.3154941499233246, mean loss: 0.3403750607202983
Epoch: 60, step: 359, loss: 0.3136986196041107, mean loss: 0.3403747540945383
Epoch: 60, step: 360, loss: 0.30616870522499084, mean loss: 0.340374360926082
Epoch: 60, step: 361, loss: 0.31990960240364075, mean loss: 0.3403741257043799
Epoch: 60, step: 362, loss: 0.3373629152774811, mean loss: 0.3403740910939593
Epoch: 60, step: 363, loss: 0.29159998893737793, mean loss: 0.34037353049786995
Epoch: 60, step: 364, loss: 0.3362712562084198, mean loss: 0.34037348334800166
Epoch: 60, step: 365, loss: 0.30305880308151245, mean loss: 0.34037305447320837
Epoch: 60, step: 366, loss: 0.3281882405281067, mean loss: 0.3403729144291436
Epoch: 60, step: 367, loss: 0.36077865958213806, mean loss: 0.3403731489563727
Epoch: 60, step: 368, loss: 0.3261087238788605, mean loss: 0.3403729850144233
Epoch: 60, step: 369, loss: 0.3190000653266907, mean loss: 0.340372739376914
Epoch: 60, step: 370, loss: 0.3135455548763275, mean loss: 0.34037243105745435
Epoch: 60, step: 371, loss: 0.3429183065891266, mean loss: 0.34037246031635576
Epoch: 60, step: 372, loss: 0.3378400504589081, mean loss: 0.34037243121254535
Epoch: 60, step: 373, loss: 0.32143497467041016, mean loss: 0.3403722135756531
Epoch: 60, step: 374, loss: 0.310830682516098, mean loss: 0.3403718740763592
Epoch: 60, step: 375, loss: 0.33258670568466187, mean loss: 0.340371784608119
Epoch: 60, step: 376, loss: 0.34459662437438965, mean loss: 0.34037183316000846
Epoch: 60, step: 377, loss: 0.3061428368091583, mean loss: 0.3403714398046527
Epoch: 60, step: 378, loss: 0.34886494278907776, mean loss: 0.3403715374098077
Epoch: 60, step: 379, loss: 0.3297804296016693, mean loss: 0.3403714157009154
Epoch: 60, step: 380, loss: 0.36744609475135803, mean loss: 0.340371726829023
Epoch: 60, step: 381, loss: 0.34222111105918884, mean loss: 0.34037174808093895
Epoch: 60, step: 382, loss: 0.33111894130706787, mean loss: 0.3403716417549473
Epoch: 60, step: 383, loss: 0.30757516622543335, mean loss: 0.3403712648879275
Epoch: 60, step: 384, loss: 0.35347113013267517, mean loss: 0.34037141541783555
Epoch: 60, step: 385, loss: 0.3167288601398468, mean loss: 0.340371143745516
Epoch: 60, step: 386, loss: 0.33213669061660767, mean loss: 0.34037104912599414
Epoch: 60, step: 387, loss: 0.3147393465042114, mean loss: 0.34037075460351146
Epoch: 60, step: 388, loss: 0.36755356192588806, mean loss: 0.34037106694545866
Epoch: 60, step: 389, loss: 0.344073086977005, mean loss: 0.340371109482745
Epoch: 60, step: 390, loss: 0.34317782521247864, mean loss: 0.3403711417323541
Epoch: 60, step: 391, loss: 0.32257184386253357, mean loss: 0.3403709372179471
Epoch: 60, step: 392, loss: 0.3203325867652893, mean loss: 0.3403707069794117
Epoch: 60, step: 393, loss: 0.34498703479766846, mean loss: 0.3403707600199225
Epoch: 60, step: 394, loss: 0.3803211450576782, mean loss: 0.34037121903508927
Epoch: 60, step: 395, loss: 0.30449944734573364, mean loss: 0.34037080688641874
Epoch: 60, step: 396, loss: 0.35588905215263367, mean loss: 0.34037098518122744
Epoch: 60, step: 397, loss: 0.37315383553504944, mean loss: 0.3403713618310856
Epoch: 60, step: 398, loss: 0.34460610151290894, mean loss: 0.3403714104844442
Epoch: 60, step: 399, loss: 0.3306095004081726, mean loss: 0.34037129833014645
Epoch: 60, step: 400, loss: 0.35522183775901794, mean loss: 0.340371468945597
Epoch: 60, step: 401, loss: 0.37001702189445496, mean loss: 0.34037180953465684
Epoch: 60, step: 402, loss: 0.34370726346969604, mean loss: 0.3403718478542682
Epoch: 60, step: 403, loss: 0.31036368012428284, mean loss: 0.3403715031071549
Epoch: 60, step: 404, loss: 0.3579237163066864, mean loss: 0.3403717047524326
Epoch: 60, step: 405, loss: 0.3413048982620239, mean loss: 0.3403717154731264
Epoch: 60, step: 406, loss: 0.336842805147171, mean loss: 0.3403716749328398
Epoch: 60, step: 407, loss: 0.3393538296222687, mean loss: 0.3403716632399197
Epoch: 60, step: 408, loss: 0.3147815465927124, mean loss: 0.34037136926621925
Epoch: 60, step: 409, loss: 0.35720205307006836, mean loss: 0.3403715626112371
Epoch: 60, step: 410, loss: 0.3057495653629303, mean loss: 0.34037116489039243
Epoch: 60, step: 411, loss: 0.3481656312942505, mean loss: 0.3403712544284433
Epoch: 60, step: 412, loss: 0.32931140065193176, mean loss: 0.3403711273810839
Epoch: 60, step: 413, loss: 0.3186396360397339, mean loss: 0.3403708777487713
Epoch: 60, step: 414, loss: 0.31207403540611267, mean loss: 0.34037055270319844
Epoch: 60, step: 415, loss: 0.34721195697784424, mean loss: 0.34037063128944495
Epoch: 60, step: 416, loss: 0.37277036905288696, mean loss: 0.3403710034563903
Epoch: 60, step: 417, loss: 0.3089115023612976, mean loss: 0.3403706420938378
Epoch: 60, step: 418, loss: 0.32209375500679016, mean loss: 0.3403704321570468
Epoch: 60, step: 419, loss: 0.3326244652271271, mean loss: 0.3403703431843047
Epoch: 60, step: 420, loss: 0.30844295024871826, mean loss: 0.3403699764599053
Epoch: 60, step: 421, loss: 0.327790766954422, mean loss: 0.3403698319742571
Epoch: 60, step: 422, loss: 0.3112589120864868, mean loss: 0.3403694976081097
Epoch: 60, step: 423, loss: 0.3191727101802826, mean loss: 0.34036925414597347
Epoch: 60, step: 424, loss: 0.3645215630531311, mean loss: 0.34036953155146255
Epoch: 60, step: 425, loss: 0.3237113952636719, mean loss: 0.3403693402237768
Epoch: 60, step: 426, loss: 0.3170533776283264, mean loss: 0.3403690724304384
Epoch: 60, step: 427, loss: 0.31826600432395935, mean loss: 0.34036881857060347
Epoch: 60, step: 428, loss: 0.324366956949234, mean loss: 0.34036863478691903
Epoch: 60, step: 429, loss: 0.32731232047080994, mean loss: 0.34036848483499166
Epoch: 60, step: 430, loss: 0.32842764258384705, mean loss: 0.34036834769584945
Epoch: 60, step: 431, loss: 0.3148006498813629, mean loss: 0.3403680540572766
Epoch: 60, step: 432, loss: 0.32781779766082764, mean loss: 0.34036790992239674
Epoch: 60, step: 433, loss: 0.3657684922218323, mean loss: 0.3403682016349895
Epoch: 60, step: 434, loss: 0.3369237184524536, mean loss: 0.34036816207733017
Epoch: 60, step: 435, loss: 0.3812388777732849, mean loss: 0.3403686314456486
Epoch: 60, step: 436, loss: 0.3082503378391266, mean loss: 0.34036826259631286
Epoch: 60, step: 437, loss: 0.3192284107208252, mean loss: 0.3403680198271648
Epoch: 60, step: 438, loss: 0.3906634449958801, mean loss: 0.3403685974110274
Epoch: 60, step: 439, loss: 0.3250437378883362, mean loss: 0.340368421425043
Epoch: 60, step: 440, loss: 0.3433230519294739, mean loss: 0.34036845535472343
Epoch: 60, step: 441, loss: 0.31223833560943604, mean loss: 0.340368132324479
Epoch: 60, step: 442, loss: 0.33354637026786804, mean loss: 0.3403680539881555
Epoch: 60, step: 443, loss: 0.3262229561805725, mean loss: 0.34036789155765385
Epoch: 60, step: 444, loss: 0.3680848777294159, mean loss: 0.34036820983274335
Epoch: 60, step: 445, loss: 0.332858145236969, mean loss: 0.3403681235954079
Epoch: 60, step: 446, loss: 0.36194318532943726, mean loss: 0.34036837133688175
Epoch: 60, step: 447, loss: 0.32117903232574463, mean loss: 0.3403681509926436
Epoch: 60, step: 448, loss: 0.35127121210098267, mean loss: 0.3403682761871126
Epoch: 60, step: 449, loss: 0.32730501890182495, mean loss: 0.34036812618989953
Epoch: 60, step: 450, loss: 0.33216592669487, mean loss: 0.3403680320102542
Epoch: 60, step: 451, loss: 0.35905006527900696, mean loss: 0.3403682465194315
Epoch: 60, step: 452, loss: 0.34967777132987976, mean loss: 0.3403683534112002
Epoch: 60, step: 453, loss: 0.3506968021392822, mean loss: 0.3403684720008703
Epoch: 60, step: 454, loss: 0.338226854801178, mean loss: 0.3403684474114312
Epoch: 60, step: 455, loss: 0.33175936341285706, mean loss: 0.34036834856551407
Epoch: 60, step: 456, loss: 0.3374844193458557, mean loss: 0.34036831545381996
Epoch: 60, step: 457, loss: 0.32402169704437256, mean loss: 0.34036812777306485
Epoch: 60, step: 458, loss: 0.3306809067726135, mean loss: 0.3403680165522586
Epoch: 60, step: 459, loss: 0.3365474343299866, mean loss: 0.34036797268793917
Epoch: 60, step: 460, loss: 0.35959047079086304, mean loss: 0.3403681933799875
Epoch: 60, step: 461, loss: 0.2871106266975403, mean loss: 0.34036758194090827
Epoch: 60, step: 462, loss: 0.3504590690135956, mean loss: 0.3403676977978486
Epoch: 60, step: 463, loss: 0.33317330479621887, mean loss: 0.34036761520241093
Epoch: 60, step: 464, loss: 0.37204861640930176, mean loss: 0.34036797891288917
Epoch: 60, step: 465, loss: 0.3605487644672394, mean loss: 0.3403682105936638
Epoch: 60, step: 466, loss: 0.29260677099227905, mean loss: 0.3403676622859549
Epoch: 60, step: 467, loss: 0.34557050466537476, mean loss: 0.340367722014595
Epoch: 60, step: 468, loss: 0.3706933856010437, mean loss: 0.34036807014927206
Epoch: 60, step: 469, loss: 0.3766227960586548, mean loss: 0.34036848634403627
Epoch: 60, step: 470, loss: 0.31048959493637085, mean loss: 0.34036814334612087
Epoch: 60, step: 471, loss: 0.33938470482826233, mean loss: 0.3403681320567633
Epoch: 60, step: 472, loss: 0.30399319529533386, mean loss: 0.3403677144963904
Epoch: 60, step: 473, loss: 0.2939288318157196, mean loss: 0.3403671814146506
Epoch: 60, step: 474, loss: 0.34720703959465027, mean loss: 0.3403672599299256
Epoch: 60, step: 475, loss: 0.3247250020503998, mean loss: 0.3403670803732669
Epoch: 60, step: 476, loss: 0.3526477515697479, mean loss: 0.34036722134083003
Epoch: 60, step: 477, loss: 0.3453509211540222, mean loss: 0.34036727854714577
Epoch: 60, step: 478, loss: 0.3192807137966156, mean loss: 0.3403670365039089
Epoch: 60, step: 479, loss: 0.3113323450088501, mean loss: 0.34036670323150886
Epoch: 60, step: 480, loss: 0.3630467653274536, mean loss: 0.340366963559812
Epoch: 60, step: 481, loss: 0.3367854356765747, mean loss: 0.3403669224504724
Epoch: 60, step: 482, loss: 0.3444962799549103, mean loss: 0.3403669698473424
Epoch: 60, step: 483, loss: 0.35579729080200195, mean loss: 0.34036714695492415
Epoch: 60, step: 484, loss: 0.3002946376800537, mean loss: 0.3403666870122065
Epoch: 60, step: 485, loss: 0.32787495851516724, mean loss: 0.34036654363676755
Epoch: 60, step: 486, loss: 0.32396432757377625, mean loss: 0.34036635538035953
Epoch: 60, step: 487, loss: 0.40794676542282104, mean loss: 0.3403671310255028
Epoch: 60, step: 488, loss: 0.30508893728256226, mean loss: 0.34036672612938623
Epoch: 60, step: 489, loss: 0.3071501553058624, mean loss: 0.3403663448993756
Epoch: 60, step: 490, loss: 0.3207267224788666, mean loss: 0.34036611949598966
Epoch: 60, step: 491, loss: 0.345946729183197, mean loss: 0.3403661835437527
Epoch: 60, step: 492, loss: 0.3564508259296417, mean loss: 0.340366368142497
Epoch: 60, step: 493, loss: 0.33206725120544434, mean loss: 0.3403662728970482
Epoch: 60, step: 494, loss: 0.3379896879196167, mean loss: 0.34036624562230233
Epoch: 60, step: 495, loss: 0.3330264389514923, mean loss: 0.34036616138838444
Epoch: 60, step: 496, loss: 0.41118645668029785, mean loss: 0.34036697413492484
Epoch: 60, step: 497, loss: 0.3070995807647705, mean loss: 0.34036659235667227
Epoch: 60, step: 498, loss: 0.2964968681335449, mean loss: 0.34036608891132375
Epoch: 60, step: 499, loss: 0.3629273772239685, mean loss: 0.3403663478198424
Epoch: 60, step: 500, loss: 0.33220764994621277, mean loss: 0.34036625419344524
Epoch: 60, step: 501, loss: 0.39752230048179626, mean loss: 0.3403669100889524
Epoch: 60, step: 502, loss: 0.3367009460926056, mean loss: 0.3403668680205821
Epoch: 60, step: 503, loss: 0.31389638781547546, mean loss: 0.3403665642649569
Epoch: 60, step: 504, loss: 0.3313130736351013, mean loss: 0.3403664603749961
Epoch: 60, step: 505, loss: 0.3304338753223419, mean loss: 0.34036634639862257
Epoch: 60, step: 506, loss: 0.3758276700973511, mean loss: 0.34036675331250027
Epoch: 60, step: 507, loss: 0.33832263946533203, mean loss: 0.3403667298568404
Epoch: 60, step: 508, loss: 0.3324127793312073, mean loss: 0.34036663858843197
Epoch: 60, step: 509, loss: 0.37161603569984436, mean loss: 0.34036699715867996
Epoch: 60, step: 510, loss: 0.3097509741783142, mean loss: 0.34036664586009496
Epoch: 60, step: 511, loss: 0.34932971000671387, mean loss: 0.34036674870413924
Epoch: 60, step: 512, loss: 0.3624194860458374, mean loss: 0.3403670017388867
Epoch: 60, step: 513, loss: 0.3484435975551605, mean loss: 0.3403670944092841
Epoch: 60, step: 514, loss: 0.3167765736579895, mean loss: 0.340366823736107
Epoch: 60, step: 515, loss: 0.3538742959499359, mean loss: 0.3403669787165124
Epoch: 60, step: 516, loss: 0.29880234599113464, mean loss: 0.3403665018227147
Epoch: 60, step: 517, loss: 0.3101204037666321, mean loss: 0.34036615479664645
Epoch: 60, step: 518, loss: 0.36508652567863464, mean loss: 0.34036643842049347
Epoch: 60, step: 519, loss: 0.32808083295822144, mean loss: 0.3403662974658645
Epoch: 60, step: 520, loss: 0.3069084584712982, mean loss: 0.3403659136033687
Epoch: 60, step: 521, loss: 0.3216246962547302, mean loss: 0.3403656985874518
Epoch: 60, step: 522, loss: 0.3155724108219147, mean loss: 0.3403654141400628
Epoch: 60, step: 523, loss: 0.33577078580856323, mean loss: 0.3403653614276089
Epoch: 60, step: 524, loss: 0.3671184182167053, mean loss: 0.340365668351911
Epoch: 60, step: 525, loss: 0.3013085722923279, mean loss: 0.34036522027472427
Epoch: 60, step: 526, loss: 0.33801162242889404, mean loss: 0.340365193273705
Epoch: 60, step: 527, loss: 0.35257890820503235, mean loss: 0.3403653333906623
Epoch: 60, step: 528, loss: 0.3201296925544739, mean loss: 0.34036510124803315
Epoch: 60, step: 529, loss: 0.3149459660053253, mean loss: 0.3403648096438661
Epoch: 60, step: 530, loss: 0.32990968227386475, mean loss: 0.34036468970572875
Epoch: 60, step: 531, loss: 0.3433748781681061, mean loss: 0.3403647242373268
Epoch: 60, step: 532, loss: 0.3353540599346161, mean loss: 0.3403646667577826
Epoch: 60, step: 533, loss: 0.31568413972854614, mean loss: 0.3403643836397998
Epoch: 60, step: 534, loss: 0.342160701751709, mean loss: 0.3403644042456858
Epoch: 60, step: 535, loss: 0.30402672290802, mean loss: 0.3403639874144325
Epoch: 60, step: 536, loss: 0.33280467987060547, mean loss: 0.3403639007022545
Epoch: 60, step: 537, loss: 0.2935678958892822, mean loss: 0.34036336391539523
Epoch: 60, step: 538, loss: 0.3016517460346222, mean loss: 0.34036291986788514
Epoch: 60, step: 539, loss: 0.3443411588668823, mean loss: 0.34036296550035816
Epoch: 60, step: 540, loss: 0.34485509991645813, mean loss: 0.3403630170268882
Epoch: 60, step: 541, loss: 0.3394221365451813, mean loss: 0.3403630062347467
Epoch: 60, step: 542, loss: 0.3183601200580597, mean loss: 0.3403627538588686
Epoch: 60, step: 543, loss: 0.3382735848426819, mean loss: 0.3403627298961115
Epoch: 60, step: 544, loss: 0.35669365525245667, mean loss: 0.34036291720958695
Epoch: 60, step: 545, loss: 0.32802149653434753, mean loss: 0.34036277565680695
Epoch: 60, step: 546, loss: 0.3107309639453888, mean loss: 0.3403624357917845
Epoch: 60, step: 547, loss: 0.311533123254776, mean loss: 0.34036210513489895
Epoch: 60, step: 548, loss: 0.2923072278499603, mean loss: 0.3403615539773299
Epoch: 60, step: 549, loss: 0.30637115240097046, mean loss: 0.34036116413443995
Epoch: 60, step: 550, loss: 0.3337048590183258, mean loss: 0.3403610877927864
Epoch: 60, step: 551, loss: 0.32710713148117065, mean loss: 0.3403609357839288
Epoch: 60, step: 552, loss: 0.30179449915885925, mean loss: 0.3403604934727728
Epoch: 60, step: 553, loss: 0.3270016610622406, mean loss: 0.3403603402646116
Epoch: 60, step: 554, loss: 0.3500624895095825, mean loss: 0.34036045153417116
Epoch: 60, step: 555, loss: 0.3564471900463104, mean loss: 0.34036063602358024
Epoch: 60, step: 556, loss: 0.34816083312034607, mean loss: 0.3403607254784594
Epoch: 60, step: 557, loss: 0.32944828271865845, mean loss: 0.3403606003328969
Epoch: 60, step: 558, loss: 0.32634350657463074, mean loss: 0.3403604395845654
Epoch: 60, step: 559, loss: 0.3655862808227539, mean loss: 0.3403607288717356
Epoch: 60, step: 560, loss: 0.32917073369026184, mean loss: 0.3403606005475744
Epoch: 60, step: 561, loss: 0.3448874354362488, mean loss: 0.3403606524596279
Epoch: 60, step: 562, loss: 0.3589017391204834, mean loss: 0.34036086507945357
Epoch: 60, step: 563, loss: 0.3964806795120239, mean loss: 0.3403615086257867
Epoch: 60, step: 564, loss: 0.32826370000839233, mean loss: 0.34036136989740395
Epoch: 60, step: 565, loss: 0.338975727558136, mean loss: 0.34036135400810347
Epoch: 60, step: 566, loss: 0.3425021767616272, mean loss: 0.34036137855685245
Epoch: 60, step: 567, loss: 0.2854912579059601, mean loss: 0.3403607493700731
Epoch: 60, step: 568, loss: 0.3186083734035492, mean loss: 0.340360499941964
Epoch: 60, step: 569, loss: 0.3132094740867615, mean loss: 0.34036018861269146
Epoch: 60, step: 570, loss: 0.29101312160491943, mean loss: 0.34035962277733806
Epoch: 60, step: 571, loss: 0.3396407961845398, mean loss: 0.3403596145350481
Epoch: 60, step: 572, loss: 0.34047603607177734, mean loss: 0.34035961586995844
Epoch: 60, step: 573, loss: 0.3026769459247589, mean loss: 0.3403591837986173
Epoch: 60, step: 574, loss: 0.3238641023635864, mean loss: 0.3403589946673734
Epoch: 60, step: 575, loss: 0.3150424659252167, mean loss: 0.3403587043934702
Epoch: 60, step: 576, loss: 0.3184030055999756, mean loss: 0.34035845265701065
Epoch: 60, step: 577, loss: 0.3148384392261505, mean loss: 0.34035816005670533
Epoch: 60, step: 578, loss: 0.3244250416755676, mean loss: 0.34035797737726187
Epoch: 60, step: 579, loss: 0.36483240127563477, mean loss: 0.3403582579829016
Epoch: 60, step: 580, loss: 0.31473132967948914, mean loss: 0.3403579641668676
Epoch: 60, step: 581, loss: 0.2933005690574646, mean loss: 0.34035742465395674
Epoch: 60, step: 582, loss: 0.33122438192367554, mean loss: 0.3403573199448464
Epoch: 60, step: 583, loss: 0.38996851444244385, mean loss: 0.3403578887240184
Epoch: 60, step: 584, loss: 0.3554919958114624, mean loss: 0.3403580622305485
Epoch: 60, step: 585, loss: 0.3970441222190857, mean loss: 0.3403587121062735
Epoch: 60, step: 586, loss: 0.32368382811546326, mean loss: 0.3403585209397311
Epoch: 60, step: 587, loss: 0.3513844907283783, mean loss: 0.3403586473437503
Epoch: 60, step: 588, loss: 0.3078109622001648, mean loss: 0.34035827421457143
Epoch: 60, step: 589, loss: 0.3547195792198181, mean loss: 0.3403584388517949
Epoch: 60, step: 590, loss: 0.3085229694843292, mean loss: 0.3403580738958805
Epoch: 60, step: 591, loss: 0.4747205078601837, mean loss: 0.3403596141842376
Epoch: 60, step: 592, loss: 0.33310478925704956, mean loss: 0.34035953101817745
Epoch: 60, step: 593, loss: 0.31582000851631165, mean loss: 0.34035924971131887
Epoch: 60, step: 594, loss: 0.3153899013996124, mean loss: 0.34035896348046757
Epoch: 60, step: 595, loss: 0.3364933729171753, mean loss: 0.34035891916859445
Epoch: 60, step: 596, loss: 0.3284637928009033, mean loss: 0.34035878281445153
Epoch: 60, step: 597, loss: 0.32121923565864563, mean loss: 0.3403585634198396
Epoch: 60, step: 598, loss: 0.3006214499473572, mean loss: 0.3403581079227171
Epoch: 60, step: 599, loss: 0.31275418400764465, mean loss: 0.34035779150910045
Epoch: 60, step: 600, loss: 0.29734131693840027, mean loss: 0.3403572984327422
Epoch: 60, step: 601, loss: 0.3269902467727661, mean loss: 0.3403571452146631
Epoch: 60, step: 602, loss: 0.3139350414276123, mean loss: 0.34035684235823005
Epoch: 60, step: 603, loss: 0.31316059827804565, mean loss: 0.34035653063199006
Epoch: 60, step: 604, loss: 0.3142987787723541, mean loss: 0.34035623195869236
Epoch: 60, step: 605, loss: 0.3495209515094757, mean loss: 0.3403563370032738
Epoch: 60, step: 606, loss: 0.3021659851074219, mean loss: 0.34035589927645343
Epoch: 60, step: 607, loss: 0.3513701260089874, mean loss: 0.34035602551690286
Epoch: 60, step: 608, loss: 0.3270336091518402, mean loss: 0.34035587282270163
Epoch: 60, step: 609, loss: 0.3330296576023102, mean loss: 0.34035578885461887
Epoch: 60, step: 610, loss: 0.35957610607147217, mean loss: 0.34035600914226277
Epoch: 60, step: 611, loss: 0.33194753527641296, mean loss: 0.3403559127722785
Epoch: 60, step: 612, loss: 0.31079667806625366, mean loss: 0.34035557399613664
Epoch: 60, step: 613, loss: 0.34843483567237854, mean loss: 0.3403556665908793
Epoch: 60, step: 614, loss: 0.34332942962646484, mean loss: 0.3403557006721702
Epoch: 60, step: 615, loss: 0.3551275134086609, mean loss: 0.34035586996497225
Epoch: 60, step: 616, loss: 0.3785199224948883, mean loss: 0.34035630734022615
Epoch: 60, step: 617, loss: 0.3113854229450226, mean loss: 0.3403559753261484
Epoch: 60, step: 618, loss: 0.32937830686569214, mean loss: 0.3403558495205758
Epoch: 60, step: 619, loss: 0.3502410352230072, mean loss: 0.34035596280484925
Epoch: 60, step: 620, loss: 0.29017531871795654, mean loss: 0.34035538774102825
Epoch: 60, step: 621, loss: 0.32265931367874146, mean loss: 0.34035518494858635
Epoch: 60, step: 622, loss: 0.40431052446365356, mean loss: 0.34035591785187314
Epoch: 60, step: 623, loss: 0.29686710238456726, mean loss: 0.3403554194926933
Epoch: 60, step: 624, loss: 0.3195521831512451, mean loss: 0.3403551811011693
Epoch: 60, step: 625, loss: 0.31322672963142395, mean loss: 0.3403548702303666
Epoch: 60, step: 626, loss: 0.3181924521923065, mean loss: 0.34035461626932706
Epoch: 60, step: 627, loss: 0.3300565183162689, mean loss: 0.3403544982638961
Epoch: 60, step: 628, loss: 0.34752407670021057, mean loss: 0.3403545804188244
Epoch: 60, step: 629, loss: 0.37300625443458557, mean loss: 0.34035495456428116
Epoch: 60, step: 630, loss: 0.3511941432952881, mean loss: 0.34035507876577686
Epoch: 60, step: 631, loss: 0.32468628883361816, mean loss: 0.3403548992260627
Epoch: 60, step: 632, loss: 0.29817262291908264, mean loss: 0.34035441588899046
Epoch: 60, step: 633, loss: 0.3121120035648346, mean loss: 0.34035409228273517
Epoch: 60, step: 634, loss: 0.3241073489189148, mean loss: 0.3403539061269819
Epoch: 60, step: 635, loss: 0.34712326526641846, mean loss: 0.34035398368964676
Epoch: 60, step: 636, loss: 0.3327641785144806, mean loss: 0.34035389672738664
Epoch: 60, step: 637, loss: 0.3052229583263397, mean loss: 0.3403534942097029
Epoch: 60, step: 638, loss: 0.37248608469963074, mean loss: 0.34035386236917414
Epoch: 60, step: 639, loss: 0.36250507831573486, mean loss: 0.3403541161640406
Epoch: 60, step: 640, loss: 0.3092367351055145, mean loss: 0.34035375964451103
Epoch: 60, step: 641, loss: 0.3123851418495178, mean loss: 0.3403534392048122
Epoch: 60, step: 642, loss: 0.3242858946323395, mean loss: 0.34035325511919906
Epoch: 60, step: 643, loss: 0.34753355383872986, mean loss: 0.3403533373828295
Epoch: 60, step: 644, loss: 0.31054267287254333, mean loss: 0.3403529958503267
Epoch: 60, step: 645, loss: 0.38727518916130066, mean loss: 0.34035353341870317
Epoch: 60, step: 646, loss: 0.312350332736969, mean loss: 0.3403532126011624
Epoch: 60, step: 647, loss: 0.3262552320957184, mean loss: 0.3403530510900669
Epoch: 60, step: 648, loss: 0.3629956543445587, mean loss: 0.3403533104881956
Epoch: 60, step: 649, loss: 0.3249269723892212, mean loss: 0.34035313376304843
Epoch: 60, step: 650, loss: 0.3326893150806427, mean loss: 0.3403530459668417
Epoch: 60, step: 651, loss: 0.3705241084098816, mean loss: 0.34035339160060474
Epoch: 60, step: 652, loss: 0.3113401532173157, mean loss: 0.34035305923445414
Epoch: 60, step: 653, loss: 0.33888891339302063, mean loss: 0.34035304246187137
Epoch: 60, step: 654, loss: 0.3309580981731415, mean loss: 0.3403529348389343
Epoch: 60, step: 655, loss: 0.32914888858795166, mean loss: 0.34035280649346317
Epoch: 60, step: 656, loss: 0.34677085280418396, mean loss: 0.34035288001312947
Epoch: 60, step: 657, loss: 0.31780481338500977, mean loss: 0.3403526217246621
Epoch: 60, step: 658, loss: 0.32827672362327576, mean loss: 0.3403524833966388
Epoch: 60, step: 659, loss: 0.42293471097946167, mean loss: 0.34035342935571766
Epoch: 60, step: 660, loss: 0.3161630630493164, mean loss: 0.34035315226420315
Epoch: 60, step: 661, loss: 0.3197588622570038, mean loss: 0.3403529163670873
Epoch: 60, step: 662, loss: 0.326673299074173, mean loss: 0.3403527596758248
Epoch: 60, step: 663, loss: 0.34864571690559387, mean loss: 0.34035285466525517
Epoch: 60, step: 664, loss: 0.3155200779438019, mean loss: 0.34035257022820437
Epoch: 60, step: 665, loss: 0.31695154309272766, mean loss: 0.3403523021936233
Epoch: 60, step: 666, loss: 0.3840668499469757, mean loss: 0.3403528028928542
Epoch: 60, step: 667, loss: 0.3353138566017151, mean loss: 0.34035274517825426
Epoch: 60, step: 668, loss: 0.3434414267539978, mean loss: 0.340352780554694
Epoch: 60, step: 669, loss: 0.31702864170074463, mean loss: 0.340352513413028
Epoch: 60, step: 670, loss: 0.31033140420913696, mean loss: 0.34035216957194037
Epoch: 60, step: 671, loss: 0.3234565556049347, mean loss: 0.3403519760634425
Epoch: 60, step: 672, loss: 0.3318352997303009, mean loss: 0.3403518785215377
Epoch: 60, step: 673, loss: 0.31183311343193054, mean loss: 0.34035155189848654
Epoch: 60, step: 674, loss: 0.3463570177555084, mean loss: 0.34035162067780117
Epoch: 60, step: 675, loss: 0.3008725047111511, mean loss: 0.34035116853711717
Epoch: 60, step: 676, loss: 0.32043588161468506, mean loss: 0.3403509404568244
Epoch: 60, step: 677, loss: 0.3411470353603363, mean loss: 0.3403509495740156
Epoch: 60, step: 678, loss: 0.32551974058151245, mean loss: 0.3403507797231356
Epoch: 60, step: 679, loss: 0.37179067730903625, mean loss: 0.340351139776933
Epoch: 60, step: 680, loss: 0.36837008595466614, mean loss: 0.3403514606498751
Epoch: 60, step: 681, loss: 0.30188801884651184, mean loss: 0.34035102017162444
Epoch: 60, step: 682, loss: 0.3275248408317566, mean loss: 0.34035087328959635
Epoch: 60, step: 683, loss: 0.3126487731933594, mean loss: 0.3403505560560741
Epoch: 60, step: 684, loss: 0.3529573082923889, mean loss: 0.34035070042197435
Epoch: 60, step: 685, loss: 0.3227578401565552, mean loss: 0.34035049896009284
Epoch: 60, step: 686, loss: 0.27709200978279114, mean loss: 0.34034977457371546
Epoch: 60, step: 687, loss: 0.3279469311237335, mean loss: 0.3403496325477507
Epoch: 60, step: 688, loss: 0.3592832386493683, mean loss: 0.34034984935552476
Epoch: 60, step: 689, loss: 0.35937386751174927, mean loss: 0.3403500671961083
Epoch: 60, step: 690, loss: 0.3599749803543091, mean loss: 0.34035029191485827
Epoch: 60, step: 691, loss: 0.33628344535827637, mean loss: 0.340350245347202
Epoch: 60, step: 692, loss: 0.339420884847641, mean loss: 0.3403502347056289
Epoch: 60, step: 693, loss: 0.3084649443626404, mean loss: 0.3403498696096715
Epoch: 60, step: 694, loss: 0.3533323407173157, mean loss: 0.34035001826108396
Epoch: 60, step: 695, loss: 0.3309331238269806, mean loss: 0.3403499104373408
Epoch: 60, step: 696, loss: 0.3199560046195984, mean loss: 0.34034967692913903
Epoch: 60, step: 697, loss: 0.3102467358112335, mean loss: 0.3403493322573911
Epoch: 60, step: 698, loss: 0.33765456080436707, mean loss: 0.34034930140323144
Epoch: 60, step: 699, loss: 0.32791876792907715, mean loss: 0.34034915907974306
Epoch: 60, step: 700, loss: 0.3392408788204193, mean loss: 0.340349146390625
Epoch: 60, step: 701, loss: 0.30586281418800354, mean loss: 0.3403487515481414
Epoch: 60, step: 702, loss: 0.33839118480682373, mean loss: 0.34034872913573583
Epoch: 60, step: 703, loss: 0.298479288816452, mean loss: 0.34034824977321154
Epoch: 60, step: 704, loss: 0.3903942406177521, mean loss: 0.34034882274236655
Epoch: 60, step: 705, loss: 0.29481178522109985, mean loss: 0.3403483014015207
Epoch: 60, step: 706, loss: 0.3346128463745117, mean loss: 0.34034823573864703
Epoch: 60, step: 707, loss: 0.3522969186306, mean loss: 0.34034837253265365
Epoch: 60, step: 708, loss: 0.3132171332836151, mean loss: 0.34034806192532846
Epoch: 60, step: 709, loss: 0.32436907291412354, mean loss: 0.34034787899471586
Epoch: 60, step: 710, loss: 0.37137264013290405, mean loss: 0.34034823416822435
Epoch: 60, step: 711, loss: 0.32600370049476624, mean loss: 0.3403480699529382
Epoch: 60, step: 712, loss: 0.40095871686935425, mean loss: 0.34034876381172857
Epoch: 60, step: 713, loss: 0.30635398626327515, mean loss: 0.3403483746506421
Epoch: 60, step: 714, loss: 0.36126628518104553, mean loss: 0.34034861410929396
Epoch: 60, step: 715, loss: 0.3529858887195587, mean loss: 0.34034875877336523
Epoch: 60, step: 716, loss: 0.3142475485801697, mean loss: 0.34034845998551544
Epoch: 60, step: 717, loss: 0.3418581187725067, mean loss: 0.3403484772668038
Epoch: 60, step: 718, loss: 0.3199971318244934, mean loss: 0.34034824430459676
Epoch: 60, step: 719, loss: 0.3209759294986725, mean loss: 0.34034802255190894
Epoch: 60, step: 720, loss: 0.3403502404689789, mean loss: 0.3403480225772969
Epoch: 60, step: 721, loss: 0.3012577295303345, mean loss: 0.3403475751253951
Epoch: 60, step: 722, loss: 0.3176540732383728, mean loss: 0.3403473153643763
Epoch: 60, step: 723, loss: 0.30652546882629395, mean loss: 0.3403469282272656
Epoch: 60, step: 724, loss: 0.32611265778541565, mean loss: 0.3403467652985133
Epoch: 60, step: 725, loss: 0.3716956079006195, mean loss: 0.34034712412051044
Epoch: 60, step: 726, loss: 0.31427088379859924, mean loss: 0.3403468256526642
Epoch: 60, step: 727, loss: 0.37273654341697693, mean loss: 0.3403471963801361
Epoch: 60, step: 728, loss: 0.379266619682312, mean loss: 0.340347641840463
Epoch: 60, step: 729, loss: 0.3089957535266876, mean loss: 0.34034728300003364
Epoch: 60, step: 730, loss: 0.3787881135940552, mean loss: 0.3403477229724569
Epoch: 60, step: 731, loss: 0.3405858874320984, mean loss: 0.340347725698324
Epoch: 60, step: 732, loss: 0.3623284101486206, mean loss: 0.34034797727128646
Epoch: 60, step: 733, loss: 0.37090444564819336, mean loss: 0.3403483269916653
Epoch: 60, step: 734, loss: 0.3077595829963684, mean loss: 0.34034795401605444
Epoch: 60, step: 735, loss: 0.38651329278945923, mean loss: 0.34034848236867726
Epoch: 60, step: 736, loss: 0.3232826590538025, mean loss: 0.3403482870561429
Epoch: 60, step: 737, loss: 0.34887462854385376, mean loss: 0.34034838463609995
Epoch: 60, step: 738, loss: 0.29440969228744507, mean loss: 0.3403478588954489
Epoch: 60, step: 739, loss: 0.32631197571754456, mean loss: 0.34034769826506234
Epoch: 60, step: 740, loss: 0.29089680314064026, mean loss: 0.3403471323423203
Epoch: 60, step: 741, loss: 0.2890731990337372, mean loss: 0.3403465455631975
Epoch: 60, step: 742, loss: 0.3466285169124603, mean loss: 0.3403466174532831
Epoch: 60, step: 743, loss: 0.3136177062988281, mean loss: 0.3403463115745049
Epoch: 60, step: 744, loss: 0.32056137919425964, mean loss: 0.34034608516342313
Epoch: 60, step: 745, loss: 0.33830001950263977, mean loss: 0.3403460617493103
Epoch: 60, step: 746, loss: 0.3439854681491852, mean loss: 0.34034610339631044
Epoch: 60, step: 747, loss: 0.32903075218200684, mean loss: 0.3403459739122713
Epoch: 60, step: 748, loss: 0.3281620144844055, mean loss: 0.34034583449015376
Epoch: 60, step: 749, loss: 0.31082645058631897, mean loss: 0.34034549670111724
Epoch: 60, step: 750, loss: 0.3164599537849426, mean loss: 0.34034522338300766
Epoch: 60, step: 751, loss: 0.3319782614707947, mean loss: 0.34034512764241454
Epoch: 60, step: 752, loss: 0.32568275928497314, mean loss: 0.3403449598673255
Epoch: 60, step: 753, loss: 0.34283843636512756, mean loss: 0.34034498839876354
Epoch: 60, step: 754, loss: 0.3535730540752411, mean loss: 0.3403451397582884
Epoch: 60, step: 755, loss: 0.31800177693367004, mean loss: 0.34034488410170427
Epoch: 60, step: 756, loss: 0.3264797031879425, mean loss: 0.34034472545574485
Epoch: 60, step: 757, loss: 0.34866541624069214, mean loss: 0.34034482066033517
Epoch: 60, step: 758, loss: 0.32834720611572266, mean loss: 0.3403446833862869
Epoch: 60, step: 759, loss: 0.3077380955219269, mean loss: 0.34034431031319917
Epoch: 60, step: 760, loss: 0.32701122760772705, mean loss: 0.3403441577625109
Epoch: 60, step: 761, loss: 0.29452016949653625, mean loss: 0.3403436334725832
Epoch: 60, step: 762, loss: 0.29970183968544006, mean loss: 0.3403431684794618
Epoch: 60, step: 763, loss: 0.37954986095428467, mean loss: 0.3403436170480911
Epoch: 60, step: 764, loss: 0.3512986898422241, mean loss: 0.3403437423850031
Epoch: 60, step: 765, loss: 0.336419016122818, mean loss: 0.34034369748275084
Epoch: 60, step: 766, loss: 0.31205108761787415, mean loss: 0.34034337379460383
Epoch: 60, step: 767, loss: 0.3292231559753418, mean loss: 0.34034324657263537
Epoch: 60, step: 768, loss: 0.2925352156162262, mean loss: 0.3403426996263145
Epoch: 60, step: 769, loss: 0.318952351808548, mean loss: 0.34034245491349197
Epoch: 60, step: 770, loss: 0.3354361951351166, mean loss: 0.3403423987848608
Epoch: 60, step: 771, loss: 0.29642927646636963, mean loss: 0.34034189641536555
Epoch: 60, step: 772, loss: 0.3163195848464966, mean loss: 0.34034162160141834
Epoch: 60, step: 773, loss: 0.35820794105529785, mean loss: 0.34034182598881
Epoch: 60, step: 774, loss: 0.3181878328323364, mean loss: 0.3403415725541231
Epoch: 60, step: 775, loss: 0.2892366051673889, mean loss: 0.3403409879361197
Epoch: 60, step: 776, loss: 0.3505435883998871, mean loss: 0.3403411046479774
Epoch: 60, step: 777, loss: 0.30741292238235474, mean loss: 0.340340727972896
Epoch: 60, step: 778, loss: 0.3276536464691162, mean loss: 0.3403405828433303
Epoch: 60, step: 779, loss: 0.2965530455112457, mean loss: 0.34034008195637844
Epoch: 60, step: 780, loss: 0.3368867039680481, mean loss: 0.340340042453536
Epoch: 60, step: 781, loss: 0.3153475821018219, mean loss: 0.34033975657057347
Epoch: 60, step: 782, loss: 0.34000271558761597, mean loss: 0.3403397527152839
Epoch: 60, step: 783, loss: 0.34686508774757385, mean loss: 0.34033982735537166
Epoch: 60, step: 784, loss: 0.3245672583580017, mean loss: 0.3403396469428009
Epoch: 60, step: 785, loss: 0.3211834132671356, mean loss: 0.3403394278291084
Epoch: 60, step: 786, loss: 0.34574201703071594, mean loss: 0.3403394896245401
Epoch: 60, step: 787, loss: 0.3093724250793457, mean loss: 0.34033913542377436
Epoch: 60, step: 788, loss: 0.33197811245918274, mean loss: 0.34033903979162755
Epoch: 60, step: 789, loss: 0.3121412396430969, mean loss: 0.34033871727303955
Epoch: 60, step: 790, loss: 0.33029839396476746, mean loss: 0.34033860243593017
Epoch: 60, step: 791, loss: 0.31794241070747375, mean loss: 0.34033834628038384
Epoch: 60, step: 792, loss: 0.3337589502334595, mean loss: 0.34033827102966563
Epoch: 60, step: 793, loss: 0.38287246227264404, mean loss: 0.34033875750164727
Epoch: 60, step: 794, loss: 0.30926012992858887, mean loss: 0.3403384020532848
Epoch: 60, step: 795, loss: 0.29633480310440063, mean loss: 0.3403378987869077
Epoch: 60, step: 796, loss: 0.3129679262638092, mean loss: 0.34033758576184364
Epoch: 60, step: 797, loss: 0.3368023633956909, mean loss: 0.3403375453306539
Epoch: 60, step: 798, loss: 0.3292050361633301, mean loss: 0.34033741801321926
Epoch: 60, step: 799, loss: 0.32521671056747437, mean loss: 0.3403372450865559
Epoch: 60, step: 800, loss: 0.3515683710575104, mean loss: 0.3403373735288881
Epoch: 60, step: 801, loss: 0.3334571421146393, mean loss: 0.3403372948455161
Epoch: 60, step: 802, loss: 0.3319328725337982, mean loss: 0.34033719873236457
Epoch: 60, step: 803, loss: 0.328649640083313, mean loss: 0.34033706507472483
Epoch: 60, step: 804, loss: 0.386772096157074, mean loss: 0.34033759609457825
Epoch: 60, step: 805, loss: 0.3496733605861664, mean loss: 0.340337702854916
Epoch: 60, step: 806, loss: 0.3456589877605438, mean loss: 0.3403377637064593
Epoch: 60, step: 807, loss: 0.34757891297340393, mean loss: 0.3403378465116609
Epoch: 60, step: 808, loss: 0.31334787607192993, mean loss: 0.34033753787496474
Epoch: 60, step: 809, loss: 0.31697314977645874, mean loss: 0.34033727070071546
Epoch: 60, step: 810, loss: 0.319600373506546, mean loss: 0.34033703357481415
Epoch: 60, step: 811, loss: 0.2920288145542145, mean loss: 0.3403364811778533
Epoch: 60, step: 812, loss: 0.34318631887435913, mean loss: 0.3403365137649309
Epoch: 60, step: 813, loss: 0.37561002373695374, mean loss: 0.3403369171027996
Epoch: 60, step: 814, loss: 0.3338989317417145, mean loss: 0.340336843487965
Epoch: 60, step: 815, loss: 0.3398894667625427, mean loss: 0.3403368383725158
Epoch: 60, step: 816, loss: 0.3457190692424774, mean loss: 0.340336899913969
Epoch: 60, step: 817, loss: 0.30913665890693665, mean loss: 0.3403365431685482
Epoch: 60, step: 818, loss: 0.3031248152256012, mean loss: 0.34033611769229144
Epoch: 60, step: 819, loss: 0.33676111698150635, mean loss: 0.34033607681645434
Epoch: 60, step: 820, loss: 0.3226264417171478, mean loss: 0.3403358743303737
Epoch: 60, step: 821, loss: 0.3756147623062134, mean loss: 0.3403362776928394
Epoch: 60, step: 822, loss: 0.35363197326660156, mean loss: 0.34033642970792666
Epoch: 60, step: 823, loss: 0.33600306510925293, mean loss: 0.34033638016337575
Epoch: 60, step: 824, loss: 0.3238106369972229, mean loss: 0.3403361912221631
Epoch: 60, step: 825, loss: 0.2858884036540985, mean loss: 0.3403355687198471
Epoch: 60, step: 826, loss: 0.29788675904273987, mean loss: 0.3403350834075616
Epoch: 60, step: 827, loss: 0.29874342679977417, mean loss: 0.34033460790044345
Epoch: 60, step: 828, loss: 0.3098088204860687, mean loss: 0.3403342589106595
Epoch: 60, step: 829, loss: 0.3181014060974121, mean loss: 0.3403340047337667
Epoch: 60, step: 830, loss: 0.31865039467811584, mean loss: 0.3403337568389209
Epoch: 60, step: 831, loss: 0.325553297996521, mean loss: 0.34033358786531975
Epoch: 60, step: 832, loss: 0.34376662969589233, mean loss: 0.340333627112194
Epoch: 60, step: 833, loss: 0.33698540925979614, mean loss: 0.3403335888354735
Epoch: 60, step: 834, loss: 0.33441099524497986, mean loss: 0.340333521129345
Epoch: 60, step: 835, loss: 0.2967555522918701, mean loss: 0.3403330229587744
Epoch: 60, step: 836, loss: 0.3116418123245239, mean loss: 0.3403326949730109
Epoch: 60, step: 837, loss: 0.3126905858516693, mean loss: 0.34033237898374363
Epoch: 60, step: 838, loss: 0.38589173555374146, mean loss: 0.34033289978709724
Epoch: 60, step: 839, loss: 0.3225940465927124, mean loss: 0.3403326970109976
Epoch: 60, step: 840, loss: 0.35118845105171204, mean loss: 0.34033282110370394
Epoch: 60, step: 841, loss: 0.3233659863471985, mean loss: 0.3403326271571234
Epoch: 60, step: 842, loss: 0.34050536155700684, mean loss: 0.34033262913161444
Epoch: 60, step: 843, loss: 0.328928679227829, mean loss: 0.3403324987769221
Epoch: 60, step: 844, loss: 0.3896714746952057, mean loss: 0.3403330627476133
Epoch: 60, step: 845, loss: 0.37246283888816833, mean loss: 0.34033343000381594
Epoch: 60, step: 846, loss: 0.32864782214164734, mean loss: 0.34033329643416715
Epoch: 60, step: 847, loss: 0.3242150545120239, mean loss: 0.34033311220042173
Epoch: 60, step: 848, loss: 0.3134405016899109, mean loss: 0.3403328048176592
Epoch: 60, step: 849, loss: 0.31689801812171936, mean loss: 0.3403325369609133
Epoch: 60, step: 850, loss: 0.33050134778022766, mean loss: 0.3403324245929077
Epoch: 60, step: 851, loss: 0.37441468238830566, mean loss: 0.3403328141400411
Epoch: 60, step: 852, loss: 0.3330425024032593, mean loss: 0.3403327308155267
Epoch: 60, step: 853, loss: 0.3173809051513672, mean loss: 0.34033246849095966
Epoch: 60, step: 854, loss: 0.3567914664745331, mean loss: 0.3403326566045431
Epoch: 60, step: 855, loss: 0.32648342847824097, mean loss: 0.3403324983204144
Epoch: 60, step: 856, loss: 0.3392504155635834, mean loss: 0.3403324859533303
Epoch: 60, step: 857, loss: 0.33487334847450256, mean loss: 0.34033242356176163
Epoch: 60, step: 858, loss: 0.2948340177536011, mean loss: 0.34033190357403825
Epoch: 60, step: 859, loss: 0.3066098392009735, mean loss: 0.34033151817901686
Epoch: 60, step: 860, loss: 0.37587761878967285, mean loss: 0.340331924415524
Epoch: 60, step: 861, loss: 0.35983121395111084, mean loss: 0.3403321472594537
Epoch: 60, step: 862, loss: 0.3790912330150604, mean loss: 0.3403325902052471
Epoch: 60, step: 863, loss: 0.35053953528404236, mean loss: 0.34033270685071565
Epoch: 60, step: 864, loss: 0.3622107207775116, mean loss: 0.34033295687087367
Epoch: 60, step: 865, loss: 0.30493319034576416, mean loss: 0.3403325523298533
Epoch: 60, step: 866, loss: 0.32796022295951843, mean loss: 0.34033241094311434
Epoch: 60, step: 867, loss: 0.3413916528224945, mean loss: 0.3403324230476291
Epoch: 60, step: 868, loss: 0.3259374499320984, mean loss: 0.34033225855057037
Epoch: 60, step: 869, loss: 0.33839741349220276, mean loss: 0.34033223644058225
Epoch: 60, step: 870, loss: 0.3686445951461792, mean loss: 0.3403325599697238
Epoch: 60, step: 871, loss: 0.3111671507358551, mean loss: 0.3403322266964672
Epoch: 60, step: 872, loss: 0.30454787611961365, mean loss: 0.3403318177932119
Epoch: 60, step: 873, loss: 0.33362534642219543, mean loss: 0.34033174116008613
Epoch: 60, step: 874, loss: 0.3060721158981323, mean loss: 0.3403313496886211
Epoch: 60, step: 875, loss: 0.3427269160747528, mean loss: 0.34033137706151734
Epoch: 60, step: 876, loss: 0.3421202600002289, mean loss: 0.3403313975019225
Epoch: 60, step: 877, loss: 0.3390667140483856, mean loss: 0.34033138305137
Epoch: 60, step: 878, loss: 0.3285035789012909, mean loss: 0.3403312479058113
Epoch: 60, step: 879, loss: 0.361581027507782, mean loss: 0.3403314907049384
Epoch: 60, step: 880, loss: 0.29438310861587524, mean loss: 0.3403309657065713
Epoch: 60, step: 881, loss: 0.31121358275413513, mean loss: 0.3403306330201273
Epoch: 60, step: 882, loss: 0.30000627040863037, mean loss: 0.3403301722913747
Epoch: 60, step: 883, loss: 0.30638188123703003, mean loss: 0.34032978441729383
Epoch: 60, step: 884, loss: 0.39753246307373047, mean loss: 0.34033043797546186
Epoch: 60, step: 885, loss: 0.33733487129211426, mean loss: 0.3403304037505837
Epoch: 60, step: 886, loss: 0.33959800004959106, mean loss: 0.34033039538283777
Epoch: 60, step: 887, loss: 0.372363805770874, mean loss: 0.3403307613618432
Epoch: 60, step: 888, loss: 0.3296998143196106, mean loss: 0.3403306399055597
Epoch: 60, step: 889, loss: 0.3491641879081726, mean loss: 0.3403307408257928
Epoch: 60, step: 890, loss: 0.30149006843566895, mean loss: 0.34033029708960344
Epoch: 60, step: 891, loss: 0.2895069122314453, mean loss: 0.3403297164632627
Epoch: 60, step: 892, loss: 0.36727893352508545, mean loss: 0.34033002433820203
Epoch: 60, step: 893, loss: 0.2856443226337433, mean loss: 0.3403293996015088
Epoch: 60, step: 894, loss: 0.3377401828765869, mean loss: 0.34032937002229224
Epoch: 60, step: 895, loss: 0.30585286021232605, mean loss: 0.3403289761670806
Epoch: 60, step: 896, loss: 0.31816771626472473, mean loss: 0.34032872300259126
Epoch: 60, step: 897, loss: 0.3399930000305176, mean loss: 0.34032871916742286
Epoch: 60, step: 898, loss: 0.34280234575271606, mean loss: 0.34032874742484626
Epoch: 60, step: 899, loss: 0.31007102131843567, mean loss: 0.34032840178027113
Epoch: 60, step: 900, loss: 0.31048762798309326, mean loss: 0.34032806090258183
Epoch: 60, step: 901, loss: 0.3097057640552521, mean loss: 0.3403277111013796
Epoch: 60, step: 902, loss: 0.3120505213737488, mean loss: 0.34032738809223295
Epoch: 60, step: 903, loss: 0.3406708538532257, mean loss: 0.34032739201558304
Epoch: 60, step: 904, loss: 0.36441129446029663, mean loss: 0.3403276671187008
Epoch: 60, step: 905, loss: 0.3179188370704651, mean loss: 0.34032741115235116
Epoch: 60, step: 906, loss: 0.29980194568634033, mean loss: 0.34032694825281756
Epoch: 60, step: 907, loss: 0.33886805176734924, mean loss: 0.34032693158885624
Epoch: 60, step: 908, loss: 0.3311145603656769, mean loss: 0.3403268263635399
Epoch: 60, step: 909, loss: 0.33794596791267395, mean loss: 0.3403267991692686
Epoch: 60, step: 910, loss: 0.3488208055496216, mean loss: 0.34032689618707973
Epoch: 60, step: 911, loss: 0.31565678119659424, mean loss: 0.34032661441036427
Epoch: 60, step: 912, loss: 0.31387749314308167, mean loss: 0.3403263123176745
Epoch: 60, step: 913, loss: 0.33469682931900024, mean loss: 0.34032624802040656
Epoch: 60, step: 914, loss: 0.31312820315361023, mean loss: 0.34032593738086725
Epoch: 60, step: 915, loss: 0.3112489581108093, mean loss: 0.34032560528507405
Epoch: 60, step: 916, loss: 0.32720696926116943, mean loss: 0.34032545545540854
Epoch: 60, step: 917, loss: 0.30851614475250244, mean loss: 0.34032509216124124
Epoch: 60, step: 918, loss: 0.32079240679740906, mean loss: 0.3403248690809712
Epoch: 60, step: 919, loss: 0.35118189454078674, mean loss: 0.34032499307623687
Epoch: 60, step: 920, loss: 0.3452082872390747, mean loss: 0.3403250488464332
Epoch: 60, step: 921, loss: 0.3291352689266205, mean loss: 0.34032492105378437
Epoch: 60, step: 922, loss: 0.36280569434165955, mean loss: 0.3403251777920561
Epoch: 60, step: 923, loss: 0.31465163826942444, mean loss: 0.34032488459462884
Epoch: 60, step: 924, loss: 0.31685149669647217, mean loss: 0.34032461652647494
Epoch: 60, step: 925, loss: 0.3173130750656128, mean loss: 0.34032435373564907
Epoch: 60, step: 926, loss: 0.3383292555809021, mean loss: 0.34032433095197306
Epoch: 60, step: 927, loss: 0.3210446536540985, mean loss: 0.340324110783906
Epoch: 60, step: 928, loss: 0.35177645087242126, mean loss: 0.3403242415646628
Epoch: 60, step: 929, loss: 0.33057692646980286, mean loss: 0.3403241302558231
Epoch: 60, step: 930, loss: 0.293746680021286, mean loss: 0.3403235983736905
Epoch: 60, step: 931, loss: 0.3219987452030182, mean loss: 0.3403233891189838
Epoch: 60, step: 932, loss: 0.3177322447299957, mean loss: 0.3403231311496966
Epoch: 60, step: 933, loss: 0.3182373642921448, mean loss: 0.3403228789542178
Epoch: 60, step: 934, loss: 0.32521340250968933, mean loss: 0.34032270642237145
Epoch: 60, step: 935, loss: 0.3541191518306732, mean loss: 0.34032286395920125
Epoch: 60, step: 936, loss: 0.3412242531776428, mean loss: 0.3403228742517349
Epoch: 60, step: 937, loss: 0.3152337372303009, mean loss: 0.3403225877741147
Epoch: 60, step: 938, loss: 0.3377457857131958, mean loss: 0.3403225583515127
Epoch: 60, step: 939, loss: 0.33624476194381714, mean loss: 0.34032251179069506
Epoch: 60, step: 940, loss: 0.30408039689064026, mean loss: 0.34032209797816837
Epoch: 60, step: 941, loss: 0.31053322553634644, mean loss: 0.34032175785265806
Epoch: 60, step: 942, loss: 0.3094943165779114, mean loss: 0.3403214058729214
Epoch: 60, step: 943, loss: 0.327401340007782, mean loss: 0.34032125835664145
Epoch: 60, step: 944, loss: 0.3577713072299957, mean loss: 0.3403214575922283
Epoch: 60, step: 945, loss: 0.3459142744541168, mean loss: 0.3403215214473748
Epoch: 60, step: 946, loss: 0.331022709608078, mean loss: 0.3403214152807994
Epoch: 60, step: 947, loss: 0.29630064964294434, mean loss: 0.34032091269179593
Epoch: 60, step: 948, loss: 0.2964310348033905, mean loss: 0.3403204116028705
Epoch: 60, step: 949, loss: 0.3616056442260742, mean loss: 0.34032065461271893
Epoch: 60, step: 950, loss: 0.31469830870628357, mean loss: 0.34032036209013206
Epoch: 60, step: 951, loss: 0.32640284299850464, mean loss: 0.3403202031998328
Epoch: 60, step: 952, loss: 0.31691133975982666, mean loss: 0.34031993595400906
Epoch: 60, step: 953, loss: 0.3251487910747528, mean loss: 0.34031976275556075
Epoch: 60, step: 954, loss: 0.3116934597492218, mean loss: 0.3403194359526267
Epoch: 60, step: 955, loss: 0.3508276641368866, mean loss: 0.3403195559150472
Epoch: 60, step: 956, loss: 0.3126411736011505, mean loss: 0.34031923994095775
Epoch: 60, step: 957, loss: 0.3193412721157074, mean loss: 0.34031900046097163
Epoch: 60, step: 958, loss: 0.30111464858055115, mean loss: 0.3403185529175992
Epoch: 60, step: 959, loss: 0.33881253004074097, mean loss: 0.34031853572555726
Epoch: 60, step: 960, loss: 0.3304320275783539, mean loss: 0.3403184228671636
Epoch: 60, step: 961, loss: 0.3388797640800476, mean loss: 0.340318406444493
Epoch: 60, step: 962, loss: 0.338845431804657, mean loss: 0.3403183896302899
Epoch: 60, step: 963, loss: 0.33683231472969055, mean loss: 0.34031834983673137
Epoch: 60, step: 964, loss: 0.37588372826576233, mean loss: 0.34031875581103
Epoch: 60, step: 965, loss: 0.3528287708759308, mean loss: 0.34031889860964043
Epoch: 60, step: 966, loss: 0.39249640703201294, mean loss: 0.34031949419570573
Epoch: 60, step: 967, loss: 0.3755558133125305, mean loss: 0.34031989640006055
Epoch: 60, step: 968, loss: 0.34997573494911194, mean loss: 0.3403200066152045
Epoch: 60, step: 969, loss: 0.3354974687099457, mean loss: 0.3403199515696857
Epoch: 60, step: 970, loss: 0.34638452529907227, mean loss: 0.3403200207912872
Epoch: 60, step: 971, loss: 0.32732975482940674, mean loss: 0.3403198725208909
Epoch: 60, step: 972, loss: 0.3363696038722992, mean loss: 0.34031982743319106
Epoch: 60, step: 973, loss: 0.35035061836242676, mean loss: 0.34031994192163956
Epoch: 60, step: 974, loss: 0.32638269662857056, mean loss: 0.34031978284790454
Epoch: 60, step: 975, loss: 0.3166322708129883, mean loss: 0.3403195124918961
Epoch: 60, step: 976, loss: 0.32110676169395447, mean loss: 0.34031929321081145
Epoch: 60, step: 977, loss: 0.33710625767707825, mean loss: 0.3403192565398587
Epoch: 60, step: 978, loss: 0.34454765915870667, mean loss: 0.3403193047988279
Epoch: 60, step: 979, loss: 0.3658420741558075, mean loss: 0.34031959608813805
Epoch: 60, step: 980, loss: 0.3033592700958252, mean loss: 0.3403191742677298
Epoch: 60, step: 981, loss: 0.3180583417415619, mean loss: 0.34031892021244087
Epoch: 60, step: 982, loss: 0.33707138895988464, mean loss: 0.34031888314989733
Epoch: 60, step: 983, loss: 0.369114488363266, mean loss: 0.34031921177681707
Epoch: 60, step: 984, loss: 0.3164549469947815, mean loss: 0.34031893943142727
Epoch: 60, step: 985, loss: 0.317162424325943, mean loss: 0.34031867516608244
Epoch: 60, step: 986, loss: 0.34826457500457764, mean loss: 0.3403187658447527
Epoch: 60, step: 987, loss: 0.34146326780319214, mean loss: 0.3403187789056688
Epoch: 60, step: 988, loss: 0.30218151211738586, mean loss: 0.3403183436928193
Epoch: 60, step: 989, loss: 0.3449398875236511, mean loss: 0.3403183964321076
Epoch: 60, step: 990, loss: 0.331121563911438, mean loss: 0.34031829148257464
Epoch: 60, step: 991, loss: 0.35826098918914795, mean loss: 0.34031849623309623
Epoch: 60, step: 992, loss: 0.31709274649620056, mean loss: 0.3403182311988085
Epoch: 60, step: 993, loss: 0.3070259392261505, mean loss: 0.3403178512972637
Epoch: 60, step: 994, loss: 0.33920562267303467, mean loss: 0.3403178386056608
Epoch: 60, step: 995, loss: 0.3056679666042328, mean loss: 0.3403174432216633
Epoch: 60, step: 996, loss: 0.3382526636123657, mean loss: 0.3403174196610712
Epoch: 60, step: 997, loss: 0.3688771724700928, mean loss: 0.3403177455442818
Epoch: 60, step: 998, loss: 0.31067898869514465, mean loss: 0.3403174073528733
Epoch: 60, step: 999, loss: 0.3128758370876312, mean loss: 0.34031709423591455
Epoch: 60, step: 1000, loss: 0.33430415391921997, mean loss: 0.34031702562715477
Epoch: 60, step: 1001, loss: 0.30453023314476013, mean loss: 0.34031661729790075
Epoch: 60, step: 1002, loss: 0.4170524775981903, mean loss: 0.34031749284826185
Epoch: 60, step: 1003, loss: 0.31188198924064636, mean loss: 0.34031716840501863
Epoch: 60, step: 1004, loss: 0.32876530289649963, mean loss: 0.34031703660211476
Epoch: 60, step: 1005, loss: 0.3356530964374542, mean loss: 0.3403169833887318
Epoch: 60, step: 1006, loss: 0.32191023230552673, mean loss: 0.34031677337867916
Epoch: 60, step: 1007, loss: 0.3086808919906616, mean loss: 0.3403164124362573
Epoch: 60, step: 1008, loss: 0.29391783475875854, mean loss: 0.3403158830682363
Epoch: 60, step: 1009, loss: 0.3141154646873474, mean loss: 0.3403155841473192
Epoch: 60, step: 1010, loss: 0.31332653760910034, mean loss: 0.3403152762324462
Epoch: 60, step: 1011, loss: 0.3209027051925659, mean loss: 0.3403150547592221
Epoch: 60, step: 1012, loss: 0.31303849816322327, mean loss: 0.34031474357128105
Epoch: 60, step: 1013, loss: 0.35210737586021423, mean loss: 0.3403148781074379
Epoch: 60, step: 1014, loss: 0.3143400549888611, mean loss: 0.3403145817772443
Epoch: 60, step: 1015, loss: 0.34895801544189453, mean loss: 0.34031468038354235
Epoch: 60, step: 1016, loss: 0.3204275965690613, mean loss: 0.34031445350966105
Epoch: 60, step: 1017, loss: 0.3471575677394867, mean loss: 0.34031453157571584
Epoch: 60, step: 1018, loss: 0.33155760169029236, mean loss: 0.3403144316780455
Epoch: 60, step: 1019, loss: 0.3242535889148712, mean loss: 0.340314248460583
Epoch: 60, step: 1020, loss: 0.356249064207077, mean loss: 0.340314430238292
Epoch: 60, step: 1021, loss: 0.3371741771697998, mean loss: 0.3403143944160079
Epoch: 60, step: 1022, loss: 0.3677675127983093, mean loss: 0.3403147075825478
Epoch: 60, step: 1023, loss: 0.3063761293888092, mean loss: 0.3403143204387009
Epoch: 60, step: 1024, loss: 0.3093205690383911, mean loss: 0.340313966891089
Epoch: 60, step: 1025, loss: 0.32482439279556274, mean loss: 0.3403137902025884
Epoch: 60, step: 1026, loss: 0.3366755545139313, mean loss: 0.34031374870195885
Epoch: 60, step: 1027, loss: 0.32643356919288635, mean loss: 0.34031359037532305
Epoch: 60, step: 1028, loss: 0.3414223790168762, mean loss: 0.3403136030227656
Epoch: 60, step: 1029, loss: 0.3106946051120758, mean loss: 0.3403132651763197
Epoch: 60, step: 1030, loss: 0.3150336742401123, mean loss: 0.34031297683021966
Epoch: 60, step: 1031, loss: 0.32573896646499634, mean loss: 0.34031281059686846
Epoch: 60, step: 1032, loss: 0.3235420882701874, mean loss: 0.34031261930967255
Epoch: 60, step: 1033, loss: 0.33970895409584045, mean loss: 0.3403126124243335
Epoch: 60, step: 1034, loss: 0.28810304403305054, mean loss: 0.3403120169345315
Epoch: 60, step: 1035, loss: 0.29877132177352905, mean loss: 0.34031154313674006
Epoch: 60, step: 1036, loss: 0.30333584547042847, mean loss: 0.34031112141043024
Epoch: 60, step: 1037, loss: 0.3368120491504669, mean loss: 0.34031108150221767
Epoch: 60, step: 1038, loss: 0.3435473144054413, mean loss: 0.3403111184122292
Epoch: 60, step: 1039, loss: 0.3281155824661255, mean loss: 0.34031097932080645
Epoch: 60, step: 1040, loss: 0.3544260263442993, mean loss: 0.34031114030262716
Epoch: 60, step: 1041, loss: 0.309052437543869, mean loss: 0.34031078380183155
Epoch: 60, step: 1042, loss: 0.32422930002212524, mean loss: 0.34031060039702354
Epoch: 60, step: 1043, loss: 0.31651434302330017, mean loss: 0.3403103290104835
Epoch: 60, step: 1044, loss: 0.301799476146698, mean loss: 0.34030988981503546
Epoch: 60, step: 1045, loss: 0.3211315870285034, mean loss: 0.3403096710993592
Epoch: 60, step: 1046, loss: 0.3937613070011139, mean loss: 0.34031028067245334
Epoch: 60, step: 1047, loss: 0.3217589259147644, mean loss: 0.34031006911152417
Epoch: 60, step: 1048, loss: 0.3418370485305786, mean loss: 0.3403100865251042
Epoch: 60, step: 1049, loss: 0.3337131142616272, mean loss: 0.34031001129449334
Epoch: 60, step: 1050, loss: 0.35829785466194153, mean loss: 0.34031021642208187
Epoch: 60, step: 1051, loss: 0.3231942057609558, mean loss: 0.3403100212388193
Epoch: 60, step: 1052, loss: 0.30714938044548035, mean loss: 0.3403096430941465
Epoch: 60, step: 1053, loss: 0.29509350657463074, mean loss: 0.3403091274814875
Epoch: 60, step: 1054, loss: 0.29791146516799927, mean loss: 0.3403086440142167
Epoch: 60, step: 1055, loss: 0.33771049976348877, mean loss: 0.34030861438750337
Epoch: 60, step: 1056, loss: 0.33360719680786133, mean loss: 0.3403085379719181
Epoch: 60, step: 1057, loss: 0.346671462059021, mean loss: 0.34030861052686906
Epoch: 60, step: 1058, loss: 0.31765809655189514, mean loss: 0.3403083522512448
Epoch: 60, step: 1059, loss: 0.31990480422973633, mean loss: 0.340308119599614
Epoch: 60, step: 1060, loss: 0.3976720869541168, mean loss: 0.3403087736852841
Epoch: 60, step: 1061, loss: 0.33772411942481995, mean loss: 0.34030874421441387
Epoch: 60, step: 1062, loss: 0.3282727897167206, mean loss: 0.34030860697903426
Epoch: 60, step: 1063, loss: 0.31354111433029175, mean loss: 0.3403083017763907
Epoch: 60, step: 1064, loss: 0.3093280494213104, mean loss: 0.340307948543937
Epoch: 60, step: 1065, loss: 0.3516552150249481, mean loss: 0.34030807792238865
Epoch: 60, step: 1066, loss: 0.3301412761211395, mean loss: 0.34030796200459645
Epoch: 60, step: 1067, loss: 0.3237702548503876, mean loss: 0.3403077734504491
Epoch: 60, step: 1068, loss: 0.33802106976509094, mean loss: 0.3403077473789663
Epoch: 60, step: 1069, loss: 0.2940210700035095, mean loss: 0.34030721965490546
Epoch: 60, step: 1070, loss: 0.32371291518211365, mean loss: 0.34030703046193683
Epoch: 60, step: 1071, loss: 0.3211873471736908, mean loss: 0.3403068124794112
Epoch: 60, step: 1072, loss: 0.3466861844062805, mean loss: 0.34030688520947316
Epoch: 60, step: 1073, loss: 0.3118637502193451, mean loss: 0.34030656093814826
Epoch: 60, step: 1074, loss: 0.3418477773666382, mean loss: 0.3403065785088765
Epoch: 60, step: 1075, loss: 0.325825572013855, mean loss: 0.3403064134191951
Epoch: 60, step: 1076, loss: 0.361457496881485, mean loss: 0.34030665454786413
Epoch: 60, step: 1077, loss: 0.3812209367752075, mean loss: 0.3403071209775847
Epoch: 60, step: 1078, loss: 0.32023051381111145, mean loss: 0.3403068921034848
Epoch: 60, step: 1079, loss: 0.3195610046386719, mean loss: 0.3403066556022597
Epoch: 60, step: 1080, loss: 0.3096943497657776, mean loss: 0.3403063066287432
Epoch: 60, step: 1081, loss: 0.28625914454460144, mean loss: 0.3403056905100719
Epoch: 60, step: 1082, loss: 0.3329531252384186, mean loss: 0.3403056066943648
Epoch: 60, step: 1083, loss: 0.3075545132160187, mean loss: 0.3403052333519103
Epoch: 60, step: 1084, loss: 0.31512683629989624, mean loss: 0.3403049463368399
Epoch: 60, step: 1085, loss: 0.3986817002296448, mean loss: 0.34030561178099433
Epoch: 60, step: 1086, loss: 0.325657457113266, mean loss: 0.34030544480669145
Epoch: 60, step: 1087, loss: 0.3299718201160431, mean loss: 0.3403053270150549
Epoch: 60, step: 1088, loss: 0.29607048630714417, mean loss: 0.3403048227936377
Epoch: 60, step: 1089, loss: 0.3341742157936096, mean loss: 0.3403047529132433
Epoch: 60, step: 1090, loss: 0.32374778389930725, mean loss: 0.34030456418897237
Epoch: 60, step: 1091, loss: 0.28951355814933777, mean loss: 0.3403039852553331
Epoch: 60, step: 1092, loss: 0.3652474880218506, mean loss: 0.3403042695668552
Epoch: 60, step: 1093, loss: 0.31451651453971863, mean loss: 0.3403039756357108
Epoch: 60, step: 1094, loss: 0.3029688894748688, mean loss: 0.3403035500919009
Epoch: 60, step: 1095, loss: 0.33949899673461914, mean loss: 0.3403035409217386
Epoch: 60, step: 1096, loss: 0.36798155307769775, mean loss: 0.34030385638741617
Epoch: 60, step: 1097, loss: 0.30592355132102966, mean loss: 0.34030346453548127
Epoch: 60, step: 1098, loss: 0.3173592686653137, mean loss: 0.3403032030303824
Epoch: 60, step: 1099, loss: 0.34318599104881287, mean loss: 0.3403032358864118
Epoch: 60, step: 1100, loss: 0.35053202509880066, mean loss: 0.3403033524657671
Epoch: 60, step: 1101, loss: 0.3619067668914795, mean loss: 0.34030359868097104
Epoch: 60, step: 1102, loss: 0.32678651809692383, mean loss: 0.34030344462787754
Epoch: 60, step: 1103, loss: 0.3434731364250183, mean loss: 0.3403034807521914
Epoch: 60, step: 1104, loss: 0.3760671317577362, mean loss: 0.3403038883383901
Epoch: 60, step: 1105, loss: 0.3137590289115906, mean loss: 0.3403035858190795
Epoch: 60, step: 1106, loss: 0.36510249972343445, mean loss: 0.34030386843744714
Epoch: 60, step: 1107, loss: 0.36347123980522156, mean loss: 0.34030413245909286
Epoch: 60, step: 1108, loss: 0.3425807058811188, mean loss: 0.3403041584032452
Epoch: 60, step: 1109, loss: 0.3642551004886627, mean loss: 0.3403044313484541
Epoch: 60, step: 1110, loss: 0.30126500129699707, mean loss: 0.3403039864597343
Epoch: 60, step: 1111, loss: 0.2987896502017975, mean loss: 0.34030351337266784
Epoch: 60, step: 1112, loss: 0.39907991886138916, mean loss: 0.3403041831663557
Epoch: 60, step: 1113, loss: 0.32449668645858765, mean loss: 0.3403040030321543
Epoch: 60, step: 1114, loss: 0.33038291335105896, mean loss: 0.3403038899777451
Epoch: 60, step: 1115, loss: 0.35804954171180725, mean loss: 0.3403040921935677
Epoch: 60, step: 1116, loss: 0.3300243318080902, mean loss: 0.34030397505464566
Epoch: 60, step: 1117, loss: 0.3224432170391083, mean loss: 0.3403037715317986
Epoch: 60, step: 1118, loss: 0.39879265427589417, mean loss: 0.3403044380034168
Epoch: 60, step: 1119, loss: 0.329931378364563, mean loss: 0.34030431980538084
Epoch: 60, step: 1120, loss: 0.32794371247291565, mean loss: 0.34030417896141446
Epoch: 60, step: 1121, loss: 0.3063419461250305, mean loss: 0.3403037919803425
Epoch: 60, step: 1122, loss: 0.3742607831954956, mean loss: 0.3403041788972803
Epoch: 60, step: 1123, loss: 0.3090204894542694, mean loss: 0.34030382244486884
Epoch: 60, step: 1124, loss: 0.3570229709148407, mean loss: 0.3403040129439114
Epoch: 60, step: 1125, loss: 0.32031577825546265, mean loss: 0.34030378519928717
Epoch: 60, step: 1126, loss: 0.35470685362815857, mean loss: 0.34030394930502655
Epoch: 60, step: 1127, loss: 0.33871129155158997, mean loss: 0.340303931158803
Epoch: 60, step: 1128, loss: 0.3457880914211273, mean loss: 0.34030399364282654
Epoch: 60, step: 1129, loss: 0.35882899165153503, mean loss: 0.3403042047058094
Epoch: 60, step: 1130, loss: 0.3421531617641449, mean loss: 0.34030422577150377
Epoch: 60, step: 1131, loss: 0.34957069158554077, mean loss: 0.340304331345785
Epoch: 60, step: 1132, loss: 0.33118557929992676, mean loss: 0.3403042274556133
Epoch: 60, step: 1133, loss: 0.33529141545295715, mean loss: 0.3403041703451705
Epoch: 60, step: 1134, loss: 0.3359616696834564, mean loss: 0.3403041208720784
Epoch: 60, step: 1135, loss: 0.3352124094963074, mean loss: 0.3403040628640651
Epoch: 60, step: 1136, loss: 0.404767781496048, mean loss: 0.340304797267367
Epoch: 60, step: 1137, loss: 0.31452465057373047, mean loss: 0.34030450357023684
Epoch: 60, step: 1138, loss: 0.3391982913017273, mean loss: 0.3403044909679941
Epoch: 60, step: 1139, loss: 0.3468524217605591, mean loss: 0.34030456556278554
Epoch: 60, step: 1140, loss: 0.3573991358280182, mean loss: 0.34030476030390566
Epoch: 60, step: 1141, loss: 0.3305785655975342, mean loss: 0.3403046495044854
Epoch: 60, step: 1142, loss: 0.31000348925590515, mean loss: 0.34030430432193015
Epoch: 60, step: 1143, loss: 0.3470776677131653, mean loss: 0.34030438148136
Epoch: 60, step: 1144, loss: 0.31681886315345764, mean loss: 0.3403041139468344
Epoch: 60, step: 1145, loss: 0.3492637574672699, mean loss: 0.34030421600916233
Epoch: 60, step: 1146, loss: 0.35634520649909973, mean loss: 0.3403043987354258
Epoch: 60, step: 1147, loss: 0.3317151963710785, mean loss: 0.34030430089514735
Epoch: 60, step: 1148, loss: 0.3058048188686371, mean loss: 0.3403039079133156
Epoch: 60, step: 1149, loss: 0.3365142345428467, mean loss: 0.3403038647458322
Epoch: 60, step: 1150, loss: 0.3164936304092407, mean loss: 0.3403035935308519
Epoch: 60, step: 1151, loss: 0.3021600544452667, mean loss: 0.34030315905460023
Epoch: 60, step: 1152, loss: 0.31132981181144714, mean loss: 0.3403028290357235
Epoch: 60, step: 1153, loss: 0.39892029762268066, mean loss: 0.34030349670627713
Epoch: 60, step: 1154, loss: 0.3489993214607239, mean loss: 0.34030359575320185
Epoch: 60, step: 1155, loss: 0.3541885018348694, mean loss: 0.3403037539028451
Epoch: 60, step: 1156, loss: 0.3202228248119354, mean loss: 0.3403035251828537
Epoch: 60, step: 1157, loss: 0.3983500003814697, mean loss: 0.34030418631949916
Epoch: 60, step: 1158, loss: 0.3330840766429901, mean loss: 0.34030410408496714
Epoch: 60, step: 1159, loss: 0.3183581233024597, mean loss: 0.3403038541307441
Epoch: 60, step: 1160, loss: 0.3235669732093811, mean loss: 0.34030366350784774
Epoch: 60, step: 1161, loss: 0.3030296266078949, mean loss: 0.3403032389840681
Epoch: 60, step: 1162, loss: 0.3462594151496887, mean loss: 0.3403033068197476
Epoch: 60, step: 1163, loss: 0.3506350517272949, mean loss: 0.34030342448801904
Epoch: 60, step: 1164, loss: 0.3505631983280182, mean loss: 0.340303541335281
Epoch: 60, step: 1165, loss: 0.32289236783981323, mean loss: 0.34030334304389437
Epoch: 60, step: 1166, loss: 0.3313572108745575, mean loss: 0.3403032411598513
Epoch: 60, step: 1167, loss: 0.3446217179298401, mean loss: 0.34030329034075474
Epoch: 60, step: 1168, loss: 0.3246113955974579, mean loss: 0.34030311163589827
Epoch: 60, step: 1169, loss: 0.30084124207496643, mean loss: 0.3403026622352655
Epoch: 60, step: 1170, loss: 0.3217024803161621, mean loss: 0.3403024504146289
Epoch: 60, step: 1171, loss: 0.31092140078544617, mean loss: 0.34030211582425823
Epoch: 60, step: 1172, loss: 0.2992134988307953, mean loss: 0.34030164791384643
Epoch: 60, step: 1173, loss: 0.32832980155944824, mean loss: 0.34030151158198185
Epoch: 60, step: 1174, loss: 0.33635130524635315, mean loss: 0.34030146659870636
Epoch: 60, step: 1175, loss: 0.3366723358631134, mean loss: 0.34030142527217433
Epoch: 60, step: 1176, loss: 0.33205947279930115, mean loss: 0.3403013314184504
Epoch: 60, step: 1177, loss: 0.3149459660053253, mean loss: 0.34030104269215955
Epoch: 60, step: 1178, loss: 0.3105158507823944, mean loss: 0.3403007035264675
Epoch: 60, step: 1179, loss: 0.32207340002059937, mean loss: 0.3403004959734784
Epoch: 60, step: 1180, loss: 0.34680068492889404, mean loss: 0.34030056998981795
Epoch: 60, step: 1181, loss: 0.3337915241718292, mean loss: 0.34030049587347105
Epoch: 60, step: 1182, loss: 0.31779754161834717, mean loss: 0.34030023964270856
Epoch: 60, step: 1183, loss: 0.33091282844543457, mean loss: 0.3403001327538035
Epoch: 60, step: 1184, loss: 0.31813523173332214, mean loss: 0.34029988037804465
Epoch: 60, step: 1185, loss: 0.30773958563804626, mean loss: 0.34029950964164835
Epoch: 60, step: 1186, loss: 0.3089899718761444, mean loss: 0.3402991531506175
Epoch: 60, step: 1187, loss: 0.31173473596572876, mean loss: 0.3402988279192882
Epoch: 60, step: 1188, loss: 0.31781715154647827, mean loss: 0.3402985719482949
Epoch: 60, step: 1189, loss: 0.3347320556640625, mean loss: 0.34029850856999266
Epoch: 60, step: 1190, loss: 0.3025352656841278, mean loss: 0.3402980786165265
Epoch: 60, step: 1191, loss: 0.32907402515411377, mean loss: 0.34029795082650166
Epoch: 60, step: 1192, loss: 0.3299576938152313, mean loss: 0.3402978331001686
Epoch: 60, step: 1193, loss: 0.3282400965690613, mean loss: 0.34029769582147773
Epoch: 60, step: 1194, loss: 0.32805562019348145, mean loss: 0.3402975564456523
Epoch: 60, step: 1195, loss: 0.3299624025821686, mean loss: 0.3402974387814387
Epoch: 60, step: 1196, loss: 0.33635789155960083, mean loss: 0.34029739393078096
Epoch: 60, step: 1197, loss: 0.3034683167934418, mean loss: 0.34029697464667685
Epoch: 60, step: 1198, loss: 0.3500319719314575, mean loss: 0.3402970854744104
Epoch: 60, step: 1199, loss: 0.3024621903896332, mean loss: 0.3402966547492842
Epoch: 60, step: 1200, loss: 0.3108959197998047, mean loss: 0.34029632004527416
Epoch: 60, step: 1201, loss: 0.3254132866859436, mean loss: 0.34029615061569196
Epoch: 60, step: 1202, loss: 0.3434693515300751, mean loss: 0.34029618673924095
Epoch: 60, step: 1203, loss: 0.33423739671707153, mean loss: 0.3402961177670855
Epoch: 60, step: 1204, loss: 0.32563409209251404, mean loss: 0.34029595085917186
Epoch: 60, step: 1205, loss: 0.3227512836456299, mean loss: 0.34029575113844224
Epoch: 60, step: 1206, loss: 0.3636840879917145, mean loss: 0.340296017377891
Epoch: 60, step: 1207, loss: 0.31499484181404114, mean loss: 0.34029572936705904
Epoch: 60, step: 1208, loss: 0.3224365711212158, mean loss: 0.34029552607324526
Epoch: 60, step: 1209, loss: 0.3280414342880249, mean loss: 0.34029538658443725
Epoch: 60, step: 1210, loss: 0.32292604446411133, mean loss: 0.34029518887078436
Epoch: 60, step: 1211, loss: 0.28989937901496887, mean loss: 0.3402946152263613
Epoch: 60, step: 1212, loss: 0.32481488585472107, mean loss: 0.34029443902601103
Epoch: 60, step: 1213, loss: 0.2984883189201355, mean loss: 0.34029396316697097
Epoch: 60, step: 1214, loss: 0.3335881531238556, mean loss: 0.3402938868388161
Epoch: 60, step: 1215, loss: 0.324261337518692, mean loss: 0.3402937043521411
Epoch: 60, step: 1216, loss: 0.31014159321784973, mean loss: 0.3402933611568222
Epoch: 60, step: 1217, loss: 0.31397631764411926, mean loss: 0.34029306161615985
Epoch: 60, step: 1218, loss: 0.3329036235809326, mean loss: 0.3402929775105129
Epoch: 60, step: 1219, loss: 0.3488328754901886, mean loss: 0.3402930747094428
Epoch: 60, step: 1220, loss: 0.28287792205810547, mean loss: 0.3402924212323295
Epoch: 60, step: 1221, loss: 0.3107821047306061, mean loss: 0.34029208536111666
Epoch: 60, step: 1222, loss: 0.3225642740726471, mean loss: 0.3402918835946019
Epoch: 60, step: 1223, loss: 0.31457072496414185, mean loss: 0.3402915908562946
Epoch: 60, step: 1224, loss: 0.31648871302604675, mean loss: 0.34029131995345696
Epoch: 60, step: 1225, loss: 0.30789855122566223, mean loss: 0.34029095129244213
Epoch: 60, step: 1226, loss: 0.3628483712673187, mean loss: 0.3402912080147608
Epoch: 60, step: 1227, loss: 0.3068384826183319, mean loss: 0.3402908272990805
Epoch: 60, step: 1228, loss: 0.33126139640808105, mean loss: 0.3402907245389388
Epoch: 60, step: 1229, loss: 0.32781514525413513, mean loss: 0.34029058256125266
Epoch: 60, step: 1230, loss: 0.35159775614738464, mean loss: 0.34029071124049365
Epoch: 60, step: 1231, loss: 0.28415173292160034, mean loss: 0.34029007236828956
Epoch: 60, step: 1232, loss: 0.3426201045513153, mean loss: 0.34029009888419526
Epoch: 60, step: 1233, loss: 0.3142186403274536, mean loss: 0.34028980219281263
Epoch: 60, step: 1234, loss: 0.29997718334198, mean loss: 0.34028934344323825
Epoch: 60, step: 1235, loss: 0.3738113343715668, mean loss: 0.34028972491247816
Epoch: 60, step: 1236, loss: 0.33587872982025146, mean loss: 0.34028967471737487
Epoch: 60, step: 1237, loss: 0.3244786262512207, mean loss: 0.34028949479693443
Epoch: 60, step: 1238, loss: 0.3338100016117096, mean loss: 0.3402894210649486
Epoch: 60, step: 1239, loss: 0.33810701966285706, mean loss: 0.34028939623106824
Epoch: 60, step: 1240, loss: 0.345441997051239, mean loss: 0.3402894548626362
Epoch: 60, step: 1241, loss: 0.3219568729400635, mean loss: 0.3402892462581219
Epoch: 60, step: 1242, loss: 0.3541335165500641, mean loss: 0.34028940378881944
Epoch: 60, step: 1243, loss: 0.30974116921424866, mean loss: 0.34028905619159383
Epoch: 60, step: 1244, loss: 0.35087499022483826, mean loss: 0.3402891766437078
Epoch: 60, step: 1245, loss: 0.34265434741973877, mean loss: 0.34028920355551145
Epoch: 60, step: 1246, loss: 0.3396267294883728, mean loss: 0.34028919601771784
Epoch: 60, step: 1247, loss: 0.3398377299308777, mean loss: 0.3402891908808836
Epoch: 60, step: 1248, loss: 0.32710206508636475, mean loss: 0.34028904083792266
Epoch: 60, step: 1249, loss: 0.34015676379203796, mean loss: 0.3402890393328931
Epoch: 60, step: 1250, loss: 0.329926460981369, mean loss: 0.3402889214302825
Epoch: 60, step: 1251, loss: 0.3048378527164459, mean loss: 0.34028851808221083
Epoch: 60, step: 1252, loss: 0.3291572034358978, mean loss: 0.3402883914360087
Epoch: 60, step: 1253, loss: 0.3459574282169342, mean loss: 0.3402884559345727
Epoch: 60, step: 1254, loss: 0.34026697278022766, mean loss: 0.3402884556901543
Epoch: 60, step: 1255, loss: 0.3286077678203583, mean loss: 0.3402883227980105
Epoch: 60, step: 1256, loss: 0.2757123112678528, mean loss: 0.3402875881197902
Epoch: 60, step: 1257, loss: 0.364115446805954, mean loss: 0.34028785920512417
Epoch: 60, step: 1258, loss: 0.3167707920074463, mean loss: 0.3402875916586538
Epoch: 60, step: 1259, loss: 0.311324805021286, mean loss: 0.34028726216164995
Epoch: 60, step: 1260, loss: 0.32679593563079834, mean loss: 0.3402871086784526
Epoch: 60, step: 1261, loss: 0.30807143449783325, mean loss: 0.34028674218310345
Epoch: 60, step: 1262, loss: 0.3290782570838928, mean loss: 0.34028661467340415
Epoch: 60, step: 1263, loss: 0.327113538980484, mean loss: 0.34028646481588126
Epoch: 60, step: 1264, loss: 0.3589288294315338, mean loss: 0.34028667688987724
Epoch: 60, step: 1265, loss: 0.3477880358695984, mean loss: 0.340286762223745
Epoch: 60, step: 1266, loss: 0.3286276161670685, mean loss: 0.3402866295932826
Epoch: 60, step: 1267, loss: 0.32457488775253296, mean loss: 0.34028645086390824
Epoch: 60, step: 1268, loss: 0.3292046785354614, mean loss: 0.34028632480432014
Epoch: 60, step: 1269, loss: 0.36167338490486145, mean loss: 0.34028656808790675
Epoch: 60, step: 1270, loss: 0.33289849758148193, mean loss: 0.34028648404756473
Epoch: 60, step: 1271, loss: 0.34749314188957214, mean loss: 0.34028656602337964
Epoch: 60, step: 1272, loss: 0.33498385548591614, mean loss: 0.3402865057056731
Epoch: 60, step: 1273, loss: 0.3096182942390442, mean loss: 0.340286156862355
Epoch: 60, step: 1274, loss: 0.30132219195365906, mean loss: 0.3402857136619352
Epoch: 60, step: 1275, loss: 0.33967235684394836, mean loss: 0.3402857066853119
Epoch: 60, step: 1276, loss: 0.3270570635795593, mean loss: 0.3402855562179039
Epoch: 60, step: 1277, loss: 0.3649744391441345, mean loss: 0.3402858370350622
Epoch: 60, step: 1278, loss: 0.36731335520744324, mean loss: 0.34028614444891103
Epoch: 60, step: 1279, loss: 0.34001296758651733, mean loss: 0.34028614134180385
Epoch: 60, step: 1280, loss: 0.31012672185897827, mean loss: 0.3402857983131818
Epoch: 60, step: 1281, loss: 0.3366096615791321, mean loss: 0.3402857565018407
Epoch: 60, step: 1282, loss: 0.3267483711242676, mean loss: 0.34028560253319334
Epoch: 60, step: 1283, loss: 0.34519675374031067, mean loss: 0.3402856583899697
Epoch: 60, step: 1284, loss: 0.3287431597709656, mean loss: 0.34028552711332916
Epoch: 60, step: 1285, loss: 0.3465697467327118, mean loss: 0.34028559858501695
Epoch: 60, step: 1286, loss: 0.30606675148010254, mean loss: 0.34028520941164464
Epoch: 60, step: 1287, loss: 0.32128965854644775, mean loss: 0.3402849933763559
Epoch: 60, step: 1288, loss: 0.2965182065963745, mean loss: 0.34028449562491125
Epoch: 60, step: 1289, loss: 0.36776790022850037, mean loss: 0.3402848081849545
Epoch: 60, step: 1290, loss: 0.3532947897911072, mean loss: 0.3402849561416661
Epoch: 60, step: 1291, loss: 0.34808266162872314, mean loss: 0.3402850448204803
Epoch: 60, step: 1292, loss: 0.35264432430267334, mean loss: 0.3402851853738503
Epoch: 60, step: 1293, loss: 0.36776337027549744, mean loss: 0.34028549786031626
Epoch: 60, step: 1294, loss: 0.32671767473220825, mean loss: 0.340285343566541
Epoch: 60, step: 1295, loss: 0.3356981575489044, mean loss: 0.34028529140148894
Epoch: 60, step: 1296, loss: 0.3168560266494751, mean loss: 0.3402850249691027
Epoch: 60, step: 1297, loss: 0.3274943232536316, mean loss: 0.34028487951774244
Epoch: 60, step: 1298, loss: 0.39322084188461304, mean loss: 0.3402854814800387
Epoch: 60, step: 1299, loss: 0.3500584363937378, mean loss: 0.3402855926121164
Epoch: 60, step: 1300, loss: 0.3711506128311157, mean loss: 0.3402859435862947
Epoch: 60, step: 1301, loss: 0.2918936610221863, mean loss: 0.34028539331131163
Epoch: 60, step: 1302, loss: 0.35586538910865784, mean loss: 0.3402855704714699
Epoch: 60, step: 1303, loss: 0.33913034200668335, mean loss: 0.34028555733551447
Epoch: 60, step: 1304, loss: 0.32298576831817627, mean loss: 0.34028536062405823
Epoch: 60, step: 1305, loss: 0.35080572962760925, mean loss: 0.340285480247111
Epoch: 60, step: 1306, loss: 0.3238636553287506, mean loss: 0.3402852935230054
Epoch: 60, step: 1307, loss: 0.32436463236808777, mean loss: 0.3402851124994329
Epoch: 60, step: 1308, loss: 0.3380904495716095, mean loss: 0.34028508754561954
Epoch: 60, step: 1309, loss: 0.30300459265708923, mean loss: 0.34028466366278964
Epoch: 60, step: 1310, loss: 0.3106369078159332, mean loss: 0.3402843265687731
Epoch: 60, step: 1311, loss: 0.337628573179245, mean loss: 0.34028429637328705
Epoch: 60, step: 1312, loss: 0.38494792580604553, mean loss: 0.34028480418574863
Epoch: 60, step: 1313, loss: 0.32688602805137634, mean loss: 0.34028465184729745
Epoch: 60, step: 1314, loss: 0.3346611261367798, mean loss: 0.34028458791090144
Epoch: 60, step: 1315, loss: 0.3669942617416382, mean loss: 0.3402848915817577
Epoch: 60, step: 1316, loss: 0.34516602754592896, mean loss: 0.3402849470763285
Epoch: 60, step: 1317, loss: 0.3390386402606964, mean loss: 0.3402849329069884
Epoch: 60, step: 1318, loss: 0.3351275324821472, mean loss: 0.3402848742728472
Epoch: 60, step: 1319, loss: 0.361204594373703, mean loss: 0.3402851121050448
Epoch: 60, step: 1320, loss: 0.3219165802001953, mean loss: 0.3402849032791799
Epoch: 60, step: 1321, loss: 0.355457603931427, mean loss: 0.3402850757707177
Epoch: 60, step: 1322, loss: 0.3780781924724579, mean loss: 0.34028550541860036
Epoch: 60, step: 1323, loss: 0.3497399389743805, mean loss: 0.3402856128993147
Epoch: 60, step: 1324, loss: 0.3372529149055481, mean loss: 0.34028557842312535
Epoch: 60, step: 1325, loss: 0.31680530309677124, mean loss: 0.3402853114986849
Epoch: 60, step: 1326, loss: 0.2814796268939972, mean loss: 0.3402846430015825
Epoch: 60, step: 1327, loss: 0.3577161431312561, mean loss: 0.3402848411588685
Epoch: 60, step: 1328, loss: 0.3435116410255432, mean loss: 0.3402848778399705
Epoch: 60, step: 1329, loss: 0.3155513107776642, mean loss: 0.34028459668085875
Epoch: 60, step: 1330, loss: 0.3121010959148407, mean loss: 0.3402842763082273
Epoch: 60, step: 1331, loss: 0.3479821979999542, mean loss: 0.34028436381245236
Epoch: 60, step: 1332, loss: 0.3242584466934204, mean loss: 0.3402841816438652
Epoch: 60, step: 1333, loss: 0.3515118360519409, mean loss: 0.3402843092685544
Epoch: 60, step: 1334, loss: 0.3237132132053375, mean loss: 0.34028412090713284
Epoch: 60, step: 1335, loss: 0.30859795212745667, mean loss: 0.34028376073880534
Epoch: 60, step: 1336, loss: 0.3391646444797516, mean loss: 0.34028374801825045
Epoch: 60, step: 1337, loss: 0.4033954441547394, mean loss: 0.3402844653759551
Epoch: 60, step: 1338, loss: 0.33750277757644653, mean loss: 0.34028443375832135
Epoch: 60, step: 1339, loss: 0.33298832178115845, mean loss: 0.3402843508291104
Epoch: 60, step: 1340, loss: 0.30366265773773193, mean loss: 0.3402839345836359
Epoch: 60, step: 1341, loss: 0.3421909213066101, mean loss: 0.34028395625837304
Epoch: 60, step: 1342, loss: 0.3065003752708435, mean loss: 0.340283572279866
Epoch: 60, step: 1343, loss: 0.3044991195201874, mean loss: 0.3402831655644091
Epoch: 60, step: 1344, loss: 0.2957104444503784, mean loss: 0.34028265896986326
Epoch: 60, step: 1345, loss: 0.31831830739974976, mean loss: 0.34028240933524445
Epoch: 60, step: 1346, loss: 0.34292641282081604, mean loss: 0.3402824393851778
Epoch: 60, step: 1347, loss: 0.338735431432724, mean loss: 0.34028242180314444
Epoch: 60, step: 1348, loss: 0.4180690050125122, mean loss: 0.3402833058520961
Epoch: 60, step: 1349, loss: 0.3082224726676941, mean loss: 0.3402829414830407
Epoch: 60, step: 1350, loss: 0.3063359558582306, mean loss: 0.3402825556823836
Epoch: 60, step: 1351, loss: 0.2938389182090759, mean loss: 0.3402820278657926
Epoch: 60, step: 1352, loss: 0.3462009131908417, mean loss: 0.3402820951312038
Epoch: 60, step: 1353, loss: 0.3643280863761902, mean loss: 0.34028236839973625
Epoch: 60, step: 1354, loss: 0.3382377624511719, mean loss: 0.34028234516425754
Epoch: 60, step: 1355, loss: 0.2985122799873352, mean loss: 0.3402818704828496
Epoch: 60, step: 1356, loss: 0.3583391308784485, mean loss: 0.340282075685986
Epoch: 60, step: 1357, loss: 0.3183801770210266, mean loss: 0.3402818267951173
Epoch: 60, step: 1358, loss: 0.3277018964290619, mean loss: 0.34028168383973867
Epoch: 60, step: 1359, loss: 0.3651809096336365, mean loss: 0.34028196678548633
Epoch: 60, step: 1360, loss: 0.322797566652298, mean loss: 0.34028176810137895
Epoch: 60, step: 1361, loss: 0.36189788579940796, mean loss: 0.34028201373349753
Epoch: 60, step: 1362, loss: 0.37256020307540894, mean loss: 0.34028238051859966
Epoch: 60, step: 1363, loss: 0.32967710494995117, mean loss: 0.3402822600095822
Epoch: 60, step: 1364, loss: 0.35447099804878235, mean loss: 0.34028242123608116
Epoch: 60, step: 1365, loss: 0.34250807762145996, mean loss: 0.34028244652590667
Epoch: 60, step: 1366, loss: 0.33465638756752014, mean loss: 0.34028238259850363
Epoch: 60, step: 1367, loss: 0.3410778343677521, mean loss: 0.3402823916369066
Epoch: 60, step: 1368, loss: 0.3007736802101135, mean loss: 0.3402819427201887
Epoch: 60, step: 1369, loss: 0.33465254306793213, mean loss: 0.34028187875700666
Epoch: 60, step: 1370, loss: 0.38906803727149963, mean loss: 0.34028243307588174
Epoch: 60, step: 1371, loss: 0.31257206201553345, mean loss: 0.3402821182282353
Epoch: 60, step: 1372, loss: 0.30555853247642517, mean loss: 0.3402817237003161
Epoch: 60, step: 1373, loss: 0.2979239225387573, mean loss: 0.340281242438231
Epoch: 60, step: 1374, loss: 0.3547544777393341, mean loss: 0.34028140687878433
Epoch: 60, step: 1375, loss: 0.33689096570014954, mean loss: 0.34028136835804745
Epoch: 60, step: 1376, loss: 0.33592817187309265, mean loss: 0.34028131889946006
Epoch: 60, step: 1377, loss: 0.30218517780303955, mean loss: 0.3402808860772976
Epoch: 60, step: 1378, loss: 0.32434889674186707, mean loss: 0.34028070507104513
Epoch: 60, step: 1379, loss: 0.29598188400268555, mean loss: 0.3402802017897333
Epoch: 60, step: 1380, loss: 0.30783718824386597, mean loss: 0.34027983320708205
Epoch: 60, step: 1381, loss: 0.30545032024383545, mean loss: 0.34027943751608475
Epoch: 60, step: 1382, loss: 0.3317285478115082, mean loss: 0.3402793403722734
Epoch: 60, step: 1383, loss: 0.3401228189468384, mean loss: 0.3402793385941058
Epoch: 60, step: 1384, loss: 0.3379283547401428, mean loss: 0.3402793118859677
Epoch: 60, step: 1385, loss: 0.3060895800590515, mean loss: 0.3402789234810439
Epoch: 60, step: 1386, loss: 0.3741317689418793, mean loss: 0.3402793080544754
Epoch: 60, step: 1387, loss: 0.32846540212631226, mean loss: 0.3402791738482464
Epoch: 60, step: 1388, loss: 0.31676042079925537, mean loss: 0.34027890667773386
Epoch: 60, step: 1389, loss: 0.3149949312210083, mean loss: 0.34027861945774684
Epoch: 60, step: 1390, loss: 0.31812962889671326, mean loss: 0.3402783678533057
Epoch: 60, step: 1391, loss: 0.3563510477542877, mean loss: 0.3402785504310036
Epoch: 60, step: 1392, loss: 0.4027620851993561, mean loss: 0.34027926020500615
Epoch: 60, step: 1393, loss: 0.3398270606994629, mean loss: 0.34027925506836004
Epoch: 60, step: 1394, loss: 0.2999791204929352, mean loss: 0.3402787972943545
Epoch: 60, step: 1395, loss: 0.30517470836639404, mean loss: 0.3402783985473768
Epoch: 60, step: 1396, loss: 0.34245020151138306, mean loss: 0.34027842321658364
Epoch: 60, step: 1397, loss: 0.37231266498565674, mean loss: 0.3402787870849333
Epoch: 60, step: 1398, loss: 0.3444456458091736, mean loss: 0.340278834414625
Epoch: 60, step: 1399, loss: 0.33734679222106934, mean loss: 0.34027880111110165
Epoch: 60, step: 1400, loss: 0.31840699911117554, mean loss: 0.3402785526836417
Epoch: 60, step: 1401, loss: 0.32852065563201904, mean loss: 0.34027841913491436
Epoch: 60, step: 1402, loss: 0.3359679877758026, mean loss: 0.3402783701766626
Epoch: 60, step: 1403, loss: 0.3187991678714752, mean loss: 0.3402781262167982
Epoch: 60, step: 1404, loss: 0.31861332058906555, mean loss: 0.34027788015165394
Epoch: 60, step: 1405, loss: 0.3297913670539856, mean loss: 0.3402777610489906
Epoch: 60, step: 1406, loss: 0.3906864821910858, mean loss: 0.34027833356958914
Epoch: 60, step: 1407, loss: 0.31823182106018066, mean loss: 0.3402780831776153
Epoch: 60, step: 1408, loss: 0.32624074816703796, mean loss: 0.34027792375121624
Epoch: 60, step: 1409, loss: 0.34700265526771545, mean loss: 0.3402780001252255
Epoch: 60, step: 1410, loss: 0.2976832389831543, mean loss: 0.3402775163742046
Epoch: 60, step: 1411, loss: 0.33899182081222534, mean loss: 0.340277501772656
Epoch: 60, step: 1412, loss: 0.2858348786830902, mean loss: 0.340276883478866
Epoch: 60, step: 1413, loss: 0.3511073589324951, mean loss: 0.34027700647697456
Epoch: 60, step: 1414, loss: 0.3440374433994293, mean loss: 0.34027704918252133
Epoch: 60, step: 1415, loss: 0.3282829821109772, mean loss: 0.3402769129729834
Epoch: 60, step: 1416, loss: 0.3018133342266083, mean loss: 0.3402764761697906
Epoch: 60, step: 1417, loss: 0.3590882420539856, mean loss: 0.3402766897990564
Epoch: 60, step: 1418, loss: 0.3111143410205841, mean loss: 0.34027635863076267
Epoch: 60, step: 1419, loss: 0.3221530616283417, mean loss: 0.3402761528245283
Epoch: 60, step: 1420, loss: 0.3112683892250061, mean loss: 0.3402758234191888
Epoch: 60, step: 1421, loss: 0.36734846234321594, mean loss: 0.34027613084621666
Epoch: 60, step: 1422, loss: 0.33819475769996643, mean loss: 0.34027610721116963
Epoch: 60, step: 1423, loss: 0.34398967027664185, mean loss: 0.3402761493800816
Epoch: 60, step: 1424, loss: 0.3151743412017822, mean loss: 0.34027586434280027
Epoch: 60, step: 1425, loss: 0.34112778306007385, mean loss: 0.34027587401643955
Epoch: 60, step: 1426, loss: 0.34301578998565674, mean loss: 0.34027590512816097
Epoch: 60, step: 1427, loss: 0.34445425868034363, mean loss: 0.3402759525727896
Epoch: 60, step: 1428, loss: 0.29971012473106384, mean loss: 0.3402754919586366
Epoch: 60, step: 1429, loss: 0.2922603487968445, mean loss: 0.340274946765686
Epoch: 60, step: 1430, loss: 0.31843283772468567, mean loss: 0.34027469875999694
Epoch: 60, step: 1431, loss: 0.319915771484375, mean loss: 0.3402744675976834
Epoch: 60, step: 1432, loss: 0.31288182735443115, mean loss: 0.34027415657568755
Epoch: 60, step: 1433, loss: 0.3000617027282715, mean loss: 0.34027369999992346
Epoch: 60, step: 1434, loss: 0.35205578804016113, mean loss: 0.3402738337732762
Epoch: 60, step: 1435, loss: 0.33206185698509216, mean loss: 0.34027374053588133
Epoch: 60, step: 1436, loss: 0.30928850173950195, mean loss: 0.34027338873871754
Epoch: 60, step: 1437, loss: 0.28422361612319946, mean loss: 0.3402727523735342
Epoch: 60, step: 1438, loss: 0.2976372539997101, mean loss: 0.34027226831378815
Epoch: 60, step: 1439, loss: 0.31759119033813477, mean loss: 0.34027201080836156
Epoch: 60, step: 1440, loss: 0.31087952852249146, mean loss: 0.3402716771100352
Epoch: 60, step: 1441, loss: 0.3604416847229004, mean loss: 0.34027190610128893
Epoch: 60, step: 1442, loss: 0.2907315492630005, mean loss: 0.3402713436731605
Epoch: 60, step: 1443, loss: 0.32977548241615295, mean loss: 0.340271224515751
Valid: 60, mean loss: 0.1853262186050415
Epoch: 61, step: 0, loss: 0.34245941042900085, mean loss: 0.34027124935750513
Epoch: 61, step: 1, loss: 0.35139200091362, mean loss: 0.3402713756063024
Epoch: 61, step: 2, loss: 0.32157376408576965, mean loss: 0.3402711633432951
Epoch: 61, step: 3, loss: 0.2896397113800049, mean loss: 0.34027058856066905
Epoch: 61, step: 4, loss: 0.30877161026000977, mean loss: 0.34027023097937853
Epoch: 61, step: 5, loss: 0.3309169411659241, mean loss: 0.3402701248005862
Epoch: 61, step: 6, loss: 0.3407647907733917, mean loss: 0.34027013041598364
Epoch: 61, step: 7, loss: 0.345261812210083, mean loss: 0.3402701870804003
Epoch: 61, step: 8, loss: 0.3306520879268646, mean loss: 0.34027007789920366
Epoch: 61, step: 9, loss: 0.33609816431999207, mean loss: 0.34027003054168126
Epoch: 61, step: 10, loss: 0.31077685952186584, mean loss: 0.3402696957534297
Epoch: 61, step: 11, loss: 0.3290327787399292, mean loss: 0.3402695682003397
Epoch: 61, step: 12, loss: 0.3538612425327301, mean loss: 0.3402697224811249
Epoch: 61, step: 13, loss: 0.40588846802711487, mean loss: 0.3402704673192092
Epoch: 61, step: 14, loss: 0.3097575008869171, mean loss: 0.34027012097059645
Epoch: 61, step: 15, loss: 0.3375299870967865, mean loss: 0.3402700898680553
Epoch: 61, step: 16, loss: 0.3159041404724121, mean loss: 0.34026981329969175
Epoch: 61, step: 17, loss: 0.3556743860244751, mean loss: 0.3402699881489883
Epoch: 61, step: 18, loss: 0.3152572810649872, mean loss: 0.3402697042459761
Epoch: 61, step: 19, loss: 0.32521697878837585, mean loss: 0.3402695333941934
Epoch: 61, step: 20, loss: 0.36721447110176086, mean loss: 0.34026983922175946
Epoch: 61, step: 21, loss: 0.3601825535297394, mean loss: 0.34027006523036624
Epoch: 61, step: 22, loss: 0.3215598464012146, mean loss: 0.3402698528724511
Epoch: 61, step: 23, loss: 0.3040679693222046, mean loss: 0.3402694419916735
Epoch: 61, step: 24, loss: 0.3164121210575104, mean loss: 0.34026917122114003
Epoch: 61, step: 25, loss: 0.3383316993713379, mean loss: 0.340269149231901
Epoch: 61, step: 26, loss: 0.3171638548374176, mean loss: 0.340268887002504
Epoch: 61, step: 27, loss: 0.31414783000946045, mean loss: 0.3402685905496146
Epoch: 61, step: 28, loss: 0.33040574193000793, mean loss: 0.34026847861552295
Epoch: 61, step: 29, loss: 0.32998716831207275, mean loss: 0.34026836193360743
Epoch: 61, step: 30, loss: 0.3617439568042755, mean loss: 0.34026860565595746
Epoch: 61, step: 31, loss: 0.37180668115615845, mean loss: 0.3402689635713814
Epoch: 61, step: 32, loss: 0.33740508556365967, mean loss: 0.3402689310705245
Epoch: 61, step: 33, loss: 0.32089313864707947, mean loss: 0.34026871118591046
Epoch: 61, step: 34, loss: 0.33744487166404724, mean loss: 0.34026867914015957
Epoch: 61, step: 35, loss: 0.31760767102241516, mean loss: 0.34026842197937746
Epoch: 61, step: 36, loss: 0.37056946754455566, mean loss: 0.34026876583663695
Epoch: 61, step: 37, loss: 0.33358117938041687, mean loss: 0.3402686899465476
Epoch: 61, step: 38, loss: 0.31219223141670227, mean loss: 0.34026837134120586
Epoch: 61, step: 39, loss: 0.3549021780490875, mean loss: 0.3402685374004713
Epoch: 61, step: 40, loss: 0.3173976540565491, mean loss: 0.3402682778727171
Epoch: 61, step: 41, loss: 0.30734962224960327, mean loss: 0.3402679043319275
Epoch: 61, step: 42, loss: 0.3098410964012146, mean loss: 0.34026755907102074
Epoch: 61, step: 43, loss: 0.30079564452171326, mean loss: 0.34026711117801794
Epoch: 61, step: 44, loss: 0.3342391550540924, mean loss: 0.3402670427787836
Epoch: 61, step: 45, loss: 0.2886354625225067, mean loss: 0.34026645692175134
Epoch: 61, step: 46, loss: 0.31965315341949463, mean loss: 0.34026622302784904
Epoch: 61, step: 47, loss: 0.3281850814819336, mean loss: 0.34026608594776975
Epoch: 61, step: 48, loss: 0.3269173800945282, mean loss: 0.34026593448684306
Epoch: 61, step: 49, loss: 0.3222391605377197, mean loss: 0.34026572994859505
Epoch: 61, step: 50, loss: 0.356651246547699, mean loss: 0.3402659158624386
Epoch: 61, step: 51, loss: 0.3283524513244629, mean loss: 0.34026578069106095
Epoch: 61, step: 52, loss: 0.2921311855316162, mean loss: 0.3402652345572561
Epoch: 61, step: 53, loss: 0.36498403549194336, mean loss: 0.3402655150129158
Epoch: 61, step: 54, loss: 0.32890018820762634, mean loss: 0.34026538606515366
Epoch: 61, step: 55, loss: 0.3301859498023987, mean loss: 0.340265271708037
Epoch: 61, step: 56, loss: 0.308851420879364, mean loss: 0.34026491530351666
Epoch: 61, step: 57, loss: 0.3118892312049866, mean loss: 0.34026459337204135
Epoch: 61, step: 58, loss: 0.28862717747688293, mean loss: 0.3402640075352092
Epoch: 61, step: 59, loss: 0.3717164993286133, mean loss: 0.34026436436598373
Epoch: 61, step: 60, loss: 0.29304206371307373, mean loss: 0.34026382863167487
Epoch: 61, step: 61, loss: 0.3440411686897278, mean loss: 0.34026387148489634
Epoch: 61, step: 62, loss: 0.322941392660141, mean loss: 0.3402636749668206
Epoch: 61, step: 63, loss: 0.3177410066127777, mean loss: 0.3402634194571283
Epoch: 61, step: 64, loss: 0.32600194215774536, mean loss: 0.34026325766882326
Epoch: 61, step: 65, loss: 0.3419322073459625, mean loss: 0.3402632766018882
Epoch: 61, step: 66, loss: 0.3227596580982208, mean loss: 0.34026307803785033
Epoch: 61, step: 67, loss: 0.34828922152519226, mean loss: 0.34026316908676
Epoch: 61, step: 68, loss: 0.3276757001876831, mean loss: 0.3402630262956026
Epoch: 61, step: 69, loss: 0.40652093291282654, mean loss: 0.3402637779110326
Epoch: 61, step: 70, loss: 0.3753569722175598, mean loss: 0.3402641759961589
Epoch: 61, step: 71, loss: 0.3371945321559906, mean loss: 0.3402641411755699
Epoch: 61, step: 72, loss: 0.343244343996048, mean loss: 0.34026417498119876
Epoch: 61, step: 73, loss: 0.39058151841163635, mean loss: 0.3402647457444129
Epoch: 61, step: 74, loss: 0.31366869807243347, mean loss: 0.34026444406168427
Epoch: 61, step: 75, loss: 0.30165305733680725, mean loss: 0.3402640060922341
Epoch: 61, step: 76, loss: 0.3806817829608917, mean loss: 0.34026446454639037
Epoch: 61, step: 77, loss: 0.34329912066459656, mean loss: 0.3402644989677524
Epoch: 61, step: 78, loss: 0.3166965842247009, mean loss: 0.34026423164569275
Epoch: 61, step: 79, loss: 0.35042375326156616, mean loss: 0.3402643468800471
Epoch: 61, step: 80, loss: 0.32552939653396606, mean loss: 0.34026417975079687
Epoch: 61, step: 81, loss: 0.37177574634552, mean loss: 0.3402645371625723
Epoch: 61, step: 82, loss: 0.2824549376964569, mean loss: 0.3402638814796131
Epoch: 61, step: 83, loss: 0.2994726300239563, mean loss: 0.3402634188259127
Epoch: 61, step: 84, loss: 0.33848220109939575, mean loss: 0.34026339862359983
Epoch: 61, step: 85, loss: 0.3167405128479004, mean loss: 0.3402631318334697
Epoch: 61, step: 86, loss: 0.3592735230922699, mean loss: 0.34026334744167713
Epoch: 61, step: 87, loss: 0.30207666754722595, mean loss: 0.3402629143486329
Epoch: 61, step: 88, loss: 0.3289392292499542, mean loss: 0.3402627859228666
Epoch: 61, step: 89, loss: 0.3460855484008789, mean loss: 0.34026285196004846
Epoch: 61, step: 90, loss: 0.3274737298488617, mean loss: 0.34026270691755217
Epoch: 61, step: 91, loss: 0.33942243456840515, mean loss: 0.34026269738806175
Epoch: 61, step: 92, loss: 0.3362828195095062, mean loss: 0.3402626522529599
Epoch: 61, step: 93, loss: 0.36796247959136963, mean loss: 0.34026296638831494
Epoch: 61, step: 94, loss: 0.3204931318759918, mean loss: 0.34026274218715014
Epoch: 61, step: 95, loss: 0.3187180161476135, mean loss: 0.34026249786047696
Epoch: 61, step: 96, loss: 0.3380454480648041, mean loss: 0.3402624727184419
Epoch: 61, step: 97, loss: 0.33364608883857727, mean loss: 0.3402623976874392
Epoch: 61, step: 98, loss: 0.33429792523384094, mean loss: 0.3402623300499983
Epoch: 61, step: 99, loss: 0.3687661290168762, mean loss: 0.34026265328095817
Epoch: 61, step: 100, loss: 0.33266782760620117, mean loss: 0.3402625671571766
Epoch: 61, step: 101, loss: 0.33779779076576233, mean loss: 0.3402625392074296
Epoch: 61, step: 102, loss: 0.3413503170013428, mean loss: 0.34026255154232926
Epoch: 61, step: 103, loss: 0.31437447667121887, mean loss: 0.34026225798680165
Epoch: 61, step: 104, loss: 0.3353525996208191, mean loss: 0.3402622023147976
Epoch: 61, step: 105, loss: 0.32033756375312805, mean loss: 0.34026197638625055
Epoch: 61, step: 106, loss: 0.34410181641578674, mean loss: 0.3402620199262947
Epoch: 61, step: 107, loss: 0.34755176305770874, mean loss: 0.34026210258394085
Epoch: 61, step: 108, loss: 0.32750359177589417, mean loss: 0.3402619579181419
Epoch: 61, step: 109, loss: 0.28128546476364136, mean loss: 0.3402612892049284
Epoch: 61, step: 110, loss: 0.32775941491127014, mean loss: 0.34026114745228603
Epoch: 61, step: 111, loss: 0.32034918665885925, mean loss: 0.3402609216828544
Epoch: 61, step: 112, loss: 0.33532464504241943, mean loss: 0.34026086571409536
Epoch: 61, step: 113, loss: 0.32557058334350586, mean loss: 0.340260699153829
Epoch: 61, step: 114, loss: 0.3365497589111328, mean loss: 0.34026065707919956
Epoch: 61, step: 115, loss: 0.3866342604160309, mean loss: 0.3402611828570152
Epoch: 61, step: 116, loss: 0.34488415718078613, mean loss: 0.3402612352710958
Epoch: 61, step: 117, loss: 0.3460172116756439, mean loss: 0.34026130053011944
Epoch: 61, step: 118, loss: 0.3664938807487488, mean loss: 0.3402615979415478
Epoch: 61, step: 119, loss: 0.3636634647846222, mean loss: 0.34026186325680385
Epoch: 61, step: 120, loss: 0.3319384455680847, mean loss: 0.3402617688923382
Epoch: 61, step: 121, loss: 0.3448217511177063, mean loss: 0.34026182058930016
Epoch: 61, step: 122, loss: 0.3108513653278351, mean loss: 0.34026148716388877
Epoch: 61, step: 123, loss: 0.3027228116989136, mean loss: 0.34026106159392383
Epoch: 61, step: 124, loss: 0.3577732741832733, mean loss: 0.3402612601248287
Epoch: 61, step: 125, loss: 0.3039246201515198, mean loss: 0.3402608481914881
Epoch: 61, step: 126, loss: 0.3290165662765503, mean loss: 0.34026072072119623
Epoch: 61, step: 127, loss: 0.34436413645744324, mean loss: 0.34026076723885523
Epoch: 61, step: 128, loss: 0.38701626658439636, mean loss: 0.3402612972684353
Epoch: 61, step: 129, loss: 0.3346759080886841, mean loss: 0.3402612339520776
Epoch: 61, step: 130, loss: 0.36648470163345337, mean loss: 0.34026153121974956
Epoch: 61, step: 131, loss: 0.34212490916252136, mean loss: 0.34026155234265176
Epoch: 61, step: 132, loss: 0.3508358299732208, mean loss: 0.34026167220931725
Epoch: 61, step: 133, loss: 0.36076194047927856, mean loss: 0.34026190459123784
Epoch: 61, step: 134, loss: 0.33065682649612427, mean loss: 0.34026179571358
Epoch: 61, step: 135, loss: 0.3015739619731903, mean loss: 0.34026135717545103
Epoch: 61, step: 136, loss: 0.33576592803001404, mean loss: 0.3402613062189991
Epoch: 61, step: 137, loss: 0.3465716540813446, mean loss: 0.34026137774705173
Epoch: 61, step: 138, loss: 0.3301224708557129, mean loss: 0.3402612628234276
Epoch: 61, step: 139, loss: 0.3261418044567108, mean loss: 0.3402611027824142
Epoch: 61, step: 140, loss: 0.33455103635787964, mean loss: 0.34026103806077723
Epoch: 61, step: 141, loss: 0.3143986165523529, mean loss: 0.3402607449224562
Epoch: 61, step: 142, loss: 0.3233304023742676, mean loss: 0.34026055302720254
Epoch: 61, step: 143, loss: 0.30356529355049133, mean loss: 0.3402601371132129
Epoch: 61, step: 144, loss: 0.32977911829948425, mean loss: 0.3402600183198591
Epoch: 61, step: 145, loss: 0.30939626693725586, mean loss: 0.34025966850968814
Epoch: 61, step: 146, loss: 0.35441938042640686, mean loss: 0.34025982899423346
Epoch: 61, step: 147, loss: 0.3157106637954712, mean loss: 0.3402595507599738
Epoch: 61, step: 148, loss: 0.3152293860912323, mean loss: 0.34025926707739845
Epoch: 61, step: 149, loss: 0.35040467977523804, mean loss: 0.34025938206042877
Epoch: 61, step: 150, loss: 0.31170326471328735, mean loss: 0.34025905842335336
Epoch: 61, step: 151, loss: 0.329744815826416, mean loss: 0.3402589392628905
Epoch: 61, step: 152, loss: 0.33158159255981445, mean loss: 0.34025884092152914
Epoch: 61, step: 153, loss: 0.30265969038009644, mean loss: 0.3402584148108904
Epoch: 61, step: 154, loss: 0.32539263367652893, mean loss: 0.3402582463391134
Epoch: 61, step: 155, loss: 0.33264052867889404, mean loss: 0.34025816000958414
Epoch: 61, step: 156, loss: 0.34455034136772156, mean loss: 0.3402582086511607
Epoch: 61, step: 157, loss: 0.3164243698120117, mean loss: 0.3402579385548478
Epoch: 61, step: 158, loss: 0.3445015549659729, mean loss: 0.34025798664496726
Epoch: 61, step: 159, loss: 0.32721176743507385, mean loss: 0.34025783880240335
Epoch: 61, step: 160, loss: 0.33281731605529785, mean loss: 0.3402577544857537
Epoch: 61, step: 161, loss: 0.2939874827861786, mean loss: 0.3402572301529601
Epoch: 61, step: 162, loss: 0.3066001832485199, mean loss: 0.34025684875702705
Epoch: 61, step: 163, loss: 0.33689719438552856, mean loss: 0.3402568106864263
Epoch: 61, step: 164, loss: 0.32861387729644775, mean loss: 0.34025667875367477
Epoch: 61, step: 165, loss: 0.34332120418548584, mean loss: 0.3402567134791754
Epoch: 61, step: 166, loss: 0.36542657017707825, mean loss: 0.3402569986867844
Epoch: 61, step: 167, loss: 0.29440659284591675, mean loss: 0.3402564791472177
Epoch: 61, step: 168, loss: 0.32329103350639343, mean loss: 0.34025628691074256
Epoch: 61, step: 169, loss: 0.3256565034389496, mean loss: 0.34025612148160084
Epoch: 61, step: 170, loss: 0.36237314343452454, mean loss: 0.3402563720852148
Epoch: 61, step: 171, loss: 0.3115835189819336, mean loss: 0.3402560472024521
Epoch: 61, step: 172, loss: 0.2997616231441498, mean loss: 0.3402555883785168
Epoch: 61, step: 173, loss: 0.3291996717453003, mean loss: 0.340255463110364
Epoch: 61, step: 174, loss: 0.3091079592704773, mean loss: 0.34025511020013566
Epoch: 61, step: 175, loss: 0.31647682189941406, mean loss: 0.34025484078830354
Epoch: 61, step: 176, loss: 0.2958465814590454, mean loss: 0.3402543376412813
Epoch: 61, step: 177, loss: 0.3176595866680145, mean loss: 0.34025408164491855
Epoch: 61, step: 178, loss: 0.3301299810409546, mean loss: 0.3402539669411287
Epoch: 61, step: 179, loss: 0.34592413902282715, mean loss: 0.3402540311821792
Epoch: 61, step: 180, loss: 0.3165743947029114, mean loss: 0.3402537629032863
Epoch: 61, step: 181, loss: 0.34556737542152405, mean loss: 0.34025382310327856
Epoch: 61, step: 182, loss: 0.3123672604560852, mean loss: 0.34025350716909425
Epoch: 61, step: 183, loss: 0.3234834372997284, mean loss: 0.3402533171787255
Epoch: 61, step: 184, loss: 0.3305390179157257, mean loss: 0.3402532071253742
Epoch: 61, step: 185, loss: 0.37657877802848816, mean loss: 0.3402536186533101
Epoch: 61, step: 186, loss: 0.3525349795818329, mean loss: 0.34025375778576505
Epoch: 61, step: 187, loss: 0.3678441345691681, mean loss: 0.3402540703466766
Epoch: 61, step: 188, loss: 0.3205692172050476, mean loss: 0.3402538473469695
Epoch: 61, step: 189, loss: 0.3613326847553253, mean loss: 0.34025408613571145
Epoch: 61, step: 190, loss: 0.35336077213287354, mean loss: 0.34025423461133875
Epoch: 61, step: 191, loss: 0.3229939043521881, mean loss: 0.34025403908446555
Epoch: 61, step: 192, loss: 0.3705291748046875, mean loss: 0.34025438204056646
Epoch: 61, step: 193, loss: 0.3819660544395447, mean loss: 0.34025485454416193
Epoch: 61, step: 194, loss: 0.324261873960495, mean loss: 0.34025467338011856
Epoch: 61, step: 195, loss: 0.30770328640937805, mean loss: 0.3402543046512222
Epoch: 61, step: 196, loss: 0.3354056775569916, mean loss: 0.34025424972856505
Epoch: 61, step: 197, loss: 0.3760116696357727, mean loss: 0.3402546547649248
Epoch: 61, step: 198, loss: 0.32646888494491577, mean loss: 0.34025449861062756
Epoch: 61, step: 199, loss: 0.34651175141334534, mean loss: 0.34025456948703553
Epoch: 61, step: 200, loss: 0.3267066478729248, mean loss: 0.34025441603037115
Epoch: 61, step: 201, loss: 0.3488522469997406, mean loss: 0.34025451341649093
Epoch: 61, step: 202, loss: 0.35449206829071045, mean loss: 0.3402546746809452
Epoch: 61, step: 203, loss: 0.3233497142791748, mean loss: 0.3402544832057685
Epoch: 61, step: 204, loss: 0.29976657032966614, mean loss: 0.34025402462188065
Epoch: 61, step: 205, loss: 0.36233651638031006, mean loss: 0.34025427473505043
Epoch: 61, step: 206, loss: 0.31957677006721497, mean loss: 0.340254040537854
Epoch: 61, step: 207, loss: 0.3245951533317566, mean loss: 0.3402538631844448
Epoch: 61, step: 208, loss: 0.3680218756198883, mean loss: 0.3402541776829037
Epoch: 61, step: 209, loss: 0.4155292212963104, mean loss: 0.34025503023283477
Epoch: 61, step: 210, loss: 0.3507744371891022, mean loss: 0.34025514937216267
Epoch: 61, step: 211, loss: 0.3329446613788605, mean loss: 0.34025506657692856
Epoch: 61, step: 212, loss: 0.32076823711395264, mean loss: 0.340254845880535
Epoch: 61, step: 213, loss: 0.3159143328666687, mean loss: 0.3402545702172922
Epoch: 61, step: 214, loss: 0.3049575090408325, mean loss: 0.3402541704725479
Epoch: 61, step: 215, loss: 0.3512970805168152, mean loss: 0.3402542955338168
Epoch: 61, step: 216, loss: 0.33667901158332825, mean loss: 0.3402542550440834
Epoch: 61, step: 217, loss: 0.2926618456840515, mean loss: 0.3402537160709077
Epoch: 61, step: 218, loss: 0.3276576101779938, mean loss: 0.34025357342449825
Epoch: 61, step: 219, loss: 0.34476709365844727, mean loss: 0.34025362453792724
Epoch: 61, step: 220, loss: 0.32223063707351685, mean loss: 0.3402534204386411
Epoch: 61, step: 221, loss: 0.3572027087211609, mean loss: 0.34025361237676854
Epoch: 61, step: 222, loss: 0.34371256828308105, mean loss: 0.34025365154643694
Epoch: 61, step: 223, loss: 0.32506459951400757, mean loss: 0.34025347954557594
Epoch: 61, step: 224, loss: 0.3142768442630768, mean loss: 0.34025318538942784
Epoch: 61, step: 225, loss: 0.3105463683605194, mean loss: 0.34025284899698044
Epoch: 61, step: 226, loss: 0.3207959830760956, mean loss: 0.3402526286748697
Epoch: 61, step: 227, loss: 0.340748131275177, mean loss: 0.3402526342856882
Epoch: 61, step: 228, loss: 0.3563151955604553, mean loss: 0.34025281616787173
Epoch: 61, step: 229, loss: 0.32837483286857605, mean loss: 0.34025268167069916
Epoch: 61, step: 230, loss: 0.357423335313797, mean loss: 0.3402528760958098
Epoch: 61, step: 231, loss: 0.30271729826927185, mean loss: 0.340252451081341
Epoch: 61, step: 232, loss: 0.37836235761642456, mean loss: 0.3402528825940343
Epoch: 61, step: 233, loss: 0.3338780105113983, mean loss: 0.3402528104131416
Epoch: 61, step: 234, loss: 0.2943129241466522, mean loss: 0.34025229025455433
Epoch: 61, step: 235, loss: 0.31031671166419983, mean loss: 0.34025195131005037
Epoch: 61, step: 236, loss: 0.2971177101135254, mean loss: 0.34025146292969694
Epoch: 61, step: 237, loss: 0.31756919622421265, mean loss: 0.3402512061163695
Epoch: 61, step: 238, loss: 0.37171098589897156, mean loss: 0.3402515623064874
Epoch: 61, step: 239, loss: 0.35433635115623474, mean loss: 0.3402517217737766
Epoch: 61, step: 240, loss: 0.3076951205730438, mean loss: 0.3402513531737064
Epoch: 61, step: 241, loss: 0.34716325998306274, mean loss: 0.34025143142820463
Epoch: 61, step: 242, loss: 0.31130778789520264, mean loss: 0.340251103740821
Epoch: 61, step: 243, loss: 0.33405575156211853, mean loss: 0.3402510336005237
Epoch: 61, step: 244, loss: 0.33265918493270874, mean loss: 0.34025094765085073
Epoch: 61, step: 245, loss: 0.32992231845855713, mean loss: 0.34025083071856055
Epoch: 61, step: 246, loss: 0.3473833203315735, mean loss: 0.34025091146585895
Epoch: 61, step: 247, loss: 0.28620269894599915, mean loss: 0.34025029959006625
Epoch: 61, step: 248, loss: 0.3115099370479584, mean loss: 0.34024997422624365
Epoch: 61, step: 249, loss: 0.30047884583473206, mean loss: 0.34024952399045233
Epoch: 61, step: 250, loss: 0.3421207368373871, mean loss: 0.3402495451735943
Epoch: 61, step: 251, loss: 0.37377163767814636, mean loss: 0.340249924657525
Epoch: 61, step: 252, loss: 0.3505445122718811, mean loss: 0.3402500411951889
Epoch: 61, step: 253, loss: 0.3510728180408478, mean loss: 0.3402501637107184
Epoch: 61, step: 254, loss: 0.3434068560600281, mean loss: 0.34025019944456586
Epoch: 61, step: 255, loss: 0.33354419469833374, mean loss: 0.3402501235332602
Epoch: 61, step: 256, loss: 0.3595414459705353, mean loss: 0.3402503419066365
Epoch: 61, step: 257, loss: 0.3811626732349396, mean loss: 0.34025080501966687
Epoch: 61, step: 258, loss: 0.3284952938556671, mean loss: 0.34025067195297043
Epoch: 61, step: 259, loss: 0.334771990776062, mean loss: 0.34025060993765327
Epoch: 61, step: 260, loss: 0.3542992174625397, mean loss: 0.34025076895749057
Epoch: 61, step: 261, loss: 0.33507347106933594, mean loss: 0.34025071035497445
Epoch: 61, step: 262, loss: 0.29777806997299194, mean loss: 0.3402502296070104
Epoch: 61, step: 263, loss: 0.3087100088596344, mean loss: 0.34024987260718303
Epoch: 61, step: 264, loss: 0.3332879841327667, mean loss: 0.34024979380732706
Epoch: 61, step: 265, loss: 0.3048231303691864, mean loss: 0.3402493928264166
Epoch: 61, step: 266, loss: 0.3375093340873718, mean loss: 0.34024936181308635
Epoch: 61, step: 267, loss: 0.2954007685184479, mean loss: 0.3402488542004313
Epoch: 61, step: 268, loss: 0.34540486335754395, mean loss: 0.3402489125573536
Epoch: 61, step: 269, loss: 0.3413061499595642, mean loss: 0.3402489245232794
Epoch: 61, step: 270, loss: 0.32565340399742126, mean loss: 0.3402487593314903
Epoch: 61, step: 271, loss: 0.35930952429771423, mean loss: 0.34024897505837887
Epoch: 61, step: 272, loss: 0.3386550843715668, mean loss: 0.3402489570191665
Epoch: 61, step: 273, loss: 0.3132929801940918, mean loss: 0.340248651942356
Epoch: 61, step: 274, loss: 0.35529106855392456, mean loss: 0.3402488221843982
Epoch: 61, step: 275, loss: 0.3537522852420807, mean loss: 0.340248975007656
Epoch: 61, step: 276, loss: 0.297438383102417, mean loss: 0.3402484905111937
Epoch: 61, step: 277, loss: 0.32135438919067383, mean loss: 0.34024827668509966
Epoch: 61, step: 278, loss: 0.30020105838775635, mean loss: 0.3402478234725752
Epoch: 61, step: 279, loss: 0.328258752822876, mean loss: 0.3402476877943505
Epoch: 61, step: 280, loss: 0.3444128632545471, mean loss: 0.3402477349303824
Epoch: 61, step: 281, loss: 0.29071173071861267, mean loss: 0.34024717435273705
Epoch: 61, step: 282, loss: 0.31205442547798157, mean loss: 0.34024685531113924
Epoch: 61, step: 283, loss: 0.33905529975891113, mean loss: 0.34024684182712295
Epoch: 61, step: 284, loss: 0.3433923125267029, mean loss: 0.340246877421853
Epoch: 61, step: 285, loss: 0.37474721670150757, mean loss: 0.34024726782967557
Epoch: 61, step: 286, loss: 0.3307424485683441, mean loss: 0.3402471602738115
Epoch: 61, step: 287, loss: 0.3413172662258148, mean loss: 0.34024717238291796
Epoch: 61, step: 288, loss: 0.38505494594573975, mean loss: 0.3402476794130467
Epoch: 61, step: 289, loss: 0.3099520802497864, mean loss: 0.34024733660182205
Epoch: 61, step: 290, loss: 0.3409107029438019, mean loss: 0.340247344108089
Epoch: 61, step: 291, loss: 0.3340631127357483, mean loss: 0.3402472741317224
Epoch: 61, step: 292, loss: 0.3507165014743805, mean loss: 0.34024739259271725
Epoch: 61, step: 293, loss: 0.31729376316070557, mean loss: 0.3402471328716392
Epoch: 61, step: 294, loss: 0.3030158579349518, mean loss: 0.3402467116032956
Epoch: 61, step: 295, loss: 0.31387436389923096, mean loss: 0.34024641320605975
Epoch: 61, step: 296, loss: 0.3343809247016907, mean loss: 0.3402463468401157
Epoch: 61, step: 297, loss: 0.32552945613861084, mean loss: 0.34024618032554593
Epoch: 61, step: 298, loss: 0.3681817948818207, mean loss: 0.3402464964000688
Epoch: 61, step: 299, loss: 0.36536526679992676, mean loss: 0.34024678060049424
Epoch: 61, step: 300, loss: 0.2941570281982422, mean loss: 0.3402462591347206
Epoch: 61, step: 301, loss: 0.3529508411884308, mean loss: 0.3402464028744764
Epoch: 61, step: 302, loss: 0.3627247214317322, mean loss: 0.34024665719149766
Epoch: 61, step: 303, loss: 0.3056815266609192, mean loss: 0.34024626613014847
Epoch: 61, step: 304, loss: 0.31858447194099426, mean loss: 0.34024602105673224
Epoch: 61, step: 305, loss: 0.3975558578968048, mean loss: 0.34024666943139953
Epoch: 61, step: 306, loss: 0.343099445104599, mean loss: 0.34024670170590343
Epoch: 61, step: 307, loss: 0.3586091995239258, mean loss: 0.3402469094452669
Epoch: 61, step: 308, loss: 0.30807259678840637, mean loss: 0.3402465454536312
Epoch: 61, step: 309, loss: 0.3056417405605316, mean loss: 0.34024615396999097
Epoch: 61, step: 310, loss: 0.3134137988090515, mean loss: 0.34024585041939237
Epoch: 61, step: 311, loss: 0.32896074652671814, mean loss: 0.34024572275406934
Epoch: 61, step: 312, loss: 0.3817930519580841, mean loss: 0.3402461927624317
Epoch: 61, step: 313, loss: 0.3559168875217438, mean loss: 0.3402463700367451
Epoch: 61, step: 314, loss: 0.3485170006752014, mean loss: 0.34024646359697364
Epoch: 61, step: 315, loss: 0.29568472504615784, mean loss: 0.3402459595049086
Epoch: 61, step: 316, loss: 0.3429776430130005, mean loss: 0.3402459904059562
Epoch: 61, step: 317, loss: 0.3480842113494873, mean loss: 0.3402460790716079
Epoch: 61, step: 318, loss: 0.3436298668384552, mean loss: 0.3402461173484511
Epoch: 61, step: 319, loss: 0.31129029393196106, mean loss: 0.3402457898087084
Epoch: 61, step: 320, loss: 0.3320494592189789, mean loss: 0.3402456970952805
Epoch: 61, step: 321, loss: 0.35651683807373047, mean loss: 0.34024588114546916
Epoch: 61, step: 322, loss: 0.33048200607299805, mean loss: 0.3402457707031391
Epoch: 61, step: 323, loss: 0.29494020342826843, mean loss: 0.3402452582430984
Epoch: 61, step: 324, loss: 0.3076727092266083, mean loss: 0.3402448898128592
Epoch: 61, step: 325, loss: 0.3436915874481201, mean loss: 0.34024492879824136
Epoch: 61, step: 326, loss: 0.325817346572876, mean loss: 0.3402447656106038
Epoch: 61, step: 327, loss: 0.334235817193985, mean loss: 0.34024469764530024
Epoch: 61, step: 328, loss: 0.34896230697631836, mean loss: 0.3402447962462903
Epoch: 61, step: 329, loss: 0.3420666754245758, mean loss: 0.34024481685251984
Epoch: 61, step: 330, loss: 0.3123384118080139, mean loss: 0.34024450122276195
Epoch: 61, step: 331, loss: 0.3092135488986969, mean loss: 0.34024415025741267
Epoch: 61, step: 332, loss: 0.3481210172176361, mean loss: 0.3402442393451103
Epoch: 61, step: 333, loss: 0.31591033935546875, mean loss: 0.3402439641307875
Epoch: 61, step: 334, loss: 0.32970932126045227, mean loss: 0.3402438449862273
Epoch: 61, step: 335, loss: 0.33072295784950256, mean loss: 0.34024373730824564
Epoch: 61, step: 336, loss: 0.3663668930530548, mean loss: 0.3402440327488734
Epoch: 61, step: 337, loss: 0.3285229504108429, mean loss: 0.3402439001904339
Epoch: 61, step: 338, loss: 0.3242020905017853, mean loss: 0.34024371876920084
Epoch: 61, step: 339, loss: 0.3341941237449646, mean loss: 0.3402436503534424
Epoch: 61, step: 340, loss: 0.3239840269088745, mean loss: 0.34024346647305287
Epoch: 61, step: 341, loss: 0.34416019916534424, mean loss: 0.34024351076695614
Epoch: 61, step: 342, loss: 0.358188271522522, mean loss: 0.3402437137000055
Epoch: 61, step: 343, loss: 0.3115689754486084, mean loss: 0.34024338942784904
Epoch: 61, step: 344, loss: 0.3652607798576355, mean loss: 0.3402436723371936
Epoch: 61, step: 345, loss: 0.331875205039978, mean loss: 0.3402435777033895
Epoch: 61, step: 346, loss: 0.36561185121536255, mean loss: 0.3402438645742098
Epoch: 61, step: 347, loss: 0.33891981840133667, mean loss: 0.3402438496017318
Epoch: 61, step: 348, loss: 0.3009340167045593, mean loss: 0.34024340508630324
Epoch: 61, step: 349, loss: 0.3324386477470398, mean loss: 0.34024331683113734
Epoch: 61, step: 350, loss: 0.36619651317596436, mean loss: 0.3402436103031376
Epoch: 61, step: 351, loss: 0.33975550532341003, mean loss: 0.34024360478383575
Epoch: 61, step: 352, loss: 0.2962997257709503, mean loss: 0.3402431078891083
Epoch: 61, step: 353, loss: 0.3071655035018921, mean loss: 0.34024273386884113
Epoch: 61, step: 354, loss: 0.33120691776275635, mean loss: 0.3402426316988018
Epoch: 61, step: 355, loss: 0.3151100277900696, mean loss: 0.34024234752191457
Epoch: 61, step: 356, loss: 0.3192293643951416, mean loss: 0.3402421099286815
Epoch: 61, step: 357, loss: 0.33000361919403076, mean loss: 0.34024199416365203
Epoch: 61, step: 358, loss: 0.3295671045780182, mean loss: 0.34024187346569307
Epoch: 61, step: 359, loss: 0.32648468017578125, mean loss: 0.3402417179187561
Epoch: 61, step: 360, loss: 0.3092420697212219, mean loss: 0.34024136742242284
Epoch: 61, step: 361, loss: 0.2922024726867676, mean loss: 0.34024082427864316
Epoch: 61, step: 362, loss: 0.35653916001319885, mean loss: 0.34024100855098405
Epoch: 61, step: 363, loss: 0.3065604567527771, mean loss: 0.34024062775603336
Epoch: 61, step: 364, loss: 0.3762008845806122, mean loss: 0.3402410343209106
Epoch: 61, step: 365, loss: 0.3435877859592438, mean loss: 0.34024107215869054
Epoch: 61, step: 366, loss: 0.3700640797615051, mean loss: 0.3402414093285089
Epoch: 61, step: 367, loss: 0.3235737383365631, mean loss: 0.3402412208910401
Epoch: 61, step: 368, loss: 0.3425787389278412, mean loss: 0.3402412473177078
Epoch: 61, step: 369, loss: 0.31513360142707825, mean loss: 0.34024096346795657
Epoch: 61, step: 370, loss: 0.34536680579185486, mean loss: 0.3402410214165443
Epoch: 61, step: 371, loss: 0.3585924208164215, mean loss: 0.3402412288801352
Epoch: 61, step: 372, loss: 0.316986083984375, mean loss: 0.3402409659824007
Epoch: 61, step: 373, loss: 0.3330032527446747, mean loss: 0.3402408841615
Epoch: 61, step: 374, loss: 0.3397115468978882, mean loss: 0.34024087817751575
Epoch: 61, step: 375, loss: 0.34391942620277405, mean loss: 0.3402409197618253
Epoch: 61, step: 376, loss: 0.35475578904151917, mean loss: 0.34024108384395507
Epoch: 61, step: 377, loss: 0.32346078753471375, mean loss: 0.34024089415463865
Epoch: 61, step: 378, loss: 0.329603374004364, mean loss: 0.34024077390639756
Epoch: 61, step: 379, loss: 0.36067062616348267, mean loss: 0.34024100484612735
Epoch: 61, step: 380, loss: 0.3904998302459717, mean loss: 0.3402415729671402
Epoch: 61, step: 381, loss: 0.3258112967014313, mean loss: 0.34024140985050483
Epoch: 61, step: 382, loss: 0.32187986373901367, mean loss: 0.3402412022980151
Epoch: 61, step: 383, loss: 0.3074035942554474, mean loss: 0.3402408311173843
Epoch: 61, step: 384, loss: 0.3617594540119171, mean loss: 0.34024107435086604
Epoch: 61, step: 385, loss: 0.33940279483795166, mean loss: 0.34024106487556915
Epoch: 61, step: 386, loss: 0.3601970672607422, mean loss: 0.3402412904410356
Epoch: 61, step: 387, loss: 0.3480886220932007, mean loss: 0.3402413791395126
Epoch: 61, step: 388, loss: 0.3162011504173279, mean loss: 0.34024110741561125
Epoch: 61, step: 389, loss: 0.3272840678691864, mean loss: 0.34024096096535983
Epoch: 61, step: 390, loss: 0.3096109926700592, mean loss: 0.3402406147662268
Epoch: 61, step: 391, loss: 0.3234390616416931, mean loss: 0.3402404248666707
Epoch: 61, step: 392, loss: 0.34828075766563416, mean loss: 0.340240515741506
Epoch: 61, step: 393, loss: 0.3697845935821533, mean loss: 0.340240849655901
Epoch: 61, step: 394, loss: 0.3679700195789337, mean loss: 0.34024116305422064
Epoch: 61, step: 395, loss: 0.30022764205932617, mean loss: 0.3402407108218405
Epoch: 61, step: 396, loss: 0.3182871639728546, mean loss: 0.3402404627058964
Epoch: 61, step: 397, loss: 0.3773578107357025, mean loss: 0.34024088219627896
Epoch: 61, step: 398, loss: 0.30441123247146606, mean loss: 0.34024047726369616
Epoch: 61, step: 399, loss: 0.3367948532104492, mean loss: 0.3402404383230509
Epoch: 61, step: 400, loss: 0.3162493407726288, mean loss: 0.34024016719124833
Epoch: 61, step: 401, loss: 0.3532620072364807, mean loss: 0.34024031435396385
Epoch: 61, step: 402, loss: 0.38345083594322205, mean loss: 0.3402408026801766
Epoch: 61, step: 403, loss: 0.335109144449234, mean loss: 0.3402407446874744
Epoch: 61, step: 404, loss: 0.32332465052604675, mean loss: 0.34024055352140675
Epoch: 61, step: 405, loss: 0.3435581624507904, mean loss: 0.3402405910127496
Epoch: 61, step: 406, loss: 0.2987535893917084, mean loss: 0.3402401221853929
Epoch: 61, step: 407, loss: 0.33029600977897644, mean loss: 0.34024000981238284
Epoch: 61, step: 408, loss: 0.32770460844039917, mean loss: 0.3402398681582252
Epoch: 61, step: 409, loss: 0.34348955750465393, mean loss: 0.3402399048803685
Epoch: 61, step: 410, loss: 0.33831992745399475, mean loss: 0.34023988318448256
Epoch: 61, step: 411, loss: 0.3392843008041382, mean loss: 0.3402398723864535
Epoch: 61, step: 412, loss: 0.35824623703956604, mean loss: 0.3402400758550982
Epoch: 61, step: 413, loss: 0.32102468609809875, mean loss: 0.34023985872714324
Epoch: 61, step: 414, loss: 0.36617881059646606, mean loss: 0.34024015182595646
Epoch: 61, step: 415, loss: 0.34309500455856323, mean loss: 0.34024018408417944
Epoch: 61, step: 416, loss: 0.3569127321243286, mean loss: 0.3402403724724241
Epoch: 61, step: 417, loss: 0.3127233386039734, mean loss: 0.3402400615525142
Epoch: 61, step: 418, loss: 0.3417266607284546, mean loss: 0.34024007834967557
Epoch: 61, step: 419, loss: 0.30909639596939087, mean loss: 0.34023972645956463
Epoch: 61, step: 420, loss: 0.30906322598457336, mean loss: 0.3402393742026246
Epoch: 61, step: 421, loss: 0.2871319651603699, mean loss: 0.34023877415958753
Epoch: 61, step: 422, loss: 0.3664076030254364, mean loss: 0.3402390698291828
Epoch: 61, step: 423, loss: 0.29708755016326904, mean loss: 0.3402385822854617
Epoch: 61, step: 424, loss: 0.30178889632225037, mean loss: 0.3402381478699112
Epoch: 61, step: 425, loss: 0.35357534885406494, mean loss: 0.3402382985557205
Epoch: 61, step: 426, loss: 0.31624364852905273, mean loss: 0.34023802746342663
Epoch: 61, step: 427, loss: 0.3279217481613159, mean loss: 0.3402378883152964
Epoch: 61, step: 428, loss: 0.35125401616096497, mean loss: 0.34023801277303534
Epoch: 61, step: 429, loss: 0.33244359493255615, mean loss: 0.3402379247144475
Epoch: 61, step: 430, loss: 0.38620784878730774, mean loss: 0.34023844406059306
Epoch: 61, step: 431, loss: 0.3399936556816101, mean loss: 0.34023844129512265
Epoch: 61, step: 432, loss: 0.3649183511734009, mean loss: 0.340238720110603
Epoch: 61, step: 433, loss: 0.34536805748939514, mean loss: 0.3402387780574317
Epoch: 61, step: 434, loss: 0.38464900851249695, mean loss: 0.3402392797602351
Epoch: 61, step: 435, loss: 0.3322213590145111, mean loss: 0.34023918918273005
Epoch: 61, step: 436, loss: 0.33317020535469055, mean loss: 0.3402391093261556
Epoch: 61, step: 437, loss: 0.32177427411079407, mean loss: 0.3402389007358027
Epoch: 61, step: 438, loss: 0.3833017945289612, mean loss: 0.34023938719574864
Epoch: 61, step: 439, loss: 0.3372660279273987, mean loss: 0.34023935360757745
Epoch: 61, step: 440, loss: 0.3468906879425049, mean loss: 0.34023942874267304
Epoch: 61, step: 441, loss: 0.34268394112586975, mean loss: 0.3402394563561695
Epoch: 61, step: 442, loss: 0.3193403482437134, mean loss: 0.3402392202800784
Epoch: 61, step: 443, loss: 0.365862101316452, mean loss: 0.34023950971258604
Epoch: 61, step: 444, loss: 0.31013163924217224, mean loss: 0.3402391696221019
Epoch: 61, step: 445, loss: 0.3665955066680908, mean loss: 0.340239467332901
Epoch: 61, step: 446, loss: 0.33916038274765015, mean loss: 0.34023945514412435
Epoch: 61, step: 447, loss: 0.32326769828796387, mean loss: 0.3402392634421764
Epoch: 61, step: 448, loss: 0.3513960838317871, mean loss: 0.3402393894609535
Epoch: 61, step: 449, loss: 0.29702869057655334, mean loss: 0.34023890139197566
Epoch: 61, step: 450, loss: 0.2959708869457245, mean loss: 0.340238401386165
Epoch: 61, step: 451, loss: 0.3869670033454895, mean loss: 0.3402389291782717
Epoch: 61, step: 452, loss: 0.32872095704078674, mean loss: 0.3402387990860827
Epoch: 61, step: 453, loss: 0.373831182718277, mean loss: 0.34023917849812757
Epoch: 61, step: 454, loss: 0.3011440336704254, mean loss: 0.3402387369396638
Epoch: 61, step: 455, loss: 0.350870281457901, mean loss: 0.3402388570158386
Epoch: 61, step: 456, loss: 0.33735108375549316, mean loss: 0.3402388244007421
Epoch: 61, step: 457, loss: 0.31769517064094543, mean loss: 0.34023856979102285
Epoch: 61, step: 458, loss: 0.3197714686393738, mean loss: 0.3402383386366555
Epoch: 61, step: 459, loss: 0.30299922823905945, mean loss: 0.3402379180648449
Epoch: 61, step: 460, loss: 0.3201163709163666, mean loss: 0.3402376908182793
Epoch: 61, step: 461, loss: 0.34822413325309753, mean loss: 0.34023778101368546
Epoch: 61, step: 462, loss: 0.3070319890975952, mean loss: 0.3402374060061537
Epoch: 61, step: 463, loss: 0.30679163336753845, mean loss: 0.3402370282926804
Epoch: 61, step: 464, loss: 0.33829519152641296, mean loss: 0.3402370063631638
Epoch: 61, step: 465, loss: 0.3680412471294403, mean loss: 0.34023732035797766
Epoch: 61, step: 466, loss: 0.3326798677444458, mean loss: 0.3402372350122152
Epoch: 61, step: 467, loss: 0.3026294708251953, mean loss: 0.34023681031526665
Epoch: 61, step: 468, loss: 0.34117183089256287, mean loss: 0.3402368208741475
Epoch: 61, step: 469, loss: 0.3454219400882721, mean loss: 0.3402368794273378
Epoch: 61, step: 470, loss: 0.3230731189250946, mean loss: 0.3402366856069945
Epoch: 61, step: 471, loss: 0.2971028685569763, mean loss: 0.34023619852743975
Epoch: 61, step: 472, loss: 0.3064582347869873, mean loss: 0.34023581710119744
Epoch: 61, step: 473, loss: 0.32985737919807434, mean loss: 0.34023569990751756
Epoch: 61, step: 474, loss: 0.3052979111671448, mean loss: 0.3402353053932532
Epoch: 61, step: 475, loss: 0.3258309066295624, mean loss: 0.3402351427419573
Epoch: 61, step: 476, loss: 0.33551546931266785, mean loss: 0.340235089449047
Epoch: 61, step: 477, loss: 0.3190779685974121, mean loss: 0.3402348505528968
Epoch: 61, step: 478, loss: 0.3085389733314514, mean loss: 0.34023449266216116
Epoch: 61, step: 479, loss: 0.32475560903549194, mean loss: 0.3402343178859132
Epoch: 61, step: 480, loss: 0.3310874402523041, mean loss: 0.3402342146072181
Epoch: 61, step: 481, loss: 0.2972961366176605, mean loss: 0.3402337297927522
Epoch: 61, step: 482, loss: 0.3318476676940918, mean loss: 0.3402336351066716
Epoch: 61, step: 483, loss: 0.3330053985118866, mean loss: 0.34023355349438955
Epoch: 61, step: 484, loss: 0.31855252385139465, mean loss: 0.34023330870185897
Epoch: 61, step: 485, loss: 0.36037367582321167, mean loss: 0.3402335360967683
Epoch: 61, step: 486, loss: 0.3453291952610016, mean loss: 0.34023359362868244
Epoch: 61, step: 487, loss: 0.2937171459197998, mean loss: 0.3402330684463708
Epoch: 61, step: 488, loss: 0.33564260601997375, mean loss: 0.34023301661948874
Epoch: 61, step: 489, loss: 0.3462402820587158, mean loss: 0.34023308444148437
Epoch: 61, step: 490, loss: 0.35283857583999634, mean loss: 0.3402332267558101
Epoch: 61, step: 491, loss: 0.30885690450668335, mean loss: 0.3402328725252934
Epoch: 61, step: 492, loss: 0.32608821988105774, mean loss: 0.3402327128376471
Epoch: 61, step: 493, loss: 0.3714474141597748, mean loss: 0.34023306523554864
Epoch: 61, step: 494, loss: 0.3243236243724823, mean loss: 0.34023288562818277
Epoch: 61, step: 495, loss: 0.308201402425766, mean loss: 0.3402325240173993
Epoch: 61, step: 496, loss: 0.333851158618927, mean loss: 0.3402324519775104
Epoch: 61, step: 497, loss: 0.31352776288986206, mean loss: 0.3402321505089379
Epoch: 61, step: 498, loss: 0.311831533908844, mean loss: 0.34023182989870115
Epoch: 61, step: 499, loss: 0.3403221666812897, mean loss: 0.34023183091848785
Epoch: 61, step: 500, loss: 0.3224392831325531, mean loss: 0.34023163006565965
Epoch: 61, step: 501, loss: 0.33773571252822876, mean loss: 0.34023160189058077
Epoch: 61, step: 502, loss: 0.3128046691417694, mean loss: 0.3402312922860931
Epoch: 61, step: 503, loss: 0.3115023672580719, mean loss: 0.3402309679879373
Epoch: 61, step: 504, loss: 0.3205178380012512, mean loss: 0.34023074546448645
Epoch: 61, step: 505, loss: 0.33518555760383606, mean loss: 0.3402306885146291
Epoch: 61, step: 506, loss: 0.32729002833366394, mean loss: 0.3402305424426785
Epoch: 61, step: 507, loss: 0.36042436957359314, mean loss: 0.34023077038455957
Epoch: 61, step: 508, loss: 0.33027249574661255, mean loss: 0.34023065797980256
Epoch: 61, step: 509, loss: 0.33761027455329895, mean loss: 0.34023062840236584
Epoch: 61, step: 510, loss: 0.3069024085998535, mean loss: 0.3402302522161273
Epoch: 61, step: 511, loss: 0.3398458957672119, mean loss: 0.3402302478778225
Epoch: 61, step: 512, loss: 0.2971438467502594, mean loss: 0.3402297615588599
Epoch: 61, step: 513, loss: 0.30785998702049255, mean loss: 0.3402293962032702
Epoch: 61, step: 514, loss: 0.3344111740589142, mean loss: 0.34022933053410753
Epoch: 61, step: 515, loss: 0.3267042338848114, mean loss: 0.3402291778806465
Epoch: 61, step: 516, loss: 0.3391254246234894, mean loss: 0.3402291654230754
Epoch: 61, step: 517, loss: 0.34150224924087524, mean loss: 0.3402291797916429
Epoch: 61, step: 518, loss: 0.34663328528404236, mean loss: 0.3402292520702959
Epoch: 61, step: 519, loss: 0.35708844661712646, mean loss: 0.34022944234606844
Epoch: 61, step: 520, loss: 0.3701327443122864, mean loss: 0.3402297798360743
Epoch: 61, step: 521, loss: 0.329942911863327, mean loss: 0.3402296637393317
Epoch: 61, step: 522, loss: 0.33469316363334656, mean loss: 0.34022960125555385
Epoch: 61, step: 523, loss: 0.32648342847824097, mean loss: 0.34022944612088457
Epoch: 61, step: 524, loss: 0.33054155111312866, mean loss: 0.3402293367878032
Epoch: 61, step: 525, loss: 0.30129390954971313, mean loss: 0.34022889738562245
Epoch: 61, step: 526, loss: 0.3122428059577942, mean loss: 0.34022858155472757
Epoch: 61, step: 527, loss: 0.3212178945541382, mean loss: 0.34022836701621134
Epoch: 61, step: 528, loss: 0.37334007024765015, mean loss: 0.34022874068263986
Epoch: 61, step: 529, loss: 0.3360927700996399, mean loss: 0.3402286940086314
Epoch: 61, step: 530, loss: 0.33174023032188416, mean loss: 0.34022859821826085
Epoch: 61, step: 531, loss: 0.33088475465774536, mean loss: 0.340228492776314
Epoch: 61, step: 532, loss: 0.3644159138202667, mean loss: 0.3402287657196662
Epoch: 61, step: 533, loss: 0.36110976338386536, mean loss: 0.3402290013489702
Epoch: 61, step: 534, loss: 0.3446679711341858, mean loss: 0.3402290514394676
Epoch: 61, step: 535, loss: 0.3085314929485321, mean loss: 0.340228693759954
Epoch: 61, step: 536, loss: 0.3215668797492981, mean loss: 0.3402284831799108
Epoch: 61, step: 537, loss: 0.30580782890319824, mean loss: 0.3402280947813836
Epoch: 61, step: 538, loss: 0.34239253401756287, mean loss: 0.3402281192043803
Epoch: 61, step: 539, loss: 0.3582659959793091, mean loss: 0.34022832273702125
Epoch: 61, step: 540, loss: 0.30763596296310425, mean loss: 0.3402279549811987
Epoch: 61, step: 541, loss: 0.3078487515449524, mean loss: 0.3402275896346476
Epoch: 61, step: 542, loss: 0.3230372369289398, mean loss: 0.3402273956717164
Epoch: 61, step: 543, loss: 0.30037251114845276, mean loss: 0.3402269459844333
Epoch: 61, step: 544, loss: 0.3483069837093353, mean loss: 0.3402270371514072
Epoch: 61, step: 545, loss: 0.32200080156326294, mean loss: 0.3402268315073184
Epoch: 61, step: 546, loss: 0.34424862265586853, mean loss: 0.3402268768841183
Epoch: 61, step: 547, loss: 0.36053648591041565, mean loss: 0.34022710602944983
Epoch: 61, step: 548, loss: 0.3967157006263733, mean loss: 0.3402277433608568
Epoch: 61, step: 549, loss: 0.3091394305229187, mean loss: 0.3402273926115638
Epoch: 61, step: 550, loss: 0.3026784360408783, mean loss: 0.34022696897579274
Epoch: 61, step: 551, loss: 0.39068880677223206, mean loss: 0.3402275382911702
Epoch: 61, step: 552, loss: 0.3377155661582947, mean loss: 0.34022750995117523
Epoch: 61, step: 553, loss: 0.3456859886646271, mean loss: 0.3402275715328751
Epoch: 61, step: 554, loss: 0.3237299621105194, mean loss: 0.34022738541153547
Epoch: 61, step: 555, loss: 0.3335774540901184, mean loss: 0.3402273103897471
Epoch: 61, step: 556, loss: 0.36933013796806335, mean loss: 0.3402276387121665
Epoch: 61, step: 557, loss: 0.30092084407806396, mean loss: 0.3402271952790915
Epoch: 61, step: 558, loss: 0.3678838610649109, mean loss: 0.3402275072796532
Epoch: 61, step: 559, loss: 0.33189669251441956, mean loss: 0.3402274132990706
Epoch: 61, step: 560, loss: 0.3288475275039673, mean loss: 0.3402272849231239
Epoch: 61, step: 561, loss: 0.3239467740058899, mean loss: 0.3402271012655317
Epoch: 61, step: 562, loss: 0.3538750112056732, mean loss: 0.3402272552234766
Epoch: 61, step: 563, loss: 0.31034451723098755, mean loss: 0.3402269181291485
Epoch: 61, step: 564, loss: 0.3167646527290344, mean loss: 0.3402266534643988
Epoch: 61, step: 565, loss: 0.3323555886745453, mean loss: 0.3402265646763019
Epoch: 61, step: 566, loss: 0.35069483518600464, mean loss: 0.3402266827603676
Epoch: 61, step: 567, loss: 0.32241925597190857, mean loss: 0.34022648189150073
Epoch: 61, step: 568, loss: 0.4671419560909271, mean loss: 0.34022791348968917
Epoch: 61, step: 569, loss: 0.3126160204410553, mean loss: 0.3402276020328677
Epoch: 61, step: 570, loss: 0.3212910294532776, mean loss: 0.3402273884343952
Epoch: 61, step: 571, loss: 0.3436412513256073, mean loss: 0.34022742694124064
Epoch: 61, step: 572, loss: 0.30149489641189575, mean loss: 0.34022699006055973
Epoch: 61, step: 573, loss: 0.3089107871055603, mean loss: 0.3402266368357751
Epoch: 61, step: 574, loss: 0.31475648283958435, mean loss: 0.340226349553559
Epoch: 61, step: 575, loss: 0.3049885332584381, mean loss: 0.34022595210469486
Epoch: 61, step: 576, loss: 0.331298828125, mean loss: 0.3402258514164105
Epoch: 61, step: 577, loss: 0.352594256401062, mean loss: 0.3402259909170419
Epoch: 61, step: 578, loss: 0.331066757440567, mean loss: 0.34022588761314426
Epoch: 61, step: 579, loss: 0.3382554054260254, mean loss: 0.3402258653889926
Epoch: 61, step: 580, loss: 0.3194739520549774, mean loss: 0.3402256313404578
Epoch: 61, step: 581, loss: 0.3292143940925598, mean loss: 0.34022550715263783
Epoch: 61, step: 582, loss: 0.355168879032135, mean loss: 0.34022567568627354
Epoch: 61, step: 583, loss: 0.3183042109012604, mean loss: 0.3402254284554261
Epoch: 61, step: 584, loss: 0.2909320294857025, mean loss: 0.3402248725294658
Epoch: 61, step: 585, loss: 0.35222968459129333, mean loss: 0.3402250079169933
Epoch: 61, step: 586, loss: 0.34581345319747925, mean loss: 0.3402250709414915
Epoch: 61, step: 587, loss: 0.32676345109939575, mean loss: 0.340224919127843
Epoch: 61, step: 588, loss: 0.37956157326698303, mean loss: 0.34022536274263143
Epoch: 61, step: 589, loss: 0.36717092990875244, mean loss: 0.3402256666148732
Epoch: 61, step: 590, loss: 0.3080546259880066, mean loss: 0.3402253038176854
Epoch: 61, step: 591, loss: 0.3238409757614136, mean loss: 0.34022511905147973
Epoch: 61, step: 592, loss: 0.3143996596336365, mean loss: 0.34022482782084024
Epoch: 61, step: 593, loss: 0.3878632187843323, mean loss: 0.3402253650272608
Epoch: 61, step: 594, loss: 0.36768248677253723, mean loss: 0.34022567465097947
Epoch: 61, step: 595, loss: 0.2905491888523102, mean loss: 0.3402251144740986
Epoch: 61, step: 596, loss: 0.32028454542160034, mean loss: 0.34022488961681174
Epoch: 61, step: 597, loss: 0.3403419852256775, mean loss: 0.3402248909372106
Epoch: 61, step: 598, loss: 0.41251271963119507, mean loss: 0.34022570606331926
Epoch: 61, step: 599, loss: 0.30212920904159546, mean loss: 0.34022527648755563
Epoch: 61, step: 600, loss: 0.36345672607421875, mean loss: 0.340225538442222
Epoch: 61, step: 601, loss: 0.3299805819988251, mean loss: 0.3402254229227889
Epoch: 61, step: 602, loss: 0.34348875284194946, mean loss: 0.3402254597188235
Epoch: 61, step: 603, loss: 0.30681470036506653, mean loss: 0.3402250829963881
Epoch: 61, step: 604, loss: 0.2889736592769623, mean loss: 0.34022450511836805
Epoch: 61, step: 605, loss: 0.29416584968566895, mean loss: 0.34022398579651175
Epoch: 61, step: 606, loss: 0.35720473527908325, mean loss: 0.34022417725618054
Epoch: 61, step: 607, loss: 0.404387503862381, mean loss: 0.3402249006960241
Epoch: 61, step: 608, loss: 0.36355555057525635, mean loss: 0.34022516374553063
Epoch: 61, step: 609, loss: 0.3150124251842499, mean loss: 0.3402248794789674
Epoch: 61, step: 610, loss: 0.32225868105888367, mean loss: 0.3402246769173978
Epoch: 61, step: 611, loss: 0.36272454261779785, mean loss: 0.3402249305913594
Epoch: 61, step: 612, loss: 0.3145788013935089, mean loss: 0.3402246414482182
Epoch: 61, step: 613, loss: 0.31659457087516785, mean loss: 0.3402243750378079
Epoch: 61, step: 614, loss: 0.3309558629989624, mean loss: 0.3402242705438222
Epoch: 61, step: 615, loss: 0.3196825087070465, mean loss: 0.3402240389568793
Epoch: 61, step: 616, loss: 0.3252417743206024, mean loss: 0.34022387004937393
Epoch: 61, step: 617, loss: 0.33034342527389526, mean loss: 0.3402237586601744
Epoch: 61, step: 618, loss: 0.34166646003723145, mean loss: 0.34022377492457784
Epoch: 61, step: 619, loss: 0.32578331232070923, mean loss: 0.3402236121307624
Epoch: 61, step: 620, loss: 0.3531883955001831, mean loss: 0.3402237582869359
Epoch: 61, step: 621, loss: 0.3068903684616089, mean loss: 0.3402233825131458
Epoch: 61, step: 622, loss: 0.3261031210422516, mean loss: 0.34022322333448496
Epoch: 61, step: 623, loss: 0.3315846621990204, mean loss: 0.34022312595249987
Epoch: 61, step: 624, loss: 0.32620272040367126, mean loss: 0.3402229679030849
Epoch: 61, step: 625, loss: 0.31394580006599426, mean loss: 0.34022267168881554
Epoch: 61, step: 626, loss: 0.3020153343677521, mean loss: 0.34022224099434334
Epoch: 61, step: 627, loss: 0.3196501135826111, mean loss: 0.34022200909643313
Epoch: 61, step: 628, loss: 0.3431534171104431, mean loss: 0.34022204214015855
Epoch: 61, step: 629, loss: 0.3289043605327606, mean loss: 0.3402219145652368
Epoch: 61, step: 630, loss: 0.32086026668548584, mean loss: 0.34022169631975546
Epoch: 61, step: 631, loss: 0.3226390480995178, mean loss: 0.3402214981294829
Epoch: 61, step: 632, loss: 0.34503281116485596, mean loss: 0.34022155236162593
Epoch: 61, step: 633, loss: 0.37053734064102173, mean loss: 0.3402218940711807
Epoch: 61, step: 634, loss: 0.3945702314376831, mean loss: 0.34022250666078796
Epoch: 61, step: 635, loss: 0.314042866230011, mean loss: 0.34022221157917804
Epoch: 61, step: 636, loss: 0.32217341661453247, mean loss: 0.3402220081460003
Epoch: 61, step: 637, loss: 0.365739107131958, mean loss: 0.34022229575334667
Epoch: 61, step: 638, loss: 0.3362259864807129, mean loss: 0.3402222507108067
Epoch: 61, step: 639, loss: 0.35126394033432007, mean loss: 0.34022237516066944
Epoch: 61, step: 640, loss: 0.33987957239151, mean loss: 0.34022237129701466
Epoch: 61, step: 641, loss: 0.3602141737937927, mean loss: 0.3402225966176929
Epoch: 61, step: 642, loss: 0.36993178725242615, mean loss: 0.34022293145591165
Epoch: 61, step: 643, loss: 0.31851470470428467, mean loss: 0.3402226867955254
Epoch: 61, step: 644, loss: 0.30835551023483276, mean loss: 0.34022232764376487
Epoch: 61, step: 645, loss: 0.387584388256073, mean loss: 0.3402228614210737
Epoch: 61, step: 646, loss: 0.3074742257595062, mean loss: 0.3402224923433482
Epoch: 61, step: 647, loss: 0.3248794674873352, mean loss: 0.340222319429125
Epoch: 61, step: 648, loss: 0.3052615523338318, mean loss: 0.3402219254295184
Epoch: 61, step: 649, loss: 0.30213987827301025, mean loss: 0.34022149625865766
Epoch: 61, step: 650, loss: 0.36155831813812256, mean loss: 0.3402217367141924
Epoch: 61, step: 651, loss: 0.32376629114151, mean loss: 0.34022155127146825
Epoch: 61, step: 652, loss: 0.3204100430011749, mean loss: 0.34022132801050303
Epoch: 61, step: 653, loss: 0.34960758686065674, mean loss: 0.3402214337854681
Epoch: 61, step: 654, loss: 0.32173222303390503, mean loss: 0.3402212254305086
Epoch: 61, step: 655, loss: 0.3172612488269806, mean loss: 0.3402209666973938
Epoch: 61, step: 656, loss: 0.3260085880756378, mean loss: 0.34022080654167525
Epoch: 61, step: 657, loss: 0.3262283205986023, mean loss: 0.34022064886564873
Epoch: 61, step: 658, loss: 0.32731905579566956, mean loss: 0.34022050348411925
Epoch: 61, step: 659, loss: 0.3036777675151825, mean loss: 0.3402200917071431
Epoch: 61, step: 660, loss: 0.31517502665519714, mean loss: 0.3402198094933277
Epoch: 61, step: 661, loss: 0.3613761365413666, mean loss: 0.340220047885222
Epoch: 61, step: 662, loss: 0.30418214201927185, mean loss: 0.34021964181058434
Epoch: 61, step: 663, loss: 0.33858588337898254, mean loss: 0.34021962340162376
Epoch: 61, step: 664, loss: 0.3431631326675415, mean loss: 0.34021965656829906
Epoch: 61, step: 665, loss: 0.3090737760066986, mean loss: 0.34021930562879976
Epoch: 61, step: 666, loss: 0.3314080834388733, mean loss: 0.34021920634854164
Epoch: 61, step: 667, loss: 0.3377704322338104, mean loss: 0.3402191787573424
Epoch: 61, step: 668, loss: 0.3089359998703003, mean loss: 0.34021882628273437
Epoch: 61, step: 669, loss: 0.33192363381385803, mean loss: 0.3402187328199894
Epoch: 61, step: 670, loss: 0.35745692253112793, mean loss: 0.34021892704217077
Epoch: 61, step: 671, loss: 0.3272203207015991, mean loss: 0.3402187805889018
Epoch: 61, step: 672, loss: 0.3326575458049774, mean loss: 0.3402186953986094
Epoch: 61, step: 673, loss: 0.32931384444236755, mean loss: 0.34021857253812404
Epoch: 61, step: 674, loss: 0.38179266452789307, mean loss: 0.34021904093109817
Epoch: 61, step: 675, loss: 0.34622547030448914, mean loss: 0.3402191086015508
Epoch: 61, step: 676, loss: 0.3622819781303406, mean loss: 0.34021935716645574
Epoch: 61, step: 677, loss: 0.3746162950992584, mean loss: 0.34021974468519045
Epoch: 61, step: 678, loss: 0.31217578053474426, mean loss: 0.3402194287431408
Epoch: 61, step: 679, loss: 0.3379378020763397, mean loss: 0.3402194030387261
Epoch: 61, step: 680, loss: 0.3749013841152191, mean loss: 0.3402197937555748
Epoch: 61, step: 681, loss: 0.32736706733703613, mean loss: 0.3402196489622258
Epoch: 61, step: 682, loss: 0.37136366963386536, mean loss: 0.3402199998135632
Epoch: 61, step: 683, loss: 0.3403845429420471, mean loss: 0.34022000166719435
Epoch: 61, step: 684, loss: 0.3720986247062683, mean loss: 0.3402203607860651
Epoch: 61, step: 685, loss: 0.3213759958744049, mean loss: 0.3402201485030313
Epoch: 61, step: 686, loss: 0.3460107743740082, mean loss: 0.340220213734085
Epoch: 61, step: 687, loss: 0.3542943298816681, mean loss: 0.3402203722763748
Epoch: 61, step: 688, loss: 0.3327273726463318, mean loss: 0.3402202878700843
Epoch: 61, step: 689, loss: 0.30172619223594666, mean loss: 0.34021985425105583
Epoch: 61, step: 690, loss: 0.3217645585536957, mean loss: 0.3402196463626222
Epoch: 61, step: 691, loss: 0.3095586895942688, mean loss: 0.34021930098823305
Epoch: 61, step: 692, loss: 0.3451918065547943, mean loss: 0.34021935699942474
Epoch: 61, step: 693, loss: 0.3563989996910095, mean loss: 0.34021953924775983
Epoch: 61, step: 694, loss: 0.31251761317253113, mean loss: 0.3402192272153414
Epoch: 61, step: 695, loss: 0.3362000584602356, mean loss: 0.34021918194423584
Epoch: 61, step: 696, loss: 0.3079102635383606, mean loss: 0.34021881802719944
Epoch: 61, step: 697, loss: 0.32537221908569336, mean loss: 0.3402186508018729
Epoch: 61, step: 698, loss: 0.3338174521923065, mean loss: 0.34021857870250016
Epoch: 61, step: 699, loss: 0.3319329619407654, mean loss: 0.3402184853791901
Epoch: 61, step: 700, loss: 0.3361283242702484, mean loss: 0.34021843931103546
Epoch: 61, step: 701, loss: 0.29940399527549744, mean loss: 0.34021797961644357
Epoch: 61, step: 702, loss: 0.35578805208206177, mean loss: 0.3402181549807702
Epoch: 61, step: 703, loss: 0.31781360507011414, mean loss: 0.3402179026431805
Epoch: 61, step: 704, loss: 0.31230607628822327, mean loss: 0.3402175882818705
Epoch: 61, step: 705, loss: 0.31332308053970337, mean loss: 0.34021728538168194
Epoch: 61, step: 706, loss: 0.32086727023124695, mean loss: 0.34021706745401864
Epoch: 61, step: 707, loss: 0.3039689064025879, mean loss: 0.3402166592172287
Epoch: 61, step: 708, loss: 0.37565335631370544, mean loss: 0.340217058310593
Epoch: 61, step: 709, loss: 0.3325590491294861, mean loss: 0.34021697206592355
Epoch: 61, step: 710, loss: 0.3159331977367401, mean loss: 0.3402166985845977
Epoch: 61, step: 711, loss: 0.30407604575157166, mean loss: 0.3402162915769303
Epoch: 61, step: 712, loss: 0.38721123337745667, mean loss: 0.3402168208171276
Epoch: 61, step: 713, loss: 0.3496486246585846, mean loss: 0.34021692703352713
Epoch: 61, step: 714, loss: 0.35322409868240356, mean loss: 0.3402170735123349
Epoch: 61, step: 715, loss: 0.33456137776374817, mean loss: 0.34021700982206743
Epoch: 61, step: 716, loss: 0.31540706753730774, mean loss: 0.34021673043397177
Epoch: 61, step: 717, loss: 0.3491705060005188, mean loss: 0.3402168312625068
Epoch: 61, step: 718, loss: 0.307767778635025, mean loss: 0.34021646585759224
Epoch: 61, step: 719, loss: 0.31287142634391785, mean loss: 0.34021615793182863
Epoch: 61, step: 720, loss: 0.372968465089798, mean loss: 0.34021652674335
Epoch: 61, step: 721, loss: 0.3415287435054779, mean loss: 0.34021654151956743
Epoch: 61, step: 722, loss: 0.3094261884689331, mean loss: 0.3402161948086882
Epoch: 61, step: 723, loss: 0.3396490812301636, mean loss: 0.34021618842284934
Epoch: 61, step: 724, loss: 0.3206658959388733, mean loss: 0.3402159682842093
Epoch: 61, step: 725, loss: 0.3584386110305786, mean loss: 0.3402161734710435
Epoch: 61, step: 726, loss: 0.3254619836807251, mean loss: 0.34021600734083673
Epoch: 61, step: 727, loss: 0.30923327803611755, mean loss: 0.3402156584833704
Epoch: 61, step: 728, loss: 0.337228387594223, mean loss: 0.34021562484785656
Epoch: 61, step: 729, loss: 0.32842519879341125, mean loss: 0.3402154920937181
Epoch: 61, step: 730, loss: 0.3065498173236847, mean loss: 0.34021511303978835
Epoch: 61, step: 731, loss: 0.33372315764427185, mean loss: 0.34021503994535274
Epoch: 61, step: 732, loss: 0.3684370219707489, mean loss: 0.3402153576996343
Epoch: 61, step: 733, loss: 0.3084949553012848, mean loss: 0.3402150005602887
Epoch: 61, step: 734, loss: 0.32799211144447327, mean loss: 0.3402148629445858
Epoch: 61, step: 735, loss: 0.3248501718044281, mean loss: 0.3402146899577457
Epoch: 61, step: 736, loss: 0.31880924105644226, mean loss: 0.34021444896238534
Epoch: 61, step: 737, loss: 0.32538706064224243, mean loss: 0.3402142820286491
Epoch: 61, step: 738, loss: 0.32850968837738037, mean loss: 0.3402141502542928
Epoch: 61, step: 739, loss: 0.34150031208992004, mean loss: 0.34021416473418375
Epoch: 61, step: 740, loss: 0.3190230429172516, mean loss: 0.34021392616259
Epoch: 61, step: 741, loss: 0.33746516704559326, mean loss: 0.34021389521715606
Epoch: 61, step: 742, loss: 0.3155730962753296, mean loss: 0.34021361781502674
Epoch: 61, step: 743, loss: 0.3207329213619232, mean loss: 0.34021339850696564
Epoch: 61, step: 744, loss: 0.3326319754123688, mean loss: 0.34021331315845227
Epoch: 61, step: 745, loss: 0.33850836753845215, mean loss: 0.3402132939650985
Epoch: 61, step: 746, loss: 0.34180107712745667, mean loss: 0.34021331183929965
Epoch: 61, step: 747, loss: 0.38650843501091003, mean loss: 0.3402138329929737
Epoch: 61, step: 748, loss: 0.3045060932636261, mean loss: 0.34021343102816637
Epoch: 61, step: 749, loss: 0.34805166721343994, mean loss: 0.34021351926280835
Epoch: 61, step: 750, loss: 0.3576335310935974, mean loss: 0.34021371535682343
Epoch: 61, step: 751, loss: 0.3697834312915802, mean loss: 0.34021404821417783
Epoch: 61, step: 752, loss: 0.3416953384876251, mean loss: 0.340214064888427
Epoch: 61, step: 753, loss: 0.3685588836669922, mean loss: 0.3402143839503012
Epoch: 61, step: 754, loss: 0.3212447166442871, mean loss: 0.34021417042170105
Epoch: 61, step: 755, loss: 0.3196362555027008, mean loss: 0.3402139387927623
Epoch: 61, step: 756, loss: 0.29584088921546936, mean loss: 0.3402134393268673
Epoch: 61, step: 757, loss: 0.31379634141921997, mean loss: 0.34021314197766417
Epoch: 61, step: 758, loss: 0.37759366631507874, mean loss: 0.3402135627257742
Epoch: 61, step: 759, loss: 0.31120070815086365, mean loss: 0.34021323616624766
Epoch: 61, step: 760, loss: 0.34774264693260193, mean loss: 0.34021332091396295
Epoch: 61, step: 761, loss: 0.3138900399208069, mean loss: 0.34021302463409675
Epoch: 61, step: 762, loss: 0.3405296802520752, mean loss: 0.340213028198152
Epoch: 61, step: 763, loss: 0.28598013520240784, mean loss: 0.3402124177973214
Epoch: 61, step: 764, loss: 0.3434508442878723, mean loss: 0.3402124542459758
Epoch: 61, step: 765, loss: 0.330486923456192, mean loss: 0.3402123447858656
Epoch: 61, step: 766, loss: 0.3542821705341339, mean loss: 0.3402125031389032
Epoch: 61, step: 767, loss: 0.32011207938194275, mean loss: 0.34021227691525313
Epoch: 61, step: 768, loss: 0.3305000960826874, mean loss: 0.3402121676090864
Epoch: 61, step: 769, loss: 0.3369196951389313, mean loss: 0.34021213055422705
Epoch: 61, step: 770, loss: 0.34210407733917236, mean loss: 0.34021215184674614
Epoch: 61, step: 771, loss: 0.34282782673835754, mean loss: 0.34021218128398045
Epoch: 61, step: 772, loss: 0.3075411319732666, mean loss: 0.3402118136027701
Epoch: 61, step: 773, loss: 0.3450612723827362, mean loss: 0.3402118681781463
Epoch: 61, step: 774, loss: 0.3185330927371979, mean loss: 0.34021162420988826
Epoch: 61, step: 775, loss: 0.31013473868370056, mean loss: 0.3402112857349217
Epoch: 61, step: 776, loss: 0.3435423970222473, mean loss: 0.3402113232216852
Epoch: 61, step: 777, loss: 0.42331382632255554, mean loss: 0.34021225840773883
Epoch: 61, step: 778, loss: 0.3782413899898529, mean loss: 0.34021268636011026
Epoch: 61, step: 779, loss: 0.37923821806907654, mean loss: 0.34021312552030686
Epoch: 61, step: 780, loss: 0.3273596465587616, mean loss: 0.3402129808797964
Epoch: 61, step: 781, loss: 0.3264094889163971, mean loss: 0.3402128255505145
Epoch: 61, step: 782, loss: 0.2953035831451416, mean loss: 0.3402123201970942
Epoch: 61, step: 783, loss: 0.31493377685546875, mean loss: 0.3402120357466357
Epoch: 61, step: 784, loss: 0.3179422616958618, mean loss: 0.3402117851556079
Epoch: 61, step: 785, loss: 0.31613388657569885, mean loss: 0.3402115142216754
Epoch: 61, step: 786, loss: 0.31613069772720337, mean loss: 0.3402112432579584
Epoch: 61, step: 787, loss: 0.3167460858821869, mean loss: 0.3402109792247716
Epoch: 61, step: 788, loss: 0.35116347670555115, mean loss: 0.340211102462397
Epoch: 61, step: 789, loss: 0.34701502323150635, mean loss: 0.34021117901932896
Epoch: 61, step: 790, loss: 0.34251657128334045, mean loss: 0.340211204959045
Epoch: 61, step: 791, loss: 0.3632243871688843, mean loss: 0.34021146389489054
Epoch: 61, step: 792, loss: 0.3721778392791748, mean loss: 0.34021182356471946
Epoch: 61, step: 793, loss: 0.3363935053348541, mean loss: 0.3402117806033766
Epoch: 61, step: 794, loss: 0.29433009028434753, mean loss: 0.34021126437693033
Epoch: 61, step: 795, loss: 0.37168174982070923, mean loss: 0.3402116184552994
Epoch: 61, step: 796, loss: 0.346403568983078, mean loss: 0.34021168812092567
Epoch: 61, step: 797, loss: 0.3025972843170166, mean loss: 0.3402112649260853
Epoch: 61, step: 798, loss: 0.30775773525238037, mean loss: 0.34021089979968683
Epoch: 61, step: 799, loss: 0.3080619275569916, mean loss: 0.3402105381038558
Epoch: 61, step: 800, loss: 0.3231225311756134, mean loss: 0.340210345855367
Epoch: 61, step: 801, loss: 0.30691349506378174, mean loss: 0.34020997125362107
Epoch: 61, step: 802, loss: 0.30399519205093384, mean loss: 0.34020956382869727
Epoch: 61, step: 803, loss: 0.3638400435447693, mean loss: 0.3402098296742525
Epoch: 61, step: 804, loss: 0.30528855323791504, mean loss: 0.3402094368103837
Epoch: 61, step: 805, loss: 0.31072545051574707, mean loss: 0.340209105119684
Epoch: 61, step: 806, loss: 0.2982501685619354, mean loss: 0.34020863309285837
Epoch: 61, step: 807, loss: 0.2964760661125183, mean loss: 0.34020814111869896
Epoch: 61, step: 808, loss: 0.3193231225013733, mean loss: 0.34020790617310576
Epoch: 61, step: 809, loss: 0.3294995427131653, mean loss: 0.3402077857109434
Epoch: 61, step: 810, loss: 0.31258419156074524, mean loss: 0.34020747496687287
Epoch: 61, step: 811, loss: 0.3176814317703247, mean loss: 0.3402072215691587
Epoch: 61, step: 812, loss: 0.37996912002563477, mean loss: 0.340207668849702
Epoch: 61, step: 813, loss: 0.2938304543495178, mean loss: 0.3402071471595121
Epoch: 61, step: 814, loss: 0.31174159049987793, mean loss: 0.3402068269584226
Epoch: 61, step: 815, loss: 0.3415941298007965, mean loss: 0.34020684256362893
Epoch: 61, step: 816, loss: 0.31187358498573303, mean loss: 0.34020652385790484
Epoch: 61, step: 817, loss: 0.3419342637062073, mean loss: 0.3402065432921116
Epoch: 61, step: 818, loss: 0.3513370752334595, mean loss: 0.3402066684907206
Epoch: 61, step: 819, loss: 0.3121681213378906, mean loss: 0.34020635311067976
Epoch: 61, step: 820, loss: 0.40719443559646606, mean loss: 0.3402071065900396
Epoch: 61, step: 821, loss: 0.3198499083518982, mean loss: 0.340206877615637
Epoch: 61, step: 822, loss: 0.31734493374824524, mean loss: 0.3402066204711617
Epoch: 61, step: 823, loss: 0.3638378977775574, mean loss: 0.3402068862658855
Epoch: 61, step: 824, loss: 0.31218865513801575, mean loss: 0.34020657113208436
Epoch: 61, step: 825, loss: 0.36489221453666687, mean loss: 0.34020684877963137
Epoch: 61, step: 826, loss: 0.2875918447971344, mean loss: 0.34020625700803975
Epoch: 61, step: 827, loss: 0.33813783526420593, mean loss: 0.34020623374434367
Epoch: 61, step: 828, loss: 0.33922669291496277, mean loss: 0.3402062227274977
Epoch: 61, step: 829, loss: 0.30146220326423645, mean loss: 0.3402057869803773
Epoch: 61, step: 830, loss: 0.3343600034713745, mean loss: 0.3402057212346256
Epoch: 61, step: 831, loss: 0.3427799344062805, mean loss: 0.3402057501856937
Epoch: 61, step: 832, loss: 0.3688797652721405, mean loss: 0.3402060726663789
Epoch: 61, step: 833, loss: 0.31426650285720825, mean loss: 0.3402057809417584
Epoch: 61, step: 834, loss: 0.33336129784584045, mean loss: 0.34020570396739863
Epoch: 61, step: 835, loss: 0.3153449296951294, mean loss: 0.3402054243815431
Epoch: 61, step: 836, loss: 0.3305501341819763, mean loss: 0.3402053157987539
Epoch: 61, step: 837, loss: 0.2899680733680725, mean loss: 0.3402047508402236
Epoch: 61, step: 838, loss: 0.34497693181037903, mean loss: 0.340204804506665
Epoch: 61, step: 839, loss: 0.34121114015579224, mean loss: 0.34020481582347095
Epoch: 61, step: 840, loss: 0.3033773601055145, mean loss: 0.3402044016828388
Epoch: 61, step: 841, loss: 0.30795931816101074, mean loss: 0.34020403907703706
Epoch: 61, step: 842, loss: 0.29379332065582275, mean loss: 0.3402035171802181
Epoch: 61, step: 843, loss: 0.33700239658355713, mean loss: 0.34020348118344995
Epoch: 61, step: 844, loss: 0.3043712377548218, mean loss: 0.34020307825253393
Epoch: 61, step: 845, loss: 0.35175150632858276, mean loss: 0.34020320811228966
Epoch: 61, step: 846, loss: 0.3135335445404053, mean loss: 0.34020290822064814
Epoch: 61, step: 847, loss: 0.30466505885124207, mean loss: 0.34020250861365214
Epoch: 61, step: 848, loss: 0.3170980215072632, mean loss: 0.34020224881709626
Epoch: 61, step: 849, loss: 0.33658504486083984, mean loss: 0.3402022081441933
Epoch: 61, step: 850, loss: 0.31788572669029236, mean loss: 0.34020195721394697
Epoch: 61, step: 851, loss: 0.313538134098053, mean loss: 0.34020165740483577
Epoch: 61, step: 852, loss: 0.33558517694473267, mean loss: 0.34020160549752543
Epoch: 61, step: 853, loss: 0.3567447364330292, mean loss: 0.3402017915049793
Epoch: 61, step: 854, loss: 0.3107926547527313, mean loss: 0.34020146083860403
Epoch: 61, step: 855, loss: 0.3258397579193115, mean loss: 0.34020129936229504
Epoch: 61, step: 856, loss: 0.3272134065628052, mean loss: 0.34020115333411005
Epoch: 61, step: 857, loss: 0.41124337911605835, mean loss: 0.3402019520818983
Epoch: 61, step: 858, loss: 0.33987993001937866, mean loss: 0.3402019484613541
Epoch: 61, step: 859, loss: 0.34343865513801575, mean loss: 0.3402019848517422
Epoch: 61, step: 860, loss: 0.32103031873703003, mean loss: 0.3402017693065613
Epoch: 61, step: 861, loss: 0.3151368200778961, mean loss: 0.34020148750693874
Epoch: 61, step: 862, loss: 0.3665735721588135, mean loss: 0.34020178399905937
Epoch: 61, step: 863, loss: 0.37129753828048706, mean loss: 0.3402021335938145
Epoch: 61, step: 864, loss: 0.3829106390476227, mean loss: 0.34020261373980215
Epoch: 61, step: 865, loss: 0.3234472870826721, mean loss: 0.3402024253718802
Epoch: 61, step: 866, loss: 0.35079890489578247, mean loss: 0.34020254449903475
Epoch: 61, step: 867, loss: 0.3670571744441986, mean loss: 0.34020284639927245
Epoch: 61, step: 868, loss: 0.3283601403236389, mean loss: 0.3402027132648523
Epoch: 61, step: 869, loss: 0.31614619493484497, mean loss: 0.3402024428271167
Epoch: 61, step: 870, loss: 0.34918534755706787, mean loss: 0.3402025438096891
Epoch: 61, step: 871, loss: 0.3027145564556122, mean loss: 0.34020212238800474
Epoch: 61, step: 872, loss: 0.3003688454627991, mean loss: 0.3402016746067517
Epoch: 61, step: 873, loss: 0.3436829745769501, mean loss: 0.34020171374094954
Epoch: 61, step: 874, loss: 0.3017490804195404, mean loss: 0.3402012814897628
Epoch: 61, step: 875, loss: 0.31523600220680237, mean loss: 0.34020100085487875
Epoch: 61, step: 876, loss: 0.337131530046463, mean loss: 0.3402009663513232
Epoch: 61, step: 877, loss: 0.3499654233455658, mean loss: 0.3402010761111869
Epoch: 61, step: 878, loss: 0.35149896144866943, mean loss: 0.3402012031065146
Epoch: 61, step: 879, loss: 0.3533155918121338, mean loss: 0.3402013505188241
Epoch: 61, step: 880, loss: 0.32261574268341064, mean loss: 0.3402011528499899
Epoch: 61, step: 881, loss: 0.3129388988018036, mean loss: 0.34020084641546383
Epoch: 61, step: 882, loss: 0.3527170717716217, mean loss: 0.3402009870993731
Epoch: 61, step: 883, loss: 0.32224687933921814, mean loss: 0.34020078529526643
Epoch: 61, step: 884, loss: 0.34452956914901733, mean loss: 0.3402008339502345
Epoch: 61, step: 885, loss: 0.2838251292705536, mean loss: 0.34020020030176107
Epoch: 61, step: 886, loss: 0.27359870076179504, mean loss: 0.34019945172638777
Epoch: 61, step: 887, loss: 0.3525996208190918, mean loss: 0.34019959109797765
Epoch: 61, step: 888, loss: 0.3605336844921112, mean loss: 0.3401998196402702
Epoch: 61, step: 889, loss: 0.3286106586456299, mean loss: 0.3401996893869266
Epoch: 61, step: 890, loss: 0.2942551076412201, mean loss: 0.34019917301062147
Epoch: 61, step: 891, loss: 0.3404615819454193, mean loss: 0.34019917595983173
Epoch: 61, step: 892, loss: 0.3620239198207855, mean loss: 0.3401994212450612
Epoch: 61, step: 893, loss: 0.30751749873161316, mean loss: 0.34019905394165456
Epoch: 61, step: 894, loss: 0.35073962807655334, mean loss: 0.3401991724030234
Epoch: 61, step: 895, loss: 0.3301335573196411, mean loss: 0.34019905928080396
Epoch: 61, step: 896, loss: 0.3465324342250824, mean loss: 0.3401991304575152
Epoch: 61, step: 897, loss: 0.3690703511238098, mean loss: 0.34019945491887443
Epoch: 61, step: 898, loss: 0.3161492645740509, mean loss: 0.3401991846403904
Epoch: 61, step: 899, loss: 0.30351921916007996, mean loss: 0.3401987724318419
Epoch: 61, step: 900, loss: 0.3214452564716339, mean loss: 0.3401985616826599
Epoch: 61, step: 901, loss: 0.35198816657066345, mean loss: 0.34019869417097137
Epoch: 61, step: 902, loss: 0.4045379161834717, mean loss: 0.34019941718918767
Epoch: 61, step: 903, loss: 0.35957032442092896, mean loss: 0.3401996348691808
Epoch: 61, step: 904, loss: 0.3566553294658661, mean loss: 0.34019981978748076
Epoch: 61, step: 905, loss: 0.33343738317489624, mean loss: 0.3401997437965086
Epoch: 61, step: 906, loss: 0.3204570710659027, mean loss: 0.3401995219462908
Epoch: 61, step: 907, loss: 0.3246307671070099, mean loss: 0.3401993470007357
Epoch: 61, step: 908, loss: 0.326639860868454, mean loss: 0.3401991946349751
Epoch: 61, step: 909, loss: 0.32822906970977783, mean loss: 0.3401990601301217
Epoch: 61, step: 910, loss: 0.3659386932849884, mean loss: 0.3401993493557316
Epoch: 61, step: 911, loss: 0.31295594573020935, mean loss: 0.3401990432363147
Epoch: 61, step: 912, loss: 0.36036932468414307, mean loss: 0.3401992698763301
Epoch: 61, step: 913, loss: 0.31259381771087646, mean loss: 0.3401989596957399
Epoch: 61, step: 914, loss: 0.29244494438171387, mean loss: 0.3401984231277412
Epoch: 61, step: 915, loss: 0.34510311484336853, mean loss: 0.34019847823663685
Epoch: 61, step: 916, loss: 0.30411723256111145, mean loss: 0.34019807283393716
Epoch: 61, step: 917, loss: 0.28369078040122986, mean loss: 0.34019743793480645
Epoch: 61, step: 918, loss: 0.3199632167816162, mean loss: 0.34019721059167024
Epoch: 61, step: 919, loss: 0.3463682234287262, mean loss: 0.340197279925777
Epoch: 61, step: 920, loss: 0.34934136271476746, mean loss: 0.3401973826625085
Epoch: 61, step: 921, loss: 0.33413946628570557, mean loss: 0.3401973146006208
Epoch: 61, step: 922, loss: 0.3341819643974304, mean loss: 0.3401972470177318
Epoch: 61, step: 923, loss: 0.31623154878616333, mean loss: 0.34019697776442615
Epoch: 61, step: 924, loss: 0.3295555114746094, mean loss: 0.340196858209479
Epoch: 61, step: 925, loss: 0.33697593212127686, mean loss: 0.34019682202336404
Epoch: 61, step: 926, loss: 0.30159106850624084, mean loss: 0.3401963883044583
Epoch: 61, step: 927, loss: 0.3145151734352112, mean loss: 0.340196099790383
Epoch: 61, step: 928, loss: 0.32674089074134827, mean loss: 0.3401959486303384
Epoch: 61, step: 929, loss: 0.29893285036087036, mean loss: 0.34019548507293995
Epoch: 61, step: 930, loss: 0.30700021982192993, mean loss: 0.3401951121552828
Epoch: 61, step: 931, loss: 0.3604693114757538, mean loss: 0.3401953399143297
Epoch: 61, step: 932, loss: 0.3058278262615204, mean loss: 0.34019495383623616
Epoch: 61, step: 933, loss: 0.3086158037185669, mean loss: 0.34019459908607197
Epoch: 61, step: 934, loss: 0.34692949056625366, mean loss: 0.3401946747428585
Epoch: 61, step: 935, loss: 0.31709951162338257, mean loss: 0.3401944153049444
Epoch: 61, step: 936, loss: 0.30288928747177124, mean loss: 0.34019399624508395
Epoch: 61, step: 937, loss: 0.33407294750213623, mean loss: 0.34019392748625193
Epoch: 61, step: 938, loss: 0.3169788718223572, mean loss: 0.3401936667103214
Epoch: 61, step: 939, loss: 0.33541446924209595, mean loss: 0.34019361302595014
Epoch: 61, step: 940, loss: 0.3137317895889282, mean loss: 0.34019331578558576
Epoch: 61, step: 941, loss: 0.3318272829055786, mean loss: 0.3401932218126691
Epoch: 61, step: 942, loss: 0.3114486038684845, mean loss: 0.3401928989373847
Epoch: 61, step: 943, loss: 0.34271323680877686, mean loss: 0.3401929272468814
Epoch: 61, step: 944, loss: 0.34323787689208984, mean loss: 0.34019296144865435
Epoch: 61, step: 945, loss: 0.33440133929252625, mean loss: 0.3401928963961759
Epoch: 61, step: 946, loss: 0.34408143162727356, mean loss: 0.34019294007236994
Epoch: 61, step: 947, loss: 0.31650659441947937, mean loss: 0.3401926740293107
Epoch: 61, step: 948, loss: 0.34255364537239075, mean loss: 0.3401927005472461
Epoch: 61, step: 949, loss: 0.31842315196990967, mean loss: 0.34019245603898435
Epoch: 61, step: 950, loss: 0.3375709056854248, mean loss: 0.34019242659494153
Epoch: 61, step: 951, loss: 0.3276654779911041, mean loss: 0.3401922858996205
Epoch: 61, step: 952, loss: 0.30361104011535645, mean loss: 0.3401918750451916
Epoch: 61, step: 953, loss: 0.3190605938434601, mean loss: 0.34019163771639715
Epoch: 61, step: 954, loss: 0.32407698035240173, mean loss: 0.34019145673213896
Epoch: 61, step: 955, loss: 0.35151761770248413, mean loss: 0.34019158393520466
Epoch: 61, step: 956, loss: 0.3344438374042511, mean loss: 0.34019151938352027
Epoch: 61, step: 957, loss: 0.3167848289012909, mean loss: 0.3401912565110502
Epoch: 61, step: 958, loss: 0.29346996545791626, mean loss: 0.3401907318062328
Epoch: 61, step: 959, loss: 0.307807981967926, mean loss: 0.3401903681349036
Epoch: 61, step: 960, loss: 0.35252895951271057, mean loss: 0.34019050670070045
Epoch: 61, step: 961, loss: 0.30979466438293457, mean loss: 0.3401901653508103
Epoch: 61, step: 962, loss: 0.3132741153240204, mean loss: 0.34018986308290655
Epoch: 61, step: 963, loss: 0.3518214523792267, mean loss: 0.3401899937044735
Epoch: 61, step: 964, loss: 0.37484505772590637, mean loss: 0.340190382872954
Epoch: 61, step: 965, loss: 0.32008686661720276, mean loss: 0.3401901571175777
Epoch: 61, step: 966, loss: 0.3187941312789917, mean loss: 0.34018991685047417
Epoch: 61, step: 967, loss: 0.28506213426589966, mean loss: 0.3401892977988798
Epoch: 61, step: 968, loss: 0.322420597076416, mean loss: 0.340189098269378
Epoch: 61, step: 969, loss: 0.32052531838417053, mean loss: 0.340188877462004
Epoch: 61, step: 970, loss: 0.34402787685394287, mean loss: 0.34018892057018874
Epoch: 61, step: 971, loss: 0.3565160930156708, mean loss: 0.34018910390620705
Epoch: 61, step: 972, loss: 0.38136664032936096, mean loss: 0.3401895662790292
Epoch: 61, step: 973, loss: 0.3184707760810852, mean loss: 0.34018932240660676
Epoch: 61, step: 974, loss: 0.3003309667110443, mean loss: 0.340188874856604
Epoch: 61, step: 975, loss: 0.30583813786506653, mean loss: 0.3401884891532917
Epoch: 61, step: 976, loss: 0.41663455963134766, mean loss: 0.3401893475095922
Epoch: 61, step: 977, loss: 0.3185511827468872, mean loss: 0.3401891045533958
Epoch: 61, step: 978, loss: 0.3554530441761017, mean loss: 0.34018927593701886
Epoch: 61, step: 979, loss: 0.34802764654159546, mean loss: 0.34018936394531185
Epoch: 61, step: 980, loss: 0.313133180141449, mean loss: 0.3401890601651086
Epoch: 61, step: 981, loss: 0.33472710847854614, mean loss: 0.3401889988403417
Epoch: 61, step: 982, loss: 0.37900349497795105, mean loss: 0.3401894346302093
Epoch: 61, step: 983, loss: 0.30547043681144714, mean loss: 0.3401890448269374
Epoch: 61, step: 984, loss: 0.3072378933429718, mean loss: 0.3401886748760961
Epoch: 61, step: 985, loss: 0.3278534412384033, mean loss: 0.34018853638688945
Epoch: 61, step: 986, loss: 0.34922847151756287, mean loss: 0.3401886378782293
Epoch: 61, step: 987, loss: 0.3123866617679596, mean loss: 0.3401883257489843
Epoch: 61, step: 988, loss: 0.34094634652137756, mean loss: 0.3401883342590914
Epoch: 61, step: 989, loss: 0.31408920884132385, mean loss: 0.34018804125411334
Epoch: 61, step: 990, loss: 0.31946805119514465, mean loss: 0.34018780864125836
Epoch: 61, step: 991, loss: 0.347539484500885, mean loss: 0.3401878911738806
Epoch: 61, step: 992, loss: 0.3879517912864685, mean loss: 0.3401884273830043
Epoch: 61, step: 993, loss: 0.3526759743690491, mean loss: 0.3401885675696608
Epoch: 61, step: 994, loss: 0.32681092619895935, mean loss: 0.34018841739238703
Epoch: 61, step: 995, loss: 0.32214295864105225, mean loss: 0.34018821481651423
Epoch: 61, step: 996, loss: 0.34302982687950134, mean loss: 0.3401882467157078
Epoch: 61, step: 997, loss: 0.32092517614364624, mean loss: 0.34018803047594476
Epoch: 61, step: 998, loss: 0.393820583820343, mean loss: 0.3401886325274399
Epoch: 61, step: 999, loss: 0.30966508388519287, mean loss: 0.34018828988960775
Epoch: 61, step: 1000, loss: 0.30371934175491333, mean loss: 0.3401878805171193
Epoch: 61, step: 1001, loss: 0.3461087644100189, mean loss: 0.34018794697968235
Epoch: 61, step: 1002, loss: 0.37787607312202454, mean loss: 0.340188370028232
Epoch: 61, step: 1003, loss: 0.3429343104362488, mean loss: 0.34018840085101854
Epoch: 61, step: 1004, loss: 0.34026339650154114, mean loss: 0.3401884016928245
Epoch: 61, step: 1005, loss: 0.3564069867134094, mean loss: 0.3401885837400242
Epoch: 61, step: 1006, loss: 0.3379760682582855, mean loss: 0.3401885589056921
Epoch: 61, step: 1007, loss: 0.38859322667121887, mean loss: 0.3401891022167387
Epoch: 61, step: 1008, loss: 0.3093346357345581, mean loss: 0.3401887558992224
Epoch: 61, step: 1009, loss: 0.35470399260520935, mean loss: 0.3401889188196963
Epoch: 61, step: 1010, loss: 0.35177406668663025, mean loss: 0.3401890488510995
Epoch: 61, step: 1011, loss: 0.3307383954524994, mean loss: 0.3401889427783982
Epoch: 61, step: 1012, loss: 0.32631877064704895, mean loss: 0.3401887871034357
Epoch: 61, step: 1013, loss: 0.3183043599128723, mean loss: 0.3401885414814555
Epoch: 61, step: 1014, loss: 0.32189950346946716, mean loss: 0.3401883362149765
Epoch: 61, step: 1015, loss: 0.36486107110977173, mean loss: 0.3401886131255814
Epoch: 61, step: 1016, loss: 0.3287757337093353, mean loss: 0.3401884850363409
Epoch: 61, step: 1017, loss: 0.3610673248767853, mean loss: 0.3401887193614946
Epoch: 61, step: 1018, loss: 0.35555315017700195, mean loss: 0.34018889179598966
Epoch: 61, step: 1019, loss: 0.36639803647994995, mean loss: 0.340189185937046
Epoch: 61, step: 1020, loss: 0.31530633568763733, mean loss: 0.3401889066839149
Epoch: 61, step: 1021, loss: 0.3529540002346039, mean loss: 0.34018904994131116
Epoch: 61, step: 1022, loss: 0.3270166218280792, mean loss: 0.3401889021142256
Epoch: 61, step: 1023, loss: 0.3048022985458374, mean loss: 0.3401885049938372
Epoch: 61, step: 1024, loss: 0.3313552737236023, mean loss: 0.34018840586545207
Epoch: 61, step: 1025, loss: 0.3737834692001343, mean loss: 0.3401887828721105
Epoch: 61, step: 1026, loss: 0.2875629961490631, mean loss: 0.34018819230768277
Epoch: 61, step: 1027, loss: 0.3274102210998535, mean loss: 0.34018804891542126
Epoch: 61, step: 1028, loss: 0.34098610281944275, mean loss: 0.3401880578709486
Epoch: 61, step: 1029, loss: 0.3131664991378784, mean loss: 0.34018775464632917
Epoch: 61, step: 1030, loss: 0.3319603204727173, mean loss: 0.3401876623225433
Epoch: 61, step: 1031, loss: 0.35232165455818176, mean loss: 0.34018779848206837
Epoch: 61, step: 1032, loss: 0.33663785457611084, mean loss: 0.34018775864742506
Epoch: 61, step: 1033, loss: 0.3438848555088043, mean loss: 0.3401878001328361
Epoch: 61, step: 1034, loss: 0.31838592886924744, mean loss: 0.3401875554950904
Epoch: 61, step: 1035, loss: 0.3609886169433594, mean loss: 0.3401877889001785
Epoch: 61, step: 1036, loss: 0.337089866399765, mean loss: 0.3401877541393196
Epoch: 61, step: 1037, loss: 0.3033793270587921, mean loss: 0.3401873411276381
Epoch: 61, step: 1038, loss: 0.3275599181652069, mean loss: 0.34018719944229353
Epoch: 61, step: 1039, loss: 0.3816402554512024, mean loss: 0.3401876645589401
Epoch: 61, step: 1040, loss: 0.3435021936893463, mean loss: 0.3401877017486078
Epoch: 61, step: 1041, loss: 0.3243001401424408, mean loss: 0.34018752348904713
Epoch: 61, step: 1042, loss: 0.3266936242580414, mean loss: 0.3401873720882457
Epoch: 61, step: 1043, loss: 0.30821672081947327, mean loss: 0.3401870133833351
Epoch: 61, step: 1044, loss: 0.29390963912010193, mean loss: 0.3401864941654121
Epoch: 61, step: 1045, loss: 0.31617653369903564, mean loss: 0.34018622478405375
Epoch: 61, step: 1046, loss: 0.32118523120880127, mean loss: 0.34018601160352646
Epoch: 61, step: 1047, loss: 0.3062877655029297, mean loss: 0.34018563128841967
Epoch: 61, step: 1048, loss: 0.33673664927482605, mean loss: 0.34018559259363756
Epoch: 61, step: 1049, loss: 0.34213992953300476, mean loss: 0.34018561451946766
Epoch: 61, step: 1050, loss: 0.35761281847953796, mean loss: 0.34018581003418086
Epoch: 61, step: 1051, loss: 0.313287615776062, mean loss: 0.3401855082684043
Epoch: 61, step: 1052, loss: 0.3119019567966461, mean loss: 0.34018519096412586
Epoch: 61, step: 1053, loss: 0.28935298323631287, mean loss: 0.34018462069995425
Epoch: 61, step: 1054, loss: 0.3200524151325226, mean loss: 0.3401843948481322
Epoch: 61, step: 1055, loss: 0.3090709149837494, mean loss: 0.3401840458075234
Epoch: 61, step: 1056, loss: 0.3348533809185028, mean loss: 0.3401839860071522
Epoch: 61, step: 1057, loss: 0.31236958503723145, mean loss: 0.3401836739836283
Epoch: 61, step: 1058, loss: 0.3591359555721283, mean loss: 0.34018388658901055
Epoch: 61, step: 1059, loss: 0.3174181580543518, mean loss: 0.34018363120750944
Epoch: 61, step: 1060, loss: 0.33613207936286926, mean loss: 0.34018358575850116
Epoch: 61, step: 1061, loss: 0.3188022971153259, mean loss: 0.34018334591275773
Epoch: 61, step: 1062, loss: 0.32653218507766724, mean loss: 0.3401831927818522
Epoch: 61, step: 1063, loss: 0.31309840083122253, mean loss: 0.34018288896357307
Epoch: 61, step: 1064, loss: 0.33282867074012756, mean loss: 0.3401828064700148
Epoch: 61, step: 1065, loss: 0.37562233209609985, mean loss: 0.34018320399694274
Epoch: 61, step: 1066, loss: 0.374436616897583, mean loss: 0.34018358821487527
Epoch: 61, step: 1067, loss: 0.3328511416912079, mean loss: 0.3401835059683017
Epoch: 61, step: 1068, loss: 0.3316899538040161, mean loss: 0.34018341069890906
Epoch: 61, step: 1069, loss: 0.3487693965435028, mean loss: 0.34018350700401984
Epoch: 61, step: 1070, loss: 0.2820832133293152, mean loss: 0.340182855326675
Epoch: 61, step: 1071, loss: 0.2928875684738159, mean loss: 0.34018232484878397
Epoch: 61, step: 1072, loss: 0.33651304244995117, mean loss: 0.3401822836934916
Epoch: 61, step: 1073, loss: 0.35149306058883667, mean loss: 0.3401824105556565
Epoch: 61, step: 1074, loss: 0.390222430229187, mean loss: 0.34018297180039536
Epoch: 61, step: 1075, loss: 0.348102331161499, mean loss: 0.34018306062228143
Epoch: 61, step: 1076, loss: 0.31002122163772583, mean loss: 0.3401827223371682
Epoch: 61, step: 1077, loss: 0.32056471705436707, mean loss: 0.34018250231064023
Epoch: 61, step: 1078, loss: 0.3231249451637268, mean loss: 0.34018231100306706
Epoch: 61, step: 1079, loss: 0.3402614891529083, mean loss: 0.34018231189107284
Epoch: 61, step: 1080, loss: 0.33976325392723083, mean loss: 0.3401823071912695
Epoch: 61, step: 1081, loss: 0.34621500968933105, mean loss: 0.340182374848252
Epoch: 61, step: 1082, loss: 0.32634758949279785, mean loss: 0.34018221969236073
Epoch: 61, step: 1083, loss: 0.31937333941459656, mean loss: 0.3401819863252304
Epoch: 61, step: 1084, loss: 0.3525694012641907, mean loss: 0.34018212524587477
Epoch: 61, step: 1085, loss: 0.3552318811416626, mean loss: 0.3401822940218745
Epoch: 61, step: 1086, loss: 0.3560572564601898, mean loss: 0.3401824720501846
Epoch: 61, step: 1087, loss: 0.3470393419265747, mean loss: 0.3401825489450605
Epoch: 61, step: 1088, loss: 0.2813751697540283, mean loss: 0.3401818894698921
Epoch: 61, step: 1089, loss: 0.35990461707115173, mean loss: 0.3401821106411707
Epoch: 61, step: 1090, loss: 0.37679922580718994, mean loss: 0.3401825212620304
Epoch: 61, step: 1091, loss: 0.35625597834587097, mean loss: 0.3401827015062338
Epoch: 61, step: 1092, loss: 0.28758832812309265, mean loss: 0.34018211173114177
Epoch: 61, step: 1093, loss: 0.34628206491470337, mean loss: 0.3401821801331376
Epoch: 61, step: 1094, loss: 0.31887802481651306, mean loss: 0.34018194124107426
Epoch: 61, step: 1095, loss: 0.350249320268631, mean loss: 0.34018205412937913
Epoch: 61, step: 1096, loss: 0.3565625548362732, mean loss: 0.34018223780640344
Epoch: 61, step: 1097, loss: 0.3278139531612396, mean loss: 0.3401820991205179
Epoch: 61, step: 1098, loss: 0.30526235699653625, mean loss: 0.3401817075689652
Epoch: 61, step: 1099, loss: 0.3782751262187958, mean loss: 0.3401821347018439
Epoch: 61, step: 1100, loss: 0.337656706571579, mean loss: 0.34018210638510754
Epoch: 61, step: 1101, loss: 0.3387005031108856, mean loss: 0.340182089772598
Epoch: 61, step: 1102, loss: 0.3284095823764801, mean loss: 0.34018195777457816
Epoch: 61, step: 1103, loss: 0.34196120500564575, mean loss: 0.3401819777239798
Epoch: 61, step: 1104, loss: 0.31508558988571167, mean loss: 0.34018169633964046
Epoch: 61, step: 1105, loss: 0.32232338190078735, mean loss: 0.3401814961118746
Epoch: 61, step: 1106, loss: 0.35372984409332275, mean loss: 0.3401816480145103
Epoch: 61, step: 1107, loss: 0.31382760405540466, mean loss: 0.34018135253908693
Epoch: 61, step: 1108, loss: 0.3508961498737335, mean loss: 0.34018147266956056
Epoch: 61, step: 1109, loss: 0.3138066828250885, mean loss: 0.34018117696816985
Epoch: 61, step: 1110, loss: 0.3390948474407196, mean loss: 0.34018116478890503
Epoch: 61, step: 1111, loss: 0.3244117796421051, mean loss: 0.34018098799414803
Epoch: 61, step: 1112, loss: 0.4993075430393219, mean loss: 0.340182771984137
Epoch: 61, step: 1113, loss: 0.32226166129112244, mean loss: 0.3401825710703195
Epoch: 61, step: 1114, loss: 0.30895352363586426, mean loss: 0.3401822209649659
Epoch: 61, step: 1115, loss: 0.30402112007141113, mean loss: 0.34018181557145816
Epoch: 61, step: 1116, loss: 0.33637794852256775, mean loss: 0.3401817729276868
Epoch: 61, step: 1117, loss: 0.314433753490448, mean loss: 0.34018148427923234
Epoch: 61, step: 1118, loss: 0.3623030483722687, mean loss: 0.34018173227048926
Epoch: 61, step: 1119, loss: 0.39633893966674805, mean loss: 0.3401823618073642
Epoch: 61, step: 1120, loss: 0.3323933780193329, mean loss: 0.34018227449181254
Epoch: 61, step: 1121, loss: 0.3984636962413788, mean loss: 0.3401829278270338
Epoch: 61, step: 1122, loss: 0.3507823050022125, mean loss: 0.3401830466448079
Epoch: 61, step: 1123, loss: 0.3133746087551117, mean loss: 0.34018274612873434
Epoch: 61, step: 1124, loss: 0.39296188950538635, mean loss: 0.3401833377634727
Epoch: 61, step: 1125, loss: 0.3572251498699188, mean loss: 0.34018352879376196
Epoch: 61, step: 1126, loss: 0.3299400508403778, mean loss: 0.34018341397072493
Epoch: 61, step: 1127, loss: 0.3592791259288788, mean loss: 0.3401836280194175
Epoch: 61, step: 1128, loss: 0.3336107134819031, mean loss: 0.3401835543427724
Epoch: 61, step: 1129, loss: 0.3134121894836426, mean loss: 0.3401832542624615
Epoch: 61, step: 1130, loss: 0.31538549065589905, mean loss: 0.34018297630736866
Epoch: 61, step: 1131, loss: 0.3252418339252472, mean loss: 0.3401828088358122
Epoch: 61, step: 1132, loss: 0.32074299454689026, mean loss: 0.34018259094220127
Epoch: 61, step: 1133, loss: 0.30991190671920776, mean loss: 0.3401822516532212
Epoch: 61, step: 1134, loss: 0.35530558228492737, mean loss: 0.34018242116118064
Epoch: 61, step: 1135, loss: 0.3080052435398102, mean loss: 0.340182060511353
Epoch: 61, step: 1136, loss: 0.35835838317871094, mean loss: 0.34018226423382497
Epoch: 61, step: 1137, loss: 0.31375423073768616, mean loss: 0.34018196802847767
Epoch: 61, step: 1138, loss: 0.3115253448486328, mean loss: 0.3401816468487014
Epoch: 61, step: 1139, loss: 0.3428928554058075, mean loss: 0.3401816772352404
Epoch: 61, step: 1140, loss: 0.39115890860557556, mean loss: 0.3401822485687385
Epoch: 61, step: 1141, loss: 0.3556922972202301, mean loss: 0.3401824223975401
Epoch: 61, step: 1142, loss: 0.3313509523868561, mean loss: 0.34018232341998833
Epoch: 61, step: 1143, loss: 0.30274471640586853, mean loss: 0.3401819038475782
Epoch: 61, step: 1144, loss: 0.37838056683540344, mean loss: 0.34018233194453085
Epoch: 61, step: 1145, loss: 0.3992636203765869, mean loss: 0.3401829940681264
Epoch: 61, step: 1146, loss: 0.3206155598163605, mean loss: 0.3401827747784821
Epoch: 61, step: 1147, loss: 0.31305477023124695, mean loss: 0.3401824707619348
Epoch: 61, step: 1148, loss: 0.34626609086990356, mean loss: 0.34018253893873157
Epoch: 61, step: 1149, loss: 0.3252066373825073, mean loss: 0.34018237111142857
Epoch: 61, step: 1150, loss: 0.2875708043575287, mean loss: 0.34018178152699696
Epoch: 61, step: 1151, loss: 0.31015831232070923, mean loss: 0.34018144507680637
Epoch: 61, step: 1152, loss: 0.3378681540489197, mean loss: 0.3401814191538033
Epoch: 61, step: 1153, loss: 0.300753116607666, mean loss: 0.3401809773206992
Epoch: 61, step: 1154, loss: 0.36593714356422424, mean loss: 0.34018126594076714
Epoch: 61, step: 1155, loss: 0.3262704610824585, mean loss: 0.3401811100599417
Epoch: 61, step: 1156, loss: 0.3309287130832672, mean loss: 0.34018100638117327
Epoch: 61, step: 1157, loss: 0.32054123282432556, mean loss: 0.3401807863079616
Epoch: 61, step: 1158, loss: 0.3330710530281067, mean loss: 0.3401807066408361
Epoch: 61, step: 1159, loss: 0.3478947877883911, mean loss: 0.34018079307892884
Epoch: 61, step: 1160, loss: 0.33360791206359863, mean loss: 0.3401807194290771
Epoch: 61, step: 1161, loss: 0.3193436563014984, mean loss: 0.3401804859501187
Epoch: 61, step: 1162, loss: 0.3171634376049042, mean loss: 0.3401802280473506
Epoch: 61, step: 1163, loss: 0.30733051896095276, mean loss: 0.3401798599751351
Epoch: 61, step: 1164, loss: 0.3364059031009674, mean loss: 0.34017981768943023
Epoch: 61, step: 1165, loss: 0.2951984107494354, mean loss: 0.3401793136960752
Epoch: 61, step: 1166, loss: 0.313458651304245, mean loss: 0.3401790143082544
Epoch: 61, step: 1167, loss: 0.33272796869277954, mean loss: 0.34017893082502026
Epoch: 61, step: 1168, loss: 0.3311925232410431, mean loss: 0.3401788301403645
Epoch: 61, step: 1169, loss: 0.30197030305862427, mean loss: 0.3401784020528045
Epoch: 61, step: 1170, loss: 0.31598252058029175, mean loss: 0.340178130965678
Epoch: 61, step: 1171, loss: 0.3326709270477295, mean loss: 0.34017804685700276
Epoch: 61, step: 1172, loss: 0.33913931250572205, mean loss: 0.3401780352194354
Epoch: 61, step: 1173, loss: 0.41412144899368286, mean loss: 0.3401788636428123
Epoch: 61, step: 1174, loss: 0.3390825390815735, mean loss: 0.3401788513603023
Epoch: 61, step: 1175, loss: 0.3245863616466522, mean loss: 0.3401786766741079
Epoch: 61, step: 1176, loss: 0.37241435050964355, mean loss: 0.34017903781361825
Epoch: 61, step: 1177, loss: 0.3543623089790344, mean loss: 0.34017919670845775
Epoch: 61, step: 1178, loss: 0.32579120993614197, mean loss: 0.3401790355220001
Epoch: 61, step: 1179, loss: 0.2950921654701233, mean loss: 0.3401785304262162
Epoch: 61, step: 1180, loss: 0.3238806128501892, mean loss: 0.34017834784718104
Epoch: 61, step: 1181, loss: 0.2934384346008301, mean loss: 0.34017782424454124
Epoch: 61, step: 1182, loss: 0.38471919298171997, mean loss: 0.3401783232124548
Epoch: 61, step: 1183, loss: 0.33040374517440796, mean loss: 0.34017821371545653
Epoch: 61, step: 1184, loss: 0.3953993320465088, mean loss: 0.34017883230778234
Epoch: 61, step: 1185, loss: 0.30380138754844666, mean loss: 0.3401784248086812
Epoch: 61, step: 1186, loss: 0.3259162902832031, mean loss: 0.3401782650464457
Epoch: 61, step: 1187, loss: 0.37887394428253174, mean loss: 0.34017869850463234
Epoch: 61, step: 1188, loss: 0.34266749024391174, mean loss: 0.34017872638306973
Epoch: 61, step: 1189, loss: 0.32184091210365295, mean loss: 0.34017852097259993
Epoch: 61, step: 1190, loss: 0.3060034513473511, mean loss: 0.3401781381658833
Epoch: 61, step: 1191, loss: 0.3202041685581207, mean loss: 0.3401779144330816
Epoch: 61, step: 1192, loss: 0.33365437388420105, mean loss: 0.34017784136229573
Epoch: 61, step: 1193, loss: 0.3018655776977539, mean loss: 0.34017741222786546
Epoch: 61, step: 1194, loss: 0.319070965051651, mean loss: 0.34017717581787904
Epoch: 61, step: 1195, loss: 0.3256320059299469, mean loss: 0.34017701290154967
Epoch: 61, step: 1196, loss: 0.3525030016899109, mean loss: 0.3401771509599136
Epoch: 61, step: 1197, loss: 0.3557775020599365, mean loss: 0.3401773256911147
Epoch: 61, step: 1198, loss: 0.3369874358177185, mean loss: 0.34017728996326196
Epoch: 61, step: 1199, loss: 0.3113747239112854, mean loss: 0.34017696736832836
Epoch: 61, step: 1200, loss: 0.38647517561912537, mean loss: 0.34017748591240915
Epoch: 61, step: 1201, loss: 0.3281584084033966, mean loss: 0.3401773512991718
Epoch: 61, step: 1202, loss: 0.3419952988624573, mean loss: 0.3401773716598913
Epoch: 61, step: 1203, loss: 0.28179433941841125, mean loss: 0.34017671778666936
Epoch: 61, step: 1204, loss: 0.3055379390716553, mean loss: 0.34017632984662394
Epoch: 61, step: 1205, loss: 0.32026857137680054, mean loss: 0.340176106890431
Epoch: 61, step: 1206, loss: 0.3218814432621002, mean loss: 0.3401759020023277
Epoch: 61, step: 1207, loss: 0.3436598777770996, mean loss: 0.34017594102010956
Epoch: 61, step: 1208, loss: 0.3472762703895569, mean loss: 0.3401760205373099
Epoch: 61, step: 1209, loss: 0.36789608001708984, mean loss: 0.34017633097316763
Epoch: 61, step: 1210, loss: 0.32568106055259705, mean loss: 0.34017616864302125
Epoch: 61, step: 1211, loss: 0.32933834195137024, mean loss: 0.3401760472733441
Epoch: 61, step: 1212, loss: 0.31520771980285645, mean loss: 0.3401757676634191
Epoch: 61, step: 1213, loss: 0.3365260064601898, mean loss: 0.3401757267917176
Epoch: 61, step: 1214, loss: 0.360871821641922, mean loss: 0.34017595855349375
Epoch: 61, step: 1215, loss: 0.29843205213546753, mean loss: 0.340175491096535
Epoch: 61, step: 1216, loss: 0.33152541518211365, mean loss: 0.34017539423226795
Epoch: 61, step: 1217, loss: 0.3348133862018585, mean loss: 0.34017533418872997
Epoch: 61, step: 1218, loss: 0.3193349540233612, mean loss: 0.340175100821652
Epoch: 61, step: 1219, loss: 0.32382386922836304, mean loss: 0.34017491772535624
Epoch: 61, step: 1220, loss: 0.34595564007759094, mean loss: 0.3401749824554649
Epoch: 61, step: 1221, loss: 0.2793527841567993, mean loss: 0.3401743014015794
Epoch: 61, step: 1222, loss: 0.3360448479652405, mean loss: 0.34017425516272426
Epoch: 61, step: 1223, loss: 0.3116879165172577, mean loss: 0.3401739361953457
Epoch: 61, step: 1224, loss: 0.3542565107345581, mean loss: 0.3401740938790566
Epoch: 61, step: 1225, loss: 0.35160332918167114, mean loss: 0.34017422185168344
Epoch: 61, step: 1226, loss: 0.3378795385360718, mean loss: 0.34017419615850664
Epoch: 61, step: 1227, loss: 0.32113438844680786, mean loss: 0.34017398297542134
Epoch: 61, step: 1228, loss: 0.3094463646411896, mean loss: 0.3401736389312359
Epoch: 61, step: 1229, loss: 0.2842297852039337, mean loss: 0.34017301255850907
Epoch: 61, step: 1230, loss: 0.3269743025302887, mean loss: 0.3401728647814276
Epoch: 61, step: 1231, loss: 0.3136400282382965, mean loss: 0.34017256771442345
Epoch: 61, step: 1232, loss: 0.3265964388847351, mean loss: 0.34017241571504114
Epoch: 61, step: 1233, loss: 0.34177568554878235, mean loss: 0.3401724336651725
Epoch: 61, step: 1234, loss: 0.34880125522613525, mean loss: 0.340172530271959
Epoch: 61, step: 1235, loss: 0.31017962098121643, mean loss: 0.34017219448031893
Epoch: 61, step: 1236, loss: 0.35327059030532837, mean loss: 0.3401723411243984
Epoch: 61, step: 1237, loss: 0.3521480858325958, mean loss: 0.34017247519825156
Epoch: 61, step: 1238, loss: 0.33048734068870544, mean loss: 0.34017236677002466
Epoch: 61, step: 1239, loss: 0.32756751775741577, mean loss: 0.3401722256562253
Epoch: 61, step: 1240, loss: 0.3283582627773285, mean loss: 0.34017209339803467
Epoch: 61, step: 1241, loss: 0.3251689076423645, mean loss: 0.34017192543813773
Epoch: 61, step: 1242, loss: 0.30581164360046387, mean loss: 0.34017154078084666
Epoch: 61, step: 1243, loss: 0.3593061864376068, mean loss: 0.3401717549874298
Epoch: 61, step: 1244, loss: 0.2920667231082916, mean loss: 0.340171216472145
Epoch: 61, step: 1245, loss: 0.34905779361724854, mean loss: 0.34017131595246675
Epoch: 61, step: 1246, loss: 0.36574235558509827, mean loss: 0.3401716022029244
Epoch: 61, step: 1247, loss: 0.29382094740867615, mean loss: 0.3401710833445669
Epoch: 61, step: 1248, loss: 0.3437734842300415, mean loss: 0.34017112367010044
Epoch: 61, step: 1249, loss: 0.3528275191783905, mean loss: 0.3401712653451123
Epoch: 61, step: 1250, loss: 0.36605626344680786, mean loss: 0.3401715550971479
Epoch: 61, step: 1251, loss: 0.32247382402420044, mean loss: 0.34017135699413154
Epoch: 61, step: 1252, loss: 0.3349634110927582, mean loss: 0.3401712986986224
Epoch: 61, step: 1253, loss: 0.3790699243545532, mean loss: 0.34017173410825385
Epoch: 61, step: 1254, loss: 0.3596135675907135, mean loss: 0.34017195172691406
Epoch: 61, step: 1255, loss: 0.3087086081504822, mean loss: 0.3401715995515886
Epoch: 61, step: 1256, loss: 0.3380796015262604, mean loss: 0.3401715761357098
Epoch: 61, step: 1257, loss: 0.27168235182762146, mean loss: 0.3401708095396597
Epoch: 61, step: 1258, loss: 0.3214976489543915, mean loss: 0.340170600534359
Epoch: 61, step: 1259, loss: 0.2765923738479614, mean loss: 0.3401698889227602
Epoch: 61, step: 1260, loss: 0.3196714222431183, mean loss: 0.34016965949227523
Epoch: 61, step: 1261, loss: 0.3383435010910034, mean loss: 0.34016963905310166
Epoch: 61, step: 1262, loss: 0.3270450234413147, mean loss: 0.34016949215823544
Epoch: 61, step: 1263, loss: 0.32898059487342834, mean loss: 0.3401693669299451
Epoch: 61, step: 1264, loss: 0.32590559124946594, mean loss: 0.3401692072888111
Epoch: 61, step: 1265, loss: 0.2918723523616791, mean loss: 0.34016866675322155
Epoch: 61, step: 1266, loss: 0.31859833002090454, mean loss: 0.34016842534197006
Epoch: 61, step: 1267, loss: 0.32938364148139954, mean loss: 0.3401683046419985
Epoch: 61, step: 1268, loss: 0.3384050130844116, mean loss: 0.3401682849080046
Epoch: 61, step: 1269, loss: 0.34502846002578735, mean loss: 0.34016833930036666
Epoch: 61, step: 1270, loss: 0.38990092277526855, mean loss: 0.34016889587340093
Epoch: 61, step: 1271, loss: 0.3320336639881134, mean loss: 0.3401688048304728
Epoch: 61, step: 1272, loss: 0.3283056318759918, mean loss: 0.34016867206893253
Epoch: 61, step: 1273, loss: 0.33010604977607727, mean loss: 0.3401685594587321
Epoch: 61, step: 1274, loss: 0.3067133128643036, mean loss: 0.34016818506727076
Epoch: 61, step: 1275, loss: 0.3115376830101013, mean loss: 0.3401678646722164
Epoch: 61, step: 1276, loss: 0.3361054062843323, mean loss: 0.3401678192110153
Epoch: 61, step: 1277, loss: 0.35484713315963745, mean loss: 0.340167983478981
Epoch: 61, step: 1278, loss: 0.3198517858982086, mean loss: 0.34016775613435757
Epoch: 61, step: 1279, loss: 0.3171474039554596, mean loss: 0.3401674985322787
Epoch: 61, step: 1280, loss: 0.2960332930088043, mean loss: 0.34016700466772853
Epoch: 61, step: 1281, loss: 0.35615605115890503, mean loss: 0.3401671835841676
Epoch: 61, step: 1282, loss: 0.32389888167381287, mean loss: 0.34016700154491475
Epoch: 61, step: 1283, loss: 0.3071214258670807, mean loss: 0.34016663177524686
Epoch: 61, step: 1284, loss: 0.32378891110420227, mean loss: 0.3401664485157198
Epoch: 61, step: 1285, loss: 0.3288489282131195, mean loss: 0.34016632187903745
Epoch: 61, step: 1286, loss: 0.35658523440361023, mean loss: 0.34016650559537187
Epoch: 61, step: 1287, loss: 0.3172384798526764, mean loss: 0.34016624904940956
Epoch: 61, step: 1288, loss: 0.32515794038772583, mean loss: 0.3401660811205198
Epoch: 61, step: 1289, loss: 0.3136124014854431, mean loss: 0.3401657840130877
Epoch: 61, step: 1290, loss: 0.3282961845397949, mean loss: 0.3401656512063803
Epoch: 61, step: 1291, loss: 0.3687761127948761, mean loss: 0.3401659713198514
Epoch: 61, step: 1292, loss: 0.35704749822616577, mean loss: 0.3401661601998418
Epoch: 61, step: 1293, loss: 0.3223625719547272, mean loss: 0.3401659610055407
Epoch: 61, step: 1294, loss: 0.3256109952926636, mean loss: 0.34016579816006565
Epoch: 61, step: 1295, loss: 0.3321051001548767, mean loss: 0.3401657079754829
Epoch: 61, step: 1296, loss: 0.332074373960495, mean loss: 0.34016561744915164
Epoch: 61, step: 1297, loss: 0.3264833390712738, mean loss: 0.34016546437271145
Epoch: 61, step: 1298, loss: 0.3043085038661957, mean loss: 0.34016506321185863
Epoch: 61, step: 1299, loss: 0.3315165936946869, mean loss: 0.3401649664555094
Epoch: 61, step: 1300, loss: 0.34381303191185, mean loss: 0.34016500726845855
Epoch: 61, step: 1301, loss: 0.3409394323825836, mean loss: 0.3401650159322886
Epoch: 61, step: 1302, loss: 0.33440670371055603, mean loss: 0.3401649515122698
Epoch: 61, step: 1303, loss: 0.2822982668876648, mean loss: 0.3401643041470236
Epoch: 61, step: 1304, loss: 0.3616000711917877, mean loss: 0.3401645439502102
Epoch: 61, step: 1305, loss: 0.3187573254108429, mean loss: 0.3401643044690765
Epoch: 61, step: 1306, loss: 0.364169180393219, mean loss: 0.34016457300702685
Epoch: 61, step: 1307, loss: 0.34575149416923523, mean loss: 0.3401646355061449
Epoch: 61, step: 1308, loss: 0.34436148405075073, mean loss: 0.34016468245443554
Epoch: 61, step: 1309, loss: 0.31813889741897583, mean loss: 0.3401644360644649
Epoch: 61, step: 1310, loss: 0.31690794229507446, mean loss: 0.3401641759101635
Epoch: 61, step: 1311, loss: 0.34187501668930054, mean loss: 0.34016419504794126
Epoch: 61, step: 1312, loss: 0.33573028445243835, mean loss: 0.34016414544996154
Epoch: 61, step: 1313, loss: 0.3286900818347931, mean loss: 0.3401640171018596
Epoch: 61, step: 1314, loss: 0.3246081471443176, mean loss: 0.34016384309689357
Epoch: 61, step: 1315, loss: 0.36375609040260315, mean loss: 0.3401641069922773
Epoch: 61, step: 1316, loss: 0.31753847002983093, mean loss: 0.34016385391192067
Epoch: 61, step: 1317, loss: 0.36464643478393555, mean loss: 0.34016412776016647
Epoch: 61, step: 1318, loss: 0.43822866678237915, mean loss: 0.34016522464213933
Epoch: 61, step: 1319, loss: 0.3180202841758728, mean loss: 0.3401649769469527
Epoch: 61, step: 1320, loss: 0.36751294136047363, mean loss: 0.340165282835487
Epoch: 61, step: 1321, loss: 0.2891087234020233, mean loss: 0.340164711771359
Epoch: 61, step: 1322, loss: 0.308709055185318, mean loss: 0.34016435994592487
Epoch: 61, step: 1323, loss: 0.36169883608818054, mean loss: 0.3401646008021809
Epoch: 61, step: 1324, loss: 0.3314565420150757, mean loss: 0.3401645034064066
Epoch: 61, step: 1325, loss: 0.32427978515625, mean loss: 0.34016432574486705
Epoch: 61, step: 1326, loss: 0.32350820302963257, mean loss: 0.3401641394576908
Epoch: 61, step: 1327, loss: 0.2893093526363373, mean loss: 0.34016357068854547
Epoch: 61, step: 1328, loss: 0.324258953332901, mean loss: 0.34016339281041413
Epoch: 61, step: 1329, loss: 0.3253980278968811, mean loss: 0.3401632276755928
Epoch: 61, step: 1330, loss: 0.3409907817840576, mean loss: 0.3401632369307973
Epoch: 61, step: 1331, loss: 0.34490492939949036, mean loss: 0.3401632899603722
Epoch: 61, step: 1332, loss: 0.3005687892436981, mean loss: 0.34016284715306805
Epoch: 61, step: 1333, loss: 0.32105380296707153, mean loss: 0.340162633448398
Epoch: 61, step: 1334, loss: 0.30370986461639404, mean loss: 0.34016222578594557
Epoch: 61, step: 1335, loss: 0.35090357065200806, mean loss: 0.340162345908344
Epoch: 61, step: 1336, loss: 0.3588147759437561, mean loss: 0.34016255449950306
Epoch: 61, step: 1337, loss: 0.3259434700012207, mean loss: 0.3401623954884711
Epoch: 61, step: 1338, loss: 0.3404477536678314, mean loss: 0.3401623986795761
Epoch: 61, step: 1339, loss: 0.3605361878871918, mean loss: 0.3401626265131466
Epoch: 61, step: 1340, loss: 0.3072071969509125, mean loss: 0.3401622579872359
Epoch: 61, step: 1341, loss: 0.31148838996887207, mean loss: 0.34016193734370925
Epoch: 61, step: 1342, loss: 0.3302014172077179, mean loss: 0.34016182596213396
Epoch: 61, step: 1343, loss: 0.34303343296051025, mean loss: 0.3401618580729605
Epoch: 61, step: 1344, loss: 0.33910661935806274, mean loss: 0.3401618462732231
Epoch: 61, step: 1345, loss: 0.3430732488632202, mean loss: 0.34016187882832305
Epoch: 61, step: 1346, loss: 0.3058546781539917, mean loss: 0.34016149521189615
Epoch: 61, step: 1347, loss: 0.3227832317352295, mean loss: 0.3401613008937161
Epoch: 61, step: 1348, loss: 0.3383192718029022, mean loss: 0.3401612802969667
Epoch: 61, step: 1349, loss: 0.3242339789867401, mean loss: 0.3401611022069639
Epoch: 61, step: 1350, loss: 0.3047473132610321, mean loss: 0.3401607062345935
Epoch: 61, step: 1351, loss: 0.3302852213382721, mean loss: 0.3401605958150209
Epoch: 61, step: 1352, loss: 0.31665554642677307, mean loss: 0.34016033300377513
Epoch: 61, step: 1353, loss: 0.35841161012649536, mean loss: 0.3401605370700235
Epoch: 61, step: 1354, loss: 0.3411552608013153, mean loss: 0.3401605481918354
Epoch: 61, step: 1355, loss: 0.35780689120292664, mean loss: 0.34016074548994596
Epoch: 61, step: 1356, loss: 0.3241179287433624, mean loss: 0.3401605661223545
Epoch: 61, step: 1357, loss: 0.3529398739337921, mean loss: 0.3401607090005081
Epoch: 61, step: 1358, loss: 0.356365829706192, mean loss: 0.3401608901786965
Epoch: 61, step: 1359, loss: 0.32920747995376587, mean loss: 0.340160767717601
Epoch: 61, step: 1360, loss: 0.33674314618110657, mean loss: 0.340160729508405
Epoch: 61, step: 1361, loss: 0.3831111192703247, mean loss: 0.340161209690747
Epoch: 61, step: 1362, loss: 0.34353145956993103, mean loss: 0.3401612473694828
Epoch: 61, step: 1363, loss: 0.3272647261619568, mean loss: 0.34016110319050497
Epoch: 61, step: 1364, loss: 0.3104725182056427, mean loss: 0.3401607712853413
Epoch: 61, step: 1365, loss: 0.3377162516117096, mean loss: 0.3401607439570051
Epoch: 61, step: 1366, loss: 0.3179304897785187, mean loss: 0.34016049543821625
Epoch: 61, step: 1367, loss: 0.33604273200035095, mean loss: 0.340160449404998
Epoch: 61, step: 1368, loss: 0.33655285835266113, mean loss: 0.3401604090755395
Epoch: 61, step: 1369, loss: 0.3444724380970001, mean loss: 0.3401604572794099
Epoch: 61, step: 1370, loss: 0.33036208152770996, mean loss: 0.3401603477452782
Epoch: 61, step: 1371, loss: 0.35671791434288025, mean loss: 0.34016053283701714
Epoch: 61, step: 1372, loss: 0.2958259880542755, mean loss: 0.34016003724086724
Epoch: 61, step: 1373, loss: 0.3333888053894043, mean loss: 0.3401599615491253
Epoch: 61, step: 1374, loss: 0.32154396176338196, mean loss: 0.3401597534537991
Epoch: 61, step: 1375, loss: 0.3366657495498657, mean loss: 0.3401597143971939
Epoch: 61, step: 1376, loss: 0.36031675338745117, mean loss: 0.34015993971368924
Epoch: 61, step: 1377, loss: 0.32258471846580505, mean loss: 0.3401597432590912
Epoch: 61, step: 1378, loss: 0.3121793568134308, mean loss: 0.3401594304997779
Epoch: 61, step: 1379, loss: 0.33127710223197937, mean loss: 0.34015933121595127
Epoch: 61, step: 1380, loss: 0.32236263155937195, mean loss: 0.34015913229235367
Epoch: 61, step: 1381, loss: 0.30943381786346436, mean loss: 0.34015878886228607
Epoch: 61, step: 1382, loss: 0.31434187293052673, mean loss: 0.3401585002987271
Epoch: 61, step: 1383, loss: 0.3254360556602478, mean loss: 0.34015833574330345
Epoch: 61, step: 1384, loss: 0.31951263546943665, mean loss: 0.3401581049851607
Epoch: 61, step: 1385, loss: 0.356353223323822, mean loss: 0.3401582859968779
Epoch: 61, step: 1386, loss: 0.35775673389434814, mean loss: 0.3401584826913141
Epoch: 61, step: 1387, loss: 0.3131490647792816, mean loss: 0.34015818081566684
Epoch: 61, step: 1388, loss: 0.3817174434661865, mean loss: 0.3401586453050955
Epoch: 61, step: 1389, loss: 0.2967502772808075, mean loss: 0.34015816015445927
Epoch: 61, step: 1390, loss: 0.3460903465747833, mean loss: 0.3401582264543913
Epoch: 61, step: 1391, loss: 0.3399287462234497, mean loss: 0.34015822388967865
Epoch: 61, step: 1392, loss: 0.31446221470832825, mean loss: 0.34015793670963035
Epoch: 61, step: 1393, loss: 0.3182010352611542, mean loss: 0.3401576913208035
Epoch: 61, step: 1394, loss: 0.3265818953514099, mean loss: 0.34015753960033307
Epoch: 61, step: 1395, loss: 0.2883477807044983, mean loss: 0.34015696059095785
Epoch: 61, step: 1396, loss: 0.3877839148044586, mean loss: 0.3401574928486909
Epoch: 61, step: 1397, loss: 0.3159942030906677, mean loss: 0.340157222813491
Epoch: 61, step: 1398, loss: 0.30801495909690857, mean loss: 0.3401568636138249
Epoch: 61, step: 1399, loss: 0.3536706566810608, mean loss: 0.340157014632924
Epoch: 61, step: 1400, loss: 0.3503451943397522, mean loss: 0.34015712848641577
Epoch: 61, step: 1401, loss: 0.3550243675708771, mean loss: 0.3401572946268074
Epoch: 61, step: 1402, loss: 0.3282306492328644, mean loss: 0.34015716134884083
Epoch: 61, step: 1403, loss: 0.3553121089935303, mean loss: 0.3401573307005712
Epoch: 61, step: 1404, loss: 0.31132155656814575, mean loss: 0.3401570084735474
Epoch: 61, step: 1405, loss: 0.3774898648262024, mean loss: 0.3401574256470456
Epoch: 61, step: 1406, loss: 0.38155969977378845, mean loss: 0.3401578882888099
Epoch: 61, step: 1407, loss: 0.3321768045425415, mean loss: 0.34015779910671823
Epoch: 61, step: 1408, loss: 0.30294734239578247, mean loss: 0.34015738331490536
Epoch: 61, step: 1409, loss: 0.3027385175228119, mean loss: 0.3401569651989893
Epoch: 61, step: 1410, loss: 0.30621424317359924, mean loss: 0.34015658592951026
Epoch: 61, step: 1411, loss: 0.3041020333766937, mean loss: 0.34015618306734263
Epoch: 61, step: 1412, loss: 0.2988128066062927, mean loss: 0.340155721114691
Epoch: 61, step: 1413, loss: 0.3257799744606018, mean loss: 0.3401555604882339
Epoch: 61, step: 1414, loss: 0.3075016140937805, mean loss: 0.34015519563559427
Epoch: 61, step: 1415, loss: 0.32585251331329346, mean loss: 0.34015503582908785
Epoch: 61, step: 1416, loss: 0.3093004524707794, mean loss: 0.34015469108899155
Epoch: 61, step: 1417, loss: 0.31499141454696655, mean loss: 0.3401544099413463
Epoch: 61, step: 1418, loss: 0.3597660958766937, mean loss: 0.34015462905898414
Epoch: 61, step: 1419, loss: 0.33870378136634827, mean loss: 0.34015461284911985
Epoch: 61, step: 1420, loss: 0.3333114981651306, mean loss: 0.34015453639400917
Epoch: 61, step: 1421, loss: 0.3351377546787262, mean loss: 0.3401544803443397
Epoch: 61, step: 1422, loss: 0.29359978437423706, mean loss: 0.34015396022081895
Epoch: 61, step: 1423, loss: 0.31049424409866333, mean loss: 0.3401536288569618
Epoch: 61, step: 1424, loss: 0.34741663932800293, mean loss: 0.3401537099997572
Epoch: 61, step: 1425, loss: 0.32080110907554626, mean loss: 0.3401534937937364
Epoch: 61, step: 1426, loss: 0.32267898321151733, mean loss: 0.3401532985718018
Epoch: 61, step: 1427, loss: 0.37612202763557434, mean loss: 0.34015370040316595
Epoch: 61, step: 1428, loss: 0.3197188675403595, mean loss: 0.34015347211417035
Epoch: 61, step: 1429, loss: 0.32301953434944153, mean loss: 0.3401532807034663
Epoch: 61, step: 1430, loss: 0.3409501612186432, mean loss: 0.3401532896056672
Epoch: 61, step: 1431, loss: 0.34419432282447815, mean loss: 0.3401533347488061
Epoch: 61, step: 1432, loss: 0.32172122597694397, mean loss: 0.3401531288425674
Epoch: 61, step: 1433, loss: 0.31640923023223877, mean loss: 0.34015286360095554
Epoch: 61, step: 1434, loss: 0.3173462748527527, mean loss: 0.3401526088328197
Epoch: 61, step: 1435, loss: 0.3403947949409485, mean loss: 0.3401526115382052
Epoch: 61, step: 1436, loss: 0.34055694937705994, mean loss: 0.3401526160548866
Epoch: 61, step: 1437, loss: 0.3640495240688324, mean loss: 0.3401528829938292
Epoch: 61, step: 1438, loss: 0.3607322871685028, mean loss: 0.3401531128722311
Epoch: 61, step: 1439, loss: 0.3123777210712433, mean loss: 0.3401528026158551
Epoch: 61, step: 1440, loss: 0.3539997339248657, mean loss: 0.3401529572869672
Epoch: 61, step: 1441, loss: 0.3539823889732361, mean loss: 0.34015311176088187
Epoch: 61, step: 1442, loss: 0.29518672823905945, mean loss: 0.34015260949471054
Epoch: 61, step: 1443, loss: 0.3745115399360657, mean loss: 0.3401529932733099
Valid: 61, mean loss: 0.18536726633707684
Epoch: 62, step: 0, loss: 0.3033747673034668, mean loss: 0.34015258247651814
Epoch: 62, step: 1, loss: 0.3449457883834839, mean loss: 0.3401526360139459
Epoch: 62, step: 2, loss: 0.32839861512184143, mean loss: 0.3401525047295763
Epoch: 62, step: 3, loss: 0.3425644040107727, mean loss: 0.3401525316685398
Epoch: 62, step: 4, loss: 0.31630799174308777, mean loss: 0.340152265347296
Epoch: 62, step: 5, loss: 0.31779944896698, mean loss: 0.34015201568999953
Epoch: 62, step: 6, loss: 0.3556515574455261, mean loss: 0.3401521888015398
Epoch: 62, step: 7, loss: 0.35405924916267395, mean loss: 0.3401523441252125
Epoch: 62, step: 8, loss: 0.32484114170074463, mean loss: 0.34015217312101953
Epoch: 62, step: 9, loss: 0.32233956456184387, mean loss: 0.34015197418192594
Epoch: 62, step: 10, loss: 0.3207980990409851, mean loss: 0.34015175803169934
Epoch: 62, step: 11, loss: 0.3213464021682739, mean loss: 0.34015154800985586
Epoch: 62, step: 12, loss: 0.3786740005016327, mean loss: 0.34015197823123483
Epoch: 62, step: 13, loss: 0.3530263602733612, mean loss: 0.34015212201160655
Epoch: 62, step: 14, loss: 0.31708839535713196, mean loss: 0.3401518644400861
Epoch: 62, step: 15, loss: 0.3124484419822693, mean loss: 0.3401515550567387
Epoch: 62, step: 16, loss: 0.35070785880088806, mean loss: 0.34015167294499316
Epoch: 62, step: 17, loss: 0.375575989484787, mean loss: 0.3401520685440879
Epoch: 62, step: 18, loss: 0.38411545753479004, mean loss: 0.3401525594973191
Epoch: 62, step: 19, loss: 0.3156086206436157, mean loss: 0.3401522854103618
Epoch: 62, step: 20, loss: 0.3582736551761627, mean loss: 0.3401524877729763
Epoch: 62, step: 21, loss: 0.309990257024765, mean loss: 0.3401521509529791
Epoch: 62, step: 22, loss: 0.3767589330673218, mean loss: 0.34015255973436753
Epoch: 62, step: 23, loss: 0.32795631885528564, mean loss: 0.34015242354264785
Epoch: 62, step: 24, loss: 0.35170191526412964, mean loss: 0.34015255251087584
Epoch: 62, step: 25, loss: 0.3308469355106354, mean loss: 0.3401524486001962
Epoch: 62, step: 26, loss: 0.3221483528614044, mean loss: 0.3401522475606592
Epoch: 62, step: 27, loss: 0.3268885016441345, mean loss: 0.34015209945505026
Epoch: 62, step: 28, loss: 0.3315425515174866, mean loss: 0.34015200332020945
Epoch: 62, step: 29, loss: 0.3228130340576172, mean loss: 0.3401518097141747
Epoch: 62, step: 30, loss: 0.35500457882881165, mean loss: 0.3401519755575753
Epoch: 62, step: 31, loss: 0.3639112114906311, mean loss: 0.34015224084605156
Epoch: 62, step: 32, loss: 0.33571934700012207, mean loss: 0.34015219135024594
Epoch: 62, step: 33, loss: 0.3132728040218353, mean loss: 0.34015189122980055
Epoch: 62, step: 34, loss: 0.36790698766708374, mean loss: 0.34015220112447175
Epoch: 62, step: 35, loss: 0.3416043519973755, mean loss: 0.34015221733802714
Epoch: 62, step: 36, loss: 0.36616143584251404, mean loss: 0.34015250773291916
Epoch: 62, step: 37, loss: 0.29256656765937805, mean loss: 0.34015197643823064
Epoch: 62, step: 38, loss: 0.33596670627593994, mean loss: 0.34015192971041613
Epoch: 62, step: 39, loss: 0.3161882162094116, mean loss: 0.34015166216270376
Epoch: 62, step: 40, loss: 0.31593531370162964, mean loss: 0.340151391797416
Epoch: 62, step: 41, loss: 0.3267081379890442, mean loss: 0.340151241710849
Epoch: 62, step: 42, loss: 0.2952307462692261, mean loss: 0.3401507402037156
Epoch: 62, step: 43, loss: 0.3619084656238556, mean loss: 0.3401509831113812
Epoch: 62, step: 44, loss: 0.2877253592014313, mean loss: 0.3401503978276025
Epoch: 62, step: 45, loss: 0.32965102791786194, mean loss: 0.3401502806131216
Epoch: 62, step: 46, loss: 0.37461939454078674, mean loss: 0.34015066542042194
Epoch: 62, step: 47, loss: 0.3100316822528839, mean loss: 0.3401503291809921
Epoch: 62, step: 48, loss: 0.3776417672634125, mean loss: 0.3401507477196581
Epoch: 62, step: 49, loss: 0.3483257293701172, mean loss: 0.3401508389807004
Epoch: 62, step: 50, loss: 0.37185829877853394, mean loss: 0.34015119294155954
Epoch: 62, step: 51, loss: 0.35087850689888, mean loss: 0.3401513126927759
Epoch: 62, step: 52, loss: 0.31311267614364624, mean loss: 0.3401510108582736
Epoch: 62, step: 53, loss: 0.33885741233825684, mean loss: 0.34015099641788915
Epoch: 62, step: 54, loss: 0.3659380078315735, mean loss: 0.3401512842739714
Epoch: 62, step: 55, loss: 0.32515501976013184, mean loss: 0.34015111687505517
Epoch: 62, step: 56, loss: 0.32081615924835205, mean loss: 0.3401509010469854
Epoch: 62, step: 57, loss: 0.31999003887176514, mean loss: 0.34015067600219967
Epoch: 62, step: 58, loss: 0.348240464925766, mean loss: 0.3401507663031242
Epoch: 62, step: 59, loss: 0.29500916600227356, mean loss: 0.3401502624231369
Epoch: 62, step: 60, loss: 0.34662148356437683, mean loss: 0.34015033465545497
Epoch: 62, step: 61, loss: 0.3063722550868988, mean loss: 0.3401499576258806
Epoch: 62, step: 62, loss: 0.296720951795578, mean loss: 0.34014947287846364
Epoch: 62, step: 63, loss: 0.3282335102558136, mean loss: 0.34014933987593415
Epoch: 62, step: 64, loss: 0.3056228756904602, mean loss: 0.34014895450582505
Epoch: 62, step: 65, loss: 0.32419249415397644, mean loss: 0.3401487764084039
Epoch: 62, step: 66, loss: 0.28918811678886414, mean loss: 0.34014820761930165
Epoch: 62, step: 67, loss: 0.36602675914764404, mean loss: 0.34014849645531586
Epoch: 62, step: 68, loss: 0.38734084367752075, mean loss: 0.34014902317325535
Epoch: 62, step: 69, loss: 0.34159091114997864, mean loss: 0.3401490392661143
Epoch: 62, step: 70, loss: 0.34726160764694214, mean loss: 0.3401491186483438
Epoch: 62, step: 71, loss: 0.3447675406932831, mean loss: 0.3401491701932327
Epoch: 62, step: 72, loss: 0.3081890940666199, mean loss: 0.3401488134999355
Epoch: 62, step: 73, loss: 0.3270803987979889, mean loss: 0.3401486676503484
Epoch: 62, step: 74, loss: 0.3350100517272949, mean loss: 0.3401486103016444
Epoch: 62, step: 75, loss: 0.3458915948867798, mean loss: 0.34014867439459323
Epoch: 62, step: 76, loss: 0.34237101674079895, mean loss: 0.34014869919613716
Epoch: 62, step: 77, loss: 0.35178688168525696, mean loss: 0.3401488290778693
Epoch: 62, step: 78, loss: 0.29912784695625305, mean loss: 0.3401483712901728
Epoch: 62, step: 79, loss: 0.3608560264110565, mean loss: 0.3401486023817619
Epoch: 62, step: 80, loss: 0.3440839350223541, mean loss: 0.34014864629847386
Epoch: 62, step: 81, loss: 0.3180684745311737, mean loss: 0.34014839989548573
Epoch: 62, step: 82, loss: 0.3382551074028015, mean loss: 0.34014837876758297
Epoch: 62, step: 83, loss: 0.3402348756790161, mean loss: 0.340148379732821
Epoch: 62, step: 84, loss: 0.3275827467441559, mean loss: 0.340148239511726
Epoch: 62, step: 85, loss: 0.3148452937602997, mean loss: 0.34014795715689583
Epoch: 62, step: 86, loss: 0.3289822041988373, mean loss: 0.34014783255997616
Epoch: 62, step: 87, loss: 0.34201672673225403, mean loss: 0.34014785341444603
Epoch: 62, step: 88, loss: 0.2982841432094574, mean loss: 0.340147386274169
Epoch: 62, step: 89, loss: 0.3124837279319763, mean loss: 0.34014707758999463
Epoch: 62, step: 90, loss: 0.33985623717308044, mean loss: 0.340147074344696
Epoch: 62, step: 91, loss: 0.29679617285728455, mean loss: 0.34014659062564345
Epoch: 62, step: 92, loss: 0.34108731150627136, mean loss: 0.3401466011223003
Epoch: 62, step: 93, loss: 0.3661474585533142, mean loss: 0.34014689123920716
Epoch: 62, step: 94, loss: 0.31247448921203613, mean loss: 0.34014658247469326
Epoch: 62, step: 95, loss: 0.34697917103767395, mean loss: 0.34014665871084165
Epoch: 62, step: 96, loss: 0.3289765417575836, mean loss: 0.34014653407913226
Epoch: 62, step: 97, loss: 0.3280121386051178, mean loss: 0.3401463986898984
Epoch: 62, step: 98, loss: 0.34655436873435974, mean loss: 0.3401464701858766
Epoch: 62, step: 99, loss: 0.33544492721557617, mean loss: 0.3401464177296914
Epoch: 62, step: 100, loss: 0.31427717208862305, mean loss: 0.34014612910384884
Epoch: 62, step: 101, loss: 0.34878137707710266, mean loss: 0.34014622544712647
Epoch: 62, step: 102, loss: 0.315400093793869, mean loss: 0.3401459493581433
Epoch: 62, step: 103, loss: 0.32681748270988464, mean loss: 0.34014580065604305
Epoch: 62, step: 104, loss: 0.335701048374176, mean loss: 0.34014575106769634
Epoch: 62, step: 105, loss: 0.337969034910202, mean loss: 0.3401457267832043
Epoch: 62, step: 106, loss: 0.3853120505809784, mean loss: 0.3401462306748069
Epoch: 62, step: 107, loss: 0.31719252467155457, mean loss: 0.34014597459794044
Epoch: 62, step: 108, loss: 0.3583231568336487, mean loss: 0.3401461773845379
Epoch: 62, step: 109, loss: 0.35014012455940247, mean loss: 0.34014628887684223
Epoch: 62, step: 110, loss: 0.3165420591831207, mean loss: 0.3401460255513958
Epoch: 62, step: 111, loss: 0.34256741404533386, mean loss: 0.34014605256376185
Epoch: 62, step: 112, loss: 0.3129064440727234, mean loss: 0.3401457486893239
Epoch: 62, step: 113, loss: 0.3017370402812958, mean loss: 0.34014532022154753
Epoch: 62, step: 114, loss: 0.3125550150871277, mean loss: 0.3401450124417417
Epoch: 62, step: 115, loss: 0.3445083498954773, mean loss: 0.34014506111580195
Epoch: 62, step: 116, loss: 0.32109254598617554, mean loss: 0.34014484858286503
Epoch: 62, step: 117, loss: 0.29487234354019165, mean loss: 0.3401443435686419
Epoch: 62, step: 118, loss: 0.2998071014881134, mean loss: 0.34014389361223424
Epoch: 62, step: 119, loss: 0.34652599692344666, mean loss: 0.34014396480292797
Epoch: 62, step: 120, loss: 0.30209237337112427, mean loss: 0.3401435403521094
Epoch: 62, step: 121, loss: 0.3654780089855194, mean loss: 0.34014382294517836
Epoch: 62, step: 122, loss: 0.3289031386375427, mean loss: 0.3401436975624798
Epoch: 62, step: 123, loss: 0.3068622350692749, mean loss: 0.34014332633303157
Epoch: 62, step: 124, loss: 0.33362114429473877, mean loss: 0.3401432535838538
Epoch: 62, step: 125, loss: 0.3186783194541931, mean loss: 0.34014301416414994
Epoch: 62, step: 126, loss: 0.35542601346969604, mean loss: 0.3401431846287008
Epoch: 62, step: 127, loss: 0.3695674240589142, mean loss: 0.34014351281911115
Epoch: 62, step: 128, loss: 0.32765161991119385, mean loss: 0.3401433734892997
Epoch: 62, step: 129, loss: 0.31593888998031616, mean loss: 0.34014310352472865
Epoch: 62, step: 130, loss: 0.3346922695636749, mean loss: 0.34014304272956075
Epoch: 62, step: 131, loss: 0.3993627727031708, mean loss: 0.3401437032217532
Epoch: 62, step: 132, loss: 0.3193790316581726, mean loss: 0.34014347163085457
Epoch: 62, step: 133, loss: 0.31014126539230347, mean loss: 0.3401431370163441
Epoch: 62, step: 134, loss: 0.39777031540870667, mean loss: 0.3401437797249127
Epoch: 62, step: 135, loss: 0.35018134117126465, mean loss: 0.34014389167130643
Epoch: 62, step: 136, loss: 0.29457706212997437, mean loss: 0.34014338348160544
Epoch: 62, step: 137, loss: 0.351076602935791, mean loss: 0.3401435054143275
Epoch: 62, step: 138, loss: 0.31030479073524475, mean loss: 0.3401431726417949
Epoch: 62, step: 139, loss: 0.3385154604911804, mean loss: 0.34014315448914123
Epoch: 62, step: 140, loss: 0.3404271602630615, mean loss: 0.34014315765640946
Epoch: 62, step: 141, loss: 0.3297502398490906, mean loss: 0.34014304175457155
Epoch: 62, step: 142, loss: 0.34347963333129883, mean loss: 0.34014307896383184
Epoch: 62, step: 143, loss: 0.30242598056793213, mean loss: 0.34014265835206453
Epoch: 62, step: 144, loss: 0.3347131013870239, mean loss: 0.3401425978036613
Epoch: 62, step: 145, loss: 0.30397018790245056, mean loss: 0.3401421944268754
Epoch: 62, step: 146, loss: 0.34250015020370483, mean loss: 0.3401422207213362
Epoch: 62, step: 147, loss: 0.3649227023124695, mean loss: 0.3401424970548211
Epoch: 62, step: 148, loss: 0.3238335847854614, mean loss: 0.3401423151919993
Epoch: 62, step: 149, loss: 0.3811652660369873, mean loss: 0.34014277263920867
Epoch: 62, step: 150, loss: 0.320756196975708, mean loss: 0.3401425564617796
Epoch: 62, step: 151, loss: 0.3661480247974396, mean loss: 0.3401428464424702
Epoch: 62, step: 152, loss: 0.3350183069705963, mean loss: 0.3401427893006066
Epoch: 62, step: 153, loss: 0.3390442132949829, mean loss: 0.3401427770509243
Epoch: 62, step: 154, loss: 0.3071597218513489, mean loss: 0.3401424092771523
Epoch: 62, step: 155, loss: 0.3471904397010803, mean loss: 0.34014248786453044
Epoch: 62, step: 156, loss: 0.3361245393753052, mean loss: 0.340142443063856
Epoch: 62, step: 157, loss: 0.3311100900173187, mean loss: 0.3401423423530087
Epoch: 62, step: 158, loss: 0.33366137742996216, mean loss: 0.3401422700909761
Epoch: 62, step: 159, loss: 0.32117190957069397, mean loss: 0.3401420585759404
Epoch: 62, step: 160, loss: 0.2897369861602783, mean loss: 0.3401414965775636
Epoch: 62, step: 161, loss: 0.33257392048835754, mean loss: 0.3401414122027605
Epoch: 62, step: 162, loss: 0.3058910071849823, mean loss: 0.3401410303316138
Epoch: 62, step: 163, loss: 0.3462977707386017, mean loss: 0.34014109897475264
Epoch: 62, step: 164, loss: 0.34020233154296875, mean loss: 0.34014109965744327
Epoch: 62, step: 165, loss: 0.3256896138191223, mean loss: 0.3401409385375708
Epoch: 62, step: 166, loss: 0.37207266688346863, mean loss: 0.34014129454100855
Epoch: 62, step: 167, loss: 0.3062896132469177, mean loss: 0.3401409171364276
Epoch: 62, step: 168, loss: 0.32446542382240295, mean loss: 0.3401407423759193
Epoch: 62, step: 169, loss: 0.33417126536369324, mean loss: 0.3401406758250819
Epoch: 62, step: 170, loss: 0.3318668603897095, mean loss: 0.34014058358530846
Epoch: 62, step: 171, loss: 0.33884191513061523, mean loss: 0.34014056910739926
Epoch: 62, step: 172, loss: 0.32672443985939026, mean loss: 0.34014041954240837
Epoch: 62, step: 173, loss: 0.30216291546821594, mean loss: 0.34013999616830215
Epoch: 62, step: 174, loss: 0.3106030523777008, mean loss: 0.3401396668934307
Epoch: 62, step: 175, loss: 0.32818570733070374, mean loss: 0.3401395336333803
Epoch: 62, step: 176, loss: 0.32297483086586, mean loss: 0.3401393422872706
Epoch: 62, step: 177, loss: 0.35576897859573364, mean loss: 0.3401395165190534
Epoch: 62, step: 178, loss: 0.2751244902610779, mean loss: 0.3401387917704133
Epoch: 62, step: 179, loss: 0.32095786929130554, mean loss: 0.3401385779553413
Epoch: 62, step: 180, loss: 0.3193367123603821, mean loss: 0.3401383460737509
Epoch: 62, step: 181, loss: 0.3128468692302704, mean loss: 0.3401380418548584
Epoch: 62, step: 182, loss: 0.36580735445022583, mean loss: 0.3401383279882489
Epoch: 62, step: 183, loss: 0.3383105397224426, mean loss: 0.3401383076142937
Epoch: 62, step: 184, loss: 0.3423342704772949, mean loss: 0.34013833209193756
Epoch: 62, step: 185, loss: 0.3742109537124634, mean loss: 0.34013871188351547
Epoch: 62, step: 186, loss: 0.34650933742523193, mean loss: 0.3401387828931074
Epoch: 62, step: 187, loss: 0.31783971190452576, mean loss: 0.340138534341333
Epoch: 62, step: 188, loss: 0.3204864263534546, mean loss: 0.3401383152958011
Epoch: 62, step: 189, loss: 0.297324538230896, mean loss: 0.3401378380919282
Epoch: 62, step: 190, loss: 0.37871795892715454, mean loss: 0.3401382681025261
Epoch: 62, step: 191, loss: 0.35132476687431335, mean loss: 0.3401383927848575
Epoch: 62, step: 192, loss: 0.32834792137145996, mean loss: 0.34013826137224046
Epoch: 62, step: 193, loss: 0.40731358528137207, mean loss: 0.3401390100773954
Epoch: 62, step: 194, loss: 0.3649211823940277, mean loss: 0.3401392862849711
Epoch: 62, step: 195, loss: 0.32622382044792175, mean loss: 0.3401391311930688
Epoch: 62, step: 196, loss: 0.31495317816734314, mean loss: 0.34013885049144693
Epoch: 62, step: 197, loss: 0.3360905051231384, mean loss: 0.3401388053724695
Epoch: 62, step: 198, loss: 0.31195586919784546, mean loss: 0.34013849127597484
Epoch: 62, step: 199, loss: 0.3581259250640869, mean loss: 0.34013869174220374
Epoch: 62, step: 200, loss: 0.34707513451576233, mean loss: 0.3401387690465621
Epoch: 62, step: 201, loss: 0.31442612409591675, mean loss: 0.34013848249083994
Epoch: 62, step: 202, loss: 0.3277684152126312, mean loss: 0.34013834463360804
Epoch: 62, step: 203, loss: 0.33502036333084106, mean loss: 0.3401382875973077
Epoch: 62, step: 204, loss: 0.3267580568790436, mean loss: 0.34013813848571306
Epoch: 62, step: 205, loss: 0.3667937219142914, mean loss: 0.3401384355368133
Epoch: 62, step: 206, loss: 0.2989735007286072, mean loss: 0.3401379767979176
Epoch: 62, step: 207, loss: 0.32974153757095337, mean loss: 0.34013786094208237
Epoch: 62, step: 208, loss: 0.30576032400131226, mean loss: 0.3401374778499694
Epoch: 62, step: 209, loss: 0.3813750445842743, mean loss: 0.34013793738290676
Epoch: 62, step: 210, loss: 0.3390759229660034, mean loss: 0.3401379255484266
Epoch: 62, step: 211, loss: 0.35457026958465576, mean loss: 0.3401380863724074
Epoch: 62, step: 212, loss: 0.3208617866039276, mean loss: 0.34013787157315434
Epoch: 62, step: 213, loss: 0.3762204647064209, mean loss: 0.34013827364345733
Epoch: 62, step: 214, loss: 0.30459949374198914, mean loss: 0.3401378776373075
Epoch: 62, step: 215, loss: 0.3713477849960327, mean loss: 0.3401382254032569
Epoch: 62, step: 216, loss: 0.323488712310791, mean loss: 0.3401380398830263
Epoch: 62, step: 217, loss: 0.3200535476207733, mean loss: 0.34013781609040866
Epoch: 62, step: 218, loss: 0.37740951776504517, mean loss: 0.3401382313878746
Epoch: 62, step: 219, loss: 0.3156794011592865, mean loss: 0.34013795886001624
Epoch: 62, step: 220, loss: 0.3238063454627991, mean loss: 0.34013777689015146
Epoch: 62, step: 221, loss: 0.3475572168827057, mean loss: 0.3401378595580065
Epoch: 62, step: 222, loss: 0.3204498589038849, mean loss: 0.3401376401955409
Epoch: 62, step: 223, loss: 0.3701035976409912, mean loss: 0.34013797407063495
Epoch: 62, step: 224, loss: 0.39396676421165466, mean loss: 0.34013857381426627
Epoch: 62, step: 225, loss: 0.3409506678581238, mean loss: 0.3401385828622646
Epoch: 62, step: 226, loss: 0.31850266456604004, mean loss: 0.34013834180696634
Epoch: 62, step: 227, loss: 0.33523932099342346, mean loss: 0.3401382872254251
Epoch: 62, step: 228, loss: 0.3035489618778229, mean loss: 0.34013787957671415
Epoch: 62, step: 229, loss: 0.2967108190059662, mean loss: 0.3401373957528704
Epoch: 62, step: 230, loss: 0.3015097379684448, mean loss: 0.34013696540429494
Epoch: 62, step: 231, loss: 0.3288610875606537, mean loss: 0.34013683978176995
Epoch: 62, step: 232, loss: 0.3581564128398895, mean loss: 0.3401370405323527
Epoch: 62, step: 233, loss: 0.31407374143600464, mean loss: 0.3401367501722995
Epoch: 62, step: 234, loss: 0.3538186848163605, mean loss: 0.34013690259517576
Epoch: 62, step: 235, loss: 0.3023078739643097, mean loss: 0.34013648116755857
Epoch: 62, step: 236, loss: 0.3190726041793823, mean loss: 0.3401362465117686
Epoch: 62, step: 237, loss: 0.32795655727386475, mean loss: 0.34013611082911327
Epoch: 62, step: 238, loss: 0.3033849596977234, mean loss: 0.34013570142308286
Epoch: 62, step: 239, loss: 0.3319120407104492, mean loss: 0.3401356098129243
Epoch: 62, step: 240, loss: 0.3367961645126343, mean loss: 0.3401355726124954
Epoch: 62, step: 241, loss: 0.3263813853263855, mean loss: 0.3401354193966406
Epoch: 62, step: 242, loss: 0.38790908455848694, mean loss: 0.340135951569226
Epoch: 62, step: 243, loss: 0.3134114444255829, mean loss: 0.34013565387610184
Epoch: 62, step: 244, loss: 0.34707483649253845, mean loss: 0.3401357311730911
Epoch: 62, step: 245, loss: 0.35745859146118164, mean loss: 0.34013592413386246
Epoch: 62, step: 246, loss: 0.3133069574832916, mean loss: 0.34013562528711616
Epoch: 62, step: 247, loss: 0.33351507782936096, mean loss: 0.3401355515419342
Epoch: 62, step: 248, loss: 0.3221045434474945, mean loss: 0.34013535069975753
Epoch: 62, step: 249, loss: 0.35232406854629517, mean loss: 0.34013548646484304
Epoch: 62, step: 250, loss: 0.3199309706687927, mean loss: 0.3401352614176071
Epoch: 62, step: 251, loss: 0.325833797454834, mean loss: 0.3401351021230653
Epoch: 62, step: 252, loss: 0.30511555075645447, mean loss: 0.34013471206780455
Epoch: 62, step: 253, loss: 0.3281829059123993, mean loss: 0.3401345789475114
Epoch: 62, step: 254, loss: 0.3304380774497986, mean loss: 0.3401344709482076
Epoch: 62, step: 255, loss: 0.3311399519443512, mean loss: 0.3401343707686767
Epoch: 62, step: 256, loss: 0.3444046974182129, mean loss: 0.34013441833037017
Epoch: 62, step: 257, loss: 0.3412471413612366, mean loss: 0.34013443072342736
Epoch: 62, step: 258, loss: 0.33431267738342285, mean loss: 0.3401343658838254
Epoch: 62, step: 259, loss: 0.3481937050819397, mean loss: 0.34013445564347256
Epoch: 62, step: 260, loss: 0.32329651713371277, mean loss: 0.34013426811561825
Epoch: 62, step: 261, loss: 0.36930176615715027, mean loss: 0.3401345929568928
Epoch: 62, step: 262, loss: 0.33106935024261475, mean loss: 0.34013449199752366
Epoch: 62, step: 263, loss: 0.31468525528907776, mean loss: 0.3401342085732018
Epoch: 62, step: 264, loss: 0.3423694670200348, mean loss: 0.3401342334666617
Epoch: 62, step: 265, loss: 0.32783663272857666, mean loss: 0.3401340965131822
Epoch: 62, step: 266, loss: 0.34235337376594543, mean loss: 0.3401341212281135
Epoch: 62, step: 267, loss: 0.31564927101135254, mean loss: 0.3401338485561658
Epoch: 62, step: 268, loss: 0.3415065407752991, mean loss: 0.3401338638427814
Epoch: 62, step: 269, loss: 0.3717251420021057, mean loss: 0.34013421564658725
Epoch: 62, step: 270, loss: 0.3252338469028473, mean loss: 0.340134049716357
Epoch: 62, step: 271, loss: 0.34485170245170593, mean loss: 0.34013410225146545
Epoch: 62, step: 272, loss: 0.30525636672973633, mean loss: 0.3401337138622992
Epoch: 62, step: 273, loss: 0.3424467444419861, mean loss: 0.3401337396193044
Epoch: 62, step: 274, loss: 0.3076710104942322, mean loss: 0.3401333781310565
Epoch: 62, step: 275, loss: 0.28603002429008484, mean loss: 0.3401327756706556
Epoch: 62, step: 276, loss: 0.3354046940803528, mean loss: 0.3401327230223444
Epoch: 62, step: 277, loss: 0.3333684802055359, mean loss: 0.34013264770173307
Epoch: 62, step: 278, loss: 0.3506597578525543, mean loss: 0.3401327649209938
Epoch: 62, step: 279, loss: 0.3416227102279663, mean loss: 0.3401327815113344
Epoch: 62, step: 280, loss: 0.29328620433807373, mean loss: 0.3401322598868071
Epoch: 62, step: 281, loss: 0.37029018998146057, mean loss: 0.3401325956838241
Epoch: 62, step: 282, loss: 0.35181334614753723, mean loss: 0.34013272574306475
Epoch: 62, step: 283, loss: 0.32597145438194275, mean loss: 0.3401325680662358
Epoch: 62, step: 284, loss: 0.3276025354862213, mean loss: 0.34013242855377573
Epoch: 62, step: 285, loss: 0.3135643005371094, mean loss: 0.34013213274100695
Epoch: 62, step: 286, loss: 0.3134978115558624, mean loss: 0.34013183619453713
Epoch: 62, step: 287, loss: 0.3465979993343353, mean loss: 0.34013190818798084
Epoch: 62, step: 288, loss: 0.344719797372818, mean loss: 0.34013195926839085
Epoch: 62, step: 289, loss: 0.35819706320762634, mean loss: 0.3401321603984977
Epoch: 62, step: 290, loss: 0.3203030824661255, mean loss: 0.34013193963142246
Epoch: 62, step: 291, loss: 0.3265829384326935, mean loss: 0.3401317887852724
Epoch: 62, step: 292, loss: 0.3339865505695343, mean loss: 0.340131720368775
Epoch: 62, step: 293, loss: 0.3999583125114441, mean loss: 0.34013238642600085
Epoch: 62, step: 294, loss: 0.34821999073028564, mean loss: 0.3401324764653483
Epoch: 62, step: 295, loss: 0.32863539457321167, mean loss: 0.3401323484696913
Epoch: 62, step: 296, loss: 0.3304804265499115, mean loss: 0.340132241017179
Epoch: 62, step: 297, loss: 0.2932402193546295, mean loss: 0.34013171898545475
Epoch: 62, step: 298, loss: 0.33575186133384705, mean loss: 0.3401316702266445
Epoch: 62, step: 299, loss: 0.3501707911491394, mean loss: 0.34013178198601707
Epoch: 62, step: 300, loss: 0.30297550559043884, mean loss: 0.34013136835259805
Epoch: 62, step: 301, loss: 0.3064842224121094, mean loss: 0.34013099378790984
Epoch: 62, step: 302, loss: 0.35344961285591125, mean loss: 0.3401311420509712
Epoch: 62, step: 303, loss: 0.3514557480812073, mean loss: 0.3401312681152471
Epoch: 62, step: 304, loss: 0.36672499775886536, mean loss: 0.34013156415044177
Epoch: 62, step: 305, loss: 0.3490249216556549, mean loss: 0.3401316631481209
Epoch: 62, step: 306, loss: 0.3490530252456665, mean loss: 0.3401317624564316
Epoch: 62, step: 307, loss: 0.37171319127082825, mean loss: 0.34013211400179
Epoch: 62, step: 308, loss: 0.30053040385246277, mean loss: 0.3401316731844191
Epoch: 62, step: 309, loss: 0.33800646662712097, mean loss: 0.34013164952843217
Epoch: 62, step: 310, loss: 0.32935062050819397, mean loss: 0.3401315295245472
Epoch: 62, step: 311, loss: 0.3481537103652954, mean loss: 0.34013161881863496
Epoch: 62, step: 312, loss: 0.3287027180194855, mean loss: 0.3401314916061062
Epoch: 62, step: 313, loss: 0.3051338195800781, mean loss: 0.34013110205921243
Epoch: 62, step: 314, loss: 0.3341996371746063, mean loss: 0.34013103603887823
Epoch: 62, step: 315, loss: 0.33445367217063904, mean loss: 0.3401309728475258
Epoch: 62, step: 316, loss: 0.30597198009490967, mean loss: 0.3401305926483745
Epoch: 62, step: 317, loss: 0.34228086471557617, mean loss: 0.3401306165812381
Epoch: 62, step: 318, loss: 0.33508896827697754, mean loss: 0.3401305604675303
Epoch: 62, step: 319, loss: 0.35134363174438477, mean loss: 0.3401306852679853
Epoch: 62, step: 320, loss: 0.29730820655822754, mean loss: 0.34013020866302907
Epoch: 62, step: 321, loss: 0.32015931606292725, mean loss: 0.3401299863937736
Epoch: 62, step: 322, loss: 0.34824517369270325, mean loss: 0.3401300767120483
Epoch: 62, step: 323, loss: 0.34392037987709045, mean loss: 0.3401301188958969
Epoch: 62, step: 324, loss: 0.40865713357925415, mean loss: 0.34013088155284416
Epoch: 62, step: 325, loss: 0.35686132311820984, mean loss: 0.34013106774869034
Epoch: 62, step: 326, loss: 0.3558295965194702, mean loss: 0.3401312424582643
Epoch: 62, step: 327, loss: 0.31610366702079773, mean loss: 0.34013097505736245
Epoch: 62, step: 328, loss: 0.31265199184417725, mean loss: 0.3401306692494319
Epoch: 62, step: 329, loss: 0.39371779561042786, mean loss: 0.3401312656028602
Epoch: 62, step: 330, loss: 0.3227675259113312, mean loss: 0.34013107236968726
Epoch: 62, step: 331, loss: 0.3513283133506775, mean loss: 0.34013119697731004
Epoch: 62, step: 332, loss: 0.36587876081466675, mean loss: 0.34013148350387706
Epoch: 62, step: 333, loss: 0.3133230209350586, mean loss: 0.3401311851746326
Epoch: 62, step: 334, loss: 0.32230302691459656, mean loss: 0.34013098678198755
Epoch: 62, step: 335, loss: 0.31586211919784546, mean loss: 0.3401307167198093
Epoch: 62, step: 336, loss: 0.35061368346214294, mean loss: 0.34013083337219613
Epoch: 62, step: 337, loss: 0.3612131178379059, mean loss: 0.34013106796909
Epoch: 62, step: 338, loss: 0.29140231013298035, mean loss: 0.340130525737149
Epoch: 62, step: 339, loss: 0.3256429433822632, mean loss: 0.34013036452757106
Epoch: 62, step: 340, loss: 0.354620099067688, mean loss: 0.34013052575930325
Epoch: 62, step: 341, loss: 0.34448865056037903, mean loss: 0.34013057425295856
Epoch: 62, step: 342, loss: 0.32411572337150574, mean loss: 0.34013039605475354
Epoch: 62, step: 343, loss: 0.2852276563644409, mean loss: 0.340129785155478
Epoch: 62, step: 344, loss: 0.3199162781238556, mean loss: 0.3401295602435797
Epoch: 62, step: 345, loss: 0.35765132308006287, mean loss: 0.34012975520277633
Epoch: 62, step: 346, loss: 0.3185408413410187, mean loss: 0.34012951499233
Epoch: 62, step: 347, loss: 0.314542680978775, mean loss: 0.3401292303019342
Epoch: 62, step: 348, loss: 0.3013279139995575, mean loss: 0.340128798586186
Epoch: 62, step: 349, loss: 0.3266063332557678, mean loss: 0.34012864813262306
Epoch: 62, step: 350, loss: 0.33367839455604553, mean loss: 0.3401285763666535
Epoch: 62, step: 351, loss: 0.3308747410774231, mean loss: 0.3401284734089845
Epoch: 62, step: 352, loss: 0.37249717116355896, mean loss: 0.3401288335373515
Epoch: 62, step: 353, loss: 0.32560786604881287, mean loss: 0.3401286719814506
Epoch: 62, step: 354, loss: 0.3181389570236206, mean loss: 0.3401284273332417
Epoch: 62, step: 355, loss: 0.31524190306663513, mean loss: 0.3401281504594459
Epoch: 62, step: 356, loss: 0.372060626745224, mean loss: 0.3401285057186803
Epoch: 62, step: 357, loss: 0.3804023563861847, mean loss: 0.340128953773446
Epoch: 62, step: 358, loss: 0.3196427822113037, mean loss: 0.3401287258631635
Epoch: 62, step: 359, loss: 0.3201700448989868, mean loss: 0.34012850382372595
Epoch: 62, step: 360, loss: 0.30110085010528564, mean loss: 0.34012806964764525
Epoch: 62, step: 361, loss: 0.32695257663726807, mean loss: 0.3401279230741331
Epoch: 62, step: 362, loss: 0.3241788148880005, mean loss: 0.3401277456469359
Epoch: 62, step: 363, loss: 0.31138381361961365, mean loss: 0.3401274258862005
Epoch: 62, step: 364, loss: 0.3095487952232361, mean loss: 0.3401270857192168
Epoch: 62, step: 365, loss: 0.30408650636672974, mean loss: 0.3401266847961368
Epoch: 62, step: 366, loss: 0.37463605403900146, mean loss: 0.340127068681439
Epoch: 62, step: 367, loss: 0.3577742278575897, mean loss: 0.34012726498782836
Epoch: 62, step: 368, loss: 0.3411202132701874, mean loss: 0.3401272760332279
Epoch: 62, step: 369, loss: 0.30147889256477356, mean loss: 0.3401268461195094
Epoch: 62, step: 370, loss: 0.3225242495536804, mean loss: 0.3401266503153673
Epoch: 62, step: 371, loss: 0.3097175657749176, mean loss: 0.3401263120608118
Epoch: 62, step: 372, loss: 0.333001971244812, mean loss: 0.3401262328142982
Epoch: 62, step: 373, loss: 0.3866162598133087, mean loss: 0.3401267499332388
Epoch: 62, step: 374, loss: 0.31239089369773865, mean loss: 0.3401264414245546
Epoch: 62, step: 375, loss: 0.30034929513931274, mean loss: 0.3401259989843263
Epoch: 62, step: 376, loss: 0.3614320755004883, mean loss: 0.34012623596866
Epoch: 62, step: 377, loss: 0.2900034189224243, mean loss: 0.34012567846619024
Epoch: 62, step: 378, loss: 0.3241663873195648, mean loss: 0.3401255009573072
Epoch: 62, step: 379, loss: 0.3156569302082062, mean loss: 0.34012522880609986
Epoch: 62, step: 380, loss: 0.3110189735889435, mean loss: 0.34012490507593696
Epoch: 62, step: 381, loss: 0.3213915526866913, mean loss: 0.34012469671922035
Epoch: 62, step: 382, loss: 0.32006052136421204, mean loss: 0.3401244735632622
Epoch: 62, step: 383, loss: 0.39046651124954224, mean loss: 0.34012503346669765
Epoch: 62, step: 384, loss: 0.3310603201389313, mean loss: 0.3401249326502047
Epoch: 62, step: 385, loss: 0.3294505774974823, mean loss: 0.3401248139328175
Epoch: 62, step: 386, loss: 0.3381787836551666, mean loss: 0.3401247922898183
Epoch: 62, step: 387, loss: 0.3327317237854004, mean loss: 0.3401247100678722
Epoch: 62, step: 388, loss: 0.3272770643234253, mean loss: 0.3401245671844826
Epoch: 62, step: 389, loss: 0.3719973564147949, mean loss: 0.3401249216495422
Epoch: 62, step: 390, loss: 0.30223265290260315, mean loss: 0.3401245002450699
Epoch: 62, step: 391, loss: 0.3338412344455719, mean loss: 0.3401244303688933
Epoch: 62, step: 392, loss: 0.28760144114494324, mean loss: 0.3401238462674128
Epoch: 62, step: 393, loss: 0.3514306843280792, mean loss: 0.34012397200792194
Epoch: 62, step: 394, loss: 0.32944124937057495, mean loss: 0.340123853209365
Epoch: 62, step: 395, loss: 0.35687699913978577, mean loss: 0.3401240395127538
Epoch: 62, step: 396, loss: 0.3415367305278778, mean loss: 0.340124055222412
Epoch: 62, step: 397, loss: 0.3023805618286133, mean loss: 0.34012363550516234
Epoch: 62, step: 398, loss: 0.3110783100128174, mean loss: 0.3401233125173445
Epoch: 62, step: 399, loss: 0.30566802620887756, mean loss: 0.34012292937431554
Epoch: 62, step: 400, loss: 0.3121598958969116, mean loss: 0.340122618428642
Epoch: 62, step: 401, loss: 0.2893763482570648, mean loss: 0.3401220541423063
Epoch: 62, step: 402, loss: 0.34344568848609924, mean loss: 0.34012209109991093
Epoch: 62, step: 403, loss: 0.33353567123413086, mean loss: 0.34012201786213275
Epoch: 62, step: 404, loss: 0.3347497284412384, mean loss: 0.3401219581255575
Epoch: 62, step: 405, loss: 0.29553428292274475, mean loss: 0.34012146234337054
Epoch: 62, step: 406, loss: 0.3222532272338867, mean loss: 0.3401212636639342
Epoch: 62, step: 407, loss: 0.31064626574516296, mean loss: 0.3401209359309027
Epoch: 62, step: 408, loss: 0.29376456141471863, mean loss: 0.3401204204992726
Epoch: 62, step: 409, loss: 0.3714425563812256, mean loss: 0.3401207687629196
Epoch: 62, step: 410, loss: 0.290500283241272, mean loss: 0.34012021705025297
Epoch: 62, step: 411, loss: 0.3479885458946228, mean loss: 0.3401203045344518
Epoch: 62, step: 412, loss: 0.3345775902271271, mean loss: 0.3401202429083379
Epoch: 62, step: 413, loss: 0.35190099477767944, mean loss: 0.34012037388999133
Epoch: 62, step: 414, loss: 0.32017505168914795, mean loss: 0.3401201521348553
Epoch: 62, step: 415, loss: 0.329367071390152, mean loss: 0.3401200325817918
Epoch: 62, step: 416, loss: 0.3273719549179077, mean loss: 0.3401198908498705
Epoch: 62, step: 417, loss: 0.37310802936553955, mean loss: 0.34012025760479586
Epoch: 62, step: 418, loss: 0.3353347182273865, mean loss: 0.34012020440080487
Epoch: 62, step: 419, loss: 0.38093996047973633, mean loss: 0.34012065821585447
Epoch: 62, step: 420, loss: 0.35396385192871094, mean loss: 0.3401208121163282
Epoch: 62, step: 421, loss: 0.3350464701652527, mean loss: 0.3401207557034105
Epoch: 62, step: 422, loss: 0.2794840931892395, mean loss: 0.3401200815957017
Epoch: 62, step: 423, loss: 0.33777832984924316, mean loss: 0.34012005556235336
Epoch: 62, step: 424, loss: 0.30899834632873535, mean loss: 0.340119709584907
Epoch: 62, step: 425, loss: 0.3067607581615448, mean loss: 0.3401193387403484
Epoch: 62, step: 426, loss: 0.34879523515701294, mean loss: 0.340119435187421
Epoch: 62, step: 427, loss: 0.3024871051311493, mean loss: 0.34011901684589785
Epoch: 62, step: 428, loss: 0.35530683398246765, mean loss: 0.3401191856800868
Epoch: 62, step: 429, loss: 0.33785977959632874, mean loss: 0.3401191605638539
Epoch: 62, step: 430, loss: 0.3299580216407776, mean loss: 0.34011904761085393
Epoch: 62, step: 431, loss: 0.30545634031295776, mean loss: 0.34011866229841176
Epoch: 62, step: 432, loss: 0.34361565113067627, mean loss: 0.3401187011706879
Epoch: 62, step: 433, loss: 0.3235990107059479, mean loss: 0.34011851754103906
Epoch: 62, step: 434, loss: 0.36167487502098083, mean loss: 0.34011875715462997
Epoch: 62, step: 435, loss: 0.36560842394828796, mean loss: 0.3401190404864826
Epoch: 62, step: 436, loss: 0.3643582761287689, mean loss: 0.3401193099161013
Epoch: 62, step: 437, loss: 0.3071683645248413, mean loss: 0.34011894365612094
Epoch: 62, step: 438, loss: 0.3896150588989258, mean loss: 0.34011949381468176
Epoch: 62, step: 439, loss: 0.3762490153312683, mean loss: 0.34011989539659443
Epoch: 62, step: 440, loss: 0.3029046356678009, mean loss: 0.3401194817512307
Epoch: 62, step: 441, loss: 0.33706265687942505, mean loss: 0.34011944777518455
Epoch: 62, step: 442, loss: 0.3238022029399872, mean loss: 0.34011926641402557
Epoch: 62, step: 443, loss: 0.324131578207016, mean loss: 0.3401190887177622
Epoch: 62, step: 444, loss: 0.30271971225738525, mean loss: 0.3401186730444329
Epoch: 62, step: 445, loss: 0.3856692314147949, mean loss: 0.340119179308002
Epoch: 62, step: 446, loss: 0.3168947398662567, mean loss: 0.34011892118697457
Epoch: 62, step: 447, loss: 0.3003126382827759, mean loss: 0.34011847877696627
Epoch: 62, step: 448, loss: 0.31608474254608154, mean loss: 0.3401182116671912
Epoch: 62, step: 449, loss: 0.3832477033138275, mean loss: 0.3401186910009355
Epoch: 62, step: 450, loss: 0.3336556553840637, mean loss: 0.3401186191726687
Epoch: 62, step: 451, loss: 0.33742913603782654, mean loss: 0.3401185892828806
Epoch: 62, step: 452, loss: 0.40487855672836304, mean loss: 0.3401193089900126
Epoch: 62, step: 453, loss: 0.34343215823173523, mean loss: 0.34011934580681197
Epoch: 62, step: 454, loss: 0.3303234577178955, mean loss: 0.3401192369430478
Epoch: 62, step: 455, loss: 0.3321162760257721, mean loss: 0.3401191480054487
Epoch: 62, step: 456, loss: 0.3585943281650543, mean loss: 0.3401193533194472
Epoch: 62, step: 457, loss: 0.33258888125419617, mean loss: 0.3401192696345177
Epoch: 62, step: 458, loss: 0.31532546877861023, mean loss: 0.34011899410804325
Epoch: 62, step: 459, loss: 0.323540061712265, mean loss: 0.34011880987311865
Epoch: 62, step: 460, loss: 0.3351731598377228, mean loss: 0.3401187549147345
Epoch: 62, step: 461, loss: 0.31445252895355225, mean loss: 0.3401184697027558
Epoch: 62, step: 462, loss: 0.3117837607860565, mean loss: 0.34011815484117053
Epoch: 62, step: 463, loss: 0.33807864785194397, mean loss: 0.34011813217796727
Epoch: 62, step: 464, loss: 0.33323678374290466, mean loss: 0.3401180557125929
Epoch: 62, step: 465, loss: 0.3433688282966614, mean loss: 0.34011809183469643
Epoch: 62, step: 466, loss: 0.34695902466773987, mean loss: 0.3401181678492843
Epoch: 62, step: 467, loss: 0.36180782318115234, mean loss: 0.34011840885616607
Epoch: 62, step: 468, loss: 0.36065107583999634, mean loss: 0.3401186370045153
Epoch: 62, step: 469, loss: 0.3300440013408661, mean loss: 0.34011852506163137
Epoch: 62, step: 470, loss: 0.3523608446121216, mean loss: 0.3401186610889156
Epoch: 62, step: 471, loss: 0.3714344799518585, mean loss: 0.3401190090424585
Epoch: 62, step: 472, loss: 0.33538728952407837, mean loss: 0.34011895646838136
Epoch: 62, step: 473, loss: 0.3340339660644531, mean loss: 0.3401188888588793
Epoch: 62, step: 474, loss: 0.3402090072631836, mean loss: 0.34011888986016153
Epoch: 62, step: 475, loss: 0.3525947332382202, mean loss: 0.3401190284744829
Epoch: 62, step: 476, loss: 0.2974346876144409, mean loss: 0.3401185542303758
Epoch: 62, step: 477, loss: 0.38123828172683716, mean loss: 0.34011901108577985
Epoch: 62, step: 478, loss: 0.3538435399532318, mean loss: 0.34011916356868527
Epoch: 62, step: 479, loss: 0.31395602226257324, mean loss: 0.34011887289295306
Epoch: 62, step: 480, loss: 0.34536290168762207, mean loss: 0.34011893115411357
Epoch: 62, step: 481, loss: 0.35499775409698486, mean loss: 0.34011909645600163
Epoch: 62, step: 482, loss: 0.2952606678009033, mean loss: 0.340118598089928
Epoch: 62, step: 483, loss: 0.32511481642723083, mean loss: 0.3401184314034677
Epoch: 62, step: 484, loss: 0.3442782759666443, mean loss: 0.34011847761728753
Epoch: 62, step: 485, loss: 0.3387615978717804, mean loss: 0.3401184625431908
Epoch: 62, step: 486, loss: 0.3027151823043823, mean loss: 0.3401180470204419
Epoch: 62, step: 487, loss: 0.3514050841331482, mean loss: 0.34011817240967396
Epoch: 62, step: 488, loss: 0.3202672600746155, mean loss: 0.34011795188563587
Epoch: 62, step: 489, loss: 0.3544733226299286, mean loss: 0.3401181113578608
Epoch: 62, step: 490, loss: 0.32477080821990967, mean loss: 0.34011794086826264
Epoch: 62, step: 491, loss: 0.3274858891963959, mean loss: 0.34011780054331625
Epoch: 62, step: 492, loss: 0.3272833824157715, mean loss: 0.34011765797193705
Epoch: 62, step: 493, loss: 0.3361888527870178, mean loss: 0.34011761432921434
Epoch: 62, step: 494, loss: 0.2952803373336792, mean loss: 0.3401171162645309
Epoch: 62, step: 495, loss: 0.3399617075920105, mean loss: 0.34011711453822824
Epoch: 62, step: 496, loss: 0.3409018814563751, mean loss: 0.3401171232554392
Epoch: 62, step: 497, loss: 0.31776243448257446, mean loss: 0.3401168749417435
Epoch: 62, step: 498, loss: 0.31935831904411316, mean loss: 0.3401166443602968
Epoch: 62, step: 499, loss: 0.30060574412345886, mean loss: 0.3401162054868326
Epoch: 62, step: 500, loss: 0.3519120216369629, mean loss: 0.3401163365092381
Epoch: 62, step: 501, loss: 0.2967989444732666, mean loss: 0.3401158553652635
Epoch: 62, step: 502, loss: 0.37338128685951233, mean loss: 0.3401162248539007
Epoch: 62, step: 503, loss: 0.3594400882720947, mean loss: 0.3401164394871802
Epoch: 62, step: 504, loss: 0.36470827460289, mean loss: 0.3401167126296403
Epoch: 62, step: 505, loss: 0.31667032837867737, mean loss: 0.34011645221263953
Epoch: 62, step: 506, loss: 0.32457882165908813, mean loss: 0.3401162796394119
Epoch: 62, step: 507, loss: 0.31841835379600525, mean loss: 0.34011603864774365
Epoch: 62, step: 508, loss: 0.304521769285202, mean loss: 0.3401156433183861
Epoch: 62, step: 509, loss: 0.3180006742477417, mean loss: 0.340115397700213
Epoch: 62, step: 510, loss: 0.351470947265625, mean loss: 0.34011552381833476
Epoch: 62, step: 511, loss: 0.3439733386039734, mean loss: 0.340115566663901
Epoch: 62, step: 512, loss: 0.3856599032878876, mean loss: 0.34011607248165765
Epoch: 62, step: 513, loss: 0.31642332673072815, mean loss: 0.34011580935172103
Epoch: 62, step: 514, loss: 0.34682926535606384, mean loss: 0.3401158839100543
Epoch: 62, step: 515, loss: 0.30755478143692017, mean loss: 0.3401155222968155
Epoch: 62, step: 516, loss: 0.34783244132995605, mean loss: 0.34011560799751
Epoch: 62, step: 517, loss: 0.3431330919265747, mean loss: 0.3401156415079816
Epoch: 62, step: 518, loss: 0.3001532554626465, mean loss: 0.3401151977132295
Epoch: 62, step: 519, loss: 0.3118628263473511, mean loss: 0.34011488396532435
Epoch: 62, step: 520, loss: 0.3605964481830597, mean loss: 0.3401151114144267
Epoch: 62, step: 521, loss: 0.30969834327697754, mean loss: 0.34011477363798986
Epoch: 62, step: 522, loss: 0.3368709981441498, mean loss: 0.3401147376164521
Epoch: 62, step: 523, loss: 0.29868176579475403, mean loss: 0.34011427751593437
Epoch: 62, step: 524, loss: 0.3432603180408478, mean loss: 0.34011431245136714
Epoch: 62, step: 525, loss: 0.35169851779937744, mean loss: 0.34011444108757816
Epoch: 62, step: 526, loss: 0.34979525208473206, mean loss: 0.340114548586451
Epoch: 62, step: 527, loss: 0.32044142484664917, mean loss: 0.3401143301321144
Epoch: 62, step: 528, loss: 0.3810761868953705, mean loss: 0.34011478497578856
Epoch: 62, step: 529, loss: 0.34109389781951904, mean loss: 0.34011479584781373
Epoch: 62, step: 530, loss: 0.3590570092201233, mean loss: 0.34011500617896745
Epoch: 62, step: 531, loss: 0.3055335581302643, mean loss: 0.340114622196644
Epoch: 62, step: 532, loss: 0.314433753490448, mean loss: 0.3401143370469265
Epoch: 62, step: 533, loss: 0.35531702637672424, mean loss: 0.34011450584941066
Epoch: 62, step: 534, loss: 0.3502536118030548, mean loss: 0.3401146184273389
Epoch: 62, step: 535, loss: 0.3657013475894928, mean loss: 0.34011490252230653
Epoch: 62, step: 536, loss: 0.3169631063938141, mean loss: 0.34011464546577924
Epoch: 62, step: 537, loss: 0.35466381907463074, mean loss: 0.34011480700480184
Epoch: 62, step: 538, loss: 0.34330499172210693, mean loss: 0.3401148424249304
Epoch: 62, step: 539, loss: 0.31725773215293884, mean loss: 0.34011458864878047
Epoch: 62, step: 540, loss: 0.3461672067642212, mean loss: 0.34011465584857303
Epoch: 62, step: 541, loss: 0.34273073077201843, mean loss: 0.3401146848934817
Epoch: 62, step: 542, loss: 0.32753172516822815, mean loss: 0.3401145451930262
Epoch: 62, step: 543, loss: 0.2955232858657837, mean loss: 0.3401140501306391
Epoch: 62, step: 544, loss: 0.30781444907188416, mean loss: 0.34011369153704213
Epoch: 62, step: 545, loss: 0.3469759225845337, mean loss: 0.3401137677214133
Epoch: 62, step: 546, loss: 0.3325357139110565, mean loss: 0.34011368359092414
Epoch: 62, step: 547, loss: 0.3106353282928467, mean loss: 0.34011335632999673
Epoch: 62, step: 548, loss: 0.30833661556243896, mean loss: 0.34011300355691626
Epoch: 62, step: 549, loss: 0.45185762643814087, mean loss: 0.3401142440887096
Epoch: 62, step: 550, loss: 0.338737815618515, mean loss: 0.3401142288084726
Epoch: 62, step: 551, loss: 0.3213159739971161, mean loss: 0.34011402012447156
Epoch: 62, step: 552, loss: 0.30234771966934204, mean loss: 0.3401136008762344
Epoch: 62, step: 553, loss: 0.31503868103027344, mean loss: 0.34011332251962767
Epoch: 62, step: 554, loss: 0.3571071922779083, mean loss: 0.3401135111664285
Epoch: 62, step: 555, loss: 0.3275253474712372, mean loss: 0.34011337142836523
Epoch: 62, step: 556, loss: 0.3385953903198242, mean loss: 0.3401133545778229
Epoch: 62, step: 557, loss: 0.33491531014442444, mean loss: 0.34011329687691005
Epoch: 62, step: 558, loss: 0.40005043148994446, mean loss: 0.3401139622019249
Epoch: 62, step: 559, loss: 0.3055732250213623, mean loss: 0.3401135787908471
Epoch: 62, step: 560, loss: 0.3075711727142334, mean loss: 0.3401132175657688
Epoch: 62, step: 561, loss: 0.31283798813819885, mean loss: 0.3401129148104194
Epoch: 62, step: 562, loss: 0.31593671441078186, mean loss: 0.3401126464573053
Epoch: 62, step: 563, loss: 0.3008921146392822, mean loss: 0.3401122111186313
Epoch: 62, step: 564, loss: 0.3217300772666931, mean loss: 0.3401120070835359
Epoch: 62, step: 565, loss: 0.33249232172966003, mean loss: 0.34011192250869904
Epoch: 62, step: 566, loss: 0.39619579911231995, mean loss: 0.34011254500580324
Epoch: 62, step: 567, loss: 0.3151944875717163, mean loss: 0.34011226843350884
Epoch: 62, step: 568, loss: 0.31348419189453125, mean loss: 0.3401119728845279
Epoch: 62, step: 569, loss: 0.3450589179992676, mean loss: 0.3401120277907979
Epoch: 62, step: 570, loss: 0.3442007899284363, mean loss: 0.3401120731715695
Epoch: 62, step: 571, loss: 0.3201413154602051, mean loss: 0.3401118515205405
Epoch: 62, step: 572, loss: 0.3129839599132538, mean loss: 0.3401115504374048
Epoch: 62, step: 573, loss: 0.29319536685943604, mean loss: 0.34011102973660373
Epoch: 62, step: 574, loss: 0.3087252378463745, mean loss: 0.3401106814042298
Epoch: 62, step: 575, loss: 0.3191908299922943, mean loss: 0.34011044922972683
Epoch: 62, step: 576, loss: 0.3143979012966156, mean loss: 0.3401101638676722
Epoch: 62, step: 577, loss: 0.32972288131713867, mean loss: 0.340110048589194
Epoch: 62, step: 578, loss: 0.3270348310470581, mean loss: 0.34010990348151604
Epoch: 62, step: 579, loss: 0.33910736441612244, mean loss: 0.3401098923555443
Epoch: 62, step: 580, loss: 0.32146215438842773, mean loss: 0.3401096854090909
Epoch: 62, step: 581, loss: 0.2859024703502655, mean loss: 0.3401090838419501
Epoch: 62, step: 582, loss: 0.3120723366737366, mean loss: 0.3401087727062711
Epoch: 62, step: 583, loss: 0.3147747814655304, mean loss: 0.3401084915673413
Epoch: 62, step: 584, loss: 0.3772833049297333, mean loss: 0.3401089041028618
Epoch: 62, step: 585, loss: 0.30944710969924927, mean loss: 0.3401085638472478
Epoch: 62, step: 586, loss: 0.35980024933815, mean loss: 0.34010878236453673
Epoch: 62, step: 587, loss: 0.3320819139480591, mean loss: 0.3401086932919146
Epoch: 62, step: 588, loss: 0.3563791811466217, mean loss: 0.34010887384039995
Epoch: 62, step: 589, loss: 0.3171982169151306, mean loss: 0.3401086196108684
Epoch: 62, step: 590, loss: 0.3248913586139679, mean loss: 0.3401084507534577
Epoch: 62, step: 591, loss: 0.3128816783428192, mean loss: 0.3401081486365867
Epoch: 62, step: 592, loss: 0.3245573937892914, mean loss: 0.3401079760824113
Epoch: 62, step: 593, loss: 0.31107673048973083, mean loss: 0.3401076539496846
Epoch: 62, step: 594, loss: 0.31219014525413513, mean loss: 0.34010734417849753
Epoch: 62, step: 595, loss: 0.3464672863483429, mean loss: 0.3401074147472935
Epoch: 62, step: 596, loss: 0.3371661901473999, mean loss: 0.3401073821123465
Epoch: 62, step: 597, loss: 0.31097230315208435, mean loss: 0.3401070588418256
Epoch: 62, step: 598, loss: 0.3129926025867462, mean loss: 0.3401067579946183
Epoch: 62, step: 599, loss: 0.3279343247413635, mean loss: 0.34010662293744126
Epoch: 62, step: 600, loss: 0.29820457100868225, mean loss: 0.34010615802546035
Epoch: 62, step: 601, loss: 0.3431088328361511, mean loss: 0.3401061913403922
Epoch: 62, step: 602, loss: 0.36065924167633057, mean loss: 0.34010641937570013
Epoch: 62, step: 603, loss: 0.31741490960121155, mean loss: 0.34010616761705975
Epoch: 62, step: 604, loss: 0.3692251145839691, mean loss: 0.3401064906834945
Epoch: 62, step: 605, loss: 0.34922483563423157, mean loss: 0.340106591847816
Epoch: 62, step: 606, loss: 0.34117045998573303, mean loss: 0.34010660365086853
Epoch: 62, step: 607, loss: 0.3438188135623932, mean loss: 0.3401066448354109
Epoch: 62, step: 608, loss: 0.30933594703674316, mean loss: 0.34010630345842036
Epoch: 62, step: 609, loss: 0.3266112804412842, mean loss: 0.3401061537432834
Epoch: 62, step: 610, loss: 0.32734769582748413, mean loss: 0.3401060122012437
Epoch: 62, step: 611, loss: 0.3138597905635834, mean loss: 0.34010572102949266
Epoch: 62, step: 612, loss: 0.3204907178878784, mean loss: 0.34010550342592555
Epoch: 62, step: 613, loss: 0.337176114320755, mean loss: 0.3401054709284315
Epoch: 62, step: 614, loss: 0.350359708070755, mean loss: 0.34010558468365537
Epoch: 62, step: 615, loss: 0.3317747116088867, mean loss: 0.3401054922662668
Epoch: 62, step: 616, loss: 0.3633160889148712, mean loss: 0.3401057497469551
Epoch: 62, step: 617, loss: 0.3357032537460327, mean loss: 0.340105700909558
Epoch: 62, step: 618, loss: 0.33696553111076355, mean loss: 0.34010566607567777
Epoch: 62, step: 619, loss: 0.3570757806301117, mean loss: 0.340105854322944
Epoch: 62, step: 620, loss: 0.3575664162635803, mean loss: 0.3401060480085305
Epoch: 62, step: 621, loss: 0.2847641706466675, mean loss: 0.3401054341219264
Epoch: 62, step: 622, loss: 0.2992388904094696, mean loss: 0.3401049808097755
Epoch: 62, step: 623, loss: 0.3539292812347412, mean loss: 0.340105134154132
Epoch: 62, step: 624, loss: 0.31243035197257996, mean loss: 0.34010482717841095
Epoch: 62, step: 625, loss: 0.35546308755874634, mean loss: 0.3401049975342507
Epoch: 62, step: 626, loss: 0.3149152398109436, mean loss: 0.3401047181292513
Epoch: 62, step: 627, loss: 0.32753312587738037, mean loss: 0.34010457868659355
Epoch: 62, step: 628, loss: 0.3310069441795349, mean loss: 0.3401044777777955
Epoch: 62, step: 629, loss: 0.3747113049030304, mean loss: 0.34010486162423315
Epoch: 62, step: 630, loss: 0.3065820634365082, mean loss: 0.34010448980557734
Epoch: 62, step: 631, loss: 0.3605251610279083, mean loss: 0.3401047162992688
Epoch: 62, step: 632, loss: 0.38877201080322266, mean loss: 0.3401052560813753
Epoch: 62, step: 633, loss: 0.2979482412338257, mean loss: 0.3401047885117246
Epoch: 62, step: 634, loss: 0.3491474688053131, mean loss: 0.34010488880430906
Epoch: 62, step: 635, loss: 0.3021790683269501, mean loss: 0.34010446817278783
Epoch: 62, step: 636, loss: 0.35341551899909973, mean loss: 0.34010461580269774
Epoch: 62, step: 637, loss: 0.3120270371437073, mean loss: 0.3401043044039592
Epoch: 62, step: 638, loss: 0.31620460748672485, mean loss: 0.34010403934360545
Epoch: 62, step: 639, loss: 0.27061063051223755, mean loss: 0.3401032686332777
Epoch: 62, step: 640, loss: 0.32144883275032043, mean loss: 0.3401030617502483
Epoch: 62, step: 641, loss: 0.303763747215271, mean loss: 0.3401026587413259
Epoch: 62, step: 642, loss: 0.28816381096839905, mean loss: 0.3401020827374247
Epoch: 62, step: 643, loss: 0.42458635568618774, mean loss: 0.34010301966100354
Epoch: 62, step: 644, loss: 0.30863019824028015, mean loss: 0.34010267063389543
Epoch: 62, step: 645, loss: 0.4138987362384796, mean loss: 0.34010348900799003
Epoch: 62, step: 646, loss: 0.3261886537075043, mean loss: 0.34010333469875464
Epoch: 62, step: 647, loss: 0.3238723874092102, mean loss: 0.34010315470687996
Epoch: 62, step: 648, loss: 0.3247964680194855, mean loss: 0.34010298496640634
Epoch: 62, step: 649, loss: 0.330644816160202, mean loss: 0.34010288008307776
Epoch: 62, step: 650, loss: 0.37052375078201294, mean loss: 0.3401032174218229
Epoch: 62, step: 651, loss: 0.3391270041465759, mean loss: 0.3401032065966591
Epoch: 62, step: 652, loss: 0.3296636641025543, mean loss: 0.340103090834553
Epoch: 62, step: 653, loss: 0.30317026376724243, mean loss: 0.34010268129798177
Epoch: 62, step: 654, loss: 0.3525523245334625, mean loss: 0.3401028193466521
Epoch: 62, step: 655, loss: 0.3402535617351532, mean loss: 0.34010282101815026
Epoch: 62, step: 656, loss: 0.3291985094547272, mean loss: 0.3401027001076711
Epoch: 62, step: 657, loss: 0.382512629032135, mean loss: 0.3401031703572544
Epoch: 62, step: 658, loss: 0.3280111849308014, mean loss: 0.3401030362804426
Epoch: 62, step: 659, loss: 0.335996150970459, mean loss: 0.3401029907435052
Epoch: 62, step: 660, loss: 0.3396415114402771, mean loss: 0.34010298562670266
Epoch: 62, step: 661, loss: 0.31200382113456726, mean loss: 0.34010267407149153
Epoch: 62, step: 662, loss: 0.3159436583518982, mean loss: 0.34010240620645266
Epoch: 62, step: 663, loss: 0.333576500415802, mean loss: 0.3401023338507472
Epoch: 62, step: 664, loss: 0.32244330644607544, mean loss: 0.34010213805919565
Epoch: 62, step: 665, loss: 0.37938299775123596, mean loss: 0.340102573574415
Epoch: 62, step: 666, loss: 0.3644411563873291, mean loss: 0.3401028434184508
Epoch: 62, step: 667, loss: 0.36806344985961914, mean loss: 0.3401031534167483
Epoch: 62, step: 668, loss: 0.34685271978378296, mean loss: 0.34010322824813255
Epoch: 62, step: 669, loss: 0.3215593695640564, mean loss: 0.34010302265755754
Epoch: 62, step: 670, loss: 0.40232473611831665, mean loss: 0.340103712484645
Epoch: 62, step: 671, loss: 0.3181009888648987, mean loss: 0.3401034685520106
Epoch: 62, step: 672, loss: 0.30141881108283997, mean loss: 0.3401030396802967
Epoch: 62, step: 673, loss: 0.3390531539916992, mean loss: 0.3401030280410239
Epoch: 62, step: 674, loss: 0.32715025544166565, mean loss: 0.34010288444521664
Epoch: 62, step: 675, loss: 0.31772658228874207, mean loss: 0.34010263638191396
Epoch: 62, step: 676, loss: 0.328298419713974, mean loss: 0.34010250552202076
Epoch: 62, step: 677, loss: 0.3227176070213318, mean loss: 0.3401023127976066
Epoch: 62, step: 678, loss: 0.3563421070575714, mean loss: 0.34010249282570043
Epoch: 62, step: 679, loss: 0.3828446567058563, mean loss: 0.34010296664358663
Epoch: 62, step: 680, loss: 0.30408263206481934, mean loss: 0.3401025673449071
Epoch: 62, step: 681, loss: 0.3149307668209076, mean loss: 0.34010228830931766
Epoch: 62, step: 682, loss: 0.3156840205192566, mean loss: 0.3401020176298241
Epoch: 62, step: 683, loss: 0.355674684047699, mean loss: 0.3401021902528279
Epoch: 62, step: 684, loss: 0.31683412194252014, mean loss: 0.3401019323291549
Epoch: 62, step: 685, loss: 0.32278597354888916, mean loss: 0.34010174038601104
Epoch: 62, step: 686, loss: 0.3545466661453247, mean loss: 0.3401019005026852
Epoch: 62, step: 687, loss: 0.3557092845439911, mean loss: 0.340102073502863
Epoch: 62, step: 688, loss: 0.27082863450050354, mean loss: 0.34010130564936525
Epoch: 62, step: 689, loss: 0.34529316425323486, mean loss: 0.34010136319728923
Epoch: 62, step: 690, loss: 0.32731539011001587, mean loss: 0.34010122147577726
Epoch: 62, step: 691, loss: 0.36195728182792664, mean loss: 0.3401014637287184
Epoch: 62, step: 692, loss: 0.34867537021636963, mean loss: 0.340101558760989
Epoch: 62, step: 693, loss: 0.3286500573158264, mean loss: 0.3401014318351678
Epoch: 62, step: 694, loss: 0.34954169392585754, mean loss: 0.3401015364677126
Epoch: 62, step: 695, loss: 0.36481979489326477, mean loss: 0.34010181043315885
Epoch: 62, step: 696, loss: 0.3494253158569336, mean loss: 0.34010191376932314
Epoch: 62, step: 697, loss: 0.349397212266922, mean loss: 0.34010201679171687
Epoch: 62, step: 698, loss: 0.39178192615509033, mean loss: 0.3401025895682623
Epoch: 62, step: 699, loss: 0.3261834383010864, mean loss: 0.34010243530183426
Epoch: 62, step: 700, loss: 0.31594446301460266, mean loss: 0.3401021675611712
Epoch: 62, step: 701, loss: 0.31995418667793274, mean loss: 0.3401019442653618
Epoch: 62, step: 702, loss: 0.3169613182544708, mean loss: 0.34010168780554184
Epoch: 62, step: 703, loss: 0.33123093843460083, mean loss: 0.34010158949508246
Epoch: 62, step: 704, loss: 0.3339883089065552, mean loss: 0.34010152174513963
Epoch: 62, step: 705, loss: 0.30866676568984985, mean loss: 0.34010117337583257
Epoch: 62, step: 706, loss: 0.36393842101097107, mean loss: 0.3401014375443662
Epoch: 62, step: 707, loss: 0.3140832185745239, mean loss: 0.34010114920912343
Epoch: 62, step: 708, loss: 0.3458486497402191, mean loss: 0.3401012129025145
Epoch: 62, step: 709, loss: 0.3588114380836487, mean loss: 0.34010142024559814
Epoch: 62, step: 710, loss: 0.31869596242904663, mean loss: 0.3401011830370983
Epoch: 62, step: 711, loss: 0.3542833626270294, mean loss: 0.3401013401977764
Epoch: 62, step: 712, loss: 0.33296215534210205, mean loss: 0.3401012610853457
Epoch: 62, step: 713, loss: 0.3009311556816101, mean loss: 0.3401008270290814
Epoch: 62, step: 714, loss: 0.3284710943698883, mean loss: 0.34010069815778216
Epoch: 62, step: 715, loss: 0.3476412296295166, mean loss: 0.34010078171493247
Epoch: 62, step: 716, loss: 0.31079360842704773, mean loss: 0.34010045696371866
Epoch: 62, step: 717, loss: 0.3753602206707001, mean loss: 0.3401008476709379
Epoch: 62, step: 718, loss: 0.3247886002063751, mean loss: 0.34010067800050603
Epoch: 62, step: 719, loss: 0.36253684759140015, mean loss: 0.34010092660623237
Epoch: 62, step: 720, loss: 0.3764057755470276, mean loss: 0.34010132888048406
Epoch: 62, step: 721, loss: 0.3388257324695587, mean loss: 0.3401013147464518
Epoch: 62, step: 722, loss: 0.2977263033390045, mean loss: 0.340100845222442
Epoch: 62, step: 723, loss: 0.36770567297935486, mean loss: 0.3401011510863315
Epoch: 62, step: 724, loss: 0.34453651309013367, mean loss: 0.34010120022998325
Epoch: 62, step: 725, loss: 0.3575075566768646, mean loss: 0.3401013930896509
Epoch: 62, step: 726, loss: 0.36282113194465637, mean loss: 0.34010164481796357
Epoch: 62, step: 727, loss: 0.29109442234039307, mean loss: 0.34010110183774644
Epoch: 62, step: 728, loss: 0.345350980758667, mean loss: 0.3401011600036385
Epoch: 62, step: 729, loss: 0.3454703390598297, mean loss: 0.34010121949065414
Epoch: 62, step: 730, loss: 0.3227723240852356, mean loss: 0.34010102749987864
Epoch: 62, step: 731, loss: 0.32440513372421265, mean loss: 0.34010085360342646
Epoch: 62, step: 732, loss: 0.3575616478919983, mean loss: 0.3401010470512532
Epoch: 62, step: 733, loss: 0.3063158690929413, mean loss: 0.3401006727500195
Epoch: 62, step: 734, loss: 0.32408595085144043, mean loss: 0.34010049532713416
Epoch: 62, step: 735, loss: 0.36034464836120605, mean loss: 0.3401007196042882
Epoch: 62, step: 736, loss: 0.31158697605133057, mean loss: 0.34010040371503375
Epoch: 62, step: 737, loss: 0.3163830637931824, mean loss: 0.34010014096560515
Epoch: 62, step: 738, loss: 0.34751537442207336, mean loss: 0.34010022311338295
Epoch: 62, step: 739, loss: 0.3346605896949768, mean loss: 0.3401001628524553
Epoch: 62, step: 740, loss: 0.3191867470741272, mean loss: 0.34009993117363113
Epoch: 62, step: 741, loss: 0.37748533487319946, mean loss: 0.3401003453245528
Epoch: 62, step: 742, loss: 0.36104947328567505, mean loss: 0.3401005773938548
Epoch: 62, step: 743, loss: 0.3342421352863312, mean loss: 0.3401005124961888
Epoch: 62, step: 744, loss: 0.3742949962615967, mean loss: 0.3401008912859018
Epoch: 62, step: 745, loss: 0.3273119032382965, mean loss: 0.3401007496173367
Epoch: 62, step: 746, loss: 0.31024861335754395, mean loss: 0.34010041893734494
Epoch: 62, step: 747, loss: 0.3429667055606842, mean loss: 0.34010045068760664
Epoch: 62, step: 748, loss: 0.3527662754058838, mean loss: 0.3401005909871815
Epoch: 62, step: 749, loss: 0.3016344904899597, mean loss: 0.340100164902194
Epoch: 62, step: 750, loss: 0.3108516335487366, mean loss: 0.3400998409228483
Epoch: 62, step: 751, loss: 0.34065690636634827, mean loss: 0.34009984709326746
Epoch: 62, step: 752, loss: 0.3189218044281006, mean loss: 0.3400996125140906
Epoch: 62, step: 753, loss: 0.3119930326938629, mean loss: 0.34009930119422815
Epoch: 62, step: 754, loss: 0.33049026131629944, mean loss: 0.3400991947617893
Epoch: 62, step: 755, loss: 0.36618831753730774, mean loss: 0.3400994837290789
Epoch: 62, step: 756, loss: 0.3213970363140106, mean loss: 0.34009927658007943
Epoch: 62, step: 757, loss: 0.32712307572364807, mean loss: 0.3400991328567906
Epoch: 62, step: 758, loss: 0.3529037833213806, mean loss: 0.3400992746784312
Epoch: 62, step: 759, loss: 0.2876650393009186, mean loss: 0.34009869393419745
Epoch: 62, step: 760, loss: 0.34657981991767883, mean loss: 0.34009876571620834
Epoch: 62, step: 761, loss: 0.39695796370506287, mean loss: 0.3400993954559136
Epoch: 62, step: 762, loss: 0.3261898458003998, mean loss: 0.3400992414034648
Epoch: 62, step: 763, loss: 0.3246828019618988, mean loss: 0.3400990706636491
Epoch: 62, step: 764, loss: 0.33468249440193176, mean loss: 0.34009901067476556
Epoch: 62, step: 765, loss: 0.30269157886505127, mean loss: 0.3400985963899647
Epoch: 62, step: 766, loss: 0.30746954679489136, mean loss: 0.34009823502942876
Epoch: 62, step: 767, loss: 0.39037442207336426, mean loss: 0.3400987918224987
Epoch: 62, step: 768, loss: 0.31221646070480347, mean loss: 0.3400984830378091
Epoch: 62, step: 769, loss: 0.33992043137550354, mean loss: 0.3400984810659862
Epoch: 62, step: 770, loss: 0.3671267032623291, mean loss: 0.3400987803851614
Epoch: 62, step: 771, loss: 0.30465126037597656, mean loss: 0.34009838783233737
Epoch: 62, step: 772, loss: 0.3093198537826538, mean loss: 0.3400980469885588
Epoch: 62, step: 773, loss: 0.33643901348114014, mean loss: 0.3400980064685979
Epoch: 62, step: 774, loss: 0.32625341415405273, mean loss: 0.340097853155947
Epoch: 62, step: 775, loss: 0.3204001486301422, mean loss: 0.34009763502934653
Epoch: 62, step: 776, loss: 0.36605799198150635, mean loss: 0.34009792250353904
Epoch: 62, step: 777, loss: 0.3274761736392975, mean loss: 0.3400977827370909
Epoch: 62, step: 778, loss: 0.38488075137138367, mean loss: 0.3400982786340716
Epoch: 62, step: 779, loss: 0.3487982749938965, mean loss: 0.3400983749710114
Epoch: 62, step: 780, loss: 0.3312416970729828, mean loss: 0.34009827690018907
Epoch: 62, step: 781, loss: 0.37401947379112244, mean loss: 0.3400986525086144
Epoch: 62, step: 782, loss: 0.3617892563343048, mean loss: 0.3400988926853794
Epoch: 62, step: 783, loss: 0.32282325625419617, mean loss: 0.34009870139699655
Epoch: 62, step: 784, loss: 0.34247490763664246, mean loss: 0.34009872770778504
Epoch: 62, step: 785, loss: 0.39630189538002014, mean loss: 0.34009935001626074
Epoch: 62, step: 786, loss: 0.335910826921463, mean loss: 0.34009930363943414
Epoch: 62, step: 787, loss: 0.31360745429992676, mean loss: 0.3400990103154457
Epoch: 62, step: 788, loss: 0.3168819546699524, mean loss: 0.34009875325358974
Epoch: 62, step: 789, loss: 0.3113727867603302, mean loss: 0.3400984351999737
Epoch: 62, step: 790, loss: 0.31507784128189087, mean loss: 0.3400981581752732
Epoch: 62, step: 791, loss: 0.3590810000896454, mean loss: 0.3400983683484565
Epoch: 62, step: 792, loss: 0.4010927975177765, mean loss: 0.34009904365574023
Epoch: 62, step: 793, loss: 0.3247341811656952, mean loss: 0.3400988735436691
Epoch: 62, step: 794, loss: 0.35400253534317017, mean loss: 0.3400990274763529
Epoch: 62, step: 795, loss: 0.319067120552063, mean loss: 0.34009879462675674
Epoch: 62, step: 796, loss: 0.29497140645980835, mean loss: 0.3400982950154845
Epoch: 62, step: 797, loss: 0.29889917373657227, mean loss: 0.3400978388996233
Epoch: 62, step: 798, loss: 0.3101976811885834, mean loss: 0.34009750787835935
Epoch: 62, step: 799, loss: 0.365645170211792, mean loss: 0.3400977907105081
Epoch: 62, step: 800, loss: 0.3694863021373749, mean loss: 0.34009811606019014
Epoch: 62, step: 801, loss: 0.34355106949806213, mean loss: 0.3400981542861775
Epoch: 62, step: 802, loss: 0.32868143916130066, mean loss: 0.3400980278986126
Epoch: 62, step: 803, loss: 0.3170052170753479, mean loss: 0.34009777225486704
Epoch: 62, step: 804, loss: 0.3697248697280884, mean loss: 0.3400981002313261
Epoch: 62, step: 805, loss: 0.3164222836494446, mean loss: 0.34009783813934985
Epoch: 62, step: 806, loss: 0.34238341450691223, mean loss: 0.34009786344046644
Epoch: 62, step: 807, loss: 0.3467162251472473, mean loss: 0.34009793670430044
Epoch: 62, step: 808, loss: 0.3377074599266052, mean loss: 0.340097910242532
Epoch: 62, step: 809, loss: 0.3153124749660492, mean loss: 0.34009763587919345
Epoch: 62, step: 810, loss: 0.33460280299186707, mean loss: 0.34009757505460064
Epoch: 62, step: 811, loss: 0.32483425736427307, mean loss: 0.3400974061004531
Epoch: 62, step: 812, loss: 0.37044182419776917, mean loss: 0.3400977419880135
Epoch: 62, step: 813, loss: 0.3346383571624756, mean loss: 0.3400976815578169
Epoch: 62, step: 814, loss: 0.3498906195163727, mean loss: 0.34009778995512446
Epoch: 62, step: 815, loss: 0.3438297212123871, mean loss: 0.3400978312631389
Epoch: 62, step: 816, loss: 0.36008408665657043, mean loss: 0.3400980524846276
Epoch: 62, step: 817, loss: 0.3236311674118042, mean loss: 0.34009787021994436
Epoch: 62, step: 818, loss: 0.3103782832622528, mean loss: 0.340097541270594
Epoch: 62, step: 819, loss: 0.33781251311302185, mean loss: 0.3400975159791857
Epoch: 62, step: 820, loss: 0.3464665114879608, mean loss: 0.34009758647244526
Epoch: 62, step: 821, loss: 0.36561280488967896, mean loss: 0.3400978688766336
Epoch: 62, step: 822, loss: 0.3399738371372223, mean loss: 0.340097867503857
Epoch: 62, step: 823, loss: 0.3549279570579529, mean loss: 0.34009803164067254
Epoch: 62, step: 824, loss: 0.32891908288002014, mean loss: 0.3400979079154087
Epoch: 62, step: 825, loss: 0.3263375759124756, mean loss: 0.34009775562185224
Epoch: 62, step: 826, loss: 0.30834969878196716, mean loss: 0.3400974042516255
Epoch: 62, step: 827, loss: 0.3447103500366211, mean loss: 0.34009745530463564
Epoch: 62, step: 828, loss: 0.31465670466423035, mean loss: 0.3400971737464759
Epoch: 62, step: 829, loss: 0.34537890553474426, mean loss: 0.34009723219987004
Epoch: 62, step: 830, loss: 0.3150365352630615, mean loss: 0.3400969548539838
Epoch: 62, step: 831, loss: 0.33986106514930725, mean loss: 0.3400969522434293
Epoch: 62, step: 832, loss: 0.32972994446754456, mean loss: 0.3400968375146439
Epoch: 62, step: 833, loss: 0.33088192343711853, mean loss: 0.3400967355368869
Epoch: 62, step: 834, loss: 0.3401328921318054, mean loss: 0.340096735937013
Epoch: 62, step: 835, loss: 0.3106597363948822, mean loss: 0.34009641017675957
Epoch: 62, step: 836, loss: 0.33458513021469116, mean loss: 0.34009634918766024
Epoch: 62, step: 837, loss: 0.33681240677833557, mean loss: 0.3400963128471958
Epoch: 62, step: 838, loss: 0.3149709701538086, mean loss: 0.34009603481049333
Epoch: 62, step: 839, loss: 0.3188423216342926, mean loss: 0.34009579961979336
Epoch: 62, step: 840, loss: 0.2888334095478058, mean loss: 0.34009523236343253
Epoch: 62, step: 841, loss: 0.3412715196609497, mean loss: 0.34009524537977975
Epoch: 62, step: 842, loss: 0.328652560710907, mean loss: 0.3400951187607906
Epoch: 62, step: 843, loss: 0.331983745098114, mean loss: 0.3400950290054055
Epoch: 62, step: 844, loss: 0.33199915289878845, mean loss: 0.3400949394224979
Epoch: 62, step: 845, loss: 0.3057672381401062, mean loss: 0.3400945595820429
Epoch: 62, step: 846, loss: 0.3397890627384186, mean loss: 0.3400945562017182
Epoch: 62, step: 847, loss: 0.35816606879234314, mean loss: 0.34009475616091744
Epoch: 62, step: 848, loss: 0.3146979510784149, mean loss: 0.3400944751513123
Epoch: 62, step: 849, loss: 0.3592242896556854, mean loss: 0.3400946868158159
Epoch: 62, step: 850, loss: 0.3447190821170807, mean loss: 0.34009473798251727
Epoch: 62, step: 851, loss: 0.35148540139198303, mean loss: 0.340094864013314
Epoch: 62, step: 852, loss: 0.3090406358242035, mean loss: 0.34009452042087546
Epoch: 62, step: 853, loss: 0.3475300371646881, mean loss: 0.3400946026885476
Epoch: 62, step: 854, loss: 0.35904642939567566, mean loss: 0.34009481237207995
Epoch: 62, step: 855, loss: 0.3435080051422119, mean loss: 0.3400948501353209
Epoch: 62, step: 856, loss: 0.3247531056404114, mean loss: 0.3400946803975935
Epoch: 62, step: 857, loss: 0.3611072599887848, mean loss: 0.34009491287363613
Epoch: 62, step: 858, loss: 0.28297877311706543, mean loss: 0.34009428096705935
Epoch: 62, step: 859, loss: 0.3182329535484314, mean loss: 0.3400940391061108
Epoch: 62, step: 860, loss: 0.33944588899612427, mean loss: 0.34009403193543614
Epoch: 62, step: 861, loss: 0.308170884847641, mean loss: 0.3400936787642105
Epoch: 62, step: 862, loss: 0.363749623298645, mean loss: 0.3400939404710677
Epoch: 62, step: 863, loss: 0.35935893654823303, mean loss: 0.3400941535982922
Epoch: 62, step: 864, loss: 0.3272910714149475, mean loss: 0.34009401196030936
Epoch: 62, step: 865, loss: 0.3088493049144745, mean loss: 0.34009366631007765
Epoch: 62, step: 866, loss: 0.38184893131256104, mean loss: 0.34009412823015067
Epoch: 62, step: 867, loss: 0.32114937901496887, mean loss: 0.34009391865506755
Epoch: 62, step: 868, loss: 0.31510844826698303, mean loss: 0.3400936422579483
Epoch: 62, step: 869, loss: 0.37930119037628174, mean loss: 0.34009407597935937
Epoch: 62, step: 870, loss: 0.34432002902030945, mean loss: 0.3400941227271446
Epoch: 62, step: 871, loss: 0.299134761095047, mean loss: 0.3400936696368611
Epoch: 62, step: 872, loss: 0.3354899287223816, mean loss: 0.3400936187110869
Epoch: 62, step: 873, loss: 0.30390021204948425, mean loss: 0.34009321835040174
Epoch: 62, step: 874, loss: 0.37343481183052063, mean loss: 0.34009358716109916
Epoch: 62, step: 875, loss: 0.3372879922389984, mean loss: 0.34009355612713027
Epoch: 62, step: 876, loss: 0.30424395203590393, mean loss: 0.3400931595826461
Epoch: 62, step: 877, loss: 0.37788814306259155, mean loss: 0.3400935776409993
Epoch: 62, step: 878, loss: 0.33817431330680847, mean loss: 0.34009355641184297
Epoch: 62, step: 879, loss: 0.34250104427337646, mean loss: 0.3400935830409893
Epoch: 62, step: 880, loss: 0.32513099908828735, mean loss: 0.3400934175421567
Epoch: 62, step: 881, loss: 0.31098473072052, mean loss: 0.34009309557902406
Epoch: 62, step: 882, loss: 0.3248632848262787, mean loss: 0.3400929271281635
Epoch: 62, step: 883, loss: 0.34669408202171326, mean loss: 0.3400930001400966
Epoch: 62, step: 884, loss: 0.3202837109565735, mean loss: 0.3400927810422989
Epoch: 62, step: 885, loss: 0.3850959539413452, mean loss: 0.34009327878792345
Epoch: 62, step: 886, loss: 0.33206427097320557, mean loss: 0.34009318998620014
Epoch: 62, step: 887, loss: 0.3647984564304352, mean loss: 0.3400934632261847
Epoch: 62, step: 888, loss: 0.3169604241847992, mean loss: 0.3400932073778482
Epoch: 62, step: 889, loss: 0.31714123487472534, mean loss: 0.340092953534891
Epoch: 62, step: 890, loss: 0.3389124274253845, mean loss: 0.34009294047871796
Epoch: 62, step: 891, loss: 0.3374362289905548, mean loss: 0.34009291109681694
Epoch: 62, step: 892, loss: 0.3213790953159332, mean loss: 0.34009270413365816
Epoch: 62, step: 893, loss: 0.39101022481918335, mean loss: 0.3400932672435284
Epoch: 62, step: 894, loss: 0.3300313353538513, mean loss: 0.3400931559672835
Epoch: 62, step: 895, loss: 0.3415099084377289, mean loss: 0.3400931716351645
Epoch: 62, step: 896, loss: 0.30578380823135376, mean loss: 0.3400927922117373
Epoch: 62, step: 897, loss: 0.35209986567497253, mean loss: 0.34009292499515653
Epoch: 62, step: 898, loss: 0.33137696981430054, mean loss: 0.34009282860851114
Epoch: 62, step: 899, loss: 0.36354774236679077, mean loss: 0.34009308798518384
Epoch: 62, step: 900, loss: 0.35320061445236206, mean loss: 0.34009323293344673
Epoch: 62, step: 901, loss: 0.31941795349121094, mean loss: 0.3400930043004771
Epoch: 62, step: 902, loss: 0.37460729479789734, mean loss: 0.3400933859648455
Epoch: 62, step: 903, loss: 0.3063027262687683, mean loss: 0.3400930123066305
Epoch: 62, step: 904, loss: 0.35965588688850403, mean loss: 0.3400932286311424
Epoch: 62, step: 905, loss: 0.32888612151145935, mean loss: 0.3400931047053278
Epoch: 62, step: 906, loss: 0.3579593002796173, mean loss: 0.34009330226374623
Epoch: 62, step: 907, loss: 0.29194507002830505, mean loss: 0.34009276986257597
Epoch: 62, step: 908, loss: 0.35465100407600403, mean loss: 0.3400929308391034
Epoch: 62, step: 909, loss: 0.3096897602081299, mean loss: 0.3400925946621575
Epoch: 62, step: 910, loss: 0.3410755395889282, mean loss: 0.3400926055307532
Epoch: 62, step: 911, loss: 0.3249581456184387, mean loss: 0.3400924381882066
Epoch: 62, step: 912, loss: 0.3478908836841583, mean loss: 0.3400925244150893
Epoch: 62, step: 913, loss: 0.359091579914093, mean loss: 0.34009273448403404
Epoch: 62, step: 914, loss: 0.3383543789386749, mean loss: 0.34009271526357976
Epoch: 62, step: 915, loss: 0.3669070303440094, mean loss: 0.3400930117378078
Epoch: 62, step: 916, loss: 0.35065987706184387, mean loss: 0.3400931285697535
Epoch: 62, step: 917, loss: 0.30565986037254333, mean loss: 0.34009274786449073
Epoch: 62, step: 918, loss: 0.34721365571022034, mean loss: 0.3400928265946625
Epoch: 62, step: 919, loss: 0.31279638409614563, mean loss: 0.34009252480310825
Epoch: 62, step: 920, loss: 0.34065353870391846, mean loss: 0.34009253100565223
Epoch: 62, step: 921, loss: 0.2994626462459564, mean loss: 0.3400920818084741
Epoch: 62, step: 922, loss: 0.3135205805301666, mean loss: 0.3400917880416691
Epoch: 62, step: 923, loss: 0.31918570399284363, mean loss: 0.34009155691262777
Epoch: 62, step: 924, loss: 0.32320353388786316, mean loss: 0.34009137020767577
Epoch: 62, step: 925, loss: 0.3785187602043152, mean loss: 0.3400917950356546
Epoch: 62, step: 926, loss: 0.2999030351638794, mean loss: 0.34009135074003943
Epoch: 62, step: 927, loss: 0.31713464856147766, mean loss: 0.3400910969514331
Epoch: 62, step: 928, loss: 0.3051656186580658, mean loss: 0.3400907108510949
Epoch: 62, step: 929, loss: 0.3498172163963318, mean loss: 0.3400908183761954
Epoch: 62, step: 930, loss: 0.32190555334091187, mean loss: 0.34009061734296453
Epoch: 62, step: 931, loss: 0.37023788690567017, mean loss: 0.34009095060926525
Epoch: 62, step: 932, loss: 0.3451167643070221, mean loss: 0.3400910061670603
Epoch: 62, step: 933, loss: 0.3278346359729767, mean loss: 0.34009087068066607
Epoch: 62, step: 934, loss: 0.331484317779541, mean loss: 0.34009077554173744
Epoch: 62, step: 935, loss: 0.3588296175003052, mean loss: 0.3400909826831634
Epoch: 62, step: 936, loss: 0.315510630607605, mean loss: 0.34009071097198146
Epoch: 62, step: 937, loss: 0.3194674253463745, mean loss: 0.34009048300472716
Epoch: 62, step: 938, loss: 0.3320484161376953, mean loss: 0.3400903941096951
Epoch: 62, step: 939, loss: 0.34346213936805725, mean loss: 0.34009043137972716
Epoch: 62, step: 940, loss: 0.32822391390800476, mean loss: 0.34009030021305714
Epoch: 62, step: 941, loss: 0.3310835659503937, mean loss: 0.34009020065812995
Epoch: 62, step: 942, loss: 0.3246411979198456, mean loss: 0.3400900298961981
Epoch: 62, step: 943, loss: 0.2994249165058136, mean loss: 0.3400895804188638
Epoch: 62, step: 944, loss: 0.3203442692756653, mean loss: 0.34008936217351826
Epoch: 62, step: 945, loss: 0.31956154108047485, mean loss: 0.3400891352815814
Epoch: 62, step: 946, loss: 0.31606942415237427, mean loss: 0.3400888697970704
Epoch: 62, step: 947, loss: 0.35764437913894653, mean loss: 0.34008906383205584
Epoch: 62, step: 948, loss: 0.33474215865135193, mean loss: 0.34008900473521153
Epoch: 62, step: 949, loss: 0.31455084681510925, mean loss: 0.340088722477006
Epoch: 62, step: 950, loss: 0.35268837213516235, mean loss: 0.34008886173196745
Epoch: 62, step: 951, loss: 0.33022555708885193, mean loss: 0.340088752721085
Epoch: 62, step: 952, loss: 0.331148236989975, mean loss: 0.3400886539101111
Epoch: 62, step: 953, loss: 0.3145609200000763, mean loss: 0.3400883717795889
Epoch: 62, step: 954, loss: 0.31946101784706116, mean loss: 0.34008814381020314
Epoch: 62, step: 955, loss: 0.3572331964969635, mean loss: 0.3400883332917986
Epoch: 62, step: 956, loss: 0.3399903178215027, mean loss: 0.3400883322085752
Epoch: 62, step: 957, loss: 0.3420838415622711, mean loss: 0.3400883542618139
Epoch: 62, step: 958, loss: 0.32063907384872437, mean loss: 0.3400881393217627
Epoch: 62, step: 959, loss: 0.32309678196907043, mean loss: 0.3400879515470594
Epoch: 62, step: 960, loss: 0.33565571904182434, mean loss: 0.3400879025661611
Epoch: 62, step: 961, loss: 0.36164724826812744, mean loss: 0.3400881408173016
Epoch: 62, step: 962, loss: 0.34273049235343933, mean loss: 0.34008817001746
Epoch: 62, step: 963, loss: 0.2806900441646576, mean loss: 0.34008751362655415
Epoch: 62, step: 964, loss: 0.3245302438735962, mean loss: 0.34008734170972355
Epoch: 62, step: 965, loss: 0.35177475214004517, mean loss: 0.34008747086094276
Epoch: 62, step: 966, loss: 0.30624279379844666, mean loss: 0.3400870968659479
Epoch: 62, step: 967, loss: 0.31830450892448425, mean loss: 0.3400868561637297
Epoch: 62, step: 968, loss: 0.33820345997810364, mean loss: 0.3400868353520322
Epoch: 62, step: 969, loss: 0.3489433228969574, mean loss: 0.3400869332159358
Epoch: 62, step: 970, loss: 0.29789650440216064, mean loss: 0.3400864670182009
Epoch: 62, step: 971, loss: 0.3783494234085083, mean loss: 0.3400868898132991
Epoch: 62, step: 972, loss: 0.27168235182762146, mean loss: 0.3400861339704025
Epoch: 62, step: 973, loss: 0.3082595467567444, mean loss: 0.3400857823031773
Epoch: 62, step: 974, loss: 0.3143763840198517, mean loss: 0.3400854982308451
Epoch: 62, step: 975, loss: 0.34089264273643494, mean loss: 0.34008550714917474
Epoch: 62, step: 976, loss: 0.3407481908798218, mean loss: 0.34008551447124236
Epoch: 62, step: 977, loss: 0.32353636622428894, mean loss: 0.34008533161984855
Epoch: 62, step: 978, loss: 0.3708491921424866, mean loss: 0.34008567152571795
Epoch: 62, step: 979, loss: 0.32165849208831787, mean loss: 0.3400854679284731
Epoch: 62, step: 980, loss: 0.34172526001930237, mean loss: 0.340085486045921
Epoch: 62, step: 981, loss: 0.3458535671234131, mean loss: 0.34008554977458166
Epoch: 62, step: 982, loss: 0.33679044246673584, mean loss: 0.34008551336898113
Epoch: 62, step: 983, loss: 0.34815171360969543, mean loss: 0.34008560248644887
Epoch: 62, step: 984, loss: 0.32879042625427246, mean loss: 0.34008547769579744
Epoch: 62, step: 985, loss: 0.30440014600753784, mean loss: 0.3400850834437294
Epoch: 62, step: 986, loss: 0.3575598895549774, mean loss: 0.3400852765035108
Epoch: 62, step: 987, loss: 0.34559789299964905, mean loss: 0.340085337405633
Epoch: 62, step: 988, loss: 0.3375965654850006, mean loss: 0.34008530991055563
Epoch: 62, step: 989, loss: 0.33360058069229126, mean loss: 0.34008523827033804
Epoch: 62, step: 990, loss: 0.3404806852340698, mean loss: 0.3400852426390006
Epoch: 62, step: 991, loss: 0.35455864667892456, mean loss: 0.34008540253078184
Epoch: 62, step: 992, loss: 0.3594101667404175, mean loss: 0.34008561601455034
Epoch: 62, step: 993, loss: 0.3396267592906952, mean loss: 0.3400856109455425
Epoch: 62, step: 994, loss: 0.32385197281837463, mean loss: 0.34008543161390165
Epoch: 62, step: 995, loss: 0.3139762282371521, mean loss: 0.34008514319090466
Epoch: 62, step: 996, loss: 0.32663822174072266, mean loss: 0.34008499464717146
Epoch: 62, step: 997, loss: 0.30345726013183594, mean loss: 0.3400845900370648
Epoch: 62, step: 998, loss: 0.2925991714000702, mean loss: 0.3400840654928003
Epoch: 62, step: 999, loss: 0.3437536358833313, mean loss: 0.34008410602799816
Epoch: 62, step: 1000, loss: 0.39373114705085754, mean loss: 0.3400846986230895
Epoch: 62, step: 1001, loss: 0.3616354465484619, mean loss: 0.3400849366739889
Epoch: 62, step: 1002, loss: 0.292822927236557, mean loss: 0.34008441462066535
Epoch: 62, step: 1003, loss: 0.35261082649230957, mean loss: 0.34008455298513174
Epoch: 62, step: 1004, loss: 0.32443568110466003, mean loss: 0.3400843801324495
Epoch: 62, step: 1005, loss: 0.30276191234588623, mean loss: 0.3400839678843683
Epoch: 62, step: 1006, loss: 0.3671846389770508, mean loss: 0.34008426722353097
Epoch: 62, step: 1007, loss: 0.34078270196914673, mean loss: 0.3400842749379732
Epoch: 62, step: 1008, loss: 0.31539854407310486, mean loss: 0.34008400227894026
Epoch: 62, step: 1009, loss: 0.31479117274284363, mean loss: 0.3400837229174618
Epoch: 62, step: 1010, loss: 0.3521715998649597, mean loss: 0.3400838564276281
Epoch: 62, step: 1011, loss: 0.31634047627449036, mean loss: 0.3400835941857444
Epoch: 62, step: 1012, loss: 0.32116827368736267, mean loss: 0.3400833852713244
Epoch: 62, step: 1013, loss: 0.3008325397968292, mean loss: 0.3400829517615116
Epoch: 62, step: 1014, loss: 0.36951160430908203, mean loss: 0.3400832767855615
Epoch: 62, step: 1015, loss: 0.3137701153755188, mean loss: 0.3400829861736887
Epoch: 62, step: 1016, loss: 0.3693452477455139, mean loss: 0.3400833093528987
Epoch: 62, step: 1017, loss: 0.3357335925102234, mean loss: 0.3400832613141467
Epoch: 62, step: 1018, loss: 0.31884604692459106, mean loss: 0.3400830267706014
Epoch: 62, step: 1019, loss: 0.3895404040813446, mean loss: 0.34008357297126085
Epoch: 62, step: 1020, loss: 0.31402096152305603, mean loss: 0.34008328514244496
Epoch: 62, step: 1021, loss: 0.34058552980422974, mean loss: 0.3400832906890453
Epoch: 62, step: 1022, loss: 0.3430873155593872, mean loss: 0.340083323863995
Epoch: 62, step: 1023, loss: 0.3167201280593872, mean loss: 0.3400830658553833
Epoch: 62, step: 1024, loss: 0.3504711389541626, mean loss: 0.34008318057353837
Epoch: 62, step: 1025, loss: 0.31124669313430786, mean loss: 0.34008286212832955
Epoch: 62, step: 1026, loss: 0.3155243694782257, mean loss: 0.3400825909285874
Epoch: 62, step: 1027, loss: 0.363978773355484, mean loss: 0.3400828548115154
Epoch: 62, step: 1028, loss: 0.30476778745651245, mean loss: 0.340082464835397
Epoch: 62, step: 1029, loss: 0.3294120132923126, mean loss: 0.3400823470053705
Epoch: 62, step: 1030, loss: 0.3177807927131653, mean loss: 0.34008210073990497
Epoch: 62, step: 1031, loss: 0.3650085926055908, mean loss: 0.34008237598826924
Epoch: 62, step: 1032, loss: 0.3556980788707733, mean loss: 0.3400825484212468
Epoch: 62, step: 1033, loss: 0.3483531177043915, mean loss: 0.3400826397461875
Epoch: 62, step: 1034, loss: 0.3283686339855194, mean loss: 0.3400825103997021
Epoch: 62, step: 1035, loss: 0.37600135803222656, mean loss: 0.3400829070125685
Epoch: 62, step: 1036, loss: 0.3322044312953949, mean loss: 0.340082820020069
Epoch: 62, step: 1037, loss: 0.35606956481933594, mean loss: 0.3400829965404497
Epoch: 62, step: 1038, loss: 0.3129645884037018, mean loss: 0.340082697111208
Epoch: 62, step: 1039, loss: 0.4010644853115082, mean loss: 0.3400833704371973
Epoch: 62, step: 1040, loss: 0.3466304838657379, mean loss: 0.3400834427258769
Epoch: 62, step: 1041, loss: 0.33193090558052063, mean loss: 0.3400833527122174
Epoch: 62, step: 1042, loss: 0.32659777998924255, mean loss: 0.34008320381717677
Epoch: 62, step: 1043, loss: 0.31569477915763855, mean loss: 0.34008293454604815
Epoch: 62, step: 1044, loss: 0.31197917461395264, mean loss: 0.3400826242575523
Epoch: 62, step: 1045, loss: 0.3171369135379791, mean loss: 0.34008237092093563
Epoch: 62, step: 1046, loss: 0.3251636326313019, mean loss: 0.3400822062094999
Epoch: 62, step: 1047, loss: 0.3270660638809204, mean loss: 0.34008206250540246
Epoch: 62, step: 1048, loss: 0.33345890045166016, mean loss: 0.3400819893835056
Epoch: 62, step: 1049, loss: 0.3161604404449463, mean loss: 0.3400817252846191
Epoch: 62, step: 1050, loss: 0.34509795904159546, mean loss: 0.34008178066427397
Epoch: 62, step: 1051, loss: 0.36510220170021057, mean loss: 0.3400820568888383
Epoch: 62, step: 1052, loss: 0.37876826524734497, mean loss: 0.34008248397849683
Epoch: 62, step: 1053, loss: 0.3223899304866791, mean loss: 0.340082288657644
Epoch: 62, step: 1054, loss: 0.3057825565338135, mean loss: 0.3400819100023541
Epoch: 62, step: 1055, loss: 0.36171963810920715, mean loss: 0.3400821488715596
Epoch: 62, step: 1056, loss: 0.32033446431159973, mean loss: 0.34008193086985333
Epoch: 62, step: 1057, loss: 0.29624930024147034, mean loss: 0.34008144699121173
Epoch: 62, step: 1058, loss: 0.3466658592224121, mean loss: 0.340081519677273
Epoch: 62, step: 1059, loss: 0.31144464015960693, mean loss: 0.34008120355505467
Epoch: 62, step: 1060, loss: 0.3144773244857788, mean loss: 0.3400809209172171
Epoch: 62, step: 1061, loss: 0.33905842900276184, mean loss: 0.34008090963018855
Epoch: 62, step: 1062, loss: 0.3296838104724884, mean loss: 0.34008079486051873
Epoch: 62, step: 1063, loss: 0.3029533922672272, mean loss: 0.3400803850296
Epoch: 62, step: 1064, loss: 0.30863678455352783, mean loss: 0.34008003794317526
Epoch: 62, step: 1065, loss: 0.3414801061153412, mean loss: 0.3400800533974898
Epoch: 62, step: 1066, loss: 0.3605678379535675, mean loss: 0.3400802795444577
Epoch: 62, step: 1067, loss: 0.3162141740322113, mean loss: 0.34008001611002886
Epoch: 62, step: 1068, loss: 0.32618051767349243, mean loss: 0.34007986268885115
Epoch: 62, step: 1069, loss: 0.3302691578865051, mean loss: 0.3400797544005357
Epoch: 62, step: 1070, loss: 0.31020206212997437, mean loss: 0.3400794246210429
Epoch: 62, step: 1071, loss: 0.37620633840560913, mean loss: 0.3400798233728507
Epoch: 62, step: 1072, loss: 0.3634239137172699, mean loss: 0.34008008103104814
Epoch: 62, step: 1073, loss: 0.3256250023841858, mean loss: 0.34007992148624067
Epoch: 62, step: 1074, loss: 0.3491431474685669, mean loss: 0.3400800215185352
Epoch: 62, step: 1075, loss: 0.3744024336338043, mean loss: 0.3400804003363812
Epoch: 62, step: 1076, loss: 0.34921908378601074, mean loss: 0.34008050119928557
Epoch: 62, step: 1077, loss: 0.35103750228881836, mean loss: 0.3400806221294788
Epoch: 62, step: 1078, loss: 0.31634947657585144, mean loss: 0.34008036021654103
Epoch: 62, step: 1079, loss: 0.3722013533115387, mean loss: 0.3400807147215858
Epoch: 62, step: 1080, loss: 0.3265790045261383, mean loss: 0.34008056571088935
Epoch: 62, step: 1081, loss: 0.3592585325241089, mean loss: 0.34008077736486586
Epoch: 62, step: 1082, loss: 0.34621110558509827, mean loss: 0.3400808450203185
Epoch: 62, step: 1083, loss: 0.33661672472953796, mean loss: 0.3400808067900588
Epoch: 62, step: 1084, loss: 0.33419713377952576, mean loss: 0.34008074185817255
Epoch: 62, step: 1085, loss: 0.3226526975631714, mean loss: 0.34008054952537303
Epoch: 62, step: 1086, loss: 0.3248930275440216, mean loss: 0.3400803819204292
Epoch: 62, step: 1087, loss: 0.30608224868774414, mean loss: 0.3400800067313541
Epoch: 62, step: 1088, loss: 0.3283495008945465, mean loss: 0.3400798772798622
Epoch: 62, step: 1089, loss: 0.34703755378723145, mean loss: 0.3400799540601543
Epoch: 62, step: 1090, loss: 0.33163538575172424, mean loss: 0.3400798608725412
Epoch: 62, step: 1091, loss: 0.3156018853187561, mean loss: 0.340079590755839
Epoch: 62, step: 1092, loss: 0.32384783029556274, mean loss: 0.3400794116388522
Epoch: 62, step: 1093, loss: 0.3189184069633484, mean loss: 0.340079178130381
Epoch: 62, step: 1094, loss: 0.42417794466018677, mean loss: 0.3400801061372505
Epoch: 62, step: 1095, loss: 0.32962557673454285, mean loss: 0.3400799907756531
Epoch: 62, step: 1096, loss: 0.3379088044166565, mean loss: 0.34007996681773467
Epoch: 62, step: 1097, loss: 0.32293152809143066, mean loss: 0.34007977759567115
Epoch: 62, step: 1098, loss: 0.3063160479068756, mean loss: 0.34007940503859996
Epoch: 62, step: 1099, loss: 0.3806416392326355, mean loss: 0.34007985260705775
Epoch: 62, step: 1100, loss: 0.30679887533187866, mean loss: 0.34007948538489624
Epoch: 62, step: 1101, loss: 0.37676146626472473, mean loss: 0.3400798901292511
Epoch: 62, step: 1102, loss: 0.30061665177345276, mean loss: 0.3400794547016562
Epoch: 62, step: 1103, loss: 0.33184584975242615, mean loss: 0.34007936385510146
Epoch: 62, step: 1104, loss: 0.36896467208862305, mean loss: 0.3400796825614031
Epoch: 62, step: 1105, loss: 0.31895604729652405, mean loss: 0.34007944949615976
Epoch: 62, step: 1106, loss: 0.3086831569671631, mean loss: 0.34007910309253503
Epoch: 62, step: 1107, loss: 0.29948005080223083, mean loss: 0.3400786551573626
Epoch: 62, step: 1108, loss: 0.34592923521995544, mean loss: 0.34007871970694015
Epoch: 62, step: 1109, loss: 0.330935537815094, mean loss: 0.34007861883112767
Epoch: 62, step: 1110, loss: 0.31536200642585754, mean loss: 0.3400783461382206
Epoch: 62, step: 1111, loss: 0.3323250412940979, mean loss: 0.34007826059867025
Epoch: 62, step: 1112, loss: 0.35729482769966125, mean loss: 0.3400784505410484
Epoch: 62, step: 1113, loss: 0.3719615340232849, mean loss: 0.34007880228840043
Epoch: 62, step: 1114, loss: 0.37755143642425537, mean loss: 0.3400792156974241
Epoch: 62, step: 1115, loss: 0.33770760893821716, mean loss: 0.3400791895334556
Epoch: 62, step: 1116, loss: 0.319364994764328, mean loss: 0.3400789610134626
Epoch: 62, step: 1117, loss: 0.31370410323143005, mean loss: 0.3400786700479729
Epoch: 62, step: 1118, loss: 0.302199125289917, mean loss: 0.34007825216823323
Epoch: 62, step: 1119, loss: 0.320389062166214, mean loss: 0.3400780349633307
Epoch: 62, step: 1120, loss: 0.32734039425849915, mean loss: 0.3400778944472665
Epoch: 62, step: 1121, loss: 0.31091055274009705, mean loss: 0.34007757268949806
Epoch: 62, step: 1122, loss: 0.31990960240364075, mean loss: 0.3400773502102062
Epoch: 62, step: 1123, loss: 0.29270899295806885, mean loss: 0.3400768276805626
Epoch: 62, step: 1124, loss: 0.3415369391441345, mean loss: 0.34007684378716097
Epoch: 62, step: 1125, loss: 0.3496338725090027, mean loss: 0.34007694921029424
Epoch: 62, step: 1126, loss: 0.3131849765777588, mean loss: 0.3400766525694842
Epoch: 62, step: 1127, loss: 0.3185436725616455, mean loss: 0.3400764150454372
Epoch: 62, step: 1128, loss: 0.29012736678123474, mean loss: 0.3400758640780738
Epoch: 62, step: 1129, loss: 0.33481451869010925, mean loss: 0.3400758060429816
Epoch: 62, step: 1130, loss: 0.4044131636619568, mean loss: 0.3400765157061989
Epoch: 62, step: 1131, loss: 0.34404540061950684, mean loss: 0.3400765594838838
Epoch: 62, step: 1132, loss: 0.3516485393047333, mean loss: 0.3400766871239917
Epoch: 62, step: 1133, loss: 0.31240785121917725, mean loss: 0.34007638193729933
Epoch: 62, step: 1134, loss: 0.3122095465660095, mean loss: 0.34007607457006717
Epoch: 62, step: 1135, loss: 0.29101061820983887, mean loss: 0.34007553339102853
Epoch: 62, step: 1136, loss: 0.300900399684906, mean loss: 0.34007510130440516
Epoch: 62, step: 1137, loss: 0.32824593782424927, mean loss: 0.340074970834731
Epoch: 62, step: 1138, loss: 0.3334171175956726, mean loss: 0.3400748974027961
Epoch: 62, step: 1139, loss: 0.36713936924934387, mean loss: 0.34007519590361057
Epoch: 62, step: 1140, loss: 0.3336457312107086, mean loss: 0.340075124992222
Epoch: 62, step: 1141, loss: 0.337758332490921, mean loss: 0.3400750994403029
Epoch: 62, step: 1142, loss: 0.3083552420139313, mean loss: 0.34007474960565426
Epoch: 62, step: 1143, loss: 0.3455668091773987, mean loss: 0.3400748101762777
Epoch: 62, step: 1144, loss: 0.3058463931083679, mean loss: 0.3400744326833408
Epoch: 62, step: 1145, loss: 0.41921693086624146, mean loss: 0.34007530550794524
Epoch: 62, step: 1146, loss: 0.3118508756160736, mean loss: 0.34007499423769555
Epoch: 62, step: 1147, loss: 0.3496186137199402, mean loss: 0.34007509948737
Epoch: 62, step: 1148, loss: 0.36391881108283997, mean loss: 0.3400753624395144
Epoch: 62, step: 1149, loss: 0.30205440521240234, mean loss: 0.3400749431431335
Epoch: 62, step: 1150, loss: 0.32190966606140137, mean loss: 0.3400747428180629
Epoch: 62, step: 1151, loss: 0.3908243179321289, mean loss: 0.3400753024737214
Epoch: 62, step: 1152, loss: 0.3501829504966736, mean loss: 0.34007541393751234
Epoch: 62, step: 1153, loss: 0.36190930008888245, mean loss: 0.34007565471171397
Epoch: 62, step: 1154, loss: 0.37066376209259033, mean loss: 0.34007599201978034
Epoch: 62, step: 1155, loss: 0.32216402888298035, mean loss: 0.3400757944991247
Epoch: 62, step: 1156, loss: 0.33001866936683655, mean loss: 0.3400756835973754
Epoch: 62, step: 1157, loss: 0.34357351064682007, mean loss: 0.34007572216812554
Epoch: 62, step: 1158, loss: 0.34256109595298767, mean loss: 0.3400757495741902
Epoch: 62, step: 1159, loss: 0.33313414454460144, mean loss: 0.34007567303038033
Epoch: 62, step: 1160, loss: 0.3459570109844208, mean loss: 0.3400757378821038
Epoch: 62, step: 1161, loss: 0.34153228998184204, mean loss: 0.3400757539428834
Epoch: 62, step: 1162, loss: 0.3078484535217285, mean loss: 0.34007539859008745
Epoch: 62, step: 1163, loss: 0.3234056532382965, mean loss: 0.3400752147839595
Epoch: 62, step: 1164, loss: 0.3192529082298279, mean loss: 0.34007498519284934
Epoch: 62, step: 1165, loss: 0.32328131794929504, mean loss: 0.3400748000244011
Epoch: 62, step: 1166, loss: 0.3218747079372406, mean loss: 0.3400745993508018
Epoch: 62, step: 1167, loss: 0.3941396474838257, mean loss: 0.3400751954636197
Epoch: 62, step: 1168, loss: 0.29784348607063293, mean loss: 0.34007472982848963
Epoch: 62, step: 1169, loss: 0.3395013213157654, mean loss: 0.3400747235063159
Epoch: 62, step: 1170, loss: 0.33115851879119873, mean loss: 0.34007462520088017
Epoch: 62, step: 1171, loss: 0.3512375056743622, mean loss: 0.34007474827563733
Epoch: 62, step: 1172, loss: 0.32867366075515747, mean loss: 0.340074622575948
Epoch: 62, step: 1173, loss: 0.3137775659561157, mean loss: 0.340074332647869
Epoch: 62, step: 1174, loss: 0.36329594254493713, mean loss: 0.3400745886659709
Epoch: 62, step: 1175, loss: 0.2974157929420471, mean loss: 0.3400741183582036
Epoch: 62, step: 1176, loss: 0.32146531343460083, mean loss: 0.340073913200771
Epoch: 62, step: 1177, loss: 0.3498765230178833, mean loss: 0.3400740212709077
Epoch: 62, step: 1178, loss: 0.335523396730423, mean loss: 0.3400739711025134
Epoch: 62, step: 1179, loss: 0.32289808988571167, mean loss: 0.34007378174897
Epoch: 62, step: 1180, loss: 0.355852872133255, mean loss: 0.3400739557018345
Epoch: 62, step: 1181, loss: 0.3663370609283447, mean loss: 0.3400742452300588
Epoch: 62, step: 1182, loss: 0.34377992153167725, mean loss: 0.34007428608151347
Epoch: 62, step: 1183, loss: 0.32152676582336426, mean loss: 0.34007408161550834
Epoch: 62, step: 1184, loss: 0.35921332240104675, mean loss: 0.3400742926022554
Epoch: 62, step: 1185, loss: 0.3181125819683075, mean loss: 0.34007405050389533
Epoch: 62, step: 1186, loss: 0.33267444372177124, mean loss: 0.34007396893406916
Epoch: 62, step: 1187, loss: 0.31818896532058716, mean loss: 0.3400737276866198
Epoch: 62, step: 1188, loss: 0.32412686944007874, mean loss: 0.3400735518997414
Epoch: 62, step: 1189, loss: 0.31145262718200684, mean loss: 0.3400732364064025
Epoch: 62, step: 1190, loss: 0.33477652072906494, mean loss: 0.340073178020445
Epoch: 62, step: 1191, loss: 0.33130186796188354, mean loss: 0.3400730813349285
Epoch: 62, step: 1192, loss: 0.3307574987411499, mean loss: 0.34007297865106706
Epoch: 62, step: 1193, loss: 0.35598358511924744, mean loss: 0.3400731540286653
Epoch: 62, step: 1194, loss: 0.3262868821620941, mean loss: 0.3400730020686125
Epoch: 62, step: 1195, loss: 0.3302055597305298, mean loss: 0.3400728933053047
Epoch: 62, step: 1196, loss: 0.3266315758228302, mean loss: 0.34007274515079955
Epoch: 62, step: 1197, loss: 0.353386253118515, mean loss: 0.3400728918949299
Epoch: 62, step: 1198, loss: 0.34323829412460327, mean loss: 0.34007292678423773
Epoch: 62, step: 1199, loss: 0.31198352575302124, mean loss: 0.3400726171841029
Epoch: 62, step: 1200, loss: 0.36846888065338135, mean loss: 0.3400729301630123
Epoch: 62, step: 1201, loss: 0.3489066958427429, mean loss: 0.34007302752624036
Epoch: 62, step: 1202, loss: 0.32808488607406616, mean loss: 0.34007289539784485
Epoch: 62, step: 1203, loss: 0.29358404874801636, mean loss: 0.3400723830224244
Epoch: 62, step: 1204, loss: 0.3163105547428131, mean loss: 0.34007212113503743
Epoch: 62, step: 1205, loss: 0.3461969494819641, mean loss: 0.34007218863816024
Epoch: 62, step: 1206, loss: 0.3480491638183594, mean loss: 0.3400722765532446
Epoch: 62, step: 1207, loss: 0.35425838828086853, mean loss: 0.3400724328981543
Epoch: 62, step: 1208, loss: 0.34627655148506165, mean loss: 0.3400725012728921
Epoch: 62, step: 1209, loss: 0.3250713348388672, mean loss: 0.3400723359489216
Epoch: 62, step: 1210, loss: 0.30174532532691956, mean loss: 0.34007191356151795
Epoch: 62, step: 1211, loss: 0.347425252199173, mean loss: 0.34007199459897264
Epoch: 62, step: 1212, loss: 0.3439633846282959, mean loss: 0.3400720374835566
Epoch: 62, step: 1213, loss: 0.3239176273345947, mean loss: 0.34007185945783364
Epoch: 62, step: 1214, loss: 0.3180030584335327, mean loss: 0.3400716162566939
Epoch: 62, step: 1215, loss: 0.3228228986263275, mean loss: 0.34007142617561276
Epoch: 62, step: 1216, loss: 0.33186832070350647, mean loss: 0.3400713357782854
Epoch: 62, step: 1217, loss: 0.31724685430526733, mean loss: 0.3400710842577614
Epoch: 62, step: 1218, loss: 0.3201499581336975, mean loss: 0.3400708647339631
Epoch: 62, step: 1219, loss: 0.3721584975719452, mean loss: 0.3400712183244867
Epoch: 62, step: 1220, loss: 0.31992626190185547, mean loss: 0.34007099633904975
Epoch: 62, step: 1221, loss: 0.3280411958694458, mean loss: 0.34007086377926493
Epoch: 62, step: 1222, loss: 0.3289644122123718, mean loss: 0.3400707413954723
Epoch: 62, step: 1223, loss: 0.3406496047973633, mean loss: 0.34007074777399177
Epoch: 62, step: 1224, loss: 0.37638938426971436, mean loss: 0.3400711479661231
Epoch: 62, step: 1225, loss: 0.2982823848724365, mean loss: 0.34007068750418096
Epoch: 62, step: 1226, loss: 0.30076664686203003, mean loss: 0.3400702544256658
Epoch: 62, step: 1227, loss: 0.371734619140625, mean loss: 0.34007060332121775
Epoch: 62, step: 1228, loss: 0.32541438937187195, mean loss: 0.340070441832694
Epoch: 62, step: 1229, loss: 0.34387949109077454, mean loss: 0.34007048380198884
Epoch: 62, step: 1230, loss: 0.3777429461479187, mean loss: 0.3400708988843757
Epoch: 62, step: 1231, loss: 0.3343146741390228, mean loss: 0.3400708354618906
Epoch: 62, step: 1232, loss: 0.28912481665611267, mean loss: 0.3400702741412925
Epoch: 62, step: 1233, loss: 0.35014787316322327, mean loss: 0.34007038517453353
Epoch: 62, step: 1234, loss: 0.3380087912082672, mean loss: 0.34007036246049843
Epoch: 62, step: 1235, loss: 0.306746244430542, mean loss: 0.34006999530922666
Epoch: 62, step: 1236, loss: 0.3105553984642029, mean loss: 0.34006967013325745
Epoch: 62, step: 1237, loss: 0.33276721835136414, mean loss: 0.3400695896796539
Epoch: 62, step: 1238, loss: 0.34711503982543945, mean loss: 0.3400696673009275
Epoch: 62, step: 1239, loss: 0.3452671766281128, mean loss: 0.3400697245623999
Epoch: 62, step: 1240, loss: 0.31985700130462646, mean loss: 0.3400695018792894
Epoch: 62, step: 1241, loss: 0.33073562383651733, mean loss: 0.34006939904930106
Epoch: 62, step: 1242, loss: 0.3148335814476013, mean loss: 0.3400691210330007
Epoch: 62, step: 1243, loss: 0.42984527349472046, mean loss: 0.3400701100621337
Epoch: 62, step: 1244, loss: 0.3323989808559418, mean loss: 0.3400700255532026
Epoch: 62, step: 1245, loss: 0.32781094312667847, mean loss: 0.3400698905026107
Epoch: 62, step: 1246, loss: 0.3400095999240875, mean loss: 0.34006988983843467
Epoch: 62, step: 1247, loss: 0.32564234733581543, mean loss: 0.34006973090278536
Epoch: 62, step: 1248, loss: 0.30201977491378784, mean loss: 0.3400693117442321
Epoch: 62, step: 1249, loss: 0.31932303309440613, mean loss: 0.3400690832056143
Epoch: 62, step: 1250, loss: 0.3435901999473572, mean loss: 0.3400691219934038
Epoch: 62, step: 1251, loss: 0.3446960151195526, mean loss: 0.340069172961603
Epoch: 62, step: 1252, loss: 0.3608599603176117, mean loss: 0.340069401982955
Epoch: 62, step: 1253, loss: 0.31702539324760437, mean loss: 0.34006914814399203
Epoch: 62, step: 1254, loss: 0.32072895765304565, mean loss: 0.3400689351064135
Epoch: 62, step: 1255, loss: 0.3062191605567932, mean loss: 0.3400685622458373
Epoch: 62, step: 1256, loss: 0.31434890627861023, mean loss: 0.3400682789429132
Epoch: 62, step: 1257, loss: 0.3399941921234131, mean loss: 0.34006827812685325
Epoch: 62, step: 1258, loss: 0.34683817625045776, mean loss: 0.3400683526958788
Epoch: 62, step: 1259, loss: 0.3333863317966461, mean loss: 0.3400682790956134
Epoch: 62, step: 1260, loss: 0.29572734236717224, mean loss: 0.3400677907001389
Epoch: 62, step: 1261, loss: 0.3394615054130554, mean loss: 0.34006778402225274
Epoch: 62, step: 1262, loss: 0.3712877929210663, mean loss: 0.34006812788903357
Epoch: 62, step: 1263, loss: 0.3033670485019684, mean loss: 0.34006772365650884
Epoch: 62, step: 1264, loss: 0.3268097937107086, mean loss: 0.34006757763280715
Epoch: 62, step: 1265, loss: 0.35213619470596313, mean loss: 0.34006771055587554
Epoch: 62, step: 1266, loss: 0.3063387870788574, mean loss: 0.3400673390715044
Epoch: 62, step: 1267, loss: 0.3207094371318817, mean loss: 0.34006712586935955
Epoch: 62, step: 1268, loss: 0.3351829946041107, mean loss: 0.3400670720775904
Epoch: 62, step: 1269, loss: 0.3445364534854889, mean loss: 0.3400671213009368
Epoch: 62, step: 1270, loss: 0.34158411622047424, mean loss: 0.34006713800811333
Epoch: 62, step: 1271, loss: 0.31487128138542175, mean loss: 0.3400668605207056
Epoch: 62, step: 1272, loss: 0.34055987000465393, mean loss: 0.3400668659502657
Epoch: 62, step: 1273, loss: 0.30289626121520996, mean loss: 0.34006645659138884
Epoch: 62, step: 1274, loss: 0.35897722840309143, mean loss: 0.34006666485292
Epoch: 62, step: 1275, loss: 0.38811516761779785, mean loss: 0.3400671939981423
Epoch: 62, step: 1276, loss: 0.33085155487060547, mean loss: 0.34006709250990785
Epoch: 62, step: 1277, loss: 0.35465681552886963, mean loss: 0.3400672531790599
Epoch: 62, step: 1278, loss: 0.2940811514854431, mean loss: 0.3400667467632363
Epoch: 62, step: 1279, loss: 0.3506006896495819, mean loss: 0.34006686276560266
Epoch: 62, step: 1280, loss: 0.3350510597229004, mean loss: 0.34006680753095586
Epoch: 62, step: 1281, loss: 0.33547714352607727, mean loss: 0.3400667569895617
Epoch: 62, step: 1282, loss: 0.3734111189842224, mean loss: 0.34006712417373536
Epoch: 62, step: 1283, loss: 0.34689900279045105, mean loss: 0.3400671994047469
Epoch: 62, step: 1284, loss: 0.32662323117256165, mean loss: 0.3400670513646179
Epoch: 62, step: 1285, loss: 0.3554943799972534, mean loss: 0.34006722124292554
Epoch: 62, step: 1286, loss: 0.31584230065345764, mean loss: 0.34006695449271257
Epoch: 62, step: 1287, loss: 0.3091975152492523, mean loss: 0.3400666145808111
Epoch: 62, step: 1288, loss: 0.28549811244010925, mean loss: 0.34006601371861417
Epoch: 62, step: 1289, loss: 0.30048978328704834, mean loss: 0.3400655779434327
Epoch: 62, step: 1290, loss: 0.32813042402267456, mean loss: 0.3400654465265054
Epoch: 62, step: 1291, loss: 0.31475579738616943, mean loss: 0.3400651678472592
Epoch: 62, step: 1292, loss: 0.33983278274536133, mean loss: 0.3400651652885437
Epoch: 62, step: 1293, loss: 0.3696439564228058, mean loss: 0.34006549096724636
Epoch: 62, step: 1294, loss: 0.3270114064216614, mean loss: 0.3400653472362031
Epoch: 62, step: 1295, loss: 0.3319413363933563, mean loss: 0.3400652577883606
Epoch: 62, step: 1296, loss: 0.32081079483032227, mean loss: 0.34006504579317254
Epoch: 62, step: 1297, loss: 0.31436264514923096, mean loss: 0.3400647628081171
Epoch: 62, step: 1298, loss: 0.37178391218185425, mean loss: 0.34006511203411127
Epoch: 62, step: 1299, loss: 0.3348621726036072, mean loss: 0.3400650547506807
Epoch: 62, step: 1300, loss: 0.3272523880004883, mean loss: 0.3400649136870694
Epoch: 62, step: 1301, loss: 0.37597155570983887, mean loss: 0.34006530900405746
Epoch: 62, step: 1302, loss: 0.3249601125717163, mean loss: 0.340065142704045
Epoch: 62, step: 1303, loss: 0.34330227971076965, mean loss: 0.34006517834277367
Epoch: 62, step: 1304, loss: 0.3495766818523407, mean loss: 0.34006528305695805
Epoch: 62, step: 1305, loss: 0.3585454821586609, mean loss: 0.3400654865071981
Epoch: 62, step: 1306, loss: 0.32914960384368896, mean loss: 0.3400653663345481
Epoch: 62, step: 1307, loss: 0.3013606667518616, mean loss: 0.3400649402402729
Epoch: 62, step: 1308, loss: 0.3298211693763733, mean loss: 0.34006482746936606
Epoch: 62, step: 1309, loss: 0.33318647742271423, mean loss: 0.3400647517483017
Epoch: 62, step: 1310, loss: 0.35408639907836914, mean loss: 0.34006490610543166
Epoch: 62, step: 1311, loss: 0.3401280343532562, mean loss: 0.34006490680037055
Epoch: 62, step: 1312, loss: 0.3213655948638916, mean loss: 0.3400647009537601
Epoch: 62, step: 1313, loss: 0.31933701038360596, mean loss: 0.3400644727807722
Epoch: 62, step: 1314, loss: 0.38294804096221924, mean loss: 0.3400649448432116
Epoch: 62, step: 1315, loss: 0.3156287670135498, mean loss: 0.3400646758526582
Epoch: 62, step: 1316, loss: 0.3090512752532959, mean loss: 0.340064334464573
Epoch: 62, step: 1317, loss: 0.3074144721031189, mean loss: 0.3400639750666649
Epoch: 62, step: 1318, loss: 0.3996157944202423, mean loss: 0.3400646305843964
Epoch: 62, step: 1319, loss: 0.3574332594871521, mean loss: 0.34006482176778957
Epoch: 62, step: 1320, loss: 0.3369545340538025, mean loss: 0.34006478753199487
Epoch: 62, step: 1321, loss: 0.33933085203170776, mean loss: 0.3400647794534533
Epoch: 62, step: 1322, loss: 0.33961862325668335, mean loss: 0.3400647745425971
Epoch: 62, step: 1323, loss: 0.32105153799057007, mean loss: 0.34006456526556905
Epoch: 62, step: 1324, loss: 0.3308616280555725, mean loss: 0.34006446397076084
Epoch: 62, step: 1325, loss: 0.34112751483917236, mean loss: 0.340064475671411
Epoch: 62, step: 1326, loss: 0.36538511514663696, mean loss: 0.3400647543642675
Epoch: 62, step: 1327, loss: 0.30554965138435364, mean loss: 0.34006437447628013
Epoch: 62, step: 1328, loss: 0.3157689571380615, mean loss: 0.34006410707346757
Epoch: 62, step: 1329, loss: 0.30776870250701904, mean loss: 0.3400637516242549
Epoch: 62, step: 1330, loss: 0.34199509024620056, mean loss: 0.34006377288069206
Epoch: 62, step: 1331, loss: 0.36502811312675476, mean loss: 0.3400640476368031
Epoch: 62, step: 1332, loss: 0.3366146683692932, mean loss: 0.3400640096735486
Epoch: 62, step: 1333, loss: 0.3606894612312317, mean loss: 0.3400642366711005
Epoch: 62, step: 1334, loss: 0.2970356047153473, mean loss: 0.34006376311605657
Epoch: 62, step: 1335, loss: 0.3238840401172638, mean loss: 0.3400635850507832
Epoch: 62, step: 1336, loss: 0.34705907106399536, mean loss: 0.3400636620384684
Epoch: 62, step: 1337, loss: 0.29601940512657166, mean loss: 0.3400631773218867
Epoch: 62, step: 1338, loss: 0.33554577827453613, mean loss: 0.34006312760747937
Epoch: 62, step: 1339, loss: 0.35157161951065063, mean loss: 0.3400632542581364
Epoch: 62, step: 1340, loss: 0.3172464668750763, mean loss: 0.3400630031627421
Epoch: 62, step: 1341, loss: 0.3268641531467438, mean loss: 0.3400628579129345
Epoch: 62, step: 1342, loss: 0.3526107966899872, mean loss: 0.34006299599811873
Epoch: 62, step: 1343, loss: 0.33751633763313293, mean loss: 0.34006296797344265
Epoch: 62, step: 1344, loss: 0.3648756444454193, mean loss: 0.3400632410212838
Epoch: 62, step: 1345, loss: 0.3182356655597687, mean loss: 0.34006300082523805
Epoch: 62, step: 1346, loss: 0.30252084136009216, mean loss: 0.34006258770656445
Epoch: 62, step: 1347, loss: 0.3171236217021942, mean loss: 0.34006233528605734
Epoch: 62, step: 1348, loss: 0.35240980982780457, mean loss: 0.3400624711562395
Epoch: 62, step: 1349, loss: 0.32847487926483154, mean loss: 0.34006234364912125
Epoch: 62, step: 1350, loss: 0.370228111743927, mean loss: 0.34006267558244024
Epoch: 62, step: 1351, loss: 0.3234277069568634, mean loss: 0.3400624925392115
Epoch: 62, step: 1352, loss: 0.33098214864730835, mean loss: 0.34006239262455507
Epoch: 62, step: 1353, loss: 0.3618415296077728, mean loss: 0.34006263226647515
Epoch: 62, step: 1354, loss: 0.3386807441711426, mean loss: 0.3400626170613422
Epoch: 62, step: 1355, loss: 0.31841903924942017, mean loss: 0.34006237891625823
Epoch: 62, step: 1356, loss: 0.3711484372615814, mean loss: 0.3400627209535399
Epoch: 62, step: 1357, loss: 0.31108227372169495, mean loss: 0.3400624020876284
Epoch: 62, step: 1358, loss: 0.32173651456832886, mean loss: 0.3400622004538687
Epoch: 62, step: 1359, loss: 0.35034650564193726, mean loss: 0.3400623136074774
Epoch: 62, step: 1360, loss: 0.3093588650226593, mean loss: 0.3400619757948864
Epoch: 62, step: 1361, loss: 0.34905675053596497, mean loss: 0.34006207475819084
Epoch: 62, step: 1362, loss: 0.38846921920776367, mean loss: 0.3400626073427641
Epoch: 62, step: 1363, loss: 0.298017680644989, mean loss: 0.3400621447616052
Epoch: 62, step: 1364, loss: 0.33049553632736206, mean loss: 0.3400620395102829
Epoch: 62, step: 1365, loss: 0.3859763443470001, mean loss: 0.34006254465148955
Epoch: 62, step: 1366, loss: 0.3428596258163452, mean loss: 0.34006257542415214
Epoch: 62, step: 1367, loss: 0.311056524515152, mean loss: 0.34006225631163994
Epoch: 62, step: 1368, loss: 0.36180004477500916, mean loss: 0.34006249545911965
Epoch: 62, step: 1369, loss: 0.32805219292640686, mean loss: 0.340062363329672
Epoch: 62, step: 1370, loss: 0.31918495893478394, mean loss: 0.3400621336527295
Epoch: 62, step: 1371, loss: 0.31802961230278015, mean loss: 0.3400618912707565
Epoch: 62, step: 1372, loss: 0.33290204405784607, mean loss: 0.340061812505427
Epoch: 62, step: 1373, loss: 0.3281337320804596, mean loss: 0.3400616812863072
Epoch: 62, step: 1374, loss: 0.3797243535518646, mean loss: 0.3400621176049355
Epoch: 62, step: 1375, loss: 0.33895835280418396, mean loss: 0.3400621054628427
Epoch: 62, step: 1376, loss: 0.31593403220176697, mean loss: 0.3400618400420929
Epoch: 62, step: 1377, loss: 0.33177271485328674, mean loss: 0.34006174885861556
Epoch: 62, step: 1378, loss: 0.3550516963005066, mean loss: 0.34006191375183
Epoch: 62, step: 1379, loss: 0.3414565324783325, mean loss: 0.34006192909282007
Epoch: 62, step: 1380, loss: 0.4038383960723877, mean loss: 0.3400626306346584
Epoch: 62, step: 1381, loss: 0.33469030261039734, mean loss: 0.3400625715396411
Epoch: 62, step: 1382, loss: 0.3490176498889923, mean loss: 0.3400626700434344
Epoch: 62, step: 1383, loss: 0.3070772886276245, mean loss: 0.3400623072158493
Epoch: 62, step: 1384, loss: 0.3470791280269623, mean loss: 0.3400623843975594
Epoch: 62, step: 1385, loss: 0.32889148592948914, mean loss: 0.3400622615243114
Epoch: 62, step: 1386, loss: 0.324006050825119, mean loss: 0.34006208491747314
Epoch: 62, step: 1387, loss: 0.38281118869781494, mean loss: 0.34006255512187916
Epoch: 62, step: 1388, loss: 0.3163929283618927, mean loss: 0.34006229477863464
Epoch: 62, step: 1389, loss: 0.3324342966079712, mean loss: 0.34006221087887695
Epoch: 62, step: 1390, loss: 0.3206331431865692, mean loss: 0.34006199718242525
Epoch: 62, step: 1391, loss: 0.31167715787887573, mean loss: 0.3400616849866564
Epoch: 62, step: 1392, loss: 0.3458206355571747, mean loss: 0.3400617483268151
Epoch: 62, step: 1393, loss: 0.32980969548225403, mean loss: 0.34006163557024527
Epoch: 62, step: 1394, loss: 0.31730589270591736, mean loss: 0.34006138529536584
Epoch: 62, step: 1395, loss: 0.3453008234500885, mean loss: 0.34006144291973517
Epoch: 62, step: 1396, loss: 0.32149457931518555, mean loss: 0.34006123871997046
Epoch: 62, step: 1397, loss: 0.3313652276992798, mean loss: 0.340061143081638
Epoch: 62, step: 1398, loss: 0.33214637637138367, mean loss: 0.3400610560363521
Epoch: 62, step: 1399, loss: 0.2924584448337555, mean loss: 0.340060532516521
Epoch: 62, step: 1400, loss: 0.32844215631484985, mean loss: 0.3400604047423653
Epoch: 62, step: 1401, loss: 0.3475320041179657, mean loss: 0.34006048691105967
Epoch: 62, step: 1402, loss: 0.36958256363868713, mean loss: 0.3400608115756595
Epoch: 62, step: 1403, loss: 0.3401348888874054, mean loss: 0.3400608123903046
Epoch: 62, step: 1404, loss: 0.31880417466163635, mean loss: 0.3400605786287689
Epoch: 62, step: 1405, loss: 0.34190112352371216, mean loss: 0.34006059886921686
Epoch: 62, step: 1406, loss: 0.3424994945526123, mean loss: 0.34006062568942563
Epoch: 62, step: 1407, loss: 0.38152143359184265, mean loss: 0.34006108162335613
Epoch: 62, step: 1408, loss: 0.33866602182388306, mean loss: 0.340061066282408
Epoch: 62, step: 1409, loss: 0.3111895024776459, mean loss: 0.34006074879616677
Epoch: 62, step: 1410, loss: 0.32973653078079224, mean loss: 0.34006063526711966
Epoch: 62, step: 1411, loss: 0.39239615201950073, mean loss: 0.34006121076213564
Epoch: 62, step: 1412, loss: 0.36096397042274475, mean loss: 0.34006144061181465
Epoch: 62, step: 1413, loss: 0.32441967725753784, mean loss: 0.3400612686146807
Epoch: 62, step: 1414, loss: 0.3258243203163147, mean loss: 0.34006111206664186
Epoch: 62, step: 1415, loss: 0.3278276026248932, mean loss: 0.3400609775496925
Epoch: 62, step: 1416, loss: 0.33667078614234924, mean loss: 0.3400609402723116
Epoch: 62, step: 1417, loss: 0.32116952538490295, mean loss: 0.34006073255108266
Epoch: 62, step: 1418, loss: 0.3345133662223816, mean loss: 0.3400606715554882
Epoch: 62, step: 1419, loss: 0.3786045014858246, mean loss: 0.3400610953562307
Epoch: 62, step: 1420, loss: 0.3481154441833496, mean loss: 0.3400611839151904
Epoch: 62, step: 1421, loss: 0.29574862122535706, mean loss: 0.34006069669624933
Epoch: 62, step: 1422, loss: 0.3383542597293854, mean loss: 0.34006067793409206
Epoch: 62, step: 1423, loss: 0.342376708984375, mean loss: 0.34006070339841443
Epoch: 62, step: 1424, loss: 0.29067733883857727, mean loss: 0.34006016044365145
Epoch: 62, step: 1425, loss: 0.418615460395813, mean loss: 0.3400610241252922
Epoch: 62, step: 1426, loss: 0.32940417528152466, mean loss: 0.34006090695912383
Epoch: 62, step: 1427, loss: 0.312697172164917, mean loss: 0.34006060611327754
Epoch: 62, step: 1428, loss: 0.35116225481033325, mean loss: 0.3400607281670909
Epoch: 62, step: 1429, loss: 0.3073764443397522, mean loss: 0.3400603688332904
Epoch: 62, step: 1430, loss: 0.3564804196357727, mean loss: 0.34006054935474295
Epoch: 62, step: 1431, loss: 0.32587388157844543, mean loss: 0.3400603933887384
Epoch: 62, step: 1432, loss: 0.36207398772239685, mean loss: 0.3400606354000876
Epoch: 62, step: 1433, loss: 0.3220328390598297, mean loss: 0.34006043720967466
Epoch: 62, step: 1434, loss: 0.31749337911605835, mean loss: 0.3400601891191533
Epoch: 62, step: 1435, loss: 0.35530364513397217, mean loss: 0.3400603566959531
Epoch: 62, step: 1436, loss: 0.30320537090301514, mean loss: 0.34005995154028007
Epoch: 62, step: 1437, loss: 0.3047468960285187, mean loss: 0.340059563339683
Epoch: 62, step: 1438, loss: 0.33973950147628784, mean loss: 0.34005955982124375
Epoch: 62, step: 1439, loss: 0.30967187881469727, mean loss: 0.3400592257732158
Epoch: 62, step: 1440, loss: 0.31136658787727356, mean loss: 0.3400589103620549
Epoch: 62, step: 1441, loss: 0.3333243131637573, mean loss: 0.34005883633108647
Epoch: 62, step: 1442, loss: 0.30101433396339417, mean loss: 0.3400584071338437
Epoch: 62, step: 1443, loss: 0.3530403673648834, mean loss: 0.3400585498366559
Valid: 62, mean loss: 0.18491086860497793
Epoch: 63, step: 0, loss: 0.3101361095905304, mean loss: 0.3400582209210409
Epoch: 63, step: 1, loss: 0.3026873767375946, mean loss: 0.34005781013505604
Epoch: 63, step: 2, loss: 0.33206257224082947, mean loss: 0.34005772225115505
Epoch: 63, step: 3, loss: 0.3266425132751465, mean loss: 0.34005757479238596
Epoch: 63, step: 4, loss: 0.37230053544044495, mean loss: 0.34005792920021044
Epoch: 63, step: 5, loss: 0.3300744295120239, mean loss: 0.3400578194648932
Epoch: 63, step: 6, loss: 0.31834810972213745, mean loss: 0.3400575808415874
Epoch: 63, step: 7, loss: 0.326227605342865, mean loss: 0.3400574288304256
Epoch: 63, step: 8, loss: 0.32088038325309753, mean loss: 0.34005721804965183
Epoch: 63, step: 9, loss: 0.31667250394821167, mean loss: 0.34005696102393135
Epoch: 63, step: 10, loss: 0.33961474895477295, mean loss: 0.3400569561635501
Epoch: 63, step: 11, loss: 0.2871781289577484, mean loss: 0.3400563749753499
Epoch: 63, step: 12, loss: 0.32109692692756653, mean loss: 0.3400561665954186
Epoch: 63, step: 13, loss: 0.32144036889076233, mean loss: 0.34005596199473603
Epoch: 63, step: 14, loss: 0.33849021792411804, mean loss: 0.3400559447862989
Epoch: 63, step: 15, loss: 0.3607316315174103, mean loss: 0.3400561720216127
Epoch: 63, step: 16, loss: 0.33932095766067505, mean loss: 0.3400561639413573
Epoch: 63, step: 17, loss: 0.2777779996395111, mean loss: 0.340055479490711
Epoch: 63, step: 18, loss: 0.3227542042732239, mean loss: 0.3400552893480022
Epoch: 63, step: 19, loss: 0.3132524788379669, mean loss: 0.3400549947857274
Epoch: 63, step: 20, loss: 0.35401514172554016, mean loss: 0.3400551482057371
Epoch: 63, step: 21, loss: 0.35515183210372925, mean loss: 0.3400553141143014
Epoch: 63, step: 22, loss: 0.3292229175567627, mean loss: 0.34005519507043575
Epoch: 63, step: 23, loss: 0.3111831545829773, mean loss: 0.34005487778131877
Epoch: 63, step: 24, loss: 0.37108299136161804, mean loss: 0.34005521876084094
Epoch: 63, step: 25, loss: 0.3599219024181366, mean loss: 0.3400554370808442
Epoch: 63, step: 26, loss: 0.3326656222343445, mean loss: 0.34005535587319524
Epoch: 63, step: 27, loss: 0.33170023560523987, mean loss: 0.3400552640586868
Epoch: 63, step: 28, loss: 0.341009259223938, mean loss: 0.34005527454203494
Epoch: 63, step: 29, loss: 0.31631121039390564, mean loss: 0.34005501362398755
Epoch: 63, step: 30, loss: 0.36571457982063293, mean loss: 0.34005529558794695
Epoch: 63, step: 31, loss: 0.33174437284469604, mean loss: 0.3400552042631399
Epoch: 63, step: 32, loss: 0.31661438941955566, mean loss: 0.34005494668592057
Epoch: 63, step: 33, loss: 0.314267098903656, mean loss: 0.3400546633216613
Epoch: 63, step: 34, loss: 0.35838326811790466, mean loss: 0.34005486471940866
Epoch: 63, step: 35, loss: 0.34687817096710205, mean loss: 0.3400549396942048
Epoch: 63, step: 36, loss: 0.3381715416908264, mean loss: 0.3400549189995702
Epoch: 63, step: 37, loss: 0.3151158392429352, mean loss: 0.3400546449738614
Epoch: 63, step: 38, loss: 0.33902278542518616, mean loss: 0.340054633636116
Epoch: 63, step: 39, loss: 0.3426283299922943, mean loss: 0.34005466191476447
Epoch: 63, step: 40, loss: 0.30107665061950684, mean loss: 0.3400542336461512
Epoch: 63, step: 41, loss: 0.2906401455402374, mean loss: 0.34005369071772146
Epoch: 63, step: 42, loss: 0.34269392490386963, mean loss: 0.3400537197265023
Epoch: 63, step: 43, loss: 0.33142566680908203, mean loss: 0.34005362492940155
Epoch: 63, step: 44, loss: 0.3298262357711792, mean loss: 0.3400535125615015
Epoch: 63, step: 45, loss: 0.3772352933883667, mean loss: 0.3400539210716954
Epoch: 63, step: 46, loss: 0.3303176462650299, mean loss: 0.3400538141019989
Epoch: 63, step: 47, loss: 0.3190995156764984, mean loss: 0.34005358388558027
Epoch: 63, step: 48, loss: 0.36444252729415894, mean loss: 0.34005385183411313
Epoch: 63, step: 49, loss: 0.3242235779762268, mean loss: 0.3400536779171056
Epoch: 63, step: 50, loss: 0.3083447515964508, mean loss: 0.3400533295554133
Epoch: 63, step: 51, loss: 0.37058791518211365, mean loss: 0.34005366501183826
Epoch: 63, step: 52, loss: 0.32813411951065063, mean loss: 0.3400535340637965
Epoch: 63, step: 53, loss: 0.3367825448513031, mean loss: 0.34005349812912716
Epoch: 63, step: 54, loss: 0.36938968300819397, mean loss: 0.3400538204091636
Epoch: 63, step: 55, loss: 0.3176991939544678, mean loss: 0.34005357482949083
Epoch: 63, step: 56, loss: 0.3620482087135315, mean loss: 0.3400538164517638
Epoch: 63, step: 57, loss: 0.33003848791122437, mean loss: 0.3400537064294795
Epoch: 63, step: 58, loss: 0.3335499167442322, mean loss: 0.3400536349836019
Epoch: 63, step: 59, loss: 0.3125714957714081, mean loss: 0.3400533330882331
Epoch: 63, step: 60, loss: 0.35049399733543396, mean loss: 0.34005344777921603
Epoch: 63, step: 61, loss: 0.3546091616153717, mean loss: 0.340053607672375
Epoch: 63, step: 62, loss: 0.308760404586792, mean loss: 0.34005326392323365
Epoch: 63, step: 63, loss: 0.3170567452907562, mean loss: 0.3400530113141709
Epoch: 63, step: 64, loss: 0.32752421498298645, mean loss: 0.34005287369104703
Epoch: 63, step: 65, loss: 0.3431868255138397, mean loss: 0.34005290811570293
Epoch: 63, step: 66, loss: 0.3538541793823242, mean loss: 0.3400530597130543
Epoch: 63, step: 67, loss: 0.30427423119544983, mean loss: 0.3400526667118623
Epoch: 63, step: 68, loss: 0.35703158378601074, mean loss: 0.34005285320934225
Epoch: 63, step: 69, loss: 0.324266254901886, mean loss: 0.3400526798102703
Epoch: 63, step: 70, loss: 0.3202325105667114, mean loss: 0.34005246210908247
Epoch: 63, step: 71, loss: 0.32879385352134705, mean loss: 0.34005233844790117
Epoch: 63, step: 72, loss: 0.3220006227493286, mean loss: 0.3400521401754458
Epoch: 63, step: 73, loss: 0.3020596504211426, mean loss: 0.3400517228864957
Epoch: 63, step: 74, loss: 0.3240542709827423, mean loss: 0.3400515471810699
Epoch: 63, step: 75, loss: 0.3220757246017456, mean loss: 0.34005134974869816
Epoch: 63, step: 76, loss: 0.31736576557159424, mean loss: 0.34005110059072635
Epoch: 63, step: 77, loss: 0.34977439045906067, mean loss: 0.3400512073813894
Epoch: 63, step: 78, loss: 0.3325018286705017, mean loss: 0.3400511244676519
Epoch: 63, step: 79, loss: 0.33905482292175293, mean loss: 0.3400511135255359
Epoch: 63, step: 80, loss: 0.3516724407672882, mean loss: 0.3400512411580932
Epoch: 63, step: 81, loss: 0.3139100968837738, mean loss: 0.34005095406313557
Epoch: 63, step: 82, loss: 0.32267001271247864, mean loss: 0.3400507631791495
Epoch: 63, step: 83, loss: 0.3154613971710205, mean loss: 0.3400504931325188
Epoch: 63, step: 84, loss: 0.39190980792045593, mean loss: 0.3400510626583629
Epoch: 63, step: 85, loss: 0.3383942246437073, mean loss: 0.3400510444629488
Epoch: 63, step: 86, loss: 0.3742911219596863, mean loss: 0.340051420483743
Epoch: 63, step: 87, loss: 0.29894065856933594, mean loss: 0.34005096901480036
Epoch: 63, step: 88, loss: 0.35326263308525085, mean loss: 0.34005111410066663
Epoch: 63, step: 89, loss: 0.36235833168029785, mean loss: 0.3400513590680249
Epoch: 63, step: 90, loss: 0.34772244095802307, mean loss: 0.3400514433073086
Epoch: 63, step: 91, loss: 0.30248400568962097, mean loss: 0.340051030768461
Epoch: 63, step: 92, loss: 0.32119083404541016, mean loss: 0.3400508236614855
Epoch: 63, step: 93, loss: 0.2841191589832306, mean loss: 0.34005020947326287
Epoch: 63, step: 94, loss: 0.30678707361221313, mean loss: 0.3400498442132251
Epoch: 63, step: 95, loss: 0.32150980830192566, mean loss: 0.3400496406286958
Epoch: 63, step: 96, loss: 0.3226364850997925, mean loss: 0.3400494494203205
Epoch: 63, step: 97, loss: 0.329203337430954, mean loss: 0.3400493303238893
Epoch: 63, step: 98, loss: 0.3068942427635193, mean loss: 0.34004896626631265
Epoch: 63, step: 99, loss: 0.37835946679115295, mean loss: 0.3400493869279927
Epoch: 63, step: 100, loss: 0.3852854371070862, mean loss: 0.34004988362899274
Epoch: 63, step: 101, loss: 0.3293934166431427, mean loss: 0.34004976662011
Epoch: 63, step: 102, loss: 0.33758625388145447, mean loss: 0.3400497395708348
Epoch: 63, step: 103, loss: 0.33530133962631226, mean loss: 0.3400496874341583
Epoch: 63, step: 104, loss: 0.3038124144077301, mean loss: 0.34004928955903035
Epoch: 63, step: 105, loss: 0.34826022386550903, mean loss: 0.3400493797118039
Epoch: 63, step: 106, loss: 0.35024717450141907, mean loss: 0.3400494916782812
Epoch: 63, step: 107, loss: 0.3653143048286438, mean loss: 0.34004976906972995
Epoch: 63, step: 108, loss: 0.3357008695602417, mean loss: 0.3400497213221261
Epoch: 63, step: 109, loss: 0.333429217338562, mean loss: 0.3400496486348335
Epoch: 63, step: 110, loss: 0.30902811884880066, mean loss: 0.34004930804954553
Epoch: 63, step: 111, loss: 0.32160139083862305, mean loss: 0.3400491055121382
Epoch: 63, step: 112, loss: 0.30958813428878784, mean loss: 0.34004877108856435
Epoch: 63, step: 113, loss: 0.30728697776794434, mean loss: 0.3400484114087747
Epoch: 63, step: 114, loss: 0.33552461862564087, mean loss: 0.3400483617442475
Epoch: 63, step: 115, loss: 0.30986273288726807, mean loss: 0.3400480303545051
Epoch: 63, step: 116, loss: 0.3116495907306671, mean loss: 0.34004771858865385
Epoch: 63, step: 117, loss: 0.2915163040161133, mean loss: 0.3400471858033363
Epoch: 63, step: 118, loss: 0.36595144867897034, mean loss: 0.34004747018118786
Epoch: 63, step: 119, loss: 0.2915385365486145, mean loss: 0.3400469376543619
Epoch: 63, step: 120, loss: 0.30893364548683167, mean loss: 0.3400465960991143
Epoch: 63, step: 121, loss: 0.306016206741333, mean loss: 0.34004622252468175
Epoch: 63, step: 122, loss: 0.3231569230556488, mean loss: 0.340046037121537
Epoch: 63, step: 123, loss: 0.38018378615379333, mean loss: 0.3400464777308836
Epoch: 63, step: 124, loss: 0.3294963240623474, mean loss: 0.3400463619185773
Epoch: 63, step: 125, loss: 0.3167388141155243, mean loss: 0.3400461060672106
Epoch: 63, step: 126, loss: 0.3144818842411041, mean loss: 0.34004582544698614
Epoch: 63, step: 127, loss: 0.40210944414138794, mean loss: 0.3400465067161266
Epoch: 63, step: 128, loss: 0.30170848965644836, mean loss: 0.34004608588631063
Epoch: 63, step: 129, loss: 0.3497666120529175, mean loss: 0.3400461925856824
Epoch: 63, step: 130, loss: 0.3616337776184082, mean loss: 0.34004642954368636
Epoch: 63, step: 131, loss: 0.3990674614906311, mean loss: 0.3400470773860637
Epoch: 63, step: 132, loss: 0.38136324286460876, mean loss: 0.34004753088659034
Epoch: 63, step: 133, loss: 0.3105345368385315, mean loss: 0.3400472069453126
Epoch: 63, step: 134, loss: 0.31551870703697205, mean loss: 0.34004693771792166
Epoch: 63, step: 135, loss: 0.3328339457511902, mean loss: 0.3400468585482333
Epoch: 63, step: 136, loss: 0.35667601227760315, mean loss: 0.34004704106756434
Epoch: 63, step: 137, loss: 0.36021846532821655, mean loss: 0.3400472624639452
Epoch: 63, step: 138, loss: 0.30389854311943054, mean loss: 0.3400468657092246
Epoch: 63, step: 139, loss: 0.33082064986228943, mean loss: 0.3400467644468679
Epoch: 63, step: 140, loss: 0.32280486822128296, mean loss: 0.34004657521046666
Epoch: 63, step: 141, loss: 0.32477301359176636, mean loss: 0.3400464075791299
Epoch: 63, step: 142, loss: 0.29834702610969543, mean loss: 0.34004594992252596
Epoch: 63, step: 143, loss: 0.3116503357887268, mean loss: 0.34004563828006873
Epoch: 63, step: 144, loss: 0.32380035519599915, mean loss: 0.34004545998970487
Epoch: 63, step: 145, loss: 0.3082845211029053, mean loss: 0.3400451114203894
Epoch: 63, step: 146, loss: 0.32743605971336365, mean loss: 0.34004497304034015
Epoch: 63, step: 147, loss: 0.3610690236091614, mean loss: 0.3400452037696045
Epoch: 63, step: 148, loss: 0.3520243465900421, mean loss: 0.34004533523373265
Epoch: 63, step: 149, loss: 0.31438279151916504, mean loss: 0.3400450536053255
Epoch: 63, step: 150, loss: 0.3258349895477295, mean loss: 0.34004489766155654
Epoch: 63, step: 151, loss: 0.3046109676361084, mean loss: 0.3400445088075771
Epoch: 63, step: 152, loss: 0.3156530559062958, mean loss: 0.3400442411373121
Epoch: 63, step: 153, loss: 0.33520564436912537, mean loss: 0.34004418803943914
Epoch: 63, step: 154, loss: 0.32728999853134155, mean loss: 0.3400440480788401
Epoch: 63, step: 155, loss: 0.31598562002182007, mean loss: 0.34004378407186026
Epoch: 63, step: 156, loss: 0.3259720504283905, mean loss: 0.34004362965632134
Epoch: 63, step: 157, loss: 0.3251526653766632, mean loss: 0.34004346625278487
Epoch: 63, step: 158, loss: 0.3702039122581482, mean loss: 0.3400437972098248
Epoch: 63, step: 159, loss: 0.3065146803855896, mean loss: 0.340043429291675
Epoch: 63, step: 160, loss: 0.3052006959915161, mean loss: 0.3400430469632836
Epoch: 63, step: 161, loss: 0.31752291321754456, mean loss: 0.3400427998531628
Epoch: 63, step: 162, loss: 0.3234381675720215, mean loss: 0.34004261765497024
Epoch: 63, step: 163, loss: 0.40144822001457214, mean loss: 0.34004329143484163
Epoch: 63, step: 164, loss: 0.35038501024246216, mean loss: 0.34004340490926815
Epoch: 63, step: 165, loss: 0.30774158239364624, mean loss: 0.34004305048166916
Epoch: 63, step: 166, loss: 0.4848411977291107, mean loss: 0.3400446392433107
Epoch: 63, step: 167, loss: 0.3207886517047882, mean loss: 0.34004442796409695
Epoch: 63, step: 168, loss: 0.31753137707710266, mean loss: 0.34004418095066846
Epoch: 63, step: 169, loss: 0.35926514863967896, mean loss: 0.340044391841012
Epoch: 63, step: 170, loss: 0.3261602222919464, mean loss: 0.3400442395071021
Epoch: 63, step: 171, loss: 0.3372155427932739, mean loss: 0.3400442084716339
Epoch: 63, step: 172, loss: 0.3271135687828064, mean loss: 0.3400440666027471
Epoch: 63, step: 173, loss: 0.3122834861278534, mean loss: 0.34004376203007824
Epoch: 63, step: 174, loss: 0.3311568796634674, mean loss: 0.34004366452953116
Epoch: 63, step: 175, loss: 0.33858442306518555, mean loss: 0.3400436485199482
Epoch: 63, step: 176, loss: 0.30197662115097046, mean loss: 0.3400432308847864
Epoch: 63, step: 177, loss: 0.3109528124332428, mean loss: 0.3400429117359279
Epoch: 63, step: 178, loss: 0.32072436809539795, mean loss: 0.34004269979592017
Epoch: 63, step: 179, loss: 0.3328412175178528, mean loss: 0.340042620790717
Epoch: 63, step: 180, loss: 0.3339979946613312, mean loss: 0.3400425544777473
Epoch: 63, step: 181, loss: 0.3301027715206146, mean loss: 0.3400424454338989
Epoch: 63, step: 182, loss: 0.3470504879951477, mean loss: 0.3400425223144053
Epoch: 63, step: 183, loss: 0.3101274073123932, mean loss: 0.3400421941394634
Epoch: 63, step: 184, loss: 0.35459989309310913, mean loss: 0.3400423538386522
Epoch: 63, step: 185, loss: 0.3359013795852661, mean loss: 0.34004230841231275
Epoch: 63, step: 186, loss: 0.30445370078086853, mean loss: 0.34004191801084244
Epoch: 63, step: 187, loss: 0.32890215516090393, mean loss: 0.3400417958107234
Epoch: 63, step: 188, loss: 0.32384276390075684, mean loss: 0.34004161811377065
Epoch: 63, step: 189, loss: 0.33442580699920654, mean loss: 0.34004155651122664
Epoch: 63, step: 190, loss: 0.3729934096336365, mean loss: 0.3400419179720509
Epoch: 63, step: 191, loss: 0.32146579027175903, mean loss: 0.3400417142060062
Epoch: 63, step: 192, loss: 0.3068101704120636, mean loss: 0.3400413496851507
Epoch: 63, step: 193, loss: 0.3376256823539734, mean loss: 0.34004132318769187
Epoch: 63, step: 194, loss: 0.34212666749954224, mean loss: 0.34004134606158604
Epoch: 63, step: 195, loss: 0.29130610823631287, mean loss: 0.3400408114964116
Epoch: 63, step: 196, loss: 0.30594390630722046, mean loss: 0.3400404374997111
Epoch: 63, step: 197, loss: 0.3144950866699219, mean loss: 0.34004015730501075
Epoch: 63, step: 198, loss: 0.3198685944080353, mean loss: 0.34003993605523947
Epoch: 63, step: 199, loss: 0.3308243751525879, mean loss: 0.34003983497638957
Epoch: 63, step: 200, loss: 0.3168784976005554, mean loss: 0.34003958093914854
Epoch: 63, step: 201, loss: 0.35349681973457336, mean loss: 0.34003972853867026
Epoch: 63, step: 202, loss: 0.3367360234260559, mean loss: 0.34003969230390074
Epoch: 63, step: 203, loss: 0.36035266518592834, mean loss: 0.34003991509249515
Epoch: 63, step: 204, loss: 0.3401079475879669, mean loss: 0.3400399158386537
Epoch: 63, step: 205, loss: 0.3113049864768982, mean loss: 0.34003960068665035
Epoch: 63, step: 206, loss: 0.30249378085136414, mean loss: 0.34003918890521123
Epoch: 63, step: 207, loss: 0.3391224145889282, mean loss: 0.3400391788506563
Epoch: 63, step: 208, loss: 0.3399944007396698, mean loss: 0.34003917835956593
Epoch: 63, step: 209, loss: 0.3352601230144501, mean loss: 0.34003912594729874
Epoch: 63, step: 210, loss: 0.32673919200897217, mean loss: 0.340038980087501
Epoch: 63, step: 211, loss: 0.3308223783969879, mean loss: 0.34003887901053914
Epoch: 63, step: 212, loss: 0.3366418480873108, mean loss: 0.3400388417562657
Epoch: 63, step: 213, loss: 0.3571101129055023, mean loss: 0.3400390289699953
Epoch: 63, step: 214, loss: 0.3464665114879608, mean loss: 0.3400390994568248
Epoch: 63, step: 215, loss: 0.3429194688796997, mean loss: 0.3400391310439791
Epoch: 63, step: 216, loss: 0.341897189617157, mean loss: 0.340039151419886
Epoch: 63, step: 217, loss: 0.337919682264328, mean loss: 0.3400391281775441
Epoch: 63, step: 218, loss: 0.3064008057117462, mean loss: 0.3400387592998866
Epoch: 63, step: 219, loss: 0.3059651553630829, mean loss: 0.3400383856530323
Epoch: 63, step: 220, loss: 0.3285982608795166, mean loss: 0.34003826020343886
Epoch: 63, step: 221, loss: 0.3195244371891022, mean loss: 0.34003803525636983
Epoch: 63, step: 222, loss: 0.3319474756717682, mean loss: 0.3400379465392298
Epoch: 63, step: 223, loss: 0.3288624882698059, mean loss: 0.34003782399593546
Epoch: 63, step: 224, loss: 0.33572274446487427, mean loss: 0.3400377766799105
Epoch: 63, step: 225, loss: 0.3573383092880249, mean loss: 0.3400379663828931
Epoch: 63, step: 226, loss: 0.3278934955596924, mean loss: 0.34003783321837566
Epoch: 63, step: 227, loss: 0.3035706877708435, mean loss: 0.3400374333593247
Epoch: 63, step: 228, loss: 0.31819310784339905, mean loss: 0.34003719384083786
Epoch: 63, step: 229, loss: 0.3219383955001831, mean loss: 0.3400369953934536
Epoch: 63, step: 230, loss: 0.33509668707847595, mean loss: 0.3400369412251881
Epoch: 63, step: 231, loss: 0.2962048649787903, mean loss: 0.3400364606313957
Epoch: 63, step: 232, loss: 0.313041090965271, mean loss: 0.3400361646457626
Epoch: 63, step: 233, loss: 0.3546406924724579, mean loss: 0.34003632477259443
Epoch: 63, step: 234, loss: 0.33871990442276, mean loss: 0.3400363103392686
Epoch: 63, step: 235, loss: 0.3093520998954773, mean loss: 0.34003597391910323
Epoch: 63, step: 236, loss: 0.314498633146286, mean loss: 0.3400356939320321
Epoch: 63, step: 237, loss: 0.34476011991500854, mean loss: 0.34003574572926903
Epoch: 63, step: 238, loss: 0.34461450576782227, mean loss: 0.3400357959289164
Epoch: 63, step: 239, loss: 0.3058598041534424, mean loss: 0.34003542124146546
Epoch: 63, step: 240, loss: 0.31634435057640076, mean loss: 0.3400351615079772
Epoch: 63, step: 241, loss: 0.3357694745063782, mean loss: 0.3400351147422723
Epoch: 63, step: 242, loss: 0.27062639594078064, mean loss: 0.340034353806913
Epoch: 63, step: 243, loss: 0.3168054223060608, mean loss: 0.34003409914839366
Epoch: 63, step: 244, loss: 0.30536484718322754, mean loss: 0.34003371907393426
Epoch: 63, step: 245, loss: 0.3616097867488861, mean loss: 0.34003395560693955
Epoch: 63, step: 246, loss: 0.37960198521614075, mean loss: 0.3400343893765447
Epoch: 63, step: 247, loss: 0.3320884704589844, mean loss: 0.3400343022693432
Epoch: 63, step: 248, loss: 0.32389482855796814, mean loss: 0.34003412534216954
Epoch: 63, step: 249, loss: 0.35556450486183167, mean loss: 0.34003429559035003
Epoch: 63, step: 250, loss: 0.34364771842956543, mean loss: 0.3400343352012249
Epoch: 63, step: 251, loss: 0.40185001492500305, mean loss: 0.34003501282640824
Epoch: 63, step: 252, loss: 0.31970518827438354, mean loss: 0.3400347899727546
Epoch: 63, step: 253, loss: 0.371427983045578, mean loss: 0.3400351340982569
Epoch: 63, step: 254, loss: 0.3279948830604553, mean loss: 0.34003500211703386
Epoch: 63, step: 255, loss: 0.30573412775993347, mean loss: 0.3400346261263911
Epoch: 63, step: 256, loss: 0.37789952754974365, mean loss: 0.34003504117973404
Epoch: 63, step: 257, loss: 0.33755603432655334, mean loss: 0.34003501400657987
Epoch: 63, step: 258, loss: 0.34116658568382263, mean loss: 0.340035026409948
Epoch: 63, step: 259, loss: 0.36994799971580505, mean loss: 0.3400353542880314
Epoch: 63, step: 260, loss: 0.33145228028297424, mean loss: 0.34003526020941943
Epoch: 63, step: 261, loss: 0.31692564487457275, mean loss: 0.3400350069089466
Epoch: 63, step: 262, loss: 0.3633888363838196, mean loss: 0.3400352628834024
Epoch: 63, step: 263, loss: 0.32606494426727295, mean loss: 0.3400351097605275
Epoch: 63, step: 264, loss: 0.32003048062324524, mean loss: 0.34003489050047797
Epoch: 63, step: 265, loss: 0.3609469532966614, mean loss: 0.3400351197039107
Epoch: 63, step: 266, loss: 0.32028570771217346, mean loss: 0.3400349032459049
Epoch: 63, step: 267, loss: 0.3487662076950073, mean loss: 0.34003499894192035
Epoch: 63, step: 268, loss: 0.31798315048217773, mean loss: 0.3400347572539899
Epoch: 63, step: 269, loss: 0.3197149336338043, mean loss: 0.3400345345514667
Epoch: 63, step: 270, loss: 0.331092894077301, mean loss: 0.3400344365533685
Epoch: 63, step: 271, loss: 0.3478236794471741, mean loss: 0.34003452192054767
Epoch: 63, step: 272, loss: 0.31535544991493225, mean loss: 0.34003425145014377
Epoch: 63, step: 273, loss: 0.3065005838871002, mean loss: 0.3400338839417865
Epoch: 63, step: 274, loss: 0.3196474015712738, mean loss: 0.34003366052093575
Epoch: 63, step: 275, loss: 0.3240170180797577, mean loss: 0.3400334849922399
Epoch: 63, step: 276, loss: 0.2947582006454468, mean loss: 0.3400329888193027
Epoch: 63, step: 277, loss: 0.2914237976074219, mean loss: 0.3400324561158374
Epoch: 63, step: 278, loss: 0.32566091418266296, mean loss: 0.34003229862121337
Epoch: 63, step: 279, loss: 0.3286195397377014, mean loss: 0.3400321735526244
Epoch: 63, step: 280, loss: 0.383573979139328, mean loss: 0.3400326507074093
Epoch: 63, step: 281, loss: 0.36668944358825684, mean loss: 0.3400329428238412
Epoch: 63, step: 282, loss: 0.36083921790122986, mean loss: 0.3400331708253214
Epoch: 63, step: 283, loss: 0.3413983881473541, mean loss: 0.34003318578562347
Epoch: 63, step: 284, loss: 0.3415328860282898, mean loss: 0.34003320221943395
Epoch: 63, step: 285, loss: 0.33128565549850464, mean loss: 0.340033106364312
Epoch: 63, step: 286, loss: 0.30312785506248474, mean loss: 0.340032701963088
Epoch: 63, step: 287, loss: 0.314760684967041, mean loss: 0.34003242503982484
Epoch: 63, step: 288, loss: 0.33671021461486816, mean loss: 0.3400323886364277
Epoch: 63, step: 289, loss: 0.31020089983940125, mean loss: 0.34003206175898915
Epoch: 63, step: 290, loss: 0.3304831385612488, mean loss: 0.34003195712816175
Epoch: 63, step: 291, loss: 0.35442858934402466, mean loss: 0.3400321148752714
Epoch: 63, step: 292, loss: 0.3398093283176422, mean loss: 0.34003211243417614
Epoch: 63, step: 293, loss: 0.32884547114372253, mean loss: 0.34003198986233896
Epoch: 63, step: 294, loss: 0.3390871286392212, mean loss: 0.34003197950962416
Epoch: 63, step: 295, loss: 0.29902219772338867, mean loss: 0.3400315301759937
Epoch: 63, step: 296, loss: 0.3357422947883606, mean loss: 0.3400314831804597
Epoch: 63, step: 297, loss: 0.3312343955039978, mean loss: 0.340031386795145
Epoch: 63, step: 298, loss: 0.31049513816833496, mean loss: 0.3400310631847033
Epoch: 63, step: 299, loss: 0.3121900260448456, mean loss: 0.3400307581509893
Epoch: 63, step: 300, loss: 0.30119428038597107, mean loss: 0.34003033265300237
Epoch: 63, step: 301, loss: 0.35419371724128723, mean loss: 0.34003048782736295
Epoch: 63, step: 302, loss: 0.32059580087661743, mean loss: 0.3400302749028277
Epoch: 63, step: 303, loss: 0.3576846122741699, mean loss: 0.34003046831990746
Epoch: 63, step: 304, loss: 0.32150760293006897, mean loss: 0.3400302653896469
Epoch: 63, step: 305, loss: 0.3229489028453827, mean loss: 0.3400300782540552
Epoch: 63, step: 306, loss: 0.3213801085948944, mean loss: 0.34002987393576006
Epoch: 63, step: 307, loss: 0.3615982234477997, mean loss: 0.3400301102235505
Epoch: 63, step: 308, loss: 0.3359009623527527, mean loss: 0.34003006498798266
Epoch: 63, step: 309, loss: 0.3266081213951111, mean loss: 0.34002991794975396
Epoch: 63, step: 310, loss: 0.31930965185165405, mean loss: 0.34002969096043395
Epoch: 63, step: 311, loss: 0.28848206996917725, mean loss: 0.3400291262654053
Epoch: 63, step: 312, loss: 0.35032105445861816, mean loss: 0.3400292390104148
Epoch: 63, step: 313, loss: 0.3168347477912903, mean loss: 0.3400289849244518
Epoch: 63, step: 314, loss: 0.3072338104248047, mean loss: 0.34002862567094916
Epoch: 63, step: 315, loss: 0.3769097924232483, mean loss: 0.34002902967987425
Epoch: 63, step: 316, loss: 0.34472641348838806, mean loss: 0.34002908113606073
Epoch: 63, step: 317, loss: 0.2821020781993866, mean loss: 0.34002844659774395
Epoch: 63, step: 318, loss: 0.2971988618373871, mean loss: 0.3400279774432297
Epoch: 63, step: 319, loss: 0.34665432572364807, mean loss: 0.34002805002733655
Epoch: 63, step: 320, loss: 0.32541200518608093, mean loss: 0.3400278899269472
Epoch: 63, step: 321, loss: 0.310255765914917, mean loss: 0.34002756381434385
Epoch: 63, step: 322, loss: 0.3947874903678894, mean loss: 0.3400281636273298
Epoch: 63, step: 323, loss: 0.2978989779949188, mean loss: 0.3400277021702492
Epoch: 63, step: 324, loss: 0.33540061116218567, mean loss: 0.3400276514885071
Epoch: 63, step: 325, loss: 0.33337125182151794, mean loss: 0.3400275785800133
Epoch: 63, step: 326, loss: 0.33919718861579895, mean loss: 0.34002756948473334
Epoch: 63, step: 327, loss: 0.3437209129333496, mean loss: 0.3400276099375641
Epoch: 63, step: 328, loss: 0.3112020790576935, mean loss: 0.3400272942177924
Epoch: 63, step: 329, loss: 0.3411277234554291, mean loss: 0.34002730627042255
Epoch: 63, step: 330, loss: 0.3187558054924011, mean loss: 0.3400270732934034
Epoch: 63, step: 331, loss: 0.33781468868255615, mean loss: 0.34002704906243203
Epoch: 63, step: 332, loss: 0.31719377636909485, mean loss: 0.34002679898551735
Epoch: 63, step: 333, loss: 0.3157721161842346, mean loss: 0.3400265333437983
Epoch: 63, step: 334, loss: 0.3061555027961731, mean loss: 0.3400261623861439
Epoch: 63, step: 335, loss: 0.36814776062965393, mean loss: 0.3400264703722814
Epoch: 63, step: 336, loss: 0.3679150342941284, mean loss: 0.34002677580289525
Epoch: 63, step: 337, loss: 0.33855175971984863, mean loss: 0.34002675964895723
Epoch: 63, step: 338, loss: 0.308179646730423, mean loss: 0.34002641087265517
Epoch: 63, step: 339, loss: 0.37778857350349426, mean loss: 0.3400268244235864
Epoch: 63, step: 340, loss: 0.32639700174331665, mean loss: 0.3400266751587207
Epoch: 63, step: 341, loss: 0.31358495354652405, mean loss: 0.3400263855895242
Epoch: 63, step: 342, loss: 0.3297939598560333, mean loss: 0.3400262735331727
Epoch: 63, step: 343, loss: 0.3475346863269806, mean loss: 0.3400263557576766
Epoch: 63, step: 344, loss: 0.2938408851623535, mean loss: 0.34002584998689356
Epoch: 63, step: 345, loss: 0.2836802303791046, mean loss: 0.3400252329604628
Epoch: 63, step: 346, loss: 0.32997050881385803, mean loss: 0.34002512285496284
Epoch: 63, step: 347, loss: 0.30535823106765747, mean loss: 0.34002474323503523
Epoch: 63, step: 348, loss: 0.32828742265701294, mean loss: 0.34002461470687
Epoch: 63, step: 349, loss: 0.3352815508842468, mean loss: 0.34002456276906945
Epoch: 63, step: 350, loss: 0.31672462821006775, mean loss: 0.340024307631431
Epoch: 63, step: 351, loss: 0.3525540828704834, mean loss: 0.3400244448327717
Epoch: 63, step: 352, loss: 0.3900085985660553, mean loss: 0.340024992154466
Epoch: 63, step: 353, loss: 0.27720823884010315, mean loss: 0.3400243043245675
Epoch: 63, step: 354, loss: 0.3448783755302429, mean loss: 0.34002435747501814
Epoch: 63, step: 355, loss: 0.30663979053497314, mean loss: 0.34002399192921684
Epoch: 63, step: 356, loss: 0.3658759295940399, mean loss: 0.34002427499305926
Epoch: 63, step: 357, loss: 0.32844147086143494, mean loss: 0.34002414816940735
Epoch: 63, step: 358, loss: 0.3567265570163727, mean loss: 0.34002433104716895
Epoch: 63, step: 359, loss: 0.3270047903060913, mean loss: 0.34002418849537175
Epoch: 63, step: 360, loss: 0.3265419006347656, mean loss: 0.34002404087854254
Epoch: 63, step: 361, loss: 0.3240255117416382, mean loss: 0.34002386571344373
Epoch: 63, step: 362, loss: 0.3341430425643921, mean loss: 0.34002380132604404
Epoch: 63, step: 363, loss: 0.3104579448699951, mean loss: 0.34002347762173846
Epoch: 63, step: 364, loss: 0.32400035858154297, mean loss: 0.3400233021931713
Epoch: 63, step: 365, loss: 0.3065590262413025, mean loss: 0.3400229358147094
Epoch: 63, step: 366, loss: 0.3056553304195404, mean loss: 0.34002255955040395
Epoch: 63, step: 367, loss: 0.3192785978317261, mean loss: 0.34002233244331265
Epoch: 63, step: 368, loss: 0.317597895860672, mean loss: 0.34002208694089225
Epoch: 63, step: 369, loss: 0.35239410400390625, mean loss: 0.34002222238808044
Epoch: 63, step: 370, loss: 0.3303827941417694, mean loss: 0.3400221168580645
Epoch: 63, step: 371, loss: 0.3575180470943451, mean loss: 0.34002230839697495
Epoch: 63, step: 372, loss: 0.29833123087882996, mean loss: 0.3400218519836243
Epoch: 63, step: 373, loss: 0.32897862792015076, mean loss: 0.34002173108917827
Epoch: 63, step: 374, loss: 0.3161837160587311, mean loss: 0.3400214701280626
Epoch: 63, step: 375, loss: 0.339394211769104, mean loss: 0.34002146326137306
Epoch: 63, step: 376, loss: 0.3538769483566284, mean loss: 0.34002161493774713
Epoch: 63, step: 377, loss: 0.34322240948677063, mean loss: 0.340021649976549
Epoch: 63, step: 378, loss: 0.4327738583087921, mean loss: 0.3400226653152791
Epoch: 63, step: 379, loss: 0.33222824335098267, mean loss: 0.3400225799923309
Epoch: 63, step: 380, loss: 0.29926517605781555, mean loss: 0.3400221338394521
Epoch: 63, step: 381, loss: 0.2941831052303314, mean loss: 0.3400216320658176
Epoch: 63, step: 382, loss: 0.3219261169433594, mean loss: 0.3400214339867292
Epoch: 63, step: 383, loss: 0.34917694330215454, mean loss: 0.3400215342046603
Epoch: 63, step: 384, loss: 0.3234900236129761, mean loss: 0.3400213532496093
Epoch: 63, step: 385, loss: 0.32247430086135864, mean loss: 0.34002116118047043
Epoch: 63, step: 386, loss: 0.3307570219039917, mean loss: 0.3400210597767852
Epoch: 63, step: 387, loss: 0.36969229578971863, mean loss: 0.34002138454950864
Epoch: 63, step: 388, loss: 0.34105899930000305, mean loss: 0.34002139590681374
Epoch: 63, step: 389, loss: 0.26992446184158325, mean loss: 0.34002062866294797
Epoch: 63, step: 390, loss: 0.3326779305934906, mean loss: 0.34002054829454864
Epoch: 63, step: 391, loss: 0.3282054662704468, mean loss: 0.34002041897575763
Epoch: 63, step: 392, loss: 0.31384196877479553, mean loss: 0.34002013244973345
Epoch: 63, step: 393, loss: 0.3280121386051178, mean loss: 0.34002000102235513
Epoch: 63, step: 394, loss: 0.29493606090545654, mean loss: 0.34001950758446053
Epoch: 63, step: 395, loss: 0.3139825761318207, mean loss: 0.3400192226167317
Epoch: 63, step: 396, loss: 0.34621649980545044, mean loss: 0.3400192904436444
Epoch: 63, step: 397, loss: 0.3115313947200775, mean loss: 0.34001897865754693
Epoch: 63, step: 398, loss: 0.316455215215683, mean loss: 0.34001872076649353
Epoch: 63, step: 399, loss: 0.3489912748336792, mean loss: 0.3400188189645637
Epoch: 63, step: 400, loss: 0.357932448387146, mean loss: 0.34001901501404685
Epoch: 63, step: 401, loss: 0.32659801840782166, mean loss: 0.3400188681342276
Epoch: 63, step: 402, loss: 0.32187899947166443, mean loss: 0.3400186696130931
Epoch: 63, step: 403, loss: 0.2897292971611023, mean loss: 0.34001811925662695
Epoch: 63, step: 404, loss: 0.3385380506515503, mean loss: 0.34001810305924024
Epoch: 63, step: 405, loss: 0.314829021692276, mean loss: 0.3400178274011894
Epoch: 63, step: 406, loss: 0.31201794743537903, mean loss: 0.340017520986368
Epoch: 63, step: 407, loss: 0.38093724846839905, mean loss: 0.3400179687837797
Epoch: 63, step: 408, loss: 0.34257251024246216, mean loss: 0.34001799673862215
Epoch: 63, step: 409, loss: 0.3036683201789856, mean loss: 0.34001759896141703
Epoch: 63, step: 410, loss: 0.3324073553085327, mean loss: 0.3400175156828679
Epoch: 63, step: 411, loss: 0.31986570358276367, mean loss: 0.3400172951649206
Epoch: 63, step: 412, loss: 0.3419898450374603, mean loss: 0.34001731674997143
Epoch: 63, step: 413, loss: 0.3558262586593628, mean loss: 0.3400174897408224
Epoch: 63, step: 414, loss: 0.298689067363739, mean loss: 0.34001703750557694
Epoch: 63, step: 415, loss: 0.31696513295173645, mean loss: 0.3400167852634384
Epoch: 63, step: 416, loss: 0.3511388301849365, mean loss: 0.340016906963478
Epoch: 63, step: 417, loss: 0.3338123857975006, mean loss: 0.34001683907288643
Epoch: 63, step: 418, loss: 0.29892247915267944, mean loss: 0.34001638941854495
Epoch: 63, step: 419, loss: 0.323152631521225, mean loss: 0.3400162048973845
Epoch: 63, step: 420, loss: 0.37847405672073364, mean loss: 0.34001662569385493
Epoch: 63, step: 421, loss: 0.3309195637702942, mean loss: 0.3400165261571028
Epoch: 63, step: 422, loss: 0.30632489919662476, mean loss: 0.34001615751957387
Epoch: 63, step: 423, loss: 0.35407838225364685, mean loss: 0.3400163113799697
Epoch: 63, step: 424, loss: 0.30583637952804565, mean loss: 0.3400159374078278
Epoch: 63, step: 425, loss: 0.32790324091911316, mean loss: 0.3400158048808963
Epoch: 63, step: 426, loss: 0.3482815623283386, mean loss: 0.34001589531686877
Epoch: 63, step: 427, loss: 0.33444440364837646, mean loss: 0.3400158343596295
Epoch: 63, step: 428, loss: 0.33394017815589905, mean loss: 0.34001576788709414
Epoch: 63, step: 429, loss: 0.2860919237136841, mean loss: 0.3400151779235904
Epoch: 63, step: 430, loss: 0.31925374269485474, mean loss: 0.34001495078186383
Epoch: 63, step: 431, loss: 0.3209945261478424, mean loss: 0.3400147426900447
Epoch: 63, step: 432, loss: 0.30799251794815063, mean loss: 0.34001439235664127
Epoch: 63, step: 433, loss: 0.3549453914165497, mean loss: 0.34001455570477007
Epoch: 63, step: 434, loss: 0.3000246286392212, mean loss: 0.3400141182117218
Epoch: 63, step: 435, loss: 0.3096410036087036, mean loss: 0.34001378593101766
Epoch: 63, step: 436, loss: 0.3330667316913605, mean loss: 0.3400137099313432
Epoch: 63, step: 437, loss: 0.28577151894569397, mean loss: 0.34001311653684607
Epoch: 63, step: 438, loss: 0.36272677779197693, mean loss: 0.3400133650152705
Epoch: 63, step: 439, loss: 0.3750832974910736, mean loss: 0.34001374866219297
Epoch: 63, step: 440, loss: 0.3671419024467468, mean loss: 0.3400140454269177
Epoch: 63, step: 441, loss: 0.3228846490383148, mean loss: 0.3400138580442806
Epoch: 63, step: 442, loss: 0.3403056561946869, mean loss: 0.3400138612362967
Epoch: 63, step: 443, loss: 0.3365841209888458, mean loss: 0.340013823718354
Epoch: 63, step: 444, loss: 0.3152415156364441, mean loss: 0.34001355273693823
Epoch: 63, step: 445, loss: 0.3341224193572998, mean loss: 0.3400134882952158
Epoch: 63, step: 446, loss: 0.35748857259750366, mean loss: 0.34001367944896177
Epoch: 63, step: 447, loss: 0.35782429575920105, mean loss: 0.34001387427084223
Epoch: 63, step: 448, loss: 0.32174453139305115, mean loss: 0.34001367443335545
Epoch: 63, step: 449, loss: 0.3115266263484955, mean loss: 0.3400133628338708
Epoch: 63, step: 450, loss: 0.3425576686859131, mean loss: 0.34001339066391195
Epoch: 63, step: 451, loss: 0.31141743063926697, mean loss: 0.34001307787996
Epoch: 63, step: 452, loss: 0.32794782519340515, mean loss: 0.3400129459111037
Epoch: 63, step: 453, loss: 0.2953667640686035, mean loss: 0.34001245757975546
Epoch: 63, step: 454, loss: 0.3733963966369629, mean loss: 0.3400128227228648
Epoch: 63, step: 455, loss: 0.3395025134086609, mean loss: 0.3400128171413218
Epoch: 63, step: 456, loss: 0.3035145401954651, mean loss: 0.34001241794328896
Epoch: 63, step: 457, loss: 0.3070780038833618, mean loss: 0.34001205772876353
Epoch: 63, step: 458, loss: 0.3531017303466797, mean loss: 0.34001220089325496
Epoch: 63, step: 459, loss: 0.30061668157577515, mean loss: 0.34001177002092015
Epoch: 63, step: 460, loss: 0.29605644941329956, mean loss: 0.34001128928288676
Epoch: 63, step: 461, loss: 0.31141212582588196, mean loss: 0.3400109764981081
Epoch: 63, step: 462, loss: 0.30169427394866943, mean loss: 0.34001055743863906
Epoch: 63, step: 463, loss: 0.2903502881526947, mean loss: 0.34001001432357186
Epoch: 63, step: 464, loss: 0.340165376663208, mean loss: 0.3400100160226908
Epoch: 63, step: 465, loss: 0.3316221535205841, mean loss: 0.3400099242899046
Epoch: 63, step: 466, loss: 0.365204781293869, mean loss: 0.34001019982722464
Epoch: 63, step: 467, loss: 0.4014221727848053, mean loss: 0.34001087143672765
Epoch: 63, step: 468, loss: 0.3410038650035858, mean loss: 0.3400108822961186
Epoch: 63, step: 469, loss: 0.3553219735622406, mean loss: 0.34001104973658647
Epoch: 63, step: 470, loss: 0.3507920801639557, mean loss: 0.3400111676355008
Epoch: 63, step: 471, loss: 0.36335957050323486, mean loss: 0.34001142296557024
Epoch: 63, step: 472, loss: 0.3217082917690277, mean loss: 0.34001122281103807
Epoch: 63, step: 473, loss: 0.35428687930107117, mean loss: 0.3400113789212724
Epoch: 63, step: 474, loss: 0.31880903244018555, mean loss: 0.34001114706734087
Epoch: 63, step: 475, loss: 0.33622121810913086, mean loss: 0.34001110562379966
Epoch: 63, step: 476, loss: 0.3630020320415497, mean loss: 0.3400113570308836
Epoch: 63, step: 477, loss: 0.31798720359802246, mean loss: 0.3400111161981506
Epoch: 63, step: 478, loss: 0.31342601776123047, mean loss: 0.3400108254949496
Epoch: 63, step: 479, loss: 0.3132426142692566, mean loss: 0.34001053279264426
Epoch: 63, step: 480, loss: 0.31814274191856384, mean loss: 0.34001029367757013
Epoch: 63, step: 481, loss: 0.3146199882030487, mean loss: 0.34001001604831965
Epoch: 63, step: 482, loss: 0.28861069679260254, mean loss: 0.3400094540307235
Epoch: 63, step: 483, loss: 0.36162078380584717, mean loss: 0.34000969033375206
Epoch: 63, step: 484, loss: 0.31009405851364136, mean loss: 0.3400093632332368
Epoch: 63, step: 485, loss: 0.3342384397983551, mean loss: 0.3400093001340718
Epoch: 63, step: 486, loss: 0.4152170717716217, mean loss: 0.34001012244539863
Epoch: 63, step: 487, loss: 0.32692763209342957, mean loss: 0.3400099794048306
Epoch: 63, step: 488, loss: 0.32342779636383057, mean loss: 0.3400097981015096
Epoch: 63, step: 489, loss: 0.3678140640258789, mean loss: 0.3400101020995189
Epoch: 63, step: 490, loss: 0.3106963336467743, mean loss: 0.3400097816008642
Epoch: 63, step: 491, loss: 0.2979486584663391, mean loss: 0.3400093217355277
Epoch: 63, step: 492, loss: 0.34675902128219604, mean loss: 0.34000939553096365
Epoch: 63, step: 493, loss: 0.3420657515525818, mean loss: 0.340009418013154
Epoch: 63, step: 494, loss: 0.31173479557037354, mean loss: 0.3400091088893996
Epoch: 63, step: 495, loss: 0.35226279497146606, mean loss: 0.3400092428563179
Epoch: 63, step: 496, loss: 0.3353849947452545, mean loss: 0.3400091923009591
Epoch: 63, step: 497, loss: 0.31966155767440796, mean loss: 0.3400089698495037
Epoch: 63, step: 498, loss: 0.3398635983467102, mean loss: 0.3400089682602404
Epoch: 63, step: 499, loss: 0.3570103049278259, mean loss: 0.3400091541240749
Epoch: 63, step: 500, loss: 0.36389464139938354, mean loss: 0.3400094152447037
Epoch: 63, step: 501, loss: 0.33470866084098816, mean loss: 0.3400093572964954
Epoch: 63, step: 502, loss: 0.29857271909713745, mean loss: 0.3400089043132956
Epoch: 63, step: 503, loss: 0.3446992337703705, mean loss: 0.3400089555871757
Epoch: 63, step: 504, loss: 0.31608378887176514, mean loss: 0.3400086940442008
Epoch: 63, step: 505, loss: 0.34818267822265625, mean loss: 0.3400087833988454
Epoch: 63, step: 506, loss: 0.35334259271621704, mean loss: 0.34000892915699005
Epoch: 63, step: 507, loss: 0.3238263428211212, mean loss: 0.34000875225945687
Epoch: 63, step: 508, loss: 0.3652574419975281, mean loss: 0.3400090282587325
Epoch: 63, step: 509, loss: 0.30274203419685364, mean loss: 0.34000862088904166
Epoch: 63, step: 510, loss: 0.33426013588905334, mean loss: 0.34000855805239444
Epoch: 63, step: 511, loss: 0.329506516456604, mean loss: 0.34000844325590984
Epoch: 63, step: 512, loss: 0.3965068459510803, mean loss: 0.34000906082603277
Epoch: 63, step: 513, loss: 0.36492204666137695, mean loss: 0.34000933314076764
Epoch: 63, step: 514, loss: 0.29073694348335266, mean loss: 0.34000879456818733
Epoch: 63, step: 515, loss: 0.3719988167285919, mean loss: 0.34000914423177336
Epoch: 63, step: 516, loss: 0.308260440826416, mean loss: 0.3400087972096898
Epoch: 63, step: 517, loss: 0.2904583513736725, mean loss: 0.340008255615572
Epoch: 63, step: 518, loss: 0.34084054827690125, mean loss: 0.34000826471256146
Epoch: 63, step: 519, loss: 0.34269416332244873, mean loss: 0.34000829406921135
Epoch: 63, step: 520, loss: 0.2935786247253418, mean loss: 0.34000778660230846
Epoch: 63, step: 521, loss: 0.32293349504470825, mean loss: 0.340007599985792
Epoch: 63, step: 522, loss: 0.3289269208908081, mean loss: 0.34000747887885613
Epoch: 63, step: 523, loss: 0.3813268542289734, mean loss: 0.34000793047647077
Epoch: 63, step: 524, loss: 0.37197044491767883, mean loss: 0.34000827980502185
Epoch: 63, step: 525, loss: 0.30510032176971436, mean loss: 0.3400078982889446
Epoch: 63, step: 526, loss: 0.3046167492866516, mean loss: 0.3400075114962037
Epoch: 63, step: 527, loss: 0.3592430055141449, mean loss: 0.340007721720182
Epoch: 63, step: 528, loss: 0.34351012110710144, mean loss: 0.3400077599973526
Epoch: 63, step: 529, loss: 0.4000703990459442, mean loss: 0.34000841640528956
Epoch: 63, step: 530, loss: 0.30053195357322693, mean loss: 0.3400079849826823
Epoch: 63, step: 531, loss: 0.342380166053772, mean loss: 0.3400080109070252
Epoch: 63, step: 532, loss: 0.3029993176460266, mean loss: 0.340007606462533
Epoch: 63, step: 533, loss: 0.32012608647346497, mean loss: 0.34000738919240875
Epoch: 63, step: 534, loss: 0.3676825761795044, mean loss: 0.3400076916303314
Epoch: 63, step: 535, loss: 0.35493579506874084, mean loss: 0.3400078547647397
Epoch: 63, step: 536, loss: 0.3620065450668335, mean loss: 0.3400080951639387
Epoch: 63, step: 537, loss: 0.3058990240097046, mean loss: 0.340007722427941
Epoch: 63, step: 538, loss: 0.3067430257797241, mean loss: 0.3400073589230438
Epoch: 63, step: 539, loss: 0.3486892580986023, mean loss: 0.3400074537947456
Epoch: 63, step: 540, loss: 0.30374687910079956, mean loss: 0.34000705756060734
Epoch: 63, step: 541, loss: 0.28970351815223694, mean loss: 0.34000650787925357
Epoch: 63, step: 542, loss: 0.33446556329727173, mean loss: 0.3400064473324079
Epoch: 63, step: 543, loss: 0.3202671408653259, mean loss: 0.3400062316399993
Epoch: 63, step: 544, loss: 0.3281925320625305, mean loss: 0.340006102552512
Epoch: 63, step: 545, loss: 0.3276679813861847, mean loss: 0.34000596773617897
Epoch: 63, step: 546, loss: 0.2886982560157776, mean loss: 0.3400054071125738
Epoch: 63, step: 547, loss: 0.3277406096458435, mean loss: 0.3400052731003637
Epoch: 63, step: 548, loss: 0.3093026578426361, mean loss: 0.3400049376296493
Epoch: 63, step: 549, loss: 0.34426364302635193, mean loss: 0.3400049841616896
Epoch: 63, step: 550, loss: 0.35646551847457886, mean loss: 0.34000516401303094
Epoch: 63, step: 551, loss: 0.31696686148643494, mean loss: 0.34000491229432844
Epoch: 63, step: 552, loss: 0.3156055212020874, mean loss: 0.34000464570715455
Epoch: 63, step: 553, loss: 0.33880341053009033, mean loss: 0.34000463258263064
Epoch: 63, step: 554, loss: 0.3340263366699219, mean loss: 0.34000456726533723
Epoch: 63, step: 555, loss: 0.3767169713973999, mean loss: 0.340004968371055
Epoch: 63, step: 556, loss: 0.39037391543388367, mean loss: 0.34000551867693685
Epoch: 63, step: 557, loss: 0.33734753727912903, mean loss: 0.34000548963748095
Epoch: 63, step: 558, loss: 0.3362124562263489, mean loss: 0.34000544819760364
Epoch: 63, step: 559, loss: 0.3086928725242615, mean loss: 0.34000510610330137
Epoch: 63, step: 560, loss: 0.3479989767074585, mean loss: 0.3400051934365102
Epoch: 63, step: 561, loss: 0.33514681458473206, mean loss: 0.34000514035919627
Epoch: 63, step: 562, loss: 0.3092516362667084, mean loss: 0.34000480438384156
Epoch: 63, step: 563, loss: 0.31360921263694763, mean loss: 0.34000451602088333
Epoch: 63, step: 564, loss: 0.3307655155658722, mean loss: 0.34000441508901474
Epoch: 63, step: 565, loss: 0.3456973433494568, mean loss: 0.3400044772809816
Epoch: 63, step: 566, loss: 0.3458096981048584, mean loss: 0.3400045406989873
Epoch: 63, step: 567, loss: 0.3049393594264984, mean loss: 0.34000415764041975
Epoch: 63, step: 568, loss: 0.3364676833152771, mean loss: 0.3400041190077379
Epoch: 63, step: 569, loss: 0.38706713914871216, mean loss: 0.3400046331216981
Epoch: 63, step: 570, loss: 0.34373435378074646, mean loss: 0.3400046738645256
Epoch: 63, step: 571, loss: 0.3184444308280945, mean loss: 0.3400044383467086
Epoch: 63, step: 572, loss: 0.31912681460380554, mean loss: 0.3400042102881173
Epoch: 63, step: 573, loss: 0.355140745639801, mean loss: 0.3400043756316096
Epoch: 63, step: 574, loss: 0.3353256285190582, mean loss: 0.3400043245240134
Epoch: 63, step: 575, loss: 0.30070915818214417, mean loss: 0.3400038952938135
Epoch: 63, step: 576, loss: 0.324978232383728, mean loss: 0.34000373116681143
Epoch: 63, step: 577, loss: 0.3120313882827759, mean loss: 0.3400034256251087
Epoch: 63, step: 578, loss: 0.32137632369995117, mean loss: 0.34000322216362905
Epoch: 63, step: 579, loss: 0.34167835116386414, mean loss: 0.3400032404606515
Epoch: 63, step: 580, loss: 0.3334719240665436, mean loss: 0.3400031691214666
Epoch: 63, step: 581, loss: 0.3146405816078186, mean loss: 0.34000289209820694
Epoch: 63, step: 582, loss: 0.31777334213256836, mean loss: 0.340002649298251
Epoch: 63, step: 583, loss: 0.35197770595550537, mean loss: 0.34000278009313784
Epoch: 63, step: 584, loss: 0.3211371600627899, mean loss: 0.34000257403985923
Epoch: 63, step: 585, loss: 0.34119120240211487, mean loss: 0.34000258702210395
Epoch: 63, step: 586, loss: 0.37816017866134644, mean loss: 0.3400030037762367
Epoch: 63, step: 587, loss: 0.3448607623577118, mean loss: 0.34000305683170395
Epoch: 63, step: 588, loss: 0.319184809923172, mean loss: 0.34000282946146
Epoch: 63, step: 589, loss: 0.306140661239624, mean loss: 0.34000245963371245
Epoch: 63, step: 590, loss: 0.3355388045310974, mean loss: 0.34000241088416183
Epoch: 63, step: 591, loss: 0.35912734270095825, mean loss: 0.34000261975371554
Epoch: 63, step: 592, loss: 0.4034208059310913, mean loss: 0.34000331235663345
Epoch: 63, step: 593, loss: 0.32369285821914673, mean loss: 0.34000313422878975
Epoch: 63, step: 594, loss: 0.2964748442173004, mean loss: 0.3400026588578591
Epoch: 63, step: 595, loss: 0.33772513270378113, mean loss: 0.34000263398534736
Epoch: 63, step: 596, loss: 0.34957820177078247, mean loss: 0.34000273855750374
Epoch: 63, step: 597, loss: 0.360662579536438, mean loss: 0.34000296417551157
Epoch: 63, step: 598, loss: 0.3065066635608673, mean loss: 0.3400025983795651
Epoch: 63, step: 599, loss: 0.306806743144989, mean loss: 0.3400022358685876
Epoch: 63, step: 600, loss: 0.3192947208881378, mean loss: 0.34000200973735917
Epoch: 63, step: 601, loss: 0.3092884421348572, mean loss: 0.34000167434120304
Epoch: 63, step: 602, loss: 0.3212704062461853, mean loss: 0.3400014697955509
Epoch: 63, step: 603, loss: 0.33080366253852844, mean loss: 0.340001369356492
Epoch: 63, step: 604, loss: 0.3515457510948181, mean loss: 0.34000149541851343
Epoch: 63, step: 605, loss: 0.31638890504837036, mean loss: 0.3400012375772156
Epoch: 63, step: 606, loss: 0.29778680205345154, mean loss: 0.3400007766152536
Epoch: 63, step: 607, loss: 0.3138929605484009, mean loss: 0.3400004915331825
Epoch: 63, step: 608, loss: 0.3165746331214905, mean loss: 0.3400002357393125
Epoch: 63, step: 609, loss: 0.3372654318809509, mean loss: 0.3400002058775071
Epoch: 63, step: 610, loss: 0.3385535180568695, mean loss: 0.3400001900810403
Epoch: 63, step: 611, loss: 0.3363984525203705, mean loss: 0.3400001507538919
Epoch: 63, step: 612, loss: 0.313460111618042, mean loss: 0.3399998609680194
Epoch: 63, step: 613, loss: 0.3155673146247864, mean loss: 0.33999959419639114
Epoch: 63, step: 614, loss: 0.3141772449016571, mean loss: 0.3399993122530008
Epoch: 63, step: 615, loss: 0.370002418756485, mean loss: 0.33999963984074705
Epoch: 63, step: 616, loss: 0.35461506247520447, mean loss: 0.33999979941692576
Epoch: 63, step: 617, loss: 0.3230886161327362, mean loss: 0.3399996147768637
Epoch: 63, step: 618, loss: 0.34472957253456116, mean loss: 0.3399996664190311
Epoch: 63, step: 619, loss: 0.36895814538002014, mean loss: 0.33999998258724407
Epoch: 63, step: 620, loss: 0.308432400226593, mean loss: 0.33999963793664456
Epoch: 63, step: 621, loss: 0.30643460154533386, mean loss: 0.3399992714821127
Epoch: 63, step: 622, loss: 0.3567740321159363, mean loss: 0.33999945462268405
Epoch: 63, step: 623, loss: 0.33062300086021423, mean loss: 0.3399993522551815
Epoch: 63, step: 624, loss: 0.352849543094635, mean loss: 0.3399994925457024
Epoch: 63, step: 625, loss: 0.3643378019332886, mean loss: 0.3399997582535714
Epoch: 63, step: 626, loss: 0.3116300404071808, mean loss: 0.33999944853711334
Epoch: 63, step: 627, loss: 0.31681400537490845, mean loss: 0.3399991954209216
Epoch: 63, step: 628, loss: 0.33914241194725037, mean loss: 0.33999918606749235
Epoch: 63, step: 629, loss: 0.3204115033149719, mean loss: 0.3399989722328299
Epoch: 63, step: 630, loss: 0.32390469312667847, mean loss: 0.33999879653684717
Epoch: 63, step: 631, loss: 0.3553527891635895, mean loss: 0.3399989641495347
Epoch: 63, step: 632, loss: 0.32549765706062317, mean loss: 0.3399988058469629
Epoch: 63, step: 633, loss: 0.40771645307540894, mean loss: 0.3399995450741667
Epoch: 63, step: 634, loss: 0.3352036774158478, mean loss: 0.3399994927215336
Epoch: 63, step: 635, loss: 0.3234175443649292, mean loss: 0.3399993117117053
Epoch: 63, step: 636, loss: 0.29868462681770325, mean loss: 0.3399988607223386
Epoch: 63, step: 637, loss: 0.35982587933540344, mean loss: 0.3399990771508793
Epoch: 63, step: 638, loss: 0.3140694797039032, mean loss: 0.3399987941106609
Epoch: 63, step: 639, loss: 0.33482328057289124, mean loss: 0.33999873761682237
Epoch: 63, step: 640, loss: 0.319650262594223, mean loss: 0.3399985155034212
Epoch: 63, step: 641, loss: 0.31194841861724854, mean loss: 0.3399982093264517
Epoch: 63, step: 642, loss: 0.3296510875225067, mean loss: 0.3399980963851014
Epoch: 63, step: 643, loss: 0.3322339951992035, mean loss: 0.33999801163897425
Epoch: 63, step: 644, loss: 0.3804453909397125, mean loss: 0.3399984531223158
Epoch: 63, step: 645, loss: 0.33596545457839966, mean loss: 0.3399984091025976
Epoch: 63, step: 646, loss: 0.3036860525608063, mean loss: 0.3399980127617017
Epoch: 63, step: 647, loss: 0.37413620948791504, mean loss: 0.3399983853680838
Epoch: 63, step: 648, loss: 0.3442440629005432, mean loss: 0.3399984317076515
Epoch: 63, step: 649, loss: 0.33651480078697205, mean loss: 0.3399983936858781
Epoch: 63, step: 650, loss: 0.3162279427051544, mean loss: 0.33999813424828074
Epoch: 63, step: 651, loss: 0.37053725123405457, mean loss: 0.33999846755742447
Epoch: 63, step: 652, loss: 0.30501386523246765, mean loss: 0.339998085733661
Epoch: 63, step: 653, loss: 0.33852827548980713, mean loss: 0.3399980696922509
Epoch: 63, step: 654, loss: 0.2870662212371826, mean loss: 0.3399974920039226
Epoch: 63, step: 655, loss: 0.3396402895450592, mean loss: 0.3399974881055241
Epoch: 63, step: 656, loss: 0.3225127160549164, mean loss: 0.339997297284146
Epoch: 63, step: 657, loss: 0.36677297949790955, mean loss: 0.3399975894993835
Epoch: 63, step: 658, loss: 0.31155434250831604, mean loss: 0.33999727908863836
Epoch: 63, step: 659, loss: 0.32458001375198364, mean loss: 0.3399971108366594
Epoch: 63, step: 660, loss: 0.3335942029953003, mean loss: 0.3399970409610923
Epoch: 63, step: 661, loss: 0.3240600526332855, mean loss: 0.339996867041059
Epoch: 63, step: 662, loss: 0.34483659267425537, mean loss: 0.3399969198563112
Epoch: 63, step: 663, loss: 0.3162738084793091, mean loss: 0.339996660972124
Epoch: 63, step: 664, loss: 0.3330524265766144, mean loss: 0.33999658519231457
Epoch: 63, step: 665, loss: 0.3521341383457184, mean loss: 0.3399967176434064
Epoch: 63, step: 666, loss: 0.32116496562957764, mean loss: 0.33999651214408827
Epoch: 63, step: 667, loss: 0.30112606287002563, mean loss: 0.3399960879794301
Epoch: 63, step: 668, loss: 0.3479914963245392, mean loss: 0.3399961752264958
Epoch: 63, step: 669, loss: 0.3257298767566681, mean loss: 0.33999601955225833
Epoch: 63, step: 670, loss: 0.3104560673236847, mean loss: 0.3399956972150124
Epoch: 63, step: 671, loss: 0.34943920373916626, mean loss: 0.3399958002605639
Epoch: 63, step: 672, loss: 0.32681718468666077, mean loss: 0.3399956564598593
Epoch: 63, step: 673, loss: 0.3371720314025879, mean loss: 0.33999562564973057
Epoch: 63, step: 674, loss: 0.3461657464504242, mean loss: 0.33999569297458354
Epoch: 63, step: 675, loss: 0.42235758900642395, mean loss: 0.339996591650998
Epoch: 63, step: 676, loss: 0.3380855321884155, mean loss: 0.3399965707990578
Epoch: 63, step: 677, loss: 0.29650336503982544, mean loss: 0.33999609624143906
Epoch: 63, step: 678, loss: 0.299242228269577, mean loss: 0.3399956515777914
Epoch: 63, step: 679, loss: 0.31325235962867737, mean loss: 0.3399953597861016
Epoch: 63, step: 680, loss: 0.33312663435935974, mean loss: 0.3399952848433782
Epoch: 63, step: 681, loss: 0.36659324169158936, mean loss: 0.33999557504300776
Epoch: 63, step: 682, loss: 0.30649805068969727, mean loss: 0.33999520956895446
Epoch: 63, step: 683, loss: 0.3251968026161194, mean loss: 0.3399950481130001
Epoch: 63, step: 684, loss: 0.3225712776184082, mean loss: 0.33999485801545715
Epoch: 63, step: 685, loss: 0.32689619064331055, mean loss: 0.3399947151073927
Epoch: 63, step: 686, loss: 0.3117583990097046, mean loss: 0.33999440704908857
Epoch: 63, step: 687, loss: 0.34207525849342346, mean loss: 0.3399944297509372
Epoch: 63, step: 688, loss: 0.3310379981994629, mean loss: 0.33999433203837076
Epoch: 63, step: 689, loss: 0.3639342188835144, mean loss: 0.33999459321406894
Epoch: 63, step: 690, loss: 0.4150637090206146, mean loss: 0.33999541218263646
Epoch: 63, step: 691, loss: 0.39203202724456787, mean loss: 0.33999597987131536
Epoch: 63, step: 692, loss: 0.3059948980808258, mean loss: 0.339995608943679
Epoch: 63, step: 693, loss: 0.32843679189682007, mean loss: 0.33999548284657594
Epoch: 63, step: 694, loss: 0.32066109776496887, mean loss: 0.33999527192677836
Epoch: 63, step: 695, loss: 0.3265271782875061, mean loss: 0.33999512500425755
Epoch: 63, step: 696, loss: 0.31084591150283813, mean loss: 0.33999480702093166
Epoch: 63, step: 697, loss: 0.32314109802246094, mean loss: 0.33999462316897355
Epoch: 63, step: 698, loss: 0.3565071225166321, mean loss: 0.3399948032968149
Epoch: 63, step: 699, loss: 0.3009088933467865, mean loss: 0.33999437692987683
Epoch: 63, step: 700, loss: 0.3460926115512848, mean loss: 0.33999444345147667
Epoch: 63, step: 701, loss: 0.3312334716320038, mean loss: 0.339994347884884
Epoch: 63, step: 702, loss: 0.3276349902153015, mean loss: 0.33999421306778366
Epoch: 63, step: 703, loss: 0.3392243981361389, mean loss: 0.33999420467065755
Epoch: 63, step: 704, loss: 0.31105342507362366, mean loss: 0.3399938889886479
Epoch: 63, step: 705, loss: 0.29745855927467346, mean loss: 0.3399934250242321
Epoch: 63, step: 706, loss: 0.30904272198677063, mean loss: 0.3399930874256213
Epoch: 63, step: 707, loss: 0.35889407992362976, mean loss: 0.3399932935882794
Epoch: 63, step: 708, loss: 0.33115485310554504, mean loss: 0.3399931971840028
Epoch: 63, step: 709, loss: 0.30456748604774475, mean loss: 0.33999281078633325
Epoch: 63, step: 710, loss: 0.4184013605117798, mean loss: 0.33999366599994674
Epoch: 63, step: 711, loss: 0.33975672721862793, mean loss: 0.3399936634156487
Epoch: 63, step: 712, loss: 0.29073566198349, mean loss: 0.3399931261630836
Epoch: 63, step: 713, loss: 0.309000700712204, mean loss: 0.33999278813519
Epoch: 63, step: 714, loss: 0.32569336891174316, mean loss: 0.3399926321761203
Epoch: 63, step: 715, loss: 0.341939240694046, mean loss: 0.3399926534069086
Epoch: 63, step: 716, loss: 0.3038984537124634, mean loss: 0.3399922597479125
Epoch: 63, step: 717, loss: 0.28765109181404114, mean loss: 0.33999168889866027
Epoch: 63, step: 718, loss: 0.33859655261039734, mean loss: 0.33999167368303074
Epoch: 63, step: 719, loss: 0.3600611388683319, mean loss: 0.3399918925621607
Epoch: 63, step: 720, loss: 0.3653917908668518, mean loss: 0.33999216957238293
Epoch: 63, step: 721, loss: 0.3001698851585388, mean loss: 0.339991735276961
Epoch: 63, step: 722, loss: 0.3276161849498749, mean loss: 0.33999160031267367
Epoch: 63, step: 723, loss: 0.3143104016780853, mean loss: 0.33999132024376516
Epoch: 63, step: 724, loss: 0.3000510036945343, mean loss: 0.33999088467535454
Epoch: 63, step: 725, loss: 0.367065966129303, mean loss: 0.339991179938953
Epoch: 63, step: 726, loss: 0.3464148938655853, mean loss: 0.3399912499911229
Epoch: 63, step: 727, loss: 0.321139931678772, mean loss: 0.33999104441513256
Epoch: 63, step: 728, loss: 0.2996470034122467, mean loss: 0.33999060446310364
Epoch: 63, step: 729, loss: 0.34615767002105713, mean loss: 0.3399906717142602
Epoch: 63, step: 730, loss: 0.36634305119514465, mean loss: 0.3399909590808619
Epoch: 63, step: 731, loss: 0.3311848044395447, mean loss: 0.33999086305282994
Epoch: 63, step: 732, loss: 0.3190928101539612, mean loss: 0.3399906351693678
Epoch: 63, step: 733, loss: 0.362597793340683, mean loss: 0.33999088168713293
Epoch: 63, step: 734, loss: 0.34756791591644287, mean loss: 0.3399909643093344
Epoch: 63, step: 735, loss: 0.354436993598938, mean loss: 0.3399911218313531
Epoch: 63, step: 736, loss: 0.34223613142967224, mean loss: 0.33999114631106175
Epoch: 63, step: 737, loss: 0.3343968391418457, mean loss: 0.3399910853110926
Epoch: 63, step: 738, loss: 0.3173036575317383, mean loss: 0.33999083793152224
Epoch: 63, step: 739, loss: 0.31375008821487427, mean loss: 0.339990551810298
Epoch: 63, step: 740, loss: 0.32995864748954773, mean loss: 0.3399904424266303
Epoch: 63, step: 741, loss: 0.3131791949272156, mean loss: 0.3399901500912453
Epoch: 63, step: 742, loss: 0.31392064690589905, mean loss: 0.33998986584653956
Epoch: 63, step: 743, loss: 0.3511902391910553, mean loss: 0.33998998796670776
Epoch: 63, step: 744, loss: 0.3555794060230255, mean loss: 0.3399901579397559
Epoch: 63, step: 745, loss: 0.3598058521747589, mean loss: 0.3399903739899776
Epoch: 63, step: 746, loss: 0.36027300357818604, mean loss: 0.3399905951287775
Epoch: 63, step: 747, loss: 0.30709412693977356, mean loss: 0.3399902364668914
Epoch: 63, step: 748, loss: 0.3294665515422821, mean loss: 0.3399901217310629
Epoch: 63, step: 749, loss: 0.32145214080810547, mean loss: 0.33998991962054503
Epoch: 63, step: 750, loss: 0.33050987124443054, mean loss: 0.33998981626535196
Epoch: 63, step: 751, loss: 0.3469950556755066, mean loss: 0.3399898926383777
Epoch: 63, step: 752, loss: 0.32221221923828125, mean loss: 0.3399896988234592
Epoch: 63, step: 753, loss: 0.3126675486564636, mean loss: 0.33998940095644037
Epoch: 63, step: 754, loss: 0.3314937353134155, mean loss: 0.3399893083374117
Epoch: 63, step: 755, loss: 0.37411776185035706, mean loss: 0.33998968039887073
Epoch: 63, step: 756, loss: 0.357485294342041, mean loss: 0.3399898711304163
Epoch: 63, step: 757, loss: 0.3490231931209564, mean loss: 0.3399899696077082
Epoch: 63, step: 758, loss: 0.35713857412338257, mean loss: 0.33999015655219283
Epoch: 63, step: 759, loss: 0.32263538241386414, mean loss: 0.3399899673622249
Epoch: 63, step: 760, loss: 0.2948302924633026, mean loss: 0.3399894750674684
Epoch: 63, step: 761, loss: 0.4002595543861389, mean loss: 0.3399901320766397
Epoch: 63, step: 762, loss: 0.31907880306243896, mean loss: 0.3399899041229795
Epoch: 63, step: 763, loss: 0.34721270203590393, mean loss: 0.3399899828575866
Epoch: 63, step: 764, loss: 0.341248482465744, mean loss: 0.3399899965761473
Epoch: 63, step: 765, loss: 0.33269980549812317, mean loss: 0.3399899171086303
Epoch: 63, step: 766, loss: 0.3102964460849762, mean loss: 0.3399895934352632
Epoch: 63, step: 767, loss: 0.3114352226257324, mean loss: 0.3399892821820388
Epoch: 63, step: 768, loss: 0.2852244973182678, mean loss: 0.33998868523209425
Epoch: 63, step: 769, loss: 0.3295885920524597, mean loss: 0.33998857186969555
Epoch: 63, step: 770, loss: 0.3008599579334259, mean loss: 0.3399881453672492
Epoch: 63, step: 771, loss: 0.3262106776237488, mean loss: 0.33998799519429246
Epoch: 63, step: 772, loss: 0.35014835000038147, mean loss: 0.33998810593988954
Epoch: 63, step: 773, loss: 0.3272821605205536, mean loss: 0.33998796744943305
Epoch: 63, step: 774, loss: 0.3422035872936249, mean loss: 0.3399879915986678
Epoch: 63, step: 775, loss: 0.3298722505569458, mean loss: 0.3399878813429561
Epoch: 63, step: 776, loss: 0.31845030188560486, mean loss: 0.33998764659838715
Epoch: 63, step: 777, loss: 0.3294828236103058, mean loss: 0.33998753210440363
Epoch: 63, step: 778, loss: 0.343559592962265, mean loss: 0.3399875710365227
Epoch: 63, step: 779, loss: 0.33806467056274414, mean loss: 0.3399875500789363
Epoch: 63, step: 780, loss: 0.29420098662376404, mean loss: 0.33998705105913907
Epoch: 63, step: 781, loss: 0.32263898849487305, mean loss: 0.33998686198768097
Epoch: 63, step: 782, loss: 0.3846398591995239, mean loss: 0.3399873486423288
Epoch: 63, step: 783, loss: 0.37115713953971863, mean loss: 0.3399876883453553
Epoch: 63, step: 784, loss: 0.34580788016319275, mean loss: 0.3399877517758491
Epoch: 63, step: 785, loss: 0.3928443193435669, mean loss: 0.3399883278190014
Epoch: 63, step: 786, loss: 0.31786689162254333, mean loss: 0.33998808673707814
Epoch: 63, step: 787, loss: 0.32174330949783325, mean loss: 0.3399878879055912
Epoch: 63, step: 788, loss: 0.33134108781814575, mean loss: 0.339987793673836
Epoch: 63, step: 789, loss: 0.32760900259017944, mean loss: 0.33998765877277587
Epoch: 63, step: 790, loss: 0.34450992941856384, mean loss: 0.33998770805484646
Epoch: 63, step: 791, loss: 0.31809282302856445, mean loss: 0.33998746945490504
Epoch: 63, step: 792, loss: 0.34322747588157654, mean loss: 0.33998750476255424
Epoch: 63, step: 793, loss: 0.3343558609485626, mean loss: 0.33998744339294223
Epoch: 63, step: 794, loss: 0.2948842942714691, mean loss: 0.3399869518965533
Epoch: 63, step: 795, loss: 0.35211342573165894, mean loss: 0.339987084039281
Epoch: 63, step: 796, loss: 0.32346341013908386, mean loss: 0.33998690398202963
Epoch: 63, step: 797, loss: 0.38487592339515686, mean loss: 0.33998739312902115
Epoch: 63, step: 798, loss: 0.3075021207332611, mean loss: 0.33998703914712713
Epoch: 63, step: 799, loss: 0.33239954710006714, mean loss: 0.33998695646949073
Epoch: 63, step: 800, loss: 0.3583027124404907, mean loss: 0.33998715604622864
Epoch: 63, step: 801, loss: 0.3195095360279083, mean loss: 0.3399869329152763
Epoch: 63, step: 802, loss: 0.3096652328968048, mean loss: 0.3399866025235572
Epoch: 63, step: 803, loss: 0.3090229034423828, mean loss: 0.33998626514015545
Epoch: 63, step: 804, loss: 0.31104782223701477, mean loss: 0.33998594982757274
Epoch: 63, step: 805, loss: 0.31837818026542664, mean loss: 0.33998571439239694
Epoch: 63, step: 806, loss: 0.3365235924720764, mean loss: 0.3399856766700212
Epoch: 63, step: 807, loss: 0.30786699056625366, mean loss: 0.3399853267170238
Epoch: 63, step: 808, loss: 0.37307998538017273, mean loss: 0.33998568729991857
Epoch: 63, step: 809, loss: 0.30955183506011963, mean loss: 0.3399853557114563
Epoch: 63, step: 810, loss: 0.35296034812927246, mean loss: 0.33998549707742187
Epoch: 63, step: 811, loss: 0.32421237230300903, mean loss: 0.3399853252269384
Epoch: 63, step: 812, loss: 0.3439227342605591, mean loss: 0.3399853681251139
Epoch: 63, step: 813, loss: 0.3362785875797272, mean loss: 0.3399853277400819
Epoch: 63, step: 814, loss: 0.27572351694107056, mean loss: 0.339984627621211
Epoch: 63, step: 815, loss: 0.29736825823783875, mean loss: 0.33998416332991604
Epoch: 63, step: 816, loss: 0.31829947233200073, mean loss: 0.3399839270849303
Epoch: 63, step: 817, loss: 0.3587970435619354, mean loss: 0.33998413204316624
Epoch: 63, step: 818, loss: 0.3473946154117584, mean loss: 0.3399842127753009
Epoch: 63, step: 819, loss: 0.3337339460849762, mean loss: 0.33998414468367316
Epoch: 63, step: 820, loss: 0.32242289185523987, mean loss: 0.33998395337003456
Epoch: 63, step: 821, loss: 0.36280471086502075, mean loss: 0.33998420197841306
Epoch: 63, step: 822, loss: 0.3553374707698822, mean loss: 0.33998436923445957
Epoch: 63, step: 823, loss: 0.3279661238193512, mean loss: 0.3399842383110488
Epoch: 63, step: 824, loss: 0.333004355430603, mean loss: 0.3399841622749814
Epoch: 63, step: 825, loss: 0.3204374611377716, mean loss: 0.3399839493433147
Epoch: 63, step: 826, loss: 0.3246929347515106, mean loss: 0.3399837827727138
Epoch: 63, step: 827, loss: 0.36330679059028625, mean loss: 0.3399840368359798
Epoch: 63, step: 828, loss: 0.3272188603878021, mean loss: 0.33998389778328486
Epoch: 63, step: 829, loss: 0.3511981964111328, mean loss: 0.33998401994073923
Epoch: 63, step: 830, loss: 0.32971328496932983, mean loss: 0.3399839080627508
Epoch: 63, step: 831, loss: 0.36455732583999634, mean loss: 0.33998417573537704
Epoch: 63, step: 832, loss: 0.3125245273113251, mean loss: 0.33998387662695784
Epoch: 63, step: 833, loss: 0.37187451124191284, mean loss: 0.33998422399678785
Epoch: 63, step: 834, loss: 0.3648345470428467, mean loss: 0.33998449467683456
Epoch: 63, step: 835, loss: 0.31108716130256653, mean loss: 0.3399841799184979
Epoch: 63, step: 836, loss: 0.35739073157310486, mean loss: 0.33998436951376254
Epoch: 63, step: 837, loss: 0.3160783350467682, mean loss: 0.3399841091278082
Epoch: 63, step: 838, loss: 0.34087929129600525, mean loss: 0.3399841188780796
Epoch: 63, step: 839, loss: 0.3118409514427185, mean loss: 0.3399838123476976
Epoch: 63, step: 840, loss: 0.33765989542007446, mean loss: 0.3399837870362828
Epoch: 63, step: 841, loss: 0.3419075012207031, mean loss: 0.33998380798857963
Epoch: 63, step: 842, loss: 0.3619228005409241, mean loss: 0.33998404693638284
Epoch: 63, step: 843, loss: 0.34642547369003296, mean loss: 0.33998411709220266
Epoch: 63, step: 844, loss: 0.3446574807167053, mean loss: 0.3399841679908775
Epoch: 63, step: 845, loss: 0.31179189682006836, mean loss: 0.33998386094573196
Epoch: 63, step: 846, loss: 0.3536945879459381, mean loss: 0.33998401026915087
Epoch: 63, step: 847, loss: 0.3698044419288635, mean loss: 0.33998433503969827
Epoch: 63, step: 848, loss: 0.34882280230522156, mean loss: 0.3399844312972784
Epoch: 63, step: 849, loss: 0.3466273844242096, mean loss: 0.3399845036432644
Epoch: 63, step: 850, loss: 0.30872032046318054, mean loss: 0.33998416316012636
Epoch: 63, step: 851, loss: 0.35034456849098206, mean loss: 0.3399842759890745
Epoch: 63, step: 852, loss: 0.30322951078414917, mean loss: 0.33998387571937444
Epoch: 63, step: 853, loss: 0.32765528559684753, mean loss: 0.3399837414590329
Epoch: 63, step: 854, loss: 0.27909958362579346, mean loss: 0.33998307842792186
Epoch: 63, step: 855, loss: 0.31670239567756653, mean loss: 0.3399828249030411
Epoch: 63, step: 856, loss: 0.32344377040863037, mean loss: 0.33998264479594537
Epoch: 63, step: 857, loss: 0.3405422568321228, mean loss: 0.33998265088994556
Epoch: 63, step: 858, loss: 0.3018084168434143, mean loss: 0.3399822351889944
Epoch: 63, step: 859, loss: 0.34208178520202637, mean loss: 0.33998225805193993
Epoch: 63, step: 860, loss: 0.3378242552280426, mean loss: 0.33998223455273135
Epoch: 63, step: 861, loss: 0.32761436700820923, mean loss: 0.3399820998763855
Epoch: 63, step: 862, loss: 0.35717451572418213, mean loss: 0.3399822870862276
Epoch: 63, step: 863, loss: 0.3517421782016754, mean loss: 0.3399824151393997
Epoch: 63, step: 864, loss: 0.331409752368927, mean loss: 0.339982321792897
Epoch: 63, step: 865, loss: 0.3131832182407379, mean loss: 0.3399820299844566
Epoch: 63, step: 866, loss: 0.2996525764465332, mean loss: 0.33998159085234997
Epoch: 63, step: 867, loss: 0.3593461215496063, mean loss: 0.3399818017030762
Epoch: 63, step: 868, loss: 0.30930355191230774, mean loss: 0.33998146766653703
Epoch: 63, step: 869, loss: 0.30481457710266113, mean loss: 0.3399810847601264
Epoch: 63, step: 870, loss: 0.32806137204170227, mean loss: 0.3399809549765531
Epoch: 63, step: 871, loss: 0.353549987077713, mean loss: 0.33998110271654813
Epoch: 63, step: 872, loss: 0.35646891593933105, mean loss: 0.33998128223435775
Epoch: 63, step: 873, loss: 0.3308611810207367, mean loss: 0.339981182936607
Epoch: 63, step: 874, loss: 0.3928629159927368, mean loss: 0.33998175869556546
Epoch: 63, step: 875, loss: 0.31233668327331543, mean loss: 0.339981457708332
Epoch: 63, step: 876, loss: 0.31939876079559326, mean loss: 0.3399812336155611
Epoch: 63, step: 877, loss: 0.3231810927391052, mean loss: 0.3399810507071139
Epoch: 63, step: 878, loss: 0.2975864112377167, mean loss: 0.33998058914829066
Epoch: 63, step: 879, loss: 0.33457931876182556, mean loss: 0.3399805303442321
Epoch: 63, step: 880, loss: 0.3197268843650818, mean loss: 0.3399803098435845
Epoch: 63, step: 881, loss: 0.3473629951477051, mean loss: 0.33998039021771415
Epoch: 63, step: 882, loss: 0.32225194573402405, mean loss: 0.33998019721303846
Epoch: 63, step: 883, loss: 0.34353724122047424, mean loss: 0.33998023593717197
Epoch: 63, step: 884, loss: 0.34320080280303955, mean loss: 0.33998027099783
Epoch: 63, step: 885, loss: 0.29990288615226746, mean loss: 0.3399798347006665
Epoch: 63, step: 886, loss: 0.44595786929130554, mean loss: 0.3399809884040009
Epoch: 63, step: 887, loss: 0.35411012172698975, mean loss: 0.3399811422155981
Epoch: 63, step: 888, loss: 0.29620474576950073, mean loss: 0.33998066566519647
Epoch: 63, step: 889, loss: 0.31476181745529175, mean loss: 0.33998039113548656
Epoch: 63, step: 890, loss: 0.3348216414451599, mean loss: 0.3399803349784953
Epoch: 63, step: 891, loss: 0.3286517560482025, mean loss: 0.33998021165947007
Epoch: 63, step: 892, loss: 0.3309169411659241, mean loss: 0.3399801130008896
Epoch: 63, step: 893, loss: 0.29308563470840454, mean loss: 0.3399796025347945
Epoch: 63, step: 894, loss: 0.32364580035209656, mean loss: 0.33997942473643183
Epoch: 63, step: 895, loss: 0.28624263405799866, mean loss: 0.3399788398016267
Epoch: 63, step: 896, loss: 0.33203375339508057, mean loss: 0.33997875331884786
Epoch: 63, step: 897, loss: 0.3843992054462433, mean loss: 0.33997923683307585
Epoch: 63, step: 898, loss: 0.30014777183532715, mean loss: 0.33997880327444474
Epoch: 63, step: 899, loss: 0.32070884108543396, mean loss: 0.3399785935265108
Epoch: 63, step: 900, loss: 0.33916929364204407, mean loss: 0.3399785847176128
Epoch: 63, step: 901, loss: 0.3378976881504059, mean loss: 0.3399785620681519
Epoch: 63, step: 902, loss: 0.3636961579322815, mean loss: 0.33997882021885517
Epoch: 63, step: 903, loss: 0.33980581164360046, mean loss: 0.33997881833578913
Epoch: 63, step: 904, loss: 0.3233708143234253, mean loss: 0.3399786375723335
Epoch: 63, step: 905, loss: 0.3244754672050476, mean loss: 0.33997846883585287
Epoch: 63, step: 906, loss: 0.2985352575778961, mean loss: 0.33997801777291947
Epoch: 63, step: 907, loss: 0.314365953207016, mean loss: 0.33997773901731904
Epoch: 63, step: 908, loss: 0.34230175614356995, mean loss: 0.3399777643110917
Epoch: 63, step: 909, loss: 0.3216448724269867, mean loss: 0.3399775647846134
Epoch: 63, step: 910, loss: 0.300013929605484, mean loss: 0.3399771298441437
Epoch: 63, step: 911, loss: 0.3444594442844391, mean loss: 0.339977178626461
Epoch: 63, step: 912, loss: 0.35619834065437317, mean loss: 0.3399773551641116
Epoch: 63, step: 913, loss: 0.3168289363384247, mean loss: 0.339977103238695
Epoch: 63, step: 914, loss: 0.31849023699760437, mean loss: 0.3399768693985844
Epoch: 63, step: 915, loss: 0.37801480293273926, mean loss: 0.3399772833583347
Epoch: 63, step: 916, loss: 0.3364824652671814, mean loss: 0.3399772453252939
Epoch: 63, step: 917, loss: 0.34670475125312805, mean loss: 0.33997731853789515
Epoch: 63, step: 918, loss: 0.32850125432014465, mean loss: 0.3399771936501018
Epoch: 63, step: 919, loss: 0.31563058495521545, mean loss: 0.3399769287020248
Epoch: 63, step: 920, loss: 0.3092708885669708, mean loss: 0.33997659455208806
Epoch: 63, step: 921, loss: 0.3275667130947113, mean loss: 0.3399764595064762
Epoch: 63, step: 922, loss: 0.33951810002326965, mean loss: 0.33997645451861525
Epoch: 63, step: 923, loss: 0.3095916509628296, mean loss: 0.3399761238752406
Epoch: 63, step: 924, loss: 0.31587061285972595, mean loss: 0.33997586156514326
Epoch: 63, step: 925, loss: 0.33878788352012634, mean loss: 0.3399758486380062
Epoch: 63, step: 926, loss: 0.315369188785553, mean loss: 0.3399755808803608
Epoch: 63, step: 927, loss: 0.3151114284992218, mean loss: 0.3399753103237516
Epoch: 63, step: 928, loss: 0.33314719796180725, mean loss: 0.33997523602518726
Epoch: 63, step: 929, loss: 0.3091143071651459, mean loss: 0.33997490022260557
Epoch: 63, step: 930, loss: 0.29757726192474365, mean loss: 0.33997443889230844
Epoch: 63, step: 931, loss: 0.3594665825366974, mean loss: 0.3399746509847489
Epoch: 63, step: 932, loss: 0.32922619581222534, mean loss: 0.33997453403294897
Epoch: 63, step: 933, loss: 0.3080320656299591, mean loss: 0.33997418647709404
Epoch: 63, step: 934, loss: 0.37046581506729126, mean loss: 0.33997451824321184
Epoch: 63, step: 935, loss: 0.36571717262268066, mean loss: 0.339974798334764
Epoch: 63, step: 936, loss: 0.3202819526195526, mean loss: 0.33997458407015757
Epoch: 63, step: 937, loss: 0.30420586466789246, mean loss: 0.33997419489901837
Epoch: 63, step: 938, loss: 0.3268062472343445, mean loss: 0.3399740516305558
Epoch: 63, step: 939, loss: 0.3128477931022644, mean loss: 0.3399737564976185
Epoch: 63, step: 940, loss: 0.3406077027320862, mean loss: 0.33997376339486085
Epoch: 63, step: 941, loss: 0.3453482687473297, mean loss: 0.339973821868057
Epoch: 63, step: 942, loss: 0.3912545442581177, mean loss: 0.339974379782678
Epoch: 63, step: 943, loss: 0.35618922114372253, mean loss: 0.3399745561920231
Epoch: 63, step: 944, loss: 0.31776872277259827, mean loss: 0.3399743146063162
Epoch: 63, step: 945, loss: 0.3549000024795532, mean loss: 0.3399744769867844
Epoch: 63, step: 946, loss: 0.38151654601097107, mean loss: 0.3399749289289185
Epoch: 63, step: 947, loss: 0.33312052488327026, mean loss: 0.3399748543596839
Epoch: 63, step: 948, loss: 0.35271281003952026, mean loss: 0.33997499293471767
Epoch: 63, step: 949, loss: 0.38377928733825684, mean loss: 0.33997546947237356
Epoch: 63, step: 950, loss: 0.33836230635643005, mean loss: 0.33997545192330403
Epoch: 63, step: 951, loss: 0.3235449492931366, mean loss: 0.3399752731832293
Epoch: 63, step: 952, loss: 0.343872606754303, mean loss: 0.3399753155801134
Epoch: 63, step: 953, loss: 0.3169945776462555, mean loss: 0.3399750655884034
Epoch: 63, step: 954, loss: 0.3332020044326782, mean loss: 0.33997499190971103
Epoch: 63, step: 955, loss: 0.32816386222839355, mean loss: 0.33997486342731525
Epoch: 63, step: 956, loss: 0.410219669342041, mean loss: 0.3399756275475158
Epoch: 63, step: 957, loss: 0.3988293707370758, mean loss: 0.3399762677492257
Epoch: 63, step: 958, loss: 0.3761534094810486, mean loss: 0.3399766612741708
Epoch: 63, step: 959, loss: 0.3468599319458008, mean loss: 0.33997673614767154
Epoch: 63, step: 960, loss: 0.31275486946105957, mean loss: 0.3399764400421742
Epoch: 63, step: 961, loss: 0.3258179724216461, mean loss: 0.33997628603530383
Epoch: 63, step: 962, loss: 0.3364744484424591, mean loss: 0.3399762479449401
Epoch: 63, step: 963, loss: 0.3044682741165161, mean loss: 0.3399758617200246
Epoch: 63, step: 964, loss: 0.2961834967136383, mean loss: 0.33997538538987454
Epoch: 63, step: 965, loss: 0.3626807928085327, mean loss: 0.33997563235421374
Epoch: 63, step: 966, loss: 0.29668474197387695, mean loss: 0.3399751614888532
Epoch: 63, step: 967, loss: 0.31757447123527527, mean loss: 0.33997491784419087
Epoch: 63, step: 968, loss: 0.38077184557914734, mean loss: 0.3399753615736232
Epoch: 63, step: 969, loss: 0.33747759461402893, mean loss: 0.33997533440685546
Epoch: 63, step: 970, loss: 0.3198719620704651, mean loss: 0.3399751157564706
Epoch: 63, step: 971, loss: 0.33382704854011536, mean loss: 0.3399750488889511
Epoch: 63, step: 972, loss: 0.3313569724559784, mean loss: 0.33997495515817255
Epoch: 63, step: 973, loss: 0.3016476631164551, mean loss: 0.3399745383125018
Epoch: 63, step: 974, loss: 0.3317931294441223, mean loss: 0.3399744493328845
Epoch: 63, step: 975, loss: 0.32979583740234375, mean loss: 0.33997433863322896
Epoch: 63, step: 976, loss: 0.35183456540107727, mean loss: 0.33997446762024097
Epoch: 63, step: 977, loss: 0.3768541216850281, mean loss: 0.3399748687040263
Epoch: 63, step: 978, loss: 0.40162503719329834, mean loss: 0.33997553917165024
Epoch: 63, step: 979, loss: 0.28441789746284485, mean loss: 0.3399749349690042
Epoch: 63, step: 980, loss: 0.3380090892314911, mean loss: 0.339974913590194
Epoch: 63, step: 981, loss: 0.3427298665046692, mean loss: 0.33997494355031443
Epoch: 63, step: 982, loss: 0.35138487815856934, mean loss: 0.33997506763203494
Epoch: 63, step: 983, loss: 0.33210623264312744, mean loss: 0.33997498206029425
Epoch: 63, step: 984, loss: 0.3450435698032379, mean loss: 0.3399750371794015
Epoch: 63, step: 985, loss: 0.34641292691230774, mean loss: 0.33997510718842444
Epoch: 63, step: 986, loss: 0.3422016501426697, mean loss: 0.33997513140076857
Epoch: 63, step: 987, loss: 0.3250509798526764, mean loss: 0.3399749691111693
Epoch: 63, step: 988, loss: 0.32675760984420776, mean loss: 0.33997482538329266
Epoch: 63, step: 989, loss: 0.3357808291912079, mean loss: 0.33997477977754037
Epoch: 63, step: 990, loss: 0.32287055253982544, mean loss: 0.33997459378722644
Epoch: 63, step: 991, loss: 0.3148881494998932, mean loss: 0.339974321001742
Epoch: 63, step: 992, loss: 0.31991416215896606, mean loss: 0.3399741028735537
Epoch: 63, step: 993, loss: 0.33324339985847473, mean loss: 0.339974029686691
Epoch: 63, step: 994, loss: 0.32674741744995117, mean loss: 0.3399738858675794
Epoch: 63, step: 995, loss: 0.3375091850757599, mean loss: 0.3399738590680318
Epoch: 63, step: 996, loss: 0.28659576177597046, mean loss: 0.3399732786757551
Epoch: 63, step: 997, loss: 0.33550238609313965, mean loss: 0.3399732300632447
Epoch: 63, step: 998, loss: 0.3033578395843506, mean loss: 0.33997283194437594
Epoch: 63, step: 999, loss: 0.33171647787094116, mean loss: 0.33997274217407547
Epoch: 63, step: 1000, loss: 0.3138889670372009, mean loss: 0.33997245857154934
Epoch: 63, step: 1001, loss: 0.37172871828079224, mean loss: 0.3399728038458628
Epoch: 63, step: 1002, loss: 0.29114484786987305, mean loss: 0.33997227296294924
Epoch: 63, step: 1003, loss: 0.2945866882801056, mean loss: 0.33997177951265045
Epoch: 63, step: 1004, loss: 0.37728622555732727, mean loss: 0.3399721852058786
Epoch: 63, step: 1005, loss: 0.4172074794769287, mean loss: 0.3399730249207481
Epoch: 63, step: 1006, loss: 0.3504592478275299, mean loss: 0.3399731389274551
Epoch: 63, step: 1007, loss: 0.36717209219932556, mean loss: 0.33997343463253527
Epoch: 63, step: 1008, loss: 0.36316540837287903, mean loss: 0.3399736867712785
Epoch: 63, step: 1009, loss: 0.30897536873817444, mean loss: 0.3399733497671034
Epoch: 63, step: 1010, loss: 0.32888028025627136, mean loss: 0.3399732291679763
Epoch: 63, step: 1011, loss: 0.36469975113868713, mean loss: 0.3399734979812696
Epoch: 63, step: 1012, loss: 0.34366628527641296, mean loss: 0.33997353812680736
Epoch: 63, step: 1013, loss: 0.35470572113990784, mean loss: 0.3399736982836031
Epoch: 63, step: 1014, loss: 0.3492453694343567, mean loss: 0.33997379907687986
Epoch: 63, step: 1015, loss: 0.35070234537124634, mean loss: 0.3399739157067261
Epoch: 63, step: 1016, loss: 0.32459592819213867, mean loss: 0.3399737485346999
Epoch: 63, step: 1017, loss: 0.32952892780303955, mean loss: 0.33997363499169814
Epoch: 63, step: 1018, loss: 0.3245169520378113, mean loss: 0.3399734669678376
Epoch: 63, step: 1019, loss: 0.3595777451992035, mean loss: 0.33997368007634954
Epoch: 63, step: 1020, loss: 0.322496235370636, mean loss: 0.339973490089669
Epoch: 63, step: 1021, loss: 0.3734385073184967, mean loss: 0.33997385386358064
Epoch: 63, step: 1022, loss: 0.3349623382091522, mean loss: 0.33997379938762373
Epoch: 63, step: 1023, loss: 0.31299349665641785, mean loss: 0.3399735061107124
Epoch: 63, step: 1024, loss: 0.3519538342952728, mean loss: 0.33997363633591743
Epoch: 63, step: 1025, loss: 0.3143477737903595, mean loss: 0.33997335778787785
Epoch: 63, step: 1026, loss: 0.3068188428878784, mean loss: 0.3399729974087987
Epoch: 63, step: 1027, loss: 0.2958504259586334, mean loss: 0.33997251781563076
Epoch: 63, step: 1028, loss: 0.30157774686813354, mean loss: 0.33997210048570015
Epoch: 63, step: 1029, loss: 0.29857078194618225, mean loss: 0.3399716504811509
Epoch: 63, step: 1030, loss: 0.33933955430984497, mean loss: 0.3399716436107644
Epoch: 63, step: 1031, loss: 0.320779412984848, mean loss: 0.3399714350086316
Epoch: 63, step: 1032, loss: 0.3134726583957672, mean loss: 0.33997114699410397
Epoch: 63, step: 1033, loss: 0.31406527757644653, mean loss: 0.3399708654269299
Epoch: 63, step: 1034, loss: 0.3053749203681946, mean loss: 0.3399704894126586
Epoch: 63, step: 1035, loss: 0.3266266882419586, mean loss: 0.33997034438395274
Epoch: 63, step: 1036, loss: 0.31670844554901123, mean loss: 0.33997009156195884
Epoch: 63, step: 1037, loss: 0.3331531286239624, mean loss: 0.3399700174725888
Epoch: 63, step: 1038, loss: 0.35076120495796204, mean loss: 0.33997013475408216
Epoch: 63, step: 1039, loss: 0.3653426468372345, mean loss: 0.3399704105062893
Epoch: 63, step: 1040, loss: 0.37538790702819824, mean loss: 0.33997079542468694
Epoch: 63, step: 1041, loss: 0.3297654390335083, mean loss: 0.3399706845137778
Epoch: 63, step: 1042, loss: 0.33010438084602356, mean loss: 0.33997057728882896
Epoch: 63, step: 1043, loss: 0.34134599566459656, mean loss: 0.3399705922364291
Epoch: 63, step: 1044, loss: 0.33562925457954407, mean loss: 0.33997054505669433
Epoch: 63, step: 1045, loss: 0.361113041639328, mean loss: 0.3399707748214858
Epoch: 63, step: 1046, loss: 0.3225140869617462, mean loss: 0.3399705851140573
Epoch: 63, step: 1047, loss: 0.3350839614868164, mean loss: 0.33997053201012745
Epoch: 63, step: 1048, loss: 0.3447822332382202, mean loss: 0.33997058429929217
Epoch: 63, step: 1049, loss: 0.3670784533023834, mean loss: 0.3399708788795991
Epoch: 63, step: 1050, loss: 0.31597641110420227, mean loss: 0.3399706181353528
Epoch: 63, step: 1051, loss: 0.3501139283180237, mean loss: 0.3399707283599701
Epoch: 63, step: 1052, loss: 0.32706549763679504, mean loss: 0.33997058812383074
Epoch: 63, step: 1053, loss: 0.3982628583908081, mean loss: 0.3399712215564505
Epoch: 63, step: 1054, loss: 0.33458080887794495, mean loss: 0.3399711629821986
Epoch: 63, step: 1055, loss: 0.2933230698108673, mean loss: 0.3399706560919785
Epoch: 63, step: 1056, loss: 0.33092159032821655, mean loss: 0.3399705577635629
Epoch: 63, step: 1057, loss: 0.3396328091621399, mean loss: 0.3399705540935792
Epoch: 63, step: 1058, loss: 0.38019317388534546, mean loss: 0.33997099114869966
Epoch: 63, step: 1059, loss: 0.3399667739868164, mean loss: 0.3399709911028769
Epoch: 63, step: 1060, loss: 0.3689723014831543, mean loss: 0.33997130622147975
Epoch: 63, step: 1061, loss: 0.3066615164279938, mean loss: 0.3399709442923036
Epoch: 63, step: 1062, loss: 0.32547497749328613, mean loss: 0.3399707867873675
Epoch: 63, step: 1063, loss: 0.33775466680526733, mean loss: 0.33997076270852894
Epoch: 63, step: 1064, loss: 0.3155602514743805, mean loss: 0.3399704974835517
Epoch: 63, step: 1065, loss: 0.36189156770706177, mean loss: 0.3399707356576778
Epoch: 63, step: 1066, loss: 0.3408960998058319, mean loss: 0.33997074571172176
Epoch: 63, step: 1067, loss: 0.33370065689086914, mean loss: 0.3399706775882013
Epoch: 63, step: 1068, loss: 0.34052789211273193, mean loss: 0.33997068364218297
Epoch: 63, step: 1069, loss: 0.317411333322525, mean loss: 0.33997043854374615
Epoch: 63, step: 1070, loss: 0.38752448558807373, mean loss: 0.339970955194084
Epoch: 63, step: 1071, loss: 0.3437168300151825, mean loss: 0.3399709958906511
Epoch: 63, step: 1072, loss: 0.34526535868644714, mean loss: 0.3399710534099384
Epoch: 63, step: 1073, loss: 0.3191632926464081, mean loss: 0.3399708273516549
Epoch: 63, step: 1074, loss: 0.32150155305862427, mean loss: 0.33997062670117967
Epoch: 63, step: 1075, loss: 0.34723106026649475, mean loss: 0.3399707055777828
Epoch: 63, step: 1076, loss: 0.32801541686058044, mean loss: 0.3399705756981674
Epoch: 63, step: 1077, loss: 0.32976216077804565, mean loss: 0.33997046479740783
Epoch: 63, step: 1078, loss: 0.3347080647945404, mean loss: 0.3399704076290989
Epoch: 63, step: 1079, loss: 0.2889360189437866, mean loss: 0.33996985322084394
Epoch: 63, step: 1080, loss: 0.34385403990745544, mean loss: 0.3399698954159564
Epoch: 63, step: 1081, loss: 0.31165260076522827, mean loss: 0.3399695877998327
Epoch: 63, step: 1082, loss: 0.3176801800727844, mean loss: 0.33996934566841425
Epoch: 63, step: 1083, loss: 0.31721723079681396, mean loss: 0.33996909851326007
Epoch: 63, step: 1084, loss: 0.30842024087905884, mean loss: 0.3399687558032257
Epoch: 63, step: 1085, loss: 0.36993545293807983, mean loss: 0.3399690813229756
Epoch: 63, step: 1086, loss: 0.3176891803741455, mean loss: 0.33996883930534616
Epoch: 63, step: 1087, loss: 0.3553392291069031, mean loss: 0.3399690062659132
Epoch: 63, step: 1088, loss: 0.33370816707611084, mean loss: 0.33996893825840524
Epoch: 63, step: 1089, loss: 0.3435206413269043, mean loss: 0.3399689768378742
Epoch: 63, step: 1090, loss: 0.2994298040866852, mean loss: 0.33996853649623043
Epoch: 63, step: 1091, loss: 0.3407442569732666, mean loss: 0.33996854492211326
Epoch: 63, step: 1092, loss: 0.3989261984825134, mean loss: 0.3399691853137231
Epoch: 63, step: 1093, loss: 0.31050145626068115, mean loss: 0.3399688652419371
Epoch: 63, step: 1094, loss: 0.34456413984298706, mean loss: 0.3399689151542249
Epoch: 63, step: 1095, loss: 0.33463549613952637, mean loss: 0.3399688572250963
Epoch: 63, step: 1096, loss: 0.3330594003200531, mean loss: 0.3399687821785887
Epoch: 63, step: 1097, loss: 0.30105310678482056, mean loss: 0.3399683595037175
Epoch: 63, step: 1098, loss: 0.3545154929161072, mean loss: 0.3399685175027988
Epoch: 63, step: 1099, loss: 0.30909475684165955, mean loss: 0.3399681821808696
Epoch: 63, step: 1100, loss: 0.339199960231781, mean loss: 0.33996817383725153
Epoch: 63, step: 1101, loss: 0.3470746576786041, mean loss: 0.3399682510195597
Epoch: 63, step: 1102, loss: 0.3423730432987213, mean loss: 0.33996827713731453
Epoch: 63, step: 1103, loss: 0.3206799328327179, mean loss: 0.33996806765444926
Epoch: 63, step: 1104, loss: 0.3220866918563843, mean loss: 0.339967873454206
Epoch: 63, step: 1105, loss: 0.3531988561153412, mean loss: 0.33996801714740804
Epoch: 63, step: 1106, loss: 0.31304097175598145, mean loss: 0.339967724713244
Epoch: 63, step: 1107, loss: 0.28970739245414734, mean loss: 0.33996717887992234
Epoch: 63, step: 1108, loss: 0.35230863094329834, mean loss: 0.3399673129081373
Epoch: 63, step: 1109, loss: 0.29775911569595337, mean loss: 0.3399668545319377
Epoch: 63, step: 1110, loss: 0.34935417771339417, mean loss: 0.3399669564760879
Epoch: 63, step: 1111, loss: 0.3213789761066437, mean loss: 0.339966754617129
Epoch: 63, step: 1112, loss: 0.30337950587272644, mean loss: 0.33996635729673214
Epoch: 63, step: 1113, loss: 0.333094984292984, mean loss: 0.3399662826776478
Epoch: 63, step: 1114, loss: 0.34340864419937134, mean loss: 0.33996632005927085
Epoch: 63, step: 1115, loss: 0.33145302534103394, mean loss: 0.3399662276118866
Epoch: 63, step: 1116, loss: 0.3138256371021271, mean loss: 0.3399659437496391
Epoch: 63, step: 1117, loss: 0.3427070081233978, mean loss: 0.3399659735146991
Epoch: 63, step: 1118, loss: 0.3338293433189392, mean loss: 0.33996590687810924
Epoch: 63, step: 1119, loss: 0.342755526304245, mean loss: 0.33996593716976786
Epoch: 63, step: 1120, loss: 0.3124220073223114, mean loss: 0.3399656380815652
Epoch: 63, step: 1121, loss: 0.31305578351020813, mean loss: 0.339965345881698
Epoch: 63, step: 1122, loss: 0.36205169558525085, mean loss: 0.3399655857030749
Epoch: 63, step: 1123, loss: 0.37821388244628906, mean loss: 0.33996600101206487
Epoch: 63, step: 1124, loss: 0.30874359607696533, mean loss: 0.3399656619955395
Epoch: 63, step: 1125, loss: 0.35463187098503113, mean loss: 0.3399658212412233
Epoch: 63, step: 1126, loss: 0.3171047270298004, mean loss: 0.3399655730181784
Epoch: 63, step: 1127, loss: 0.34684664011001587, mean loss: 0.33996564773117616
Epoch: 63, step: 1128, loss: 0.3511465787887573, mean loss: 0.33996576912976095
Epoch: 63, step: 1129, loss: 0.33796170353889465, mean loss: 0.3399657473705636
Epoch: 63, step: 1130, loss: 0.37461352348327637, mean loss: 0.33996612355566197
Epoch: 63, step: 1131, loss: 0.3062320053577423, mean loss: 0.3399657572944985
Epoch: 63, step: 1132, loss: 0.31443530321121216, mean loss: 0.33996548010591937
Epoch: 63, step: 1133, loss: 0.3538914620876312, mean loss: 0.3399656313010856
Epoch: 63, step: 1134, loss: 0.3466389775276184, mean loss: 0.3399657037531927
Epoch: 63, step: 1135, loss: 0.2904854714870453, mean loss: 0.3399651665552048
Epoch: 63, step: 1136, loss: 0.32633864879608154, mean loss: 0.33996501861615697
Epoch: 63, step: 1137, loss: 0.30951955914497375, mean loss: 0.339964688082453
Epoch: 63, step: 1138, loss: 0.3090479373931885, mean loss: 0.3399643524357801
Epoch: 63, step: 1139, loss: 0.3228669762611389, mean loss: 0.3399641668207009
Epoch: 63, step: 1140, loss: 0.3122688829898834, mean loss: 0.33996386615430385
Epoch: 63, step: 1141, loss: 0.3328644037246704, mean loss: 0.3399637890817369
Epoch: 63, step: 1142, loss: 0.34165579080581665, mean loss: 0.3399638074500995
Epoch: 63, step: 1143, loss: 0.3230425715446472, mean loss: 0.33996362375523753
Epoch: 63, step: 1144, loss: 0.3456025719642639, mean loss: 0.33996368497030327
Epoch: 63, step: 1145, loss: 0.3253154754638672, mean loss: 0.3399635259545897
Epoch: 63, step: 1146, loss: 0.32327204942703247, mean loss: 0.3399633447598684
Epoch: 63, step: 1147, loss: 0.33320382237434387, mean loss: 0.3399632713825086
Epoch: 63, step: 1148, loss: 0.3173736333847046, mean loss: 0.33996302616547885
Epoch: 63, step: 1149, loss: 0.35905325412750244, mean loss: 0.33996323339315476
Epoch: 63, step: 1150, loss: 0.2941679358482361, mean loss: 0.3399627362827964
Epoch: 63, step: 1151, loss: 0.37157297134399414, mean loss: 0.33996307940983234
Epoch: 63, step: 1152, loss: 0.303609162569046, mean loss: 0.33996268479472413
Epoch: 63, step: 1153, loss: 0.34506756067276, mean loss: 0.3399627402066152
Epoch: 63, step: 1154, loss: 0.3275330066680908, mean loss: 0.3399626052870635
Epoch: 63, step: 1155, loss: 0.3932686448097229, mean loss: 0.3399631838955161
Epoch: 63, step: 1156, loss: 0.37747737765312195, mean loss: 0.3399635910875377
Epoch: 63, step: 1157, loss: 0.3461931645870209, mean loss: 0.3399636587047471
Epoch: 63, step: 1158, loss: 0.35084420442581177, mean loss: 0.33996377680338624
Epoch: 63, step: 1159, loss: 0.32894366979599, mean loss: 0.33996365719123184
Epoch: 63, step: 1160, loss: 0.34464162588119507, mean loss: 0.33996370796531594
Epoch: 63, step: 1161, loss: 0.33921244740486145, mean loss: 0.33996369981131674
Epoch: 63, step: 1162, loss: 0.29941582679748535, mean loss: 0.3399632597193537
Epoch: 63, step: 1163, loss: 0.31557121872901917, mean loss: 0.33996299497982746
Epoch: 63, step: 1164, loss: 0.3610333800315857, mean loss: 0.3399632236652096
Epoch: 63, step: 1165, loss: 0.36326056718826294, mean loss: 0.33996347651792536
Epoch: 63, step: 1166, loss: 0.331807941198349, mean loss: 0.3399633880045345
Epoch: 63, step: 1167, loss: 0.36104699969291687, mean loss: 0.33996361682602017
Epoch: 63, step: 1168, loss: 0.3744008243083954, mean loss: 0.3399639905706885
Epoch: 63, step: 1169, loss: 0.33052802085876465, mean loss: 0.339963888163863
Epoch: 63, step: 1170, loss: 0.32612332701683044, mean loss: 0.33996373795645557
Epoch: 63, step: 1171, loss: 0.3471006155014038, mean loss: 0.3399638154099799
Epoch: 63, step: 1172, loss: 0.3370601236820221, mean loss: 0.33996378389777926
Epoch: 63, step: 1173, loss: 0.35442668199539185, mean loss: 0.33996394085411047
Epoch: 63, step: 1174, loss: 0.3230028748512268, mean loss: 0.33996375678880175
Epoch: 63, step: 1175, loss: 0.34247371554374695, mean loss: 0.33996378402714394
Epoch: 63, step: 1176, loss: 0.3238752484321594, mean loss: 0.3399636094345212
Epoch: 63, step: 1177, loss: 0.33763420581817627, mean loss: 0.3399635841561314
Epoch: 63, step: 1178, loss: 0.33350804448127747, mean loss: 0.3399635141022017
Epoch: 63, step: 1179, loss: 0.31912416219711304, mean loss: 0.33996328796113146
Epoch: 63, step: 1180, loss: 0.3258517384529114, mean loss: 0.3399631348293885
Epoch: 63, step: 1181, loss: 0.33628636598587036, mean loss: 0.33996309493129573
Epoch: 63, step: 1182, loss: 0.36995723843574524, mean loss: 0.33996342040624017
Epoch: 63, step: 1183, loss: 0.33626222610473633, mean loss: 0.33996338024396855
Epoch: 63, step: 1184, loss: 0.3334271013736725, mean loss: 0.33996330931849494
Epoch: 63, step: 1185, loss: 0.32150450348854065, mean loss: 0.3399631090232864
Epoch: 63, step: 1186, loss: 0.3402019739151001, mean loss: 0.3399631116151645
Epoch: 63, step: 1187, loss: 0.3169746696949005, mean loss: 0.3399628621746055
Epoch: 63, step: 1188, loss: 0.3317171335220337, mean loss: 0.33996277270369424
Epoch: 63, step: 1189, loss: 0.31875360012054443, mean loss: 0.33996254257443725
Epoch: 63, step: 1190, loss: 0.3236134946346283, mean loss: 0.3399623651816881
Epoch: 63, step: 1191, loss: 0.3266655504703522, mean loss: 0.33996222090827644
Epoch: 63, step: 1192, loss: 0.31979620456695557, mean loss: 0.3399620021048658
Epoch: 63, step: 1193, loss: 0.3583083152770996, mean loss: 0.33996220116214476
Epoch: 63, step: 1194, loss: 0.3306010663509369, mean loss: 0.3399620995950458
Epoch: 63, step: 1195, loss: 0.32588741183280945, mean loss: 0.3399619468881653
Epoch: 63, step: 1196, loss: 0.31454557180404663, mean loss: 0.3399616711297749
Epoch: 63, step: 1197, loss: 0.3151417672634125, mean loss: 0.3399614018458011
Epoch: 63, step: 1198, loss: 0.3011883795261383, mean loss: 0.3399609811817927
Epoch: 63, step: 1199, loss: 0.3361613154411316, mean loss: 0.3399609399581484
Epoch: 63, step: 1200, loss: 0.33947545289993286, mean loss: 0.3399609346910197
Epoch: 63, step: 1201, loss: 0.35152173042297363, mean loss: 0.3399610601146286
Epoch: 63, step: 1202, loss: 0.34767842292785645, mean loss: 0.3399611438397473
Epoch: 63, step: 1203, loss: 0.30945199728012085, mean loss: 0.3399608128517834
Epoch: 63, step: 1204, loss: 0.3293205201625824, mean loss: 0.3399606974185117
Epoch: 63, step: 1205, loss: 0.3676193654537201, mean loss: 0.3399609974756624
Epoch: 63, step: 1206, loss: 0.344135046005249, mean loss: 0.3399610427576521
Epoch: 63, step: 1207, loss: 0.3362370729446411, mean loss: 0.33996100235876064
Epoch: 63, step: 1208, loss: 0.337271124124527, mean loss: 0.339960973178363
Epoch: 63, step: 1209, loss: 0.31154003739356995, mean loss: 0.33996066486507204
Epoch: 63, step: 1210, loss: 0.33668839931488037, mean loss: 0.33996062936757737
Epoch: 63, step: 1211, loss: 0.31820881366729736, mean loss: 0.33996039340671974
Epoch: 63, step: 1212, loss: 0.3174504041671753, mean loss: 0.33996014922394335
Epoch: 63, step: 1213, loss: 0.3123815953731537, mean loss: 0.33995985006188134
Epoch: 63, step: 1214, loss: 0.3473978042602539, mean loss: 0.33995993074521197
Epoch: 63, step: 1215, loss: 0.3535473048686981, mean loss: 0.33996007813287765
Epoch: 63, step: 1216, loss: 0.33254188299179077, mean loss: 0.3399599976656295
Epoch: 63, step: 1217, loss: 0.3213443458080292, mean loss: 0.3399597957386108
Epoch: 63, step: 1218, loss: 0.32839053869247437, mean loss: 0.33995967024634965
Epoch: 63, step: 1219, loss: 0.3302839994430542, mean loss: 0.3399595652950437
Epoch: 63, step: 1220, loss: 0.35523784160614014, mean loss: 0.3399597310156115
Epoch: 63, step: 1221, loss: 0.3623298704624176, mean loss: 0.33995997365764297
Epoch: 63, step: 1222, loss: 0.3317328989505768, mean loss: 0.33995988442205854
Epoch: 63, step: 1223, loss: 0.3241727948188782, mean loss: 0.3399597131880614
Epoch: 63, step: 1224, loss: 0.3325830101966858, mean loss: 0.3399596331778334
Epoch: 63, step: 1225, loss: 0.3157730996608734, mean loss: 0.33995937084531513
Epoch: 63, step: 1226, loss: 0.3204939663410187, mean loss: 0.33995915972150137
Epoch: 63, step: 1227, loss: 0.3055948317050934, mean loss: 0.33995878700644694
Epoch: 63, step: 1228, loss: 0.3711756467819214, mean loss: 0.3399591255804296
Epoch: 63, step: 1229, loss: 0.30782362818717957, mean loss: 0.33995877704680355
Epoch: 63, step: 1230, loss: 0.32863304018974304, mean loss: 0.3399586542120058
Epoch: 63, step: 1231, loss: 0.35471609234809875, mean loss: 0.33995881426404406
Epoch: 63, step: 1232, loss: 0.30268192291259766, mean loss: 0.33995840998128984
Epoch: 63, step: 1233, loss: 0.3050580620765686, mean loss: 0.3399580314772022
Epoch: 63, step: 1234, loss: 0.3604307472705841, mean loss: 0.3399582535071543
Epoch: 63, step: 1235, loss: 0.32178688049316406, mean loss: 0.3399580564377784
Epoch: 63, step: 1236, loss: 0.2849997878074646, mean loss: 0.33995746041929176
Epoch: 63, step: 1237, loss: 0.3721349835395813, mean loss: 0.33995780937844067
Epoch: 63, step: 1238, loss: 0.3749825060367584, mean loss: 0.33995818921052856
Epoch: 63, step: 1239, loss: 0.34867504239082336, mean loss: 0.3399582837411014
Epoch: 63, step: 1240, loss: 0.3223014771938324, mean loss: 0.3399580922626054
Epoch: 63, step: 1241, loss: 0.33743464946746826, mean loss: 0.33995806489753294
Epoch: 63, step: 1242, loss: 0.38604649901390076, mean loss: 0.33995856469077823
Epoch: 63, step: 1243, loss: 0.3733108937740326, mean loss: 0.33995892636694164
Epoch: 63, step: 1244, loss: 0.3136690855026245, mean loss: 0.33995864128023456
Epoch: 63, step: 1245, loss: 0.32478067278862, mean loss: 0.339958476692318
Epoch: 63, step: 1246, loss: 0.367446631193161, mean loss: 0.33995877476705855
Epoch: 63, step: 1247, loss: 0.34850040078163147, mean loss: 0.3399588673893315
Epoch: 63, step: 1248, loss: 0.36153239011764526, mean loss: 0.33995910132219637
Epoch: 63, step: 1249, loss: 0.3371995985507965, mean loss: 0.3399590713998051
Epoch: 63, step: 1250, loss: 0.3188101351261139, mean loss: 0.33995884207592414
Epoch: 63, step: 1251, loss: 0.3738303482532501, mean loss: 0.33995920935023644
Epoch: 63, step: 1252, loss: 0.3337969183921814, mean loss: 0.3399591425322266
Epoch: 63, step: 1253, loss: 0.3198421597480774, mean loss: 0.33995892440520403
Epoch: 63, step: 1254, loss: 0.35149577260017395, mean loss: 0.3399590494970773
Epoch: 63, step: 1255, loss: 0.34974613785743713, mean loss: 0.3399591556154834
Epoch: 63, step: 1256, loss: 0.31813719868659973, mean loss: 0.3399589190092432
Epoch: 63, step: 1257, loss: 0.3020825982093811, mean loss: 0.3399585083367852
Epoch: 63, step: 1258, loss: 0.32446563243865967, mean loss: 0.3399583403577337
Epoch: 63, step: 1259, loss: 0.29611119627952576, mean loss: 0.3399578649571777
Epoch: 63, step: 1260, loss: 0.2991570830345154, mean loss: 0.33995742259075873
Epoch: 63, step: 1261, loss: 0.3228287994861603, mean loss: 0.3399572368824179
Epoch: 63, step: 1262, loss: 0.3286517560482025, mean loss: 0.33995711430984965
Epoch: 63, step: 1263, loss: 0.31480327248573303, mean loss: 0.3399568415980904
Epoch: 63, step: 1264, loss: 0.3474899232387543, mean loss: 0.33995692326902116
Epoch: 63, step: 1265, loss: 0.32917705178260803, mean loss: 0.33995680639884307
Epoch: 63, step: 1266, loss: 0.33158937096595764, mean loss: 0.339956715684119
Epoch: 63, step: 1267, loss: 0.32232463359832764, mean loss: 0.33995652452971653
Epoch: 63, step: 1268, loss: 0.3432830274105072, mean loss: 0.3399565605928867
Epoch: 63, step: 1269, loss: 0.31939953565597534, mean loss: 0.3399563377331814
Epoch: 63, step: 1270, loss: 0.3260101079940796, mean loss: 0.3399561865430668
Epoch: 63, step: 1271, loss: 0.3550305664539337, mean loss: 0.33995634996160795
Epoch: 63, step: 1272, loss: 0.4088295102119446, mean loss: 0.3399570965945989
Epoch: 63, step: 1273, loss: 0.312898188829422, mean loss: 0.3399568032603864
Epoch: 63, step: 1274, loss: 0.3365142345428467, mean loss: 0.3399567659413547
Epoch: 63, step: 1275, loss: 0.3285016119480133, mean loss: 0.33995664176355145
Epoch: 63, step: 1276, loss: 0.30193182826042175, mean loss: 0.33995622956598287
Epoch: 63, step: 1277, loss: 0.33421850204467773, mean loss: 0.33995616736839457
Epoch: 63, step: 1278, loss: 0.3440984785556793, mean loss: 0.33995621227101014
Epoch: 63, step: 1279, loss: 0.3363191783428192, mean loss: 0.33995617284602286
Epoch: 63, step: 1280, loss: 0.35277777910232544, mean loss: 0.3399563118291048
Epoch: 63, step: 1281, loss: 0.3544884920120239, mean loss: 0.339956469352683
Epoch: 63, step: 1282, loss: 0.3614864945411682, mean loss: 0.33995670272784084
Epoch: 63, step: 1283, loss: 0.36606329679489136, mean loss: 0.3399569857077453
Epoch: 63, step: 1284, loss: 0.33571094274520874, mean loss: 0.33995693968367163
Epoch: 63, step: 1285, loss: 0.31347203254699707, mean loss: 0.33995665260930263
Epoch: 63, step: 1286, loss: 0.3263324201107025, mean loss: 0.3399565049355527
Epoch: 63, step: 1287, loss: 0.3599245846271515, mean loss: 0.33995672136823957
Epoch: 63, step: 1288, loss: 0.3029981255531311, mean loss: 0.3399563207808211
Epoch: 63, step: 1289, loss: 0.3518121838569641, mean loss: 0.3399564492829463
Epoch: 63, step: 1290, loss: 0.29948553442955017, mean loss: 0.339956010635657
Epoch: 63, step: 1291, loss: 0.34775272011756897, mean loss: 0.33995609514000846
Epoch: 63, step: 1292, loss: 0.3115527927875519, mean loss: 0.3399557872951881
Epoch: 63, step: 1293, loss: 0.3207458257675171, mean loss: 0.33995557909323365
Epoch: 63, step: 1294, loss: 0.3464963138103485, mean loss: 0.33995564998244343
Epoch: 63, step: 1295, loss: 0.3215656876564026, mean loss: 0.33995545067214816
Epoch: 63, step: 1296, loss: 0.32243549823760986, mean loss: 0.3399552607930725
Epoch: 63, step: 1297, loss: 0.3510856330394745, mean loss: 0.3399553814213617
Epoch: 63, step: 1298, loss: 0.3263266980648041, mean loss: 0.33995523371858016
Epoch: 63, step: 1299, loss: 0.329961359500885, mean loss: 0.33995512540973005
Epoch: 63, step: 1300, loss: 0.3500500023365021, mean loss: 0.3399552348120138
Epoch: 63, step: 1301, loss: 0.30660831928253174, mean loss: 0.3399548734218548
Epoch: 63, step: 1302, loss: 0.3468121886253357, mean loss: 0.3399549477357557
Epoch: 63, step: 1303, loss: 0.3158104717731476, mean loss: 0.33995468608076457
Epoch: 63, step: 1304, loss: 0.28195732831954956, mean loss: 0.3399540575670747
Epoch: 63, step: 1305, loss: 0.34357506036758423, mean loss: 0.33995409680722727
Epoch: 63, step: 1306, loss: 0.34370627999305725, mean loss: 0.3399541374685173
Epoch: 63, step: 1307, loss: 0.34627094864845276, mean loss: 0.33995420592117426
Epoch: 63, step: 1308, loss: 0.34853696823120117, mean loss: 0.3399542989279938
Epoch: 63, step: 1309, loss: 0.30246198177337646, mean loss: 0.3399538926481434
Epoch: 63, step: 1310, loss: 0.3698045313358307, mean loss: 0.3399542161165903
Epoch: 63, step: 1311, loss: 0.3252812922000885, mean loss: 0.3399540571191052
Epoch: 63, step: 1312, loss: 0.31908875703811646, mean loss: 0.3399538310227723
Epoch: 63, step: 1313, loss: 0.30710262060165405, mean loss: 0.33995347505100604
Epoch: 63, step: 1314, loss: 0.35009056329727173, mean loss: 0.33995358489408517
Epoch: 63, step: 1315, loss: 0.3341185450553894, mean loss: 0.3399535216676653
Epoch: 63, step: 1316, loss: 0.37811192870140076, mean loss: 0.33995393513413513
Epoch: 63, step: 1317, loss: 0.3084571063518524, mean loss: 0.3399535938530778
Epoch: 63, step: 1318, loss: 0.3141371011734009, mean loss: 0.3399533141238227
Epoch: 63, step: 1319, loss: 0.34768325090408325, mean loss: 0.33995339787904283
Epoch: 63, step: 1320, loss: 0.3251368999481201, mean loss: 0.3399532373414297
Epoch: 63, step: 1321, loss: 0.35392850637435913, mean loss: 0.33995338876263836
Epoch: 63, step: 1322, loss: 0.3152911067008972, mean loss: 0.33995312155117446
Epoch: 63, step: 1323, loss: 0.3688293695449829, mean loss: 0.339953434416824
Epoch: 63, step: 1324, loss: 0.34430602192878723, mean loss: 0.3399534815753179
Epoch: 63, step: 1325, loss: 0.3128243684768677, mean loss: 0.33995318764573007
Epoch: 63, step: 1326, loss: 0.31653133034706116, mean loss: 0.3399529338850469
Epoch: 63, step: 1327, loss: 0.3066692650318146, mean loss: 0.33995257328191736
Epoch: 63, step: 1328, loss: 0.33739835023880005, mean loss: 0.33995254560916144
Epoch: 63, step: 1329, loss: 0.31248554587364197, mean loss: 0.33995224803164703
Epoch: 63, step: 1330, loss: 0.3181861340999603, mean loss: 0.33995201222009236
Epoch: 63, step: 1331, loss: 0.34821847081184387, mean loss: 0.33995210177697605
Epoch: 63, step: 1332, loss: 0.3231349587440491, mean loss: 0.33995191958594595
Epoch: 63, step: 1333, loss: 0.34807145595550537, mean loss: 0.33995200754920263
Epoch: 63, step: 1334, loss: 0.37478360533714294, mean loss: 0.3399523848943421
Epoch: 63, step: 1335, loss: 0.33093494176864624, mean loss: 0.33995228720570053
Epoch: 63, step: 1336, loss: 0.33297860622406006, mean loss: 0.33995221165856015
Epoch: 63, step: 1337, loss: 0.3253314197063446, mean loss: 0.339952053270607
Epoch: 63, step: 1338, loss: 0.3303663432598114, mean loss: 0.3399519494291362
Epoch: 63, step: 1339, loss: 0.32595300674438477, mean loss: 0.3399517977810007
Epoch: 63, step: 1340, loss: 0.3313562572002411, mean loss: 0.3399517046679984
Epoch: 63, step: 1341, loss: 0.31066808104515076, mean loss: 0.33995138745041903
Epoch: 63, step: 1342, loss: 0.3069368898868561, mean loss: 0.33995102982167436
Epoch: 63, step: 1343, loss: 0.29611414670944214, mean loss: 0.33995055496484444
Epoch: 63, step: 1344, loss: 0.3276122212409973, mean loss: 0.339950421313039
Epoch: 63, step: 1345, loss: 0.3211002051830292, mean loss: 0.3399502171251652
Epoch: 63, step: 1346, loss: 0.3630092740058899, mean loss: 0.3399504669010172
Epoch: 63, step: 1347, loss: 0.38468408584594727, mean loss: 0.3399509514506158
Epoch: 63, step: 1348, loss: 0.3302977681159973, mean loss: 0.33995084688953725
Epoch: 63, step: 1349, loss: 0.3620157241821289, mean loss: 0.3399510858886631
Epoch: 63, step: 1350, loss: 0.3395257890224457, mean loss: 0.33995108128204427
Epoch: 63, step: 1351, loss: 0.36591339111328125, mean loss: 0.33995136249072055
Epoch: 63, step: 1352, loss: 0.2866816520690918, mean loss: 0.3399507855103748
Epoch: 63, step: 1353, loss: 0.300126314163208, mean loss: 0.3399503541641522
Epoch: 63, step: 1354, loss: 0.3134510815143585, mean loss: 0.33995006714873255
Epoch: 63, step: 1355, loss: 0.35763660073280334, mean loss: 0.3399502587107027
Epoch: 63, step: 1356, loss: 0.31312090158462524, mean loss: 0.3399499681264104
Epoch: 63, step: 1357, loss: 0.3105108439922333, mean loss: 0.33994964927962024
Epoch: 63, step: 1358, loss: 0.32674679160118103, mean loss: 0.3399495062847683
Epoch: 63, step: 1359, loss: 0.33176350593566895, mean loss: 0.33994941762644454
Epoch: 63, step: 1360, loss: 0.34968364238739014, mean loss: 0.33994952305164206
Epoch: 63, step: 1361, loss: 0.35373935103416443, mean loss: 0.33994967239888124
Epoch: 63, step: 1362, loss: 0.3533918857574463, mean loss: 0.3399498179797916
Epoch: 63, step: 1363, loss: 0.33625519275665283, mean loss: 0.33994977796695564
Epoch: 63, step: 1364, loss: 0.3184942603111267, mean loss: 0.33994954560595564
Epoch: 63, step: 1365, loss: 0.39054369926452637, mean loss: 0.33995009352938543
Epoch: 63, step: 1366, loss: 0.3004607558250427, mean loss: 0.3399496658732737
Epoch: 63, step: 1367, loss: 0.31381136178970337, mean loss: 0.33994938280738585
Epoch: 63, step: 1368, loss: 0.312094122171402, mean loss: 0.33994908115091
Epoch: 63, step: 1369, loss: 0.3114283084869385, mean loss: 0.33994877229066583
Epoch: 63, step: 1370, loss: 0.3273746073246002, mean loss: 0.33994863612262965
Epoch: 63, step: 1371, loss: 0.3547562062740326, mean loss: 0.33994879647490106
Epoch: 63, step: 1372, loss: 0.3101661801338196, mean loss: 0.33994847396024036
Epoch: 63, step: 1373, loss: 0.3060254156589508, mean loss: 0.33994810661289127
Epoch: 63, step: 1374, loss: 0.3500438928604126, mean loss: 0.33994821593735497
Epoch: 63, step: 1375, loss: 0.32434430718421936, mean loss: 0.3399480469687931
Epoch: 63, step: 1376, loss: 0.32506534457206726, mean loss: 0.339947885811635
Epoch: 63, step: 1377, loss: 0.342097669839859, mean loss: 0.3399479090902926
Epoch: 63, step: 1378, loss: 0.34390315413475037, mean loss: 0.33994795191868693
Epoch: 63, step: 1379, loss: 0.3177339434623718, mean loss: 0.33994771138238605
Epoch: 63, step: 1380, loss: 0.3239045739173889, mean loss: 0.3399475376669955
Epoch: 63, step: 1381, loss: 0.3381173014640808, mean loss: 0.33994751784937843
Epoch: 63, step: 1382, loss: 0.32227614521980286, mean loss: 0.339947326507571
Epoch: 63, step: 1383, loss: 0.36189910769462585, mean loss: 0.3399475641941445
Epoch: 63, step: 1384, loss: 0.3118843138217926, mean loss: 0.3399472603379087
Epoch: 63, step: 1385, loss: 0.3235146403312683, mean loss: 0.3399470824148267
Epoch: 63, step: 1386, loss: 0.30954623222351074, mean loss: 0.3399467532552408
Epoch: 63, step: 1387, loss: 0.33386847376823425, mean loss: 0.3399466874445058
Epoch: 63, step: 1388, loss: 0.33478277921676636, mean loss: 0.3399466315344547
Epoch: 63, step: 1389, loss: 0.3096148371696472, mean loss: 0.33994630313322516
Epoch: 63, step: 1390, loss: 0.3253597915172577, mean loss: 0.3399461452073066
Epoch: 63, step: 1391, loss: 0.3153494894504547, mean loss: 0.3399458789059797
Epoch: 63, step: 1392, loss: 0.3066825568675995, mean loss: 0.33994551877690443
Epoch: 63, step: 1393, loss: 0.284302294254303, mean loss: 0.33994491635583474
Epoch: 63, step: 1394, loss: 0.3591682016849518, mean loss: 0.3399451244743763
Epoch: 63, step: 1395, loss: 0.30200740694999695, mean loss: 0.3399447137507759
Epoch: 63, step: 1396, loss: 0.32525306940078735, mean loss: 0.3399445546969337
Epoch: 63, step: 1397, loss: 0.31298139691352844, mean loss: 0.3399442627930928
Epoch: 63, step: 1398, loss: 0.3071541488170624, mean loss: 0.3399439078103171
Epoch: 63, step: 1399, loss: 0.3330417275428772, mean loss: 0.33994383308875353
Epoch: 63, step: 1400, loss: 0.3093201220035553, mean loss: 0.3399435015664355
Epoch: 63, step: 1401, loss: 0.31520360708236694, mean loss: 0.3399432337432982
Epoch: 63, step: 1402, loss: 0.3151935040950775, mean loss: 0.3399429658165902
Epoch: 63, step: 1403, loss: 0.31713050603866577, mean loss: 0.33994271886435395
Epoch: 63, step: 1404, loss: 0.3618837893009186, mean loss: 0.3399429563809483
Epoch: 63, step: 1405, loss: 0.32890209555625916, mean loss: 0.3399428368626558
Epoch: 63, step: 1406, loss: 0.295183926820755, mean loss: 0.3399423523487507
Epoch: 63, step: 1407, loss: 0.31553536653518677, mean loss: 0.339942088146696
Epoch: 63, step: 1408, loss: 0.31017106771469116, mean loss: 0.3399417658832389
Epoch: 63, step: 1409, loss: 0.3345482647418976, mean loss: 0.3399417075006412
Epoch: 63, step: 1410, loss: 0.33923232555389404, mean loss: 0.3399416998219346
Epoch: 63, step: 1411, loss: 0.3280434012413025, mean loss: 0.33994157103016787
Epoch: 63, step: 1412, loss: 0.3158703148365021, mean loss: 0.3399413104764395
Epoch: 63, step: 1413, loss: 0.3501366376876831, mean loss: 0.33994142083219914
Epoch: 63, step: 1414, loss: 0.3402649164199829, mean loss: 0.33994142433372626
Epoch: 63, step: 1415, loss: 0.3350856900215149, mean loss: 0.3399413717756634
Epoch: 63, step: 1416, loss: 0.3572930693626404, mean loss: 0.3399415595869568
Epoch: 63, step: 1417, loss: 0.34573549032211304, mean loss: 0.3399416222986219
Epoch: 63, step: 1418, loss: 0.30883029103279114, mean loss: 0.33994128556310366
Epoch: 63, step: 1419, loss: 0.3296314477920532, mean loss: 0.3399411739751115
Epoch: 63, step: 1420, loss: 0.3334471881389618, mean loss: 0.33994110368855474
Epoch: 63, step: 1421, loss: 0.34877026081085205, mean loss: 0.33994119924840843
Epoch: 63, step: 1422, loss: 0.3601168096065521, mean loss: 0.33994141761098606
Epoch: 63, step: 1423, loss: 0.3308769464492798, mean loss: 0.3399413195064019
Epoch: 63, step: 1424, loss: 0.3723853826522827, mean loss: 0.33994167064402697
Epoch: 63, step: 1425, loss: 0.32635268568992615, mean loss: 0.3399415235739069
Epoch: 63, step: 1426, loss: 0.3145446181297302, mean loss: 0.3399412487126482
Epoch: 63, step: 1427, loss: 0.33224064111709595, mean loss: 0.33994116537273916
Epoch: 63, step: 1428, loss: 0.349187433719635, mean loss: 0.33994126543949543
Epoch: 63, step: 1429, loss: 0.323932409286499, mean loss: 0.3399410921872265
Epoch: 63, step: 1430, loss: 0.3062320947647095, mean loss: 0.3399407273830814
Epoch: 63, step: 1431, loss: 0.3286232054233551, mean loss: 0.3399406049043796
Epoch: 63, step: 1432, loss: 0.27814584970474243, mean loss: 0.3399399361661598
Epoch: 63, step: 1433, loss: 0.3835732340812683, mean loss: 0.33994040835733697
Epoch: 63, step: 1434, loss: 0.3453078866004944, mean loss: 0.33994046644252796
Epoch: 63, step: 1435, loss: 0.3488803803920746, mean loss: 0.3399405631864673
Epoch: 63, step: 1436, loss: 0.32149890065193176, mean loss: 0.33994036362081315
Epoch: 63, step: 1437, loss: 0.3166886866092682, mean loss: 0.339940112006518
Epoch: 63, step: 1438, loss: 0.33624398708343506, mean loss: 0.33994007200992754
Epoch: 63, step: 1439, loss: 0.35245996713638306, mean loss: 0.33994020748903336
Epoch: 63, step: 1440, loss: 0.33668240904808044, mean loss: 0.33994017223643425
Epoch: 63, step: 1441, loss: 0.3539080023765564, mean loss: 0.3399403233805265
Epoch: 63, step: 1442, loss: 0.2904188930988312, mean loss: 0.33993978752130144
Epoch: 63, step: 1443, loss: 0.3206256926059723, mean loss: 0.33993957853048906
Valid: 63, mean loss: 0.18602798630793888
Epoch: 64, step: 0, loss: 0.39160624146461487, mean loss: 0.33994013759065045
Epoch: 64, step: 1, loss: 0.33296632766723633, mean loss: 0.33994006213121697
Epoch: 64, step: 2, loss: 0.33694443106651306, mean loss: 0.3399400297176325
Epoch: 64, step: 3, loss: 0.3200092315673828, mean loss: 0.3399398140630323
Epoch: 64, step: 4, loss: 0.2967204451560974, mean loss: 0.33993934642722545
Epoch: 64, step: 5, loss: 0.32282933592796326, mean loss: 0.33993916129803003
Epoch: 64, step: 6, loss: 0.3038659393787384, mean loss: 0.3399387709923494
Epoch: 64, step: 7, loss: 0.35744228959083557, mean loss: 0.33993896037517857
Epoch: 64, step: 8, loss: 0.3310509920120239, mean loss: 0.3399388642110632
Epoch: 64, step: 9, loss: 0.36049267649650574, mean loss: 0.33993908659234423
Epoch: 64, step: 10, loss: 0.3327266275882721, mean loss: 0.3399390085582308
Epoch: 64, step: 11, loss: 0.3246898055076599, mean loss: 0.3399388435735611
Epoch: 64, step: 12, loss: 0.3617914319038391, mean loss: 0.3399390799992319
Epoch: 64, step: 13, loss: 0.3513360619544983, mean loss: 0.3399392033031587
Epoch: 64, step: 14, loss: 0.3407055139541626, mean loss: 0.33993921159378254
Epoch: 64, step: 15, loss: 0.3285979628562927, mean loss: 0.33993908889548824
Epoch: 64, step: 16, loss: 0.3183210790157318, mean loss: 0.3399388550178701
Epoch: 64, step: 17, loss: 0.3413113057613373, mean loss: 0.3399388698657696
Epoch: 64, step: 18, loss: 0.3237558603286743, mean loss: 0.33993869479128985
Epoch: 64, step: 19, loss: 0.3819532096385956, mean loss: 0.3399391493167436
Epoch: 64, step: 20, loss: 0.3207128643989563, mean loss: 0.33993894132335445
Epoch: 64, step: 21, loss: 0.31214872002601624, mean loss: 0.339938640687022
Epoch: 64, step: 22, loss: 0.29798418283462524, mean loss: 0.33993818682601257
Epoch: 64, step: 23, loss: 0.31127581000328064, mean loss: 0.33993787676135634
Epoch: 64, step: 24, loss: 0.3174704611301422, mean loss: 0.3399376337153526
Epoch: 64, step: 25, loss: 0.34073325991630554, mean loss: 0.33993764232211365
Epoch: 64, step: 26, loss: 0.3258177638053894, mean loss: 0.33993748958065656
Epoch: 64, step: 27, loss: 0.35963261127471924, mean loss: 0.3399377026298722
Epoch: 64, step: 28, loss: 0.3062083125114441, mean loss: 0.3399373377708737
Epoch: 64, step: 29, loss: 0.3177850544452667, mean loss: 0.33993709814684103
Epoch: 64, step: 30, loss: 0.2864786982536316, mean loss: 0.3399365198868662
Epoch: 64, step: 31, loss: 0.33139267563819885, mean loss: 0.3399364274690286
Epoch: 64, step: 32, loss: 0.35212472081184387, mean loss: 0.3399365593070511
Epoch: 64, step: 33, loss: 0.3229696452617645, mean loss: 0.3399363757817504
Epoch: 64, step: 34, loss: 0.34860098361968994, mean loss: 0.33993646950283335
Epoch: 64, step: 35, loss: 0.3124310374259949, mean loss: 0.3399361719924271
Epoch: 64, step: 36, loss: 0.3169105648994446, mean loss: 0.33993592294039965
Epoch: 64, step: 37, loss: 0.3415558636188507, mean loss: 0.3399359404619853
Epoch: 64, step: 38, loss: 0.33538591861724854, mean loss: 0.3399358912486183
Epoch: 64, step: 39, loss: 0.3483527600765228, mean loss: 0.33993598228509864
Epoch: 64, step: 40, loss: 0.3557265102863312, mean loss: 0.3399361530729027
Epoch: 64, step: 41, loss: 0.3510822057723999, mean loss: 0.3399362736255071
Epoch: 64, step: 42, loss: 0.32541748881340027, mean loss: 0.33993611659606904
Epoch: 64, step: 43, loss: 0.33733588457107544, mean loss: 0.3399360884732914
Epoch: 64, step: 44, loss: 0.2989310324192047, mean loss: 0.3399356449884053
Epoch: 64, step: 45, loss: 0.3409096598625183, mean loss: 0.3399356555226234
Epoch: 64, step: 46, loss: 0.35173991322517395, mean loss: 0.33993578318728607
Epoch: 64, step: 47, loss: 0.3213944137096405, mean loss: 0.3399355826620062
Epoch: 64, step: 48, loss: 0.3802277147769928, mean loss: 0.3399360184175041
Epoch: 64, step: 49, loss: 0.3350091278553009, mean loss: 0.33993596513423713
Epoch: 64, step: 50, loss: 0.353094220161438, mean loss: 0.33993610743641006
Epoch: 64, step: 51, loss: 0.3295344114303589, mean loss: 0.3399359949467271
Epoch: 64, step: 52, loss: 0.37987637519836426, mean loss: 0.33993642687937753
Epoch: 64, step: 53, loss: 0.4130619764328003, mean loss: 0.3399372176823358
Epoch: 64, step: 54, loss: 0.3267318308353424, mean loss: 0.3399370748766254
Epoch: 64, step: 55, loss: 0.306232213973999, mean loss: 0.3399367103894195
Epoch: 64, step: 56, loss: 0.3317149877548218, mean loss: 0.33993662147997966
Epoch: 64, step: 57, loss: 0.3217262327671051, mean loss: 0.3399364245555608
Epoch: 64, step: 58, loss: 0.3142322301864624, mean loss: 0.3399361465972545
Epoch: 64, step: 59, loss: 0.34542885422706604, mean loss: 0.3399362059932884
Epoch: 64, step: 60, loss: 0.32408738136291504, mean loss: 0.33993603461203004
Epoch: 64, step: 61, loss: 0.34888896346092224, mean loss: 0.33993613142347545
Epoch: 64, step: 62, loss: 0.2995566427707672, mean loss: 0.3399356947893352
Epoch: 64, step: 63, loss: 0.33315983414649963, mean loss: 0.3399356215209459
Epoch: 64, step: 64, loss: 0.3340509235858917, mean loss: 0.3399355578895196
Epoch: 64, step: 65, loss: 0.30400189757347107, mean loss: 0.33993516934190693
Epoch: 64, step: 66, loss: 0.32431894540786743, mean loss: 0.33993500048683156
Epoch: 64, step: 67, loss: 0.3272974193096161, mean loss: 0.33993486384069627
Epoch: 64, step: 68, loss: 0.3348892629146576, mean loss: 0.33993480928481234
Epoch: 64, step: 69, loss: 0.3194701373577118, mean loss: 0.33993458801162585
Epoch: 64, step: 70, loss: 0.311198890209198, mean loss: 0.33993427731176745
Epoch: 64, step: 71, loss: 0.33111563324928284, mean loss: 0.33993418196270525
Epoch: 64, step: 72, loss: 0.3416583836078644, mean loss: 0.33993420060493995
Epoch: 64, step: 73, loss: 0.34510675072669983, mean loss: 0.33993425653044673
Epoch: 64, step: 74, loss: 0.3299301266670227, mean loss: 0.33993414836716745
Epoch: 64, step: 75, loss: 0.34713470935821533, mean loss: 0.3399342262178031
Epoch: 64, step: 76, loss: 0.3452184200286865, mean loss: 0.3399342833485461
Epoch: 64, step: 77, loss: 0.3548862636089325, mean loss: 0.33993444500206155
Epoch: 64, step: 78, loss: 0.29043304920196533, mean loss: 0.33993390982290805
Epoch: 64, step: 79, loss: 0.34852924942970276, mean loss: 0.33993400274951685
Epoch: 64, step: 80, loss: 0.3466813266277313, mean loss: 0.3399340756959246
Epoch: 64, step: 81, loss: 0.3194045424461365, mean loss: 0.3399338537502258
Epoch: 64, step: 82, loss: 0.33790984749794006, mean loss: 0.3399338318688406
Epoch: 64, step: 83, loss: 0.35720399022102356, mean loss: 0.33993401857325517
Epoch: 64, step: 84, loss: 0.32868802547454834, mean loss: 0.33993389699626575
Epoch: 64, step: 85, loss: 0.35517555475234985, mean loss: 0.33993406176738156
Epoch: 64, step: 86, loss: 0.30697882175445557, mean loss: 0.339933705506071
Epoch: 64, step: 87, loss: 0.3560134768486023, mean loss: 0.33993387933392
Epoch: 64, step: 88, loss: 0.3457947075366974, mean loss: 0.3399339426908002
Epoch: 64, step: 89, loss: 0.31975963711738586, mean loss: 0.33993372460434557
Epoch: 64, step: 90, loss: 0.29465994238853455, mean loss: 0.3399332351950877
Epoch: 64, step: 91, loss: 0.3270775079727173, mean loss: 0.3399330962262718
Epoch: 64, step: 92, loss: 0.33943140506744385, mean loss: 0.3399330908031113
Epoch: 64, step: 93, loss: 0.3279046416282654, mean loss: 0.3399329607798795
Epoch: 64, step: 94, loss: 0.3429052531719208, mean loss: 0.33993299290894946
Epoch: 64, step: 95, loss: 0.32288217544555664, mean loss: 0.3399328085996981
Epoch: 64, step: 96, loss: 0.3173694908618927, mean loss: 0.3399325647062157
Epoch: 64, step: 97, loss: 0.31463655829429626, mean loss: 0.33993229127725993
Epoch: 64, step: 98, loss: 0.34434178471565247, mean loss: 0.33993233893973024
Epoch: 64, step: 99, loss: 0.3168541491031647, mean loss: 0.33993208948893433
Epoch: 64, step: 100, loss: 0.32731759548187256, mean loss: 0.33993195314108465
Epoch: 64, step: 101, loss: 0.32051289081573486, mean loss: 0.33993174324612013
Epoch: 64, step: 102, loss: 0.3637142777442932, mean loss: 0.33993200030180054
Epoch: 64, step: 103, loss: 0.3106527328491211, mean loss: 0.33993168383760414
Epoch: 64, step: 104, loss: 0.32442256808280945, mean loss: 0.339931516209544
Epoch: 64, step: 105, loss: 0.32551661133766174, mean loss: 0.3399313604097896
Epoch: 64, step: 106, loss: 0.3378969430923462, mean loss: 0.3399313384215562
Epoch: 64, step: 107, loss: 0.3067682981491089, mean loss: 0.339930979995199
Epoch: 64, step: 108, loss: 0.33196932077407837, mean loss: 0.33993089394646386
Epoch: 64, step: 109, loss: 0.3686080873012543, mean loss: 0.3399312038830585
Epoch: 64, step: 110, loss: 0.33384495973587036, mean loss: 0.3399311381050245
Epoch: 64, step: 111, loss: 0.3248178958892822, mean loss: 0.3399309747680647
Epoch: 64, step: 112, loss: 0.3413121700286865, mean loss: 0.3399309896952255
Epoch: 64, step: 113, loss: 0.3298816680908203, mean loss: 0.33993088108913444
Epoch: 64, step: 114, loss: 0.321537047624588, mean loss: 0.3399306823035008
Epoch: 64, step: 115, loss: 0.3021567463874817, mean loss: 0.33993027407785004
Epoch: 64, step: 116, loss: 0.3756355345249176, mean loss: 0.3399306599430057
Epoch: 64, step: 117, loss: 0.3556545078754425, mean loss: 0.339930829868092
Epoch: 64, step: 118, loss: 0.3318846523761749, mean loss: 0.3399307429152904
Epoch: 64, step: 119, loss: 0.3281248211860657, mean loss: 0.33993061533335767
Epoch: 64, step: 120, loss: 0.3488825559616089, mean loss: 0.33993071207239856
Epoch: 64, step: 121, loss: 0.3548796474933624, mean loss: 0.3399308736161473
Epoch: 64, step: 122, loss: 0.3099299371242523, mean loss: 0.3399305494183876
Epoch: 64, step: 123, loss: 0.3123001754283905, mean loss: 0.3399302508407564
Epoch: 64, step: 124, loss: 0.33326035737991333, mean loss: 0.3399301787657468
Epoch: 64, step: 125, loss: 0.3206559121608734, mean loss: 0.33992997048986556
Epoch: 64, step: 126, loss: 0.35691124200820923, mean loss: 0.33993015398587845
Epoch: 64, step: 127, loss: 0.3425181806087494, mean loss: 0.3399301819512422
Epoch: 64, step: 128, loss: 0.3312469720840454, mean loss: 0.3399300881243486
Epoch: 64, step: 129, loss: 0.3614879250526428, mean loss: 0.3399303210662038
Epoch: 64, step: 130, loss: 0.3084470331668854, mean loss: 0.3399299808791864
Epoch: 64, step: 131, loss: 0.3753194212913513, mean loss: 0.3399303632693019
Epoch: 64, step: 132, loss: 0.3292267620563507, mean loss: 0.33993024761595925
Epoch: 64, step: 133, loss: 0.35226383805274963, mean loss: 0.33993038088003746
Epoch: 64, step: 134, loss: 0.330771267414093, mean loss: 0.3399302819171579
Epoch: 64, step: 135, loss: 0.35643452405929565, mean loss: 0.33993046024115026
Epoch: 64, step: 136, loss: 0.31195712089538574, mean loss: 0.33993015799984694
Epoch: 64, step: 137, loss: 0.31548401713371277, mean loss: 0.33992989387143685
Epoch: 64, step: 138, loss: 0.3762090802192688, mean loss: 0.339930285845791
Epoch: 64, step: 139, loss: 0.3547552227973938, mean loss: 0.33993044601841027
Epoch: 64, step: 140, loss: 0.34372735023498535, mean loss: 0.3399304870407448
Epoch: 64, step: 141, loss: 0.30585551261901855, mean loss: 0.33993011889348124
Epoch: 64, step: 142, loss: 0.3255356252193451, mean loss: 0.33992996337652803
Epoch: 64, step: 143, loss: 0.32983148097991943, mean loss: 0.3399298542745142
Epoch: 64, step: 144, loss: 0.32542335987091064, mean loss: 0.3399296975509006
Epoch: 64, step: 145, loss: 0.3330443799495697, mean loss: 0.33992962316489334
Epoch: 64, step: 146, loss: 0.3399495482444763, mean loss: 0.339929623380153
Epoch: 64, step: 147, loss: 0.30260932445526123, mean loss: 0.33992922019642147
Epoch: 64, step: 148, loss: 0.30449628829956055, mean loss: 0.3399288374066856
Epoch: 64, step: 149, loss: 0.3192075490951538, mean loss: 0.33992861355248094
Epoch: 64, step: 150, loss: 0.2929111123085022, mean loss: 0.3399281056230758
Epoch: 64, step: 151, loss: 0.34236061573028564, mean loss: 0.3399281319011644
Epoch: 64, step: 152, loss: 0.3876534402370453, mean loss: 0.3399286474658603
Epoch: 64, step: 153, loss: 0.3278863728046417, mean loss: 0.3399285173775524
Epoch: 64, step: 154, loss: 0.29929783940315247, mean loss: 0.3399280784638756
Epoch: 64, step: 155, loss: 0.30556732416152954, mean loss: 0.339927707285179
Epoch: 64, step: 156, loss: 0.3230082392692566, mean loss: 0.3399275245162505
Epoch: 64, step: 157, loss: 0.31674256920814514, mean loss: 0.33992727406844325
Epoch: 64, step: 158, loss: 0.3318786919116974, mean loss: 0.33992718712723713
Epoch: 64, step: 159, loss: 0.3249078094959259, mean loss: 0.3399270248888856
Epoch: 64, step: 160, loss: 0.32679370045661926, mean loss: 0.3399268830250919
Epoch: 64, step: 161, loss: 0.31483107805252075, mean loss: 0.33992661194767637
Epoch: 64, step: 162, loss: 0.3333097994327545, mean loss: 0.3399265404756091
Epoch: 64, step: 163, loss: 0.35189029574394226, mean loss: 0.33992666970174074
Epoch: 64, step: 164, loss: 0.3308849036693573, mean loss: 0.3399265720384401
Epoch: 64, step: 165, loss: 0.32704609632492065, mean loss: 0.33992643291338653
Epoch: 64, step: 166, loss: 0.32525378465652466, mean loss: 0.3399262744323667
Epoch: 64, step: 167, loss: 0.3006139099597931, mean loss: 0.33992584981942636
Epoch: 64, step: 168, loss: 0.3189755380153656, mean loss: 0.3399256235375038
Epoch: 64, step: 169, loss: 0.3612172305583954, mean loss: 0.3399258535032332
Epoch: 64, step: 170, loss: 0.388942688703537, mean loss: 0.3399263829170299
Epoch: 64, step: 171, loss: 0.3488108813762665, mean loss: 0.3399264788743728
Epoch: 64, step: 172, loss: 0.3333098292350769, mean loss: 0.3399264074117839
Epoch: 64, step: 173, loss: 0.3745858371257782, mean loss: 0.3399267817441061
Epoch: 64, step: 174, loss: 0.3457071781158447, mean loss: 0.3399268441734607
Epoch: 64, step: 175, loss: 0.33434075117111206, mean loss: 0.33992678384327013
Epoch: 64, step: 176, loss: 0.3464363217353821, mean loss: 0.33992685414597
Epoch: 64, step: 177, loss: 0.3026222586631775, mean loss: 0.3399264512624626
Epoch: 64, step: 178, loss: 0.33837971091270447, mean loss: 0.3399264345581012
Epoch: 64, step: 179, loss: 0.3092346787452698, mean loss: 0.3399261030993361
Epoch: 64, step: 180, loss: 0.35602355003356934, mean loss: 0.339926276943488
Epoch: 64, step: 181, loss: 0.3336929678916931, mean loss: 0.33992620962768144
Epoch: 64, step: 182, loss: 0.3184156119823456, mean loss: 0.3399259773293019
Epoch: 64, step: 183, loss: 0.3389153480529785, mean loss: 0.33992596641537887
Epoch: 64, step: 184, loss: 0.3323615789413452, mean loss: 0.3399258847274114
Epoch: 64, step: 185, loss: 0.2998412251472473, mean loss: 0.3399254518570676
Epoch: 64, step: 186, loss: 0.3344202935695648, mean loss: 0.33992539240804015
Epoch: 64, step: 187, loss: 0.29449963569641113, mean loss: 0.3399249018703019
Epoch: 64, step: 188, loss: 0.3392499089241028, mean loss: 0.3399248945813548
Epoch: 64, step: 189, loss: 0.30869153141975403, mean loss: 0.33992455730986953
Epoch: 64, step: 190, loss: 0.34082064032554626, mean loss: 0.3399245669860605
Epoch: 64, step: 191, loss: 0.3317777216434479, mean loss: 0.33992447901476924
Epoch: 64, step: 192, loss: 0.330122709274292, mean loss: 0.33992437317441093
Epoch: 64, step: 193, loss: 0.3180326223373413, mean loss: 0.33992413678794253
Epoch: 64, step: 194, loss: 0.3707846701145172, mean loss: 0.33992447001545684
Epoch: 64, step: 195, loss: 0.36809781193733215, mean loss: 0.33992477422378753
Epoch: 64, step: 196, loss: 0.330513060092926, mean loss: 0.33992467259967285
Epoch: 64, step: 197, loss: 0.31983715295791626, mean loss: 0.33992445570460683
Epoch: 64, step: 198, loss: 0.3130563497543335, mean loss: 0.3399241655992681
Epoch: 64, step: 199, loss: 0.3395039439201355, mean loss: 0.33992416106202095
Epoch: 64, step: 200, loss: 0.37535446882247925, mean loss: 0.3399245436085055
Epoch: 64, step: 201, loss: 0.31783074140548706, mean loss: 0.33992430506089916
Epoch: 64, step: 202, loss: 0.35563674569129944, mean loss: 0.3399244747068749
Epoch: 64, step: 203, loss: 0.3260960578918457, mean loss: 0.33992432540416695
Epoch: 64, step: 204, loss: 0.32919788360595703, mean loss: 0.33992420959412606
Epoch: 64, step: 205, loss: 0.3138110041618347, mean loss: 0.33992392766104934
Epoch: 64, step: 206, loss: 0.3568512499332428, mean loss: 0.33992411041611315
Epoch: 64, step: 207, loss: 0.34990406036376953, mean loss: 0.3399242181630248
Epoch: 64, step: 208, loss: 0.32507967948913574, mean loss: 0.3399240578980999
Epoch: 64, step: 209, loss: 0.3184407651424408, mean loss: 0.3399238259622206
Epoch: 64, step: 210, loss: 0.37821733951568604, mean loss: 0.3399242393785415
Epoch: 64, step: 211, loss: 0.3052397668361664, mean loss: 0.3399238649294274
Epoch: 64, step: 212, loss: 0.315306156873703, mean loss: 0.3399235991626799
Epoch: 64, step: 213, loss: 0.3342939615249634, mean loss: 0.33992353838714673
Epoch: 64, step: 214, loss: 0.34324872493743896, mean loss: 0.33992357428427133
Epoch: 64, step: 215, loss: 0.32039985060691833, mean loss: 0.33992336351775787
Epoch: 64, step: 216, loss: 0.3085689842700958, mean loss: 0.3399230250381745
Epoch: 64, step: 217, loss: 0.365569531917572, mean loss: 0.3399233018966377
Epoch: 64, step: 218, loss: 0.3512956500053406, mean loss: 0.3399234246617709
Epoch: 64, step: 219, loss: 0.3382726311683655, mean loss: 0.33992340684155525
Epoch: 64, step: 220, loss: 0.3378106653690338, mean loss: 0.3399233840348854
Epoch: 64, step: 221, loss: 0.32198506593704224, mean loss: 0.3399231903960105
Epoch: 64, step: 222, loss: 0.31093186140060425, mean loss: 0.3399228774465076
Epoch: 64, step: 223, loss: 0.3452312648296356, mean loss: 0.33992293474775315
Epoch: 64, step: 224, loss: 0.3262415826320648, mean loss: 0.33992278706635815
Epoch: 64, step: 225, loss: 0.3252933621406555, mean loss: 0.3399226291528316
Epoch: 64, step: 226, loss: 0.32580259442329407, mean loss: 0.3399224767394304
Epoch: 64, step: 227, loss: 0.32419902086257935, mean loss: 0.33992230702033494
Epoch: 64, step: 228, loss: 0.3237282931804657, mean loss: 0.33992213222392026
Epoch: 64, step: 229, loss: 0.3574671149253845, mean loss: 0.339922321600501
Epoch: 64, step: 230, loss: 0.33439382910728455, mean loss: 0.33992226192784575
Epoch: 64, step: 231, loss: 0.27816736698150635, mean loss: 0.33992159537384625
Epoch: 64, step: 232, loss: 0.32613125443458557, mean loss: 0.3399214465288405
Epoch: 64, step: 233, loss: 0.32547059655189514, mean loss: 0.33992129055636366
Epoch: 64, step: 234, loss: 0.30196547508239746, mean loss: 0.33992088089197287
Epoch: 64, step: 235, loss: 0.32388225197792053, mean loss: 0.3399207077858455
Epoch: 64, step: 236, loss: 0.3676427900791168, mean loss: 0.339921006989134
Epoch: 64, step: 237, loss: 0.3099620044231415, mean loss: 0.33992068364634725
Epoch: 64, step: 238, loss: 0.3639930188655853, mean loss: 0.3399209434524583
Epoch: 64, step: 239, loss: 0.34314456582069397, mean loss: 0.33992097824375483
Epoch: 64, step: 240, loss: 0.36983099579811096, mean loss: 0.3399213010474022
Epoch: 64, step: 241, loss: 0.3395228087902069, mean loss: 0.33992129674672383
Epoch: 64, step: 242, loss: 0.3576675355434418, mean loss: 0.33992148826874324
Epoch: 64, step: 243, loss: 0.3322739601135254, mean loss: 0.3399214057355234
Epoch: 64, step: 244, loss: 0.34518110752105713, mean loss: 0.33992146249836624
Epoch: 64, step: 245, loss: 0.3356545865535736, mean loss: 0.3399214164506234
Epoch: 64, step: 246, loss: 0.3176381289958954, mean loss: 0.3399211759739773
Epoch: 64, step: 247, loss: 0.3005620837211609, mean loss: 0.33992075122334864
Epoch: 64, step: 248, loss: 0.3621455132961273, mean loss: 0.33992099106322426
Epoch: 64, step: 249, loss: 0.305615097284317, mean loss: 0.33992062085307406
Epoch: 64, step: 250, loss: 0.33906421065330505, mean loss: 0.33992061161127063
Epoch: 64, step: 251, loss: 0.3621421456336975, mean loss: 0.33992085140854716
Epoch: 64, step: 252, loss: 0.3147580027580261, mean loss: 0.33992057987385216
Epoch: 64, step: 253, loss: 0.3400987386703491, mean loss: 0.3399205817963599
Epoch: 64, step: 254, loss: 0.3256169557571411, mean loss: 0.33992042744790096
Epoch: 64, step: 255, loss: 0.32477524876594543, mean loss: 0.33992026402012687
Epoch: 64, step: 256, loss: 0.33616960048675537, mean loss: 0.33992022354810664
Epoch: 64, step: 257, loss: 0.30170151591300964, mean loss: 0.3399198111486458
Epoch: 64, step: 258, loss: 0.32144683599472046, mean loss: 0.33991961181791847
Epoch: 64, step: 259, loss: 0.3289104700088501, mean loss: 0.3399194930261945
Epoch: 64, step: 260, loss: 0.35648292303085327, mean loss: 0.3399196717483155
Epoch: 64, step: 261, loss: 0.31508126854896545, mean loss: 0.3399194037407711
Epoch: 64, step: 262, loss: 0.3694344758987427, mean loss: 0.33991972220635835
Epoch: 64, step: 263, loss: 0.32215234637260437, mean loss: 0.33991953049967044
Epoch: 64, step: 264, loss: 0.3404042422771454, mean loss: 0.3399195357295641
Epoch: 64, step: 265, loss: 0.3127233386039734, mean loss: 0.3399192422939766
Epoch: 64, step: 266, loss: 0.33124274015426636, mean loss: 0.33991914867915896
Epoch: 64, step: 267, loss: 0.37289151549339294, mean loss: 0.3399195044295238
Epoch: 64, step: 268, loss: 0.30587905645370483, mean loss: 0.3399191371592214
Epoch: 64, step: 269, loss: 0.33120471239089966, mean loss: 0.3399190431382822
Epoch: 64, step: 270, loss: 0.36666572093963623, mean loss: 0.33991933170817656
Epoch: 64, step: 271, loss: 0.3103324770927429, mean loss: 0.3399190124990598
Epoch: 64, step: 272, loss: 0.33280032873153687, mean loss: 0.3399189356972412
Epoch: 64, step: 273, loss: 0.2963968813419342, mean loss: 0.3399184661530147
Epoch: 64, step: 274, loss: 0.3197111189365387, mean loss: 0.33991824814536326
Epoch: 64, step: 275, loss: 0.35135558247566223, mean loss: 0.3399183715361017
Epoch: 64, step: 276, loss: 0.29779133200645447, mean loss: 0.33991791705691204
Epoch: 64, step: 277, loss: 0.3488906919956207, mean loss: 0.3399180138568661
Epoch: 64, step: 278, loss: 0.30590489506721497, mean loss: 0.3399176469210142
Epoch: 64, step: 279, loss: 0.3578813970088959, mean loss: 0.33991784071308817
Epoch: 64, step: 280, loss: 0.4163885712623596, mean loss: 0.3399186656667603
Epoch: 64, step: 281, loss: 0.36362361907958984, mean loss: 0.3399189213891428
Epoch: 64, step: 282, loss: 0.2789604067802429, mean loss: 0.33991826379289464
Epoch: 64, step: 283, loss: 0.3572777807712555, mean loss: 0.33991845105845
Epoch: 64, step: 284, loss: 0.32110995054244995, mean loss: 0.339918248164193
Epoch: 64, step: 285, loss: 0.35919684171676636, mean loss: 0.3399184561272742
Epoch: 64, step: 286, loss: 0.37082937359809875, mean loss: 0.3399187895675887
Epoch: 64, step: 287, loss: 0.3134843409061432, mean loss: 0.33991850441863436
Epoch: 64, step: 288, loss: 0.31125524640083313, mean loss: 0.3399181952308018
Epoch: 64, step: 289, loss: 0.33260083198547363, mean loss: 0.3399181162999533
Epoch: 64, step: 290, loss: 0.335694283246994, mean loss: 0.3399180707388516
Epoch: 64, step: 291, loss: 0.36723339557647705, mean loss: 0.3399183653771227
Epoch: 64, step: 292, loss: 0.3426339328289032, mean loss: 0.33991839466842616
Epoch: 64, step: 293, loss: 0.3049190044403076, mean loss: 0.33991801715370035
Epoch: 64, step: 294, loss: 0.3285723924636841, mean loss: 0.33991789477744844
Epoch: 64, step: 295, loss: 0.31048065423965454, mean loss: 0.33991757726471505
Epoch: 64, step: 296, loss: 0.30425146222114563, mean loss: 0.3399171925709284
Epoch: 64, step: 297, loss: 0.3389680087566376, mean loss: 0.339917182333167
Epoch: 64, step: 298, loss: 0.3302989602088928, mean loss: 0.33991707859351183
Epoch: 64, step: 299, loss: 0.31354817748069763, mean loss: 0.3399167941884349
Epoch: 64, step: 300, loss: 0.2965832054615021, mean loss: 0.3399163268136414
Epoch: 64, step: 301, loss: 0.3190084993839264, mean loss: 0.3399161013145212
Epoch: 64, step: 302, loss: 0.34642958641052246, mean loss: 0.3399161715642553
Epoch: 64, step: 303, loss: 0.35022681951522827, mean loss: 0.33991628276623925
Epoch: 64, step: 304, loss: 0.32500746846199036, mean loss: 0.3399161219740314
Epoch: 64, step: 305, loss: 0.3241521120071411, mean loss: 0.3399159519603349
Epoch: 64, step: 306, loss: 0.3385170102119446, mean loss: 0.339915936873013
Epoch: 64, step: 307, loss: 0.37768635153770447, mean loss: 0.3399163442153911
Epoch: 64, step: 308, loss: 0.3267129063606262, mean loss: 0.339916201821885
Epoch: 64, step: 309, loss: 0.33192938566207886, mean loss: 0.3399161156883716
Epoch: 64, step: 310, loss: 0.33897489309310913, mean loss: 0.33991610553790197
Epoch: 64, step: 311, loss: 0.3692389726638794, mean loss: 0.3399164217624202
Epoch: 64, step: 312, loss: 0.3285030126571655, mean loss: 0.3399162986789285
Epoch: 64, step: 313, loss: 0.32092469930648804, mean loss: 0.3399160938735864
Epoch: 64, step: 314, loss: 0.3588279187679291, mean loss: 0.3399162978164415
Epoch: 64, step: 315, loss: 0.3257327675819397, mean loss: 0.33991614486459926
Epoch: 64, step: 316, loss: 0.29585957527160645, mean loss: 0.33991566977407495
Epoch: 64, step: 317, loss: 0.360879510641098, mean loss: 0.339915895838311
Epoch: 64, step: 318, loss: 0.3331622779369354, mean loss: 0.3399158230112457
Epoch: 64, step: 319, loss: 0.32905906438827515, mean loss: 0.33991570593957315
Epoch: 64, step: 320, loss: 0.3885480761528015, mean loss: 0.3399162303512989
Epoch: 64, step: 321, loss: 0.36001700162887573, mean loss: 0.33991644709924773
Epoch: 64, step: 322, loss: 0.29986366629600525, mean loss: 0.339916015212115
Epoch: 64, step: 323, loss: 0.30146411061286926, mean loss: 0.3399156005916212
Epoch: 64, step: 324, loss: 0.29413098096847534, mean loss: 0.33991510690900373
Epoch: 64, step: 325, loss: 0.3039984703063965, mean loss: 0.339914719634235
Epoch: 64, step: 326, loss: 0.299735963344574, mean loss: 0.33991428640740073
Epoch: 64, step: 327, loss: 0.33912909030914307, mean loss: 0.33991427794112694
Epoch: 64, step: 328, loss: 0.3985156714916229, mean loss: 0.3399149097961439
Epoch: 64, step: 329, loss: 0.3482426404953003, mean loss: 0.3399149995868702
Epoch: 64, step: 330, loss: 0.29373544454574585, mean loss: 0.33991450167798865
Epoch: 64, step: 331, loss: 0.31673097610473633, mean loss: 0.3399142517154496
Epoch: 64, step: 332, loss: 0.28837645053863525, mean loss: 0.339913696045834
Epoch: 64, step: 333, loss: 0.3313402235507965, mean loss: 0.33991360360947287
Epoch: 64, step: 334, loss: 0.3526258170604706, mean loss: 0.3399137406669003
Epoch: 64, step: 335, loss: 0.3266734480857849, mean loss: 0.33991359791749776
Epoch: 64, step: 336, loss: 0.32287314534187317, mean loss: 0.33991341419888405
Epoch: 64, step: 337, loss: 0.30922675132751465, mean loss: 0.339913083359644
Epoch: 64, step: 338, loss: 0.32053712010383606, mean loss: 0.3399128744656409
Epoch: 64, step: 339, loss: 0.333138644695282, mean loss: 0.33991280143284763
Epoch: 64, step: 340, loss: 0.3297225832939148, mean loss: 0.3399126915735579
Epoch: 64, step: 341, loss: 0.29766976833343506, mean loss: 0.3399122361635314
Epoch: 64, step: 342, loss: 0.29398152232170105, mean loss: 0.3399117410017267
Epoch: 64, step: 343, loss: 0.31295472383499146, mean loss: 0.33991145039136483
Epoch: 64, step: 344, loss: 0.337048202753067, mean loss: 0.3399114195244311
Epoch: 64, step: 345, loss: 0.3699273467063904, mean loss: 0.33991174310442274
Epoch: 64, step: 346, loss: 0.30660468339920044, mean loss: 0.3399113840489836
Epoch: 64, step: 347, loss: 0.32055899500846863, mean loss: 0.33991117542937854
Epoch: 64, step: 348, loss: 0.3436352014541626, mean loss: 0.33991121557411014
Epoch: 64, step: 349, loss: 0.33163705468177795, mean loss: 0.3399111263802148
Epoch: 64, step: 350, loss: 0.3379793167114258, mean loss: 0.3399111055558951
Epoch: 64, step: 351, loss: 0.3465414345264435, mean loss: 0.3399111770280511
Epoch: 64, step: 352, loss: 0.3425591289997101, mean loss: 0.33991120557155136
Epoch: 64, step: 353, loss: 0.30992555618286133, mean loss: 0.33991088234583844
Epoch: 64, step: 354, loss: 0.31081655621528625, mean loss: 0.33991056873138853
Epoch: 64, step: 355, loss: 0.29979830980300903, mean loss: 0.3399101363567612
Epoch: 64, step: 356, loss: 0.30839669704437256, mean loss: 0.3399097966734556
Epoch: 64, step: 357, loss: 0.34856441617012024, mean loss: 0.339909889960578
Epoch: 64, step: 358, loss: 0.3535664975643158, mean loss: 0.33991003716195345
Epoch: 64, step: 359, loss: 0.3286820650100708, mean loss: 0.33990991613957533
Epoch: 64, step: 360, loss: 0.33529868721961975, mean loss: 0.33990986643729004
Epoch: 64, step: 361, loss: 0.3519037663936615, mean loss: 0.3399099957125488
Epoch: 64, step: 362, loss: 0.3588484525680542, mean loss: 0.33991019983693965
Epoch: 64, step: 363, loss: 0.31416067481040955, mean loss: 0.33990992230379646
Epoch: 64, step: 364, loss: 0.29402241110801697, mean loss: 0.3399094277250444
Epoch: 64, step: 365, loss: 0.33968642354011536, mean loss: 0.33990942532151586
Epoch: 64, step: 366, loss: 0.32797059416770935, mean loss: 0.3399092966467462
Epoch: 64, step: 367, loss: 0.29390949010849, mean loss: 0.3399088008736976
Epoch: 64, step: 368, loss: 0.32795006036758423, mean loss: 0.33990867198712643
Epoch: 64, step: 369, loss: 0.3945089876651764, mean loss: 0.33990926044137254
Epoch: 64, step: 370, loss: 0.3432093560695648, mean loss: 0.3399092960077302
Epoch: 64, step: 371, loss: 0.32534676790237427, mean loss: 0.33990913906364145
Epoch: 64, step: 372, loss: 0.3317270278930664, mean loss: 0.33990905088388773
Epoch: 64, step: 373, loss: 0.36991748213768005, mean loss: 0.33990937428545315
Epoch: 64, step: 374, loss: 0.3040032386779785, mean loss: 0.3399089873283602
Epoch: 64, step: 375, loss: 0.3489522635936737, mean loss: 0.3399090847858594
Epoch: 64, step: 376, loss: 0.32790419459342957, mean loss: 0.3399089554130598
Epoch: 64, step: 377, loss: 0.32452392578125, mean loss: 0.3399087896153829
Epoch: 64, step: 378, loss: 0.2927016317844391, mean loss: 0.3399082808901517
Epoch: 64, step: 379, loss: 0.30107903480529785, mean loss: 0.33990786245351556
Epoch: 64, step: 380, loss: 0.3359103202819824, mean loss: 0.3399078193751599
Epoch: 64, step: 381, loss: 0.3397265672683716, mean loss: 0.3399078174219701
Epoch: 64, step: 382, loss: 0.34638506174087524, mean loss: 0.33990788722061366
Epoch: 64, step: 383, loss: 0.34718504548072815, mean loss: 0.3399079656382673
Epoch: 64, step: 384, loss: 0.3153141736984253, mean loss: 0.3399077006218134
Epoch: 64, step: 385, loss: 0.33300042152404785, mean loss: 0.3399076261915307
Epoch: 64, step: 386, loss: 0.36136722564697266, mean loss: 0.3399078574297391
Epoch: 64, step: 387, loss: 0.30381423234939575, mean loss: 0.3399074685065776
Epoch: 64, step: 388, loss: 0.3317639231681824, mean loss: 0.33990738075758414
Epoch: 64, step: 389, loss: 0.32169678807258606, mean loss: 0.33990718453543595
Epoch: 64, step: 390, loss: 0.3352913558483124, mean loss: 0.3399071347996543
Epoch: 64, step: 391, loss: 0.3162307143211365, mean loss: 0.3399068796878053
Epoch: 64, step: 392, loss: 0.3151049017906189, mean loss: 0.3399066124510298
Epoch: 64, step: 393, loss: 0.30324095487594604, mean loss: 0.3399062173895324
Epoch: 64, step: 394, loss: 0.35377204418182373, mean loss: 0.3399063667880605
Epoch: 64, step: 395, loss: 0.3449893295764923, mean loss: 0.3399064215542846
Epoch: 64, step: 396, loss: 0.37526458501815796, mean loss: 0.3399068025156097
Epoch: 64, step: 397, loss: 0.34754303097724915, mean loss: 0.3399068847901422
Epoch: 64, step: 398, loss: 0.3238872289657593, mean loss: 0.33990671219243895
Epoch: 64, step: 399, loss: 0.33122164011001587, mean loss: 0.3399066186194334
Epoch: 64, step: 400, loss: 0.3327757716178894, mean loss: 0.3399065417924836
Epoch: 64, step: 401, loss: 0.31539198756217957, mean loss: 0.3399062776782576
Epoch: 64, step: 402, loss: 0.35385316610336304, mean loss: 0.3399064279372393
Epoch: 64, step: 403, loss: 0.31409016251564026, mean loss: 0.3399061498046663
Epoch: 64, step: 404, loss: 0.28713464736938477, mean loss: 0.3399055812748893
Epoch: 64, step: 405, loss: 0.36191850900650024, mean loss: 0.33990581842694084
Epoch: 64, step: 406, loss: 0.36084678769111633, mean loss: 0.33990604402802316
Epoch: 64, step: 407, loss: 0.31501904129981995, mean loss: 0.3399057759184531
Epoch: 64, step: 408, loss: 0.32908207178115845, mean loss: 0.3399056593151228
Epoch: 64, step: 409, loss: 0.3301803469657898, mean loss: 0.3399055545458518
Epoch: 64, step: 410, loss: 0.3042648434638977, mean loss: 0.33990517059817404
Epoch: 64, step: 411, loss: 0.3609442114830017, mean loss: 0.3399053972435923
Epoch: 64, step: 412, loss: 0.3588138520717621, mean loss: 0.33990560093483996
Epoch: 64, step: 413, loss: 0.3177087903022766, mean loss: 0.3399053618223695
Epoch: 64, step: 414, loss: 0.4289059638977051, mean loss: 0.3399063205603135
Epoch: 64, step: 415, loss: 0.3230763375759125, mean loss: 0.33990613926525376
Epoch: 64, step: 416, loss: 0.36272841691970825, mean loss: 0.3399063851075475
Epoch: 64, step: 417, loss: 0.3341953754425049, mean loss: 0.33990632358903416
Epoch: 64, step: 418, loss: 0.3368227779865265, mean loss: 0.3399062903736994
Epoch: 64, step: 419, loss: 0.3318375051021576, mean loss: 0.33990620345929906
Epoch: 64, step: 420, loss: 0.29959580302238464, mean loss: 0.339905769253105
Epoch: 64, step: 421, loss: 0.2972693145275116, mean loss: 0.3399053099966074
Epoch: 64, step: 422, loss: 0.3405446708202362, mean loss: 0.3399053168833772
Epoch: 64, step: 423, loss: 0.3583521246910095, mean loss: 0.33990551557798954
Epoch: 64, step: 424, loss: 0.35474586486816406, mean loss: 0.3399056754249245
Epoch: 64, step: 425, loss: 0.3024289309978485, mean loss: 0.3399052717633874
Epoch: 64, step: 426, loss: 0.3420601785182953, mean loss: 0.33990529497361066
Epoch: 64, step: 427, loss: 0.3140585720539093, mean loss: 0.3399050165848842
Epoch: 64, step: 428, loss: 0.3418150544166565, mean loss: 0.3399050371572126
Epoch: 64, step: 429, loss: 0.3367234468460083, mean loss: 0.33990500288982023
Epoch: 64, step: 430, loss: 0.2889208495616913, mean loss: 0.33990445376972667
Epoch: 64, step: 431, loss: 0.3367677628993988, mean loss: 0.3399044199866525
Epoch: 64, step: 432, loss: 0.3091513216495514, mean loss: 0.3399040887703945
Epoch: 64, step: 433, loss: 0.36063113808631897, mean loss: 0.33990431200194343
Epoch: 64, step: 434, loss: 0.33323562145233154, mean loss: 0.33990424018052473
Epoch: 64, step: 435, loss: 0.3338738977909088, mean loss: 0.33990417523477895
Epoch: 64, step: 436, loss: 0.3136042058467865, mean loss: 0.3399038919917024
Epoch: 64, step: 437, loss: 0.3368293046951294, mean loss: 0.3399038588796416
Epoch: 64, step: 438, loss: 0.33107560873031616, mean loss: 0.3399037638039844
Epoch: 64, step: 439, loss: 0.3496866822242737, mean loss: 0.33990386915978715
Epoch: 64, step: 440, loss: 0.3393586277961731, mean loss: 0.339903863287948
Epoch: 64, step: 441, loss: 0.3296110928058624, mean loss: 0.33990375244375065
Epoch: 64, step: 442, loss: 0.2983349859714508, mean loss: 0.33990330478906483
Epoch: 64, step: 443, loss: 0.3113280236721039, mean loss: 0.33990299706473664
Epoch: 64, step: 444, loss: 0.3029782772064209, mean loss: 0.3399025994304245
Epoch: 64, step: 445, loss: 0.306903600692749, mean loss: 0.33990224407517977
Epoch: 64, step: 446, loss: 0.31854507327079773, mean loss: 0.3399020140893856
Epoch: 64, step: 447, loss: 0.3118375241756439, mean loss: 0.33990171187873436
Epoch: 64, step: 448, loss: 0.32093703746795654, mean loss: 0.33990150766105914
Epoch: 64, step: 449, loss: 0.35548263788223267, mean loss: 0.3399016754418424
Epoch: 64, step: 450, loss: 0.3542134761810303, mean loss: 0.33990182955256787
Epoch: 64, step: 451, loss: 0.3112775981426239, mean loss: 0.33990152132765283
Epoch: 64, step: 452, loss: 0.3318302035331726, mean loss: 0.3399014344168667
Epoch: 64, step: 453, loss: 0.3615930676460266, mean loss: 0.33990166798673027
Epoch: 64, step: 454, loss: 0.3018004596233368, mean loss: 0.33990125772724816
Epoch: 64, step: 455, loss: 0.3041616976261139, mean loss: 0.33990087290125
Epoch: 64, step: 456, loss: 0.34759461879730225, mean loss: 0.33990095574282825
Epoch: 64, step: 457, loss: 0.34036508202552795, mean loss: 0.3399009607402041
Epoch: 64, step: 458, loss: 0.32578402757644653, mean loss: 0.3399008087409237
Epoch: 64, step: 459, loss: 0.31665199995040894, mean loss: 0.33990055841997113
Epoch: 64, step: 460, loss: 0.3011951446533203, mean loss: 0.3399001416815562
Epoch: 64, step: 461, loss: 0.33316341042518616, mean loss: 0.33990006914843474
Epoch: 64, step: 462, loss: 0.3339271545410156, mean loss: 0.3399000048398762
Epoch: 64, step: 463, loss: 0.33210310339927673, mean loss: 0.3398999208939089
Epoch: 64, step: 464, loss: 0.3278255760669708, mean loss: 0.33989979089590255
Epoch: 64, step: 465, loss: 0.3072876036167145, mean loss: 0.33989943978172243
Epoch: 64, step: 466, loss: 0.3157591223716736, mean loss: 0.33989917988144563
Epoch: 64, step: 467, loss: 0.39819273352622986, mean loss: 0.3398998074766573
Epoch: 64, step: 468, loss: 0.3266180455684662, mean loss: 0.33989966448519576
Epoch: 64, step: 469, loss: 0.35006311535835266, mean loss: 0.3398997739037397
Epoch: 64, step: 470, loss: 0.4018659293651581, mean loss: 0.3399004410170652
Epoch: 64, step: 471, loss: 0.3368918001651764, mean loss: 0.339900408627081
Epoch: 64, step: 472, loss: 0.3086493909358978, mean loss: 0.33990007219308244
Epoch: 64, step: 473, loss: 0.2970053255558014, mean loss: 0.3398996104130562
Epoch: 64, step: 474, loss: 0.28750959038734436, mean loss: 0.3398990464184817
Epoch: 64, step: 475, loss: 0.31013214588165283, mean loss: 0.33989872597215115
Epoch: 64, step: 476, loss: 0.32636383175849915, mean loss: 0.3398985802680161
Epoch: 64, step: 477, loss: 0.3151293396949768, mean loss: 0.3398983136281839
Epoch: 64, step: 478, loss: 0.3232503831386566, mean loss: 0.3398981344158421
Epoch: 64, step: 479, loss: 0.36140313744544983, mean loss: 0.33989836591131045
Epoch: 64, step: 480, loss: 0.35646969079971313, mean loss: 0.3398985442951645
Epoch: 64, step: 481, loss: 0.3318954110145569, mean loss: 0.33989845814548114
Epoch: 64, step: 482, loss: 0.3955918252468109, mean loss: 0.3398990576499656
Epoch: 64, step: 483, loss: 0.3396977186203003, mean loss: 0.3398990554826994
Epoch: 64, step: 484, loss: 0.3280275762081146, mean loss: 0.339898927696354
Epoch: 64, step: 485, loss: 0.30964985489845276, mean loss: 0.33989860209439926
Epoch: 64, step: 486, loss: 0.3191066384315491, mean loss: 0.33989837829146863
Epoch: 64, step: 487, loss: 0.31716388463974, mean loss: 0.33989813358194426
Epoch: 64, step: 488, loss: 0.3766162395477295, mean loss: 0.33989852880400945
Epoch: 64, step: 489, loss: 0.30590710043907166, mean loss: 0.3398981629349766
Epoch: 64, step: 490, loss: 0.3152727782726288, mean loss: 0.33989789788084007
Epoch: 64, step: 491, loss: 0.3481864035129547, mean loss: 0.3398979870928093
Epoch: 64, step: 492, loss: 0.3269042670726776, mean loss: 0.33989784723854305
Epoch: 64, step: 493, loss: 0.30414867401123047, mean loss: 0.33989746246647085
Epoch: 64, step: 494, loss: 0.33131372928619385, mean loss: 0.3398973700798516
Epoch: 64, step: 495, loss: 0.3131048381328583, mean loss: 0.3398970817152491
Epoch: 64, step: 496, loss: 0.3154943585395813, mean loss: 0.3398968190746803
Epoch: 64, step: 497, loss: 0.3160597085952759, mean loss: 0.33989656252442435
Epoch: 64, step: 498, loss: 0.3113832473754883, mean loss: 0.33989625564916043
Epoch: 64, step: 499, loss: 0.30196142196655273, mean loss: 0.3398958473789628
Epoch: 64, step: 500, loss: 0.37199991941452026, mean loss: 0.33989619289239986
Epoch: 64, step: 501, loss: 0.32310178875923157, mean loss: 0.3398960121480432
Epoch: 64, step: 502, loss: 0.3452640175819397, mean loss: 0.33989606991884824
Epoch: 64, step: 503, loss: 0.3565160930156708, mean loss: 0.33989624878263536
Epoch: 64, step: 504, loss: 0.3106788694858551, mean loss: 0.339895934350168
Epoch: 64, step: 505, loss: 0.3481441140174866, mean loss: 0.33989602311471967
Epoch: 64, step: 506, loss: 0.28755876421928406, mean loss: 0.33989545988216263
Epoch: 64, step: 507, loss: 0.33491671085357666, mean loss: 0.33989540630344206
Epoch: 64, step: 508, loss: 0.3636826276779175, mean loss: 0.3398956622864539
Epoch: 64, step: 509, loss: 0.34840768575668335, mean loss: 0.33989575388647403
Epoch: 64, step: 510, loss: 0.3278142511844635, mean loss: 0.3398956238757914
Epoch: 64, step: 511, loss: 0.4160720109939575, mean loss: 0.3398964436113622
Epoch: 64, step: 512, loss: 0.3342640995979309, mean loss: 0.33989638300225183
Epoch: 64, step: 513, loss: 0.3172018527984619, mean loss: 0.3398961387912306
Epoch: 64, step: 514, loss: 0.2973792552947998, mean loss: 0.33989568128099723
Epoch: 64, step: 515, loss: 0.30335190892219543, mean loss: 0.33989528804968444
Epoch: 64, step: 516, loss: 0.33417829871177673, mean loss: 0.33989522653236187
Epoch: 64, step: 517, loss: 0.34614098072052, mean loss: 0.33989529373870386
Epoch: 64, step: 518, loss: 0.31812381744384766, mean loss: 0.3398950594730742
Epoch: 64, step: 519, loss: 0.31973034143447876, mean loss: 0.33989484249883345
Epoch: 64, step: 520, loss: 0.3264066278934479, mean loss: 0.33989469736595196
Epoch: 64, step: 521, loss: 0.3489607572555542, mean loss: 0.33989479491549995
Epoch: 64, step: 522, loss: 0.31514307856559753, mean loss: 0.33989452859332786
Epoch: 64, step: 523, loss: 0.3224800229072571, mean loss: 0.3398943412196923
Epoch: 64, step: 524, loss: 0.2974407970905304, mean loss: 0.33989388444018565
Epoch: 64, step: 525, loss: 0.3324754238128662, mean loss: 0.33989380462201274
Epoch: 64, step: 526, loss: 0.3311743140220642, mean loss: 0.3398937108065495
Epoch: 64, step: 527, loss: 0.37596026062965393, mean loss: 0.3398940988525753
Epoch: 64, step: 528, loss: 0.32839182019233704, mean loss: 0.339893975098972
Epoch: 64, step: 529, loss: 0.32793453335762024, mean loss: 0.33989384642811216
Epoch: 64, step: 530, loss: 0.32966941595077515, mean loss: 0.33989373642530973
Epoch: 64, step: 531, loss: 0.3300309181213379, mean loss: 0.339893630314169
Epoch: 64, step: 532, loss: 0.33911600708961487, mean loss: 0.3398936219480411
Epoch: 64, step: 533, loss: 0.32392528653144836, mean loss: 0.3398934501531469
Epoch: 64, step: 534, loss: 0.3081371784210205, mean loss: 0.3398931085078528
Epoch: 64, step: 535, loss: 0.40279126167297363, mean loss: 0.33989378518133123
Epoch: 64, step: 536, loss: 0.3745719790458679, mean loss: 0.3398941582536782
Epoch: 64, step: 537, loss: 0.305803120136261, mean loss: 0.3398937915019718
Epoch: 64, step: 538, loss: 0.3765393793582916, mean loss: 0.33989418573130703
Epoch: 64, step: 539, loss: 0.3434287905693054, mean loss: 0.33989422375580075
Epoch: 64, step: 540, loss: 0.31272637844085693, mean loss: 0.33989393149329966
Epoch: 64, step: 541, loss: 0.3643356263637543, mean loss: 0.3398941944259668
Epoch: 64, step: 542, loss: 0.3603006899356842, mean loss: 0.339894413947428
Epoch: 64, step: 543, loss: 0.30822432041168213, mean loss: 0.33989407326225657
Epoch: 64, step: 544, loss: 0.29589328169822693, mean loss: 0.3398935999369743
Epoch: 64, step: 545, loss: 0.31835314631462097, mean loss: 0.3398933682245152
Epoch: 64, step: 546, loss: 0.3084995448589325, mean loss: 0.33989303052216735
Epoch: 64, step: 547, loss: 0.285515695810318, mean loss: 0.33989244559321946
Epoch: 64, step: 548, loss: 0.3506275415420532, mean loss: 0.3398925610678169
Epoch: 64, step: 549, loss: 0.3659186363220215, mean loss: 0.3398928410204367
Epoch: 64, step: 550, loss: 0.33397597074508667, mean loss: 0.33989277737559204
Epoch: 64, step: 551, loss: 0.3034857213497162, mean loss: 0.3398923857671243
Epoch: 64, step: 552, loss: 0.3228025436401367, mean loss: 0.3398922019441067
Epoch: 64, step: 553, loss: 0.3603031039237976, mean loss: 0.3398924214869913
Epoch: 64, step: 554, loss: 0.3210064470767975, mean loss: 0.3398922183486534
Epoch: 64, step: 555, loss: 0.29753297567367554, mean loss: 0.33989176273575195
Epoch: 64, step: 556, loss: 0.3533415198326111, mean loss: 0.33989190739879493
Epoch: 64, step: 557, loss: 0.37428367137908936, mean loss: 0.33989227730612365
Epoch: 64, step: 558, loss: 0.32695600390434265, mean loss: 0.3398921381690072
Epoch: 64, step: 559, loss: 0.3556455075740814, mean loss: 0.3398923076038012
Epoch: 64, step: 560, loss: 0.3247690498828888, mean loss: 0.33989214494790004
Epoch: 64, step: 561, loss: 0.3197934925556183, mean loss: 0.33989192878222224
Epoch: 64, step: 562, loss: 0.3251633942127228, mean loss: 0.3398917703751134
Epoch: 64, step: 563, loss: 0.31294891238212585, mean loss: 0.33989148060464675
Epoch: 64, step: 564, loss: 0.3224104046821594, mean loss: 0.3398912925976784
Epoch: 64, step: 565, loss: 0.3434736132621765, mean loss: 0.3398913311247123
Epoch: 64, step: 566, loss: 0.3081514537334442, mean loss: 0.33989098977331056
Epoch: 64, step: 567, loss: 0.31799671053886414, mean loss: 0.33989075431044347
Epoch: 64, step: 568, loss: 0.33050453662872314, mean loss: 0.33989065336709046
Epoch: 64, step: 569, loss: 0.3160596787929535, mean loss: 0.3398903970814714
Epoch: 64, step: 570, loss: 0.3201429843902588, mean loss: 0.3398901847140148
Epoch: 64, step: 571, loss: 0.3132096529006958, mean loss: 0.3398898977895534
Epoch: 64, step: 572, loss: 0.35367751121520996, mean loss: 0.3398900460609987
Epoch: 64, step: 573, loss: 0.3180338144302368, mean loss: 0.3398898110224824
Epoch: 64, step: 574, loss: 0.32475829124450684, mean loss: 0.3398896483022215
Epoch: 64, step: 575, loss: 0.3449583053588867, mean loss: 0.33988970280859904
Epoch: 64, step: 576, loss: 0.30688658356666565, mean loss: 0.3398893479096363
Epoch: 64, step: 577, loss: 0.31027624011039734, mean loss: 0.33988902946857774
Epoch: 64, step: 578, loss: 0.3516572415828705, mean loss: 0.3398891560152965
Epoch: 64, step: 579, loss: 0.3077436089515686, mean loss: 0.33988881034938545
Epoch: 64, step: 580, loss: 0.3284914791584015, mean loss: 0.33988868779348375
Epoch: 64, step: 581, loss: 0.3240463137626648, mean loss: 0.3398885174417124
Epoch: 64, step: 582, loss: 0.3334908187389374, mean loss: 0.33988844864851353
Epoch: 64, step: 583, loss: 0.361676961183548, mean loss: 0.33988868293359453
Epoch: 64, step: 584, loss: 0.3478180170059204, mean loss: 0.33988876819433445
Epoch: 64, step: 585, loss: 0.373248815536499, mean loss: 0.3398891268968069
Epoch: 64, step: 586, loss: 0.3138749301433563, mean loss: 0.33988884718328416
Epoch: 64, step: 587, loss: 0.31743544340133667, mean loss: 0.3398886057592187
Epoch: 64, step: 588, loss: 0.34012314677238464, mean loss: 0.3398886082810295
Epoch: 64, step: 589, loss: 0.34336057305336, mean loss: 0.3398886456115756
Epoch: 64, step: 590, loss: 0.38239747285842896, mean loss: 0.339889102661338
Epoch: 64, step: 591, loss: 0.3161971867084503, mean loss: 0.3398888479314658
Epoch: 64, step: 592, loss: 0.3214292824268341, mean loss: 0.33988864946072095
Epoch: 64, step: 593, loss: 0.36598217487335205, mean loss: 0.3398889300060968
Epoch: 64, step: 594, loss: 0.36753007769584656, mean loss: 0.3398892271875881
Epoch: 64, step: 595, loss: 0.3672810196876526, mean loss: 0.3398895216849917
Epoch: 64, step: 596, loss: 0.3173990249633789, mean loss: 0.33988927988549356
Epoch: 64, step: 597, loss: 0.34572142362594604, mean loss: 0.3398893425872776
Epoch: 64, step: 598, loss: 0.3409479260444641, mean loss: 0.3398893539680598
Epoch: 64, step: 599, loss: 0.3539969325065613, mean loss: 0.3398895056363592
Epoch: 64, step: 600, loss: 0.33578014373779297, mean loss: 0.3398894614577478
Epoch: 64, step: 601, loss: 0.31175169348716736, mean loss: 0.33988915895965094
Epoch: 64, step: 602, loss: 0.3716157078742981, mean loss: 0.339889500035656
Epoch: 64, step: 603, loss: 0.3225133419036865, mean loss: 0.33988931323541804
Epoch: 64, step: 604, loss: 0.32424092292785645, mean loss: 0.3398891450111428
Epoch: 64, step: 605, loss: 0.3336273729801178, mean loss: 0.3398890776961847
Epoch: 64, step: 606, loss: 0.3329610824584961, mean loss: 0.33988900322003107
Epoch: 64, step: 607, loss: 0.3350606858730316, mean loss: 0.3398889513160348
Epoch: 64, step: 608, loss: 0.30299246311187744, mean loss: 0.3398885546862234
Epoch: 64, step: 609, loss: 0.3267478346824646, mean loss: 0.3398884134276505
Epoch: 64, step: 610, loss: 0.3201751112937927, mean loss: 0.33988820151818194
Epoch: 64, step: 611, loss: 0.3215160667896271, mean loss: 0.3398880040278056
Epoch: 64, step: 612, loss: 0.3213725686073303, mean loss: 0.3398878049991649
Epoch: 64, step: 613, loss: 0.339555948972702, mean loss: 0.3398878014319712
Epoch: 64, step: 614, loss: 0.2917913794517517, mean loss: 0.33988728443847466
Epoch: 64, step: 615, loss: 0.3733227849006653, mean loss: 0.33988764383632125
Epoch: 64, step: 616, loss: 0.3242759108543396, mean loss: 0.33988747602776964
Epoch: 64, step: 617, loss: 0.30760130286216736, mean loss: 0.3398871289914908
Epoch: 64, step: 618, loss: 0.3690255284309387, mean loss: 0.33988744218974354
Epoch: 64, step: 619, loss: 0.36113470792770386, mean loss: 0.3398876705665626
Epoch: 64, step: 620, loss: 0.32973694801330566, mean loss: 0.3398875614624153
Epoch: 64, step: 621, loss: 0.3624171018600464, mean loss: 0.3398878036165931
Epoch: 64, step: 622, loss: 0.31836333870887756, mean loss: 0.3398875722677511
Epoch: 64, step: 623, loss: 0.335371196269989, mean loss: 0.3398875237254468
Epoch: 64, step: 624, loss: 0.29843243956565857, mean loss: 0.3398870781682821
Epoch: 64, step: 625, loss: 0.33316436409950256, mean loss: 0.33988700591366516
Epoch: 64, step: 626, loss: 0.33829134702682495, mean loss: 0.33988698876397216
Epoch: 64, step: 627, loss: 0.30228811502456665, mean loss: 0.33988658466619326
Epoch: 64, step: 628, loss: 0.3431101143360138, mean loss: 0.339886619311039
Epoch: 64, step: 629, loss: 0.3175009787082672, mean loss: 0.33988637872422595
Epoch: 64, step: 630, loss: 0.36677053570747375, mean loss: 0.3398866676551639
Epoch: 64, step: 631, loss: 0.3740045726299286, mean loss: 0.3398870343251082
Epoch: 64, step: 632, loss: 0.3603481650352478, mean loss: 0.33988725422140703
Epoch: 64, step: 633, loss: 0.33980298042297363, mean loss: 0.33988725331572406
Epoch: 64, step: 634, loss: 0.31604209542274475, mean loss: 0.33988699705670594
Epoch: 64, step: 635, loss: 0.36085060238838196, mean loss: 0.3398872223458489
Epoch: 64, step: 636, loss: 0.35276490449905396, mean loss: 0.3398873607366816
Epoch: 64, step: 637, loss: 0.31331732869148254, mean loss: 0.3398870752032059
Epoch: 64, step: 638, loss: 0.31626635789871216, mean loss: 0.3398868213671164
Epoch: 64, step: 639, loss: 0.3199273645877838, mean loss: 0.339886606878456
Epoch: 64, step: 640, loss: 0.30483075976371765, mean loss: 0.33988623016475245
Epoch: 64, step: 641, loss: 0.30266207456588745, mean loss: 0.3398858301544836
Epoch: 64, step: 642, loss: 0.32334235310554504, mean loss: 0.339885652380415
Epoch: 64, step: 643, loss: 0.3889692425727844, mean loss: 0.3398861798206707
Epoch: 64, step: 644, loss: 0.3329518139362335, mean loss: 0.33988610530647156
Epoch: 64, step: 645, loss: 0.3415104150772095, mean loss: 0.339886122760532
Epoch: 64, step: 646, loss: 0.34044545888900757, mean loss: 0.33988612877082747
Epoch: 64, step: 647, loss: 0.31190919876098633, mean loss: 0.33988582815050156
Epoch: 64, step: 648, loss: 0.3271215260028839, mean loss: 0.3398856909958016
Epoch: 64, step: 649, loss: 0.33842140436172485, mean loss: 0.33988567526195
Epoch: 64, step: 650, loss: 0.3397614359855652, mean loss: 0.3398856739270055
Epoch: 64, step: 651, loss: 0.3245936632156372, mean loss: 0.33988550961692354
Epoch: 64, step: 652, loss: 0.376284122467041, mean loss: 0.3398859007096918
Epoch: 64, step: 653, loss: 0.3612341284751892, mean loss: 0.33988613008787777
Epoch: 64, step: 654, loss: 0.3387850224971771, mean loss: 0.33988611825704335
Epoch: 64, step: 655, loss: 0.3149406909942627, mean loss: 0.33988585023414425
Epoch: 64, step: 656, loss: 0.3638102412223816, mean loss: 0.33988610728389
Epoch: 64, step: 657, loss: 0.30820539593696594, mean loss: 0.3398857669019214
Epoch: 64, step: 658, loss: 0.34041041135787964, mean loss: 0.3398857725387138
Epoch: 64, step: 659, loss: 0.37115010619163513, mean loss: 0.3398861084398447
Epoch: 64, step: 660, loss: 0.3265742361545563, mean loss: 0.3398859654198474
Epoch: 64, step: 661, loss: 0.3493229150772095, mean loss: 0.33988606680738964
Epoch: 64, step: 662, loss: 0.3505997657775879, mean loss: 0.33988618191067793
Epoch: 64, step: 663, loss: 0.3812849223613739, mean loss: 0.339886626675831
Epoch: 64, step: 664, loss: 0.4206623136997223, mean loss: 0.3398874944757797
Epoch: 64, step: 665, loss: 0.3697628378868103, mean loss: 0.33988781543303687
Epoch: 64, step: 666, loss: 0.3078828752040863, mean loss: 0.33988747160075566
Epoch: 64, step: 667, loss: 0.32631170749664307, mean loss: 0.3398873257565278
Epoch: 64, step: 668, loss: 0.32933950424194336, mean loss: 0.3398872124426586
Epoch: 64, step: 669, loss: 0.3085448145866394, mean loss: 0.3398868757389883
Epoch: 64, step: 670, loss: 0.3368423581123352, mean loss: 0.3398868430328357
Epoch: 64, step: 671, loss: 0.3298940658569336, mean loss: 0.339886735685195
Epoch: 64, step: 672, loss: 0.33848580718040466, mean loss: 0.3398867206358497
Epoch: 64, step: 673, loss: 0.3331082761287689, mean loss: 0.33988664781981676
Epoch: 64, step: 674, loss: 0.293894499540329, mean loss: 0.3398861537640189
Epoch: 64, step: 675, loss: 0.3538093864917755, mean loss: 0.3398863033282427
Epoch: 64, step: 676, loss: 0.3187599182128906, mean loss: 0.3398860763897499
Epoch: 64, step: 677, loss: 0.31248652935028076, mean loss: 0.33988578206845055
Epoch: 64, step: 678, loss: 0.32231369614601135, mean loss: 0.3398855933141037
Epoch: 64, step: 679, loss: 0.3563765585422516, mean loss: 0.3398857704534569
Epoch: 64, step: 680, loss: 0.32286980748176575, mean loss: 0.3398855876767512
Epoch: 64, step: 681, loss: 0.33176982402801514, mean loss: 0.3398855005023366
Epoch: 64, step: 682, loss: 0.3534131944179535, mean loss: 0.33988564580673214
Epoch: 64, step: 683, loss: 0.34263312816619873, mean loss: 0.3398856753178209
Epoch: 64, step: 684, loss: 0.32539254426956177, mean loss: 0.3398855196467642
Epoch: 64, step: 685, loss: 0.385141521692276, mean loss: 0.33988600573731054
Epoch: 64, step: 686, loss: 0.32871249318122864, mean loss: 0.33988588572493117
Epoch: 64, step: 687, loss: 0.3482617437839508, mean loss: 0.33988597568731793
Epoch: 64, step: 688, loss: 0.318464457988739, mean loss: 0.3398857456081847
Epoch: 64, step: 689, loss: 0.37343665957450867, mean loss: 0.3398861059599769
Epoch: 64, step: 690, loss: 0.2966858446598053, mean loss: 0.33988564197487053
Epoch: 64, step: 691, loss: 0.3026433289051056, mean loss: 0.33988524198439635
Epoch: 64, step: 692, loss: 0.3949214220046997, mean loss: 0.3398858330784906
Epoch: 64, step: 693, loss: 0.3228297233581543, mean loss: 0.3398856498961286
Epoch: 64, step: 694, loss: 0.3712932765483856, mean loss: 0.3398859872099439
Epoch: 64, step: 695, loss: 0.32635438442230225, mean loss: 0.339885841883855
Epoch: 64, step: 696, loss: 0.32701051235198975, mean loss: 0.3398857036074647
Epoch: 64, step: 697, loss: 0.32770493626594543, mean loss: 0.3398855727918264
Epoch: 64, step: 698, loss: 0.29293879866600037, mean loss: 0.33988506861125267
Epoch: 64, step: 699, loss: 0.2990204393863678, mean loss: 0.33988462975402917
Epoch: 64, step: 700, loss: 0.3109520971775055, mean loss: 0.3398843190424236
Epoch: 64, step: 701, loss: 0.3414004147052765, mean loss: 0.33988433532386936
Epoch: 64, step: 702, loss: 0.3835441768169403, mean loss: 0.3398848041845905
Epoch: 64, step: 703, loss: 0.31215134263038635, mean loss: 0.33988450635961676
Epoch: 64, step: 704, loss: 0.3422589898109436, mean loss: 0.3398845318585209
Epoch: 64, step: 705, loss: 0.3333086669445038, mean loss: 0.33988446124293153
Epoch: 64, step: 706, loss: 0.3050740361213684, mean loss: 0.3398840874316806
Epoch: 64, step: 707, loss: 0.3571590185165405, mean loss: 0.33988427293628826
Epoch: 64, step: 708, loss: 0.34302622079849243, mean loss: 0.3398843066753257
Epoch: 64, step: 709, loss: 0.3480069935321808, mean loss: 0.3398843938978721
Epoch: 64, step: 710, loss: 0.3272917568683624, mean loss: 0.3398842586778282
Epoch: 64, step: 711, loss: 0.3281998336315155, mean loss: 0.339884133211534
Epoch: 64, step: 712, loss: 0.3053429424762726, mean loss: 0.33988376231534984
Epoch: 64, step: 713, loss: 0.41295284032821655, mean loss: 0.3398845469076188
Epoch: 64, step: 714, loss: 0.3139941990375519, mean loss: 0.33988426890837187
Epoch: 64, step: 715, loss: 0.3302558362483978, mean loss: 0.3398841655235776
Epoch: 64, step: 716, loss: 0.3664856553077698, mean loss: 0.3398844511526219
Epoch: 64, step: 717, loss: 0.32291164994239807, mean loss: 0.3398842689119664
Epoch: 64, step: 718, loss: 0.30014318227767944, mean loss: 0.3398838422078634
Epoch: 64, step: 719, loss: 0.32123032212257385, mean loss: 0.339883641925265
Epoch: 64, step: 720, loss: 0.3251701593399048, mean loss: 0.33988348394849327
Epoch: 64, step: 721, loss: 0.3940950334072113, mean loss: 0.3398840660046836
Epoch: 64, step: 722, loss: 0.2901739180088043, mean loss: 0.3398835322846738
Epoch: 64, step: 723, loss: 0.38205352425575256, mean loss: 0.3398839850438747
Epoch: 64, step: 724, loss: 0.35676902532577515, mean loss: 0.3398841663285966
Epoch: 64, step: 725, loss: 0.35152411460876465, mean loss: 0.3398842912985165
Epoch: 64, step: 726, loss: 0.3545245826244354, mean loss: 0.33988444847931726
Epoch: 64, step: 727, loss: 0.35246390104293823, mean loss: 0.33988458353313244
Epoch: 64, step: 728, loss: 0.3246622085571289, mean loss: 0.33988442010648606
Epoch: 64, step: 729, loss: 0.2764301896095276, mean loss: 0.3398837388723966
Epoch: 64, step: 730, loss: 0.30247896909713745, mean loss: 0.3398833373053061
Epoch: 64, step: 731, loss: 0.3748883903026581, mean loss: 0.33988371310567755
Epoch: 64, step: 732, loss: 0.28701266646385193, mean loss: 0.3398831455091747
Epoch: 64, step: 733, loss: 0.3153636157512665, mean loss: 0.3398828822828756
Epoch: 64, step: 734, loss: 0.31878039240837097, mean loss: 0.33988265574220644
Epoch: 64, step: 735, loss: 0.33112260699272156, mean loss: 0.3398825617018343
Epoch: 64, step: 736, loss: 0.2902553975582123, mean loss: 0.33988202895287134
Epoch: 64, step: 737, loss: 0.320513516664505, mean loss: 0.33988182103359477
Epoch: 64, step: 738, loss: 0.33760836720466614, mean loss: 0.3398817966285298
Epoch: 64, step: 739, loss: 0.3729248344898224, mean loss: 0.33988215133502064
Epoch: 64, step: 740, loss: 0.3028130829334259, mean loss: 0.3398817534146453
Epoch: 64, step: 741, loss: 0.3352268636226654, mean loss: 0.3398817034469583
Epoch: 64, step: 742, loss: 0.3214744031429291, mean loss: 0.3398815058568134
Epoch: 64, step: 743, loss: 0.31924518942832947, mean loss: 0.3398812843420385
Epoch: 64, step: 744, loss: 0.3728262186050415, mean loss: 0.3398816379764377
Epoch: 64, step: 745, loss: 0.3594772219657898, mean loss: 0.33988184831524526
Epoch: 64, step: 746, loss: 0.31340768933296204, mean loss: 0.33988156414493104
Epoch: 64, step: 747, loss: 0.3388966917991638, mean loss: 0.3398815535735478
Epoch: 64, step: 748, loss: 0.3913343846797943, mean loss: 0.33988210584995104
Epoch: 64, step: 749, loss: 0.29729610681533813, mean loss: 0.33988164875187843
Epoch: 64, step: 750, loss: 0.31922605633735657, mean loss: 0.33988142704684965
Epoch: 64, step: 751, loss: 0.3442825973033905, mean loss: 0.3398814742859259
Epoch: 64, step: 752, loss: 0.3721610903739929, mean loss: 0.3398818207489779
Epoch: 64, step: 753, loss: 0.39675241708755493, mean loss: 0.33988243114498884
Epoch: 64, step: 754, loss: 0.384314626455307, mean loss: 0.33988290803367
Epoch: 64, step: 755, loss: 0.41297057271003723, mean loss: 0.33988369247174877
Epoch: 64, step: 756, loss: 0.3390859067440033, mean loss: 0.33988368390933554
Epoch: 64, step: 757, loss: 0.3493618071079254, mean loss: 0.3398837856343146
Epoch: 64, step: 758, loss: 0.32787609100341797, mean loss: 0.3398836567618206
Epoch: 64, step: 759, loss: 0.3366955816745758, mean loss: 0.3398836225461955
Epoch: 64, step: 760, loss: 0.3543911576271057, mean loss: 0.3398837782448666
Epoch: 64, step: 761, loss: 0.3502763509750366, mean loss: 0.3398838897794856
Epoch: 64, step: 762, loss: 0.36235204339027405, mean loss: 0.3398841309084268
Epoch: 64, step: 763, loss: 0.3249165415763855, mean loss: 0.33988397027750455
Epoch: 64, step: 764, loss: 0.3126372992992401, mean loss: 0.3398836778716388
Epoch: 64, step: 765, loss: 0.3090277314186096, mean loss: 0.33988334673529863
Epoch: 64, step: 766, loss: 0.29934149980545044, mean loss: 0.33988291165758133
Epoch: 64, step: 767, loss: 0.3852519392967224, mean loss: 0.3398833985333072
Epoch: 64, step: 768, loss: 0.34082499146461487, mean loss: 0.3398834086378619
Epoch: 64, step: 769, loss: 0.3444041907787323, mean loss: 0.33988345715139545
Epoch: 64, step: 770, loss: 0.3505139946937561, mean loss: 0.33988357122886914
Epoch: 64, step: 771, loss: 0.3344506323337555, mean loss: 0.3398835129280268
Epoch: 64, step: 772, loss: 0.3308727741241455, mean loss: 0.33988341623486773
Epoch: 64, step: 773, loss: 0.3142220675945282, mean loss: 0.3398831408689632
Epoch: 64, step: 774, loss: 0.30955103039741516, mean loss: 0.3398828153857033
Epoch: 64, step: 775, loss: 0.33529379963874817, mean loss: 0.3398827661431101
Epoch: 64, step: 776, loss: 0.3464633524417877, mean loss: 0.33988283675556274
Epoch: 64, step: 777, loss: 0.30474674701690674, mean loss: 0.33988245973462
Epoch: 64, step: 778, loss: 0.2911585569381714, mean loss: 0.3398819369179153
Epoch: 64, step: 779, loss: 0.2962702512741089, mean loss: 0.33988146896129007
Epoch: 64, step: 780, loss: 0.341253399848938, mean loss: 0.3398814836820524
Epoch: 64, step: 781, loss: 0.3337477743625641, mean loss: 0.33988141786830833
Epoch: 64, step: 782, loss: 0.37737011909484863, mean loss: 0.3398818201119078
Epoch: 64, step: 783, loss: 0.3010934889316559, mean loss: 0.33988140392809685
Epoch: 64, step: 784, loss: 0.3702421188354492, mean loss: 0.33988172968334524
Epoch: 64, step: 785, loss: 0.322254478931427, mean loss: 0.33988154055381203
Epoch: 64, step: 786, loss: 0.33408501744270325, mean loss: 0.33988147836135996
Epoch: 64, step: 787, loss: 0.3128909766674042, mean loss: 0.3398811887761308
Epoch: 64, step: 788, loss: 0.34462711215019226, mean loss: 0.33988123969532374
Epoch: 64, step: 789, loss: 0.3339833617210388, mean loss: 0.3398811764174449
Epoch: 64, step: 790, loss: 0.3005058765411377, mean loss: 0.3398807539674157
Epoch: 64, step: 791, loss: 0.3290731906890869, mean loss: 0.3398806380163892
Epoch: 64, step: 792, loss: 0.32000866532325745, mean loss: 0.3398804248183858
Epoch: 64, step: 793, loss: 0.3220427632331848, mean loss: 0.3398802334477004
Epoch: 64, step: 794, loss: 0.36133208870887756, mean loss: 0.33988046359065843
Epoch: 64, step: 795, loss: 0.31796857714653015, mean loss: 0.339880228514848
Epoch: 64, step: 796, loss: 0.3825090825557709, mean loss: 0.3398806858421955
Epoch: 64, step: 797, loss: 0.344821959733963, mean loss: 0.33988073885219283
Epoch: 64, step: 798, loss: 0.3555115759372711, mean loss: 0.33988090653804903
Epoch: 64, step: 799, loss: 0.34007203578948975, mean loss: 0.33988090858844006
Epoch: 64, step: 800, loss: 0.32613667845726013, mean loss: 0.33988076114505383
Epoch: 64, step: 801, loss: 0.3658757209777832, mean loss: 0.3398810400070744
Epoch: 64, step: 802, loss: 0.3205045163631439, mean loss: 0.3398808321468352
Epoch: 64, step: 803, loss: 0.3276549279689789, mean loss: 0.3398807009957498
Epoch: 64, step: 804, loss: 0.3528378903865814, mean loss: 0.3398808399900686
Epoch: 64, step: 805, loss: 0.3282293677330017, mean loss: 0.33988071500377504
Epoch: 64, step: 806, loss: 0.3345864415168762, mean loss: 0.3398806582122806
Epoch: 64, step: 807, loss: 0.312499076128006, mean loss: 0.33988036449411696
Epoch: 64, step: 808, loss: 0.3187231421470642, mean loss: 0.3398801375461701
Epoch: 64, step: 809, loss: 0.3294253349304199, mean loss: 0.33988002540146134
Epoch: 64, step: 810, loss: 0.350659042596817, mean loss: 0.33988014102265685
Epoch: 64, step: 811, loss: 0.33388280868530273, mean loss: 0.33988007669292397
Epoch: 64, step: 812, loss: 0.3210658133029938, mean loss: 0.3398798748859391
Epoch: 64, step: 813, loss: 0.3399094045162201, mean loss: 0.3398798752026787
Epoch: 64, step: 814, loss: 0.3025517761707306, mean loss: 0.33987947481976927
Epoch: 64, step: 815, loss: 0.3427734971046448, mean loss: 0.33987950586085264
Epoch: 64, step: 816, loss: 0.32443544268608093, mean loss: 0.33987934021067323
Epoch: 64, step: 817, loss: 0.3438071012496948, mean loss: 0.33987938233866344
Epoch: 64, step: 818, loss: 0.33954647183418274, mean loss: 0.3398793787680032
Epoch: 64, step: 819, loss: 0.3509981334209442, mean loss: 0.3398794980218821
Epoch: 64, step: 820, loss: 0.3202853798866272, mean loss: 0.33987928786799326
Epoch: 64, step: 821, loss: 0.3415486216545105, mean loss: 0.3398793057720001
Epoch: 64, step: 822, loss: 0.3599284589290619, mean loss: 0.33987952080168893
Epoch: 64, step: 823, loss: 0.32128196954727173, mean loss: 0.3398793213427523
Epoch: 64, step: 824, loss: 0.29464828968048096, mean loss: 0.33987883624465526
Epoch: 64, step: 825, loss: 0.30606719851493835, mean loss: 0.33987847362225626
Epoch: 64, step: 826, loss: 0.33596935868263245, mean loss: 0.3398784316983055
Epoch: 64, step: 827, loss: 0.3247220814228058, mean loss: 0.3398782691532594
Epoch: 64, step: 828, loss: 0.3564147651195526, mean loss: 0.3398784464978459
Epoch: 64, step: 829, loss: 0.29824554920196533, mean loss: 0.33987800001330715
Epoch: 64, step: 830, loss: 0.31275105476379395, mean loss: 0.3398777090983689
Epoch: 64, step: 831, loss: 0.3691018521785736, mean loss: 0.3398780225007269
Epoch: 64, step: 832, loss: 0.32038500905036926, mean loss: 0.33987781345812645
Epoch: 64, step: 833, loss: 0.31220975518226624, mean loss: 0.3398775167497267
Epoch: 64, step: 834, loss: 0.363524854183197, mean loss: 0.33987777033775723
Epoch: 64, step: 835, loss: 0.30944743752479553, mean loss: 0.33987744401410935
Epoch: 64, step: 836, loss: 0.3164740204811096, mean loss: 0.33987719304713204
Epoch: 64, step: 837, loss: 0.3516681492328644, mean loss: 0.33987731948627875
Epoch: 64, step: 838, loss: 0.33433619141578674, mean loss: 0.33987726006717983
Epoch: 64, step: 839, loss: 0.33578863739967346, mean loss: 0.3398772162241813
Epoch: 64, step: 840, loss: 0.3011478781700134, mean loss: 0.3398768009273344
Epoch: 64, step: 841, loss: 0.31467607617378235, mean loss: 0.3398765307014583
Epoch: 64, step: 842, loss: 0.3181881904602051, mean loss: 0.3398762981411666
Epoch: 64, step: 843, loss: 0.3341292440891266, mean loss: 0.33987623651716864
Epoch: 64, step: 844, loss: 0.32478591799736023, mean loss: 0.33987607470978376
Epoch: 64, step: 845, loss: 0.30283451080322266, mean loss: 0.3398756775323277
Epoch: 64, step: 846, loss: 0.3068554997444153, mean loss: 0.3398753234779033
Epoch: 64, step: 847, loss: 0.3334294259548187, mean loss: 0.3398752543633733
Epoch: 64, step: 848, loss: 0.300136536359787, mean loss: 0.3398748282794404
Epoch: 64, step: 849, loss: 0.3286148011684418, mean loss: 0.3398747075491945
Epoch: 64, step: 850, loss: 0.3323064148426056, mean loss: 0.3398746264026721
Epoch: 64, step: 851, loss: 0.34273719787597656, mean loss: 0.33987465709456505
Epoch: 64, step: 852, loss: 0.37586528062820435, mean loss: 0.33987504297437005
Epoch: 64, step: 853, loss: 0.2922725975513458, mean loss: 0.33987453260184486
Epoch: 64, step: 854, loss: 0.3642129600048065, mean loss: 0.3398747935449826
Epoch: 64, step: 855, loss: 0.33719658851623535, mean loss: 0.3398747648310596
Epoch: 64, step: 856, loss: 0.3310962915420532, mean loss: 0.33987467071514943
Epoch: 64, step: 857, loss: 0.31515154242515564, mean loss: 0.3398744056559873
Epoch: 64, step: 858, loss: 0.3322264850139618, mean loss: 0.3398743236627346
Epoch: 64, step: 859, loss: 0.32956042885780334, mean loss: 0.33987421308879484
Epoch: 64, step: 860, loss: 0.33297014236450195, mean loss: 0.33987413907193403
Epoch: 64, step: 861, loss: 0.36255359649658203, mean loss: 0.339874382210267
Epoch: 64, step: 862, loss: 0.3594506084918976, mean loss: 0.3398745920777214
Epoch: 64, step: 863, loss: 0.35124945640563965, mean loss: 0.33987471402094965
Epoch: 64, step: 864, loss: 0.294599711894989, mean loss: 0.3398742286594921
Epoch: 64, step: 865, loss: 0.35844069719314575, mean loss: 0.3398744276954104
Epoch: 64, step: 866, loss: 0.3444505035877228, mean loss: 0.33987447675125004
Epoch: 64, step: 867, loss: 0.37934431433677673, mean loss: 0.3398748998660134
Epoch: 64, step: 868, loss: 0.3367116451263428, mean loss: 0.339874865956438
Epoch: 64, step: 869, loss: 0.341867595911026, mean loss: 0.33987488731794946
Epoch: 64, step: 870, loss: 0.42832863330841064, mean loss: 0.33987583550736483
Epoch: 64, step: 871, loss: 0.4048837125301361, mean loss: 0.3398765323588036
Epoch: 64, step: 872, loss: 0.3408312499523163, mean loss: 0.3398765425927818
Epoch: 64, step: 873, loss: 0.38585326075553894, mean loss: 0.3398770354292934
Epoch: 64, step: 874, loss: 0.35234156250953674, mean loss: 0.3398771690383991
Epoch: 64, step: 875, loss: 0.30920881032943726, mean loss: 0.3398768403032588
Epoch: 64, step: 876, loss: 0.31494539976119995, mean loss: 0.3398765730651966
Epoch: 64, step: 877, loss: 0.32638952136039734, mean loss: 0.3398764285001473
Epoch: 64, step: 878, loss: 0.3230848014354706, mean loss: 0.33987624851593523
Epoch: 64, step: 879, loss: 0.38026973605155945, mean loss: 0.3398766814764859
Epoch: 64, step: 880, loss: 0.41307762265205383, mean loss: 0.3398774660777183
Epoch: 64, step: 881, loss: 0.37328243255615234, mean loss: 0.3398778241236194
Epoch: 64, step: 882, loss: 0.3624477684497833, mean loss: 0.33987806603343973
Epoch: 64, step: 883, loss: 0.3356074392795563, mean loss: 0.339878020260377
Epoch: 64, step: 884, loss: 0.34968340396881104, mean loss: 0.3398781253544672
Epoch: 64, step: 885, loss: 0.3482227325439453, mean loss: 0.33987821479099795
Epoch: 64, step: 886, loss: 0.3476518988609314, mean loss: 0.339878298107548
Epoch: 64, step: 887, loss: 0.30925679206848145, mean loss: 0.33987796991683766
Epoch: 64, step: 888, loss: 0.2949357032775879, mean loss: 0.33987748824633085
Epoch: 64, step: 889, loss: 0.3279041349887848, mean loss: 0.33987735992282264
Epoch: 64, step: 890, loss: 0.3507010042667389, mean loss: 0.3398774759231693
Epoch: 64, step: 891, loss: 0.37610527873039246, mean loss: 0.33987786418358434
Epoch: 64, step: 892, loss: 0.3213801681995392, mean loss: 0.3398776659423002
Epoch: 64, step: 893, loss: 0.327560156583786, mean loss: 0.339877533935984
Epoch: 64, step: 894, loss: 0.3220154047012329, mean loss: 0.3398773425102225
Epoch: 64, step: 895, loss: 0.33333659172058105, mean loss: 0.3398772724147279
Epoch: 64, step: 896, loss: 0.35137802362442017, mean loss: 0.339877395663913
Epoch: 64, step: 897, loss: 0.3247200548648834, mean loss: 0.33987723323018604
Epoch: 64, step: 898, loss: 0.2914350628852844, mean loss: 0.33987671410496134
Epoch: 64, step: 899, loss: 0.3681524395942688, mean loss: 0.3398770171154364
Epoch: 64, step: 900, loss: 0.3246379792690277, mean loss: 0.3398768538114527
Epoch: 64, step: 901, loss: 0.3331577181816101, mean loss: 0.3398767818088848
Epoch: 64, step: 902, loss: 0.3088197708129883, mean loss: 0.33987644900408626
Epoch: 64, step: 903, loss: 0.34657415747642517, mean loss: 0.3398765207755015
Epoch: 64, step: 904, loss: 0.33373382687568665, mean loss: 0.33987645495222596
Epoch: 64, step: 905, loss: 0.32278183102607727, mean loss: 0.3398762717732979
Epoch: 64, step: 906, loss: 0.30392566323280334, mean loss: 0.33987588654555617
Epoch: 64, step: 907, loss: 0.3044857978820801, mean loss: 0.33987550732811306
Epoch: 64, step: 908, loss: 0.3353460431098938, mean loss: 0.3398754587938059
Epoch: 64, step: 909, loss: 0.31356289982795715, mean loss: 0.33987517685137864
Epoch: 64, step: 910, loss: 0.2885386347770691, mean loss: 0.33987462677967295
Epoch: 64, step: 911, loss: 0.3471698760986328, mean loss: 0.33987470494752525
Epoch: 64, step: 912, loss: 0.3742203712463379, mean loss: 0.339875072953893
Epoch: 64, step: 913, loss: 0.3458824157714844, mean loss: 0.33987513732057917
Epoch: 64, step: 914, loss: 0.3414860963821411, mean loss: 0.33987515458128637
Epoch: 64, step: 915, loss: 0.3717656135559082, mean loss: 0.33987549626965663
Epoch: 64, step: 916, loss: 0.3535782992839813, mean loss: 0.33987564308592755
Epoch: 64, step: 917, loss: 0.35471057891845703, mean loss: 0.3398758020305333
Epoch: 64, step: 918, loss: 0.30956459045410156, mean loss: 0.3398754772733514
Epoch: 64, step: 919, loss: 0.3210535943508148, mean loss: 0.3398752756160817
Epoch: 64, step: 920, loss: 0.3177246153354645, mean loss: 0.33987503829690197
Epoch: 64, step: 921, loss: 0.31869181990623474, mean loss: 0.33987481134519537
Epoch: 64, step: 922, loss: 0.3522510528564453, mean loss: 0.3398749439397326
Epoch: 64, step: 923, loss: 0.32742559909820557, mean loss: 0.3398748105634219
Epoch: 64, step: 924, loss: 0.3708733916282654, mean loss: 0.3398751426637965
Epoch: 64, step: 925, loss: 0.34787502884864807, mean loss: 0.33987522836890444
Epoch: 64, step: 926, loss: 0.34160515666007996, mean loss: 0.33987524690193094
Epoch: 64, step: 927, loss: 0.34067919850349426, mean loss: 0.33987525551471376
Epoch: 64, step: 928, loss: 0.30930131673812866, mean loss: 0.33987492797774044
Epoch: 64, step: 929, loss: 0.3613259196281433, mean loss: 0.33987515777860655
Epoch: 64, step: 930, loss: 0.36454492807388306, mean loss: 0.33987542205887583
Epoch: 64, step: 931, loss: 0.2926650643348694, mean loss: 0.33987491631308886
Epoch: 64, step: 932, loss: 0.31040462851524353, mean loss: 0.33987460061299785
Epoch: 64, step: 933, loss: 0.35651642084121704, mean loss: 0.33987477888638007
Epoch: 64, step: 934, loss: 0.3196773827075958, mean loss: 0.33987456252666054
Epoch: 64, step: 935, loss: 0.31163227558135986, mean loss: 0.33987425999123605
Epoch: 64, step: 936, loss: 0.340390145778656, mean loss: 0.33987426551741934
Epoch: 64, step: 937, loss: 0.3158115744590759, mean loss: 0.33987400775994714
Epoch: 64, step: 938, loss: 0.3505818247795105, mean loss: 0.33987412245993126
Epoch: 64, step: 939, loss: 0.3774346709251404, mean loss: 0.33987452479666874
Epoch: 64, step: 940, loss: 0.30871057510375977, mean loss: 0.3398741909818536
Epoch: 64, step: 941, loss: 0.33628734946250916, mean loss: 0.3398741525615627
Epoch: 64, step: 942, loss: 0.31072187423706055, mean loss: 0.339873840301595
Epoch: 64, step: 943, loss: 0.3609660565853119, mean loss: 0.33987406622507704
Epoch: 64, step: 944, loss: 0.36683157086372375, mean loss: 0.33987435496989166
Epoch: 64, step: 945, loss: 0.3220180571079254, mean loss: 0.3398741637111583
Epoch: 64, step: 946, loss: 0.3069733679294586, mean loss: 0.33987381131464384
Epoch: 64, step: 947, loss: 0.3308238685131073, mean loss: 0.33987371438282
Epoch: 64, step: 948, loss: 0.33755117654800415, mean loss: 0.3398736895069261
Epoch: 64, step: 949, loss: 0.331384539604187, mean loss: 0.33987359858357175
Epoch: 64, step: 950, loss: 0.33685776591300964, mean loss: 0.33987356628273024
Epoch: 64, step: 951, loss: 0.3541739583015442, mean loss: 0.3398737194443276
Epoch: 64, step: 952, loss: 0.3148006200790405, mean loss: 0.33987345090659704
Epoch: 64, step: 953, loss: 0.3438416123390198, mean loss: 0.3398734934059162
Epoch: 64, step: 954, loss: 0.3566875159740448, mean loss: 0.33987367348348385
Epoch: 64, step: 955, loss: 0.3297399878501892, mean loss: 0.33987356495324317
Epoch: 64, step: 956, loss: 0.31116539239883423, mean loss: 0.3398732574963493
Epoch: 64, step: 957, loss: 0.3417931795120239, mean loss: 0.3398732780579833
Epoch: 64, step: 958, loss: 0.33482176065444946, mean loss: 0.339873223958734
Epoch: 64, step: 959, loss: 0.38208457827568054, mean loss: 0.3398736760165895
Epoch: 64, step: 960, loss: 0.32480427622795105, mean loss: 0.33987351463423854
Epoch: 64, step: 961, loss: 0.32277122139930725, mean loss: 0.3398733314830334
Epoch: 64, step: 962, loss: 0.3254844546318054, mean loss: 0.33987317739189027
Epoch: 64, step: 963, loss: 0.3684045970439911, mean loss: 0.33987348293290176
Epoch: 64, step: 964, loss: 0.36141297221183777, mean loss: 0.3398737135953414
Epoch: 64, step: 965, loss: 0.3566255271434784, mean loss: 0.33987389298551884
Epoch: 64, step: 966, loss: 0.349137544631958, mean loss: 0.33987399218614045
Epoch: 64, step: 967, loss: 0.34749528765678406, mean loss: 0.33987407379857376
Epoch: 64, step: 968, loss: 0.36103010177612305, mean loss: 0.3398743003448925
Epoch: 64, step: 969, loss: 0.2904324233531952, mean loss: 0.33987377090924914
Epoch: 64, step: 970, loss: 0.3359431326389313, mean loss: 0.3398737288194693
Epoch: 64, step: 971, loss: 0.315950870513916, mean loss: 0.3398734726531706
Epoch: 64, step: 972, loss: 0.35370802879333496, mean loss: 0.33987362079220346
Epoch: 64, step: 973, loss: 0.3585807681083679, mean loss: 0.33987382110430664
Epoch: 64, step: 974, loss: 0.3448602855205536, mean loss: 0.3398738744977216
Epoch: 64, step: 975, loss: 0.3399013876914978, mean loss: 0.3398738747923207
Epoch: 64, step: 976, loss: 0.36436283588409424, mean loss: 0.33987413700641694
Epoch: 64, step: 977, loss: 0.3476487994194031, mean loss: 0.33987422025226155
Epoch: 64, step: 978, loss: 0.3473567068576813, mean loss: 0.3398743003688267
Epoch: 64, step: 979, loss: 0.29424548149108887, mean loss: 0.3398738118166523
Epoch: 64, step: 980, loss: 0.3399912416934967, mean loss: 0.3398738130739719
Epoch: 64, step: 981, loss: 0.37284165620803833, mean loss: 0.3398741660562963
Epoch: 64, step: 982, loss: 0.3207961320877075, mean loss: 0.3398739617925036
Epoch: 64, step: 983, loss: 0.3159525394439697, mean loss: 0.3398737056744913
Epoch: 64, step: 984, loss: 0.3364008665084839, mean loss: 0.33987366849245726
Epoch: 64, step: 985, loss: 0.34350794553756714, mean loss: 0.3398737074025132
Epoch: 64, step: 986, loss: 0.35898324847221375, mean loss: 0.33987391199488254
Epoch: 64, step: 987, loss: 0.344186931848526, mean loss: 0.33987395817084776
Epoch: 64, step: 988, loss: 0.3423445224761963, mean loss: 0.33987398462086976
Epoch: 64, step: 989, loss: 0.31729656457901, mean loss: 0.3398737429081314
Epoch: 64, step: 990, loss: 0.3381057679653168, mean loss: 0.33987372398048205
Epoch: 64, step: 991, loss: 0.34862375259399414, mean loss: 0.33987381765584834
Epoch: 64, step: 992, loss: 0.33509328961372375, mean loss: 0.33987376647739614
Epoch: 64, step: 993, loss: 0.34858742356300354, mean loss: 0.3398738597613816
Epoch: 64, step: 994, loss: 0.3679221272468567, mean loss: 0.339874160028668
Epoch: 64, step: 995, loss: 0.3114837408065796, mean loss: 0.33987385610177184
Epoch: 64, step: 996, loss: 0.352057546377182, mean loss: 0.33987398652998074
Epoch: 64, step: 997, loss: 0.3205873668193817, mean loss: 0.3398737800660705
Epoch: 64, step: 998, loss: 0.32705703377723694, mean loss: 0.3398736428638408
Epoch: 64, step: 999, loss: 0.3098539710044861, mean loss: 0.3398733215091279
Epoch: 64, step: 1000, loss: 0.3644576370716095, mean loss: 0.3398735846765981
Epoch: 64, step: 1001, loss: 0.33006829023361206, mean loss: 0.339873479715087
Epoch: 64, step: 1002, loss: 0.37479376792907715, mean loss: 0.33987385351793453
Epoch: 64, step: 1003, loss: 0.32043060660362244, mean loss: 0.33987364539069287
Epoch: 64, step: 1004, loss: 0.3740735650062561, mean loss: 0.3398740114745457
Epoch: 64, step: 1005, loss: 0.333738774061203, mean loss: 0.33987394580224783
Epoch: 64, step: 1006, loss: 0.31318897008895874, mean loss: 0.3398736601662084
Epoch: 64, step: 1007, loss: 0.3816990256309509, mean loss: 0.3398741078602213
Epoch: 64, step: 1008, loss: 0.3689965605735779, mean loss: 0.3398744195803467
Epoch: 64, step: 1009, loss: 0.3078092336654663, mean loss: 0.3398740763655466
Epoch: 64, step: 1010, loss: 0.31305983662605286, mean loss: 0.33987378935815327
Epoch: 64, step: 1011, loss: 0.31743699312210083, mean loss: 0.33987354920748925
Epoch: 64, step: 1012, loss: 0.33221638202667236, mean loss: 0.3398734672504183
Epoch: 64, step: 1013, loss: 0.35685551166534424, mean loss: 0.33987364901264044
Epoch: 64, step: 1014, loss: 0.3166747987270355, mean loss: 0.3398734007133577
Epoch: 64, step: 1015, loss: 0.3496711254119873, mean loss: 0.33987350557812246
Epoch: 64, step: 1016, loss: 0.3235325217247009, mean loss: 0.3398733306829157
Epoch: 64, step: 1017, loss: 0.2764286696910858, mean loss: 0.3398726516510751
Epoch: 64, step: 1018, loss: 0.3158605694770813, mean loss: 0.3398723946587042
Epoch: 64, step: 1019, loss: 0.3708607256412506, mean loss: 0.3398727263117179
Epoch: 64, step: 1020, loss: 0.3241117000579834, mean loss: 0.3398725576309356
Epoch: 64, step: 1021, loss: 0.3487556278705597, mean loss: 0.33987265270007494
Epoch: 64, step: 1022, loss: 0.3154434859752655, mean loss: 0.3398723912549961
Epoch: 64, step: 1023, loss: 0.31175971031188965, mean loss: 0.3398720903915442
Epoch: 64, step: 1024, loss: 0.3712932765483856, mean loss: 0.3398724266592014
Epoch: 64, step: 1025, loss: 0.31831708550453186, mean loss: 0.3398721959776968
Epoch: 64, step: 1026, loss: 0.3446948230266571, mean loss: 0.33987224758805873
Epoch: 64, step: 1027, loss: 0.36388659477233887, mean loss: 0.3398725045799168
Epoch: 64, step: 1028, loss: 0.3075709044933319, mean loss: 0.3398721589049199
Epoch: 64, step: 1029, loss: 0.3277820646762848, mean loss: 0.33987202952437684
Epoch: 64, step: 1030, loss: 0.33727914094924927, mean loss: 0.3398720017772199
Epoch: 64, step: 1031, loss: 0.30361855030059814, mean loss: 0.3398716138240109
Epoch: 64, step: 1032, loss: 0.3306734263896942, mean loss: 0.3398715153939856
Epoch: 64, step: 1033, loss: 0.3279918432235718, mean loss: 0.33987138827068786
Epoch: 64, step: 1034, loss: 0.329899400472641, mean loss: 0.33987128156249
Epoch: 64, step: 1035, loss: 0.32197967171669006, mean loss: 0.3398710901100883
Epoch: 64, step: 1036, loss: 0.3307051658630371, mean loss: 0.33987099202951043
Epoch: 64, step: 1037, loss: 0.3231160640716553, mean loss: 0.33987081274421543
Epoch: 64, step: 1038, loss: 0.2990432679653168, mean loss: 0.33987037587572494
Epoch: 64, step: 1039, loss: 0.3555857241153717, mean loss: 0.3398705440334488
Epoch: 64, step: 1040, loss: 0.2968102693557739, mean loss: 0.33987008328385615
Epoch: 64, step: 1041, loss: 0.33888640999794006, mean loss: 0.3398700727585583
Epoch: 64, step: 1042, loss: 0.3291061818599701, mean loss: 0.3398699575862271
Epoch: 64, step: 1043, loss: 0.32098188996315, mean loss: 0.3398697554883497
Epoch: 64, step: 1044, loss: 0.31991297006607056, mean loss: 0.3398695419577281
Epoch: 64, step: 1045, loss: 0.35902708768844604, mean loss: 0.33986974693457145
Epoch: 64, step: 1046, loss: 0.29359331727027893, mean loss: 0.33986925180356065
Epoch: 64, step: 1047, loss: 0.3296626806259155, mean loss: 0.3398691426003254
Epoch: 64, step: 1048, loss: 0.30103984475135803, mean loss: 0.3398687271582043
Epoch: 64, step: 1049, loss: 0.33614233136177063, mean loss: 0.339868687289206
Epoch: 64, step: 1050, loss: 0.3486767113208771, mean loss: 0.3398687815259316
Epoch: 64, step: 1051, loss: 0.29852792620658875, mean loss: 0.3398683392263711
Epoch: 64, step: 1052, loss: 0.3430534601211548, mean loss: 0.3398683733031334
Epoch: 64, step: 1053, loss: 0.3404272496700287, mean loss: 0.3398683792823392
Epoch: 64, step: 1054, loss: 0.374957412481308, mean loss: 0.339868754682551
Epoch: 64, step: 1055, loss: 0.3384135961532593, mean loss: 0.3398687391146962
Epoch: 64, step: 1056, loss: 0.3139122426509857, mean loss: 0.33986846142491983
Epoch: 64, step: 1057, loss: 0.33664846420288086, mean loss: 0.33986842697686775
Epoch: 64, step: 1058, loss: 0.36581873893737793, mean loss: 0.3398687045945405
Epoch: 64, step: 1059, loss: 0.32848429679870605, mean loss: 0.33986858280490684
Epoch: 64, step: 1060, loss: 0.30670851469039917, mean loss: 0.33986822806450956
Epoch: 64, step: 1061, loss: 0.3243272304534912, mean loss: 0.339868061811513
Epoch: 64, step: 1062, loss: 0.34183791279792786, mean loss: 0.3398680828841709
Epoch: 64, step: 1063, loss: 0.3227984607219696, mean loss: 0.33986790028230784
Epoch: 64, step: 1064, loss: 0.3882957696914673, mean loss: 0.3398684183327075
Epoch: 64, step: 1065, loss: 0.41611313819885254, mean loss: 0.3398692339412724
Epoch: 64, step: 1066, loss: 0.3588654398918152, mean loss: 0.33986943714619683
Epoch: 64, step: 1067, loss: 0.3413792848587036, mean loss: 0.33986945329706447
Epoch: 64, step: 1068, loss: 0.4061962366104126, mean loss: 0.3398701627882482
Epoch: 64, step: 1069, loss: 0.3723194897174835, mean loss: 0.33987050989184586
Epoch: 64, step: 1070, loss: 0.30960649251937866, mean loss: 0.33987018616750586
Epoch: 64, step: 1071, loss: 0.3079695999622345, mean loss: 0.33986984494097194
Epoch: 64, step: 1072, loss: 0.3214474618434906, mean loss: 0.33986964788695384
Epoch: 64, step: 1073, loss: 0.3587867319583893, mean loss: 0.3398698502303496
Epoch: 64, step: 1074, loss: 0.34694382548332214, mean loss: 0.33986992589512216
Epoch: 64, step: 1075, loss: 0.3201266825199127, mean loss: 0.3398697147193705
Epoch: 64, step: 1076, loss: 0.32449713349342346, mean loss: 0.33986955029442717
Epoch: 64, step: 1077, loss: 0.31972411274909973, mean loss: 0.33986933482137494
Epoch: 64, step: 1078, loss: 0.32619181275367737, mean loss: 0.3398691885298934
Epoch: 64, step: 1079, loss: 0.3336452543735504, mean loss: 0.3398691219609048
Epoch: 64, step: 1080, loss: 0.3273848295211792, mean loss: 0.33986898843477625
Epoch: 64, step: 1081, loss: 0.3175480365753174, mean loss: 0.3398687497029118
Epoch: 64, step: 1082, loss: 0.32028546929359436, mean loss: 0.3398685402538224
Epoch: 64, step: 1083, loss: 0.32064881920814514, mean loss: 0.3398683346953085
Epoch: 64, step: 1084, loss: 0.3087363839149475, mean loss: 0.33986800173682913
Epoch: 64, step: 1085, loss: 0.35580822825431824, mean loss: 0.3398681722168886
Epoch: 64, step: 1086, loss: 0.35983482003211975, mean loss: 0.3398683857570725
Epoch: 64, step: 1087, loss: 0.3396093249320984, mean loss: 0.339868382986487
Epoch: 64, step: 1088, loss: 0.36161476373672485, mean loss: 0.3398686155556625
Epoch: 64, step: 1089, loss: 0.32989877462387085, mean loss: 0.3398685089331898
Epoch: 64, step: 1090, loss: 0.4103797674179077, mean loss: 0.3398692630078418
Epoch: 64, step: 1091, loss: 0.3081809878349304, mean loss: 0.33986892412480324
Epoch: 64, step: 1092, loss: 0.35274454951286316, mean loss: 0.3398690618187727
Epoch: 64, step: 1093, loss: 0.2977464497089386, mean loss: 0.3398686113577299
Epoch: 64, step: 1094, loss: 0.3122960329055786, mean loss: 0.339868316498532
Epoch: 64, step: 1095, loss: 0.2993784248828888, mean loss: 0.3398678835071339
Epoch: 64, step: 1096, loss: 0.32210293412208557, mean loss: 0.33986769353408863
Epoch: 64, step: 1097, loss: 0.3099217414855957, mean loss: 0.3398673733044754
Epoch: 64, step: 1098, loss: 0.3410782516002655, mean loss: 0.33986738625296814
Epoch: 64, step: 1099, loss: 0.3536546230316162, mean loss: 0.339867533684817
Epoch: 64, step: 1100, loss: 0.3683309555053711, mean loss: 0.3398678380511014
Epoch: 64, step: 1101, loss: 0.32929566502571106, mean loss: 0.3398677250014957
Epoch: 64, step: 1102, loss: 0.32789576053619385, mean loss: 0.33986759698510904
Epoch: 64, step: 1103, loss: 0.347189337015152, mean loss: 0.3398676752757424
Epoch: 64, step: 1104, loss: 0.32304418087005615, mean loss: 0.3398674953857241
Epoch: 64, step: 1105, loss: 0.30475300550460815, mean loss: 0.3398671199180279
Epoch: 64, step: 1106, loss: 0.39488306641578674, mean loss: 0.3398677081791669
Epoch: 64, step: 1107, loss: 0.31728750467300415, mean loss: 0.3398674667416374
Epoch: 64, step: 1108, loss: 0.3417966365814209, mean loss: 0.3398674873689546
Epoch: 64, step: 1109, loss: 0.35935917496681213, mean loss: 0.33986769577824827
Epoch: 64, step: 1110, loss: 0.3455335795879364, mean loss: 0.33986775635844235
Epoch: 64, step: 1111, loss: 0.34263819456100464, mean loss: 0.33986778597992684
Epoch: 64, step: 1112, loss: 0.35888227820396423, mean loss: 0.3398679892804243
Epoch: 64, step: 1113, loss: 0.3325720727443695, mean loss: 0.3398679112742601
Epoch: 64, step: 1114, loss: 0.33471521735191345, mean loss: 0.3398678561834996
Epoch: 64, step: 1115, loss: 0.3140440881252289, mean loss: 0.3398675800879595
Epoch: 64, step: 1116, loss: 0.32361072301864624, mean loss: 0.33986740627917467
Epoch: 64, step: 1117, loss: 0.30536919832229614, mean loss: 0.33986703744850394
Epoch: 64, step: 1118, loss: 0.3102880120277405, mean loss: 0.33986672121366757
Epoch: 64, step: 1119, loss: 0.3166186511516571, mean loss: 0.3398664726669042
Epoch: 64, step: 1120, loss: 0.32783207297325134, mean loss: 0.3398663440076603
Epoch: 64, step: 1121, loss: 0.3333382308483124, mean loss: 0.3398662742166325
Epoch: 64, step: 1122, loss: 0.3161172568798065, mean loss: 0.3398660203223495
Epoch: 64, step: 1123, loss: 0.28489238023757935, mean loss: 0.3398654326204029
Epoch: 64, step: 1124, loss: 0.29067012667655945, mean loss: 0.33986490669801656
Epoch: 64, step: 1125, loss: 0.31452542543411255, mean loss: 0.33986463580920445
Epoch: 64, step: 1126, loss: 0.33104896545410156, mean loss: 0.3398645415673012
Epoch: 64, step: 1127, loss: 0.36348268389701843, mean loss: 0.33986479404893905
Epoch: 64, step: 1128, loss: 0.3164297938346863, mean loss: 0.3398645435277972
Epoch: 64, step: 1129, loss: 0.3100462853908539, mean loss: 0.3398642247727661
Epoch: 64, step: 1130, loss: 0.31888777017593384, mean loss: 0.3398640005383749
Epoch: 64, step: 1131, loss: 0.317006915807724, mean loss: 0.33986375620300985
Epoch: 64, step: 1132, loss: 0.2885152995586395, mean loss: 0.3398632073093109
Epoch: 64, step: 1133, loss: 0.3619394600391388, mean loss: 0.3398634432927714
Epoch: 64, step: 1134, loss: 0.29656893014907837, mean loss: 0.33986298050228125
Epoch: 64, step: 1135, loss: 0.3664160370826721, mean loss: 0.33986326433433806
Epoch: 64, step: 1136, loss: 0.3405478000640869, mean loss: 0.33986327165142816
Epoch: 64, step: 1137, loss: 0.3365497589111328, mean loss: 0.33986323623324466
Epoch: 64, step: 1138, loss: 0.31835317611694336, mean loss: 0.33986300631437216
Epoch: 64, step: 1139, loss: 0.34829509258270264, mean loss: 0.3398630964431321
Epoch: 64, step: 1140, loss: 0.2862764000892639, mean loss: 0.33986252367256065
Epoch: 64, step: 1141, loss: 0.3303399682044983, mean loss: 0.33986242189018534
Epoch: 64, step: 1142, loss: 0.3462660610675812, mean loss: 0.339862490335115
Epoch: 64, step: 1143, loss: 0.32549652457237244, mean loss: 0.33986233678695593
Epoch: 64, step: 1144, loss: 0.338960200548172, mean loss: 0.33986232714473064
Epoch: 64, step: 1145, loss: 0.3313683867454529, mean loss: 0.3398622363606474
Epoch: 64, step: 1146, loss: 0.3258570730686188, mean loss: 0.3398620866736633
Epoch: 64, step: 1147, loss: 0.3279151916503906, mean loss: 0.3398619589867856
Epoch: 64, step: 1148, loss: 0.33081862330436707, mean loss: 0.33986186233380977
Epoch: 64, step: 1149, loss: 0.3168245255947113, mean loss: 0.33986161611898025
Epoch: 64, step: 1150, loss: 0.3740262985229492, mean loss: 0.3398619812550047
Epoch: 64, step: 1151, loss: 0.33027270436286926, mean loss: 0.33986187877042784
Epoch: 64, step: 1152, loss: 0.29850080609321594, mean loss: 0.3398614367322242
Epoch: 64, step: 1153, loss: 0.32207268476486206, mean loss: 0.3398612466205221
Epoch: 64, step: 1154, loss: 0.2952103316783905, mean loss: 0.339860769432986
Epoch: 64, step: 1155, loss: 0.32135647535324097, mean loss: 0.3398605716783791
Epoch: 64, step: 1156, loss: 0.317404568195343, mean loss: 0.33986033169458585
Epoch: 64, step: 1157, loss: 0.3049132525920868, mean loss: 0.33985995822461446
Epoch: 64, step: 1158, loss: 0.345461905002594, mean loss: 0.339860018090463
Epoch: 64, step: 1159, loss: 0.3325396776199341, mean loss: 0.33985993986163865
Epoch: 64, step: 1160, loss: 0.3481290936470032, mean loss: 0.33986002822901296
Epoch: 64, step: 1161, loss: 0.37371137738227844, mean loss: 0.3398603899737516
Epoch: 64, step: 1162, loss: 0.36971554160118103, mean loss: 0.3398607090106256
Epoch: 64, step: 1163, loss: 0.3482603430747986, mean loss: 0.339860798769485
Epoch: 64, step: 1164, loss: 0.318742573261261, mean loss: 0.33986057310160894
Epoch: 64, step: 1165, loss: 0.3483964800834656, mean loss: 0.3398606643147373
Epoch: 64, step: 1166, loss: 0.29851284623146057, mean loss: 0.33986022248429715
Epoch: 64, step: 1167, loss: 0.3352237045764923, mean loss: 0.33986017294038035
Epoch: 64, step: 1168, loss: 0.3138292729854584, mean loss: 0.33985989478789913
Epoch: 64, step: 1169, loss: 0.33857277035713196, mean loss: 0.3398598810345126
Epoch: 64, step: 1170, loss: 0.3287404477596283, mean loss: 0.3398597622206466
Epoch: 64, step: 1171, loss: 0.3327997028827667, mean loss: 0.3398596867829907
Epoch: 64, step: 1172, loss: 0.33332815766334534, mean loss: 0.33985961699349493
Epoch: 64, step: 1173, loss: 0.30977216362953186, mean loss: 0.3398592955119973
Epoch: 64, step: 1174, loss: 0.3196577727794647, mean loss: 0.33985907966300827
Epoch: 64, step: 1175, loss: 0.3127790093421936, mean loss: 0.3398587903212876
Epoch: 64, step: 1176, loss: 0.3120846748352051, mean loss: 0.33985849356709136
Epoch: 64, step: 1177, loss: 0.33279716968536377, mean loss: 0.3398584181207606
Epoch: 64, step: 1178, loss: 0.3835652470588684, mean loss: 0.33985888509900664
Epoch: 64, step: 1179, loss: 0.366692453622818, mean loss: 0.339859171794683
Epoch: 64, step: 1180, loss: 0.3249039947986603, mean loss: 0.3398590120120297
Epoch: 64, step: 1181, loss: 0.3416679799556732, mean loss: 0.3398590313390233
Epoch: 64, step: 1182, loss: 0.3592519164085388, mean loss: 0.3398592385301799
Epoch: 64, step: 1183, loss: 0.31930771470069885, mean loss: 0.3398590189626176
Epoch: 64, step: 1184, loss: 0.30621084570884705, mean loss: 0.33985865947742777
Epoch: 64, step: 1185, loss: 0.30668947100639343, mean loss: 0.33985830511332793
Epoch: 64, step: 1186, loss: 0.3160529136657715, mean loss: 0.3398580507903741
Epoch: 64, step: 1187, loss: 0.3682520091533661, mean loss: 0.3398583541316668
Epoch: 64, step: 1188, loss: 0.333769291639328, mean loss: 0.3398582890810553
Epoch: 64, step: 1189, loss: 0.30294081568717957, mean loss: 0.33985789468888605
Epoch: 64, step: 1190, loss: 0.318146675825119, mean loss: 0.3398576627487655
Epoch: 64, step: 1191, loss: 0.3239760398864746, mean loss: 0.3398574930878085
Epoch: 64, step: 1192, loss: 0.3388688266277313, mean loss: 0.33985748252614817
Epoch: 64, step: 1193, loss: 0.34162381291389465, mean loss: 0.3398575013951834
Epoch: 64, step: 1194, loss: 0.3197607398033142, mean loss: 0.33985728671142196
Epoch: 64, step: 1195, loss: 0.32503488659858704, mean loss: 0.33985712837274623
Epoch: 64, step: 1196, loss: 0.34220731258392334, mean loss: 0.33985715347806505
Epoch: 64, step: 1197, loss: 0.32828396558761597, mean loss: 0.33985702985138644
Epoch: 64, step: 1198, loss: 0.3366442918777466, mean loss: 0.33985699553276255
Epoch: 64, step: 1199, loss: 0.33531835675239563, mean loss: 0.3398569470513194
Epoch: 64, step: 1200, loss: 0.32231613993644714, mean loss: 0.3398567596835645
Epoch: 64, step: 1201, loss: 0.31253060698509216, mean loss: 0.33985646779362133
Epoch: 64, step: 1202, loss: 0.3314289152622223, mean loss: 0.3398563777739402
Epoch: 64, step: 1203, loss: 0.31291118264198303, mean loss: 0.3398560899594226
Epoch: 64, step: 1204, loss: 0.3211890459060669, mean loss: 0.3398558905699261
Epoch: 64, step: 1205, loss: 0.35203874111175537, mean loss: 0.3398560206980001
Epoch: 64, step: 1206, loss: 0.3424942195415497, mean loss: 0.33985604887696086
Epoch: 64, step: 1207, loss: 0.33859893679618835, mean loss: 0.3398560354497191
Epoch: 64, step: 1208, loss: 0.3761482238769531, mean loss: 0.3398564230832403
Epoch: 64, step: 1209, loss: 0.3418966829776764, mean loss: 0.3398564448748356
Epoch: 64, step: 1210, loss: 0.31897470355033875, mean loss: 0.3398562218436445
Epoch: 64, step: 1211, loss: 0.3347361087799072, mean loss: 0.3398561671579408
Epoch: 64, step: 1212, loss: 0.3292468786239624, mean loss: 0.3398560538459484
Epoch: 64, step: 1213, loss: 0.32929977774620056, mean loss: 0.3398559411013569
Epoch: 64, step: 1214, loss: 0.3318513333797455, mean loss: 0.33985585561035797
Epoch: 64, step: 1215, loss: 0.3177322447299957, mean loss: 0.33985561932777425
Epoch: 64, step: 1216, loss: 0.3166038393974304, mean loss: 0.33985537099887386
Epoch: 64, step: 1217, loss: 0.35636672377586365, mean loss: 0.33985554733816065
Epoch: 64, step: 1218, loss: 0.2750679552555084, mean loss: 0.33985485542176097
Epoch: 64, step: 1219, loss: 0.3672090470790863, mean loss: 0.33985514755503937
Epoch: 64, step: 1220, loss: 0.31181174516677856, mean loss: 0.3398548480644279
Epoch: 64, step: 1221, loss: 0.3094172775745392, mean loss: 0.3398545230086761
Epoch: 64, step: 1222, loss: 0.34395453333854675, mean loss: 0.33985456679396137
Epoch: 64, step: 1223, loss: 0.3127928376197815, mean loss: 0.3398542777964264
Epoch: 64, step: 1224, loss: 0.3113529086112976, mean loss: 0.33985397342794266
Epoch: 64, step: 1225, loss: 0.33165472745895386, mean loss: 0.33985388586845044
Epoch: 64, step: 1226, loss: 0.3082472085952759, mean loss: 0.33985354834533316
Epoch: 64, step: 1227, loss: 0.3557169437408447, mean loss: 0.3398537177464202
Epoch: 64, step: 1228, loss: 0.35084742307662964, mean loss: 0.3398538351440958
Epoch: 64, step: 1229, loss: 0.3138262629508972, mean loss: 0.33985355720833565
Epoch: 64, step: 1230, loss: 0.3354506194591522, mean loss: 0.33985351019201104
Epoch: 64, step: 1231, loss: 0.36319002509117126, mean loss: 0.33985375938595963
Epoch: 64, step: 1232, loss: 0.36420273780822754, mean loss: 0.33985401938850557
Epoch: 64, step: 1233, loss: 0.31500688195228577, mean loss: 0.33985375406936585
Epoch: 64, step: 1234, loss: 0.3919636905193329, mean loss: 0.3398543104962748
Epoch: 64, step: 1235, loss: 0.31097009778022766, mean loss: 0.3398540020756034
Epoch: 64, step: 1236, loss: 0.3178146183490753, mean loss: 0.3398537667453553
Epoch: 64, step: 1237, loss: 0.3281310200691223, mean loss: 0.33985364157454917
Epoch: 64, step: 1238, loss: 0.3168639540672302, mean loss: 0.33985339610247073
Epoch: 64, step: 1239, loss: 0.35961103439331055, mean loss: 0.33985360706213474
Epoch: 64, step: 1240, loss: 0.3479927182197571, mean loss: 0.3398536939655286
Epoch: 64, step: 1241, loss: 0.3669491410255432, mean loss: 0.3398539832675323
Epoch: 64, step: 1242, loss: 0.330763578414917, mean loss: 0.3398538862090024
Epoch: 64, step: 1243, loss: 0.30197519063949585, mean loss: 0.33985348178133246
Epoch: 64, step: 1244, loss: 0.35711923241615295, mean loss: 0.3398536661243422
Epoch: 64, step: 1245, loss: 0.3185592591762543, mean loss: 0.33985343877059204
Epoch: 64, step: 1246, loss: 0.3111005425453186, mean loss: 0.33985313178815263
Epoch: 64, step: 1247, loss: 0.3253975808620453, mean loss: 0.3398529774540336
Epoch: 64, step: 1248, loss: 0.30877259373664856, mean loss: 0.33985264562908596
Epoch: 64, step: 1249, loss: 0.3767768442630768, mean loss: 0.3398530398404181
Epoch: 64, step: 1250, loss: 0.32121652364730835, mean loss: 0.3398528408747611
Epoch: 64, step: 1251, loss: 0.31367629766464233, mean loss: 0.33985256141386505
Epoch: 64, step: 1252, loss: 0.3588571548461914, mean loss: 0.33985276430482614
Epoch: 64, step: 1253, loss: 0.33090171217918396, mean loss: 0.33985266874539277
Epoch: 64, step: 1254, loss: 0.34086480736732483, mean loss: 0.3398526795506433
Epoch: 64, step: 1255, loss: 0.34213992953300476, mean loss: 0.3398527039682919
Epoch: 64, step: 1256, loss: 0.33612555265426636, mean loss: 0.33985266417933124
Epoch: 64, step: 1257, loss: 0.33307790756225586, mean loss: 0.3398525918566311
Epoch: 64, step: 1258, loss: 0.35324791073799133, mean loss: 0.33985273485443074
Epoch: 64, step: 1259, loss: 0.36072349548339844, mean loss: 0.3398529576517388
Epoch: 64, step: 1260, loss: 0.3535768985748291, mean loss: 0.3398531041545188
Epoch: 64, step: 1261, loss: 0.3382725715637207, mean loss: 0.3398530872825468
Epoch: 64, step: 1262, loss: 0.3334392011165619, mean loss: 0.33985301881590896
Epoch: 64, step: 1263, loss: 0.33477845788002014, mean loss: 0.3398529646468127
Epoch: 64, step: 1264, loss: 0.31591540575027466, mean loss: 0.33985270912478693
Epoch: 64, step: 1265, loss: 0.3856847286224365, mean loss: 0.3398531983545162
Epoch: 64, step: 1266, loss: 0.32933562994003296, mean loss: 0.33985308608688586
Epoch: 64, step: 1267, loss: 0.31945058703422546, mean loss: 0.3398528683069122
Epoch: 64, step: 1268, loss: 0.35075056552886963, mean loss: 0.33985298462966634
Epoch: 64, step: 1269, loss: 0.30846482515335083, mean loss: 0.3398526495939142
Epoch: 64, step: 1270, loss: 0.3693033456802368, mean loss: 0.339852963945917
Epoch: 64, step: 1271, loss: 0.3484969735145569, mean loss: 0.33985305620970285
Epoch: 64, step: 1272, loss: 0.33369532227516174, mean loss: 0.33985299048444234
Epoch: 64, step: 1273, loss: 0.30904144048690796, mean loss: 0.33985266161743416
Epoch: 64, step: 1274, loss: 0.3464064598083496, mean loss: 0.3398527315686375
Epoch: 64, step: 1275, loss: 0.33063504099845886, mean loss: 0.3398526331857385
Epoch: 64, step: 1276, loss: 0.3336065411567688, mean loss: 0.3398525665202242
Epoch: 64, step: 1277, loss: 0.3309628367424011, mean loss: 0.3398524716397647
Epoch: 64, step: 1278, loss: 0.3614422082901001, mean loss: 0.339852702065472
Epoch: 64, step: 1279, loss: 0.3488510251045227, mean loss: 0.339852798102902
Epoch: 64, step: 1280, loss: 0.34287774562835693, mean loss: 0.33985283038726033
Epoch: 64, step: 1281, loss: 0.31605467200279236, mean loss: 0.33985257639935895
Epoch: 64, step: 1282, loss: 0.2988380491733551, mean loss: 0.3398521386729454
Epoch: 64, step: 1283, loss: 0.3083001375198364, mean loss: 0.3398518019386748
Epoch: 64, step: 1284, loss: 0.3612687289714813, mean loss: 0.33985203050536067
Epoch: 64, step: 1285, loss: 0.3577069342136383, mean loss: 0.33985222105522844
Epoch: 64, step: 1286, loss: 0.33222466707229614, mean loss: 0.3398521396538434
Epoch: 64, step: 1287, loss: 0.324978232383728, mean loss: 0.3398519809209476
Epoch: 64, step: 1288, loss: 0.33998915553092957, mean loss: 0.3398519823848461
Epoch: 64, step: 1289, loss: 0.32629144191741943, mean loss: 0.33985183767116217
Epoch: 64, step: 1290, loss: 0.3664473593235016, mean loss: 0.3398521214869033
Epoch: 64, step: 1291, loss: 0.314195841550827, mean loss: 0.33985184769725957
Epoch: 64, step: 1292, loss: 0.2894692122936249, mean loss: 0.3398513100473497
Epoch: 64, step: 1293, loss: 0.34855106472969055, mean loss: 0.3398514028843434
Epoch: 64, step: 1294, loss: 0.35073357820510864, mean loss: 0.3398515190091881
Epoch: 64, step: 1295, loss: 0.3076382577419281, mean loss: 0.3398511752617356
Epoch: 64, step: 1296, loss: 0.3323642611503601, mean loss: 0.3398510953697877
Epoch: 64, step: 1297, loss: 0.3064083755016327, mean loss: 0.3398507385104084
Epoch: 64, step: 1298, loss: 0.3978545069694519, mean loss: 0.33985135744834216
Epoch: 64, step: 1299, loss: 0.3469753563404083, mean loss: 0.33985143346523244
Epoch: 64, step: 1300, loss: 0.32307979464530945, mean loss: 0.3398512545047576
Epoch: 64, step: 1301, loss: 0.4195021688938141, mean loss: 0.3398521044046102
Epoch: 64, step: 1302, loss: 0.3232273459434509, mean loss: 0.33985192701519656
Epoch: 64, step: 1303, loss: 0.324827641248703, mean loss: 0.33985176670484907
Epoch: 64, step: 1304, loss: 0.3455602526664734, mean loss: 0.3398518276142073
Epoch: 64, step: 1305, loss: 0.3188873529434204, mean loss: 0.339851603926336
Epoch: 64, step: 1306, loss: 0.29920515418052673, mean loss: 0.3398511702393035
Epoch: 64, step: 1307, loss: 0.3289264738559723, mean loss: 0.3398510536768821
Epoch: 64, step: 1308, loss: 0.3148055374622345, mean loss: 0.33985078645344957
Epoch: 64, step: 1309, loss: 0.32706719636917114, mean loss: 0.3398506500602387
Epoch: 64, step: 1310, loss: 0.3271435499191284, mean loss: 0.3398505144845759
Epoch: 64, step: 1311, loss: 0.3483223617076874, mean loss: 0.33985060487215724
Epoch: 64, step: 1312, loss: 0.32801997661590576, mean loss: 0.33985047865051554
Epoch: 64, step: 1313, loss: 0.32952335476875305, mean loss: 0.3398503684710225
Epoch: 64, step: 1314, loss: 0.3240457773208618, mean loss: 0.33985019985454396
Epoch: 64, step: 1315, loss: 0.33766162395477295, mean loss: 0.3398501765052513
Epoch: 64, step: 1316, loss: 0.3459085524082184, mean loss: 0.33985024113964796
Epoch: 64, step: 1317, loss: 0.32438981533050537, mean loss: 0.3398500762002897
Epoch: 64, step: 1318, loss: 0.3299906849861145, mean loss: 0.3398499710166207
Epoch: 64, step: 1319, loss: 0.34052056074142456, mean loss: 0.33984997817064605
Epoch: 64, step: 1320, loss: 0.3759065866470337, mean loss: 0.33985036282780895
Epoch: 64, step: 1321, loss: 0.3631580173969269, mean loss: 0.3398506114746178
Epoch: 64, step: 1322, loss: 0.32148051261901855, mean loss: 0.33985041550390277
Epoch: 64, step: 1323, loss: 0.31687313318252563, mean loss: 0.33985017038674553
Epoch: 64, step: 1324, loss: 0.30671262741088867, mean loss: 0.33984981688568433
Epoch: 64, step: 1325, loss: 0.3169655203819275, mean loss: 0.33984957276569006
Epoch: 64, step: 1326, loss: 0.39736372232437134, mean loss: 0.33985018629576225
Epoch: 64, step: 1327, loss: 0.34405288100242615, mean loss: 0.339850231127375
Epoch: 64, step: 1328, loss: 0.3361670672893524, mean loss: 0.33985019183819865
Epoch: 64, step: 1329, loss: 0.30887332558631897, mean loss: 0.33984986140419343
Epoch: 64, step: 1330, loss: 0.347523957490921, mean loss: 0.3398499432638379
Epoch: 64, step: 1331, loss: 0.33048179745674133, mean loss: 0.33984984333481744
Epoch: 64, step: 1332, loss: 0.3491300642490387, mean loss: 0.3398499423248964
Epoch: 64, step: 1333, loss: 0.31803321838378906, mean loss: 0.33984970961317434
Epoch: 64, step: 1334, loss: 0.336424857378006, mean loss: 0.33984967308180686
Epoch: 64, step: 1335, loss: 0.306294322013855, mean loss: 0.33984931516569766
Epoch: 64, step: 1336, loss: 0.2927142083644867, mean loss: 0.3398488124073134
Epoch: 64, step: 1337, loss: 0.3254544734954834, mean loss: 0.3398486588742491
Epoch: 64, step: 1338, loss: 0.3256594240665436, mean loss: 0.3398485075304828
Epoch: 64, step: 1339, loss: 0.3056979179382324, mean loss: 0.3398481432808391
Epoch: 64, step: 1340, loss: 0.3364071249961853, mean loss: 0.33984810657938447
Epoch: 64, step: 1341, loss: 0.30498063564300537, mean loss: 0.3398477346914289
Epoch: 64, step: 1342, loss: 0.30467915534973145, mean loss: 0.3398473595959251
Epoch: 64, step: 1343, loss: 0.3431977927684784, mean loss: 0.3398473953300673
Epoch: 64, step: 1344, loss: 0.3061227798461914, mean loss: 0.33984703564303875
Epoch: 64, step: 1345, loss: 0.3154291808605194, mean loss: 0.3398467752192553
Epoch: 64, step: 1346, loss: 0.29742762446403503, mean loss: 0.3398463228110479
Epoch: 64, step: 1347, loss: 0.3548632860183716, mean loss: 0.33984648296807196
Epoch: 64, step: 1348, loss: 0.34025824069976807, mean loss: 0.33984648735945183
Epoch: 64, step: 1349, loss: 0.3319433331489563, mean loss: 0.33984640307352504
Epoch: 64, step: 1350, loss: 0.3198198080062866, mean loss: 0.33984618949523987
Epoch: 64, step: 1351, loss: 0.3133857548236847, mean loss: 0.3398459073047839
Epoch: 64, step: 1352, loss: 0.3418738543987274, mean loss: 0.3398459289318365
Epoch: 64, step: 1353, loss: 0.3278229832649231, mean loss: 0.33984580071443576
Epoch: 64, step: 1354, loss: 0.3180060386657715, mean loss: 0.3398455678091447
Epoch: 64, step: 1355, loss: 0.3558683693408966, mean loss: 0.33984573867893025
Epoch: 64, step: 1356, loss: 0.3201248049736023, mean loss: 0.3398455283738989
Epoch: 64, step: 1357, loss: 0.353503942489624, mean loss: 0.33984567402636245
Epoch: 64, step: 1358, loss: 0.35303065180778503, mean loss: 0.3398458146286315
Epoch: 64, step: 1359, loss: 0.34564241766929626, mean loss: 0.33984587644192105
Epoch: 64, step: 1360, loss: 0.3978313207626343, mean loss: 0.33984649477524714
Epoch: 64, step: 1361, loss: 0.319011390209198, mean loss: 0.33984627260048794
Epoch: 64, step: 1362, loss: 0.3302839994430542, mean loss: 0.3398461706344491
Epoch: 64, step: 1363, loss: 0.3293989896774292, mean loss: 0.33984605923350053
Epoch: 64, step: 1364, loss: 0.35989126563072205, mean loss: 0.3398462729783571
Epoch: 64, step: 1365, loss: 0.33941778540611267, mean loss: 0.33984626840938253
Epoch: 64, step: 1366, loss: 0.3392813503742218, mean loss: 0.3398462623857105
Epoch: 64, step: 1367, loss: 0.36141473054885864, mean loss: 0.3398464923659647
Epoch: 64, step: 1368, loss: 0.30390459299087524, mean loss: 0.33984610912877994
Epoch: 64, step: 1369, loss: 0.29926732182502747, mean loss: 0.33984567645452896
Epoch: 64, step: 1370, loss: 0.35418882966041565, mean loss: 0.3398458293878055
Epoch: 64, step: 1371, loss: 0.34170001745224, mean loss: 0.3398458491577981
Epoch: 64, step: 1372, loss: 0.29007717967033386, mean loss: 0.3398453185127386
Epoch: 64, step: 1373, loss: 0.3181489408016205, mean loss: 0.33984508718341017
Epoch: 64, step: 1374, loss: 0.32930806279182434, mean loss: 0.3398449748376159
Epoch: 64, step: 1375, loss: 0.352273166179657, mean loss: 0.3398451073456266
Epoch: 64, step: 1376, loss: 0.3699709475040436, mean loss: 0.33984542854060024
Epoch: 64, step: 1377, loss: 0.3259192705154419, mean loss: 0.33984528006459935
Epoch: 64, step: 1378, loss: 0.3379799425601959, mean loss: 0.3398452601772119
Epoch: 64, step: 1379, loss: 0.33377841114997864, mean loss: 0.3398451954958926
Epoch: 64, step: 1380, loss: 0.35349419713020325, mean loss: 0.33984534101229114
Epoch: 64, step: 1381, loss: 0.3849513828754425, mean loss: 0.33984582189719126
Epoch: 64, step: 1382, loss: 0.28679993748664856, mean loss: 0.3398452563700064
Epoch: 64, step: 1383, loss: 0.33974921703338623, mean loss: 0.33984525534613286
Epoch: 64, step: 1384, loss: 0.32194817066192627, mean loss: 0.3398450645476906
Epoch: 64, step: 1385, loss: 0.34538111090660095, mean loss: 0.3398451235661162
Epoch: 64, step: 1386, loss: 0.36008521914482117, mean loss: 0.3398453393384857
Epoch: 64, step: 1387, loss: 0.32868269085884094, mean loss: 0.33984522033877906
Epoch: 64, step: 1388, loss: 0.3339659869670868, mean loss: 0.3398451576637258
Epoch: 64, step: 1389, loss: 0.31627458333969116, mean loss: 0.33984490639435794
Epoch: 64, step: 1390, loss: 0.33749473094940186, mean loss: 0.3398448813410523
Epoch: 64, step: 1391, loss: 0.3230607211589813, mean loss: 0.3398447024207024
Epoch: 64, step: 1392, loss: 0.32475581765174866, mean loss: 0.3398445415738245
Epoch: 64, step: 1393, loss: 0.3671239912509918, mean loss: 0.33984483236851243
Epoch: 64, step: 1394, loss: 0.31746840476989746, mean loss: 0.3398445938418194
Epoch: 64, step: 1395, loss: 0.3293679654598236, mean loss: 0.3398444821649723
Epoch: 64, step: 1396, loss: 0.3060888350009918, mean loss: 0.3398441223465339
Epoch: 64, step: 1397, loss: 0.3389010429382324, mean loss: 0.3398441122938828
Epoch: 64, step: 1398, loss: 0.3556773066520691, mean loss: 0.3398442810642751
Epoch: 64, step: 1399, loss: 0.30956053733825684, mean loss: 0.3398439582649261
Epoch: 64, step: 1400, loss: 0.3140881657600403, mean loss: 0.33984368373267176
Epoch: 64, step: 1401, loss: 0.2989395558834076, mean loss: 0.339843247738216
Epoch: 64, step: 1402, loss: 0.3414559066295624, mean loss: 0.3398432649272597
Epoch: 64, step: 1403, loss: 0.3565741181373596, mean loss: 0.3398434432565414
Epoch: 64, step: 1404, loss: 0.3512149155139923, mean loss: 0.3398435644604537
Epoch: 64, step: 1405, loss: 0.32471734285354614, mean loss: 0.33984340323790885
Epoch: 64, step: 1406, loss: 0.3375242054462433, mean loss: 0.33984337851904683
Epoch: 64, step: 1407, loss: 0.34881117939949036, mean loss: 0.3398434741001442
Epoch: 64, step: 1408, loss: 0.34452804923057556, mean loss: 0.33984352402900253
Epoch: 64, step: 1409, loss: 0.34118854999542236, mean loss: 0.339843538364325
Epoch: 64, step: 1410, loss: 0.3305460214614868, mean loss: 0.33984343927219907
Epoch: 64, step: 1411, loss: 0.37501296401023865, mean loss: 0.3398438141019379
Epoch: 64, step: 1412, loss: 0.3504135310649872, mean loss: 0.3398439267506602
Epoch: 64, step: 1413, loss: 0.3123127818107605, mean loss: 0.3398436333354951
Epoch: 64, step: 1414, loss: 0.34623050689697266, mean loss: 0.3398437014033358
Epoch: 64, step: 1415, loss: 0.31100645661354065, mean loss: 0.339843394074868
Epoch: 64, step: 1416, loss: 0.3262355923652649, mean loss: 0.3398432490533755
Epoch: 64, step: 1417, loss: 0.3336845636367798, mean loss: 0.33984318341953895
Epoch: 64, step: 1418, loss: 0.3203989863395691, mean loss: 0.33984297620264675
Epoch: 64, step: 1419, loss: 0.33728328347206116, mean loss: 0.33984294892428096
Epoch: 64, step: 1420, loss: 0.34997719526290894, mean loss: 0.33984305692268607
Epoch: 64, step: 1421, loss: 0.3045263886451721, mean loss: 0.33984268056483236
Epoch: 64, step: 1422, loss: 0.31558576226234436, mean loss: 0.33984242206976845
Epoch: 64, step: 1423, loss: 0.36086657643318176, mean loss: 0.3398426461123341
Epoch: 64, step: 1424, loss: 0.42236149311065674, mean loss: 0.3398435254598155
Epoch: 64, step: 1425, loss: 0.34119805693626404, mean loss: 0.3398435398939865
Epoch: 64, step: 1426, loss: 0.32732683420181274, mean loss: 0.3398434065147713
Epoch: 64, step: 1427, loss: 0.33642348647117615, mean loss: 0.339843370072164
Epoch: 64, step: 1428, loss: 0.35784631967544556, mean loss: 0.33984356190923154
Epoch: 64, step: 1429, loss: 0.33828601241111755, mean loss: 0.33984354531236544
Epoch: 64, step: 1430, loss: 0.37035173177719116, mean loss: 0.3398438703966672
Epoch: 64, step: 1431, loss: 0.3309193253517151, mean loss: 0.3398437753009268
Epoch: 64, step: 1432, loss: 0.32997775077819824, mean loss: 0.3398436701743456
Epoch: 64, step: 1433, loss: 0.3561224043369293, mean loss: 0.3398438436291582
Epoch: 64, step: 1434, loss: 0.3222435712814331, mean loss: 0.33984365609495665
Epoch: 64, step: 1435, loss: 0.3560299277305603, mean loss: 0.33984382856087786
Epoch: 64, step: 1436, loss: 0.31535306572914124, mean loss: 0.3398435676127693
Epoch: 64, step: 1437, loss: 0.3382239043712616, mean loss: 0.33984355035550545
Epoch: 64, step: 1438, loss: 0.2981317937374115, mean loss: 0.3398431059278605
Epoch: 64, step: 1439, loss: 0.3136952519416809, mean loss: 0.33984282733241655
Epoch: 64, step: 1440, loss: 0.3142300546169281, mean loss: 0.33984255444096767
Epoch: 64, step: 1441, loss: 0.3417276442050934, mean loss: 0.33984257452545447
Epoch: 64, step: 1442, loss: 0.34810101985931396, mean loss: 0.3398426625132376
Epoch: 64, step: 1443, loss: 0.3483200669288635, mean loss: 0.3398427528329096
Valid: 64, mean loss: 0.18453666319449744
Epoch: 65, step: 0, loss: 0.32062387466430664, mean loss: 0.33984254807397707
Epoch: 65, step: 1, loss: 0.3561563193798065, mean loss: 0.3398427218798975
Epoch: 65, step: 2, loss: 0.3282310664653778, mean loss: 0.33984259817134976
Epoch: 65, step: 3, loss: 0.3208811283111572, mean loss: 0.33984239616131545
Epoch: 65, step: 4, loss: 0.34563931822776794, mean loss: 0.33984245791939427
Epoch: 65, step: 5, loss: 0.297643780708313, mean loss: 0.3398420083564299
Epoch: 65, step: 6, loss: 0.30248504877090454, mean loss: 0.33984161037887034
Epoch: 65, step: 7, loss: 0.3524588644504547, mean loss: 0.33984174479373025
Epoch: 65, step: 8, loss: 0.33094552159309387, mean loss: 0.339841650020981
Epoch: 65, step: 9, loss: 0.33736473321914673, mean loss: 0.33984162363431003
Epoch: 65, step: 10, loss: 0.3679187297821045, mean loss: 0.3398419227373999
Epoch: 65, step: 11, loss: 0.3183317482471466, mean loss: 0.33984169359373095
Epoch: 65, step: 12, loss: 0.32786181569099426, mean loss: 0.3398415659758014
Epoch: 65, step: 13, loss: 0.33527636528015137, mean loss: 0.3398415173446501
Epoch: 65, step: 14, loss: 0.3547598421573639, mean loss: 0.3398416762615589
Epoch: 65, step: 15, loss: 0.3124953806400299, mean loss: 0.33984138495924926
Epoch: 65, step: 16, loss: 0.3245554566383362, mean loss: 0.3398412221299266
Epoch: 65, step: 17, loss: 0.29105183482170105, mean loss: 0.3398407024193735
Epoch: 65, step: 18, loss: 0.35046228766441345, mean loss: 0.3398408155606004
Epoch: 65, step: 19, loss: 0.3332635760307312, mean loss: 0.33984074550052873
Epoch: 65, step: 20, loss: 0.3342495262622833, mean loss: 0.33984068594407707
Epoch: 65, step: 21, loss: 0.3533652424812317, mean loss: 0.3398408300031783
Epoch: 65, step: 22, loss: 0.3564981520175934, mean loss: 0.33984100742957085
Epoch: 65, step: 23, loss: 0.3135907053947449, mean loss: 0.33984072782599584
Epoch: 65, step: 24, loss: 0.34095877408981323, mean loss: 0.33984073973467416
Epoch: 65, step: 25, loss: 0.3130144774913788, mean loss: 0.3398404540023792
Epoch: 65, step: 26, loss: 0.340008407831192, mean loss: 0.33984045579127253
Epoch: 65, step: 27, loss: 0.3131803572177887, mean loss: 0.3398401718348716
Epoch: 65, step: 28, loss: 0.3264358341693878, mean loss: 0.33984002906694705
Epoch: 65, step: 29, loss: 0.42572134733200073, mean loss: 0.33984094376838775
Epoch: 65, step: 30, loss: 0.32398781180381775, mean loss: 0.33984077492225806
Epoch: 65, step: 31, loss: 0.3284723162651062, mean loss: 0.33984065384209516
Epoch: 65, step: 32, loss: 0.35911253094673157, mean loss: 0.3398408590957041
Epoch: 65, step: 33, loss: 0.32325050234794617, mean loss: 0.33984068240329834
Epoch: 65, step: 34, loss: 0.34449708461761475, mean loss: 0.33984073199488696
Epoch: 65, step: 35, loss: 0.3300083875656128, mean loss: 0.33984062727962294
Epoch: 65, step: 36, loss: 0.3575989007949829, mean loss: 0.3398408164046591
Epoch: 65, step: 37, loss: 0.3268607556819916, mean loss: 0.33984067816890623
Epoch: 65, step: 38, loss: 0.29002004861831665, mean loss: 0.33984014759212106
Epoch: 65, step: 39, loss: 0.30720654129981995, mean loss: 0.3398398000563778
Epoch: 65, step: 40, loss: 0.34583789110183716, mean loss: 0.3398398639331315
Epoch: 65, step: 41, loss: 0.3436089754104614, mean loss: 0.3398399040719089
Epoch: 65, step: 42, loss: 0.3247740566730499, mean loss: 0.3398397436313756
Epoch: 65, step: 43, loss: 0.3498890697956085, mean loss: 0.3398398506483947
Epoch: 65, step: 44, loss: 0.3695794641971588, mean loss: 0.33984016734733036
Epoch: 65, step: 45, loss: 0.3583870828151703, mean loss: 0.33984036485244684
Epoch: 65, step: 46, loss: 0.32022517919540405, mean loss: 0.3398401559736023
Epoch: 65, step: 47, loss: 0.33030790090560913, mean loss: 0.3398400544672869
Epoch: 65, step: 48, loss: 0.3171364665031433, mean loss: 0.33983981270570957
Epoch: 65, step: 49, loss: 0.3164498209953308, mean loss: 0.339839563637541
Epoch: 65, step: 50, loss: 0.3445110619068146, mean loss: 0.339839613381429
Epoch: 65, step: 51, loss: 0.32098785042762756, mean loss: 0.3398394126428338
Epoch: 65, step: 52, loss: 0.3359466791152954, mean loss: 0.3398393711924113
Epoch: 65, step: 53, loss: 0.3251535892486572, mean loss: 0.3398392148176222
Epoch: 65, step: 54, loss: 0.3228044807910919, mean loss: 0.33983903343302946
Epoch: 65, step: 55, loss: 0.3390783369541168, mean loss: 0.33983902533327565
Epoch: 65, step: 56, loss: 0.37089091539382935, mean loss: 0.3398393559644719
Epoch: 65, step: 57, loss: 0.3288240134716034, mean loss: 0.33983923867766325
Epoch: 65, step: 58, loss: 0.32188326120376587, mean loss: 0.3398390474918811
Epoch: 65, step: 59, loss: 0.30444926023483276, mean loss: 0.3398386706840951
Epoch: 65, step: 60, loss: 0.30857980251312256, mean loss: 0.3398383378632332
Epoch: 65, step: 61, loss: 0.31526607275009155, mean loss: 0.33983807623906515
Epoch: 65, step: 62, loss: 0.3498842418193817, mean loss: 0.3398381832007846
Epoch: 65, step: 63, loss: 0.3294108808040619, mean loss: 0.3398380721822761
Epoch: 65, step: 64, loss: 0.31920215487480164, mean loss: 0.3398378524759433
Epoch: 65, step: 65, loss: 0.30258387327194214, mean loss: 0.33983745584477404
Epoch: 65, step: 66, loss: 0.31887444853782654, mean loss: 0.33983723266073423
Epoch: 65, step: 67, loss: 0.3367435038089752, mean loss: 0.33983719972349663
Epoch: 65, step: 68, loss: 0.32073312997817993, mean loss: 0.33983699633508896
Epoch: 65, step: 69, loss: 0.2973233759403229, mean loss: 0.3398365437254819
Epoch: 65, step: 70, loss: 0.3326758146286011, mean loss: 0.33983646749155383
Epoch: 65, step: 71, loss: 0.31825485825538635, mean loss: 0.33983623773375843
Epoch: 65, step: 72, loss: 0.3704769015312195, mean loss: 0.33983656393076905
Epoch: 65, step: 73, loss: 0.36221256852149963, mean loss: 0.33983680214062484
Epoch: 65, step: 74, loss: 0.3085784316062927, mean loss: 0.33983646937466394
Epoch: 65, step: 75, loss: 0.34601151943206787, mean loss: 0.3398365351114428
Epoch: 65, step: 76, loss: 0.3536703884601593, mean loss: 0.3398366823787959
Epoch: 65, step: 77, loss: 0.3213346302509308, mean loss: 0.33983648541854417
Epoch: 65, step: 78, loss: 0.33630460500717163, mean loss: 0.33983644782094985
Epoch: 65, step: 79, loss: 0.3194633722305298, mean loss: 0.3398362309476734
Epoch: 65, step: 80, loss: 0.32533514499664307, mean loss: 0.3398360765839137
Epoch: 65, step: 81, loss: 0.32057300209999084, mean loss: 0.3398358715310674
Epoch: 65, step: 82, loss: 0.34454965591430664, mean loss: 0.3398359217081363
Epoch: 65, step: 83, loss: 0.35614901781082153, mean loss: 0.3398360953551612
Epoch: 65, step: 84, loss: 0.38279107213020325, mean loss: 0.3398365525905305
Epoch: 65, step: 85, loss: 0.2871725857257843, mean loss: 0.33983599201353026
Epoch: 65, step: 86, loss: 0.3215477764606476, mean loss: 0.3398357973482876
Epoch: 65, step: 87, loss: 0.3474704921245575, mean loss: 0.3398358786134
Epoch: 65, step: 88, loss: 0.3305884897708893, mean loss: 0.3398357801835195
Epoch: 65, step: 89, loss: 0.32245656847953796, mean loss: 0.3398355951998931
Epoch: 65, step: 90, loss: 0.31970903277397156, mean loss: 0.33983538097585686
Epoch: 65, step: 91, loss: 0.3249039351940155, mean loss: 0.3398352220495351
Epoch: 65, step: 92, loss: 0.3546111285686493, mean loss: 0.33983537931866453
Epoch: 65, step: 93, loss: 0.33230358362197876, mean loss: 0.33983529915394883
Epoch: 65, step: 94, loss: 0.3511464297771454, mean loss: 0.33983541954275864
Epoch: 65, step: 95, loss: 0.29321151971817017, mean loss: 0.3398349233115459
Epoch: 65, step: 96, loss: 0.3413099944591522, mean loss: 0.33983493901097384
Epoch: 65, step: 97, loss: 0.3433127999305725, mean loss: 0.3398349760260329
Epoch: 65, step: 98, loss: 0.3251146972179413, mean loss: 0.3398348193589887
Epoch: 65, step: 99, loss: 0.3587322235107422, mean loss: 0.3398350204807868
Epoch: 65, step: 100, loss: 0.3454565405845642, mean loss: 0.3398350803090145
Epoch: 65, step: 101, loss: 0.3300183117389679, mean loss: 0.3398349758330713
Epoch: 65, step: 102, loss: 0.33590471744537354, mean loss: 0.33983493400534776
Epoch: 65, step: 103, loss: 0.31539076566696167, mean loss: 0.3398346738613741
Epoch: 65, step: 104, loss: 0.3763164281845093, mean loss: 0.33983506210970404
Epoch: 65, step: 105, loss: 0.3165842592716217, mean loss: 0.33983481467123866
Epoch: 65, step: 106, loss: 0.32802632451057434, mean loss: 0.339834689004886
Epoch: 65, step: 107, loss: 0.3266947567462921, mean loss: 0.3398345491707695
Epoch: 65, step: 108, loss: 0.30257949233055115, mean loss: 0.33983415270962974
Epoch: 65, step: 109, loss: 0.2983558177947998, mean loss: 0.3398337113098754
Epoch: 65, step: 110, loss: 0.36890798807144165, mean loss: 0.33983402070614405
Epoch: 65, step: 111, loss: 0.3432566523551941, mean loss: 0.3398340571279681
Epoch: 65, step: 112, loss: 0.3721626102924347, mean loss: 0.3398344011475606
Epoch: 65, step: 113, loss: 0.3260148763656616, mean loss: 0.3398342540906642
Epoch: 65, step: 114, loss: 0.30449604988098145, mean loss: 0.33983387805231136
Epoch: 65, step: 115, loss: 0.29033929109573364, mean loss: 0.3398333513796826
Epoch: 65, step: 116, loss: 0.3032626807689667, mean loss: 0.339832962234779
Epoch: 65, step: 117, loss: 0.337197482585907, mean loss: 0.33983293419119803
Epoch: 65, step: 118, loss: 0.31297844648361206, mean loss: 0.33983264844132083
Epoch: 65, step: 119, loss: 0.33949926495552063, mean loss: 0.3398326448939332
Epoch: 65, step: 120, loss: 0.29887476563453674, mean loss: 0.33983220908372413
Epoch: 65, step: 121, loss: 0.33016225695610046, mean loss: 0.33983210619219034
Epoch: 65, step: 122, loss: 0.2966632843017578, mean loss: 0.3398316468663347
Epoch: 65, step: 123, loss: 0.30723893642425537, mean loss: 0.3398313000763445
Epoch: 65, step: 124, loss: 0.36344894766807556, mean loss: 0.33983155136801435
Epoch: 65, step: 125, loss: 0.309683620929718, mean loss: 0.3398312305975758
Epoch: 65, step: 126, loss: 0.3266596794128418, mean loss: 0.33983109045530946
Epoch: 65, step: 127, loss: 0.33554479479789734, mean loss: 0.3398310448505976
Epoch: 65, step: 128, loss: 0.3487379848957062, mean loss: 0.33983113961636857
Epoch: 65, step: 129, loss: 0.32240042090415955, mean loss: 0.33983095416346176
Epoch: 65, step: 130, loss: 0.3194907605648041, mean loss: 0.3398307377577038
Epoch: 65, step: 131, loss: 0.3509172201156616, mean loss: 0.33983085570904387
Epoch: 65, step: 132, loss: 0.32417166233062744, mean loss: 0.3398306891094739
Epoch: 65, step: 133, loss: 0.34128502011299133, mean loss: 0.33983070458206793
Epoch: 65, step: 134, loss: 0.3188396990299225, mean loss: 0.33983048126161947
Epoch: 65, step: 135, loss: 0.29175370931625366, mean loss: 0.3398299697848338
Epoch: 65, step: 136, loss: 0.3428073823451996, mean loss: 0.33983000146044645
Epoch: 65, step: 137, loss: 0.3366488814353943, mean loss: 0.33982996761802403
Epoch: 65, step: 138, loss: 0.3335682153701782, mean loss: 0.33982990100292976
Epoch: 65, step: 139, loss: 0.3519752323627472, mean loss: 0.33983003020858255
Epoch: 65, step: 140, loss: 0.33318445086479187, mean loss: 0.33982995951168204
Epoch: 65, step: 141, loss: 0.34199488162994385, mean loss: 0.3398299825422784
Epoch: 65, step: 142, loss: 0.32812899351119995, mean loss: 0.3398298580676443
Epoch: 65, step: 143, loss: 0.3040163218975067, mean loss: 0.3398294770887905
Epoch: 65, step: 144, loss: 0.3067858815193176, mean loss: 0.3398291255798754
Epoch: 65, step: 145, loss: 0.3519291281700134, mean loss: 0.3398292542950913
Epoch: 65, step: 146, loss: 0.29703494906425476, mean loss: 0.33982879907042474
Epoch: 65, step: 147, loss: 0.33166980743408203, mean loss: 0.3398287122800278
Epoch: 65, step: 148, loss: 0.29668328166007996, mean loss: 0.3398282533300271
Epoch: 65, step: 149, loss: 0.3877561688423157, mean loss: 0.3398287631472328
Epoch: 65, step: 150, loss: 0.351865291595459, mean loss: 0.3398288911804252
Epoch: 65, step: 151, loss: 0.34995603561401367, mean loss: 0.33982899890225254
Epoch: 65, step: 152, loss: 0.3331416845321655, mean loss: 0.3398289277704477
Epoch: 65, step: 153, loss: 0.3204890787601471, mean loss: 0.3398287220580112
Epoch: 65, step: 154, loss: 0.3586549460887909, mean loss: 0.3398289223050359
Epoch: 65, step: 155, loss: 0.33864036202430725, mean loss: 0.33982890966292945
Epoch: 65, step: 156, loss: 0.35917383432388306, mean loss: 0.33982911542278843
Epoch: 65, step: 157, loss: 0.31185978651046753, mean loss: 0.3398288179337022
Epoch: 65, step: 158, loss: 0.3398287296295166, mean loss: 0.339828817932763
Epoch: 65, step: 159, loss: 0.3241342306137085, mean loss: 0.33982865100458476
Epoch: 65, step: 160, loss: 0.3226573169231415, mean loss: 0.3398284683716189
Epoch: 65, step: 161, loss: 0.3088521659374237, mean loss: 0.3398281389135938
Epoch: 65, step: 162, loss: 0.41135844588279724, mean loss: 0.33982889968815927
Epoch: 65, step: 163, loss: 0.3351300060749054, mean loss: 0.33982884971268906
Epoch: 65, step: 164, loss: 0.3676035404205322, mean loss: 0.33982914510955914
Epoch: 65, step: 165, loss: 0.3147146999835968, mean loss: 0.33982887800849
Epoch: 65, step: 166, loss: 0.3377428948879242, mean loss: 0.3398288558235525
Epoch: 65, step: 167, loss: 0.29781773686408997, mean loss: 0.3398284090298425
Epoch: 65, step: 168, loss: 0.31396758556365967, mean loss: 0.33982813399954903
Epoch: 65, step: 169, loss: 0.34756550192832947, mean loss: 0.33982821628571225
Epoch: 65, step: 170, loss: 0.33398663997650146, mean loss: 0.3398281541617711
Epoch: 65, step: 171, loss: 0.3083641529083252, mean loss: 0.3398278195522631
Epoch: 65, step: 172, loss: 0.33304306864738464, mean loss: 0.33982774739939225
Epoch: 65, step: 173, loss: 0.3954416811466217, mean loss: 0.3398283388230661
Epoch: 65, step: 174, loss: 0.31622833013534546, mean loss: 0.3398280878525904
Epoch: 65, step: 175, loss: 0.288055956363678, mean loss: 0.33982753729608556
Epoch: 65, step: 176, loss: 0.31614938378334045, mean loss: 0.3398272854999467
Epoch: 65, step: 177, loss: 0.3362319767475128, mean loss: 0.3398272472674369
Epoch: 65, step: 178, loss: 0.34886276721954346, mean loss: 0.3398273433501255
Epoch: 65, step: 179, loss: 0.3380981385707855, mean loss: 0.3398273249621546
Epoch: 65, step: 180, loss: 0.3243606984615326, mean loss: 0.33982716049531037
Epoch: 65, step: 181, loss: 0.332277774810791, mean loss: 0.33982708021856506
Epoch: 65, step: 182, loss: 0.33096182346343994, mean loss: 0.33982698595044564
Epoch: 65, step: 183, loss: 0.29189687967300415, mean loss: 0.3398264762942605
Epoch: 65, step: 184, loss: 0.27988195419311523, mean loss: 0.3398258388917181
Epoch: 65, step: 185, loss: 0.3277362287044525, mean loss: 0.3398257103417512
Epoch: 65, step: 186, loss: 0.33728092908859253, mean loss: 0.3398256832831395
Epoch: 65, step: 187, loss: 0.30482882261276245, mean loss: 0.3398253111661283
Epoch: 65, step: 188, loss: 0.28999027609825134, mean loss: 0.33982478128239674
Epoch: 65, step: 189, loss: 0.3204464316368103, mean loss: 0.3398245752393383
Epoch: 65, step: 190, loss: 0.3860180377960205, mean loss: 0.3398250663926759
Epoch: 65, step: 191, loss: 0.333484023809433, mean loss: 0.3398249989720726
Epoch: 65, step: 192, loss: 0.2927123010158539, mean loss: 0.3398244980555898
Epoch: 65, step: 193, loss: 0.3067700266838074, mean loss: 0.3398241466141692
Epoch: 65, step: 194, loss: 0.3222389221191406, mean loss: 0.33982395964670875
Epoch: 65, step: 195, loss: 0.35980749130249023, mean loss: 0.33982417211089666
Epoch: 65, step: 196, loss: 0.30524155497550964, mean loss: 0.3398238044336676
Epoch: 65, step: 197, loss: 0.3786134719848633, mean loss: 0.33982421683524483
Epoch: 65, step: 198, loss: 0.33671560883522034, mean loss: 0.33982418378569085
Epoch: 65, step: 199, loss: 0.35497239232063293, mean loss: 0.33982434483404866
Epoch: 65, step: 200, loss: 0.3450290262699127, mean loss: 0.3398244001670925
Epoch: 65, step: 201, loss: 0.3660390377044678, mean loss: 0.3398246788623949
Epoch: 65, step: 202, loss: 0.3596283495426178, mean loss: 0.33982488939863853
Epoch: 65, step: 203, loss: 0.31499791145324707, mean loss: 0.33982462546155373
Epoch: 65, step: 204, loss: 0.3812974691390991, mean loss: 0.33982506635714377
Epoch: 65, step: 205, loss: 0.31195518374443054, mean loss: 0.3398247700770573
Epoch: 65, step: 206, loss: 0.3349115550518036, mean loss: 0.33982471784604085
Epoch: 65, step: 207, loss: 0.3767850399017334, mean loss: 0.33982511075672306
Epoch: 65, step: 208, loss: 0.34909969568252563, mean loss: 0.33982520935014837
Epoch: 65, step: 209, loss: 0.31269970536231995, mean loss: 0.33982492099568906
Epoch: 65, step: 210, loss: 0.32375696301460266, mean loss: 0.33982475018897945
Epoch: 65, step: 211, loss: 0.34258317947387695, mean loss: 0.339824779511512
Epoch: 65, step: 212, loss: 0.3067498803138733, mean loss: 0.3398244279239237
Epoch: 65, step: 213, loss: 0.2870616614818573, mean loss: 0.33982386705942935
Epoch: 65, step: 214, loss: 0.35332199931144714, mean loss: 0.3398240105421001
Epoch: 65, step: 215, loss: 0.34450703859329224, mean loss: 0.3398240603213004
Epoch: 65, step: 216, loss: 0.3211931884288788, mean loss: 0.3398238622827587
Epoch: 65, step: 217, loss: 0.32622072100639343, mean loss: 0.3398237176884723
Epoch: 65, step: 218, loss: 0.3102928102016449, mean loss: 0.3398234037936872
Epoch: 65, step: 219, loss: 0.3422612249851227, mean loss: 0.33982342970590224
Epoch: 65, step: 220, loss: 0.3487999141216278, mean loss: 0.3398235251182003
Epoch: 65, step: 221, loss: 0.32154878973960876, mean loss: 0.3398233308755675
Epoch: 65, step: 222, loss: 0.3365175426006317, mean loss: 0.3398232957386323
Epoch: 65, step: 223, loss: 0.35329964756965637, mean loss: 0.33982343897607786
Epoch: 65, step: 224, loss: 0.35198071599006653, mean loss: 0.3398235681919679
Epoch: 65, step: 225, loss: 0.32689616084098816, mean loss: 0.33982343079206406
Epoch: 65, step: 226, loss: 0.3580305278301239, mean loss: 0.3398236243054829
Epoch: 65, step: 227, loss: 0.36287039518356323, mean loss: 0.33982386925458247
Epoch: 65, step: 228, loss: 0.32851260900497437, mean loss: 0.3398237490358507
Epoch: 65, step: 229, loss: 0.3276130259037018, mean loss: 0.33982361925879545
Epoch: 65, step: 230, loss: 0.2935313582420349, mean loss: 0.3398231272642262
Epoch: 65, step: 231, loss: 0.32589954137802124, mean loss: 0.339822979285802
Epoch: 65, step: 232, loss: 0.3570645749568939, mean loss: 0.33982316252574196
Epoch: 65, step: 233, loss: 0.365803599357605, mean loss: 0.33982343863725634
Epoch: 65, step: 234, loss: 0.32590898871421814, mean loss: 0.3398232907606431
Epoch: 65, step: 235, loss: 0.33479487895965576, mean loss: 0.33982323732147673
Epoch: 65, step: 236, loss: 0.3328593373298645, mean loss: 0.3398231633138039
Epoch: 65, step: 237, loss: 0.3201562166213989, mean loss: 0.3398229543088655
Epoch: 65, step: 238, loss: 0.3595617115497589, mean loss: 0.339823164074721
Epoch: 65, step: 239, loss: 0.31941378116607666, mean loss: 0.3398229471843607
Epoch: 65, step: 240, loss: 0.3620436191558838, mean loss: 0.339823183320767
Epoch: 65, step: 241, loss: 0.3301140367984772, mean loss: 0.33982308014393203
Epoch: 65, step: 242, loss: 0.33573323488235474, mean loss: 0.3398230366825625
Epoch: 65, step: 243, loss: 0.33110955357551575, mean loss: 0.3398229440883783
Epoch: 65, step: 244, loss: 0.3356522023677826, mean loss: 0.33982289976829205
Epoch: 65, step: 245, loss: 0.31851670145988464, mean loss: 0.33982267336191724
Epoch: 65, step: 246, loss: 0.3305412828922272, mean loss: 0.3398225747359864
Epoch: 65, step: 247, loss: 0.3456725776195526, mean loss: 0.33982263689863873
Epoch: 65, step: 248, loss: 0.3166976273059845, mean loss: 0.33982239117283575
Epoch: 65, step: 249, loss: 0.32449793815612793, mean loss: 0.33982222833729203
Epoch: 65, step: 250, loss: 0.32150548696517944, mean loss: 0.33982203370816927
Epoch: 65, step: 251, loss: 0.3147422671318054, mean loss: 0.33982176721966006
Epoch: 65, step: 252, loss: 0.3479562997817993, mean loss: 0.3398218536533362
Epoch: 65, step: 253, loss: 0.35922884941101074, mean loss: 0.33982205986065667
Epoch: 65, step: 254, loss: 0.3088941276073456, mean loss: 0.3398217312421341
Epoch: 65, step: 255, loss: 0.37537890672683716, mean loss: 0.33982210904373517
Epoch: 65, step: 256, loss: 0.34307828545570374, mean loss: 0.3398221436408474
Epoch: 65, step: 257, loss: 0.35174795985221863, mean loss: 0.3398222703521695
Epoch: 65, step: 258, loss: 0.3476322889328003, mean loss: 0.33982235333242405
Epoch: 65, step: 259, loss: 0.3277133107185364, mean loss: 0.3398222246770627
Epoch: 65, step: 260, loss: 0.3336535394191742, mean loss: 0.33982215913711666
Epoch: 65, step: 261, loss: 0.31472525000572205, mean loss: 0.33982189249478933
Epoch: 65, step: 262, loss: 0.3115061819553375, mean loss: 0.339821591657475
Epoch: 65, step: 263, loss: 0.3358801007270813, mean loss: 0.33982154978196044
Epoch: 65, step: 264, loss: 0.34361183643341064, mean loss: 0.33982159005061013
Epoch: 65, step: 265, loss: 0.2937849462032318, mean loss: 0.33982110095467655
Epoch: 65, step: 266, loss: 0.359976202249527, mean loss: 0.33982131508134894
Epoch: 65, step: 267, loss: 0.3348856568336487, mean loss: 0.33982126264574797
Epoch: 65, step: 268, loss: 0.3620246946811676, mean loss: 0.33982149852876
Epoch: 65, step: 269, loss: 0.3143812119960785, mean loss: 0.3398212282611882
Epoch: 65, step: 270, loss: 0.3639785349369049, mean loss: 0.33982148489616154
Epoch: 65, step: 271, loss: 0.3097214698791504, mean loss: 0.33982116513226596
Epoch: 65, step: 272, loss: 0.3581719398498535, mean loss: 0.3398213600774469
Epoch: 65, step: 273, loss: 0.3429665267467499, mean loss: 0.3398213934890375
Epoch: 65, step: 274, loss: 0.32731014490127563, mean loss: 0.33982126058152606
Epoch: 65, step: 275, loss: 0.319955438375473, mean loss: 0.3398210495483166
Epoch: 65, step: 276, loss: 0.3520997166633606, mean loss: 0.3398211799823342
Epoch: 65, step: 277, loss: 0.3147379457950592, mean loss: 0.33982091353059113
Epoch: 65, step: 278, loss: 0.359284907579422, mean loss: 0.33982112028861966
Epoch: 65, step: 279, loss: 0.3016091287136078, mean loss: 0.33982071438261185
Epoch: 65, step: 280, loss: 0.33666712045669556, mean loss: 0.33982068088398826
Epoch: 65, step: 281, loss: 0.31201404333114624, mean loss: 0.339820385514891
Epoch: 65, step: 282, loss: 0.3420298993587494, mean loss: 0.33982040898465343
Epoch: 65, step: 283, loss: 0.29120874404907227, mean loss: 0.3398198926302927
Epoch: 65, step: 284, loss: 0.31364905834198, mean loss: 0.3398196146459676
Epoch: 65, step: 285, loss: 0.38858136534690857, mean loss: 0.3398201325835401
Epoch: 65, step: 286, loss: 0.31908899545669556, mean loss: 0.33981991238388287
Epoch: 65, step: 287, loss: 0.34840500354766846, mean loss: 0.3398200035710686
Epoch: 65, step: 288, loss: 0.35458630323410034, mean loss: 0.3398201604107553
Epoch: 65, step: 289, loss: 0.3333778977394104, mean loss: 0.3398200919852357
Epoch: 65, step: 290, loss: 0.3224584460258484, mean loss: 0.3398199075830949
Epoch: 65, step: 291, loss: 0.32193464040756226, mean loss: 0.3398197176214671
Epoch: 65, step: 292, loss: 0.3098253905773163, mean loss: 0.3398193990514052
Epoch: 65, step: 293, loss: 0.3114158809185028, mean loss: 0.3398190973805454
Epoch: 65, step: 294, loss: 0.33910420536994934, mean loss: 0.33981908978783115
Epoch: 65, step: 295, loss: 0.33022427558898926, mean loss: 0.3398189878844559
Epoch: 65, step: 296, loss: 0.36654573678970337, mean loss: 0.339819271737477
Epoch: 65, step: 297, loss: 0.3094455897808075, mean loss: 0.3398189491554133
Epoch: 65, step: 298, loss: 0.31037482619285583, mean loss: 0.3398186364490022
Epoch: 65, step: 299, loss: 0.3189835250377655, mean loss: 0.3398184151755165
Epoch: 65, step: 300, loss: 0.32931917905807495, mean loss: 0.3398183036724938
Epoch: 65, step: 301, loss: 0.29844874143600464, mean loss: 0.3398178643279362
Epoch: 65, step: 302, loss: 0.2997949421405792, mean loss: 0.3398174392892035
Epoch: 65, step: 303, loss: 0.3505968749523163, mean loss: 0.33981755376432843
Epoch: 65, step: 304, loss: 0.3811730444431305, mean loss: 0.3398179929454539
Epoch: 65, step: 305, loss: 0.3367105722427368, mean loss: 0.33981795994606234
Epoch: 65, step: 306, loss: 0.3320744037628174, mean loss: 0.3398178777138984
Epoch: 65, step: 307, loss: 0.37725695967674255, mean loss: 0.33981827529144026
Epoch: 65, step: 308, loss: 0.29871249198913574, mean loss: 0.33981783878066385
Epoch: 65, step: 309, loss: 0.3288564682006836, mean loss: 0.33981772238084884
Epoch: 65, step: 310, loss: 0.29887253046035767, mean loss: 0.3398172875846598
Epoch: 65, step: 311, loss: 0.37373802065849304, mean loss: 0.33981764778443335
Epoch: 65, step: 312, loss: 0.34968942403793335, mean loss: 0.33981775261040525
Epoch: 65, step: 313, loss: 0.3344087600708008, mean loss: 0.3398176951742494
Epoch: 65, step: 314, loss: 0.310150682926178, mean loss: 0.33981738015420965
Epoch: 65, step: 315, loss: 0.31348729133605957, mean loss: 0.33981710057035797
Epoch: 65, step: 316, loss: 0.30397966504096985, mean loss: 0.33981672003757896
Epoch: 65, step: 317, loss: 0.32774636149406433, mean loss: 0.3398165918722055
Epoch: 65, step: 318, loss: 0.3340001106262207, mean loss: 0.33981653011235197
Epoch: 65, step: 319, loss: 0.3895561993122101, mean loss: 0.33981705824644837
Epoch: 65, step: 320, loss: 0.3147905468940735, mean loss: 0.3398167925186333
Epoch: 65, step: 321, loss: 0.3157346248626709, mean loss: 0.33981653682043556
Epoch: 65, step: 322, loss: 0.27720898389816284, mean loss: 0.33981587207676717
Epoch: 65, step: 323, loss: 0.3025873005390167, mean loss: 0.33981547680186336
Epoch: 65, step: 324, loss: 0.41653478145599365, mean loss: 0.33981629136155606
Epoch: 65, step: 325, loss: 0.3233150839805603, mean loss: 0.33981611616346524
Epoch: 65, step: 326, loss: 0.30239129066467285, mean loss: 0.3398157188174886
Epoch: 65, step: 327, loss: 0.3091171979904175, mean loss: 0.33981539288933615
Epoch: 65, step: 328, loss: 0.35280653834342957, mean loss: 0.3398155308156912
Epoch: 65, step: 329, loss: 0.31764787435531616, mean loss: 0.33981529546526695
Epoch: 65, step: 330, loss: 0.3879694938659668, mean loss: 0.33981580670517736
Epoch: 65, step: 331, loss: 0.3313254415988922, mean loss: 0.33981571656625786
Epoch: 65, step: 332, loss: 0.30409619212150574, mean loss: 0.3398153373499207
Epoch: 65, step: 333, loss: 0.3396048843860626, mean loss: 0.33981533511567047
Epoch: 65, step: 334, loss: 0.3213750422000885, mean loss: 0.3398151393484544
Epoch: 65, step: 335, loss: 0.3706652820110321, mean loss: 0.33981546685856806
Epoch: 65, step: 336, loss: 0.3407870829105377, mean loss: 0.339815477173292
Epoch: 65, step: 337, loss: 0.32862550020217896, mean loss: 0.33981535838120547
Epoch: 65, step: 338, loss: 0.3432759940624237, mean loss: 0.3398153951187046
Epoch: 65, step: 339, loss: 0.33043596148490906, mean loss: 0.3398152955493455
Epoch: 65, step: 340, loss: 0.3677784502506256, mean loss: 0.3398155923949703
Epoch: 65, step: 341, loss: 0.3274174928665161, mean loss: 0.3398154607831199
Epoch: 65, step: 342, loss: 0.31659749150276184, mean loss: 0.33981521431571143
Epoch: 65, step: 343, loss: 0.33516764640808105, mean loss: 0.3398151649805674
Epoch: 65, step: 344, loss: 0.33770403265953064, mean loss: 0.33981514257058576
Epoch: 65, step: 345, loss: 0.32898297905921936, mean loss: 0.3398150275867895
Epoch: 65, step: 346, loss: 0.3336661458015442, mean loss: 0.3398149623168861
Epoch: 65, step: 347, loss: 0.3176804482936859, mean loss: 0.33981472736323015
Epoch: 65, step: 348, loss: 0.35374683141708374, mean loss: 0.3398148752482948
Epoch: 65, step: 349, loss: 0.2879304885864258, mean loss: 0.3398143245170915
Epoch: 65, step: 350, loss: 0.3124980032444, mean loss: 0.33981403456877046
Epoch: 65, step: 351, loss: 0.3510249853134155, mean loss: 0.33981415356582756
Epoch: 65, step: 352, loss: 0.35599589347839355, mean loss: 0.33981432532280287
Epoch: 65, step: 353, loss: 0.31665265560150146, mean loss: 0.33981407948174186
Epoch: 65, step: 354, loss: 0.35867759585380554, mean loss: 0.33981427969950306
Epoch: 65, step: 355, loss: 0.3000335693359375, mean loss: 0.33981385747068454
Epoch: 65, step: 356, loss: 0.3460862636566162, mean loss: 0.33981392404472305
Epoch: 65, step: 357, loss: 0.3046238124370575, mean loss: 0.3398135505480281
Epoch: 65, step: 358, loss: 0.33863601088523865, mean loss: 0.3398135380501279
Epoch: 65, step: 359, loss: 0.3416695296764374, mean loss: 0.33981355774861677
Epoch: 65, step: 360, loss: 0.32585233449935913, mean loss: 0.3398134095733347
Epoch: 65, step: 361, loss: 0.3197394907474518, mean loss: 0.3398131965241655
Epoch: 65, step: 362, loss: 0.3405167758464813, mean loss: 0.3398132039913372
Epoch: 65, step: 363, loss: 0.3386191129684448, mean loss: 0.33981319131844046
Epoch: 65, step: 364, loss: 0.3448817729949951, mean loss: 0.3398132451107639
Epoch: 65, step: 365, loss: 0.3066042959690094, mean loss: 0.33981289267142506
Epoch: 65, step: 366, loss: 0.34556806087493896, mean loss: 0.33981295374912257
Epoch: 65, step: 367, loss: 0.3547818660736084, mean loss: 0.3398131126075545
Epoch: 65, step: 368, loss: 0.3174467086791992, mean loss: 0.3398128752453419
Epoch: 65, step: 369, loss: 0.36894339323043823, mean loss: 0.3398131843880564
Epoch: 65, step: 370, loss: 0.29509082436561584, mean loss: 0.3398127097845817
Epoch: 65, step: 371, loss: 0.33805468678474426, mean loss: 0.3398126911282548
Epoch: 65, step: 372, loss: 0.3041779100894928, mean loss: 0.3398123129721838
Epoch: 65, step: 373, loss: 0.34725213050842285, mean loss: 0.3398123919226426
Epoch: 65, step: 374, loss: 0.3112684190273285, mean loss: 0.33981208902061155
Epoch: 65, step: 375, loss: 0.3133735954761505, mean loss: 0.33981180846441705
Epoch: 65, step: 376, loss: 0.30459049344062805, mean loss: 0.33981143471190983
Epoch: 65, step: 377, loss: 0.3111593425273895, mean loss: 0.33981113067222113
Epoch: 65, step: 378, loss: 0.2986859679222107, mean loss: 0.33981069428004007
Epoch: 65, step: 379, loss: 0.3659525513648987, mean loss: 0.33981097167665597
Epoch: 65, step: 380, loss: 0.3234626054763794, mean loss: 0.3398107982026245
Epoch: 65, step: 381, loss: 0.3123762011528015, mean loss: 0.33981050709465727
Epoch: 65, step: 382, loss: 0.3768962621688843, mean loss: 0.3398109006066961
Epoch: 65, step: 383, loss: 0.3234439790248871, mean loss: 0.3398107269413001
Epoch: 65, step: 384, loss: 0.344607949256897, mean loss: 0.33981077784291097
Epoch: 65, step: 385, loss: 0.32734888792037964, mean loss: 0.33981064561565544
Epoch: 65, step: 386, loss: 0.34482085704803467, mean loss: 0.33981069877608955
Epoch: 65, step: 387, loss: 0.3326149880886078, mean loss: 0.3398106224274064
Epoch: 65, step: 388, loss: 0.3429550230503082, mean loss: 0.3398106557901012
Epoch: 65, step: 389, loss: 0.38414764404296875, mean loss: 0.3398111262090747
Epoch: 65, step: 390, loss: 0.305854856967926, mean loss: 0.3398107659341785
Epoch: 65, step: 391, loss: 0.30708420276641846, mean loss: 0.33981041871010725
Epoch: 65, step: 392, loss: 0.3703419268131256, mean loss: 0.339810742641527
Epoch: 65, step: 393, loss: 0.3112432658672333, mean loss: 0.3398104395511884
Epoch: 65, step: 394, loss: 0.31758689880371094, mean loss: 0.3398102037701609
Epoch: 65, step: 395, loss: 0.3878893554210663, mean loss: 0.33981071386131323
Epoch: 65, step: 396, loss: 0.3473784625530243, mean loss: 0.339810794149766
Epoch: 65, step: 397, loss: 0.3769601881504059, mean loss: 0.339811188274339
Epoch: 65, step: 398, loss: 0.32378390431404114, mean loss: 0.3398110182398175
Epoch: 65, step: 399, loss: 0.363694429397583, mean loss: 0.3398112716178268
Epoch: 65, step: 400, loss: 0.3942132890224457, mean loss: 0.33981184876020176
Epoch: 65, step: 401, loss: 0.3386692702770233, mean loss: 0.3398118366388964
Epoch: 65, step: 402, loss: 0.32831183075904846, mean loss: 0.33981171463974635
Epoch: 65, step: 403, loss: 0.30572062730789185, mean loss: 0.33981135298431764
Epoch: 65, step: 404, loss: 0.33975130319595337, mean loss: 0.339811352347286
Epoch: 65, step: 405, loss: 0.35746946930885315, mean loss: 0.33981153966951205
Epoch: 65, step: 406, loss: 0.2913200855255127, mean loss: 0.33981102526410883
Epoch: 65, step: 407, loss: 0.34395989775657654, mean loss: 0.33981106927557075
Epoch: 65, step: 408, loss: 0.3160287141799927, mean loss: 0.33981081699374854
Epoch: 65, step: 409, loss: 0.298607736825943, mean loss: 0.33981037991853724
Epoch: 65, step: 410, loss: 0.3318589925765991, mean loss: 0.3398102955724781
Epoch: 65, step: 411, loss: 0.38013848662376404, mean loss: 0.3398107233579399
Epoch: 65, step: 412, loss: 0.2976786196231842, mean loss: 0.33981027644202827
Epoch: 65, step: 413, loss: 0.34731051325798035, mean loss: 0.33981035599987897
Epoch: 65, step: 414, loss: 0.32815274596214294, mean loss: 0.33981023234450863
Epoch: 65, step: 415, loss: 0.327682763338089, mean loss: 0.33981010370658377
Epoch: 65, step: 416, loss: 0.329528272151947, mean loss: 0.33980999464677536
Epoch: 65, step: 417, loss: 0.36569324135780334, mean loss: 0.33981026918852114
Epoch: 65, step: 418, loss: 0.3430774211883545, mean loss: 0.339810303842601
Epoch: 65, step: 419, loss: 0.3050650656223297, mean loss: 0.3398099353101634
Epoch: 65, step: 420, loss: 0.3518344461917877, mean loss: 0.33981006284923154
Epoch: 65, step: 421, loss: 0.2852066159248352, mean loss: 0.33980948369894914
Epoch: 65, step: 422, loss: 0.3268359303474426, mean loss: 0.3398093460966947
Epoch: 65, step: 423, loss: 0.34666430950164795, mean loss: 0.33980941880217397
Epoch: 65, step: 424, loss: 0.39355888962745667, mean loss: 0.3398099888766378
Epoch: 65, step: 425, loss: 0.3413899540901184, mean loss: 0.3398100056337939
Epoch: 65, step: 426, loss: 0.32824569940567017, mean loss: 0.33980988298373366
Epoch: 65, step: 427, loss: 0.3758445382118225, mean loss: 0.339810265160206
Epoch: 65, step: 428, loss: 0.32055485248565674, mean loss: 0.33981006094324884
Epoch: 65, step: 429, loss: 0.35108864307403564, mean loss: 0.33981018055913736
Epoch: 65, step: 430, loss: 0.3346591889858246, mean loss: 0.33981012593047105
Epoch: 65, step: 431, loss: 0.32536810636520386, mean loss: 0.3398099727677471
Epoch: 65, step: 432, loss: 0.30634620785713196, mean loss: 0.33980961787645175
Epoch: 65, step: 433, loss: 0.33200210332870483, mean loss: 0.3398095350767556
Epoch: 65, step: 434, loss: 0.3383448123931885, mean loss: 0.33980951954334787
Epoch: 65, step: 435, loss: 0.320173442363739, mean loss: 0.3398093113046402
Epoch: 65, step: 436, loss: 0.29142817854881287, mean loss: 0.33980879823282717
Epoch: 65, step: 437, loss: 0.35605505108833313, mean loss: 0.3398089705191201
Epoch: 65, step: 438, loss: 0.32647639513015747, mean loss: 0.33980882913294014
Epoch: 65, step: 439, loss: 0.3278205990791321, mean loss: 0.3398087020043075
Epoch: 65, step: 440, loss: 0.35140132904052734, mean loss: 0.3398088249364825
Epoch: 65, step: 441, loss: 0.3322145342826843, mean loss: 0.33980874440488557
Epoch: 65, step: 442, loss: 0.3423309922218323, mean loss: 0.3398087711510953
Epoch: 65, step: 443, loss: 0.36377352476119995, mean loss: 0.3398090252734402
Epoch: 65, step: 444, loss: 0.3274245858192444, mean loss: 0.3398088939501864
Epoch: 65, step: 445, loss: 0.369986891746521, mean loss: 0.3398092139510113
Epoch: 65, step: 446, loss: 0.32494622468948364, mean loss: 0.3398090563488263
Epoch: 65, step: 447, loss: 0.31222406029701233, mean loss: 0.3398087638498225
Epoch: 65, step: 448, loss: 0.3238948583602905, mean loss: 0.3398085951076506
Epoch: 65, step: 449, loss: 0.35583195090293884, mean loss: 0.33980876500857093
Epoch: 65, step: 450, loss: 0.3329637050628662, mean loss: 0.3398086924289148
Epoch: 65, step: 451, loss: 0.30555927753448486, mean loss: 0.33980832927878657
Epoch: 65, step: 452, loss: 0.3555404245853424, mean loss: 0.33980849608606983
Epoch: 65, step: 453, loss: 0.34823375940322876, mean loss: 0.3398085854181236
Epoch: 65, step: 454, loss: 0.3373105525970459, mean loss: 0.3398085589320628
Epoch: 65, step: 455, loss: 0.3317340910434723, mean loss: 0.33980847332126624
Epoch: 65, step: 456, loss: 0.3089909851551056, mean loss: 0.33980814657753855
Epoch: 65, step: 457, loss: 0.30318567156791687, mean loss: 0.339807758290308
Epoch: 65, step: 458, loss: 0.36692917346954346, mean loss: 0.3398080458401673
Epoch: 65, step: 459, loss: 0.3314257860183716, mean loss: 0.33980795696972815
Epoch: 65, step: 460, loss: 0.3131072521209717, mean loss: 0.3398076738863761
Epoch: 65, step: 461, loss: 0.32660964131355286, mean loss: 0.3398075339610928
Epoch: 65, step: 462, loss: 0.3058865964412689, mean loss: 0.3398071743357891
Epoch: 65, step: 463, loss: 0.40151137113571167, mean loss: 0.3398078285086062
Epoch: 65, step: 464, loss: 0.3113778829574585, mean loss: 0.3398075271044657
Epoch: 65, step: 465, loss: 0.30972421169281006, mean loss: 0.339807208175269
Epoch: 65, step: 466, loss: 0.31624147295951843, mean loss: 0.3398069583450484
Epoch: 65, step: 467, loss: 0.3341693580150604, mean loss: 0.3398068985791218
Epoch: 65, step: 468, loss: 0.30658432841300964, mean loss: 0.3398065463802204
Epoch: 65, step: 469, loss: 0.38378944993019104, mean loss: 0.3398070126465572
Epoch: 65, step: 470, loss: 0.3215920329093933, mean loss: 0.339806819550123
Epoch: 65, step: 471, loss: 0.36415284872055054, mean loss: 0.3398070776388858
Epoch: 65, step: 472, loss: 0.2912403345108032, mean loss: 0.3398065627952666
Epoch: 65, step: 473, loss: 0.3730141818523407, mean loss: 0.3398069148170091
Epoch: 65, step: 474, loss: 0.4561903178691864, mean loss: 0.33980814854153396
Epoch: 65, step: 475, loss: 0.3339175581932068, mean loss: 0.33980808609887847
Epoch: 65, step: 476, loss: 0.33870729804039, mean loss: 0.33980807443020067
Epoch: 65, step: 477, loss: 0.36454376578330994, mean loss: 0.3398083366330389
Epoch: 65, step: 478, loss: 0.34039124846458435, mean loss: 0.3398083428119451
Epoch: 65, step: 479, loss: 0.34455347061157227, mean loss: 0.3398083931100986
Epoch: 65, step: 480, loss: 0.3413698673248291, mean loss: 0.3398084096614836
Epoch: 65, step: 481, loss: 0.34028470516204834, mean loss: 0.3398084147100887
Epoch: 65, step: 482, loss: 0.3341233432292938, mean loss: 0.3398083544504883
Epoch: 65, step: 483, loss: 0.37283551692962646, mean loss: 0.33980870452216727
Epoch: 65, step: 484, loss: 0.3142583668231964, mean loss: 0.3398084337040243
Epoch: 65, step: 485, loss: 0.31413277983665466, mean loss: 0.3398081615604902
Epoch: 65, step: 486, loss: 0.3125610649585724, mean loss: 0.3398078727638501
Epoch: 65, step: 487, loss: 0.3439251482486725, mean loss: 0.3398079164030951
Epoch: 65, step: 488, loss: 0.3357824385166168, mean loss: 0.3398078737372705
Epoch: 65, step: 489, loss: 0.32741647958755493, mean loss: 0.3398077424029393
Epoch: 65, step: 490, loss: 0.32458439469337463, mean loss: 0.33980758105491216
Epoch: 65, step: 491, loss: 0.33010709285736084, mean loss: 0.33980747824322616
Epoch: 65, step: 492, loss: 0.30200886726379395, mean loss: 0.33980707763475604
Epoch: 65, step: 493, loss: 0.3165470361709595, mean loss: 0.339806831115886
Epoch: 65, step: 494, loss: 0.31345340609550476, mean loss: 0.3398065518151068
Epoch: 65, step: 495, loss: 0.3383772075176239, mean loss: 0.33980653666668703
Epoch: 65, step: 496, loss: 0.3323214054107666, mean loss: 0.3398064573389079
Epoch: 65, step: 497, loss: 0.3214218020439148, mean loss: 0.3398062624995165
Epoch: 65, step: 498, loss: 0.3361908197402954, mean loss: 0.33980622418369333
Epoch: 65, step: 499, loss: 0.3518011271953583, mean loss: 0.33980635130220765
Epoch: 65, step: 500, loss: 0.31522318720817566, mean loss: 0.33980609077970264
Epoch: 65, step: 501, loss: 0.3022176921367645, mean loss: 0.33980569243716385
Epoch: 65, step: 502, loss: 0.3294895589351654, mean loss: 0.3398055831132392
Epoch: 65, step: 503, loss: 0.32618793845176697, mean loss: 0.33980543880349545
Epoch: 65, step: 504, loss: 0.31068742275238037, mean loss: 0.3398051302355301
Epoch: 65, step: 505, loss: 0.34994781017303467, mean loss: 0.3398052377178854
Epoch: 65, step: 506, loss: 0.3399200141429901, mean loss: 0.33980523893416253
Epoch: 65, step: 507, loss: 0.30222734808921814, mean loss: 0.3398048407282999
Epoch: 65, step: 508, loss: 0.29662013053894043, mean loss: 0.33980438311287336
Epoch: 65, step: 509, loss: 0.32834696769714355, mean loss: 0.3398042617033638
Epoch: 65, step: 510, loss: 0.35492998361587524, mean loss: 0.33980442198270716
Epoch: 65, step: 511, loss: 0.310427725315094, mean loss: 0.3398041106965559
Epoch: 65, step: 512, loss: 0.38314691185951233, mean loss: 0.3398045699677581
Epoch: 65, step: 513, loss: 0.3594946563243866, mean loss: 0.3398047786066455
Epoch: 65, step: 514, loss: 0.3161635398864746, mean loss: 0.33980452810345374
Epoch: 65, step: 515, loss: 0.3144693374633789, mean loss: 0.33980425965394706
Epoch: 65, step: 516, loss: 0.3161323666572571, mean loss: 0.3398040088312572
Epoch: 65, step: 517, loss: 0.30877503752708435, mean loss: 0.3398036800579064
Epoch: 65, step: 518, loss: 0.32752588391304016, mean loss: 0.33980354996756695
Epoch: 65, step: 519, loss: 0.3846641182899475, mean loss: 0.33980402528615483
Epoch: 65, step: 520, loss: 0.30133309960365295, mean loss: 0.33980361767312167
Epoch: 65, step: 521, loss: 0.3311386704444885, mean loss: 0.33980352586592083
Epoch: 65, step: 522, loss: 0.3231789469718933, mean loss: 0.3398033497263735
Epoch: 65, step: 523, loss: 0.33611395955085754, mean loss: 0.3398033106372252
Epoch: 65, step: 524, loss: 0.3248814046382904, mean loss: 0.33980315254106586
Epoch: 65, step: 525, loss: 0.35580140352249146, mean loss: 0.339803322039201
Epoch: 65, step: 526, loss: 0.3142760097980499, mean loss: 0.3398030515855131
Epoch: 65, step: 527, loss: 0.32757729291915894, mean loss: 0.3398029220588925
Epoch: 65, step: 528, loss: 0.33010369539260864, mean loss: 0.3398028193008734
Epoch: 65, step: 529, loss: 0.3240978419780731, mean loss: 0.3398026529169628
Epoch: 65, step: 530, loss: 0.3240232467651367, mean loss: 0.33980248574629873
Epoch: 65, step: 531, loss: 0.3109027147293091, mean loss: 0.3398021795787102
Epoch: 65, step: 532, loss: 0.33979687094688416, mean loss: 0.3398021795224705
Epoch: 65, step: 533, loss: 0.31726211309432983, mean loss: 0.3398019407354032
Epoch: 65, step: 534, loss: 0.32196587324142456, mean loss: 0.33980175178400224
Epoch: 65, step: 535, loss: 0.34344956278800964, mean loss: 0.3398017904277054
Epoch: 65, step: 536, loss: 0.3163228929042816, mean loss: 0.33980154170266624
Epoch: 65, step: 537, loss: 0.41377171874046326, mean loss: 0.3398023253016518
Epoch: 65, step: 538, loss: 0.31554514169692993, mean loss: 0.33980206833723897
Epoch: 65, step: 539, loss: 0.3510679006576538, mean loss: 0.33980218767868303
Epoch: 65, step: 540, loss: 0.3321029841899872, mean loss: 0.339802106120188
Epoch: 65, step: 541, loss: 0.3690929412841797, mean loss: 0.33980241639788517
Epoch: 65, step: 542, loss: 0.3184072971343994, mean loss: 0.33980218976187504
Epoch: 65, step: 543, loss: 0.3235422670841217, mean loss: 0.3398020175242296
Epoch: 65, step: 544, loss: 0.3246926963329315, mean loss: 0.3398018574763382
Epoch: 65, step: 545, loss: 0.33685383200645447, mean loss: 0.3398018262492396
Epoch: 65, step: 546, loss: 0.3282630145549774, mean loss: 0.3398017040251281
Epoch: 65, step: 547, loss: 0.337588906288147, mean loss: 0.33980168058646043
Epoch: 65, step: 548, loss: 0.3410683870315552, mean loss: 0.3398016940036817
Epoch: 65, step: 549, loss: 0.2955975830554962, mean loss: 0.33980122578939354
Epoch: 65, step: 550, loss: 0.3318907916545868, mean loss: 0.3398011420021851
Epoch: 65, step: 551, loss: 0.3260173499584198, mean loss: 0.3398009960059977
Epoch: 65, step: 552, loss: 0.3518466651439667, mean loss: 0.33980112359085507
Epoch: 65, step: 553, loss: 0.3429437279701233, mean loss: 0.3398011568762193
Epoch: 65, step: 554, loss: 0.3567314147949219, mean loss: 0.3398013361936786
Epoch: 65, step: 555, loss: 0.31166619062423706, mean loss: 0.33980103820238927
Epoch: 65, step: 556, loss: 0.32039543986320496, mean loss: 0.3398008326716232
Epoch: 65, step: 557, loss: 0.35100194811820984, mean loss: 0.3398009513048864
Epoch: 65, step: 558, loss: 0.36852434277534485, mean loss: 0.339801255516872
Epoch: 65, step: 559, loss: 0.3595178425312042, mean loss: 0.33980146433478153
Epoch: 65, step: 560, loss: 0.3218090236186981, mean loss: 0.3398012737792831
Epoch: 65, step: 561, loss: 0.30167776346206665, mean loss: 0.33980087002263404
Epoch: 65, step: 562, loss: 0.34332510828971863, mean loss: 0.33980090734657276
Epoch: 65, step: 563, loss: 0.3444279730319977, mean loss: 0.3398009563496407
Epoch: 65, step: 564, loss: 0.3060705363750458, mean loss: 0.33980059913047234
Epoch: 65, step: 565, loss: 0.3264928460121155, mean loss: 0.3398004581973277
Epoch: 65, step: 566, loss: 0.3432866632938385, mean loss: 0.3398004951169068
Epoch: 65, step: 567, loss: 0.3337417244911194, mean loss: 0.33980043095404594
Epoch: 65, step: 568, loss: 0.32827410101890564, mean loss: 0.33980030889059154
Epoch: 65, step: 569, loss: 0.3422357141971588, mean loss: 0.3398003346811804
Epoch: 65, step: 570, loss: 0.35284602642059326, mean loss: 0.3398004728317003
Epoch: 65, step: 571, loss: 0.31801220774650574, mean loss: 0.33980024210202087
Epoch: 65, step: 572, loss: 0.3100804388523102, mean loss: 0.3397999273836147
Epoch: 65, step: 573, loss: 0.3101654052734375, mean loss: 0.33979961357161786
Epoch: 65, step: 574, loss: 0.33124852180480957, mean loss: 0.3397995230215912
Epoch: 65, step: 575, loss: 0.31334254145622253, mean loss: 0.3397992428637958
Epoch: 65, step: 576, loss: 0.33767110109329224, mean loss: 0.3397992203287537
Epoch: 65, step: 577, loss: 0.33075129985809326, mean loss: 0.3397991245207053
Epoch: 65, step: 578, loss: 0.2863123118877411, mean loss: 0.3397985581570988
Epoch: 65, step: 579, loss: 0.36075639724731445, mean loss: 0.3397987800740735
Epoch: 65, step: 580, loss: 0.30337539315223694, mean loss: 0.3397983944006168
Epoch: 65, step: 581, loss: 0.2889905273914337, mean loss: 0.33979785642104193
Epoch: 65, step: 582, loss: 0.35093870759010315, mean loss: 0.33979797438479964
Epoch: 65, step: 583, loss: 0.3931923806667328, mean loss: 0.33979853973999724
Epoch: 65, step: 584, loss: 0.3400532305240631, mean loss: 0.3397985424367073
Epoch: 65, step: 585, loss: 0.3643825054168701, mean loss: 0.33979880273320456
Epoch: 65, step: 586, loss: 0.3600224554538727, mean loss: 0.33979901686020403
Epoch: 65, step: 587, loss: 0.3371364176273346, mean loss: 0.3397989886690382
Epoch: 65, step: 588, loss: 0.2989792227745056, mean loss: 0.339798556480599
Epoch: 65, step: 589, loss: 0.2986499071121216, mean loss: 0.33979812081464483
Epoch: 65, step: 590, loss: 0.31598323583602905, mean loss: 0.33979786867454065
Epoch: 65, step: 591, loss: 0.3713880479335785, mean loss: 0.339798203132035
Epoch: 65, step: 592, loss: 0.33688101172447205, mean loss: 0.3397981722469238
Epoch: 65, step: 593, loss: 0.330976665019989, mean loss: 0.339798078852179
Epoch: 65, step: 594, loss: 0.31318214535713196, mean loss: 0.33979779706790614
Epoch: 65, step: 595, loss: 0.363230437040329, mean loss: 0.33979804514785844
Epoch: 65, step: 596, loss: 0.3723450303077698, mean loss: 0.33979838971718795
Epoch: 65, step: 597, loss: 0.34033674001693726, mean loss: 0.33979839541654955
Epoch: 65, step: 598, loss: 0.3051047921180725, mean loss: 0.3397980281291201
Epoch: 65, step: 599, loss: 0.30054759979248047, mean loss: 0.33979761260478875
Epoch: 65, step: 600, loss: 0.382302850484848, mean loss: 0.3397980625813704
Epoch: 65, step: 601, loss: 0.3305722773075104, mean loss: 0.3397979649147397
Epoch: 65, step: 602, loss: 0.37533038854599, mean loss: 0.3397983410664989
Epoch: 65, step: 603, loss: 0.3216462731361389, mean loss: 0.3397981489079207
Epoch: 65, step: 604, loss: 0.324920117855072, mean loss: 0.33979799141010614
Epoch: 65, step: 605, loss: 0.36979037523269653, mean loss: 0.33979830890405976
Epoch: 65, step: 606, loss: 0.34881192445755005, mean loss: 0.3397984043195546
Epoch: 65, step: 607, loss: 0.3592534363269806, mean loss: 0.3397986102626465
Epoch: 65, step: 608, loss: 0.3111211061477661, mean loss: 0.33979830669741223
Epoch: 65, step: 609, loss: 0.3097425401210785, mean loss: 0.3397979885459718
Epoch: 65, step: 610, loss: 0.3233610689640045, mean loss: 0.3397978145569214
Epoch: 65, step: 611, loss: 0.3254321813583374, mean loss: 0.3397976624945833
Epoch: 65, step: 612, loss: 0.34737318754196167, mean loss: 0.33979774268178015
Epoch: 65, step: 613, loss: 0.34017783403396606, mean loss: 0.3397977467050178
Epoch: 65, step: 614, loss: 0.34026646614074707, mean loss: 0.3397977516663243
Epoch: 65, step: 615, loss: 0.3552230894565582, mean loss: 0.33979791493887807
Epoch: 65, step: 616, loss: 0.29980888962745667, mean loss: 0.33979749167157164
Epoch: 65, step: 617, loss: 0.33955273032188416, mean loss: 0.33979748908090135
Epoch: 65, step: 618, loss: 0.3173484206199646, mean loss: 0.33979725147181933
Epoch: 65, step: 619, loss: 0.3094380497932434, mean loss: 0.3397969301424197
Epoch: 65, step: 620, loss: 0.31637492775917053, mean loss: 0.3397966822406999
Epoch: 65, step: 621, loss: 0.3086784780025482, mean loss: 0.3397963528847989
Epoch: 65, step: 622, loss: 0.38429683446884155, mean loss: 0.3397968238740942
Epoch: 65, step: 623, loss: 0.31709298491477966, mean loss: 0.33979658358114556
Epoch: 65, step: 624, loss: 0.3166412115097046, mean loss: 0.33979633851185337
Epoch: 65, step: 625, loss: 0.34138861298561096, mean loss: 0.3397963553638153
Epoch: 65, step: 626, loss: 0.32921072840690613, mean loss: 0.3397962433311869
Epoch: 65, step: 627, loss: 0.30413833260536194, mean loss: 0.33979586595087696
Epoch: 65, step: 628, loss: 0.35718438029289246, mean loss: 0.3397960499777409
Epoch: 65, step: 629, loss: 0.34185004234313965, mean loss: 0.3397960717154101
Epoch: 65, step: 630, loss: 0.33434489369392395, mean loss: 0.3397960140254923
Epoch: 65, step: 631, loss: 0.3204587399959564, mean loss: 0.3397958093809295
Epoch: 65, step: 632, loss: 0.35200372338294983, mean loss: 0.3397959385747746
Epoch: 65, step: 633, loss: 0.34872564673423767, mean loss: 0.33979603307504086
Epoch: 65, step: 634, loss: 0.33199813961982727, mean loss: 0.33979595055328354
Epoch: 65, step: 635, loss: 0.3158770501613617, mean loss: 0.33979569743251237
Epoch: 65, step: 636, loss: 0.3126920759677887, mean loss: 0.3397954106125978
Epoch: 65, step: 637, loss: 0.37260517477989197, mean loss: 0.3397957578132176
Epoch: 65, step: 638, loss: 0.323244571685791, mean loss: 0.3397955826665374
Epoch: 65, step: 639, loss: 0.34859034419059753, mean loss: 0.33979567573279695
Epoch: 65, step: 640, loss: 0.3236682415008545, mean loss: 0.33979550507392314
Epoch: 65, step: 641, loss: 0.3498762249946594, mean loss: 0.3397956117459504
Epoch: 65, step: 642, loss: 0.36090368032455444, mean loss: 0.3397958351046647
Epoch: 65, step: 643, loss: 0.36176052689552307, mean loss: 0.33979606752542774
Epoch: 65, step: 644, loss: 0.35089924931526184, mean loss: 0.33979618501319864
Epoch: 65, step: 645, loss: 0.3360651433467865, mean loss: 0.33979614553378285
Epoch: 65, step: 646, loss: 0.3198239505290985, mean loss: 0.33979593420345805
Epoch: 65, step: 647, loss: 0.32815590500831604, mean loss: 0.33979581103897255
Epoch: 65, step: 648, loss: 0.3199336528778076, mean loss: 0.3397956008774201
Epoch: 65, step: 649, loss: 0.33827999234199524, mean loss: 0.33979558484093153
Epoch: 65, step: 650, loss: 0.3344113826751709, mean loss: 0.33979552787187856
Epoch: 65, step: 651, loss: 0.37561413645744324, mean loss: 0.33979590685664857
Epoch: 65, step: 652, loss: 0.30859848856925964, mean loss: 0.33979557677064676
Epoch: 65, step: 653, loss: 0.30650827288627625, mean loss: 0.33979522457622174
Epoch: 65, step: 654, loss: 0.3631540834903717, mean loss: 0.3397954717206847
Epoch: 65, step: 655, loss: 0.3477305769920349, mean loss: 0.339795555675838
Epoch: 65, step: 656, loss: 0.3273959159851074, mean loss: 0.33979542448631983
Epoch: 65, step: 657, loss: 0.3050285875797272, mean loss: 0.3397950566533472
Epoch: 65, step: 658, loss: 0.346457839012146, mean loss: 0.33979512714480775
Epoch: 65, step: 659, loss: 0.33654701709747314, mean loss: 0.3397950927805457
Epoch: 65, step: 660, loss: 0.316718727350235, mean loss: 0.3397948486404559
Epoch: 65, step: 661, loss: 0.3134843111038208, mean loss: 0.33979457028687116
Epoch: 65, step: 662, loss: 0.34659910202026367, mean loss: 0.3397946422749771
Epoch: 65, step: 663, loss: 0.30470529198646545, mean loss: 0.3397942710533795
Epoch: 65, step: 664, loss: 0.3250952363014221, mean loss: 0.3397941155491769
Epoch: 65, step: 665, loss: 0.3662146031856537, mean loss: 0.33979439505415576
Epoch: 65, step: 666, loss: 0.38544511795043945, mean loss: 0.3397948779926061
Epoch: 65, step: 667, loss: 0.3412914276123047, mean loss: 0.33979489382441913
Epoch: 65, step: 668, loss: 0.3142284154891968, mean loss: 0.3397946233626737
Epoch: 65, step: 669, loss: 0.3486085832118988, mean loss: 0.33979471660249017
Epoch: 65, step: 670, loss: 0.3382684290409088, mean loss: 0.3397947004565956
Epoch: 65, step: 671, loss: 0.32406461238861084, mean loss: 0.3397945340569842
Epoch: 65, step: 672, loss: 0.3244522213935852, mean loss: 0.33979437176114397
Epoch: 65, step: 673, loss: 0.3251316249370575, mean loss: 0.33979421665560705
Epoch: 65, step: 674, loss: 0.35085880756378174, mean loss: 0.33979433369787615
Epoch: 65, step: 675, loss: 0.3937819302082062, mean loss: 0.3397949047776395
Epoch: 65, step: 676, loss: 0.3150774836540222, mean loss: 0.33979464331999726
Epoch: 65, step: 677, loss: 0.3456982970237732, mean loss: 0.3397947057674121
Epoch: 65, step: 678, loss: 0.36855006217956543, mean loss: 0.33979500993136996
Epoch: 65, step: 679, loss: 0.3400803208351135, mean loss: 0.33979501294925557
Epoch: 65, step: 680, loss: 0.3112717866897583, mean loss: 0.3397947112470707
Epoch: 65, step: 681, loss: 0.3737485110759735, mean loss: 0.3397950703869221
Epoch: 65, step: 682, loss: 0.32195112109184265, mean loss: 0.339794881647943
Epoch: 65, step: 683, loss: 0.2828907072544098, mean loss: 0.339794279767608
Epoch: 65, step: 684, loss: 0.33070072531700134, mean loss: 0.33979418358531965
Epoch: 65, step: 685, loss: 0.3266344368457794, mean loss: 0.3397940443964937
Epoch: 65, step: 686, loss: 0.28481176495552063, mean loss: 0.33979346286265927
Epoch: 65, step: 687, loss: 0.36428195238113403, mean loss: 0.33979372186855594
Epoch: 65, step: 688, loss: 0.31338509917259216, mean loss: 0.3397934425570593
Epoch: 65, step: 689, loss: 0.29218584299087524, mean loss: 0.3397929390393484
Epoch: 65, step: 690, loss: 0.36669644713401794, mean loss: 0.33979322357899466
Epoch: 65, step: 691, loss: 0.33149006962776184, mean loss: 0.3397931357632536
Epoch: 65, step: 692, loss: 0.32046422362327576, mean loss: 0.33979293133915134
Epoch: 65, step: 693, loss: 0.3656328618526459, mean loss: 0.33979320462140816
Epoch: 65, step: 694, loss: 0.30773597955703735, mean loss: 0.33979286558883387
Epoch: 65, step: 695, loss: 0.33975672721862793, mean loss: 0.33979286520664376
Epoch: 65, step: 696, loss: 0.34546229243278503, mean loss: 0.33979292516441767
Epoch: 65, step: 697, loss: 0.32148388028144836, mean loss: 0.3397927315367512
Epoch: 65, step: 698, loss: 0.2947758138179779, mean loss: 0.33979225546448183
Epoch: 65, step: 699, loss: 0.3217012584209442, mean loss: 0.3397920641468312
Epoch: 65, step: 700, loss: 0.3299616277217865, mean loss: 0.33979196018815455
Epoch: 65, step: 701, loss: 0.3165726065635681, mean loss: 0.33979171464180796
Epoch: 65, step: 702, loss: 0.30288776755332947, mean loss: 0.3397913243840212
Epoch: 65, step: 703, loss: 0.29349783062934875, mean loss: 0.33979083483732525
Epoch: 65, step: 704, loss: 0.3254987299442291, mean loss: 0.3397906837020755
Epoch: 65, step: 705, loss: 0.3413502275943756, mean loss: 0.3397907001936675
Epoch: 65, step: 706, loss: 0.3489255905151367, mean loss: 0.3397907967906868
Epoch: 65, step: 707, loss: 0.34957030415534973, mean loss: 0.339790900203124
Epoch: 65, step: 708, loss: 0.3132159113883972, mean loss: 0.3397906191914943
Epoch: 65, step: 709, loss: 0.3445121943950653, mean loss: 0.33979066911827027
Epoch: 65, step: 710, loss: 0.30968448519706726, mean loss: 0.3397903507734931
Epoch: 65, step: 711, loss: 0.33014023303985596, mean loss: 0.3397902487335898
Epoch: 65, step: 712, loss: 0.3314872682094574, mean loss: 0.3397901609391821
Epoch: 65, step: 713, loss: 0.3246081471443176, mean loss: 0.33979000040865787
Epoch: 65, step: 714, loss: 0.2908966541290283, mean loss: 0.3397894834290514
Epoch: 65, step: 715, loss: 0.2844063639640808, mean loss: 0.3397888978352489
Epoch: 65, step: 716, loss: 0.31462424993515015, mean loss: 0.339788631759481
Epoch: 65, step: 717, loss: 0.32130271196365356, mean loss: 0.3397884363026116
Epoch: 65, step: 718, loss: 0.3174511790275574, mean loss: 0.33978820012695654
Epoch: 65, step: 719, loss: 0.3115968406200409, mean loss: 0.3397879020580254
Epoch: 65, step: 720, loss: 0.319450706243515, mean loss: 0.33978768703391043
Epoch: 65, step: 721, loss: 0.3676918148994446, mean loss: 0.3397879820596856
Epoch: 65, step: 722, loss: 0.3497135043144226, mean loss: 0.33978808699949775
Epoch: 65, step: 723, loss: 0.34135618805885315, mean loss: 0.33978810357842293
Epoch: 65, step: 724, loss: 0.3611027002334595, mean loss: 0.33978832892701577
Epoch: 65, step: 725, loss: 0.3228558301925659, mean loss: 0.3397881499100499
Epoch: 65, step: 726, loss: 0.3132823705673218, mean loss: 0.3397878696835987
Epoch: 65, step: 727, loss: 0.3004676103591919, mean loss: 0.33978745398330557
Epoch: 65, step: 728, loss: 0.3575749397277832, mean loss: 0.33978764203356243
Epoch: 65, step: 729, loss: 0.37385743856430054, mean loss: 0.33978800221747757
Epoch: 65, step: 730, loss: 0.31334248185157776, mean loss: 0.339787722639924
Epoch: 65, step: 731, loss: 0.2900601923465729, mean loss: 0.3397871969344701
Epoch: 65, step: 732, loss: 0.3281650245189667, mean loss: 0.3397870740694334
Epoch: 65, step: 733, loss: 0.38635361194610596, mean loss: 0.33978756634735674
Epoch: 65, step: 734, loss: 0.3319179117679596, mean loss: 0.339787483154222
Epoch: 65, step: 735, loss: 0.3107423484325409, mean loss: 0.33978717611021675
Epoch: 65, step: 736, loss: 0.34621164202690125, mean loss: 0.33978724402427235
Epoch: 65, step: 737, loss: 0.3539756238460541, mean loss: 0.33978739401031666
Epoch: 65, step: 738, loss: 0.35986024141311646, mean loss: 0.33978760619910725
Epoch: 65, step: 739, loss: 0.3256312310695648, mean loss: 0.33978745655454984
Epoch: 65, step: 740, loss: 0.33367279171943665, mean loss: 0.3397873919181841
Epoch: 65, step: 741, loss: 0.34628042578697205, mean loss: 0.33978746055345466
Epoch: 65, step: 742, loss: 0.3470427393913269, mean loss: 0.33978753724530203
Epoch: 65, step: 743, loss: 0.3278304636478424, mean loss: 0.3397874108545194
Epoch: 65, step: 744, loss: 0.29535189270973206, mean loss: 0.33978694115927977
Epoch: 65, step: 745, loss: 0.32551848888397217, mean loss: 0.3397867903395403
Epoch: 65, step: 746, loss: 0.33926475048065186, mean loss: 0.33978678482155683
Epoch: 65, step: 747, loss: 0.320536732673645, mean loss: 0.3397865813498404
Epoch: 65, step: 748, loss: 0.36580342054367065, mean loss: 0.33978685634312006
Epoch: 65, step: 749, loss: 0.31139740347862244, mean loss: 0.33978655627491516
Epoch: 65, step: 750, loss: 0.3461434543132782, mean loss: 0.3397866234647561
Epoch: 65, step: 751, loss: 0.32861465215682983, mean loss: 0.3397865053827865
Epoch: 65, step: 752, loss: 0.3184727132320404, mean loss: 0.33978628010938694
Epoch: 65, step: 753, loss: 0.3348635137081146, mean loss: 0.33978622807938713
Epoch: 65, step: 754, loss: 0.31027916073799133, mean loss: 0.339785916214806
Epoch: 65, step: 755, loss: 0.32740890979766846, mean loss: 0.3397857854017679
Epoch: 65, step: 756, loss: 0.32861772179603577, mean loss: 0.3397856673673385
Epoch: 65, step: 757, loss: 0.33286482095718384, mean loss: 0.3397855942222032
Epoch: 65, step: 758, loss: 0.3369891345500946, mean loss: 0.33978556466725474
Epoch: 65, step: 759, loss: 0.3355939984321594, mean loss: 0.3397855203683091
Epoch: 65, step: 760, loss: 0.3167368769645691, mean loss: 0.3397852767792179
Epoch: 65, step: 761, loss: 0.2998432517051697, mean loss: 0.33978485465724756
Epoch: 65, step: 762, loss: 0.3648478388786316, mean loss: 0.3397851195292578
Epoch: 65, step: 763, loss: 0.3188183307647705, mean loss: 0.3397848979492277
Epoch: 65, step: 764, loss: 0.3351348042488098, mean loss: 0.3397848488068901
Epoch: 65, step: 765, loss: 0.302376389503479, mean loss: 0.33978445347728403
Epoch: 65, step: 766, loss: 0.3274552822113037, mean loss: 0.3397843231849651
Epoch: 65, step: 767, loss: 0.34381917119026184, mean loss: 0.3397843658240149
Epoch: 65, step: 768, loss: 0.30942243337631226, mean loss: 0.3397840449717133
Epoch: 65, step: 769, loss: 0.3532153069972992, mean loss: 0.33978418690621637
Epoch: 65, step: 770, loss: 0.2977142333984375, mean loss: 0.3397837423378032
Epoch: 65, step: 771, loss: 0.3823237121105194, mean loss: 0.33978419186829784
Epoch: 65, step: 772, loss: 0.31016358733177185, mean loss: 0.33978387886327277
Epoch: 65, step: 773, loss: 0.35979747772216797, mean loss: 0.3397840903475053
Epoch: 65, step: 774, loss: 0.31419801712036133, mean loss: 0.3397838199816446
Epoch: 65, step: 775, loss: 0.34888172149658203, mean loss: 0.3397839161173806
Epoch: 65, step: 776, loss: 0.28658390045166016, mean loss: 0.339783353969218
Epoch: 65, step: 777, loss: 0.3323136866092682, mean loss: 0.3397832750403801
Epoch: 65, step: 778, loss: 0.3209812343120575, mean loss: 0.33978307636921146
Epoch: 65, step: 779, loss: 0.3314095437526703, mean loss: 0.3397829878914788
Epoch: 65, step: 780, loss: 0.3036780059337616, mean loss: 0.33978260639739105
Epoch: 65, step: 781, loss: 0.31930971145629883, mean loss: 0.33978239007805144
Epoch: 65, step: 782, loss: 0.3095225393772125, mean loss: 0.3397820703518097
Epoch: 65, step: 783, loss: 0.32946592569351196, mean loss: 0.33978196135235217
Epoch: 65, step: 784, loss: 0.3563182055950165, mean loss: 0.33978213607097696
Epoch: 65, step: 785, loss: 0.3109002709388733, mean loss: 0.3397818309142336
Epoch: 65, step: 786, loss: 0.34427645802497864, mean loss: 0.3397818784025545
Epoch: 65, step: 787, loss: 0.39438650012016296, mean loss: 0.33978245532569834
Epoch: 65, step: 788, loss: 0.34151849150657654, mean loss: 0.33978247366753167
Epoch: 65, step: 789, loss: 0.30872443318367004, mean loss: 0.33978214553186886
Epoch: 65, step: 790, loss: 0.3219553530216217, mean loss: 0.33978195718951104
Epoch: 65, step: 791, loss: 0.3195245563983917, mean loss: 0.339781743169725
Epoch: 65, step: 792, loss: 0.31780755519866943, mean loss: 0.3397815110145057
Epoch: 65, step: 793, loss: 0.3543894290924072, mean loss: 0.3397816653441492
Epoch: 65, step: 794, loss: 0.29585492610931396, mean loss: 0.33978120127210615
Epoch: 65, step: 795, loss: 0.3229696750640869, mean loss: 0.3397810236655497
Epoch: 65, step: 796, loss: 0.3192746341228485, mean loss: 0.33978080702663715
Epoch: 65, step: 797, loss: 0.3319338262081146, mean loss: 0.33978072412840543
Epoch: 65, step: 798, loss: 0.29824596643447876, mean loss: 0.33978028534542976
Epoch: 65, step: 799, loss: 0.31514042615890503, mean loss: 0.3397800250468962
Epoch: 65, step: 800, loss: 0.3750024139881134, mean loss: 0.339780397136658
Epoch: 65, step: 801, loss: 0.33106890320777893, mean loss: 0.33978030510929824
Epoch: 65, step: 802, loss: 0.3245445191860199, mean loss: 0.33978014416166374
Epoch: 65, step: 803, loss: 0.3228170871734619, mean loss: 0.3397799649693944
Epoch: 65, step: 804, loss: 0.3345431983470917, mean loss: 0.3397799096504632
Epoch: 65, step: 805, loss: 0.3307937681674957, mean loss: 0.33977981472576496
Epoch: 65, step: 806, loss: 0.3065556287765503, mean loss: 0.33977946376729
Epoch: 65, step: 807, loss: 0.3066800534725189, mean loss: 0.33977911413055645
Epoch: 65, step: 808, loss: 0.3168235719203949, mean loss: 0.3397788716484112
Epoch: 65, step: 809, loss: 0.36462724208831787, mean loss: 0.3397791341219555
Epoch: 65, step: 810, loss: 0.38208773732185364, mean loss: 0.33977958102336353
Epoch: 65, step: 811, loss: 0.3405894935131073, mean loss: 0.3397795895782952
Epoch: 65, step: 812, loss: 0.36041566729545593, mean loss: 0.339779807550449
Epoch: 65, step: 813, loss: 0.3388175964355469, mean loss: 0.3397797973870344
Epoch: 65, step: 814, loss: 0.36218342185020447, mean loss: 0.33978003402420853
Epoch: 65, step: 815, loss: 0.29172682762145996, mean loss: 0.33977952646995613
Epoch: 65, step: 816, loss: 0.3343803584575653, mean loss: 0.33977946944271603
Epoch: 65, step: 817, loss: 0.3350363075733185, mean loss: 0.3397794193448911
Epoch: 65, step: 818, loss: 0.31667831540107727, mean loss: 0.33977917535093316
Epoch: 65, step: 819, loss: 0.3329094648361206, mean loss: 0.33977910279378787
Epoch: 65, step: 820, loss: 0.3344655930995941, mean loss: 0.3397790466736614
Epoch: 65, step: 821, loss: 0.32505595684051514, mean loss: 0.3397788911732512
Epoch: 65, step: 822, loss: 0.3182520270347595, mean loss: 0.33977866381602617
Epoch: 65, step: 823, loss: 0.3102758824825287, mean loss: 0.3397783522239796
Epoch: 65, step: 824, loss: 0.3192594349384308, mean loss: 0.3397781355168213
Epoch: 65, step: 825, loss: 0.3401765525341034, mean loss: 0.3397781397245924
Epoch: 65, step: 826, loss: 0.3325420916080475, mean loss: 0.3397780633038787
Epoch: 65, step: 827, loss: 0.3375716507434845, mean loss: 0.33977804000195494
Epoch: 65, step: 828, loss: 0.35959193110466003, mean loss: 0.33977824925425565
Epoch: 65, step: 829, loss: 0.31279510259628296, mean loss: 0.3397779642912537
Epoch: 65, step: 830, loss: 0.29837730526924133, mean loss: 0.3397775270727321
Epoch: 65, step: 831, loss: 0.34496161341667175, mean loss: 0.33977758181955703
Epoch: 65, step: 832, loss: 0.33697280287742615, mean loss: 0.33977755219984973
Epoch: 65, step: 833, loss: 0.3508448004722595, mean loss: 0.33977766907365664
Epoch: 65, step: 834, loss: 0.3403680622577667, mean loss: 0.33977767530833836
Epoch: 65, step: 835, loss: 0.33421850204467773, mean loss: 0.33977761660286754
Epoch: 65, step: 836, loss: 0.34036141633987427, mean loss: 0.3397776227677908
Epoch: 65, step: 837, loss: 0.3329694867134094, mean loss: 0.3397775508746562
Epoch: 65, step: 838, loss: 0.3405902087688446, mean loss: 0.3397775594561396
Epoch: 65, step: 839, loss: 0.35914164781570435, mean loss: 0.33977776393436937
Epoch: 65, step: 840, loss: 0.3284704089164734, mean loss: 0.33977764453378206
Epoch: 65, step: 841, loss: 0.33548733592033386, mean loss: 0.33977759923052964
Epoch: 65, step: 842, loss: 0.3208070993423462, mean loss: 0.3397773989148069
Epoch: 65, step: 843, loss: 0.295727401971817, mean loss: 0.3397769337813707
Epoch: 65, step: 844, loss: 0.3672600984573364, mean loss: 0.3397772239789809
Epoch: 65, step: 845, loss: 0.384653776884079, mean loss: 0.3397776978301931
Epoch: 65, step: 846, loss: 0.3330298066139221, mean loss: 0.3397776265800087
Epoch: 65, step: 847, loss: 0.30902761220932007, mean loss: 0.33977730189767597
Epoch: 65, step: 848, loss: 0.3438202142715454, mean loss: 0.3397773445854076
Epoch: 65, step: 849, loss: 0.3675342798233032, mean loss: 0.33977763765831687
Epoch: 65, step: 850, loss: 0.3281369209289551, mean loss: 0.33977751475055823
Epoch: 65, step: 851, loss: 0.328693151473999, mean loss: 0.3397773977182574
Epoch: 65, step: 852, loss: 0.2898203134536743, mean loss: 0.33977687026073555
Epoch: 65, step: 853, loss: 0.317335307598114, mean loss: 0.33977663332044516
Epoch: 65, step: 854, loss: 0.31385621428489685, mean loss: 0.33977635965292646
Epoch: 65, step: 855, loss: 0.3428802490234375, mean loss: 0.3397763924234127
Epoch: 65, step: 856, loss: 0.3236500322818756, mean loss: 0.33977622216506265
Epoch: 65, step: 857, loss: 0.37705087661743164, mean loss: 0.33977661569801787
Epoch: 65, step: 858, loss: 0.3227091133594513, mean loss: 0.3397764355071128
Epoch: 65, step: 859, loss: 0.32044461369514465, mean loss: 0.3397762314127102
Epoch: 65, step: 860, loss: 0.30679789185523987, mean loss: 0.3397758832497943
Epoch: 65, step: 861, loss: 0.33547499775886536, mean loss: 0.33977583784444504
Epoch: 65, step: 862, loss: 0.3329937160015106, mean loss: 0.3397757662449197
Epoch: 65, step: 863, loss: 0.2988705337047577, mean loss: 0.3397753344089273
Epoch: 65, step: 864, loss: 0.4251662790775299, mean loss: 0.3397762358704704
Epoch: 65, step: 865, loss: 0.3102717697620392, mean loss: 0.33977592439879306
Epoch: 65, step: 866, loss: 0.33096352219581604, mean loss: 0.3397758313693273
Epoch: 65, step: 867, loss: 0.3120116591453552, mean loss: 0.33977553827570955
Epoch: 65, step: 868, loss: 0.32733413577079773, mean loss: 0.33977540693892244
Epoch: 65, step: 869, loss: 0.32136020064353943, mean loss: 0.33977521254214954
Epoch: 65, step: 870, loss: 0.3474096953868866, mean loss: 0.33977529313332716
Epoch: 65, step: 871, loss: 0.3650270998477936, mean loss: 0.3397755596938
Epoch: 65, step: 872, loss: 0.33354511857032776, mean loss: 0.3397754939253653
Epoch: 65, step: 873, loss: 0.32970714569091797, mean loss: 0.3397753876451678
Epoch: 65, step: 874, loss: 0.3020293414592743, mean loss: 0.3397749892069329
Epoch: 65, step: 875, loss: 0.3695138394832611, mean loss: 0.33977530311980947
Epoch: 65, step: 876, loss: 0.3769955039024353, mean loss: 0.33977569599905183
Epoch: 65, step: 877, loss: 0.3078559935092926, mean loss: 0.33977535907297685
Epoch: 65, step: 878, loss: 0.30010080337524414, mean loss: 0.33977494029553884
Epoch: 65, step: 879, loss: 0.30205100774765015, mean loss: 0.33977454211174585
Epoch: 65, step: 880, loss: 0.30852141976356506, mean loss: 0.33977421223215465
Epoch: 65, step: 881, loss: 0.3409620225429535, mean loss: 0.3397742247694698
Epoch: 65, step: 882, loss: 0.34507235884666443, mean loss: 0.3397742806905835
Epoch: 65, step: 883, loss: 0.39422154426574707, mean loss: 0.33977485536827895
Epoch: 65, step: 884, loss: 0.29789239168167114, mean loss: 0.33977441331367253
Epoch: 65, step: 885, loss: 0.3287220597267151, mean loss: 0.3397742966612166
Epoch: 65, step: 886, loss: 0.3750535547733307, mean loss: 0.33977466901346115
Epoch: 65, step: 887, loss: 0.3172732889652252, mean loss: 0.3397744315268646
Epoch: 65, step: 888, loss: 0.31489816308021545, mean loss: 0.3397741689777248
Epoch: 65, step: 889, loss: 0.3171706199645996, mean loss: 0.3397739304178407
Epoch: 65, step: 890, loss: 0.3245716691017151, mean loss: 0.33977376997350434
Epoch: 65, step: 891, loss: 0.29699063301086426, mean loss: 0.3397733184459697
Epoch: 65, step: 892, loss: 0.33239737153053284, mean loss: 0.33977324060202896
Epoch: 65, step: 893, loss: 0.33009961247444153, mean loss: 0.33977313850999985
Epoch: 65, step: 894, loss: 0.3641510009765625, mean loss: 0.3397733957825709
Epoch: 65, step: 895, loss: 0.3250460922718048, mean loss: 0.33977324035913054
Epoch: 65, step: 896, loss: 0.3209335505962372, mean loss: 0.33977304153804333
Epoch: 65, step: 897, loss: 0.32802924513816833, mean loss: 0.3397729176034267
Epoch: 65, step: 898, loss: 0.2924778163433075, mean loss: 0.33977241849409395
Epoch: 65, step: 899, loss: 0.33742427825927734, mean loss: 0.3397723937142266
Epoch: 65, step: 900, loss: 0.3373963534832001, mean loss: 0.3397723686401958
Epoch: 65, step: 901, loss: 0.32170578837394714, mean loss: 0.33977217798803283
Epoch: 65, step: 902, loss: 0.3411686420440674, mean loss: 0.3397721927244179
Epoch: 65, step: 903, loss: 0.36462000012397766, mean loss: 0.33977245493166325
Epoch: 65, step: 904, loss: 0.31773582100868225, mean loss: 0.3397722223918656
Epoch: 65, step: 905, loss: 0.3022304177284241, mean loss: 0.33977182623918784
Epoch: 65, step: 906, loss: 0.3264244794845581, mean loss: 0.33977168539536295
Epoch: 65, step: 907, loss: 0.3024258315563202, mean loss: 0.3397712913187354
Epoch: 65, step: 908, loss: 0.3754941523075104, mean loss: 0.3397716682654267
Epoch: 65, step: 909, loss: 0.302234947681427, mean loss: 0.33977127218311604
Epoch: 65, step: 910, loss: 0.32102084159851074, mean loss: 0.33977107433324016
Epoch: 65, step: 911, loss: 0.37875500321388245, mean loss: 0.3397714856776128
Epoch: 65, step: 912, loss: 0.3453511893749237, mean loss: 0.33977154455201475
Epoch: 65, step: 913, loss: 0.3228275179862976, mean loss: 0.33977136576852385
Epoch: 65, step: 914, loss: 0.32014644145965576, mean loss: 0.3397711586999477
Epoch: 65, step: 915, loss: 0.38240885734558105, mean loss: 0.3397716085785947
Epoch: 65, step: 916, loss: 0.3471802771091461, mean loss: 0.3397716867480718
Epoch: 65, step: 917, loss: 0.3682759404182434, mean loss: 0.33977198749564685
Epoch: 65, step: 918, loss: 0.35769912600517273, mean loss: 0.3397721766423831
Epoch: 65, step: 919, loss: 0.32132428884506226, mean loss: 0.33977198200334746
Epoch: 65, step: 920, loss: 0.34194687008857727, mean loss: 0.33977200494980386
Epoch: 65, step: 921, loss: 0.30579516291618347, mean loss: 0.3397716464762326
Epoch: 65, step: 922, loss: 0.30974721908569336, mean loss: 0.3397713297060587
Epoch: 65, step: 923, loss: 0.3288555145263672, mean loss: 0.3397712145408918
Epoch: 65, step: 924, loss: 0.3495102524757385, mean loss: 0.3397713172896172
Epoch: 65, step: 925, loss: 0.3400656580924988, mean loss: 0.33977132039493657
Epoch: 65, step: 926, loss: 0.31001317501068115, mean loss: 0.3397710064473975
Epoch: 65, step: 927, loss: 0.3220846354961395, mean loss: 0.33977081985868424
Epoch: 65, step: 928, loss: 0.33980777859687805, mean loss: 0.33977082024858957
Epoch: 65, step: 929, loss: 0.2972370386123657, mean loss: 0.339770371532674
Epoch: 65, step: 930, loss: 0.30604687333106995, mean loss: 0.33977001576579524
Epoch: 65, step: 931, loss: 0.30693382024765015, mean loss: 0.33976966936319253
Epoch: 65, step: 932, loss: 0.31410908699035645, mean loss: 0.3397693986619554
Epoch: 65, step: 933, loss: 0.3400159478187561, mean loss: 0.3397694012628495
Epoch: 65, step: 934, loss: 0.3290090560913086, mean loss: 0.3397692877511118
Epoch: 65, step: 935, loss: 0.34591707587242126, mean loss: 0.33976935260393387
Epoch: 65, step: 936, loss: 0.3220660984516144, mean loss: 0.33976916585483685
Epoch: 65, step: 937, loss: 0.3464202284812927, mean loss: 0.3397692360152055
Epoch: 65, step: 938, loss: 0.299422025680542, mean loss: 0.3397688104072314
Epoch: 65, step: 939, loss: 0.29829928278923035, mean loss: 0.33976837296495693
Epoch: 65, step: 940, loss: 0.33095866441726685, mean loss: 0.33976828003652215
Epoch: 65, step: 941, loss: 0.3274191915988922, mean loss: 0.33976814977462433
Epoch: 65, step: 942, loss: 0.3384574055671692, mean loss: 0.3397681359486462
Epoch: 65, step: 943, loss: 0.3452516198158264, mean loss: 0.3397681937888625
Epoch: 65, step: 944, loss: 0.36014047265052795, mean loss: 0.3397684086749852
Epoch: 65, step: 945, loss: 0.33137083053588867, mean loss: 0.3397683200985434
Epoch: 65, step: 946, loss: 0.2973494529724121, mean loss: 0.3397678726751767
Epoch: 65, step: 947, loss: 0.34656453132629395, mean loss: 0.33976794436383856
Epoch: 65, step: 948, loss: 0.300642192363739, mean loss: 0.33976753168411405
Epoch: 65, step: 949, loss: 0.39858710765838623, mean loss: 0.33976815207833383
Epoch: 65, step: 950, loss: 0.347165584564209, mean loss: 0.3397682301012688
Epoch: 65, step: 951, loss: 0.330545037984848, mean loss: 0.33976813282252644
Epoch: 65, step: 952, loss: 0.30789700150489807, mean loss: 0.33976779667525425
Epoch: 65, step: 953, loss: 0.3465534746646881, mean loss: 0.33976786824356686
Epoch: 65, step: 954, loss: 0.34225085377693176, mean loss: 0.33976789443125377
Epoch: 65, step: 955, loss: 0.3455400764942169, mean loss: 0.33976795530897547
Epoch: 65, step: 956, loss: 0.32201194763183594, mean loss: 0.3397677680428979
Epoch: 65, step: 957, loss: 0.33173900842666626, mean loss: 0.33976768336741836
Epoch: 65, step: 958, loss: 0.3403007686138153, mean loss: 0.3397676889895537
Epoch: 65, step: 959, loss: 0.3599388003349304, mean loss: 0.33976790172010995
Epoch: 65, step: 960, loss: 0.3218858540058136, mean loss: 0.33976771313269033
Epoch: 65, step: 961, loss: 0.342978835105896, mean loss: 0.33976774699742607
Epoch: 65, step: 962, loss: 0.2971210777759552, mean loss: 0.3397672972471627
Epoch: 65, step: 963, loss: 0.33150261640548706, mean loss: 0.3397672100890504
Epoch: 65, step: 964, loss: 0.3135058581829071, mean loss: 0.3397669331436045
Epoch: 65, step: 965, loss: 0.3341844081878662, mean loss: 0.3397668742723566
Epoch: 65, step: 966, loss: 0.34070101380348206, mean loss: 0.33976688412334344
Epoch: 65, step: 967, loss: 0.31191959977149963, mean loss: 0.3397665904623535
Epoch: 65, step: 968, loss: 0.3447675406932831, mean loss: 0.33976664319886063
Epoch: 65, step: 969, loss: 0.34917858242988586, mean loss: 0.3397667424495116
Epoch: 65, step: 970, loss: 0.3480972647666931, mean loss: 0.3397668302954936
Epoch: 65, step: 971, loss: 0.3641192615032196, mean loss: 0.3397670870909973
Epoch: 65, step: 972, loss: 0.3199913203716278, mean loss: 0.33976687855845356
Epoch: 65, step: 973, loss: 0.30171895027160645, mean loss: 0.33976647735289134
Epoch: 65, step: 974, loss: 0.3753807842731476, mean loss: 0.33976685289258574
Epoch: 65, step: 975, loss: 0.3460915982723236, mean loss: 0.3397669195839833
Epoch: 65, step: 976, loss: 0.31426122784614563, mean loss: 0.3397666506415691
Epoch: 65, step: 977, loss: 0.34930068254470825, mean loss: 0.3397667511712292
Epoch: 65, step: 978, loss: 0.28758639097213745, mean loss: 0.3397662009718365
Epoch: 65, step: 979, loss: 0.35687536001205444, mean loss: 0.33976638137207943
Epoch: 65, step: 980, loss: 0.3313116133213043, mean loss: 0.33976629222531746
Epoch: 65, step: 981, loss: 0.33454108238220215, mean loss: 0.33976623713147885
Epoch: 65, step: 982, loss: 0.3784586489200592, mean loss: 0.33976664509423615
Epoch: 65, step: 983, loss: 0.30523577332496643, mean loss: 0.3397662810135166
Epoch: 65, step: 984, loss: 0.3221452534198761, mean loss: 0.3397660952258884
Epoch: 65, step: 985, loss: 0.3306496739387512, mean loss: 0.3397659991077465
Epoch: 65, step: 986, loss: 0.31189024448394775, mean loss: 0.33976570520541305
Epoch: 65, step: 987, loss: 0.3444116413593292, mean loss: 0.3397657541883769
Epoch: 65, step: 988, loss: 0.31061795353889465, mean loss: 0.33976544688096566
Epoch: 65, step: 989, loss: 0.302305668592453, mean loss: 0.3397650519439252
Epoch: 65, step: 990, loss: 0.3314369320869446, mean loss: 0.33976496414179497
Epoch: 65, step: 991, loss: 0.32912975549697876, mean loss: 0.3397648520175525
Epoch: 65, step: 992, loss: 0.3293825387954712, mean loss: 0.3397647425606748
Epoch: 65, step: 993, loss: 0.3260660767555237, mean loss: 0.3397645981422443
Epoch: 65, step: 994, loss: 0.36101284623146057, mean loss: 0.3397648221499201
Epoch: 65, step: 995, loss: 0.3488853871822357, mean loss: 0.33976491830161354
Epoch: 65, step: 996, loss: 0.34862571954727173, mean loss: 0.33976501171381557
Epoch: 65, step: 997, loss: 0.3546479046344757, mean loss: 0.3397651686103654
Epoch: 65, step: 998, loss: 0.362197607755661, mean loss: 0.3397654050922927
Epoch: 65, step: 999, loss: 0.34124529361724854, mean loss: 0.33976542069305726
Epoch: 65, step: 1000, loss: 0.34221675992012024, mean loss: 0.3397654465344381
Epoch: 65, step: 1001, loss: 0.35776838660240173, mean loss: 0.33976563631475126
Epoch: 65, step: 1002, loss: 0.33874472975730896, mean loss: 0.3397656255528467
Epoch: 65, step: 1003, loss: 0.3331628143787384, mean loss: 0.3397655559499291
Epoch: 65, step: 1004, loss: 0.2964376211166382, mean loss: 0.3397650992173635
Epoch: 65, step: 1005, loss: 0.33472323417663574, mean loss: 0.3397650460701343
Epoch: 65, step: 1006, loss: 0.3273237943649292, mean loss: 0.33976491492598826
Epoch: 65, step: 1007, loss: 0.2902619540691376, mean loss: 0.3397643931171501
Epoch: 65, step: 1008, loss: 0.3498012125492096, mean loss: 0.339764498913769
Epoch: 65, step: 1009, loss: 0.34922459721565247, mean loss: 0.3397645986302052
Epoch: 65, step: 1010, loss: 0.3179139196872711, mean loss: 0.33976436831030826
Epoch: 65, step: 1011, loss: 0.29022523760795593, mean loss: 0.33976384614222177
Epoch: 65, step: 1012, loss: 0.3372983932495117, mean loss: 0.33976382015534573
Epoch: 65, step: 1013, loss: 0.33671149611473083, mean loss: 0.3397637879829482
Epoch: 65, step: 1014, loss: 0.2959904372692108, mean loss: 0.3397633266037575
Epoch: 65, step: 1015, loss: 0.3476363718509674, mean loss: 0.33976340958623197
Epoch: 65, step: 1016, loss: 0.3320106863975525, mean loss: 0.3397633278728221
Epoch: 65, step: 1017, loss: 0.33036017417907715, mean loss: 0.33976322876498155
Epoch: 65, step: 1018, loss: 0.36315420269966125, mean loss: 0.33976347529976725
Epoch: 65, step: 1019, loss: 0.34539079666137695, mean loss: 0.3397635346096467
Epoch: 65, step: 1020, loss: 0.33533143997192383, mean loss: 0.3397634878975058
Epoch: 65, step: 1021, loss: 0.33877256512641907, mean loss: 0.3397634774537676
Epoch: 65, step: 1022, loss: 0.34603309631347656, mean loss: 0.3397635435311351
Epoch: 65, step: 1023, loss: 0.3327673375606537, mean loss: 0.33976346979682825
Epoch: 65, step: 1024, loss: 0.3038294315338135, mean loss: 0.3397630910853537
Epoch: 65, step: 1025, loss: 0.3393304944038391, mean loss: 0.33976308652623344
Epoch: 65, step: 1026, loss: 0.3209717273712158, mean loss: 0.3397628884868903
Epoch: 65, step: 1027, loss: 0.32602977752685547, mean loss: 0.33976274375719884
Epoch: 65, step: 1028, loss: 0.3406050503253937, mean loss: 0.33976275263395556
Epoch: 65, step: 1029, loss: 0.3248763978481293, mean loss: 0.33976259575383344
Epoch: 65, step: 1030, loss: 0.31893783807754517, mean loss: 0.3397623762940567
Epoch: 65, step: 1031, loss: 0.35033392906188965, mean loss: 0.3397624877002107
Epoch: 65, step: 1032, loss: 0.3236708343029022, mean loss: 0.3397623181233884
Epoch: 65, step: 1033, loss: 0.3407498896121979, mean loss: 0.33976232853048993
Epoch: 65, step: 1034, loss: 0.36091846227645874, mean loss: 0.3397625514730448
Epoch: 65, step: 1035, loss: 0.30137282609939575, mean loss: 0.3397621469278019
Epoch: 65, step: 1036, loss: 0.34040185809135437, mean loss: 0.3397621536689124
Epoch: 65, step: 1037, loss: 0.34301334619522095, mean loss: 0.3397621879287759
Epoch: 65, step: 1038, loss: 0.3317180871963501, mean loss: 0.3397621031639129
Epoch: 65, step: 1039, loss: 0.2895508408546448, mean loss: 0.33976157406736596
Epoch: 65, step: 1040, loss: 0.3642946779727936, mean loss: 0.3397618325799623
Epoch: 65, step: 1041, loss: 0.3247867822647095, mean loss: 0.3397616747850758
Epoch: 65, step: 1042, loss: 0.3077546954154968, mean loss: 0.33976133752514337
Epoch: 65, step: 1043, loss: 0.3373975455760956, mean loss: 0.3397613126179535
Epoch: 65, step: 1044, loss: 0.3279227018356323, mean loss: 0.3397611878762562
Epoch: 65, step: 1045, loss: 0.3146924078464508, mean loss: 0.3397609237329983
Epoch: 65, step: 1046, loss: 0.3337634801864624, mean loss: 0.33976086054015114
Epoch: 65, step: 1047, loss: 0.320750892162323, mean loss: 0.3397606602412472
Epoch: 65, step: 1048, loss: 0.3552250266075134, mean loss: 0.33976082318012935
Epoch: 65, step: 1049, loss: 0.3350578546524048, mean loss: 0.3397607736282536
Epoch: 65, step: 1050, loss: 0.31121981143951416, mean loss: 0.3397604729153521
Epoch: 65, step: 1051, loss: 0.35287952423095703, mean loss: 0.33976061113866757
Epoch: 65, step: 1052, loss: 0.336599200963974, mean loss: 0.33976057783016217
Epoch: 65, step: 1053, loss: 0.32077810168266296, mean loss: 0.3397603778335742
Epoch: 65, step: 1054, loss: 0.3427733778953552, mean loss: 0.33976040957776704
Epoch: 65, step: 1055, loss: 0.3175519108772278, mean loss: 0.33976017559720845
Epoch: 65, step: 1056, loss: 0.3219674527645111, mean loss: 0.3397599881416122
Epoch: 65, step: 1057, loss: 0.3749171197414398, mean loss: 0.3397603585363908
Epoch: 65, step: 1058, loss: 0.2978956997394562, mean loss: 0.339759917479713
Epoch: 65, step: 1059, loss: 0.3514693081378937, mean loss: 0.3397600408403394
Epoch: 65, step: 1060, loss: 0.3218199908733368, mean loss: 0.3397598518405399
Epoch: 65, step: 1061, loss: 0.32287997007369995, mean loss: 0.339759674011567
Epoch: 65, step: 1062, loss: 0.34685003757476807, mean loss: 0.33975974870751596
Epoch: 65, step: 1063, loss: 0.3129498064517975, mean loss: 0.33975946627164877
Epoch: 65, step: 1064, loss: 0.3558392822742462, mean loss: 0.3397596356666027
Epoch: 65, step: 1065, loss: 0.35077103972435, mean loss: 0.33975975166647693
Epoch: 65, step: 1066, loss: 0.3576679825782776, mean loss: 0.3397599403191354
Epoch: 65, step: 1067, loss: 0.3030009865760803, mean loss: 0.3397595530893008
Epoch: 65, step: 1068, loss: 0.33790332078933716, mean loss: 0.33975953353539945
Epoch: 65, step: 1069, loss: 0.3012194335460663, mean loss: 0.33975912755098997
Epoch: 65, step: 1070, loss: 0.3446465730667114, mean loss: 0.33975917903517866
Epoch: 65, step: 1071, loss: 0.33714714646339417, mean loss: 0.33975915152040415
Epoch: 65, step: 1072, loss: 0.3274856209754944, mean loss: 0.33975902223416493
Epoch: 65, step: 1073, loss: 0.34309229254722595, mean loss: 0.33975905734561407
Epoch: 65, step: 1074, loss: 0.33135485649108887, mean loss: 0.3397589688197716
Epoch: 65, step: 1075, loss: 0.3616369366645813, mean loss: 0.3397591992694202
Epoch: 65, step: 1076, loss: 0.3306798040866852, mean loss: 0.3397591036334176
Epoch: 65, step: 1077, loss: 0.29630517959594727, mean loss: 0.3397586459249759
Epoch: 65, step: 1078, loss: 0.3370552957057953, mean loss: 0.3397586174503741
Epoch: 65, step: 1079, loss: 0.29313570261001587, mean loss: 0.33975812637269515
Epoch: 65, step: 1080, loss: 0.3271103501319885, mean loss: 0.3397579931554735
Epoch: 65, step: 1081, loss: 0.3194844722747803, mean loss: 0.3397577796196213
Epoch: 65, step: 1082, loss: 0.3421112596988678, mean loss: 0.3397578044079688
Epoch: 65, step: 1083, loss: 0.32708674669265747, mean loss: 0.3397576709497438
Epoch: 65, step: 1084, loss: 0.31378573179244995, mean loss: 0.33975739740254113
Epoch: 65, step: 1085, loss: 0.33920466899871826, mean loss: 0.33975739158103835
Epoch: 65, step: 1086, loss: 0.30452197790145874, mean loss: 0.33975702047490886
Epoch: 65, step: 1087, loss: 0.35609176754951477, mean loss: 0.33975719251378356
Epoch: 65, step: 1088, loss: 0.30807220935821533, mean loss: 0.33975685880849804
Epoch: 65, step: 1089, loss: 0.3788718283176422, mean loss: 0.33975727076183676
Epoch: 65, step: 1090, loss: 0.3293747901916504, mean loss: 0.33975716141616824
Epoch: 65, step: 1091, loss: 0.3281742036342621, mean loss: 0.33975703942866103
Epoch: 65, step: 1092, loss: 0.33380866050720215, mean loss: 0.33975697678315303
Epoch: 65, step: 1093, loss: 0.3219061493873596, mean loss: 0.3397567887886779
Epoch: 65, step: 1094, loss: 0.3179440498352051, mean loss: 0.3397565590720863
Epoch: 65, step: 1095, loss: 0.3524227738380432, mean loss: 0.33975669246244355
Epoch: 65, step: 1096, loss: 0.3331071734428406, mean loss: 0.33975662243581023
Epoch: 65, step: 1097, loss: 0.33556872606277466, mean loss: 0.3397565783331925
Epoch: 65, step: 1098, loss: 0.35157740116119385, mean loss: 0.3397567028166309
Epoch: 65, step: 1099, loss: 0.341539591550827, mean loss: 0.33975672159178605
Epoch: 65, step: 1100, loss: 0.3497282564640045, mean loss: 0.339756826598419
Epoch: 65, step: 1101, loss: 0.33393046259880066, mean loss: 0.3397567652437298
Epoch: 65, step: 1102, loss: 0.35449784994125366, mean loss: 0.3397569204735003
Epoch: 65, step: 1103, loss: 0.34458836913108826, mean loss: 0.33975697135013416
Epoch: 65, step: 1104, loss: 0.3300595283508301, mean loss: 0.33975686923416515
Epoch: 65, step: 1105, loss: 0.32240030169487, mean loss: 0.3397566864680432
Epoch: 65, step: 1106, loss: 0.31313082575798035, mean loss: 0.33975640609843366
Epoch: 65, step: 1107, loss: 0.32244977355003357, mean loss: 0.3397562238619693
Epoch: 65, step: 1108, loss: 0.2977546155452728, mean loss: 0.33975578159545794
Epoch: 65, step: 1109, loss: 0.3293444514274597, mean loss: 0.3397556719678896
Epoch: 65, step: 1110, loss: 0.3366812765598297, mean loss: 0.3397556395959507
Epoch: 65, step: 1111, loss: 0.3666934669017792, mean loss: 0.33975592323562664
Epoch: 65, step: 1112, loss: 0.3330552279949188, mean loss: 0.3397558526819404
Epoch: 65, step: 1113, loss: 0.3144228458404541, mean loss: 0.33975558594570904
Epoch: 65, step: 1114, loss: 0.3359646201133728, mean loss: 0.3397555460303015
Epoch: 65, step: 1115, loss: 0.30753037333488464, mean loss: 0.3397552067322399
Epoch: 65, step: 1116, loss: 0.3061327338218689, mean loss: 0.3397548527257656
Epoch: 65, step: 1117, loss: 0.3096526861190796, mean loss: 0.33975453578745773
Epoch: 65, step: 1118, loss: 0.30026865005493164, mean loss: 0.33975412005465644
Epoch: 65, step: 1119, loss: 0.33555343747138977, mean loss: 0.33975407582763406
Epoch: 65, step: 1120, loss: 0.3060336410999298, mean loss: 0.33975372080468497
Epoch: 65, step: 1121, loss: 0.30607911944389343, mean loss: 0.3397533662680216
Epoch: 65, step: 1122, loss: 0.32965710759162903, mean loss: 0.3397532599725932
Epoch: 65, step: 1123, loss: 0.32117706537246704, mean loss: 0.33975306440076425
Epoch: 65, step: 1124, loss: 0.33650243282318115, mean loss: 0.3397530301781862
Epoch: 65, step: 1125, loss: 0.32048845291137695, mean loss: 0.33975282736327383
Epoch: 65, step: 1126, loss: 0.3184758722782135, mean loss: 0.3397526033646731
Epoch: 65, step: 1127, loss: 0.3533884882926941, mean loss: 0.33975274691843704
Epoch: 65, step: 1128, loss: 0.33446359634399414, mean loss: 0.33975269123672047
Epoch: 65, step: 1129, loss: 0.38922402262687683, mean loss: 0.33975321204239883
Epoch: 65, step: 1130, loss: 0.33439186215400696, mean loss: 0.33975315560178987
Epoch: 65, step: 1131, loss: 0.39462727308273315, mean loss: 0.3397537332727251
Epoch: 65, step: 1132, loss: 0.3097854554653168, mean loss: 0.33975341779392343
Epoch: 65, step: 1133, loss: 0.3062800467014313, mean loss: 0.3397530654203936
Epoch: 65, step: 1134, loss: 0.35565513372421265, mean loss: 0.33975323281939673
Epoch: 65, step: 1135, loss: 0.3699662387371063, mean loss: 0.3397535508644293
Epoch: 65, step: 1136, loss: 0.32983434200286865, mean loss: 0.3397534464484071
Epoch: 65, step: 1137, loss: 0.3458106219768524, mean loss: 0.33975351020949185
Epoch: 65, step: 1138, loss: 0.3320423662662506, mean loss: 0.33975342903870115
Epoch: 65, step: 1139, loss: 0.2885873019695282, mean loss: 0.3397528904478899
Epoch: 65, step: 1140, loss: 0.3188464045524597, mean loss: 0.3397526703819338
Epoch: 65, step: 1141, loss: 0.32628050446510315, mean loss: 0.33975252857264643
Epoch: 65, step: 1142, loss: 0.3013858497142792, mean loss: 0.33975212472562205
Epoch: 65, step: 1143, loss: 0.36439892649650574, mean loss: 0.33975238415471737
Epoch: 65, step: 1144, loss: 0.29533636569976807, mean loss: 0.33975191664228693
Epoch: 65, step: 1145, loss: 0.3077360689640045, mean loss: 0.3397515796546474
Epoch: 65, step: 1146, loss: 0.34239983558654785, mean loss: 0.33975160752897177
Epoch: 65, step: 1147, loss: 0.3708088994026184, mean loss: 0.3397519344203059
Epoch: 65, step: 1148, loss: 0.33235007524490356, mean loss: 0.3397518565133794
Epoch: 65, step: 1149, loss: 0.32802972197532654, mean loss: 0.3397517331354767
Epoch: 65, step: 1150, loss: 0.33820444345474243, mean loss: 0.3397517168501026
Epoch: 65, step: 1151, loss: 0.2987060546875, mean loss: 0.33975128484506995
Epoch: 65, step: 1152, loss: 0.35015660524368286, mean loss: 0.33975139435977214
Epoch: 65, step: 1153, loss: 0.32534345984458923, mean loss: 0.3397512427196505
Epoch: 65, step: 1154, loss: 0.37342342734336853, mean loss: 0.33975159710774316
Epoch: 65, step: 1155, loss: 0.3393153250217438, mean loss: 0.33975159251617876
Epoch: 65, step: 1156, loss: 0.3059907555580139, mean loss: 0.3397512372025301
Epoch: 65, step: 1157, loss: 0.306403249502182, mean loss: 0.3397508862375792
Epoch: 65, step: 1158, loss: 0.33855801820755005, mean loss: 0.3397508736835844
Epoch: 65, step: 1159, loss: 0.35557010769844055, mean loss: 0.3397510401667881
Epoch: 65, step: 1160, loss: 0.33536791801452637, mean loss: 0.3397509940388569
Epoch: 65, step: 1161, loss: 0.3100723922252655, mean loss: 0.339750681704852
Epoch: 65, step: 1162, loss: 0.4190143942832947, mean loss: 0.33975151585776847
Epoch: 65, step: 1163, loss: 0.3329613208770752, mean loss: 0.3397514444000843
Epoch: 65, step: 1164, loss: 0.33198389410972595, mean loss: 0.3397513626579081
Epoch: 65, step: 1165, loss: 0.3543679118156433, mean loss: 0.3397515164742232
Epoch: 65, step: 1166, loss: 0.3468444347381592, mean loss: 0.33975159111530695
Epoch: 65, step: 1167, loss: 0.35478487610816956, mean loss: 0.3397517493137852
Epoch: 65, step: 1168, loss: 0.317399799823761, mean loss: 0.3397515141019079
Epoch: 65, step: 1169, loss: 0.3312029242515564, mean loss: 0.33975142414515896
Epoch: 65, step: 1170, loss: 0.3296331465244293, mean loss: 0.33975131767171746
Epoch: 65, step: 1171, loss: 0.3188660144805908, mean loss: 0.33975109790044894
Epoch: 65, step: 1172, loss: 0.36750173568725586, mean loss: 0.3397513899109904
Epoch: 65, step: 1173, loss: 0.31702253222465515, mean loss: 0.339751150745453
Epoch: 65, step: 1174, loss: 0.3490718901157379, mean loss: 0.3397512488223654
Epoch: 65, step: 1175, loss: 0.35696110129356384, mean loss: 0.3397514299100845
Epoch: 65, step: 1176, loss: 0.3498658239841461, mean loss: 0.33975153633594046
Epoch: 65, step: 1177, loss: 0.3727954030036926, mean loss: 0.3397518840270395
Epoch: 65, step: 1178, loss: 0.36015623807907104, mean loss: 0.33975209872157597
Epoch: 65, step: 1179, loss: 0.31621384620666504, mean loss: 0.3397518510547776
Epoch: 65, step: 1180, loss: 0.3525346517562866, mean loss: 0.33975198555252806
Epoch: 65, step: 1181, loss: 0.3817219138145447, mean loss: 0.3397524271460158
Epoch: 65, step: 1182, loss: 0.3306601047515869, mean loss: 0.33975233148066014
Epoch: 65, step: 1183, loss: 0.32765546441078186, mean loss: 0.3397522042041664
Epoch: 65, step: 1184, loss: 0.30222418904304504, mean loss: 0.3397518093594596
Epoch: 65, step: 1185, loss: 0.32254016399383545, mean loss: 0.33975162827192973
Epoch: 65, step: 1186, loss: 0.3075195848941803, mean loss: 0.3397512891550362
Epoch: 65, step: 1187, loss: 0.3452487289905548, mean loss: 0.33975134699360027
Epoch: 65, step: 1188, loss: 0.3515264093875885, mean loss: 0.33975147087772734
Epoch: 65, step: 1189, loss: 0.28816959261894226, mean loss: 0.3397509281962096
Epoch: 65, step: 1190, loss: 0.3211474120616913, mean loss: 0.3397507324747955
Epoch: 65, step: 1191, loss: 0.30514898896217346, mean loss: 0.3397503684451747
Epoch: 65, step: 1192, loss: 0.3271375298500061, mean loss: 0.3397502357524812
Epoch: 65, step: 1193, loss: 0.31784239411354065, mean loss: 0.3397500052746303
Epoch: 65, step: 1194, loss: 0.3578489124774933, mean loss: 0.3397501956792087
Epoch: 65, step: 1195, loss: 0.3503325581550598, mean loss: 0.3397503070068732
Epoch: 65, step: 1196, loss: 0.29821574687957764, mean loss: 0.33974987006314333
Epoch: 65, step: 1197, loss: 0.3369474709033966, mean loss: 0.3397498405822037
Epoch: 65, step: 1198, loss: 0.29028430581092834, mean loss: 0.3397493202155391
Epoch: 65, step: 1199, loss: 0.37779825925827026, mean loss: 0.33974972047788965
Epoch: 65, step: 1200, loss: 0.3103976845741272, mean loss: 0.33974941170735384
Epoch: 65, step: 1201, loss: 0.32018113136291504, mean loss: 0.3397492058597981
Epoch: 65, step: 1202, loss: 0.3061661422252655, mean loss: 0.33974885258814
Epoch: 65, step: 1203, loss: 0.3130730986595154, mean loss: 0.33974857197977165
Epoch: 65, step: 1204, loss: 0.30995413661003113, mean loss: 0.33974825856857543
Epoch: 65, step: 1205, loss: 0.3348981738090515, mean loss: 0.3397482075504958
Epoch: 65, step: 1206, loss: 0.303280770778656, mean loss: 0.3397478239532773
Epoch: 65, step: 1207, loss: 0.3453126549720764, mean loss: 0.339747882488547
Epoch: 65, step: 1208, loss: 0.35193103551864624, mean loss: 0.33974801063918525
Epoch: 65, step: 1209, loss: 0.30807992815971375, mean loss: 0.3397476775363928
Epoch: 65, step: 1210, loss: 0.3246608376502991, mean loss: 0.33974751884615195
Epoch: 65, step: 1211, loss: 0.3214459717273712, mean loss: 0.33974732634418375
Epoch: 65, step: 1212, loss: 0.3613124191761017, mean loss: 0.3397475531708625
Epoch: 65, step: 1213, loss: 0.3264189064502716, mean loss: 0.33974741297852057
Epoch: 65, step: 1214, loss: 0.30713972449302673, mean loss: 0.3397470700104587
Epoch: 65, step: 1215, loss: 0.3855256140232086, mean loss: 0.33974755150467395
Epoch: 65, step: 1216, loss: 0.28273558616638184, mean loss: 0.33974695186474696
Epoch: 65, step: 1217, loss: 0.3368028402328491, mean loss: 0.3397469208995223
Epoch: 65, step: 1218, loss: 0.3552860617637634, mean loss: 0.33974708433351786
Epoch: 65, step: 1219, loss: 0.3097791373729706, mean loss: 0.3397467691468649
Epoch: 65, step: 1220, loss: 0.36178991198539734, mean loss: 0.3397470009822772
Epoch: 65, step: 1221, loss: 0.32431846857070923, mean loss: 0.33974683871673367
Epoch: 65, step: 1222, loss: 0.31068485975265503, mean loss: 0.3397465330682059
Epoch: 65, step: 1223, loss: 0.36034104228019714, mean loss: 0.33974674966099977
Epoch: 65, step: 1224, loss: 0.3825497329235077, mean loss: 0.3397471998159481
Epoch: 65, step: 1225, loss: 0.3257458806037903, mean loss: 0.3397470525669397
Epoch: 65, step: 1226, loss: 0.2948545515537262, mean loss: 0.33974658044666023
Epoch: 65, step: 1227, loss: 0.3598784804344177, mean loss: 0.33974679216527864
Epoch: 65, step: 1228, loss: 0.3042508661746979, mean loss: 0.33974641887366774
Epoch: 65, step: 1229, loss: 0.3443036675453186, mean loss: 0.33974646679930315
Epoch: 65, step: 1230, loss: 0.3200324475765228, mean loss: 0.33974625948189957
Epoch: 65, step: 1231, loss: 0.38443058729171753, mean loss: 0.3397467293881778
Epoch: 65, step: 1232, loss: 0.3286142647266388, mean loss: 0.3397466123189439
Epoch: 65, step: 1233, loss: 0.34421879053115845, mean loss: 0.33974665934797
Epoch: 65, step: 1234, loss: 0.31653258204460144, mean loss: 0.3397464152333761
Epoch: 65, step: 1235, loss: 0.309467613697052, mean loss: 0.3397460968309035
Epoch: 65, step: 1236, loss: 0.30645647644996643, mean loss: 0.33974574677127617
Epoch: 65, step: 1237, loss: 0.32730042934417725, mean loss: 0.33974561590293584
Epoch: 65, step: 1238, loss: 0.29102620482444763, mean loss: 0.3397451036009024
Epoch: 65, step: 1239, loss: 0.31464990973472595, mean loss: 0.33974483971873765
Epoch: 65, step: 1240, loss: 0.3348340690135956, mean loss: 0.33974478808131314
Epoch: 65, step: 1241, loss: 0.30370625853538513, mean loss: 0.33974440913523896
Epoch: 65, step: 1242, loss: 0.3184465765953064, mean loss: 0.33974418519033145
Epoch: 65, step: 1243, loss: 0.328579306602478, mean loss: 0.339744067793812
Epoch: 65, step: 1244, loss: 0.3336271643638611, mean loss: 0.33974400347644246
Epoch: 65, step: 1245, loss: 0.32285410165786743, mean loss: 0.33974382588615565
Epoch: 65, step: 1246, loss: 0.332732617855072, mean loss: 0.3397437521669969
Epoch: 65, step: 1247, loss: 0.32409241795539856, mean loss: 0.33974358760319356
Epoch: 65, step: 1248, loss: 0.34737393260002136, mean loss: 0.33974366783056426
Epoch: 65, step: 1249, loss: 0.34064459800720215, mean loss: 0.33974367730307165
Epoch: 65, step: 1250, loss: 0.3575703501701355, mean loss: 0.33974386473326235
Epoch: 65, step: 1251, loss: 0.4035620391368866, mean loss: 0.33974453571247004
Epoch: 65, step: 1252, loss: 0.3559301793575287, mean loss: 0.33974470588525024
Epoch: 65, step: 1253, loss: 0.3456208109855652, mean loss: 0.3397447676648526
Epoch: 65, step: 1254, loss: 0.3411139249801636, mean loss: 0.3397447820596097
Epoch: 65, step: 1255, loss: 0.35203513503074646, mean loss: 0.33974491127396866
Epoch: 65, step: 1256, loss: 0.31759440898895264, mean loss: 0.33974467839759237
Epoch: 65, step: 1257, loss: 0.3431171178817749, mean loss: 0.3397447138529161
Epoch: 65, step: 1258, loss: 0.3510976731777191, mean loss: 0.33974483320824284
Epoch: 65, step: 1259, loss: 0.28882551193237305, mean loss: 0.3397442978915768
Epoch: 65, step: 1260, loss: 0.3105931282043457, mean loss: 0.3397439914274975
Epoch: 65, step: 1261, loss: 0.28263378143310547, mean loss: 0.3397433910384183
Epoch: 65, step: 1262, loss: 0.2998460531234741, mean loss: 0.3397429716094903
Epoch: 65, step: 1263, loss: 0.3215269148349762, mean loss: 0.33974278011147957
Epoch: 65, step: 1264, loss: 0.32379424571990967, mean loss: 0.33974261245277376
Epoch: 65, step: 1265, loss: 0.3230116665363312, mean loss: 0.3397424365708286
Epoch: 65, step: 1266, loss: 0.3298555314540863, mean loss: 0.33974233263708614
Epoch: 65, step: 1267, loss: 0.3758014142513275, mean loss: 0.33974271169563475
Epoch: 65, step: 1268, loss: 0.3238728642463684, mean loss: 0.3397425448711391
Epoch: 65, step: 1269, loss: 0.31418460607528687, mean loss: 0.3397422762078489
Epoch: 65, step: 1270, loss: 0.3433970510959625, mean loss: 0.33974231462618665
Epoch: 65, step: 1271, loss: 0.3707422614097595, mean loss: 0.33974264048863867
Epoch: 65, step: 1272, loss: 0.3308252990245819, mean loss: 0.33974254675311616
Epoch: 65, step: 1273, loss: 0.3151980936527252, mean loss: 0.33974228875436596
Epoch: 65, step: 1274, loss: 0.3254552483558655, mean loss: 0.3397421385778757
Epoch: 65, step: 1275, loss: 0.34023886919021606, mean loss: 0.33974214379914436
Epoch: 65, step: 1276, loss: 0.3560508191585541, mean loss: 0.3397423152222012
Epoch: 65, step: 1277, loss: 0.32709285616874695, mean loss: 0.3397421822631412
Epoch: 65, step: 1278, loss: 0.2989414930343628, mean loss: 0.33974175340968227
Epoch: 65, step: 1279, loss: 0.36729127168655396, mean loss: 0.3397420429778794
Epoch: 65, step: 1280, loss: 0.3136717677116394, mean loss: 0.3397417689606285
Epoch: 65, step: 1281, loss: 0.346679151058197, mean loss: 0.33974184187671286
Epoch: 65, step: 1282, loss: 0.3532140851020813, mean loss: 0.33974198347665424
Epoch: 65, step: 1283, loss: 0.3674449920654297, mean loss: 0.33974227464591966
Epoch: 65, step: 1284, loss: 0.3094761371612549, mean loss: 0.3397419565405281
Epoch: 65, step: 1285, loss: 0.3540569543838501, mean loss: 0.33974210699349344
Epoch: 65, step: 1286, loss: 0.34589987993240356, mean loss: 0.33974217171201254
Epoch: 65, step: 1287, loss: 0.30569109320640564, mean loss: 0.3397418138371386
Epoch: 65, step: 1288, loss: 0.34379884600639343, mean loss: 0.3397418564758649
Epoch: 65, step: 1289, loss: 0.28850263357162476, mean loss: 0.3397413179659027
Epoch: 65, step: 1290, loss: 0.3213284909725189, mean loss: 0.33974112445425286
Epoch: 65, step: 1291, loss: 0.3735782504081726, mean loss: 0.339741480065548
Epoch: 65, step: 1292, loss: 0.3316524028778076, mean loss: 0.33974139505427997
Epoch: 65, step: 1293, loss: 0.33476701378822327, mean loss: 0.33974134277711593
Epoch: 65, step: 1294, loss: 0.3090519905090332, mean loss: 0.3397410202575188
Epoch: 65, step: 1295, loss: 0.32658079266548157, mean loss: 0.33974088195591307
Epoch: 65, step: 1296, loss: 0.31041333079338074, mean loss: 0.3397405737541921
Epoch: 65, step: 1297, loss: 0.32349300384521484, mean loss: 0.33974040301111313
Epoch: 65, step: 1298, loss: 0.30629557371139526, mean loss: 0.3397400515485158
Epoch: 65, step: 1299, loss: 0.3492750823497772, mean loss: 0.3397401517485032
Epoch: 65, step: 1300, loss: 0.3473498225212097, mean loss: 0.339740231714779
Epoch: 65, step: 1301, loss: 0.33055001497268677, mean loss: 0.33974013514034024
Epoch: 65, step: 1302, loss: 0.3074803650379181, mean loss: 0.3397397961454567
Epoch: 65, step: 1303, loss: 0.32111597061157227, mean loss: 0.3397396004430321
Epoch: 65, step: 1304, loss: 0.33617785573005676, mean loss: 0.33973956301598734
Epoch: 65, step: 1305, loss: 0.3207499384880066, mean loss: 0.3397393634738764
Epoch: 65, step: 1306, loss: 0.31015464663505554, mean loss: 0.33973905260228393
Epoch: 65, step: 1307, loss: 0.33025479316711426, mean loss: 0.3397389529442115
Epoch: 65, step: 1308, loss: 0.35849854350090027, mean loss: 0.339739150062922
Epoch: 65, step: 1309, loss: 0.318732351064682, mean loss: 0.33973892933371114
Epoch: 65, step: 1310, loss: 0.3781556487083435, mean loss: 0.339739332993643
Epoch: 65, step: 1311, loss: 0.32574087381362915, mean loss: 0.339739185907744
Epoch: 65, step: 1312, loss: 0.2990799844264984, mean loss: 0.33973875869412795
Epoch: 65, step: 1313, loss: 0.3041595220565796, mean loss: 0.33973838486055324
Epoch: 65, step: 1314, loss: 0.32852011919021606, mean loss: 0.3397382669906749
Epoch: 65, step: 1315, loss: 0.3365479111671448, mean loss: 0.3397382334700833
Epoch: 65, step: 1316, loss: 0.3160136342048645, mean loss: 0.33973798420188545
Epoch: 65, step: 1317, loss: 0.3387965261936188, mean loss: 0.3397379743103348
Epoch: 65, step: 1318, loss: 0.307169109582901, mean loss: 0.33973763212492913
Epoch: 65, step: 1319, loss: 0.30529913306236267, mean loss: 0.33973727029997575
Epoch: 65, step: 1320, loss: 0.35508671402931213, mean loss: 0.33973743156581376
Epoch: 65, step: 1321, loss: 0.3264460861682892, mean loss: 0.3397372919244383
Epoch: 65, step: 1322, loss: 0.31202635169029236, mean loss: 0.3397370007911452
Epoch: 65, step: 1323, loss: 0.30470743775367737, mean loss: 0.3397366327716983
Epoch: 65, step: 1324, loss: 0.3221595585346222, mean loss: 0.3397364481094696
Epoch: 65, step: 1325, loss: 0.3557288944721222, mean loss: 0.3397366161220593
Epoch: 65, step: 1326, loss: 0.30789074301719666, mean loss: 0.33973628156089963
Epoch: 65, step: 1327, loss: 0.3383009135723114, mean loss: 0.33973626648160404
Epoch: 65, step: 1328, loss: 0.3024967908859253, mean loss: 0.33973587526543836
Epoch: 65, step: 1329, loss: 0.3339916467666626, mean loss: 0.339735814920565
Epoch: 65, step: 1330, loss: 0.343524307012558, mean loss: 0.3397358547194125
Epoch: 65, step: 1331, loss: 0.3045157194137573, mean loss: 0.33973548472891635
Epoch: 65, step: 1332, loss: 0.36874908208847046, mean loss: 0.3397357895160053
Epoch: 65, step: 1333, loss: 0.2857639491558075, mean loss: 0.3397352225491759
Epoch: 65, step: 1334, loss: 0.3085598647594452, mean loss: 0.3397348950597301
Epoch: 65, step: 1335, loss: 0.34209078550338745, mean loss: 0.3397349198075183
Epoch: 65, step: 1336, loss: 0.3231063187122345, mean loss: 0.3397347451318342
Epoch: 65, step: 1337, loss: 0.3159889876842499, mean loss: 0.3397344956963687
Epoch: 65, step: 1338, loss: 0.3380793631076813, mean loss: 0.33973447831033954
Epoch: 65, step: 1339, loss: 0.416464239358902, mean loss: 0.3397352842952245
Epoch: 65, step: 1340, loss: 0.2954161763191223, mean loss: 0.33973481876326606
Epoch: 65, step: 1341, loss: 0.3761145770549774, mean loss: 0.33973520089555626
Epoch: 65, step: 1342, loss: 0.346233606338501, mean loss: 0.3397352691539666
Epoch: 65, step: 1343, loss: 0.3089565634727478, mean loss: 0.3397349458618184
Epoch: 65, step: 1344, loss: 0.34176307916641235, mean loss: 0.3397349671646208
Epoch: 65, step: 1345, loss: 0.34621042013168335, mean loss: 0.3397350351797981
Epoch: 65, step: 1346, loss: 0.33307966589927673, mean loss: 0.33973496527559693
Epoch: 65, step: 1347, loss: 0.3448154926300049, mean loss: 0.33973501863799666
Epoch: 65, step: 1348, loss: 0.34396058320999146, mean loss: 0.33973506301998335
Epoch: 65, step: 1349, loss: 0.31881043314933777, mean loss: 0.3397348432465365
Epoch: 65, step: 1350, loss: 0.32254618406295776, mean loss: 0.3397346627142537
Epoch: 65, step: 1351, loss: 0.300554484128952, mean loss: 0.33973425120962625
Epoch: 65, step: 1352, loss: 0.3447260558605194, mean loss: 0.3397343036373898
Epoch: 65, step: 1353, loss: 0.2877822518348694, mean loss: 0.33973375800280037
Epoch: 65, step: 1354, loss: 0.30908480286598206, mean loss: 0.3397334361107126
Epoch: 65, step: 1355, loss: 0.30023401975631714, mean loss: 0.33973302127059796
Epoch: 65, step: 1356, loss: 0.3034571707248688, mean loss: 0.33973264028977995
Epoch: 65, step: 1357, loss: 0.31328678131103516, mean loss: 0.3397323625496575
Epoch: 65, step: 1358, loss: 0.33642691373825073, mean loss: 0.3397323278354848
Epoch: 65, step: 1359, loss: 0.3645898997783661, mean loss: 0.33973258888959046
Epoch: 65, step: 1360, loss: 0.35482096672058105, mean loss: 0.3397327473460006
Epoch: 65, step: 1361, loss: 0.33934348821640015, mean loss: 0.3397327432580889
Epoch: 65, step: 1362, loss: 0.33040404319763184, mean loss: 0.3397326452912105
Epoch: 65, step: 1363, loss: 0.31801876425743103, mean loss: 0.3397324172617113
Epoch: 65, step: 1364, loss: 0.3187136650085449, mean loss: 0.3397321965344626
Epoch: 65, step: 1365, loss: 0.3250059187412262, mean loss: 0.3397320418889058
Epoch: 65, step: 1366, loss: 0.30443820357322693, mean loss: 0.3397316712604253
Epoch: 65, step: 1367, loss: 0.3642745316028595, mean loss: 0.339731928987778
Epoch: 65, step: 1368, loss: 0.3105762302875519, mean loss: 0.33973162282370295
Epoch: 65, step: 1369, loss: 0.34801241755485535, mean loss: 0.33973170977943884
Epoch: 65, step: 1370, loss: 0.3103775680065155, mean loss: 0.33973140153798626
Epoch: 65, step: 1371, loss: 0.3327106237411499, mean loss: 0.3397313278151011
Epoch: 65, step: 1372, loss: 0.311890184879303, mean loss: 0.3397310354674597
Epoch: 65, step: 1373, loss: 0.3254169523715973, mean loss: 0.3397308851631241
Epoch: 65, step: 1374, loss: 0.3260977864265442, mean loss: 0.33973074201093495
Epoch: 65, step: 1375, loss: 0.3303464949131012, mean loss: 0.3397306434741726
Epoch: 65, step: 1376, loss: 0.30152493715286255, mean loss: 0.3397302423096428
Epoch: 65, step: 1377, loss: 0.3867494761943817, mean loss: 0.3397307360120923
Epoch: 65, step: 1378, loss: 0.3219643235206604, mean loss: 0.3397305494665333
Epoch: 65, step: 1379, loss: 0.3513566255569458, mean loss: 0.3397306715378908
Epoch: 65, step: 1380, loss: 0.37189626693725586, mean loss: 0.3397310092663418
Epoch: 65, step: 1381, loss: 0.36147573590278625, mean loss: 0.3397312375766108
Epoch: 65, step: 1382, loss: 0.40481650829315186, mean loss: 0.33973192093676025
Epoch: 65, step: 1383, loss: 0.3129471242427826, mean loss: 0.3397316397138308
Epoch: 65, step: 1384, loss: 0.3182998597621918, mean loss: 0.33973141469645507
Epoch: 65, step: 1385, loss: 0.2949238717556, mean loss: 0.33973094425630074
Epoch: 65, step: 1386, loss: 0.32030487060546875, mean loss: 0.33973074030159717
Epoch: 65, step: 1387, loss: 0.3440866470336914, mean loss: 0.3397307860338617
Epoch: 65, step: 1388, loss: 0.31285563111305237, mean loss: 0.339730503877042
Epoch: 65, step: 1389, loss: 0.2971685528755188, mean loss: 0.33973005703241205
Epoch: 65, step: 1390, loss: 0.32922565937042236, mean loss: 0.3397299467511797
Epoch: 65, step: 1391, loss: 0.339264452457428, mean loss: 0.3397299418642031
Epoch: 65, step: 1392, loss: 0.470579594373703, mean loss: 0.3397313155705694
Epoch: 65, step: 1393, loss: 0.34672248363494873, mean loss: 0.3397313889655771
Epoch: 65, step: 1394, loss: 0.3344428241252899, mean loss: 0.33973133344550105
Epoch: 65, step: 1395, loss: 0.31923288106918335, mean loss: 0.3397311182522074
Epoch: 65, step: 1396, loss: 0.33057183027267456, mean loss: 0.3397310220987701
Epoch: 65, step: 1397, loss: 0.33812689781188965, mean loss: 0.3397310052589846
Epoch: 65, step: 1398, loss: 0.3431144058704376, mean loss: 0.3397310407768948
Epoch: 65, step: 1399, loss: 0.33950722217559814, mean loss: 0.33973103842733987
Epoch: 65, step: 1400, loss: 0.31302276253700256, mean loss: 0.3397307580578719
Epoch: 65, step: 1401, loss: 0.34947076439857483, mean loss: 0.3397308603022751
Epoch: 65, step: 1402, loss: 0.34928998351097107, mean loss: 0.33973096064682873
Epoch: 65, step: 1403, loss: 0.34459376335144043, mean loss: 0.33973101169237274
Epoch: 65, step: 1404, loss: 0.32035818696022034, mean loss: 0.33973080833516145
Epoch: 65, step: 1405, loss: 0.3066003918647766, mean loss: 0.33973046056768436
Epoch: 65, step: 1406, loss: 0.35068538784980774, mean loss: 0.3397305755595208
Epoch: 65, step: 1407, loss: 0.325504869222641, mean loss: 0.3397304262364917
Epoch: 65, step: 1408, loss: 0.35316020250320435, mean loss: 0.3397305672033987
Epoch: 65, step: 1409, loss: 0.42038848996162415, mean loss: 0.33973141382796845
Epoch: 65, step: 1410, loss: 0.3109409213066101, mean loss: 0.3397311116322056
Epoch: 65, step: 1411, loss: 0.2696353495121002, mean loss: 0.33973037588862803
Epoch: 65, step: 1412, loss: 0.36936262249946594, mean loss: 0.33973068691322694
Epoch: 65, step: 1413, loss: 0.31264933943748474, mean loss: 0.33973040266623955
Epoch: 65, step: 1414, loss: 0.4225502908229828, mean loss: 0.3397312719382223
Epoch: 65, step: 1415, loss: 0.32570213079452515, mean loss: 0.3397311246908447
Epoch: 65, step: 1416, loss: 0.34239310026168823, mean loss: 0.339731152630175
Epoch: 65, step: 1417, loss: 0.33670416474342346, mean loss: 0.33973112086011387
Epoch: 65, step: 1418, loss: 0.30086585879325867, mean loss: 0.3397307129500595
Epoch: 65, step: 1419, loss: 0.32323041558265686, mean loss: 0.339730539773135
Epoch: 65, step: 1420, loss: 0.373602956533432, mean loss: 0.33973089527335815
Epoch: 65, step: 1421, loss: 0.3476324677467346, mean loss: 0.33973097820163917
Epoch: 65, step: 1422, loss: 0.2880745828151703, mean loss: 0.339730436065105
Epoch: 65, step: 1423, loss: 0.31123828887939453, mean loss: 0.33973013704168886
Epoch: 65, step: 1424, loss: 0.35164740681648254, mean loss: 0.33973026211142465
Epoch: 65, step: 1425, loss: 0.3341701328754425, mean loss: 0.33973020375941876
Epoch: 65, step: 1426, loss: 0.35404515266418457, mean loss: 0.33973035398923923
Epoch: 65, step: 1427, loss: 0.32978111505508423, mean loss: 0.3397302495769425
Epoch: 65, step: 1428, loss: 0.3293265998363495, mean loss: 0.3397301403969769
Epoch: 65, step: 1429, loss: 0.32824787497520447, mean loss: 0.3397300198988615
Epoch: 65, step: 1430, loss: 0.3383629024028778, mean loss: 0.3397300055520974
Epoch: 65, step: 1431, loss: 0.35444891452789307, mean loss: 0.33973016001321665
Epoch: 65, step: 1432, loss: 0.3466782569885254, mean loss: 0.3397302329262006
Epoch: 65, step: 1433, loss: 0.331765353679657, mean loss: 0.33973014934403123
Epoch: 65, step: 1434, loss: 0.3237595558166504, mean loss: 0.3397299817529349
Epoch: 65, step: 1435, loss: 0.3513534367084503, mean loss: 0.33973010372505286
Epoch: 65, step: 1436, loss: 0.3557226061820984, mean loss: 0.33973027154253355
Epoch: 65, step: 1437, loss: 0.31742677092552185, mean loss: 0.33973003750298797
Epoch: 65, step: 1438, loss: 0.3105626106262207, mean loss: 0.3397297314407326
Epoch: 65, step: 1439, loss: 0.33018964529037476, mean loss: 0.3397296313348968
Epoch: 65, step: 1440, loss: 0.3192368149757385, mean loss: 0.33972941630235404
Epoch: 65, step: 1441, loss: 0.34804683923721313, mean loss: 0.33972950357673376
Epoch: 65, step: 1442, loss: 0.38896337151527405, mean loss: 0.3397300201802818
Epoch: 65, step: 1443, loss: 0.3292580544948578, mean loss: 0.3397299103006788
Valid: 65, mean loss: 0.18459579100211462
Epoch: 66, step: 0, loss: 0.37551358342170715, mean loss: 0.33973028576548253
Epoch: 66, step: 1, loss: 0.3750568628311157, mean loss: 0.33973065643025774
Epoch: 66, step: 2, loss: 0.35271114110946655, mean loss: 0.33973079262680866
Epoch: 66, step: 3, loss: 0.3518388867378235, mean loss: 0.3397309196685482
Epoch: 66, step: 4, loss: 0.34786486625671387, mean loss: 0.3397310050114496
Epoch: 66, step: 5, loss: 0.36094921827316284, mean loss: 0.33973122763460833
Epoch: 66, step: 6, loss: 0.3210426867008209, mean loss: 0.33973103155502743
Epoch: 66, step: 7, loss: 0.318829745054245, mean loss: 0.3397308122616908
Epoch: 66, step: 8, loss: 0.34815895557403564, mean loss: 0.33973090068764855
Epoch: 66, step: 9, loss: 0.31923964619636536, mean loss: 0.3397306857008209
Epoch: 66, step: 10, loss: 0.36891332268714905, mean loss: 0.3397309918712766
Epoch: 66, step: 11, loss: 0.34207186102867126, mean loss: 0.33973101643031345
Epoch: 66, step: 12, loss: 0.3189827799797058, mean loss: 0.3397307987541754
Epoch: 66, step: 13, loss: 0.362660676240921, mean loss: 0.3397310393160576
Epoch: 66, step: 14, loss: 0.32885703444480896, mean loss: 0.3397309252359175
Epoch: 66, step: 15, loss: 0.3569297790527344, mean loss: 0.3397311056687104
Epoch: 66, step: 16, loss: 0.31652069091796875, mean loss: 0.33973086217132
Epoch: 66, step: 17, loss: 0.3547218143939972, mean loss: 0.33973101943776657
Epoch: 66, step: 18, loss: 0.3423655927181244, mean loss: 0.3397310470761464
Epoch: 66, step: 19, loss: 0.3518252372741699, mean loss: 0.3397311739507026
Epoch: 66, step: 20, loss: 0.3532088100910187, mean loss: 0.33973131533686723
Epoch: 66, step: 21, loss: 0.3125517964363098, mean loss: 0.33973103021508616
Epoch: 66, step: 22, loss: 0.3290378749370575, mean loss: 0.3397309180416696
Epoch: 66, step: 23, loss: 0.3279407322406769, mean loss: 0.3397307943614728
Epoch: 66, step: 24, loss: 0.3356077969074249, mean loss: 0.3397307511112818
Epoch: 66, step: 25, loss: 0.3571145236492157, mean loss: 0.3397309334649222
Epoch: 66, step: 26, loss: 0.3373483419418335, mean loss: 0.33973090847209175
Epoch: 66, step: 27, loss: 0.33565554022789, mean loss: 0.3397308657228759
Epoch: 66, step: 28, loss: 0.3406543433666229, mean loss: 0.33973087540973823
Epoch: 66, step: 29, loss: 0.32342728972435, mean loss: 0.3397307043943011
Epoch: 66, step: 30, loss: 0.31697791814804077, mean loss: 0.3397304657328835
Epoch: 66, step: 31, loss: 0.3574329614639282, mean loss: 0.3397306514182042
Epoch: 66, step: 32, loss: 0.3835383951663971, mean loss: 0.3397311109223185
Epoch: 66, step: 33, loss: 0.3591459393501282, mean loss: 0.3397313145643965
Epoch: 66, step: 34, loss: 0.3298761546611786, mean loss: 0.33973121119473765
Epoch: 66, step: 35, loss: 0.30898913741111755, mean loss: 0.33973088874798096
Epoch: 66, step: 36, loss: 0.328685462474823, mean loss: 0.339730772896183
Epoch: 66, step: 37, loss: 0.321353554725647, mean loss: 0.33973058014568297
Epoch: 66, step: 38, loss: 0.3483206033706665, mean loss: 0.3397306702416861
Epoch: 66, step: 39, loss: 0.3346136510372162, mean loss: 0.3397306165726644
Epoch: 66, step: 40, loss: 0.35188278555870056, mean loss: 0.33973074402737086
Epoch: 66, step: 41, loss: 0.35875123739242554, mean loss: 0.33973094351653
Epoch: 66, step: 42, loss: 0.35116928815841675, mean loss: 0.33973106348196824
Epoch: 66, step: 43, loss: 0.3463587462902069, mean loss: 0.3397311329924227
Epoch: 66, step: 44, loss: 0.35503119230270386, mean loss: 0.3397312934561854
Epoch: 66, step: 45, loss: 0.32417893409729004, mean loss: 0.3397311303480642
Epoch: 66, step: 46, loss: 0.34838002920150757, mean loss: 0.3397312210539703
Epoch: 66, step: 47, loss: 0.33926427364349365, mean loss: 0.3397312161568794
Epoch: 66, step: 48, loss: 0.355501651763916, mean loss: 0.3397313815469102
Epoch: 66, step: 49, loss: 0.34286755323410034, mean loss: 0.33973141443668603
Epoch: 66, step: 50, loss: 0.35211843252182007, mean loss: 0.33973154434091846
Epoch: 66, step: 51, loss: 0.3095681965351105, mean loss: 0.33973122801737504
Epoch: 66, step: 52, loss: 0.3790225088596344, mean loss: 0.33973164006138695
Epoch: 66, step: 53, loss: 0.3131517171859741, mean loss: 0.33973136132312826
Epoch: 66, step: 54, loss: 0.32867226004600525, mean loss: 0.339731245349793
Epoch: 66, step: 55, loss: 0.31008413434028625, mean loss: 0.3397309344530752
Epoch: 66, step: 56, loss: 0.3070569932460785, mean loss: 0.33973059181886195
Epoch: 66, step: 57, loss: 0.29090067744255066, mean loss: 0.33973007977093533
Epoch: 66, step: 58, loss: 0.3288908302783966, mean loss: 0.33972996610788475
Epoch: 66, step: 59, loss: 0.3095557391643524, mean loss: 0.3397296496967973
Epoch: 66, step: 60, loss: 0.30988791584968567, mean loss: 0.33972933677555944
Epoch: 66, step: 61, loss: 0.33748409152030945, mean loss: 0.33972931323210315
Epoch: 66, step: 62, loss: 0.29046884179115295, mean loss: 0.33972879669628425
Epoch: 66, step: 63, loss: 0.3400695025920868, mean loss: 0.33972880026882324
Epoch: 66, step: 64, loss: 0.30764684081077576, mean loss: 0.33972846387062827
Epoch: 66, step: 65, loss: 0.3480162024497986, mean loss: 0.3397285507715256
Epoch: 66, step: 66, loss: 0.3069394826889038, mean loss: 0.3397282069660912
Epoch: 66, step: 67, loss: 0.2979791760444641, mean loss: 0.3397277692167421
Epoch: 66, step: 68, loss: 0.31529101729393005, mean loss: 0.33972751299378673
Epoch: 66, step: 69, loss: 0.3361293375492096, mean loss: 0.339727475266781
Epoch: 66, step: 70, loss: 0.3107558488845825, mean loss: 0.3397271715013668
Epoch: 66, step: 71, loss: 0.3098134696483612, mean loss: 0.33972685786164764
Epoch: 66, step: 72, loss: 0.32143938541412354, mean loss: 0.339726666122838
Epoch: 66, step: 73, loss: 0.3527645170688629, mean loss: 0.33972680281946555
Epoch: 66, step: 74, loss: 0.2850247025489807, mean loss: 0.33972622929594076
Epoch: 66, step: 75, loss: 0.3664773404598236, mean loss: 0.33972650976470953
Epoch: 66, step: 76, loss: 0.33080700039863586, mean loss: 0.33972641625017974
Epoch: 66, step: 77, loss: 0.32720592617988586, mean loss: 0.33972628498337815
Epoch: 66, step: 78, loss: 0.3774721920490265, mean loss: 0.33972668071329926
Epoch: 66, step: 79, loss: 0.3541228175163269, mean loss: 0.3397268316415137
Epoch: 66, step: 80, loss: 0.29980942606925964, mean loss: 0.33972641315427177
Epoch: 66, step: 81, loss: 0.3165014386177063, mean loss: 0.33972616967016994
Epoch: 66, step: 82, loss: 0.3359035849571228, mean loss: 0.33972612959568693
Epoch: 66, step: 83, loss: 0.353211909532547, mean loss: 0.33972627097384706
Epoch: 66, step: 84, loss: 0.29563456773757935, mean loss: 0.3397258087433673
Epoch: 66, step: 85, loss: 0.35505521297454834, mean loss: 0.3397259694457913
Epoch: 66, step: 86, loss: 0.3276726007461548, mean loss: 0.33972584308828696
Epoch: 66, step: 87, loss: 0.3163183033466339, mean loss: 0.339725597705658
Epoch: 66, step: 88, loss: 0.3405345380306244, mean loss: 0.3397256061857386
Epoch: 66, step: 89, loss: 0.3806708753108978, mean loss: 0.3397260354084269
Epoch: 66, step: 90, loss: 0.3126847445964813, mean loss: 0.3397257519418845
Epoch: 66, step: 91, loss: 0.306936651468277, mean loss: 0.3397254082262101
Epoch: 66, step: 92, loss: 0.3589877784252167, mean loss: 0.33972561014419705
Epoch: 66, step: 93, loss: 0.32427430152893066, mean loss: 0.33972544817739886
Epoch: 66, step: 94, loss: 0.3370645344257355, mean loss: 0.3397254202849288
Epoch: 66, step: 95, loss: 0.3247312009334564, mean loss: 0.3397252631128182
Epoch: 66, step: 96, loss: 0.3946323096752167, mean loss: 0.33972583865234673
Epoch: 66, step: 97, loss: 0.34240221977233887, mean loss: 0.339725866706068
Epoch: 66, step: 98, loss: 0.411220908164978, mean loss: 0.33972661610641663
Epoch: 66, step: 99, loss: 0.3405512571334839, mean loss: 0.33972662475009013
Epoch: 66, step: 100, loss: 0.31470075249671936, mean loss: 0.3397263624381332
Epoch: 66, step: 101, loss: 0.3187733292579651, mean loss: 0.33972614281847424
Epoch: 66, step: 102, loss: 0.3178092837333679, mean loss: 0.3397259130988616
Epoch: 66, step: 103, loss: 0.33430710434913635, mean loss: 0.3397258563026941
Epoch: 66, step: 104, loss: 0.33418598771095276, mean loss: 0.3397257982382705
Epoch: 66, step: 105, loss: 0.3500056564807892, mean loss: 0.33972590598230407
Epoch: 66, step: 106, loss: 0.33078959584236145, mean loss: 0.3397258123210895
Epoch: 66, step: 107, loss: 0.3536268174648285, mean loss: 0.33972595801560534
Epoch: 66, step: 108, loss: 0.29388684034347534, mean loss: 0.3397254775871766
Epoch: 66, step: 109, loss: 0.32979047298431396, mean loss: 0.33972537346194753
Epoch: 66, step: 110, loss: 0.31511789560317993, mean loss: 0.33972511556247825
Epoch: 66, step: 111, loss: 0.31517893075942993, mean loss: 0.339724858308089
Epoch: 66, step: 112, loss: 0.3822503685951233, mean loss: 0.33972530398873596
Epoch: 66, step: 113, loss: 0.30463719367980957, mean loss: 0.33972493625822064
Epoch: 66, step: 114, loss: 0.40575167536735535, mean loss: 0.3397256282245912
Epoch: 66, step: 115, loss: 0.3024509847164154, mean loss: 0.3397252375869522
Epoch: 66, step: 116, loss: 0.3339115381240845, mean loss: 0.33972517666011787
Epoch: 66, step: 117, loss: 0.2974066138267517, mean loss: 0.33972473317158447
Epoch: 66, step: 118, loss: 0.3151889443397522, mean loss: 0.339724476045013
Epoch: 66, step: 119, loss: 0.34535855054855347, mean loss: 0.33972453508754424
Epoch: 66, step: 120, loss: 0.3255404829978943, mean loss: 0.33972438644670494
Epoch: 66, step: 121, loss: 0.31262797117233276, mean loss: 0.3397241024945821
Epoch: 66, step: 122, loss: 0.3435295522212982, mean loss: 0.339724142372706
Epoch: 66, step: 123, loss: 0.33042073249816895, mean loss: 0.33972404488130015
Epoch: 66, step: 124, loss: 0.32923078536987305, mean loss: 0.3397239349224877
Epoch: 66, step: 125, loss: 0.3667929768562317, mean loss: 0.33972421857586643
Epoch: 66, step: 126, loss: 0.31669124960899353, mean loss: 0.3397239772185615
Epoch: 66, step: 127, loss: 0.30153754353523254, mean loss: 0.3397235770756987
Epoch: 66, step: 128, loss: 0.3441559970378876, mean loss: 0.3397236235210579
Epoch: 66, step: 129, loss: 0.33268675208091736, mean loss: 0.33972354978558167
Epoch: 66, step: 130, loss: 0.3636776804924011, mean loss: 0.33972380078501274
Epoch: 66, step: 131, loss: 0.30846020579338074, mean loss: 0.3397234731979912
Epoch: 66, step: 132, loss: 0.3722628951072693, mean loss: 0.33972381414984326
Epoch: 66, step: 133, loss: 0.35695216059684753, mean loss: 0.3397239946685721
Epoch: 66, step: 134, loss: 0.36139267683029175, mean loss: 0.33972422171078925
Epoch: 66, step: 135, loss: 0.3321004807949066, mean loss: 0.3397241418308551
Epoch: 66, step: 136, loss: 0.3480868935585022, mean loss: 0.3397242294530691
Epoch: 66, step: 137, loss: 0.3309391736984253, mean loss: 0.3397241374070542
Epoch: 66, step: 138, loss: 0.3098708987236023, mean loss: 0.3397238246210072
Epoch: 66, step: 139, loss: 0.32715466618537903, mean loss: 0.3397236929295605
Epoch: 66, step: 140, loss: 0.3297126889228821, mean loss: 0.3397235880418869
Epoch: 66, step: 141, loss: 0.3212448060512543, mean loss: 0.3397233944373148
Epoch: 66, step: 142, loss: 0.3133527636528015, mean loss: 0.339723118151724
Epoch: 66, step: 143, loss: 0.33582186698913574, mean loss: 0.339723077278671
Epoch: 66, step: 144, loss: 0.3180449604988098, mean loss: 0.33972285016139603
Epoch: 66, step: 145, loss: 0.2987011671066284, mean loss: 0.33972242038996536
Epoch: 66, step: 146, loss: 0.31756195425987244, mean loss: 0.33972218822407785
Epoch: 66, step: 147, loss: 0.30150043964385986, mean loss: 0.3397217877950813
Epoch: 66, step: 148, loss: 0.34469369053840637, mean loss: 0.33972183988252475
Epoch: 66, step: 149, loss: 0.365882933139801, mean loss: 0.33972211395268687
Epoch: 66, step: 150, loss: 0.35548171401023865, mean loss: 0.3397222790524727
Epoch: 66, step: 151, loss: 0.32571542263031006, mean loss: 0.33972213231621284
Epoch: 66, step: 152, loss: 0.36176297068595886, mean loss: 0.3397223632142965
Epoch: 66, step: 153, loss: 0.35148629546165466, mean loss: 0.3397224864510315
Epoch: 66, step: 154, loss: 0.3587453067302704, mean loss: 0.3397226857284205
Epoch: 66, step: 155, loss: 0.33191609382629395, mean loss: 0.33972260394974985
Epoch: 66, step: 156, loss: 0.32615748047828674, mean loss: 0.33972246184854127
Epoch: 66, step: 157, loss: 0.3783029317855835, mean loss: 0.3397228659933312
Epoch: 66, step: 158, loss: 0.35390570759773254, mean loss: 0.33972301456232235
Epoch: 66, step: 159, loss: 0.36426517367362976, mean loss: 0.33972327164519245
Epoch: 66, step: 160, loss: 0.36417466402053833, mean loss: 0.3397235277745841
Epoch: 66, step: 161, loss: 0.29939085245132446, mean loss: 0.33972310529249283
Epoch: 66, step: 162, loss: 0.31296274065971375, mean loss: 0.33972282498238954
Epoch: 66, step: 163, loss: 0.32482075691223145, mean loss: 0.33972266888748787
Epoch: 66, step: 164, loss: 0.3475712835788727, mean loss: 0.3397227510986212
Epoch: 66, step: 165, loss: 0.3214404284954071, mean loss: 0.3397225596005317
Epoch: 66, step: 166, loss: 0.3190523684024811, mean loss: 0.3397223430929933
Epoch: 66, step: 167, loss: 0.35380318760871887, mean loss: 0.33972249057963355
Epoch: 66, step: 168, loss: 0.30076897144317627, mean loss: 0.3397220825740284
Epoch: 66, step: 169, loss: 0.3602759838104248, mean loss: 0.33972229785673613
Epoch: 66, step: 170, loss: 0.3161076307296753, mean loss: 0.33972205051798643
Epoch: 66, step: 171, loss: 0.34526485204696655, mean loss: 0.3397221085723826
Epoch: 66, step: 172, loss: 0.3049534559249878, mean loss: 0.33972174441501857
Epoch: 66, step: 173, loss: 0.3457784354686737, mean loss: 0.33972180785048073
Epoch: 66, step: 174, loss: 0.3116835355758667, mean loss: 0.3397215141914324
Epoch: 66, step: 175, loss: 0.31956690549850464, mean loss: 0.33972130310420273
Epoch: 66, step: 176, loss: 0.33052122592926025, mean loss: 0.33972120674914597
Epoch: 66, step: 177, loss: 0.31201016902923584, mean loss: 0.3397209165265101
Epoch: 66, step: 178, loss: 0.3452054262161255, mean loss: 0.3397209739661558
Epoch: 66, step: 179, loss: 0.32480165362358093, mean loss: 0.33972081771672824
Epoch: 66, step: 180, loss: 0.35666623711586, mean loss: 0.3397209951835492
Epoch: 66, step: 181, loss: 0.3213418424129486, mean loss: 0.33972080270347077
Epoch: 66, step: 182, loss: 0.33703935146331787, mean loss: 0.33972077462162464
Epoch: 66, step: 183, loss: 0.3198813498020172, mean loss: 0.3397205668528493
Epoch: 66, step: 184, loss: 0.32291001081466675, mean loss: 0.33972039080580685
Epoch: 66, step: 185, loss: 0.32693228125572205, mean loss: 0.33972025688487745
Epoch: 66, step: 186, loss: 0.33163872361183167, mean loss: 0.33972017225351664
Epoch: 66, step: 187, loss: 0.30829834938049316, mean loss: 0.3397198432016288
Epoch: 66, step: 188, loss: 0.35717400908470154, mean loss: 0.33972002598116113
Epoch: 66, step: 189, loss: 0.32167598605155945, mean loss: 0.33971983702646313
Epoch: 66, step: 190, loss: 0.3534764051437378, mean loss: 0.339719981081839
Epoch: 66, step: 191, loss: 0.33076056838035583, mean loss: 0.33971988726206953
Epoch: 66, step: 192, loss: 0.34849998354911804, mean loss: 0.33971997920313873
Epoch: 66, step: 193, loss: 0.3583194613456726, mean loss: 0.33972017396619286
Epoch: 66, step: 194, loss: 0.356496661901474, mean loss: 0.3397203496380631
Epoch: 66, step: 195, loss: 0.35561344027519226, mean loss: 0.3397205160578603
Epoch: 66, step: 196, loss: 0.32033848762512207, mean loss: 0.3397203131068081
Epoch: 66, step: 197, loss: 0.34470465779304504, mean loss: 0.3397203652978061
Epoch: 66, step: 198, loss: 0.34059423208236694, mean loss: 0.33972037444795616
Epoch: 66, step: 199, loss: 0.3106915056705475, mean loss: 0.3397200704934749
Epoch: 66, step: 200, loss: 0.31895917654037476, mean loss: 0.33971985311329633
Epoch: 66, step: 201, loss: 0.347789466381073, mean loss: 0.3397199376065561
Epoch: 66, step: 202, loss: 0.36381271481513977, mean loss: 0.3397201898684553
Epoch: 66, step: 203, loss: 0.3710554838180542, mean loss: 0.3397205179592325
Epoch: 66, step: 204, loss: 0.3674200773239136, mean loss: 0.3397208079796428
Epoch: 66, step: 205, loss: 0.3239867091178894, mean loss: 0.33972064324193096
Epoch: 66, step: 206, loss: 0.33822527527809143, mean loss: 0.33972062758543103
Epoch: 66, step: 207, loss: 0.36034372448921204, mean loss: 0.3397208435069582
Epoch: 66, step: 208, loss: 0.3406102657318115, mean loss: 0.3397208528190123
Epoch: 66, step: 209, loss: 0.3680810332298279, mean loss: 0.3397211497407244
Epoch: 66, step: 210, loss: 0.3001238703727722, mean loss: 0.33972073517464196
Epoch: 66, step: 211, loss: 0.3707566559314728, mean loss: 0.33972106010366704
Epoch: 66, step: 212, loss: 0.31300535798072815, mean loss: 0.33972078040788384
Epoch: 66, step: 213, loss: 0.33548545837402344, mean loss: 0.3397207360673194
Epoch: 66, step: 214, loss: 0.3206160068511963, mean loss: 0.33972053605759134
Epoch: 66, step: 215, loss: 0.29796096682548523, mean loss: 0.3397200988761714
Epoch: 66, step: 216, loss: 0.36413541436195374, mean loss: 0.3397203544777196
Epoch: 66, step: 217, loss: 0.3302927017211914, mean loss: 0.33972025578157883
Epoch: 66, step: 218, loss: 0.33081546425819397, mean loss: 0.33972016256013976
Epoch: 66, step: 219, loss: 0.3325670659542084, mean loss: 0.3397200876774233
Epoch: 66, step: 220, loss: 0.35359829664230347, mean loss: 0.3397202329609508
Epoch: 66, step: 221, loss: 0.3358944356441498, mean loss: 0.3397201929111495
Epoch: 66, step: 222, loss: 0.31667354702949524, mean loss: 0.33971995165322366
Epoch: 66, step: 223, loss: 0.29854854941368103, mean loss: 0.339719520665427
Epoch: 66, step: 224, loss: 0.2902904152870178, mean loss: 0.3397190032402956
Epoch: 66, step: 225, loss: 0.4002957344055176, mean loss: 0.33971963735241917
Epoch: 66, step: 226, loss: 0.33939287066459656, mean loss: 0.3397196339318888
Epoch: 66, step: 227, loss: 0.33632612228393555, mean loss: 0.33971959840963817
Epoch: 66, step: 228, loss: 0.31407782435417175, mean loss: 0.33971933000213445
Epoch: 66, step: 229, loss: 0.3568883240222931, mean loss: 0.33971950971819387
Epoch: 66, step: 230, loss: 0.31464219093322754, mean loss: 0.3397192472246702
Epoch: 66, step: 231, loss: 0.3366517722606659, mean loss: 0.33971921511661707
Epoch: 66, step: 232, loss: 0.4022989571094513, mean loss: 0.3397198701480917
Epoch: 66, step: 233, loss: 0.33239322900772095, mean loss: 0.339719793459851
Epoch: 66, step: 234, loss: 0.30821114778518677, mean loss: 0.33971946366107064
Epoch: 66, step: 235, loss: 0.33626481890678406, mean loss: 0.3397194275019252
Epoch: 66, step: 236, loss: 0.33276066184043884, mean loss: 0.3397193546665387
Epoch: 66, step: 237, loss: 0.3017606735229492, mean loss: 0.33971895736816576
Epoch: 66, step: 238, loss: 0.28644371032714844, mean loss: 0.339718399763244
Epoch: 66, step: 239, loss: 0.3152361810207367, mean loss: 0.33971814352299085
Epoch: 66, step: 240, loss: 0.3187011480331421, mean loss: 0.33971792355339026
Epoch: 66, step: 241, loss: 0.29489484429359436, mean loss: 0.33971745442774126
Epoch: 66, step: 242, loss: 0.3522149920463562, mean loss: 0.3397175852276368
Epoch: 66, step: 243, loss: 0.30140969157218933, mean loss: 0.339717184299374
Epoch: 66, step: 244, loss: 0.35406893491744995, mean loss: 0.33971733450241764
Epoch: 66, step: 245, loss: 0.29772520065307617, mean loss: 0.3397168950243031
Epoch: 66, step: 246, loss: 0.3462599217891693, mean loss: 0.3397169635011036
Epoch: 66, step: 247, loss: 0.33060601353645325, mean loss: 0.33971686815040486
Epoch: 66, step: 248, loss: 0.3443097472190857, mean loss: 0.33971691621670386
Epoch: 66, step: 249, loss: 0.29124271869659424, mean loss: 0.33971640892033195
Epoch: 66, step: 250, loss: 0.3355995714664459, mean loss: 0.3397163658368988
Epoch: 66, step: 251, loss: 0.36145198345184326, mean loss: 0.33971659330160653
Epoch: 66, step: 252, loss: 0.3354407846927643, mean loss: 0.33971654855544864
Epoch: 66, step: 253, loss: 0.3337356746196747, mean loss: 0.33971648596650855
Epoch: 66, step: 254, loss: 0.3246504068374634, mean loss: 0.3397163283039218
Epoch: 66, step: 255, loss: 0.2948440909385681, mean loss: 0.3397158587325806
Epoch: 66, step: 256, loss: 0.3210209906101227, mean loss: 0.33971566309975837
Epoch: 66, step: 257, loss: 0.33155104517936707, mean loss: 0.33971557766184457
Epoch: 66, step: 258, loss: 0.3370864987373352, mean loss: 0.33971555015037125
Epoch: 66, step: 259, loss: 0.32026365399360657, mean loss: 0.3397153466020041
Epoch: 66, step: 260, loss: 0.3026052415370941, mean loss: 0.33971495827882026
Epoch: 66, step: 261, loss: 0.3070072531700134, mean loss: 0.33971461602629205
Epoch: 66, step: 262, loss: 0.33738940954208374, mean loss: 0.3397145916956498
Epoch: 66, step: 263, loss: 0.31366515159606934, mean loss: 0.3397143191207283
Epoch: 66, step: 264, loss: 0.32482919096946716, mean loss: 0.3397141633680454
Epoch: 66, step: 265, loss: 0.3398211598396301, mean loss: 0.33971416448760666
Epoch: 66, step: 266, loss: 0.3262842893600464, mean loss: 0.3397140239651142
Epoch: 66, step: 267, loss: 0.33759400248527527, mean loss: 0.3397140017826603
Epoch: 66, step: 268, loss: 0.3185230493545532, mean loss: 0.33971378005735686
Epoch: 66, step: 269, loss: 0.32144924998283386, mean loss: 0.33971358895381326
Epoch: 66, step: 270, loss: 0.32040542364120483, mean loss: 0.33971338693272707
Epoch: 66, step: 271, loss: 0.34388455748558044, mean loss: 0.33971343057517445
Epoch: 66, step: 272, loss: 0.3565237820148468, mean loss: 0.3397136064579856
Epoch: 66, step: 273, loss: 0.30301007628440857, mean loss: 0.33971322244147373
Epoch: 66, step: 274, loss: 0.35159480571746826, mean loss: 0.3397133467531246
Epoch: 66, step: 275, loss: 0.3269582688808441, mean loss: 0.3397132133038897
Epoch: 66, step: 276, loss: 0.3291845917701721, mean loss: 0.3397131031499728
Epoch: 66, step: 277, loss: 0.32193732261657715, mean loss: 0.3397129171758298
Epoch: 66, step: 278, loss: 0.34256982803344727, mean loss: 0.33971294706514965
Epoch: 66, step: 279, loss: 0.33542516827583313, mean loss: 0.3397129022063993
Epoch: 66, step: 280, loss: 0.3690674602985382, mean loss: 0.33971320931063215
Epoch: 66, step: 281, loss: 0.3480297327041626, mean loss: 0.3397132963162961
Epoch: 66, step: 282, loss: 0.3176755905151367, mean loss: 0.3397130657650098
Epoch: 66, step: 283, loss: 0.368129163980484, mean loss: 0.33971336304184596
Epoch: 66, step: 284, loss: 0.31028902530670166, mean loss: 0.33971305522046763
Epoch: 66, step: 285, loss: 0.33858340978622437, mean loss: 0.33971304340285663
Epoch: 66, step: 286, loss: 0.29425182938575745, mean loss: 0.3397125678223729
Epoch: 66, step: 287, loss: 0.2903708815574646, mean loss: 0.3397120516527534
Epoch: 66, step: 288, loss: 0.305477499961853, mean loss: 0.3397116935245255
Epoch: 66, step: 289, loss: 0.3142516314983368, mean loss: 0.33971142718916947
Epoch: 66, step: 290, loss: 0.3241363763809204, mean loss: 0.33971126426170667
Epoch: 66, step: 291, loss: 0.3757133483886719, mean loss: 0.3397116408683024
Epoch: 66, step: 292, loss: 0.3431564271450043, mean loss: 0.33971167690276244
Epoch: 66, step: 293, loss: 0.29766663908958435, mean loss: 0.3397112370919106
Epoch: 66, step: 294, loss: 0.2868283987045288, mean loss: 0.3397106839183587
Epoch: 66, step: 295, loss: 0.37481924891471863, mean loss: 0.3397110511627624
Epoch: 66, step: 296, loss: 0.33358803391456604, mean loss: 0.33971098711513475
Epoch: 66, step: 297, loss: 0.3298931419849396, mean loss: 0.3397108844201584
Epoch: 66, step: 298, loss: 0.3253883123397827, mean loss: 0.33971073460716006
Epoch: 66, step: 299, loss: 0.31665849685668945, mean loss: 0.33971049348505483
Epoch: 66, step: 300, loss: 0.38335102796554565, mean loss: 0.3397109499521275
Epoch: 66, step: 301, loss: 0.32748815417289734, mean loss: 0.3397108221066389
Epoch: 66, step: 302, loss: 0.35771867632865906, mean loss: 0.33971101045952334
Epoch: 66, step: 303, loss: 0.3187573552131653, mean loss: 0.3397107912973691
Epoch: 66, step: 304, loss: 0.34050384163856506, mean loss: 0.3397107995920939
Epoch: 66, step: 305, loss: 0.3017098009586334, mean loss: 0.3397104021336833
Epoch: 66, step: 306, loss: 0.37613344192504883, mean loss: 0.33971078308399016
Epoch: 66, step: 307, loss: 0.30573445558547974, mean loss: 0.3397104277276803
Epoch: 66, step: 308, loss: 0.33141663670539856, mean loss: 0.3397103409843397
Epoch: 66, step: 309, loss: 0.32577288150787354, mean loss: 0.3397101952163614
Epoch: 66, step: 310, loss: 0.3220854699611664, mean loss: 0.3397100108862327
Epoch: 66, step: 311, loss: 0.29738056659698486, mean loss: 0.3397095681837113
Epoch: 66, step: 312, loss: 0.30671507120132446, mean loss: 0.3397092231143514
Epoch: 66, step: 313, loss: 0.36014091968536377, mean loss: 0.33970943679479415
Epoch: 66, step: 314, loss: 0.3213450610637665, mean loss: 0.33970924473698416
Epoch: 66, step: 315, loss: 0.3370882272720337, mean loss: 0.33970921732621795
Epoch: 66, step: 316, loss: 0.3143892288208008, mean loss: 0.339708952530948
Epoch: 66, step: 317, loss: 0.3603097200393677, mean loss: 0.3397091679705697
Epoch: 66, step: 318, loss: 0.3798495829105377, mean loss: 0.3397095877483945
Epoch: 66, step: 319, loss: 0.35354170203208923, mean loss: 0.33970973239946833
Epoch: 66, step: 320, loss: 0.3372308313846588, mean loss: 0.3397097064763205
Epoch: 66, step: 321, loss: 0.3724669814109802, mean loss: 0.3397100490324761
Epoch: 66, step: 322, loss: 0.3423578441143036, mean loss: 0.3397100767212573
Epoch: 66, step: 323, loss: 0.338396281003952, mean loss: 0.33971006298264816
Epoch: 66, step: 324, loss: 0.41272568702697754, mean loss: 0.33971082651279116
Epoch: 66, step: 325, loss: 0.3668877184391022, mean loss: 0.3397111107007231
Epoch: 66, step: 326, loss: 0.34338754415512085, mean loss: 0.3397111491446738
Epoch: 66, step: 327, loss: 0.32695072889328003, mean loss: 0.33971101571213813
Epoch: 66, step: 328, loss: 0.35117509961128235, mean loss: 0.339711135587954
Epoch: 66, step: 329, loss: 0.3259841501712799, mean loss: 0.3397109920512891
Epoch: 66, step: 330, loss: 0.31890690326690674, mean loss: 0.3397107745149396
Epoch: 66, step: 331, loss: 0.33716389536857605, mean loss: 0.3397107478839727
Epoch: 66, step: 332, loss: 0.30704084038734436, mean loss: 0.3397104062807491
Epoch: 66, step: 333, loss: 0.3347444534301758, mean loss: 0.33971035435627506
Epoch: 66, step: 334, loss: 0.33062300086021423, mean loss: 0.3397102593390384
Epoch: 66, step: 335, loss: 0.38335803151130676, mean loss: 0.33971071571474076
Epoch: 66, step: 336, loss: 0.35428524017333984, mean loss: 0.33971086810257084
Epoch: 66, step: 337, loss: 0.308926522731781, mean loss: 0.33971054623199753
Epoch: 66, step: 338, loss: 0.34008851647377014, mean loss: 0.33971055018388363
Epoch: 66, step: 339, loss: 0.319828063249588, mean loss: 0.3397103423037559
Epoch: 66, step: 340, loss: 0.3126937747001648, mean loss: 0.3397100598366368
Epoch: 66, step: 341, loss: 0.3151090443134308, mean loss: 0.33970980262760014
Epoch: 66, step: 342, loss: 0.3031407296657562, mean loss: 0.33970942029388385
Epoch: 66, step: 343, loss: 0.33300456404685974, mean loss: 0.3397093501946006
Epoch: 66, step: 344, loss: 0.3130386471748352, mean loss: 0.3397090713552712
Epoch: 66, step: 345, loss: 0.3608512580394745, mean loss: 0.33970929239224645
Epoch: 66, step: 346, loss: 0.32891613245010376, mean loss: 0.3397091795532804
Epoch: 66, step: 347, loss: 0.3012809455394745, mean loss: 0.3397087778028307
Epoch: 66, step: 348, loss: 0.2958141565322876, mean loss: 0.3397083189084806
Epoch: 66, step: 349, loss: 0.3429411053657532, mean loss: 0.3397083527051483
Epoch: 66, step: 350, loss: 0.32994961738586426, mean loss: 0.3397082506850206
Epoch: 66, step: 351, loss: 0.34316128492355347, mean loss: 0.33970828678348003
Epoch: 66, step: 352, loss: 0.33990150690078735, mean loss: 0.3397082888034066
Epoch: 66, step: 353, loss: 0.30068454146385193, mean loss: 0.33970788085271414
Epoch: 66, step: 354, loss: 0.3915117084980011, mean loss: 0.33970842239953825
Epoch: 66, step: 355, loss: 0.3106963634490967, mean loss: 0.3397081191164633
Epoch: 66, step: 356, loss: 0.2958078384399414, mean loss: 0.33970766020132886
Epoch: 66, step: 357, loss: 0.3250911235809326, mean loss: 0.33970750740777844
Epoch: 66, step: 358, loss: 0.3194117844104767, mean loss: 0.3397072952492323
Epoch: 66, step: 359, loss: 0.3230828046798706, mean loss: 0.33970712146922555
Epoch: 66, step: 360, loss: 0.33172813057899475, mean loss: 0.3397070380636865
Epoch: 66, step: 361, loss: 0.35537630319595337, mean loss: 0.33970720185505576
Epoch: 66, step: 362, loss: 0.3073994815349579, mean loss: 0.3397068641448702
Epoch: 66, step: 363, loss: 0.3105412423610687, mean loss: 0.3397065592819925
Epoch: 66, step: 364, loss: 0.35028156638145447, mean loss: 0.33970666981944037
Epoch: 66, step: 365, loss: 0.365314781665802, mean loss: 0.33970693749072545
Epoch: 66, step: 366, loss: 0.30274346470832825, mean loss: 0.33970655113046183
Epoch: 66, step: 367, loss: 0.4064781963825226, mean loss: 0.33970724905300187
Epoch: 66, step: 368, loss: 0.35230597853660583, mean loss: 0.33970738073832046
Epoch: 66, step: 369, loss: 0.3324377238750458, mean loss: 0.3397073047547004
Epoch: 66, step: 370, loss: 0.3415623903274536, mean loss: 0.33970732414414984
Epoch: 66, step: 371, loss: 0.3115597665309906, mean loss: 0.33970702994751106
Epoch: 66, step: 372, loss: 0.380102276802063, mean loss: 0.3397074521518742
Epoch: 66, step: 373, loss: 0.3675840198993683, mean loss: 0.3397077435100521
Epoch: 66, step: 374, loss: 0.3406413793563843, mean loss: 0.33970775326805386
Epoch: 66, step: 375, loss: 0.29097893834114075, mean loss: 0.3397072439786002
Epoch: 66, step: 376, loss: 0.3197351098060608, mean loss: 0.3397070352419213
Epoch: 66, step: 377, loss: 0.3110455572605133, mean loss: 0.3397067356926019
Epoch: 66, step: 378, loss: 0.3433980941772461, mean loss: 0.339706774271644
Epoch: 66, step: 379, loss: 0.32646191120147705, mean loss: 0.33970663584867805
Epoch: 66, step: 380, loss: 0.29811573028564453, mean loss: 0.33970620118383443
Epoch: 66, step: 381, loss: 0.29730281233787537, mean loss: 0.3397057580323928
Epoch: 66, step: 382, loss: 0.3370329439640045, mean loss: 0.3397057300995067
Epoch: 66, step: 383, loss: 0.3175595700740814, mean loss: 0.3397054986581554
Epoch: 66, step: 384, loss: 0.3043447732925415, mean loss: 0.3397051291201169
Epoch: 66, step: 385, loss: 0.3367127776145935, mean loss: 0.3397050978488085
Epoch: 66, step: 386, loss: 0.3564426600933075, mean loss: 0.33970527276141516
Epoch: 66, step: 387, loss: 0.3408713936805725, mean loss: 0.33970528494760543
Epoch: 66, step: 388, loss: 0.3192693591117859, mean loss: 0.33970507139044
Epoch: 66, step: 389, loss: 0.35251355171203613, mean loss: 0.3397052052387515
Epoch: 66, step: 390, loss: 0.3370373249053955, mean loss: 0.33970517735975747
Epoch: 66, step: 391, loss: 0.3727012574672699, mean loss: 0.3397055221607952
Epoch: 66, step: 392, loss: 0.3274194300174713, mean loss: 0.33970539377545245
Epoch: 66, step: 393, loss: 0.32136625051498413, mean loss: 0.3397052021398565
Epoch: 66, step: 394, loss: 0.3197934031486511, mean loss: 0.3397049940729071
Epoch: 66, step: 395, loss: 0.3486083149909973, mean loss: 0.3397050871065635
Epoch: 66, step: 396, loss: 0.31876569986343384, mean loss: 0.3397048683064753
Epoch: 66, step: 397, loss: 0.3401470482349396, mean loss: 0.33970487292685864
Epoch: 66, step: 398, loss: 0.34742099046707153, mean loss: 0.3397049535525187
Epoch: 66, step: 399, loss: 0.30457958579063416, mean loss: 0.3397045865316234
Epoch: 66, step: 400, loss: 0.3033186197280884, mean loss: 0.3397042063428474
Epoch: 66, step: 401, loss: 0.3518943190574646, mean loss: 0.3397043337132601
Epoch: 66, step: 402, loss: 0.3304148316383362, mean loss: 0.3397042366513725
Epoch: 66, step: 403, loss: 0.33018890023231506, mean loss: 0.33970413723088083
Epoch: 66, step: 404, loss: 0.33285972476005554, mean loss: 0.3397040657181446
Epoch: 66, step: 405, loss: 0.35066327452659607, mean loss: 0.3397041802224682
Epoch: 66, step: 406, loss: 0.324678897857666, mean loss: 0.3397040232365171
Epoch: 66, step: 407, loss: 0.3740467429161072, mean loss: 0.3397043820496197
Epoch: 66, step: 408, loss: 0.3350921869277954, mean loss: 0.3397043338618592
Epoch: 66, step: 409, loss: 0.3105798661708832, mean loss: 0.3397040295754676
Epoch: 66, step: 410, loss: 0.351256787776947, mean loss: 0.33970415027502565
Epoch: 66, step: 411, loss: 0.33608752489089966, mean loss: 0.33970411249006405
Epoch: 66, step: 412, loss: 0.3791021704673767, mean loss: 0.33970452409989277
Epoch: 66, step: 413, loss: 0.34090927243232727, mean loss: 0.3397045366863272
Epoch: 66, step: 414, loss: 0.3436930179595947, mean loss: 0.33970457835497475
Epoch: 66, step: 415, loss: 0.31880998611450195, mean loss: 0.33970436006629695
Epoch: 66, step: 416, loss: 0.3456379771232605, mean loss: 0.33970442205496254
Epoch: 66, step: 417, loss: 0.32189270853996277, mean loss: 0.33970423597743055
Epoch: 66, step: 418, loss: 0.31273484230041504, mean loss: 0.3397039542332972
Epoch: 66, step: 419, loss: 0.32716652750968933, mean loss: 0.33970382325854975
Epoch: 66, step: 420, loss: 0.335525244474411, mean loss: 0.3397037796066429
Epoch: 66, step: 421, loss: 0.35982227325439453, mean loss: 0.3397039897741381
Epoch: 66, step: 422, loss: 0.3490527868270874, mean loss: 0.3397040874351643
Epoch: 66, step: 423, loss: 0.33157339692115784, mean loss: 0.3397040024998213
Epoch: 66, step: 424, loss: 0.3648892045021057, mean loss: 0.3397042655883525
Epoch: 66, step: 425, loss: 0.28421327471733093, mean loss: 0.33970368592689976
Epoch: 66, step: 426, loss: 0.30900678038597107, mean loss: 0.3397033652689568
Epoch: 66, step: 427, loss: 0.32515883445739746, mean loss: 0.3397032133392905
Epoch: 66, step: 428, loss: 0.37315618991851807, mean loss: 0.3397035627796776
Epoch: 66, step: 429, loss: 0.34735170006752014, mean loss: 0.3397036426691347
Epoch: 66, step: 430, loss: 0.30743083357810974, mean loss: 0.339703305563488
Epoch: 66, step: 431, loss: 0.36563223600387573, mean loss: 0.33970357640131743
Epoch: 66, step: 432, loss: 0.3450447916984558, mean loss: 0.3397036321918195
Epoch: 66, step: 433, loss: 0.36986660957336426, mean loss: 0.33970394724934505
Epoch: 66, step: 434, loss: 0.3369113504886627, mean loss: 0.33970391808049266
Epoch: 66, step: 435, loss: 0.3753010034561157, mean loss: 0.33970428989045065
Epoch: 66, step: 436, loss: 0.3796168267726898, mean loss: 0.3397047067707515
Epoch: 66, step: 437, loss: 0.33691373467445374, mean loss: 0.33970467761978224
Epoch: 66, step: 438, loss: 0.30517587065696716, mean loss: 0.3397043169792449
Epoch: 66, step: 439, loss: 0.30914151668548584, mean loss: 0.3397039977655052
Epoch: 66, step: 440, loss: 0.37690845131874084, mean loss: 0.33970438634405814
Epoch: 66, step: 441, loss: 0.32622528076171875, mean loss: 0.33970424556422835
Epoch: 66, step: 442, loss: 0.29609137773513794, mean loss: 0.3397037900630865
Epoch: 66, step: 443, loss: 0.32906603813171387, mean loss: 0.3397036789615289
Epoch: 66, step: 444, loss: 0.3288203477859497, mean loss: 0.33970356529630863
Epoch: 66, step: 445, loss: 0.3483714461326599, mean loss: 0.33970365582247924
Epoch: 66, step: 446, loss: 0.3334706127643585, mean loss: 0.3397035907261037
Epoch: 66, step: 447, loss: 0.27972185611724854, mean loss: 0.3397029642980958
Epoch: 66, step: 448, loss: 0.3192741572856903, mean loss: 0.3397027509490936
Epoch: 66, step: 449, loss: 0.3257901966571808, mean loss: 0.33970260565433524
Epoch: 66, step: 450, loss: 0.333511620759964, mean loss: 0.33970254099990577
Epoch: 66, step: 451, loss: 0.3532346487045288, mean loss: 0.3397026823185459
Epoch: 66, step: 452, loss: 0.3132363557815552, mean loss: 0.33970240592803097
Epoch: 66, step: 453, loss: 0.327664852142334, mean loss: 0.3397022802199566
Epoch: 66, step: 454, loss: 0.3413764238357544, mean loss: 0.3397022977028419
Epoch: 66, step: 455, loss: 0.33075928688049316, mean loss: 0.3397022043130046
Epoch: 66, step: 456, loss: 0.3738096356391907, mean loss: 0.3397025604854686
Epoch: 66, step: 457, loss: 0.31629738211631775, mean loss: 0.3397023160755944
Epoch: 66, step: 458, loss: 0.3418116569519043, mean loss: 0.33970233810227357
Epoch: 66, step: 459, loss: 0.3265957832336426, mean loss: 0.3397022012392053
Epoch: 66, step: 460, loss: 0.33733317255973816, mean loss: 0.33970217650126683
Epoch: 66, step: 461, loss: 0.3458590805530548, mean loss: 0.33970224079239364
Epoch: 66, step: 462, loss: 0.42964673042297363, mean loss: 0.33970317999368044
Epoch: 66, step: 463, loss: 0.32338982820510864, mean loss: 0.3397030096512718
Epoch: 66, step: 464, loss: 0.3244995176792145, mean loss: 0.3397028508995675
Epoch: 66, step: 465, loss: 0.33711621165275574, mean loss: 0.3397028238906999
Epoch: 66, step: 466, loss: 0.330274373292923, mean loss: 0.33970272544283364
Epoch: 66, step: 467, loss: 0.3620781898498535, mean loss: 0.3397029590754654
Epoch: 66, step: 468, loss: 0.3194155693054199, mean loss: 0.33970274724760396
Epoch: 66, step: 469, loss: 0.3246196508407593, mean loss: 0.3397025897612673
Epoch: 66, step: 470, loss: 0.3444981276988983, mean loss: 0.3397026398321411
Epoch: 66, step: 471, loss: 0.3066556751728058, mean loss: 0.3397022947878225
Epoch: 66, step: 472, loss: 0.29405906796455383, mean loss: 0.33970181823054024
Epoch: 66, step: 473, loss: 0.3529822826385498, mean loss: 0.33970195688935967
Epoch: 66, step: 474, loss: 0.35447701811790466, mean loss: 0.3397021111513715
Epoch: 66, step: 475, loss: 0.32705652713775635, mean loss: 0.33970197912397526
Epoch: 66, step: 476, loss: 0.32123973965644836, mean loss: 0.33970178636925913
Epoch: 66, step: 477, loss: 0.33621981739997864, mean loss: 0.3397017500161973
Epoch: 66, step: 478, loss: 0.31359413266181946, mean loss: 0.33970147744572704
Epoch: 66, step: 479, loss: 0.29498177766799927, mean loss: 0.3397010105650395
Epoch: 66, step: 480, loss: 0.3224319815635681, mean loss: 0.33970083027554737
Epoch: 66, step: 481, loss: 0.3418879210948944, mean loss: 0.3397008531086422
Epoch: 66, step: 482, loss: 0.3350315988063812, mean loss: 0.33970080436242084
Epoch: 66, step: 483, loss: 0.33701661229133606, mean loss: 0.33970077634020435
Epoch: 66, step: 484, loss: 0.31637895107269287, mean loss: 0.33970053286939594
Epoch: 66, step: 485, loss: 0.29529693722724915, mean loss: 0.3397000693179225
Epoch: 66, step: 486, loss: 0.30853113532066345, mean loss: 0.3396997439331369
Epoch: 66, step: 487, loss: 0.36510783433914185, mean loss: 0.33970000917543697
Epoch: 66, step: 488, loss: 0.36887624859809875, mean loss: 0.3397003137513394
Epoch: 66, step: 489, loss: 0.3093843162059784, mean loss: 0.33969999728060485
Epoch: 66, step: 490, loss: 0.3242016136646271, mean loss: 0.33969983549362626
Epoch: 66, step: 491, loss: 0.3241887390613556, mean loss: 0.33969967357562936
Epoch: 66, step: 492, loss: 0.32146546244621277, mean loss: 0.3396994832334357
Epoch: 66, step: 493, loss: 0.40175580978393555, mean loss: 0.33970013101654756
Epoch: 66, step: 494, loss: 0.3160908818244934, mean loss: 0.33969988457087286
Epoch: 66, step: 495, loss: 0.3446235656738281, mean loss: 0.33969993596629144
Epoch: 66, step: 496, loss: 0.3399105668067932, mean loss: 0.3396999381649203
Epoch: 66, step: 497, loss: 0.32891717553138733, mean loss: 0.33969982561233647
Epoch: 66, step: 498, loss: 0.30311691761016846, mean loss: 0.3396994437567787
Epoch: 66, step: 499, loss: 0.3310582637786865, mean loss: 0.3396993535603362
Epoch: 66, step: 500, loss: 0.36893412470817566, mean loss: 0.3396996587090356
Epoch: 66, step: 501, loss: 0.31263336539268494, mean loss: 0.3396993761975717
Epoch: 66, step: 502, loss: 0.3259284794330597, mean loss: 0.33969923246176154
Epoch: 66, step: 503, loss: 0.3114769160747528, mean loss: 0.339698937890156
Epoch: 66, step: 504, loss: 0.3456421196460724, mean loss: 0.3396989999217162
Epoch: 66, step: 505, loss: 0.3447623550891876, mean loss: 0.33969905276959395
Epoch: 66, step: 506, loss: 0.33146989345550537, mean loss: 0.33969896688008944
Epoch: 66, step: 507, loss: 0.31074059009552, mean loss: 0.3396986646384414
Epoch: 66, step: 508, loss: 0.3303989768028259, mean loss: 0.33969856757762673
Epoch: 66, step: 509, loss: 0.32187971472740173, mean loss: 0.3396983816042528
Epoch: 66, step: 510, loss: 0.31811290979385376, mean loss: 0.3396981563214494
Epoch: 66, step: 511, loss: 0.3123133182525635, mean loss: 0.33969787051492367
Epoch: 66, step: 512, loss: 0.34668347239494324, mean loss: 0.33969794342058635
Epoch: 66, step: 513, loss: 0.3058103621006012, mean loss: 0.3396975897544556
Epoch: 66, step: 514, loss: 0.3543091416358948, mean loss: 0.33969774224563043
Epoch: 66, step: 515, loss: 0.3315982222557068, mean loss: 0.3396976577171396
Epoch: 66, step: 516, loss: 0.33538833260536194, mean loss: 0.33969761274448107
Epoch: 66, step: 517, loss: 0.342413067817688, mean loss: 0.33969764108301576
Epoch: 66, step: 518, loss: 0.33667856454849243, mean loss: 0.3396976095762112
Epoch: 66, step: 519, loss: 0.3320966958999634, mean loss: 0.33969753025460414
Epoch: 66, step: 520, loss: 0.355905145406723, mean loss: 0.3396976993922525
Epoch: 66, step: 521, loss: 0.30565887689590454, mean loss: 0.3396973441773578
Epoch: 66, step: 522, loss: 0.3893449902534485, mean loss: 0.33969786227399107
Epoch: 66, step: 523, loss: 0.3223147392272949, mean loss: 0.33969768087478575
Epoch: 66, step: 524, loss: 0.3401302099227905, mean loss: 0.33969768538833645
Epoch: 66, step: 525, loss: 0.32042914628982544, mean loss: 0.339697484318326
Epoch: 66, step: 526, loss: 0.30557772517204285, mean loss: 0.33969712827738785
Epoch: 66, step: 527, loss: 0.3247750401496887, mean loss: 0.33969697256647574
Epoch: 66, step: 528, loss: 0.35479700565338135, mean loss: 0.33969713013258646
Epoch: 66, step: 529, loss: 0.3220159709453583, mean loss: 0.3396969456348175
Epoch: 66, step: 530, loss: 0.34784337878227234, mean loss: 0.3396970306395981
Epoch: 66, step: 531, loss: 0.31899693608283997, mean loss: 0.3396968146446217
Epoch: 66, step: 532, loss: 0.34550634026527405, mean loss: 0.3396968752634393
Epoch: 66, step: 533, loss: 0.298162043094635, mean loss: 0.3396964418775989
Epoch: 66, step: 534, loss: 0.317409873008728, mean loss: 0.33969620933584793
Epoch: 66, step: 535, loss: 0.30665746331214905, mean loss: 0.3396958646076966
Epoch: 66, step: 536, loss: 0.3364727199077606, mean loss: 0.3396958309775727
Epoch: 66, step: 537, loss: 0.33295559883117676, mean loss: 0.3396957606510755
Epoch: 66, step: 538, loss: 0.36062049865722656, mean loss: 0.33969597897414555
Epoch: 66, step: 539, loss: 0.33803901076316833, mean loss: 0.3396959616859667
Epoch: 66, step: 540, loss: 0.3673710823059082, mean loss: 0.33969625043468205
Epoch: 66, step: 541, loss: 0.3465527296066284, mean loss: 0.3396963219710964
Epoch: 66, step: 542, loss: 0.30773141980171204, mean loss: 0.33969598847185106
Epoch: 66, step: 543, loss: 0.28997504711151123, mean loss: 0.33969546972402787
Epoch: 66, step: 544, loss: 0.3411925435066223, mean loss: 0.33969548534311395
Epoch: 66, step: 545, loss: 0.3246663212776184, mean loss: 0.3396953285443235
Epoch: 66, step: 546, loss: 0.34105631709098816, mean loss: 0.3396953427433256
Epoch: 66, step: 547, loss: 0.3060798645019531, mean loss: 0.3396949920414285
Epoch: 66, step: 548, loss: 0.3518132269382477, mean loss: 0.3396951184666306
Epoch: 66, step: 549, loss: 0.32795044779777527, mean loss: 0.3396949959399685
Epoch: 66, step: 550, loss: 0.32192373275756836, mean loss: 0.3396948105426164
Epoch: 66, step: 551, loss: 0.3267335593700409, mean loss: 0.33969467532675957
Epoch: 66, step: 552, loss: 0.33747056126594543, mean loss: 0.33969465212434286
Epoch: 66, step: 553, loss: 0.3939286768436432, mean loss: 0.33969521789897533
Epoch: 66, step: 554, loss: 0.34389111399650574, mean loss: 0.3396952616705158
Epoch: 66, step: 555, loss: 0.34659743309020996, mean loss: 0.33969533367313853
Epoch: 66, step: 556, loss: 0.3354087173938751, mean loss: 0.33969528895613915
Epoch: 66, step: 557, loss: 0.3304065465927124, mean loss: 0.33969519205911675
Epoch: 66, step: 558, loss: 0.34280428290367126, mean loss: 0.3396952244917638
Epoch: 66, step: 559, loss: 0.33356261253356934, mean loss: 0.33969516051976223
Epoch: 66, step: 560, loss: 0.29574039578437805, mean loss: 0.33969470201285423
Epoch: 66, step: 561, loss: 0.34285613894462585, mean loss: 0.3396947349905203
Epoch: 66, step: 562, loss: 0.333394855260849, mean loss: 0.3396946692757307
Epoch: 66, step: 563, loss: 0.3256092369556427, mean loss: 0.3396945223504551
Epoch: 66, step: 564, loss: 0.3443313241004944, mean loss: 0.3396945707164728
Epoch: 66, step: 565, loss: 0.31550559401512146, mean loss: 0.33969431840629544
Epoch: 66, step: 566, loss: 0.3344132900238037, mean loss: 0.339694263321563
Epoch: 66, step: 567, loss: 0.31080931425094604, mean loss: 0.3396939620349614
Epoch: 66, step: 568, loss: 0.3314286172389984, mean loss: 0.33969387582356925
Epoch: 66, step: 569, loss: 0.342182993888855, mean loss: 0.33969390178595804
Epoch: 66, step: 570, loss: 0.35077333450317383, mean loss: 0.33969401734718585
Epoch: 66, step: 571, loss: 0.31913429498672485, mean loss: 0.33969380290642526
Epoch: 66, step: 572, loss: 0.35079118609428406, mean loss: 0.3396939186524664
Epoch: 66, step: 573, loss: 0.3380507826805115, mean loss: 0.3396939015146874
Epoch: 66, step: 574, loss: 0.3267635703086853, mean loss: 0.3396937666537564
Epoch: 66, step: 575, loss: 0.3207972049713135, mean loss: 0.3396935695682153
Epoch: 66, step: 576, loss: 0.3285484313964844, mean loss: 0.33969345332893774
Epoch: 66, step: 577, loss: 0.3218819200992584, mean loss: 0.339693267563797
Epoch: 66, step: 578, loss: 0.3096778392791748, mean loss: 0.33969295452156545
Epoch: 66, step: 579, loss: 0.3475744426250458, mean loss: 0.3396930367197226
Epoch: 66, step: 580, loss: 0.34416136145591736, mean loss: 0.3396930833205959
Epoch: 66, step: 581, loss: 0.3954820930957794, mean loss: 0.33969366514703325
Epoch: 66, step: 582, loss: 0.33761537075042725, mean loss: 0.3396936434726207
Epoch: 66, step: 583, loss: 0.30831921100616455, mean loss: 0.339693316273884
Epoch: 66, step: 584, loss: 0.35517218708992004, mean loss: 0.3396934776987692
Epoch: 66, step: 585, loss: 0.30536606907844543, mean loss: 0.3396931197114022
Epoch: 66, step: 586, loss: 0.3531635105609894, mean loss: 0.3396932601874724
Epoch: 66, step: 587, loss: 0.36325207352638245, mean loss: 0.3396935058681688
Epoch: 66, step: 588, loss: 0.3277018070220947, mean loss: 0.3396933808152573
Epoch: 66, step: 589, loss: 0.3277072012424469, mean loss: 0.3396932558212058
Epoch: 66, step: 590, loss: 0.33440104126930237, mean loss: 0.33969320063360947
Epoch: 66, step: 591, loss: 0.3632546663284302, mean loss: 0.3396934463317167
Epoch: 66, step: 592, loss: 0.34688010811805725, mean loss: 0.3396935212731829
Epoch: 66, step: 593, loss: 0.3599643409252167, mean loss: 0.3396937326521444
Epoch: 66, step: 594, loss: 0.3060331344604492, mean loss: 0.3396933816516315
Epoch: 66, step: 595, loss: 0.3190104365348816, mean loss: 0.3396931659796282
Epoch: 66, step: 596, loss: 0.308637797832489, mean loss: 0.33969284215226303
Epoch: 66, step: 597, loss: 0.33860644698143005, mean loss: 0.33969283082408247
Epoch: 66, step: 598, loss: 0.3085698187351227, mean loss: 0.33969250629813347
Epoch: 66, step: 599, loss: 0.3293486535549164, mean loss: 0.3396923984418111
Epoch: 66, step: 600, loss: 0.31546345353126526, mean loss: 0.33969214580696505
Epoch: 66, step: 601, loss: 0.31271007657051086, mean loss: 0.3396918644682664
Epoch: 66, step: 602, loss: 0.31314101815223694, mean loss: 0.33969158762876234
Epoch: 66, step: 603, loss: 0.3359791040420532, mean loss: 0.3396915489199624
Epoch: 66, step: 604, loss: 0.342303067445755, mean loss: 0.3396915761490913
Epoch: 66, step: 605, loss: 0.32178470492362976, mean loss: 0.3396913894441468
Epoch: 66, step: 606, loss: 0.32916459441185, mean loss: 0.339691279688279
Epoch: 66, step: 607, loss: 0.3119001090526581, mean loss: 0.33969098993130764
Epoch: 66, step: 608, loss: 0.33717402815818787, mean loss: 0.3396909636891739
Epoch: 66, step: 609, loss: 0.2881300449371338, mean loss: 0.3396904261146931
Epoch: 66, step: 610, loss: 0.3300507068634033, mean loss: 0.3396903256119641
Epoch: 66, step: 611, loss: 0.3488883972167969, mean loss: 0.33969042150912
Epoch: 66, step: 612, loss: 0.3159099221229553, mean loss: 0.3396901735812304
Epoch: 66, step: 613, loss: 0.34285807609558105, mean loss: 0.33969020660842564
Epoch: 66, step: 614, loss: 0.34427475929260254, mean loss: 0.3396902544045107
Epoch: 66, step: 615, loss: 0.33081358671188354, mean loss: 0.3396901618621036
Epoch: 66, step: 616, loss: 0.3828510046005249, mean loss: 0.339690611824497
Epoch: 66, step: 617, loss: 0.3336572051048279, mean loss: 0.33969054892540484
Epoch: 66, step: 618, loss: 0.3258373439311981, mean loss: 0.3396904045053492
Epoch: 66, step: 619, loss: 0.36593353748321533, mean loss: 0.33969067808790393
Epoch: 66, step: 620, loss: 0.3238065838813782, mean loss: 0.3396905124992231
Epoch: 66, step: 621, loss: 0.312547892332077, mean loss: 0.33969022954548617
Epoch: 66, step: 622, loss: 0.32001930475234985, mean loss: 0.33969002448408747
Epoch: 66, step: 623, loss: 0.4003419280052185, mean loss: 0.3396906567489478
Epoch: 66, step: 624, loss: 0.3231119215488434, mean loss: 0.33969048392597245
Epoch: 66, step: 625, loss: 0.2974488139152527, mean loss: 0.3396900435874964
Epoch: 66, step: 626, loss: 0.3679496645927429, mean loss: 0.3396903381702799
Epoch: 66, step: 627, loss: 0.313138872385025, mean loss: 0.3396900613964632
Epoch: 66, step: 628, loss: 0.32601410150527954, mean loss: 0.33968991883905447
Epoch: 66, step: 629, loss: 0.3341861963272095, mean loss: 0.33968986146916985
Epoch: 66, step: 630, loss: 0.3135766088962555, mean loss: 0.3396895892718219
Epoch: 66, step: 631, loss: 0.33123350143432617, mean loss: 0.3396895011288116
Epoch: 66, step: 632, loss: 0.29622986912727356, mean loss: 0.33968904812702916
Epoch: 66, step: 633, loss: 0.35679975152015686, mean loss: 0.3396892264787083
Epoch: 66, step: 634, loss: 0.3415358066558838, mean loss: 0.3396892457261486
Epoch: 66, step: 635, loss: 0.31892216205596924, mean loss: 0.33968902926707345
Epoch: 66, step: 636, loss: 0.34004679322242737, mean loss: 0.3396890329960731
Epoch: 66, step: 637, loss: 0.3419627845287323, mean loss: 0.3396890566953032
Epoch: 66, step: 638, loss: 0.3184732496738434, mean loss: 0.33968883556601787
Epoch: 66, step: 639, loss: 0.3218776285648346, mean loss: 0.33968864992432063
Epoch: 66, step: 640, loss: 0.32324784994125366, mean loss: 0.3396884785678145
Epoch: 66, step: 641, loss: 0.31239643692970276, mean loss: 0.3396881941157098
Epoch: 66, step: 642, loss: 0.31258654594421387, mean loss: 0.33968791165093054
Epoch: 66, step: 643, loss: 0.3287133574485779, mean loss: 0.33968779727070164
Epoch: 66, step: 644, loss: 0.3443358242511749, mean loss: 0.3396878457133845
Epoch: 66, step: 645, loss: 0.3794664144515991, mean loss: 0.3396882602894005
Epoch: 66, step: 646, loss: 0.31327956914901733, mean loss: 0.3396879850583853
Epoch: 66, step: 647, loss: 0.2954559624195099, mean loss: 0.3396875240776591
Epoch: 66, step: 648, loss: 0.303443044424057, mean loss: 0.33968714634606495
Epoch: 66, step: 649, loss: 0.33651989698410034, mean loss: 0.3396871133380678
Epoch: 66, step: 650, loss: 0.33606135845184326, mean loss: 0.33968707555207556
Epoch: 66, step: 651, loss: 0.3576996326446533, mean loss: 0.33968726326891546
Epoch: 66, step: 652, loss: 0.33479392528533936, mean loss: 0.3396872122738032
Epoch: 66, step: 653, loss: 0.33572453260421753, mean loss: 0.339687170977823
Epoch: 66, step: 654, loss: 0.3396605849266052, mean loss: 0.33968717070076665
Epoch: 66, step: 655, loss: 0.32313215732574463, mean loss: 0.33968699818082737
Epoch: 66, step: 656, loss: 0.3129459023475647, mean loss: 0.3396867195145376
Epoch: 66, step: 657, loss: 0.3560884892940521, mean loss: 0.3396868904339618
Epoch: 66, step: 658, loss: 0.30252012610435486, mean loss: 0.3396865031308936
Epoch: 66, step: 659, loss: 0.3225359618663788, mean loss: 0.33968632441240265
Epoch: 66, step: 660, loss: 0.34049853682518005, mean loss: 0.33968633287603434
Epoch: 66, step: 661, loss: 0.33911949396133423, mean loss: 0.33968632696937034
Epoch: 66, step: 662, loss: 0.3297712802886963, mean loss: 0.33968622365211876
Epoch: 66, step: 663, loss: 0.32806968688964844, mean loss: 0.3396861026061788
Epoch: 66, step: 664, loss: 0.3423936367034912, mean loss: 0.3396861308187693
Epoch: 66, step: 665, loss: 0.3731769025325775, mean loss: 0.3396864797900282
Epoch: 66, step: 666, loss: 0.38561129570007324, mean loss: 0.3396869583180826
Epoch: 66, step: 667, loss: 0.2902509868144989, mean loss: 0.3396864432098062
Epoch: 66, step: 668, loss: 0.37042444944381714, mean loss: 0.3396867634874492
Epoch: 66, step: 669, loss: 0.30773332715034485, mean loss: 0.3396864305489832
Epoch: 66, step: 670, loss: 0.33156272768974304, mean loss: 0.3396863459050357
Epoch: 66, step: 671, loss: 0.3495200574398041, mean loss: 0.3396864483651459
Epoch: 66, step: 672, loss: 0.34733596444129944, mean loss: 0.3396865280667002
Epoch: 66, step: 673, loss: 0.3305433690547943, mean loss: 0.33968643280362937
Epoch: 66, step: 674, loss: 0.3084123134613037, mean loss: 0.3396861069602746
Epoch: 66, step: 675, loss: 0.36198315024375916, mean loss: 0.33968633926953995
Epoch: 66, step: 676, loss: 0.32536301016807556, mean loss: 0.33968619003865985
Epoch: 66, step: 677, loss: 0.3312908709049225, mean loss: 0.33968610257101867
Epoch: 66, step: 678, loss: 0.3647421896457672, mean loss: 0.3396863636181528
Epoch: 66, step: 679, loss: 0.3669785261154175, mean loss: 0.33968664795890224
Epoch: 66, step: 680, loss: 0.2968612611293793, mean loss: 0.3396862017914091
Epoch: 66, step: 681, loss: 0.38354936242103577, mean loss: 0.3396866587659745
Epoch: 66, step: 682, loss: 0.34525781869888306, mean loss: 0.3396867168067501
Epoch: 66, step: 683, loss: 0.2921495735645294, mean loss: 0.3396862215662696
Epoch: 66, step: 684, loss: 0.32718369364738464, mean loss: 0.3396860913166793
Epoch: 66, step: 685, loss: 0.3279293179512024, mean loss: 0.3396859688375318
Epoch: 66, step: 686, loss: 0.31226563453674316, mean loss: 0.3396856831822693
Epoch: 66, step: 687, loss: 0.32869118452072144, mean loss: 0.33968556864669697
Epoch: 66, step: 688, loss: 0.3186493515968323, mean loss: 0.33968534950345686
Epoch: 66, step: 689, loss: 0.39730891585350037, mean loss: 0.33968594978645733
Epoch: 66, step: 690, loss: 0.3130367696285248, mean loss: 0.3396856721763718
Epoch: 66, step: 691, loss: 0.3130682408809662, mean loss: 0.3396853948999093
Epoch: 66, step: 692, loss: 0.3627861738204956, mean loss: 0.33968563554054304
Epoch: 66, step: 693, loss: 0.32043054699897766, mean loss: 0.33968543496252535
Epoch: 66, step: 694, loss: 0.34772682189941406, mean loss: 0.33968551872784514
Epoch: 66, step: 695, loss: 0.37778034806251526, mean loss: 0.33968591554898403
Epoch: 66, step: 696, loss: 0.376230388879776, mean loss: 0.33968629621661595
Epoch: 66, step: 697, loss: 0.3069256842136383, mean loss: 0.33968595496735027
Epoch: 66, step: 698, loss: 0.34991347789764404, mean loss: 0.3396860615007183
Epoch: 66, step: 699, loss: 0.3121355473995209, mean loss: 0.3396857745281536
Epoch: 66, step: 700, loss: 0.3078138530254364, mean loss: 0.339685442546262
Epoch: 66, step: 701, loss: 0.31264618039131165, mean loss: 0.33968516090488377
Epoch: 66, step: 702, loss: 0.32813283801078796, mean loss: 0.33968504057696086
Epoch: 66, step: 703, loss: 0.30657222867012024, mean loss: 0.3396846956805782
Epoch: 66, step: 704, loss: 0.36556562781333923, mean loss: 0.33968496524834924
Epoch: 66, step: 705, loss: 0.3407887816429138, mean loss: 0.33968497674523906
Epoch: 66, step: 706, loss: 0.30429938435554504, mean loss: 0.3396846081875489
Epoch: 66, step: 707, loss: 0.36794513463974, mean loss: 0.33968490253123984
Epoch: 66, step: 708, loss: 0.319339781999588, mean loss: 0.33968469063159573
Epoch: 66, step: 709, loss: 0.3480618894100189, mean loss: 0.3396847778813591
Epoch: 66, step: 710, loss: 0.3454689681529999, mean loss: 0.3396848381239282
Epoch: 66, step: 711, loss: 0.3005618751049042, mean loss: 0.3396844306609739
Epoch: 66, step: 712, loss: 0.3559805154800415, mean loss: 0.3396846003818027
Epoch: 66, step: 713, loss: 0.28416532278060913, mean loss: 0.3396840221644101
Epoch: 66, step: 714, loss: 0.382822722196579, mean loss: 0.3396844714369503
Epoch: 66, step: 715, loss: 0.342358261346817, mean loss: 0.3396844992831272
Epoch: 66, step: 716, loss: 0.32738715410232544, mean loss: 0.33968437121379674
Epoch: 66, step: 717, loss: 0.3202284276485443, mean loss: 0.3396841685941516
Epoch: 66, step: 718, loss: 0.3166652023792267, mean loss: 0.3396839288706873
Epoch: 66, step: 719, loss: 0.32960084080696106, mean loss: 0.3396838238647715
Epoch: 66, step: 720, loss: 0.3568068742752075, mean loss: 0.33968400218344275
Epoch: 66, step: 721, loss: 0.3382858335971832, mean loss: 0.33968398762313007
Epoch: 66, step: 722, loss: 0.30190369486808777, mean loss: 0.3396835941890672
Epoch: 66, step: 723, loss: 0.3515104651451111, mean loss: 0.3396837173497178
Epoch: 66, step: 724, loss: 0.39298215508461, mean loss: 0.3396842723741139
Epoch: 66, step: 725, loss: 0.3216264247894287, mean loss: 0.3396840843302986
Epoch: 66, step: 726, loss: 0.3227989077568054, mean loss: 0.3396839084998212
Epoch: 66, step: 727, loss: 0.383890300989151, mean loss: 0.33968436882963304
Epoch: 66, step: 728, loss: 0.4031628370285034, mean loss: 0.3396850298364557
Epoch: 66, step: 729, loss: 0.3355776071548462, mean loss: 0.3396849870659507
Epoch: 66, step: 730, loss: 0.3083958923816681, mean loss: 0.3396846612566657
Epoch: 66, step: 731, loss: 0.3571409285068512, mean loss: 0.3396848430246199
Epoch: 66, step: 732, loss: 0.33098089694976807, mean loss: 0.3396847523934457
Epoch: 66, step: 733, loss: 0.31459325551986694, mean loss: 0.3396844911271045
Epoch: 66, step: 734, loss: 0.31466561555862427, mean loss: 0.33968423061964853
Epoch: 66, step: 735, loss: 0.34554851055145264, mean loss: 0.33968429168045583
Epoch: 66, step: 736, loss: 0.32904252409935, mean loss: 0.3396841808760329
Epoch: 66, step: 737, loss: 0.3336118161678314, mean loss: 0.3396841176498953
Epoch: 66, step: 738, loss: 0.3282901644706726, mean loss: 0.33968399901602114
Epoch: 66, step: 739, loss: 0.34242498874664307, mean loss: 0.33968402755491717
Epoch: 66, step: 740, loss: 0.3512651026248932, mean loss: 0.3396841481345941
Epoch: 66, step: 741, loss: 0.3177410364151001, mean loss: 0.3396839196699863
Epoch: 66, step: 742, loss: 0.35816648602485657, mean loss: 0.3396841121025074
Epoch: 66, step: 743, loss: 0.3833923041820526, mean loss: 0.3396845671686418
Epoch: 66, step: 744, loss: 0.33618083596229553, mean loss: 0.33968453069006105
Epoch: 66, step: 745, loss: 0.33237478137016296, mean loss: 0.3396844545864762
Epoch: 66, step: 746, loss: 0.31670719385147095, mean loss: 0.33968421536709553
Epoch: 66, step: 747, loss: 0.31424975395202637, mean loss: 0.33968395056822187
Epoch: 66, step: 748, loss: 0.3640483617782593, mean loss: 0.33968420422413276
Epoch: 66, step: 749, loss: 0.3232559263706207, mean loss: 0.3396840331924438
Epoch: 66, step: 750, loss: 0.33595114946365356, mean loss: 0.33968399433050295
Epoch: 66, step: 751, loss: 0.3388485014438629, mean loss: 0.3396839856325259
Epoch: 66, step: 752, loss: 0.3194167912006378, mean loss: 0.3396837746411933
Epoch: 66, step: 753, loss: 0.38814401626586914, mean loss: 0.33968427913058125
Epoch: 66, step: 754, loss: 0.36253035068511963, mean loss: 0.3396845169643246
Epoch: 66, step: 755, loss: 0.3534541428089142, mean loss: 0.33968466030833716
Epoch: 66, step: 756, loss: 0.36810174584388733, mean loss: 0.33968495613167377
Epoch: 66, step: 757, loss: 0.36916834115982056, mean loss: 0.3396852630520484
Epoch: 66, step: 758, loss: 0.32687127590179443, mean loss: 0.33968512966055375
Epoch: 66, step: 759, loss: 0.3535945415496826, mean loss: 0.33968527445373214
Epoch: 66, step: 760, loss: 0.29902294278144836, mean loss: 0.33968485117437264
Epoch: 66, step: 761, loss: 0.3532991409301758, mean loss: 0.33968499289245974
Epoch: 66, step: 762, loss: 0.4149681627750397, mean loss: 0.3396857765452217
Epoch: 66, step: 763, loss: 0.37995612621307373, mean loss: 0.3396861957311074
Epoch: 66, step: 764, loss: 0.3235569894313812, mean loss: 0.3396860278392141
Epoch: 66, step: 765, loss: 0.3426400125026703, mean loss: 0.3396860585874671
Epoch: 66, step: 766, loss: 0.3615919053554535, mean loss: 0.33968628660473316
Epoch: 66, step: 767, loss: 0.3101044297218323, mean loss: 0.33968597869132566
Epoch: 66, step: 768, loss: 0.3083970844745636, mean loss: 0.33968565301299547
Epoch: 66, step: 769, loss: 0.30854344367980957, mean loss: 0.33968532886484576
Epoch: 66, step: 770, loss: 0.3312586843967438, mean loss: 0.3396852411558219
Epoch: 66, step: 771, loss: 0.31505608558654785, mean loss: 0.3396849848050624
Epoch: 66, step: 772, loss: 0.3530781865119934, mean loss: 0.3396851242057692
Epoch: 66, step: 773, loss: 0.3571721911430359, mean loss: 0.33968530621483406
Epoch: 66, step: 774, loss: 0.3686373829841614, mean loss: 0.33968560755099253
Epoch: 66, step: 775, loss: 0.33498436212539673, mean loss: 0.33968555862046146
Epoch: 66, step: 776, loss: 0.3169924318790436, mean loss: 0.33968532243300775
Epoch: 66, step: 777, loss: 0.32231926918029785, mean loss: 0.3396851416910035
Epoch: 66, step: 778, loss: 0.3133223056793213, mean loss: 0.33968486731534897
Epoch: 66, step: 779, loss: 0.31356877088546753, mean loss: 0.33968459551050706
Epoch: 66, step: 780, loss: 0.3081369698047638, mean loss: 0.3396842671801152
Epoch: 66, step: 781, loss: 0.30375951528549194, mean loss: 0.3396838932988849
Epoch: 66, step: 782, loss: 0.33065325021743774, mean loss: 0.33968379931485915
Epoch: 66, step: 783, loss: 0.34060201048851013, mean loss: 0.33968380887079924
Epoch: 66, step: 784, loss: 0.3312945067882538, mean loss: 0.33968372156317733
Epoch: 66, step: 785, loss: 0.3511980473995209, mean loss: 0.3396838413917322
Epoch: 66, step: 786, loss: 0.34341904520988464, mean loss: 0.33968388026325835
Epoch: 66, step: 787, loss: 0.29936668276786804, mean loss: 0.3396834606945378
Epoch: 66, step: 788, loss: 0.3430177867412567, mean loss: 0.3396834953934862
Epoch: 66, step: 789, loss: 0.2963446080684662, mean loss: 0.3396830443883524
Epoch: 66, step: 790, loss: 0.33063995838165283, mean loss: 0.33968295028266526
Epoch: 66, step: 791, loss: 0.30844372510910034, mean loss: 0.3396826251991532
Epoch: 66, step: 792, loss: 0.3699975907802582, mean loss: 0.33968294066129645
Epoch: 66, step: 793, loss: 0.34443801641464233, mean loss: 0.33968299014282316
Epoch: 66, step: 794, loss: 0.31633442640304565, mean loss: 0.3396827471791738
Epoch: 66, step: 795, loss: 0.29239243268966675, mean loss: 0.33968225508433
Epoch: 66, step: 796, loss: 0.33640024065971375, mean loss: 0.3396822209326102
Epoch: 66, step: 797, loss: 0.29580363631248474, mean loss: 0.3396817643491403
Epoch: 66, step: 798, loss: 0.34717637300491333, mean loss: 0.3396818423343089
Epoch: 66, step: 799, loss: 0.37112951278686523, mean loss: 0.3396821695597153
Epoch: 66, step: 800, loss: 0.3357401192188263, mean loss: 0.33968212854155455
Epoch: 66, step: 801, loss: 0.3807399272918701, mean loss: 0.3396825557552431
Epoch: 66, step: 802, loss: 0.32480549812316895, mean loss: 0.3396824009584267
Epoch: 66, step: 803, loss: 0.3231269121170044, mean loss: 0.33968222869920955
Epoch: 66, step: 804, loss: 0.35071972012519836, mean loss: 0.3396823435426834
Epoch: 66, step: 805, loss: 0.3234741687774658, mean loss: 0.33968217490076513
Epoch: 66, step: 806, loss: 0.3052568733692169, mean loss: 0.339681816718023
Epoch: 66, step: 807, loss: 0.37259262800216675, mean loss: 0.3396821591394822
Epoch: 66, step: 808, loss: 0.33696627616882324, mean loss: 0.33968213088229565
Epoch: 66, step: 809, loss: 0.31902316212654114, mean loss: 0.3396819159399485
Epoch: 66, step: 810, loss: 0.3382053077220917, mean loss: 0.3396819005770164
Epoch: 66, step: 811, loss: 0.3218452036380768, mean loss: 0.3396817150023261
Epoch: 66, step: 812, loss: 0.3991394639015198, mean loss: 0.33968233359996125
Epoch: 66, step: 813, loss: 0.3533417284488678, mean loss: 0.3396824757106465
Epoch: 66, step: 814, loss: 0.36171647906303406, mean loss: 0.33968270494735675
Epoch: 66, step: 815, loss: 0.364552766084671, mean loss: 0.33968296368706896
Epoch: 66, step: 816, loss: 0.3543735146522522, mean loss: 0.3396831165210071
Epoch: 66, step: 817, loss: 0.32975924015045166, mean loss: 0.3396830132784989
Epoch: 66, step: 818, loss: 0.3159804940223694, mean loss: 0.3396827666931941
Epoch: 66, step: 819, loss: 0.3145360052585602, mean loss: 0.3396825050856722
Epoch: 66, step: 820, loss: 0.36478644609451294, mean loss: 0.3396827662450065
Epoch: 66, step: 821, loss: 0.31701308488845825, mean loss: 0.3396825304120231
Epoch: 66, step: 822, loss: 0.3146507740020752, mean loss: 0.33968227000905193
Epoch: 66, step: 823, loss: 0.34476813673973083, mean loss: 0.3396823229162874
Epoch: 66, step: 824, loss: 0.33503660559654236, mean loss: 0.33968227458833933
Epoch: 66, step: 825, loss: 0.3268909156322479, mean loss: 0.33968214152520654
Epoch: 66, step: 826, loss: 0.351392537355423, mean loss: 0.3396822633422669
Epoch: 66, step: 827, loss: 0.3129613697528839, mean loss: 0.339681985381821
Epoch: 66, step: 828, loss: 0.31432974338531494, mean loss: 0.3396817216613296
Epoch: 66, step: 829, loss: 0.31294602155685425, mean loss: 0.3396814435526469
Epoch: 66, step: 830, loss: 0.3228021562099457, mean loss: 0.33968126797364506
Epoch: 66, step: 831, loss: 0.34200459718704224, mean loss: 0.3396812921407543
Epoch: 66, step: 832, loss: 0.3301258087158203, mean loss: 0.3396811927463128
Epoch: 66, step: 833, loss: 0.30556270480155945, mean loss: 0.3396808378555522
Epoch: 66, step: 834, loss: 0.3135606050491333, mean loss: 0.3396805661631817
Epoch: 66, step: 835, loss: 0.3305368721485138, mean loss: 0.3396804710550684
Epoch: 66, step: 836, loss: 0.32840242981910706, mean loss: 0.3396803537477673
Epoch: 66, step: 837, loss: 0.35342973470687866, mean loss: 0.33968049675894824
Epoch: 66, step: 838, loss: 0.32746005058288574, mean loss: 0.33968036965197035
Epoch: 66, step: 839, loss: 0.3113776445388794, mean loss: 0.3396800752734848
Epoch: 66, step: 840, loss: 0.34387245774269104, mean loss: 0.33968011887827415
Epoch: 66, step: 841, loss: 0.3420586585998535, mean loss: 0.33968014361710597
Epoch: 66, step: 842, loss: 0.3061455190181732, mean loss: 0.33967979483217664
Epoch: 66, step: 843, loss: 0.3517804741859436, mean loss: 0.3396799206868939
Epoch: 66, step: 844, loss: 0.3487502634525299, mean loss: 0.3396800150232132
Epoch: 66, step: 845, loss: 0.3105500638484955, mean loss: 0.33967971205960246
Epoch: 66, step: 846, loss: 0.3415030241012573, mean loss: 0.339679731022609
Epoch: 66, step: 847, loss: 0.32397356629371643, mean loss: 0.33967956767535956
Epoch: 66, step: 848, loss: 0.3352721333503723, mean loss: 0.3396795218376392
Epoch: 66, step: 849, loss: 0.29143887758255005, mean loss: 0.3396790201357417
Epoch: 66, step: 850, loss: 0.32991525530815125, mean loss: 0.339678918593806
Epoch: 66, step: 851, loss: 0.3043537735939026, mean loss: 0.33967855122052715
Epoch: 66, step: 852, loss: 0.3184732496738434, mean loss: 0.3396783306926244
Epoch: 66, step: 853, loss: 0.3119461238384247, mean loss: 0.3396780422901321
Epoch: 66, step: 854, loss: 0.34302765130996704, mean loss: 0.3396780771241988
Epoch: 66, step: 855, loss: 0.33565202355384827, mean loss: 0.3396780352559212
Epoch: 66, step: 856, loss: 0.3152093291282654, mean loss: 0.33967778080030897
Epoch: 66, step: 857, loss: 0.36061811447143555, mean loss: 0.33967799856131303
Epoch: 66, step: 858, loss: 0.336531400680542, mean loss: 0.33967796583981014
Epoch: 66, step: 859, loss: 0.31875699758529663, mean loss: 0.3396777482847141
Epoch: 66, step: 860, loss: 0.33418428897857666, mean loss: 0.33967769115936386
Epoch: 66, step: 861, loss: 0.2957000136375427, mean loss: 0.33967723384932164
Epoch: 66, step: 862, loss: 0.3133353590965271, mean loss: 0.3396769599312962
Epoch: 66, step: 863, loss: 0.33315375447273254, mean loss: 0.3396768920999442
Epoch: 66, step: 864, loss: 0.31107670068740845, mean loss: 0.33967659470482303
Epoch: 66, step: 865, loss: 0.3129909634590149, mean loss: 0.3396763172208754
Epoch: 66, step: 866, loss: 0.32887566089630127, mean loss: 0.3396762049140851
Epoch: 66, step: 867, loss: 0.3182341456413269, mean loss: 0.33967598195876264
Epoch: 66, step: 868, loss: 0.31949952244758606, mean loss: 0.3396757721653746
Epoch: 66, step: 869, loss: 0.34034067392349243, mean loss: 0.3396757790789038
Epoch: 66, step: 870, loss: 0.3223123252391815, mean loss: 0.3396755985387027
Epoch: 66, step: 871, loss: 0.2932884991168976, mean loss: 0.33967511622399404
Epoch: 66, step: 872, loss: 0.32555919885635376, mean loss: 0.33967496945379566
Epoch: 66, step: 873, loss: 0.337744802236557, mean loss: 0.33967494938509785
Epoch: 66, step: 874, loss: 0.2974626421928406, mean loss: 0.3396745104919175
Epoch: 66, step: 875, loss: 0.35880976915359497, mean loss: 0.33967470944449246
Epoch: 66, step: 876, loss: 0.337246298789978, mean loss: 0.33967468419615177
Epoch: 66, step: 877, loss: 0.31252622604370117, mean loss: 0.3396744019348331
Epoch: 66, step: 878, loss: 0.41241297125816345, mean loss: 0.3396751581866585
Epoch: 66, step: 879, loss: 0.30075475573539734, mean loss: 0.3396747535413698
Epoch: 66, step: 880, loss: 0.34287986159324646, mean loss: 0.33967478686369706
Epoch: 66, step: 881, loss: 0.3338630199432373, mean loss: 0.33967472644152624
Epoch: 66, step: 882, loss: 0.3169289827346802, mean loss: 0.339674489967328
Epoch: 66, step: 883, loss: 0.3725976347923279, mean loss: 0.33967483224645667
Epoch: 66, step: 884, loss: 0.34410473704338074, mean loss: 0.33967487830062915
Epoch: 66, step: 885, loss: 0.31925180554389954, mean loss: 0.33967466598050483
Epoch: 66, step: 886, loss: 0.3030514121055603, mean loss: 0.3396742852457804
Epoch: 66, step: 887, loss: 0.3285311460494995, mean loss: 0.33967416940309914
Epoch: 66, step: 888, loss: 0.35872185230255127, mean loss: 0.3396743674183695
Epoch: 66, step: 889, loss: 0.3119626045227051, mean loss: 0.3396740793363384
Epoch: 66, step: 890, loss: 0.340371310710907, mean loss: 0.33967408658444254
Epoch: 66, step: 891, loss: 0.320808082818985, mean loss: 0.3396738904639826
Epoch: 66, step: 892, loss: 0.32880526781082153, mean loss: 0.3396737774810138
Epoch: 66, step: 893, loss: 0.3347088694572449, mean loss: 0.33967372586967026
Epoch: 66, step: 894, loss: 0.3259032368659973, mean loss: 0.33967358272380593
Epoch: 66, step: 895, loss: 0.3327300250530243, mean loss: 0.33967351054545175
Epoch: 66, step: 896, loss: 0.3306336998939514, mean loss: 0.3396734165775029
Epoch: 66, step: 897, loss: 0.3516656458377838, mean loss: 0.3396735412342591
Epoch: 66, step: 898, loss: 0.30360516905784607, mean loss: 0.33967316631484723
Epoch: 66, step: 899, loss: 0.32484614849090576, mean loss: 0.33967301219425117
Epoch: 66, step: 900, loss: 0.3499976098537445, mean loss: 0.33967311951297324
Epoch: 66, step: 901, loss: 0.3292170464992523, mean loss: 0.3396730108287642
Epoch: 66, step: 902, loss: 0.35936644673347473, mean loss: 0.33967321552734026
Epoch: 66, step: 903, loss: 0.35243865847587585, mean loss: 0.3396733482132182
Epoch: 66, step: 904, loss: 0.33397147059440613, mean loss: 0.33967328894768567
Epoch: 66, step: 905, loss: 0.32359641790390015, mean loss: 0.33967312184581433
Epoch: 66, step: 906, loss: 0.3384547233581543, mean loss: 0.33967310918199745
Epoch: 66, step: 907, loss: 0.32072222232818604, mean loss: 0.33967291221190166
Epoch: 66, step: 908, loss: 0.38565337657928467, mean loss: 0.33967339011472525
Epoch: 66, step: 909, loss: 0.3701609671115875, mean loss: 0.33967370698729055
Epoch: 66, step: 910, loss: 0.3346402645111084, mean loss: 0.33967365467276084
Epoch: 66, step: 911, loss: 0.3331919312477112, mean loss: 0.33967358730638286
Epoch: 66, step: 912, loss: 0.32764241099357605, mean loss: 0.33967346226427686
Epoch: 66, step: 913, loss: 0.2994261682033539, mean loss: 0.33967304397150355
Epoch: 66, step: 914, loss: 0.31113746762275696, mean loss: 0.3396727474024647
Epoch: 66, step: 915, loss: 0.3427417576313019, mean loss: 0.3396727792982268
Epoch: 66, step: 916, loss: 0.31796374917030334, mean loss: 0.3396725536818839
Epoch: 66, step: 917, loss: 0.33069291710853577, mean loss: 0.33967246035981025
Epoch: 66, step: 918, loss: 0.35374224185943604, mean loss: 0.339672606580376
Epoch: 66, step: 919, loss: 0.3111932873725891, mean loss: 0.33967231061139525
Epoch: 66, step: 920, loss: 0.35194289684295654, mean loss: 0.33967243813112746
Epoch: 66, step: 921, loss: 0.3150521516799927, mean loss: 0.33967218227214496
Epoch: 66, step: 922, loss: 0.3010752201080322, mean loss: 0.3396717811688978
Epoch: 66, step: 923, loss: 0.3411354422569275, mean loss: 0.3396717963792429
Epoch: 66, step: 924, loss: 0.3646495044231415, mean loss: 0.3396720559445303
Epoch: 66, step: 925, loss: 0.3208923041820526, mean loss: 0.33967186078967465
Epoch: 66, step: 926, loss: 0.3411804735660553, mean loss: 0.3396718764666683
Epoch: 66, step: 927, loss: 0.30865806341171265, mean loss: 0.3396715541849631
Epoch: 66, step: 928, loss: 0.3283357322216034, mean loss: 0.33967143638938396
Epoch: 66, step: 929, loss: 0.30126136541366577, mean loss: 0.33967103725736225
Epoch: 66, step: 930, loss: 0.3274102210998535, mean loss: 0.339670909852404
Epoch: 66, step: 931, loss: 0.3478905260562897, mean loss: 0.33967099526343736
Epoch: 66, step: 932, loss: 0.31445661187171936, mean loss: 0.3396707332604303
Epoch: 66, step: 933, loss: 0.27707043290138245, mean loss: 0.33967008278660127
Epoch: 66, step: 934, loss: 0.35672396421432495, mean loss: 0.33967025999003675
Epoch: 66, step: 935, loss: 0.3266233503818512, mean loss: 0.3396701244236443
Epoch: 66, step: 936, loss: 0.34232306480407715, mean loss: 0.33967015198923883
Epoch: 66, step: 937, loss: 0.32525208592414856, mean loss: 0.3396700021786981
Epoch: 66, step: 938, loss: 0.3402077853679657, mean loss: 0.3396700077664623
Epoch: 66, step: 939, loss: 0.3217259645462036, mean loss: 0.339669821323222
Epoch: 66, step: 940, loss: 0.38263067603111267, mean loss: 0.33967026769295244
Epoch: 66, step: 941, loss: 0.3424275815486908, mean loss: 0.3396702963415597
Epoch: 66, step: 942, loss: 0.31596797704696655, mean loss: 0.3396700500760211
Epoch: 66, step: 943, loss: 0.33742555975914, mean loss: 0.3396700267561566
Epoch: 66, step: 944, loss: 0.35107576847076416, mean loss: 0.3396701452586004
Epoch: 66, step: 945, loss: 0.3385978639125824, mean loss: 0.339670134118015
Epoch: 66, step: 946, loss: 0.3763575851917267, mean loss: 0.3396705152823777
Epoch: 66, step: 947, loss: 0.3255845308303833, mean loss: 0.3396703689375282
Epoch: 66, step: 948, loss: 0.3612392544746399, mean loss: 0.339670593022861
Epoch: 66, step: 949, loss: 0.3119661211967468, mean loss: 0.3396703051961543
Epoch: 66, step: 950, loss: 0.3558609187602997, mean loss: 0.3396704734015833
Epoch: 66, step: 951, loss: 0.3863637447357178, mean loss: 0.3396709584962406
Epoch: 66, step: 952, loss: 0.3778804838657379, mean loss: 0.33967135544945304
Epoch: 66, step: 953, loss: 0.3258918225765228, mean loss: 0.3396712122973735
Epoch: 66, step: 954, loss: 0.33710119128227234, mean loss: 0.339671185598353
Epoch: 66, step: 955, loss: 0.3528943359851837, mean loss: 0.33967132296746155
Epoch: 66, step: 956, loss: 0.3370841443538666, mean loss: 0.33967129609075536
Epoch: 66, step: 957, loss: 0.2998674511909485, mean loss: 0.3396708825958675
Epoch: 66, step: 958, loss: 0.33488479256629944, mean loss: 0.33967083287697203
Epoch: 66, step: 959, loss: 0.34453892707824707, mean loss: 0.33967088344721846
Epoch: 66, step: 960, loss: 0.3327850103378296, mean loss: 0.33967081191682724
Epoch: 66, step: 961, loss: 0.35671359300613403, mean loss: 0.33967098895525294
Epoch: 66, step: 962, loss: 0.3013724386692047, mean loss: 0.33967059111850423
Epoch: 66, step: 963, loss: 0.3026389181613922, mean loss: 0.33967020644578894
Epoch: 66, step: 964, loss: 0.2923627495765686, mean loss: 0.339669715036749
Epoch: 66, step: 965, loss: 0.3397653102874756, mean loss: 0.33966971602974005
Epoch: 66, step: 966, loss: 0.3218323588371277, mean loss: 0.33966953074697376
Epoch: 66, step: 967, loss: 0.32312723994255066, mean loss: 0.3396693589182925
Epoch: 66, step: 968, loss: 0.36723387241363525, mean loss: 0.3396696452344299
Epoch: 66, step: 969, loss: 0.33907508850097656, mean loss: 0.33966963905875697
Epoch: 66, step: 970, loss: 0.3174728751182556, mean loss: 0.33966940850291233
Epoch: 66, step: 971, loss: 0.32838431000709534, mean loss: 0.33966929128679935
Epoch: 66, step: 972, loss: 0.31532973051071167, mean loss: 0.3396690384791633
Epoch: 66, step: 973, loss: 0.3027811348438263, mean loss: 0.3396686553396752
Epoch: 66, step: 974, loss: 0.3503861725330353, mean loss: 0.33966876665696344
Epoch: 66, step: 975, loss: 0.34012338519096375, mean loss: 0.33966877137880114
Epoch: 66, step: 976, loss: 0.31667304039001465, mean loss: 0.33966853253904056
Epoch: 66, step: 977, loss: 0.3196025490760803, mean loss: 0.33966832413057935
Epoch: 66, step: 978, loss: 0.3151392340660095, mean loss: 0.33966806937023675
Epoch: 66, step: 979, loss: 0.30350443720817566, mean loss: 0.33966769377686545
Epoch: 66, step: 980, loss: 0.3621186316013336, mean loss: 0.3396679269485726
Epoch: 66, step: 981, loss: 0.3196863830089569, mean loss: 0.33966771942573504
Epoch: 66, step: 982, loss: 0.35589173436164856, mean loss: 0.3396678879221565
Epoch: 66, step: 983, loss: 0.3174877166748047, mean loss: 0.3396676575697632
Epoch: 66, step: 984, loss: 0.34384235739707947, mean loss: 0.3396677009257003
Epoch: 66, step: 985, loss: 0.3241800367832184, mean loss: 0.33966754008174826
Epoch: 66, step: 986, loss: 0.3390637934207916, mean loss: 0.33966753381172654
Epoch: 66, step: 987, loss: 0.2990351915359497, mean loss: 0.3396671118416535
Epoch: 66, step: 988, loss: 0.30122917890548706, mean loss: 0.33966671266483967
Epoch: 66, step: 989, loss: 0.30655381083488464, mean loss: 0.33966636879188983
Epoch: 66, step: 990, loss: 0.32899853587150574, mean loss: 0.33966625800905664
Epoch: 66, step: 991, loss: 0.3154948055744171, mean loss: 0.33966600699704746
Epoch: 66, step: 992, loss: 0.3330666124820709, mean loss: 0.33966593846537446
Epoch: 66, step: 993, loss: 0.28394779562950134, mean loss: 0.33966535986412794
Epoch: 66, step: 994, loss: 0.3498626947402954, mean loss: 0.33966546575655543
Epoch: 66, step: 995, loss: 0.348371684551239, mean loss: 0.3396655561638119
Epoch: 66, step: 996, loss: 0.3779221177101135, mean loss: 0.33966595342408484
Epoch: 66, step: 997, loss: 0.3044624924659729, mean loss: 0.33966558787133455
Epoch: 66, step: 998, loss: 0.33242136240005493, mean loss: 0.339665512648076
Epoch: 66, step: 999, loss: 0.3543785810470581, mean loss: 0.33966566542541027
Epoch: 66, step: 1000, loss: 0.3038058280944824, mean loss: 0.33966529306844717
Epoch: 66, step: 1001, loss: 0.37530243396759033, mean loss: 0.3396656631091601
Epoch: 66, step: 1002, loss: 0.3346688151359558, mean loss: 0.3396656112245829
Epoch: 66, step: 1003, loss: 0.40841272473335266, mean loss: 0.3396663250501582
Epoch: 66, step: 1004, loss: 0.3066175878047943, mean loss: 0.33966598189700276
Epoch: 66, step: 1005, loss: 0.32623744010925293, mean loss: 0.33966584246660314
Epoch: 66, step: 1006, loss: 0.31279224157333374, mean loss: 0.3396655634371995
Epoch: 66, step: 1007, loss: 0.35321953892707825, mean loss: 0.3396657041670721
Epoch: 66, step: 1008, loss: 0.3078099191188812, mean loss: 0.3396653734143695
Epoch: 66, step: 1009, loss: 0.33505043387413025, mean loss: 0.3396653254988064
Epoch: 66, step: 1010, loss: 0.3271094858646393, mean loss: 0.33966519513656135
Epoch: 66, step: 1011, loss: 0.31902486085891724, mean loss: 0.3396649808384771
Epoch: 66, step: 1012, loss: 0.346748948097229, mean loss: 0.3396650543869396
Epoch: 66, step: 1013, loss: 0.3415161073207855, mean loss: 0.3396650736050809
Epoch: 66, step: 1014, loss: 0.3460169732570648, mean loss: 0.33966513955156763
Epoch: 66, step: 1015, loss: 0.31569772958755493, mean loss: 0.3396648907204841
Epoch: 66, step: 1016, loss: 0.3523184657096863, mean loss: 0.33966502208929245
Epoch: 66, step: 1017, loss: 0.34671375155448914, mean loss: 0.3396650952681038
Epoch: 66, step: 1018, loss: 0.3733482360839844, mean loss: 0.33966544495759454
Epoch: 66, step: 1019, loss: 0.2960261106491089, mean loss: 0.33966499191023036
Epoch: 66, step: 1020, loss: 0.3214366137981415, mean loss: 0.33966480267194216
Epoch: 66, step: 1021, loss: 0.3455028831958771, mean loss: 0.3396648632794679
Epoch: 66, step: 1022, loss: 0.3535856306552887, mean loss: 0.33966500779520464
Epoch: 66, step: 1023, loss: 0.2991560697555542, mean loss: 0.3396645872639153
Epoch: 66, step: 1024, loss: 0.2829109728336334, mean loss: 0.33966399809954706
Epoch: 66, step: 1025, loss: 0.324686199426651, mean loss: 0.33966384261528804
Epoch: 66, step: 1026, loss: 0.31316155195236206, mean loss: 0.3396635674983406
Epoch: 66, step: 1027, loss: 0.3325662910938263, mean loss: 0.33966349382317135
Epoch: 66, step: 1028, loss: 0.3506738245487213, mean loss: 0.3396636081176574
Epoch: 66, step: 1029, loss: 0.32066017389297485, mean loss: 0.3396634108515392
Epoch: 66, step: 1030, loss: 0.31995582580566406, mean loss: 0.3396632062780712
Epoch: 66, step: 1031, loss: 0.3437976837158203, mean loss: 0.3396632491953341
Epoch: 66, step: 1032, loss: 0.32432302832603455, mean loss: 0.33966308996034783
Epoch: 66, step: 1033, loss: 0.3356793522834778, mean loss: 0.33966304860867275
Epoch: 66, step: 1034, loss: 0.3415628969669342, mean loss: 0.33966306832912196
Epoch: 66, step: 1035, loss: 0.32434919476509094, mean loss: 0.33966290937257676
Epoch: 66, step: 1036, loss: 0.342596173286438, mean loss: 0.33966293981926005
Epoch: 66, step: 1037, loss: 0.37680044770240784, mean loss: 0.339663325295043
Epoch: 66, step: 1038, loss: 0.30944210290908813, mean loss: 0.33966301161140866
Epoch: 66, step: 1039, loss: 0.35981473326683044, mean loss: 0.3396632207756706
Epoch: 66, step: 1040, loss: 0.3128141760826111, mean loss: 0.33966294209961384
Epoch: 66, step: 1041, loss: 0.32011204957962036, mean loss: 0.3396627391758545
Epoch: 66, step: 1042, loss: 0.32526493072509766, mean loss: 0.3396625897388357
Epoch: 66, step: 1043, loss: 0.34376445412635803, mean loss: 0.33966263231226107
Epoch: 66, step: 1044, loss: 0.31899237632751465, mean loss: 0.33966241777701955
Epoch: 66, step: 1045, loss: 0.35650646686553955, mean loss: 0.33966259259849424
Epoch: 66, step: 1046, loss: 0.3268754184246063, mean loss: 0.3396624598840006
Epoch: 66, step: 1047, loss: 0.3436988890171051, mean loss: 0.33966250177653146
Epoch: 66, step: 1048, loss: 0.33795028924942017, mean loss: 0.3396624840063268
Epoch: 66, step: 1049, loss: 0.38275283575057983, mean loss: 0.33966293121507524
Epoch: 66, step: 1050, loss: 0.3252154588699341, mean loss: 0.3396627812750374
Epoch: 66, step: 1051, loss: 0.3313210904598236, mean loss: 0.339662694703461
Epoch: 66, step: 1052, loss: 0.3248223662376404, mean loss: 0.3396625406894458
Epoch: 66, step: 1053, loss: 0.3351222276687622, mean loss: 0.33966249357023387
Epoch: 66, step: 1054, loss: 0.3225323259830475, mean loss: 0.33966231579579054
Epoch: 66, step: 1055, loss: 0.3420908749103546, mean loss: 0.33966234099877013
Epoch: 66, step: 1056, loss: 0.3605150282382965, mean loss: 0.33966255740050155
Epoch: 66, step: 1057, loss: 0.3785582482814789, mean loss: 0.33966296104188387
Epoch: 66, step: 1058, loss: 0.3401745557785034, mean loss: 0.3396629663509209
Epoch: 66, step: 1059, loss: 0.3305475413799286, mean loss: 0.33966287175724513
Epoch: 66, step: 1060, loss: 0.2773115634918213, mean loss: 0.339662224724523
Epoch: 66, step: 1061, loss: 0.35460352897644043, mean loss: 0.3396623797719905
Epoch: 66, step: 1062, loss: 0.29627639055252075, mean loss: 0.339661929555742
Epoch: 66, step: 1063, loss: 0.3761255443096161, mean loss: 0.33966230793461
Epoch: 66, step: 1064, loss: 0.30531278252601624, mean loss: 0.3396619514971103
Epoch: 66, step: 1065, loss: 0.31116899847984314, mean loss: 0.33966165583504726
Epoch: 66, step: 1066, loss: 0.3555286228656769, mean loss: 0.339661820479671
Epoch: 66, step: 1067, loss: 0.31068217754364014, mean loss: 0.3396615197736263
Epoch: 66, step: 1068, loss: 0.3484379053115845, mean loss: 0.3396616108404763
Epoch: 66, step: 1069, loss: 0.3295925259590149, mean loss: 0.3396615063612093
Epoch: 66, step: 1070, loss: 0.34740790724754333, mean loss: 0.3396615867389098
Epoch: 66, step: 1071, loss: 0.31889477372169495, mean loss: 0.3396613712618925
Epoch: 66, step: 1072, loss: 0.3201083838939667, mean loss: 0.3396611683816683
Epoch: 66, step: 1073, loss: 0.29503950476646423, mean loss: 0.33966070539567966
Epoch: 66, step: 1074, loss: 0.32533931732177734, mean loss: 0.33966055680119256
Epoch: 66, step: 1075, loss: 0.32572615146636963, mean loss: 0.33966041222342397
Epoch: 66, step: 1076, loss: 0.3320464789867401, mean loss: 0.33966033322514383
Epoch: 66, step: 1077, loss: 0.35622671246528625, mean loss: 0.3396605051076451
Epoch: 66, step: 1078, loss: 0.3339746594429016, mean loss: 0.33966044611544044
Epoch: 66, step: 1079, loss: 0.32016804814338684, mean loss: 0.3396602438785757
Epoch: 66, step: 1080, loss: 0.3006390929222107, mean loss: 0.33965983903185726
Epoch: 66, step: 1081, loss: 0.3324248194694519, mean loss: 0.33965976396888586
Epoch: 66, step: 1082, loss: 0.35224688053131104, mean loss: 0.339659894558245
Epoch: 66, step: 1083, loss: 0.3173352777957916, mean loss: 0.3396596629462522
Epoch: 66, step: 1084, loss: 0.33595821261405945, mean loss: 0.33965962454508264
Epoch: 66, step: 1085, loss: 0.3020138144493103, mean loss: 0.3396592339878662
Epoch: 66, step: 1086, loss: 0.3719973564147949, mean loss: 0.3396595694768893
Epoch: 66, step: 1087, loss: 0.32785239815711975, mean loss: 0.3396594469856938
Epoch: 66, step: 1088, loss: 0.3997609317302704, mean loss: 0.33966007049035435
Epoch: 66, step: 1089, loss: 0.27914804220199585, mean loss: 0.3396594427331466
Epoch: 66, step: 1090, loss: 0.365203320980072, mean loss: 0.3396597077248811
Epoch: 66, step: 1091, loss: 0.31507664918899536, mean loss: 0.3396594527033186
Epoch: 66, step: 1092, loss: 0.3513154983520508, mean loss: 0.3396595736204182
Epoch: 66, step: 1093, loss: 0.3117813467979431, mean loss: 0.3396592844211939
Epoch: 66, step: 1094, loss: 0.33949753642082214, mean loss: 0.3396592827432927
Epoch: 66, step: 1095, loss: 0.35658565163612366, mean loss: 0.33965945832803224
Epoch: 66, step: 1096, loss: 0.3517882227897644, mean loss: 0.33965958414378583
Epoch: 66, step: 1097, loss: 0.34553128480911255, mean loss: 0.33965964505228013
Epoch: 66, step: 1098, loss: 0.31217828392982483, mean loss: 0.33965935998479135
Epoch: 66, step: 1099, loss: 0.30051788687705994, mean loss: 0.33965895396975976
Epoch: 66, step: 1100, loss: 0.3275166451931, mean loss: 0.33965882801873254
Epoch: 66, step: 1101, loss: 0.3506978452205658, mean loss: 0.33965894252423223
Epoch: 66, step: 1102, loss: 0.3341897130012512, mean loss: 0.3396588857936056
Epoch: 66, step: 1103, loss: 0.33395591378211975, mean loss: 0.339658826639054
Epoch: 66, step: 1104, loss: 0.3114539384841919, mean loss: 0.33965853408453983
Epoch: 66, step: 1105, loss: 0.3091055154800415, mean loss: 0.339658217177387
Epoch: 66, step: 1106, loss: 0.3289949893951416, mean loss: 0.3396581065756114
Epoch: 66, step: 1107, loss: 0.2973286211490631, mean loss: 0.33965766752771875
Epoch: 66, step: 1108, loss: 0.3338465094566345, mean loss: 0.3396576072541242
Epoch: 66, step: 1109, loss: 0.33871394395828247, mean loss: 0.3396575974665073
Epoch: 66, step: 1110, loss: 0.3496403396129608, mean loss: 0.3396577010058129
Epoch: 66, step: 1111, loss: 0.3038601279258728, mean loss: 0.33965732972331747
Epoch: 66, step: 1112, loss: 0.3665623068809509, mean loss: 0.3396576087713812
Epoch: 66, step: 1113, loss: 0.3421850800514221, mean loss: 0.33965763498506824
Epoch: 66, step: 1114, loss: 0.30523574352264404, mean loss: 0.33965727798186907
Epoch: 66, step: 1115, loss: 0.3092733919620514, mean loss: 0.33965696286170705
Epoch: 66, step: 1116, loss: 0.30815815925598145, mean loss: 0.33965663618179703
Epoch: 66, step: 1117, loss: 0.3442365229129791, mean loss: 0.3396566836801556
Epoch: 66, step: 1118, loss: 0.41355884075164795, mean loss: 0.3396574501171786
Epoch: 66, step: 1119, loss: 0.3313847482204437, mean loss: 0.3396573643221287
Epoch: 66, step: 1120, loss: 0.3289136588573456, mean loss: 0.33965725290179716
Epoch: 66, step: 1121, loss: 0.323709636926651, mean loss: 0.33965708751470264
Epoch: 66, step: 1122, loss: 0.34270358085632324, mean loss: 0.3396571191084818
Epoch: 66, step: 1123, loss: 0.3453698754310608, mean loss: 0.33965717835223175
Epoch: 66, step: 1124, loss: 0.29921653866767883, mean loss: 0.3396567589696841
Epoch: 66, step: 1125, loss: 0.4134722352027893, mean loss: 0.33965752445217123
Epoch: 66, step: 1126, loss: 0.3467751443386078, mean loss: 0.33965759826266667
Epoch: 66, step: 1127, loss: 0.41582128405570984, mean loss: 0.3396583880802147
Epoch: 66, step: 1128, loss: 0.3532572388648987, mean loss: 0.3396585290988575
Epoch: 66, step: 1129, loss: 0.31996867060661316, mean loss: 0.339658324919227
Epoch: 66, step: 1130, loss: 0.3318037688732147, mean loss: 0.3396582434700016
Epoch: 66, step: 1131, loss: 0.3216554820537567, mean loss: 0.3396580567890794
Epoch: 66, step: 1132, loss: 0.34333327412605286, mean loss: 0.33965809489911325
Epoch: 66, step: 1133, loss: 0.33306679129600525, mean loss: 0.33965802655153654
Epoch: 66, step: 1134, loss: 0.298107773065567, mean loss: 0.33965759570661397
Epoch: 66, step: 1135, loss: 0.3462580144405365, mean loss: 0.3396576641472894
Epoch: 66, step: 1136, loss: 0.3749719560146332, mean loss: 0.3396580303223795
Epoch: 66, step: 1137, loss: 0.32819291949272156, mean loss: 0.33965791144148916
Epoch: 66, step: 1138, loss: 0.3214498460292816, mean loss: 0.3396577226453566
Epoch: 66, step: 1139, loss: 0.31711992621421814, mean loss: 0.33965748895745035
Epoch: 66, step: 1140, loss: 0.3382326066493988, mean loss: 0.33965747418341014
Epoch: 66, step: 1141, loss: 0.31151440739631653, mean loss: 0.33965718238212456
Epoch: 66, step: 1142, loss: 0.336404412984848, mean loss: 0.3396571486561466
Epoch: 66, step: 1143, loss: 0.3959041237831116, mean loss: 0.33965773184061
Epoch: 66, step: 1144, loss: 0.3100943863391876, mean loss: 0.33965742532270415
Epoch: 66, step: 1145, loss: 0.3373488783836365, mean loss: 0.3396574013875363
Epoch: 66, step: 1146, loss: 0.3336114287376404, mean loss: 0.3396573387031406
Epoch: 66, step: 1147, loss: 0.3154200315475464, mean loss: 0.3396570874143425
Epoch: 66, step: 1148, loss: 0.28657758235931396, mean loss: 0.33965653709962906
Epoch: 66, step: 1149, loss: 0.31137073040008545, mean loss: 0.3396562438426703
Epoch: 66, step: 1150, loss: 0.31720399856567383, mean loss: 0.3396560110683685
Epoch: 66, step: 1151, loss: 0.380416601896286, mean loss: 0.33965643365059073
Epoch: 66, step: 1152, loss: 0.32330015301704407, mean loss: 0.33965626407989463
Epoch: 66, step: 1153, loss: 0.3843541145324707, mean loss: 0.33965672747173825
Epoch: 66, step: 1154, loss: 0.33875077962875366, mean loss: 0.3396567180796873
Epoch: 66, step: 1155, loss: 0.3129505217075348, mean loss: 0.3396564412167765
Epoch: 66, step: 1156, loss: 0.34950631856918335, mean loss: 0.3396565433293127
Epoch: 66, step: 1157, loss: 0.36608415842056274, mean loss: 0.33965681729849323
Epoch: 66, step: 1158, loss: 0.32249096035957336, mean loss: 0.33965663934573476
Epoch: 66, step: 1159, loss: 0.32744887471199036, mean loss: 0.3396565127931905
Epoch: 66, step: 1160, loss: 0.34033316373825073, mean loss: 0.3396565198076615
Epoch: 66, step: 1161, loss: 0.3093770146369934, mean loss: 0.3396562059198132
Epoch: 66, step: 1162, loss: 0.34570765495300293, mean loss: 0.33965626865058157
Epoch: 66, step: 1163, loss: 0.29621464014053345, mean loss: 0.33965581832893593
Epoch: 66, step: 1164, loss: 0.3047601878643036, mean loss: 0.3396554565999819
Epoch: 66, step: 1165, loss: 0.31747332215309143, mean loss: 0.33965522666182035
Epoch: 66, step: 1166, loss: 0.30061137676239014, mean loss: 0.3396548219407135
Epoch: 66, step: 1167, loss: 0.3337516188621521, mean loss: 0.3396547607498697
Epoch: 66, step: 1168, loss: 0.3275159001350403, mean loss: 0.3396546349233627
Epoch: 66, step: 1169, loss: 0.329008549451828, mean loss: 0.3396545245715013
Epoch: 66, step: 1170, loss: 0.3732928931713104, mean loss: 0.33965487324596205
Epoch: 66, step: 1171, loss: 0.3114132881164551, mean loss: 0.3396545805142451
Epoch: 66, step: 1172, loss: 0.3054609000682831, mean loss: 0.3396542260911137
Epoch: 66, step: 1173, loss: 0.30522620677948, mean loss: 0.3396538692427201
Epoch: 66, step: 1174, loss: 0.33458322286605835, mean loss: 0.33965381668572453
Epoch: 66, step: 1175, loss: 0.35755541920661926, mean loss: 0.33965400223301434
Epoch: 66, step: 1176, loss: 0.35023218393325806, mean loss: 0.3396541118730647
Epoch: 66, step: 1177, loss: 0.31685394048690796, mean loss: 0.3396538755577791
Epoch: 66, step: 1178, loss: 0.3256779611110687, mean loss: 0.33965373070413185
Epoch: 66, step: 1179, loss: 0.3146970868110657, mean loss: 0.33965347204317364
Epoch: 66, step: 1180, loss: 0.35388243198394775, mean loss: 0.33965361951645906
Epoch: 66, step: 1181, loss: 0.30245381593704224, mean loss: 0.33965323397033237
Epoch: 66, step: 1182, loss: 0.33320876955986023, mean loss: 0.33965316717932
Epoch: 66, step: 1183, loss: 0.3660498261451721, mean loss: 0.339653440753847
Epoch: 66, step: 1184, loss: 0.3530847132205963, mean loss: 0.339653579953885
Epoch: 66, step: 1185, loss: 0.297697514295578, mean loss: 0.3396531451309432
Epoch: 66, step: 1186, loss: 0.3280635178089142, mean loss: 0.33965302501997613
Epoch: 66, step: 1187, loss: 0.3417740762233734, mean loss: 0.33965304700160365
Epoch: 66, step: 1188, loss: 0.31200531125068665, mean loss: 0.3396527604757857
Epoch: 66, step: 1189, loss: 0.31453579664230347, mean loss: 0.33965250018018356
Epoch: 66, step: 1190, loss: 0.35206687450408936, mean loss: 0.33965262883321556
Epoch: 66, step: 1191, loss: 0.29922646284103394, mean loss: 0.3396522098918502
Epoch: 66, step: 1192, loss: 0.27580225467681885, mean loss: 0.3396515482137129
Epoch: 66, step: 1193, loss: 0.36494842171669006, mean loss: 0.3396518103629129
Epoch: 66, step: 1194, loss: 0.34703174233436584, mean loss: 0.3396518868396844
Epoch: 66, step: 1195, loss: 0.29128894209861755, mean loss: 0.33965138566927255
Epoch: 66, step: 1196, loss: 0.364936888217926, mean loss: 0.33965164769249045
Epoch: 66, step: 1197, loss: 0.33174440264701843, mean loss: 0.3396515657538255
Epoch: 66, step: 1198, loss: 0.2901953458786011, mean loss: 0.3396510532700698
Epoch: 66, step: 1199, loss: 0.3224053680896759, mean loss: 0.3396508745657137
Epoch: 66, step: 1200, loss: 0.3485857844352722, mean loss: 0.3396509671506561
Epoch: 66, step: 1201, loss: 0.31902050971984863, mean loss: 0.3396507533768241
Epoch: 66, step: 1202, loss: 0.338809072971344, mean loss: 0.33965074465538
Epoch: 66, step: 1203, loss: 0.3845679461956024, mean loss: 0.33965121008002397
Epoch: 66, step: 1204, loss: 0.30690810084342957, mean loss: 0.33965087080483475
Epoch: 66, step: 1205, loss: 0.342574805021286, mean loss: 0.3396509011015316
Epoch: 66, step: 1206, loss: 0.35368022322654724, mean loss: 0.33965104646653793
Epoch: 66, step: 1207, loss: 0.3175705075263977, mean loss: 0.3396508176811129
Epoch: 66, step: 1208, loss: 0.31340160965919495, mean loss: 0.33965054570523373
Epoch: 66, step: 1209, loss: 0.3118347227573395, mean loss: 0.3396502575001759
Epoch: 66, step: 1210, loss: 0.2999788522720337, mean loss: 0.3396498464614231
Epoch: 66, step: 1211, loss: 0.30807965993881226, mean loss: 0.339649519363465
Epoch: 66, step: 1212, loss: 0.34695085883140564, mean loss: 0.33964959501168723
Epoch: 66, step: 1213, loss: 0.3425038754940033, mean loss: 0.3396496245842072
Epoch: 66, step: 1214, loss: 0.3200095295906067, mean loss: 0.33964942109997104
Epoch: 66, step: 1215, loss: 0.3608047664165497, mean loss: 0.33964964028092126
Epoch: 66, step: 1216, loss: 0.30496475100517273, mean loss: 0.3396492809302175
Epoch: 66, step: 1217, loss: 0.34494274854660034, mean loss: 0.33964933577230133
Epoch: 66, step: 1218, loss: 0.33354058861732483, mean loss: 0.3396492724843062
Epoch: 66, step: 1219, loss: 0.3524181842803955, mean loss: 0.3396494047717352
Epoch: 66, step: 1220, loss: 0.3552699089050293, mean loss: 0.33964956660031986
Epoch: 66, step: 1221, loss: 0.3517938256263733, mean loss: 0.33964969241366577
Epoch: 66, step: 1222, loss: 0.3082667887210846, mean loss: 0.3396493672931949
Epoch: 66, step: 1223, loss: 0.3204768896102905, mean loss: 0.3396491686723006
Epoch: 66, step: 1224, loss: 0.3473401963710785, mean loss: 0.3396492483481255
Epoch: 66, step: 1225, loss: 0.36801791191101074, mean loss: 0.33964954223255067
Epoch: 66, step: 1226, loss: 0.331879585981369, mean loss: 0.3396494617407268
Epoch: 66, step: 1227, loss: 0.34405791759490967, mean loss: 0.33964950740906324
Epoch: 66, step: 1228, loss: 0.29852065443992615, mean loss: 0.33964908134903227
Epoch: 66, step: 1229, loss: 0.3015352189540863, mean loss: 0.33964868652583635
Epoch: 66, step: 1230, loss: 0.33059531450271606, mean loss: 0.33964859274252435
Epoch: 66, step: 1231, loss: 0.2934357225894928, mean loss: 0.33964811403126477
Epoch: 66, step: 1232, loss: 0.3105311095714569, mean loss: 0.3396478124162937
Epoch: 66, step: 1233, loss: 0.29758304357528687, mean loss: 0.3396473766835373
Epoch: 66, step: 1234, loss: 0.33334940671920776, mean loss: 0.33964731144596527
Epoch: 66, step: 1235, loss: 0.34218695759773254, mean loss: 0.33964733775263767
Epoch: 66, step: 1236, loss: 0.3271179497241974, mean loss: 0.33964720796956077
Epoch: 66, step: 1237, loss: 0.3660562038421631, mean loss: 0.33964748151885404
Epoch: 66, step: 1238, loss: 0.34714072942733765, mean loss: 0.3396475591345062
Epoch: 66, step: 1239, loss: 0.30090615153312683, mean loss: 0.33964715785211064
Epoch: 66, step: 1240, loss: 0.32013997435569763, mean loss: 0.3396469557993529
Epoch: 66, step: 1241, loss: 0.2858772873878479, mean loss: 0.3396463988661976
Epoch: 66, step: 1242, loss: 0.31346774101257324, mean loss: 0.33964612771683145
Epoch: 66, step: 1243, loss: 0.32767653465270996, mean loss: 0.33964600374126425
Epoch: 66, step: 1244, loss: 0.31579428911209106, mean loss: 0.3396457566986783
Epoch: 66, step: 1245, loss: 0.3578438460826874, mean loss: 0.33964594518225555
Epoch: 66, step: 1246, loss: 0.307861864566803, mean loss: 0.3396456159875231
Epoch: 66, step: 1247, loss: 0.3378777801990509, mean loss: 0.3396455976778476
Epoch: 66, step: 1248, loss: 0.3560364544391632, mean loss: 0.33964576743804936
Epoch: 66, step: 1249, loss: 0.33099016547203064, mean loss: 0.33964567779285637
Epoch: 66, step: 1250, loss: 0.34401556849479675, mean loss: 0.3396457230509031
Epoch: 66, step: 1251, loss: 0.3836808204650879, mean loss: 0.3396461791085009
Epoch: 66, step: 1252, loss: 0.28630301356315613, mean loss: 0.33964562665590253
Epoch: 66, step: 1253, loss: 0.3136569559574127, mean loss: 0.3396453575050222
Epoch: 66, step: 1254, loss: 0.3274317979812622, mean loss: 0.33964523101697325
Epoch: 66, step: 1255, loss: 0.3311378061771393, mean loss: 0.3396451429119107
Epoch: 66, step: 1256, loss: 0.3485490679740906, mean loss: 0.3396452351222758
Epoch: 66, step: 1257, loss: 0.3535791337490082, mean loss: 0.3396453794222968
Epoch: 66, step: 1258, loss: 0.3437735140323639, mean loss: 0.339645422172984
Epoch: 66, step: 1259, loss: 0.2971152663230896, mean loss: 0.3396449817380823
Epoch: 66, step: 1260, loss: 0.3055892884731293, mean loss: 0.3396446290668943
Epoch: 66, step: 1261, loss: 0.3147513270378113, mean loss: 0.3396443712815244
Epoch: 66, step: 1262, loss: 0.3324131667613983, mean loss: 0.3396442963987537
Epoch: 66, step: 1263, loss: 0.3622421622276306, mean loss: 0.33964453040863096
Epoch: 66, step: 1264, loss: 0.32170534133911133, mean loss: 0.33964434464312576
Epoch: 66, step: 1265, loss: 0.3125842809677124, mean loss: 0.33964406443122064
Epoch: 66, step: 1266, loss: 0.3491584360599518, mean loss: 0.33964416295325756
Epoch: 66, step: 1267, loss: 0.38918113708496094, mean loss: 0.33964467590705505
Epoch: 66, step: 1268, loss: 0.3233824372291565, mean loss: 0.3396445075138325
Epoch: 66, step: 1269, loss: 0.3268262445926666, mean loss: 0.33964437478387494
Epoch: 66, step: 1270, loss: 0.33166131377220154, mean loss: 0.339644292122099
Epoch: 66, step: 1271, loss: 0.31288832426071167, mean loss: 0.3396440150763748
Epoch: 66, step: 1272, loss: 0.32918334007263184, mean loss: 0.33964390676202455
Epoch: 66, step: 1273, loss: 0.3391658365726471, mean loss: 0.33964390181193044
Epoch: 66, step: 1274, loss: 0.3805326223373413, mean loss: 0.3396443251826479
Epoch: 66, step: 1275, loss: 0.33109602332115173, mean loss: 0.33964423667258514
Epoch: 66, step: 1276, loss: 0.34051060676574707, mean loss: 0.339644245642984
Epoch: 66, step: 1277, loss: 0.30843809247016907, mean loss: 0.33964392253771414
Epoch: 66, step: 1278, loss: 0.30620336532592773, mean loss: 0.33964357630124176
Epoch: 66, step: 1279, loss: 0.35817497968673706, mean loss: 0.33964376816949515
Epoch: 66, step: 1280, loss: 0.29621076583862305, mean loss: 0.33964331848266666
Epoch: 66, step: 1281, loss: 0.31951791048049927, mean loss: 0.3396431101149115
Epoch: 66, step: 1282, loss: 0.39100104570388794, mean loss: 0.33964364184211693
Epoch: 66, step: 1283, loss: 0.32359549403190613, mean loss: 0.3396434756915826
Epoch: 66, step: 1284, loss: 0.3161197304725647, mean loss: 0.3396432321468185
Epoch: 66, step: 1285, loss: 0.3082679212093353, mean loss: 0.33964290731701274
Epoch: 66, step: 1286, loss: 0.31214308738708496, mean loss: 0.3396426226132626
Epoch: 66, step: 1287, loss: 0.31390732526779175, mean loss: 0.3396423561802522
Epoch: 66, step: 1288, loss: 0.3344659209251404, mean loss: 0.33964230259008255
Epoch: 66, step: 1289, loss: 0.3335305452346802, mean loss: 0.33964223931744286
Epoch: 66, step: 1290, loss: 0.34913262724876404, mean loss: 0.3396423375667097
Epoch: 66, step: 1291, loss: 0.2861240804195404, mean loss: 0.3396417835245429
Epoch: 66, step: 1292, loss: 0.31041455268859863, mean loss: 0.3396414809558209
Epoch: 66, step: 1293, loss: 0.3396014869213104, mean loss: 0.33964148054179544
Epoch: 66, step: 1294, loss: 0.34336963295936584, mean loss: 0.3396415191359053
Epoch: 66, step: 1295, loss: 0.3071577548980713, mean loss: 0.33964118286505396
Epoch: 66, step: 1296, loss: 0.40291938185691833, mean loss: 0.33964183791209274
Epoch: 66, step: 1297, loss: 0.319377064704895, mean loss: 0.339641628136175
Epoch: 66, step: 1298, loss: 0.3360181152820587, mean loss: 0.33964159062685484
Epoch: 66, step: 1299, loss: 0.31810083985328674, mean loss: 0.3396413676469495
Epoch: 66, step: 1300, loss: 0.3370141088962555, mean loss: 0.33964134045106165
Epoch: 66, step: 1301, loss: 0.3412807881832123, mean loss: 0.3396413574215162
Epoch: 66, step: 1302, loss: 0.3366725742816925, mean loss: 0.33964132669099834
Epoch: 66, step: 1303, loss: 0.3411751389503479, mean loss: 0.3396413425676572
Epoch: 66, step: 1304, loss: 0.3454046845436096, mean loss: 0.3396414022240244
Epoch: 66, step: 1305, loss: 0.3460117280483246, mean loss: 0.3396414681626004
Epoch: 66, step: 1306, loss: 0.34754931926727295, mean loss: 0.3396415500150924
Epoch: 66, step: 1307, loss: 0.34926944971084595, mean loss: 0.33964164967041155
Epoch: 66, step: 1308, loss: 0.3350204527378082, mean loss: 0.339641601838371
Epoch: 66, step: 1309, loss: 0.30706286430358887, mean loss: 0.3396412646332296
Epoch: 66, step: 1310, loss: 0.3229307532310486, mean loss: 0.3396410916734262
Epoch: 66, step: 1311, loss: 0.3392438590526581, mean loss: 0.33964108756196826
Epoch: 66, step: 1312, loss: 0.32154741883277893, mean loss: 0.3396409002898657
Epoch: 66, step: 1313, loss: 0.3405655026435852, mean loss: 0.3396409098595355
Epoch: 66, step: 1314, loss: 0.3980499804019928, mean loss: 0.3396415143893955
Epoch: 66, step: 1315, loss: 0.3372136056423187, mean loss: 0.33964148926096716
Epoch: 66, step: 1316, loss: 0.3106389045715332, mean loss: 0.33964118909242524
Epoch: 66, step: 1317, loss: 0.3154948949813843, mean loss: 0.3396409391877026
Epoch: 66, step: 1318, loss: 0.3247849941253662, mean loss: 0.33964078543605897
Epoch: 66, step: 1319, loss: 0.4087054133415222, mean loss: 0.3396415002132148
Epoch: 66, step: 1320, loss: 0.297764390707016, mean loss: 0.33964106681492756
Epoch: 66, step: 1321, loss: 0.3158166706562042, mean loss: 0.33964082025193043
Epoch: 66, step: 1322, loss: 0.319755882024765, mean loss: 0.3396406144612278
Epoch: 66, step: 1323, loss: 0.30349376797676086, mean loss: 0.3396402403787001
Epoch: 66, step: 1324, loss: 0.31856200098991394, mean loss: 0.3396400222429501
Epoch: 66, step: 1325, loss: 0.34153053164482117, mean loss: 0.3396400418073649
Epoch: 66, step: 1326, loss: 0.3776637017726898, mean loss: 0.33964043530075694
Epoch: 66, step: 1327, loss: 0.3191487491130829, mean loss: 0.33964022324174764
Epoch: 66, step: 1328, loss: 0.33932259678840637, mean loss: 0.339640219954812
Epoch: 66, step: 1329, loss: 0.3340904414653778, mean loss: 0.33964016252390267
Epoch: 66, step: 1330, loss: 0.3160199820995331, mean loss: 0.3396399180971378
Epoch: 66, step: 1331, loss: 0.31613409519195557, mean loss: 0.3396396748562865
Epoch: 66, step: 1332, loss: 0.3260379433631897, mean loss: 0.3396395341055234
Epoch: 66, step: 1333, loss: 0.3302595615386963, mean loss: 0.33963943704254024
Epoch: 66, step: 1334, loss: 0.3541237413883209, mean loss: 0.3396395869230682
Epoch: 66, step: 1335, loss: 0.3735900819301605, mean loss: 0.33963993823199834
Epoch: 66, step: 1336, loss: 0.3420831263065338, mean loss: 0.3396399635130703
Epoch: 66, step: 1337, loss: 0.3315708041191101, mean loss: 0.3396398800177019
Epoch: 66, step: 1338, loss: 0.40678083896636963, mean loss: 0.3396405747494357
Epoch: 66, step: 1339, loss: 0.3471650183200836, mean loss: 0.33964065260676335
Epoch: 66, step: 1340, loss: 0.3569316864013672, mean loss: 0.33964083151962793
Epoch: 66, step: 1341, loss: 0.3595212697982788, mean loss: 0.3396410372233123
Epoch: 66, step: 1342, loss: 0.34515243768692017, mean loss: 0.3396410942494017
Epoch: 66, step: 1343, loss: 0.3435254991054535, mean loss: 0.3396411344406613
Epoch: 66, step: 1344, loss: 0.34992164373397827, mean loss: 0.33964124081019736
Epoch: 66, step: 1345, loss: 0.39679038524627686, mean loss: 0.33964183211019155
Epoch: 66, step: 1346, loss: 0.3392086327075958, mean loss: 0.33964182762809203
Epoch: 66, step: 1347, loss: 0.3307216465473175, mean loss: 0.33964173533635383
Epoch: 66, step: 1348, loss: 0.3216741383075714, mean loss: 0.3396415494383783
Epoch: 66, step: 1349, loss: 0.3445590138435364, mean loss: 0.3396416003153664
Epoch: 66, step: 1350, loss: 0.3200337886810303, mean loss: 0.3396413974514521
Epoch: 66, step: 1351, loss: 0.3433111608028412, mean loss: 0.3396414354187108
Epoch: 66, step: 1352, loss: 0.3051004707813263, mean loss: 0.3396410780626513
Epoch: 66, step: 1353, loss: 0.3505876660346985, mean loss: 0.33964119131337006
Epoch: 66, step: 1354, loss: 0.3115643560886383, mean loss: 0.33964090084031295
Epoch: 66, step: 1355, loss: 0.3365468978881836, mean loss: 0.33964086883117833
Epoch: 66, step: 1356, loss: 0.30938223004341125, mean loss: 0.3396405557924265
Epoch: 66, step: 1357, loss: 0.3140314817428589, mean loss: 0.3396402908581809
Epoch: 66, step: 1358, loss: 0.31655409932136536, mean loss: 0.3396400520264507
Epoch: 66, step: 1359, loss: 0.3344779908657074, mean loss: 0.33963999862434485
Epoch: 66, step: 1360, loss: 0.3279787600040436, mean loss: 0.33963987798876194
Epoch: 66, step: 1361, loss: 0.33608800172805786, mean loss: 0.339639841244961
Epoch: 66, step: 1362, loss: 0.3109360933303833, mean loss: 0.3396395443106617
Epoch: 66, step: 1363, loss: 0.3361794352531433, mean loss: 0.33963950851692376
Epoch: 66, step: 1364, loss: 0.3801991045475006, mean loss: 0.33963992808882404
Epoch: 66, step: 1365, loss: 0.32576072216033936, mean loss: 0.3396397845157825
Epoch: 66, step: 1366, loss: 0.363831490278244, mean loss: 0.3396400347635896
Epoch: 66, step: 1367, loss: 0.3174422085285187, mean loss: 0.3396398051435731
Epoch: 66, step: 1368, loss: 0.3722374439239502, mean loss: 0.3396401423384339
Epoch: 66, step: 1369, loss: 0.3178597688674927, mean loss: 0.33963991704131713
Epoch: 66, step: 1370, loss: 0.3201166093349457, mean loss: 0.3396397150934743
Epoch: 66, step: 1371, loss: 0.3229449987411499, mean loss: 0.33963954240618527
Epoch: 66, step: 1372, loss: 0.35052964091300964, mean loss: 0.33963965505033544
Epoch: 66, step: 1373, loss: 0.31630364060401917, mean loss: 0.339639413671589
Epoch: 66, step: 1374, loss: 0.32524943351745605, mean loss: 0.33963926482871565
Epoch: 66, step: 1375, loss: 0.31447017192840576, mean loss: 0.33963900449469725
Epoch: 66, step: 1376, loss: 0.3094964921474457, mean loss: 0.3396386927218324
Epoch: 66, step: 1377, loss: 0.3389507532119751, mean loss: 0.3396386856063454
Epoch: 66, step: 1378, loss: 0.3175010085105896, mean loss: 0.33963845663458103
Epoch: 66, step: 1379, loss: 0.33177027106285095, mean loss: 0.33963837525415025
Epoch: 66, step: 1380, loss: 0.2937271296977997, mean loss: 0.3396379004002892
Epoch: 66, step: 1381, loss: 0.32006606459617615, mean loss: 0.3396376979735076
Epoch: 66, step: 1382, loss: 0.2950231730937958, mean loss: 0.33963723654099987
Epoch: 66, step: 1383, loss: 0.33196496963500977, mean loss: 0.3396371571902334
Epoch: 66, step: 1384, loss: 0.3825918734073639, mean loss: 0.3396376014467281
Epoch: 66, step: 1385, loss: 0.34576088190078735, mean loss: 0.3396376647757224
Epoch: 66, step: 1386, loss: 0.3403814733028412, mean loss: 0.3396376724683569
Epoch: 66, step: 1387, loss: 0.3284269869327545, mean loss: 0.33963755652613276
Epoch: 66, step: 1388, loss: 0.3902893364429474, mean loss: 0.3396380803673614
Epoch: 66, step: 1389, loss: 0.3291866183280945, mean loss: 0.3396379722793514
Epoch: 66, step: 1390, loss: 0.3600519299507141, mean loss: 0.3396381833963447
Epoch: 66, step: 1391, loss: 0.3303360641002655, mean loss: 0.339638087196716
Epoch: 66, step: 1392, loss: 0.32316774129867554, mean loss: 0.3396379168672756
Epoch: 66, step: 1393, loss: 0.32738685607910156, mean loss: 0.33963779017323037
Epoch: 66, step: 1394, loss: 0.29939088225364685, mean loss: 0.3396373739651215
Epoch: 66, step: 1395, loss: 0.33147770166397095, mean loss: 0.3396372895838154
Epoch: 66, step: 1396, loss: 0.368283212184906, mean loss: 0.33963758581573233
Epoch: 66, step: 1397, loss: 0.32324671745300293, mean loss: 0.33963741631697986
Epoch: 66, step: 1398, loss: 0.33208462595939636, mean loss: 0.33963733821402176
Epoch: 66, step: 1399, loss: 0.36927756667137146, mean loss: 0.33963764471870056
Epoch: 66, step: 1400, loss: 0.37521177530288696, mean loss: 0.3396380125810715
Epoch: 66, step: 1401, loss: 0.30097755789756775, mean loss: 0.3396376128079997
Epoch: 66, step: 1402, loss: 0.3208318054676056, mean loss: 0.3396374183463026
Epoch: 66, step: 1403, loss: 0.3240344226360321, mean loss: 0.3396372570049895
Epoch: 66, step: 1404, loss: 0.32315748929977417, mean loss: 0.33963708659925984
Epoch: 66, step: 1405, loss: 0.36857736110687256, mean loss: 0.3396373858472643
Epoch: 66, step: 1406, loss: 0.36111006140708923, mean loss: 0.3396376078765635
Epoch: 66, step: 1407, loss: 0.31118685007095337, mean loss: 0.3396373136963397
Epoch: 66, step: 1408, loss: 0.35119539499282837, mean loss: 0.339637433205416
Epoch: 66, step: 1409, loss: 0.31165415048599243, mean loss: 0.3396371438648581
Epoch: 66, step: 1410, loss: 0.3324969410896301, mean loss: 0.33963707003760507
Epoch: 66, step: 1411, loss: 0.3731848895549774, mean loss: 0.3396374169069909
Epoch: 66, step: 1412, loss: 0.3169648051261902, mean loss: 0.3396371824847923
Epoch: 66, step: 1413, loss: 0.3554494082927704, mean loss: 0.3396373459727243
Epoch: 66, step: 1414, loss: 0.35567304491996765, mean loss: 0.3396375117695062
Epoch: 66, step: 1415, loss: 0.3397842049598694, mean loss: 0.33963751328618513
Epoch: 66, step: 1416, loss: 0.308318555355072, mean loss: 0.33963718947896715
Epoch: 66, step: 1417, loss: 0.32882341742515564, mean loss: 0.33963707767635704
Epoch: 66, step: 1418, loss: 0.31077075004577637, mean loss: 0.33963677923309504
Epoch: 66, step: 1419, loss: 0.3197173774242401, mean loss: 0.33963657329246183
Epoch: 66, step: 1420, loss: 0.3607088029384613, mean loss: 0.3396367911495789
Epoch: 66, step: 1421, loss: 0.3266224265098572, mean loss: 0.33963665660080566
Epoch: 66, step: 1422, loss: 0.31868016719818115, mean loss: 0.3396364399447592
Epoch: 66, step: 1423, loss: 0.30623263120651245, mean loss: 0.3396360946072278
Epoch: 66, step: 1424, loss: 0.3479480445384979, mean loss: 0.33963618053750655
Epoch: 66, step: 1425, loss: 0.32421553134918213, mean loss: 0.3396360211179967
Epoch: 66, step: 1426, loss: 0.3358987867832184, mean loss: 0.3396359824826643
Epoch: 66, step: 1427, loss: 0.3320220410823822, mean loss: 0.33963590377095154
Epoch: 66, step: 1428, loss: 0.31006330251693726, mean loss: 0.3396355980572731
Epoch: 66, step: 1429, loss: 0.33553898334503174, mean loss: 0.3396355557079987
Epoch: 66, step: 1430, loss: 0.35259538888931274, mean loss: 0.33963568968053376
Epoch: 66, step: 1431, loss: 0.31609010696411133, mean loss: 0.339635446280117
Epoch: 66, step: 1432, loss: 0.35509976744651794, mean loss: 0.3396356061395417
Epoch: 66, step: 1433, loss: 0.33229005336761475, mean loss: 0.33963553020709764
Epoch: 66, step: 1434, loss: 0.30626797676086426, mean loss: 0.3396351852836082
Epoch: 66, step: 1435, loss: 0.36651554703712463, mean loss: 0.3396354631455242
Epoch: 66, step: 1436, loss: 0.3049010932445526, mean loss: 0.3396351041005494
Epoch: 66, step: 1437, loss: 0.3370869755744934, mean loss: 0.3396350777611257
Epoch: 66, step: 1438, loss: 0.3340124785900116, mean loss: 0.3396350196422006
Epoch: 66, step: 1439, loss: 0.3801172971725464, mean loss: 0.33963543808962404
Epoch: 66, step: 1440, loss: 0.3289160132408142, mean loss: 0.339635327288809
Epoch: 66, step: 1441, loss: 0.37059256434440613, mean loss: 0.3396356472734808
Epoch: 66, step: 1442, loss: 0.34681376814842224, mean loss: 0.3396357214682452
Epoch: 66, step: 1443, loss: 0.3181394338607788, mean loss: 0.3396354992798009
Valid: 66, mean loss: 0.18567362924416858
Epoch: 67, step: 0, loss: 0.30659884214401245, mean loss: 0.33963515781211506
Epoch: 67, step: 1, loss: 0.310593843460083, mean loss: 0.3396348576434913
Epoch: 67, step: 2, loss: 0.3071900010108948, mean loss: 0.339634522299602
Epoch: 67, step: 3, loss: 0.2975151836872101, mean loss: 0.33963408696659997
Epoch: 67, step: 4, loss: 0.37177151441574097, mean loss: 0.3396344191260932
Epoch: 67, step: 5, loss: 0.3379339873790741, mean loss: 0.33963440155129787
Epoch: 67, step: 6, loss: 0.3513370156288147, mean loss: 0.33963452250229864
Epoch: 67, step: 7, loss: 0.2931499779224396, mean loss: 0.3396340420716837
Epoch: 67, step: 8, loss: 0.36108478903770447, mean loss: 0.3396342637687905
Epoch: 67, step: 9, loss: 0.308209627866745, mean loss: 0.3396339389932071
Epoch: 67, step: 10, loss: 0.31046754121780396, mean loss: 0.3396336375597717
Epoch: 67, step: 11, loss: 0.3494682013988495, mean loss: 0.3396337391985051
Epoch: 67, step: 12, loss: 0.3237428069114685, mean loss: 0.33963357496981494
Epoch: 67, step: 13, loss: 0.30697566270828247, mean loss: 0.3396332374621956
Epoch: 67, step: 14, loss: 0.30743494629859924, mean loss: 0.33963290470803165
Epoch: 67, step: 15, loss: 0.3398441672325134, mean loss: 0.3396329068913077
Epoch: 67, step: 16, loss: 0.30554091930389404, mean loss: 0.3396325545739658
Epoch: 67, step: 17, loss: 0.3077598214149475, mean loss: 0.33963222519450237
Epoch: 67, step: 18, loss: 0.34557652473449707, mean loss: 0.33963228662349715
Epoch: 67, step: 19, loss: 0.3439692258834839, mean loss: 0.33963233144140453
Epoch: 67, step: 20, loss: 0.3425721526145935, mean loss: 0.33963236182118706
Epoch: 67, step: 21, loss: 0.3437514305114746, mean loss: 0.33963240438674136
Epoch: 67, step: 22, loss: 0.3211921155452728, mean loss: 0.33963221383080167
Epoch: 67, step: 23, loss: 0.3080899715423584, mean loss: 0.33963188788690996
Epoch: 67, step: 24, loss: 0.310624361038208, mean loss: 0.339631588138769
Epoch: 67, step: 25, loss: 0.3381774425506592, mean loss: 0.33963157311256786
Epoch: 67, step: 26, loss: 0.34504464268684387, mean loss: 0.339631629047154
Epoch: 67, step: 27, loss: 0.3454255759716034, mean loss: 0.33963168891682133
Epoch: 67, step: 28, loss: 0.3457626402378082, mean loss: 0.3396317522681478
Epoch: 67, step: 29, loss: 0.3093629479408264, mean loss: 0.33963143950280517
Epoch: 67, step: 30, loss: 0.31788864731788635, mean loss: 0.3396312148384443
Epoch: 67, step: 31, loss: 0.31587642431259155, mean loss: 0.3396309693870026
Epoch: 67, step: 32, loss: 0.32505035400390625, mean loss: 0.3396308187312398
Epoch: 67, step: 33, loss: 0.3307493031024933, mean loss: 0.3396307269629809
Epoch: 67, step: 34, loss: 0.31599682569503784, mean loss: 0.3396304827682229
Epoch: 67, step: 35, loss: 0.2899765074253082, mean loss: 0.3396299697291323
Epoch: 67, step: 36, loss: 0.3660100996494293, mean loss: 0.3396302422933718
Epoch: 67, step: 37, loss: 0.34276482462882996, mean loss: 0.33963027468010476
Epoch: 67, step: 38, loss: 0.3097264766693115, mean loss: 0.33962996571507836
Epoch: 67, step: 39, loss: 0.3329989016056061, mean loss: 0.33962989720385683
Epoch: 67, step: 40, loss: 0.3289206624031067, mean loss: 0.3396297865586926
Epoch: 67, step: 41, loss: 0.33181342482566833, mean loss: 0.3396297058028115
Epoch: 67, step: 42, loss: 0.3056809902191162, mean loss: 0.3396293550603294
Epoch: 67, step: 43, loss: 0.360266774892807, mean loss: 0.33962956827443624
Epoch: 67, step: 44, loss: 0.29698681831359863, mean loss: 0.3396291277183014
Epoch: 67, step: 45, loss: 0.3692300021648407, mean loss: 0.3396294335314143
Epoch: 67, step: 46, loss: 0.33903947472572327, mean loss: 0.3396294274364837
Epoch: 67, step: 47, loss: 0.3277328312397003, mean loss: 0.33962930453268403
Epoch: 67, step: 48, loss: 0.3495858609676361, mean loss: 0.3396294073928598
Epoch: 67, step: 49, loss: 0.35361403226852417, mean loss: 0.33962955186511
Epoch: 67, step: 50, loss: 0.3400546610355377, mean loss: 0.33962955625677904
Epoch: 67, step: 51, loss: 0.329278826713562, mean loss: 0.33962944932775485
Epoch: 67, step: 52, loss: 0.31030893325805664, mean loss: 0.33962914643299064
Epoch: 67, step: 53, loss: 0.3419121205806732, mean loss: 0.33962917001694704
Epoch: 67, step: 54, loss: 0.3464226722717285, mean loss: 0.3396292401955805
Epoch: 67, step: 55, loss: 0.3449634313583374, mean loss: 0.3396292952985841
Epoch: 67, step: 56, loss: 0.35339704155921936, mean loss: 0.3396294375200216
Epoch: 67, step: 57, loss: 0.3233141601085663, mean loss: 0.3396292689842138
Epoch: 67, step: 58, loss: 0.3142271935939789, mean loss: 0.33962900658505474
Epoch: 67, step: 59, loss: 0.35812923312187195, mean loss: 0.3396291976873039
Epoch: 67, step: 60, loss: 0.32207509875297546, mean loss: 0.33962901636016557
Epoch: 67, step: 61, loss: 0.2975924015045166, mean loss: 0.3396285821424726
Epoch: 67, step: 62, loss: 0.336738258600235, mean loss: 0.339628552287151
Epoch: 67, step: 63, loss: 0.33138614892959595, mean loss: 0.3396284671489103
Epoch: 67, step: 64, loss: 0.32872873544692993, mean loss: 0.33962835456349616
Epoch: 67, step: 65, loss: 0.32370883226394653, mean loss: 0.33962819012940293
Epoch: 67, step: 66, loss: 0.35283342003822327, mean loss: 0.33962832652593145
Epoch: 67, step: 67, loss: 0.326494425535202, mean loss: 0.33962819086755897
Epoch: 67, step: 68, loss: 0.338979572057724, mean loss: 0.33962818416812796
Epoch: 67, step: 69, loss: 0.3288100063800812, mean loss: 0.33962807243087056
Epoch: 67, step: 70, loss: 0.3193158209323883, mean loss: 0.3396278626347407
Epoch: 67, step: 71, loss: 0.38510164618492126, mean loss: 0.33962833230819195
Epoch: 67, step: 72, loss: 0.3373870849609375, mean loss: 0.3396283091598321
Epoch: 67, step: 73, loss: 0.315582811832428, mean loss: 0.3396280608123767
Epoch: 67, step: 74, loss: 0.3007437586784363, mean loss: 0.3396276592104625
Epoch: 67, step: 75, loss: 0.36332276463508606, mean loss: 0.3396279039339342
Epoch: 67, step: 76, loss: 0.31262636184692383, mean loss: 0.3396276250644058
Epoch: 67, step: 77, loss: 0.34514206647872925, mean loss: 0.33962768201647875
Epoch: 67, step: 78, loss: 0.32939717173576355, mean loss: 0.3396275763588597
Epoch: 67, step: 79, loss: 0.2976592481136322, mean loss: 0.33962714292712254
Epoch: 67, step: 80, loss: 0.3236110806465149, mean loss: 0.339626977521487
Epoch: 67, step: 81, loss: 0.3340744376182556, mean loss: 0.33962692017830926
Epoch: 67, step: 82, loss: 0.3268330693244934, mean loss: 0.3396267880527415
Epoch: 67, step: 83, loss: 0.3306959569454193, mean loss: 0.3396266958225789
Epoch: 67, step: 84, loss: 0.33176520466804504, mean loss: 0.33962661463650434
Epoch: 67, step: 85, loss: 0.34099796414375305, mean loss: 0.33962662879836386
Epoch: 67, step: 86, loss: 0.32473406195640564, mean loss: 0.3396264750051399
Epoch: 67, step: 87, loss: 0.2964906692504883, mean loss: 0.33962602955297594
Epoch: 67, step: 88, loss: 0.36761459708213806, mean loss: 0.33962631858059483
Epoch: 67, step: 89, loss: 0.33997926115989685, mean loss: 0.3396263222252651
Epoch: 67, step: 90, loss: 0.3197941184043884, mean loss: 0.3396261174296371
Epoch: 67, step: 91, loss: 0.3299524188041687, mean loss: 0.3396260175360123
Epoch: 67, step: 92, loss: 0.38045552372932434, mean loss: 0.3396264391498555
Epoch: 67, step: 93, loss: 0.3535396158695221, mean loss: 0.33962658281868435
Epoch: 67, step: 94, loss: 0.32873767614364624, mean loss: 0.339626470379926
Epoch: 67, step: 95, loss: 0.3095184862613678, mean loss: 0.33962615948834657
Epoch: 67, step: 96, loss: 0.29748937487602234, mean loss: 0.3396257243932502
Epoch: 67, step: 97, loss: 0.3428220748901367, mean loss: 0.339625757397716
Epoch: 67, step: 98, loss: 0.36182767152786255, mean loss: 0.33962598664502497
Epoch: 67, step: 99, loss: 0.3117174804210663, mean loss: 0.33962569847690355
Epoch: 67, step: 100, loss: 0.33719342947006226, mean loss: 0.3396256733628703
Epoch: 67, step: 101, loss: 0.31994372606277466, mean loss: 0.33962547014193795
Epoch: 67, step: 102, loss: 0.35037165880203247, mean loss: 0.3396255810978254
Epoch: 67, step: 103, loss: 0.2967575192451477, mean loss: 0.3396251384837147
Epoch: 67, step: 104, loss: 0.3484986126422882, mean loss: 0.33962523010167345
Epoch: 67, step: 105, loss: 0.337048202753067, mean loss: 0.339625203494333
Epoch: 67, step: 106, loss: 0.3731496036052704, mean loss: 0.3396255496241158
Epoch: 67, step: 107, loss: 0.3282729685306549, mean loss: 0.33962543241319343
Epoch: 67, step: 108, loss: 0.329611212015152, mean loss: 0.3396253290213849
Epoch: 67, step: 109, loss: 0.33071595430374146, mean loss: 0.3396252370375042
Epoch: 67, step: 110, loss: 0.32253387570381165, mean loss: 0.3396250605814048
Epoch: 67, step: 111, loss: 0.3190365731716156, mean loss: 0.33962484802217074
Epoch: 67, step: 112, loss: 0.3564007878303528, mean loss: 0.33962502121819194
Epoch: 67, step: 113, loss: 0.3289026916027069, mean loss: 0.33962491052122495
Epoch: 67, step: 114, loss: 0.3144785463809967, mean loss: 0.33962465091369537
Epoch: 67, step: 115, loss: 0.37201976776123047, mean loss: 0.33962498535287655
Epoch: 67, step: 116, loss: 0.29523807764053345, mean loss: 0.33962452711814045
Epoch: 67, step: 117, loss: 0.341217041015625, mean loss: 0.33962454355852095
Epoch: 67, step: 118, loss: 0.3523584008216858, mean loss: 0.3396246750156453
Epoch: 67, step: 119, loss: 0.32448306679725647, mean loss: 0.3396245187038786
Epoch: 67, step: 120, loss: 0.34861209988594055, mean loss: 0.3396246114846566
Epoch: 67, step: 121, loss: 0.2872942090034485, mean loss: 0.33962407127197486
Epoch: 67, step: 122, loss: 0.31867143511772156, mean loss: 0.3396238549777676
Epoch: 67, step: 123, loss: 0.40345725417137146, mean loss: 0.33962451392358467
Epoch: 67, step: 124, loss: 0.34571778774261475, mean loss: 0.33962457682319364
Epoch: 67, step: 125, loss: 0.3452824354171753, mean loss: 0.33962463522749814
Epoch: 67, step: 126, loss: 0.38314929604530334, mean loss: 0.3396250845143195
Epoch: 67, step: 127, loss: 0.3196878731250763, mean loss: 0.3396248787129715
Epoch: 67, step: 128, loss: 0.28959885239601135, mean loss: 0.33962436232594134
Epoch: 67, step: 129, loss: 0.3083772659301758, mean loss: 0.33962403978525724
Epoch: 67, step: 130, loss: 0.35747474431991577, mean loss: 0.3396242240429863
Epoch: 67, step: 131, loss: 0.32674285769462585, mean loss: 0.3396240910809059
Epoch: 67, step: 132, loss: 0.31474587321281433, mean loss: 0.3396238342894002
Epoch: 67, step: 133, loss: 0.28603726625442505, mean loss: 0.3396232811776969
Epoch: 67, step: 134, loss: 0.3114743232727051, mean loss: 0.33962299063180235
Epoch: 67, step: 135, loss: 0.3562820553779602, mean loss: 0.33962316258036707
Epoch: 67, step: 136, loss: 0.3134545385837555, mean loss: 0.33962289248051675
Epoch: 67, step: 137, loss: 0.2979356348514557, mean loss: 0.3396224622092946
Epoch: 67, step: 138, loss: 0.3236100673675537, mean loss: 0.33962229694052953
Epoch: 67, step: 139, loss: 0.32287535071372986, mean loss: 0.3396221240920217
Epoch: 67, step: 140, loss: 0.34608131647109985, mean loss: 0.3396221907579216
Epoch: 67, step: 141, loss: 0.30803340673446655, mean loss: 0.33962186473063266
Epoch: 67, step: 142, loss: 0.32201966643333435, mean loss: 0.3396216830605261
Epoch: 67, step: 143, loss: 0.37542280554771423, mean loss: 0.3396220525556597
Epoch: 67, step: 144, loss: 0.34111225605010986, mean loss: 0.3396220679355478
Epoch: 67, step: 145, loss: 0.34299755096435547, mean loss: 0.33962210277241106
Epoch: 67, step: 146, loss: 0.36445292830467224, mean loss: 0.3396223590377037
Epoch: 67, step: 147, loss: 0.31403324007987976, mean loss: 0.3396220949492072
Epoch: 67, step: 148, loss: 0.3911283612251282, mean loss: 0.3396226265060797
Epoch: 67, step: 149, loss: 0.3286622166633606, mean loss: 0.3396225133932204
Epoch: 67, step: 150, loss: 0.3347393870353699, mean loss: 0.3396224629992395
Epoch: 67, step: 151, loss: 0.2969202399253845, mean loss: 0.33962202231582284
Epoch: 67, step: 152, loss: 0.32283157110214233, mean loss: 0.3396218490415407
Epoch: 67, step: 153, loss: 0.377329021692276, mean loss: 0.33962223816841786
Epoch: 67, step: 154, loss: 0.343974769115448, mean loss: 0.3396222830847873
Epoch: 67, step: 155, loss: 0.33682698011398315, mean loss: 0.3396222542386822
Epoch: 67, step: 156, loss: 0.32737284898757935, mean loss: 0.33962212783235385
Epoch: 67, step: 157, loss: 0.32391759753227234, mean loss: 0.33962196577293235
Epoch: 67, step: 158, loss: 0.34696993231773376, mean loss: 0.3396220415978629
Epoch: 67, step: 159, loss: 0.3676196038722992, mean loss: 0.339622330506542
Epoch: 67, step: 160, loss: 0.37126100063323975, mean loss: 0.3396226569846826
Epoch: 67, step: 161, loss: 0.31250566244125366, mean loss: 0.3396223771684145
Epoch: 67, step: 162, loss: 0.3631453514099121, mean loss: 0.3396226198960124
Epoch: 67, step: 163, loss: 0.3241178095340729, mean loss: 0.33962245990746237
Epoch: 67, step: 164, loss: 0.33667242527008057, mean loss: 0.33962242946743226
Epoch: 67, step: 165, loss: 0.3531198501586914, mean loss: 0.3396225687395776
Epoch: 67, step: 166, loss: 0.3148995041847229, mean loss: 0.33962231363908174
Epoch: 67, step: 167, loss: 0.3437102735042572, mean loss: 0.33962235581952527
Epoch: 67, step: 168, loss: 0.3308720886707306, mean loss: 0.3396222655333304
Epoch: 67, step: 169, loss: 0.32154762744903564, mean loss: 0.3396220790392005
Epoch: 67, step: 170, loss: 0.36360740661621094, mean loss: 0.33962232651727575
Epoch: 67, step: 171, loss: 0.3313043713569641, mean loss: 0.3396222406943789
Epoch: 67, step: 172, loss: 0.31096863746643066, mean loss: 0.33962194505562954
Epoch: 67, step: 173, loss: 0.3090328872203827, mean loss: 0.33962162945073243
Epoch: 67, step: 174, loss: 0.31194213032722473, mean loss: 0.33962134386837195
Epoch: 67, step: 175, loss: 0.33006641268730164, mean loss: 0.3396212452866875
Epoch: 67, step: 176, loss: 0.3010879456996918, mean loss: 0.3396208477287862
Epoch: 67, step: 177, loss: 0.35098204016685486, mean loss: 0.33962096494390326
Epoch: 67, step: 178, loss: 0.3245150148868561, mean loss: 0.33962080909517117
Epoch: 67, step: 179, loss: 0.2964213192462921, mean loss: 0.339620363408787
Epoch: 67, step: 180, loss: 0.34170278906822205, mean loss: 0.33962038489281815
Epoch: 67, step: 181, loss: 0.3109845817089081, mean loss: 0.3396200894651571
Epoch: 67, step: 182, loss: 0.3223653733730316, mean loss: 0.33961991145486015
Epoch: 67, step: 183, loss: 0.333783358335495, mean loss: 0.33961985124199834
Epoch: 67, step: 184, loss: 0.3388752341270447, mean loss: 0.3396198435602273
Epoch: 67, step: 185, loss: 0.35302719473838806, mean loss: 0.33961998187445325
Epoch: 67, step: 186, loss: 0.3684750497341156, mean loss: 0.33962027954885216
Epoch: 67, step: 187, loss: 0.3327687382698059, mean loss: 0.33962020886777106
Epoch: 67, step: 188, loss: 0.34596163034439087, mean loss: 0.33962027428573816
Epoch: 67, step: 189, loss: 0.2717093527317047, mean loss: 0.33961957372536394
Epoch: 67, step: 190, loss: 0.33209332823753357, mean loss: 0.33961949608637976
Epoch: 67, step: 191, loss: 0.3171412944793701, mean loss: 0.3396192642089132
Epoch: 67, step: 192, loss: 0.3662043809890747, mean loss: 0.33961953844908793
Epoch: 67, step: 193, loss: 0.3176380395889282, mean loss: 0.3396193117001158
Epoch: 67, step: 194, loss: 0.3408586382865906, mean loss: 0.3396193244841908
Epoch: 67, step: 195, loss: 0.29841509461402893, mean loss: 0.339618899452937
Epoch: 67, step: 196, loss: 0.3093721866607666, mean loss: 0.33961858745424917
Epoch: 67, step: 197, loss: 0.3435661494731903, mean loss: 0.33961862817343325
Epoch: 67, step: 198, loss: 0.3336926996707916, mean loss: 0.3396185670479884
Epoch: 67, step: 199, loss: 0.33706504106521606, mean loss: 0.3396185407088583
Epoch: 67, step: 200, loss: 0.3323320746421814, mean loss: 0.3396184655511355
Epoch: 67, step: 201, loss: 0.322486013174057, mean loss: 0.33961828883682527
Epoch: 67, step: 202, loss: 0.3153229355812073, mean loss: 0.3396180382426771
Epoch: 67, step: 203, loss: 0.30021652579307556, mean loss: 0.33961763184041155
Epoch: 67, step: 204, loss: 0.3585071861743927, mean loss: 0.33961782667248824
Epoch: 67, step: 205, loss: 0.34019723534584045, mean loss: 0.33961783264860756
Epoch: 67, step: 206, loss: 0.33213406801223755, mean loss: 0.3396177554605859
Epoch: 67, step: 207, loss: 0.3205793499946594, mean loss: 0.33961755909929353
Epoch: 67, step: 208, loss: 0.3120265603065491, mean loss: 0.3396172745298577
Epoch: 67, step: 209, loss: 0.32506343722343445, mean loss: 0.3396171244253041
Epoch: 67, step: 210, loss: 0.37813329696655273, mean loss: 0.3396175216671542
Epoch: 67, step: 211, loss: 0.33076974749565125, mean loss: 0.33961743041535786
Epoch: 67, step: 212, loss: 0.34952524304389954, mean loss: 0.33961753259884014
Epoch: 67, step: 213, loss: 0.3325756788253784, mean loss: 0.3396174599739585
Epoch: 67, step: 214, loss: 0.2988816797733307, mean loss: 0.33961703985721087
Epoch: 67, step: 215, loss: 0.3614632189273834, mean loss: 0.339617265159169
Epoch: 67, step: 216, loss: 0.3319452702999115, mean loss: 0.3396171860378896
Epoch: 67, step: 217, loss: 0.3237573504447937, mean loss: 0.3396170224770993
Epoch: 67, step: 218, loss: 0.3403482437133789, mean loss: 0.339617030018028
Epoch: 67, step: 219, loss: 0.3363017439842224, mean loss: 0.3396169958285425
Epoch: 67, step: 220, loss: 0.30791133642196655, mean loss: 0.33961666886157976
Epoch: 67, step: 221, loss: 0.3865402936935425, mean loss: 0.33961715275994864
Epoch: 67, step: 222, loss: 0.3311472535133362, mean loss: 0.33961706541528636
Epoch: 67, step: 223, loss: 0.28452712297439575, mean loss: 0.3396164973137473
Epoch: 67, step: 224, loss: 0.31974130868911743, mean loss: 0.33961629235784596
Epoch: 67, step: 225, loss: 0.33898961544036865, mean loss: 0.339616285895527
Epoch: 67, step: 226, loss: 0.3479325771331787, mean loss: 0.33961637165259057
Epoch: 67, step: 227, loss: 0.3702861964702606, mean loss: 0.339616687914602
Epoch: 67, step: 228, loss: 0.3027169704437256, mean loss: 0.33961630741492194
Epoch: 67, step: 229, loss: 0.3529965281486511, mean loss: 0.33961644538663444
Epoch: 67, step: 230, loss: 0.3451632559299469, mean loss: 0.33961650258263093
Epoch: 67, step: 231, loss: 0.3659634292125702, mean loss: 0.3396167742564465
Epoch: 67, step: 232, loss: 0.30614256858825684, mean loss: 0.3396164290939335
Epoch: 67, step: 233, loss: 0.3332694470882416, mean loss: 0.3396163636489849
Epoch: 67, step: 234, loss: 0.3779758810997009, mean loss: 0.3396167591772471
Epoch: 67, step: 235, loss: 0.3131471276283264, mean loss: 0.3396164862494286
Epoch: 67, step: 236, loss: 0.32647767663002014, mean loss: 0.33961635077683366
Epoch: 67, step: 237, loss: 0.3256950080394745, mean loss: 0.33961620723711927
Epoch: 67, step: 238, loss: 0.3510057330131531, mean loss: 0.3396163246706493
Epoch: 67, step: 239, loss: 0.3312324285507202, mean loss: 0.3396162382280366
Epoch: 67, step: 240, loss: 0.3260277509689331, mean loss: 0.3396160981246511
Epoch: 67, step: 241, loss: 0.3210502862930298, mean loss: 0.33961590670479513
Epoch: 67, step: 242, loss: 0.3100724518299103, mean loss: 0.33961560210483355
Epoch: 67, step: 243, loss: 0.3649252951145172, mean loss: 0.3396158630510251
Epoch: 67, step: 244, loss: 0.3988712728023529, mean loss: 0.33961647397562533
Epoch: 67, step: 245, loss: 0.3198951780796051, mean loss: 0.3396162706507197
Epoch: 67, step: 246, loss: 0.31502214074134827, mean loss: 0.3396160170899185
Epoch: 67, step: 247, loss: 0.349060595035553, mean loss: 0.33961611446071677
Epoch: 67, step: 248, loss: 0.30064624547958374, mean loss: 0.3396157126970645
Epoch: 67, step: 249, loss: 0.3435402512550354, mean loss: 0.3396157531570591
Epoch: 67, step: 250, loss: 0.36933499574661255, mean loss: 0.33961605954416196
Epoch: 67, step: 251, loss: 0.3268524408340454, mean loss: 0.3396159279604639
Epoch: 67, step: 252, loss: 0.3097885549068451, mean loss: 0.3396156204649427
Epoch: 67, step: 253, loss: 0.3245134949684143, mean loss: 0.33961546477613735
Epoch: 67, step: 254, loss: 0.33655476570129395, mean loss: 0.3396154332235145
Epoch: 67, step: 255, loss: 0.2869192361831665, mean loss: 0.33961488998615275
Epoch: 67, step: 256, loss: 0.32019636034965515, mean loss: 0.3396146898054442
Epoch: 67, step: 257, loss: 0.32984960079193115, mean loss: 0.3396145891406501
Epoch: 67, step: 258, loss: 0.3525625169277191, mean loss: 0.33961472261480957
Epoch: 67, step: 259, loss: 0.3068850636482239, mean loss: 0.33961438522347104
Epoch: 67, step: 260, loss: 0.32376813888549805, mean loss: 0.33961422187526275
Epoch: 67, step: 261, loss: 0.31759199500083923, mean loss: 0.33961399486539906
Epoch: 67, step: 262, loss: 0.322321355342865, mean loss: 0.3396138166109792
Epoch: 67, step: 263, loss: 0.32024192810058594, mean loss: 0.33961361692549175
Epoch: 67, step: 264, loss: 0.3645472824573517, mean loss: 0.3396138739391449
Epoch: 67, step: 265, loss: 0.3187410533428192, mean loss: 0.33961365878648037
Epoch: 67, step: 266, loss: 0.3151797354221344, mean loss: 0.3396134069293102
Epoch: 67, step: 267, loss: 0.3779738247394562, mean loss: 0.3396138023323139
Epoch: 67, step: 268, loss: 0.2970713973045349, mean loss: 0.3396133638276701
Epoch: 67, step: 269, loss: 0.3294169306755066, mean loss: 0.33961325872930537
Epoch: 67, step: 270, loss: 0.331938773393631, mean loss: 0.33961317962639426
Epoch: 67, step: 271, loss: 0.3576412796974182, mean loss: 0.33961336544478293
Epoch: 67, step: 272, loss: 0.3833995461463928, mean loss: 0.3396138167510022
Epoch: 67, step: 273, loss: 0.31322020292282104, mean loss: 0.3396135447135898
Epoch: 67, step: 274, loss: 0.3793911933898926, mean loss: 0.33961395469523
Epoch: 67, step: 275, loss: 0.35239821672439575, mean loss: 0.33961408645914437
Epoch: 67, step: 276, loss: 0.31272345781326294, mean loss: 0.33961380930759943
Epoch: 67, step: 277, loss: 0.30097445845603943, mean loss: 0.3396134110705202
Epoch: 67, step: 278, loss: 0.3428948223590851, mean loss: 0.3396134448900888
Epoch: 67, step: 279, loss: 0.3254276514053345, mean loss: 0.33961329868699813
Epoch: 67, step: 280, loss: 0.30302247405052185, mean loss: 0.33961292157474676
Epoch: 67, step: 281, loss: 0.33460763096809387, mean loss: 0.3396128699897668
Epoch: 67, step: 282, loss: 0.3683858811855316, mean loss: 0.33961316652397955
Epoch: 67, step: 283, loss: 0.31011301279067993, mean loss: 0.33961286249898026
Epoch: 67, step: 284, loss: 0.3014846444129944, mean loss: 0.33961246955824786
Epoch: 67, step: 285, loss: 0.3259108066558838, mean loss: 0.3396123283534856
Epoch: 67, step: 286, loss: 0.3432490825653076, mean loss: 0.3396123658322738
Epoch: 67, step: 287, loss: 0.3371192514896393, mean loss: 0.3396123401395995
Epoch: 67, step: 288, loss: 0.3301292359828949, mean loss: 0.3396122424129163
Epoch: 67, step: 289, loss: 0.4027766287326813, mean loss: 0.3396128933371555
Epoch: 67, step: 290, loss: 0.33981993794441223, mean loss: 0.3396128954707781
Epoch: 67, step: 291, loss: 0.4007398188114166, mean loss: 0.3396135253854869
Epoch: 67, step: 292, loss: 0.3182779848575592, mean loss: 0.3396133055243918
Epoch: 67, step: 293, loss: 0.3094348609447479, mean loss: 0.339612994541059
Epoch: 67, step: 294, loss: 0.33560606837272644, mean loss: 0.3396129532508457
Epoch: 67, step: 295, loss: 0.3408592641353607, mean loss: 0.33961296609358593
Epoch: 67, step: 296, loss: 0.3048762083053589, mean loss: 0.3396126081487378
Epoch: 67, step: 297, loss: 0.3250667154788971, mean loss: 0.33961245826216163
Epoch: 67, step: 298, loss: 0.3684193789958954, mean loss: 0.33961275509689876
Epoch: 67, step: 299, loss: 0.3291406035423279, mean loss: 0.3396126471899707
Epoch: 67, step: 300, loss: 0.37141287326812744, mean loss: 0.339612974861828
Epoch: 67, step: 301, loss: 0.3489369750022888, mean loss: 0.339613070936018
Epoch: 67, step: 302, loss: 0.32043230533599854, mean loss: 0.3396128733000781
Epoch: 67, step: 303, loss: 0.33268609642982483, mean loss: 0.3396128019282685
Epoch: 67, step: 304, loss: 0.3076941967010498, mean loss: 0.3396124730501789
Epoch: 67, step: 305, loss: 0.34672239422798157, mean loss: 0.3396125463075529
Epoch: 67, step: 306, loss: 0.31306377053260803, mean loss: 0.33961227276393563
Epoch: 67, step: 307, loss: 0.3010483682155609, mean loss: 0.3396118754272996
Epoch: 67, step: 308, loss: 0.33065658807754517, mean loss: 0.3396117831589691
Epoch: 67, step: 309, loss: 0.3276921510696411, mean loss: 0.3396116603495965
Epoch: 67, step: 310, loss: 0.3355409502983093, mean loss: 0.33961161840902376
Epoch: 67, step: 311, loss: 0.3644399344921112, mean loss: 0.3396118742128161
Epoch: 67, step: 312, loss: 0.3064671754837036, mean loss: 0.3396115327296382
Epoch: 67, step: 313, loss: 0.3711616098880768, mean loss: 0.3396118577804012
Epoch: 67, step: 314, loss: 0.31253334879875183, mean loss: 0.33961157880170717
Epoch: 67, step: 315, loss: 0.3332132399082184, mean loss: 0.33961151288294333
Epoch: 67, step: 316, loss: 0.3295271098613739, mean loss: 0.3396114089896448
Epoch: 67, step: 317, loss: 0.31238576769828796, mean loss: 0.3396111285037765
Epoch: 67, step: 318, loss: 0.30540549755096436, mean loss: 0.3396107761118106
Epoch: 67, step: 319, loss: 0.3227374255657196, mean loss: 0.3396106022816035
Epoch: 67, step: 320, loss: 0.35465288162231445, mean loss: 0.33961075724641554
Epoch: 67, step: 321, loss: 0.31412044167518616, mean loss: 0.33961049464916027
Epoch: 67, step: 322, loss: 0.3142312169075012, mean loss: 0.3396102331984928
Epoch: 67, step: 323, loss: 0.3483527600765228, mean loss: 0.33961032326078555
Epoch: 67, step: 324, loss: 0.3472856879234314, mean loss: 0.33961040232875156
Epoch: 67, step: 325, loss: 0.3160168528556824, mean loss: 0.33961015928170013
Epoch: 67, step: 326, loss: 0.3206075131893158, mean loss: 0.33960996352948697
Epoch: 67, step: 327, loss: 0.3671118915081024, mean loss: 0.33961024683254826
Epoch: 67, step: 328, loss: 0.35568875074386597, mean loss: 0.339610412458844
Epoch: 67, step: 329, loss: 0.32688361406326294, mean loss: 0.33961028136015636
Epoch: 67, step: 330, loss: 0.33101686835289, mean loss: 0.33961019284036315
Epoch: 67, step: 331, loss: 0.3443523049354553, mean loss: 0.3396102416878301
Epoch: 67, step: 332, loss: 0.3507283627986908, mean loss: 0.3396103562120018
Epoch: 67, step: 333, loss: 0.2970830500125885, mean loss: 0.3396099181564797
Epoch: 67, step: 334, loss: 0.3418163061141968, mean loss: 0.3396099408833006
Epoch: 67, step: 335, loss: 0.317930668592453, mean loss: 0.33960971757902503
Epoch: 67, step: 336, loss: 0.3008456230163574, mean loss: 0.33960931829906865
Epoch: 67, step: 337, loss: 0.31351858377456665, mean loss: 0.33960904956068694
Epoch: 67, step: 338, loss: 0.3405536711215973, mean loss: 0.339609059290327
Epoch: 67, step: 339, loss: 0.32860881090164185, mean loss: 0.3396089459884937
Epoch: 67, step: 340, loss: 0.3559367060661316, mean loss: 0.33960911416161405
Epoch: 67, step: 341, loss: 0.4021596312522888, mean loss: 0.33960975841454527
Epoch: 67, step: 342, loss: 0.28676342964172363, mean loss: 0.3396092141176612
Epoch: 67, step: 343, loss: 0.3190181851387024, mean loss: 0.3396090020401576
Epoch: 67, step: 344, loss: 0.3038967549800873, mean loss: 0.33960863422530935
Epoch: 67, step: 345, loss: 0.34425094723701477, mean loss: 0.33960868203787253
Epoch: 67, step: 346, loss: 0.3208690583705902, mean loss: 0.3396084890348995
Epoch: 67, step: 347, loss: 0.39405208826065063, mean loss: 0.33960904975417966
Epoch: 67, step: 348, loss: 0.3028317391872406, mean loss: 0.3396086709854168
Epoch: 67, step: 349, loss: 0.3331651985645294, mean loss: 0.3396086046249107
Epoch: 67, step: 350, loss: 0.370059609413147, mean loss: 0.33960891823272116
Epoch: 67, step: 351, loss: 0.31082314252853394, mean loss: 0.33960862177777057
Epoch: 67, step: 352, loss: 0.31886717677116394, mean loss: 0.339608408170856
Epoch: 67, step: 353, loss: 0.36736708879470825, mean loss: 0.3396086940422142
Epoch: 67, step: 354, loss: 0.3217986822128296, mean loss: 0.33960851062860364
Epoch: 67, step: 355, loss: 0.3564758002758026, mean loss: 0.339608684331949
Epoch: 67, step: 356, loss: 0.3951334059238434, mean loss: 0.3396092561327996
Epoch: 67, step: 357, loss: 0.35818374156951904, mean loss: 0.33960944741331195
Epoch: 67, step: 358, loss: 0.33026260137557983, mean loss: 0.3396093511602505
Epoch: 67, step: 359, loss: 0.3309474289417267, mean loss: 0.33960926196139746
Epoch: 67, step: 360, loss: 0.3513891100883484, mean loss: 0.33960938326681844
Epoch: 67, step: 361, loss: 0.3273748457431793, mean loss: 0.3396092572804368
Epoch: 67, step: 362, loss: 0.34352344274520874, mean loss: 0.3396092975867405
Epoch: 67, step: 363, loss: 0.29554179310798645, mean loss: 0.33960884380652306
Epoch: 67, step: 364, loss: 0.31030914187431335, mean loss: 0.3396085420992137
Epoch: 67, step: 365, loss: 0.3378061354160309, mean loss: 0.33960852353951393
Epoch: 67, step: 366, loss: 0.34358638525009155, mean loss: 0.33960856449983634
Epoch: 67, step: 367, loss: 0.3558018207550049, mean loss: 0.33960873124122043
Epoch: 67, step: 368, loss: 0.35071879625320435, mean loss: 0.339608845639987
Epoch: 67, step: 369, loss: 0.35347723960876465, mean loss: 0.33960898843940596
Epoch: 67, step: 370, loss: 0.31999897956848145, mean loss: 0.33960878652207904
Epoch: 67, step: 371, loss: 0.3130617141723633, mean loss: 0.3396085131790771
Epoch: 67, step: 372, loss: 0.312110960483551, mean loss: 0.3396082300523311
Epoch: 67, step: 373, loss: 0.30635181069374084, mean loss: 0.33960788763331834
Epoch: 67, step: 374, loss: 0.31022846698760986, mean loss: 0.3396075851362719
Epoch: 67, step: 375, loss: 0.327273428440094, mean loss: 0.33960745814236
Epoch: 67, step: 376, loss: 0.33305439352989197, mean loss: 0.3396073906719393
Epoch: 67, step: 377, loss: 0.31245094537734985, mean loss: 0.3396071110717777
Epoch: 67, step: 378, loss: 0.34513044357299805, mean loss: 0.339607167938895
Epoch: 67, step: 379, loss: 0.34110817313194275, mean loss: 0.33960718339278256
Epoch: 67, step: 380, loss: 0.30222728848457336, mean loss: 0.3396067985448493
Epoch: 67, step: 381, loss: 0.3694474399089813, mean loss: 0.33960710576858416
Epoch: 67, step: 382, loss: 0.32314953207969666, mean loss: 0.33960693633170314
Epoch: 67, step: 383, loss: 0.33375483751296997, mean loss: 0.33960687608277573
Epoch: 67, step: 384, loss: 0.3218420445919037, mean loss: 0.33960669319095227
Epoch: 67, step: 385, loss: 0.3666914701461792, mean loss: 0.33960697203025625
Epoch: 67, step: 386, loss: 0.32943660020828247, mean loss: 0.3396068673267835
Epoch: 67, step: 387, loss: 0.35578829050064087, mean loss: 0.33960703391201635
Epoch: 67, step: 388, loss: 0.33805739879608154, mean loss: 0.3396070179589283
Epoch: 67, step: 389, loss: 0.31964999437332153, mean loss: 0.3396068125087071
Epoch: 67, step: 390, loss: 0.32527998089790344, mean loss: 0.33960666502076087
Epoch: 67, step: 391, loss: 0.3704605996608734, mean loss: 0.3396069826441358
Epoch: 67, step: 392, loss: 0.3261827528476715, mean loss: 0.339606844450893
Epoch: 67, step: 393, loss: 0.34936729073524475, mean loss: 0.3396069449269619
Epoch: 67, step: 394, loss: 0.3282068371772766, mean loss: 0.33960682757308414
Epoch: 67, step: 395, loss: 0.3438442349433899, mean loss: 0.339606871192941
Epoch: 67, step: 396, loss: 0.3660525381565094, mean loss: 0.3396071434217429
Epoch: 67, step: 397, loss: 0.34411221742630005, mean loss: 0.3396071897960044
Epoch: 67, step: 398, loss: 0.3375341296195984, mean loss: 0.3396071684565891
Epoch: 67, step: 399, loss: 0.32665833830833435, mean loss: 0.3396070351668647
Epoch: 67, step: 400, loss: 0.33907121419906616, mean loss: 0.3396070296514094
Epoch: 67, step: 401, loss: 0.32150280475616455, mean loss: 0.3396068432980908
Epoch: 67, step: 402, loss: 0.35339075326919556, mean loss: 0.3396069851793887
Epoch: 67, step: 403, loss: 0.3359455466270447, mean loss: 0.33960694749165654
Epoch: 67, step: 404, loss: 0.3057626783847809, mean loss: 0.3396065991311416
Epoch: 67, step: 405, loss: 0.33532801270484924, mean loss: 0.3396065550919211
Epoch: 67, step: 406, loss: 0.3379599153995514, mean loss: 0.33960653814333697
Epoch: 67, step: 407, loss: 0.3620932102203369, mean loss: 0.3396067695924711
Epoch: 67, step: 408, loss: 0.303787499666214, mean loss: 0.3396064009183671
Epoch: 67, step: 409, loss: 0.33339065313339233, mean loss: 0.3396063369427008
Epoch: 67, step: 410, loss: 0.3233107328414917, mean loss: 0.33960616922170633
Epoch: 67, step: 411, loss: 0.33138158917427063, mean loss: 0.33960608457184993
Epoch: 67, step: 412, loss: 0.36145150661468506, mean loss: 0.33960630940920283
Epoch: 67, step: 413, loss: 0.2907750904560089, mean loss: 0.339605806833927
Epoch: 67, step: 414, loss: 0.3808462619781494, mean loss: 0.33960623128001394
Epoch: 67, step: 415, loss: 0.3410968482494354, mean loss: 0.33960624662126143
Epoch: 67, step: 416, loss: 0.3598476052284241, mean loss: 0.3396064549407037
Epoch: 67, step: 417, loss: 0.3611573576927185, mean loss: 0.3396066767353927
Epoch: 67, step: 418, loss: 0.3048524856567383, mean loss: 0.3396063190605537
Epoch: 67, step: 419, loss: 0.34909728169441223, mean loss: 0.3396064167363589
Epoch: 67, step: 420, loss: 0.31708070635795593, mean loss: 0.339606184916433
Epoch: 67, step: 421, loss: 0.3337789475917816, mean loss: 0.3396061249469226
Epoch: 67, step: 422, loss: 0.3710833787918091, mean loss: 0.3396064488836305
Epoch: 67, step: 423, loss: 0.3349136412143707, mean loss: 0.3396064005898044
Epoch: 67, step: 424, loss: 0.31552204489707947, mean loss: 0.33960615273951994
Epoch: 67, step: 425, loss: 0.32610204815864563, mean loss: 0.3396060137712303
Epoch: 67, step: 426, loss: 0.3466750681400299, mean loss: 0.3396060865168374
Epoch: 67, step: 427, loss: 0.34771642088890076, mean loss: 0.33960616997709886
Epoch: 67, step: 428, loss: 0.3458126485347748, mean loss: 0.33960623384487165
Epoch: 67, step: 429, loss: 0.3908797800540924, mean loss: 0.3396067614699124
Epoch: 67, step: 430, loss: 0.30837762355804443, mean loss: 0.3396064401130564
Epoch: 67, step: 431, loss: 0.3910294771194458, mean loss: 0.33960696926552614
Epoch: 67, step: 432, loss: 0.3353005051612854, mean loss: 0.3396069249516777
Epoch: 67, step: 433, loss: 0.3536299467086792, mean loss: 0.33960706924817047
Epoch: 67, step: 434, loss: 0.34499669075012207, mean loss: 0.3396071247066509
Epoch: 67, step: 435, loss: 0.3247133493423462, mean loss: 0.3396069714532824
Epoch: 67, step: 436, loss: 0.3069581687450409, mean loss: 0.3396066355084071
Epoch: 67, step: 437, loss: 0.3645854890346527, mean loss: 0.33960689252951637
Epoch: 67, step: 438, loss: 0.3519580662250519, mean loss: 0.33960701961620177
Epoch: 67, step: 439, loss: 0.3085659444332123, mean loss: 0.3396067002241453
Epoch: 67, step: 440, loss: 0.34456920623779297, mean loss: 0.33960675128451234
Epoch: 67, step: 441, loss: 0.30734899640083313, mean loss: 0.3396064193804596
Epoch: 67, step: 442, loss: 0.29084184765815735, mean loss: 0.3396059176408775
Epoch: 67, step: 443, loss: 0.28086698055267334, mean loss: 0.3396053132810836
Epoch: 67, step: 444, loss: 0.3829951882362366, mean loss: 0.33960575971112444
Epoch: 67, step: 445, loss: 0.329071968793869, mean loss: 0.33960565133209986
Epoch: 67, step: 446, loss: 0.33084094524383545, mean loss: 0.3396055611555878
Epoch: 67, step: 447, loss: 0.32452672719955444, mean loss: 0.33960540601716693
Epoch: 67, step: 448, loss: 0.3509902358055115, mean loss: 0.3396055231486606
Epoch: 67, step: 449, loss: 0.3672778904438019, mean loss: 0.33960580784965544
Epoch: 67, step: 450, loss: 0.31634265184402466, mean loss: 0.33960556851431245
Epoch: 67, step: 451, loss: 0.35727396607398987, mean loss: 0.33960575028794987
Epoch: 67, step: 452, loss: 0.3715812563896179, mean loss: 0.33960607925067765
Epoch: 67, step: 453, loss: 0.32716265320777893, mean loss: 0.3396059512345253
Epoch: 67, step: 454, loss: 0.31438973546028137, mean loss: 0.33960569181644384
Epoch: 67, step: 455, loss: 0.35375022888183594, mean loss: 0.3396058373303843
Epoch: 67, step: 456, loss: 0.327778160572052, mean loss: 0.3396057156527262
Epoch: 67, step: 457, loss: 0.3031364381313324, mean loss: 0.33960534047755675
Epoch: 67, step: 458, loss: 0.3594990074634552, mean loss: 0.3396055451301742
Epoch: 67, step: 459, loss: 0.31509140133857727, mean loss: 0.33960529294780456
Epoch: 67, step: 460, loss: 0.36601540446281433, mean loss: 0.33960556463161484
Epoch: 67, step: 461, loss: 0.31704941391944885, mean loss: 0.3396053325963231
Epoch: 67, step: 462, loss: 0.3236163258552551, mean loss: 0.33960516811898267
Epoch: 67, step: 463, loss: 0.3368327021598816, mean loss: 0.3396051395991913
Epoch: 67, step: 464, loss: 0.37966346740722656, mean loss: 0.33960555166679346
Epoch: 67, step: 465, loss: 0.37703123688697815, mean loss: 0.3396059366492571
Epoch: 67, step: 466, loss: 0.305127888917923, mean loss: 0.339605581991563
Epoch: 67, step: 467, loss: 0.33696359395980835, mean loss: 0.33960555481508964
Epoch: 67, step: 468, loss: 0.3031732439994812, mean loss: 0.33960518006262025
Epoch: 67, step: 469, loss: 0.30393555760383606, mean loss: 0.3396048131591409
Epoch: 67, step: 470, loss: 0.3362700045108795, mean loss: 0.33960477885711504
Epoch: 67, step: 471, loss: 0.3691990375518799, mean loss: 0.3396050832621623
Epoch: 67, step: 472, loss: 0.3568693995475769, mean loss: 0.33960526084021936
Epoch: 67, step: 473, loss: 0.3780146837234497, mean loss: 0.339605655909472
Epoch: 67, step: 474, loss: 0.28831422328948975, mean loss: 0.33960512834467127
Epoch: 67, step: 475, loss: 0.33522552251815796, mean loss: 0.3396050832981208
Epoch: 67, step: 476, loss: 0.34621375799179077, mean loss: 0.3396051512711184
Epoch: 67, step: 477, loss: 0.34954163432121277, mean loss: 0.33960525347097287
Epoch: 67, step: 478, loss: 0.3667675852775574, mean loss: 0.33960553284122813
Epoch: 67, step: 479, loss: 0.35970091819763184, mean loss: 0.3396057395243375
Epoch: 67, step: 480, loss: 0.33287131786346436, mean loss: 0.33960567026082905
Epoch: 67, step: 481, loss: 0.31040310859680176, mean loss: 0.339605369915651
Epoch: 67, step: 482, loss: 0.35322508215904236, mean loss: 0.33960550999147293
Epoch: 67, step: 483, loss: 0.31355100870132446, mean loss: 0.3396052420292661
Epoch: 67, step: 484, loss: 0.31677618622779846, mean loss: 0.33960500724214854
Epoch: 67, step: 485, loss: 0.3635891079902649, mean loss: 0.3396052539058747
Epoch: 67, step: 486, loss: 0.3619418740272522, mean loss: 0.3396054836237759
Epoch: 67, step: 487, loss: 0.3419908583164215, mean loss: 0.33960550815558194
Epoch: 67, step: 488, loss: 0.29847267270088196, mean loss: 0.33960508513928717
Epoch: 67, step: 489, loss: 0.3528037369251251, mean loss: 0.3396052208748205
Epoch: 67, step: 490, loss: 0.3290659487247467, mean loss: 0.3396051124895826
Epoch: 67, step: 491, loss: 0.3568134307861328, mean loss: 0.33960528945706814
Epoch: 67, step: 492, loss: 0.33162721991539, mean loss: 0.33960520741277056
Epoch: 67, step: 493, loss: 0.3389774262905121, mean loss: 0.3396052009569066
Epoch: 67, step: 494, loss: 0.29417094588279724, mean loss: 0.33960473373299255
Epoch: 67, step: 495, loss: 0.3295484781265259, mean loss: 0.339604630320385
Epoch: 67, step: 496, loss: 0.33211731910705566, mean loss: 0.33960455332607975
Epoch: 67, step: 497, loss: 0.3087337911128998, mean loss: 0.33960423587587907
Epoch: 67, step: 498, loss: 0.30931612849235535, mean loss: 0.3396039244204369
Epoch: 67, step: 499, loss: 0.33898040652275085, mean loss: 0.33960391800880996
Epoch: 67, step: 500, loss: 0.3135996162891388, mean loss: 0.33960365060964165
Epoch: 67, step: 501, loss: 0.3162214756011963, mean loss: 0.33960341017596546
Epoch: 67, step: 502, loss: 0.3227827250957489, mean loss: 0.3396032372144013
Epoch: 67, step: 503, loss: 0.3986263871192932, mean loss: 0.33960384412376976
Epoch: 67, step: 504, loss: 0.3317052125930786, mean loss: 0.3396037629064137
Epoch: 67, step: 505, loss: 0.3058217465877533, mean loss: 0.3396034155477825
Epoch: 67, step: 506, loss: 0.45372867584228516, mean loss: 0.3396045890119776
Epoch: 67, step: 507, loss: 0.3097657561302185, mean loss: 0.3396042822048615
Epoch: 67, step: 508, loss: 0.3225509226322174, mean loss: 0.3396041068616001
Epoch: 67, step: 509, loss: 0.3676125705242157, mean loss: 0.33960439484267785
Epoch: 67, step: 510, loss: 0.3100667893886566, mean loss: 0.33960409114219303
Epoch: 67, step: 511, loss: 0.3174758553504944, mean loss: 0.33960386362588835
Epoch: 67, step: 512, loss: 0.3200649917125702, mean loss: 0.3396036627347612
Epoch: 67, step: 513, loss: 0.329757422208786, mean loss: 0.33960356150056364
Epoch: 67, step: 514, loss: 0.30891644954681396, mean loss: 0.3396032459940303
Epoch: 67, step: 515, loss: 0.3203285336494446, mean loss: 0.3396030478250022
Epoch: 67, step: 516, loss: 0.34302064776420593, mean loss: 0.3396030829619985
Epoch: 67, step: 517, loss: 0.3103439509868622, mean loss: 0.33960278214637973
Epoch: 67, step: 518, loss: 0.3313208222389221, mean loss: 0.3396026969997225
Epoch: 67, step: 519, loss: 0.3473402261734009, mean loss: 0.33960277654828086
Epoch: 67, step: 520, loss: 0.3107476830482483, mean loss: 0.3396024798957657
Epoch: 67, step: 521, loss: 0.3272467851638794, mean loss: 0.33960235287104346
Epoch: 67, step: 522, loss: 0.31299975514411926, mean loss: 0.3396020793815376
Epoch: 67, step: 523, loss: 0.3429512083530426, mean loss: 0.3396021138120928
Epoch: 67, step: 524, loss: 0.325167715549469, mean loss: 0.3396019654214987
Epoch: 67, step: 525, loss: 0.3111487925052643, mean loss: 0.3396016729160716
Epoch: 67, step: 526, loss: 0.3376617729663849, mean loss: 0.33960165297364087
Epoch: 67, step: 527, loss: 0.30790984630584717, mean loss: 0.3396013271809822
Epoch: 67, step: 528, loss: 0.336660236120224, mean loss: 0.33960129694679464
Epoch: 67, step: 529, loss: 0.33644115924835205, mean loss: 0.3396012644611586
Epoch: 67, step: 530, loss: 0.29498961567878723, mean loss: 0.3396008058663048
Epoch: 67, step: 531, loss: 0.39430367946624756, mean loss: 0.33960136819025216
Epoch: 67, step: 532, loss: 0.32880476117134094, mean loss: 0.33960125720653467
Epoch: 67, step: 533, loss: 0.332184761762619, mean loss: 0.33960118096945646
Epoch: 67, step: 534, loss: 0.3560052216053009, mean loss: 0.3396013495913188
Epoch: 67, step: 535, loss: 0.36214348673820496, mean loss: 0.3396015813060627
Epoch: 67, step: 536, loss: 0.33249154686927795, mean loss: 0.3396015082214717
Epoch: 67, step: 537, loss: 0.33415544033050537, mean loss: 0.3396014522414963
Epoch: 67, step: 538, loss: 0.34725603461265564, mean loss: 0.3396015309219199
Epoch: 67, step: 539, loss: 0.3543739914894104, mean loss: 0.33960168276449626
Epoch: 67, step: 540, loss: 0.3158362805843353, mean loss: 0.3396014384881425
Epoch: 67, step: 541, loss: 0.2968194782733917, mean loss: 0.33960099875168226
Epoch: 67, step: 542, loss: 0.30571356415748596, mean loss: 0.33960065044161664
Epoch: 67, step: 543, loss: 0.3294789493083954, mean loss: 0.3396005464073576
Epoch: 67, step: 544, loss: 0.29930180311203003, mean loss: 0.33960013220753543
Epoch: 67, step: 545, loss: 0.3453352749347687, mean loss: 0.33960019115405554
Epoch: 67, step: 546, loss: 0.3047342300415039, mean loss: 0.3395998328009941
Epoch: 67, step: 547, loss: 0.31461095809936523, mean loss: 0.33959957596746854
Epoch: 67, step: 548, loss: 0.28944915533065796, mean loss: 0.33959906053101485
Epoch: 67, step: 549, loss: 0.3057829737663269, mean loss: 0.3395987129792999
Epoch: 67, step: 550, loss: 0.3283294141292572, mean loss: 0.33959859715797747
Epoch: 67, step: 551, loss: 0.3735223114490509, mean loss: 0.3395989458086896
Epoch: 67, step: 552, loss: 0.3184404671192169, mean loss: 0.33959872835482285
Epoch: 67, step: 553, loss: 0.32855111360549927, mean loss: 0.33959861481538123
Epoch: 67, step: 554, loss: 0.32073700428009033, mean loss: 0.33959842097130105
Epoch: 67, step: 555, loss: 0.32854998111724854, mean loss: 0.33959830742571345
Epoch: 67, step: 556, loss: 0.36568671464920044, mean loss: 0.3395985755353401
Epoch: 67, step: 557, loss: 0.3361242413520813, mean loss: 0.3395985398300991
Epoch: 67, step: 558, loss: 0.3330322802066803, mean loss: 0.3395984723502711
Epoch: 67, step: 559, loss: 0.3589160144329071, mean loss: 0.33959867086983864
Epoch: 67, step: 560, loss: 0.33828461170196533, mean loss: 0.33959865736585476
Epoch: 67, step: 561, loss: 0.32520174980163574, mean loss: 0.3395985094169537
Epoch: 67, step: 562, loss: 0.33746886253356934, mean loss: 0.3395984875319984
Epoch: 67, step: 563, loss: 0.31895264983177185, mean loss: 0.3395982753707264
Epoch: 67, step: 564, loss: 0.31467312574386597, mean loss: 0.33959801923691463
Epoch: 67, step: 565, loss: 0.3133179545402527, mean loss: 0.339597749182609
Epoch: 67, step: 566, loss: 0.3457377851009369, mean loss: 0.33959781227705405
Epoch: 67, step: 567, loss: 0.3301880955696106, mean loss: 0.3395977155846632
Epoch: 67, step: 568, loss: 0.31797143816947937, mean loss: 0.33959749335959033
Epoch: 67, step: 569, loss: 0.31538093090057373, mean loss: 0.3395972445200903
Epoch: 67, step: 570, loss: 0.33918875455856323, mean loss: 0.33959724032265753
Epoch: 67, step: 571, loss: 0.30620232224464417, mean loss: 0.3395968971771779
Epoch: 67, step: 572, loss: 0.30995795130729675, mean loss: 0.33959659262887004
Epoch: 67, step: 573, loss: 0.2990686595439911, mean loss: 0.3395961761975073
Epoch: 67, step: 574, loss: 0.3181183934211731, mean loss: 0.33959595551192656
Epoch: 67, step: 575, loss: 0.35045167803764343, mean loss: 0.3395960670540182
Epoch: 67, step: 576, loss: 0.3240399956703186, mean loss: 0.33959590721768235
Epoch: 67, step: 577, loss: 0.3150911331176758, mean loss: 0.33959565543733483
Epoch: 67, step: 578, loss: 0.3283229470252991, mean loss: 0.339595539614301
Epoch: 67, step: 579, loss: 0.3668651580810547, mean loss: 0.3395958197969665
Epoch: 67, step: 580, loss: 0.35140183568000793, mean loss: 0.3395959410970506
Epoch: 67, step: 581, loss: 0.3224976360797882, mean loss: 0.3395957654235171
Epoch: 67, step: 582, loss: 0.32952138781547546, mean loss: 0.33959566191715623
Epoch: 67, step: 583, loss: 0.3048473000526428, mean loss: 0.3395953049085479
Epoch: 67, step: 584, loss: 0.36414363980293274, mean loss: 0.3395955571183318
Epoch: 67, step: 585, loss: 0.32382962107658386, mean loss: 0.3395953951406463
Epoch: 67, step: 586, loss: 0.35658887028694153, mean loss: 0.33959556972815486
Epoch: 67, step: 587, loss: 0.37964481115341187, mean loss: 0.3395959811816913
Epoch: 67, step: 588, loss: 0.3264802098274231, mean loss: 0.3395958464356918
Epoch: 67, step: 589, loss: 0.3220116198062897, mean loss: 0.3395956657844905
Epoch: 67, step: 590, loss: 0.364146888256073, mean loss: 0.3395959180083933
Epoch: 67, step: 591, loss: 0.34588515758514404, mean loss: 0.33959598261944296
Epoch: 67, step: 592, loss: 0.32707589864730835, mean loss: 0.33959585399857434
Epoch: 67, step: 593, loss: 0.34633868932724, mean loss: 0.33959592326811194
Epoch: 67, step: 594, loss: 0.3017761707305908, mean loss: 0.33959553474759646
Epoch: 67, step: 595, loss: 0.33116477727890015, mean loss: 0.3395954481397165
Epoch: 67, step: 596, loss: 0.3635483384132385, mean loss: 0.3395956942015612
Epoch: 67, step: 597, loss: 0.32495301961898804, mean loss: 0.3395955437826988
Epoch: 67, step: 598, loss: 0.30449923872947693, mean loss: 0.3395951832548443
Epoch: 67, step: 599, loss: 0.3303208351135254, mean loss: 0.3395950879848013
Epoch: 67, step: 600, loss: 0.3270701467990875, mean loss: 0.3395949593246077
Epoch: 67, step: 601, loss: 0.34738752245903015, mean loss: 0.3395950393714812
Epoch: 67, step: 602, loss: 0.3239269554615021, mean loss: 0.33959487842722885
Epoch: 67, step: 603, loss: 0.3494061231613159, mean loss: 0.33959497920836057
Epoch: 67, step: 604, loss: 0.32061484456062317, mean loss: 0.3395947842463702
Epoch: 67, step: 605, loss: 0.2912381589412689, mean loss: 0.3395942875371923
Epoch: 67, step: 606, loss: 0.29923200607299805, mean loss: 0.3395938729485069
Epoch: 67, step: 607, loss: 0.32656198740005493, mean loss: 0.33959373909044427
Epoch: 67, step: 608, loss: 0.37966471910476685, mean loss: 0.33959415067851717
Epoch: 67, step: 609, loss: 0.3200712203979492, mean loss: 0.3395939501512849
Epoch: 67, step: 610, loss: 0.33101341128349304, mean loss: 0.3395938620183042
Epoch: 67, step: 611, loss: 0.34741443395614624, mean loss: 0.33959394234463885
Epoch: 67, step: 612, loss: 0.3033443093299866, mean loss: 0.3395935700227336
Epoch: 67, step: 613, loss: 0.3277647793292999, mean loss: 0.33959344852984424
Epoch: 67, step: 614, loss: 0.3862822949886322, mean loss: 0.3395939280636143
Epoch: 67, step: 615, loss: 0.31758683919906616, mean loss: 0.3395937020346009
Epoch: 67, step: 616, loss: 0.305646151304245, mean loss: 0.33959335337182955
Epoch: 67, step: 617, loss: 0.31442195177078247, mean loss: 0.33959309484830386
Epoch: 67, step: 618, loss: 0.31335100531578064, mean loss: 0.3395928253310184
Epoch: 67, step: 619, loss: 0.31295621395111084, mean loss: 0.3395925517646375
Epoch: 67, step: 620, loss: 0.3076648414134979, mean loss: 0.33959222386037274
Epoch: 67, step: 621, loss: 0.31754839420318604, mean loss: 0.3395919974679556
Epoch: 67, step: 622, loss: 0.3029308319091797, mean loss: 0.33959162095784934
Epoch: 67, step: 623, loss: 0.34516873955726624, mean loss: 0.3395916782342594
Epoch: 67, step: 624, loss: 0.3239377737045288, mean loss: 0.3395915174719893
Epoch: 67, step: 625, loss: 0.3452111780643463, mean loss: 0.33959157518411565
Epoch: 67, step: 626, loss: 0.3326268494129181, mean loss: 0.3395915036593324
Epoch: 67, step: 627, loss: 0.3594296872615814, mean loss: 0.3395917073869819
Epoch: 67, step: 628, loss: 0.32266050577163696, mean loss: 0.3395915335142849
Epoch: 67, step: 629, loss: 0.3375649154186249, mean loss: 0.3395915127024168
Epoch: 67, step: 630, loss: 0.3410489857196808, mean loss: 0.3395915276694324
Epoch: 67, step: 631, loss: 0.31822070479393005, mean loss: 0.33959130821140326
Epoch: 67, step: 632, loss: 0.3659040927886963, mean loss: 0.3395915784159049
Epoch: 67, step: 633, loss: 0.32535117864608765, mean loss: 0.33959143218354404
Epoch: 67, step: 634, loss: 0.30794844031333923, mean loss: 0.33959110725011754
Epoch: 67, step: 635, loss: 0.34159937500953674, mean loss: 0.33959112787227064
Epoch: 67, step: 636, loss: 0.3138050138950348, mean loss: 0.33959086308699593
Epoch: 67, step: 637, loss: 0.3024440407752991, mean loss: 0.3395904816479563
Epoch: 67, step: 638, loss: 0.32503148913383484, mean loss: 0.3395903321516938
Epoch: 67, step: 639, loss: 0.3299340009689331, mean loss: 0.3395902329985006
Epoch: 67, step: 640, loss: 0.3049579858779907, mean loss: 0.33958987739112073
Epoch: 67, step: 641, loss: 0.30820706486701965, mean loss: 0.3395895551525693
Epoch: 67, step: 642, loss: 0.3492693305015564, mean loss: 0.3395896545434303
Epoch: 67, step: 643, loss: 0.3361271321773529, mean loss: 0.33958961899099926
Epoch: 67, step: 644, loss: 0.33947718143463135, mean loss: 0.3395896178365266
Epoch: 67, step: 645, loss: 0.34536296129226685, mean loss: 0.3395896771147517
Epoch: 67, step: 646, loss: 0.35144859552383423, mean loss: 0.33958979887581137
Epoch: 67, step: 647, loss: 0.3421863615512848, mean loss: 0.3395898255356606
Epoch: 67, step: 648, loss: 0.3181944787502289, mean loss: 0.3395896058641431
Epoch: 67, step: 649, loss: 0.37340497970581055, mean loss: 0.3395899530517018
Epoch: 67, step: 650, loss: 0.35142919421195984, mean loss: 0.33959007460573376
Epoch: 67, step: 651, loss: 0.31549298763275146, mean loss: 0.33958982720237674
Epoch: 67, step: 652, loss: 0.3384974002838135, mean loss: 0.33958981598660976
Epoch: 67, step: 653, loss: 0.34260842204093933, mean loss: 0.339589846977822
Epoch: 67, step: 654, loss: 0.33016520738601685, mean loss: 0.33958975021858884
Epoch: 67, step: 655, loss: 0.3692801594734192, mean loss: 0.3395900550357345
Epoch: 67, step: 656, loss: 0.32054319977760315, mean loss: 0.33958985949284387
Epoch: 67, step: 657, loss: 0.3192203640937805, mean loss: 0.33958965037332967
Epoch: 67, step: 658, loss: 0.3082515299320221, mean loss: 0.33958932864983504
Epoch: 67, step: 659, loss: 0.3621121942996979, mean loss: 0.3395895598717639
Epoch: 67, step: 660, loss: 0.31048277020454407, mean loss: 0.33958926106169846
Epoch: 67, step: 661, loss: 0.32175204157829285, mean loss: 0.33958907794682847
Epoch: 67, step: 662, loss: 0.3434465229511261, mean loss: 0.3395891175465144
Epoch: 67, step: 663, loss: 0.3593331277370453, mean loss: 0.33958932023211974
Epoch: 67, step: 664, loss: 0.3234829604625702, mean loss: 0.3395891548911512
Epoch: 67, step: 665, loss: 0.33802899718284607, mean loss: 0.339589138875407
Epoch: 67, step: 666, loss: 0.29007309675216675, mean loss: 0.33958863057543137
Epoch: 67, step: 667, loss: 0.2972008287906647, mean loss: 0.3395881954538724
Epoch: 67, step: 668, loss: 0.3216785788536072, mean loss: 0.3395880116089932
Epoch: 67, step: 669, loss: 0.3432646095752716, mean loss: 0.339588049349431
Epoch: 67, step: 670, loss: 0.3185599744319916, mean loss: 0.3395878334975446
Epoch: 67, step: 671, loss: 0.326260507106781, mean loss: 0.3395876966947691
Epoch: 67, step: 672, loss: 0.33770567178726196, mean loss: 0.33958767737629664
Epoch: 67, step: 673, loss: 0.32131528854370117, mean loss: 0.33958748981713305
Epoch: 67, step: 674, loss: 0.3238981366157532, mean loss: 0.3395873287735068
Epoch: 67, step: 675, loss: 0.2960651218891144, mean loss: 0.33958688204367754
Epoch: 67, step: 676, loss: 0.3284662961959839, mean loss: 0.3395867678985829
Epoch: 67, step: 677, loss: 0.3137608468532562, mean loss: 0.3395865028161506
Epoch: 67, step: 678, loss: 0.32108601927757263, mean loss: 0.3395863129254269
Epoch: 67, step: 679, loss: 0.35132884979248047, mean loss: 0.33958643345070577
Epoch: 67, step: 680, loss: 0.3315295875072479, mean loss: 0.33958635075616983
Epoch: 67, step: 681, loss: 0.3034006655216217, mean loss: 0.33958597935428914
Epoch: 67, step: 682, loss: 0.3063434064388275, mean loss: 0.3395856381633651
Epoch: 67, step: 683, loss: 0.36137136816978455, mean loss: 0.339585861762696
Epoch: 67, step: 684, loss: 0.32803842425346375, mean loss: 0.3395857432459973
Epoch: 67, step: 685, loss: 0.3415469229221344, mean loss: 0.3395857633742859
Epoch: 67, step: 686, loss: 0.34251686930656433, mean loss: 0.339585793456966
Epoch: 67, step: 687, loss: 0.33606207370758057, mean loss: 0.3395857572925119
Epoch: 67, step: 688, loss: 0.30313271284103394, mean loss: 0.3395853831733944
Epoch: 67, step: 689, loss: 0.3435641825199127, mean loss: 0.33958542400755914
Epoch: 67, step: 690, loss: 0.40241312980651855, mean loss: 0.33958606879769243
Epoch: 67, step: 691, loss: 0.31835588812828064, mean loss: 0.33958585091816995
Epoch: 67, step: 692, loss: 0.3009233772754669, mean loss: 0.339585454139877
Epoch: 67, step: 693, loss: 0.32885071635246277, mean loss: 0.339585343974468
Epoch: 67, step: 694, loss: 0.3631134331226349, mean loss: 0.33958558542936107
Epoch: 67, step: 695, loss: 0.3470298945903778, mean loss: 0.3395856618251285
Epoch: 67, step: 696, loss: 0.35217806696891785, mean loss: 0.33958579105089837
Epoch: 67, step: 697, loss: 0.3077258765697479, mean loss: 0.339585464101465
Epoch: 67, step: 698, loss: 0.3266758322715759, mean loss: 0.3395853316229708
Epoch: 67, step: 699, loss: 0.29308608174324036, mean loss: 0.3395848544530968
Epoch: 67, step: 700, loss: 0.3105964958667755, mean loss: 0.33958455698099765
Epoch: 67, step: 701, loss: 0.3023495376110077, mean loss: 0.33958417488741766
Epoch: 67, step: 702, loss: 0.34922653436660767, mean loss: 0.3395842738331389
Epoch: 67, step: 703, loss: 0.3301261067390442, mean loss: 0.33958417677851616
Epoch: 67, step: 704, loss: 0.3274538218975067, mean loss: 0.33958405230461713
Epoch: 67, step: 705, loss: 0.33524367213249207, mean loss: 0.33958400776688474
Epoch: 67, step: 706, loss: 0.3318594992160797, mean loss: 0.3395839285045734
Epoch: 67, step: 707, loss: 0.32329750061035156, mean loss: 0.33958376138887103
Epoch: 67, step: 708, loss: 0.3202439844608307, mean loss: 0.33958356294466563
Epoch: 67, step: 709, loss: 0.3814511001110077, mean loss: 0.3395839925403598
Epoch: 67, step: 710, loss: 0.33145323395729065, mean loss: 0.3395839091128818
Epoch: 67, step: 711, loss: 0.35389477014541626, mean loss: 0.339584055951185
Epoch: 67, step: 712, loss: 0.32613688707351685, mean loss: 0.33958391797631426
Epoch: 67, step: 713, loss: 0.31410324573516846, mean loss: 0.33958365653419076
Epoch: 67, step: 714, loss: 0.2994745671749115, mean loss: 0.3395832450027444
Epoch: 67, step: 715, loss: 0.31962016224861145, mean loss: 0.3395830401775499
Epoch: 67, step: 716, loss: 0.33421581983566284, mean loss: 0.3395829851093681
Epoch: 67, step: 717, loss: 0.3365228474140167, mean loss: 0.3395829537123917
Epoch: 67, step: 718, loss: 0.3599798083305359, mean loss: 0.33958316298173025
Epoch: 67, step: 719, loss: 0.35844480991363525, mean loss: 0.33958335649803234
Epoch: 67, step: 720, loss: 0.3656913936138153, mean loss: 0.3395836243579377
Epoch: 67, step: 721, loss: 0.34537801146507263, mean loss: 0.33958368380584075
Epoch: 67, step: 722, loss: 0.31363242864608765, mean loss: 0.3395834175599301
Epoch: 67, step: 723, loss: 0.29777586460113525, mean loss: 0.3395829886413385
Epoch: 67, step: 724, loss: 0.3480283319950104, mean loss: 0.33958307528423815
Epoch: 67, step: 725, loss: 0.3170856535434723, mean loss: 0.3395828444799032
Epoch: 67, step: 726, loss: 0.30177634954452515, mean loss: 0.33958245662152997
Epoch: 67, step: 727, loss: 0.3305724859237671, mean loss: 0.33958236418882143
Epoch: 67, step: 728, loss: 0.32746610045433044, mean loss: 0.33958223989012803
Epoch: 67, step: 729, loss: 0.3386082947254181, mean loss: 0.33958222989869236
Epoch: 67, step: 730, loss: 0.3076581358909607, mean loss: 0.3395819024015493
Epoch: 67, step: 731, loss: 0.32006868720054626, mean loss: 0.3395817022249469
Epoch: 67, step: 732, loss: 0.3427284359931946, mean loss: 0.33958173450542994
Epoch: 67, step: 733, loss: 0.38317441940307617, mean loss: 0.339582181692448
Epoch: 67, step: 734, loss: 0.33409032225608826, mean loss: 0.3395821253558618
Epoch: 67, step: 735, loss: 0.3411765396595001, mean loss: 0.339582141711513
Epoch: 67, step: 736, loss: 0.30681112408638, mean loss: 0.33958180554679407
Epoch: 67, step: 737, loss: 0.3281760811805725, mean loss: 0.3395816885482059
Epoch: 67, step: 738, loss: 0.32638871669769287, mean loss: 0.33958155321763006
Epoch: 67, step: 739, loss: 0.30914735794067383, mean loss: 0.3395812410336148
Epoch: 67, step: 740, loss: 0.3455982506275177, mean loss: 0.339581302753497
Epoch: 67, step: 741, loss: 0.3342972993850708, mean loss: 0.3395812485530317
Epoch: 67, step: 742, loss: 0.3656824231147766, mean loss: 0.3395815162820996
Epoch: 67, step: 743, loss: 0.3627258241176605, mean loss: 0.3395817536790946
Epoch: 67, step: 744, loss: 0.335616797208786, mean loss: 0.33958171300995454
Epoch: 67, step: 745, loss: 0.3184400796890259, mean loss: 0.3395814961593451
Epoch: 67, step: 746, loss: 0.31163251399993896, mean loss: 0.33958120948841675
Epoch: 67, step: 747, loss: 0.31007033586502075, mean loss: 0.3395809068003719
Epoch: 67, step: 748, loss: 0.3764878213405609, mean loss: 0.33958128534447624
Epoch: 67, step: 749, loss: 0.3387565314769745, mean loss: 0.33958127688528866
Epoch: 67, step: 750, loss: 0.3058079779148102, mean loss: 0.3395809304889259
Epoch: 67, step: 751, loss: 0.3444851040840149, mean loss: 0.33958098078814225
Epoch: 67, step: 752, loss: 0.31518521904945374, mean loss: 0.3395807305777676
Epoch: 67, step: 753, loss: 0.3474670946598053, mean loss: 0.3395808114618939
Epoch: 67, step: 754, loss: 0.299268901348114, mean loss: 0.3395803980191269
Epoch: 67, step: 755, loss: 0.3565233647823334, mean loss: 0.3395805717860161
Epoch: 67, step: 756, loss: 0.3177359402179718, mean loss: 0.33958034775000184
Epoch: 67, step: 757, loss: 0.3629039227962494, mean loss: 0.33958058695143606
Epoch: 67, step: 758, loss: 0.2994830012321472, mean loss: 0.33958017572367066
Epoch: 67, step: 759, loss: 0.3031913936138153, mean loss: 0.33957980253601316
Epoch: 67, step: 760, loss: 0.36511874198913574, mean loss: 0.3395800644496771
Epoch: 67, step: 761, loss: 0.3325909674167633, mean loss: 0.33957999277398193
Epoch: 67, step: 762, loss: 0.35957950353622437, mean loss: 0.33958019787402977
Epoch: 67, step: 763, loss: 0.3082062602043152, mean loss: 0.33957987612965296
Epoch: 67, step: 764, loss: 0.37197136878967285, mean loss: 0.3395802083058003
Epoch: 67, step: 765, loss: 0.3341122269630432, mean loss: 0.339580152231992
Epoch: 67, step: 766, loss: 0.38072624802589417, mean loss: 0.3395805741783161
Epoch: 67, step: 767, loss: 0.3385930359363556, mean loss: 0.3395805640513806
Epoch: 67, step: 768, loss: 0.37674176692962646, mean loss: 0.33958094512547926
Epoch: 67, step: 769, loss: 0.281707227230072, mean loss: 0.33958035165844863
Epoch: 67, step: 770, loss: 0.33247819542884827, mean loss: 0.33958027883001285
Epoch: 67, step: 771, loss: 0.3880442678928375, mean loss: 0.33958077579462587
Epoch: 67, step: 772, loss: 0.32046547532081604, mean loss: 0.33958057978248
Epoch: 67, step: 773, loss: 0.3232913911342621, mean loss: 0.33958041275156753
Epoch: 67, step: 774, loss: 0.35796135663986206, mean loss: 0.3395806012296075
Epoch: 67, step: 775, loss: 0.3096993863582611, mean loss: 0.33958029483102997
Epoch: 67, step: 776, loss: 0.32198813557624817, mean loss: 0.33958011444488023
Epoch: 67, step: 777, loss: 0.3677269518375397, mean loss: 0.3395804030534297
Epoch: 67, step: 778, loss: 0.3369887173175812, mean loss: 0.3395803764793965
Epoch: 67, step: 779, loss: 0.3581989109516144, mean loss: 0.3395805673839005
Epoch: 67, step: 780, loss: 0.3484419286251068, mean loss: 0.33958065824263217
Epoch: 67, step: 781, loss: 0.3112553656101227, mean loss: 0.3395803678161723
Epoch: 67, step: 782, loss: 0.3158600926399231, mean loss: 0.3395801246086262
Epoch: 67, step: 783, loss: 0.3265492022037506, mean loss: 0.3395799910019904
Epoch: 67, step: 784, loss: 0.4041668474674225, mean loss: 0.33958065320715647
Epoch: 67, step: 785, loss: 0.32295525074005127, mean loss: 0.3395804827496497
Epoch: 67, step: 786, loss: 0.3436535894870758, mean loss: 0.33958052451011245
Epoch: 67, step: 787, loss: 0.36006081104278564, mean loss: 0.3395807344868034
Epoch: 67, step: 788, loss: 0.35310497879981995, mean loss: 0.33958087314438273
Epoch: 67, step: 789, loss: 0.3272249102592468, mean loss: 0.3395807464659304
Epoch: 67, step: 790, loss: 0.2968362867832184, mean loss: 0.3395803082365075
Epoch: 67, step: 791, loss: 0.33919039368629456, mean loss: 0.33958030423902386
Epoch: 67, step: 792, loss: 0.291608989238739, mean loss: 0.3395798124323477
Epoch: 67, step: 793, loss: 0.3503810167312622, mean loss: 0.3395799231662295
Epoch: 67, step: 794, loss: 0.3794487416744232, mean loss: 0.3395803318969278
Epoch: 67, step: 795, loss: 0.3431079387664795, mean loss: 0.3395803680611908
Epoch: 67, step: 796, loss: 0.3230358362197876, mean loss: 0.3395801984519659
Epoch: 67, step: 797, loss: 0.3063049614429474, mean loss: 0.3395798573284241
Epoch: 67, step: 798, loss: 0.2993825376033783, mean loss: 0.33957944524686623
Epoch: 67, step: 799, loss: 0.3701559007167816, mean loss: 0.3395797586972237
Epoch: 67, step: 800, loss: 0.33542537689208984, mean loss: 0.33957971610958254
Epoch: 67, step: 801, loss: 0.33138689398765564, mean loss: 0.3395796321237074
Epoch: 67, step: 802, loss: 0.3240853250026703, mean loss: 0.3395794732908187
Epoch: 67, step: 803, loss: 0.3251997232437134, mean loss: 0.33957932588481937
Epoch: 67, step: 804, loss: 0.33558979630470276, mean loss: 0.3395792849887979
Epoch: 67, step: 805, loss: 0.320078045129776, mean loss: 0.33957908508679635
Epoch: 67, step: 806, loss: 0.33513376116752625, mean loss: 0.3395790395194352
Epoch: 67, step: 807, loss: 0.32128944993019104, mean loss: 0.3395788520415805
Epoch: 67, step: 808, loss: 0.3120752274990082, mean loss: 0.33957857011794057
Epoch: 67, step: 809, loss: 0.3801918625831604, mean loss: 0.33957898641688544
Epoch: 67, step: 810, loss: 0.3191651701927185, mean loss: 0.3395787771710319
Epoch: 67, step: 811, loss: 0.32109907269477844, mean loss: 0.3395785877521668
Epoch: 67, step: 812, loss: 0.31682419776916504, mean loss: 0.3395783545197278
Epoch: 67, step: 813, loss: 0.3389081656932831, mean loss: 0.33957834765036443
Epoch: 67, step: 814, loss: 0.34676381945610046, mean loss: 0.3395784212999222
Epoch: 67, step: 815, loss: 0.3355564475059509, mean loss: 0.33957838007596874
Epoch: 67, step: 816, loss: 0.3291459083557129, mean loss: 0.3395782731475444
Epoch: 67, step: 817, loss: 0.38016730546951294, mean loss: 0.3395786891637009
Epoch: 67, step: 818, loss: 0.3260795772075653, mean loss: 0.3395785508063469
Epoch: 67, step: 819, loss: 0.3148353397846222, mean loss: 0.33957829720669314
Epoch: 67, step: 820, loss: 0.3390108644962311, mean loss: 0.3395782913909862
Epoch: 67, step: 821, loss: 0.3186277747154236, mean loss: 0.3395780766680522
Epoch: 67, step: 822, loss: 0.32909727096557617, mean loss: 0.33957796925083084
Epoch: 67, step: 823, loss: 0.3540944755077362, mean loss: 0.33957811802820814
Epoch: 67, step: 824, loss: 0.31445077061653137, mean loss: 0.33957786050463695
Epoch: 67, step: 825, loss: 0.34870854020118713, mean loss: 0.3395779540816113
Epoch: 67, step: 826, loss: 0.3571650981903076, mean loss: 0.3395781343239286
Epoch: 67, step: 827, loss: 0.2965537905693054, mean loss: 0.3395776933923086
Epoch: 67, step: 828, loss: 0.3336649239063263, mean loss: 0.33957763279637426
Epoch: 67, step: 829, loss: 0.3488837778568268, mean loss: 0.3395777281677188
Epoch: 67, step: 830, loss: 0.31688663363456726, mean loss: 0.33957749562696177
Epoch: 67, step: 831, loss: 0.3118150234222412, mean loss: 0.3395772111171011
Epoch: 67, step: 832, loss: 0.357269287109375, mean loss: 0.33957739242366686
Epoch: 67, step: 833, loss: 0.3424797058105469, mean loss: 0.3395774221659696
Epoch: 67, step: 834, loss: 0.3303280174732208, mean loss: 0.3395773273809692
Epoch: 67, step: 835, loss: 0.3489457368850708, mean loss: 0.33957742338450975
Epoch: 67, step: 836, loss: 0.31531840562820435, mean loss: 0.33957717479079397
Epoch: 67, step: 837, loss: 0.3639216721057892, mean loss: 0.33957742425790316
Epoch: 67, step: 838, loss: 0.3577457666397095, mean loss: 0.3395776104337502
Epoch: 67, step: 839, loss: 0.3288015127182007, mean loss: 0.3395775000093362
Epoch: 67, step: 840, loss: 0.339480996131897, mean loss: 0.3395774990204555
Epoch: 67, step: 841, loss: 0.3340732157230377, mean loss: 0.3395774426183313
Epoch: 67, step: 842, loss: 0.3630099892616272, mean loss: 0.3395776827280406
Epoch: 67, step: 843, loss: 0.3226991295814514, mean loss: 0.33957750977786905
Epoch: 67, step: 844, loss: 0.30883312225341797, mean loss: 0.3395771947513044
Epoch: 67, step: 845, loss: 0.314279168844223, mean loss: 0.3395769355342838
Epoch: 67, step: 846, loss: 0.33924752473831177, mean loss: 0.33957693215900026
Epoch: 67, step: 847, loss: 0.3328673839569092, mean loss: 0.3395768634108118
Epoch: 67, step: 848, loss: 0.3101397454738617, mean loss: 0.3395765617917258
Epoch: 67, step: 849, loss: 0.311076819896698, mean loss: 0.33957626978018973
Epoch: 67, step: 850, loss: 0.3647899925708771, mean loss: 0.3395765281201603
Epoch: 67, step: 851, loss: 0.3590496778488159, mean loss: 0.339576727640137
Epoch: 67, step: 852, loss: 0.3419307470321655, mean loss: 0.33957675175894103
Epoch: 67, step: 853, loss: 0.3093816041946411, mean loss: 0.33957644238876866
Epoch: 67, step: 854, loss: 0.3269750475883484, mean loss: 0.33957631328008553
Epoch: 67, step: 855, loss: 0.35311853885650635, mean loss: 0.33957645202671044
Epoch: 67, step: 856, loss: 0.32026901841163635, mean loss: 0.3395762542147785
Epoch: 67, step: 857, loss: 0.33938613533973694, mean loss: 0.3395762522669589
Epoch: 67, step: 858, loss: 0.326080322265625, mean loss: 0.33957611399890436
Epoch: 67, step: 859, loss: 0.29864785075187683, mean loss: 0.33957569468631477
Epoch: 67, step: 860, loss: 0.3278070092201233, mean loss: 0.33957557411663913
Epoch: 67, step: 861, loss: 0.32935237884521484, mean loss: 0.339575469381517
Epoch: 67, step: 862, loss: 0.32089143991470337, mean loss: 0.33957527796836207
Epoch: 67, step: 863, loss: 0.3256666362285614, mean loss: 0.339575135479306
Epoch: 67, step: 864, loss: 0.3096397817134857, mean loss: 0.33957482880546375
Epoch: 67, step: 865, loss: 0.31223902106285095, mean loss: 0.33957454876563603
Epoch: 67, step: 866, loss: 0.31166890263557434, mean loss: 0.33957426289106624
Epoch: 67, step: 867, loss: 0.32879766821861267, mean loss: 0.3395741524932352
Epoch: 67, step: 868, loss: 0.311504989862442, mean loss: 0.33957386494944025
Epoch: 67, step: 869, loss: 0.3436731994152069, mean loss: 0.33957390694307327
Epoch: 67, step: 870, loss: 0.29656901955604553, mean loss: 0.3395734664049876
Epoch: 67, step: 871, loss: 0.3264063894748688, mean loss: 0.339573331524052
Epoch: 67, step: 872, loss: 0.39996182918548584, mean loss: 0.33957395012555847
Epoch: 67, step: 873, loss: 0.3349321782588959, mean loss: 0.3395739025771384
Epoch: 67, step: 874, loss: 0.3453771471977234, mean loss: 0.33957396202260326
Epoch: 67, step: 875, loss: 0.388500452041626, mean loss: 0.3395744631953683
Epoch: 67, step: 876, loss: 0.35342368483543396, mean loss: 0.3395746050567936
Epoch: 67, step: 877, loss: 0.3213130831718445, mean loss: 0.3395744180008671
Epoch: 67, step: 878, loss: 0.3307972252368927, mean loss: 0.3395743280954847
Epoch: 67, step: 879, loss: 0.4029497504234314, mean loss: 0.33957497724759605
Epoch: 67, step: 880, loss: 0.3821975588798523, mean loss: 0.33957541382465445
Epoch: 67, step: 881, loss: 0.31543055176734924, mean loss: 0.3395751665147901
Epoch: 67, step: 882, loss: 0.3309222459793091, mean loss: 0.3395750778859679
Epoch: 67, step: 883, loss: 0.3563809096813202, mean loss: 0.33957525002042993
Epoch: 67, step: 884, loss: 0.30822065472602844, mean loss: 0.3395749288729153
Epoch: 67, step: 885, loss: 0.32025623321533203, mean loss: 0.3395747310043894
Epoch: 67, step: 886, loss: 0.32929491996765137, mean loss: 0.33957462571621366
Epoch: 67, step: 887, loss: 0.3103187382221222, mean loss: 0.33957432607379184
Epoch: 67, step: 888, loss: 0.3427843749523163, mean loss: 0.33957435895117316
Epoch: 67, step: 889, loss: 0.32409289479255676, mean loss: 0.3395742003913485
Epoch: 67, step: 890, loss: 0.3668046295642853, mean loss: 0.3395744792802062
Epoch: 67, step: 891, loss: 0.3126397728919983, mean loss: 0.3395742034229101
Epoch: 67, step: 892, loss: 0.3529980182647705, mean loss: 0.33957434090424315
Epoch: 67, step: 893, loss: 0.35100314021110535, mean loss: 0.3395744579522277
Epoch: 67, step: 894, loss: 0.32357537746429443, mean loss: 0.3395742940994119
Epoch: 67, step: 895, loss: 0.4240834414958954, mean loss: 0.33957515958164736
Epoch: 67, step: 896, loss: 0.35730403661727905, mean loss: 0.3395753411462644
Epoch: 67, step: 897, loss: 0.3221539855003357, mean loss: 0.3395751627328563
Epoch: 67, step: 898, loss: 0.3162863254547119, mean loss: 0.33957492423257185
Epoch: 67, step: 899, loss: 0.3487846851348877, mean loss: 0.3395750185484913
Epoch: 67, step: 900, loss: 0.3564409017562866, mean loss: 0.33957519126795804
Epoch: 67, step: 901, loss: 0.3180059492588043, mean loss: 0.33957497038478335
Epoch: 67, step: 902, loss: 0.3253008723258972, mean loss: 0.3395748242101609
Epoch: 67, step: 903, loss: 0.31640109419822693, mean loss: 0.33957458690083786
Epoch: 67, step: 904, loss: 0.3284724950790405, mean loss: 0.33957447321163403
Epoch: 67, step: 905, loss: 0.3293699622154236, mean loss: 0.3395743687150338
Epoch: 67, step: 906, loss: 0.30818110704421997, mean loss: 0.3395740472439195
Epoch: 67, step: 907, loss: 0.3346201777458191, mean loss: 0.339573996516166
Epoch: 67, step: 908, loss: 0.28478118777275085, mean loss: 0.3395734354421135
Epoch: 67, step: 909, loss: 0.3326740860939026, mean loss: 0.33957336479404215
Epoch: 67, step: 910, loss: 0.3176470696926117, mean loss: 0.33957314027510277
Epoch: 67, step: 911, loss: 0.30567631125450134, mean loss: 0.33957279318490186
Epoch: 67, step: 912, loss: 0.3419255316257477, mean loss: 0.3395728172757717
Epoch: 67, step: 913, loss: 0.33369046449661255, mean loss: 0.3395727570440257
Epoch: 67, step: 914, loss: 0.3122590482234955, mean loss: 0.33957247737097834
Epoch: 67, step: 915, loss: 0.3220071494579315, mean loss: 0.3395722975162938
Epoch: 67, step: 916, loss: 0.3714362680912018, mean loss: 0.3395726237741198
Epoch: 67, step: 917, loss: 0.3885565400123596, mean loss: 0.3395731253193478
Epoch: 67, step: 918, loss: 0.31074485182762146, mean loss: 0.33957283015031947
Epoch: 67, step: 919, loss: 0.3236162066459656, mean loss: 0.3395726667741522
Epoch: 67, step: 920, loss: 0.3292575776576996, mean loss: 0.3395725611614285
Epoch: 67, step: 921, loss: 0.34794875979423523, mean loss: 0.3395726469216274
Epoch: 67, step: 922, loss: 0.30300816893577576, mean loss: 0.3395722725579167
Epoch: 67, step: 923, loss: 0.3311946988105774, mean loss: 0.3395721867853949
Epoch: 67, step: 924, loss: 0.2970145642757416, mean loss: 0.3395717510700743
Epoch: 67, step: 925, loss: 0.32144832611083984, mean loss: 0.33957156551992834
Epoch: 67, step: 926, loss: 0.30468323826789856, mean loss: 0.33957120833203736
Epoch: 67, step: 927, loss: 0.28575828671455383, mean loss: 0.33957065739914066
Epoch: 67, step: 928, loss: 0.3280656933784485, mean loss: 0.3395705396133362
Epoch: 67, step: 929, loss: 0.3411567211151123, mean loss: 0.33957055585221807
Epoch: 67, step: 930, loss: 0.3198850154876709, mean loss: 0.3395703543192339
Epoch: 67, step: 931, loss: 0.3261180520057678, mean loss: 0.3395702166011512
Epoch: 67, step: 932, loss: 0.33015376329421997, mean loss: 0.339570120201101
Epoch: 67, step: 933, loss: 0.30485352873802185, mean loss: 0.3395697647969174
Epoch: 67, step: 934, loss: 0.3962308168411255, mean loss: 0.339570344847203
Epoch: 67, step: 935, loss: 0.32821834087371826, mean loss: 0.33957022863570496
Epoch: 67, step: 936, loss: 0.3331381678581238, mean loss: 0.33957016279078733
Epoch: 67, step: 937, loss: 0.3238956928253174, mean loss: 0.3395700023330967
Epoch: 67, step: 938, loss: 0.3062064051628113, mean loss: 0.3395696607974044
Epoch: 67, step: 939, loss: 0.31658005714416504, mean loss: 0.3395694254603758
Epoch: 67, step: 940, loss: 0.3400135338306427, mean loss: 0.3395694300065209
Epoch: 67, step: 941, loss: 0.34411928057670593, mean loss: 0.33956947658089465
Epoch: 67, step: 942, loss: 0.30909377336502075, mean loss: 0.33956916462070164
Epoch: 67, step: 943, loss: 0.3949914872646332, mean loss: 0.33956973193760215
Epoch: 67, step: 944, loss: 0.3084615170955658, mean loss: 0.3395694135093131
Epoch: 67, step: 945, loss: 0.3359605371952057, mean loss: 0.3395693765686994
Epoch: 67, step: 946, loss: 0.3073534667491913, mean loss: 0.33956904680863165
Epoch: 67, step: 947, loss: 0.326579213142395, mean loss: 0.33956891384685567
Epoch: 67, step: 948, loss: 0.34333154559135437, mean loss: 0.3395689523601339
Epoch: 67, step: 949, loss: 0.3273589313030243, mean loss: 0.3395688273829485
Epoch: 67, step: 950, loss: 0.3274461627006531, mean loss: 0.3395687033011802
Epoch: 67, step: 951, loss: 0.29923850297927856, mean loss: 0.33956829050486165
Epoch: 67, step: 952, loss: 0.33031466603279114, mean loss: 0.33956819579114866
Epoch: 67, step: 953, loss: 0.3260440230369568, mean loss: 0.3395680573684679
Epoch: 67, step: 954, loss: 0.3501664996147156, mean loss: 0.3395681658445868
Epoch: 67, step: 955, loss: 0.31055864691734314, mean loss: 0.33956786893229124
Epoch: 67, step: 956, loss: 0.30280202627182007, mean loss: 0.33956749263790853
Epoch: 67, step: 957, loss: 0.31839290261268616, mean loss: 0.33956727592051117
Epoch: 67, step: 958, loss: 0.31396812200546265, mean loss: 0.3395670139213308
Epoch: 67, step: 959, loss: 0.3077700138092041, mean loss: 0.33956668849250093
Epoch: 67, step: 960, loss: 0.3397665023803711, mean loss: 0.3395666905374905
Epoch: 67, step: 961, loss: 0.32269367575645447, mean loss: 0.33956651785286474
Epoch: 67, step: 962, loss: 0.3177127242088318, mean loss: 0.3395662941954091
Epoch: 67, step: 963, loss: 0.34899768233299255, mean loss: 0.339566390717721
Epoch: 67, step: 964, loss: 0.3246884346008301, mean loss: 0.3395662384559327
Epoch: 67, step: 965, loss: 0.32847651839256287, mean loss: 0.33956612496431365
Epoch: 67, step: 966, loss: 0.35750463604927063, mean loss: 0.3395663085442255
Epoch: 67, step: 967, loss: 0.3050728142261505, mean loss: 0.3395659555468216
Epoch: 67, step: 968, loss: 0.30908507108688354, mean loss: 0.3395656436166103
Epoch: 67, step: 969, loss: 0.3368366062641144, mean loss: 0.339565615688927
Epoch: 67, step: 970, loss: 0.32881104946136475, mean loss: 0.33956550563288646
Epoch: 67, step: 971, loss: 0.32930031418800354, mean loss: 0.33956540058590073
Epoch: 67, step: 972, loss: 0.312800794839859, mean loss: 0.3395651266979366
Epoch: 67, step: 973, loss: 0.3297497630119324, mean loss: 0.33956502625623786
Epoch: 67, step: 974, loss: 0.2947797477245331, mean loss: 0.3395645679682347
Epoch: 67, step: 975, loss: 0.2977205812931061, mean loss: 0.33956413978286903
Epoch: 67, step: 976, loss: 0.3428102433681488, mean loss: 0.3395641729995852
Epoch: 67, step: 977, loss: 0.3253203332424164, mean loss: 0.33956402724676854
Epoch: 67, step: 978, loss: 0.2947459816932678, mean loss: 0.33956356864223186
Epoch: 67, step: 979, loss: 0.3063933849334717, mean loss: 0.3395632292289244
Epoch: 67, step: 980, loss: 0.31868574023246765, mean loss: 0.3395630156025802
Epoch: 67, step: 981, loss: 0.3107021450996399, mean loss: 0.33956272029028606
Epoch: 67, step: 982, loss: 0.32170525193214417, mean loss: 0.33956253756967175
Epoch: 67, step: 983, loss: 0.31910863518714905, mean loss: 0.33956232828405003
Epoch: 67, step: 984, loss: 0.3504689037799835, mean loss: 0.3395624398796779
Epoch: 67, step: 985, loss: 0.34855374693870544, mean loss: 0.33956253187741725
Epoch: 67, step: 986, loss: 0.321125864982605, mean loss: 0.339562343238067
Epoch: 67, step: 987, loss: 0.3562564551830292, mean loss: 0.3395625140462845
Epoch: 67, step: 988, loss: 0.2993207275867462, mean loss: 0.339562102310847
Epoch: 67, step: 989, loss: 0.46386784315109253, mean loss: 0.33956337413696214
Epoch: 67, step: 990, loss: 0.3191109299659729, mean loss: 0.33956316488124877
Epoch: 67, step: 991, loss: 0.3354516327381134, mean loss: 0.33956312281523543
Epoch: 67, step: 992, loss: 0.3371499180793762, mean loss: 0.3395630981254457
Epoch: 67, step: 993, loss: 0.3210445046424866, mean loss: 0.33956290866141303
Epoch: 67, step: 994, loss: 0.30563461780548096, mean loss: 0.33956256154406594
Epoch: 67, step: 995, loss: 0.3332984745502472, mean loss: 0.33956249745740086
Epoch: 67, step: 996, loss: 0.364987850189209, mean loss: 0.33956275757661647
Epoch: 67, step: 997, loss: 0.3219951391220093, mean loss: 0.33956257784938
Epoch: 67, step: 998, loss: 0.34626489877700806, mean loss: 0.3395626464174274
Epoch: 67, step: 999, loss: 0.3311540186405182, mean loss: 0.33956256039389976
Epoch: 67, step: 1000, loss: 0.3644036054611206, mean loss: 0.33956281452483783
Epoch: 67, step: 1001, loss: 0.340724378824234, mean loss: 0.3395628264078486
Epoch: 67, step: 1002, loss: 0.3568912744522095, mean loss: 0.3395630036791608
Epoch: 67, step: 1003, loss: 0.33483850955963135, mean loss: 0.339562955347729
Epoch: 67, step: 1004, loss: 0.32744887471199036, mean loss: 0.3395628314223187
Epoch: 67, step: 1005, loss: 0.340160995721817, mean loss: 0.33956283754139616
Epoch: 67, step: 1006, loss: 0.34418973326683044, mean loss: 0.3395628848729467
Epoch: 67, step: 1007, loss: 0.37959498167037964, mean loss: 0.33956329438332766
Epoch: 67, step: 1008, loss: 0.3166310489177704, mean loss: 0.3395630597991499
Epoch: 67, step: 1009, loss: 0.32306748628616333, mean loss: 0.33956289106028953
Epoch: 67, step: 1010, loss: 0.3468617796897888, mean loss: 0.33956296572235267
Epoch: 67, step: 1011, loss: 0.32856419682502747, mean loss: 0.33956285321448754
Epoch: 67, step: 1012, loss: 0.3391043245792389, mean loss: 0.33956284852418533
Epoch: 67, step: 1013, loss: 0.3310488760471344, mean loss: 0.33956276143541386
Epoch: 67, step: 1014, loss: 0.3050188422203064, mean loss: 0.33956240809192795
Epoch: 67, step: 1015, loss: 0.356284499168396, mean loss: 0.33956257913741583
Epoch: 67, step: 1016, loss: 0.30991843342781067, mean loss: 0.33956227591902777
Epoch: 67, step: 1017, loss: 0.31858184933662415, mean loss: 0.3395620613206338
Epoch: 67, step: 1018, loss: 0.3263879418373108, mean loss: 0.3395619265704678
Epoch: 67, step: 1019, loss: 0.309969425201416, mean loss: 0.3395616238896175
Epoch: 67, step: 1020, loss: 0.343765527009964, mean loss: 0.3395616668879413
Epoch: 67, step: 1021, loss: 0.2962256669998169, mean loss: 0.3395612236435935
Epoch: 67, step: 1022, loss: 0.32305923104286194, mean loss: 0.33956105486151494
Epoch: 67, step: 1023, loss: 0.29519155621528625, mean loss: 0.3395606010557357
Epoch: 67, step: 1024, loss: 0.3134162127971649, mean loss: 0.3395603336568806
Epoch: 67, step: 1025, loss: 0.3144838511943817, mean loss: 0.3395600771829462
Epoch: 67, step: 1026, loss: 0.31774815917015076, mean loss: 0.33955985410017436
Epoch: 67, step: 1027, loss: 0.3584897220134735, mean loss: 0.3395600477046163
Epoch: 67, step: 1028, loss: 0.35242345929145813, mean loss: 0.3395601792632813
Epoch: 67, step: 1029, loss: 0.3534417748451233, mean loss: 0.33956032123382257
Epoch: 67, step: 1030, loss: 0.3430633842945099, mean loss: 0.339560357060156
Epoch: 67, step: 1031, loss: 0.3167160153388977, mean loss: 0.33956012343015274
Epoch: 67, step: 1032, loss: 0.33257123827934265, mean loss: 0.33956005195527367
Epoch: 67, step: 1033, loss: 0.32177770137786865, mean loss: 0.3395598700981775
Epoch: 67, step: 1034, loss: 0.3052380084991455, mean loss: 0.339559519097885
Epoch: 67, step: 1035, loss: 0.2968429625034332, mean loss: 0.33955908225181003
Epoch: 67, step: 1036, loss: 0.31114625930786133, mean loss: 0.33955879168758296
Epoch: 67, step: 1037, loss: 0.3952281177043915, mean loss: 0.33955936098508993
Epoch: 67, step: 1038, loss: 0.2881680428981781, mean loss: 0.33955883544163235
Epoch: 67, step: 1039, loss: 0.3480187654495239, mean loss: 0.33955892195459925
Epoch: 67, step: 1040, loss: 0.34357750415802, mean loss: 0.3395589630490189
Epoch: 67, step: 1041, loss: 0.3993415832519531, mean loss: 0.33955957438576295
Epoch: 67, step: 1042, loss: 0.3271366357803345, mean loss: 0.3395594473501604
Epoch: 67, step: 1043, loss: 0.4253079891204834, mean loss: 0.3395603241963418
Epoch: 67, step: 1044, loss: 0.314165323972702, mean loss: 0.33956006451517623
Epoch: 67, step: 1045, loss: 0.30046772956848145, mean loss: 0.33955966477352595
Epoch: 67, step: 1046, loss: 0.32521960139274597, mean loss: 0.3395595181396144
Epoch: 67, step: 1047, loss: 0.3223477303981781, mean loss: 0.33955934214276645
Epoch: 67, step: 1048, loss: 0.3451531231403351, mean loss: 0.3395593993406457
Epoch: 67, step: 1049, loss: 0.34029290080070496, mean loss: 0.33955940684081404
Epoch: 67, step: 1050, loss: 0.35175782442092896, mean loss: 0.3395595315702855
Epoch: 67, step: 1051, loss: 0.3397674858570099, mean loss: 0.33955953369660746
Epoch: 67, step: 1052, loss: 0.3163538873195648, mean loss: 0.3395592964224858
Epoch: 67, step: 1053, loss: 0.30321747064590454, mean loss: 0.3395589248367741
Epoch: 67, step: 1054, loss: 0.333757609128952, mean loss: 0.33955886552043707
Epoch: 67, step: 1055, loss: 0.31627246737480164, mean loss: 0.33955862742794446
Epoch: 67, step: 1056, loss: 0.3180227279663086, mean loss: 0.3395584072357308
Epoch: 67, step: 1057, loss: 0.3456639349460602, mean loss: 0.3395584696606097
Epoch: 67, step: 1058, loss: 0.3199159801006317, mean loss: 0.33955826883153245
Epoch: 67, step: 1059, loss: 0.29761379957199097, mean loss: 0.33955783998655803
Epoch: 67, step: 1060, loss: 0.29773908853530884, mean loss: 0.339557412431308
Epoch: 67, step: 1061, loss: 0.31802529096603394, mean loss: 0.3395571922889763
Epoch: 67, step: 1062, loss: 0.3229222595691681, mean loss: 0.3395570222167685
Epoch: 67, step: 1063, loss: 0.37627413868904114, mean loss: 0.3395573976013478
Epoch: 67, step: 1064, loss: 0.374414324760437, mean loss: 0.3395577539642766
Epoch: 67, step: 1065, loss: 0.33779436349868774, mean loss: 0.33955773593627997
Epoch: 67, step: 1066, loss: 0.3443286716938019, mean loss: 0.3395577847113733
Epoch: 67, step: 1067, loss: 0.34490957856178284, mean loss: 0.33955783942424084
Epoch: 67, step: 1068, loss: 0.3105204105377197, mean loss: 0.3395575425696155
Epoch: 67, step: 1069, loss: 0.32657748460769653, mean loss: 0.33955740987360905
Epoch: 67, step: 1070, loss: 0.3104793131351471, mean loss: 0.33955711260930727
Epoch: 67, step: 1071, loss: 0.3184399902820587, mean loss: 0.33955689673195777
Epoch: 67, step: 1072, loss: 0.3208952248096466, mean loss: 0.33955670595828014
Epoch: 67, step: 1073, loss: 0.3576483130455017, mean loss: 0.3395568909024347
Epoch: 67, step: 1074, loss: 0.3359093964099884, mean loss: 0.3395568536157588
Epoch: 67, step: 1075, loss: 0.33467915654182434, mean loss: 0.33955680375379166
Epoch: 67, step: 1076, loss: 0.3084064722061157, mean loss: 0.33955648532464217
Epoch: 67, step: 1077, loss: 0.29517555236816406, mean loss: 0.3395560316524798
Epoch: 67, step: 1078, loss: 0.3080722987651825, mean loss: 0.3395557098217696
Epoch: 67, step: 1079, loss: 0.3374508023262024, mean loss: 0.33955568830535815
Epoch: 67, step: 1080, loss: 0.3755289912223816, mean loss: 0.33955605602150485
Epoch: 67, step: 1081, loss: 0.3570212125778198, mean loss: 0.3395562345470753
Epoch: 67, step: 1082, loss: 0.334689736366272, mean loss: 0.3395561848031477
Epoch: 67, step: 1083, loss: 0.3261953294277191, mean loss: 0.33955604823376984
Epoch: 67, step: 1084, loss: 0.35306814312934875, mean loss: 0.3395561863476465
Epoch: 67, step: 1085, loss: 0.3212619125843048, mean loss: 0.33955599935464037
Epoch: 67, step: 1086, loss: 0.3184641897678375, mean loss: 0.33955578376911794
Epoch: 67, step: 1087, loss: 0.2939208447933197, mean loss: 0.3395553173258969
Epoch: 67, step: 1088, loss: 0.31893572211265564, mean loss: 0.3395551065713233
Epoch: 67, step: 1089, loss: 0.34704864025115967, mean loss: 0.3395551831625627
Epoch: 67, step: 1090, loss: 0.33903297781944275, mean loss: 0.3395551778251682
Epoch: 67, step: 1091, loss: 0.32440119981765747, mean loss: 0.33955502293986556
Epoch: 67, step: 1092, loss: 0.3534103333950043, mean loss: 0.33955516455034024
Epoch: 67, step: 1093, loss: 0.33809608221054077, mean loss: 0.3395551496377021
Epoch: 67, step: 1094, loss: 0.35643401741981506, mean loss: 0.3395553221474144
Epoch: 67, step: 1095, loss: 0.32715269923210144, mean loss: 0.33955519538825785
Epoch: 67, step: 1096, loss: 0.34571608901023865, mean loss: 0.33955525835410816
Epoch: 67, step: 1097, loss: 0.35845598578453064, mean loss: 0.33955545152222366
Epoch: 67, step: 1098, loss: 0.32563358545303345, mean loss: 0.3395553092402317
Epoch: 67, step: 1099, loss: 0.34749916195869446, mean loss: 0.3395553904258739
Epoch: 67, step: 1100, loss: 0.32512179017066956, mean loss: 0.3395552429169545
Epoch: 67, step: 1101, loss: 0.3551165461540222, mean loss: 0.3395554019491797
Epoch: 67, step: 1102, loss: 0.3271891474723816, mean loss: 0.33955527557076276
Epoch: 67, step: 1103, loss: 0.35457196831703186, mean loss: 0.3395554290340823
Epoch: 67, step: 1104, loss: 0.32297182083129883, mean loss: 0.3395552595593784
Epoch: 67, step: 1105, loss: 0.321254700422287, mean loss: 0.3395550725403588
Epoch: 67, step: 1106, loss: 0.30186697840690613, mean loss: 0.3395546873981164
Epoch: 67, step: 1107, loss: 0.35322773456573486, mean loss: 0.33955482712431784
Epoch: 67, step: 1108, loss: 0.32581377029418945, mean loss: 0.339554686704554
Epoch: 67, step: 1109, loss: 0.3400512635707855, mean loss: 0.3395546917790177
Epoch: 67, step: 1110, loss: 0.34815463423728943, mean loss: 0.33955477965997355
Epoch: 67, step: 1111, loss: 0.332522988319397, mean loss: 0.3395547078043498
Epoch: 67, step: 1112, loss: 0.3402676284313202, mean loss: 0.33955471508938295
Epoch: 67, step: 1113, loss: 0.3029603660106659, mean loss: 0.3395543411510915
Epoch: 67, step: 1114, loss: 0.33039551973342896, mean loss: 0.33955424756289765
Epoch: 67, step: 1115, loss: 0.3564264178276062, mean loss: 0.33955441996715524
Epoch: 67, step: 1116, loss: 0.32489851117134094, mean loss: 0.33955427021076845
Epoch: 67, step: 1117, loss: 0.303625226020813, mean loss: 0.33955390308588146
Epoch: 67, step: 1118, loss: 0.35243791341781616, mean loss: 0.33955403473404
Epoch: 67, step: 1119, loss: 0.314816415309906, mean loss: 0.3395537819688928
Epoch: 67, step: 1120, loss: 0.30528560280799866, mean loss: 0.3395534318255465
Epoch: 67, step: 1121, loss: 0.29969727993011475, mean loss: 0.33955302458990844
Epoch: 67, step: 1122, loss: 0.3276146948337555, mean loss: 0.3395529026096512
Epoch: 67, step: 1123, loss: 0.3383099138736725, mean loss: 0.3395528899095047
Epoch: 67, step: 1124, loss: 0.34604716300964355, mean loss: 0.33955295626358706
Epoch: 67, step: 1125, loss: 0.3697081506252289, mean loss: 0.33955326436578337
Epoch: 67, step: 1126, loss: 0.33107519149780273, mean loss: 0.33955317774434923
Epoch: 67, step: 1127, loss: 0.39334383606910706, mean loss: 0.33955372732400435
Epoch: 67, step: 1128, loss: 0.3366861045360565, mean loss: 0.33955369802577506
Epoch: 67, step: 1129, loss: 0.31841787695884705, mean loss: 0.33955348208530767
Epoch: 67, step: 1130, loss: 0.329563170671463, mean loss: 0.33955338001733176
Epoch: 67, step: 1131, loss: 0.3259222209453583, mean loss: 0.33955324075334453
Epoch: 67, step: 1132, loss: 0.3008873164653778, mean loss: 0.3395528457234175
Epoch: 67, step: 1133, loss: 0.36018070578575134, mean loss: 0.3395530564655362
Epoch: 67, step: 1134, loss: 0.3817838430404663, mean loss: 0.3395534879070181
Epoch: 67, step: 1135, loss: 0.31808868050575256, mean loss: 0.3395532686188055
Epoch: 67, step: 1136, loss: 0.32883358001708984, mean loss: 0.3395531591057177
Epoch: 67, step: 1137, loss: 0.354488730430603, mean loss: 0.33955331168699926
Epoch: 67, step: 1138, loss: 0.35074302554130554, mean loss: 0.3395534259995623
Epoch: 67, step: 1139, loss: 0.31999635696411133, mean loss: 0.3395532262093016
Epoch: 67, step: 1140, loss: 0.35169169306755066, mean loss: 0.33955335021166
Epoch: 67, step: 1141, loss: 0.32520195841789246, mean loss: 0.33955320360432734
Epoch: 67, step: 1142, loss: 0.283648282289505, mean loss: 0.33955263251075063
Epoch: 67, step: 1143, loss: 0.31100696325302124, mean loss: 0.3395523409070521
Epoch: 67, step: 1144, loss: 0.37002748250961304, mean loss: 0.3395526522177853
Epoch: 67, step: 1145, loss: 0.28844475746154785, mean loss: 0.339552130143963
Epoch: 67, step: 1146, loss: 0.35449299216270447, mean loss: 0.33955228276526156
Epoch: 67, step: 1147, loss: 0.321744441986084, mean loss: 0.3395521008595578
Epoch: 67, step: 1148, loss: 0.3226017951965332, mean loss: 0.3395519277152769
Epoch: 67, step: 1149, loss: 0.3406387269496918, mean loss: 0.3395519388166195
Epoch: 67, step: 1150, loss: 0.31833043694496155, mean loss: 0.3395517220472769
Epoch: 67, step: 1151, loss: 0.32735466957092285, mean loss: 0.33955159746042834
Epoch: 67, step: 1152, loss: 0.33971038460731506, mean loss: 0.33955159908234384
Epoch: 67, step: 1153, loss: 0.3155834376811981, mean loss: 0.33955135426445043
Epoch: 67, step: 1154, loss: 0.36703428626060486, mean loss: 0.3395516349803835
Epoch: 67, step: 1155, loss: 0.31391027569770813, mean loss: 0.3395513730773021
Epoch: 67, step: 1156, loss: 0.3174063265323639, mean loss: 0.33955114688817445
Epoch: 67, step: 1157, loss: 0.3430761992931366, mean loss: 0.3395511828926318
Epoch: 67, step: 1158, loss: 0.33747756481170654, mean loss: 0.33955116171316474
Epoch: 67, step: 1159, loss: 0.34731826186180115, mean loss: 0.33955124104376233
Epoch: 67, step: 1160, loss: 0.31842556595802307, mean loss: 0.3395510252752928
Epoch: 67, step: 1161, loss: 0.35292983055114746, mean loss: 0.33955116191920326
Epoch: 67, step: 1162, loss: 0.324660062789917, mean loss: 0.3395510098310913
Epoch: 67, step: 1163, loss: 0.29189106822013855, mean loss: 0.33955052306806316
Epoch: 67, step: 1164, loss: 0.3739425241947174, mean loss: 0.3395508743186747
Epoch: 67, step: 1165, loss: 0.3070564866065979, mean loss: 0.33955054245206
Epoch: 67, step: 1166, loss: 0.3416672348976135, mean loss: 0.3395505640697125
Epoch: 67, step: 1167, loss: 0.3466707468032837, mean loss: 0.33955063678696745
Epoch: 67, step: 1168, loss: 0.31323716044425964, mean loss: 0.3395503680545069
Epoch: 67, step: 1169, loss: 0.3489760160446167, mean loss: 0.339550464315133
Epoch: 67, step: 1170, loss: 0.32647430896759033, mean loss: 0.33955033077460106
Epoch: 67, step: 1171, loss: 0.3362458646297455, mean loss: 0.33955029702801054
Epoch: 67, step: 1172, loss: 0.3400006890296936, mean loss: 0.33955030162755506
Epoch: 67, step: 1173, loss: 0.31410911679267883, mean loss: 0.33955004181684006
Epoch: 67, step: 1174, loss: 0.3454960584640503, mean loss: 0.33955010253818896
Epoch: 67, step: 1175, loss: 0.3831193149089813, mean loss: 0.3395505474670355
Epoch: 67, step: 1176, loss: 0.3780843913555145, mean loss: 0.3395509409706749
Epoch: 67, step: 1177, loss: 0.319441020488739, mean loss: 0.3395507356123382
Epoch: 67, step: 1178, loss: 0.3250330090522766, mean loss: 0.33955058736183974
Epoch: 67, step: 1179, loss: 0.306320458650589, mean loss: 0.3395502480295884
Epoch: 67, step: 1180, loss: 0.32668018341064453, mean loss: 0.3395501166071842
Epoch: 67, step: 1181, loss: 0.313663125038147, mean loss: 0.33954985226539347
Epoch: 67, step: 1182, loss: 0.33090952038764954, mean loss: 0.3395497640366214
Epoch: 67, step: 1183, loss: 0.3392426371574402, mean loss: 0.3395497609004976
Epoch: 67, step: 1184, loss: 0.3885246813297272, mean loss: 0.3395502609864791
Epoch: 67, step: 1185, loss: 0.33446580171585083, mean loss: 0.339550209069277
Epoch: 67, step: 1186, loss: 0.32887929677963257, mean loss: 0.33955010011014813
Epoch: 67, step: 1187, loss: 0.332322359085083, mean loss: 0.3395500263094923
Epoch: 67, step: 1188, loss: 0.3432498574256897, mean loss: 0.3395500640871567
Epoch: 67, step: 1189, loss: 0.3157743811607361, mean loss: 0.33954982132456274
Epoch: 67, step: 1190, loss: 0.36171507835388184, mean loss: 0.33955004764152563
Epoch: 67, step: 1191, loss: 0.37664279341697693, mean loss: 0.33955042637080657
Epoch: 67, step: 1192, loss: 0.3491514325141907, mean loss: 0.33955052439927413
Epoch: 67, step: 1193, loss: 0.3279281258583069, mean loss: 0.33955040573313966
Epoch: 67, step: 1194, loss: 0.31331607699394226, mean loss: 0.33955013788011557
Epoch: 67, step: 1195, loss: 0.3451182246208191, mean loss: 0.33955019472981274
Epoch: 67, step: 1196, loss: 0.39851418137550354, mean loss: 0.3395507967410093
Epoch: 67, step: 1197, loss: 0.402664452791214, mean loss: 0.33955144111296987
Epoch: 67, step: 1198, loss: 0.3012028634548187, mean loss: 0.3395510495892105
Epoch: 67, step: 1199, loss: 0.3172963857650757, mean loss: 0.33955082238024425
Epoch: 67, step: 1200, loss: 0.3262854814529419, mean loss: 0.3395506869491431
Epoch: 67, step: 1201, loss: 0.3376520574092865, mean loss: 0.33955066756548263
Epoch: 67, step: 1202, loss: 0.3480027914047241, mean loss: 0.3395507538547889
Epoch: 67, step: 1203, loss: 0.29622387886047363, mean loss: 0.3395503115271693
Epoch: 67, step: 1204, loss: 0.30691322684288025, mean loss: 0.3395499783358971
Epoch: 67, step: 1205, loss: 0.34070348739624023, mean loss: 0.33954999011192527
Epoch: 67, step: 1206, loss: 0.3198283016681671, mean loss: 0.3395497887777571
Epoch: 67, step: 1207, loss: 0.370015025138855, mean loss: 0.3395500997871528
Epoch: 67, step: 1208, loss: 0.3179263472557068, mean loss: 0.3395498790397582
Epoch: 67, step: 1209, loss: 0.368192583322525, mean loss: 0.3395501714375642
Epoch: 67, step: 1210, loss: 0.32183122634887695, mean loss: 0.3395499905563273
Epoch: 67, step: 1211, loss: 0.3357725441455841, mean loss: 0.33954995199521654
Epoch: 67, step: 1212, loss: 0.3553079664707184, mean loss: 0.33955011285529835
Epoch: 67, step: 1213, loss: 0.3254299461841583, mean loss: 0.33954996871607424
Epoch: 67, step: 1214, loss: 0.3494439125061035, mean loss: 0.33955006971281576
Epoch: 67, step: 1215, loss: 0.4104548990726471, mean loss: 0.3395507934973627
Epoch: 67, step: 1216, loss: 0.30388838052749634, mean loss: 0.33955042946517805
Epoch: 67, step: 1217, loss: 0.3226330876350403, mean loss: 0.3395502567793296
Epoch: 67, step: 1218, loss: 0.3357485830783844, mean loss: 0.3395502179736736
Epoch: 67, step: 1219, loss: 0.3471512496471405, mean loss: 0.33955029556055577
Epoch: 67, step: 1220, loss: 0.309455931186676, mean loss: 0.339549988378035
Epoch: 67, step: 1221, loss: 0.3180558979511261, mean loss: 0.33954976898342004
Epoch: 67, step: 1222, loss: 0.3278215229511261, mean loss: 0.3395496492720153
Epoch: 67, step: 1223, loss: 0.32241490483283997, mean loss: 0.3395494743777145
Epoch: 67, step: 1224, loss: 0.3372439444065094, mean loss: 0.33954945084541505
Epoch: 67, step: 1225, loss: 0.3422712981700897, mean loss: 0.3395494786267379
Epoch: 67, step: 1226, loss: 0.3270891308784485, mean loss: 0.3395493514478887
Epoch: 67, step: 1227, loss: 0.3522176444530487, mean loss: 0.33954948074785
Epoch: 67, step: 1228, loss: 0.2985150218009949, mean loss: 0.3395490619305873
Epoch: 67, step: 1229, loss: 0.33158326148986816, mean loss: 0.3395489806286579
Epoch: 67, step: 1230, loss: 0.3257882297039032, mean loss: 0.33954884018273657
Epoch: 67, step: 1231, loss: 0.34351566433906555, mean loss: 0.3395488806687965
Epoch: 67, step: 1232, loss: 0.3395674526691437, mean loss: 0.33954888085834345
Epoch: 67, step: 1233, loss: 0.33341431617736816, mean loss: 0.33954881824924504
Epoch: 67, step: 1234, loss: 0.3311750590801239, mean loss: 0.339548732787898
Epoch: 67, step: 1235, loss: 0.31936585903167725, mean loss: 0.339548526806577
Epoch: 67, step: 1236, loss: 0.3309776484966278, mean loss: 0.3395484393352466
Epoch: 67, step: 1237, loss: 0.3190211057662964, mean loss: 0.33954822984273164
Epoch: 67, step: 1238, loss: 0.3021973669528961, mean loss: 0.33954784866091275
Epoch: 67, step: 1239, loss: 0.3502524793148041, mean loss: 0.33954795790521464
Epoch: 67, step: 1240, loss: 0.32781463861465454, mean loss: 0.33954783816402645
Epoch: 67, step: 1241, loss: 0.2920896112918854, mean loss: 0.3395473538469852
Epoch: 67, step: 1242, loss: 0.356555312871933, mean loss: 0.3395475274135273
Epoch: 67, step: 1243, loss: 0.33115318417549133, mean loss: 0.3395474417499707
Epoch: 67, step: 1244, loss: 0.318739652633667, mean loss: 0.33954722941042487
Epoch: 67, step: 1245, loss: 0.3406866192817688, mean loss: 0.339547241037564
Epoch: 67, step: 1246, loss: 0.33642905950546265, mean loss: 0.33954720921776166
Epoch: 67, step: 1247, loss: 0.3488258421421051, mean loss: 0.3395473039015541
Epoch: 67, step: 1248, loss: 0.3179164528846741, mean loss: 0.33954708317182747
Epoch: 67, step: 1249, loss: 0.3365558385848999, mean loss: 0.3395470526483006
Epoch: 67, step: 1250, loss: 0.3171427547931671, mean loss: 0.33954682403068354
Epoch: 67, step: 1251, loss: 0.29790198802948, mean loss: 0.3395463990833774
Epoch: 67, step: 1252, loss: 0.3183569014072418, mean loss: 0.3395461828662197
Epoch: 67, step: 1253, loss: 0.3307844400405884, mean loss: 0.3395460934625052
Epoch: 67, step: 1254, loss: 0.32285869121551514, mean loss: 0.3395459231881029
Epoch: 67, step: 1255, loss: 0.31067249178886414, mean loss: 0.33954562857327697
Epoch: 67, step: 1256, loss: 0.3858397901058197, mean loss: 0.3395461009385801
Epoch: 67, step: 1257, loss: 0.3244665861129761, mean loss: 0.33954594707540003
Epoch: 67, step: 1258, loss: 0.30134400725364685, mean loss: 0.33954555728752955
Epoch: 67, step: 1259, loss: 0.3475792109966278, mean loss: 0.33954563925689646
Epoch: 67, step: 1260, loss: 0.31928524374961853, mean loss: 0.33954543253715125
Epoch: 67, step: 1261, loss: 0.34620949625968933, mean loss: 0.33954550053086335
Epoch: 67, step: 1262, loss: 0.3330356776714325, mean loss: 0.3395454341115547
Epoch: 67, step: 1263, loss: 0.3116530179977417, mean loss: 0.33954514952991044
Epoch: 67, step: 1264, loss: 0.41688793897628784, mean loss: 0.33954593863737015
Epoch: 67, step: 1265, loss: 0.33390963077545166, mean loss: 0.33954588113223966
Epoch: 67, step: 1266, loss: 0.33182889223098755, mean loss: 0.3395458023995059
Epoch: 67, step: 1267, loss: 0.2977675199508667, mean loss: 0.3395453761600914
Epoch: 67, step: 1268, loss: 0.3245554566383362, mean loss: 0.3395452232282579
Epoch: 67, step: 1269, loss: 0.3231571912765503, mean loss: 0.3395450560341512
Epoch: 67, step: 1270, loss: 0.35748931765556335, mean loss: 0.3395452391033686
Epoch: 67, step: 1271, loss: 0.3472554087638855, mean loss: 0.33954531776251634
Epoch: 67, step: 1272, loss: 0.3035215139389038, mean loss: 0.3395449502514338
Epoch: 67, step: 1273, loss: 0.33552464842796326, mean loss: 0.3395449092371531
Epoch: 67, step: 1274, loss: 0.29864948987960815, mean loss: 0.33954449203487036
Epoch: 67, step: 1275, loss: 0.3293927311897278, mean loss: 0.3395443884708366
Epoch: 67, step: 1276, loss: 0.3356647193431854, mean loss: 0.33954434889247265
Epoch: 67, step: 1277, loss: 0.2848254442214966, mean loss: 0.33954379068439855
Epoch: 67, step: 1278, loss: 0.30632632970809937, mean loss: 0.3395434518240746
Epoch: 67, step: 1279, loss: 0.401510089635849, mean loss: 0.33954408395609614
Epoch: 67, step: 1280, loss: 0.33219748735427856, mean loss: 0.33954400901300175
Epoch: 67, step: 1281, loss: 0.3182569444179535, mean loss: 0.33954379186453093
Epoch: 67, step: 1282, loss: 0.34531107544898987, mean loss: 0.33954385069575355
Epoch: 67, step: 1283, loss: 0.3520425856113434, mean loss: 0.3395439781922334
Epoch: 67, step: 1284, loss: 0.33249714970588684, mean loss: 0.3395439063100255
Epoch: 67, step: 1285, loss: 0.3141453266143799, mean loss: 0.3395436472307296
Epoch: 67, step: 1286, loss: 0.30513033270835876, mean loss: 0.33954329619982715
Epoch: 67, step: 1287, loss: 0.30333778262138367, mean loss: 0.33954292689147536
Epoch: 67, step: 1288, loss: 0.31575286388397217, mean loss: 0.33954268422734846
Epoch: 67, step: 1289, loss: 0.3243972063064575, mean loss: 0.339542529741558
Epoch: 67, step: 1290, loss: 0.3337056040763855, mean loss: 0.33954247020478523
Epoch: 67, step: 1291, loss: 0.33984437584877014, mean loss: 0.3395424732841982
Epoch: 67, step: 1292, loss: 0.34621667861938477, mean loss: 0.3395425413598536
Epoch: 67, step: 1293, loss: 0.3115995228290558, mean loss: 0.3395422563491589
Epoch: 67, step: 1294, loss: 0.3258543610572815, mean loss: 0.33954211673801593
Epoch: 67, step: 1295, loss: 0.36817121505737305, mean loss: 0.33954240874056907
Epoch: 67, step: 1296, loss: 0.3254344165325165, mean loss: 0.33954226484753824
Epoch: 67, step: 1297, loss: 0.34321197867393494, mean loss: 0.3395423022760292
Epoch: 67, step: 1298, loss: 0.3463868796825409, mean loss: 0.3395423720851759
Epoch: 67, step: 1299, loss: 0.37998318672180176, mean loss: 0.33954278454452885
Epoch: 67, step: 1300, loss: 0.3193347454071045, mean loss: 0.3395425784430986
Epoch: 67, step: 1301, loss: 0.3592347204685211, mean loss: 0.3395427792808551
Epoch: 67, step: 1302, loss: 0.3368600904941559, mean loss: 0.33954275192071814
Epoch: 67, step: 1303, loss: 0.3281742334365845, mean loss: 0.33954263597694867
Epoch: 67, step: 1304, loss: 0.3612150549888611, mean loss: 0.3395428570045461
Epoch: 67, step: 1305, loss: 0.3348425626754761, mean loss: 0.33954280906877266
Epoch: 67, step: 1306, loss: 0.3187660574913025, mean loss: 0.33954259718002067
Epoch: 67, step: 1307, loss: 0.37617337703704834, mean loss: 0.33954297075002005
Epoch: 67, step: 1308, loss: 0.3235487639904022, mean loss: 0.3395428076386995
Epoch: 67, step: 1309, loss: 0.3029581308364868, mean loss: 0.3395424345464806
Epoch: 67, step: 1310, loss: 0.30770397186279297, mean loss: 0.33954210985968303
Epoch: 67, step: 1311, loss: 0.34077945351600647, mean loss: 0.33954212247791327
Epoch: 67, step: 1312, loss: 0.34308308362960815, mean loss: 0.33954215858769343
Epoch: 67, step: 1313, loss: 0.31445229053497314, mean loss: 0.3395419027305005
Epoch: 67, step: 1314, loss: 0.35487082600593567, mean loss: 0.3395420590475954
Epoch: 67, step: 1315, loss: 0.3058466911315918, mean loss: 0.3395417154417062
Epoch: 67, step: 1316, loss: 0.36905041337013245, mean loss: 0.33954201635128584
Epoch: 67, step: 1317, loss: 0.3216223418712616, mean loss: 0.3395418336205282
Epoch: 67, step: 1318, loss: 0.2913022041320801, mean loss: 0.33954134171571326
Epoch: 67, step: 1319, loss: 0.35328173637390137, mean loss: 0.3395414818266022
Epoch: 67, step: 1320, loss: 0.3269643783569336, mean loss: 0.3395413535791084
Epoch: 67, step: 1321, loss: 0.3383937478065491, mean loss: 0.3395413418772039
Epoch: 67, step: 1322, loss: 0.35406914353370667, mean loss: 0.33954149001275524
Epoch: 67, step: 1323, loss: 0.3701452910900116, mean loss: 0.3395418020671752
Epoch: 67, step: 1324, loss: 0.33884865045547485, mean loss: 0.3395417949994643
Epoch: 67, step: 1325, loss: 0.28735965490341187, mean loss: 0.3395412629304134
Epoch: 67, step: 1326, loss: 0.3423840403556824, mean loss: 0.33954129191616333
Epoch: 67, step: 1327, loss: 0.30474984645843506, mean loss: 0.33954093717651795
Epoch: 67, step: 1328, loss: 0.35925766825675964, mean loss: 0.3395411382096968
Epoch: 67, step: 1329, loss: 0.29273417592048645, mean loss: 0.3395406609674784
Epoch: 67, step: 1330, loss: 0.3554244935512543, mean loss: 0.3395408229168517
Epoch: 67, step: 1331, loss: 0.3352801501750946, mean loss: 0.33954077947606115
Epoch: 67, step: 1332, loss: 0.3693758547306061, mean loss: 0.3395410836641838
Epoch: 67, step: 1333, loss: 0.3160824775695801, mean loss: 0.33954084449077687
Epoch: 67, step: 1334, loss: 0.31715455651283264, mean loss: 0.3395406162525707
Epoch: 67, step: 1335, loss: 0.31232818961143494, mean loss: 0.3395403388125536
Epoch: 67, step: 1336, loss: 0.36124467849731445, mean loss: 0.33954056009348016
Epoch: 67, step: 1337, loss: 0.337656706571579, mean loss: 0.3395405408873394
Epoch: 67, step: 1338, loss: 0.33587026596069336, mean loss: 0.33954050346877296
Epoch: 67, step: 1339, loss: 0.31784534454345703, mean loss: 0.33954028228821137
Epoch: 67, step: 1340, loss: 0.31875744462013245, mean loss: 0.3395400704108585
Epoch: 67, step: 1341, loss: 0.3147249221801758, mean loss: 0.339539817427392
Epoch: 67, step: 1342, loss: 0.3202114403247833, mean loss: 0.3395396203820249
Epoch: 67, step: 1343, loss: 0.34574559330940247, mean loss: 0.33953968364888587
Epoch: 67, step: 1344, loss: 0.3419785499572754, mean loss: 0.33953970851168247
Epoch: 67, step: 1345, loss: 0.2644708752632141, mean loss: 0.3395389432372187
Epoch: 67, step: 1346, loss: 0.29864177107810974, mean loss: 0.33953852632328674
Epoch: 67, step: 1347, loss: 0.34610748291015625, mean loss: 0.33953859328785807
Epoch: 67, step: 1348, loss: 0.3175337612628937, mean loss: 0.3395383689707839
Epoch: 67, step: 1349, loss: 0.361007958650589, mean loss: 0.339538587829371
Epoch: 67, step: 1350, loss: 0.3594503402709961, mean loss: 0.3395387908054711
Epoch: 67, step: 1351, loss: 0.3611034154891968, mean loss: 0.3395390106283527
Epoch: 67, step: 1352, loss: 0.40692010521888733, mean loss: 0.33953969748266194
Epoch: 67, step: 1353, loss: 0.36585843563079834, mean loss: 0.339539965761985
Epoch: 67, step: 1354, loss: 0.29636386036872864, mean loss: 0.3395395256520455
Epoch: 67, step: 1355, loss: 0.3452112674713135, mean loss: 0.33953958346560886
Epoch: 67, step: 1356, loss: 0.3185240924358368, mean loss: 0.33953936925133815
Epoch: 67, step: 1357, loss: 0.36150482296943665, mean loss: 0.3395395931464487
Epoch: 67, step: 1358, loss: 0.29462578892707825, mean loss: 0.33953913534217156
Epoch: 67, step: 1359, loss: 0.308513343334198, mean loss: 0.3395388191009679
Epoch: 67, step: 1360, loss: 0.3042982220649719, mean loss: 0.33953845990255554
Epoch: 67, step: 1361, loss: 0.3095982074737549, mean loss: 0.3395381547323137
Epoch: 67, step: 1362, loss: 0.30649057030677795, mean loss: 0.3395378178935859
Epoch: 67, step: 1363, loss: 0.3416590988636017, mean loss: 0.33953783951460037
Epoch: 67, step: 1364, loss: 0.32708680629730225, mean loss: 0.3395377126095703
Epoch: 67, step: 1365, loss: 0.3165028393268585, mean loss: 0.3395374778329504
Epoch: 67, step: 1366, loss: 0.3365299105644226, mean loss: 0.33953744717945944
Epoch: 67, step: 1367, loss: 0.33004453778266907, mean loss: 0.33953735042755967
Epoch: 67, step: 1368, loss: 0.34303832054138184, mean loss: 0.3395373861091451
Epoch: 67, step: 1369, loss: 0.3325098156929016, mean loss: 0.33953731448548363
Epoch: 67, step: 1370, loss: 0.3109632432460785, mean loss: 0.3395370232669506
Epoch: 67, step: 1371, loss: 0.3137674033641815, mean loss: 0.3395367606332378
Epoch: 67, step: 1372, loss: 0.30213814973831177, mean loss: 0.3395363794853602
Epoch: 67, step: 1373, loss: 0.33839085698127747, mean loss: 0.3395363678108886
Epoch: 67, step: 1374, loss: 0.33659717440605164, mean loss: 0.33953633785671467
Epoch: 67, step: 1375, loss: 0.33171147108078003, mean loss: 0.33953625811203675
Epoch: 67, step: 1376, loss: 0.3202388882637024, mean loss: 0.3395360614509427
Epoch: 67, step: 1377, loss: 0.28938165307044983, mean loss: 0.3395355503284229
Epoch: 67, step: 1378, loss: 0.34116989374160767, mean loss: 0.3395355669838125
Epoch: 67, step: 1379, loss: 0.33027148246765137, mean loss: 0.3395354725756465
Epoch: 67, step: 1380, loss: 0.3505822420120239, mean loss: 0.33953558514959953
Epoch: 67, step: 1381, loss: 0.31378012895584106, mean loss: 0.3395353226869867
Epoch: 67, step: 1382, loss: 0.3074839413166046, mean loss: 0.3395349960686768
Epoch: 67, step: 1383, loss: 0.344536691904068, mean loss: 0.33953504703773724
Epoch: 67, step: 1384, loss: 0.32598480582237244, mean loss: 0.33953490895736455
Epoch: 67, step: 1385, loss: 0.32628193497657776, mean loss: 0.33953477390759607
Epoch: 67, step: 1386, loss: 0.33006009459495544, mean loss: 0.3395346773601939
Epoch: 67, step: 1387, loss: 0.35495442152023315, mean loss: 0.33953483448646926
Epoch: 67, step: 1388, loss: 0.3120541274547577, mean loss: 0.3395345544625534
Epoch: 67, step: 1389, loss: 0.3216346204280853, mean loss: 0.339534372067008
Epoch: 67, step: 1390, loss: 0.3237040042877197, mean loss: 0.3395342107614335
Epoch: 67, step: 1391, loss: 0.3051892817020416, mean loss: 0.3395338608029144
Epoch: 67, step: 1392, loss: 0.3003922700881958, mean loss: 0.3395334619727546
Epoch: 67, step: 1393, loss: 0.365464985370636, mean loss: 0.33953372619728023
Epoch: 67, step: 1394, loss: 0.2900564968585968, mean loss: 0.3395332220632173
Epoch: 67, step: 1395, loss: 0.35350310802459717, mean loss: 0.33953336440392035
Epoch: 67, step: 1396, loss: 0.30099421739578247, mean loss: 0.3395329717283178
Epoch: 67, step: 1397, loss: 0.3014470040798187, mean loss: 0.33953258367411643
Epoch: 67, step: 1398, loss: 0.3316417336463928, mean loss: 0.339532503275836
Epoch: 67, step: 1399, loss: 0.30097466707229614, mean loss: 0.3395321104218175
Epoch: 67, step: 1400, loss: 0.34673818945884705, mean loss: 0.3395321838416082
Epoch: 67, step: 1401, loss: 0.2938061058521271, mean loss: 0.3395317179620566
Epoch: 67, step: 1402, loss: 0.34297114610671997, mean loss: 0.3395317530042686
Epoch: 67, step: 1403, loss: 0.308611661195755, mean loss: 0.3395314379817341
Epoch: 67, step: 1404, loss: 0.2996044456958771, mean loss: 0.33953103119852535
Epoch: 67, step: 1405, loss: 0.333987295627594, mean loss: 0.33953097471854926
Epoch: 67, step: 1406, loss: 0.3396527171134949, mean loss: 0.3395309759588569
Epoch: 67, step: 1407, loss: 0.3626711666584015, mean loss: 0.3395312117079777
Epoch: 67, step: 1408, loss: 0.3820701539516449, mean loss: 0.33953164508453
Epoch: 67, step: 1409, loss: 0.34348824620246887, mean loss: 0.33953168539302364
Epoch: 67, step: 1410, loss: 0.3465387523174286, mean loss: 0.3395317567778882
Epoch: 67, step: 1411, loss: 0.31582605838775635, mean loss: 0.33953151527729336
Epoch: 67, step: 1412, loss: 0.3463788330554962, mean loss: 0.3395315850332838
Epoch: 67, step: 1413, loss: 0.30849510431289673, mean loss: 0.3395312688571594
Epoch: 67, step: 1414, loss: 0.2957615256309509, mean loss: 0.3395308229687572
Epoch: 67, step: 1415, loss: 0.3414332866668701, mean loss: 0.3395308423492195
Epoch: 67, step: 1416, loss: 0.36558783054351807, mean loss: 0.3395311077899386
Epoch: 67, step: 1417, loss: 0.2949686646461487, mean loss: 0.33953065384006653
Epoch: 67, step: 1418, loss: 0.32499873638153076, mean loss: 0.33953050580745414
Epoch: 67, step: 1419, loss: 0.346940815448761, mean loss: 0.3395305812934541
Epoch: 67, step: 1420, loss: 0.3115667998790741, mean loss: 0.3395302964399727
Epoch: 67, step: 1421, loss: 0.3030971884727478, mean loss: 0.339529925317349
Epoch: 67, step: 1422, loss: 0.3759813606739044, mean loss: 0.33953029662288076
Epoch: 67, step: 1423, loss: 0.3419071137905121, mean loss: 0.33953032083362483
Epoch: 67, step: 1424, loss: 0.268983393907547, mean loss: 0.3395296022355691
Epoch: 67, step: 1425, loss: 0.3275700807571411, mean loss: 0.3395294804159277
Epoch: 67, step: 1426, loss: 0.3735702931880951, mean loss: 0.3395298271519885
Epoch: 67, step: 1427, loss: 0.33943071961402893, mean loss: 0.33952982614250005
Epoch: 67, step: 1428, loss: 0.31444066762924194, mean loss: 0.33952957059223354
Epoch: 67, step: 1429, loss: 0.34529855847358704, mean loss: 0.33952962935272857
Epoch: 67, step: 1430, loss: 0.30177998542785645, mean loss: 0.33952924485457797
Epoch: 67, step: 1431, loss: 0.377361923456192, mean loss: 0.3395296301945515
Epoch: 67, step: 1432, loss: 0.3364582359790802, mean loss: 0.339529598911572
Epoch: 67, step: 1433, loss: 0.38916078209877014, mean loss: 0.33953010441342757
Epoch: 67, step: 1434, loss: 0.33157601952552795, mean loss: 0.33953002340057514
Epoch: 67, step: 1435, loss: 0.3563961386680603, mean loss: 0.33953019518126515
Epoch: 67, step: 1436, loss: 0.2858645021915436, mean loss: 0.3395296486039571
Epoch: 67, step: 1437, loss: 0.33834463357925415, mean loss: 0.3395296365348737
Epoch: 67, step: 1438, loss: 0.30723080039024353, mean loss: 0.3395293075826077
Epoch: 67, step: 1439, loss: 0.32341304421424866, mean loss: 0.3395291434458153
Epoch: 67, step: 1440, loss: 0.3249085247516632, mean loss: 0.33952899454299834
Epoch: 67, step: 1441, loss: 0.3273322880268097, mean loss: 0.3395288703276351
Epoch: 67, step: 1442, loss: 0.3201000690460205, mean loss: 0.3395286724602004
Epoch: 67, step: 1443, loss: 0.31352314352989197, mean loss: 0.3395284076165377
Valid: 67, mean loss: 0.1860281949241956
Epoch: 68, step: 0, loss: 0.2907933294773102, mean loss: 0.33952791129726706
Epoch: 68, step: 1, loss: 0.3296968936920166, mean loss: 0.33952781117895425
Epoch: 68, step: 2, loss: 0.30836087465286255, mean loss: 0.33952749378054775
Epoch: 68, step: 3, loss: 0.35754701495170593, mean loss: 0.3395276772862015
Epoch: 68, step: 4, loss: 0.3184138834476471, mean loss: 0.3395274622715489
Epoch: 68, step: 5, loss: 0.3261103332042694, mean loss: 0.3395273256381239
Epoch: 68, step: 6, loss: 0.3057714104652405, mean loss: 0.339526981888033
Epoch: 68, step: 7, loss: 0.36525818705558777, mean loss: 0.33952724391659883
Epoch: 68, step: 8, loss: 0.30866676568984985, mean loss: 0.33952692965830994
Epoch: 68, step: 9, loss: 0.3335320055484772, mean loss: 0.3395268686114462
Epoch: 68, step: 10, loss: 0.35078713297843933, mean loss: 0.3395269832745865
Epoch: 68, step: 11, loss: 0.3236357271671295, mean loss: 0.3395268214557593
Epoch: 68, step: 12, loss: 0.3275308907032013, mean loss: 0.33952669930382456
Epoch: 68, step: 13, loss: 0.3405481278896332, mean loss: 0.33952670970470217
Epoch: 68, step: 14, loss: 0.32923784852027893, mean loss: 0.3395266049376165
Epoch: 68, step: 15, loss: 0.3354696035385132, mean loss: 0.33952656362732203
Epoch: 68, step: 16, loss: 0.30479976534843445, mean loss: 0.33952621002634575
Epoch: 68, step: 17, loss: 0.3148946464061737, mean loss: 0.33952595922129924
Epoch: 68, step: 18, loss: 0.37949660420417786, mean loss: 0.33952636620875465
Epoch: 68, step: 19, loss: 0.32267042994499207, mean loss: 0.33952619458068206
Epoch: 68, step: 20, loss: 0.3251664340496063, mean loss: 0.33952604837029715
Epoch: 68, step: 21, loss: 0.35579895973205566, mean loss: 0.33952621405860395
Epoch: 68, step: 22, loss: 0.33810752630233765, mean loss: 0.3395261996138882
Epoch: 68, step: 23, loss: 0.3172743320465088, mean loss: 0.3395259730533729
Epoch: 68, step: 24, loss: 0.31111714243888855, mean loss: 0.3395256838078185
Epoch: 68, step: 25, loss: 0.3651445508003235, mean loss: 0.3395259446445999
Epoch: 68, step: 26, loss: 0.3583395481109619, mean loss: 0.3395261361920955
Epoch: 68, step: 27, loss: 0.32325637340545654, mean loss: 0.3395259705459665
Epoch: 68, step: 28, loss: 0.3325219452381134, mean loss: 0.3395258992371292
Epoch: 68, step: 29, loss: 0.3559756278991699, mean loss: 0.3395260667121212
Epoch: 68, step: 30, loss: 0.307647168636322, mean loss: 0.3395257421557742
Epoch: 68, step: 31, loss: 0.33488157391548157, mean loss: 0.3395256948743741
Epoch: 68, step: 32, loss: 0.3039536476135254, mean loss: 0.3395253327257637
Epoch: 68, step: 33, loss: 0.35176411271095276, mean loss: 0.3395254573239351
Epoch: 68, step: 34, loss: 0.36133694648742676, mean loss: 0.3395256793758064
Epoch: 68, step: 35, loss: 0.31510499119758606, mean loss: 0.3395254307635148
Epoch: 68, step: 36, loss: 0.3341364860534668, mean loss: 0.3395253759024788
Epoch: 68, step: 37, loss: 0.3489799499511719, mean loss: 0.3395254721518328
Epoch: 68, step: 38, loss: 0.31655052304267883, mean loss: 0.33952523826488157
Epoch: 68, step: 39, loss: 0.3147745430469513, mean loss: 0.3395249863032477
Epoch: 68, step: 40, loss: 0.3638874292373657, mean loss: 0.33952523430995557
Epoch: 68, step: 41, loss: 0.3265230357646942, mean loss: 0.3395251019505022
Epoch: 68, step: 42, loss: 0.30003565549850464, mean loss: 0.33952469996092155
Epoch: 68, step: 43, loss: 0.32041677832603455, mean loss: 0.3395245054505421
Epoch: 68, step: 44, loss: 0.40637776255607605, mean loss: 0.3395251859808627
Epoch: 68, step: 45, loss: 0.2826996445655823, mean loss: 0.33952460753320074
Epoch: 68, step: 46, loss: 0.3650783598423004, mean loss: 0.33952486765140544
Epoch: 68, step: 47, loss: 0.3062632381916046, mean loss: 0.339524529076187
Epoch: 68, step: 48, loss: 0.3363792300224304, mean loss: 0.33952449706003235
Epoch: 68, step: 49, loss: 0.3535522520542145, mean loss: 0.3395246398477911
Epoch: 68, step: 50, loss: 0.35467296838760376, mean loss: 0.3395247940402378
Epoch: 68, step: 51, loss: 0.311967134475708, mean loss: 0.33952451353802326
Epoch: 68, step: 52, loss: 0.3235940635204315, mean loss: 0.3395243513877864
Epoch: 68, step: 53, loss: 0.32803934812545776, mean loss: 0.3395242344873196
Epoch: 68, step: 54, loss: 0.3911401629447937, mean loss: 0.3395247598563228
Epoch: 68, step: 55, loss: 0.3777059018611908, mean loss: 0.339525148476366
Epoch: 68, step: 56, loss: 0.33058032393455505, mean loss: 0.3395250574339682
Epoch: 68, step: 57, loss: 0.29412731528282166, mean loss: 0.3395245953704349
Epoch: 68, step: 58, loss: 0.32801553606987, mean loss: 0.33952447823107446
Epoch: 68, step: 59, loss: 0.3152428865432739, mean loss: 0.3395242310952229
Epoch: 68, step: 60, loss: 0.31689032912254333, mean loss: 0.3395240007317534
Epoch: 68, step: 61, loss: 0.31646305322647095, mean loss: 0.3395237660242859
Epoch: 68, step: 62, loss: 0.3241786062717438, mean loss: 0.33952360984740176
Epoch: 68, step: 63, loss: 0.3478431701660156, mean loss: 0.33952369451968967
Epoch: 68, step: 64, loss: 0.31362348794937134, mean loss: 0.339523430923136
Epoch: 68, step: 65, loss: 0.3301659822463989, mean loss: 0.3395233356896825
Epoch: 68, step: 66, loss: 0.34666842222213745, mean loss: 0.3395234084065485
Epoch: 68, step: 67, loss: 0.3199121952056885, mean loss: 0.33952320882163906
Epoch: 68, step: 68, loss: 0.33081570267677307, mean loss: 0.3395231202055437
Epoch: 68, step: 69, loss: 0.31639838218688965, mean loss: 0.339522884867997
Epoch: 68, step: 70, loss: 0.33086472749710083, mean loss: 0.33952279675591646
Epoch: 68, step: 71, loss: 0.32615435123443604, mean loss: 0.3395226607096989
Epoch: 68, step: 72, loss: 0.3070763051509857, mean loss: 0.3395223305173053
Epoch: 68, step: 73, loss: 0.32647767663002014, mean loss: 0.33952219776890924
Epoch: 68, step: 74, loss: 0.34317296743392944, mean loss: 0.339522234920442
Epoch: 68, step: 75, loss: 0.3260052502155304, mean loss: 0.33952209736818995
Epoch: 68, step: 76, loss: 0.3362060487270355, mean loss: 0.3395220636235844
Epoch: 68, step: 77, loss: 0.33293285965919495, mean loss: 0.33952199657154447
Epoch: 68, step: 78, loss: 0.30320560932159424, mean loss: 0.3395216270180928
Epoch: 68, step: 79, loss: 0.3109569549560547, mean loss: 0.3395213363486034
Epoch: 68, step: 80, loss: 0.3168336749076843, mean loss: 0.3395211054849741
Epoch: 68, step: 81, loss: 0.31188639998435974, mean loss: 0.3395208242843971
Epoch: 68, step: 82, loss: 0.3047577440738678, mean loss: 0.3395204705517061
Epoch: 68, step: 83, loss: 0.3525296151638031, mean loss: 0.3395206029252725
Epoch: 68, step: 84, loss: 0.32275524735450745, mean loss: 0.3395204323324016
Epoch: 68, step: 85, loss: 0.3269776403903961, mean loss: 0.33952030470676875
Epoch: 68, step: 86, loss: 0.28125593066215515, mean loss: 0.3395197118601378
Epoch: 68, step: 87, loss: 0.32185545563697815, mean loss: 0.339519532126151
Epoch: 68, step: 88, loss: 0.3030964136123657, mean loss: 0.3395191615243204
Epoch: 68, step: 89, loss: 0.3100466728210449, mean loss: 0.33951886164755046
Epoch: 68, step: 90, loss: 0.3244085907936096, mean loss: 0.33951870790508376
Epoch: 68, step: 91, loss: 0.3141684830188751, mean loss: 0.3395184499767853
Epoch: 68, step: 92, loss: 0.4213900566101074, mean loss: 0.3395192829788368
Epoch: 68, step: 93, loss: 0.38364264369010925, mean loss: 0.3395197319070739
Epoch: 68, step: 94, loss: 0.342512845993042, mean loss: 0.3395197623598712
Epoch: 68, step: 95, loss: 0.3442150056362152, mean loss: 0.3395198101301308
Epoch: 68, step: 96, loss: 0.3374841809272766, mean loss: 0.3395197894194795
Epoch: 68, step: 97, loss: 0.309481680393219, mean loss: 0.33951948381251007
Epoch: 68, step: 98, loss: 0.30876579880714417, mean loss: 0.3395191709284718
Epoch: 68, step: 99, loss: 0.30906185507774353, mean loss: 0.3395188610628077
Epoch: 68, step: 100, loss: 0.3436087369918823, mean loss: 0.33951890267183304
Epoch: 68, step: 101, loss: 0.32508453726768494, mean loss: 0.33951875582293684
Epoch: 68, step: 102, loss: 0.2860560715198517, mean loss: 0.33951821192259296
Epoch: 68, step: 103, loss: 0.3486733138561249, mean loss: 0.33951830506068537
Epoch: 68, step: 104, loss: 0.3472086787223816, mean loss: 0.33951838329678274
Epoch: 68, step: 105, loss: 0.3348482549190521, mean loss: 0.33951833578688045
Epoch: 68, step: 106, loss: 0.4258258044719696, mean loss: 0.3395192137965111
Epoch: 68, step: 107, loss: 0.3280424177646637, mean loss: 0.33951909704375394
Epoch: 68, step: 108, loss: 0.3919413387775421, mean loss: 0.3395196303266476
Epoch: 68, step: 109, loss: 0.30254891514778137, mean loss: 0.33951925423343304
Epoch: 68, step: 110, loss: 0.31313231587409973, mean loss: 0.33951898580888484
Epoch: 68, step: 111, loss: 0.34201887249946594, mean loss: 0.3395190112390473
Epoch: 68, step: 112, loss: 0.3284221589565277, mean loss: 0.3395188983571768
Epoch: 68, step: 113, loss: 0.32379797101020813, mean loss: 0.3395187384388875
Epoch: 68, step: 114, loss: 0.3619774580001831, mean loss: 0.3395189668938252
Epoch: 68, step: 115, loss: 0.36413273215293884, mean loss: 0.33951921726780554
Epoch: 68, step: 116, loss: 0.3007148206233978, mean loss: 0.33951882254914656
Epoch: 68, step: 117, loss: 0.32200565934181213, mean loss: 0.3395186444069107
Epoch: 68, step: 118, loss: 0.31888678669929504, mean loss: 0.33951843454374475
Epoch: 68, step: 119, loss: 0.3398587107658386, mean loss: 0.3395184380049318
Epoch: 68, step: 120, loss: 0.3096606433391571, mean loss: 0.3395181343035427
Epoch: 68, step: 121, loss: 0.35095369815826416, mean loss: 0.33951825062028146
Epoch: 68, step: 122, loss: 0.30508583784103394, mean loss: 0.33951790039485524
Epoch: 68, step: 123, loss: 0.3614138066768646, mean loss: 0.33951812310434587
Epoch: 68, step: 124, loss: 0.3414839506149292, mean loss: 0.33951814309913325
Epoch: 68, step: 125, loss: 0.34722939133644104, mean loss: 0.3395182215308369
Epoch: 68, step: 126, loss: 0.3242097496986389, mean loss: 0.33951806582876676
Epoch: 68, step: 127, loss: 0.3281373381614685, mean loss: 0.33951795007685803
Epoch: 68, step: 128, loss: 0.3549312353134155, mean loss: 0.3395181068417937
Epoch: 68, step: 129, loss: 0.30758488178253174, mean loss: 0.33951778205969957
Epoch: 68, step: 130, loss: 0.3099227249622345, mean loss: 0.3395174810613869
Epoch: 68, step: 131, loss: 0.32699671387672424, mean loss: 0.33951735371946445
Epoch: 68, step: 132, loss: 0.3034471869468689, mean loss: 0.3395169868731205
Epoch: 68, step: 133, loss: 0.3352883756160736, mean loss: 0.3395169438670869
Epoch: 68, step: 134, loss: 0.3550514578819275, mean loss: 0.33951710185537104
Epoch: 68, step: 135, loss: 0.30788370966911316, mean loss: 0.33951678014240844
Epoch: 68, step: 136, loss: 0.28958553075790405, mean loss: 0.33951627234461346
Epoch: 68, step: 137, loss: 0.374830424785614, mean loss: 0.33951663148376166
Epoch: 68, step: 138, loss: 0.36132296919822693, mean loss: 0.3395168532483904
Epoch: 68, step: 139, loss: 0.3377484381198883, mean loss: 0.3395168352642639
Epoch: 68, step: 140, loss: 0.3158213794231415, mean loss: 0.3395165942927097
Epoch: 68, step: 141, loss: 0.3219337463378906, mean loss: 0.3395164154852987
Epoch: 68, step: 142, loss: 0.3467784821987152, mean loss: 0.3395164893355729
Epoch: 68, step: 143, loss: 0.3858497440814972, mean loss: 0.33951696050843677
Epoch: 68, step: 144, loss: 0.3174487352371216, mean loss: 0.3395167360941749
Epoch: 68, step: 145, loss: 0.2937072813510895, mean loss: 0.3395162702574206
Epoch: 68, step: 146, loss: 0.3548717498779297, mean loss: 0.33951642640584206
Epoch: 68, step: 147, loss: 0.3474208414554596, mean loss: 0.33951650678427453
Epoch: 68, step: 148, loss: 0.35181924700737, mean loss: 0.3395166318871332
Epoch: 68, step: 149, loss: 0.3384973704814911, mean loss: 0.3395166215226765
Epoch: 68, step: 150, loss: 0.3633885085582733, mean loss: 0.3395168642637667
Epoch: 68, step: 151, loss: 0.35894256830215454, mean loss: 0.3395170617918725
Epoch: 68, step: 152, loss: 0.33910003304481506, mean loss: 0.3395170575514053
Epoch: 68, step: 153, loss: 0.3698996603488922, mean loss: 0.33951736648723185
Epoch: 68, step: 154, loss: 0.39342832565307617, mean loss: 0.3395179146580878
Epoch: 68, step: 155, loss: 0.3219105005264282, mean loss: 0.339517735626342
Epoch: 68, step: 156, loss: 0.3408797085285187, mean loss: 0.33951774947470753
Epoch: 68, step: 157, loss: 0.3227280080318451, mean loss: 0.3395175787605088
Epoch: 68, step: 158, loss: 0.3705283999443054, mean loss: 0.33951789406814353
Epoch: 68, step: 159, loss: 0.3432375490665436, mean loss: 0.33951793188796414
Epoch: 68, step: 160, loss: 0.34502652287483215, mean loss: 0.3395179878963318
Epoch: 68, step: 161, loss: 0.34212246537208557, mean loss: 0.339518014376978
Epoch: 68, step: 162, loss: 0.2840055823326111, mean loss: 0.33951744996813205
Epoch: 68, step: 163, loss: 0.32201310992240906, mean loss: 0.3395172719989177
Epoch: 68, step: 164, loss: 0.31796813011169434, mean loss: 0.3395170529078323
Epoch: 68, step: 165, loss: 0.31897544860839844, mean loss: 0.3395168440625498
Epoch: 68, step: 166, loss: 0.2880934476852417, mean loss: 0.33951632124921927
Epoch: 68, step: 167, loss: 0.4010600447654724, mean loss: 0.339516946947913
Epoch: 68, step: 168, loss: 0.35927197337150574, mean loss: 0.3395171477899787
Epoch: 68, step: 169, loss: 0.3092931807041168, mean loss: 0.3395168405171794
Epoch: 68, step: 170, loss: 0.30555737018585205, mean loss: 0.33951649527079275
Epoch: 68, step: 171, loss: 0.3647992014884949, mean loss: 0.3395167523029002
Epoch: 68, step: 172, loss: 0.32104140520095825, mean loss: 0.3395165644785002
Epoch: 68, step: 173, loss: 0.31966790556907654, mean loss: 0.3395163626947649
Epoch: 68, step: 174, loss: 0.3084335923194885, mean loss: 0.3395160467069806
Epoch: 68, step: 175, loss: 0.3378012180328369, mean loss: 0.3395160292741907
Epoch: 68, step: 176, loss: 0.3434269428253174, mean loss: 0.3395160690317724
Epoch: 68, step: 177, loss: 0.30784499645233154, mean loss: 0.3395157470731206
Epoch: 68, step: 178, loss: 0.35629332065582275, mean loss: 0.3395159176271821
Epoch: 68, step: 179, loss: 0.3415782153606415, mean loss: 0.33951593859145784
Epoch: 68, step: 180, loss: 0.31413206458091736, mean loss: 0.3395156805544557
Epoch: 68, step: 181, loss: 0.30836471915245056, mean loss: 0.33951536389597475
Epoch: 68, step: 182, loss: 0.3128582239151001, mean loss: 0.33951509292123544
Epoch: 68, step: 183, loss: 0.3153463900089264, mean loss: 0.3395148472444148
Epoch: 68, step: 184, loss: 0.32438647747039795, mean loss: 0.3395146934648751
Epoch: 68, step: 185, loss: 0.32090505957603455, mean loss: 0.3395145043002866
Epoch: 68, step: 186, loss: 0.3309936225414276, mean loss: 0.33951441768747537
Epoch: 68, step: 187, loss: 0.31057897210121155, mean loss: 0.3395141235682887
Epoch: 68, step: 188, loss: 0.31581994891166687, mean loss: 0.33951388272732697
Epoch: 68, step: 189, loss: 0.3109593093395233, mean loss: 0.33951359248548
Epoch: 68, step: 190, loss: 0.3186436593532562, mean loss: 0.33951338035601525
Epoch: 68, step: 191, loss: 0.32946375012397766, mean loss: 0.33951327820901744
Epoch: 68, step: 192, loss: 0.3022248148918152, mean loss: 0.33951289920344424
Epoch: 68, step: 193, loss: 0.3447439670562744, mean loss: 0.3395129523722676
Epoch: 68, step: 194, loss: 0.3512956202030182, mean loss: 0.3395130721306486
Epoch: 68, step: 195, loss: 0.3236005902290344, mean loss: 0.33951291039871073
Epoch: 68, step: 196, loss: 0.33089402318000793, mean loss: 0.3395128227986008
Epoch: 68, step: 197, loss: 0.31574833393096924, mean loss: 0.3395125812650215
Epoch: 68, step: 198, loss: 0.35566583275794983, mean loss: 0.3395127454390973
Epoch: 68, step: 199, loss: 0.36627110838890076, mean loss: 0.33951301739579043
Epoch: 68, step: 200, loss: 0.2809099853038788, mean loss: 0.33951242179415114
Epoch: 68, step: 201, loss: 0.3171433210372925, mean loss: 0.33951219445202907
Epoch: 68, step: 202, loss: 0.36107632517814636, mean loss: 0.3395124136108352
Epoch: 68, step: 203, loss: 0.35214725136756897, mean loss: 0.33951254201887776
Epoch: 68, step: 204, loss: 0.3511003851890564, mean loss: 0.33951265978510203
Epoch: 68, step: 205, loss: 0.3807286322116852, mean loss: 0.33951307865512403
Epoch: 68, step: 206, loss: 0.32173141837120056, mean loss: 0.3395128979453578
Epoch: 68, step: 207, loss: 0.32617834210395813, mean loss: 0.33951276243157896
Epoch: 68, step: 208, loss: 0.3222997784614563, mean loss: 0.3395125875046578
Epoch: 68, step: 209, loss: 0.3041831851005554, mean loss: 0.33951222847331286
Epoch: 68, step: 210, loss: 0.32262125611305237, mean loss: 0.33951205682232294
Epoch: 68, step: 211, loss: 0.3228939175605774, mean loss: 0.3395118879456588
Epoch: 68, step: 212, loss: 0.33411267399787903, mean loss: 0.33951183307838634
Epoch: 68, step: 213, loss: 0.3610176742076874, mean loss: 0.33951205162035664
Epoch: 68, step: 214, loss: 0.34027016162872314, mean loss: 0.3395120593241786
Epoch: 68, step: 215, loss: 0.31635284423828125, mean loss: 0.33951182398543495
Epoch: 68, step: 216, loss: 0.3496716022491455, mean loss: 0.33951192722577134
Epoch: 68, step: 217, loss: 0.32687127590179443, mean loss: 0.3395117987769214
Epoch: 68, step: 218, loss: 0.3876171410083771, mean loss: 0.33951228759770596
Epoch: 68, step: 219, loss: 0.3306717872619629, mean loss: 0.3395121977661779
Epoch: 68, step: 220, loss: 0.3030701279640198, mean loss: 0.3395118274688615
Epoch: 68, step: 221, loss: 0.3442961573600769, mean loss: 0.33951187608318356
Epoch: 68, step: 222, loss: 0.3227669298648834, mean loss: 0.33951170593690283
Epoch: 68, step: 223, loss: 0.32607051730155945, mean loss: 0.3395115693616647
Epoch: 68, step: 224, loss: 0.3090832829475403, mean loss: 0.3395112601845265
Epoch: 68, step: 225, loss: 0.3497685492038727, mean loss: 0.3395113644062036
Epoch: 68, step: 226, loss: 0.29521459341049194, mean loss: 0.33951091432267305
Epoch: 68, step: 227, loss: 0.34808096289634705, mean loss: 0.3395110013989642
Epoch: 68, step: 228, loss: 0.35329681634902954, mean loss: 0.33951114146881667
Epoch: 68, step: 229, loss: 0.31109291315078735, mean loss: 0.33951085273023873
Epoch: 68, step: 230, loss: 0.3242490887641907, mean loss: 0.33951069766725583
Epoch: 68, step: 231, loss: 0.33966803550720215, mean loss: 0.3395106992658277
Epoch: 68, step: 232, loss: 0.32458919286727905, mean loss: 0.3395105476630195
Epoch: 68, step: 233, loss: 0.3036455810070038, mean loss: 0.3395101832779317
Epoch: 68, step: 234, loss: 0.3410429060459137, mean loss: 0.33951019885010975
Epoch: 68, step: 235, loss: 0.34408068656921387, mean loss: 0.3395102452849425
Epoch: 68, step: 236, loss: 0.30847030878067017, mean loss: 0.33950992993137286
Epoch: 68, step: 237, loss: 0.2896522283554077, mean loss: 0.3395094234018435
Epoch: 68, step: 238, loss: 0.33431434631347656, mean loss: 0.3395093706229721
Epoch: 68, step: 239, loss: 0.3274555802345276, mean loss: 0.33950924816492606
Epoch: 68, step: 240, loss: 0.3135252594947815, mean loss: 0.3395089841885292
Epoch: 68, step: 241, loss: 0.3149147033691406, mean loss: 0.3395087343329832
Epoch: 68, step: 242, loss: 0.3426240384578705, mean loss: 0.3395087659813209
Epoch: 68, step: 243, loss: 0.308001309633255, mean loss: 0.33950844590069645
Epoch: 68, step: 244, loss: 0.3072372078895569, mean loss: 0.3395081180642324
Epoch: 68, step: 245, loss: 0.351578027009964, mean loss: 0.3395082406785576
Epoch: 68, step: 246, loss: 0.34509706497192383, mean loss: 0.3395082974530504
Epoch: 68, step: 247, loss: 0.3276809751987457, mean loss: 0.33950817730552646
Epoch: 68, step: 248, loss: 0.33633947372436523, mean loss: 0.3395081451166663
Epoch: 68, step: 249, loss: 0.3265584111213684, mean loss: 0.3395080135698266
Epoch: 68, step: 250, loss: 0.3338899314403534, mean loss: 0.3395079565004349
Epoch: 68, step: 251, loss: 0.3319494426250458, mean loss: 0.339507879720602
Epoch: 68, step: 252, loss: 0.3705696165561676, mean loss: 0.3395081952443649
Epoch: 68, step: 253, loss: 0.3575887084007263, mean loss: 0.33950837890356034
Epoch: 68, step: 254, loss: 0.32264941930770874, mean loss: 0.33950820765446593
Epoch: 68, step: 255, loss: 0.3218415081501007, mean loss: 0.3395080282023744
Epoch: 68, step: 256, loss: 0.3428545892238617, mean loss: 0.33950806219521357
Epoch: 68, step: 257, loss: 0.3107827305793762, mean loss: 0.33950777041937186
Epoch: 68, step: 258, loss: 0.32698649168014526, mean loss: 0.3395076432365221
Epoch: 68, step: 259, loss: 0.3326484262943268, mean loss: 0.3395075735658507
Epoch: 68, step: 260, loss: 0.3116106688976288, mean loss: 0.3395072902133407
Epoch: 68, step: 261, loss: 0.33556315302848816, mean loss: 0.3395072501526303
Epoch: 68, step: 262, loss: 0.3797462284564972, mean loss: 0.3395076588568942
Epoch: 68, step: 263, loss: 0.31691184639930725, mean loss: 0.33950742935526446
Epoch: 68, step: 264, loss: 0.3003689646720886, mean loss: 0.3395070318369094
Epoch: 68, step: 265, loss: 0.3248167335987091, mean loss: 0.3395068826332059
Epoch: 68, step: 266, loss: 0.31823304295539856, mean loss: 0.3395066665652012
Epoch: 68, step: 267, loss: 0.35409411787986755, mean loss: 0.33950681472131855
Epoch: 68, step: 268, loss: 0.32772502303123474, mean loss: 0.33950669506184233
Epoch: 68, step: 269, loss: 0.3122418224811554, mean loss: 0.3395064181542782
Epoch: 68, step: 270, loss: 0.3344508707523346, mean loss: 0.33950636680963703
Epoch: 68, step: 271, loss: 0.3106096684932709, mean loss: 0.33950607333488164
Epoch: 68, step: 272, loss: 0.32940059900283813, mean loss: 0.33950597070476607
Epoch: 68, step: 273, loss: 0.3469165563583374, mean loss: 0.33950604596511635
Epoch: 68, step: 274, loss: 0.3295084238052368, mean loss: 0.3395059444323982
Epoch: 68, step: 275, loss: 0.32694241404533386, mean loss: 0.33950581684241576
Epoch: 68, step: 276, loss: 0.29119428992271423, mean loss: 0.33950532621565077
Epoch: 68, step: 277, loss: 0.33601516485214233, mean loss: 0.3395052907717454
Epoch: 68, step: 278, loss: 0.3730238974094391, mean loss: 0.33950563116238464
Epoch: 68, step: 279, loss: 0.35264843702316284, mean loss: 0.33950576462982573
Epoch: 68, step: 280, loss: 0.3416309952735901, mean loss: 0.3395057862116872
Epoch: 68, step: 281, loss: 0.348168283700943, mean loss: 0.33950587417904393
Epoch: 68, step: 282, loss: 0.33186131715774536, mean loss: 0.3395057965496251
Epoch: 68, step: 283, loss: 0.35891208052635193, mean loss: 0.3395059936157526
Epoch: 68, step: 284, loss: 0.3241002857685089, mean loss: 0.3395058371760982
Epoch: 68, step: 285, loss: 0.3306221067905426, mean loss: 0.33950574696579355
Epoch: 68, step: 286, loss: 0.3262105882167816, mean loss: 0.33950561196077983
Epoch: 68, step: 287, loss: 0.30540189146995544, mean loss: 0.33950526565980005
Epoch: 68, step: 288, loss: 0.35902661085128784, mean loss: 0.3395054638842818
Epoch: 68, step: 289, loss: 0.3448857367038727, mean loss: 0.33950551851632443
Epoch: 68, step: 290, loss: 0.3420731723308563, mean loss: 0.3395055445883756
Epoch: 68, step: 291, loss: 0.35991883277893066, mean loss: 0.33950575186354914
Epoch: 68, step: 292, loss: 0.3172536790370941, mean loss: 0.3395055259197727
Epoch: 68, step: 293, loss: 0.3205251693725586, mean loss: 0.3395053331984057
Epoch: 68, step: 294, loss: 0.3155096769332886, mean loss: 0.3395050895555263
Epoch: 68, step: 295, loss: 0.39881017804145813, mean loss: 0.3395056917110019
Epoch: 68, step: 296, loss: 0.3503459692001343, mean loss: 0.3395058017768721
Epoch: 68, step: 297, loss: 0.36626046895980835, mean loss: 0.33950607342543726
Epoch: 68, step: 298, loss: 0.33226609230041504, mean loss: 0.33950599991637426
Epoch: 68, step: 299, loss: 0.33106178045272827, mean loss: 0.3395059141812946
Epoch: 68, step: 300, loss: 0.32753974199295044, mean loss: 0.33950579268867903
Epoch: 68, step: 301, loss: 0.3578075170516968, mean loss: 0.339505978504306
Epoch: 68, step: 302, loss: 0.3743351995944977, mean loss: 0.3395063321184092
Epoch: 68, step: 303, loss: 0.33433201909065247, mean loss: 0.33950627958517915
Epoch: 68, step: 304, loss: 0.3124677240848541, mean loss: 0.33950600507371687
Epoch: 68, step: 305, loss: 0.3322325646877289, mean loss: 0.33950593123018313
Epoch: 68, step: 306, loss: 0.3396141827106476, mean loss: 0.33950593232919407
Epoch: 68, step: 307, loss: 0.35103246569633484, mean loss: 0.3395060493498374
Epoch: 68, step: 308, loss: 0.35207808017730713, mean loss: 0.3395061769833724
Epoch: 68, step: 309, loss: 0.33199915289878845, mean loss: 0.33950610077147736
Epoch: 68, step: 310, loss: 0.3088493347167969, mean loss: 0.33950578954475275
Epoch: 68, step: 311, loss: 0.3689613342285156, mean loss: 0.3395060885736722
Epoch: 68, step: 312, loss: 0.41350170969963074, mean loss: 0.33950683976012086
Epoch: 68, step: 313, loss: 0.3412536680698395, mean loss: 0.3395068574933382
Epoch: 68, step: 314, loss: 0.359935462474823, mean loss: 0.3395070648756053
Epoch: 68, step: 315, loss: 0.3625718355178833, mean loss: 0.3395072990166968
Epoch: 68, step: 316, loss: 0.32889991998672485, mean loss: 0.3395071913374083
Epoch: 68, step: 317, loss: 0.3772987127304077, mean loss: 0.3395075749687289
Epoch: 68, step: 318, loss: 0.3394237458705902, mean loss: 0.3395075741177671
Epoch: 68, step: 319, loss: 0.32175934314727783, mean loss: 0.3395073939546299
Epoch: 68, step: 320, loss: 0.2937529683113098, mean loss: 0.3395069295039925
Epoch: 68, step: 321, loss: 0.30712664127349854, mean loss: 0.3395066008168188
Epoch: 68, step: 322, loss: 0.33577606081962585, mean loss: 0.339506562949083
Epoch: 68, step: 323, loss: 0.30202069878578186, mean loss: 0.3395061824437421
Epoch: 68, step: 324, loss: 0.31475958228111267, mean loss: 0.33950593125257544
Epoch: 68, step: 325, loss: 0.3413662612438202, mean loss: 0.3395059501357236
Epoch: 68, step: 326, loss: 0.3099903166294098, mean loss: 0.3395056505424116
Epoch: 68, step: 327, loss: 0.3866494596004486, mean loss: 0.33950612906260097
Epoch: 68, step: 328, loss: 0.33538201451301575, mean loss: 0.33950608720234227
Epoch: 68, step: 329, loss: 0.32437288761138916, mean loss: 0.3395059336001053
Epoch: 68, step: 330, loss: 0.3475766181945801, mean loss: 0.3395060155168617
Epoch: 68, step: 331, loss: 0.30703091621398926, mean loss: 0.33950568590073466
Epoch: 68, step: 332, loss: 0.29184287786483765, mean loss: 0.3395052021371413
Epoch: 68, step: 333, loss: 0.3281235694885254, mean loss: 0.3395050866180636
Epoch: 68, step: 334, loss: 0.39590033888816833, mean loss: 0.33950565900179874
Epoch: 68, step: 335, loss: 0.33774396777153015, mean loss: 0.33950564112169124
Epoch: 68, step: 336, loss: 0.3274346888065338, mean loss: 0.33950551861002143
Epoch: 68, step: 337, loss: 0.29200154542922974, mean loss: 0.3395050364830227
Epoch: 68, step: 338, loss: 0.31135493516921997, mean loss: 0.3395047507851072
Epoch: 68, step: 339, loss: 0.31828275322914124, mean loss: 0.33950453540332715
Epoch: 68, step: 340, loss: 0.3819716274738312, mean loss: 0.3395049663969239
Epoch: 68, step: 341, loss: 0.3416706323623657, mean loss: 0.3395049883757938
Epoch: 68, step: 342, loss: 0.36357754468917847, mean loss: 0.3395052326804197
Epoch: 68, step: 343, loss: 0.29740577936172485, mean loss: 0.33950480543095435
Epoch: 68, step: 344, loss: 0.32555386424064636, mean loss: 0.33950466385021627
Epoch: 68, step: 345, loss: 0.3168022036552429, mean loss: 0.33950443345726944
Epoch: 68, step: 346, loss: 0.31714728474617004, mean loss: 0.3395042065709735
Epoch: 68, step: 347, loss: 0.3444664776325226, mean loss: 0.33950425692891
Epoch: 68, step: 348, loss: 0.35475605726242065, mean loss: 0.33950441170509793
Epoch: 68, step: 349, loss: 0.3489091992378235, mean loss: 0.33950450714447944
Epoch: 68, step: 350, loss: 0.3492403030395508, mean loss: 0.33950460594191706
Epoch: 68, step: 351, loss: 0.3168236315250397, mean loss: 0.3395043757810304
Epoch: 68, step: 352, loss: 0.3056730329990387, mean loss: 0.3395040324724629
Epoch: 68, step: 353, loss: 0.34903109073638916, mean loss: 0.3395041291487183
Epoch: 68, step: 354, loss: 0.30875957012176514, mean loss: 0.3395038171700784
Epoch: 68, step: 355, loss: 0.33331507444381714, mean loss: 0.33950375437080565
Epoch: 68, step: 356, loss: 0.3501230776309967, mean loss: 0.3395038621275892
Epoch: 68, step: 357, loss: 0.3269505202770233, mean loss: 0.3395037347471544
Epoch: 68, step: 358, loss: 0.34290850162506104, mean loss: 0.33950376929542764
Epoch: 68, step: 359, loss: 0.325757771730423, mean loss: 0.3395036298157868
Epoch: 68, step: 360, loss: 0.3736836612224579, mean loss: 0.33950397663456866
Epoch: 68, step: 361, loss: 0.35164594650268555, mean loss: 0.3395040998357565
Epoch: 68, step: 362, loss: 0.34023115038871765, mean loss: 0.33950410721286123
Epoch: 68, step: 363, loss: 0.3436054587364197, mean loss: 0.3395041488272888
Epoch: 68, step: 364, loss: 0.31614571809768677, mean loss: 0.33950391182300976
Epoch: 68, step: 365, loss: 0.32057392597198486, mean loss: 0.33950371975350907
Epoch: 68, step: 366, loss: 0.3229253590106964, mean loss: 0.3395035515460319
Epoch: 68, step: 367, loss: 0.318477600812912, mean loss: 0.33950333821455125
Epoch: 68, step: 368, loss: 0.3202763795852661, mean loss: 0.33950314313781066
Epoch: 68, step: 369, loss: 0.3459304869174957, mean loss: 0.3395032083489851
Epoch: 68, step: 370, loss: 0.3667120933532715, mean loss: 0.3395034844047566
Epoch: 68, step: 371, loss: 0.3712359070777893, mean loss: 0.33950380635214783
Epoch: 68, step: 372, loss: 0.35582417249679565, mean loss: 0.3395039719318784
Epoch: 68, step: 373, loss: 0.3314002752304077, mean loss: 0.33950388971593476
Epoch: 68, step: 374, loss: 0.31144770979881287, mean loss: 0.33950360507523436
Epoch: 68, step: 375, loss: 0.3176528513431549, mean loss: 0.33950338339321046
Epoch: 68, step: 376, loss: 0.31712308526039124, mean loss: 0.3395031563411136
Epoch: 68, step: 377, loss: 0.3213837444782257, mean loss: 0.33950297251832917
Epoch: 68, step: 378, loss: 0.340080201625824, mean loss: 0.3395029783743021
Epoch: 68, step: 379, loss: 0.3458796441555023, mean loss: 0.33950304306473933
Epoch: 68, step: 380, loss: 0.3507137596607208, mean loss: 0.3395031567948337
Epoch: 68, step: 381, loss: 0.3252868056297302, mean loss: 0.3395030125747436
Epoch: 68, step: 382, loss: 0.3412851095199585, mean loss: 0.3395030306533329
Epoch: 68, step: 383, loss: 0.3072715997695923, mean loss: 0.3395027036829661
Epoch: 68, step: 384, loss: 0.336137980222702, mean loss: 0.3395026695500197
Epoch: 68, step: 385, loss: 0.3340052664279938, mean loss: 0.3395026137829812
Epoch: 68, step: 386, loss: 0.31770259141921997, mean loss: 0.33950239264032034
Epoch: 68, step: 387, loss: 0.3026721179485321, mean loss: 0.3395020190323401
Epoch: 68, step: 388, loss: 0.372531920671463, mean loss: 0.3395023540857646
Epoch: 68, step: 389, loss: 0.34763669967651367, mean loss: 0.33950243659926194
Epoch: 68, step: 390, loss: 0.31428423523902893, mean loss: 0.339502180792466
Epoch: 68, step: 391, loss: 0.3164677917957306, mean loss: 0.33950194714005794
Epoch: 68, step: 392, loss: 0.3258538246154785, mean loss: 0.33950180869990454
Epoch: 68, step: 393, loss: 0.3190672695636749, mean loss: 0.3395016014236266
Epoch: 68, step: 394, loss: 0.3043065071105957, mean loss: 0.33950124442834007
Epoch: 68, step: 395, loss: 0.35285648703575134, mean loss: 0.3395013798935347
Epoch: 68, step: 396, loss: 0.3163159191608429, mean loss: 0.3395011447206378
Epoch: 68, step: 397, loss: 0.3174125552177429, mean loss: 0.3395009206757093
Epoch: 68, step: 398, loss: 0.33150920271873474, mean loss: 0.33950083961640415
Epoch: 68, step: 399, loss: 0.3391435444355011, mean loss: 0.33950083599242675
Epoch: 68, step: 400, loss: 0.36274468898773193, mean loss: 0.3395010717480382
Epoch: 68, step: 401, loss: 0.3028343915939331, mean loss: 0.33950069985238374
Epoch: 68, step: 402, loss: 0.37354400753974915, mean loss: 0.3395010451367053
Epoch: 68, step: 403, loss: 0.30400270223617554, mean loss: 0.33950068509833764
Epoch: 68, step: 404, loss: 0.38210752606391907, mean loss: 0.3395011172295482
Epoch: 68, step: 405, loss: 0.3185671865940094, mean loss: 0.3395009049135718
Epoch: 68, step: 406, loss: 0.3245388865470886, mean loss: 0.3395007531674246
Epoch: 68, step: 407, loss: 0.3285423219203949, mean loss: 0.3395006420271483
Epoch: 68, step: 408, loss: 0.330663800239563, mean loss: 0.3395005524049154
Epoch: 68, step: 409, loss: 0.35147663950920105, mean loss: 0.33950067386378135
Epoch: 68, step: 410, loss: 0.40028125047683716, mean loss: 0.33950129028089454
Epoch: 68, step: 411, loss: 0.33549681305885315, mean loss: 0.3395012496691828
Epoch: 68, step: 412, loss: 0.3258717656135559, mean loss: 0.3395011114461307
Epoch: 68, step: 413, loss: 0.32796287536621094, mean loss: 0.3395009944326013
Epoch: 68, step: 414, loss: 0.3291124701499939, mean loss: 0.33950088907979387
Epoch: 68, step: 415, loss: 0.33547136187553406, mean loss: 0.33950084821569354
Epoch: 68, step: 416, loss: 0.3422177731990814, mean loss: 0.3395008757681987
Epoch: 68, step: 417, loss: 0.3403606414794922, mean loss: 0.33950088448704785
Epoch: 68, step: 418, loss: 0.3274590075016022, mean loss: 0.33950076237210136
Epoch: 68, step: 419, loss: 0.361686646938324, mean loss: 0.3395009873536915
Epoch: 68, step: 420, loss: 0.31366562843322754, mean loss: 0.3395007253663377
Epoch: 68, step: 421, loss: 0.3405657708644867, mean loss: 0.3395007361664827
Epoch: 68, step: 422, loss: 0.3124428987503052, mean loss: 0.33950046178796606
Epoch: 68, step: 423, loss: 0.3387472927570343, mean loss: 0.3395004541505742
Epoch: 68, step: 424, loss: 0.3183225989341736, mean loss: 0.33950023940205
Epoch: 68, step: 425, loss: 0.28917425870895386, mean loss: 0.33949972908972675
Epoch: 68, step: 426, loss: 0.3479306101799011, mean loss: 0.3394998145791465
Epoch: 68, step: 427, loss: 0.316559374332428, mean loss: 0.3394995819646642
Epoch: 68, step: 428, loss: 0.3227814733982086, mean loss: 0.33949941244591497
Epoch: 68, step: 429, loss: 0.31215617060661316, mean loss: 0.3394991351929507
Epoch: 68, step: 430, loss: 0.3423992991447449, mean loss: 0.3394991645995187
Epoch: 68, step: 431, loss: 0.3631024956703186, mean loss: 0.33949940392596123
Epoch: 68, step: 432, loss: 0.34415507316589355, mean loss: 0.33949945113173297
Epoch: 68, step: 433, loss: 0.33271676301956177, mean loss: 0.3394993823599272
Epoch: 68, step: 434, loss: 0.3365360498428345, mean loss: 0.33949935231407247
Epoch: 68, step: 435, loss: 0.3321506083011627, mean loss: 0.33949927780435907
Epoch: 68, step: 436, loss: 0.37024012207984924, mean loss: 0.33949958948595654
Epoch: 68, step: 437, loss: 0.35845521092414856, mean loss: 0.33949978167516304
Epoch: 68, step: 438, loss: 0.36945024132728577, mean loss: 0.3395000853368886
Epoch: 68, step: 439, loss: 0.30896613001823425, mean loss: 0.3394997757623558
Epoch: 68, step: 440, loss: 0.3051312565803528, mean loss: 0.3394994273138732
Epoch: 68, step: 441, loss: 0.31127017736434937, mean loss: 0.33949914111185414
Epoch: 68, step: 442, loss: 0.35138776898384094, mean loss: 0.3394992616433883
Epoch: 68, step: 443, loss: 0.35450297594070435, mean loss: 0.33949941375533826
Epoch: 68, step: 444, loss: 0.3902670741081238, mean loss: 0.33949992844719173
Epoch: 68, step: 445, loss: 0.3457372784614563, mean loss: 0.3394999916819493
Epoch: 68, step: 446, loss: 0.33019232749938965, mean loss: 0.3394998973210557
Epoch: 68, step: 447, loss: 0.32906800508499146, mean loss: 0.33949979156383514
Epoch: 68, step: 448, loss: 0.3350522220134735, mean loss: 0.3394997464753876
Epoch: 68, step: 449, loss: 0.35639140009880066, mean loss: 0.33949991771739024
Epoch: 68, step: 450, loss: 0.3629104793071747, mean loss: 0.33950015504352177
Epoch: 68, step: 451, loss: 0.35206830501556396, mean loss: 0.3395002824526898
Epoch: 68, step: 452, loss: 0.3806098997592926, mean loss: 0.3395006991957311
Epoch: 68, step: 453, loss: 0.3136352300643921, mean loss: 0.3395004369907848
Epoch: 68, step: 454, loss: 0.35102367401123047, mean loss: 0.33950055380363287
Epoch: 68, step: 455, loss: 0.32094696164131165, mean loss: 0.33950036572488657
Epoch: 68, step: 456, loss: 0.3729609251022339, mean loss: 0.33950070491291057
Epoch: 68, step: 457, loss: 0.3362473249435425, mean loss: 0.33950067193389416
Epoch: 68, step: 458, loss: 0.31990107893943787, mean loss: 0.339500473257824
Epoch: 68, step: 459, loss: 0.335039883852005, mean loss: 0.3395004280424264
Epoch: 68, step: 460, loss: 0.2962356209754944, mean loss: 0.3394999894870143
Epoch: 68, step: 461, loss: 0.32527992129325867, mean loss: 0.339499845346197
Epoch: 68, step: 462, loss: 0.3053032159805298, mean loss: 0.3394994987177507
Epoch: 68, step: 463, loss: 0.28646236658096313, mean loss: 0.33949896112113076
Epoch: 68, step: 464, loss: 0.3335575461387634, mean loss: 0.3394989008981868
Epoch: 68, step: 465, loss: 0.3825404644012451, mean loss: 0.3394993371685704
Epoch: 68, step: 466, loss: 0.355729341506958, mean loss: 0.33949950167464016
Epoch: 68, step: 467, loss: 0.30275896191596985, mean loss: 0.3394991292791429
Epoch: 68, step: 468, loss: 0.34253746271133423, mean loss: 0.3394991600748315
Epoch: 68, step: 469, loss: 0.3134446144104004, mean loss: 0.3394988959960001
Epoch: 68, step: 470, loss: 0.33904626965522766, mean loss: 0.33949889140840045
Epoch: 68, step: 471, loss: 0.3271941840648651, mean loss: 0.3394987666951581
Epoch: 68, step: 472, loss: 0.3656178414821625, mean loss: 0.3394990314199824
Epoch: 68, step: 473, loss: 0.32254403829574585, mean loss: 0.3394988595776748
Epoch: 68, step: 474, loss: 0.33157217502593994, mean loss: 0.3394987792399271
Epoch: 68, step: 475, loss: 0.32809942960739136, mean loss: 0.3394986637075394
Epoch: 68, step: 476, loss: 0.32098203897476196, mean loss: 0.3394984760434835
Epoch: 68, step: 477, loss: 0.33807137608528137, mean loss: 0.3394984615801212
Epoch: 68, step: 478, loss: 0.32345515489578247, mean loss: 0.3394982989861809
Epoch: 68, step: 479, loss: 0.3467313349246979, mean loss: 0.33949837229001517
Epoch: 68, step: 480, loss: 0.3101971745491028, mean loss: 0.3394980753374776
Epoch: 68, step: 481, loss: 0.3973660171031952, mean loss: 0.33949866179329946
Epoch: 68, step: 482, loss: 0.32858628034591675, mean loss: 0.33949855120417916
Epoch: 68, step: 483, loss: 0.2895069718360901, mean loss: 0.3394980445806905
Epoch: 68, step: 484, loss: 0.31938812136650085, mean loss: 0.3394978407852446
Epoch: 68, step: 485, loss: 0.37122929096221924, mean loss: 0.33949816235084357
Epoch: 68, step: 486, loss: 0.3388606309890747, mean loss: 0.33949815589018467
Epoch: 68, step: 487, loss: 0.35036948323249817, mean loss: 0.33949826605766886
Epoch: 68, step: 488, loss: 0.35638806223869324, mean loss: 0.33949843721317174
Epoch: 68, step: 489, loss: 0.3409298062324524, mean loss: 0.33949845171803605
Epoch: 68, step: 490, loss: 0.3456161618232727, mean loss: 0.33949851371159223
Epoch: 68, step: 491, loss: 0.31793415546417236, mean loss: 0.3394982951922958
Epoch: 68, step: 492, loss: 0.31011253595352173, mean loss: 0.33949799741898434
Epoch: 68, step: 493, loss: 0.3174925446510315, mean loss: 0.33949777443443974
Epoch: 68, step: 494, loss: 0.30514398217201233, mean loss: 0.33949742632585134
Epoch: 68, step: 495, loss: 0.3185800313949585, mean loss: 0.3394972143710551
Epoch: 68, step: 496, loss: 0.36066874861717224, mean loss: 0.3394974288988571
Epoch: 68, step: 497, loss: 0.29449039697647095, mean loss: 0.3394969728543549
Epoch: 68, step: 498, loss: 0.3186110258102417, mean loss: 0.3394967612246516
Epoch: 68, step: 499, loss: 0.3378337621688843, mean loss: 0.3394967443742579
Epoch: 68, step: 500, loss: 0.3458847403526306, mean loss: 0.3394968091001856
Epoch: 68, step: 501, loss: 0.2929845452308655, mean loss: 0.3394963378226624
Epoch: 68, step: 502, loss: 0.4107840359210968, mean loss: 0.339497060125698
Epoch: 68, step: 503, loss: 0.3000803291797638, mean loss: 0.33949666075053647
Epoch: 68, step: 504, loss: 0.3243233561515808, mean loss: 0.3394965070143074
Epoch: 68, step: 505, loss: 0.29445791244506836, mean loss: 0.3394960506869799
Epoch: 68, step: 506, loss: 0.31541505455970764, mean loss: 0.33949580670278423
Epoch: 68, step: 507, loss: 0.3326336741447449, mean loss: 0.33949573717763165
Epoch: 68, step: 508, loss: 0.32397153973579407, mean loss: 0.33949557989252366
Epoch: 68, step: 509, loss: 0.35532888770103455, mean loss: 0.33949574030779195
Epoch: 68, step: 510, loss: 0.3222159743309021, mean loss: 0.33949556523949637
Epoch: 68, step: 511, loss: 0.3412463665008545, mean loss: 0.33949558297739213
Epoch: 68, step: 512, loss: 0.440159410238266, mean loss: 0.339496602822661
Epoch: 68, step: 513, loss: 0.34303268790245056, mean loss: 0.33949663864707974
Epoch: 68, step: 514, loss: 0.3575558066368103, mean loss: 0.33949682160439776
Epoch: 68, step: 515, loss: 0.3069673180580139, mean loss: 0.33949649205153937
Epoch: 68, step: 516, loss: 0.3333664834499359, mean loss: 0.33949642994971885
Epoch: 68, step: 517, loss: 0.3315666913986206, mean loss: 0.33949634961602876
Epoch: 68, step: 518, loss: 0.32540273666381836, mean loss: 0.33949620683950993
Epoch: 68, step: 519, loss: 0.3578585386276245, mean loss: 0.3394963928587557
Epoch: 68, step: 520, loss: 0.3407853841781616, mean loss: 0.339496405916725
Epoch: 68, step: 521, loss: 0.3274518549442291, mean loss: 0.3394962839021073
Epoch: 68, step: 522, loss: 0.3254658877849579, mean loss: 0.3394961417717713
Epoch: 68, step: 523, loss: 0.3433244526386261, mean loss: 0.3394961805528287
Epoch: 68, step: 524, loss: 0.3754143714904785, mean loss: 0.339496544402935
Epoch: 68, step: 525, loss: 0.33464011549949646, mean loss: 0.33949649520796643
Epoch: 68, step: 526, loss: 0.342781126499176, mean loss: 0.3394965284805005
Epoch: 68, step: 527, loss: 0.32208508253097534, mean loss: 0.3394963521084791
Epoch: 68, step: 528, loss: 0.3654961585998535, mean loss: 0.3394966154750019
Epoch: 68, step: 529, loss: 0.3085057735443115, mean loss: 0.33949630155468086
Epoch: 68, step: 530, loss: 0.3135603368282318, mean loss: 0.33949603884016927
Epoch: 68, step: 531, loss: 0.3476627767086029, mean loss: 0.33949612156309245
Epoch: 68, step: 532, loss: 0.3189598619937897, mean loss: 0.33949591354830827
Epoch: 68, step: 533, loss: 0.33560681343078613, mean loss: 0.33949587415544197
Epoch: 68, step: 534, loss: 0.3294844329357147, mean loss: 0.33949577275014026
Epoch: 68, step: 535, loss: 0.344730406999588, mean loss: 0.3394958257709069
Epoch: 68, step: 536, loss: 0.34293222427368164, mean loss: 0.339495860577281
Epoch: 68, step: 537, loss: 0.32079771161079407, mean loss: 0.3394956711905802
Epoch: 68, step: 538, loss: 0.33628302812576294, mean loss: 0.3394956386512252
Epoch: 68, step: 539, loss: 0.31638142466545105, mean loss: 0.3394954045405621
Epoch: 68, step: 540, loss: 0.3458293080329895, mean loss: 0.3394954686924008
Epoch: 68, step: 541, loss: 0.3170261085033417, mean loss: 0.33949524111770324
Epoch: 68, step: 542, loss: 0.33324307203292847, mean loss: 0.33949517779497995
Epoch: 68, step: 543, loss: 0.3077180087566376, mean loss: 0.3394948559552352
Epoch: 68, step: 544, loss: 0.3139013648033142, mean loss: 0.3394945967465176
Epoch: 68, step: 545, loss: 0.33411329984664917, mean loss: 0.33949454224574893
Epoch: 68, step: 546, loss: 0.2862021028995514, mean loss: 0.3394940025153552
Epoch: 68, step: 547, loss: 0.32253310084342957, mean loss: 0.33949383074199413
Epoch: 68, step: 548, loss: 0.3338286876678467, mean loss: 0.33949377336822767
Epoch: 68, step: 549, loss: 0.36462703347206116, mean loss: 0.3394940279028746
Epoch: 68, step: 550, loss: 0.35801830887794495, mean loss: 0.3394942155038283
Epoch: 68, step: 551, loss: 0.3315710127353668, mean loss: 0.33949413526398825
Epoch: 68, step: 552, loss: 0.304166316986084, mean loss: 0.3394937774958149
Epoch: 68, step: 553, loss: 0.2979244589805603, mean loss: 0.33949335652363866
Epoch: 68, step: 554, loss: 0.3838713765144348, mean loss: 0.3394938059349625
Epoch: 68, step: 555, loss: 0.3558502793312073, mean loss: 0.3394939715734908
Epoch: 68, step: 556, loss: 0.37257876992225647, mean loss: 0.33949430661281627
Epoch: 68, step: 557, loss: 0.3088742792606354, mean loss: 0.3394939965365899
Epoch: 68, step: 558, loss: 0.3433719277381897, mean loss: 0.3394940358063816
Epoch: 68, step: 559, loss: 0.32531094551086426, mean loss: 0.3394938921830596
Epoch: 68, step: 560, loss: 0.3188003897666931, mean loss: 0.33949368263497076
Epoch: 68, step: 561, loss: 0.33883628249168396, mean loss: 0.33949367597802377
Epoch: 68, step: 562, loss: 0.38083329796791077, mean loss: 0.3394940945859119
Epoch: 68, step: 563, loss: 0.3143516182899475, mean loss: 0.3394938399940259
Epoch: 68, step: 564, loss: 0.30158933997154236, mean loss: 0.3394934561781949
Epoch: 68, step: 565, loss: 0.361747145652771, mean loss: 0.3394936815137573
Epoch: 68, step: 566, loss: 0.34594470262527466, mean loss: 0.3394937468346001
Epoch: 68, step: 567, loss: 0.3533346951007843, mean loss: 0.3394938869819094
Epoch: 68, step: 568, loss: 0.36106598377227783, mean loss: 0.33949410540919134
Epoch: 68, step: 569, loss: 0.3219672441482544, mean loss: 0.33949392794355415
Epoch: 68, step: 570, loss: 0.30902808904647827, mean loss: 0.33949361946933915
Epoch: 68, step: 571, loss: 0.3353162407875061, mean loss: 0.3394935771727667
Epoch: 68, step: 572, loss: 0.35140836238861084, mean loss: 0.33949369781049477
Epoch: 68, step: 573, loss: 0.31519007682800293, mean loss: 0.33949345173774725
Epoch: 68, step: 574, loss: 0.3119414150714874, mean loss: 0.3394931727778045
Epoch: 68, step: 575, loss: 0.3313480019569397, mean loss: 0.3394930903100941
Epoch: 68, step: 576, loss: 0.3644045293331146, mean loss: 0.3394933425293028
Epoch: 68, step: 577, loss: 0.3372860252857208, mean loss: 0.3394933201812493
Epoch: 68, step: 578, loss: 0.33156776428222656, mean loss: 0.3394932399395194
Epoch: 68, step: 579, loss: 0.3621366322040558, mean loss: 0.339493469188621
Epoch: 68, step: 580, loss: 0.2979297339916229, mean loss: 0.33949304838804595
Epoch: 68, step: 581, loss: 0.3227345943450928, mean loss: 0.33949287872341716
Epoch: 68, step: 582, loss: 0.34823355078697205, mean loss: 0.3394929672141493
Epoch: 68, step: 583, loss: 0.3097171187400818, mean loss: 0.33949266576593845
Epoch: 68, step: 584, loss: 0.33646371960639954, mean loss: 0.33949263510145017
Epoch: 68, step: 585, loss: 0.32849642634391785, mean loss: 0.3394925237790023
Epoch: 68, step: 586, loss: 0.39511868357658386, mean loss: 0.33949308691650926
Epoch: 68, step: 587, loss: 0.31970930099487305, mean loss: 0.3394928866352183
Epoch: 68, step: 588, loss: 0.28429219126701355, mean loss: 0.33949232781626154
Epoch: 68, step: 589, loss: 0.32980087399482727, mean loss: 0.33949222970674947
Epoch: 68, step: 590, loss: 0.3035220801830292, mean loss: 0.3394918655737557
Epoch: 68, step: 591, loss: 0.336924284696579, mean loss: 0.3394918395818858
Epoch: 68, step: 592, loss: 0.31256669759750366, mean loss: 0.33949156701882477
Epoch: 68, step: 593, loss: 0.37156081199645996, mean loss: 0.33949189165232524
Epoch: 68, step: 594, loss: 0.3270559310913086, mean loss: 0.33949176576571505
Epoch: 68, step: 595, loss: 0.2824433445930481, mean loss: 0.3394911882824056
Epoch: 68, step: 596, loss: 0.3358883559703827, mean loss: 0.3394911518124311
Epoch: 68, step: 597, loss: 0.31321701407432556, mean loss: 0.33949088585294396
Epoch: 68, step: 598, loss: 0.3163551986217499, mean loss: 0.3394906516647362
Epoch: 68, step: 599, loss: 0.35605114698410034, mean loss: 0.33949081929465885
Epoch: 68, step: 600, loss: 0.36101293563842773, mean loss: 0.3394910371452793
Epoch: 68, step: 601, loss: 0.3749984800815582, mean loss: 0.33949139655418
Epoch: 68, step: 602, loss: 0.32544076442718506, mean loss: 0.3394912543341068
Epoch: 68, step: 603, loss: 0.3110664486885071, mean loss: 0.33949096662199657
Epoch: 68, step: 604, loss: 0.38432735204696655, mean loss: 0.3394914204453457
Epoch: 68, step: 605, loss: 0.3327285349369049, mean loss: 0.33949135199370184
Epoch: 68, step: 606, loss: 0.29990309476852417, mean loss: 0.3394909512987836
Epoch: 68, step: 607, loss: 0.3288271129131317, mean loss: 0.3394908433651967
Epoch: 68, step: 608, loss: 0.3511817455291748, mean loss: 0.33949096169296833
Epoch: 68, step: 609, loss: 0.3351985216140747, mean loss: 0.339490918248098
Epoch: 68, step: 610, loss: 0.38452979922294617, mean loss: 0.33949137409337576
Epoch: 68, step: 611, loss: 0.3420678973197937, mean loss: 0.33949140017049034
Epoch: 68, step: 612, loss: 0.32559138536453247, mean loss: 0.3394912594892009
Epoch: 68, step: 613, loss: 0.2920922338962555, mean loss: 0.339490779771111
Epoch: 68, step: 614, loss: 0.33621543645858765, mean loss: 0.33949074662221146
Epoch: 68, step: 615, loss: 0.32892608642578125, mean loss: 0.33949063970111
Epoch: 68, step: 616, loss: 0.3604290783405304, mean loss: 0.3394908516093232
Epoch: 68, step: 617, loss: 0.2882022261619568, mean loss: 0.33949033254621774
Epoch: 68, step: 618, loss: 0.30147141218185425, mean loss: 0.33948994778216957
Epoch: 68, step: 619, loss: 0.3469979166984558, mean loss: 0.33949002376452914
Epoch: 68, step: 620, loss: 0.28742825984954834, mean loss: 0.339489496892924
Epoch: 68, step: 621, loss: 0.31470805406570435, mean loss: 0.3394892461041408
Epoch: 68, step: 622, loss: 0.33199697732925415, mean loss: 0.33948917028297215
Epoch: 68, step: 623, loss: 0.35979539155960083, mean loss: 0.339489375778249
Epoch: 68, step: 624, loss: 0.37442347407341003, mean loss: 0.33948972930141097
Epoch: 68, step: 625, loss: 0.3414907455444336, mean loss: 0.33948974955092265
Epoch: 68, step: 626, loss: 0.3376266062259674, mean loss: 0.3394897306968225
Epoch: 68, step: 627, loss: 0.43478015065193176, mean loss: 0.3394906949795583
Epoch: 68, step: 628, loss: 0.35307812690734863, mean loss: 0.3394908324749482
Epoch: 68, step: 629, loss: 0.29618459939956665, mean loss: 0.33949039425033145
Epoch: 68, step: 630, loss: 0.3444419801235199, mean loss: 0.3394904443559331
Epoch: 68, step: 631, loss: 0.34387385845184326, mean loss: 0.33949048871169785
Epoch: 68, step: 632, loss: 0.3629746437072754, mean loss: 0.3394907263454443
Epoch: 68, step: 633, loss: 0.32481881976127625, mean loss: 0.33949057788343445
Epoch: 68, step: 634, loss: 0.33521899580955505, mean loss: 0.33949053466060997
Epoch: 68, step: 635, loss: 0.34548938274383545, mean loss: 0.3394905953604934
Epoch: 68, step: 636, loss: 0.349445641040802, mean loss: 0.3394906960904986
Epoch: 68, step: 637, loss: 0.37053951621055603, mean loss: 0.33949101025441764
Epoch: 68, step: 638, loss: 0.356212854385376, mean loss: 0.33949117945076424
Epoch: 68, step: 639, loss: 0.2914278507232666, mean loss: 0.3394906931373361
Epoch: 68, step: 640, loss: 0.33325543999671936, mean loss: 0.3394906300485587
Epoch: 68, step: 641, loss: 0.31218332052230835, mean loss: 0.3394903537538673
Epoch: 68, step: 642, loss: 0.3279646933078766, mean loss: 0.33949023713869614
Epoch: 68, step: 643, loss: 0.330131471157074, mean loss: 0.33949014244884645
Epoch: 68, step: 644, loss: 0.305457204580307, mean loss: 0.3394897981148636
Epoch: 68, step: 645, loss: 0.3572775721549988, mean loss: 0.3394899780838435
Epoch: 68, step: 646, loss: 0.3387652337551117, mean loss: 0.339489970751269
Epoch: 68, step: 647, loss: 0.3408811688423157, mean loss: 0.3394899848265229
Epoch: 68, step: 648, loss: 0.30319759249687195, mean loss: 0.33948961764698876
Epoch: 68, step: 649, loss: 0.3460078537464142, mean loss: 0.33948968359300463
Epoch: 68, step: 650, loss: 0.31402096152305603, mean loss: 0.33948942592456005
Epoch: 68, step: 651, loss: 0.30402976274490356, mean loss: 0.339489067180851
Epoch: 68, step: 652, loss: 0.3114686906337738, mean loss: 0.33948878370291535
Epoch: 68, step: 653, loss: 0.35039156675338745, mean loss: 0.3394888940036159
Epoch: 68, step: 654, loss: 0.35725244879722595, mean loss: 0.3394890737111922
Epoch: 68, step: 655, loss: 0.32468900084495544, mean loss: 0.33948892398562497
Epoch: 68, step: 656, loss: 0.32455992698669434, mean loss: 0.33948877295731916
Epoch: 68, step: 657, loss: 0.3003953993320465, mean loss: 0.3394883774755425
Epoch: 68, step: 658, loss: 0.33092719316482544, mean loss: 0.33948829086858545
Epoch: 68, step: 659, loss: 0.3404217064380646, mean loss: 0.3394883003111417
Epoch: 68, step: 660, loss: 0.3018527925014496, mean loss: 0.33948791958918273
Epoch: 68, step: 661, loss: 0.34876328706741333, mean loss: 0.33948801341813734
Epoch: 68, step: 662, loss: 0.30513834953308105, mean loss: 0.3394876659429071
Epoch: 68, step: 663, loss: 0.3318053185939789, mean loss: 0.33948758823040254
Epoch: 68, step: 664, loss: 0.3217082619667053, mean loss: 0.33948740838146657
Epoch: 68, step: 665, loss: 0.31946253776550293, mean loss: 0.33948720581950276
Epoch: 68, step: 666, loss: 0.3423892855644226, mean loss: 0.33948723517524926
Epoch: 68, step: 667, loss: 0.35615378618240356, mean loss: 0.33948740376265574
Epoch: 68, step: 668, loss: 0.3419108986854553, mean loss: 0.3394874282768213
Epoch: 68, step: 669, loss: 0.33786529302597046, mean loss: 0.3394874118687449
Epoch: 68, step: 670, loss: 0.3120824992656708, mean loss: 0.33948713466784464
Epoch: 68, step: 671, loss: 0.3306354880332947, mean loss: 0.33948704513427697
Epoch: 68, step: 672, loss: 0.364868700504303, mean loss: 0.3394873018647212
Epoch: 68, step: 673, loss: 0.3335053026676178, mean loss: 0.3394872413585897
Epoch: 68, step: 674, loss: 0.3180480897426605, mean loss: 0.3394870245101811
Epoch: 68, step: 675, loss: 0.2979169189929962, mean loss: 0.33948660404951114
Epoch: 68, step: 676, loss: 0.32197660207748413, mean loss: 0.33948642694645587
Epoch: 68, step: 677, loss: 0.34980469942092896, mean loss: 0.3394865313084714
Epoch: 68, step: 678, loss: 0.32536882162094116, mean loss: 0.3394863885192846
Epoch: 68, step: 679, loss: 0.3004419505596161, mean loss: 0.33948599362044607
Epoch: 68, step: 680, loss: 0.3830191493034363, mean loss: 0.33948643391411254
Epoch: 68, step: 681, loss: 0.3212135136127472, mean loss: 0.33948624910394704
Epoch: 68, step: 682, loss: 0.32669705152511597, mean loss: 0.33948611975681603
Epoch: 68, step: 683, loss: 0.34278592467308044, mean loss: 0.33948615312997954
Epoch: 68, step: 684, loss: 0.3358525037765503, mean loss: 0.3394861163807926
Epoch: 68, step: 685, loss: 0.3556179106235504, mean loss: 0.33948627952926086
Epoch: 68, step: 686, loss: 0.36825376749038696, mean loss: 0.3394865704655361
Epoch: 68, step: 687, loss: 0.3191757798194885, mean loss: 0.33948636505705465
Epoch: 68, step: 688, loss: 0.328670471906662, mean loss: 0.3394862556741282
Epoch: 68, step: 689, loss: 0.34004732966423035, mean loss: 0.3394862613483054
Epoch: 68, step: 690, loss: 0.33279240131378174, mean loss: 0.3394861936535547
Epoch: 68, step: 691, loss: 0.3360665738582611, mean loss: 0.3394861590714201
Epoch: 68, step: 692, loss: 0.3476129174232483, mean loss: 0.3394862412553545
Epoch: 68, step: 693, loss: 0.3445035517215729, mean loss: 0.33948629199368413
Epoch: 68, step: 694, loss: 0.3625658452510834, mean loss: 0.339486525386883
Epoch: 68, step: 695, loss: 0.32541805505752563, mean loss: 0.33948638312017393
Epoch: 68, step: 696, loss: 0.33520862460136414, mean loss: 0.33948633986199034
Epoch: 68, step: 697, loss: 0.3453141748905182, mean loss: 0.3394863987944914
Epoch: 68, step: 698, loss: 0.3414325714111328, mean loss: 0.3394864184744685
Epoch: 68, step: 699, loss: 0.3292301595211029, mean loss: 0.33948631476275315
Epoch: 68, step: 700, loss: 0.35325753688812256, mean loss: 0.3394864540165135
Epoch: 68, step: 701, loss: 0.360072523355484, mean loss: 0.3394866621794894
Epoch: 68, step: 702, loss: 0.3461263179779053, mean loss: 0.3394867293179271
Epoch: 68, step: 703, loss: 0.33009999990463257, mean loss: 0.33948663440276966
Epoch: 68, step: 704, loss: 0.35826027393341064, mean loss: 0.3394868242329923
Epoch: 68, step: 705, loss: 0.36279723048210144, mean loss: 0.33948705993448525
Epoch: 68, step: 706, loss: 0.28974854946136475, mean loss: 0.3394865570122062
Epoch: 68, step: 707, loss: 0.32425984740257263, mean loss: 0.3394864030515428
Epoch: 68, step: 708, loss: 0.3296080529689789, mean loss: 0.33948630317034767
Epoch: 68, step: 709, loss: 0.32723724842071533, mean loss: 0.33948617931992253
Epoch: 68, step: 710, loss: 0.30722764134407043, mean loss: 0.33948585315653035
Epoch: 68, step: 711, loss: 0.34133636951446533, mean loss: 0.33948587186675805
Epoch: 68, step: 712, loss: 0.35918277502059937, mean loss: 0.33948607101647904
Epoch: 68, step: 713, loss: 0.3177716135978699, mean loss: 0.3394858514700671
Epoch: 68, step: 714, loss: 0.29585710167884827, mean loss: 0.3394854103612498
Epoch: 68, step: 715, loss: 0.36861762404441833, mean loss: 0.339485704899747
Epoch: 68, step: 716, loss: 0.31677597761154175, mean loss: 0.3394854752975138
Epoch: 68, step: 717, loss: 0.3167486786842346, mean loss: 0.33948524542392555
Epoch: 68, step: 718, loss: 0.33105888962745667, mean loss: 0.3394851602326344
Epoch: 68, step: 719, loss: 0.35063523054122925, mean loss: 0.3394852729598092
Epoch: 68, step: 720, loss: 0.3141772150993347, mean loss: 0.3394850170980129
Epoch: 68, step: 721, loss: 0.3608369827270508, mean loss: 0.33948523296195154
Epoch: 68, step: 722, loss: 0.3463233411312103, mean loss: 0.3394853020931063
Epoch: 68, step: 723, loss: 0.33568868041038513, mean loss: 0.33948526371082555
Epoch: 68, step: 724, loss: 0.3081703186035156, mean loss: 0.33948494713283484
Epoch: 68, step: 725, loss: 0.35236048698425293, mean loss: 0.3394850772966053
Epoch: 68, step: 726, loss: 0.33362069725990295, mean loss: 0.3394850180119377
Epoch: 68, step: 727, loss: 0.35933154821395874, mean loss: 0.3394852186440667
Epoch: 68, step: 728, loss: 0.32490280270576477, mean loss: 0.33948507122930205
Epoch: 68, step: 729, loss: 0.2969134449958801, mean loss: 0.3394846408738075
Epoch: 68, step: 730, loss: 0.32235655188560486, mean loss: 0.33948446772813873
Epoch: 68, step: 731, loss: 0.3092254102230072, mean loss: 0.33948416184627483
Epoch: 68, step: 732, loss: 0.36587512493133545, mean loss: 0.3394844286237637
Epoch: 68, step: 733, loss: 0.3803066611289978, mean loss: 0.3394848412779952
Epoch: 68, step: 734, loss: 0.3035964071750641, mean loss: 0.3394844785010577
Epoch: 68, step: 735, loss: 0.31580254435539246, mean loss: 0.3394842391155031
Epoch: 68, step: 736, loss: 0.3075372874736786, mean loss: 0.33948391618742696
Epoch: 68, step: 737, loss: 0.31292757391929626, mean loss: 0.33948364775174245
Epoch: 68, step: 738, loss: 0.3121687173843384, mean loss: 0.339483371650921
Epoch: 68, step: 739, loss: 0.38182562589645386, mean loss: 0.3394837996444342
Epoch: 68, step: 740, loss: 0.32205161452293396, mean loss: 0.33948362344250843
Epoch: 68, step: 741, loss: 0.3452471196651459, mean loss: 0.3394836816984793
Epoch: 68, step: 742, loss: 0.36186468601226807, mean loss: 0.3394839079177578
Epoch: 68, step: 743, loss: 0.3712323307991028, mean loss: 0.3394842288163476
Epoch: 68, step: 744, loss: 0.3218720555305481, mean loss: 0.3394840508023257
Epoch: 68, step: 745, loss: 0.32606327533721924, mean loss: 0.3394839151539857
Epoch: 68, step: 746, loss: 0.3216562271118164, mean loss: 0.3394837349653033
Epoch: 68, step: 747, loss: 0.33016759157180786, mean loss: 0.3394836408057784
Epoch: 68, step: 748, loss: 0.3733178675174713, mean loss: 0.3394839827694407
Epoch: 68, step: 749, loss: 0.3372268080711365, mean loss: 0.339483959956331
Epoch: 68, step: 750, loss: 0.31403040885925293, mean loss: 0.3394837027016379
Epoch: 68, step: 751, loss: 0.3500913083553314, mean loss: 0.33948380990981275
Epoch: 68, step: 752, loss: 0.29697006940841675, mean loss: 0.33948338023938474
Epoch: 68, step: 753, loss: 0.3543095588684082, mean loss: 0.33948353008049637
Epoch: 68, step: 754, loss: 0.2910657823085785, mean loss: 0.33948304075037244
Epoch: 68, step: 755, loss: 0.34308934211730957, mean loss: 0.33948307719680254
Epoch: 68, step: 756, loss: 0.2950863242149353, mean loss: 0.3394826285136124
Epoch: 68, step: 757, loss: 0.3471047878265381, mean loss: 0.3394827055440248
Epoch: 68, step: 758, loss: 0.33561116456985474, mean loss: 0.33948266641818503
Epoch: 68, step: 759, loss: 0.3671390116214752, mean loss: 0.3394829459107188
Epoch: 68, step: 760, loss: 0.3455056846141815, mean loss: 0.33948300677535864
Epoch: 68, step: 761, loss: 0.31055787205696106, mean loss: 0.3394827144664604
Epoch: 68, step: 762, loss: 0.37546685338020325, mean loss: 0.3394830781079026
Epoch: 68, step: 763, loss: 0.3266349136829376, mean loss: 0.3394829482707586
Epoch: 68, step: 764, loss: 0.30182045698165894, mean loss: 0.3394825676762449
Epoch: 68, step: 765, loss: 0.300776869058609, mean loss: 0.33948217654365714
Epoch: 68, step: 766, loss: 0.3425789475440979, mean loss: 0.33948220783713223
Epoch: 68, step: 767, loss: 0.34918949007987976, mean loss: 0.33948230593012174
Epoch: 68, step: 768, loss: 0.37158697843551636, mean loss: 0.33948263034754383
Epoch: 68, step: 769, loss: 0.3018541634082794, mean loss: 0.33948225011607175
Epoch: 68, step: 770, loss: 0.34549564123153687, mean loss: 0.33948231088010594
Epoch: 68, step: 771, loss: 0.35863158106803894, mean loss: 0.3394825043774402
Epoch: 68, step: 772, loss: 0.3810632824897766, mean loss: 0.33948292453384005
Epoch: 68, step: 773, loss: 0.37569132447242737, mean loss: 0.33948329040090486
Epoch: 68, step: 774, loss: 0.3751237392425537, mean loss: 0.33948365052548013
Epoch: 68, step: 775, loss: 0.36101219058036804, mean loss: 0.3394838680557935
Epoch: 68, step: 776, loss: 0.3089848458766937, mean loss: 0.33948355988836554
Epoch: 68, step: 777, loss: 0.3141966760158539, mean loss: 0.3394833043878717
Epoch: 68, step: 778, loss: 0.3424552381038666, mean loss: 0.3394833344162004
Epoch: 68, step: 779, loss: 0.3243362009525299, mean loss: 0.3394831813715669
Epoch: 68, step: 780, loss: 0.32366862893104553, mean loss: 0.3394830215850348
Epoch: 68, step: 781, loss: 0.3239020109176636, mean loss: 0.33948286415974466
Epoch: 68, step: 782, loss: 0.34485432505607605, mean loss: 0.3394829184306302
Epoch: 68, step: 783, loss: 0.3107609748840332, mean loss: 0.339482628239639
Epoch: 68, step: 784, loss: 0.33830156922340393, mean loss: 0.3394826163069777
Epoch: 68, step: 785, loss: 0.31929299235343933, mean loss: 0.3394824123260531
Epoch: 68, step: 786, loss: 0.3579005002975464, mean loss: 0.3394825984068174
Epoch: 68, step: 787, loss: 0.336710661649704, mean loss: 0.33948257040179863
Epoch: 68, step: 788, loss: 0.3423222005367279, mean loss: 0.3394825990904372
Epoch: 68, step: 789, loss: 0.3755551874637604, mean loss: 0.3394829635262778
Epoch: 68, step: 790, loss: 0.3333112895488739, mean loss: 0.33948290117542995
Epoch: 68, step: 791, loss: 0.3511809706687927, mean loss: 0.3394830193568481
Epoch: 68, step: 792, loss: 0.3729146718978882, mean loss: 0.33948335710148153
Epoch: 68, step: 793, loss: 0.3465142548084259, mean loss: 0.3394834281306948
Epoch: 68, step: 794, loss: 0.3208768665790558, mean loss: 0.3394832401609457
Epoch: 68, step: 795, loss: 0.29319533705711365, mean loss: 0.3394827725496888
Epoch: 68, step: 796, loss: 0.35137274861335754, mean loss: 0.3394828926638031
Epoch: 68, step: 797, loss: 0.3516935706138611, mean loss: 0.33948301601644426
Epoch: 68, step: 798, loss: 0.34845003485679626, mean loss: 0.3394831066006271
Epoch: 68, step: 799, loss: 0.33379241824150085, mean loss: 0.3394830491142811
Epoch: 68, step: 800, loss: 0.35075047612190247, mean loss: 0.339483162934723
Epoch: 68, step: 801, loss: 0.34249183535575867, mean loss: 0.3394831933271955
Epoch: 68, step: 802, loss: 0.3119344711303711, mean loss: 0.3394829150432196
Epoch: 68, step: 803, loss: 0.3492897152900696, mean loss: 0.3394830141058105
Epoch: 68, step: 804, loss: 0.31848961114883423, mean loss: 0.3394828020448091
Epoch: 68, step: 805, loss: 0.29569700360298157, mean loss: 0.33948235975508156
Epoch: 68, step: 806, loss: 0.28413793444633484, mean loss: 0.33948180071483564
Epoch: 68, step: 807, loss: 0.33308976888656616, mean loss: 0.33948173614885757
Epoch: 68, step: 808, loss: 0.3219646215438843, mean loss: 0.33948155921009326
Epoch: 68, step: 809, loss: 0.34030190110206604, mean loss: 0.3394815674962076
Epoch: 68, step: 810, loss: 0.35658079385757446, mean loss: 0.33948174021043204
Epoch: 68, step: 811, loss: 0.34310969710350037, mean loss: 0.33948177685498065
Epoch: 68, step: 812, loss: 0.3448258340358734, mean loss: 0.33948183083263006
Epoch: 68, step: 813, loss: 0.3398973047733307, mean loss: 0.3394818350290822
Epoch: 68, step: 814, loss: 0.33267873525619507, mean loss: 0.33948176631576116
Epoch: 68, step: 815, loss: 0.378949373960495, mean loss: 0.33948216494625205
Epoch: 68, step: 816, loss: 0.36190909147262573, mean loss: 0.33948239146027126
Epoch: 68, step: 817, loss: 0.3255678713321686, mean loss: 0.3394822509237585
Epoch: 68, step: 818, loss: 0.30312788486480713, mean loss: 0.33948188374873695
Epoch: 68, step: 819, loss: 0.30569714307785034, mean loss: 0.33948154253009
Epoch: 68, step: 820, loss: 0.349586546421051, mean loss: 0.3394816445874349
Epoch: 68, step: 821, loss: 0.34428468346595764, mean loss: 0.3394816930961193
Epoch: 68, step: 822, loss: 0.38293328881263733, mean loss: 0.33948213193463583
Epoch: 68, step: 823, loss: 0.297323614358902, mean loss: 0.339481706159836
Epoch: 68, step: 824, loss: 0.3067775368690491, mean loss: 0.33948137587140786
Epoch: 68, step: 825, loss: 0.3312093913555145, mean loss: 0.33948129233119784
Epoch: 68, step: 826, loss: 0.3565346300601959, mean loss: 0.3394814645540816
Epoch: 68, step: 827, loss: 0.38267266750335693, mean loss: 0.33948190074074036
Epoch: 68, step: 828, loss: 0.31344664096832275, mean loss: 0.33948163781409074
Epoch: 68, step: 829, loss: 0.32744014263153076, mean loss: 0.33948151620984945
Epoch: 68, step: 830, loss: 0.30815622210502625, mean loss: 0.33948119986623126
Epoch: 68, step: 831, loss: 0.3066194951534271, mean loss: 0.33948086801026994
Epoch: 68, step: 832, loss: 0.3478134870529175, mean loss: 0.3394809521568899
Epoch: 68, step: 833, loss: 0.34339115023612976, mean loss: 0.33948099164346995
Epoch: 68, step: 834, loss: 0.3668121099472046, mean loss: 0.3394812676401002
Epoch: 68, step: 835, loss: 0.3385688364505768, mean loss: 0.3394812584262295
Epoch: 68, step: 836, loss: 0.3087421953678131, mean loss: 0.3394809480215697
Epoch: 68, step: 837, loss: 0.3306241035461426, mean loss: 0.339480858585596
Epoch: 68, step: 838, loss: 0.34095296263694763, mean loss: 0.3394808734506792
Epoch: 68, step: 839, loss: 0.33693215250968933, mean loss: 0.339480847714342
Epoch: 68, step: 840, loss: 0.3986629843711853, mean loss: 0.33948144531450214
Epoch: 68, step: 841, loss: 0.3166097104549408, mean loss: 0.3394812143661929
Epoch: 68, step: 842, loss: 0.3370603621006012, mean loss: 0.33948118992178167
Epoch: 68, step: 843, loss: 0.3427863121032715, mean loss: 0.3394812232947186
Epoch: 68, step: 844, loss: 0.3649005591869354, mean loss: 0.33948147995976186
Epoch: 68, step: 845, loss: 0.35070255398750305, mean loss: 0.3394815932604548
Epoch: 68, step: 846, loss: 0.3315252363681793, mean loss: 0.33948151292486084
Epoch: 68, step: 847, loss: 0.3056987524032593, mean loss: 0.3394811718226746
Epoch: 68, step: 848, loss: 0.36843371391296387, mean loss: 0.33948146415152924
Epoch: 68, step: 849, loss: 0.33818161487579346, mean loss: 0.3394814510273064
Epoch: 68, step: 850, loss: 0.31925168633461, mean loss: 0.3394812467749646
Epoch: 68, step: 851, loss: 0.374199241399765, mean loss: 0.3394815973059874
Epoch: 68, step: 852, loss: 0.3908829987049103, mean loss: 0.33948211627616665
Epoch: 68, step: 853, loss: 0.31213387846946716, mean loss: 0.3394818401596369
Epoch: 68, step: 854, loss: 0.308649480342865, mean loss: 0.33948152886944316
Epoch: 68, step: 855, loss: 0.3401825428009033, mean loss: 0.33948153594696046
Epoch: 68, step: 856, loss: 0.31504589319229126, mean loss: 0.33948128924439147
Epoch: 68, step: 857, loss: 0.3710392117500305, mean loss: 0.33948160785037335
Epoch: 68, step: 858, loss: 0.34323596954345703, mean loss: 0.3394816457536928
Epoch: 68, step: 859, loss: 0.3494373559951782, mean loss: 0.33948174626362937
Epoch: 68, step: 860, loss: 0.31898191571235657, mean loss: 0.3394815393054297
Epoch: 68, step: 861, loss: 0.33841970562934875, mean loss: 0.33948152858568414
Epoch: 68, step: 862, loss: 0.31636276841163635, mean loss: 0.33948129519251696
Epoch: 68, step: 863, loss: 0.3149062395095825, mean loss: 0.33948104709996646
Epoch: 68, step: 864, loss: 0.30922722816467285, mean loss: 0.3394807416816827
Epoch: 68, step: 865, loss: 0.32334285974502563, mean loss: 0.33948057876821847
Epoch: 68, step: 866, loss: 0.32782694697380066, mean loss: 0.3394804611248767
Epoch: 68, step: 867, loss: 0.3573264181613922, mean loss: 0.3394806412778853
Epoch: 68, step: 868, loss: 0.34296050667762756, mean loss: 0.339480676406396
Epoch: 68, step: 869, loss: 0.35314953327178955, mean loss: 0.33948081438924377
Epoch: 68, step: 870, loss: 0.34502893686294556, mean loss: 0.3394808703952447
Epoch: 68, step: 871, loss: 0.3084897994995117, mean loss: 0.33948055755636386
Epoch: 68, step: 872, loss: 0.321859210729599, mean loss: 0.33948037967974926
Epoch: 68, step: 873, loss: 0.3361230790615082, mean loss: 0.3394803457902148
Epoch: 68, step: 874, loss: 0.37788212299346924, mean loss: 0.33948073342461577
Epoch: 68, step: 875, loss: 0.36905860900878906, mean loss: 0.33948103198596336
Epoch: 68, step: 876, loss: 0.3287809491157532, mean loss: 0.3394809239795954
Epoch: 68, step: 877, loss: 0.3264409303665161, mean loss: 0.33948079235555567
Epoch: 68, step: 878, loss: 0.30426764488220215, mean loss: 0.33948043692210417
Epoch: 68, step: 879, loss: 0.3231434226036072, mean loss: 0.33948027202168507
Epoch: 68, step: 880, loss: 0.3130074739456177, mean loss: 0.33948000481671425
Epoch: 68, step: 881, loss: 0.3487071096897125, mean loss: 0.33948009795017886
Epoch: 68, step: 882, loss: 0.3098379671573639, mean loss: 0.3394797987613745
Epoch: 68, step: 883, loss: 0.3627404570579529, mean loss: 0.3394800335372869
Epoch: 68, step: 884, loss: 0.31545060873031616, mean loss: 0.33947979100446085
Epoch: 68, step: 885, loss: 0.3137541711330414, mean loss: 0.33947953135428754
Epoch: 68, step: 886, loss: 0.35482078790664673, mean loss: 0.33947968619291685
Epoch: 68, step: 887, loss: 0.32889989018440247, mean loss: 0.33947957941257767
Epoch: 68, step: 888, loss: 0.33281752467155457, mean loss: 0.3394795121741087
Epoch: 68, step: 889, loss: 0.33615750074386597, mean loss: 0.33947947864620825
Epoch: 68, step: 890, loss: 0.34124213457107544, mean loss: 0.339479496435899
Epoch: 68, step: 891, loss: 0.35376039147377014, mean loss: 0.33947964056507257
Epoch: 68, step: 892, loss: 0.321058452129364, mean loss: 0.33947945465208434
Epoch: 68, step: 893, loss: 0.33682575821876526, mean loss: 0.3394794278703348
Epoch: 68, step: 894, loss: 0.3038414716720581, mean loss: 0.339479068207047
Epoch: 68, step: 895, loss: 0.32870179414749146, mean loss: 0.33947895944237255
Epoch: 68, step: 896, loss: 0.3110334575176239, mean loss: 0.3394786723721435
Epoch: 68, step: 897, loss: 0.36267465353012085, mean loss: 0.3394789064621744
Epoch: 68, step: 898, loss: 0.31858083605766296, mean loss: 0.3394786955644096
Epoch: 68, step: 899, loss: 0.31317344307899475, mean loss: 0.3394784301014814
Epoch: 68, step: 900, loss: 0.3143479526042938, mean loss: 0.3394781764965093
Epoch: 68, step: 901, loss: 0.3634689748287201, mean loss: 0.3394784185979315
Epoch: 68, step: 902, loss: 0.3199581205844879, mean loss: 0.33947822161223074
Epoch: 68, step: 903, loss: 0.3293524980545044, mean loss: 0.33947811943127937
Epoch: 68, step: 904, loss: 0.3468780517578125, mean loss: 0.3394781941049055
Epoch: 68, step: 905, loss: 0.32735851407051086, mean loss: 0.33947807180495965
Epoch: 68, step: 906, loss: 0.30408975481987, mean loss: 0.339477714704313
Epoch: 68, step: 907, loss: 0.33013296127319336, mean loss: 0.33947762040811286
Epoch: 68, step: 908, loss: 0.30694764852523804, mean loss: 0.3394772921574203
Epoch: 68, step: 909, loss: 0.33111372590065, mean loss: 0.33947720776390394
Epoch: 68, step: 910, loss: 0.3594161868095398, mean loss: 0.3394774089584091
Epoch: 68, step: 911, loss: 0.29888594150543213, mean loss: 0.339476999373857
Epoch: 68, step: 912, loss: 0.3884090185165405, mean loss: 0.3394774931130139
Epoch: 68, step: 913, loss: 0.310000479221344, mean loss: 0.3394771956838583
Epoch: 68, step: 914, loss: 0.3368492126464844, mean loss: 0.33947716916723447
Epoch: 68, step: 915, loss: 0.3707713186740875, mean loss: 0.3394774849252914
Epoch: 68, step: 916, loss: 0.387994647026062, mean loss: 0.3394779744586547
Epoch: 68, step: 917, loss: 0.33036789298057556, mean loss: 0.33947788253976174
Epoch: 68, step: 918, loss: 0.3173106610774994, mean loss: 0.3394776588792048
Epoch: 68, step: 919, loss: 0.31051674485206604, mean loss: 0.33947736667529377
Epoch: 68, step: 920, loss: 0.303180068731308, mean loss: 0.33947700045393087
Epoch: 68, step: 921, loss: 0.3509580194950104, mean loss: 0.3394771162904327
Epoch: 68, step: 922, loss: 0.3309890329837799, mean loss: 0.3394770306516968
Epoch: 68, step: 923, loss: 0.3379361927509308, mean loss: 0.3394770151058929
Epoch: 68, step: 924, loss: 0.3390691876411438, mean loss: 0.3394770109912863
Epoch: 68, step: 925, loss: 0.338172048330307, mean loss: 0.3394769978255378
Epoch: 68, step: 926, loss: 0.315705806016922, mean loss: 0.33947675800076343
Epoch: 68, step: 927, loss: 0.309338241815567, mean loss: 0.3394764539398657
Epoch: 68, step: 928, loss: 0.30309465527534485, mean loss: 0.3394760868955596
Epoch: 68, step: 929, loss: 0.3222901225090027, mean loss: 0.33947591351362233
Epoch: 68, step: 930, loss: 0.3227161169052124, mean loss: 0.3394757444328176
Epoch: 68, step: 931, loss: 0.32824888825416565, mean loss: 0.33947563117209184
Epoch: 68, step: 932, loss: 0.35723990201950073, mean loss: 0.3394758103828948
Epoch: 68, step: 933, loss: 0.32289060950279236, mean loss: 0.3394756430685587
Epoch: 68, step: 934, loss: 0.35075098276138306, mean loss: 0.3394757568149617
Epoch: 68, step: 935, loss: 0.3265348970890045, mean loss: 0.33947562626799493
Epoch: 68, step: 936, loss: 0.3259958028793335, mean loss: 0.33947549028535223
Epoch: 68, step: 937, loss: 0.30016475915908813, mean loss: 0.33947509372799195
Epoch: 68, step: 938, loss: 0.3481370210647583, mean loss: 0.3394751811065853
Epoch: 68, step: 939, loss: 0.34909141063690186, mean loss: 0.33947527811087785
Epoch: 68, step: 940, loss: 0.34825316071510315, mean loss: 0.33947536665740224
Epoch: 68, step: 941, loss: 0.3642588257789612, mean loss: 0.3394756166569899
Epoch: 68, step: 942, loss: 0.3442399203777313, mean loss: 0.33947566471573526
Epoch: 68, step: 943, loss: 0.3371524512767792, mean loss: 0.33947564128112584
Epoch: 68, step: 944, loss: 0.36824169754981995, mean loss: 0.33947593144580973
Epoch: 68, step: 945, loss: 0.3066753149032593, mean loss: 0.3394756005876469
Epoch: 68, step: 946, loss: 0.37108519673347473, mean loss: 0.339475919428831
Epoch: 68, step: 947, loss: 0.3341604173183441, mean loss: 0.3394758658127113
Epoch: 68, step: 948, loss: 0.35327088832855225, mean loss: 0.33947600495819613
Epoch: 68, step: 949, loss: 0.34091225266456604, mean loss: 0.3394760194449697
Epoch: 68, step: 950, loss: 0.321664035320282, mean loss: 0.3394758397854463
Epoch: 68, step: 951, loss: 0.3866264820098877, mean loss: 0.3394763153628108
Epoch: 68, step: 952, loss: 0.3269611597061157, mean loss: 0.33947618913198063
Epoch: 68, step: 953, loss: 0.3340556025505066, mean loss: 0.3394761344592094
Epoch: 68, step: 954, loss: 0.3114852011203766, mean loss: 0.3394758521417077
Epoch: 68, step: 955, loss: 0.32615700364112854, mean loss: 0.33947571780870556
Epoch: 68, step: 956, loss: 0.3683031499385834, mean loss: 0.33947600855729737
Epoch: 68, step: 957, loss: 0.32194989919662476, mean loss: 0.3394758317937133
Epoch: 68, step: 958, loss: 0.31020402908325195, mean loss: 0.33947553656923035
Epoch: 68, step: 959, loss: 0.33281129598617554, mean loss: 0.3394754693568636
Epoch: 68, step: 960, loss: 0.32623764872550964, mean loss: 0.33947533584783585
Epoch: 68, step: 961, loss: 0.32665959000587463, mean loss: 0.33947520659691466
Epoch: 68, step: 962, loss: 0.3109397292137146, mean loss: 0.3394749188103443
Epoch: 68, step: 963, loss: 0.34881994128227234, mean loss: 0.33947501305600236
Epoch: 68, step: 964, loss: 0.32403939962387085, mean loss: 0.33947485738758326
Epoch: 68, step: 965, loss: 0.3001112937927246, mean loss: 0.33947446040939094
Epoch: 68, step: 966, loss: 0.35350462794303894, mean loss: 0.3394746019010108
Epoch: 68, step: 967, loss: 0.2918984591960907, mean loss: 0.3394741221093337
Epoch: 68, step: 968, loss: 0.3208584785461426, mean loss: 0.33947393437783074
Epoch: 68, step: 969, loss: 0.38836875557899475, mean loss: 0.33947442745805506
Epoch: 68, step: 970, loss: 0.34543177485466003, mean loss: 0.33947448753436776
Epoch: 68, step: 971, loss: 0.3680715560913086, mean loss: 0.3394747759159231
Epoch: 68, step: 972, loss: 0.33093544840812683, mean loss: 0.33947468980361023
Epoch: 68, step: 973, loss: 0.325258731842041, mean loss: 0.33947454644844854
Epoch: 68, step: 974, loss: 0.3587227761745453, mean loss: 0.3394747405475917
Epoch: 68, step: 975, loss: 0.35773932933807373, mean loss: 0.3394749247258426
Epoch: 68, step: 976, loss: 0.35260915756225586, mean loss: 0.33947505716877174
Epoch: 68, step: 977, loss: 0.283429354429245, mean loss: 0.339474492021018
Epoch: 68, step: 978, loss: 0.35891789197921753, mean loss: 0.3394746880803494
Epoch: 68, step: 979, loss: 0.33856505155563354, mean loss: 0.33947467890803745
Epoch: 68, step: 980, loss: 0.3489420711994171, mean loss: 0.33947477437144274
Epoch: 68, step: 981, loss: 0.2999459505081177, mean loss: 0.3394743757909291
Epoch: 68, step: 982, loss: 0.29712551832199097, mean loss: 0.3394739487795102
Epoch: 68, step: 983, loss: 0.351611852645874, mean loss: 0.33947407116702194
Epoch: 68, step: 984, loss: 0.32185816764831543, mean loss: 0.33947389354616714
Epoch: 68, step: 985, loss: 0.30456608533859253, mean loss: 0.3394735415748811
Epoch: 68, step: 986, loss: 0.32820984721183777, mean loss: 0.3394734280055331
Epoch: 68, step: 987, loss: 0.3409386873245239, mean loss: 0.33947344277927094
Epoch: 68, step: 988, loss: 0.3137326240539551, mean loss: 0.33947318324550213
Epoch: 68, step: 989, loss: 0.3156856894493103, mean loss: 0.3394729434086991
Epoch: 68, step: 990, loss: 0.34581080079078674, mean loss: 0.33947300730934116
Epoch: 68, step: 991, loss: 0.33503615856170654, mean loss: 0.3394729625758282
Epoch: 68, step: 992, loss: 0.32638829946517944, mean loss: 0.3394728306540345
Epoch: 68, step: 993, loss: 0.3311331570148468, mean loss: 0.33947274657287746
Epoch: 68, step: 994, loss: 0.3238585293292999, mean loss: 0.33947258915086403
Epoch: 68, step: 995, loss: 0.37461352348327637, mean loss: 0.3394729434370109
Epoch: 68, step: 996, loss: 0.3169984817504883, mean loss: 0.3394727168548124
Epoch: 68, step: 997, loss: 0.32254743576049805, mean loss: 0.33947254621985834
Epoch: 68, step: 998, loss: 0.3128531873226166, mean loss: 0.3394722778551993
Epoch: 68, step: 999, loss: 0.33100268244743347, mean loss: 0.33947219246932736
Epoch: 68, step: 1000, loss: 0.33870673179626465, mean loss: 0.3394721847524454
Epoch: 68, step: 1001, loss: 0.3731856644153595, mean loss: 0.3394725246266279
Epoch: 68, step: 1002, loss: 0.31065165996551514, mean loss: 0.3394722340790735
Epoch: 68, step: 1003, loss: 0.29852187633514404, mean loss: 0.3394718212564018
Epoch: 68, step: 1004, loss: 0.35407570004463196, mean loss: 0.3394719684773741
Epoch: 68, step: 1005, loss: 0.327717661857605, mean loss: 0.339471849983991
Epoch: 68, step: 1006, loss: 0.333477258682251, mean loss: 0.339471789554034
Epoch: 68, step: 1007, loss: 0.30791929364204407, mean loss: 0.3394714714845188
Epoch: 68, step: 1008, loss: 0.32756340503692627, mean loss: 0.33947135144473645
Epoch: 68, step: 1009, loss: 0.3223302960395813, mean loss: 0.3394711786553229
Epoch: 68, step: 1010, loss: 0.32452186942100525, mean loss: 0.3394710279611984
Epoch: 68, step: 1011, loss: 0.31344273686408997, mean loss: 0.33947076558981115
Epoch: 68, step: 1012, loss: 0.32437849044799805, mean loss: 0.3394706134576087
Epoch: 68, step: 1013, loss: 0.3551003634929657, mean loss: 0.3394707710060436
Epoch: 68, step: 1014, loss: 0.3422148823738098, mean loss: 0.33947079866650476
Epoch: 68, step: 1015, loss: 0.34683433175086975, mean loss: 0.3394708728896832
Epoch: 68, step: 1016, loss: 0.31531208753585815, mean loss: 0.33947062937563355
Epoch: 68, step: 1017, loss: 0.36542457342147827, mean loss: 0.3394708909817624
Epoch: 68, step: 1018, loss: 0.3336535394191742, mean loss: 0.33947083234560754
Epoch: 68, step: 1019, loss: 0.3346821367740631, mean loss: 0.3394707840783055
Epoch: 68, step: 1020, loss: 0.35459908843040466, mean loss: 0.3394709365613909
Epoch: 68, step: 1021, loss: 0.35462450981140137, mean loss: 0.3394710892976302
Epoch: 68, step: 1022, loss: 0.2987643778324127, mean loss: 0.33947067900975575
Epoch: 68, step: 1023, loss: 0.3107386827468872, mean loss: 0.33947038941940477
Epoch: 68, step: 1024, loss: 0.31388115882873535, mean loss: 0.3394701315076498
Epoch: 68, step: 1025, loss: 0.3195246458053589, mean loss: 0.3394699304807625
Epoch: 68, step: 1026, loss: 0.33903422951698303, mean loss: 0.3394699260894568
Epoch: 68, step: 1027, loss: 0.29002463817596436, mean loss: 0.3394694277495262
Epoch: 68, step: 1028, loss: 0.3243693709373474, mean loss: 0.3394692755634284
Epoch: 68, step: 1029, loss: 0.3331209123134613, mean loss: 0.33946921158202054
Epoch: 68, step: 1030, loss: 0.302401065826416, mean loss: 0.3394688379978137
Epoch: 68, step: 1031, loss: 0.31456053256988525, mean loss: 0.3394685869667584
Epoch: 68, step: 1032, loss: 0.33595842123031616, mean loss: 0.3394685515909384
Epoch: 68, step: 1033, loss: 0.3343580961227417, mean loss: 0.33946850008774904
Epoch: 68, step: 1034, loss: 0.34427833557128906, mean loss: 0.33946854856080055
Epoch: 68, step: 1035, loss: 0.3227880895137787, mean loss: 0.33946838045846
Epoch: 68, step: 1036, loss: 0.3071022927761078, mean loss: 0.3394680542827686
Epoch: 68, step: 1037, loss: 0.3020497262477875, mean loss: 0.3394676771959195
Epoch: 68, step: 1038, loss: 0.374725878238678, mean loss: 0.3394680325102975
Epoch: 68, step: 1039, loss: 0.3786163926124573, mean loss: 0.33946842702376195
Epoch: 68, step: 1040, loss: 0.3512243628501892, mean loss: 0.33946854549176986
Epoch: 68, step: 1041, loss: 0.3106192946434021, mean loss: 0.3394682547723506
Epoch: 68, step: 1042, loss: 0.39268943667411804, mean loss: 0.33946879108697653
Epoch: 68, step: 1043, loss: 0.374360591173172, mean loss: 0.3394691426912339
Epoch: 68, step: 1044, loss: 0.31984925270080566, mean loss: 0.33946894498382646
Epoch: 68, step: 1045, loss: 0.336769163608551, mean loss: 0.33946891777870974
Epoch: 68, step: 1046, loss: 0.32601895928382874, mean loss: 0.3394687822477341
Epoch: 68, step: 1047, loss: 0.3769458532333374, mean loss: 0.33946915988851384
Epoch: 68, step: 1048, loss: 0.31419801712036133, mean loss: 0.33946890524433687
Epoch: 68, step: 1049, loss: 0.3220292329788208, mean loss: 0.3394687295155903
Epoch: 68, step: 1050, loss: 0.3336729407310486, mean loss: 0.33946867111561463
Epoch: 68, step: 1051, loss: 0.32040107250213623, mean loss: 0.3394684789871372
Epoch: 68, step: 1052, loss: 0.32058051228523254, mean loss: 0.3394682886705802
Epoch: 68, step: 1053, loss: 0.3723047971725464, mean loss: 0.3394686195303479
Epoch: 68, step: 1054, loss: 0.37175464630126953, mean loss: 0.3394689448401988
Epoch: 68, step: 1055, loss: 0.3331179618835449, mean loss: 0.3394688808491566
Epoch: 68, step: 1056, loss: 0.35017314553260803, mean loss: 0.3394689887017766
Epoch: 68, step: 1057, loss: 0.34332016110420227, mean loss: 0.33946902750452124
Epoch: 68, step: 1058, loss: 0.3258655071258545, mean loss: 0.3394688904427246
Epoch: 68, step: 1059, loss: 0.34284985065460205, mean loss: 0.33946892450712846
Epoch: 68, step: 1060, loss: 0.3685794472694397, mean loss: 0.3394692178032783
Epoch: 68, step: 1061, loss: 0.3331303298473358, mean loss: 0.3394691539379635
Epoch: 68, step: 1062, loss: 0.379810631275177, mean loss: 0.33946956038073556
Epoch: 68, step: 1063, loss: 0.34015554189682007, mean loss: 0.3394695672919703
Epoch: 68, step: 1064, loss: 0.3598181903362274, mean loss: 0.33946977230142095
Epoch: 68, step: 1065, loss: 0.39435258507728577, mean loss: 0.3394703252322958
Epoch: 68, step: 1066, loss: 0.31480827927589417, mean loss: 0.3394700767707361
Epoch: 68, step: 1067, loss: 0.3328688144683838, mean loss: 0.33947001026597784
Epoch: 68, step: 1068, loss: 0.3383544385433197, mean loss: 0.3394699990272061
Epoch: 68, step: 1069, loss: 0.2996058464050293, mean loss: 0.3394695974218322
Epoch: 68, step: 1070, loss: 0.33113643527030945, mean loss: 0.33946951347149673
Epoch: 68, step: 1071, loss: 0.3457995653152466, mean loss: 0.3394695772413614
Epoch: 68, step: 1072, loss: 0.31805017590522766, mean loss: 0.3394693614613651
Epoch: 68, step: 1073, loss: 0.3206324279308319, mean loss: 0.3394691716991753
Epoch: 68, step: 1074, loss: 0.3257852792739868, mean loss: 0.33946903384981525
Epoch: 68, step: 1075, loss: 0.31179511547088623, mean loss: 0.33946875506996294
Epoch: 68, step: 1076, loss: 0.34824201464653015, mean loss: 0.33946884344860656
Epoch: 68, step: 1077, loss: 0.33748048543930054, mean loss: 0.33946882341880896
Epoch: 68, step: 1078, loss: 0.31450310349464417, mean loss: 0.3394685719282435
Epoch: 68, step: 1079, loss: 0.29760944843292236, mean loss: 0.33946815026731697
Epoch: 68, step: 1080, loss: 0.3192487955093384, mean loss: 0.3394679465930575
Epoch: 68, step: 1081, loss: 0.33365803956985474, mean loss: 0.3394678880691034
Epoch: 68, step: 1082, loss: 0.3165486752986908, mean loss: 0.3394676572031979
Epoch: 68, step: 1083, loss: 0.3837534189224243, mean loss: 0.33946810329048704
Epoch: 68, step: 1084, loss: 0.3120735287666321, mean loss: 0.33946782734968983
Epoch: 68, step: 1085, loss: 0.3388323485851288, mean loss: 0.33946782094868694
Epoch: 68, step: 1086, loss: 0.3855534791946411, mean loss: 0.3394682851521766
Epoch: 68, step: 1087, loss: 0.32339319586753845, mean loss: 0.33946812323548353
Epoch: 68, step: 1088, loss: 0.3555079400539398, mean loss: 0.3394682847952666
Epoch: 68, step: 1089, loss: 0.3090382218360901, mean loss: 0.3394679782939576
Epoch: 68, step: 1090, loss: 0.3191654682159424, mean loss: 0.33946777380265414
Epoch: 68, step: 1091, loss: 0.3162165582180023, mean loss: 0.3394675396137054
Epoch: 68, step: 1092, loss: 0.3002447783946991, mean loss: 0.3394671445614697
Epoch: 68, step: 1093, loss: 0.34031030535697937, mean loss: 0.3394671530537123
Epoch: 68, step: 1094, loss: 0.339915931224823, mean loss: 0.33946715757372165
Epoch: 68, step: 1095, loss: 0.3098856806755066, mean loss: 0.33946685963764783
Epoch: 68, step: 1096, loss: 0.2933633029460907, mean loss: 0.3394663953006448
Epoch: 68, step: 1097, loss: 0.32249006628990173, mean loss: 0.3394662243234164
Epoch: 68, step: 1098, loss: 0.30841490626335144, mean loss: 0.33946591159297695
Epoch: 68, step: 1099, loss: 0.32219961285591125, mean loss: 0.33946573769881894
Epoch: 68, step: 1100, loss: 0.3192107379436493, mean loss: 0.3394655337065964
Epoch: 68, step: 1101, loss: 0.34303247928619385, mean loss: 0.33946556962966906
Epoch: 68, step: 1102, loss: 0.3500978350639343, mean loss: 0.33946567670722017
Epoch: 68, step: 1103, loss: 0.3562013506889343, mean loss: 0.3394658452505047
Epoch: 68, step: 1104, loss: 0.328486829996109, mean loss: 0.33946573468306307
Epoch: 68, step: 1105, loss: 0.3173268139362335, mean loss: 0.3394655117287161
Epoch: 68, step: 1106, loss: 0.31432512402534485, mean loss: 0.33946525855005666
Epoch: 68, step: 1107, loss: 0.36935508251190186, mean loss: 0.3394655595553332
Epoch: 68, step: 1108, loss: 0.40446561574935913, mean loss: 0.3394662141313817
Epoch: 68, step: 1109, loss: 0.3815290629863739, mean loss: 0.3394666377164944
Epoch: 68, step: 1110, loss: 0.33148375153541565, mean loss: 0.33946655732732
Epoch: 68, step: 1111, loss: 0.30880263447761536, mean loss: 0.33946624853892426
Epoch: 68, step: 1112, loss: 0.34088581800460815, mean loss: 0.33946626283396947
Epoch: 68, step: 1113, loss: 0.318222314119339, mean loss: 0.33946604890984894
Epoch: 68, step: 1114, loss: 0.35438674688339233, mean loss: 0.3394661991580487
Epoch: 68, step: 1115, loss: 0.29723846912384033, mean loss: 0.3394657739382272
Epoch: 68, step: 1116, loss: 0.3686278462409973, mean loss: 0.33946606758807063
Epoch: 68, step: 1117, loss: 0.2996154725551605, mean loss: 0.33946566631332453
Epoch: 68, step: 1118, loss: 0.3207464814186096, mean loss: 0.3394654778227757
Epoch: 68, step: 1119, loss: 0.3213229775428772, mean loss: 0.3394652951409217
Epoch: 68, step: 1120, loss: 0.3147256672382355, mean loss: 0.33946504603327315
Epoch: 68, step: 1121, loss: 0.35621416568756104, mean loss: 0.33946521468139584
Epoch: 68, step: 1122, loss: 0.32738199830055237, mean loss: 0.33946509301582284
Epoch: 68, step: 1123, loss: 0.34545692801475525, mean loss: 0.33946515334683697
Epoch: 68, step: 1124, loss: 0.3850034475326538, mean loss: 0.33946561186143354
Epoch: 68, step: 1125, loss: 0.3409331142902374, mean loss: 0.33946562663722873
Epoch: 68, step: 1126, loss: 0.33386296033859253, mean loss: 0.33946557022640805
Epoch: 68, step: 1127, loss: 0.3252425193786621, mean loss: 0.33946542702211036
Epoch: 68, step: 1128, loss: 0.33207598328590393, mean loss: 0.33946535262249966
Epoch: 68, step: 1129, loss: 0.33851730823516846, mean loss: 0.3394653430773396
Epoch: 68, step: 1130, loss: 0.3314274549484253, mean loss: 0.3394652621505842
Epoch: 68, step: 1131, loss: 0.4111862778663635, mean loss: 0.33946598424207985
Epoch: 68, step: 1132, loss: 0.32976046204566956, mean loss: 0.339465886527283
Epoch: 68, step: 1133, loss: 0.29066455364227295, mean loss: 0.3394653952024246
Epoch: 68, step: 1134, loss: 0.30317285656929016, mean loss: 0.3394650298180011
Epoch: 68, step: 1135, loss: 0.3724234402179718, mean loss: 0.33946536163189445
Epoch: 68, step: 1136, loss: 0.3802904486656189, mean loss: 0.33946577264063343
Epoch: 68, step: 1137, loss: 0.3610071539878845, mean loss: 0.3394659895074546
Epoch: 68, step: 1138, loss: 0.30925023555755615, mean loss: 0.3394656853148667
Epoch: 68, step: 1139, loss: 0.31754207611083984, mean loss: 0.33946546460442895
Epoch: 68, step: 1140, loss: 0.2802371084690094, mean loss: 0.33946486834380923
Epoch: 68, step: 1141, loss: 0.35111236572265625, mean loss: 0.3394649855997073
Epoch: 68, step: 1142, loss: 0.282133549451828, mean loss: 0.33946440844728215
Epoch: 68, step: 1143, loss: 0.3409396708011627, mean loss: 0.3394644232985179
Epoch: 68, step: 1144, loss: 0.32029032707214355, mean loss: 0.33946423027782846
Epoch: 68, step: 1145, loss: 0.33197614550590515, mean loss: 0.33946415489796605
Epoch: 68, step: 1146, loss: 0.33457186818122864, mean loss: 0.33946410564956697
Epoch: 68, step: 1147, loss: 0.32238641381263733, mean loss: 0.33946393373803246
Epoch: 68, step: 1148, loss: 0.3219957649707794, mean loss: 0.33946375789755606
Epoch: 68, step: 1149, loss: 0.32884907722473145, mean loss: 0.3394636510476771
Epoch: 68, step: 1150, loss: 0.3482019901275635, mean loss: 0.33946373900897364
Epoch: 68, step: 1151, loss: 0.3480316400527954, mean loss: 0.3394638252537498
Epoch: 68, step: 1152, loss: 0.3476312458515167, mean loss: 0.33946390746644894
Epoch: 68, step: 1153, loss: 0.31736117601394653, mean loss: 0.33946368498409984
Epoch: 68, step: 1154, loss: 0.3036072552204132, mean loss: 0.33946332406298735
Epoch: 68, step: 1155, loss: 0.32848480343818665, mean loss: 0.3394632135572839
Epoch: 68, step: 1156, loss: 0.3524528443813324, mean loss: 0.3394633443047582
Epoch: 68, step: 1157, loss: 0.3635796904563904, mean loss: 0.3394635870460381
Epoch: 68, step: 1158, loss: 0.31102871894836426, mean loss: 0.33946330083987913
Epoch: 68, step: 1159, loss: 0.33239778876304626, mean loss: 0.339463229723927
Epoch: 68, step: 1160, loss: 0.34172138571739197, mean loss: 0.33946325245254105
Epoch: 68, step: 1161, loss: 0.34501913189888, mean loss: 0.339463308372579
Epoch: 68, step: 1162, loss: 0.33074361085891724, mean loss: 0.3394632206095322
Epoch: 68, step: 1163, loss: 0.32230105996131897, mean loss: 0.3394630478755187
Epoch: 68, step: 1164, loss: 0.3620396852493286, mean loss: 0.33946327510296487
Epoch: 68, step: 1165, loss: 0.3741746246814728, mean loss: 0.3394636244593285
Epoch: 68, step: 1166, loss: 0.3367118239402771, mean loss: 0.33946359676379495
Epoch: 68, step: 1167, loss: 0.32325679063796997, mean loss: 0.339463433651817
Epoch: 68, step: 1168, loss: 0.3426513671875, mean loss: 0.3394634657361714
Epoch: 68, step: 1169, loss: 0.3312031626701355, mean loss: 0.33946338260274955
Epoch: 68, step: 1170, loss: 0.28793662786483765, mean loss: 0.3394628640319059
Epoch: 68, step: 1171, loss: 0.3279692828655243, mean loss: 0.3394627483604236
Epoch: 68, step: 1172, loss: 0.3507435619831085, mean loss: 0.3394628618894693
Epoch: 68, step: 1173, loss: 0.30812352895736694, mean loss: 0.33946254649654883
Epoch: 68, step: 1174, loss: 0.30962759256362915, mean loss: 0.33946224624642624
Epoch: 68, step: 1175, loss: 0.32826030254364014, mean loss: 0.3394621335145236
Epoch: 68, step: 1176, loss: 0.325053870677948, mean loss: 0.3394619885169606
Epoch: 68, step: 1177, loss: 0.31409597396850586, mean loss: 0.33946173324862455
Epoch: 68, step: 1178, loss: 0.38625043630599976, mean loss: 0.3394622040972933
Epoch: 68, step: 1179, loss: 0.3087717294692993, mean loss: 0.33946189525300485
Epoch: 68, step: 1180, loss: 0.3638608455657959, mean loss: 0.3394621407819746
Epoch: 68, step: 1181, loss: 0.35459908843040466, mean loss: 0.3394622931049932
Epoch: 68, step: 1182, loss: 0.31776562333106995, mean loss: 0.33946207477372503
Epoch: 68, step: 1183, loss: 0.30168211460113525, mean loss: 0.3394616946018508
Epoch: 68, step: 1184, loss: 0.33435767889022827, mean loss: 0.3394616432417201
Epoch: 68, step: 1185, loss: 0.3714689612388611, mean loss: 0.3394619653182159
Epoch: 68, step: 1186, loss: 0.2951667904853821, mean loss: 0.3394615195985484
Epoch: 68, step: 1187, loss: 0.3237525522708893, mean loss: 0.339461361528843
Epoch: 68, step: 1188, loss: 0.36781787872314453, mean loss: 0.3394616468602161
Epoch: 68, step: 1189, loss: 0.3378777801990509, mean loss: 0.33946163092305787
Epoch: 68, step: 1190, loss: 0.30641716718673706, mean loss: 0.33946129842691936
Epoch: 68, step: 1191, loss: 0.3622327446937561, mean loss: 0.33946152755279746
Epoch: 68, step: 1192, loss: 0.3032127320766449, mean loss: 0.3394611628217467
Epoch: 68, step: 1193, loss: 0.3330380618572235, mean loss: 0.33946109819392223
Epoch: 68, step: 1194, loss: 0.3304278552532196, mean loss: 0.3394610073043397
Epoch: 68, step: 1195, loss: 0.32211756706237793, mean loss: 0.33946083280198286
Epoch: 68, step: 1196, loss: 0.3116367757320404, mean loss: 0.3394605528509111
Epoch: 68, step: 1197, loss: 0.3407500982284546, mean loss: 0.33946056582550993
Epoch: 68, step: 1198, loss: 0.3605403006076813, mean loss: 0.3394607779144796
Epoch: 68, step: 1199, loss: 0.32039278745651245, mean loss: 0.33946058606814933
Epoch: 68, step: 1200, loss: 0.3126975893974304, mean loss: 0.3394603168037477
Epoch: 68, step: 1201, loss: 0.3099345564842224, mean loss: 0.3394600197459744
Epoch: 68, step: 1202, loss: 0.35493215918540955, mean loss: 0.33946017540913087
Epoch: 68, step: 1203, loss: 0.33998745679855347, mean loss: 0.3394601807139861
Epoch: 68, step: 1204, loss: 0.2871381342411041, mean loss: 0.33945965431936176
Epoch: 68, step: 1205, loss: 0.3105860650539398, mean loss: 0.3394593638347517
Epoch: 68, step: 1206, loss: 0.31194090843200684, mean loss: 0.33945908698633875
Epoch: 68, step: 1207, loss: 0.35936880111694336, mean loss: 0.3394592872852737
Epoch: 68, step: 1208, loss: 0.3243744671344757, mean loss: 0.3394591355280464
Epoch: 68, step: 1209, loss: 0.31923815608024597, mean loss: 0.33945893210176276
Epoch: 68, step: 1210, loss: 0.35079526901245117, mean loss: 0.33945904614597583
Epoch: 68, step: 1211, loss: 0.308052659034729, mean loss: 0.3394587301990611
Epoch: 68, step: 1212, loss: 0.3290686309337616, mean loss: 0.33945862567615714
Epoch: 68, step: 1213, loss: 0.3382023870944977, mean loss: 0.33945861303870484
Epoch: 68, step: 1214, loss: 0.3209230303764343, mean loss: 0.33945842657716124
Epoch: 68, step: 1215, loss: 0.310077428817749, mean loss: 0.3394581310174703
Epoch: 68, step: 1216, loss: 0.35514193773269653, mean loss: 0.339458288787961
Epoch: 68, step: 1217, loss: 0.2922632396221161, mean loss: 0.3394578140364354
Epoch: 68, step: 1218, loss: 0.31084808707237244, mean loss: 0.3394575262440687
Epoch: 68, step: 1219, loss: 0.35414910316467285, mean loss: 0.3394576740288122
Epoch: 68, step: 1220, loss: 0.30458107590675354, mean loss: 0.3394573232034863
Epoch: 68, step: 1221, loss: 0.34904494881629944, mean loss: 0.33945741964488907
Epoch: 68, step: 1222, loss: 0.3492593467235565, mean loss: 0.3394575182409468
Epoch: 68, step: 1223, loss: 0.3187949061393738, mean loss: 0.3394573104010407
Epoch: 68, step: 1224, loss: 0.32817015051841736, mean loss: 0.3394571968675416
Epoch: 68, step: 1225, loss: 0.3305034935474396, mean loss: 0.33945710680635227
Epoch: 68, step: 1226, loss: 0.31884074211120605, mean loss: 0.3394568994378946
Epoch: 68, step: 1227, loss: 0.30168578028678894, mean loss: 0.33945651952319783
Epoch: 68, step: 1228, loss: 0.3374917507171631, mean loss: 0.33945649976108716
Epoch: 68, step: 1229, loss: 0.3191989064216614, mean loss: 0.3394562960074578
Epoch: 68, step: 1230, loss: 0.33945661783218384, mean loss: 0.3394562960106947
Epoch: 68, step: 1231, loss: 0.3857225775718689, mean loss: 0.33945676135388714
Epoch: 68, step: 1232, loss: 0.3347840905189514, mean loss: 0.33945671435694635
Epoch: 68, step: 1233, loss: 0.3412401080131531, mean loss: 0.3394567322938407
Epoch: 68, step: 1234, loss: 0.32582423090934753, mean loss: 0.3394565951831828
Epoch: 68, step: 1235, loss: 0.30791088938713074, mean loss: 0.3394562779113298
Epoch: 68, step: 1236, loss: 0.3088700771331787, mean loss: 0.3394559702928204
Epoch: 68, step: 1237, loss: 0.3346582055091858, mean loss: 0.3394559220401322
Epoch: 68, step: 1238, loss: 0.3322124481201172, mean loss: 0.33945584919088073
Epoch: 68, step: 1239, loss: 0.36678579449653625, mean loss: 0.33945612405154235
Epoch: 68, step: 1240, loss: 0.32631319761276245, mean loss: 0.33945599187282466
Epoch: 68, step: 1241, loss: 0.3739866316318512, mean loss: 0.3394563391447815
Epoch: 68, step: 1242, loss: 0.3214680552482605, mean loss: 0.33945615823982955
Epoch: 68, step: 1243, loss: 0.32245174050331116, mean loss: 0.3394559872311633
Epoch: 68, step: 1244, loss: 0.3208713233470917, mean loss: 0.3394558003322838
Epoch: 68, step: 1245, loss: 0.30870842933654785, mean loss: 0.3394554911208053
Epoch: 68, step: 1246, loss: 0.3641606569290161, mean loss: 0.3394557395662423
Epoch: 68, step: 1247, loss: 0.3204525411128998, mean loss: 0.3394555484640857
Epoch: 68, step: 1248, loss: 0.30400216579437256, mean loss: 0.33945519193727414
Epoch: 68, step: 1249, loss: 0.34471988677978516, mean loss: 0.33945524487964096
Epoch: 68, step: 1250, loss: 0.38664931058883667, mean loss: 0.33945571946373143
Epoch: 68, step: 1251, loss: 0.3240574598312378, mean loss: 0.3394555646202051
Epoch: 68, step: 1252, loss: 0.35660138726234436, mean loss: 0.3394557370353355
Epoch: 68, step: 1253, loss: 0.29112568497657776, mean loss: 0.33945525104241414
Epoch: 68, step: 1254, loss: 0.3275194764137268, mean loss: 0.33945513102094915
Epoch: 68, step: 1255, loss: 0.3090282380580902, mean loss: 0.33945482506313235
Epoch: 68, step: 1256, loss: 0.3125367760658264, mean loss: 0.3394545543912402
Epoch: 68, step: 1257, loss: 0.3426060378551483, mean loss: 0.33945458608036505
Epoch: 68, step: 1258, loss: 0.3069463074207306, mean loss: 0.33945425920302186
Epoch: 68, step: 1259, loss: 0.33446213603019714, mean loss: 0.33945420900671436
Epoch: 68, step: 1260, loss: 0.3460465967655182, mean loss: 0.3394542752931789
Epoch: 68, step: 1261, loss: 0.30754852294921875, mean loss: 0.33945395448403753
Epoch: 68, step: 1262, loss: 0.30881935358047485, mean loss: 0.33945364645929366
Epoch: 68, step: 1263, loss: 0.2960771918296814, mean loss: 0.33945321032216136
Epoch: 68, step: 1264, loss: 0.3204857409000397, mean loss: 0.3394530196119105
Epoch: 68, step: 1265, loss: 0.29236114025115967, mean loss: 0.33945254612682774
Epoch: 68, step: 1266, loss: 0.32944583892822266, mean loss: 0.3394524455154482
Epoch: 68, step: 1267, loss: 0.32172471284866333, mean loss: 0.3394522672756265
Epoch: 68, step: 1268, loss: 0.3222472071647644, mean loss: 0.3394520942926471
Epoch: 68, step: 1269, loss: 0.30719950795173645, mean loss: 0.3394517700222087
Epoch: 68, step: 1270, loss: 0.30617618560791016, mean loss: 0.33945143546981826
Epoch: 68, step: 1271, loss: 0.3177292048931122, mean loss: 0.3394512170769266
Epoch: 68, step: 1272, loss: 0.30993321537971497, mean loss: 0.3394509203092023
Epoch: 68, step: 1273, loss: 0.3569542169570923, mean loss: 0.3394510962818628
Epoch: 68, step: 1274, loss: 0.34485170245170593, mean loss: 0.3394511505773193
Epoch: 68, step: 1275, loss: 0.33792850375175476, mean loss: 0.33945113526941295
Epoch: 68, step: 1276, loss: 0.3257739543914795, mean loss: 0.33945099776746884
Epoch: 68, step: 1277, loss: 0.4420693516731262, mean loss: 0.33945202941875974
Epoch: 68, step: 1278, loss: 0.3497661054134369, mean loss: 0.33945213310803596
Epoch: 68, step: 1279, loss: 0.3205018639564514, mean loss: 0.33945194259945916
Epoch: 68, step: 1280, loss: 0.33951452374458313, mean loss: 0.33945194322858613
Epoch: 68, step: 1281, loss: 0.34267738461494446, mean loss: 0.33945197565355534
Epoch: 68, step: 1282, loss: 0.34503066539764404, mean loss: 0.33945203173487976
Epoch: 68, step: 1283, loss: 0.3401380181312561, mean loss: 0.33945203863087875
Epoch: 68, step: 1284, loss: 0.29368290305137634, mean loss: 0.3394515785332122
Epoch: 68, step: 1285, loss: 0.3352772891521454, mean loss: 0.3394515365712771
Epoch: 68, step: 1286, loss: 0.3231654167175293, mean loss: 0.33945137285712784
Epoch: 68, step: 1287, loss: 0.3390887677669525, mean loss: 0.33945136921212293
Epoch: 68, step: 1288, loss: 0.3225111663341522, mean loss: 0.3394511989263108
Epoch: 68, step: 1289, loss: 0.3129982650279999, mean loss: 0.33945093301957496
Epoch: 68, step: 1290, loss: 0.3023532032966614, mean loss: 0.33945056011435776
Epoch: 68, step: 1291, loss: 0.37858736515045166, mean loss: 0.3394509535123417
Epoch: 68, step: 1292, loss: 0.335424542427063, mean loss: 0.33945091303979724
Epoch: 68, step: 1293, loss: 0.32784152030944824, mean loss: 0.3394507963460642
Epoch: 68, step: 1294, loss: 0.3868906497955322, mean loss: 0.33945127319081225
Epoch: 68, step: 1295, loss: 0.3389560282230377, mean loss: 0.3394512682128755
Epoch: 68, step: 1296, loss: 0.37957674264907837, mean loss: 0.33945167152856304
Epoch: 68, step: 1297, loss: 0.32416850328445435, mean loss: 0.33945151791344347
Epoch: 68, step: 1298, loss: 0.3661552369594574, mean loss: 0.33945178631680706
Epoch: 68, step: 1299, loss: 0.30244070291519165, mean loss: 0.33945141431621
Epoch: 68, step: 1300, loss: 0.34141942858695984, mean loss: 0.33945143409663947
Epoch: 68, step: 1301, loss: 0.3289031982421875, mean loss: 0.33945132807782574
Epoch: 68, step: 1302, loss: 0.2925305664539337, mean loss: 0.33945085648868434
Epoch: 68, step: 1303, loss: 0.3311809003353119, mean loss: 0.3394507733702057
Epoch: 68, step: 1304, loss: 0.32433223724365234, mean loss: 0.3394506214205376
Epoch: 68, step: 1305, loss: 0.32752180099487305, mean loss: 0.3394505015304853
Epoch: 68, step: 1306, loss: 0.338180810213089, mean loss: 0.3394504887696403
Epoch: 68, step: 1307, loss: 0.35107630491256714, mean loss: 0.33945060561201357
Epoch: 68, step: 1308, loss: 0.3861795663833618, mean loss: 0.33945107524509033
Epoch: 68, step: 1309, loss: 0.32131391763687134, mean loss: 0.3394508929657632
Epoch: 68, step: 1310, loss: 0.34382960200309753, mean loss: 0.33945093697156237
Epoch: 68, step: 1311, loss: 0.3224911689758301, mean loss: 0.33945076652848477
Epoch: 68, step: 1312, loss: 0.32344308495521545, mean loss: 0.339450605655347
Epoch: 68, step: 1313, loss: 0.3207855820655823, mean loss: 0.3394504180784814
Epoch: 68, step: 1314, loss: 0.34293437004089355, mean loss: 0.33945045309061084
Epoch: 68, step: 1315, loss: 0.33779144287109375, mean loss: 0.33945043641848177
Epoch: 68, step: 1316, loss: 0.3273153305053711, mean loss: 0.339450314468649
Epoch: 68, step: 1317, loss: 0.32357871532440186, mean loss: 0.33945015497111963
Epoch: 68, step: 1318, loss: 0.333035409450531, mean loss: 0.33945009050844194
Epoch: 68, step: 1319, loss: 0.32801541686058044, mean loss: 0.3394499756009569
Epoch: 68, step: 1320, loss: 0.3514983355998993, mean loss: 0.3394500966741835
Epoch: 68, step: 1321, loss: 0.3473484218120575, mean loss: 0.3394501760431682
Epoch: 68, step: 1322, loss: 0.3303525447845459, mean loss: 0.33945008462347004
Epoch: 68, step: 1323, loss: 0.3250868618488312, mean loss: 0.3394499402926813
Epoch: 68, step: 1324, loss: 0.3295828402042389, mean loss: 0.3394498411427864
Epoch: 68, step: 1325, loss: 0.30859288573265076, mean loss: 0.33944953107872355
Epoch: 68, step: 1326, loss: 0.35505959391593933, mean loss: 0.33944968793382496
Epoch: 68, step: 1327, loss: 0.3723061978816986, mean loss: 0.33945001808364356
Epoch: 68, step: 1328, loss: 0.3109387457370758, mean loss: 0.339449731598657
Epoch: 68, step: 1329, loss: 0.339481383562088, mean loss: 0.33944973191669686
Epoch: 68, step: 1330, loss: 0.34072935581207275, mean loss: 0.3394497447742664
Epoch: 68, step: 1331, loss: 0.34191787242889404, mean loss: 0.33944976957358775
Epoch: 68, step: 1332, loss: 0.31841784715652466, mean loss: 0.33944955825057926
Epoch: 68, step: 1333, loss: 0.32558098435401917, mean loss: 0.3394494189043391
Epoch: 68, step: 1334, loss: 0.31438806653022766, mean loss: 0.3394491670997798
Epoch: 68, step: 1335, loss: 0.31652653217315674, mean loss: 0.33944893678635113
Epoch: 68, step: 1336, loss: 0.33817002177238464, mean loss: 0.339448923936679
Epoch: 68, step: 1337, loss: 0.31215792894363403, mean loss: 0.33944864973799527
Epoch: 68, step: 1338, loss: 0.3282971978187561, mean loss: 0.33944853769800853
Epoch: 68, step: 1339, loss: 0.3011283278465271, mean loss: 0.3394481526940917
Epoch: 68, step: 1340, loss: 0.3899807333946228, mean loss: 0.3394486603908425
Epoch: 68, step: 1341, loss: 0.3264259397983551, mean loss: 0.33944852955393656
Epoch: 68, step: 1342, loss: 0.31851276755332947, mean loss: 0.33944831921825563
Epoch: 68, step: 1343, loss: 0.31833404302597046, mean loss: 0.3394481070912243
Epoch: 68, step: 1344, loss: 0.3075754642486572, mean loss: 0.3394477868822282
Epoch: 68, step: 1345, loss: 0.33833447098731995, mean loss: 0.3394477756973953
Epoch: 68, step: 1346, loss: 0.3272334933280945, mean loss: 0.3394476529888854
Epoch: 68, step: 1347, loss: 0.3275637924671173, mean loss: 0.33944753360109636
Epoch: 68, step: 1348, loss: 0.29147249460220337, mean loss: 0.33944705163849803
Epoch: 68, step: 1349, loss: 0.3467944860458374, mean loss: 0.33944712545090294
Epoch: 68, step: 1350, loss: 0.3678719699382782, mean loss: 0.33944741100432696
Epoch: 68, step: 1351, loss: 0.350120484828949, mean loss: 0.33944751822398683
Epoch: 68, step: 1352, loss: 0.33802321553230286, mean loss: 0.33944750391585793
Epoch: 68, step: 1353, loss: 0.33992353081703186, mean loss: 0.33944750869783713
Epoch: 68, step: 1354, loss: 0.32572072744369507, mean loss: 0.33944737080537174
Epoch: 68, step: 1355, loss: 0.3264329731464386, mean loss: 0.3394472400704734
Epoch: 68, step: 1356, loss: 0.3467029333114624, mean loss: 0.3394473129561201
Epoch: 68, step: 1357, loss: 0.317827433347702, mean loss: 0.33944709578003157
Epoch: 68, step: 1358, loss: 0.37540164589881897, mean loss: 0.3394474569471732
Epoch: 68, step: 1359, loss: 0.346834272146225, mean loss: 0.33944753114774373
Epoch: 68, step: 1360, loss: 0.32152059674263, mean loss: 0.3394473510734677
Epoch: 68, step: 1361, loss: 0.3351404666900635, mean loss: 0.33944730781167626
Epoch: 68, step: 1362, loss: 0.33394259214401245, mean loss: 0.3394472525184648
Epoch: 68, step: 1363, loss: 0.35147786140441895, mean loss: 0.33944737336109493
Epoch: 68, step: 1364, loss: 0.3416198194026947, mean loss: 0.33944739518222294
Epoch: 68, step: 1365, loss: 0.31952187418937683, mean loss: 0.33944719504239496
Epoch: 68, step: 1366, loss: 0.32633060216903687, mean loss: 0.33944706329546226
Epoch: 68, step: 1367, loss: 0.3551194965839386, mean loss: 0.3394472207124298
Epoch: 68, step: 1368, loss: 0.3393650949001312, mean loss: 0.33944721988755044
Epoch: 68, step: 1369, loss: 0.3369500935077667, mean loss: 0.3394471948064313
Epoch: 68, step: 1370, loss: 0.3706415295600891, mean loss: 0.3394475081189546
Epoch: 68, step: 1371, loss: 0.30524230003356934, mean loss: 0.33944716456899593
Epoch: 68, step: 1372, loss: 0.37181714177131653, mean loss: 0.3394474896830139
Epoch: 68, step: 1373, loss: 0.34917160868644714, mean loss: 0.3394475873480703
Epoch: 68, step: 1374, loss: 0.35933127999305725, mean loss: 0.3394477870497048
Epoch: 68, step: 1375, loss: 0.3181900084018707, mean loss: 0.33944757354959787
Epoch: 68, step: 1376, loss: 0.3513577878475189, mean loss: 0.3394476931672931
Epoch: 68, step: 1377, loss: 0.31623539328575134, mean loss: 0.33944746004185494
Epoch: 68, step: 1378, loss: 0.3709166646003723, mean loss: 0.33944777608974597
Epoch: 68, step: 1379, loss: 0.3551892638206482, mean loss: 0.33944793418125496
Epoch: 68, step: 1380, loss: 0.32623517513275146, mean loss: 0.3394478014870603
Epoch: 68, step: 1381, loss: 0.31826531887054443, mean loss: 0.3394475887559998
Epoch: 68, step: 1382, loss: 0.3932892680168152, mean loss: 0.3394481294708304
Epoch: 68, step: 1383, loss: 0.3094068467617035, mean loss: 0.33944782777882926
Epoch: 68, step: 1384, loss: 0.39479148387908936, mean loss: 0.3394483835663716
Epoch: 68, step: 1385, loss: 0.35616669058799744, mean loss: 0.3394485514579442
Epoch: 68, step: 1386, loss: 0.2920645475387573, mean loss: 0.33944807561460455
Epoch: 68, step: 1387, loss: 0.30157020688056946, mean loss: 0.3394476952383369
Epoch: 68, step: 1388, loss: 0.36152341961860657, mean loss: 0.3394479169244455
Epoch: 68, step: 1389, loss: 0.31177374720573425, mean loss: 0.33944763902111236
Epoch: 68, step: 1390, loss: 0.3240204155445099, mean loss: 0.3394474841028685
Epoch: 68, step: 1391, loss: 0.3668009042739868, mean loss: 0.33944775877972594
Epoch: 68, step: 1392, loss: 0.39242133498191833, mean loss: 0.33944829072305277
Epoch: 68, step: 1393, loss: 0.3882204294204712, mean loss: 0.3394487804720004
Epoch: 68, step: 1394, loss: 0.3341387212276459, mean loss: 0.339448727151193
Epoch: 68, step: 1395, loss: 0.3408217430114746, mean loss: 0.3394487409381539
Epoch: 68, step: 1396, loss: 0.2886628806591034, mean loss: 0.3394482309836381
Epoch: 68, step: 1397, loss: 0.31250330805778503, mean loss: 0.3394479604251189
Epoch: 68, step: 1398, loss: 0.32934802770614624, mean loss: 0.339447859011008
Epoch: 68, step: 1399, loss: 0.3438878655433655, mean loss: 0.3394479035929677
Epoch: 68, step: 1400, loss: 0.3880854845046997, mean loss: 0.3394483919564161
Epoch: 68, step: 1401, loss: 0.31784507632255554, mean loss: 0.3394481750425896
Epoch: 68, step: 1402, loss: 0.3536086082458496, mean loss: 0.3394483172227513
Epoch: 68, step: 1403, loss: 0.2861393988132477, mean loss: 0.3394477819711508
Epoch: 68, step: 1404, loss: 0.3374132215976715, mean loss: 0.3394477615432225
Epoch: 68, step: 1405, loss: 0.3359110951423645, mean loss: 0.3394477260338106
Epoch: 68, step: 1406, loss: 0.380857914686203, mean loss: 0.3394481418029313
Epoch: 68, step: 1407, loss: 0.3361463248729706, mean loss: 0.3394481086521589
Epoch: 68, step: 1408, loss: 0.323078989982605, mean loss: 0.33944794430522796
Epoch: 68, step: 1409, loss: 0.3096133768558502, mean loss: 0.33944764476739286
Epoch: 68, step: 1410, loss: 0.303618460893631, mean loss: 0.339447285047466
Epoch: 68, step: 1411, loss: 0.32956981658935547, mean loss: 0.3394471858800786
Epoch: 68, step: 1412, loss: 0.30145490169525146, mean loss: 0.3394468044505903
Epoch: 68, step: 1413, loss: 0.31946897506713867, mean loss: 0.33944660388205644
Epoch: 68, step: 1414, loss: 0.34838560223579407, mean loss: 0.3394466936247287
Epoch: 68, step: 1415, loss: 0.3160141706466675, mean loss: 0.3394464583773291
Epoch: 68, step: 1416, loss: 0.3501541316509247, mean loss: 0.33944656587437533
Epoch: 68, step: 1417, loss: 0.356225848197937, mean loss: 0.3394467343241527
Epoch: 68, step: 1418, loss: 0.3645920753479004, mean loss: 0.33944698675953655
Epoch: 68, step: 1419, loss: 0.36617136001586914, mean loss: 0.33944725504421364
Epoch: 68, step: 1420, loss: 0.2916956841945648, mean loss: 0.33944677567333986
Epoch: 68, step: 1421, loss: 0.3010219931602478, mean loss: 0.3394463899365708
Epoch: 68, step: 1422, loss: 0.3391900658607483, mean loss: 0.3394463873634234
Epoch: 68, step: 1423, loss: 0.3594423234462738, mean loss: 0.3394465880935881
Epoch: 68, step: 1424, loss: 0.3097924292087555, mean loss: 0.3394462904118783
Epoch: 68, step: 1425, loss: 0.3341370224952698, mean loss: 0.3394462371156074
Epoch: 68, step: 1426, loss: 0.3004347085952759, mean loss: 0.33944584550829837
Epoch: 68, step: 1427, loss: 0.29829567670822144, mean loss: 0.3394454324369392
Epoch: 68, step: 1428, loss: 0.2885473370552063, mean loss: 0.3394449215196087
Epoch: 68, step: 1429, loss: 0.3017100691795349, mean loss: 0.3394445427392957
Epoch: 68, step: 1430, loss: 0.3809843063354492, mean loss: 0.3394449597089071
Epoch: 68, step: 1431, loss: 0.3533709943294525, mean loss: 0.3394450994948484
Epoch: 68, step: 1432, loss: 0.2940882444381714, mean loss: 0.3394446442190135
Epoch: 68, step: 1433, loss: 0.31828126311302185, mean loss: 0.3394444317907206
Epoch: 68, step: 1434, loss: 0.32228317856788635, mean loss: 0.33944425953567703
Epoch: 68, step: 1435, loss: 0.3562014400959015, mean loss: 0.33944442773317735
Epoch: 68, step: 1436, loss: 0.30991387367248535, mean loss: 0.3394441313279734
Epoch: 68, step: 1437, loss: 0.37948015332221985, mean loss: 0.33944453317502743
Epoch: 68, step: 1438, loss: 0.2916398048400879, mean loss: 0.33944405335721634
Epoch: 68, step: 1439, loss: 0.3472408950328827, mean loss: 0.33944413161361664
Epoch: 68, step: 1440, loss: 0.36568987369537354, mean loss: 0.3394443950378042
Epoch: 68, step: 1441, loss: 0.34088966250419617, mean loss: 0.33944440954356997
Epoch: 68, step: 1442, loss: 0.330506294965744, mean loss: 0.33944431983498785
Epoch: 68, step: 1443, loss: 0.33057788014411926, mean loss: 0.33944423084667347
Valid: 68, mean loss: 0.18526800721883774
Epoch: 69, step: 0, loss: 0.2897234261035919, mean loss: 0.3394437318271853
Epoch: 69, step: 1, loss: 0.3082525134086609, mean loss: 0.33944341878177675
Epoch: 69, step: 2, loss: 0.3091750741004944, mean loss: 0.3394431150016838
Epoch: 69, step: 3, loss: 0.3748072683811188, mean loss: 0.33944346992092683
Epoch: 69, step: 4, loss: 0.3762292265892029, mean loss: 0.3394438391038602
Epoch: 69, step: 5, loss: 0.34735649824142456, mean loss: 0.33944391851474254
Epoch: 69, step: 6, loss: 0.3577350676059723, mean loss: 0.339444102081567
Epoch: 69, step: 7, loss: 0.3350469768047333, mean loss: 0.3394440579532173
Epoch: 69, step: 8, loss: 0.33532705903053284, mean loss: 0.33944401663655394
Epoch: 69, step: 9, loss: 0.34990668296813965, mean loss: 0.33944412163491144
Epoch: 69, step: 10, loss: 0.3035213053226471, mean loss: 0.33944376113418073
Epoch: 69, step: 11, loss: 0.34761756658554077, mean loss: 0.33944384316096954
Epoch: 69, step: 12, loss: 0.31588104367256165, mean loss: 0.3394436067030072
Epoch: 69, step: 13, loss: 0.31090372800827026, mean loss: 0.3394433203018161
Epoch: 69, step: 14, loss: 0.3832075595855713, mean loss: 0.3394437594769301
Epoch: 69, step: 15, loss: 0.31996676325798035, mean loss: 0.3394435640268015
Epoch: 69, step: 16, loss: 0.32280218601226807, mean loss: 0.33944339703355475
Epoch: 69, step: 17, loss: 0.35098105669021606, mean loss: 0.33944351281074037
Epoch: 69, step: 18, loss: 0.355275422334671, mean loss: 0.3394436716779274
Epoch: 69, step: 19, loss: 0.34745755791664124, mean loss: 0.33944375209341904
Epoch: 69, step: 20, loss: 0.371483713388443, mean loss: 0.3394440735957851
Epoch: 69, step: 21, loss: 0.3074852228164673, mean loss: 0.33944375291053375
Epoch: 69, step: 22, loss: 0.2973831295967102, mean loss: 0.3394433308651258
Epoch: 69, step: 23, loss: 0.32333439588546753, mean loss: 0.33944316922620366
Epoch: 69, step: 24, loss: 0.3535667359828949, mean loss: 0.33944331094228875
Epoch: 69, step: 25, loss: 0.32193511724472046, mean loss: 0.33944313526656783
Epoch: 69, step: 26, loss: 0.3475549817085266, mean loss: 0.33944321665932586
Epoch: 69, step: 27, loss: 0.3265398144721985, mean loss: 0.33944308719028804
Epoch: 69, step: 28, loss: 0.3273414671421051, mean loss: 0.33944296576732064
Epoch: 69, step: 29, loss: 0.3293338418006897, mean loss: 0.3394428643373047
Epoch: 69, step: 30, loss: 0.3506254255771637, mean loss: 0.33944297653654054
Epoch: 69, step: 31, loss: 0.34606432914733887, mean loss: 0.33944304297062783
Epoch: 69, step: 32, loss: 0.34484368562698364, mean loss: 0.3394430971564093
Epoch: 69, step: 33, loss: 0.3281809985637665, mean loss: 0.3394429841625436
Epoch: 69, step: 34, loss: 0.3227478563785553, mean loss: 0.339442816660183
Epoch: 69, step: 35, loss: 0.3619726896286011, mean loss: 0.3394430427003243
Epoch: 69, step: 36, loss: 0.36472049355506897, mean loss: 0.3394432963041173
Epoch: 69, step: 37, loss: 0.3629123866558075, mean loss: 0.3394435317626155
Epoch: 69, step: 38, loss: 0.31348341703414917, mean loss: 0.3394432713150135
Epoch: 69, step: 39, loss: 0.280220627784729, mean loss: 0.3394426771635274
Epoch: 69, step: 40, loss: 0.30202120542526245, mean loss: 0.3394423017361797
Epoch: 69, step: 41, loss: 0.29620999097824097, mean loss: 0.33944186801649473
Epoch: 69, step: 42, loss: 0.33678850531578064, mean loss: 0.3394418413974205
Epoch: 69, step: 43, loss: 0.3628968596458435, mean loss: 0.3394420767005731
Epoch: 69, step: 44, loss: 0.2916707396507263, mean loss: 0.3394415974584201
Epoch: 69, step: 45, loss: 0.31692376732826233, mean loss: 0.33944137156176746
Epoch: 69, step: 46, loss: 0.33976081013679504, mean loss: 0.3394413747663116
Epoch: 69, step: 47, loss: 0.29855266213417053, mean loss: 0.33944096458300604
Epoch: 69, step: 48, loss: 0.33628740906715393, mean loss: 0.3394409329478
Epoch: 69, step: 49, loss: 0.35917600989341736, mean loss: 0.3394411309202028
Epoch: 69, step: 50, loss: 0.32284781336784363, mean loss: 0.3394409644660257
Epoch: 69, step: 51, loss: 0.32791846990585327, mean loss: 0.33944084888045306
Epoch: 69, step: 52, loss: 0.34506043791770935, mean loss: 0.3394409052516579
Epoch: 69, step: 53, loss: 0.3492469787597656, mean loss: 0.33944100361732654
Epoch: 69, step: 54, loss: 0.3364739716053009, mean loss: 0.33944097385504096
Epoch: 69, step: 55, loss: 0.34878605604171753, mean loss: 0.3394410675945806
Epoch: 69, step: 56, loss: 0.3813333511352539, mean loss: 0.3394414878074696
Epoch: 69, step: 57, loss: 0.3218342661857605, mean loss: 0.33944131119481863
Epoch: 69, step: 58, loss: 0.32881686091423035, mean loss: 0.3394412046252787
Epoch: 69, step: 59, loss: 0.327021986246109, mean loss: 0.33944108005439944
Epoch: 69, step: 60, loss: 0.30660372972488403, mean loss: 0.33944075068290047
Epoch: 69, step: 61, loss: 0.3485088050365448, mean loss: 0.3394408416381288
Epoch: 69, step: 62, loss: 0.3329560458660126, mean loss: 0.3394407765943894
Epoch: 69, step: 63, loss: 0.33417436480522156, mean loss: 0.3394407237718038
Epoch: 69, step: 64, loss: 0.34821420907974243, mean loss: 0.3394408117697708
Epoch: 69, step: 65, loss: 0.3162759840488434, mean loss: 0.3394405794291185
Epoch: 69, step: 66, loss: 0.34491872787475586, mean loss: 0.33944063437378863
Epoch: 69, step: 67, loss: 0.3174574375152588, mean loss: 0.3394404138891856
Epoch: 69, step: 68, loss: 0.330636203289032, mean loss: 0.33944032558658693
Epoch: 69, step: 69, loss: 0.30169013142585754, mean loss: 0.339439946971517
Epoch: 69, step: 70, loss: 0.3779202401638031, mean loss: 0.33944033290523473
Epoch: 69, step: 71, loss: 0.32159295678138733, mean loss: 0.3394401539088039
Epoch: 69, step: 72, loss: 0.35982745885849, mean loss: 0.33944035837685543
Epoch: 69, step: 73, loss: 0.32792940735816956, mean loss: 0.33944024293255676
Epoch: 69, step: 74, loss: 0.32214367389678955, mean loss: 0.3394400694655467
Epoch: 69, step: 75, loss: 0.3496195077896118, mean loss: 0.33944017155394457
Epoch: 69, step: 76, loss: 0.2974320948123932, mean loss: 0.33943975026407525
Epoch: 69, step: 77, loss: 0.3247848153114319, mean loss: 0.33943960329439243
Epoch: 69, step: 78, loss: 0.3394815921783447, mean loss: 0.3394396037154814
Epoch: 69, step: 79, loss: 0.36114516854286194, mean loss: 0.3394398213893234
Epoch: 69, step: 80, loss: 0.33429282903671265, mean loss: 0.33943976977332657
Epoch: 69, step: 81, loss: 0.34964561462402344, mean loss: 0.3394398721203938
Epoch: 69, step: 82, loss: 0.3338490426540375, mean loss: 0.3394398160545541
Epoch: 69, step: 83, loss: 0.36693382263183594, mean loss: 0.3394400917666136
Epoch: 69, step: 84, loss: 0.30224525928497314, mean loss: 0.33943971877764956
Epoch: 69, step: 85, loss: 0.30363041162490845, mean loss: 0.33943935968630407
Epoch: 69, step: 86, loss: 0.36889517307281494, mean loss: 0.33943965506263035
Epoch: 69, step: 87, loss: 0.31601375341415405, mean loss: 0.33943942015526957
Epoch: 69, step: 88, loss: 0.3458617329597473, mean loss: 0.3394394845554982
Epoch: 69, step: 89, loss: 0.3129080832004547, mean loss: 0.33943921851252695
Epoch: 69, step: 90, loss: 0.33174076676368713, mean loss: 0.3394391413172664
Epoch: 69, step: 91, loss: 0.3241012394428253, mean loss: 0.33943898751991886
Epoch: 69, step: 92, loss: 0.3491603136062622, mean loss: 0.33943908499734354
Epoch: 69, step: 93, loss: 0.3432812988758087, mean loss: 0.339439123523503
Epoch: 69, step: 94, loss: 0.33193862438201904, mean loss: 0.3394390483162039
Epoch: 69, step: 95, loss: 0.3299364745616913, mean loss: 0.33943895303511307
Epoch: 69, step: 96, loss: 0.3635907471179962, mean loss: 0.33943919519963317
Epoch: 69, step: 97, loss: 0.3525694012641907, mean loss: 0.3394393268518888
Epoch: 69, step: 98, loss: 0.2896278202533722, mean loss: 0.3394388274133106
Epoch: 69, step: 99, loss: 0.2976212799549103, mean loss: 0.3394384081309305
Epoch: 69, step: 100, loss: 0.3411611318588257, mean loss: 0.3394384254035949
Epoch: 69, step: 101, loss: 0.3275075852870941, mean loss: 0.33943830578178463
Epoch: 69, step: 102, loss: 0.32614222168922424, mean loss: 0.3394381724730078
Epoch: 69, step: 103, loss: 0.34475913643836975, mean loss: 0.33943822582135313
Epoch: 69, step: 104, loss: 0.3583011329174042, mean loss: 0.339438414940242
Epoch: 69, step: 105, loss: 0.29412132501602173, mean loss: 0.33943796059713754
Epoch: 69, step: 106, loss: 0.3414627015590668, mean loss: 0.33943798089671706
Epoch: 69, step: 107, loss: 0.34109222888946533, mean loss: 0.33943799748165443
Epoch: 69, step: 108, loss: 0.3233983516693115, mean loss: 0.3394378366751397
Epoch: 69, step: 109, loss: 0.32195693254470825, mean loss: 0.3394376614209528
Epoch: 69, step: 110, loss: 0.33141690492630005, mean loss: 0.339437581009948
Epoch: 69, step: 111, loss: 0.32507267594337463, mean loss: 0.3394374369979872
Epoch: 69, step: 112, loss: 0.313058465719223, mean loss: 0.3394371725444961
Epoch: 69, step: 113, loss: 0.3018034100532532, mean loss: 0.33943679526366916
Epoch: 69, step: 114, loss: 0.32312873005867004, mean loss: 0.33943663177593264
Epoch: 69, step: 115, loss: 0.36456653475761414, mean loss: 0.33943688369973346
Epoch: 69, step: 116, loss: 0.3178485333919525, mean loss: 0.33943666728167776
Epoch: 69, step: 117, loss: 0.33866870403289795, mean loss: 0.3394366595831068
Epoch: 69, step: 118, loss: 0.35694757103919983, mean loss: 0.3394368351222924
Epoch: 69, step: 119, loss: 0.3458101749420166, mean loss: 0.3394368990115805
Epoch: 69, step: 120, loss: 0.35591790080070496, mean loss: 0.33943706422306225
Epoch: 69, step: 121, loss: 0.31110596656799316, mean loss: 0.33943678022480994
Epoch: 69, step: 122, loss: 0.3352910876274109, mean loss: 0.3394367386677314
Epoch: 69, step: 123, loss: 0.31402286887168884, mean loss: 0.3394364839176332
Epoch: 69, step: 124, loss: 0.36353787779808044, mean loss: 0.3394367255089753
Epoch: 69, step: 125, loss: 0.33415359258651733, mean loss: 0.33943667255160753
Epoch: 69, step: 126, loss: 0.330764502286911, mean loss: 0.3394365856238862
Epoch: 69, step: 127, loss: 0.33521077036857605, mean loss: 0.33943654326576844
Epoch: 69, step: 128, loss: 0.3302355408668518, mean loss: 0.3394364510390116
Epoch: 69, step: 129, loss: 0.3387168049812317, mean loss: 0.3394364438256718
Epoch: 69, step: 130, loss: 0.34850212931632996, mean loss: 0.3394365346942505
Epoch: 69, step: 131, loss: 0.30031946301460266, mean loss: 0.3394361426139073
Epoch: 69, step: 132, loss: 0.3031816780567169, mean loss: 0.3394357792298446
Epoch: 69, step: 133, loss: 0.34320080280303955, mean loss: 0.33943581696687547
Epoch: 69, step: 134, loss: 0.37795713543891907, mean loss: 0.3394362030642231
Epoch: 69, step: 135, loss: 0.3375268280506134, mean loss: 0.3394361839268398
Epoch: 69, step: 136, loss: 0.3489258885383606, mean loss: 0.3394362790397923
Epoch: 69, step: 137, loss: 0.33484092354774475, mean loss: 0.3394362329821471
Epoch: 69, step: 138, loss: 0.31597816944122314, mean loss: 0.339435997872515
Epoch: 69, step: 139, loss: 0.37172794342041016, mean loss: 0.339436321516934
Epoch: 69, step: 140, loss: 0.3522627055644989, mean loss: 0.3394364500674421
Epoch: 69, step: 141, loss: 0.3259992301464081, mean loss: 0.3394363153962729
Epoch: 69, step: 142, loss: 0.3273470997810364, mean loss: 0.3394361942363533
Epoch: 69, step: 143, loss: 0.3418857157230377, mean loss: 0.33943621878557645
Epoch: 69, step: 144, loss: 0.3138871490955353, mean loss: 0.33943596273412685
Epoch: 69, step: 145, loss: 0.3518509268760681, mean loss: 0.3394360871550058
Epoch: 69, step: 146, loss: 0.32055583596229553, mean loss: 0.33943589794190143
Epoch: 69, step: 147, loss: 0.31419819593429565, mean loss: 0.33943564501856693
Epoch: 69, step: 148, loss: 0.31257012486457825, mean loss: 0.33943537578451216
Epoch: 69, step: 149, loss: 0.31829914450645447, mean loss: 0.339435163968914
Epoch: 69, step: 150, loss: 0.374394953250885, mean loss: 0.3394355143130398
Epoch: 69, step: 151, loss: 0.32631781697273254, mean loss: 0.3394353828573804
Epoch: 69, step: 152, loss: 0.31302568316459656, mean loss: 0.33943511820196054
Epoch: 69, step: 153, loss: 0.32018381357192993, mean loss: 0.33943492528378605
Epoch: 69, step: 154, loss: 0.3317115008831024, mean loss: 0.3394348478877844
Epoch: 69, step: 155, loss: 0.3708251416683197, mean loss: 0.3394351624450012
Epoch: 69, step: 156, loss: 0.32585373520851135, mean loss: 0.3394350263490101
Epoch: 69, step: 157, loss: 0.3246844708919525, mean loss: 0.33943487853896687
Epoch: 69, step: 158, loss: 0.3244014084339142, mean loss: 0.3394347278954466
Epoch: 69, step: 159, loss: 0.3390781283378601, mean loss: 0.33943472432216154
Epoch: 69, step: 160, loss: 0.33070170879364014, mean loss: 0.3394346368143654
Epoch: 69, step: 161, loss: 0.3550906479358673, mean loss: 0.3394347936913682
Epoch: 69, step: 162, loss: 0.3482539653778076, mean loss: 0.33943488206070743
Epoch: 69, step: 163, loss: 0.3055568337440491, mean loss: 0.33943454260130546
Epoch: 69, step: 164, loss: 0.33366212248802185, mean loss: 0.3394344847620041
Epoch: 69, step: 165, loss: 0.33621159195899963, mean loss: 0.33943445246913617
Epoch: 69, step: 166, loss: 0.32444053888320923, mean loss: 0.33943430223403714
Epoch: 69, step: 167, loss: 0.33054476976394653, mean loss: 0.3394342131641354
Epoch: 69, step: 168, loss: 0.34773918986320496, mean loss: 0.33943429637616584
Epoch: 69, step: 169, loss: 0.3317042291164398, mean loss: 0.33943421892523845
Epoch: 69, step: 170, loss: 0.2993038296699524, mean loss: 0.3394338168453317
Epoch: 69, step: 171, loss: 0.3243650496006012, mean loss: 0.33943366586778234
Epoch: 69, step: 172, loss: 0.33129173517227173, mean loss: 0.3394335842926669
Epoch: 69, step: 173, loss: 0.31151124835014343, mean loss: 0.33943330453777315
Epoch: 69, step: 174, loss: 0.3213551640510559, mean loss: 0.3394331234140444
Epoch: 69, step: 175, loss: 0.36062636971473694, mean loss: 0.3394333357456909
Epoch: 69, step: 176, loss: 0.35421451926231384, mean loss: 0.33943348383445204
Epoch: 69, step: 177, loss: 0.3770262598991394, mean loss: 0.3394338604627413
Epoch: 69, step: 178, loss: 0.3480500876903534, mean loss: 0.33943394678470923
Epoch: 69, step: 179, loss: 0.3516237735748291, mean loss: 0.3394340689076834
Epoch: 69, step: 180, loss: 0.3349587917327881, mean loss: 0.33943402407286394
Epoch: 69, step: 181, loss: 0.3331473767757416, mean loss: 0.3394339610917654
Epoch: 69, step: 182, loss: 0.3816000521183014, mean loss: 0.3394343835172658
Epoch: 69, step: 183, loss: 0.3101573884487152, mean loss: 0.3394340902193789
Epoch: 69, step: 184, loss: 0.3265970051288605, mean loss: 0.33943396161833217
Epoch: 69, step: 185, loss: 0.37601274251937866, mean loss: 0.3394343280584045
Epoch: 69, step: 186, loss: 0.32286542654037476, mean loss: 0.3394341620755998
Epoch: 69, step: 187, loss: 0.3619655668735504, mean loss: 0.33943438778689966
Epoch: 69, step: 188, loss: 0.3146834075450897, mean loss: 0.33943413984319576
Epoch: 69, step: 189, loss: 0.3610052466392517, mean loss: 0.3394343559302552
Epoch: 69, step: 190, loss: 0.32620352506637573, mean loss: 0.33943422339265655
Epoch: 69, step: 191, loss: 0.31645768880844116, mean loss: 0.3394339932314334
Epoch: 69, step: 192, loss: 0.3290536403656006, mean loss: 0.33943388925009665
Epoch: 69, step: 193, loss: 0.33868566155433655, mean loss: 0.33943388175507816
Epoch: 69, step: 194, loss: 0.33984673023223877, mean loss: 0.3394338858905519
Epoch: 69, step: 195, loss: 0.34437111020088196, mean loss: 0.33943393534587996
Epoch: 69, step: 196, loss: 0.323804646730423, mean loss: 0.33943377879154807
Epoch: 69, step: 197, loss: 0.3961969017982483, mean loss: 0.33943434736661277
Epoch: 69, step: 198, loss: 0.312608540058136, mean loss: 0.3394340786651823
Epoch: 69, step: 199, loss: 0.356078565120697, mean loss: 0.33943424538346484
Epoch: 69, step: 200, loss: 0.35464730858802795, mean loss: 0.3394343977624747
Epoch: 69, step: 201, loss: 0.31389641761779785, mean loss: 0.33943414196828664
Epoch: 69, step: 202, loss: 0.355117529630661, mean loss: 0.339434299055073
Epoch: 69, step: 203, loss: 0.3008250892162323, mean loss: 0.33943391234423725
Epoch: 69, step: 204, loss: 0.35396909713745117, mean loss: 0.33943405792756265
Epoch: 69, step: 205, loss: 0.30720993876457214, mean loss: 0.3394337351764242
Epoch: 69, step: 206, loss: 0.36371201276779175, mean loss: 0.33943397834096845
Epoch: 69, step: 207, loss: 0.31098634004592896, mean loss: 0.33943369342010893
Epoch: 69, step: 208, loss: 0.31759583950042725, mean loss: 0.3394334747025575
Epoch: 69, step: 209, loss: 0.3693597912788391, mean loss: 0.3394337744272994
Epoch: 69, step: 210, loss: 0.34890836477279663, mean loss: 0.3394338693183862
Epoch: 69, step: 211, loss: 0.3376668691635132, mean loss: 0.33943385162148537
Epoch: 69, step: 212, loss: 0.33665746450424194, mean loss: 0.33943382381562737
Epoch: 69, step: 213, loss: 0.36429518461227417, mean loss: 0.339434072802716
Epoch: 69, step: 214, loss: 0.33468446135520935, mean loss: 0.3394340252357267
Epoch: 69, step: 215, loss: 0.3077283203601837, mean loss: 0.339433707708738
Epoch: 69, step: 216, loss: 0.33964771032333374, mean loss: 0.3394337098519146
Epoch: 69, step: 217, loss: 0.3379635214805603, mean loss: 0.3394336951285348
Epoch: 69, step: 218, loss: 0.34497708082199097, mean loss: 0.3394337506428875
Epoch: 69, step: 219, loss: 0.3130723536014557, mean loss: 0.33943348664876555
Epoch: 69, step: 220, loss: 0.336551308631897, mean loss: 0.3394334577857112
Epoch: 69, step: 221, loss: 0.31551453471183777, mean loss: 0.33943321825634876
Epoch: 69, step: 222, loss: 0.33420026302337646, mean loss: 0.33943316585290756
Epoch: 69, step: 223, loss: 0.3209342956542969, mean loss: 0.3394329806048583
Epoch: 69, step: 224, loss: 0.34102940559387207, mean loss: 0.3394329965913294
Epoch: 69, step: 225, loss: 0.31902408599853516, mean loss: 0.3394327922201913
Epoch: 69, step: 226, loss: 0.3595542907714844, mean loss: 0.3394329937112195
Epoch: 69, step: 227, loss: 0.4195586144924164, mean loss: 0.3394337960586198
Epoch: 69, step: 228, loss: 0.31819865107536316, mean loss: 0.339433583420108
Epoch: 69, step: 229, loss: 0.29261282086372375, mean loss: 0.33943311458424236
Epoch: 69, step: 230, loss: 0.33712461590766907, mean loss: 0.3394330914685117
Epoch: 69, step: 231, loss: 0.3366142511367798, mean loss: 0.3394330632428505
Epoch: 69, step: 232, loss: 0.33461540937423706, mean loss: 0.3394330150031178
Epoch: 69, step: 233, loss: 0.39120063185691833, mean loss: 0.33943353335314136
Epoch: 69, step: 234, loss: 0.39912149310112, mean loss: 0.33943413100370806
Epoch: 69, step: 235, loss: 0.32797130942344666, mean loss: 0.3394340162285801
Epoch: 69, step: 236, loss: 0.3398873805999756, mean loss: 0.33943402076798884
Epoch: 69, step: 237, loss: 0.3695530891418457, mean loss: 0.3394343223386516
Epoch: 69, step: 238, loss: 0.3700234889984131, mean loss: 0.33943462861316137
Epoch: 69, step: 239, loss: 0.38187888264656067, mean loss: 0.3394350535826639
Epoch: 69, step: 240, loss: 0.3242206573486328, mean loss: 0.339434901251334
Epoch: 69, step: 241, loss: 0.3047679662704468, mean loss: 0.33943455415853097
Epoch: 69, step: 242, loss: 0.33184003829956055, mean loss: 0.3394344781213674
Epoch: 69, step: 243, loss: 0.32376793026924133, mean loss: 0.33943432126766443
Epoch: 69, step: 244, loss: 0.32519981265068054, mean loss: 0.3394341787529858
Epoch: 69, step: 245, loss: 0.35901978611946106, mean loss: 0.3394343748404427
Epoch: 69, step: 246, loss: 0.36705365777015686, mean loss: 0.3394346513567961
Epoch: 69, step: 247, loss: 0.33907145261764526, mean loss: 0.33943464772059073
Epoch: 69, step: 248, loss: 0.326703816652298, mean loss: 0.3394345202657069
Epoch: 69, step: 249, loss: 0.3569354712963104, mean loss: 0.33943469547495575
Epoch: 69, step: 250, loss: 0.3272094130516052, mean loss: 0.3394345730838295
Epoch: 69, step: 251, loss: 0.3279050886631012, mean loss: 0.3394344576597103
Epoch: 69, step: 252, loss: 0.3370096683502197, mean loss: 0.33943443338487217
Epoch: 69, step: 253, loss: 0.3554753363132477, mean loss: 0.3394345939705457
Epoch: 69, step: 254, loss: 0.30358171463012695, mean loss: 0.3394342350505295
Epoch: 69, step: 255, loss: 0.36737462878227234, mean loss: 0.33943451475654934
Epoch: 69, step: 256, loss: 0.3115485906600952, mean loss: 0.33943423559860936
Epoch: 69, step: 257, loss: 0.30206725001335144, mean loss: 0.33943386153224314
Epoch: 69, step: 258, loss: 0.32421234250068665, mean loss: 0.3394337091570589
Epoch: 69, step: 259, loss: 0.31770315766334534, mean loss: 0.33943349162531095
Epoch: 69, step: 260, loss: 0.3141460716724396, mean loss: 0.3394332384903824
Epoch: 69, step: 261, loss: 0.3895929753780365, mean loss: 0.339433740599903
Epoch: 69, step: 262, loss: 0.3380906879901886, mean loss: 0.33943372715579834
Epoch: 69, step: 263, loss: 0.35440224409103394, mean loss: 0.3394338769908027
Epoch: 69, step: 264, loss: 0.34598639607429504, mean loss: 0.33943394258092774
Epoch: 69, step: 265, loss: 0.3322245180606842, mean loss: 0.33943387041596085
Epoch: 69, step: 266, loss: 0.3078761696815491, mean loss: 0.3394335545325466
Epoch: 69, step: 267, loss: 0.31681370735168457, mean loss: 0.33943332811671556
Epoch: 69, step: 268, loss: 0.32489216327667236, mean loss: 0.3394331825667947
Epoch: 69, step: 269, loss: 0.3054964244365692, mean loss: 0.33943284287990777
Epoch: 69, step: 270, loss: 0.3337372839450836, mean loss: 0.33943278587130044
Epoch: 69, step: 271, loss: 0.31919214129447937, mean loss: 0.33943258327846926
Epoch: 69, step: 272, loss: 0.32351335883140564, mean loss: 0.3394324239412279
Epoch: 69, step: 273, loss: 0.33092203736305237, mean loss: 0.33943233876069967
Epoch: 69, step: 274, loss: 0.3567465841770172, mean loss: 0.3394325120573879
Epoch: 69, step: 275, loss: 0.34224578738212585, mean loss: 0.33943254021491975
Epoch: 69, step: 276, loss: 0.309332013130188, mean loss: 0.3394322389475463
Epoch: 69, step: 277, loss: 0.33420923352241516, mean loss: 0.33943218667253555
Epoch: 69, step: 278, loss: 0.31905847787857056, mean loss: 0.3394319827621238
Epoch: 69, step: 279, loss: 0.3040710985660553, mean loss: 0.33943162885600064
Epoch: 69, step: 280, loss: 0.32699134945869446, mean loss: 0.3394315043498666
Epoch: 69, step: 281, loss: 0.3463086783885956, mean loss: 0.33943157317804606
Epoch: 69, step: 282, loss: 0.33401763439178467, mean loss: 0.33943151899476975
Epoch: 69, step: 283, loss: 0.31416428089141846, mean loss: 0.339431266120089
Epoch: 69, step: 284, loss: 0.3164841830730438, mean loss: 0.33943103646783324
Epoch: 69, step: 285, loss: 0.317217081785202, mean loss: 0.3394308141548823
Epoch: 69, step: 286, loss: 0.30029016733169556, mean loss: 0.33943042244679883
Epoch: 69, step: 287, loss: 0.3105347454547882, mean loss: 0.33943013327025473
Epoch: 69, step: 288, loss: 0.30279749631881714, mean loss: 0.3394297666689342
Epoch: 69, step: 289, loss: 0.33389270305633545, mean loss: 0.3394297112572935
Epoch: 69, step: 290, loss: 0.30834752321243286, mean loss: 0.33942940020834733
Epoch: 69, step: 291, loss: 0.3040107488632202, mean loss: 0.33942904576663585
Epoch: 69, step: 292, loss: 0.3462735414505005, mean loss: 0.33942911426022315
Epoch: 69, step: 293, loss: 0.2977033257484436, mean loss: 0.33942869671005294
Epoch: 69, step: 294, loss: 0.34011808037757874, mean loss: 0.33942870360864963
Epoch: 69, step: 295, loss: 0.3351019024848938, mean loss: 0.3394286603111961
Epoch: 69, step: 296, loss: 0.31760257482528687, mean loss: 0.33942844190400845
Epoch: 69, step: 297, loss: 0.3715594410896301, mean loss: 0.339428763426205
Epoch: 69, step: 298, loss: 0.3056071996688843, mean loss: 0.33942842499058423
Epoch: 69, step: 299, loss: 0.3277794122695923, mean loss: 0.3394283084258556
Epoch: 69, step: 300, loss: 0.3367287516593933, mean loss: 0.33942828141326997
Epoch: 69, step: 301, loss: 0.3264564275741577, mean loss: 0.3394281516142562
Epoch: 69, step: 302, loss: 0.30361294746398926, mean loss: 0.3394277932436086
Epoch: 69, step: 303, loss: 0.35891175270080566, mean loss: 0.3394279882001771
Epoch: 69, step: 304, loss: 0.3079236149787903, mean loss: 0.33942767297045934
Epoch: 69, step: 305, loss: 0.3330419659614563, mean loss: 0.3394276090763306
Epoch: 69, step: 306, loss: 0.36608439683914185, mean loss: 0.3394278757962386
Epoch: 69, step: 307, loss: 0.4019359052181244, mean loss: 0.3394285012267739
Epoch: 69, step: 308, loss: 0.3403606414794922, mean loss: 0.33942851055330603
Epoch: 69, step: 309, loss: 0.28345999121665955, mean loss: 0.33942795056571934
Epoch: 69, step: 310, loss: 0.32131877541542053, mean loss: 0.33942776937793834
Epoch: 69, step: 311, loss: 0.2785378694534302, mean loss: 0.33942716016214686
Epoch: 69, step: 312, loss: 0.3327682614326477, mean loss: 0.3394270935391818
Epoch: 69, step: 313, loss: 0.30881479382514954, mean loss: 0.3394267872630466
Epoch: 69, step: 314, loss: 0.32292747497558594, mean loss: 0.33942662218903746
Epoch: 69, step: 315, loss: 0.3959294259548187, mean loss: 0.3394271874884188
Epoch: 69, step: 316, loss: 0.3492484390735626, mean loss: 0.3394272857471163
Epoch: 69, step: 317, loss: 0.3321192264556885, mean loss: 0.33942721263289083
Epoch: 69, step: 318, loss: 0.3085917830467224, mean loss: 0.33942690413977306
Epoch: 69, step: 319, loss: 0.3249616026878357, mean loss: 0.3394267594230832
Epoch: 69, step: 320, loss: 0.29863324761390686, mean loss: 0.33942635131247756
Epoch: 69, step: 321, loss: 0.3340461552143097, mean loss: 0.33942629748791026
Epoch: 69, step: 322, loss: 0.31400349736213684, mean loss: 0.33942604315563274
Epoch: 69, step: 323, loss: 0.2998599410057068, mean loss: 0.3394256473362835
Epoch: 69, step: 324, loss: 0.337674617767334, mean loss: 0.33942562981915614
Epoch: 69, step: 325, loss: 0.32123228907585144, mean loss: 0.33942544781658773
Epoch: 69, step: 326, loss: 0.30675050616264343, mean loss: 0.3394251209462292
Epoch: 69, step: 327, loss: 0.30057376623153687, mean loss: 0.33942473229276676
Epoch: 69, step: 328, loss: 0.37488266825675964, mean loss: 0.3394250869962726
Epoch: 69, step: 329, loss: 0.3255371153354645, mean loss: 0.33942494806932083
Epoch: 69, step: 330, loss: 0.32841378450393677, mean loss: 0.3394248379213363
Epoch: 69, step: 331, loss: 0.30778050422668457, mean loss: 0.3394245213767051
Epoch: 69, step: 332, loss: 0.321625292301178, mean loss: 0.3394243433292196
Epoch: 69, step: 333, loss: 0.29688340425491333, mean loss: 0.33942391779216774
Epoch: 69, step: 334, loss: 0.3486289083957672, mean loss: 0.33942400986877597
Epoch: 69, step: 335, loss: 0.3124755620956421, mean loss: 0.33942374030882144
Epoch: 69, step: 336, loss: 0.3126722574234009, mean loss: 0.33942347272174406
Epoch: 69, step: 337, loss: 0.3529917001724243, mean loss: 0.33942360843930514
Epoch: 69, step: 338, loss: 0.3513062000274658, mean loss: 0.3394237272949349
Epoch: 69, step: 339, loss: 0.3010375499725342, mean loss: 0.33942334334101276
Epoch: 69, step: 340, loss: 0.323541522026062, mean loss: 0.339423184486263
Epoch: 69, step: 341, loss: 0.32240545749664307, mean loss: 0.33942301427154586
Epoch: 69, step: 342, loss: 0.329546719789505, mean loss: 0.33942291548785647
Epoch: 69, step: 343, loss: 0.32233181595802307, mean loss: 0.33942274454267213
Epoch: 69, step: 344, loss: 0.33564358949661255, mean loss: 0.33942270674393993
Epoch: 69, step: 345, loss: 0.2965767979621887, mean loss: 0.3394222782077156
Epoch: 69, step: 346, loss: 0.31797996163368225, mean loss: 0.3394220637480917
Epoch: 69, step: 347, loss: 0.3245854675769806, mean loss: 0.3394219153583876
Epoch: 69, step: 348, loss: 0.3311784565448761, mean loss: 0.33942183291143246
Epoch: 69, step: 349, loss: 0.31601423025131226, mean loss: 0.3394215988026306
Epoch: 69, step: 350, loss: 0.2958660423755646, mean loss: 0.33942116319043675
Epoch: 69, step: 351, loss: 0.3196081221103668, mean loss: 0.33942096503624747
Epoch: 69, step: 352, loss: 0.36722248792648315, mean loss: 0.3394212430820614
Epoch: 69, step: 353, loss: 0.3594052791595459, mean loss: 0.3394214429424082
Epoch: 69, step: 354, loss: 0.3231215178966522, mean loss: 0.33942127992848653
Epoch: 69, step: 355, loss: 0.3336794376373291, mean loss: 0.3394212225054698
Epoch: 69, step: 356, loss: 0.36524298787117004, mean loss: 0.33942148074119993
Epoch: 69, step: 357, loss: 0.3511882722377777, mean loss: 0.3394215984161754
Epoch: 69, step: 358, loss: 0.34652552008628845, mean loss: 0.33942166945894425
Epoch: 69, step: 359, loss: 0.3242224454879761, mean loss: 0.3394215174606246
Epoch: 69, step: 360, loss: 0.3075995445251465, mean loss: 0.3394211992313484
Epoch: 69, step: 361, loss: 0.32616162300109863, mean loss: 0.33942106663293414
Epoch: 69, step: 362, loss: 0.3833601474761963, mean loss: 0.33942150602813653
Epoch: 69, step: 363, loss: 0.32851460576057434, mean loss: 0.33942139695913387
Epoch: 69, step: 364, loss: 0.3073074519634247, mean loss: 0.33942107582289527
Epoch: 69, step: 365, loss: 0.3317273259162903, mean loss: 0.33942099888693494
Epoch: 69, step: 366, loss: 0.3309690058231354, mean loss: 0.3394209143695398
Epoch: 69, step: 367, loss: 0.3366204500198364, mean loss: 0.33942088636601647
Epoch: 69, step: 368, loss: 0.35484567284584045, mean loss: 0.3394210406061693
Epoch: 69, step: 369, loss: 0.3276994228363037, mean loss: 0.3394209233970241
Epoch: 69, step: 370, loss: 0.38431572914123535, mean loss: 0.3394213723136574
Epoch: 69, step: 371, loss: 0.3033725917339325, mean loss: 0.3394210118546883
Epoch: 69, step: 372, loss: 0.3247378468513489, mean loss: 0.33942086503625196
Epoch: 69, step: 373, loss: 0.3324684798717499, mean loss: 0.339420795519352
Epoch: 69, step: 374, loss: 0.3597685992717743, mean loss: 0.3394209989750094
Epoch: 69, step: 375, loss: 0.3550504446029663, mean loss: 0.3394211552507126
Epoch: 69, step: 376, loss: 0.330817312002182, mean loss: 0.33942106922346366
Epoch: 69, step: 377, loss: 0.33180487155914307, mean loss: 0.3394209930721482
Epoch: 69, step: 378, loss: 0.32107236981391907, mean loss: 0.3394208096134344
Epoch: 69, step: 379, loss: 0.2851145565509796, mean loss: 0.3394202666377799
Epoch: 69, step: 380, loss: 0.34561827778816223, mean loss: 0.3394203286073566
Epoch: 69, step: 381, loss: 0.3568868935108185, mean loss: 0.33942050324157147
Epoch: 69, step: 382, loss: 0.3213653266429901, mean loss: 0.33942032272410383
Epoch: 69, step: 383, loss: 0.3157349228858948, mean loss: 0.33942008591746675
Epoch: 69, step: 384, loss: 0.30314362049102783, mean loss: 0.33941972322897707
Epoch: 69, step: 385, loss: 0.32131245732307434, mean loss: 0.33941954219614523
Epoch: 69, step: 386, loss: 0.37021973729133606, mean loss: 0.33941985012727205
Epoch: 69, step: 387, loss: 0.40456274151802063, mean loss: 0.3394205013998805
Epoch: 69, step: 388, loss: 0.33022648096084595, mean loss: 0.3394204094826554
Epoch: 69, step: 389, loss: 0.3272612392902374, mean loss: 0.33942028792255907
Epoch: 69, step: 390, loss: 0.30262377858161926, mean loss: 0.3394199200567894
Epoch: 69, step: 391, loss: 0.2939746081829071, mean loss: 0.3394194657308819
Epoch: 69, step: 392, loss: 0.3332599401473999, mean loss: 0.3394194041534835
Epoch: 69, step: 393, loss: 0.37973496317863464, mean loss: 0.33941980718816334
Epoch: 69, step: 394, loss: 0.3386234939098358, mean loss: 0.3394197992274984
Epoch: 69, step: 395, loss: 0.3382943272590637, mean loss: 0.33941978797637906
Epoch: 69, step: 396, loss: 0.3231707513332367, mean loss: 0.33941962553961674
Epoch: 69, step: 397, loss: 0.32296276092529297, mean loss: 0.3394194610269049
Epoch: 69, step: 398, loss: 0.3078489899635315, mean loss: 0.3394191454326523
Epoch: 69, step: 399, loss: 0.31941139698028564, mean loss: 0.3394189454271697
Epoch: 69, step: 400, loss: 0.31777510046958923, mean loss: 0.33941872906877274
Epoch: 69, step: 401, loss: 0.3257748782634735, mean loss: 0.3394185926820916
Epoch: 69, step: 402, loss: 0.3042115569114685, mean loss: 0.33941824074898785
Epoch: 69, step: 403, loss: 0.3295775353908539, mean loss: 0.3394181423812814
Epoch: 69, step: 404, loss: 0.32533860206604004, mean loss: 0.33941800164358066
Epoch: 69, step: 405, loss: 0.3183061182498932, mean loss: 0.3394177906133794
Epoch: 69, step: 406, loss: 0.3070550560951233, mean loss: 0.33941746712513415
Epoch: 69, step: 407, loss: 0.3099687397480011, mean loss: 0.3394171727673778
Epoch: 69, step: 408, loss: 0.3076004087924957, mean loss: 0.3394168547428491
Epoch: 69, step: 409, loss: 0.30236372351646423, mean loss: 0.33941648438190286
Epoch: 69, step: 410, loss: 0.32251396775245667, mean loss: 0.3394163154361411
Epoch: 69, step: 411, loss: 0.320172518491745, mean loss: 0.33941612309049757
Epoch: 69, step: 412, loss: 0.3314274251461029, mean loss: 0.3394160432426436
Epoch: 69, step: 413, loss: 0.3067963421344757, mean loss: 0.3394157172086495
Epoch: 69, step: 414, loss: 0.2807081639766693, mean loss: 0.3394151304323731
Epoch: 69, step: 415, loss: 0.32113832235336304, mean loss: 0.3394149477592823
Epoch: 69, step: 416, loss: 0.32570940256118774, mean loss: 0.33941481077643126
Epoch: 69, step: 417, loss: 0.28428763151168823, mean loss: 0.3394142598021647
Epoch: 69, step: 418, loss: 0.3300473690032959, mean loss: 0.3394141661847463
Epoch: 69, step: 419, loss: 0.31137487292289734, mean loss: 0.33941388594874583
Epoch: 69, step: 420, loss: 0.29129743576049805, mean loss: 0.3394134050583515
Epoch: 69, step: 421, loss: 0.32846271991729736, mean loss: 0.33941329561497724
Epoch: 69, step: 422, loss: 0.34228914976119995, mean loss: 0.3394133243565612
Epoch: 69, step: 423, loss: 0.3272703289985657, mean loss: 0.3394132029994219
Epoch: 69, step: 424, loss: 0.3248170018196106, mean loss: 0.33941305712639264
Epoch: 69, step: 425, loss: 0.31390970945358276, mean loss: 0.33941280225093867
Epoch: 69, step: 426, loss: 0.32621583342552185, mean loss: 0.339412670364339
Epoch: 69, step: 427, loss: 0.3295414447784424, mean loss: 0.33941257171521855
Epoch: 69, step: 428, loss: 0.32339659333229065, mean loss: 0.33941241165947095
Epoch: 69, step: 429, loss: 0.3289366364479065, mean loss: 0.33941230697081337
Epoch: 69, step: 430, loss: 0.3490384817123413, mean loss: 0.3394124031681086
Epoch: 69, step: 431, loss: 0.36249032616615295, mean loss: 0.33941263379051534
Epoch: 69, step: 432, loss: 0.3224569857120514, mean loss: 0.33941246435094785
Epoch: 69, step: 433, loss: 0.31700757145881653, mean loss: 0.33941224045874346
Epoch: 69, step: 434, loss: 0.3249961733818054, mean loss: 0.33941209640035414
Epoch: 69, step: 435, loss: 0.3487096130847931, mean loss: 0.33941218930862704
Epoch: 69, step: 436, loss: 0.35543081164360046, mean loss: 0.33941234937799974
Epoch: 69, step: 437, loss: 0.3435579240322113, mean loss: 0.3394123908030917
Epoch: 69, step: 438, loss: 0.3393345773220062, mean loss: 0.3394123900255401
Epoch: 69, step: 439, loss: 0.3134656548500061, mean loss: 0.33941213075523374
Epoch: 69, step: 440, loss: 0.34924939274787903, mean loss: 0.33941222905216506
Epoch: 69, step: 441, loss: 0.38421934843063354, mean loss: 0.3394126767741357
Epoch: 69, step: 442, loss: 0.3102289140224457, mean loss: 0.33941238516687794
Epoch: 69, step: 443, loss: 0.3499319851398468, mean loss: 0.3394124902787881
Epoch: 69, step: 444, loss: 0.3266202211380005, mean loss: 0.33941236245963025
Epoch: 69, step: 445, loss: 0.3113362789154053, mean loss: 0.33941208192883005
Epoch: 69, step: 446, loss: 0.3270552456378937, mean loss: 0.3394119584629438
Epoch: 69, step: 447, loss: 0.3578230142593384, mean loss: 0.3394121424189787
Epoch: 69, step: 448, loss: 0.3314386010169983, mean loss: 0.3394120627512822
Epoch: 69, step: 449, loss: 0.3243085741996765, mean loss: 0.3394119118461751
Epoch: 69, step: 450, loss: 0.32497698068618774, mean loss: 0.3394117676223382
Epoch: 69, step: 451, loss: 0.36076951026916504, mean loss: 0.3394119810119818
Epoch: 69, step: 452, loss: 0.34057673811912537, mean loss: 0.33941199264919575
Epoch: 69, step: 453, loss: 0.3484978675842285, mean loss: 0.33941208342624574
Epoch: 69, step: 454, loss: 0.2942214012145996, mean loss: 0.33941163193028495
Epoch: 69, step: 455, loss: 0.34970828890800476, mean loss: 0.33941173480221254
Epoch: 69, step: 456, loss: 0.3618651032447815, mean loss: 0.3394119591272747
Epoch: 69, step: 457, loss: 0.32243630290031433, mean loss: 0.33941178953013373
Epoch: 69, step: 458, loss: 0.31622934341430664, mean loss: 0.33941155792569677
Epoch: 69, step: 459, loss: 0.33645251393318176, mean loss: 0.3394115283636364
Epoch: 69, step: 460, loss: 0.3186092674732208, mean loss: 0.3394113205426139
Epoch: 69, step: 461, loss: 0.34304842352867126, mean loss: 0.3394113568780351
Epoch: 69, step: 462, loss: 0.29614123702049255, mean loss: 0.339410924604787
Epoch: 69, step: 463, loss: 0.36168283224105835, mean loss: 0.3394111471013668
Epoch: 69, step: 464, loss: 0.3380777835845947, mean loss: 0.339411133781185
Epoch: 69, step: 465, loss: 0.3252103924751282, mean loss: 0.3394109919184719
Epoch: 69, step: 466, loss: 0.36494848132133484, mean loss: 0.33941124703060044
Epoch: 69, step: 467, loss: 0.31423941254615784, mean loss: 0.3394109955737707
Epoch: 69, step: 468, loss: 0.34099361300468445, mean loss: 0.33941101138334495
Epoch: 69, step: 469, loss: 0.3419000804424286, mean loss: 0.3394110362476793
Epoch: 69, step: 470, loss: 0.3020905554294586, mean loss: 0.33941066344177345
Epoch: 69, step: 471, loss: 0.33398962020874023, mean loss: 0.33941060928982525
Epoch: 69, step: 472, loss: 0.29288628697395325, mean loss: 0.33941014455316504
Epoch: 69, step: 473, loss: 0.3520124554634094, mean loss: 0.33941027043780103
Epoch: 69, step: 474, loss: 0.32542741298675537, mean loss: 0.33941013076426413
Epoch: 69, step: 475, loss: 0.3182496428489685, mean loss: 0.3394099193961173
Epoch: 69, step: 476, loss: 0.3384690582752228, mean loss: 0.3394099099981258
Epoch: 69, step: 477, loss: 0.301972895860672, mean loss: 0.3394095360542804
Epoch: 69, step: 478, loss: 0.40956395864486694, mean loss: 0.3394102367926572
Epoch: 69, step: 479, loss: 0.34709709882736206, mean loss: 0.33941031357221324
Epoch: 69, step: 480, loss: 0.34722083806991577, mean loss: 0.33941039158618186
Epoch: 69, step: 481, loss: 0.3639962375164032, mean loss: 0.33941063715487013
Epoch: 69, step: 482, loss: 0.3188518285751343, mean loss: 0.3394104318111434
Epoch: 69, step: 483, loss: 0.3245369791984558, mean loss: 0.33941028325488476
Epoch: 69, step: 484, loss: 0.3091890513896942, mean loss: 0.3394099814078011
Epoch: 69, step: 485, loss: 0.3173225522041321, mean loss: 0.33940976080264734
Epoch: 69, step: 486, loss: 0.35682687163352966, mean loss: 0.33940993475978837
Epoch: 69, step: 487, loss: 0.31877368688583374, mean loss: 0.3394097286528822
Epoch: 69, step: 488, loss: 0.33014097809791565, mean loss: 0.3394096360810914
Epoch: 69, step: 489, loss: 0.30834293365478516, mean loss: 0.33940932580501504
Epoch: 69, step: 490, loss: 0.3114044964313507, mean loss: 0.3394090461119315
Epoch: 69, step: 491, loss: 0.35901105403900146, mean loss: 0.33940924188142585
Epoch: 69, step: 492, loss: 0.3164243698120117, mean loss: 0.33940901232882803
Epoch: 69, step: 493, loss: 0.3002380430698395, mean loss: 0.33940862112769693
Epoch: 69, step: 494, loss: 0.31638476252555847, mean loss: 0.33940839119032884
Epoch: 69, step: 495, loss: 0.33372780680656433, mean loss: 0.33940833445936985
Epoch: 69, step: 496, loss: 0.32868316769599915, mean loss: 0.33940822735015747
Epoch: 69, step: 497, loss: 0.3361223340034485, mean loss: 0.33940819453519605
Epoch: 69, step: 498, loss: 0.32876139879226685, mean loss: 0.3394080882107766
Epoch: 69, step: 499, loss: 0.3543470799922943, mean loss: 0.33940823739780007
Epoch: 69, step: 500, loss: 0.31758809089660645, mean loss: 0.3394080194948621
Epoch: 69, step: 501, loss: 0.2879919409751892, mean loss: 0.33940750604264097
Epoch: 69, step: 502, loss: 0.3398645222187042, mean loss: 0.339407510606459
Epoch: 69, step: 503, loss: 0.3256593644618988, mean loss: 0.33940737331720255
Epoch: 69, step: 504, loss: 0.3232273459434509, mean loss: 0.339407211744746
Epoch: 69, step: 505, loss: 0.3182470202445984, mean loss: 0.33940700044287964
Epoch: 69, step: 506, loss: 0.3150451183319092, mean loss: 0.33940675717193597
Epoch: 69, step: 507, loss: 0.3124176859855652, mean loss: 0.33940648766930787
Epoch: 69, step: 508, loss: 0.32107192277908325, mean loss: 0.33940630458912524
Epoch: 69, step: 509, loss: 0.3550749719142914, mean loss: 0.33940646104736943
Epoch: 69, step: 510, loss: 0.3164317011833191, mean loss: 0.339406231637004
Epoch: 69, step: 511, loss: 0.3648606538772583, mean loss: 0.33940648580505767
Epoch: 69, step: 512, loss: 0.3483654856681824, mean loss: 0.3394065752617658
Epoch: 69, step: 513, loss: 0.31824713945388794, mean loss: 0.3394063639843239
Epoch: 69, step: 514, loss: 0.3361648917198181, mean loss: 0.33940633161847367
Epoch: 69, step: 515, loss: 0.2920362949371338, mean loss: 0.33940585863703865
Epoch: 69, step: 516, loss: 0.28533637523651123, mean loss: 0.33940531876820396
Epoch: 69, step: 517, loss: 0.33801838755607605, mean loss: 0.33940530492021775
Epoch: 69, step: 518, loss: 0.2981070876121521, mean loss: 0.3394048925771764
Epoch: 69, step: 519, loss: 0.30458319187164307, mean loss: 0.33940454490254174
Epoch: 69, step: 520, loss: 0.3297426104545593, mean loss: 0.33940444843465184
Epoch: 69, step: 521, loss: 0.33581164479255676, mean loss: 0.3394044125632922
Epoch: 69, step: 522, loss: 0.3743501901626587, mean loss: 0.3394047614663124
Epoch: 69, step: 523, loss: 0.3196181058883667, mean loss: 0.33940456391583734
Epoch: 69, step: 524, loss: 0.32492944598197937, mean loss: 0.3394044193973328
Epoch: 69, step: 525, loss: 0.3272969424724579, mean loss: 0.33940429851838744
Epoch: 69, step: 526, loss: 0.3199838101863861, mean loss: 0.33940410462954296
Epoch: 69, step: 527, loss: 0.33160051703453064, mean loss: 0.3394040267214363
Epoch: 69, step: 528, loss: 0.3321375846862793, mean loss: 0.33940395417671476
Epoch: 69, step: 529, loss: 0.3383433222770691, mean loss: 0.3394039435879731
Epoch: 69, step: 530, loss: 0.39621374011039734, mean loss: 0.33940451073879646
Epoch: 69, step: 531, loss: 0.31641367077827454, mean loss: 0.33940428121599514
Epoch: 69, step: 532, loss: 0.32443928718566895, mean loss: 0.33940413181853657
Epoch: 69, step: 533, loss: 0.32831069827079773, mean loss: 0.3394040210724694
Epoch: 69, step: 534, loss: 0.3381529748439789, mean loss: 0.3394040085833635
Epoch: 69, step: 535, loss: 0.3460965156555176, mean loss: 0.33940407539352074
Epoch: 69, step: 536, loss: 0.32557082176208496, mean loss: 0.33940393729988644
Epoch: 69, step: 537, loss: 0.33886751532554626, mean loss: 0.33940393194498425
Epoch: 69, step: 538, loss: 0.317298024892807, mean loss: 0.3394037112720913
Epoch: 69, step: 539, loss: 0.314123272895813, mean loss: 0.3394034589118615
Epoch: 69, step: 540, loss: 0.3091450035572052, mean loss: 0.33940315686193634
Epoch: 69, step: 541, loss: 0.317507803440094, mean loss: 0.3394029382974469
Epoch: 69, step: 542, loss: 0.29596421122550964, mean loss: 0.33940250468634003
Epoch: 69, step: 543, loss: 0.3284401595592499, mean loss: 0.33940239525985644
Epoch: 69, step: 544, loss: 0.3375588655471802, mean loss: 0.3394023768578669
Epoch: 69, step: 545, loss: 0.3086514174938202, mean loss: 0.33940206990692395
Epoch: 69, step: 546, loss: 0.32825058698654175, mean loss: 0.33940195859579414
Epoch: 69, step: 547, loss: 0.32446882128715515, mean loss: 0.33940180953868615
Epoch: 69, step: 548, loss: 0.3449523448944092, mean loss: 0.3394018649415444
Epoch: 69, step: 549, loss: 0.34156155586242676, mean loss: 0.33940188649835795
Epoch: 69, step: 550, loss: 0.288501501083374, mean loss: 0.3394013784445644
Epoch: 69, step: 551, loss: 0.31088805198669434, mean loss: 0.3394010938463445
Epoch: 69, step: 552, loss: 0.30864018201828003, mean loss: 0.3394007868175107
Epoch: 69, step: 553, loss: 0.36071449518203735, mean loss: 0.3394009995504018
Epoch: 69, step: 554, loss: 0.3163697123527527, mean loss: 0.33940076967658883
Epoch: 69, step: 555, loss: 0.30625253915786743, mean loss: 0.33940043882951004
Epoch: 69, step: 556, loss: 0.30398908257484436, mean loss: 0.33940008539807015
Epoch: 69, step: 557, loss: 0.37061408162117004, mean loss: 0.33940039693365337
Epoch: 69, step: 558, loss: 0.3292711675167084, mean loss: 0.33940029583849474
Epoch: 69, step: 559, loss: 0.36503300070762634, mean loss: 0.3394005516641252
Epoch: 69, step: 560, loss: 0.3426249921321869, mean loss: 0.3394005838451333
Epoch: 69, step: 561, loss: 0.3261338770389557, mean loss: 0.3394004514402269
Epoch: 69, step: 562, loss: 0.3259505033493042, mean loss: 0.3394003172078684
Epoch: 69, step: 563, loss: 0.37068265676498413, mean loss: 0.339400629406866
Epoch: 69, step: 564, loss: 0.2972789704799652, mean loss: 0.3394002090352237
Epoch: 69, step: 565, loss: 0.31549516320228577, mean loss: 0.33939997046667386
Epoch: 69, step: 566, loss: 0.3205011487007141, mean loss: 0.3393997818613251
Epoch: 69, step: 567, loss: 0.3761823773384094, mean loss: 0.3394001489384425
Epoch: 69, step: 568, loss: 0.36493033170700073, mean loss: 0.33940040371797214
Epoch: 69, step: 569, loss: 0.3142932057380676, mean loss: 0.33940015316213734
Epoch: 69, step: 570, loss: 0.3189331293106079, mean loss: 0.33939994891469105
Epoch: 69, step: 571, loss: 0.32107818126678467, mean loss: 0.3393997660773163
Epoch: 69, step: 572, loss: 0.3243563175201416, mean loss: 0.3393996159565831
Epoch: 69, step: 573, loss: 0.3498077690601349, mean loss: 0.33939971982000094
Epoch: 69, step: 574, loss: 0.3121572434902191, mean loss: 0.3393994479688436
Epoch: 69, step: 575, loss: 0.3963259756565094, mean loss: 0.33940001602983116
Epoch: 69, step: 576, loss: 0.32636743783950806, mean loss: 0.33939988598105314
Epoch: 69, step: 577, loss: 0.31228721141815186, mean loss: 0.33939961543327973
Epoch: 69, step: 578, loss: 0.3126956820487976, mean loss: 0.3393993489668487
Epoch: 69, step: 579, loss: 0.3471927344799042, mean loss: 0.33939942673272955
Epoch: 69, step: 580, loss: 0.29761460423469543, mean loss: 0.33939900978927184
Epoch: 69, step: 581, loss: 0.3461174964904785, mean loss: 0.3393990768279944
Epoch: 69, step: 582, loss: 0.30056971311569214, mean loss: 0.3393986893828621
Epoch: 69, step: 583, loss: 0.345575213432312, mean loss: 0.3393987510125174
Epoch: 69, step: 584, loss: 0.32917386293411255, mean loss: 0.3393986489891083
Epoch: 69, step: 585, loss: 0.3217555582523346, mean loss: 0.33939847294901
Epoch: 69, step: 586, loss: 0.3139340281486511, mean loss: 0.3393982188711556
Epoch: 69, step: 587, loss: 0.3198222517967224, mean loss: 0.3393980235490065
Epoch: 69, step: 588, loss: 0.33389073610305786, mean loss: 0.33939796859976784
Epoch: 69, step: 589, loss: 0.3587881922721863, mean loss: 0.33939816206477363
Epoch: 69, step: 590, loss: 0.32078731060028076, mean loss: 0.3393979763777685
Epoch: 69, step: 591, loss: 0.32772600650787354, mean loss: 0.3393978599235853
Epoch: 69, step: 592, loss: 0.33788061141967773, mean loss: 0.33939784478576585
Epoch: 69, step: 593, loss: 0.31162571907043457, mean loss: 0.3393975677018018
Epoch: 69, step: 594, loss: 0.3191272020339966, mean loss: 0.3393973654653114
Epoch: 69, step: 595, loss: 0.36369168758392334, mean loss: 0.3393976078462089
Epoch: 69, step: 596, loss: 0.31734684109687805, mean loss: 0.33939738785113
Epoch: 69, step: 597, loss: 0.2996622622013092, mean loss: 0.3393969914275048
Epoch: 69, step: 598, loss: 0.33036506175994873, mean loss: 0.33939690131996086
Epoch: 69, step: 599, loss: 0.36298641562461853, mean loss: 0.3393971366597021
Epoch: 69, step: 600, loss: 0.3219361901283264, mean loss: 0.33939696246308276
Epoch: 69, step: 601, loss: 0.36269035935401917, mean loss: 0.3393971948439851
Epoch: 69, step: 602, loss: 0.33991602063179016, mean loss: 0.3393972000198726
Epoch: 69, step: 603, loss: 0.37744513154029846, mean loss: 0.33939757958822375
Epoch: 69, step: 604, loss: 0.3371235728263855, mean loss: 0.3393975569028279
Epoch: 69, step: 605, loss: 0.3408217430114746, mean loss: 0.3393975711103069
Epoch: 69, step: 606, loss: 0.3962169885635376, mean loss: 0.3393981379271166
Epoch: 69, step: 607, loss: 0.30537739396095276, mean loss: 0.33939779854776253
Epoch: 69, step: 608, loss: 0.315010666847229, mean loss: 0.33939755527247
Epoch: 69, step: 609, loss: 0.3204575181007385, mean loss: 0.33939736633687984
Epoch: 69, step: 610, loss: 0.35149073600769043, mean loss: 0.3393974869726063
Epoch: 69, step: 611, loss: 0.3239247798919678, mean loss: 0.33939733262830935
Epoch: 69, step: 612, loss: 0.3161620795726776, mean loss: 0.33939710085289954
Epoch: 69, step: 613, loss: 0.3143436014652252, mean loss: 0.3393968509426812
Epoch: 69, step: 614, loss: 0.350042462348938, mean loss: 0.3393969571322594
Epoch: 69, step: 615, loss: 0.3362572193145752, mean loss: 0.33939692581380376
Epoch: 69, step: 616, loss: 0.3205859065055847, mean loss: 0.33939673817832844
Epoch: 69, step: 617, loss: 0.3355858623981476, mean loss: 0.33939670016612167
Epoch: 69, step: 618, loss: 0.34873801469802856, mean loss: 0.33939679334166933
Epoch: 69, step: 619, loss: 0.33642372488975525, mean loss: 0.339396763686901
Epoch: 69, step: 620, loss: 0.32411155104637146, mean loss: 0.3393966112265976
Epoch: 69, step: 621, loss: 0.38601812720298767, mean loss: 0.3393970762420176
Epoch: 69, step: 622, loss: 0.287695974111557, mean loss: 0.3393965605665956
Epoch: 69, step: 623, loss: 0.29538610577583313, mean loss: 0.33939612160335214
Epoch: 69, step: 624, loss: 0.3284449279308319, mean loss: 0.3393960123764975
Epoch: 69, step: 625, loss: 0.30179592967033386, mean loss: 0.33939563735821837
Epoch: 69, step: 626, loss: 0.3601002097129822, mean loss: 0.33939584386084004
Epoch: 69, step: 627, loss: 0.35086479783058167, mean loss: 0.3393959582483966
Epoch: 69, step: 628, loss: 0.2901760935783386, mean loss: 0.339395467350629
Epoch: 69, step: 629, loss: 0.3184738755226135, mean loss: 0.3393952586897486
Epoch: 69, step: 630, loss: 0.34220999479293823, mean loss: 0.3393952867621563
Epoch: 69, step: 631, loss: 0.337091326713562, mean loss: 0.3393952637841369
Epoch: 69, step: 632, loss: 0.32273080945014954, mean loss: 0.3393950975866648
Epoch: 69, step: 633, loss: 0.3313009738922119, mean loss: 0.33939501686338075
Epoch: 69, step: 634, loss: 0.3071500062942505, mean loss: 0.33939469528475313
Epoch: 69, step: 635, loss: 0.3299221098423004, mean loss: 0.3393946008158541
Epoch: 69, step: 636, loss: 0.3155517876148224, mean loss: 0.33939436303685877
Epoch: 69, step: 637, loss: 0.3293250799179077, mean loss: 0.33939426261917205
Epoch: 69, step: 638, loss: 0.41683751344680786, mean loss: 0.3393950349278315
Epoch: 69, step: 639, loss: 0.31924471259117126, mean loss: 0.3393948339792263
Epoch: 69, step: 640, loss: 0.3289373815059662, mean loss: 0.33939472969357287
Epoch: 69, step: 641, loss: 0.31950634717941284, mean loss: 0.339394531361112
Epoch: 69, step: 642, loss: 0.30483439564704895, mean loss: 0.3393941867212999
Epoch: 69, step: 643, loss: 0.33758875727653503, mean loss: 0.33939416871741634
Epoch: 69, step: 644, loss: 0.4074757397174835, mean loss: 0.3393948476253949
Epoch: 69, step: 645, loss: 0.2968745827674866, mean loss: 0.3393944236184459
Epoch: 69, step: 646, loss: 0.3410249948501587, mean loss: 0.3393944398781433
Epoch: 69, step: 647, loss: 0.36760780215263367, mean loss: 0.33939472121277564
Epoch: 69, step: 648, loss: 0.32489094138145447, mean loss: 0.3393945765871603
Epoch: 69, step: 649, loss: 0.3117194175720215, mean loss: 0.33939430062482245
Epoch: 69, step: 650, loss: 0.34848588705062866, mean loss: 0.3393943912805049
Epoch: 69, step: 651, loss: 0.3638916015625, mean loss: 0.33939463554911414
Epoch: 69, step: 652, loss: 0.3606199324131012, mean loss: 0.33939484719043933
Epoch: 69, step: 653, loss: 0.32776767015457153, mean loss: 0.33939473125488206
Epoch: 69, step: 654, loss: 0.3618558943271637, mean loss: 0.33939495521478946
Epoch: 69, step: 655, loss: 0.3312215209007263, mean loss: 0.33939487371841576
Epoch: 69, step: 656, loss: 0.31036242842674255, mean loss: 0.33939458424212837
Epoch: 69, step: 657, loss: 0.3049410283565521, mean loss: 0.33939424071653473
Epoch: 69, step: 658, loss: 0.3103564381599426, mean loss: 0.33939395119260474
Epoch: 69, step: 659, loss: 0.3267543613910675, mean loss: 0.33939382516973443
Epoch: 69, step: 660, loss: 0.325344443321228, mean loss: 0.33939368509194695
Epoch: 69, step: 661, loss: 0.33073532581329346, mean loss: 0.33939359876560665
Epoch: 69, step: 662, loss: 0.37863874435424805, mean loss: 0.3393939900471308
Epoch: 69, step: 663, loss: 0.3416058123111725, mean loss: 0.33939401209919723
Epoch: 69, step: 664, loss: 0.31248337030410767, mean loss: 0.3393937438003588
Epoch: 69, step: 665, loss: 0.3618868589401245, mean loss: 0.3393939680542634
Epoch: 69, step: 666, loss: 0.3389087915420532, mean loss: 0.33939396321715476
Epoch: 69, step: 667, loss: 0.29497358202934265, mean loss: 0.3393935203596298
Epoch: 69, step: 668, loss: 0.36012545228004456, mean loss: 0.33939372704854776
Epoch: 69, step: 669, loss: 0.3209998905658722, mean loss: 0.33939354367131724
Epoch: 69, step: 670, loss: 0.3434709310531616, mean loss: 0.3393935843203984
Epoch: 69, step: 671, loss: 0.3114616572856903, mean loss: 0.3393933058587898
Epoch: 69, step: 672, loss: 0.3254536986351013, mean loss: 0.33939316689212456
Epoch: 69, step: 673, loss: 0.33424994349479675, mean loss: 0.3393931156188378
Epoch: 69, step: 674, loss: 0.3343922793865204, mean loss: 0.33939306576551925
Epoch: 69, step: 675, loss: 0.3176509141921997, mean loss: 0.33939284902024874
Epoch: 69, step: 676, loss: 0.3439628481864929, mean loss: 0.33939289457764577
Epoch: 69, step: 677, loss: 0.3277447521686554, mean loss: 0.3393927784608285
Epoch: 69, step: 678, loss: 0.30261901021003723, mean loss: 0.33939241187788227
Epoch: 69, step: 679, loss: 0.39334526658058167, mean loss: 0.33939294970688966
Epoch: 69, step: 680, loss: 0.3191593885421753, mean loss: 0.33939274801065505
Epoch: 69, step: 681, loss: 0.3275464177131653, mean loss: 0.3393926299228712
Epoch: 69, step: 682, loss: 0.36028605699539185, mean loss: 0.339392838192761
Epoch: 69, step: 683, loss: 0.3564608693122864, mean loss: 0.3393930083286374
Epoch: 69, step: 684, loss: 0.3633081316947937, mean loss: 0.33939324671465193
Epoch: 69, step: 685, loss: 0.3858342170715332, mean loss: 0.339393709633756
Epoch: 69, step: 686, loss: 0.34279099106788635, mean loss: 0.3393937434971914
Epoch: 69, step: 687, loss: 0.30910179018974304, mean loss: 0.339393441555948
Epoch: 69, step: 688, loss: 0.3382916748523712, mean loss: 0.33939343057397237
Epoch: 69, step: 689, loss: 0.3310418725013733, mean loss: 0.3393933473297677
Epoch: 69, step: 690, loss: 0.3483843207359314, mean loss: 0.33939343694645524
Epoch: 69, step: 691, loss: 0.30375564098358154, mean loss: 0.3393930817335938
Epoch: 69, step: 692, loss: 0.3059636056423187, mean loss: 0.3393927485350561
Epoch: 69, step: 693, loss: 0.3388644754886627, mean loss: 0.33939274326970126
Epoch: 69, step: 694, loss: 0.3033320903778076, mean loss: 0.33939238385284215
Epoch: 69, step: 695, loss: 0.3257221281528473, mean loss: 0.3393922476026358
Epoch: 69, step: 696, loss: 0.3126385807991028, mean loss: 0.33939198095390805
Epoch: 69, step: 697, loss: 0.3368745446205139, mean loss: 0.3393919558633472
Epoch: 69, step: 698, loss: 0.2950804531574249, mean loss: 0.33939151422779923
Epoch: 69, step: 699, loss: 0.3495804965496063, mean loss: 0.3393916157764191
Epoch: 69, step: 700, loss: 0.3602032959461212, mean loss: 0.3393918231942228
Epoch: 69, step: 701, loss: 0.29661497473716736, mean loss: 0.33939139686672515
Epoch: 69, step: 702, loss: 0.3234541714191437, mean loss: 0.33939123803291726
Epoch: 69, step: 703, loss: 0.3614078760147095, mean loss: 0.3393914574532679
Epoch: 69, step: 704, loss: 0.3600154221057892, mean loss: 0.3393916629920272
Epoch: 69, step: 705, loss: 0.3345738351345062, mean loss: 0.3393916149779568
Epoch: 69, step: 706, loss: 0.32028841972351074, mean loss: 0.33939142459900407
Epoch: 69, step: 707, loss: 0.337066113948822, mean loss: 0.339391401425614
Epoch: 69, step: 708, loss: 0.3119608759880066, mean loss: 0.33939112806345906
Epoch: 69, step: 709, loss: 0.296628475189209, mean loss: 0.3393907019114164
Epoch: 69, step: 710, loss: 0.29585081338882446, mean loss: 0.3393902680181408
Epoch: 69, step: 711, loss: 0.33928173780441284, mean loss: 0.33939026693660246
Epoch: 69, step: 712, loss: 0.3075181245803833, mean loss: 0.33938994932364813
Epoch: 69, step: 713, loss: 0.37605395913124084, mean loss: 0.33939031468498154
Epoch: 69, step: 714, loss: 0.40071162581443787, mean loss: 0.33939092575324326
Epoch: 69, step: 715, loss: 0.38546717166900635, mean loss: 0.33939138489950754
Epoch: 69, step: 716, loss: 0.34814566373825073, mean loss: 0.3393914721343569
Epoch: 69, step: 717, loss: 0.3284447193145752, mean loss: 0.3393913630529768
Epoch: 69, step: 718, loss: 0.3218359351158142, mean loss: 0.33939118811971053
Epoch: 69, step: 719, loss: 0.33693569898605347, mean loss: 0.3393911636519245
Epoch: 69, step: 720, loss: 0.3189657926559448, mean loss: 0.33939096012480635
Epoch: 69, step: 721, loss: 0.3288354277610779, mean loss: 0.3393908549460228
Epoch: 69, step: 722, loss: 0.32117605209350586, mean loss: 0.3393906734495665
Epoch: 69, step: 723, loss: 0.36578938364982605, mean loss: 0.33939093648972396
Epoch: 69, step: 724, loss: 0.3272295594215393, mean loss: 0.3393908153133998
Epoch: 69, step: 725, loss: 0.29002630710601807, mean loss: 0.3393903234488673
Epoch: 69, step: 726, loss: 0.3384280204772949, mean loss: 0.3393903138606429
Epoch: 69, step: 727, loss: 0.3382687270641327, mean loss: 0.3393903026854526
Epoch: 69, step: 728, loss: 0.33023756742477417, mean loss: 0.3393902114909599
Epoch: 69, step: 729, loss: 0.30036914348602295, mean loss: 0.33938982270324286
Epoch: 69, step: 730, loss: 0.33239999413490295, mean loss: 0.33938975306054586
Epoch: 69, step: 731, loss: 0.3282056748867035, mean loss: 0.33938964162982915
Epoch: 69, step: 732, loss: 0.3512692153453827, mean loss: 0.33938975998882165
Epoch: 69, step: 733, loss: 0.3383720815181732, mean loss: 0.3393897498495522
Epoch: 69, step: 734, loss: 0.33763355016708374, mean loss: 0.33938973235246955
Epoch: 69, step: 735, loss: 0.36925479769706726, mean loss: 0.3393900298962601
Epoch: 69, step: 736, loss: 0.32234713435173035, mean loss: 0.3393898601006423
Epoch: 69, step: 737, loss: 0.2859627306461334, mean loss: 0.3393893278200771
Epoch: 69, step: 738, loss: 0.36061179637908936, mean loss: 0.33938953925189336
Epoch: 69, step: 739, loss: 0.3094923794269562, mean loss: 0.3393892414002174
Epoch: 69, step: 740, loss: 0.37286749482154846, mean loss: 0.3393895749253618
Epoch: 69, step: 741, loss: 0.3326514661312103, mean loss: 0.33938950779801524
Epoch: 69, step: 742, loss: 0.29401499032974243, mean loss: 0.3393890557660417
Epoch: 69, step: 743, loss: 0.31200048327445984, mean loss: 0.33938878291714264
Epoch: 69, step: 744, loss: 0.31752005219459534, mean loss: 0.33938856505987164
Epoch: 69, step: 745, loss: 0.34737643599510193, mean loss: 0.3393886446346055
Epoch: 69, step: 746, loss: 0.3207986354827881, mean loss: 0.3393884594437948
Epoch: 69, step: 747, loss: 0.35580408573150635, mean loss: 0.339388622972109
Epoch: 69, step: 748, loss: 0.3689398169517517, mean loss: 0.3393889173506912
Epoch: 69, step: 749, loss: 0.3576916754245758, mean loss: 0.33938909967450204
Epoch: 69, step: 750, loss: 0.3411538600921631, mean loss: 0.3393891172540733
Epoch: 69, step: 751, loss: 0.3492527902126312, mean loss: 0.3393892155095715
Epoch: 69, step: 752, loss: 0.3653484880924225, mean loss: 0.3393894740963946
Epoch: 69, step: 753, loss: 0.3807474672794342, mean loss: 0.3393898860696308
Epoch: 69, step: 754, loss: 0.287313312292099, mean loss: 0.3393893673321565
Epoch: 69, step: 755, loss: 0.35945603251457214, mean loss: 0.33938956721526653
Epoch: 69, step: 756, loss: 0.33597686886787415, mean loss: 0.3393895332218771
Epoch: 69, step: 757, loss: 0.3579259216785431, mean loss: 0.3393897178582942
Epoch: 69, step: 758, loss: 0.31718602776527405, mean loss: 0.3393894966949883
Epoch: 69, step: 759, loss: 0.31493112444877625, mean loss: 0.33938925307599704
Epoch: 69, step: 760, loss: 0.317615807056427, mean loss: 0.33938903620252453
Epoch: 69, step: 761, loss: 0.28244709968566895, mean loss: 0.3393884690404644
Epoch: 69, step: 762, loss: 0.3094483017921448, mean loss: 0.339388170828657
Epoch: 69, step: 763, loss: 0.33751773834228516, mean loss: 0.3393881521988514
Epoch: 69, step: 764, loss: 0.3402099609375, mean loss: 0.33938816038411584
Epoch: 69, step: 765, loss: 0.35598450899124146, mean loss: 0.3393883256831
Epoch: 69, step: 766, loss: 0.3631134629249573, mean loss: 0.3393885619821871
Epoch: 69, step: 767, loss: 0.32334837317466736, mean loss: 0.33938840222571515
Epoch: 69, step: 768, loss: 0.33205753564834595, mean loss: 0.33938832921275186
Epoch: 69, step: 769, loss: 0.30400437116622925, mean loss: 0.3393879768039511
Epoch: 69, step: 770, loss: 0.3860340714454651, mean loss: 0.339388441374097
Epoch: 69, step: 771, loss: 0.3240918517112732, mean loss: 0.33938828902976526
Epoch: 69, step: 772, loss: 0.3167251944541931, mean loss: 0.3393880633219644
Epoch: 69, step: 773, loss: 0.30066078901290894, mean loss: 0.3393876776305561
Epoch: 69, step: 774, loss: 0.32469451427459717, mean loss: 0.3393875313003397
Epoch: 69, step: 775, loss: 0.32714077830314636, mean loss: 0.3393874093353057
Epoch: 69, step: 776, loss: 0.32204729318618774, mean loss: 0.3393872366473455
Epoch: 69, step: 777, loss: 0.36715853214263916, mean loss: 0.3393875132153091
Epoch: 69, step: 778, loss: 0.32165879011154175, mean loss: 0.33938733666077936
Epoch: 69, step: 779, loss: 0.3212713897228241, mean loss: 0.33938715625181126
Epoch: 69, step: 780, loss: 0.3232385516166687, mean loss: 0.3393869954363653
Epoch: 69, step: 781, loss: 0.3430979251861572, mean loss: 0.3393870323911916
Epoch: 69, step: 782, loss: 0.3676876425743103, mean loss: 0.33938731421644563
Epoch: 69, step: 783, loss: 0.3123331665992737, mean loss: 0.3393870448064913
Epoch: 69, step: 784, loss: 0.3220890164375305, mean loss: 0.33938687255140154
Epoch: 69, step: 785, loss: 0.36909985542297363, mean loss: 0.3393871684326116
Epoch: 69, step: 786, loss: 0.2940755784511566, mean loss: 0.3393867172253186
Epoch: 69, step: 787, loss: 0.32589805126190186, mean loss: 0.3393865829081637
Epoch: 69, step: 788, loss: 0.3388529121875763, mean loss: 0.3393865775940415
Epoch: 69, step: 789, loss: 0.32471540570259094, mean loss: 0.33938643150466336
Epoch: 69, step: 790, loss: 0.3298082649707794, mean loss: 0.33938633613024677
Epoch: 69, step: 791, loss: 0.34728455543518066, mean loss: 0.3393864147758367
Epoch: 69, step: 792, loss: 0.31449154019355774, mean loss: 0.33938616689051887
Epoch: 69, step: 793, loss: 0.3422507047653198, mean loss: 0.3393861954132499
Epoch: 69, step: 794, loss: 0.3730374276638031, mean loss: 0.3393865304814285
Epoch: 69, step: 795, loss: 0.3187272548675537, mean loss: 0.3393863247773142
Epoch: 69, step: 796, loss: 0.33514106273651123, mean loss: 0.3393862825077211
Epoch: 69, step: 797, loss: 0.36493605375289917, mean loss: 0.33938653690136517
Epoch: 69, step: 798, loss: 0.3124699294567108, mean loss: 0.3393862689010919
Epoch: 69, step: 799, loss: 0.3056369423866272, mean loss: 0.33938593287290963
Epoch: 69, step: 800, loss: 0.35658860206604004, mean loss: 0.3393861041511158
Epoch: 69, step: 801, loss: 0.3099159896373749, mean loss: 0.3393858107351327
Epoch: 69, step: 802, loss: 0.3039899468421936, mean loss: 0.33938545832358047
Epoch: 69, step: 803, loss: 0.33316749334335327, mean loss: 0.3393853964163226
Epoch: 69, step: 804, loss: 0.3519543409347534, mean loss: 0.339385521553911
Epoch: 69, step: 805, loss: 0.3011261522769928, mean loss: 0.33938514064384073
Epoch: 69, step: 806, loss: 0.3220626711845398, mean loss: 0.339384968183147
Epoch: 69, step: 807, loss: 0.36470702290534973, mean loss: 0.3393852202843648
Epoch: 69, step: 808, loss: 0.41118234395980835, mean loss: 0.3393859350747842
Epoch: 69, step: 809, loss: 0.3494490087032318, mean loss: 0.3393860352587002
Epoch: 69, step: 810, loss: 0.34450480341911316, mean loss: 0.3393860862185911
Epoch: 69, step: 811, loss: 0.32335686683654785, mean loss: 0.33938592664130357
Epoch: 69, step: 812, loss: 0.37470871210098267, mean loss: 0.33938627829025436
Epoch: 69, step: 813, loss: 0.3311406075954437, mean loss: 0.3393861962029403
Epoch: 69, step: 814, loss: 0.3786303400993347, mean loss: 0.33938658688241485
Epoch: 69, step: 815, loss: 0.3127284348011017, mean loss: 0.33938632150042064
Epoch: 69, step: 816, loss: 0.32135361433029175, mean loss: 0.33938614198654676
Epoch: 69, step: 817, loss: 0.33835092186927795, mean loss: 0.3393861316811322
Epoch: 69, step: 818, loss: 0.3611312508583069, mean loss: 0.33938634814740243
Epoch: 69, step: 819, loss: 0.360284686088562, mean loss: 0.3393865561821434
Epoch: 69, step: 820, loss: 0.3202521502971649, mean loss: 0.3393863657085489
Epoch: 69, step: 821, loss: 0.3538191020488739, mean loss: 0.33938650937790665
Epoch: 69, step: 822, loss: 0.3202234208583832, mean loss: 0.3393863186225884
Epoch: 69, step: 823, loss: 0.31564414501190186, mean loss: 0.33938608228799144
Epoch: 69, step: 824, loss: 0.3571546971797943, mean loss: 0.3393862591587661
Epoch: 69, step: 825, loss: 0.3283061981201172, mean loss: 0.3393861488677004
Epoch: 69, step: 826, loss: 0.34063994884490967, mean loss: 0.33938616134791677
Epoch: 69, step: 827, loss: 0.34287896752357483, mean loss: 0.3393861961146608
Epoch: 69, step: 828, loss: 0.33087602257728577, mean loss: 0.3393861114068169
Epoch: 69, step: 829, loss: 0.31164392828941345, mean loss: 0.339385835271775
Epoch: 69, step: 830, loss: 0.35166507959365845, mean loss: 0.339385957493443
Epoch: 69, step: 831, loss: 0.3255414068698883, mean loss: 0.3393858196928436
Epoch: 69, step: 832, loss: 0.32494109869003296, mean loss: 0.3393856759199285
Epoch: 69, step: 833, loss: 0.32902687788009644, mean loss: 0.3393855728165341
Epoch: 69, step: 834, loss: 0.30708804726600647, mean loss: 0.3393852513553607
Epoch: 69, step: 835, loss: 0.32734236121177673, mean loss: 0.3393851314922133
Epoch: 69, step: 836, loss: 0.3387010395526886, mean loss: 0.3393851246834991
Epoch: 69, step: 837, loss: 0.35332536697387695, mean loss: 0.33938526342827174
Epoch: 69, step: 838, loss: 0.32772526144981384, mean loss: 0.3393851473794837
Epoch: 69, step: 839, loss: 0.31830090284347534, mean loss: 0.3393849375358938
Epoch: 69, step: 840, loss: 0.3309914171695709, mean loss: 0.3393848539991604
Epoch: 69, step: 841, loss: 0.35642582178115845, mean loss: 0.33938502359815503
Epoch: 69, step: 842, loss: 0.3076300024986267, mean loss: 0.33938470756175837
Epoch: 69, step: 843, loss: 0.32004326581954956, mean loss: 0.3393845150712952
Epoch: 69, step: 844, loss: 0.32900911569595337, mean loss: 0.33938441181396917
Epoch: 69, step: 845, loss: 0.317026287317276, mean loss: 0.3393841893052164
Epoch: 69, step: 846, loss: 0.3238941431045532, mean loss: 0.33938403514932736
Epoch: 69, step: 847, loss: 0.3276582360267639, mean loss: 0.3393839184561312
Epoch: 69, step: 848, loss: 0.328009694814682, mean loss: 0.33938380526288203
Epoch: 69, step: 849, loss: 0.36652103066444397, mean loss: 0.3393840753226456
Epoch: 69, step: 850, loss: 0.3381209969520569, mean loss: 0.3393840627530757
Epoch: 69, step: 851, loss: 0.3342289626598358, mean loss: 0.339384011452422
Epoch: 69, step: 852, loss: 0.313442200422287, mean loss: 0.3393837532966932
Epoch: 69, step: 853, loss: 0.31658458709716797, mean loss: 0.33938352641674296
Epoch: 69, step: 854, loss: 0.3425176739692688, mean loss: 0.33938355760508376
Epoch: 69, step: 855, loss: 0.3023653030395508, mean loss: 0.33938318923491934
Epoch: 69, step: 856, loss: 0.36178284883499146, mean loss: 0.3393834121326296
Epoch: 69, step: 857, loss: 0.32171276211738586, mean loss: 0.3393832362947685
Epoch: 69, step: 858, loss: 0.3568418323993683, mean loss: 0.33938341002078576
Epoch: 69, step: 859, loss: 0.3109363317489624, mean loss: 0.33938312695401424
Epoch: 69, step: 860, loss: 0.3065674901008606, mean loss: 0.33938280042051716
Epoch: 69, step: 861, loss: 0.365023672580719, mean loss: 0.33938305555865084
Epoch: 69, step: 862, loss: 0.3015950620174408, mean loss: 0.33938267955497375
Epoch: 69, step: 863, loss: 0.3124973773956299, mean loss: 0.3393824120395294
Epoch: 69, step: 864, loss: 0.31948891282081604, mean loss: 0.33938221409623315
Epoch: 69, step: 865, loss: 0.32188349962234497, mean loss: 0.33938203998313615
Epoch: 69, step: 866, loss: 0.32261934876441956, mean loss: 0.33938187319516744
Epoch: 69, step: 867, loss: 0.3200620710849762, mean loss: 0.3393816809659814
Epoch: 69, step: 868, loss: 0.3223463296890259, mean loss: 0.33938151146843126
Epoch: 69, step: 869, loss: 0.3555402159690857, mean loss: 0.3393816722419622
Epoch: 69, step: 870, loss: 0.3224789500236511, mean loss: 0.3393815040673851
Epoch: 69, step: 871, loss: 0.3361077904701233, mean loss: 0.33938147149571324
Epoch: 69, step: 872, loss: 0.3001205325126648, mean loss: 0.33938108087458496
Epoch: 69, step: 873, loss: 0.3160478472709656, mean loss: 0.33938084872620566
Epoch: 69, step: 874, loss: 0.3275785744190216, mean loss: 0.33938073130349267
Epoch: 69, step: 875, loss: 0.34813976287841797, mean loss: 0.3393808184476304
Epoch: 69, step: 876, loss: 0.2960253953933716, mean loss: 0.3393803871061815
Epoch: 69, step: 877, loss: 0.3308659791946411, mean loss: 0.339380302397505
Epoch: 69, step: 878, loss: 0.3249494135379791, mean loss: 0.3393801588279994
Epoch: 69, step: 879, loss: 0.3571579158306122, mean loss: 0.3393803356929463
Epoch: 69, step: 880, loss: 0.31708869338035583, mean loss: 0.3393801139230734
Epoch: 69, step: 881, loss: 0.33540353178977966, mean loss: 0.3393800743621775
Epoch: 69, step: 882, loss: 0.3043545186519623, mean loss: 0.33937972591506094
Epoch: 69, step: 883, loss: 0.38340863585472107, mean loss: 0.33938016392650083
Epoch: 69, step: 884, loss: 0.3308287262916565, mean loss: 0.3393800788553452
Epoch: 69, step: 885, loss: 0.32249972224235535, mean loss: 0.33937991092835795
Epoch: 69, step: 886, loss: 0.32046785950660706, mean loss: 0.33937972279179796
Epoch: 69, step: 887, loss: 0.3024168908596039, mean loss: 0.3393793550902348
Epoch: 69, step: 888, loss: 0.3235803246498108, mean loss: 0.3393791979250476
Epoch: 69, step: 889, loss: 0.32712486386299133, mean loss: 0.33937907602291223
Epoch: 69, step: 890, loss: 0.308097243309021, mean loss: 0.33937876484449536
Epoch: 69, step: 891, loss: 0.3191070556640625, mean loss: 0.33937856319212806
Epoch: 69, step: 892, loss: 0.3259297013282776, mean loss: 0.3393784294112105
Epoch: 69, step: 893, loss: 0.3168705403804779, mean loss: 0.33937820551894915
Epoch: 69, step: 894, loss: 0.32571545243263245, mean loss: 0.3393780696130785
Epoch: 69, step: 895, loss: 0.32206329703330994, mean loss: 0.339377897381624
Epoch: 69, step: 896, loss: 0.3053017258644104, mean loss: 0.33937755842653944
Epoch: 69, step: 897, loss: 0.37687039375305176, mean loss: 0.3393779313634098
Epoch: 69, step: 898, loss: 0.3819647431373596, mean loss: 0.3393783549652577
Epoch: 69, step: 899, loss: 0.3608795702457428, mean loss: 0.33937856883108963
Epoch: 69, step: 900, loss: 0.33849161863327026, mean loss: 0.3393785600089625
Epoch: 69, step: 901, loss: 0.3245726525783539, mean loss: 0.33937841274218344
Epoch: 69, step: 902, loss: 0.3486008942127228, mean loss: 0.33937850447257134
Epoch: 69, step: 903, loss: 0.3099389374256134, mean loss: 0.339378211658099
Epoch: 69, step: 904, loss: 0.30611106753349304, mean loss: 0.339377880776726
Epoch: 69, step: 905, loss: 0.31852060556411743, mean loss: 0.33937767332834406
Epoch: 69, step: 906, loss: 0.3509674072265625, mean loss: 0.33937778859975926
Epoch: 69, step: 907, loss: 0.32362282276153564, mean loss: 0.3393776319025338
Epoch: 69, step: 908, loss: 0.3695768117904663, mean loss: 0.33937793225739865
Epoch: 69, step: 909, loss: 0.30930742621421814, mean loss: 0.33937763318527203
Epoch: 69, step: 910, loss: 0.3237656056880951, mean loss: 0.3393774779143291
Epoch: 69, step: 911, loss: 0.32923057675361633, mean loss: 0.33937737699833714
Epoch: 69, step: 912, loss: 0.3580465018749237, mean loss: 0.3393775626702471
Epoch: 69, step: 913, loss: 0.3328092396259308, mean loss: 0.33937749734629835
Epoch: 69, step: 914, loss: 0.3006414771080017, mean loss: 0.3393771121087548
Epoch: 69, step: 915, loss: 0.340232789516449, mean loss: 0.3393771206185548
Epoch: 69, step: 916, loss: 0.31872305274009705, mean loss: 0.3393769152137645
Epoch: 69, step: 917, loss: 0.35934141278266907, mean loss: 0.3393771137588007
Epoch: 69, step: 918, loss: 0.35898637771606445, mean loss: 0.3393773087691329
Epoch: 69, step: 919, loss: 0.3152572214603424, mean loss: 0.33937706890192154
Epoch: 69, step: 920, loss: 0.3496875464916229, mean loss: 0.33937717143558493
Epoch: 69, step: 921, loss: 0.31523817777633667, mean loss: 0.33937693138512987
Epoch: 69, step: 922, loss: 0.4031069278717041, mean loss: 0.33937756514239165
Epoch: 69, step: 923, loss: 0.3345334827899933, mean loss: 0.33937751697132607
Epoch: 69, step: 924, loss: 0.32726380228996277, mean loss: 0.33937739650996745
Epoch: 69, step: 925, loss: 0.36762556433677673, mean loss: 0.33937767741297087
Epoch: 69, step: 926, loss: 0.3249216675758362, mean loss: 0.3393775336621894
Epoch: 69, step: 927, loss: 0.34855231642723083, mean loss: 0.3393776248954614
Epoch: 69, step: 928, loss: 0.3313509225845337, mean loss: 0.33937754507939905
Epoch: 69, step: 929, loss: 0.31297585368156433, mean loss: 0.3393772825484105
Epoch: 69, step: 930, loss: 0.35357043147087097, mean loss: 0.3393774236796854
Epoch: 69, step: 931, loss: 0.30032673478126526, mean loss: 0.339377035378348
Epoch: 69, step: 932, loss: 0.32471051812171936, mean loss: 0.3393768895429787
Epoch: 69, step: 933, loss: 0.3226321339607239, mean loss: 0.33937672304446437
Epoch: 69, step: 934, loss: 0.3607857823371887, mean loss: 0.3393769359195406
Epoch: 69, step: 935, loss: 0.3859272301197052, mean loss: 0.33937739877494966
Epoch: 69, step: 936, loss: 0.3415091037750244, mean loss: 0.3393774199705489
Epoch: 69, step: 937, loss: 0.3317416310310364, mean loss: 0.3393773440484523
Epoch: 69, step: 938, loss: 0.31284284591674805, mean loss: 0.33937708022048185
Epoch: 69, step: 939, loss: 0.3272269666194916, mean loss: 0.33937695941518436
Epoch: 69, step: 940, loss: 0.3228299915790558, mean loss: 0.33937679489478867
Epoch: 69, step: 941, loss: 0.38518983125686646, mean loss: 0.3393772503923762
Epoch: 69, step: 942, loss: 0.3312482535839081, mean loss: 0.33937716957036757
Epoch: 69, step: 943, loss: 0.3717099726200104, mean loss: 0.3393774910339095
Epoch: 69, step: 944, loss: 0.33727309107780457, mean loss: 0.33937747011146935
Epoch: 69, step: 945, loss: 0.3264525234699249, mean loss: 0.33937734160988214
Epoch: 69, step: 946, loss: 0.2940199077129364, mean loss: 0.33937689066455445
Epoch: 69, step: 947, loss: 0.40155312418937683, mean loss: 0.3393775088168801
Epoch: 69, step: 948, loss: 0.32245221734046936, mean loss: 0.33937734054833635
Epoch: 69, step: 949, loss: 0.30354544520378113, mean loss: 0.3393769843168991
Epoch: 69, step: 950, loss: 0.2880820333957672, mean loss: 0.339376474360832
Epoch: 69, step: 951, loss: 0.3568755090236664, mean loss: 0.3393766483282502
Epoch: 69, step: 952, loss: 0.318845272064209, mean loss: 0.3393764442167046
Epoch: 69, step: 953, loss: 0.31584712862968445, mean loss: 0.33937621030363585
Epoch: 69, step: 954, loss: 0.34278613328933716, mean loss: 0.33937624420252327
Epoch: 69, step: 955, loss: 0.31451719999313354, mean loss: 0.33937599707507565
Epoch: 69, step: 956, loss: 0.3162834942340851, mean loss: 0.33937576751136006
Epoch: 69, step: 957, loss: 0.31628862023353577, mean loss: 0.33937553800316594
Epoch: 69, step: 958, loss: 0.34506744146347046, mean loss: 0.33937559458553546
Epoch: 69, step: 959, loss: 0.3321666717529297, mean loss: 0.3393755229234134
Epoch: 69, step: 960, loss: 0.3507477939128876, mean loss: 0.33937563597122783
Epoch: 69, step: 961, loss: 0.31882426142692566, mean loss: 0.339375431679149
Epoch: 69, step: 962, loss: 0.29608941078186035, mean loss: 0.3393750013963341
Epoch: 69, step: 963, loss: 0.3190208077430725, mean loss: 0.3393747990683654
Epoch: 69, step: 964, loss: 0.3003901541233063, mean loss: 0.3393744115508959
Epoch: 69, step: 965, loss: 0.3637917637825012, mean loss: 0.3393746542632896
Epoch: 69, step: 966, loss: 0.31266075372695923, mean loss: 0.33937438872547726
Epoch: 69, step: 967, loss: 0.3377526104450226, mean loss: 0.33937437260506176
Epoch: 69, step: 968, loss: 0.3083620071411133, mean loss: 0.3393740643463722
Epoch: 69, step: 969, loss: 0.34991851449012756, mean loss: 0.33937416915572893
Epoch: 69, step: 970, loss: 0.3488145172595978, mean loss: 0.33937426298963813
Epoch: 69, step: 971, loss: 0.3521212041378021, mean loss: 0.3393743896887192
Epoch: 69, step: 972, loss: 0.3595876693725586, mean loss: 0.33937459059797864
Epoch: 69, step: 973, loss: 0.3794237971305847, mean loss: 0.33937498866185434
Epoch: 69, step: 974, loss: 0.32473233342170715, mean loss: 0.339374843124535
Epoch: 69, step: 975, loss: 0.307778537273407, mean loss: 0.33937452908340815
Epoch: 69, step: 976, loss: 0.40073320269584656, mean loss: 0.3393751389317738
Epoch: 69, step: 977, loss: 0.3139961361885071, mean loss: 0.33937488669050775
Epoch: 69, step: 978, loss: 0.3206467032432556, mean loss: 0.3393747005534164
Epoch: 69, step: 979, loss: 0.3255656659603119, mean loss: 0.33937456330849913
Epoch: 69, step: 980, loss: 0.3113536238670349, mean loss: 0.33937428481739484
Epoch: 69, step: 981, loss: 0.31980738043785095, mean loss: 0.3393740903501586
Epoch: 69, step: 982, loss: 0.35499799251556396, mean loss: 0.33937424562801033
Epoch: 69, step: 983, loss: 0.3230792284011841, mean loss: 0.3393740836819039
Epoch: 69, step: 984, loss: 0.3200501799583435, mean loss: 0.339373891635475
Epoch: 69, step: 985, loss: 0.3244045674800873, mean loss: 0.3393737428675698
Epoch: 69, step: 986, loss: 0.3120783865451813, mean loss: 0.3393734716039788
Epoch: 69, step: 987, loss: 0.32612577080726624, mean loss: 0.339373339948501
Epoch: 69, step: 988, loss: 0.32454198598861694, mean loss: 0.3393731925561635
Epoch: 69, step: 989, loss: 0.30842339992523193, mean loss: 0.33937288498364115
Epoch: 69, step: 990, loss: 0.31696611642837524, mean loss: 0.3393726623121061
Epoch: 69, step: 991, loss: 0.3122185170650482, mean loss: 0.33937239246529166
Epoch: 69, step: 992, loss: 0.3862590789794922, mean loss: 0.33937285840141856
Epoch: 69, step: 993, loss: 0.3301570415496826, mean loss: 0.33937276682021167
Epoch: 69, step: 994, loss: 0.32075393199920654, mean loss: 0.33937258179934515
Epoch: 69, step: 995, loss: 0.2958541810512543, mean loss: 0.33937214934842747
Epoch: 69, step: 996, loss: 0.31310734152793884, mean loss: 0.3393718883524538
Epoch: 69, step: 997, loss: 0.34767550230026245, mean loss: 0.33937197086546084
Epoch: 69, step: 998, loss: 0.31792864203453064, mean loss: 0.339371757785232
Epoch: 69, step: 999, loss: 0.3426576554775238, mean loss: 0.3393717904365465
Epoch: 69, step: 1000, loss: 0.3267074227333069, mean loss: 0.3393716645944834
Epoch: 69, step: 1001, loss: 0.3406588137149811, mean loss: 0.3393716773843751
Epoch: 69, step: 1002, loss: 0.32006990909576416, mean loss: 0.33937148559224395
Epoch: 69, step: 1003, loss: 0.3315514624118805, mean loss: 0.3393714078893109
Epoch: 69, step: 1004, loss: 0.3599872887134552, mean loss: 0.3393716127350579
Epoch: 69, step: 1005, loss: 0.3371277153491974, mean loss: 0.33937159043922327
Epoch: 69, step: 1006, loss: 0.32754185795783997, mean loss: 0.3393714728976905
Epoch: 69, step: 1007, loss: 0.30082079768180847, mean loss: 0.33937108985771575
Epoch: 69, step: 1008, loss: 0.32432428002357483, mean loss: 0.3393709403539169
Epoch: 69, step: 1009, loss: 0.3007503151893616, mean loss: 0.3393705566265441
Epoch: 69, step: 1010, loss: 0.2902928292751312, mean loss: 0.3393700690041872
Epoch: 69, step: 1011, loss: 0.38375309109687805, mean loss: 0.33937050997690493
Epoch: 69, step: 1012, loss: 0.2905268669128418, mean loss: 0.3393700246899864
Epoch: 69, step: 1013, loss: 0.35398009419441223, mean loss: 0.3393701698471598
Epoch: 69, step: 1014, loss: 0.3123708665370941, mean loss: 0.339369901600413
Epoch: 69, step: 1015, loss: 0.34839320182800293, mean loss: 0.3393699912489071
Epoch: 69, step: 1016, loss: 0.355194628238678, mean loss: 0.33937014846863217
Epoch: 69, step: 1017, loss: 0.3346739113330841, mean loss: 0.3393701018113991
Epoch: 69, step: 1018, loss: 0.3443436920642853, mean loss: 0.3393701512236514
Epoch: 69, step: 1019, loss: 0.3414160907268524, mean loss: 0.3393701715497075
Epoch: 69, step: 1020, loss: 0.30095213651657104, mean loss: 0.3393697898769472
Epoch: 69, step: 1021, loss: 0.31966257095336914, mean loss: 0.33936959409301626
Epoch: 69, step: 1022, loss: 0.3685072660446167, mean loss: 0.33936988356213427
Epoch: 69, step: 1023, loss: 0.3309255540370941, mean loss: 0.3393697996725105
Epoch: 69, step: 1024, loss: 0.35875576734542847, mean loss: 0.3393699922591893
Epoch: 69, step: 1025, loss: 0.3699066638946533, mean loss: 0.3393702956176725
Epoch: 69, step: 1026, loss: 0.33040326833724976, mean loss: 0.33937020653799793
Epoch: 69, step: 1027, loss: 0.30806848406791687, mean loss: 0.33936989558549785
Epoch: 69, step: 1028, loss: 0.3364257216453552, mean loss: 0.3393698663382526
Epoch: 69, step: 1029, loss: 0.3133791983127594, mean loss: 0.3393696081510988
Epoch: 69, step: 1030, loss: 0.37547120451927185, mean loss: 0.3393699667750408
Epoch: 69, step: 1031, loss: 0.3314101994037628, mean loss: 0.33936988770555127
Epoch: 69, step: 1032, loss: 0.3042362928390503, mean loss: 0.33936953870442016
Epoch: 69, step: 1033, loss: 0.3232265114784241, mean loss: 0.33936937834853237
Epoch: 69, step: 1034, loss: 0.32425668835639954, mean loss: 0.33936922822893495
Epoch: 69, step: 1035, loss: 0.3604968190193176, mean loss: 0.33936943809454595
Epoch: 69, step: 1036, loss: 0.35684847831726074, mean loss: 0.3393696117164726
Epoch: 69, step: 1037, loss: 0.3164052963256836, mean loss: 0.33936938361075125
Epoch: 69, step: 1038, loss: 0.36259227991104126, mean loss: 0.33936961428267876
Epoch: 69, step: 1039, loss: 0.3551703095436096, mean loss: 0.3393697712286764
Epoch: 69, step: 1040, loss: 0.3698352873325348, mean loss: 0.33937007383519135
Epoch: 69, step: 1041, loss: 0.35007262229919434, mean loss: 0.33937018013992987
Epoch: 69, step: 1042, loss: 0.3015221953392029, mean loss: 0.33936980421262825
Epoch: 69, step: 1043, loss: 0.3585958480834961, mean loss: 0.33936999517452604
Epoch: 69, step: 1044, loss: 0.3549030125141144, mean loss: 0.33937014945405586
Epoch: 69, step: 1045, loss: 0.33911967277526855, mean loss: 0.3393701469662559
Epoch: 69, step: 1046, loss: 0.3151014447212219, mean loss: 0.3393699059255415
Epoch: 69, step: 1047, loss: 0.30071479082107544, mean loss: 0.3393695220004382
Epoch: 69, step: 1048, loss: 0.3047189712524414, mean loss: 0.33936917785234516
Epoch: 69, step: 1049, loss: 0.3095923960208893, mean loss: 0.33936888211329674
Epoch: 69, step: 1050, loss: 0.3703233003616333, mean loss: 0.33936918954542056
Epoch: 69, step: 1051, loss: 0.3149030804634094, mean loss: 0.3393689465560963
Epoch: 69, step: 1052, loss: 0.3350851237773895, mean loss: 0.33936890401100417
Epoch: 69, step: 1053, loss: 0.34335148334503174, mean loss: 0.33936894356388264
Epoch: 69, step: 1054, loss: 0.3425876200199127, mean loss: 0.339368975529763
Epoch: 69, step: 1055, loss: 0.36203715205192566, mean loss: 0.33936920065367077
Epoch: 69, step: 1056, loss: 0.36058568954467773, mean loss: 0.33936941135837606
Epoch: 69, step: 1057, loss: 0.33315324783325195, mean loss: 0.3393693496251693
Epoch: 69, step: 1058, loss: 0.31162357330322266, mean loss: 0.3393690740824281
Epoch: 69, step: 1059, loss: 0.3267814815044403, mean loss: 0.3393689490765433
Epoch: 69, step: 1060, loss: 0.3351735770702362, mean loss: 0.3393689074132166
Epoch: 69, step: 1061, loss: 0.3028481900691986, mean loss: 0.33936854473751954
Epoch: 69, step: 1062, loss: 0.38775908946990967, mean loss: 0.33936902528394736
Epoch: 69, step: 1063, loss: 0.3580697774887085, mean loss: 0.3393692109915164
Epoch: 69, step: 1064, loss: 0.31252050399780273, mean loss: 0.3393689443734392
Epoch: 69, step: 1065, loss: 0.33562353253364563, mean loss: 0.3393689071804158
Epoch: 69, step: 1066, loss: 0.39809057116508484, mean loss: 0.33936949029774083
Epoch: 69, step: 1067, loss: 0.31323933601379395, mean loss: 0.3393692308229009
Epoch: 69, step: 1068, loss: 0.32654574513435364, mean loss: 0.33936910348577076
Epoch: 69, step: 1069, loss: 0.33655720949172974, mean loss: 0.3393690755639588
Epoch: 69, step: 1070, loss: 0.314281165599823, mean loss: 0.33936882644612226
Epoch: 69, step: 1071, loss: 0.33778855204582214, mean loss: 0.3393688107544751
Epoch: 69, step: 1072, loss: 0.3481995463371277, mean loss: 0.33936889844013957
Epoch: 69, step: 1073, loss: 0.33369216322898865, mean loss: 0.33936884207299417
Epoch: 69, step: 1074, loss: 0.33565154671669006, mean loss: 0.3393688051624744
Epoch: 69, step: 1075, loss: 0.2988203465938568, mean loss: 0.3393684025445285
Epoch: 69, step: 1076, loss: 0.32013118267059326, mean loss: 0.33936821153423313
Epoch: 69, step: 1077, loss: 0.29287707805633545, mean loss: 0.33936774991883234
Epoch: 69, step: 1078, loss: 0.32747405767440796, mean loss: 0.3393676318262717
Epoch: 69, step: 1079, loss: 0.3534970283508301, mean loss: 0.3393677721157642
Epoch: 69, step: 1080, loss: 0.3046916425228119, mean loss: 0.339367427823047
Epoch: 69, step: 1081, loss: 0.32303258776664734, mean loss: 0.339367265639127
Epoch: 69, step: 1082, loss: 0.347965270280838, mean loss: 0.33936735100539
Epoch: 69, step: 1083, loss: 0.3524845242500305, mean loss: 0.33936748123943733
Epoch: 69, step: 1084, loss: 0.3427179157733917, mean loss: 0.3393675145039456
Epoch: 69, step: 1085, loss: 0.3531816899776459, mean loss: 0.33936765165546634
Epoch: 69, step: 1086, loss: 0.3322795331478119, mean loss: 0.33936758128307365
Epoch: 69, step: 1087, loss: 0.3134523630142212, mean loss: 0.33936732399366626
Epoch: 69, step: 1088, loss: 0.30748558044433594, mean loss: 0.33936700747101994
Epoch: 69, step: 1089, loss: 0.36594507098197937, mean loss: 0.3393672713359953
Epoch: 69, step: 1090, loss: 0.3508581519126892, mean loss: 0.3393673854154435
Epoch: 69, step: 1091, loss: 0.33988696336746216, mean loss: 0.3393673905736711
Epoch: 69, step: 1092, loss: 0.3103680908679962, mean loss: 0.3393671026794231
Epoch: 69, step: 1093, loss: 0.2986384332180023, mean loss: 0.33936669834437433
Epoch: 69, step: 1094, loss: 0.33751049637794495, mean loss: 0.3393666799170583
Epoch: 69, step: 1095, loss: 0.3303661048412323, mean loss: 0.339366590565362
Epoch: 69, step: 1096, loss: 0.31232526898384094, mean loss: 0.3393663221198518
Epoch: 69, step: 1097, loss: 0.2998402714729309, mean loss: 0.3393659297394177
Epoch: 69, step: 1098, loss: 0.3300437033176422, mean loss: 0.33936583719733776
Epoch: 69, step: 1099, loss: 0.306081086397171, mean loss: 0.3393655067816889
Epoch: 69, step: 1100, loss: 0.34278908371925354, mean loss: 0.33936554076698666
Epoch: 69, step: 1101, loss: 0.3412915766239166, mean loss: 0.3393655598862451
Epoch: 69, step: 1102, loss: 0.3447321653366089, mean loss: 0.3393656131586168
Epoch: 69, step: 1103, loss: 0.29079484939575195, mean loss: 0.3393651310188137
Epoch: 69, step: 1104, loss: 0.35029271245002747, mean loss: 0.33936523949085023
Epoch: 69, step: 1105, loss: 0.3079454302787781, mean loss: 0.33936492760693676
Epoch: 69, step: 1106, loss: 0.3164423406124115, mean loss: 0.339364700071654
Epoch: 69, step: 1107, loss: 0.3850955367088318, mean loss: 0.33936515400277284
Epoch: 69, step: 1108, loss: 0.31288233399391174, mean loss: 0.33936489113295293
Epoch: 69, step: 1109, loss: 0.3314879536628723, mean loss: 0.33936481294684656
Epoch: 69, step: 1110, loss: 0.3391445577144623, mean loss: 0.3393648107606253
Epoch: 69, step: 1111, loss: 0.32943540811538696, mean loss: 0.3393647122038039
Epoch: 69, step: 1112, loss: 0.29710569977760315, mean loss: 0.3393642927553485
Epoch: 69, step: 1113, loss: 0.31185659766197205, mean loss: 0.3393640197261168
Epoch: 69, step: 1114, loss: 0.2739724814891815, mean loss: 0.339363370685033
Epoch: 69, step: 1115, loss: 0.3272635042667389, mean loss: 0.3393632505894873
Epoch: 69, step: 1116, loss: 0.35697489976882935, mean loss: 0.33936342538973324
Epoch: 69, step: 1117, loss: 0.35444968938827515, mean loss: 0.3393635751233815
Epoch: 69, step: 1118, loss: 0.30961719155311584, mean loss: 0.3393632798885686
Epoch: 69, step: 1119, loss: 0.28841638565063477, mean loss: 0.3393627742423119
Epoch: 69, step: 1120, loss: 0.29919981956481934, mean loss: 0.3393623756302584
Epoch: 69, step: 1121, loss: 0.3086366057395935, mean loss: 0.3393620706840517
Epoch: 69, step: 1122, loss: 0.32638970017433167, mean loss: 0.3393619419375327
Epoch: 69, step: 1123, loss: 0.3031595051288605, mean loss: 0.339361582643797
Epoch: 69, step: 1124, loss: 0.30022144317626953, mean loss: 0.33936119419847127
Epoch: 69, step: 1125, loss: 0.33808889985084534, mean loss: 0.33936118157174344
Epoch: 69, step: 1126, loss: 0.3155944347381592, mean loss: 0.33936094570394637
Epoch: 69, step: 1127, loss: 0.33855780959129333, mean loss: 0.3393609377334796
Epoch: 69, step: 1128, loss: 0.34640395641326904, mean loss: 0.3393610076289659
Epoch: 69, step: 1129, loss: 0.3397451341152191, mean loss: 0.33936101144103037
Epoch: 69, step: 1130, loss: 0.3178993761539459, mean loss: 0.3393607984582554
Epoch: 69, step: 1131, loss: 0.37297365069389343, mean loss: 0.33936113202498525
Epoch: 69, step: 1132, loss: 0.3149797320365906, mean loss: 0.33936089007160686
Epoch: 69, step: 1133, loss: 0.30457645654678345, mean loss: 0.3393605448852069
Epoch: 69, step: 1134, loss: 0.34352344274520874, mean loss: 0.3393605861956817
Epoch: 69, step: 1135, loss: 0.3340553641319275, mean loss: 0.3393605335498866
Epoch: 69, step: 1136, loss: 0.3453967571258545, mean loss: 0.3393605934491014
Epoch: 69, step: 1137, loss: 0.33282241225242615, mean loss: 0.33936052856945786
Epoch: 69, step: 1138, loss: 0.3351539373397827, mean loss: 0.3393604868270492
Epoch: 69, step: 1139, loss: 0.3360026478767395, mean loss: 0.3393604535072216
Epoch: 69, step: 1140, loss: 0.3202970623970032, mean loss: 0.3393602643431156
Epoch: 69, step: 1141, loss: 0.3395959436893463, mean loss: 0.33936026668171476
Epoch: 69, step: 1142, loss: 0.36411985754966736, mean loss: 0.3393605123637603
Epoch: 69, step: 1143, loss: 0.3330536186695099, mean loss: 0.33936044978295365
Epoch: 69, step: 1144, loss: 0.32610124349594116, mean loss: 0.3393603182184099
Epoch: 69, step: 1145, loss: 0.33200252056121826, mean loss: 0.33936024521134855
Epoch: 69, step: 1146, loss: 0.33854684233665466, mean loss: 0.33936023714051444
Epoch: 69, step: 1147, loss: 0.333984911441803, mean loss: 0.3393601838054047
Epoch: 69, step: 1148, loss: 0.3265826106071472, mean loss: 0.3393600570248997
Epoch: 69, step: 1149, loss: 0.32234445214271545, mean loss: 0.3393598881958472
Epoch: 69, step: 1150, loss: 0.3639060854911804, mean loss: 0.3393601317411189
Epoch: 69, step: 1151, loss: 0.3188570737838745, mean loss: 0.33935992831354855
Epoch: 69, step: 1152, loss: 0.3311200439929962, mean loss: 0.3393598465597429
Epoch: 69, step: 1153, loss: 0.2943567633628845, mean loss: 0.33935940005628823
Epoch: 69, step: 1154, loss: 0.3871326148509979, mean loss: 0.3393598740392311
Epoch: 69, step: 1155, loss: 0.3448967933654785, mean loss: 0.3393599289733462
Epoch: 69, step: 1156, loss: 0.3411552906036377, mean loss: 0.33935994678571046
Epoch: 69, step: 1157, loss: 0.3730994164943695, mean loss: 0.3393602815225967
Epoch: 69, step: 1158, loss: 0.3419865071773529, mean loss: 0.339360307577715
Epoch: 69, step: 1159, loss: 0.3137006461620331, mean loss: 0.33936005300747996
Epoch: 69, step: 1160, loss: 0.33346009254455566, mean loss: 0.3393599944743841
Epoch: 69, step: 1161, loss: 0.38727685809135437, mean loss: 0.3393604698495266
Epoch: 69, step: 1162, loss: 0.3353176414966583, mean loss: 0.3393604297417046
Epoch: 69, step: 1163, loss: 0.3352389335632324, mean loss: 0.3393603888538457
Epoch: 69, step: 1164, loss: 0.3107500672340393, mean loss: 0.3393601050241057
Epoch: 69, step: 1165, loss: 0.318533331155777, mean loss: 0.339359898413385
Epoch: 69, step: 1166, loss: 0.35423070192337036, mean loss: 0.339360045936807
Epoch: 69, step: 1167, loss: 0.2779502272605896, mean loss: 0.33935943673659
Epoch: 69, step: 1168, loss: 0.3618907630443573, mean loss: 0.3393596602505656
Epoch: 69, step: 1169, loss: 0.32316240668296814, mean loss: 0.33935949957309036
Epoch: 69, step: 1170, loss: 0.3405758738517761, mean loss: 0.33935951163945755
Epoch: 69, step: 1171, loss: 0.3757320046424866, mean loss: 0.3393598724490461
Epoch: 69, step: 1172, loss: 0.3365316390991211, mean loss: 0.3393598443936805
Epoch: 69, step: 1173, loss: 0.3362765908241272, mean loss: 0.3393598138088817
Epoch: 69, step: 1174, loss: 0.3401208519935608, mean loss: 0.3393598213580399
Epoch: 69, step: 1175, loss: 0.3226251006126404, mean loss: 0.3393596553587467
Epoch: 69, step: 1176, loss: 0.3415659964084625, mean loss: 0.3393596772442282
Epoch: 69, step: 1177, loss: 0.3355311155319214, mean loss: 0.3393596392677397
Epoch: 69, step: 1178, loss: 0.3977186977863312, mean loss: 0.3393602181405118
Epoch: 69, step: 1179, loss: 0.3653687834739685, mean loss: 0.33936047612104403
Epoch: 69, step: 1180, loss: 0.36470353603363037, mean loss: 0.3393607274978943
Epoch: 69, step: 1181, loss: 0.3782895505428314, mean loss: 0.3393611136275839
Epoch: 69, step: 1182, loss: 0.3967760503292084, mean loss: 0.33936168311286646
Epoch: 69, step: 1183, loss: 0.3425467610359192, mean loss: 0.33936171470459353
Epoch: 69, step: 1184, loss: 0.37499356269836426, mean loss: 0.3393620681215205
Epoch: 69, step: 1185, loss: 0.31932365894317627, mean loss: 0.3393618693711567
Epoch: 69, step: 1186, loss: 0.2919916808605194, mean loss: 0.3393613995360148
Epoch: 69, step: 1187, loss: 0.32073095440864563, mean loss: 0.339361214754166
Epoch: 69, step: 1188, loss: 0.3570898175239563, mean loss: 0.3393613905895517
Epoch: 69, step: 1189, loss: 0.31196752190589905, mean loss: 0.3393611188950614
Epoch: 69, step: 1190, loss: 0.34400153160095215, mean loss: 0.339361164918574
Epoch: 69, step: 1191, loss: 0.34070536494255066, mean loss: 0.33936117825018847
Epoch: 69, step: 1192, loss: 0.3564944863319397, mean loss: 0.33936134817459596
Epoch: 69, step: 1193, loss: 0.31007447838783264, mean loss: 0.3393610577166986
Epoch: 69, step: 1194, loss: 0.2985292077064514, mean loss: 0.33936065276336075
Epoch: 69, step: 1195, loss: 0.3195505142211914, mean loss: 0.33936045629657896
Epoch: 69, step: 1196, loss: 0.31312990188598633, mean loss: 0.3393601961579893
Epoch: 69, step: 1197, loss: 0.31446051597595215, mean loss: 0.33935994922064494
Epoch: 69, step: 1198, loss: 0.3502238094806671, mean loss: 0.33936005695962707
Epoch: 69, step: 1199, loss: 0.34040018916130066, mean loss: 0.33936006727471496
Epoch: 69, step: 1200, loss: 0.35722815990448, mean loss: 0.33936024447249585
Epoch: 69, step: 1201, loss: 0.33788618445396423, mean loss: 0.33936022985439535
Epoch: 69, step: 1202, loss: 0.3450028896331787, mean loss: 0.3393602858115129
Epoch: 69, step: 1203, loss: 0.3305024802684784, mean loss: 0.3393601979713151
Epoch: 69, step: 1204, loss: 0.32621875405311584, mean loss: 0.3393600676528542
Epoch: 69, step: 1205, loss: 0.3810371160507202, mean loss: 0.3393604809434315
Epoch: 69, step: 1206, loss: 0.3051271140575409, mean loss: 0.33936014147151095
Epoch: 69, step: 1207, loss: 0.3482668995857239, mean loss: 0.3393602297936532
Epoch: 69, step: 1208, loss: 0.3317706882953644, mean loss: 0.3393601545341808
Epoch: 69, step: 1209, loss: 0.3074744939804077, mean loss: 0.3393598383524725
Epoch: 69, step: 1210, loss: 0.3153013288974762, mean loss: 0.3393595997880189
Epoch: 69, step: 1211, loss: 0.33559513092041016, mean loss: 0.33935956245987287
Epoch: 69, step: 1212, loss: 0.31456565856933594, mean loss: 0.33935931660811536
Epoch: 69, step: 1213, loss: 0.3326994478702545, mean loss: 0.3393592505707456
Epoch: 69, step: 1214, loss: 0.39263302087783813, mean loss: 0.3393597788131062
Epoch: 69, step: 1215, loss: 0.36940571665763855, mean loss: 0.33936007673419694
Epoch: 69, step: 1216, loss: 0.3237404525279999, mean loss: 0.33935992185903996
Epoch: 69, step: 1217, loss: 0.38278263807296753, mean loss: 0.33936035240930285
Epoch: 69, step: 1218, loss: 0.32717975974082947, mean loss: 0.339360231635988
Epoch: 69, step: 1219, loss: 0.295464426279068, mean loss: 0.3393597964035243
Epoch: 69, step: 1220, loss: 0.3045758605003357, mean loss: 0.33935945151981867
Epoch: 69, step: 1221, loss: 0.3461735248565674, mean loss: 0.33935951908087814
Epoch: 69, step: 1222, loss: 0.31679683923721313, mean loss: 0.33935929537570714
Epoch: 69, step: 1223, loss: 0.3376854658126831, mean loss: 0.33935927878013344
Epoch: 69, step: 1224, loss: 0.3812873363494873, mean loss: 0.3393596944815202
Epoch: 69, step: 1225, loss: 0.33982717990875244, mean loss: 0.3393596991164216
Epoch: 69, step: 1226, loss: 0.2973688244819641, mean loss: 0.33935928280048183
Epoch: 69, step: 1227, loss: 0.3019792139530182, mean loss: 0.3393589122017663
Epoch: 69, step: 1228, loss: 0.32847359776496887, mean loss: 0.3393588042821268
Epoch: 69, step: 1229, loss: 0.2896459400653839, mean loss: 0.3393583114216563
Epoch: 69, step: 1230, loss: 0.30011114478111267, mean loss: 0.3393579223234712
Epoch: 69, step: 1231, loss: 0.33992668986320496, mean loss: 0.3393579279622024
Epoch: 69, step: 1232, loss: 0.340270072221756, mean loss: 0.3393579370050625
Epoch: 69, step: 1233, loss: 0.3484279215335846, mean loss: 0.339358026922625
Epoch: 69, step: 1234, loss: 0.3277371823787689, mean loss: 0.3393579117176152
Epoch: 69, step: 1235, loss: 0.3457087278366089, mean loss: 0.33935797467677253
Epoch: 69, step: 1236, loss: 0.30645015835762024, mean loss: 0.33935764844659877
Epoch: 69, step: 1237, loss: 0.31585362553596497, mean loss: 0.33935741544282266
Epoch: 69, step: 1238, loss: 0.3286965787410736, mean loss: 0.33935730975918743
Epoch: 69, step: 1239, loss: 0.31860384345054626, mean loss: 0.3393571040267406
Epoch: 69, step: 1240, loss: 0.2962188124656677, mean loss: 0.33935667639416267
Epoch: 69, step: 1241, loss: 0.32454487681388855, mean loss: 0.3393565295653241
Epoch: 69, step: 1242, loss: 0.3543808162212372, mean loss: 0.3393566784990631
Epoch: 69, step: 1243, loss: 0.31406691670417786, mean loss: 0.3393564278075306
Epoch: 69, step: 1244, loss: 0.3324814736843109, mean loss: 0.33935635965838334
Epoch: 69, step: 1245, loss: 0.3153402805328369, mean loss: 0.33935612159729095
Epoch: 69, step: 1246, loss: 0.32422125339508057, mean loss: 0.3393559715733206
Epoch: 69, step: 1247, loss: 0.328389436006546, mean loss: 0.3393558628689119
Epoch: 69, step: 1248, loss: 0.3017592430114746, mean loss: 0.3393554902008259
Epoch: 69, step: 1249, loss: 0.29244616627693176, mean loss: 0.3393550252272525
Epoch: 69, step: 1250, loss: 0.330339252948761, mean loss: 0.3393549358621978
Epoch: 69, step: 1251, loss: 0.3068435490131378, mean loss: 0.3393546136099294
Epoch: 69, step: 1252, loss: 0.2970135509967804, mean loss: 0.33935419393025557
Epoch: 69, step: 1253, loss: 0.3411969244480133, mean loss: 0.3393542121950045
Epoch: 69, step: 1254, loss: 0.33761507272720337, mean loss: 0.33935419495719865
Epoch: 69, step: 1255, loss: 0.3127889931201935, mean loss: 0.3393539316538462
Epoch: 69, step: 1256, loss: 0.302389919757843, mean loss: 0.3393535652853975
Epoch: 69, step: 1257, loss: 0.36847203969955444, mean loss: 0.3393538538900164
Epoch: 69, step: 1258, loss: 0.3316988945007324, mean loss: 0.3393537780194639
Epoch: 69, step: 1259, loss: 0.2705007493495941, mean loss: 0.33935309560362314
Epoch: 69, step: 1260, loss: 0.3461025357246399, mean loss: 0.339353162497982
Epoch: 69, step: 1261, loss: 0.3308064341545105, mean loss: 0.339353077791364
Epoch: 69, step: 1262, loss: 0.3462749719619751, mean loss: 0.33935314639357184
Epoch: 69, step: 1263, loss: 0.36655130982398987, mean loss: 0.33935341594920543
Epoch: 69, step: 1264, loss: 0.3242877423763275, mean loss: 0.33935326663776577
Epoch: 69, step: 1265, loss: 0.3559741675853729, mean loss: 0.3393534313609719
Epoch: 69, step: 1266, loss: 0.3325694501399994, mean loss: 0.339353364128271
Epoch: 69, step: 1267, loss: 0.34844204783439636, mean loss: 0.33935345420085195
Epoch: 69, step: 1268, loss: 0.29556113481521606, mean loss: 0.33935302020531766
Epoch: 69, step: 1269, loss: 0.3379829227924347, mean loss: 0.33935300662735984
Epoch: 69, step: 1270, loss: 0.3467489778995514, mean loss: 0.3393530799222876
Epoch: 69, step: 1271, loss: 0.36184191703796387, mean loss: 0.33935330278704673
Epoch: 69, step: 1272, loss: 0.34220629930496216, mean loss: 0.33935333106001064
Epoch: 69, step: 1273, loss: 0.2952907681465149, mean loss: 0.33935289440791555
Epoch: 69, step: 1274, loss: 0.3220296800136566, mean loss: 0.3393527227396693
Epoch: 69, step: 1275, loss: 0.3556658923625946, mean loss: 0.33935288439705025
Epoch: 69, step: 1276, loss: 0.31769341230392456, mean loss: 0.3393526697619478
Epoch: 69, step: 1277, loss: 0.3044945299625397, mean loss: 0.33935232433772716
Epoch: 69, step: 1278, loss: 0.4129016399383545, mean loss: 0.3393530531621398
Epoch: 69, step: 1279, loss: 0.3018367886543274, mean loss: 0.339352681404792
Epoch: 69, step: 1280, loss: 0.3013664484024048, mean loss: 0.3393523049941476
Epoch: 69, step: 1281, loss: 0.3862995207309723, mean loss: 0.3393527701957542
Epoch: 69, step: 1282, loss: 0.3607567846775055, mean loss: 0.3393529822867825
Epoch: 69, step: 1283, loss: 0.3368666172027588, mean loss: 0.339352957649792
Epoch: 69, step: 1284, loss: 0.35508567094802856, mean loss: 0.33935311354116543
Epoch: 69, step: 1285, loss: 0.33203768730163574, mean loss: 0.3393530410552234
Epoch: 69, step: 1286, loss: 0.29525402188301086, mean loss: 0.3393526040981455
Epoch: 69, step: 1287, loss: 0.33306655287742615, mean loss: 0.33935254181314667
Epoch: 69, step: 1288, loss: 0.3685736656188965, mean loss: 0.3393528313462039
Epoch: 69, step: 1289, loss: 0.3537790775299072, mean loss: 0.339352974285052
Epoch: 69, step: 1290, loss: 0.2935298979282379, mean loss: 0.3393525202630722
Epoch: 69, step: 1291, loss: 0.33953559398651123, mean loss: 0.3393525220769764
Epoch: 69, step: 1292, loss: 0.33558711409568787, mean loss: 0.3393524847694832
Epoch: 69, step: 1293, loss: 0.3852168321609497, mean loss: 0.33935293918687537
Epoch: 69, step: 1294, loss: 0.36083683371543884, mean loss: 0.3393531520441197
Epoch: 69, step: 1295, loss: 0.3363359868526459, mean loss: 0.339353122151071
Epoch: 69, step: 1296, loss: 0.29576557874679565, mean loss: 0.339352690304763
Epoch: 69, step: 1297, loss: 0.3266680836677551, mean loss: 0.3393525646324758
Epoch: 69, step: 1298, loss: 0.34500619769096375, mean loss: 0.3393526206450885
Epoch: 69, step: 1299, loss: 0.3271443545818329, mean loss: 0.33935249969452513
Epoch: 69, step: 1300, loss: 0.3248059153556824, mean loss: 0.3393523555790438
Epoch: 69, step: 1301, loss: 0.41981515288352966, mean loss: 0.3393531527297433
Epoch: 69, step: 1302, loss: 0.33891913294792175, mean loss: 0.3393531484299208
Epoch: 69, step: 1303, loss: 0.32463231682777405, mean loss: 0.33935300259247675
Epoch: 69, step: 1304, loss: 0.313458651304245, mean loss: 0.3393527460629071
Epoch: 69, step: 1305, loss: 0.32608211040496826, mean loss: 0.3393526145949784
Epoch: 69, step: 1306, loss: 0.31735655665397644, mean loss: 0.33935239668925
Epoch: 69, step: 1307, loss: 0.3305767774581909, mean loss: 0.339352309753729
Epoch: 69, step: 1308, loss: 0.3052334487438202, mean loss: 0.3393519717591675
Epoch: 69, step: 1309, loss: 0.35297784209251404, mean loss: 0.33935210674094324
Epoch: 69, step: 1310, loss: 0.3194265365600586, mean loss: 0.3393519093544911
Epoch: 69, step: 1311, loss: 0.333726167678833, mean loss: 0.3393518536253863
Epoch: 69, step: 1312, loss: 0.3800737261772156, mean loss: 0.33935225701593547
Epoch: 69, step: 1313, loss: 0.3902263939380646, mean loss: 0.3393527609697435
Epoch: 69, step: 1314, loss: 0.3475929796695709, mean loss: 0.33935284259566795
Epoch: 69, step: 1315, loss: 0.33708876371383667, mean loss: 0.33935282016838686
Epoch: 69, step: 1316, loss: 0.32570981979370117, mean loss: 0.33935268502628735
Epoch: 69, step: 1317, loss: 0.32030346989631653, mean loss: 0.339352496334258
Epoch: 69, step: 1318, loss: 0.3394941985607147, mean loss: 0.33935249773787574
Epoch: 69, step: 1319, loss: 0.3297269642353058, mean loss: 0.3393524023940279
Epoch: 69, step: 1320, loss: 0.31607624888420105, mean loss: 0.33935217183890537
Epoch: 69, step: 1321, loss: 0.3432162404060364, mean loss: 0.33935221011292593
Epoch: 69, step: 1322, loss: 0.3531422019004822, mean loss: 0.3393523467029455
Epoch: 69, step: 1323, loss: 0.34374532103538513, mean loss: 0.3393523902149734
Epoch: 69, step: 1324, loss: 0.3012760579586029, mean loss: 0.33935201307595675
Epoch: 69, step: 1325, loss: 0.3500194549560547, mean loss: 0.3393521187339457
Epoch: 69, step: 1326, loss: 0.34043383598327637, mean loss: 0.3393521294479424
Epoch: 69, step: 1327, loss: 0.3117336928844452, mean loss: 0.33935185590057343
Epoch: 69, step: 1328, loss: 0.32991594076156616, mean loss: 0.33935176244328485
Epoch: 69, step: 1329, loss: 0.30309486389160156, mean loss: 0.3393514033432061
Epoch: 69, step: 1330, loss: 0.3138717710971832, mean loss: 0.33935115098716656
Epoch: 69, step: 1331, loss: 0.30910295248031616, mean loss: 0.33935085140513555
Epoch: 69, step: 1332, loss: 0.33839869499206543, mean loss: 0.3393508419749499
Epoch: 69, step: 1333, loss: 0.3226112425327301, mean loss: 0.33935067618709763
Epoch: 69, step: 1334, loss: 0.38024500012397766, mean loss: 0.3393510811976842
Epoch: 69, step: 1335, loss: 0.3387715816497803, mean loss: 0.33935107545847387
Epoch: 69, step: 1336, loss: 0.31922468543052673, mean loss: 0.3393508761340007
Epoch: 69, step: 1337, loss: 0.3072294592857361, mean loss: 0.33935055801827935
Epoch: 69, step: 1338, loss: 0.291544109582901, mean loss: 0.33935008456991655
Epoch: 69, step: 1339, loss: 0.30871400237083435, mean loss: 0.3393497811702751
Epoch: 69, step: 1340, loss: 0.34929749369621277, mean loss: 0.33934987968491237
Epoch: 69, step: 1341, loss: 0.3705975115299225, mean loss: 0.3393501891348108
Epoch: 69, step: 1342, loss: 0.33851104974746704, mean loss: 0.3393501808247722
Epoch: 69, step: 1343, loss: 0.35066357254981995, mean loss: 0.339350292860737
Epoch: 69, step: 1344, loss: 0.306266725063324, mean loss: 0.339349965239028
Epoch: 69, step: 1345, loss: 0.30462926626205444, mean loss: 0.3393496214084545
Epoch: 69, step: 1346, loss: 0.34566596150398254, mean loss: 0.3393496839570032
Epoch: 69, step: 1347, loss: 0.328149676322937, mean loss: 0.3393495730482688
Epoch: 69, step: 1348, loss: 0.3092527687549591, mean loss: 0.3393492750158452
Epoch: 69, step: 1349, loss: 0.3381626605987549, mean loss: 0.33934926326555886
Epoch: 69, step: 1350, loss: 0.3654744327068329, mean loss: 0.33934952196390067
Epoch: 69, step: 1351, loss: 0.31112128496170044, mean loss: 0.3393492424431952
Epoch: 69, step: 1352, loss: 0.32821977138519287, mean loss: 0.33934913223840996
Epoch: 69, step: 1353, loss: 0.36013367772102356, mean loss: 0.339349338046366
Epoch: 69, step: 1354, loss: 0.30701780319213867, mean loss: 0.339349017903632
Epoch: 69, step: 1355, loss: 0.3452654480934143, mean loss: 0.33934907648678897
Epoch: 69, step: 1356, loss: 0.3191641867160797, mean loss: 0.3393488766225432
Epoch: 69, step: 1357, loss: 0.3134949207305908, mean loss: 0.33934862062757426
Epoch: 69, step: 1358, loss: 0.3115399181842804, mean loss: 0.33934834528025565
Epoch: 69, step: 1359, loss: 0.31584784388542175, mean loss: 0.33934811259280867
Epoch: 69, step: 1360, loss: 0.29966843128204346, mean loss: 0.3393477197130072
Epoch: 69, step: 1361, loss: 0.37139785289764404, mean loss: 0.3393480370473424
Epoch: 69, step: 1362, loss: 0.37853315472602844, mean loss: 0.3393484250226459
Epoch: 69, step: 1363, loss: 0.31719261407852173, mean loss: 0.3393482056581811
Epoch: 69, step: 1364, loss: 0.2946069836616516, mean loss: 0.339347762680171
Epoch: 69, step: 1365, loss: 0.32780569791793823, mean loss: 0.33934764840456494
Epoch: 69, step: 1366, loss: 0.30832144618034363, mean loss: 0.3393473412235681
Epoch: 69, step: 1367, loss: 0.36274054646492004, mean loss: 0.339347572830289
Epoch: 69, step: 1368, loss: 0.382142573595047, mean loss: 0.339347996522193
Epoch: 69, step: 1369, loss: 0.36315155029296875, mean loss: 0.3393482321869433
Epoch: 69, step: 1370, loss: 0.3669925928115845, mean loss: 0.3393485058745157
Epoch: 69, step: 1371, loss: 0.2961359918117523, mean loss: 0.33934807806172795
Epoch: 69, step: 1372, loss: 0.32057154178619385, mean loss: 0.3393478921719926
Epoch: 69, step: 1373, loss: 0.3374418616294861, mean loss: 0.3393478733022714
Epoch: 69, step: 1374, loss: 0.37854522466659546, mean loss: 0.33934826135259627
Epoch: 69, step: 1375, loss: 0.28640493750572205, mean loss: 0.33934773722354383
Epoch: 69, step: 1376, loss: 0.33448928594589233, mean loss: 0.33934768912625657
Epoch: 69, step: 1377, loss: 0.3198293447494507, mean loss: 0.33934749590210567
Epoch: 69, step: 1378, loss: 0.326193630695343, mean loss: 0.33934736568515567
Epoch: 69, step: 1379, loss: 0.34029990434646606, mean loss: 0.3393473751147377
Epoch: 69, step: 1380, loss: 0.3130589425563812, mean loss: 0.3393471148770296
Epoch: 69, step: 1381, loss: 0.3394431173801422, mean loss: 0.3393471158273801
Epoch: 69, step: 1382, loss: 0.30499762296676636, mean loss: 0.3393467757973574
Epoch: 69, step: 1383, loss: 0.3650292158126831, mean loss: 0.3393470300285989
Epoch: 69, step: 1384, loss: 0.30996882915496826, mean loss: 0.33934673921578895
Epoch: 69, step: 1385, loss: 0.32150667905807495, mean loss: 0.33934656261999635
Epoch: 69, step: 1386, loss: 0.3673658072948456, mean loss: 0.3393468399751004
Epoch: 69, step: 1387, loss: 0.3581943213939667, mean loss: 0.33934702653949517
Epoch: 69, step: 1388, loss: 0.32086700201034546, mean loss: 0.3393468436142338
Epoch: 69, step: 1389, loss: 0.35672247409820557, mean loss: 0.3393470156059041
Epoch: 69, step: 1390, loss: 0.3825293481349945, mean loss: 0.3393474430394865
Epoch: 69, step: 1391, loss: 0.37717390060424805, mean loss: 0.3393478174550699
Epoch: 69, step: 1392, loss: 0.29522979259490967, mean loss: 0.3393473807683279
Epoch: 69, step: 1393, loss: 0.37583333253860474, mean loss: 0.33934774190810585
Epoch: 69, step: 1394, loss: 0.3308507800102234, mean loss: 0.33934765780558385
Epoch: 69, step: 1395, loss: 0.29615750908851624, mean loss: 0.33934723031579134
Epoch: 69, step: 1396, loss: 0.3120161294937134, mean loss: 0.3393469597992193
Epoch: 69, step: 1397, loss: 0.3507474958896637, mean loss: 0.339347072637829
Epoch: 69, step: 1398, loss: 0.3174230754375458, mean loss: 0.3393468556437457
Epoch: 69, step: 1399, loss: 0.3852780759334564, mean loss: 0.3393473102462665
Epoch: 69, step: 1400, loss: 0.36926206946372986, mean loss: 0.3393476063235374
Epoch: 69, step: 1401, loss: 0.3227023482322693, mean loss: 0.3393474415809842
Epoch: 69, step: 1402, loss: 0.3579961657524109, mean loss: 0.33934762615054814
Epoch: 69, step: 1403, loss: 0.3305951654911041, mean loss: 0.3393475395268282
Epoch: 69, step: 1404, loss: 0.29965612292289734, mean loss: 0.33934714670196897
Epoch: 69, step: 1405, loss: 0.3337882161140442, mean loss: 0.3393470916859302
Epoch: 69, step: 1406, loss: 0.3518918454647064, mean loss: 0.3393472158385561
Epoch: 69, step: 1407, loss: 0.3638855814933777, mean loss: 0.33934745868687616
Epoch: 69, step: 1408, loss: 0.30446386337280273, mean loss: 0.33934711345855895
Epoch: 69, step: 1409, loss: 0.3304041624069214, mean loss: 0.3393470249547978
Epoch: 69, step: 1410, loss: 0.33314386010169983, mean loss: 0.3393469635658911
Epoch: 69, step: 1411, loss: 0.34501463174819946, mean loss: 0.33934701965476155
Epoch: 69, step: 1412, loss: 0.34478452801704407, mean loss: 0.33934707346537185
Epoch: 69, step: 1413, loss: 0.3189270496368408, mean loss: 0.3393468713869569
Epoch: 69, step: 1414, loss: 0.3669685423374176, mean loss: 0.3393471447308224
Epoch: 69, step: 1415, loss: 0.34918412566185, mean loss: 0.3393472420765546
Epoch: 69, step: 1416, loss: 0.3230226933956146, mean loss: 0.3393470805321306
Epoch: 69, step: 1417, loss: 0.35452190041542053, mean loss: 0.33934723069758554
Epoch: 69, step: 1418, loss: 0.35816022753715515, mean loss: 0.3393474168635035
Epoch: 69, step: 1419, loss: 0.3259205222129822, mean loss: 0.3393472839976207
Epoch: 69, step: 1420, loss: 0.32328546047210693, mean loss: 0.3393471250593628
Epoch: 69, step: 1421, loss: 0.33884185552597046, mean loss: 0.33934712005956535
Epoch: 69, step: 1422, loss: 0.335720032453537, mean loss: 0.3393470841687728
Epoch: 69, step: 1423, loss: 0.32926568388938904, mean loss: 0.3393469844121898
Epoch: 69, step: 1424, loss: 0.2900165915489197, mean loss: 0.3393464962872666
Epoch: 69, step: 1425, loss: 0.3374060392379761, mean loss: 0.3393464770866071
Epoch: 69, step: 1426, loss: 0.34338632225990295, mean loss: 0.3393465170601402
Epoch: 69, step: 1427, loss: 0.3240230679512024, mean loss: 0.3393463654388991
Epoch: 69, step: 1428, loss: 0.2997492551803589, mean loss: 0.33934597364045
Epoch: 69, step: 1429, loss: 0.36884501576423645, mean loss: 0.3393462655194412
Epoch: 69, step: 1430, loss: 0.4164787530899048, mean loss: 0.3393470287011679
Epoch: 69, step: 1431, loss: 0.3439960777759552, mean loss: 0.339347074700387
Epoch: 69, step: 1432, loss: 0.2930828928947449, mean loss: 0.33934661695190027
Epoch: 69, step: 1433, loss: 0.30138832330703735, mean loss: 0.33934624138750286
Epoch: 69, step: 1434, loss: 0.3356478810310364, mean loss: 0.33934620479579647
Epoch: 69, step: 1435, loss: 0.3384687006473541, mean loss: 0.3393461961138257
Epoch: 69, step: 1436, loss: 0.2896639406681061, mean loss: 0.3393457045655839
Epoch: 69, step: 1437, loss: 0.2961360216140747, mean loss: 0.3393452770601626
Epoch: 69, step: 1438, loss: 0.3605451285839081, mean loss: 0.3393454868039323
Epoch: 69, step: 1439, loss: 0.312370628118515, mean loss: 0.33934521992694183
Epoch: 69, step: 1440, loss: 0.3099993169307709, mean loss: 0.3393449295947892
Epoch: 69, step: 1441, loss: 0.3683639466762543, mean loss: 0.33934521669007284
Epoch: 69, step: 1442, loss: 0.34949836134910583, mean loss: 0.3393453171376896
Epoch: 69, step: 1443, loss: 0.3235085904598236, mean loss: 0.33934516046251473
Valid: 69, mean loss: 0.1847439830501874
Epoch: 70, step: 0, loss: 0.3399142026901245, mean loss: 0.3393451660920814
Epoch: 70, step: 1, loss: 0.3112677037715912, mean loss: 0.3393448883229205
Epoch: 70, step: 2, loss: 0.3145778477191925, mean loss: 0.3393446433060472
Epoch: 70, step: 3, loss: 0.38677358627319336, mean loss: 0.33934511250931343
Epoch: 70, step: 4, loss: 0.3526650369167328, mean loss: 0.3393452442788579
Epoch: 70, step: 5, loss: 0.31946781277656555, mean loss: 0.3393450476400405
Epoch: 70, step: 6, loss: 0.32849234342575073, mean loss: 0.33934494028000195
Epoch: 70, step: 7, loss: 0.35393208265304565, mean loss: 0.3393450845814262
Epoch: 70, step: 8, loss: 0.311441570520401, mean loss: 0.3393448085522434
Epoch: 70, step: 9, loss: 0.3487342596054077, mean loss: 0.3393449014343391
Epoch: 70, step: 10, loss: 0.3013851046562195, mean loss: 0.33934452593308995
Epoch: 70, step: 11, loss: 0.35316193103790283, mean loss: 0.33934466261457913
Epoch: 70, step: 12, loss: 0.36120283603668213, mean loss: 0.33934487883304554
Epoch: 70, step: 13, loss: 0.34343045949935913, mean loss: 0.33934491924672655
Epoch: 70, step: 14, loss: 0.3020927906036377, mean loss: 0.3393445507603658
Epoch: 70, step: 15, loss: 0.2982984185218811, mean loss: 0.33934414474892877
Epoch: 70, step: 16, loss: 0.29142752289772034, mean loss: 0.3393436707821261
Epoch: 70, step: 17, loss: 0.3381201922893524, mean loss: 0.3393436586802201
Epoch: 70, step: 18, loss: 0.3334525525569916, mean loss: 0.33934360040955347
Epoch: 70, step: 19, loss: 0.3073314428329468, mean loss: 0.33934328377100176
Epoch: 70, step: 20, loss: 0.30193638801574707, mean loss: 0.33934291377569253
Epoch: 70, step: 21, loss: 0.3107849061489105, mean loss: 0.33934263130840575
Epoch: 70, step: 22, loss: 0.39039307832717896, mean loss: 0.3393431362434425
Epoch: 70, step: 23, loss: 0.2972337603569031, mean loss: 0.33934271974779556
Epoch: 70, step: 24, loss: 0.32028740644454956, mean loss: 0.33934253127726194
Epoch: 70, step: 25, loss: 0.30559006333351135, mean loss: 0.33934219744476984
Epoch: 70, step: 26, loss: 0.30830392241477966, mean loss: 0.3393418904603372
Epoch: 70, step: 27, loss: 0.3720319867134094, mean loss: 0.3393422137789297
Epoch: 70, step: 28, loss: 0.3670942783355713, mean loss: 0.3393424882556287
Epoch: 70, step: 29, loss: 0.3878590166568756, mean loss: 0.339342968094699
Epoch: 70, step: 30, loss: 0.329596608877182, mean loss: 0.33934287170202937
Epoch: 70, step: 31, loss: 0.34240084886550903, mean loss: 0.33934290194549366
Epoch: 70, step: 32, loss: 0.3034369647502899, mean loss: 0.33934254683846293
Epoch: 70, step: 33, loss: 0.3273909091949463, mean loss: 0.3393424286388304
Epoch: 70, step: 34, loss: 0.3827104866504669, mean loss: 0.3393428575371938
Epoch: 70, step: 35, loss: 0.32699066400527954, mean loss: 0.3393427353785489
Epoch: 70, step: 36, loss: 0.3407233655452728, mean loss: 0.33934274903233774
Epoch: 70, step: 37, loss: 0.3198774456977844, mean loss: 0.33934255653146417
Epoch: 70, step: 38, loss: 0.3292582035064697, mean loss: 0.33934245680388553
Epoch: 70, step: 39, loss: 0.3331877291202545, mean loss: 0.33934239593830323
Epoch: 70, step: 40, loss: 0.3448602855205536, mean loss: 0.33934245050550077
Epoch: 70, step: 41, loss: 0.29810649156570435, mean loss: 0.3393420427212507
Epoch: 70, step: 42, loss: 0.34703242778778076, mean loss: 0.33934211877106196
Epoch: 70, step: 43, loss: 0.3702869117259979, mean loss: 0.33934242477945714
Epoch: 70, step: 44, loss: 0.35347381234169006, mean loss: 0.33934256452123773
Epoch: 70, step: 45, loss: 0.324256956577301, mean loss: 0.339342415344884
Epoch: 70, step: 46, loss: 0.304913192987442, mean loss: 0.3393420748895916
Epoch: 70, step: 47, loss: 0.3472730815410614, mean loss: 0.3393421533150193
Epoch: 70, step: 48, loss: 0.34510934352874756, mean loss: 0.3393422103430747
Epoch: 70, step: 49, loss: 0.31195196509361267, mean loss: 0.3393419395011361
Epoch: 70, step: 50, loss: 0.30855637788772583, mean loss: 0.3393416350884277
Epoch: 70, step: 51, loss: 0.34283754229545593, mean loss: 0.33934166965619267
Epoch: 70, step: 52, loss: 0.34641575813293457, mean loss: 0.33934173960456243
Epoch: 70, step: 53, loss: 0.3418247699737549, mean loss: 0.33934176415644773
Epoch: 70, step: 54, loss: 0.35107505321502686, mean loss: 0.3393418801725555
Epoch: 70, step: 55, loss: 0.288244366645813, mean loss: 0.3393413749368973
Epoch: 70, step: 56, loss: 0.3188624978065491, mean loss: 0.3393411724503975
Epoch: 70, step: 57, loss: 0.35625991225242615, mean loss: 0.3393413397341069
Epoch: 70, step: 58, loss: 0.3295672535896301, mean loss: 0.33934124309397656
Epoch: 70, step: 59, loss: 0.3260384500026703, mean loss: 0.33934111156547064
Epoch: 70, step: 60, loss: 0.3394601047039032, mean loss: 0.3393411127419781
Epoch: 70, step: 61, loss: 0.3850497901439667, mean loss: 0.33934156466775967
Epoch: 70, step: 62, loss: 0.32965123653411865, mean loss: 0.339341468859566
Epoch: 70, step: 63, loss: 0.35761788487434387, mean loss: 0.3393416495565526
Epoch: 70, step: 64, loss: 0.32038500905036926, mean loss: 0.3393414621361116
Epoch: 70, step: 65, loss: 0.3399486839771271, mean loss: 0.3393414681395308
Epoch: 70, step: 66, loss: 0.33966901898384094, mean loss: 0.3393414713778952
Epoch: 70, step: 67, loss: 0.3593433201313019, mean loss: 0.33934166912623187
Epoch: 70, step: 68, loss: 0.34637755155563354, mean loss: 0.3393417386858165
Epoch: 70, step: 69, loss: 0.31609779596328735, mean loss: 0.33934150888905207
Epoch: 70, step: 70, loss: 0.31865018606185913, mean loss: 0.3393413043302951
Epoch: 70, step: 71, loss: 0.31804969906806946, mean loss: 0.339341093839101
Epoch: 70, step: 72, loss: 0.32132166624069214, mean loss: 0.3393409156987829
Epoch: 70, step: 73, loss: 0.3408743441104889, mean loss: 0.33934093085812816
Epoch: 70, step: 74, loss: 0.31000882387161255, mean loss: 0.33934064088623367
Epoch: 70, step: 75, loss: 0.3683302104473114, mean loss: 0.3393409274690321
Epoch: 70, step: 76, loss: 0.3295861780643463, mean loss: 0.3393408310372537
Epoch: 70, step: 77, loss: 0.3530299663543701, mean loss: 0.33934096636155153
Epoch: 70, step: 78, loss: 0.385769784450531, mean loss: 0.33934142533028483
Epoch: 70, step: 79, loss: 0.3212237060070038, mean loss: 0.3393412462306474
Epoch: 70, step: 80, loss: 0.3306109309196472, mean loss: 0.33934115992945113
Epoch: 70, step: 81, loss: 0.2928289771080017, mean loss: 0.33934070015025714
Epoch: 70, step: 82, loss: 0.3757440745830536, mean loss: 0.339341059998961
Epoch: 70, step: 83, loss: 0.3295018672943115, mean loss: 0.33934096273913833
Epoch: 70, step: 84, loss: 0.3467784523963928, mean loss: 0.33934103625754547
Epoch: 70, step: 85, loss: 0.35156935453414917, mean loss: 0.3393411571313398
Epoch: 70, step: 86, loss: 0.3850487172603607, mean loss: 0.33934160893439935
Epoch: 70, step: 87, loss: 0.3057568371295929, mean loss: 0.33934127696409444
Epoch: 70, step: 88, loss: 0.31392133235931396, mean loss: 0.3393410257019034
Epoch: 70, step: 89, loss: 0.3297456204891205, mean loss: 0.3393409308575304
Epoch: 70, step: 90, loss: 0.334663063287735, mean loss: 0.33934088462029277
Epoch: 70, step: 91, loss: 0.38227301836013794, mean loss: 0.33934130896827186
Epoch: 70, step: 92, loss: 0.297650009393692, mean loss: 0.33934089688896635
Epoch: 70, step: 93, loss: 0.3442959785461426, mean loss: 0.33934094586480656
Epoch: 70, step: 94, loss: 0.3420839309692383, mean loss: 0.3393409729760999
Epoch: 70, step: 95, loss: 0.3440084755420685, mean loss: 0.33934101910860726
Epoch: 70, step: 96, loss: 0.31029799580574036, mean loss: 0.33934073205697196
Epoch: 70, step: 97, loss: 0.3768482506275177, mean loss: 0.33934110276521456
Epoch: 70, step: 98, loss: 0.3700477182865143, mean loss: 0.3393414062532459
Epoch: 70, step: 99, loss: 0.3149990737438202, mean loss: 0.33934116566881706
Epoch: 70, step: 100, loss: 0.36678269505500793, mean loss: 0.3393414368810939
Epoch: 70, step: 101, loss: 0.3427616059780121, mean loss: 0.3393414706832435
Epoch: 70, step: 102, loss: 0.3101133406162262, mean loss: 0.3393411818192044
Epoch: 70, step: 103, loss: 0.34865620732307434, mean loss: 0.33934127387946594
Epoch: 70, step: 104, loss: 0.3037801682949066, mean loss: 0.33934092243305014
Epoch: 70, step: 105, loss: 0.33374032378196716, mean loss: 0.3393408670835092
Epoch: 70, step: 106, loss: 0.32622629404067993, mean loss: 0.3393407374762173
Epoch: 70, step: 107, loss: 0.3091696798801422, mean loss: 0.33934043930788116
Epoch: 70, step: 108, loss: 0.2923639416694641, mean loss: 0.339339975062779
Epoch: 70, step: 109, loss: 0.3277255892753601, mean loss: 0.33933986028477936
Epoch: 70, step: 110, loss: 0.36495548486709595, mean loss: 0.3393401134261119
Epoch: 70, step: 111, loss: 0.36287277936935425, mean loss: 0.33934034598072044
Epoch: 70, step: 112, loss: 0.3030770719051361, mean loss: 0.33933998762318507
Epoch: 70, step: 113, loss: 0.3338531255722046, mean loss: 0.33933993340196594
Epoch: 70, step: 114, loss: 0.29154643416404724, mean loss: 0.3393394611108524
Epoch: 70, step: 115, loss: 0.2895892262458801, mean loss: 0.3393389694883094
Epoch: 70, step: 116, loss: 0.33401691913604736, mean loss: 0.33933891689732
Epoch: 70, step: 117, loss: 0.279611736536026, mean loss: 0.3393383266961267
Epoch: 70, step: 118, loss: 0.3218703866004944, mean loss: 0.33933815408631735
Epoch: 70, step: 119, loss: 0.3122422397136688, mean loss: 0.3393378863401279
Epoch: 70, step: 120, loss: 0.312343567609787, mean loss: 0.33933761960048375
Epoch: 70, step: 121, loss: 0.30630892515182495, mean loss: 0.33933729323643513
Epoch: 70, step: 122, loss: 0.3259558081626892, mean loss: 0.33933716101224143
Epoch: 70, step: 123, loss: 0.3205246925354004, mean loss: 0.33933697512563143
Epoch: 70, step: 124, loss: 0.3688820004463196, mean loss: 0.3393372670580984
Epoch: 70, step: 125, loss: 0.3501662313938141, mean loss: 0.339337374057331
Epoch: 70, step: 126, loss: 0.32429200410842896, mean loss: 0.33933722539795025
Epoch: 70, step: 127, loss: 0.3563019931316376, mean loss: 0.3393373930207442
Epoch: 70, step: 128, loss: 0.30802303552627563, mean loss: 0.33933708361785025
Epoch: 70, step: 129, loss: 0.32045018672943115, mean loss: 0.3393368970068742
Epoch: 70, step: 130, loss: 0.35393062233924866, mean loss: 0.3393370411979733
Epoch: 70, step: 131, loss: 0.32739898562431335, mean loss: 0.33933692324698356
Epoch: 70, step: 132, loss: 0.40033963322639465, mean loss: 0.33933752596313643
Epoch: 70, step: 133, loss: 0.3800789713859558, mean loss: 0.33933792849090355
Epoch: 70, step: 134, loss: 0.3145785331726074, mean loss: 0.33933768386910523
Epoch: 70, step: 135, loss: 0.29220688343048096, mean loss: 0.33933721822335317
Epoch: 70, step: 136, loss: 0.3402913212776184, mean loss: 0.3393372276496655
Epoch: 70, step: 137, loss: 0.3220396637916565, mean loss: 0.3393370567555177
Epoch: 70, step: 138, loss: 0.4096699655056, mean loss: 0.3393377516142769
Epoch: 70, step: 139, loss: 0.3405960500240326, mean loss: 0.33933776404559884
Epoch: 70, step: 140, loss: 0.3008604645729065, mean loss: 0.3393373839140108
Epoch: 70, step: 141, loss: 0.33995115756988525, mean loss: 0.3393373899776497
Epoch: 70, step: 142, loss: 0.3654812276363373, mean loss: 0.33933764825726653
Epoch: 70, step: 143, loss: 0.39373576641082764, mean loss: 0.3393381856606309
Epoch: 70, step: 144, loss: 0.34005406498908997, mean loss: 0.33933819273279026
Epoch: 70, step: 145, loss: 0.33709362149238586, mean loss: 0.3393381705589294
Epoch: 70, step: 146, loss: 0.36923351883888245, mean loss: 0.33933846588871575
Epoch: 70, step: 147, loss: 0.32729223370552063, mean loss: 0.33933834688772607
Epoch: 70, step: 148, loss: 0.32578325271606445, mean loss: 0.33933821298247985
Epoch: 70, step: 149, loss: 0.3645448386669159, mean loss: 0.3393384619859935
Epoch: 70, step: 150, loss: 0.3778354823589325, mean loss: 0.3393388422748415
Epoch: 70, step: 151, loss: 0.3084026873111725, mean loss: 0.339338536678242
Epoch: 70, step: 152, loss: 0.3017047941684723, mean loss: 0.33933816492454005
Epoch: 70, step: 153, loss: 0.3337031602859497, mean loss: 0.3393381092613771
Epoch: 70, step: 154, loss: 0.3228367269039154, mean loss: 0.3393379462606129
Epoch: 70, step: 155, loss: 0.3548178970813751, mean loss: 0.3393380991701591
Epoch: 70, step: 156, loss: 0.3338257968425751, mean loss: 0.33933804472067597
Epoch: 70, step: 157, loss: 0.3158082664012909, mean loss: 0.33933781230025756
Epoch: 70, step: 158, loss: 0.3691312372684479, mean loss: 0.3393381065882787
Epoch: 70, step: 159, loss: 0.3456926643848419, mean loss: 0.33933816935554256
Epoch: 70, step: 160, loss: 0.3374263346195221, mean loss: 0.3393381504715456
Epoch: 70, step: 161, loss: 0.37689757347106934, mean loss: 0.3393385214581223
Epoch: 70, step: 162, loss: 0.3203074634075165, mean loss: 0.3393383334840594
Epoch: 70, step: 163, loss: 0.3207146227359772, mean loss: 0.3393381495352748
Epoch: 70, step: 164, loss: 0.3315267264842987, mean loss: 0.33933807238160746
Epoch: 70, step: 165, loss: 0.3362754285335541, mean loss: 0.33933804213207813
Epoch: 70, step: 166, loss: 0.30677542090415955, mean loss: 0.3393377205164132
Epoch: 70, step: 167, loss: 0.35150620341300964, mean loss: 0.3393378407013343
Epoch: 70, step: 168, loss: 0.32931214570999146, mean loss: 0.33933774168114655
Epoch: 70, step: 169, loss: 0.316864550113678, mean loss: 0.33933751972369897
Epoch: 70, step: 170, loss: 0.31224632263183594, mean loss: 0.3393372521589629
Epoch: 70, step: 171, loss: 0.3465045094490051, mean loss: 0.33933732294529095
Epoch: 70, step: 172, loss: 0.32891151309013367, mean loss: 0.3393372199773803
Epoch: 70, step: 173, loss: 0.31094908714294434, mean loss: 0.3393369396118359
Epoch: 70, step: 174, loss: 0.32654136419296265, mean loss: 0.33933681324202286
Epoch: 70, step: 175, loss: 0.3555344343185425, mean loss: 0.3393369732090478
Epoch: 70, step: 176, loss: 0.3973635137081146, mean loss: 0.3393375462710633
Epoch: 70, step: 177, loss: 0.3195517063140869, mean loss: 0.339337350870799
Epoch: 70, step: 178, loss: 0.3479097783565521, mean loss: 0.3393374355292243
Epoch: 70, step: 179, loss: 0.3548433184623718, mean loss: 0.3393375886586232
Epoch: 70, step: 180, loss: 0.3216584622859955, mean loss: 0.3393374140689354
Epoch: 70, step: 181, loss: 0.302174836397171, mean loss: 0.33933704707462686
Epoch: 70, step: 182, loss: 0.3438930809497833, mean loss: 0.33933709206671553
Epoch: 70, step: 183, loss: 0.37392085790634155, mean loss: 0.3393374335875506
Epoch: 70, step: 184, loss: 0.3373831510543823, mean loss: 0.3393374142888538
Epoch: 70, step: 185, loss: 0.30703550577163696, mean loss: 0.3393370953080654
Epoch: 70, step: 186, loss: 0.35192546248435974, mean loss: 0.3393372196167462
Epoch: 70, step: 187, loss: 0.3709544837474823, mean loss: 0.33933753183051685
Epoch: 70, step: 188, loss: 0.3132413923740387, mean loss: 0.33933727413922476
Epoch: 70, step: 189, loss: 0.3510214388370514, mean loss: 0.3393373895155919
Epoch: 70, step: 190, loss: 0.3253965377807617, mean loss: 0.3393372518567188
Epoch: 70, step: 191, loss: 0.3094712495803833, mean loss: 0.33933695694793575
Epoch: 70, step: 192, loss: 0.35391315817832947, mean loss: 0.3393371008777219
Epoch: 70, step: 193, loss: 0.36344093084335327, mean loss: 0.33933733888382384
Epoch: 70, step: 194, loss: 0.35955342650413513, mean loss: 0.3393375384995989
Epoch: 70, step: 195, loss: 0.3181071877479553, mean loss: 0.3393373288709529
Epoch: 70, step: 196, loss: 0.3508356511592865, mean loss: 0.33933744240435426
Epoch: 70, step: 197, loss: 0.34046822786331177, mean loss: 0.33933745356951805
Epoch: 70, step: 198, loss: 0.32955172657966614, mean loss: 0.3393373569480369
Epoch: 70, step: 199, loss: 0.3782792091369629, mean loss: 0.3393377414449977
Epoch: 70, step: 200, loss: 0.32031992077827454, mean loss: 0.33933755367216106
Epoch: 70, step: 201, loss: 0.32755813002586365, mean loss: 0.339337437368932
Epoch: 70, step: 202, loss: 0.33519136905670166, mean loss: 0.3393373964334511
Epoch: 70, step: 203, loss: 0.34354132413864136, mean loss: 0.3393374379397868
Epoch: 70, step: 204, loss: 0.3189689517021179, mean loss: 0.3393372368390687
Epoch: 70, step: 205, loss: 0.35089272260665894, mean loss: 0.33933735092675865
Epoch: 70, step: 206, loss: 0.31764209270477295, mean loss: 0.3393371367308774
Epoch: 70, step: 207, loss: 0.3439531922340393, mean loss: 0.3393371823044449
Epoch: 70, step: 208, loss: 0.3217533528804779, mean loss: 0.33933700870386213
Epoch: 70, step: 209, loss: 0.34141626954078674, mean loss: 0.33933702923166187
Epoch: 70, step: 210, loss: 0.36848074197769165, mean loss: 0.3393373169542902
Epoch: 70, step: 211, loss: 0.29317158460617065, mean loss: 0.3393368611854995
Epoch: 70, step: 212, loss: 0.3211023807525635, mean loss: 0.33933668116831733
Epoch: 70, step: 213, loss: 0.35512420535087585, mean loss: 0.33933683702675105
Epoch: 70, step: 214, loss: 0.3355705738067627, mean loss: 0.33933679984561455
Epoch: 70, step: 215, loss: 0.31469103693962097, mean loss: 0.3393365565412106
Epoch: 70, step: 216, loss: 0.3499414026737213, mean loss: 0.33933666123183454
Epoch: 70, step: 217, loss: 0.34192731976509094, mean loss: 0.33933668680646123
Epoch: 70, step: 218, loss: 0.30155104398727417, mean loss: 0.3393363137954461
Epoch: 70, step: 219, loss: 0.35912466049194336, mean loss: 0.33933650913944113
Epoch: 70, step: 220, loss: 0.3255867660045624, mean loss: 0.3393363734078774
Epoch: 70, step: 221, loss: 0.35317474603652954, mean loss: 0.33933651001300497
Epoch: 70, step: 222, loss: 0.30400633811950684, mean loss: 0.33933616125559507
Epoch: 70, step: 223, loss: 0.3187607228755951, mean loss: 0.33933595814971196
Epoch: 70, step: 224, loss: 0.2978520393371582, mean loss: 0.33933554865443716
Epoch: 70, step: 225, loss: 0.33310186862945557, mean loss: 0.3393354871212602
Epoch: 70, step: 226, loss: 0.31297996640205383, mean loss: 0.33933522696627866
Epoch: 70, step: 227, loss: 0.4024015963077545, mean loss: 0.33933584948739587
Epoch: 70, step: 228, loss: 0.3279346823692322, mean loss: 0.3393357369488542
Epoch: 70, step: 229, loss: 0.31589096784591675, mean loss: 0.33933550553271463
Epoch: 70, step: 230, loss: 0.30074813961982727, mean loss: 0.33933512465239646
Epoch: 70, step: 231, loss: 0.3412955701351166, mean loss: 0.3393351440029717
Epoch: 70, step: 232, loss: 0.34379416704177856, mean loss: 0.33933518801532
Epoch: 70, step: 233, loss: 0.3560846447944641, mean loss: 0.3393353533375536
Epoch: 70, step: 234, loss: 0.32616424560546875, mean loss: 0.33933522333599675
Epoch: 70, step: 235, loss: 0.32952624559402466, mean loss: 0.3393351265203137
Epoch: 70, step: 236, loss: 0.33040371537208557, mean loss: 0.33933503836717904
Epoch: 70, step: 237, loss: 0.3450627326965332, mean loss: 0.3393350948990325
Epoch: 70, step: 238, loss: 0.35924696922302246, mean loss: 0.33933529142559044
Epoch: 70, step: 239, loss: 0.32604268193244934, mean loss: 0.33933516023126065
Epoch: 70, step: 240, loss: 0.4170398414134979, mean loss: 0.339335927147114
Epoch: 70, step: 241, loss: 0.4087343215942383, mean loss: 0.33933661207629473
Epoch: 70, step: 242, loss: 0.3144339621067047, mean loss: 0.3393363663013969
Epoch: 70, step: 243, loss: 0.3313369154930115, mean loss: 0.3393362873521765
Epoch: 70, step: 244, loss: 0.30994269251823425, mean loss: 0.3393359972599502
Epoch: 70, step: 245, loss: 0.34397533535957336, mean loss: 0.3393360430462054
Epoch: 70, step: 246, loss: 0.3222759962081909, mean loss: 0.33933587467995713
Epoch: 70, step: 247, loss: 0.3426647484302521, mean loss: 0.339335907532414
Epoch: 70, step: 248, loss: 0.3560452163219452, mean loss: 0.33933607243396036
Epoch: 70, step: 249, loss: 0.3284730315208435, mean loss: 0.33933596522937226
Epoch: 70, step: 250, loss: 0.3705316483974457, mean loss: 0.33933627308859765
Epoch: 70, step: 251, loss: 0.3088061511516571, mean loss: 0.33933597180053526
Epoch: 70, step: 252, loss: 0.30740103125572205, mean loss: 0.339335656652059
Epoch: 70, step: 253, loss: 0.3102339804172516, mean loss: 0.33933536946635395
Epoch: 70, step: 254, loss: 0.30659642815589905, mean loss: 0.33933504639001005
Epoch: 70, step: 255, loss: 0.3332922160625458, mean loss: 0.3393349867583853
Epoch: 70, step: 256, loss: 0.3131200075149536, mean loss: 0.33933472806729276
Epoch: 70, step: 257, loss: 0.34107792377471924, mean loss: 0.3393347452690898
Epoch: 70, step: 258, loss: 0.30930376052856445, mean loss: 0.3393344489272595
Epoch: 70, step: 259, loss: 0.319345623254776, mean loss: 0.3393342516820881
Epoch: 70, step: 260, loss: 0.3201676607131958, mean loss: 0.3393340625524074
Epoch: 70, step: 261, loss: 0.30701836943626404, mean loss: 0.33933374367481356
Epoch: 70, step: 262, loss: 0.31935667991638184, mean loss: 0.3393335465515415
Epoch: 70, step: 263, loss: 0.3280610740184784, mean loss: 0.33933343532174465
Epoch: 70, step: 264, loss: 0.31549811363220215, mean loss: 0.3393332001318321
Epoch: 70, step: 265, loss: 0.3139875829219818, mean loss: 0.33933295004187086
Epoch: 70, step: 266, loss: 0.3739865720272064, mean loss: 0.339333291972288
Epoch: 70, step: 267, loss: 0.3086768090724945, mean loss: 0.3393329894849878
Epoch: 70, step: 268, loss: 0.34113699197769165, mean loss: 0.339333007284892
Epoch: 70, step: 269, loss: 0.30277955532073975, mean loss: 0.3393326466193571
Epoch: 70, step: 270, loss: 0.336856484413147, mean loss: 0.3393326221878053
Epoch: 70, step: 271, loss: 0.3106447160243988, mean loss: 0.33933233913560934
Epoch: 70, step: 272, loss: 0.3476339876651764, mean loss: 0.3393324210438758
Epoch: 70, step: 273, loss: 0.3126814663410187, mean loss: 0.3393321580946611
Epoch: 70, step: 274, loss: 0.29743191599845886, mean loss: 0.33933174469382155
Epoch: 70, step: 275, loss: 0.322070837020874, mean loss: 0.33933157439401024
Epoch: 70, step: 276, loss: 0.31276535987854004, mean loss: 0.339331312288635
Epoch: 70, step: 277, loss: 0.32979312539100647, mean loss: 0.33933121818469747
Epoch: 70, step: 278, loss: 0.31016114354133606, mean loss: 0.33933093039501283
Epoch: 70, step: 279, loss: 0.3492984473705292, mean loss: 0.3393310287327888
Epoch: 70, step: 280, loss: 0.3084726631641388, mean loss: 0.33933072429256456
Epoch: 70, step: 281, loss: 0.301957905292511, mean loss: 0.3393303555861558
Epoch: 70, step: 282, loss: 0.3761539161205292, mean loss: 0.33933071887019967
Epoch: 70, step: 283, loss: 0.3299095332622528, mean loss: 0.3393306259261011
Epoch: 70, step: 284, loss: 0.32223063707351685, mean loss: 0.33933045722892896
Epoch: 70, step: 285, loss: 0.31918248534202576, mean loss: 0.33933025846433446
Epoch: 70, step: 286, loss: 0.3253304362297058, mean loss: 0.3393301203540793
Epoch: 70, step: 287, loss: 0.3343949615955353, mean loss: 0.33933007166851026
Epoch: 70, step: 288, loss: 0.33051055669784546, mean loss: 0.3393299846644462
Epoch: 70, step: 289, loss: 0.32010418176651, mean loss: 0.33932979500475496
Epoch: 70, step: 290, loss: 0.3484382927417755, mean loss: 0.33932988485784643
Epoch: 70, step: 291, loss: 0.3259812593460083, mean loss: 0.33932975317823555
Epoch: 70, step: 292, loss: 0.3473876416683197, mean loss: 0.3393298326657568
Epoch: 70, step: 293, loss: 0.3614530861377716, mean loss: 0.3393300508997564
Epoch: 70, step: 294, loss: 0.32336583733558655, mean loss: 0.33932989342292713
Epoch: 70, step: 295, loss: 0.3256186544895172, mean loss: 0.3393297581715961
Epoch: 70, step: 296, loss: 0.3423590064048767, mean loss: 0.33932978805261677
Epoch: 70, step: 297, loss: 0.33722203969955444, mean loss: 0.339329767261633
Epoch: 70, step: 298, loss: 0.3145013153553009, mean loss: 0.3393295223543849
Epoch: 70, step: 299, loss: 0.34050068259239197, mean loss: 0.33932953390656717
Epoch: 70, step: 300, loss: 0.33038535714149475, mean loss: 0.3393294456831647
Epoch: 70, step: 301, loss: 0.3546263873577118, mean loss: 0.33932959656736184
Epoch: 70, step: 302, loss: 0.3064252436161041, mean loss: 0.3393292720124271
Epoch: 70, step: 303, loss: 0.3357618451118469, mean loss: 0.33932923682515
Epoch: 70, step: 304, loss: 0.32266655564308167, mean loss: 0.3393290724745934
Epoch: 70, step: 305, loss: 0.3359226882457733, mean loss: 0.33932903887642174
Epoch: 70, step: 306, loss: 0.306753545999527, mean loss: 0.3393287175779034
Epoch: 70, step: 307, loss: 0.3163563013076782, mean loss: 0.3393284909986606
Epoch: 70, step: 308, loss: 0.3190072774887085, mean loss: 0.33932829057047303
Epoch: 70, step: 309, loss: 0.3233047425746918, mean loss: 0.3393281325317316
Epoch: 70, step: 310, loss: 0.31870660185813904, mean loss: 0.33932792914552695
Epoch: 70, step: 311, loss: 0.3343871831893921, mean loss: 0.3393278804163772
Epoch: 70, step: 312, loss: 0.318302184343338, mean loss: 0.33932767304805717
Epoch: 70, step: 313, loss: 0.31400203704833984, mean loss: 0.33932742327355375
Epoch: 70, step: 314, loss: 0.28704634308815, mean loss: 0.33932690765562207
Epoch: 70, step: 315, loss: 0.3365325331687927, mean loss: 0.3393268800966011
Epoch: 70, step: 316, loss: 0.3861580491065979, mean loss: 0.3393273419561138
Epoch: 70, step: 317, loss: 0.31799015402793884, mean loss: 0.3393271315260469
Epoch: 70, step: 318, loss: 0.3377377688884735, mean loss: 0.33932711585170455
Epoch: 70, step: 319, loss: 0.3281843960285187, mean loss: 0.3393270059629489
Epoch: 70, step: 320, loss: 0.37767350673675537, mean loss: 0.33932738412983854
Epoch: 70, step: 321, loss: 0.32895129919052124, mean loss: 0.33932728180360294
Epoch: 70, step: 322, loss: 0.2953791320323944, mean loss: 0.33932684840271965
Epoch: 70, step: 323, loss: 0.3218810558319092, mean loss: 0.3393266763602699
Epoch: 70, step: 324, loss: 0.33375683426856995, mean loss: 0.3393266214335691
Epoch: 70, step: 325, loss: 0.3293318748474121, mean loss: 0.3393265228718806
Epoch: 70, step: 326, loss: 0.3366990089416504, mean loss: 0.3393264969613031
Epoch: 70, step: 327, loss: 0.3005639314651489, mean loss: 0.33932611471763896
Epoch: 70, step: 328, loss: 0.2984190881252289, mean loss: 0.3393257113310895
Epoch: 70, step: 329, loss: 0.3313435912132263, mean loss: 0.33932563261971865
Epoch: 70, step: 330, loss: 0.3340207636356354, mean loss: 0.3393255803091312
Epoch: 70, step: 331, loss: 0.3149283528327942, mean loss: 0.3393253397337804
Epoch: 70, step: 332, loss: 0.3337327837944031, mean loss: 0.33932528458743877
Epoch: 70, step: 333, loss: 0.3021705448627472, mean loss: 0.33932491822047045
Epoch: 70, step: 334, loss: 0.30658093094825745, mean loss: 0.3393245953492258
Epoch: 70, step: 335, loss: 0.3378898501396179, mean loss: 0.3393245812020971
Epoch: 70, step: 336, loss: 0.32339805364608765, mean loss: 0.3393244241620786
Epoch: 70, step: 337, loss: 0.37956714630126953, mean loss: 0.33932482096266764
Epoch: 70, step: 338, loss: 0.31243640184402466, mean loss: 0.33932455584055915
Epoch: 70, step: 339, loss: 0.31589698791503906, mean loss: 0.3393243248450166
Epoch: 70, step: 340, loss: 0.35740017890930176, mean loss: 0.3393245030709665
Epoch: 70, step: 341, loss: 0.3222944736480713, mean loss: 0.3393243351583891
Epoch: 70, step: 342, loss: 0.327693909406662, mean loss: 0.3393242204859208
Epoch: 70, step: 343, loss: 0.3482319712638855, mean loss: 0.3393243083127742
Epoch: 70, step: 344, loss: 0.36548885703086853, mean loss: 0.3393245662821971
Epoch: 70, step: 345, loss: 0.34676653146743774, mean loss: 0.339324639655545
Epoch: 70, step: 346, loss: 0.31442445516586304, mean loss: 0.33932439415696486
Epoch: 70, step: 347, loss: 0.4004264175891876, mean loss: 0.3393249965746743
Epoch: 70, step: 348, loss: 0.34110546112060547, mean loss: 0.33932501412847593
Epoch: 70, step: 349, loss: 0.3606034219264984, mean loss: 0.33932522391264036
Epoch: 70, step: 350, loss: 0.336971640586853, mean loss: 0.3393252007088533
Epoch: 70, step: 351, loss: 0.30857205390930176, mean loss: 0.3393248975190631
Epoch: 70, step: 352, loss: 0.3475937843322754, mean loss: 0.3393249790397399
Epoch: 70, step: 353, loss: 0.30837079882621765, mean loss: 0.33932467387401427
Epoch: 70, step: 354, loss: 0.34639406204223633, mean loss: 0.33932474356779024
Epoch: 70, step: 355, loss: 0.3044392168521881, mean loss: 0.3393243996511658
Epoch: 70, step: 356, loss: 0.3378954529762268, mean loss: 0.33932438556412975
Epoch: 70, step: 357, loss: 0.31934696435928345, mean loss: 0.3393241886219463
Epoch: 70, step: 358, loss: 0.3238121271133423, mean loss: 0.3393240357018514
Epoch: 70, step: 359, loss: 0.37865033745765686, mean loss: 0.3393244233822709
Epoch: 70, step: 360, loss: 0.31315046548843384, mean loss: 0.33932416536078164
Epoch: 70, step: 361, loss: 0.3373391330242157, mean loss: 0.339324145792631
Epoch: 70, step: 362, loss: 0.3116973042488098, mean loss: 0.3393238734540611
Epoch: 70, step: 363, loss: 0.3422415554523468, mean loss: 0.33932390221556497
Epoch: 70, step: 364, loss: 0.3553772270679474, mean loss: 0.33932406046215036
Epoch: 70, step: 365, loss: 0.36903300881385803, mean loss: 0.33932435331695343
Epoch: 70, step: 366, loss: 0.30066630244255066, mean loss: 0.3393239722504766
Epoch: 70, step: 367, loss: 0.3091703951358795, mean loss: 0.3393236750186227
Epoch: 70, step: 368, loss: 0.3158664107322693, mean loss: 0.33932344379639
Epoch: 70, step: 369, loss: 0.2913482189178467, mean loss: 0.3393229709011226
Epoch: 70, step: 370, loss: 0.36676299571990967, mean loss: 0.33932324137676917
Epoch: 70, step: 371, loss: 0.3268420398235321, mean loss: 0.33932311835108653
Epoch: 70, step: 372, loss: 0.30970391631126404, mean loss: 0.33932282640109945
Epoch: 70, step: 373, loss: 0.33554139733314514, mean loss: 0.33932278912874875
Epoch: 70, step: 374, loss: 0.32170674204826355, mean loss: 0.33932261549465403
Epoch: 70, step: 375, loss: 0.28993546962738037, mean loss: 0.3393221287107687
Epoch: 70, step: 376, loss: 0.345093697309494, mean loss: 0.3393221855976134
Epoch: 70, step: 377, loss: 0.3133942484855652, mean loss: 0.3393219300442109
Epoch: 70, step: 378, loss: 0.3229857385158539, mean loss: 0.3393217690314715
Epoch: 70, step: 379, loss: 0.3829934597015381, mean loss: 0.33932219946406234
Epoch: 70, step: 380, loss: 0.3226962387561798, mean loss: 0.3393220355985307
Epoch: 70, step: 381, loss: 0.3318299651145935, mean loss: 0.33932196175738344
Epoch: 70, step: 382, loss: 0.3144797086715698, mean loss: 0.3393217169168693
Epoch: 70, step: 383, loss: 0.3269067704677582, mean loss: 0.339321594558728
Epoch: 70, step: 384, loss: 0.3228299617767334, mean loss: 0.3393214320235407
Epoch: 70, step: 385, loss: 0.3653751611709595, mean loss: 0.33932168879654
Epoch: 70, step: 386, loss: 0.3259788155555725, mean loss: 0.3393215572969072
Epoch: 70, step: 387, loss: 0.34186461567878723, mean loss: 0.3393215823595711
Epoch: 70, step: 388, loss: 0.3483576774597168, mean loss: 0.339321671412337
Epoch: 70, step: 389, loss: 0.36937782168388367, mean loss: 0.33932196761959305
Epoch: 70, step: 390, loss: 0.33660033345222473, mean loss: 0.3393219407977999
Epoch: 70, step: 391, loss: 0.3242267072200775, mean loss: 0.3393217920352489
Epoch: 70, step: 392, loss: 0.3392571210861206, mean loss: 0.3393217913979272
Epoch: 70, step: 393, loss: 0.29988893866539, mean loss: 0.33932140279737205
Epoch: 70, step: 394, loss: 0.33164674043655396, mean loss: 0.33932132716630664
Epoch: 70, step: 395, loss: 0.34158357977867126, mean loss: 0.3393213494597811
Epoch: 70, step: 396, loss: 0.3219328820705414, mean loss: 0.33932117810600254
Epoch: 70, step: 397, loss: 0.33843111991882324, mean loss: 0.3393211693350553
Epoch: 70, step: 398, loss: 0.312846302986145, mean loss: 0.3393209084449564
Epoch: 70, step: 399, loss: 0.39887094497680664, mean loss: 0.33932149526045235
Epoch: 70, step: 400, loss: 0.3921397626399994, mean loss: 0.33932201573489956
Epoch: 70, step: 401, loss: 0.36508414149284363, mean loss: 0.3393222695939658
Epoch: 70, step: 402, loss: 0.36022108793258667, mean loss: 0.33932247552814526
Epoch: 70, step: 403, loss: 0.35026589035987854, mean loss: 0.3393225833620386
Epoch: 70, step: 404, loss: 0.31075340509414673, mean loss: 0.3393223018506993
Epoch: 70, step: 405, loss: 0.33634066581726074, mean loss: 0.33932227247092245
Epoch: 70, step: 406, loss: 0.34257814288139343, mean loss: 0.3393223045525724
Epoch: 70, step: 407, loss: 0.35759028792381287, mean loss: 0.33932248455398506
Epoch: 70, step: 408, loss: 0.32029616832733154, mean loss: 0.3393222970822765
Epoch: 70, step: 409, loss: 0.310650497674942, mean loss: 0.3393220145736608
Epoch: 70, step: 410, loss: 0.29347044229507446, mean loss: 0.33932156279397313
Epoch: 70, step: 411, loss: 0.3404856324195862, mean loss: 0.3393215742635434
Epoch: 70, step: 412, loss: 0.3342162072658539, mean loss: 0.33932152396089205
Epoch: 70, step: 413, loss: 0.326383113861084, mean loss: 0.33932139648133564
Epoch: 70, step: 414, loss: 0.3073626458644867, mean loss: 0.3393210816012862
Epoch: 70, step: 415, loss: 0.31658992171287537, mean loss: 0.33932085764014597
Epoch: 70, step: 416, loss: 0.3310070037841797, mean loss: 0.3393207757278347
Epoch: 70, step: 417, loss: 0.2949172556400299, mean loss: 0.3393203382461101
Epoch: 70, step: 418, loss: 0.3370172679424286, mean loss: 0.3393203155555387
Epoch: 70, step: 419, loss: 0.31693994998931885, mean loss: 0.33932009505932625
Epoch: 70, step: 420, loss: 0.35164257884025574, mean loss: 0.33932021646191124
Epoch: 70, step: 421, loss: 0.3598850667476654, mean loss: 0.33932041906728144
Epoch: 70, step: 422, loss: 0.3374282419681549, mean loss: 0.3393204004256935
Epoch: 70, step: 423, loss: 0.31036314368247986, mean loss: 0.33932011514376625
Epoch: 70, step: 424, loss: 0.293091356754303, mean loss: 0.3393196597104537
Epoch: 70, step: 425, loss: 0.32532796263694763, mean loss: 0.3393195218693697
Epoch: 70, step: 426, loss: 0.349872887134552, mean loss: 0.3393196258362416
Epoch: 70, step: 427, loss: 0.3661124110221863, mean loss: 0.3393198897837648
Epoch: 70, step: 428, loss: 0.3074164390563965, mean loss: 0.33931957549192143
Epoch: 70, step: 429, loss: 0.3355882465839386, mean loss: 0.33931953873368176
Epoch: 70, step: 430, loss: 0.3317946493625641, mean loss: 0.33931946460487433
Epoch: 70, step: 431, loss: 0.3292885422706604, mean loss: 0.33931936578973587
Epoch: 70, step: 432, loss: 0.31814631819725037, mean loss: 0.3393191572149958
Epoch: 70, step: 433, loss: 0.3213111460208893, mean loss: 0.33931897982063447
Epoch: 70, step: 434, loss: 0.3382696509361267, mean loss: 0.33931896948394646
Epoch: 70, step: 435, loss: 0.31317850947380066, mean loss: 0.3393187119830598
Epoch: 70, step: 436, loss: 0.33660680055618286, mean loss: 0.33931868526919484
Epoch: 70, step: 437, loss: 0.33227309584617615, mean loss: 0.33931861586682854
Epoch: 70, step: 438, loss: 0.3269496560096741, mean loss: 0.3393184940279623
Epoch: 70, step: 439, loss: 0.30617812275886536, mean loss: 0.33931816758616495
Epoch: 70, step: 440, loss: 0.31924617290496826, mean loss: 0.3393179698734289
Epoch: 70, step: 441, loss: 0.2865210771560669, mean loss: 0.3393174498197192
Epoch: 70, step: 442, loss: 0.3105897009372711, mean loss: 0.3393171668518313
Epoch: 70, step: 443, loss: 0.30213552713394165, mean loss: 0.33931680061685515
Epoch: 70, step: 444, loss: 0.3239261209964752, mean loss: 0.3393166490218823
Epoch: 70, step: 445, loss: 0.3066360652446747, mean loss: 0.33931632712814297
Epoch: 70, step: 446, loss: 0.34453442692756653, mean loss: 0.33931637852432134
Epoch: 70, step: 447, loss: 0.3072144091129303, mean loss: 0.339316062335985
Epoch: 70, step: 448, loss: 0.3083805739879608, mean loss: 0.33931575763990457
Epoch: 70, step: 449, loss: 0.35717326402664185, mean loss: 0.3393159335239427
Epoch: 70, step: 450, loss: 0.29952919483184814, mean loss: 0.33931554165605315
Epoch: 70, step: 451, loss: 0.3574756681919098, mean loss: 0.33931572051716624
Epoch: 70, step: 452, loss: 0.31673863530158997, mean loss: 0.3393154981551242
Epoch: 70, step: 453, loss: 0.3142688572406769, mean loss: 0.33931525147282154
Epoch: 70, step: 454, loss: 0.34970229864120483, mean loss: 0.3393153537729857
Epoch: 70, step: 455, loss: 0.33293989300727844, mean loss: 0.3393152909828348
Epoch: 70, step: 456, loss: 0.326137512922287, mean loss: 0.33931516119981914
Epoch: 70, step: 457, loss: 0.3590523898601532, mean loss: 0.3393153555825001
Epoch: 70, step: 458, loss: 0.3018783926963806, mean loss: 0.33931498688709355
Epoch: 70, step: 459, loss: 0.34171372652053833, mean loss: 0.3393150105106866
Epoch: 70, step: 460, loss: 0.3379966914653778, mean loss: 0.339314997527566
Epoch: 70, step: 461, loss: 0.32322150468826294, mean loss: 0.3393148390365688
Epoch: 70, step: 462, loss: 0.32779788970947266, mean loss: 0.3393147256171373
Epoch: 70, step: 463, loss: 0.306427001953125, mean loss: 0.3393144017405551
Epoch: 70, step: 464, loss: 0.3328354060649872, mean loss: 0.33931433793637295
Epoch: 70, step: 465, loss: 0.33572468161582947, mean loss: 0.33931430258632156
Epoch: 70, step: 466, loss: 0.3573893904685974, mean loss: 0.33931448058358277
Epoch: 70, step: 467, loss: 0.34172672033309937, mean loss: 0.3393145043382579
Epoch: 70, step: 468, loss: 0.35054004192352295, mean loss: 0.3393146148813217
Epoch: 70, step: 469, loss: 0.2869213819503784, mean loss: 0.33931409894599
Epoch: 70, step: 470, loss: 0.3095945715904236, mean loss: 0.3393138062898138
Epoch: 70, step: 471, loss: 0.34949710965156555, mean loss: 0.3393139065665524
Epoch: 70, step: 472, loss: 0.32336410880088806, mean loss: 0.33931374950769877
Epoch: 70, step: 473, loss: 0.2927279472351074, mean loss: 0.33931329077833045
Epoch: 70, step: 474, loss: 0.3660224378108978, mean loss: 0.3393135537801229
Epoch: 70, step: 475, loss: 0.312034010887146, mean loss: 0.3393132851643553
Epoch: 70, step: 476, loss: 0.3691045343875885, mean loss: 0.3393135785094642
Epoch: 70, step: 477, loss: 0.3725138008594513, mean loss: 0.33931390541844575
Epoch: 70, step: 478, loss: 0.27905264496803284, mean loss: 0.33931331205635623
Epoch: 70, step: 479, loss: 0.30876424908638, mean loss: 0.3393130112581781
Epoch: 70, step: 480, loss: 0.36456605792045593, mean loss: 0.339313259907233
Epoch: 70, step: 481, loss: 0.3141342103481293, mean loss: 0.3393130119892168
Epoch: 70, step: 482, loss: 0.3742513060569763, mean loss: 0.33931335599534174
Epoch: 70, step: 483, loss: 0.3384958505630493, mean loss: 0.33931334794617635
Epoch: 70, step: 484, loss: 0.3368079960346222, mean loss: 0.33931332327870317
Epoch: 70, step: 485, loss: 0.34070494771003723, mean loss: 0.33931333698037924
Epoch: 70, step: 486, loss: 0.4134332835674286, mean loss: 0.33931406674444226
Epoch: 70, step: 487, loss: 0.32769542932510376, mean loss: 0.33931395235174555
Epoch: 70, step: 488, loss: 0.3243561387062073, mean loss: 0.3393138050842363
Epoch: 70, step: 489, loss: 0.35126736760139465, mean loss: 0.33931392277216105
Epoch: 70, step: 490, loss: 0.31477296352386475, mean loss: 0.339313681158322
Epoch: 70, step: 491, loss: 0.2979154586791992, mean loss: 0.3393132735831785
Epoch: 70, step: 492, loss: 0.3666399419307709, mean loss: 0.33931354261794505
Epoch: 70, step: 493, loss: 0.3297058939933777, mean loss: 0.3393134480302688
Epoch: 70, step: 494, loss: 0.3479384779930115, mean loss: 0.33931353294318994
Epoch: 70, step: 495, loss: 0.31629258394241333, mean loss: 0.33931330630550977
Epoch: 70, step: 496, loss: 0.3359423577785492, mean loss: 0.33931327311936993
Epoch: 70, step: 497, loss: 0.35203638672828674, mean loss: 0.33931339837398816
Epoch: 70, step: 498, loss: 0.3137325942516327, mean loss: 0.3393131465423682
Epoch: 70, step: 499, loss: 0.3610812723636627, mean loss: 0.33931336083775926
Epoch: 70, step: 500, loss: 0.31374678015708923, mean loss: 0.33931310915111823
Epoch: 70, step: 501, loss: 0.3224996328353882, mean loss: 0.33931294363482284
Epoch: 70, step: 502, loss: 0.3157937228679657, mean loss: 0.3393127121076897
Epoch: 70, step: 503, loss: 0.3888339698314667, mean loss: 0.3393131995984139
Epoch: 70, step: 504, loss: 0.3271324336528778, mean loss: 0.33931307969128244
Epoch: 70, step: 505, loss: 0.331513911485672, mean loss: 0.33931300291723676
Epoch: 70, step: 506, loss: 0.36301693320274353, mean loss: 0.33931323625349324
Epoch: 70, step: 507, loss: 0.33069440722465515, mean loss: 0.33931315141247825
Epoch: 70, step: 508, loss: 0.3102148771286011, mean loss: 0.33931286498112956
Epoch: 70, step: 509, loss: 0.33707576990127563, mean loss: 0.3393128429603098
Epoch: 70, step: 510, loss: 0.2894364297389984, mean loss: 0.3393123520072409
Epoch: 70, step: 511, loss: 0.39459365606307983, mean loss: 0.3393128961574108
Epoch: 70, step: 512, loss: 0.3567665219306946, mean loss: 0.33931306795690264
Epoch: 70, step: 513, loss: 0.3323265016078949, mean loss: 0.33931299918742464
Epoch: 70, step: 514, loss: 0.2916885018348694, mean loss: 0.33931253041930265
Epoch: 70, step: 515, loss: 0.3171364367008209, mean loss: 0.3393123121420701
Epoch: 70, step: 516, loss: 0.3342530131340027, mean loss: 0.3393122623443496
Epoch: 70, step: 517, loss: 0.32604068517684937, mean loss: 0.33931213171601865
Epoch: 70, step: 518, loss: 0.30214229226112366, mean loss: 0.33931176586754125
Epoch: 70, step: 519, loss: 0.3193168342113495, mean loss: 0.3393115690670328
Epoch: 70, step: 520, loss: 0.3249199688434601, mean loss: 0.3393114274188185
Epoch: 70, step: 521, loss: 0.33562883734703064, mean loss: 0.3393113911735667
Epoch: 70, step: 522, loss: 0.3193618655204773, mean loss: 0.3393111948257654
Epoch: 70, step: 523, loss: 0.3403153121471405, mean loss: 0.3393112047084208
Epoch: 70, step: 524, loss: 0.3045506775379181, mean loss: 0.3393108625940842
Epoch: 70, step: 525, loss: 0.32831859588623047, mean loss: 0.33931075440887165
Epoch: 70, step: 526, loss: 0.3496473431587219, mean loss: 0.3393108561399409
Epoch: 70, step: 527, loss: 0.31127846240997314, mean loss: 0.3393105802522772
Epoch: 70, step: 528, loss: 0.35353726148605347, mean loss: 0.3393107202662645
Epoch: 70, step: 529, loss: 0.3356502652168274, mean loss: 0.33931068424170935
Epoch: 70, step: 530, loss: 0.32270893454551697, mean loss: 0.3393105208563505
Epoch: 70, step: 531, loss: 0.31679102778434753, mean loss: 0.3393102992339725
Epoch: 70, step: 532, loss: 0.3171517848968506, mean loss: 0.3393100811662613
Epoch: 70, step: 533, loss: 0.3343948721885681, mean loss: 0.33931003279488553
Epoch: 70, step: 534, loss: 0.2967968285083771, mean loss: 0.33930961441960344
Epoch: 70, step: 535, loss: 0.34976616501808167, mean loss: 0.33930971732220344
Epoch: 70, step: 536, loss: 0.30865681171417236, mean loss: 0.33930941567084977
Epoch: 70, step: 537, loss: 0.3145180940628052, mean loss: 0.33930917170500113
Epoch: 70, step: 538, loss: 0.3542650043964386, mean loss: 0.3393093188805558
Epoch: 70, step: 539, loss: 0.348502516746521, mean loss: 0.33930940934697845
Epoch: 70, step: 540, loss: 0.33470281958580017, mean loss: 0.3393093640158977
Epoch: 70, step: 541, loss: 0.34908831119537354, mean loss: 0.3393094602445409
Epoch: 70, step: 542, loss: 0.2975148856639862, mean loss: 0.3393090489737205
Epoch: 70, step: 543, loss: 0.3343835473060608, mean loss: 0.33930900050582247
Epoch: 70, step: 544, loss: 0.3211071491241455, mean loss: 0.33930882139781376
Epoch: 70, step: 545, loss: 0.3106164038181305, mean loss: 0.33930853906437963
Epoch: 70, step: 546, loss: 0.3255918622016907, mean loss: 0.3393084040935858
Epoch: 70, step: 547, loss: 0.3823036849498749, mean loss: 0.3393088271588912
Epoch: 70, step: 548, loss: 0.3308829963207245, mean loss: 0.33930874425114993
Epoch: 70, step: 549, loss: 0.37821438908576965, mean loss: 0.3393091270676887
Epoch: 70, step: 550, loss: 0.36104056239128113, mean loss: 0.3393093408945262
Epoch: 70, step: 551, loss: 0.32134395837783813, mean loss: 0.3393091641255704
Epoch: 70, step: 552, loss: 0.3210412561893463, mean loss: 0.3393089843817083
Epoch: 70, step: 553, loss: 0.35853955149650574, mean loss: 0.33930917359562407
Epoch: 70, step: 554, loss: 0.33801373839378357, mean loss: 0.33930916084966845
Epoch: 70, step: 555, loss: 0.3638911843299866, mean loss: 0.33930940271301885
Epoch: 70, step: 556, loss: 0.3150472939014435, mean loss: 0.33930916399966826
Epoch: 70, step: 557, loss: 0.3606892228126526, mean loss: 0.3393093743546419
Epoch: 70, step: 558, loss: 0.4095537066459656, mean loss: 0.3393100654705747
Epoch: 70, step: 559, loss: 0.3291015625, mean loss: 0.3393099650327257
Epoch: 70, step: 560, loss: 0.28525346517562866, mean loss: 0.33930943319518125
Epoch: 70, step: 561, loss: 0.3251291811466217, mean loss: 0.3393092936834435
Epoch: 70, step: 562, loss: 0.35244715213775635, mean loss: 0.3393094229383696
Epoch: 70, step: 563, loss: 0.3557325005531311, mean loss: 0.3393095845128611
Epoch: 70, step: 564, loss: 0.3152502477169037, mean loss: 0.3393093478132025
Epoch: 70, step: 565, loss: 0.379848837852478, mean loss: 0.3393097466433585
Epoch: 70, step: 566, loss: 0.3424992263317108, mean loss: 0.3393097780213597
Epoch: 70, step: 567, loss: 0.37258023023605347, mean loss: 0.3393101053318057
Epoch: 70, step: 568, loss: 0.33802035450935364, mean loss: 0.3393100926435272
Epoch: 70, step: 569, loss: 0.30047255754470825, mean loss: 0.3393097105723506
Epoch: 70, step: 570, loss: 0.37284690141677856, mean loss: 0.33931004049719976
Epoch: 70, step: 571, loss: 0.3448432683944702, mean loss: 0.33931009493024483
Epoch: 70, step: 572, loss: 0.3404059410095215, mean loss: 0.3393101057105079
Epoch: 70, step: 573, loss: 0.31201204657554626, mean loss: 0.3393098371715509
Epoch: 70, step: 574, loss: 0.31677472591400146, mean loss: 0.3393096154892799
Epoch: 70, step: 575, loss: 0.38549697399139404, mean loss: 0.33931006983883627
Epoch: 70, step: 576, loss: 0.32711702585220337, mean loss: 0.33930994989585167
Epoch: 70, step: 577, loss: 0.3061801493167877, mean loss: 0.33930962400117953
Epoch: 70, step: 578, loss: 0.3199697732925415, mean loss: 0.33930943375879363
Epoch: 70, step: 579, loss: 0.31134214997291565, mean loss: 0.33930915865271666
Epoch: 70, step: 580, loss: 0.2975788116455078, mean loss: 0.3393087481674076
Epoch: 70, step: 581, loss: 0.3227866590023041, mean loss: 0.3393085856475952
Epoch: 70, step: 582, loss: 0.3019406497478485, mean loss: 0.3393082180808708
Epoch: 70, step: 583, loss: 0.3898121118545532, mean loss: 0.3393087148535118
Epoch: 70, step: 584, loss: 0.3683725893497467, mean loss: 0.3393090007323737
Epoch: 70, step: 585, loss: 0.3111291527748108, mean loss: 0.33930872355172376
Epoch: 70, step: 586, loss: 0.3683667778968811, mean loss: 0.33930900936771463
Epoch: 70, step: 587, loss: 0.30201825499534607, mean loss: 0.3393086425782197
Epoch: 70, step: 588, loss: 0.3293662369251251, mean loss: 0.3393085447863101
Epoch: 70, step: 589, loss: 0.3555575907230377, mean loss: 0.3393087046077514
Epoch: 70, step: 590, loss: 0.34211182594299316, mean loss: 0.3393087321782616
Epoch: 70, step: 591, loss: 0.36711087822914124, mean loss: 0.3393090056276483
Epoch: 70, step: 592, loss: 0.3354642391204834, mean loss: 0.33930896781262854
Epoch: 70, step: 593, loss: 0.300050288438797, mean loss: 0.33930858168953537
Epoch: 70, step: 594, loss: 0.30603110790252686, mean loss: 0.33930825439694834
Epoch: 70, step: 595, loss: 0.30916768312454224, mean loss: 0.3393079579595268
Epoch: 70, step: 596, loss: 0.31475991010665894, mean loss: 0.33930771652785735
Epoch: 70, step: 597, loss: 0.3287636637687683, mean loss: 0.33930761282742306
Epoch: 70, step: 598, loss: 0.2845364809036255, mean loss: 0.3393070741603244
Epoch: 70, step: 599, loss: 0.32446253299713135, mean loss: 0.3393069281675907
Epoch: 70, step: 600, loss: 0.3125168979167938, mean loss: 0.3393066646962416
Epoch: 70, step: 601, loss: 0.32761242985725403, mean loss: 0.33930654968832635
Epoch: 70, step: 602, loss: 0.3278751075267792, mean loss: 0.3393064372659729
Epoch: 70, step: 603, loss: 0.3362668454647064, mean loss: 0.3393064073734451
Epoch: 70, step: 604, loss: 0.32511961460113525, mean loss: 0.3393062678563799
Epoch: 70, step: 605, loss: 0.3143913447856903, mean loss: 0.3393060228381565
Epoch: 70, step: 606, loss: 0.343810498714447, mean loss: 0.33930606713561706
Epoch: 70, step: 607, loss: 0.2930064797401428, mean loss: 0.33930561182537994
Epoch: 70, step: 608, loss: 0.36117151379585266, mean loss: 0.3393058268525901
Epoch: 70, step: 609, loss: 0.3645651936531067, mean loss: 0.3393060752483694
Epoch: 70, step: 610, loss: 0.31751930713653564, mean loss: 0.3393058610035679
Epoch: 70, step: 611, loss: 0.3313010036945343, mean loss: 0.3393057822868812
Epoch: 70, step: 612, loss: 0.31841278076171875, mean loss: 0.3393055768351635
Epoch: 70, step: 613, loss: 0.40873944759368896, mean loss: 0.3393062596077042
Epoch: 70, step: 614, loss: 0.3311973214149475, mean loss: 0.33930617986987843
Epoch: 70, step: 615, loss: 0.33000579476356506, mean loss: 0.33930608841706705
Epoch: 70, step: 616, loss: 0.3803431987762451, mean loss: 0.33930649194038004
Epoch: 70, step: 617, loss: 0.37261179089546204, mean loss: 0.3393068194325525
Epoch: 70, step: 618, loss: 0.35916969180107117, mean loss: 0.33930701474295244
Epoch: 70, step: 619, loss: 0.29578059911727905, mean loss: 0.3393065867545982
Epoch: 70, step: 620, loss: 0.3227665424346924, mean loss: 0.33930642412055995
Epoch: 70, step: 621, loss: 0.31515631079673767, mean loss: 0.3393061866609886
Epoch: 70, step: 622, loss: 0.31541213393211365, mean loss: 0.33930595172148115
Epoch: 70, step: 623, loss: 0.3399317264556885, mean loss: 0.33930595787438306
Epoch: 70, step: 624, loss: 0.3623599112033844, mean loss: 0.3393061845491122
Epoch: 70, step: 625, loss: 0.31445541977882385, mean loss: 0.33930594020989163
Epoch: 70, step: 626, loss: 0.2986730933189392, mean loss: 0.33930554070103885
Epoch: 70, step: 627, loss: 0.34803691506385803, mean loss: 0.3393056265485077
Epoch: 70, step: 628, loss: 0.3222053349018097, mean loss: 0.3393054584189258
Epoch: 70, step: 629, loss: 0.29580000042915344, mean loss: 0.3393050306787037
Epoch: 70, step: 630, loss: 0.3093000650405884, mean loss: 0.33930473567653446
Epoch: 70, step: 631, loss: 0.3836026191711426, mean loss: 0.339305171199221
Epoch: 70, step: 632, loss: 0.3839395344257355, mean loss: 0.3393056100257547
Epoch: 70, step: 633, loss: 0.3128892481327057, mean loss: 0.3393053503136021
Epoch: 70, step: 634, loss: 0.3286730647087097, mean loss: 0.33930524578343835
Epoch: 70, step: 635, loss: 0.33305129408836365, mean loss: 0.3393051842989945
Epoch: 70, step: 636, loss: 0.3487420976161957, mean loss: 0.3393052770751609
Epoch: 70, step: 637, loss: 0.35734280943870544, mean loss: 0.33930545440397547
Epoch: 70, step: 638, loss: 0.3056233823299408, mean loss: 0.3393051232753557
Epoch: 70, step: 639, loss: 0.33209171891212463, mean loss: 0.33930505236103836
Epoch: 70, step: 640, loss: 0.33598917722702026, mean loss: 0.3393050197632942
Epoch: 70, step: 641, loss: 0.31841278076171875, mean loss: 0.33930481437764504
Epoch: 70, step: 642, loss: 0.3713180422782898, mean loss: 0.3393051290874737
Epoch: 70, step: 643, loss: 0.29832807183265686, mean loss: 0.3393047262616189
Epoch: 70, step: 644, loss: 0.33415961265563965, mean loss: 0.33930467568296463
Epoch: 70, step: 645, loss: 0.3460933268070221, mean loss: 0.3393047424176355
Epoch: 70, step: 646, loss: 0.27453842759132385, mean loss: 0.33930410574974174
Epoch: 70, step: 647, loss: 0.33220627903938293, mean loss: 0.3393040359771451
Epoch: 70, step: 648, loss: 0.3588409423828125, mean loss: 0.3393042280256898
Epoch: 70, step: 649, loss: 0.3129512071609497, mean loss: 0.3393039689770231
Epoch: 70, step: 650, loss: 0.37244483828544617, mean loss: 0.33930429474664403
Epoch: 70, step: 651, loss: 0.426203191280365, mean loss: 0.33930514894096375
Epoch: 70, step: 652, loss: 0.34251588582992554, mean loss: 0.33930518050139047
Epoch: 70, step: 653, loss: 0.3117293417453766, mean loss: 0.3393049094431527
Epoch: 70, step: 654, loss: 0.3027428984642029, mean loss: 0.33930455005836896
Epoch: 70, step: 655, loss: 0.3362624943256378, mean loss: 0.3393045201569011
Epoch: 70, step: 656, loss: 0.3701295554637909, mean loss: 0.339304823144362
Epoch: 70, step: 657, loss: 0.3187010884284973, mean loss: 0.3393046206267706
Epoch: 70, step: 658, loss: 0.3164680302143097, mean loss: 0.33930439616426933
Epoch: 70, step: 659, loss: 0.3362836539745331, mean loss: 0.3393043664734674
Epoch: 70, step: 660, loss: 0.36418649554252625, mean loss: 0.33930461103690857
Epoch: 70, step: 661, loss: 0.34848669171333313, mean loss: 0.33930470128558343
Epoch: 70, step: 662, loss: 0.35908782482147217, mean loss: 0.33930489572769285
Epoch: 70, step: 663, loss: 0.3196541666984558, mean loss: 0.3393047025887458
Epoch: 70, step: 664, loss: 0.34332042932510376, mean loss: 0.3393047420572871
Epoch: 70, step: 665, loss: 0.34860682487487793, mean loss: 0.33930483348184254
Epoch: 70, step: 666, loss: 0.3175390362739563, mean loss: 0.33930461956106645
Epoch: 70, step: 667, loss: 0.3527158796787262, mean loss: 0.33930475136965355
Epoch: 70, step: 668, loss: 0.35709595680236816, mean loss: 0.3393049262235139
Epoch: 70, step: 669, loss: 0.31178998947143555, mean loss: 0.3393046558064451
Epoch: 70, step: 670, loss: 0.33389219641685486, mean loss: 0.3393046026132638
Epoch: 70, step: 671, loss: 0.3190915882587433, mean loss: 0.33930440396346473
Epoch: 70, step: 672, loss: 0.38248470425605774, mean loss: 0.3393048283273684
Epoch: 70, step: 673, loss: 0.322976678609848, mean loss: 0.3393046678604608
Epoch: 70, step: 674, loss: 0.3255431652069092, mean loss: 0.3393045326189233
Epoch: 70, step: 675, loss: 0.29891112446784973, mean loss: 0.33930413565551915
Epoch: 70, step: 676, loss: 0.34126344323158264, mean loss: 0.3393041549102886
Epoch: 70, step: 677, loss: 0.314896821975708, mean loss: 0.33930391505363916
Epoch: 70, step: 678, loss: 0.3452945947647095, mean loss: 0.339303973924891
Epoch: 70, step: 679, loss: 0.3794472813606262, mean loss: 0.33930436841494044
Epoch: 70, step: 680, loss: 0.3144609034061432, mean loss: 0.3393041242795152
Epoch: 70, step: 681, loss: 0.3685820400714874, mean loss: 0.33930441198922795
Epoch: 70, step: 682, loss: 0.32075178623199463, mean loss: 0.33930422967713264
Epoch: 70, step: 683, loss: 0.339358925819397, mean loss: 0.3393042302146129
Epoch: 70, step: 684, loss: 0.3720993101596832, mean loss: 0.3393045524774729
Epoch: 70, step: 685, loss: 0.3511260449886322, mean loss: 0.339304668640951
Epoch: 70, step: 686, loss: 0.35407328605651855, mean loss: 0.3393048137628217
Epoch: 70, step: 687, loss: 0.39953991770744324, mean loss: 0.33930540564930806
Epoch: 70, step: 688, loss: 0.3265666663646698, mean loss: 0.339305280476227
Epoch: 70, step: 689, loss: 0.2966327667236328, mean loss: 0.3393048611727608
Epoch: 70, step: 690, loss: 0.33183467388153076, mean loss: 0.339304787770836
Epoch: 70, step: 691, loss: 0.3076772689819336, mean loss: 0.3393044770024637
Epoch: 70, step: 692, loss: 0.3019612431526184, mean loss: 0.3393041100757361
Epoch: 70, step: 693, loss: 0.3472602665424347, mean loss: 0.33930418825048075
Epoch: 70, step: 694, loss: 0.3423902690410614, mean loss: 0.3393042185730628
Epoch: 70, step: 695, loss: 0.2960701882839203, mean loss: 0.3393037937771356
Epoch: 70, step: 696, loss: 0.3328112065792084, mean loss: 0.3393037299848525
Epoch: 70, step: 697, loss: 0.3359578549861908, mean loss: 0.3393036971106066
Epoch: 70, step: 698, loss: 0.3640654385089874, mean loss: 0.33930394039990397
Epoch: 70, step: 699, loss: 0.3279592990875244, mean loss: 0.33930382893752126
Epoch: 70, step: 700, loss: 0.3087198734283447, mean loss: 0.33930352844965506
Epoch: 70, step: 701, loss: 0.3253711462020874, mean loss: 0.3393033915651151
Epoch: 70, step: 702, loss: 0.31461018323898315, mean loss: 0.3393031489587041
Epoch: 70, step: 703, loss: 0.33830127120018005, mean loss: 0.3393031391155288
Epoch: 70, step: 704, loss: 0.3645590841770172, mean loss: 0.3393033872458531
Epoch: 70, step: 705, loss: 0.33504340052604675, mean loss: 0.3393033453934695
Epoch: 70, step: 706, loss: 0.3343184292316437, mean loss: 0.3393032964194732
Epoch: 70, step: 707, loss: 0.3589504361152649, mean loss: 0.3393034894396691
Epoch: 70, step: 708, loss: 0.3676813244819641, mean loss: 0.3393037682304524
Epoch: 70, step: 709, loss: 0.34624093770980835, mean loss: 0.33930383638223033
Epoch: 70, step: 710, loss: 0.3323120176792145, mean loss: 0.33930376769424514
Epoch: 70, step: 711, loss: 0.33669525384902954, mean loss: 0.3393037420683232
Epoch: 70, step: 712, loss: 0.3224623501300812, mean loss: 0.3393035766208765
Epoch: 70, step: 713, loss: 0.3199211359024048, mean loss: 0.3393033862123974
Epoch: 70, step: 714, loss: 0.3143835961818695, mean loss: 0.3393031414087231
Epoch: 70, step: 715, loss: 0.348747193813324, mean loss: 0.3393032341830207
Epoch: 70, step: 716, loss: 0.3557009994983673, mean loss: 0.3393033952660125
Epoch: 70, step: 717, loss: 0.32381460070610046, mean loss: 0.3393032431137643
Epoch: 70, step: 718, loss: 0.30323565006256104, mean loss: 0.33930288881172743
Epoch: 70, step: 719, loss: 0.31469210982322693, mean loss: 0.33930264705554875
Epoch: 70, step: 720, loss: 0.35397985577583313, mean loss: 0.3393027912310354
Epoch: 70, step: 721, loss: 0.32656973600387573, mean loss: 0.3393026661543647
Epoch: 70, step: 722, loss: 0.37506964802742004, mean loss: 0.339303017489609
Epoch: 70, step: 723, loss: 0.34312352538108826, mean loss: 0.3393030550176815
Epoch: 70, step: 724, loss: 0.3933207392692566, mean loss: 0.33930358561720264
Epoch: 70, step: 725, loss: 0.34068742394447327, mean loss: 0.33930359921009823
Epoch: 70, step: 726, loss: 0.3515072464942932, mean loss: 0.33930371908051266
Epoch: 70, step: 727, loss: 0.32742512226104736, mean loss: 0.3393036024040548
Epoch: 70, step: 728, loss: 0.3212180733680725, mean loss: 0.33930342476230374
Epoch: 70, step: 729, loss: 0.3405645787715912, mean loss: 0.3393034371496332
Epoch: 70, step: 730, loss: 0.34841984510421753, mean loss: 0.3393035266920987
Epoch: 70, step: 731, loss: 0.3596433103084564, mean loss: 0.33930372646996
Epoch: 70, step: 732, loss: 0.33600693941116333, mean loss: 0.3393036940891534
Epoch: 70, step: 733, loss: 0.33934083580970764, mean loss: 0.33930369445395314
Epoch: 70, step: 734, loss: 0.33415889739990234, mean loss: 0.3393036439231173
Epoch: 70, step: 735, loss: 0.3343575596809387, mean loss: 0.33930359534446325
Epoch: 70, step: 736, loss: 0.3084087073802948, mean loss: 0.3393032919090059
Epoch: 70, step: 737, loss: 0.36187782883644104, mean loss: 0.3393035136236038
Epoch: 70, step: 738, loss: 0.39715439081192017, mean loss: 0.3393040817972962
Epoch: 70, step: 739, loss: 0.359345018863678, mean loss: 0.3393042786244133
Epoch: 70, step: 740, loss: 0.30724218487739563, mean loss: 0.33930396373756533
Epoch: 70, step: 741, loss: 0.38162580132484436, mean loss: 0.3393043793828835
Epoch: 70, step: 742, loss: 0.2882014214992523, mean loss: 0.33930387750258256
Epoch: 70, step: 743, loss: 0.38072821497917175, mean loss: 0.3393042843255072
Epoch: 70, step: 744, loss: 0.3099389672279358, mean loss: 0.3393039959354547
Epoch: 70, step: 745, loss: 0.31034374237060547, mean loss: 0.33930371152623146
Epoch: 70, step: 746, loss: 0.33573511242866516, mean loss: 0.3393036764805255
Epoch: 70, step: 747, loss: 0.31835028529167175, mean loss: 0.33930347070813294
Epoch: 70, step: 748, loss: 0.32168543338775635, mean loss: 0.3393032976922208
Epoch: 70, step: 749, loss: 0.3121959865093231, mean loss: 0.33930303149059865
Epoch: 70, step: 750, loss: 0.3684675991535187, mean loss: 0.33930331789226087
Epoch: 70, step: 751, loss: 0.3266766369342804, mean loss: 0.33930319389704366
Epoch: 70, step: 752, loss: 0.34294191002845764, mean loss: 0.3393032296292339
Epoch: 70, step: 753, loss: 0.3312424421310425, mean loss: 0.33930315047308274
Epoch: 70, step: 754, loss: 0.3900527358055115, mean loss: 0.33930364882419317
Epoch: 70, step: 755, loss: 0.36175408959388733, mean loss: 0.33930386928101364
Epoch: 70, step: 756, loss: 0.33365586400032043, mean loss: 0.33930381381978364
Epoch: 70, step: 757, loss: 0.324261337518692, mean loss: 0.3393036661099278
Epoch: 70, step: 758, loss: 0.3349621593952179, mean loss: 0.33930362347884624
Epoch: 70, step: 759, loss: 0.319490522146225, mean loss: 0.33930342892757626
Epoch: 70, step: 760, loss: 0.3476408123970032, mean loss: 0.3393035107942456
Epoch: 70, step: 761, loss: 0.33962804079055786, mean loss: 0.33930351398084835
Epoch: 70, step: 762, loss: 0.3112437427043915, mean loss: 0.339303238460967
Epoch: 70, step: 763, loss: 0.34731924533843994, mean loss: 0.3393033171696477
Epoch: 70, step: 764, loss: 0.3534160256385803, mean loss: 0.3393034557401074
Epoch: 70, step: 765, loss: 0.3143776059150696, mean loss: 0.3393032109995204
Epoch: 70, step: 766, loss: 0.3377353250980377, mean loss: 0.33930319560499816
Epoch: 70, step: 767, loss: 0.3269749879837036, mean loss: 0.33930307455983655
Epoch: 70, step: 768, loss: 0.3693915009498596, mean loss: 0.33930336998174926
Epoch: 70, step: 769, loss: 0.3630512058734894, mean loss: 0.3393036031465592
Epoch: 70, step: 770, loss: 0.30468401312828064, mean loss: 0.3393032632422871
Epoch: 70, step: 771, loss: 0.34605494141578674, mean loss: 0.3393033295313946
Epoch: 70, step: 772, loss: 0.3673461973667145, mean loss: 0.339303604858266
Epoch: 70, step: 773, loss: 0.3584721088409424, mean loss: 0.33930379305415403
Epoch: 70, step: 774, loss: 0.34506872296333313, mean loss: 0.3393038496535346
Epoch: 70, step: 775, loss: 0.292184978723526, mean loss: 0.3393033870507333
Epoch: 70, step: 776, loss: 0.35109078884124756, mean loss: 0.3393035027757379
Epoch: 70, step: 777, loss: 0.3176749646663666, mean loss: 0.3393032904356359
Epoch: 70, step: 778, loss: 0.32533109188079834, mean loss: 0.33930315326367705
Epoch: 70, step: 779, loss: 0.3086480498313904, mean loss: 0.33930285231037416
Epoch: 70, step: 780, loss: 0.32136642932891846, mean loss: 0.339302676223128
Epoch: 70, step: 781, loss: 0.33588650822639465, mean loss: 0.339302642685911
Epoch: 70, step: 782, loss: 0.3059491813182831, mean loss: 0.3393023152514022
Epoch: 70, step: 783, loss: 0.3541639447212219, mean loss: 0.33930246114818097
Epoch: 70, step: 784, loss: 0.3231317400932312, mean loss: 0.33930230240159426
Epoch: 70, step: 785, loss: 0.29829299449920654, mean loss: 0.33930189982067516
Epoch: 70, step: 786, loss: 0.3486882150173187, mean loss: 0.33930199196352023
Epoch: 70, step: 787, loss: 0.3450373709201813, mean loss: 0.3393020482655872
Epoch: 70, step: 788, loss: 0.32485780119895935, mean loss: 0.33930190647321595
Epoch: 70, step: 789, loss: 0.3402121365070343, mean loss: 0.33930191540842786
Epoch: 70, step: 790, loss: 0.33584555983543396, mean loss: 0.339301881479679
Epoch: 70, step: 791, loss: 0.32333430647850037, mean loss: 0.33930172473813075
Epoch: 70, step: 792, loss: 0.3456685543060303, mean loss: 0.33930178723584425
Epoch: 70, step: 793, loss: 0.31088685989379883, mean loss: 0.3393015083135742
Epoch: 70, step: 794, loss: 0.3201250731945038, mean loss: 0.33930132007862823
Epoch: 70, step: 795, loss: 0.3531835377216339, mean loss: 0.3393014563444577
Epoch: 70, step: 796, loss: 0.3104516863822937, mean loss: 0.3393011731620911
Epoch: 70, step: 797, loss: 0.3111262917518616, mean loss: 0.3393008966069819
Epoch: 70, step: 798, loss: 0.35888686776161194, mean loss: 0.33930108885436516
Epoch: 70, step: 799, loss: 0.34390318393707275, mean loss: 0.3393011340260876
Epoch: 70, step: 800, loss: 0.29430538415908813, mean loss: 0.33930069237602656
Epoch: 70, step: 801, loss: 0.3774935007095337, mean loss: 0.3393010672490005
Epoch: 70, step: 802, loss: 0.3254092037677765, mean loss: 0.3393009308978577
Epoch: 70, step: 803, loss: 0.37723466753959656, mean loss: 0.33930130322066243
Epoch: 70, step: 804, loss: 0.3695109188556671, mean loss: 0.33930159972766183
Epoch: 70, step: 805, loss: 0.3045511841773987, mean loss: 0.3393012586561157
Epoch: 70, step: 806, loss: 0.3089475631713867, mean loss: 0.33930096074082244
Epoch: 70, step: 807, loss: 0.31422555446624756, mean loss: 0.3393007146332703
Epoch: 70, step: 808, loss: 0.3526157736778259, mean loss: 0.3393008453152776
Epoch: 70, step: 809, loss: 0.36226969957351685, mean loss: 0.33930107074323185
Epoch: 70, step: 810, loss: 0.3044905662536621, mean loss: 0.3393007290986853
Epoch: 70, step: 811, loss: 0.33373144268989563, mean loss: 0.3393006744399642
Epoch: 70, step: 812, loss: 0.3690553903579712, mean loss: 0.33930096645919927
Epoch: 70, step: 813, loss: 0.3264290392398834, mean loss: 0.33930084013255374
Epoch: 70, step: 814, loss: 0.349844366312027, mean loss: 0.33930094360697527
Epoch: 70, step: 815, loss: 0.3628644645214081, mean loss: 0.3393011748576712
Epoch: 70, step: 816, loss: 0.35022062063217163, mean loss: 0.33930128201927334
Epoch: 70, step: 817, loss: 0.33114564418792725, mean loss: 0.3393012019820024
Epoch: 70, step: 818, loss: 0.2997804582118988, mean loss: 0.3393008141396902
Epoch: 70, step: 819, loss: 0.2922234833240509, mean loss: 0.33930035214429455
Epoch: 70, step: 820, loss: 0.36158302426338196, mean loss: 0.3393005708141027
Epoch: 70, step: 821, loss: 0.3221454918384552, mean loss: 0.339300402465307
Epoch: 70, step: 822, loss: 0.308938205242157, mean loss: 0.33930010451336035
Epoch: 70, step: 823, loss: 0.3264358341693878, mean loss: 0.33929997827424957
Epoch: 70, step: 824, loss: 0.34352967143058777, mean loss: 0.3393000197804873
Epoch: 70, step: 825, loss: 0.34335246682167053, mean loss: 0.3393000595470078
Epoch: 70, step: 826, loss: 0.3482706546783447, mean loss: 0.33930014757427907
Epoch: 70, step: 827, loss: 0.34272611141204834, mean loss: 0.3393001811924821
Epoch: 70, step: 828, loss: 0.3378591537475586, mean loss: 0.33930016705214666
Epoch: 70, step: 829, loss: 0.3329874575138092, mean loss: 0.33930010510818104
Epoch: 70, step: 830, loss: 0.3224693238735199, mean loss: 0.3392999399564189
Epoch: 70, step: 831, loss: 0.359831303358078, mean loss: 0.33930014141810544
Epoch: 70, step: 832, loss: 0.3596588373184204, mean loss: 0.33930034118355146
Epoch: 70, step: 833, loss: 0.3314790427684784, mean loss: 0.33930026443944944
Epoch: 70, step: 834, loss: 0.31289854645729065, mean loss: 0.3393000053831969
Epoch: 70, step: 835, loss: 0.35309740900993347, mean loss: 0.3393001407633494
Epoch: 70, step: 836, loss: 0.29768455028533936, mean loss: 0.3392997324350972
Epoch: 70, step: 837, loss: 0.33313465118408203, mean loss: 0.33929967194449445
Epoch: 70, step: 838, loss: 0.31518593430519104, mean loss: 0.33929943534741597
Epoch: 70, step: 839, loss: 0.31977421045303345, mean loss: 0.3392992437733884
Epoch: 70, step: 840, loss: 0.316898912191391, mean loss: 0.3392990239920717
Epoch: 70, step: 841, loss: 0.3697933256626129, mean loss: 0.3392993231846078
Epoch: 70, step: 842, loss: 0.3323611617088318, mean loss: 0.33929925511202874
Epoch: 70, step: 843, loss: 0.34760740399360657, mean loss: 0.33929933662520406
Epoch: 70, step: 844, loss: 0.342783123254776, mean loss: 0.33929937080510725
Epoch: 70, step: 845, loss: 0.31928667426109314, mean loss: 0.3392991744597533
Epoch: 70, step: 846, loss: 0.35306504368782043, mean loss: 0.3392993095159134
Epoch: 70, step: 847, loss: 0.332097589969635, mean loss: 0.3392992388609457
Epoch: 70, step: 848, loss: 0.3058721721172333, mean loss: 0.3392989109163299
Epoch: 70, step: 849, loss: 0.3411366641521454, mean loss: 0.3392989289458917
Epoch: 70, step: 850, loss: 0.35193759202957153, mean loss: 0.3392990529382305
Epoch: 70, step: 851, loss: 0.3404369652271271, mean loss: 0.3392990641016756
Epoch: 70, step: 852, loss: 0.34412118792533875, mean loss: 0.3392991114084734
Epoch: 70, step: 853, loss: 0.33415091037750244, mean loss: 0.3392990609032344
Epoch: 70, step: 854, loss: 0.3541595935821533, mean loss: 0.3392992066876331
Epoch: 70, step: 855, loss: 0.33887502551078796, mean loss: 0.3392992025263831
Epoch: 70, step: 856, loss: 0.3456993103027344, mean loss: 0.3392992653113167
Epoch: 70, step: 857, loss: 0.34207257628440857, mean loss: 0.3392992925171769
Epoch: 70, step: 858, loss: 0.37365442514419556, mean loss: 0.33929962953375176
Epoch: 70, step: 859, loss: 0.29080766439437866, mean loss: 0.33929915384251047
Epoch: 70, step: 860, loss: 0.3367486894130707, mean loss: 0.33929912882348545
Epoch: 70, step: 861, loss: 0.35123157501220703, mean loss: 0.3392992458748106
Epoch: 70, step: 862, loss: 0.36038491129875183, mean loss: 0.3392994527126065
Epoch: 70, step: 863, loss: 0.34746253490448, mean loss: 0.3392995327867863
Epoch: 70, step: 864, loss: 0.3440597355365753, mean loss: 0.3392995794806188
Epoch: 70, step: 865, loss: 0.37119489908218384, mean loss: 0.33929989234546487
Epoch: 70, step: 866, loss: 0.33841580152511597, mean loss: 0.33929988367340175
Epoch: 70, step: 867, loss: 0.3207520544528961, mean loss: 0.33929970173918805
Epoch: 70, step: 868, loss: 0.32937851548194885, mean loss: 0.33929960442399854
Epoch: 70, step: 869, loss: 0.3060391843318939, mean loss: 0.33929927818152583
Epoch: 70, step: 870, loss: 0.3714808523654938, mean loss: 0.3392995938387944
Epoch: 70, step: 871, loss: 0.3025633990764618, mean loss: 0.33929923351045593
Epoch: 70, step: 872, loss: 0.315371572971344, mean loss: 0.33929899881740583
Epoch: 70, step: 873, loss: 0.3370364010334015, mean loss: 0.3392989766250663
Epoch: 70, step: 874, loss: 0.3222000300884247, mean loss: 0.33929880891434555
Epoch: 70, step: 875, loss: 0.33764490485191345, mean loss: 0.3392987926926022
Epoch: 70, step: 876, loss: 0.36188995838165283, mean loss: 0.339299014268028
Epoch: 70, step: 877, loss: 0.30239179730415344, mean loss: 0.33929865228351513
Epoch: 70, step: 878, loss: 0.3395576477050781, mean loss: 0.33929865482370697
Epoch: 70, step: 879, loss: 0.3317907154560089, mean loss: 0.3392985811875813
Epoch: 70, step: 880, loss: 0.2909386456012726, mean loss: 0.3392981068892164
Epoch: 70, step: 881, loss: 0.33216896653175354, mean loss: 0.339298036969635
Epoch: 70, step: 882, loss: 0.31202366948127747, mean loss: 0.33929776947684365
Epoch: 70, step: 883, loss: 0.36143961548805237, mean loss: 0.3392979866304078
Epoch: 70, step: 884, loss: 0.38696154952049255, mean loss: 0.33929845408063963
Epoch: 70, step: 885, loss: 0.3749389946460724, mean loss: 0.3392988036142152
Epoch: 70, step: 886, loss: 0.36111459136009216, mean loss: 0.3392990175637062
Epoch: 70, step: 887, loss: 0.3053947389125824, mean loss: 0.33929868506450395
Epoch: 70, step: 888, loss: 0.3130165636539459, mean loss: 0.33929842731831233
Epoch: 70, step: 889, loss: 0.3347628116607666, mean loss: 0.33929838283840985
Epoch: 70, step: 890, loss: 0.3071863651275635, mean loss: 0.33929806792517264
Epoch: 70, step: 891, loss: 0.32699260115623474, mean loss: 0.3392979472502151
Epoch: 70, step: 892, loss: 0.3152408301830292, mean loss: 0.3392977113336777
Epoch: 70, step: 893, loss: 0.3305940330028534, mean loss: 0.3392976259817416
Epoch: 70, step: 894, loss: 0.2929147779941559, mean loss: 0.33929717113645613
Epoch: 70, step: 895, loss: 0.3288606107234955, mean loss: 0.33929706879315563
Epoch: 70, step: 896, loss: 0.3523300290107727, mean loss: 0.3392971965960937
Epoch: 70, step: 897, loss: 0.3303621709346771, mean loss: 0.3392971089789051
Epoch: 70, step: 898, loss: 0.3174484670162201, mean loss: 0.3392968947324233
Epoch: 70, step: 899, loss: 0.3383863568305969, mean loss: 0.33929688580383044
Epoch: 70, step: 900, loss: 0.3188364803791046, mean loss: 0.3392966851742482
Epoch: 70, step: 901, loss: 0.321414977312088, mean loss: 0.33929650983244414
Epoch: 70, step: 902, loss: 0.33547303080558777, mean loss: 0.3392964723411071
Epoch: 70, step: 903, loss: 0.3304600119590759, mean loss: 0.3392963856955511
Epoch: 70, step: 904, loss: 0.3406224846839905, mean loss: 0.33929639869843375
Epoch: 70, step: 905, loss: 0.31124261021614075, mean loss: 0.3392961236235364
Epoch: 70, step: 906, loss: 0.3262799382209778, mean loss: 0.3392959959976095
Epoch: 70, step: 907, loss: 0.3583293855190277, mean loss: 0.3392961826214233
Epoch: 70, step: 908, loss: 0.31262174248695374, mean loss: 0.3392959210790988
Epoch: 70, step: 909, loss: 0.344323992729187, mean loss: 0.3392959703787522
Epoch: 70, step: 910, loss: 0.3331036865711212, mean loss: 0.3392959096647303
Epoch: 70, step: 911, loss: 0.30841758847236633, mean loss: 0.33929560691234584
Epoch: 70, step: 912, loss: 0.32656750082969666, mean loss: 0.3392954821184278
Epoch: 70, step: 913, loss: 0.3103703260421753, mean loss: 0.33929519852178414
Epoch: 70, step: 914, loss: 0.36189916729927063, mean loss: 0.3392954201401848
Epoch: 70, step: 915, loss: 0.33611592650413513, mean loss: 0.33929538896745615
Epoch: 70, step: 916, loss: 0.3609755039215088, mean loss: 0.3392956015238544
Epoch: 70, step: 917, loss: 0.3699450194835663, mean loss: 0.33929590201423615
Epoch: 70, step: 918, loss: 0.3451944589614868, mean loss: 0.3392959598437928
Epoch: 70, step: 919, loss: 0.3465560972690582, mean loss: 0.3392960310216107
Epoch: 70, step: 920, loss: 0.34059375524520874, mean loss: 0.33929604374427247
Epoch: 70, step: 921, loss: 0.30917680263519287, mean loss: 0.3392957484633847
Epoch: 70, step: 922, loss: 0.3709072768688202, mean loss: 0.33929605837121496
Epoch: 70, step: 923, loss: 0.346322238445282, mean loss: 0.3392961272526321
Epoch: 70, step: 924, loss: 0.3246479332447052, mean loss: 0.33929598364992625
Epoch: 70, step: 925, loss: 0.31404292583465576, mean loss: 0.3392957360854907
Epoch: 70, step: 926, loss: 0.3275241255760193, mean loss: 0.33929562068546415
Epoch: 70, step: 927, loss: 0.3246088922023773, mean loss: 0.3392954767092223
Epoch: 70, step: 928, loss: 0.3162643313407898, mean loss: 0.3392952509336008
Epoch: 70, step: 929, loss: 0.33029651641845703, mean loss: 0.33929516271936183
Epoch: 70, step: 930, loss: 0.34875234961509705, mean loss: 0.33929525542688255
Epoch: 70, step: 931, loss: 0.3477667570114136, mean loss: 0.33929533847104976
Epoch: 70, step: 932, loss: 0.3291974663734436, mean loss: 0.3392952394849196
Epoch: 70, step: 933, loss: 0.3697534501552582, mean loss: 0.33929553805384804
Epoch: 70, step: 934, loss: 0.32283034920692444, mean loss: 0.3392953766541632
Epoch: 70, step: 935, loss: 0.3581524193286896, mean loss: 0.33929556149813545
Epoch: 70, step: 936, loss: 0.33560311794281006, mean loss: 0.33929552530374085
Epoch: 70, step: 937, loss: 0.34041351079940796, mean loss: 0.33929553626244907
Epoch: 70, step: 938, loss: 0.31418177485466003, mean loss: 0.3392952900949567
Epoch: 70, step: 939, loss: 0.31795838475227356, mean loss: 0.3392950809506189
Epoch: 70, step: 940, loss: 0.35587644577026367, mean loss: 0.33929524347955725
Epoch: 70, step: 941, loss: 0.35375455021858215, mean loss: 0.33929538520689784
Epoch: 70, step: 942, loss: 0.3367384970188141, mean loss: 0.33929536014501777
Epoch: 70, step: 943, loss: 0.3570004105567932, mean loss: 0.3392955336831109
Epoch: 70, step: 944, loss: 0.31649044156074524, mean loss: 0.3392953101585618
Epoch: 70, step: 945, loss: 0.2965298295021057, mean loss: 0.339294890995989
Epoch: 70, step: 946, loss: 0.33451223373413086, mean loss: 0.33929484411960076
Epoch: 70, step: 947, loss: 0.321354478597641, mean loss: 0.33929466828193344
Epoch: 70, step: 948, loss: 0.28841155767440796, mean loss: 0.3392941695696986
Epoch: 70, step: 949, loss: 0.3607543110847473, mean loss: 0.3392943799013806
Epoch: 70, step: 950, loss: 0.3248859941959381, mean loss: 0.33929423868561576
Epoch: 70, step: 951, loss: 0.32479703426361084, mean loss: 0.3392940966007363
Epoch: 70, step: 952, loss: 0.33515989780426025, mean loss: 0.33929405608248436
Epoch: 70, step: 953, loss: 0.4006415605545044, mean loss: 0.3392946573281914
Epoch: 70, step: 954, loss: 0.35179048776626587, mean loss: 0.3392947797943103
Epoch: 70, step: 955, loss: 0.3256230354309082, mean loss: 0.3392946458048912
Epoch: 70, step: 956, loss: 0.33680468797683716, mean loss: 0.33929462140239186
Epoch: 70, step: 957, loss: 0.3313077390193939, mean loss: 0.33929454312878415
Epoch: 70, step: 958, loss: 0.3480106592178345, mean loss: 0.33929462854824227
Epoch: 70, step: 959, loss: 0.3582385778427124, mean loss: 0.33929481420043056
Epoch: 70, step: 960, loss: 0.3225105106830597, mean loss: 0.33929464971455214
Epoch: 70, step: 961, loss: 0.29884010553359985, mean loss: 0.339294253264618
Epoch: 70, step: 962, loss: 0.32320693135261536, mean loss: 0.339294095612237
Epoch: 70, step: 963, loss: 0.3153117895126343, mean loss: 0.33929386059296984
Epoch: 70, step: 964, loss: 0.3276767432689667, mean loss: 0.33929374674988766
Epoch: 70, step: 965, loss: 0.3493303656578064, mean loss: 0.3392938451037566
Epoch: 70, step: 966, loss: 0.35572123527526855, mean loss: 0.339294006082425
Epoch: 70, step: 967, loss: 0.3317600190639496, mean loss: 0.3392939322545497
Epoch: 70, step: 968, loss: 0.3258349299430847, mean loss: 0.33929380036690443
Epoch: 70, step: 969, loss: 0.34048622846603394, mean loss: 0.33929381205164816
Epoch: 70, step: 970, loss: 0.32185041904449463, mean loss: 0.33929364112345534
Epoch: 70, step: 971, loss: 0.32690903544425964, mean loss: 0.3392935197676203
Epoch: 70, step: 972, loss: 0.3332640826702118, mean loss: 0.33929346068619104
Epoch: 70, step: 973, loss: 0.2950390577316284, mean loss: 0.339293027049068
Epoch: 70, step: 974, loss: 0.3324441611766815, mean loss: 0.3392929599395107
Epoch: 70, step: 975, loss: 0.3738850951194763, mean loss: 0.33929329889199933
Epoch: 70, step: 976, loss: 0.31781744956970215, mean loss: 0.33929308846205014
Epoch: 70, step: 977, loss: 0.3269980549812317, mean loss: 0.33929296799100933
Epoch: 70, step: 978, loss: 0.3130226135253906, mean loss: 0.3392927105874049
Epoch: 70, step: 979, loss: 0.35283228754997253, mean loss: 0.3392928432503185
Epoch: 70, step: 980, loss: 0.31444865465164185, mean loss: 0.33929259982541965
Epoch: 70, step: 981, loss: 0.34967198967933655, mean loss: 0.33929270152232793
Epoch: 70, step: 982, loss: 0.3321053981781006, mean loss: 0.33929263110206453
Epoch: 70, step: 983, loss: 0.3755166828632355, mean loss: 0.3392929860171351
Epoch: 70, step: 984, loss: 0.3056439757347107, mean loss: 0.339292656334969
Epoch: 70, step: 985, loss: 0.33816370368003845, mean loss: 0.33929264527396286
Epoch: 70, step: 986, loss: 0.3409622013568878, mean loss: 0.33929266163141514
Epoch: 70, step: 987, loss: 0.33262670040130615, mean loss: 0.3392925963223934
Epoch: 70, step: 988, loss: 0.3185533583164215, mean loss: 0.3392923931339816
Epoch: 70, step: 989, loss: 0.2972773611545563, mean loss: 0.3392919815043942
Epoch: 70, step: 990, loss: 0.3054806888103485, mean loss: 0.3392916502517104
Epoch: 70, step: 991, loss: 0.33073270320892334, mean loss: 0.3392915663996545
Epoch: 70, step: 992, loss: 0.28919678926467896, mean loss: 0.3392910756256287
Epoch: 70, step: 993, loss: 0.3206349015235901, mean loss: 0.33929089285455966
Epoch: 70, step: 994, loss: 0.31678542494773865, mean loss: 0.3392906723748349
Epoch: 70, step: 995, loss: 0.3555545210838318, mean loss: 0.33929083170561497
Epoch: 70, step: 996, loss: 0.3496812880039215, mean loss: 0.3392909334959918
Epoch: 70, step: 997, loss: 0.31864386796951294, mean loss: 0.33929073122845593
Epoch: 70, step: 998, loss: 0.34298598766326904, mean loss: 0.33929076742842296
Epoch: 70, step: 999, loss: 0.3075172007083893, mean loss: 0.3392904561669935
Epoch: 70, step: 1000, loss: 0.3805050551891327, mean loss: 0.3392908599110695
Epoch: 70, step: 1001, loss: 0.3398793339729309, mean loss: 0.33929086567578864
Epoch: 70, step: 1002, loss: 0.30031925439834595, mean loss: 0.3392904839118194
Epoch: 70, step: 1003, loss: 0.3061596155166626, mean loss: 0.33929015936665663
Epoch: 70, step: 1004, loss: 0.30833521485328674, mean loss: 0.33928985613949775
Epoch: 70, step: 1005, loss: 0.35358038544654846, mean loss: 0.3392899961246995
Epoch: 70, step: 1006, loss: 0.3218497633934021, mean loss: 0.33928982528773954
Epoch: 70, step: 1007, loss: 0.35299238562583923, mean loss: 0.3392899595107661
Epoch: 70, step: 1008, loss: 0.30769339203834534, mean loss: 0.3392896500105509
Epoch: 70, step: 1009, loss: 0.3008193373680115, mean loss: 0.3392892731831178
Epoch: 70, step: 1010, loss: 0.3109631836414337, mean loss: 0.33928899572389476
Epoch: 70, step: 1011, loss: 0.3747069537639618, mean loss: 0.33928934264586746
Epoch: 70, step: 1012, loss: 0.3896670937538147, mean loss: 0.3392898360954782
Epoch: 70, step: 1013, loss: 0.3370879590511322, mean loss: 0.33928981452832396
Epoch: 70, step: 1014, loss: 0.3125293552875519, mean loss: 0.3392895524150056
Epoch: 70, step: 1015, loss: 0.32463338971138, mean loss: 0.3392894088622444
Epoch: 70, step: 1016, loss: 0.3449042737483978, mean loss: 0.3392894638576398
Epoch: 70, step: 1017, loss: 0.3828375041484833, mean loss: 0.33928989038940627
Epoch: 70, step: 1018, loss: 0.32129284739494324, mean loss: 0.33928971411889436
Epoch: 70, step: 1019, loss: 0.33613234758377075, mean loss: 0.33928968319463837
Epoch: 70, step: 1020, loss: 0.32522374391555786, mean loss: 0.3392895454296872
Epoch: 70, step: 1021, loss: 0.33497121930122375, mean loss: 0.33928950313545075
Epoch: 70, step: 1022, loss: 0.37899696826934814, mean loss: 0.33928989203161575
Epoch: 70, step: 1023, loss: 0.3169325888156891, mean loss: 0.33928967306562796
Epoch: 70, step: 1024, loss: 0.3329260051250458, mean loss: 0.33928961074088443
Epoch: 70, step: 1025, loss: 0.27261021733283997, mean loss: 0.33928895769999157
Epoch: 70, step: 1026, loss: 0.3483501672744751, mean loss: 0.33928904644228713
Epoch: 70, step: 1027, loss: 0.31817108392715454, mean loss: 0.3392888396224247
Epoch: 70, step: 1028, loss: 0.3436059355735779, mean loss: 0.33928888190171397
Epoch: 70, step: 1029, loss: 0.3306385576725006, mean loss: 0.33928879718597377
Epoch: 70, step: 1030, loss: 0.32443228363990784, mean loss: 0.3392886516922116
Epoch: 70, step: 1031, loss: 0.30850663781166077, mean loss: 0.3392883502387695
Epoch: 70, step: 1032, loss: 0.2971527576446533, mean loss: 0.33928793760186143
Epoch: 70, step: 1033, loss: 0.34040987491607666, mean loss: 0.33928794858896716
Epoch: 70, step: 1034, loss: 0.316817969083786, mean loss: 0.3392877285431413
Epoch: 70, step: 1035, loss: 0.3270951509475708, mean loss: 0.33928760914385425
Epoch: 70, step: 1036, loss: 0.37415504455566406, mean loss: 0.33928795058979777
Epoch: 70, step: 1037, loss: 0.33166027069091797, mean loss: 0.3392878758950339
Epoch: 70, step: 1038, loss: 0.3175714313983917, mean loss: 0.3392876632368166
Epoch: 70, step: 1039, loss: 0.33966895937919617, mean loss: 0.33928766697062135
Epoch: 70, step: 1040, loss: 0.316577672958374, mean loss: 0.33928744458742877
Epoch: 70, step: 1041, loss: 0.30267325043678284, mean loss: 0.3392870860535756
Epoch: 70, step: 1042, loss: 0.3270518183708191, mean loss: 0.3392869662444466
Epoch: 70, step: 1043, loss: 0.3347432315349579, mean loss: 0.3392869217521166
Epoch: 70, step: 1044, loss: 0.3437243700027466, mean loss: 0.3392869652032623
Epoch: 70, step: 1045, loss: 0.3647304177284241, mean loss: 0.33928721434111675
Epoch: 70, step: 1046, loss: 0.3343602120876312, mean loss: 0.33928716609724147
Epoch: 70, step: 1047, loss: 0.3169305920600891, mean loss: 0.33928694718985036
Epoch: 70, step: 1048, loss: 0.30285710096359253, mean loss: 0.33928659048562115
Epoch: 70, step: 1049, loss: 0.2987482249736786, mean loss: 0.33928619355655515
Epoch: 70, step: 1050, loss: 0.34662485122680664, mean loss: 0.33928626541189455
Epoch: 70, step: 1051, loss: 0.30818232893943787, mean loss: 0.3392859608654598
Epoch: 70, step: 1052, loss: 0.3232363164424896, mean loss: 0.33928580372090883
Epoch: 70, step: 1053, loss: 0.3095952272415161, mean loss: 0.33928551301872856
Epoch: 70, step: 1054, loss: 0.35269811749458313, mean loss: 0.3392856443410419
Epoch: 70, step: 1055, loss: 0.3359065055847168, mean loss: 0.3392856112563435
Epoch: 70, step: 1056, loss: 0.3465563654899597, mean loss: 0.3392856824426348
Epoch: 70, step: 1057, loss: 0.33226847648620605, mean loss: 0.3392856137394493
Epoch: 70, step: 1058, loss: 0.30742204189300537, mean loss: 0.33928530177661587
Epoch: 70, step: 1059, loss: 0.3308296501636505, mean loss: 0.339285218991697
Epoch: 70, step: 1060, loss: 0.3092816472053528, mean loss: 0.3392849252450939
Epoch: 70, step: 1061, loss: 0.3212578594684601, mean loss: 0.33928474875485704
Epoch: 70, step: 1062, loss: 0.32837846875190735, mean loss: 0.3392846419802371
Epoch: 70, step: 1063, loss: 0.32885751128196716, mean loss: 0.3392845398975822
Epoch: 70, step: 1064, loss: 0.3086296617984772, mean loss: 0.3392842397861906
Epoch: 70, step: 1065, loss: 0.3210143744945526, mean loss: 0.3392840609258799
Epoch: 70, step: 1066, loss: 0.3600040674209595, mean loss: 0.33928426377086307
Epoch: 70, step: 1067, loss: 0.39010635018348694, mean loss: 0.33928476130470037
Epoch: 70, step: 1068, loss: 0.3244158625602722, mean loss: 0.3392846157438163
Epoch: 70, step: 1069, loss: 0.36306580901145935, mean loss: 0.33928484855040725
Epoch: 70, step: 1070, loss: 0.39153802394866943, mean loss: 0.33928536007917737
Epoch: 70, step: 1071, loss: 0.3390875458717346, mean loss: 0.3392853581427081
Epoch: 70, step: 1072, loss: 0.35329365730285645, mean loss: 0.3392854952732785
Epoch: 70, step: 1073, loss: 0.32053354382514954, mean loss: 0.33928531170776516
Epoch: 70, step: 1074, loss: 0.32889115810394287, mean loss: 0.3392852099589168
Epoch: 70, step: 1075, loss: 0.3171240985393524, mean loss: 0.3392849930249
Epoch: 70, step: 1076, loss: 0.29779499769210815, mean loss: 0.3392845868853762
Epoch: 70, step: 1077, loss: 0.29043346643447876, mean loss: 0.3392841086935513
Epoch: 70, step: 1078, loss: 0.3126211166381836, mean loss: 0.3392838476985136
Epoch: 70, step: 1079, loss: 0.31854048371315, mean loss: 0.3392836446507064
Epoch: 70, step: 1080, loss: 0.28334078192710876, mean loss: 0.33928309705560916
Epoch: 70, step: 1081, loss: 0.29346463084220886, mean loss: 0.33928264856726503
Epoch: 70, step: 1082, loss: 0.32071104645729065, mean loss: 0.33928246678323254
Epoch: 70, step: 1083, loss: 0.35348767042160034, mean loss: 0.3392826058263753
Epoch: 70, step: 1084, loss: 0.31258687376976013, mean loss: 0.3392823445262035
Epoch: 70, step: 1085, loss: 0.3608182668685913, mean loss: 0.3392825553196411
Epoch: 70, step: 1086, loss: 0.3223954737186432, mean loss: 0.33928239003063776
Epoch: 70, step: 1087, loss: 0.34300899505615234, mean loss: 0.33928242650590423
Epoch: 70, step: 1088, loss: 0.36291369795799255, mean loss: 0.33928265780181055
Epoch: 70, step: 1089, loss: 0.3323309123516083, mean loss: 0.339282589760845
Epoch: 70, step: 1090, loss: 0.30816423892974854, mean loss: 0.3392822851895789
Epoch: 70, step: 1091, loss: 0.32161250710487366, mean loss: 0.3392821122480873
Epoch: 70, step: 1092, loss: 0.31925708055496216, mean loss: 0.339281916256664
Epoch: 70, step: 1093, loss: 0.2838912308216095, mean loss: 0.33928137413552323
Epoch: 70, step: 1094, loss: 0.3406185507774353, mean loss: 0.3392813872226448
Epoch: 70, step: 1095, loss: 0.31992265582084656, mean loss: 0.3392811977580797
Epoch: 70, step: 1096, loss: 0.36229488253593445, mean loss: 0.33928142299159386
Epoch: 70, step: 1097, loss: 0.30913203954696655, mean loss: 0.3392811279243245
Epoch: 70, step: 1098, loss: 0.31482064723968506, mean loss: 0.33928088853579375
Epoch: 70, step: 1099, loss: 0.30274152755737305, mean loss: 0.3392805309378198
Epoch: 70, step: 1100, loss: 0.34200987219810486, mean loss: 0.33928055764866877
Epoch: 70, step: 1101, loss: 0.29945191740989685, mean loss: 0.3392801678672959
Epoch: 70, step: 1102, loss: 0.37517407536506653, mean loss: 0.3392805191381286
Epoch: 70, step: 1103, loss: 0.3344866931438446, mean loss: 0.3392804722244631
Epoch: 70, step: 1104, loss: 0.3188636302947998, mean loss: 0.3392802724217335
Epoch: 70, step: 1105, loss: 0.2916054427623749, mean loss: 0.33927980587220946
Epoch: 70, step: 1106, loss: 0.3238087594509125, mean loss: 0.33927965447284925
Epoch: 70, step: 1107, loss: 0.3379037380218506, mean loss: 0.33927964100828933
Epoch: 70, step: 1108, loss: 0.4076872169971466, mean loss: 0.33928031043039925
Epoch: 70, step: 1109, loss: 0.3249838948249817, mean loss: 0.3392801705300606
Epoch: 70, step: 1110, loss: 0.32569751143455505, mean loss: 0.3392800376156249
Epoch: 70, step: 1111, loss: 0.33679935336112976, mean loss: 0.3392800133408847
Epoch: 70, step: 1112, loss: 0.41641128063201904, mean loss: 0.3392807681016539
Epoch: 70, step: 1113, loss: 0.3525553345680237, mean loss: 0.3392808979974058
Epoch: 70, step: 1114, loss: 0.3311065435409546, mean loss: 0.3392808180095937
Epoch: 70, step: 1115, loss: 0.3495400547981262, mean loss: 0.3392809183974444
Epoch: 70, step: 1116, loss: 0.32723546028137207, mean loss: 0.33928080053235915
Epoch: 70, step: 1117, loss: 0.3010057806968689, mean loss: 0.3392804260140727
Epoch: 70, step: 1118, loss: 0.35426297783851624, mean loss: 0.33928057261581857
Epoch: 70, step: 1119, loss: 0.3587670922279358, mean loss: 0.3392807632862649
Epoch: 70, step: 1120, loss: 0.34319832921028137, mean loss: 0.3392808016182374
Epoch: 70, step: 1121, loss: 0.3289784789085388, mean loss: 0.33928070081470413
Epoch: 70, step: 1122, loss: 0.34690698981285095, mean loss: 0.3392807754337368
Epoch: 70, step: 1123, loss: 0.3603607416152954, mean loss: 0.33928098168756426
Epoch: 70, step: 1124, loss: 0.35742175579071045, mean loss: 0.33928115918156265
Epoch: 70, step: 1125, loss: 0.3185093402862549, mean loss: 0.339280955946734
Epoch: 70, step: 1126, loss: 0.3362807035446167, mean loss: 0.3392809265920675
Epoch: 70, step: 1127, loss: 0.31787070631980896, mean loss: 0.33928071711511587
Epoch: 70, step: 1128, loss: 0.35375261306762695, mean loss: 0.33928085870632557
Epoch: 70, step: 1129, loss: 0.34521371126174927, mean loss: 0.3392809167520408
Epoch: 70, step: 1130, loss: 0.32833221554756165, mean loss: 0.33928080963342144
Epoch: 70, step: 1131, loss: 0.33358055353164673, mean loss: 0.33928075386446965
Epoch: 70, step: 1132, loss: 0.3097856044769287, mean loss: 0.33928046529893113
Epoch: 70, step: 1133, loss: 0.3546842038631439, mean loss: 0.33928061599979953
Epoch: 70, step: 1134, loss: 0.29615336656570435, mean loss: 0.33928019407298415
Epoch: 70, step: 1135, loss: 0.3258163034915924, mean loss: 0.33928006235299335
Epoch: 70, step: 1136, loss: 0.37025365233421326, mean loss: 0.3392803653709843
Epoch: 70, step: 1137, loss: 0.3144080936908722, mean loss: 0.3392801220452327
Epoch: 70, step: 1138, loss: 0.3148905634880066, mean loss: 0.33927988344420396
Epoch: 70, step: 1139, loss: 0.32135647535324097, mean loss: 0.33927970810270436
Epoch: 70, step: 1140, loss: 0.29996734857559204, mean loss: 0.3392793235206759
Epoch: 70, step: 1141, loss: 0.33964934945106506, mean loss: 0.3392793271405027
Epoch: 70, step: 1142, loss: 0.37643179297447205, mean loss: 0.3392796905857727
Epoch: 70, step: 1143, loss: 0.34486493468284607, mean loss: 0.3392797452230799
Epoch: 70, step: 1144, loss: 0.3398315906524658, mean loss: 0.33927975062142113
Epoch: 70, step: 1145, loss: 0.31554216146469116, mean loss: 0.3392795184144566
Epoch: 70, step: 1146, loss: 0.36896106600761414, mean loss: 0.3392798087638515
Epoch: 70, step: 1147, loss: 0.3327488601207733, mean loss: 0.3392797448777475
Epoch: 70, step: 1148, loss: 0.32869163155555725, mean loss: 0.33927964130524535
Epoch: 70, step: 1149, loss: 0.34997430443763733, mean loss: 0.3392797459189902
Epoch: 70, step: 1150, loss: 0.323579341173172, mean loss: 0.33927959234126187
Epoch: 70, step: 1151, loss: 0.32755640149116516, mean loss: 0.3392794776688418
Epoch: 70, step: 1152, loss: 0.355928897857666, mean loss: 0.33927964052643367
Epoch: 70, step: 1153, loss: 0.3337398171424866, mean loss: 0.3392795863387526
Epoch: 70, step: 1154, loss: 0.3168971538543701, mean loss: 0.33927936740754033
Epoch: 70, step: 1155, loss: 0.2910535931587219, mean loss: 0.3392788956972402
Epoch: 70, step: 1156, loss: 0.362493634223938, mean loss: 0.339279122765117
Epoch: 70, step: 1157, loss: 0.35197940468788147, mean loss: 0.3392792469878319
Epoch: 70, step: 1158, loss: 0.32354018092155457, mean loss: 0.33927909304397424
Epoch: 70, step: 1159, loss: 0.34102869033813477, mean loss: 0.3392791101566238
Epoch: 70, step: 1160, loss: 0.3552096486091614, mean loss: 0.3392792659702255
Epoch: 70, step: 1161, loss: 0.2967665195465088, mean loss: 0.33927885016511194
Epoch: 70, step: 1162, loss: 0.3900474011898041, mean loss: 0.3392793467130519
Epoch: 70, step: 1163, loss: 0.33718228340148926, mean loss: 0.3392793262026717
Epoch: 70, step: 1164, loss: 0.35757437348365784, mean loss: 0.3392795051360893
Epoch: 70, step: 1165, loss: 0.3401316702365875, mean loss: 0.33927951347054836
Epoch: 70, step: 1166, loss: 0.33579063415527344, mean loss: 0.33927947934847813
Epoch: 70, step: 1167, loss: 0.3008078932762146, mean loss: 0.33927910309088805
Epoch: 70, step: 1168, loss: 0.33644798398017883, mean loss: 0.3392790754024108
Epoch: 70, step: 1169, loss: 0.37447625398635864, mean loss: 0.33927941962909625
Epoch: 70, step: 1170, loss: 0.3360494375228882, mean loss: 0.33927938804033814
Epoch: 70, step: 1171, loss: 0.3691706359386444, mean loss: 0.33927968036956296
Epoch: 70, step: 1172, loss: 0.37078675627708435, mean loss: 0.3392799884981842
Epoch: 70, step: 1173, loss: 0.32625749707221985, mean loss: 0.3392798611438369
Epoch: 70, step: 1174, loss: 0.3124055862426758, mean loss: 0.3392795983275942
Epoch: 70, step: 1175, loss: 0.33561620116233826, mean loss: 0.3392795625018513
Epoch: 70, step: 1176, loss: 0.3305723965167999, mean loss: 0.3392794773520231
Epoch: 70, step: 1177, loss: 0.3552708923816681, mean loss: 0.3392796337350447
Epoch: 70, step: 1178, loss: 0.31025975942611694, mean loss: 0.33927934994707193
Epoch: 70, step: 1179, loss: 0.3136906325817108, mean loss: 0.3392790997151399
Epoch: 70, step: 1180, loss: 0.3550180196762085, mean loss: 0.33927925362445005
Epoch: 70, step: 1181, loss: 0.338979572057724, mean loss: 0.3392792506939229
Epoch: 70, step: 1182, loss: 0.3302183747291565, mean loss: 0.33927916209026404
Epoch: 70, step: 1183, loss: 0.32667264342308044, mean loss: 0.3392790388160066
Epoch: 70, step: 1184, loss: 0.3129864037036896, mean loss: 0.3392787817130377
Epoch: 70, step: 1185, loss: 0.3047693967819214, mean loss: 0.33927844426574405
Epoch: 70, step: 1186, loss: 0.3061372935771942, mean loss: 0.3392781202007897
Epoch: 70, step: 1187, loss: 0.3303077816963196, mean loss: 0.33927803248675886
Epoch: 70, step: 1188, loss: 0.31976765394210815, mean loss: 0.3392778417116604
Epoch: 70, step: 1189, loss: 0.3120463788509369, mean loss: 0.33927757544136744
Epoch: 70, step: 1190, loss: 0.34209388494491577, mean loss: 0.339277602979081
Epoch: 70, step: 1191, loss: 0.3108692765235901, mean loss: 0.3392773252068026
Epoch: 70, step: 1192, loss: 0.30427291989326477, mean loss: 0.3392769829424189
Epoch: 70, step: 1193, loss: 0.3062196373939514, mean loss: 0.33927665971906257
Epoch: 70, step: 1194, loss: 0.30332884192466736, mean loss: 0.3392763082370993
Epoch: 70, step: 1195, loss: 0.36438697576522827, mean loss: 0.33927655375576965
Epoch: 70, step: 1196, loss: 0.30891647934913635, mean loss: 0.3392762569141102
Epoch: 70, step: 1197, loss: 0.3709205985069275, mean loss: 0.33927656630949915
Epoch: 70, step: 1198, loss: 0.30154478549957275, mean loss: 0.3392761973991577
Epoch: 70, step: 1199, loss: 0.2988617718219757, mean loss: 0.3392758022639839
Epoch: 70, step: 1200, loss: 0.42899802327156067, mean loss: 0.3392766794769659
Epoch: 70, step: 1201, loss: 0.32624998688697815, mean loss: 0.3392765521164079
Epoch: 70, step: 1202, loss: 0.34256795048713684, mean loss: 0.3392765842957375
Epoch: 70, step: 1203, loss: 0.3200361132621765, mean loss: 0.3392763961874211
Epoch: 70, step: 1204, loss: 0.3412204086780548, mean loss: 0.33927641519326257
Epoch: 70, step: 1205, loss: 0.3441050052642822, mean loss: 0.33927646240001685
Epoch: 70, step: 1206, loss: 0.30334192514419556, mean loss: 0.3392761110891244
Epoch: 70, step: 1207, loss: 0.3364239037036896, mean loss: 0.33927608320503844
Epoch: 70, step: 1208, loss: 0.3449806869029999, mean loss: 0.33927613897451214
Epoch: 70, step: 1209, loss: 0.3425288796424866, mean loss: 0.339276170773717
Epoch: 70, step: 1210, loss: 0.32482418417930603, mean loss: 0.3392760294906462
Epoch: 70, step: 1211, loss: 0.35212552547454834, mean loss: 0.3392761551064909
Epoch: 70, step: 1212, loss: 0.3146691918373108, mean loss: 0.33927591455275535
Epoch: 70, step: 1213, loss: 0.3216927647590637, mean loss: 0.3392757426643768
Epoch: 70, step: 1214, loss: 0.3556099236011505, mean loss: 0.33927590234159405
Epoch: 70, step: 1215, loss: 0.3560243546962738, mean loss: 0.3392760660669827
Epoch: 70, step: 1216, loss: 0.31577906012535095, mean loss: 0.3392758363729942
Epoch: 70, step: 1217, loss: 0.33509254455566406, mean loss: 0.3392757954798016
Epoch: 70, step: 1218, loss: 0.36644217371940613, mean loss: 0.339276061038392
Epoch: 70, step: 1219, loss: 0.3317217230796814, mean loss: 0.33927598719344615
Epoch: 70, step: 1220, loss: 0.32234805822372437, mean loss: 0.3392758217216622
Epoch: 70, step: 1221, loss: 0.35771143436431885, mean loss: 0.3392760019294064
Epoch: 70, step: 1222, loss: 0.3108097314834595, mean loss: 0.3392757236749031
Epoch: 70, step: 1223, loss: 0.4044192433357239, mean loss: 0.3392763604390537
Epoch: 70, step: 1224, loss: 0.363450288772583, mean loss: 0.33927659673178945
Epoch: 70, step: 1225, loss: 0.35506120324134827, mean loss: 0.3392767510199691
Epoch: 70, step: 1226, loss: 0.3129897117614746, mean loss: 0.3392764940772452
Epoch: 70, step: 1227, loss: 0.3136112093925476, mean loss: 0.33927624321431477
Epoch: 70, step: 1228, loss: 0.3415333032608032, mean loss: 0.33927626527552196
Epoch: 70, step: 1229, loss: 0.343912810087204, mean loss: 0.3392763105941107
Epoch: 70, step: 1230, loss: 0.3119596242904663, mean loss: 0.33927604359753843
Epoch: 70, step: 1231, loss: 0.3426341712474823, mean loss: 0.33927607641996055
Epoch: 70, step: 1232, loss: 0.30304527282714844, mean loss: 0.33927572230265785
Epoch: 70, step: 1233, loss: 0.3435627818107605, mean loss: 0.3392757642036637
Epoch: 70, step: 1234, loss: 0.3293185234069824, mean loss: 0.33927566688420124
Epoch: 70, step: 1235, loss: 0.3446693420410156, mean loss: 0.33927571960005365
Epoch: 70, step: 1236, loss: 0.32062867283821106, mean loss: 0.33927553735226723
Epoch: 70, step: 1237, loss: 0.3444105386734009, mean loss: 0.33927558753895304
Epoch: 70, step: 1238, loss: 0.28759098052978516, mean loss: 0.33927508240689536
Epoch: 70, step: 1239, loss: 0.32788264751434326, mean loss: 0.339274971065663
Epoch: 70, step: 1240, loss: 0.3068583607673645, mean loss: 0.33927465425278686
Epoch: 70, step: 1241, loss: 0.30243420600891113, mean loss: 0.339274294208532
Epoch: 70, step: 1242, loss: 0.3454411029815674, mean loss: 0.33927435447659265
Epoch: 70, step: 1243, loss: 0.31439369916915894, mean loss: 0.3392741113209761
Epoch: 70, step: 1244, loss: 0.33760783076286316, mean loss: 0.33927409503677813
Epoch: 70, step: 1245, loss: 0.33244261145591736, mean loss: 0.33927402827482533
Epoch: 70, step: 1246, loss: 0.31270912289619446, mean loss: 0.33927376866684916
Epoch: 70, step: 1247, loss: 0.36529314517974854, mean loss: 0.33927402294110953
Epoch: 70, step: 1248, loss: 0.3649805188179016, mean loss: 0.33927427415529005
Epoch: 70, step: 1249, loss: 0.32375019788742065, mean loss: 0.33927412244927746
Epoch: 70, step: 1250, loss: 0.33389517664909363, mean loss: 0.3392740698850907
Epoch: 70, step: 1251, loss: 0.3435669243335724, mean loss: 0.339274111835355
Epoch: 70, step: 1252, loss: 0.3281245529651642, mean loss: 0.3392740028816561
Epoch: 70, step: 1253, loss: 0.2995195686817169, mean loss: 0.33927361440437387
Epoch: 70, step: 1254, loss: 0.32519668340682983, mean loss: 0.3392734768470279
Epoch: 70, step: 1255, loss: 0.34323373436927795, mean loss: 0.33927351554560436
Epoch: 70, step: 1256, loss: 0.353807657957077, mean loss: 0.3392736575679659
Epoch: 70, step: 1257, loss: 0.3525581359863281, mean loss: 0.33927378737779623
Epoch: 70, step: 1258, loss: 0.3380429744720459, mean loss: 0.3392737753509745
Epoch: 70, step: 1259, loss: 0.36062994599342346, mean loss: 0.3392739840296011
Epoch: 70, step: 1260, loss: 0.3565705120563507, mean loss: 0.3392741530383857
Epoch: 70, step: 1261, loss: 0.37689754366874695, mean loss: 0.33927452066253444
Epoch: 70, step: 1262, loss: 0.31415385007858276, mean loss: 0.33927427520685516
Epoch: 70, step: 1263, loss: 0.31981754302978516, mean loss: 0.339274085095738
Epoch: 70, step: 1264, loss: 0.3430989384651184, mean loss: 0.3392741224678946
Epoch: 70, step: 1265, loss: 0.44745588302612305, mean loss: 0.33927517948781294
Epoch: 70, step: 1266, loss: 0.373523473739624, mean loss: 0.33927551411700824
Epoch: 70, step: 1267, loss: 0.3261505365371704, mean loss: 0.3392753858782778
Epoch: 70, step: 1268, loss: 0.3425256609916687, mean loss: 0.3392754176350621
Epoch: 70, step: 1269, loss: 0.3073214292526245, mean loss: 0.3392751054319514
Epoch: 70, step: 1270, loss: 0.32926157116889954, mean loss: 0.33927500759671514
Epoch: 70, step: 1271, loss: 0.3304552733898163, mean loss: 0.3392749214261058
Epoch: 70, step: 1272, loss: 0.3256889879703522, mean loss: 0.3392747886900506
Epoch: 70, step: 1273, loss: 0.3272048830986023, mean loss: 0.33927467076690554
Epoch: 70, step: 1274, loss: 0.29910579323768616, mean loss: 0.33927427832024903
Epoch: 70, step: 1275, loss: 0.3255990147590637, mean loss: 0.33927414471534495
Epoch: 70, step: 1276, loss: 0.32406917214393616, mean loss: 0.33927399616690596
Epoch: 70, step: 1277, loss: 0.3356412649154663, mean loss: 0.3392739606764582
Epoch: 70, step: 1278, loss: 0.35333219170570374, mean loss: 0.3392740980188612
Epoch: 70, step: 1279, loss: 0.34052976965904236, mean loss: 0.33927411028607146
Epoch: 70, step: 1280, loss: 0.32674258947372437, mean loss: 0.3392739878613119
Epoch: 70, step: 1281, loss: 0.3226885497570038, mean loss: 0.3392738258340156
Epoch: 70, step: 1282, loss: 0.31561678647994995, mean loss: 0.3392735947247344
Epoch: 70, step: 1283, loss: 0.3114563226699829, mean loss: 0.33927332297615037
Epoch: 70, step: 1284, loss: 0.2835490107536316, mean loss: 0.3392727786073503
Epoch: 70, step: 1285, loss: 0.3391607701778412, mean loss: 0.33927277751315466
Epoch: 70, step: 1286, loss: 0.35638338327407837, mean loss: 0.33927294466278063
Epoch: 70, step: 1287, loss: 0.32675087451934814, mean loss: 0.3392728223387131
Epoch: 70, step: 1288, loss: 0.2995125353336334, mean loss: 0.3392724339370778
Epoch: 70, step: 1289, loss: 0.3219345211982727, mean loss: 0.339272264571905
Epoch: 70, step: 1290, loss: 0.34748727083206177, mean loss: 0.33927234481930185
Epoch: 70, step: 1291, loss: 0.35260576009750366, mean loss: 0.33927247506404923
Epoch: 70, step: 1292, loss: 0.3276488482952118, mean loss: 0.33927236152213125
Epoch: 70, step: 1293, loss: 0.3026200532913208, mean loss: 0.33927200349852926
Epoch: 70, step: 1294, loss: 0.3173827826976776, mean loss: 0.3392717896844067
Epoch: 70, step: 1295, loss: 0.30548208951950073, mean loss: 0.3392714596295094
Epoch: 70, step: 1296, loss: 0.3388459086418152, mean loss: 0.3392714554728044
Epoch: 70, step: 1297, loss: 0.3039417564868927, mean loss: 0.33927111038207214
Epoch: 70, step: 1298, loss: 0.35739704966545105, mean loss: 0.3392712874295065
Epoch: 70, step: 1299, loss: 0.3364536166191101, mean loss: 0.3392712599078147
Epoch: 70, step: 1300, loss: 0.32745832204818726, mean loss: 0.33927114452568463
Epoch: 70, step: 1301, loss: 0.31976836919784546, mean loss: 0.3392709540354097
Epoch: 70, step: 1302, loss: 0.33022356033325195, mean loss: 0.3392708656672851
Epoch: 70, step: 1303, loss: 0.3219071924686432, mean loss: 0.339270696073665
Epoch: 70, step: 1304, loss: 0.379998117685318, mean loss: 0.33927109386066123
Epoch: 70, step: 1305, loss: 0.331795334815979, mean loss: 0.3392710208452192
Epoch: 70, step: 1306, loss: 0.3722611963748932, mean loss: 0.33927134305580775
Epoch: 70, step: 1307, loss: 0.33240097761154175, mean loss: 0.33927127595453177
Epoch: 70, step: 1308, loss: 0.3402283489704132, mean loss: 0.33927128530195205
Epoch: 70, step: 1309, loss: 0.3611660599708557, mean loss: 0.33927149913899346
Epoch: 70, step: 1310, loss: 0.33345258235931396, mean loss: 0.3392714423086394
Epoch: 70, step: 1311, loss: 0.37253710627555847, mean loss: 0.33927176719402075
Epoch: 70, step: 1312, loss: 0.29661616683006287, mean loss: 0.3392713506069458
Epoch: 70, step: 1313, loss: 0.33298277854919434, mean loss: 0.3392712891915107
Epoch: 70, step: 1314, loss: 0.3324175775051117, mean loss: 0.33927122225746426
Epoch: 70, step: 1315, loss: 0.3369320034980774, mean loss: 0.33927119941263867
Epoch: 70, step: 1316, loss: 0.3470290005207062, mean loss: 0.3392712751746347
Epoch: 70, step: 1317, loss: 0.34178072214126587, mean loss: 0.3392712996814314
Epoch: 70, step: 1318, loss: 0.33153319358825684, mean loss: 0.3392712241132511
Epoch: 70, step: 1319, loss: 0.35631728172302246, mean loss: 0.33927139057865746
Epoch: 70, step: 1320, loss: 0.3491351902484894, mean loss: 0.3392714869038854
Epoch: 70, step: 1321, loss: 0.3217543363571167, mean loss: 0.33927131584130316
Epoch: 70, step: 1322, loss: 0.3054670989513397, mean loss: 0.33927098573166875
Epoch: 70, step: 1323, loss: 0.3589979410171509, mean loss: 0.3392711783701915
Epoch: 70, step: 1324, loss: 0.3036031126976013, mean loss: 0.3392708300662447
Epoch: 70, step: 1325, loss: 0.3442973792552948, mean loss: 0.3392708791507631
Epoch: 70, step: 1326, loss: 0.285608172416687, mean loss: 0.33927035513671394
Epoch: 70, step: 1327, loss: 0.3653849959373474, mean loss: 0.3392706101425807
Epoch: 70, step: 1328, loss: 0.3419256806373596, mean loss: 0.3392706360687248
Epoch: 70, step: 1329, loss: 0.3916552662849426, mean loss: 0.33927114758742627
Epoch: 70, step: 1330, loss: 0.31642386317253113, mean loss: 0.3392709244933796
Epoch: 70, step: 1331, loss: 0.3682212829589844, mean loss: 0.3392712071785968
Epoch: 70, step: 1332, loss: 0.305093377828598, mean loss: 0.3392708734530996
Epoch: 70, step: 1333, loss: 0.3173302412033081, mean loss: 0.33927065921840266
Epoch: 70, step: 1334, loss: 0.34068402647972107, mean loss: 0.33927067301879577
Epoch: 70, step: 1335, loss: 0.32250458002090454, mean loss: 0.33927050931299785
Epoch: 70, step: 1336, loss: 0.2897287607192993, mean loss: 0.3392700255871653
Epoch: 70, step: 1337, loss: 0.3095425069332123, mean loss: 0.3392697353303876
Epoch: 70, step: 1338, loss: 0.332199364900589, mean loss: 0.3392696662966104
Epoch: 70, step: 1339, loss: 0.3381476104259491, mean loss: 0.33926965534117326
Epoch: 70, step: 1340, loss: 0.36921530961990356, mean loss: 0.33926994771924296
Epoch: 70, step: 1341, loss: 0.3542390763759613, mean loss: 0.33927009387074025
Epoch: 70, step: 1342, loss: 0.3023161292076111, mean loss: 0.3392697330732176
Epoch: 70, step: 1343, loss: 0.3293696641921997, mean loss: 0.3392696364155116
Epoch: 70, step: 1344, loss: 0.35365819931030273, mean loss: 0.3392697768945245
Epoch: 70, step: 1345, loss: 0.31214433908462524, mean loss: 0.33926951206491274
Epoch: 70, step: 1346, loss: 0.33676743507385254, mean loss: 0.3392694876370081
Epoch: 70, step: 1347, loss: 0.31115853786468506, mean loss: 0.339269213191058
Epoch: 70, step: 1348, loss: 0.3544655740261078, mean loss: 0.3392693615510033
Epoch: 70, step: 1349, loss: 0.3312700390815735, mean loss: 0.33926928345549934
Epoch: 70, step: 1350, loss: 0.33856722712516785, mean loss: 0.3392692766015554
Epoch: 70, step: 1351, loss: 0.3455774188041687, mean loss: 0.3392693381852617
Epoch: 70, step: 1352, loss: 0.31556442379951477, mean loss: 0.3392691067665355
Epoch: 70, step: 1353, loss: 0.37926000356674194, mean loss: 0.3392694971730099
Epoch: 70, step: 1354, loss: 0.3476892411708832, mean loss: 0.33926957936897806
Epoch: 70, step: 1355, loss: 0.32443732023239136, mean loss: 0.33926943457360204
Epoch: 70, step: 1356, loss: 0.3320084810256958, mean loss: 0.33926936369146427
Epoch: 70, step: 1357, loss: 0.31806138157844543, mean loss: 0.33926915665909235
Epoch: 70, step: 1358, loss: 0.32723259925842285, mean loss: 0.33926903915933737
Epoch: 70, step: 1359, loss: 0.3504991829395294, mean loss: 0.3392691487858874
Epoch: 70, step: 1360, loss: 0.3176119029521942, mean loss: 0.3392689373739934
Epoch: 70, step: 1361, loss: 0.3593778610229492, mean loss: 0.33926913366968897
Epoch: 70, step: 1362, loss: 0.3355131447315216, mean loss: 0.3392690970055056
Epoch: 70, step: 1363, loss: 0.3395916819572449, mean loss: 0.33926910015439626
Epoch: 70, step: 1364, loss: 0.303987056016922, mean loss: 0.3392687557545316
Epoch: 70, step: 1365, loss: 0.3250676095485687, mean loss: 0.33926861713373424
Epoch: 70, step: 1366, loss: 0.3442305028438568, mean loss: 0.3392686655674191
Epoch: 70, step: 1367, loss: 0.32411062717437744, mean loss: 0.3392685176090559
Epoch: 70, step: 1368, loss: 0.3449641466140747, mean loss: 0.3392685732038299
Epoch: 70, step: 1369, loss: 0.3196242153644562, mean loss: 0.3392683814580238
Epoch: 70, step: 1370, loss: 0.4065811038017273, mean loss: 0.3392690384815994
Epoch: 70, step: 1371, loss: 0.3426711857318878, mean loss: 0.3392690716888306
Epoch: 70, step: 1372, loss: 0.3363231420516968, mean loss: 0.33926904293486887
Epoch: 70, step: 1373, loss: 0.3391549289226532, mean loss: 0.3392690418210616
Epoch: 70, step: 1374, loss: 0.30727481842041016, mean loss: 0.3392687295452
Epoch: 70, step: 1375, loss: 0.3406851589679718, mean loss: 0.33926874336995816
Epoch: 70, step: 1376, loss: 0.31182464957237244, mean loss: 0.33926847551033124
Epoch: 70, step: 1377, loss: 0.35893142223358154, mean loss: 0.33926866742259504
Epoch: 70, step: 1378, loss: 0.3140921890735626, mean loss: 0.33926842170012705
Epoch: 70, step: 1379, loss: 0.3597424030303955, mean loss: 0.3392686215242665
Epoch: 70, step: 1380, loss: 0.37684231996536255, mean loss: 0.33926898823646373
Epoch: 70, step: 1381, loss: 0.3294229805469513, mean loss: 0.33926889214222694
Epoch: 70, step: 1382, loss: 0.31638965010643005, mean loss: 0.3392686688495063
Epoch: 70, step: 1383, loss: 0.3062199056148529, mean loss: 0.3392683463092655
Epoch: 70, step: 1384, loss: 0.34807920455932617, mean loss: 0.3392684322982203
Epoch: 70, step: 1385, loss: 0.3443824350833893, mean loss: 0.3392684822074857
Epoch: 70, step: 1386, loss: 0.30658796429634094, mean loss: 0.3392681632704824
Epoch: 70, step: 1387, loss: 0.38101693987846375, mean loss: 0.33926857070281846
Epoch: 70, step: 1388, loss: 0.3426472842693329, mean loss: 0.33926860367585
Epoch: 70, step: 1389, loss: 0.3501812219619751, mean loss: 0.3392687101715881
Epoch: 70, step: 1390, loss: 0.33649536967277527, mean loss: 0.3392686831069503
Epoch: 70, step: 1391, loss: 0.3199097514152527, mean loss: 0.3392684941877168
Epoch: 70, step: 1392, loss: 0.337049275636673, mean loss: 0.33926847253109943
Epoch: 70, step: 1393, loss: 0.33063995838165283, mean loss: 0.33926838832911504
Epoch: 70, step: 1394, loss: 0.29461607336997986, mean loss: 0.33926795259049625
Epoch: 70, step: 1395, loss: 0.31654784083366394, mean loss: 0.3392677308789564
Epoch: 70, step: 1396, loss: 0.3265171945095062, mean loss: 0.3392676064555602
Epoch: 70, step: 1397, loss: 0.30353596806526184, mean loss: 0.3392672577793722
Epoch: 70, step: 1398, loss: 0.30030369758605957, mean loss: 0.33926687756918095
Epoch: 70, step: 1399, loss: 0.3106536567211151, mean loss: 0.3392665983613272
Epoch: 70, step: 1400, loss: 0.33823108673095703, mean loss: 0.3392665882569017
Epoch: 70, step: 1401, loss: 0.3613385558128357, mean loss: 0.3392668036309923
Epoch: 70, step: 1402, loss: 0.3326578438282013, mean loss: 0.33926673914264005
Epoch: 70, step: 1403, loss: 0.32273069024086, mean loss: 0.33926657779014696
Epoch: 70, step: 1404, loss: 0.3553757667541504, mean loss: 0.33926673497596893
Epoch: 70, step: 1405, loss: 0.33978956937789917, mean loss: 0.33926674007748914
Epoch: 70, step: 1406, loss: 0.33411210775375366, mean loss: 0.33926668978201435
Epoch: 70, step: 1407, loss: 0.3337230980396271, mean loss: 0.33926663569186
Epoch: 70, step: 1408, loss: 0.3438091576099396, mean loss: 0.33926668001390353
Epoch: 70, step: 1409, loss: 0.33757317066192627, mean loss: 0.33926666349024903
Epoch: 70, step: 1410, loss: 0.3757324814796448, mean loss: 0.3392670192855675
Epoch: 70, step: 1411, loss: 0.31571197509765625, mean loss: 0.3392667894623209
Epoch: 70, step: 1412, loss: 0.3952500820159912, mean loss: 0.3392673356780874
Epoch: 70, step: 1413, loss: 0.3302161991596222, mean loss: 0.3392672473691472
Epoch: 70, step: 1414, loss: 0.30600839853286743, mean loss: 0.3392669228767443
Epoch: 70, step: 1415, loss: 0.32400771975517273, mean loss: 0.33926677400066013
Epoch: 70, step: 1416, loss: 0.3730129301548004, mean loss: 0.33926710324108816
Epoch: 70, step: 1417, loss: 0.3671949505805969, mean loss: 0.33926737571320803
Epoch: 70, step: 1418, loss: 0.34794268012046814, mean loss: 0.3392674603511499
Epoch: 70, step: 1419, loss: 0.3067312240600586, mean loss: 0.33926714292445437
Epoch: 70, step: 1420, loss: 0.3146061897277832, mean loss: 0.3392669023321363
Epoch: 70, step: 1421, loss: 0.32010143995285034, mean loss: 0.33926671535566383
Epoch: 70, step: 1422, loss: 0.34680691361427307, mean loss: 0.33926678891642065
Epoch: 70, step: 1423, loss: 0.3228211998939514, mean loss: 0.3392666284779107
Epoch: 70, step: 1424, loss: 0.27847978472709656, mean loss: 0.33926603546446016
Epoch: 70, step: 1425, loss: 0.34907636046409607, mean loss: 0.33926613116934573
Epoch: 70, step: 1426, loss: 0.34463605284690857, mean loss: 0.33926618355524796
Epoch: 70, step: 1427, loss: 0.29684779047966003, mean loss: 0.33926576974956374
Epoch: 70, step: 1428, loss: 0.34116464853286743, mean loss: 0.3392657882735839
Epoch: 70, step: 1429, loss: 0.3294762969017029, mean loss: 0.33926569277566787
Epoch: 70, step: 1430, loss: 0.33886122703552246, mean loss: 0.33926568883008407
Epoch: 70, step: 1431, loss: 0.31841182708740234, mean loss: 0.3392654854015904
Epoch: 70, step: 1432, loss: 0.3424103856086731, mean loss: 0.3392655160796528
Epoch: 70, step: 1433, loss: 0.2808760702610016, mean loss: 0.3392649465043185
Epoch: 70, step: 1434, loss: 0.3254287838935852, mean loss: 0.33926481153711746
Epoch: 70, step: 1435, loss: 0.3964647054672241, mean loss: 0.3392653694977668
Epoch: 70, step: 1436, loss: 0.3299632668495178, mean loss: 0.3392652787605949
Epoch: 70, step: 1437, loss: 0.33363696932792664, mean loss: 0.3392652238599001
Epoch: 70, step: 1438, loss: 0.34986168146133423, mean loss: 0.33926532722081465
Epoch: 70, step: 1439, loss: 0.3443927764892578, mean loss: 0.3392653772349511
Epoch: 70, step: 1440, loss: 0.33909618854522705, mean loss: 0.33926537558466785
Epoch: 70, step: 1441, loss: 0.3698233366012573, mean loss: 0.3392656736471424
Epoch: 70, step: 1442, loss: 0.3433481752872467, mean loss: 0.3392657134674914
Epoch: 70, step: 1443, loss: 0.357707679271698, mean loss: 0.33926589334699087
Valid: 70, mean loss: 0.18363048136234283
Epoch: 71, step: 0, loss: 0.31972774863243103, mean loss: 0.33926570277742524
Epoch: 71, step: 1, loss: 0.35382241010665894, mean loss: 0.3392658447580675
Epoch: 71, step: 2, loss: 0.35622596740722656, mean loss: 0.33926601017910435
Epoch: 71, step: 3, loss: 0.29237744212150574, mean loss: 0.33926555285458754
Epoch: 71, step: 4, loss: 0.3573140799999237, mean loss: 0.3392657288879746
Epoch: 71, step: 5, loss: 0.31053778529167175, mean loss: 0.3392654486973612
Epoch: 71, step: 6, loss: 0.30401739478111267, mean loss: 0.3392651049178807
Epoch: 71, step: 7, loss: 0.31131672859191895, mean loss: 0.3392648323358934
Epoch: 71, step: 8, loss: 0.3291252553462982, mean loss: 0.33926473344502905
Epoch: 71, step: 9, loss: 0.2973647713661194, mean loss: 0.3392643248004616
Epoch: 71, step: 10, loss: 0.33464083075523376, mean loss: 0.33926427970859985
Epoch: 71, step: 11, loss: 0.3217011094093323, mean loss: 0.33926410842075655
Epoch: 71, step: 12, loss: 0.34613651037216187, mean loss: 0.3392641754443866
Epoch: 71, step: 13, loss: 0.2967929244041443, mean loss: 0.339263761244275
Epoch: 71, step: 14, loss: 0.32058748602867126, mean loss: 0.3392635791060133
Epoch: 71, step: 15, loss: 0.36100637912750244, mean loss: 0.3392637911481434
Epoch: 71, step: 16, loss: 0.3437750041484833, mean loss: 0.3392638351423799
Epoch: 71, step: 17, loss: 0.31081971526145935, mean loss: 0.33926355775243355
Epoch: 71, step: 18, loss: 0.30154505372047424, mean loss: 0.33926318992133797
Epoch: 71, step: 19, loss: 0.3411564230918884, mean loss: 0.33926320838398005
Epoch: 71, step: 20, loss: 0.3119683265686035, mean loss: 0.3392629422093073
Epoch: 71, step: 21, loss: 0.32496124505996704, mean loss: 0.3392628027431443
Epoch: 71, step: 22, loss: 0.31980177760124207, mean loss: 0.3392626129665039
Epoch: 71, step: 23, loss: 0.33543193340301514, mean loss: 0.3392625756115134
Epoch: 71, step: 24, loss: 0.36602210998535156, mean loss: 0.3392628365553975
Epoch: 71, step: 25, loss: 0.3443717658519745, mean loss: 0.33926288637430824
Epoch: 71, step: 26, loss: 0.29839351773262024, mean loss: 0.3392624878470521
Epoch: 71, step: 27, loss: 0.36809295415878296, mean loss: 0.339262768977272
Epoch: 71, step: 28, loss: 0.33132627606391907, mean loss: 0.3392626915880887
Epoch: 71, step: 29, loss: 0.3137805163860321, mean loss: 0.3392624431124056
Epoch: 71, step: 30, loss: 0.33416980504989624, mean loss: 0.3392623934547774
Epoch: 71, step: 31, loss: 0.3675307035446167, mean loss: 0.33926266909257613
Epoch: 71, step: 32, loss: 0.3172719180583954, mean loss: 0.3392624546679046
Epoch: 71, step: 33, loss: 0.35355812311172485, mean loss: 0.3392625940589657
Epoch: 71, step: 34, loss: 0.3249758780002594, mean loss: 0.3392624547565538
Epoch: 71, step: 35, loss: 0.3129141628742218, mean loss: 0.3392621978504317
Epoch: 71, step: 36, loss: 0.33545196056365967, mean loss: 0.33926216069949433
Epoch: 71, step: 37, loss: 0.3607481122016907, mean loss: 0.33926237019181604
Epoch: 71, step: 38, loss: 0.330603688955307, mean loss: 0.33926228576876644
Epoch: 71, step: 39, loss: 0.3310322165489197, mean loss: 0.3392622055255113
Epoch: 71, step: 40, loss: 0.313464492559433, mean loss: 0.3392619540000107
Epoch: 71, step: 41, loss: 0.3155832588672638, mean loss: 0.3392617231370041
Epoch: 71, step: 42, loss: 0.3685872256755829, mean loss: 0.33926200905257675
Epoch: 71, step: 43, loss: 0.3317703902721405, mean loss: 0.33926193601206917
Epoch: 71, step: 44, loss: 0.32709285616874695, mean loss: 0.3392618173692059
Epoch: 71, step: 45, loss: 0.3395237922668457, mean loss: 0.3392618199233143
Epoch: 71, step: 46, loss: 0.33552995324134827, mean loss: 0.3392617835400609
Epoch: 71, step: 47, loss: 0.3451947271823883, mean loss: 0.33926184138180765
Epoch: 71, step: 48, loss: 0.3335304856300354, mean loss: 0.3392617855059363
Epoch: 71, step: 49, loss: 0.33010581135749817, mean loss: 0.33926169624380215
Epoch: 71, step: 50, loss: 0.37159979343414307, mean loss: 0.33926201150675306
Epoch: 71, step: 51, loss: 0.32693836092948914, mean loss: 0.3392618913650964
Epoch: 71, step: 52, loss: 0.40281403064727783, mean loss: 0.33926251092054527
Epoch: 71, step: 53, loss: 0.341819167137146, mean loss: 0.33926253584456617
Epoch: 71, step: 54, loss: 0.3149215877056122, mean loss: 0.3392622985547882
Epoch: 71, step: 55, loss: 0.3357568681240082, mean loss: 0.33926226438213825
Epoch: 71, step: 56, loss: 0.32325389981269836, mean loss: 0.3392621083262939
Epoch: 71, step: 57, loss: 0.33075711131095886, mean loss: 0.33926202541704065
Epoch: 71, step: 58, loss: 0.3516865074634552, mean loss: 0.3392621465334249
Epoch: 71, step: 59, loss: 0.3100210726261139, mean loss: 0.33926186148825305
Epoch: 71, step: 60, loss: 0.33786827325820923, mean loss: 0.3392618479035357
Epoch: 71, step: 61, loss: 0.3066137433052063, mean loss: 0.3392615296524625
Epoch: 71, step: 62, loss: 0.38238653540611267, mean loss: 0.3392619500274199
Epoch: 71, step: 63, loss: 0.33779969811439514, mean loss: 0.33926193577378483
Epoch: 71, step: 64, loss: 0.39555761218070984, mean loss: 0.33926248452342084
Epoch: 71, step: 65, loss: 0.31666019558906555, mean loss: 0.33926226420673367
Epoch: 71, step: 66, loss: 0.3607165515422821, mean loss: 0.3392624733311923
Epoch: 71, step: 67, loss: 0.3301427364349365, mean loss: 0.33926238443793655
Epoch: 71, step: 68, loss: 0.33551153540611267, mean loss: 0.3392623478774594
Epoch: 71, step: 69, loss: 0.31982195377349854, mean loss: 0.3392621583888528
Epoch: 71, step: 70, loss: 0.3325129747390747, mean loss: 0.3392620926041299
Epoch: 71, step: 71, loss: 0.36907950043678284, mean loss: 0.3392623832334705
Epoch: 71, step: 72, loss: 0.3283369839191437, mean loss: 0.3392622767449834
Epoch: 71, step: 73, loss: 0.32670193910598755, mean loss: 0.3392621543221521
Epoch: 71, step: 74, loss: 0.3405516445636749, mean loss: 0.3392621668904056
Epoch: 71, step: 75, loss: 0.32820382714271545, mean loss: 0.33926205910931645
Epoch: 71, step: 76, loss: 0.3295385539531708, mean loss: 0.3392619643392347
Epoch: 71, step: 77, loss: 0.2894570231437683, mean loss: 0.3392614789204203
Epoch: 71, step: 78, loss: 0.36939263343811035, mean loss: 0.3392617725878035
Epoch: 71, step: 79, loss: 0.3147055506706238, mean loss: 0.33926153325773917
Epoch: 71, step: 80, loss: 0.30273520946502686, mean loss: 0.33926117726803307
Epoch: 71, step: 81, loss: 0.35353392362594604, mean loss: 0.3392613163704867
Epoch: 71, step: 82, loss: 0.2886098325252533, mean loss: 0.3392608227249864
Epoch: 71, step: 83, loss: 0.32488396763801575, mean loss: 0.33926068261061826
Epoch: 71, step: 84, loss: 0.2824060022830963, mean loss: 0.33926012852003823
Epoch: 71, step: 85, loss: 0.3547307550907135, mean loss: 0.3392602792911772
Epoch: 71, step: 86, loss: 0.34441760182380676, mean loss: 0.33926032955209007
Epoch: 71, step: 87, loss: 0.36562442779541016, mean loss: 0.33926058648206164
Epoch: 71, step: 88, loss: 0.3311903774738312, mean loss: 0.33926050783501877
Epoch: 71, step: 89, loss: 0.3356238603591919, mean loss: 0.33926047239494744
Epoch: 71, step: 90, loss: 0.30248647928237915, mean loss: 0.33926011402635503
Epoch: 71, step: 91, loss: 0.3307337462902069, mean loss: 0.3392600309363132
Epoch: 71, step: 92, loss: 0.3377196192741394, mean loss: 0.3392600159250415
Epoch: 71, step: 93, loss: 0.3409871459007263, mean loss: 0.33926003275571426
Epoch: 71, step: 94, loss: 0.33779773116111755, mean loss: 0.33926001850590093
Epoch: 71, step: 95, loss: 0.37758514285087585, mean loss: 0.3392603919723241
Epoch: 71, step: 96, loss: 0.301868736743927, mean loss: 0.33926002760581797
Epoch: 71, step: 97, loss: 0.3574059307575226, mean loss: 0.33926020442855725
Epoch: 71, step: 98, loss: 0.32682499289512634, mean loss: 0.3392600832548288
Epoch: 71, step: 99, loss: 0.32717055082321167, mean loss: 0.3392599654506852
Epoch: 71, step: 100, loss: 0.3284090757369995, mean loss: 0.3392598597172897
Epoch: 71, step: 101, loss: 0.3014068901538849, mean loss: 0.33925949087343377
Epoch: 71, step: 102, loss: 0.343023419380188, mean loss: 0.33925952754924527
Epoch: 71, step: 103, loss: 0.32582226395606995, mean loss: 0.3392593966174957
Epoch: 71, step: 104, loss: 0.32261210680007935, mean loss: 0.33925923440905736
Epoch: 71, step: 105, loss: 0.36065560579299927, mean loss: 0.33925944288972953
Epoch: 71, step: 106, loss: 0.31954464316368103, mean loss: 0.3392592507957255
Epoch: 71, step: 107, loss: 0.3468121588230133, mean loss: 0.3392593243878608
Epoch: 71, step: 108, loss: 0.35754650831222534, mean loss: 0.33925950256821136
Epoch: 71, step: 109, loss: 0.3054610788822174, mean loss: 0.3392591732580053
Epoch: 71, step: 110, loss: 0.31554263830184937, mean loss: 0.3392589421815211
Epoch: 71, step: 111, loss: 0.3402796983718872, mean loss: 0.3392589521269222
Epoch: 71, step: 112, loss: 0.3276897370815277, mean loss: 0.33925883940719104
Epoch: 71, step: 113, loss: 0.31206074357032776, mean loss: 0.3392585744166823
Epoch: 71, step: 114, loss: 0.31613653898239136, mean loss: 0.3392583491413441
Epoch: 71, step: 115, loss: 0.3305618464946747, mean loss: 0.33925826441314216
Epoch: 71, step: 116, loss: 0.3235688805580139, mean loss: 0.339258111556254
Epoch: 71, step: 117, loss: 0.3571440577507019, mean loss: 0.3392582858118823
Epoch: 71, step: 118, loss: 0.32410928606987, mean loss: 0.3392581382226678
Epoch: 71, step: 119, loss: 0.33927008509635925, mean loss: 0.33925813833905916
Epoch: 71, step: 120, loss: 0.35061848163604736, mean loss: 0.3392582490151106
Epoch: 71, step: 121, loss: 0.3194642961025238, mean loss: 0.3392580561780501
Epoch: 71, step: 122, loss: 0.31902164220809937, mean loss: 0.3392578590323569
Epoch: 71, step: 123, loss: 0.3679700195789337, mean loss: 0.3392581387471155
Epoch: 71, step: 124, loss: 0.31675058603286743, mean loss: 0.3392579194799749
Epoch: 71, step: 125, loss: 0.34200066328048706, mean loss: 0.3392579461993495
Epoch: 71, step: 126, loss: 0.31125321984291077, mean loss: 0.33925767338441
Epoch: 71, step: 127, loss: 0.32519689202308655, mean loss: 0.3392575364091795
Epoch: 71, step: 128, loss: 0.31754204630851746, mean loss: 0.3392573248665056
Epoch: 71, step: 129, loss: 0.30399662256240845, mean loss: 0.3392569813757278
Epoch: 71, step: 130, loss: 0.3412577509880066, mean loss: 0.3392570008659583
Epoch: 71, step: 131, loss: 0.3236456513404846, mean loss: 0.3392568487915591
Epoch: 71, step: 132, loss: 0.3502713739871979, mean loss: 0.3392569560859978
Epoch: 71, step: 133, loss: 0.29086923599243164, mean loss: 0.3392564847372467
Epoch: 71, step: 134, loss: 0.33447661995887756, mean loss: 0.3392564381766453
Epoch: 71, step: 135, loss: 0.3481459319591522, mean loss: 0.3392565247682465
Epoch: 71, step: 136, loss: 0.2861845791339874, mean loss: 0.33925600780517745
Epoch: 71, step: 137, loss: 0.31289228796958923, mean loss: 0.3392557510040258
Epoch: 71, step: 138, loss: 0.3409205675125122, mean loss: 0.33925576722035017
Epoch: 71, step: 139, loss: 0.32101354002952576, mean loss: 0.3392555895317038
Epoch: 71, step: 140, loss: 0.35695263743400574, mean loss: 0.33925576190834533
Epoch: 71, step: 141, loss: 0.28786417841911316, mean loss: 0.3392552613377232
Epoch: 71, step: 142, loss: 0.30489373207092285, mean loss: 0.33925492664858975
Epoch: 71, step: 143, loss: 0.28968918323516846, mean loss: 0.3392544438716445
Epoch: 71, step: 144, loss: 0.35372063517570496, mean loss: 0.33925458477290293
Epoch: 71, step: 145, loss: 0.30270305275917053, mean loss: 0.33925422876304595
Epoch: 71, step: 146, loss: 0.37284260988235474, mean loss: 0.3392545559087942
Epoch: 71, step: 147, loss: 0.3313272297382355, mean loss: 0.3392544786985892
Epoch: 71, step: 148, loss: 0.34475192427635193, mean loss: 0.33925453224183405
Epoch: 71, step: 149, loss: 0.3005792498588562, mean loss: 0.33925415556144384
Epoch: 71, step: 150, loss: 0.35228973627090454, mean loss: 0.33925428252108064
Epoch: 71, step: 151, loss: 0.3201851546764374, mean loss: 0.3392540967997062
Epoch: 71, step: 152, loss: 0.3378072679042816, mean loss: 0.3392540827086352
Epoch: 71, step: 153, loss: 0.32110652327537537, mean loss: 0.3392539059662032
Epoch: 71, step: 154, loss: 0.30522623658180237, mean loss: 0.3392535745676759
Epoch: 71, step: 155, loss: 0.40631723403930664, mean loss: 0.3392542277003159
Epoch: 71, step: 156, loss: 0.3207923471927643, mean loss: 0.33925404790190616
Epoch: 71, step: 157, loss: 0.32618364691734314, mean loss: 0.33925392061181653
Epoch: 71, step: 158, loss: 0.36392343044281006, mean loss: 0.3392541608610285
Epoch: 71, step: 159, loss: 0.349301278591156, mean loss: 0.33925425870604553
Epoch: 71, step: 160, loss: 0.36657047271728516, mean loss: 0.3392545247255616
Epoch: 71, step: 161, loss: 0.3024980127811432, mean loss: 0.3392541667749944
Epoch: 71, step: 162, loss: 0.3179169297218323, mean loss: 0.3392539589859164
Epoch: 71, step: 163, loss: 0.3453333377838135, mean loss: 0.33925401818834316
Epoch: 71, step: 164, loss: 0.3188057243824005, mean loss: 0.33925381905996715
Epoch: 71, step: 165, loss: 0.289604127407074, mean loss: 0.33925333556895876
Epoch: 71, step: 166, loss: 0.3281141221523285, mean loss: 0.33925322709583633
Epoch: 71, step: 167, loss: 0.33421653509140015, mean loss: 0.33925317804925037
Epoch: 71, step: 168, loss: 0.32464027404785156, mean loss: 0.33925303575226806
Epoch: 71, step: 169, loss: 0.31886613368988037, mean loss: 0.33925283723139965
Epoch: 71, step: 170, loss: 0.3357881009578705, mean loss: 0.33925280349327924
Epoch: 71, step: 171, loss: 0.3042135536670685, mean loss: 0.3392524622993688
Epoch: 71, step: 172, loss: 0.35668888688087463, mean loss: 0.33925263208450934
Epoch: 71, step: 173, loss: 0.3352894186973572, mean loss: 0.3392525934935593
Epoch: 71, step: 174, loss: 0.3590855598449707, mean loss: 0.3392527866109835
Epoch: 71, step: 175, loss: 0.35502323508262634, mean loss: 0.3392529401693912
Epoch: 71, step: 176, loss: 0.314921498298645, mean loss: 0.3392527032540557
Epoch: 71, step: 177, loss: 0.3018147647380829, mean loss: 0.33925233872426547
Epoch: 71, step: 178, loss: 0.36521244049072266, mean loss: 0.33925259149294573
Epoch: 71, step: 179, loss: 0.3174639344215393, mean loss: 0.3392523793429119
Epoch: 71, step: 180, loss: 0.3330164849758148, mean loss: 0.3392523186263512
Epoch: 71, step: 181, loss: 0.3084809184074402, mean loss: 0.33925201901970486
Epoch: 71, step: 182, loss: 0.3289405405521393, mean loss: 0.33925191862266796
Epoch: 71, step: 183, loss: 0.3211159408092499, mean loss: 0.3392517420446233
Epoch: 71, step: 184, loss: 0.3020395040512085, mean loss: 0.3392513797371527
Epoch: 71, step: 185, loss: 0.31790322065353394, mean loss: 0.33925117188826664
Epoch: 71, step: 186, loss: 0.3309375047683716, mean loss: 0.33925109094594186
Epoch: 71, step: 187, loss: 0.3483494222164154, mean loss: 0.33925117952693795
Epoch: 71, step: 188, loss: 0.34551548957824707, mean loss: 0.33925124051542094
Epoch: 71, step: 189, loss: 0.3328770399093628, mean loss: 0.33925117845766245
Epoch: 71, step: 190, loss: 0.31564363837242126, mean loss: 0.3392509486222919
Epoch: 71, step: 191, loss: 0.3362371027469635, mean loss: 0.3392509192807494
Epoch: 71, step: 192, loss: 0.3523733913898468, mean loss: 0.33925104703440373
Epoch: 71, step: 193, loss: 0.31499120593070984, mean loss: 0.33925081085533965
Epoch: 71, step: 194, loss: 0.3061991333961487, mean loss: 0.3392504890874344
Epoch: 71, step: 195, loss: 0.32267993688583374, mean loss: 0.3392503277697533
Epoch: 71, step: 196, loss: 0.33969011902809143, mean loss: 0.33925033205116856
Epoch: 71, step: 197, loss: 0.3733859360218048, mean loss: 0.3392506643617152
Epoch: 71, step: 198, loss: 0.31581395864486694, mean loss: 0.33925043620730266
Epoch: 71, step: 199, loss: 0.3391433656215668, mean loss: 0.33925043516498943
Epoch: 71, step: 200, loss: 0.3037438690662384, mean loss: 0.33925008951820335
Epoch: 71, step: 201, loss: 0.4308423399925232, mean loss: 0.339250981135228
Epoch: 71, step: 202, loss: 0.34679102897644043, mean loss: 0.3392510545341187
Epoch: 71, step: 203, loss: 0.30950021743774414, mean loss: 0.3392507649262504
Epoch: 71, step: 204, loss: 0.3382929861545563, mean loss: 0.33925075560289697
Epoch: 71, step: 205, loss: 0.32977351546287537, mean loss: 0.33925066334902626
Epoch: 71, step: 206, loss: 0.30963048338890076, mean loss: 0.33925037502145267
Epoch: 71, step: 207, loss: 0.3494015336036682, mean loss: 0.33925047383349355
Epoch: 71, step: 208, loss: 0.29290077090263367, mean loss: 0.33925002266684867
Epoch: 71, step: 209, loss: 0.3296003043651581, mean loss: 0.3392499287376889
Epoch: 71, step: 210, loss: 0.33893126249313354, mean loss: 0.3392499256358614
Epoch: 71, step: 211, loss: 0.3057039678096771, mean loss: 0.33924959911002994
Epoch: 71, step: 212, loss: 0.3052961528301239, mean loss: 0.33924926862105054
Epoch: 71, step: 213, loss: 0.3325861990451813, mean loss: 0.33924920376608375
Epoch: 71, step: 214, loss: 0.33378368616104126, mean loss: 0.33924915056800314
Epoch: 71, step: 215, loss: 0.3330147862434387, mean loss: 0.33924908988701885
Epoch: 71, step: 216, loss: 0.34191301465034485, mean loss: 0.33924911581556505
Epoch: 71, step: 217, loss: 0.35102176666259766, mean loss: 0.3392492304001638
Epoch: 71, step: 218, loss: 0.3132968544960022, mean loss: 0.3392489778050877
Epoch: 71, step: 219, loss: 0.35571399331092834, mean loss: 0.33924913805790546
Epoch: 71, step: 220, loss: 0.31769227981567383, mean loss: 0.33924892824858877
Epoch: 71, step: 221, loss: 0.32127389311790466, mean loss: 0.33924875330226356
Epoch: 71, step: 222, loss: 0.32501423358917236, mean loss: 0.3392486147627469
Epoch: 71, step: 223, loss: 0.3308168947696686, mean loss: 0.3392485327006144
Epoch: 71, step: 224, loss: 0.30274659395217896, mean loss: 0.3392481774471448
Epoch: 71, step: 225, loss: 0.31673476099967957, mean loss: 0.33924795833846894
Epoch: 71, step: 226, loss: 0.33190369606018066, mean loss: 0.33924788686215945
Epoch: 71, step: 227, loss: 0.3347843289375305, mean loss: 0.33924784342205194
Epoch: 71, step: 228, loss: 0.37035590410232544, mean loss: 0.3392481461680611
Epoch: 71, step: 229, loss: 0.2973781228065491, mean loss: 0.33924773868977937
Epoch: 71, step: 230, loss: 0.30453118681907654, mean loss: 0.339247400832236
Epoch: 71, step: 231, loss: 0.36331799626350403, mean loss: 0.33924763508225964
Epoch: 71, step: 232, loss: 0.3108222186565399, mean loss: 0.33924735845471676
Epoch: 71, step: 233, loss: 0.32180941104888916, mean loss: 0.3392471887555458
Epoch: 71, step: 234, loss: 0.285398930311203, mean loss: 0.339246664730804
Epoch: 71, step: 235, loss: 0.3046443462371826, mean loss: 0.33924632800135196
Epoch: 71, step: 236, loss: 0.3449832499027252, mean loss: 0.33924638382916505
Epoch: 71, step: 237, loss: 0.34081506729125977, mean loss: 0.3392463990943746
Epoch: 71, step: 238, loss: 0.3298948109149933, mean loss: 0.33924630809286455
Epoch: 71, step: 239, loss: 0.3153068423271179, mean loss: 0.3392460751371041
Epoch: 71, step: 240, loss: 0.33434250950813293, mean loss: 0.3392460274208035
Epoch: 71, step: 241, loss: 0.2948809862136841, mean loss: 0.33924559571147156
Epoch: 71, step: 242, loss: 0.3620469272136688, mean loss: 0.33924581758553135
Epoch: 71, step: 243, loss: 0.36778393387794495, mean loss: 0.3392460952801084
Epoch: 71, step: 244, loss: 0.34654077887535095, mean loss: 0.3392461662614704
Epoch: 71, step: 245, loss: 0.32317492365837097, mean loss: 0.33924600988078923
Epoch: 71, step: 246, loss: 0.3588593602180481, mean loss: 0.33924620072597256
Epoch: 71, step: 247, loss: 0.33260130882263184, mean loss: 0.3392461360693355
Epoch: 71, step: 248, loss: 0.3125162720680237, mean loss: 0.3392458759828926
Epoch: 71, step: 249, loss: 0.32910656929016113, mean loss: 0.33924577732655253
Epoch: 71, step: 250, loss: 0.31305786967277527, mean loss: 0.3392455225184022
Epoch: 71, step: 251, loss: 0.33594244718551636, mean loss: 0.339245490379816
Epoch: 71, step: 252, loss: 0.28646260499954224, mean loss: 0.3392449768127204
Epoch: 71, step: 253, loss: 0.365418940782547, mean loss: 0.3392452314777652
Epoch: 71, step: 254, loss: 0.3787163197994232, mean loss: 0.33924561551621973
Epoch: 71, step: 255, loss: 0.32509878277778625, mean loss: 0.3392454778743367
Epoch: 71, step: 256, loss: 0.3475008010864258, mean loss: 0.33924555819388225
Epoch: 71, step: 257, loss: 0.3601120710372925, mean loss: 0.33924576121107247
Epoch: 71, step: 258, loss: 0.36815106868743896, mean loss: 0.33924604243761264
Epoch: 71, step: 259, loss: 0.32014888525009155, mean loss: 0.33924585663868295
Epoch: 71, step: 260, loss: 0.33144402503967285, mean loss: 0.3392457807343039
Epoch: 71, step: 261, loss: 0.35359716415405273, mean loss: 0.3392459203582159
Epoch: 71, step: 262, loss: 0.31165650486946106, mean loss: 0.33924565194474443
Epoch: 71, step: 263, loss: 0.32532599568367004, mean loss: 0.33924551652372
Epoch: 71, step: 264, loss: 0.3224965035915375, mean loss: 0.3392453535781428
Epoch: 71, step: 265, loss: 0.3970455527305603, mean loss: 0.33924591589158914
Epoch: 71, step: 266, loss: 0.36460721492767334, mean loss: 0.33924616261843327
Epoch: 71, step: 267, loss: 0.34941765666007996, mean loss: 0.33924626157062837
Epoch: 71, step: 268, loss: 0.30982112884521484, mean loss: 0.33924597531443657
Epoch: 71, step: 269, loss: 0.33550596237182617, mean loss: 0.33924593893086413
Epoch: 71, step: 270, loss: 0.32587870955467224, mean loss: 0.33924580889312517
Epoch: 71, step: 271, loss: 0.333749383687973, mean loss: 0.3392457554238734
Epoch: 71, step: 272, loss: 0.38261929154396057, mean loss: 0.33924617735774426
Epoch: 71, step: 273, loss: 0.3479442894458771, mean loss: 0.33924626197137575
Epoch: 71, step: 274, loss: 0.32373446226119995, mean loss: 0.3392461110769146
Epoch: 71, step: 275, loss: 0.33906030654907227, mean loss: 0.33924610926947757
Epoch: 71, step: 276, loss: 0.33126652240753174, mean loss: 0.3392460316477924
Epoch: 71, step: 277, loss: 0.30348700284957886, mean loss: 0.3392456838040851
Epoch: 71, step: 278, loss: 0.3513651490211487, mean loss: 0.33924580169427526
Epoch: 71, step: 279, loss: 0.2862664461135864, mean loss: 0.3392452863509464
Epoch: 71, step: 280, loss: 0.364628404378891, mean loss: 0.3392455332564279
Epoch: 71, step: 281, loss: 0.3136977553367615, mean loss: 0.33924528475169163
Epoch: 71, step: 282, loss: 0.34765833616256714, mean loss: 0.3392453665851408
Epoch: 71, step: 283, loss: 0.37861889600753784, mean loss: 0.3392457495663234
Epoch: 71, step: 284, loss: 0.33717241883277893, mean loss: 0.3392457293995021
Epoch: 71, step: 285, loss: 0.3411722481250763, mean loss: 0.3392457481381338
Epoch: 71, step: 286, loss: 0.33786001801490784, mean loss: 0.33924573465971103
Epoch: 71, step: 287, loss: 0.3876359760761261, mean loss: 0.3392462053269621
Epoch: 71, step: 288, loss: 0.3461613953113556, mean loss: 0.33924627258684154
Epoch: 71, step: 289, loss: 0.3277156949043274, mean loss: 0.3392461604369623
Epoch: 71, step: 290, loss: 0.30423495173454285, mean loss: 0.33924581991068986
Epoch: 71, step: 291, loss: 0.3713100552558899, mean loss: 0.3392461317710554
Epoch: 71, step: 292, loss: 0.35219606757164, mean loss: 0.339246257722365
Epoch: 71, step: 293, loss: 0.37086349725723267, mean loss: 0.33924656522921726
Epoch: 71, step: 294, loss: 0.3487246036529541, mean loss: 0.33924665741099713
Epoch: 71, step: 295, loss: 0.3036433160305023, mean loss: 0.3392463111423589
Epoch: 71, step: 296, loss: 0.33014675974845886, mean loss: 0.3392462226434006
Epoch: 71, step: 297, loss: 0.33235418796539307, mean loss: 0.3392461556146064
Epoch: 71, step: 298, loss: 0.33355993032455444, mean loss: 0.33924610031350366
Epoch: 71, step: 299, loss: 0.33004823327064514, mean loss: 0.3392460108609727
Epoch: 71, step: 300, loss: 0.3176025450229645, mean loss: 0.3392458003726106
Epoch: 71, step: 301, loss: 0.31870222091674805, mean loss: 0.339245600582874
Epoch: 71, step: 302, loss: 0.3102746903896332, mean loss: 0.3392453188386804
Epoch: 71, step: 303, loss: 0.32122671604156494, mean loss: 0.33924514360817126
Epoch: 71, step: 304, loss: 0.33081814646720886, mean loss: 0.33924506165660956
Epoch: 71, step: 305, loss: 0.333890825510025, mean loss: 0.3392450095877955
Epoch: 71, step: 306, loss: 0.3554244041442871, mean loss: 0.3392451669274553
Epoch: 71, step: 307, loss: 0.3413185775279999, mean loss: 0.3392451870905427
Epoch: 71, step: 308, loss: 0.3550633490085602, mean loss: 0.33924534091433384
Epoch: 71, step: 309, loss: 0.3149658739566803, mean loss: 0.33924510481083736
Epoch: 71, step: 310, loss: 0.3291231095790863, mean loss: 0.3392450063813607
Epoch: 71, step: 311, loss: 0.31919142603874207, mean loss: 0.3392448113759118
Epoch: 71, step: 312, loss: 0.300394207239151, mean loss: 0.3392444335877214
Epoch: 71, step: 313, loss: 0.32619693875312805, mean loss: 0.33924430671346445
Epoch: 71, step: 314, loss: 0.30452460050582886, mean loss: 0.3392439691012142
Epoch: 71, step: 315, loss: 0.3374611437320709, mean loss: 0.3392439517653004
Epoch: 71, step: 316, loss: 0.3207637071609497, mean loss: 0.3392437720680532
Epoch: 71, step: 317, loss: 0.32519590854644775, mean loss: 0.3392436354714922
Epoch: 71, step: 318, loss: 0.31574568152427673, mean loss: 0.3392434069877457
Epoch: 71, step: 319, loss: 0.3233185112476349, mean loss: 0.33924325214258466
Epoch: 71, step: 320, loss: 0.3266024887561798, mean loss: 0.33924312923176364
Epoch: 71, step: 321, loss: 0.32448461651802063, mean loss: 0.3392429857306774
Epoch: 71, step: 322, loss: 0.3073105216026306, mean loss: 0.33924267524554774
Epoch: 71, step: 323, loss: 0.3220692574977875, mean loss: 0.33924250826692154
Epoch: 71, step: 324, loss: 0.3512097895145416, mean loss: 0.3392426246247009
Epoch: 71, step: 325, loss: 0.3505611717700958, mean loss: 0.33924273467377375
Epoch: 71, step: 326, loss: 0.3599294424057007, mean loss: 0.33924293580655546
Epoch: 71, step: 327, loss: 0.3432857394218445, mean loss: 0.33924297511355594
Epoch: 71, step: 328, loss: 0.3522680699825287, mean loss: 0.33924310175152345
Epoch: 71, step: 329, loss: 0.35207870602607727, mean loss: 0.3392432265459337
Epoch: 71, step: 330, loss: 0.29278939962387085, mean loss: 0.33924277490209603
Epoch: 71, step: 331, loss: 0.31372714042663574, mean loss: 0.3392425268306712
Epoch: 71, step: 332, loss: 0.28742650151252747, mean loss: 0.3392420230630587
Epoch: 71, step: 333, loss: 0.32330530881881714, mean loss: 0.3392418681240725
Epoch: 71, step: 334, loss: 0.3001532256603241, mean loss: 0.33924148810246557
Epoch: 71, step: 335, loss: 0.3221327066421509, mean loss: 0.33924132177171057
Epoch: 71, step: 336, loss: 0.3507068455219269, mean loss: 0.3392414332379004
Epoch: 71, step: 337, loss: 0.34333816170692444, mean loss: 0.3392414730653242
Epoch: 71, step: 338, loss: 0.31726211309432983, mean loss: 0.3392412593892699
Epoch: 71, step: 339, loss: 0.30580461025238037, mean loss: 0.3392409343324071
Epoch: 71, step: 340, loss: 0.349220335483551, mean loss: 0.3392410313469519
Epoch: 71, step: 341, loss: 0.34698617458343506, mean loss: 0.33924110664047197
Epoch: 71, step: 342, loss: 0.38789355754852295, mean loss: 0.33924157960508555
Epoch: 71, step: 343, loss: 0.3492661118507385, mean loss: 0.33924167705552927
Epoch: 71, step: 344, loss: 0.3133887052536011, mean loss: 0.33924142573616384
Epoch: 71, step: 345, loss: 0.3013363480567932, mean loss: 0.33924105726063475
Epoch: 71, step: 346, loss: 0.3511451780796051, mean loss: 0.3392411729795528
Epoch: 71, step: 347, loss: 0.3034461438655853, mean loss: 0.33924082502258573
Epoch: 71, step: 348, loss: 0.33746716380119324, mean loss: 0.3392408077813152
Epoch: 71, step: 349, loss: 0.32471150159835815, mean loss: 0.33924066654731844
Epoch: 71, step: 350, loss: 0.3399864137172699, mean loss: 0.3392406737963796
Epoch: 71, step: 351, loss: 0.32692670822143555, mean loss: 0.33924055409921433
Epoch: 71, step: 352, loss: 0.3170066177845001, mean loss: 0.33924033797766806
Epoch: 71, step: 353, loss: 0.3691387474536896, mean loss: 0.3392406285977178
Epoch: 71, step: 354, loss: 0.30318018794059753, mean loss: 0.33924027808458435
Epoch: 71, step: 355, loss: 0.4141852855682373, mean loss: 0.3392410065547193
Epoch: 71, step: 356, loss: 0.29302117228507996, mean loss: 0.3392405572994217
Epoch: 71, step: 357, loss: 0.35327571630477905, mean loss: 0.3392406937193883
Epoch: 71, step: 358, loss: 0.3234163522720337, mean loss: 0.33924053991029013
Epoch: 71, step: 359, loss: 0.3068619668483734, mean loss: 0.33924022520078173
Epoch: 71, step: 360, loss: 0.36160388588905334, mean loss: 0.3392404425663908
Epoch: 71, step: 361, loss: 0.3592860698699951, mean loss: 0.33924063739977245
Epoch: 71, step: 362, loss: 0.3321785628795624, mean loss: 0.339240568760639
Epoch: 71, step: 363, loss: 0.3427405059337616, mean loss: 0.3392406027776009
Epoch: 71, step: 364, loss: 0.335208535194397, mean loss: 0.3392405635890814
Epoch: 71, step: 365, loss: 0.33251819014549255, mean loss: 0.33924049825354397
Epoch: 71, step: 366, loss: 0.303727924823761, mean loss: 0.33924015310602446
Epoch: 71, step: 367, loss: 0.3150605261325836, mean loss: 0.33923991810595666
Epoch: 71, step: 368, loss: 0.35270339250564575, mean loss: 0.33924004895523113
Epoch: 71, step: 369, loss: 0.33355095982551575, mean loss: 0.3392399936644549
Epoch: 71, step: 370, loss: 0.35336026549339294, mean loss: 0.3392401308943672
Epoch: 71, step: 371, loss: 0.3691830635070801, mean loss: 0.339240421896278
Epoch: 71, step: 372, loss: 0.290854275226593, mean loss: 0.3392399516576251
Epoch: 71, step: 373, loss: 0.3249143362045288, mean loss: 0.33923981243611007
Epoch: 71, step: 374, loss: 0.3097599744796753, mean loss: 0.3392395259431611
Epoch: 71, step: 375, loss: 0.32605886459350586, mean loss: 0.33923939785121404
Epoch: 71, step: 376, loss: 0.335143119096756, mean loss: 0.3392393580432554
Epoch: 71, step: 377, loss: 0.3239782750606537, mean loss: 0.33923920973629357
Epoch: 71, step: 378, loss: 0.32666656374931335, mean loss: 0.3392390875567071
Epoch: 71, step: 379, loss: 0.3230866491794586, mean loss: 0.33923893059061855
Epoch: 71, step: 380, loss: 0.30613377690315247, mean loss: 0.33923860888464036
Epoch: 71, step: 381, loss: 0.3476788401603699, mean loss: 0.33923869090348546
Epoch: 71, step: 382, loss: 0.32341915369033813, mean loss: 0.3392385371769439
Epoch: 71, step: 383, loss: 0.32156842947006226, mean loss: 0.33923836546913005
Epoch: 71, step: 384, loss: 0.3855958878993988, mean loss: 0.3392388159401523
Epoch: 71, step: 385, loss: 0.34045740962028503, mean loss: 0.3392388277815057
Epoch: 71, step: 386, loss: 0.31624695658683777, mean loss: 0.3392386043664073
Epoch: 71, step: 387, loss: 0.3267679214477539, mean loss: 0.33923848318828503
Epoch: 71, step: 388, loss: 0.3347187340259552, mean loss: 0.3392384392701293
Epoch: 71, step: 389, loss: 0.3503641188144684, mean loss: 0.3392385473766993
Epoch: 71, step: 390, loss: 0.3144650161266327, mean loss: 0.3392383066583273
Epoch: 71, step: 391, loss: 0.29097023606300354, mean loss: 0.33923783765379356
Epoch: 71, step: 392, loss: 0.32756003737449646, mean loss: 0.33923772418565634
Epoch: 71, step: 393, loss: 0.32628658413887024, mean loss: 0.3392375983462498
Epoch: 71, step: 394, loss: 0.32851341366767883, mean loss: 0.33923749414600807
Epoch: 71, step: 395, loss: 0.31934666633605957, mean loss: 0.3392373008810663
Epoch: 71, step: 396, loss: 0.3377218246459961, mean loss: 0.33923728615641113
Epoch: 71, step: 397, loss: 0.36096274852752686, mean loss: 0.33923749724308233
Epoch: 71, step: 398, loss: 0.36039310693740845, mean loss: 0.33923770279101323
Epoch: 71, step: 399, loss: 0.3003910779953003, mean loss: 0.339237325360824
Epoch: 71, step: 400, loss: 0.35794445872306824, mean loss: 0.3392375071158239
Epoch: 71, step: 401, loss: 0.3450773060321808, mean loss: 0.3392375638536639
Epoch: 71, step: 402, loss: 0.37474575638771057, mean loss: 0.3392379088379006
Epoch: 71, step: 403, loss: 0.3072569668292999, mean loss: 0.3392375981261214
Epoch: 71, step: 404, loss: 0.3380645215511322, mean loss: 0.3392375867291723
Epoch: 71, step: 405, loss: 0.28694838285446167, mean loss: 0.339237078721751
Epoch: 71, step: 406, loss: 0.32488909363746643, mean loss: 0.3392369393275444
Epoch: 71, step: 407, loss: 0.3355002701282501, mean loss: 0.33923690302523607
Epoch: 71, step: 408, loss: 0.319024920463562, mean loss: 0.339236706664666
Epoch: 71, step: 409, loss: 0.34748634696006775, mean loss: 0.3392367868096161
Epoch: 71, step: 410, loss: 0.34278541803359985, mean loss: 0.3392368212841022
Epoch: 71, step: 411, loss: 0.30528250336647034, mean loss: 0.33923649142556955
Epoch: 71, step: 412, loss: 0.3527381420135498, mean loss: 0.3392366225897825
Epoch: 71, step: 413, loss: 0.30006083846092224, mean loss: 0.3392362420132789
Epoch: 71, step: 414, loss: 0.31891319155693054, mean loss: 0.33923604458518597
Epoch: 71, step: 415, loss: 0.3357054889202118, mean loss: 0.3392360102879675
Epoch: 71, step: 416, loss: 0.3276806175708771, mean loss: 0.33923589803538867
Epoch: 71, step: 417, loss: 0.37440863251686096, mean loss: 0.33923623971064737
Epoch: 71, step: 418, loss: 0.3229609429836273, mean loss: 0.3392360816105655
Epoch: 71, step: 419, loss: 0.3318725824356079, mean loss: 0.3392360100813926
Epoch: 71, step: 420, loss: 0.3284977078437805, mean loss: 0.33923590577033097
Epoch: 71, step: 421, loss: 0.3506876528263092, mean loss: 0.3392360170106614
Epoch: 71, step: 422, loss: 0.31809261441230774, mean loss: 0.33923581162922634
Epoch: 71, step: 423, loss: 0.3313182294368744, mean loss: 0.3392357347206687
Epoch: 71, step: 424, loss: 0.3881915807723999, mean loss: 0.33923621025560396
Epoch: 71, step: 425, loss: 0.30678460001945496, mean loss: 0.33923589503840884
Epoch: 71, step: 426, loss: 0.34509697556495667, mean loss: 0.3392359519691868
Epoch: 71, step: 427, loss: 0.34249135851860046, mean loss: 0.3392359835898115
Epoch: 71, step: 428, loss: 0.31266066431999207, mean loss: 0.3392357254592153
Epoch: 71, step: 429, loss: 0.367715448141098, mean loss: 0.33923600208491883
Epoch: 71, step: 430, loss: 0.3249080777168274, mean loss: 0.33923586291805596
Epoch: 71, step: 431, loss: 0.3262821137905121, mean loss: 0.3392357370997537
Epoch: 71, step: 432, loss: 0.32857879996299744, mean loss: 0.33923563359113224
Epoch: 71, step: 433, loss: 0.28021931648254395, mean loss: 0.33923506038344453
Epoch: 71, step: 434, loss: 0.3038599193096161, mean loss: 0.3392347167987062
Epoch: 71, step: 435, loss: 0.3092631995677948, mean loss: 0.339234425700054
Epoch: 71, step: 436, loss: 0.3503231704235077, mean loss: 0.3392345333985488
Epoch: 71, step: 437, loss: 0.3331744968891144, mean loss: 0.33923447454152866
Epoch: 71, step: 438, loss: 0.374798059463501, mean loss: 0.3392348199431285
Epoch: 71, step: 439, loss: 0.36855843663215637, mean loss: 0.3392351047379761
Epoch: 71, step: 440, loss: 0.33553993701934814, mean loss: 0.33923506885036653
Epoch: 71, step: 441, loss: 0.3198244869709015, mean loss: 0.33923488033588717
Epoch: 71, step: 442, loss: 0.3369966447353363, mean loss: 0.33923485859848
Epoch: 71, step: 443, loss: 0.317974328994751, mean loss: 0.339234652121423
Epoch: 71, step: 444, loss: 0.3507698178291321, mean loss: 0.3392347641470395
Epoch: 71, step: 445, loss: 0.32148370146751404, mean loss: 0.3392345917564143
Epoch: 71, step: 446, loss: 0.3476007878780365, mean loss: 0.33923467300449506
Epoch: 71, step: 447, loss: 0.3463095724582672, mean loss: 0.3392347417115169
Epoch: 71, step: 448, loss: 0.3336140513420105, mean loss: 0.339234687127399
Epoch: 71, step: 449, loss: 0.3176902234554291, mean loss: 0.3392344779050354
Epoch: 71, step: 450, loss: 0.3264729678630829, mean loss: 0.3392343539768
Epoch: 71, step: 451, loss: 0.3291528522968292, mean loss: 0.3392342560753309
Epoch: 71, step: 452, loss: 0.31891369819641113, mean loss: 0.339234058744297
Epoch: 71, step: 453, loss: 0.39377903938293457, mean loss: 0.33923458842035054
Epoch: 71, step: 454, loss: 0.3093724548816681, mean loss: 0.3392342984376012
Epoch: 71, step: 455, loss: 0.35245007276535034, mean loss: 0.33923442677100896
Epoch: 71, step: 456, loss: 0.3400769829750061, mean loss: 0.3392344349526755
Epoch: 71, step: 457, loss: 0.29768404364585876, mean loss: 0.33923403148030845
Epoch: 71, step: 458, loss: 0.3239090144634247, mean loss: 0.3392338826691744
Epoch: 71, step: 459, loss: 0.34577882289886475, mean loss: 0.33923394622215575
Epoch: 71, step: 460, loss: 0.34225714206695557, mean loss: 0.3392339755778468
Epoch: 71, step: 461, loss: 0.308976411819458, mean loss: 0.3392336817751575
Epoch: 71, step: 462, loss: 0.33411163091659546, mean loss: 0.33923363204023116
Epoch: 71, step: 463, loss: 0.3314509391784668, mean loss: 0.33923355647130216
Epoch: 71, step: 464, loss: 0.2983454465866089, mean loss: 0.3392331594569619
Epoch: 71, step: 465, loss: 0.32347428798675537, mean loss: 0.3392330064433541
Epoch: 71, step: 466, loss: 0.30938661098480225, mean loss: 0.3392327166472024
Epoch: 71, step: 467, loss: 0.3507337272167206, mean loss: 0.3392328283161725
Epoch: 71, step: 468, loss: 0.3024682104587555, mean loss: 0.3392324713538755
Epoch: 71, step: 469, loss: 0.3494443893432617, mean loss: 0.33923257050448613
Epoch: 71, step: 470, loss: 0.3395618498325348, mean loss: 0.339232573701528
Epoch: 71, step: 471, loss: 0.32204049825668335, mean loss: 0.3392324067816918
Epoch: 71, step: 472, loss: 0.32828861474990845, mean loss: 0.339232300528189
Epoch: 71, step: 473, loss: 0.31820210814476013, mean loss: 0.3392320963475992
Epoch: 71, step: 474, loss: 0.36601048707962036, mean loss: 0.3392323563344994
Epoch: 71, step: 475, loss: 0.3333529233932495, mean loss: 0.33923229925262616
Epoch: 71, step: 476, loss: 0.31994208693504333, mean loss: 0.3392321119708297
Epoch: 71, step: 477, loss: 0.3683922290802002, mean loss: 0.33923239507326564
Epoch: 71, step: 478, loss: 0.3473941385746002, mean loss: 0.3392324743111859
Epoch: 71, step: 479, loss: 0.3479807376861572, mean loss: 0.33923255924248347
Epoch: 71, step: 480, loss: 0.30547094345092773, mean loss: 0.3392322314757169
Epoch: 71, step: 481, loss: 0.308204710483551, mean loss: 0.3392319302551958
Epoch: 71, step: 482, loss: 0.33267781138420105, mean loss: 0.339231866627298
Epoch: 71, step: 483, loss: 0.33615532517433167, mean loss: 0.33923183676028323
Epoch: 71, step: 484, loss: 0.41348421573638916, mean loss: 0.33923255759418103
Epoch: 71, step: 485, loss: 0.37446510791778564, mean loss: 0.3392328996245696
Epoch: 71, step: 486, loss: 0.30437445640563965, mean loss: 0.33923256122922135
Epoch: 71, step: 487, loss: 0.33052709698677063, mean loss: 0.3392324767199968
Epoch: 71, step: 488, loss: 0.37339019775390625, mean loss: 0.3392328083065056
Epoch: 71, step: 489, loss: 0.33121055364608765, mean loss: 0.339232730431123
Epoch: 71, step: 490, loss: 0.3196695148944855, mean loss: 0.33923254052464785
Epoch: 71, step: 491, loss: 0.3502512276172638, mean loss: 0.33923264748557713
Epoch: 71, step: 492, loss: 0.3732004165649414, mean loss: 0.33923297721532153
Epoch: 71, step: 493, loss: 0.32042166590690613, mean loss: 0.3392327946131422
Epoch: 71, step: 494, loss: 0.344856321811676, mean loss: 0.3392328492004241
Epoch: 71, step: 495, loss: 0.394724577665329, mean loss: 0.3392333878504772
Epoch: 71, step: 496, loss: 0.33237382769584656, mean loss: 0.33923332126638117
Epoch: 71, step: 497, loss: 0.3259037435054779, mean loss: 0.33923319188064066
Epoch: 71, step: 498, loss: 0.31193724274635315, mean loss: 0.3392329269305894
Epoch: 71, step: 499, loss: 0.34109050035476685, mean loss: 0.33923294496108153
Epoch: 71, step: 500, loss: 0.31198135018348694, mean loss: 0.33923268044669397
Epoch: 71, step: 501, loss: 0.3226950466632843, mean loss: 0.339232519927662
Epoch: 71, step: 502, loss: 0.295694500207901, mean loss: 0.33923209733921705
Epoch: 71, step: 503, loss: 0.3337715268135071, mean loss: 0.3392320443383772
Epoch: 71, step: 504, loss: 0.33312079310417175, mean loss: 0.33923198502254154
Epoch: 71, step: 505, loss: 0.35634106397628784, mean loss: 0.33923215108173743
Epoch: 71, step: 506, loss: 0.34204649925231934, mean loss: 0.33923217839728487
Epoch: 71, step: 507, loss: 0.3614404499530792, mean loss: 0.33923239394460564
Epoch: 71, step: 508, loss: 0.3340979516506195, mean loss: 0.33923234411161723
Epoch: 71, step: 509, loss: 0.3563116788864136, mean loss: 0.3392325098756832
Epoch: 71, step: 510, loss: 0.33946651220321655, mean loss: 0.33923251214677874
Epoch: 71, step: 511, loss: 0.3073469400405884, mean loss: 0.33923220268627846
Epoch: 71, step: 512, loss: 0.3146388828754425, mean loss: 0.3392319640019242
Epoch: 71, step: 513, loss: 0.33036330342292786, mean loss: 0.33923187793017806
Epoch: 71, step: 514, loss: 0.3748369812965393, mean loss: 0.339232223479954
Epoch: 71, step: 515, loss: 0.33775943517684937, mean loss: 0.33923220918658925
Epoch: 71, step: 516, loss: 0.33136433362960815, mean loss: 0.3392321328298424
Epoch: 71, step: 517, loss: 0.33232739567756653, mean loss: 0.3392320658208834
Epoch: 71, step: 518, loss: 0.33802300691604614, mean loss: 0.3392320540873459
Epoch: 71, step: 519, loss: 0.3242321014404297, mean loss: 0.33923190851892226
Epoch: 71, step: 520, loss: 0.31902846693992615, mean loss: 0.33923171245466316
Epoch: 71, step: 521, loss: 0.3690716028213501, mean loss: 0.33923200203301035
Epoch: 71, step: 522, loss: 0.381602942943573, mean loss: 0.33923241321374253
Epoch: 71, step: 523, loss: 0.3422504961490631, mean loss: 0.3392324425018698
Epoch: 71, step: 524, loss: 0.3221159279346466, mean loss: 0.3392322764011355
Epoch: 71, step: 525, loss: 0.43495872616767883, mean loss: 0.33923320533320506
Epoch: 71, step: 526, loss: 0.2743634283542633, mean loss: 0.3392325758412353
Epoch: 71, step: 527, loss: 0.3229135572910309, mean loss: 0.33923241748410926
Epoch: 71, step: 528, loss: 0.29931479692459106, mean loss: 0.33923203013371134
Epoch: 71, step: 529, loss: 0.3138144910335541, mean loss: 0.339231783490795
Epoch: 71, step: 530, loss: 0.35260069370269775, mean loss: 0.33923191321676865
Epoch: 71, step: 531, loss: 0.369620680809021, mean loss: 0.3392322080930261
Epoch: 71, step: 532, loss: 0.3560805320739746, mean loss: 0.33923237157851455
Epoch: 71, step: 533, loss: 0.3473142385482788, mean loss: 0.33923244999908325
Epoch: 71, step: 534, loss: 0.3190333843231201, mean loss: 0.3392322540039186
Epoch: 71, step: 535, loss: 0.3533863127231598, mean loss: 0.33923239134196165
Epoch: 71, step: 536, loss: 0.2896784245967865, mean loss: 0.33923191052024687
Epoch: 71, step: 537, loss: 0.2926025092601776, mean loss: 0.33923145807995597
Epoch: 71, step: 538, loss: 0.32383161783218384, mean loss: 0.33923130865833767
Epoch: 71, step: 539, loss: 0.34545353055000305, mean loss: 0.339231369030746
Epoch: 71, step: 540, loss: 0.32423511147499084, mean loss: 0.3392312235278347
Epoch: 71, step: 541, loss: 0.3610686957836151, mean loss: 0.33923143540636164
Epoch: 71, step: 542, loss: 0.2845967710018158, mean loss: 0.3392309053175417
Epoch: 71, step: 543, loss: 0.32798126339912415, mean loss: 0.33923079616977597
Epoch: 71, step: 544, loss: 0.3057822287082672, mean loss: 0.33923047164380343
Epoch: 71, step: 545, loss: 0.30174514651298523, mean loss: 0.33923010795577463
Epoch: 71, step: 546, loss: 0.3482784628868103, mean loss: 0.339230195743367
Epoch: 71, step: 547, loss: 0.31791794300079346, mean loss: 0.33922998897283047
Epoch: 71, step: 548, loss: 0.3023452162742615, mean loss: 0.33922963112186366
Epoch: 71, step: 549, loss: 0.334492564201355, mean loss: 0.33922958516394097
Epoch: 71, step: 550, loss: 0.3269476294517517, mean loss: 0.33922946600841625
Epoch: 71, step: 551, loss: 0.2918892204761505, mean loss: 0.3392290067332646
Epoch: 71, step: 552, loss: 0.3085242509841919, mean loss: 0.33922870885152817
Epoch: 71, step: 553, loss: 0.35440999269485474, mean loss: 0.3392288561311013
Epoch: 71, step: 554, loss: 0.3171650767326355, mean loss: 0.33922864208382303
Epoch: 71, step: 555, loss: 0.3207246959209442, mean loss: 0.3392284625732859
Epoch: 71, step: 556, loss: 0.3027495741844177, mean loss: 0.33922810868761943
Epoch: 71, step: 557, loss: 0.3428696393966675, mean loss: 0.33922814401416246
Epoch: 71, step: 558, loss: 0.3337477743625641, mean loss: 0.33922809084953154
Epoch: 71, step: 559, loss: 0.3254842758178711, mean loss: 0.3392279575231663
Epoch: 71, step: 560, loss: 0.3386370539665222, mean loss: 0.33922795179096904
Epoch: 71, step: 561, loss: 0.3357583284378052, mean loss: 0.33922791813340786
Epoch: 71, step: 562, loss: 0.29055649042129517, mean loss: 0.339227445994072
Epoch: 71, step: 563, loss: 0.3643149435520172, mean loss: 0.3392276893540902
Epoch: 71, step: 564, loss: 0.3428945243358612, mean loss: 0.3392277249236949
Epoch: 71, step: 565, loss: 0.30058765411376953, mean loss: 0.33922735010488797
Epoch: 71, step: 566, loss: 0.3457587957382202, mean loss: 0.33922741346100665
Epoch: 71, step: 567, loss: 0.32854416966438293, mean loss: 0.33922730983275423
Epoch: 71, step: 568, loss: 0.37578442692756653, mean loss: 0.3392276644360454
Epoch: 71, step: 569, loss: 0.3418501317501068, mean loss: 0.3392276898736782
Epoch: 71, step: 570, loss: 0.3120756447315216, mean loss: 0.3392274265045027
Epoch: 71, step: 571, loss: 0.3502214252948761, mean loss: 0.3392275331429639
Epoch: 71, step: 572, loss: 0.3127499222755432, mean loss: 0.33922727632064253
Epoch: 71, step: 573, loss: 0.3287889063358307, mean loss: 0.3392271750735768
Epoch: 71, step: 574, loss: 0.3059992492198944, mean loss: 0.3392268527821302
Epoch: 71, step: 575, loss: 0.3004544675350189, mean loss: 0.33922647671631795
Epoch: 71, step: 576, loss: 0.31207388639450073, mean loss: 0.33922621335718156
Epoch: 71, step: 577, loss: 0.34357044100761414, mean loss: 0.33922625549242286
Epoch: 71, step: 578, loss: 0.2994747757911682, mean loss: 0.33922586994127785
Epoch: 71, step: 579, loss: 0.3653506338596344, mean loss: 0.3392261233239198
Epoch: 71, step: 580, loss: 0.3066578805446625, mean loss: 0.339225807449396
Epoch: 71, step: 581, loss: 0.30702096223831177, mean loss: 0.3392254951024403
Epoch: 71, step: 582, loss: 0.32107025384902954, mean loss: 0.3392253190208818
Epoch: 71, step: 583, loss: 0.3639809489250183, mean loss: 0.339225559115054
Epoch: 71, step: 584, loss: 0.3063262701034546, mean loss: 0.3392252400421407
Epoch: 71, step: 585, loss: 0.30538031458854675, mean loss: 0.3392249118011801
Epoch: 71, step: 586, loss: 0.3638589084148407, mean loss: 0.33922515070873227
Epoch: 71, step: 587, loss: 0.34387317299842834, mean loss: 0.33922519578614607
Epoch: 71, step: 588, loss: 0.30516478419303894, mean loss: 0.33922486546492964
Epoch: 71, step: 589, loss: 0.32383930683135986, mean loss: 0.33922471625571815
Epoch: 71, step: 590, loss: 0.333161860704422, mean loss: 0.33922465745869007
Epoch: 71, step: 591, loss: 0.3874583840370178, mean loss: 0.3392251252204979
Epoch: 71, step: 592, loss: 0.35973912477493286, mean loss: 0.3392253241595628
Epoch: 71, step: 593, loss: 0.3640029728412628, mean loss: 0.33922556444398144
Epoch: 71, step: 594, loss: 0.322507381439209, mean loss: 0.33922540231883475
Epoch: 71, step: 595, loss: 0.3284112215042114, mean loss: 0.3392252974489665
Epoch: 71, step: 596, loss: 0.38409438729286194, mean loss: 0.3392257325600481
Epoch: 71, step: 597, loss: 0.30919989943504333, mean loss: 0.33922544139198385
Epoch: 71, step: 598, loss: 0.3310002088546753, mean loss: 0.3392253616306063
Epoch: 71, step: 599, loss: 0.3205433785915375, mean loss: 0.33922518047022615
Epoch: 71, step: 600, loss: 0.30356651544570923, mean loss: 0.339224834689232
Epoch: 71, step: 601, loss: 0.3463962972164154, mean loss: 0.33922490423001245
Epoch: 71, step: 602, loss: 0.3101678788661957, mean loss: 0.33922462247038243
Epoch: 71, step: 603, loss: 0.3322848677635193, mean loss: 0.33922455517774897
Epoch: 71, step: 604, loss: 0.3245111405849457, mean loss: 0.3392244125077474
Epoch: 71, step: 605, loss: 0.32894977927207947, mean loss: 0.3392243128797707
Epoch: 71, step: 606, loss: 0.31317687034606934, mean loss: 0.3392240603132045
Epoch: 71, step: 607, loss: 0.29654625058174133, mean loss: 0.3392236464958662
Epoch: 71, step: 608, loss: 0.34701135754585266, mean loss: 0.33922372200720646
Epoch: 71, step: 609, loss: 0.3158884048461914, mean loss: 0.3392234957450896
Epoch: 71, step: 610, loss: 0.3349173367023468, mean loss: 0.3392234539924446
Epoch: 71, step: 611, loss: 0.3348245322704315, mean loss: 0.33922341134078343
Epoch: 71, step: 612, loss: 0.33154818415641785, mean loss: 0.33922333692299755
Epoch: 71, step: 613, loss: 0.37581050395965576, mean loss: 0.3392236916629289
Epoch: 71, step: 614, loss: 0.3137749433517456, mean loss: 0.3392234449206848
Epoch: 71, step: 615, loss: 0.35644569993019104, mean loss: 0.3392236119000818
Epoch: 71, step: 616, loss: 0.3449612259864807, mean loss: 0.33922366752892086
Epoch: 71, step: 617, loss: 0.3171921968460083, mean loss: 0.33922345392562947
Epoch: 71, step: 618, loss: 0.31156685948371887, mean loss: 0.33922318578727356
Epoch: 71, step: 619, loss: 0.3219967484474182, mean loss: 0.3392230187738037
Epoch: 71, step: 620, loss: 0.3556276261806488, mean loss: 0.33922317781793965
Epoch: 71, step: 621, loss: 0.35158249735832214, mean loss: 0.3392232976414863
Epoch: 71, step: 622, loss: 0.37261828780174255, mean loss: 0.33922362140262485
Epoch: 71, step: 623, loss: 0.3253605365753174, mean loss: 0.3392234870026866
Epoch: 71, step: 624, loss: 0.3563089370727539, mean loss: 0.3392236526412296
Epoch: 71, step: 625, loss: 0.31035465002059937, mean loss: 0.33922337276723424
Epoch: 71, step: 626, loss: 0.33617135882377625, mean loss: 0.3392233431794072
Epoch: 71, step: 627, loss: 0.3096020519733429, mean loss: 0.33922305601782815
Epoch: 71, step: 628, loss: 0.3622007668018341, mean loss: 0.3392232787715123
Epoch: 71, step: 629, loss: 0.35596737265586853, mean loss: 0.3392234410928366
Epoch: 71, step: 630, loss: 0.30288249254226685, mean loss: 0.3392230887982454
Epoch: 71, step: 631, loss: 0.3578539490699768, mean loss: 0.3392232694068409
Epoch: 71, step: 632, loss: 0.29496562480926514, mean loss: 0.3392228403749323
Epoch: 71, step: 633, loss: 0.3051295578479767, mean loss: 0.3392225098791634
Epoch: 71, step: 634, loss: 0.3025772273540497, mean loss: 0.33922215464808786
Epoch: 71, step: 635, loss: 0.31000810861587524, mean loss: 0.33922187145648225
Epoch: 71, step: 636, loss: 0.33701589703559875, mean loss: 0.33922185007268
Epoch: 71, step: 637, loss: 0.35095903277397156, mean loss: 0.3392219638469642
Epoch: 71, step: 638, loss: 0.32404783368110657, mean loss: 0.3392218167580838
Epoch: 71, step: 639, loss: 0.3086058795452118, mean loss: 0.3392215199885013
Epoch: 71, step: 640, loss: 0.32111504673957825, mean loss: 0.33922134447865543
Epoch: 71, step: 641, loss: 0.3098614811897278, mean loss: 0.3392210598900963
Epoch: 71, step: 642, loss: 0.3519391119480133, mean loss: 0.3392211831664546
Epoch: 71, step: 643, loss: 0.3354418873786926, mean loss: 0.3392211465340125
Epoch: 71, step: 644, loss: 0.34955787658691406, mean loss: 0.3392212467262219
Epoch: 71, step: 645, loss: 0.3474155068397522, mean loss: 0.33922132615105577
Epoch: 71, step: 646, loss: 0.3370678126811981, mean loss: 0.33922130527781164
Epoch: 71, step: 647, loss: 0.31221169233322144, mean loss: 0.3392210434857271
Epoch: 71, step: 648, loss: 0.3309304416179657, mean loss: 0.33922096312941424
Epoch: 71, step: 649, loss: 0.356080025434494, mean loss: 0.33922112653358877
Epoch: 71, step: 650, loss: 0.3283262848854065, mean loss: 0.3392210209378374
Epoch: 71, step: 651, loss: 0.34538647532463074, mean loss: 0.33922108069450935
Epoch: 71, step: 652, loss: 0.30844321846961975, mean loss: 0.3392207823929283
Epoch: 71, step: 653, loss: 0.334769606590271, mean loss: 0.33922073925218316
Epoch: 71, step: 654, loss: 0.3284376263618469, mean loss: 0.3392206347433888
Epoch: 71, step: 655, loss: 0.3312838673591614, mean loss: 0.3392205578218208
Epoch: 71, step: 656, loss: 0.28521499037742615, mean loss: 0.3392200344156952
Epoch: 71, step: 657, loss: 0.3427928686141968, mean loss: 0.33922006904222113
Epoch: 71, step: 658, loss: 0.4126248061656952, mean loss: 0.3392207804456221
Epoch: 71, step: 659, loss: 0.3330162465572357, mean loss: 0.33922072031484707
Epoch: 71, step: 660, loss: 0.3280334770679474, mean loss: 0.3392206118955686
Epoch: 71, step: 661, loss: 0.33616942167282104, mean loss: 0.33922058232576047
Epoch: 71, step: 662, loss: 0.3184655010700226, mean loss: 0.3392203811852946
Epoch: 71, step: 663, loss: 0.33883073925971985, mean loss: 0.3392203774092554
Epoch: 71, step: 664, loss: 0.30461233854293823, mean loss: 0.33922004202429323
Epoch: 71, step: 665, loss: 0.3264872431755066, mean loss: 0.33921991863250284
Epoch: 71, step: 666, loss: 0.3223389983177185, mean loss: 0.3392197550434271
Epoch: 71, step: 667, loss: 0.3632628321647644, mean loss: 0.3392199880370421
Epoch: 71, step: 668, loss: 0.32448554039001465, mean loss: 0.33921984525170157
Epoch: 71, step: 669, loss: 0.35337162017822266, mean loss: 0.3392199823892767
Epoch: 71, step: 670, loss: 0.3384200930595398, mean loss: 0.33921997463803555
Epoch: 71, step: 671, loss: 0.30435341596603394, mean loss: 0.3392196367706892
Epoch: 71, step: 672, loss: 0.3814341127872467, mean loss: 0.33922004583758086
Epoch: 71, step: 673, loss: 0.3742575943470001, mean loss: 0.33922038535528964
Epoch: 71, step: 674, loss: 0.3130201995372772, mean loss: 0.33922013147506
Epoch: 71, step: 675, loss: 0.3475290536880493, mean loss: 0.33922021198787217
Epoch: 71, step: 676, loss: 0.31722724437713623, mean loss: 0.3392199988797859
Epoch: 71, step: 677, loss: 0.31076326966285706, mean loss: 0.33921972314162946
Epoch: 71, step: 678, loss: 0.28571566939353943, mean loss: 0.339219204706567
Epoch: 71, step: 679, loss: 0.35815685987472534, mean loss: 0.33921938820386527
Epoch: 71, step: 680, loss: 0.30085012316703796, mean loss: 0.3392190164266739
Epoch: 71, step: 681, loss: 0.32411989569664, mean loss: 0.3392188701258704
Epoch: 71, step: 682, loss: 0.36145684123039246, mean loss: 0.3392190855954713
Epoch: 71, step: 683, loss: 0.33241361379623413, mean loss: 0.3392190196560887
Epoch: 71, step: 684, loss: 0.3214246928691864, mean loss: 0.33921884724547735
Epoch: 71, step: 685, loss: 0.3383716642856598, mean loss: 0.3392188390371355
Epoch: 71, step: 686, loss: 0.3185025155544281, mean loss: 0.33921863831896126
Epoch: 71, step: 687, loss: 0.34977251291275024, mean loss: 0.3392187405732979
Epoch: 71, step: 688, loss: 0.34589245915412903, mean loss: 0.33921880523296855
Epoch: 71, step: 689, loss: 0.34480661153793335, mean loss: 0.3392188593710342
Epoch: 71, step: 690, loss: 0.3515104651451111, mean loss: 0.3392189784584321
Epoch: 71, step: 691, loss: 0.3393448293209076, mean loss: 0.3392189796777281
Epoch: 71, step: 692, loss: 0.2958565354347229, mean loss: 0.33921855956820895
Epoch: 71, step: 693, loss: 0.3528327941894531, mean loss: 0.33921869146608163
Epoch: 71, step: 694, loss: 0.2998826205730438, mean loss: 0.3392183103727665
Epoch: 71, step: 695, loss: 0.29655441641807556, mean loss: 0.339217897043044
Epoch: 71, step: 696, loss: 0.33934399485588074, mean loss: 0.33921789826467347
Epoch: 71, step: 697, loss: 0.3175320625305176, mean loss: 0.3392176881753928
Epoch: 71, step: 698, loss: 0.3056885004043579, mean loss: 0.33921736335255515
Epoch: 71, step: 699, loss: 0.3111993670463562, mean loss: 0.33921709192346594
Epoch: 71, step: 700, loss: 0.36033082008361816, mean loss: 0.3392172964643055
Epoch: 71, step: 701, loss: 0.3355136513710022, mean loss: 0.33921726058531093
Epoch: 71, step: 702, loss: 0.36173292994499207, mean loss: 0.33921747870333585
Epoch: 71, step: 703, loss: 0.33990707993507385, mean loss: 0.33921748538370583
Epoch: 71, step: 704, loss: 0.3173617720603943, mean loss: 0.3392172736630331
Epoch: 71, step: 705, loss: 0.2906370162963867, mean loss: 0.33921680306090807
Epoch: 71, step: 706, loss: 0.2873733937740326, mean loss: 0.3392163008531479
Epoch: 71, step: 707, loss: 0.29570868611335754, mean loss: 0.3392158793984174
Epoch: 71, step: 708, loss: 0.3143087923526764, mean loss: 0.3392156381278252
Epoch: 71, step: 709, loss: 0.33694228529930115, mean loss: 0.3392156161064676
Epoch: 71, step: 710, loss: 0.3228406608104706, mean loss: 0.33921545748821513
Epoch: 71, step: 711, loss: 0.3085537254810333, mean loss: 0.33921516048201567
Epoch: 71, step: 712, loss: 0.32572683691978455, mean loss: 0.33921502982804896
Epoch: 71, step: 713, loss: 0.34493768215179443, mean loss: 0.3392150852596955
Epoch: 71, step: 714, loss: 0.33907049894332886, mean loss: 0.3392150838591946
Epoch: 71, step: 715, loss: 0.3324982225894928, mean loss: 0.3392150187985469
Epoch: 71, step: 716, loss: 0.2825031280517578, mean loss: 0.33921446948295764
Epoch: 71, step: 717, loss: 0.32169896364212036, mean loss: 0.3392142998281094
Epoch: 71, step: 718, loss: 0.33522558212280273, mean loss: 0.3392142611938417
Epoch: 71, step: 719, loss: 0.3830757439136505, mean loss: 0.33921468602707866
Epoch: 71, step: 720, loss: 0.34459003806114197, mean loss: 0.33921473809112085
Epoch: 71, step: 721, loss: 0.335769385099411, mean loss: 0.3392147047207918
Epoch: 71, step: 722, loss: 0.35276564955711365, mean loss: 0.33921483596862306
Epoch: 71, step: 723, loss: 0.3474878668785095, mean loss: 0.33921491609638255
Epoch: 71, step: 724, loss: 0.3195931315422058, mean loss: 0.33921472605304503
Epoch: 71, step: 725, loss: 0.30802100896835327, mean loss: 0.33921442393471973
Epoch: 71, step: 726, loss: 0.3132786452770233, mean loss: 0.33921417274317045
Epoch: 71, step: 727, loss: 0.3708856403827667, mean loss: 0.3392144794826781
Epoch: 71, step: 728, loss: 0.3343181610107422, mean loss: 0.33921443206208524
Epoch: 71, step: 729, loss: 0.31462857127189636, mean loss: 0.33921419395159275
Epoch: 71, step: 730, loss: 0.32892054319381714, mean loss: 0.33921409426004506
Epoch: 71, step: 731, loss: 0.3255856931209564, mean loss: 0.3392139622735151
Epoch: 71, step: 732, loss: 0.33845049142837524, mean loss: 0.33921395487962563
Epoch: 71, step: 733, loss: 0.2978628873825073, mean loss: 0.33921355441605383
Epoch: 71, step: 734, loss: 0.3285331726074219, mean loss: 0.33921345098311523
Epoch: 71, step: 735, loss: 0.28233402967453003, mean loss: 0.33921290014618605
Epoch: 71, step: 736, loss: 0.30320456624031067, mean loss: 0.33921255143434026
Epoch: 71, step: 737, loss: 0.3249892294406891, mean loss: 0.3392124136942036
Epoch: 71, step: 738, loss: 0.3079834282398224, mean loss: 0.33921211127237333
Epoch: 71, step: 739, loss: 0.3222208321094513, mean loss: 0.339211946730237
Epoch: 71, step: 740, loss: 0.3366204798221588, mean loss: 0.33921192163492975
Epoch: 71, step: 741, loss: 0.3105037212371826, mean loss: 0.33921164363248557
Epoch: 71, step: 742, loss: 0.3472462296485901, mean loss: 0.3392117214364889
Epoch: 71, step: 743, loss: 0.3401110768318176, mean loss: 0.33921173014543454
Epoch: 71, step: 744, loss: 0.3303917348384857, mean loss: 0.3392116447374679
Epoch: 71, step: 745, loss: 0.34243738651275635, mean loss: 0.3392116759734684
Epoch: 71, step: 746, loss: 0.3223545551300049, mean loss: 0.3392115127415752
Epoch: 71, step: 747, loss: 0.3225228190422058, mean loss: 0.3392113511421707
Epoch: 71, step: 748, loss: 0.3289216160774231, mean loss: 0.33921125150591475
Epoch: 71, step: 749, loss: 0.3276076912879944, mean loss: 0.33921113914888185
Epoch: 71, step: 750, loss: 0.34426233172416687, mean loss: 0.3392111880590012
Epoch: 71, step: 751, loss: 0.33680862188339233, mean loss: 0.33921116479545327
Epoch: 71, step: 752, loss: 0.3843502700328827, mean loss: 0.3392116018637767
Epoch: 71, step: 753, loss: 0.32878127694129944, mean loss: 0.33921150087106844
Epoch: 71, step: 754, loss: 0.37799832224845886, mean loss: 0.33921187642487294
Epoch: 71, step: 755, loss: 0.30391600728034973, mean loss: 0.339211534675559
Epoch: 71, step: 756, loss: 0.2986408770084381, mean loss: 0.3392111418573478
Epoch: 71, step: 757, loss: 0.37612342834472656, mean loss: 0.3392114992505672
Epoch: 71, step: 758, loss: 0.3290958106517792, mean loss: 0.3392114013090996
Epoch: 71, step: 759, loss: 0.3403841555118561, mean loss: 0.33921141266375476
Epoch: 71, step: 760, loss: 0.30888956785202026, mean loss: 0.3392111190892298
Epoch: 71, step: 761, loss: 0.32476842403411865, mean loss: 0.33921097925716104
Epoch: 71, step: 762, loss: 0.33564478158950806, mean loss: 0.3392109447300892
Epoch: 71, step: 763, loss: 0.3117780387401581, mean loss: 0.3392106791338342
Epoch: 71, step: 764, loss: 0.35775837302207947, mean loss: 0.3392108587046877
Epoch: 71, step: 765, loss: 0.3620084524154663, mean loss: 0.33921107941912
Epoch: 71, step: 766, loss: 0.3530043959617615, mean loss: 0.33921121295753615
Epoch: 71, step: 767, loss: 0.33852192759513855, mean loss: 0.33921120628436335
Epoch: 71, step: 768, loss: 0.32132792472839355, mean loss: 0.3392110331527711
Epoch: 71, step: 769, loss: 0.3030482828617096, mean loss: 0.3392106830574094
Epoch: 71, step: 770, loss: 0.341899573802948, mean loss: 0.33921070908858947
Epoch: 71, step: 771, loss: 0.3696759343147278, mean loss: 0.33921100401990556
Epoch: 71, step: 772, loss: 0.3500685393810272, mean loss: 0.3392111091297864
Epoch: 71, step: 773, loss: 0.3149803578853607, mean loss: 0.33921087455843707
Epoch: 71, step: 774, loss: 0.3538637161254883, mean loss: 0.3392110164072601
Epoch: 71, step: 775, loss: 0.33844873309135437, mean loss: 0.3392110090279444
Epoch: 71, step: 776, loss: 0.3249779939651489, mean loss: 0.3392108712459765
Epoch: 71, step: 777, loss: 0.33279314637184143, mean loss: 0.3392108091201234
Epoch: 71, step: 778, loss: 0.3502509593963623, mean loss: 0.33921091599165937
Epoch: 71, step: 779, loss: 0.3447999656200409, mean loss: 0.33921097009459467
Epoch: 71, step: 780, loss: 0.3161469101905823, mean loss: 0.339210746832798
Epoch: 71, step: 781, loss: 0.3533231019973755, mean loss: 0.33921088344011185
Epoch: 71, step: 782, loss: 0.32848381996154785, mean loss: 0.3392107796033585
Epoch: 71, step: 783, loss: 0.33684852719306946, mean loss: 0.33921075673724543
Epoch: 71, step: 784, loss: 0.3988546133041382, mean loss: 0.33921133407181037
Epoch: 71, step: 785, loss: 0.32891032099723816, mean loss: 0.33921123436207196
Epoch: 71, step: 786, loss: 0.3156159222126007, mean loss: 0.33921100597097953
Epoch: 71, step: 787, loss: 0.33936628699302673, mean loss: 0.3392110074740094
Epoch: 71, step: 788, loss: 0.34808799624443054, mean loss: 0.3392110933972598
Epoch: 71, step: 789, loss: 0.3183179199695587, mean loss: 0.3392108911674223
Epoch: 71, step: 790, loss: 0.328887939453125, mean loss: 0.33921079125016235
Epoch: 71, step: 791, loss: 0.3383839726448059, mean loss: 0.33921078324734955
Epoch: 71, step: 792, loss: 0.3046838045120239, mean loss: 0.3392104490624745
Epoch: 71, step: 793, loss: 0.368594765663147, mean loss: 0.33921073346903097
Epoch: 71, step: 794, loss: 0.3826136589050293, mean loss: 0.3392111535556117
Epoch: 71, step: 795, loss: 0.3305840492248535, mean loss: 0.33921107005673123
Epoch: 71, step: 796, loss: 0.3682565987110138, mean loss: 0.33921135117604534
Epoch: 71, step: 797, loss: 0.34787195920944214, mean loss: 0.3392114349975745
Epoch: 71, step: 798, loss: 0.34960103034973145, mean loss: 0.3392115355521011
Epoch: 71, step: 799, loss: 0.307381272315979, mean loss: 0.3392112274894706
Epoch: 71, step: 800, loss: 0.32340356707572937, mean loss: 0.33921107449977383
Epoch: 71, step: 801, loss: 0.3312031030654907, mean loss: 0.33921099699777596
Epoch: 71, step: 802, loss: 0.3265836238861084, mean loss: 0.33921087478990086
Epoch: 71, step: 803, loss: 0.34701037406921387, mean loss: 0.33921095027282205
Epoch: 71, step: 804, loss: 0.35442084074020386, mean loss: 0.3392110974714833
Epoch: 71, step: 805, loss: 0.31675440073013306, mean loss: 0.339210880141601
Epoch: 71, step: 806, loss: 0.35426145792007446, mean loss: 0.33921102579564266
Epoch: 71, step: 807, loss: 0.3356456756591797, mean loss: 0.33921099129180904
Epoch: 71, step: 808, loss: 0.30185621976852417, mean loss: 0.339210629792854
Epoch: 71, step: 809, loss: 0.31168732047080994, mean loss: 0.3392103634399661
Epoch: 71, step: 810, loss: 0.3522334098815918, mean loss: 0.33921048946741506
Epoch: 71, step: 811, loss: 0.35302427411079407, mean loss: 0.3392106231457522
Epoch: 71, step: 812, loss: 0.3655640780925751, mean loss: 0.3392108781701379
Epoch: 71, step: 813, loss: 0.3260348439216614, mean loss: 0.3392107506658873
Epoch: 71, step: 814, loss: 0.323182076215744, mean loss: 0.33921059555818883
Epoch: 71, step: 815, loss: 0.35026654601097107, mean loss: 0.33921070254435537
Epoch: 71, step: 816, loss: 0.31230831146240234, mean loss: 0.33921044221794977
Epoch: 71, step: 817, loss: 0.2828226387500763, mean loss: 0.3392098965752927
Epoch: 71, step: 818, loss: 0.3781689703464508, mean loss: 0.3392102735633207
Epoch: 71, step: 819, loss: 0.35113659501075745, mean loss: 0.339210388967422
Epoch: 71, step: 820, loss: 0.3348807990550995, mean loss: 0.3392103470728948
Epoch: 71, step: 821, loss: 0.35383540391921997, mean loss: 0.33921048858835595
Epoch: 71, step: 822, loss: 0.329108864068985, mean loss: 0.33921039084362686
Epoch: 71, step: 823, loss: 0.3212142884731293, mean loss: 0.33921021671251284
Epoch: 71, step: 824, loss: 0.3474632501602173, mean loss: 0.3392102965684713
Epoch: 71, step: 825, loss: 0.3332693874835968, mean loss: 0.33921023908507425
Epoch: 71, step: 826, loss: 0.42525234818458557, mean loss: 0.33921107160831154
Epoch: 71, step: 827, loss: 0.31421759724617004, mean loss: 0.33921082977966416
Epoch: 71, step: 828, loss: 0.32689327001571655, mean loss: 0.33921071060015545
Epoch: 71, step: 829, loss: 0.3151443600654602, mean loss: 0.3392104777465597
Epoch: 71, step: 830, loss: 0.35757631063461304, mean loss: 0.3392106554431674
Epoch: 71, step: 831, loss: 0.3611760437488556, mean loss: 0.3392108679648237
Epoch: 71, step: 832, loss: 0.3362559974193573, mean loss: 0.33921083937585006
Epoch: 71, step: 833, loss: 0.31044143438339233, mean loss: 0.3392105610286975
Epoch: 71, step: 834, loss: 0.34086140990257263, mean loss: 0.33921057700068713
Epoch: 71, step: 835, loss: 0.3302861154079437, mean loss: 0.339210490657212
Epoch: 71, step: 836, loss: 0.3717518746852875, mean loss: 0.3392108054895378
Epoch: 71, step: 837, loss: 0.3165561556816101, mean loss: 0.3392105863117954
Epoch: 71, step: 838, loss: 0.32145535945892334, mean loss: 0.3392104145363356
Epoch: 71, step: 839, loss: 0.31740596890449524, mean loss: 0.3392102035881754
Epoch: 71, step: 840, loss: 0.30628862977027893, mean loss: 0.339209885089904
Epoch: 71, step: 841, loss: 0.3203960657119751, mean loss: 0.3392097030782234
Epoch: 71, step: 842, loss: 0.34554460644721985, mean loss: 0.33920976436377265
Epoch: 71, step: 843, loss: 0.35345223546028137, mean loss: 0.33920990214791374
Epoch: 71, step: 844, loss: 0.3546154499053955, mean loss: 0.3392100511824188
Epoch: 71, step: 845, loss: 0.34953394532203674, mean loss: 0.3392101510556329
Epoch: 71, step: 846, loss: 0.3573748767375946, mean loss: 0.3392103267792467
Epoch: 71, step: 847, loss: 0.4153282046318054, mean loss: 0.339211063128334
Epoch: 71, step: 848, loss: 0.3405521810054779, mean loss: 0.3392110761019139
Epoch: 71, step: 849, loss: 0.3425349295139313, mean loss: 0.33921110825558326
Epoch: 71, step: 850, loss: 0.32729700207710266, mean loss: 0.33921099300425384
Epoch: 71, step: 851, loss: 0.36971569061279297, mean loss: 0.3392112880891634
Epoch: 71, step: 852, loss: 0.3380609154701233, mean loss: 0.3392112769612276
Epoch: 71, step: 853, loss: 0.33136090636253357, mean loss: 0.3392112010227243
Epoch: 71, step: 854, loss: 0.3791980445384979, mean loss: 0.33921158782123767
Epoch: 71, step: 855, loss: 0.34409981966018677, mean loss: 0.33921163510535296
Epoch: 71, step: 856, loss: 0.3521747887134552, mean loss: 0.33921176049738444
Epoch: 71, step: 857, loss: 0.3402521312236786, mean loss: 0.33921177056074875
Epoch: 71, step: 858, loss: 0.34058794379234314, mean loss: 0.33921178387215617
Epoch: 71, step: 859, loss: 0.36771321296691895, mean loss: 0.3392120595572631
Epoch: 71, step: 860, loss: 0.316468745470047, mean loss: 0.3392118395706684
Epoch: 71, step: 861, loss: 0.3363904058933258, mean loss: 0.3392118122803808
Epoch: 71, step: 862, loss: 0.3113028109073639, mean loss: 0.33921154233346895
Epoch: 71, step: 863, loss: 0.31549739837646484, mean loss: 0.3392113129630976
Epoch: 71, step: 864, loss: 0.36574921011924744, mean loss: 0.3392115696431811
Epoch: 71, step: 865, loss: 0.3540972173213959, mean loss: 0.33921171361888164
Epoch: 71, step: 866, loss: 0.3551170229911804, mean loss: 0.33921186745537973
Epoch: 71, step: 867, loss: 0.3345465064048767, mean loss: 0.33921182233234265
Epoch: 71, step: 868, loss: 0.2975499629974365, mean loss: 0.33921141938572796
Epoch: 71, step: 869, loss: 0.33022812008857727, mean loss: 0.33921133250158286
Epoch: 71, step: 870, loss: 0.33875274658203125, mean loss: 0.33921132806630144
Epoch: 71, step: 871, loss: 0.34124600887298584, mean loss: 0.3392113477448268
Epoch: 71, step: 872, loss: 0.3141244351863861, mean loss: 0.3392111051177433
Epoch: 71, step: 873, loss: 0.35676905512809753, mean loss: 0.3392112749271207
Epoch: 71, step: 874, loss: 0.34741148352622986, mean loss: 0.3392113542335802
Epoch: 71, step: 875, loss: 0.31018635630607605, mean loss: 0.3392110735276041
Epoch: 71, step: 876, loss: 0.3076506555080414, mean loss: 0.3392107683040761
Epoch: 71, step: 877, loss: 0.29917919635772705, mean loss: 0.33921038115903107
Epoch: 71, step: 878, loss: 0.39005181193351746, mean loss: 0.3392108728413882
Epoch: 71, step: 879, loss: 0.2924928367137909, mean loss: 0.3392104210403348
Epoch: 71, step: 880, loss: 0.38215917348861694, mean loss: 0.3392108363853611
Epoch: 71, step: 881, loss: 0.3562968969345093, mean loss: 0.3392110016181382
Epoch: 71, step: 882, loss: 0.34455931186676025, mean loss: 0.3392110533391073
Epoch: 71, step: 883, loss: 0.35260576009750366, mean loss: 0.339211182871704
Epoch: 71, step: 884, loss: 0.3073289692401886, mean loss: 0.3392108745599165
Epoch: 71, step: 885, loss: 0.3697870373725891, mean loss: 0.3392111702388916
Epoch: 71, step: 886, loss: 0.34319525957107544, mean loss: 0.3392112087656376
Epoch: 71, step: 887, loss: 0.3526415526866913, mean loss: 0.33921133863783737
Epoch: 71, step: 888, loss: 0.33146560192108154, mean loss: 0.3392112637368412
Epoch: 71, step: 889, loss: 0.3517736494541168, mean loss: 0.3392113852134857
Epoch: 71, step: 890, loss: 0.31045761704444885, mean loss: 0.33921110717095637
Epoch: 71, step: 891, loss: 0.29289352893829346, mean loss: 0.3392106592946294
Epoch: 71, step: 892, loss: 0.3415410816669464, mean loss: 0.3392106818288585
Epoch: 71, step: 893, loss: 0.3157860338687897, mean loss: 0.33921045532430455
Epoch: 71, step: 894, loss: 0.3434639573097229, mean loss: 0.33921049645312984
Epoch: 71, step: 895, loss: 0.29735851287841797, mean loss: 0.3392100917733428
Epoch: 71, step: 896, loss: 0.3386991620063782, mean loss: 0.3392100868330525
Epoch: 71, step: 897, loss: 0.3625635802745819, mean loss: 0.3392103126408443
Epoch: 71, step: 898, loss: 0.3605744540691376, mean loss: 0.33921051921135015
Epoch: 71, step: 899, loss: 0.3477669358253479, mean loss: 0.33921060194279173
Epoch: 71, step: 900, loss: 0.3490281105041504, mean loss: 0.3392106968667324
Epoch: 71, step: 901, loss: 0.32449328899383545, mean loss: 0.33921055456781457
Epoch: 71, step: 902, loss: 0.31311649084091187, mean loss: 0.33921030227330995
Epoch: 71, step: 903, loss: 0.32116463780403137, mean loss: 0.3392101277976895
Epoch: 71, step: 904, loss: 0.3250027298927307, mean loss: 0.3392099904339143
Epoch: 71, step: 905, loss: 0.2976280450820923, mean loss: 0.339209588404084
Epoch: 71, step: 906, loss: 0.31595996022224426, mean loss: 0.3392093636201393
Epoch: 71, step: 907, loss: 0.32340165972709656, mean loss: 0.3392092107882895
Epoch: 71, step: 908, loss: 0.37535491585731506, mean loss: 0.3392095602483754
Epoch: 71, step: 909, loss: 0.376175194978714, mean loss: 0.3392099176321634
Epoch: 71, step: 910, loss: 0.28799498081207275, mean loss: 0.3392094224908977
Epoch: 71, step: 911, loss: 0.3432644009590149, mean loss: 0.33920946169367494
Epoch: 71, step: 912, loss: 0.3200668692588806, mean loss: 0.33920927662844264
Epoch: 71, step: 913, loss: 0.32547727227211, mean loss: 0.33920914387254675
Epoch: 71, step: 914, loss: 0.3487859070301056, mean loss: 0.3392092364562256
Epoch: 71, step: 915, loss: 0.30014246702194214, mean loss: 0.33920885878057366
Epoch: 71, step: 916, loss: 0.32875195145606995, mean loss: 0.3392087576900262
Epoch: 71, step: 917, loss: 0.35330769419670105, mean loss: 0.33920889398801446
Epoch: 71, step: 918, loss: 0.2762697637081146, mean loss: 0.3392082855453912
Epoch: 71, step: 919, loss: 0.33916372060775757, mean loss: 0.33920828511457896
Epoch: 71, step: 920, loss: 0.29860925674438477, mean loss: 0.3392078926448765
Epoch: 71, step: 921, loss: 0.3251388669013977, mean loss: 0.3392077566413022
Epoch: 71, step: 922, loss: 0.35303130745887756, mean loss: 0.3392078902706082
Epoch: 71, step: 923, loss: 0.3417045772075653, mean loss: 0.33920791440531295
Epoch: 71, step: 924, loss: 0.32984909415245056, mean loss: 0.33920782393735044
Epoch: 71, step: 925, loss: 0.3527683615684509, mean loss: 0.33920795502036283
Epoch: 71, step: 926, loss: 0.38229840993881226, mean loss: 0.3392083715504584
Epoch: 71, step: 927, loss: 0.38307926058769226, mean loss: 0.3392087956204526
Epoch: 71, step: 928, loss: 0.3772508502006531, mean loss: 0.33920916334352086
Epoch: 71, step: 929, loss: 0.32693666219711304, mean loss: 0.3392090447159072
Epoch: 71, step: 930, loss: 0.3162969946861267, mean loss: 0.33920882324715235
Epoch: 71, step: 931, loss: 0.34897544980049133, mean loss: 0.3392089176508269
Epoch: 71, step: 932, loss: 0.3655886650085449, mean loss: 0.33920917263354783
Epoch: 71, step: 933, loss: 0.34850603342056274, mean loss: 0.33920926249475514
Epoch: 71, step: 934, loss: 0.3272576630115509, mean loss: 0.3392091469746024
Epoch: 71, step: 935, loss: 0.34595292806625366, mean loss: 0.3392092121570989
Epoch: 71, step: 936, loss: 0.34266507625579834, mean loss: 0.3392092455596767
Epoch: 71, step: 937, loss: 0.3129655718803406, mean loss: 0.3392089919044827
Epoch: 71, step: 938, loss: 0.30776897072792053, mean loss: 0.33920868802752985
Epoch: 71, step: 939, loss: 0.2936723232269287, mean loss: 0.33920824790956805
Epoch: 71, step: 940, loss: 0.38004016876220703, mean loss: 0.3392086425543354
Epoch: 71, step: 941, loss: 0.36151379346847534, mean loss: 0.3392088581338583
Epoch: 71, step: 942, loss: 0.3096652030944824, mean loss: 0.33920857259687515
Epoch: 71, step: 943, loss: 0.35255154967308044, mean loss: 0.339208701554399
Epoch: 71, step: 944, loss: 0.3441963195800781, mean loss: 0.339208749758383
Epoch: 71, step: 945, loss: 0.3197554349899292, mean loss: 0.33920856174915553
Epoch: 71, step: 946, loss: 0.3199675381183624, mean loss: 0.33920837579344204
Epoch: 71, step: 947, loss: 0.34092146158218384, mean loss: 0.3392083923494745
Epoch: 71, step: 948, loss: 0.30737897753715515, mean loss: 0.3392080847386503
Epoch: 71, step: 949, loss: 0.3525696098804474, mean loss: 0.3392082138679498
Epoch: 71, step: 950, loss: 0.36416029930114746, mean loss: 0.33920845500914754
Epoch: 71, step: 951, loss: 0.3388933837413788, mean loss: 0.3392084519642746
Epoch: 71, step: 952, loss: 0.31995055079460144, mean loss: 0.3392082658562393
Epoch: 71, step: 953, loss: 0.33075881004333496, mean loss: 0.33920818420162857
Epoch: 71, step: 954, loss: 0.33401092886924744, mean loss: 0.3392081339764106
Epoch: 71, step: 955, loss: 0.33636507391929626, mean loss: 0.33920810650192224
Epoch: 71, step: 956, loss: 0.3680972754955292, mean loss: 0.33920838567557726
Epoch: 71, step: 957, loss: 0.3346399962902069, mean loss: 0.3392083415288717
Epoch: 71, step: 958, loss: 0.33979174494743347, mean loss: 0.3392083471665457
Epoch: 71, step: 959, loss: 0.30875271558761597, mean loss: 0.3392080528637397
Epoch: 71, step: 960, loss: 0.3044167757034302, mean loss: 0.3392077166674102
Epoch: 71, step: 961, loss: 0.3716071546077728, mean loss: 0.33920802974780695
Epoch: 71, step: 962, loss: 0.33978697657585144, mean loss: 0.3392080353421988
Epoch: 71, step: 963, loss: 0.3046685457229614, mean loss: 0.3392077015886272
Epoch: 71, step: 964, loss: 0.30018481612205505, mean loss: 0.33920732451584196
Epoch: 71, step: 965, loss: 0.3017684519290924, mean loss: 0.33920696275265144
Epoch: 71, step: 966, loss: 0.33550384640693665, mean loss: 0.3392069269706381
Epoch: 71, step: 967, loss: 0.3100447654724121, mean loss: 0.33920664518884336
Epoch: 71, step: 968, loss: 0.33748409152030945, mean loss: 0.339206628544687
Epoch: 71, step: 969, loss: 0.35886043310165405, mean loss: 0.33920681844752737
Epoch: 71, step: 970, loss: 0.3524130880832672, mean loss: 0.33920694605049984
Epoch: 71, step: 971, loss: 0.3267691731452942, mean loss: 0.3392068258741365
Epoch: 71, step: 972, loss: 0.33222854137420654, mean loss: 0.3392067584491435
Epoch: 71, step: 973, loss: 0.32508519291877747, mean loss: 0.3392066220062602
Epoch: 71, step: 974, loss: 0.3494309186935425, mean loss: 0.33920672079268993
Epoch: 71, step: 975, loss: 0.32881060242652893, mean loss: 0.33920662034710186
Epoch: 71, step: 976, loss: 0.3245529234409332, mean loss: 0.33920647876685717
Epoch: 71, step: 977, loss: 0.3214751183986664, mean loss: 0.3392063074526761
Epoch: 71, step: 978, loss: 0.35199084877967834, mean loss: 0.33920643097123426
Epoch: 71, step: 979, loss: 0.3015730381011963, mean loss: 0.3392060673776256
Epoch: 71, step: 980, loss: 0.30273693799972534, mean loss: 0.33920571503590896
Epoch: 71, step: 981, loss: 0.3239584267139435, mean loss: 0.3392055677276532
Epoch: 71, step: 982, loss: 0.31959015130996704, mean loss: 0.3392053782195386
Epoch: 71, step: 983, loss: 0.31877225637435913, mean loss: 0.33920518081332995
Epoch: 71, step: 984, loss: 0.34382182359695435, mean loss: 0.3392052254146959
Epoch: 71, step: 985, loss: 0.31226229667663574, mean loss: 0.3392049651216929
Epoch: 71, step: 986, loss: 0.37136510014533997, mean loss: 0.3392052758146147
Epoch: 71, step: 987, loss: 0.3583052158355713, mean loss: 0.33920546033370447
Epoch: 71, step: 988, loss: 0.3403349220752716, mean loss: 0.3392054712450078
Epoch: 71, step: 989, loss: 0.3526948094367981, mean loss: 0.3392056015591507
Epoch: 71, step: 990, loss: 0.31151625514030457, mean loss: 0.33920533406800046
Epoch: 71, step: 991, loss: 0.29411157965660095, mean loss: 0.33920489844689444
Epoch: 71, step: 992, loss: 0.3133450746536255, mean loss: 0.33920464863455646
Epoch: 71, step: 993, loss: 0.31043243408203125, mean loss: 0.3392043706904834
Epoch: 71, step: 994, loss: 0.3508170247077942, mean loss: 0.33920448286944593
Epoch: 71, step: 995, loss: 0.33939942717552185, mean loss: 0.3392044847526019
Epoch: 71, step: 996, loss: 0.31133535504341125, mean loss: 0.33920421554027097
Epoch: 71, step: 997, loss: 0.30433592200279236, mean loss: 0.3392038787201406
Epoch: 71, step: 998, loss: 0.36353829503059387, mean loss: 0.33920411378303783
Epoch: 71, step: 999, loss: 0.3223043978214264, mean loss: 0.3392039505386118
Epoch: 71, step: 1000, loss: 0.32863694429397583, mean loss: 0.3392038484665882
Epoch: 71, step: 1001, loss: 0.2971118688583374, mean loss: 0.33920344188293183
Epoch: 71, step: 1002, loss: 0.3488897383213043, mean loss: 0.3392035354459293
Epoch: 71, step: 1003, loss: 0.322550505399704, mean loss: 0.3392033745906047
Epoch: 71, step: 1004, loss: 0.3074539303779602, mean loss: 0.339203067918617
Epoch: 71, step: 1005, loss: 0.3460793197154999, mean loss: 0.33920313433658084
Epoch: 71, step: 1006, loss: 0.3310299813747406, mean loss: 0.33920305539256446
Epoch: 71, step: 1007, loss: 0.3188163638114929, mean loss: 0.33920285848057996
Epoch: 71, step: 1008, loss: 0.3062094748020172, mean loss: 0.3392025398055326
Epoch: 71, step: 1009, loss: 0.30603301525115967, mean loss: 0.3392022194322779
Epoch: 71, step: 1010, loss: 0.3231676518917084, mean loss: 0.33920206456129187
Epoch: 71, step: 1011, loss: 0.3465093970298767, mean loss: 0.33920213513898917
Epoch: 71, step: 1012, loss: 0.33073902130126953, mean loss: 0.3392020533989944
Epoch: 71, step: 1013, loss: 0.3156905770301819, mean loss: 0.3392018263183441
Epoch: 71, step: 1014, loss: 0.32845231890678406, mean loss: 0.33920172249749003
Epoch: 71, step: 1015, loss: 0.3411012887954712, mean loss: 0.33920174084369725
Epoch: 71, step: 1016, loss: 0.33442384004592896, mean loss: 0.33920169469868416
Epoch: 71, step: 1017, loss: 0.3079504668712616, mean loss: 0.33920139287693235
Epoch: 71, step: 1018, loss: 0.3132176101207733, mean loss: 0.33920114193014933
Epoch: 71, step: 1019, loss: 0.3100864589214325, mean loss: 0.33920086074840045
Epoch: 71, step: 1020, loss: 0.32557329535484314, mean loss: 0.3392007291383237
Epoch: 71, step: 1021, loss: 0.35420531034469604, mean loss: 0.3392008740457195
Epoch: 71, step: 1022, loss: 0.3356361389160156, mean loss: 0.3392008396194674
Epoch: 71, step: 1023, loss: 0.3307127058506012, mean loss: 0.33920075764652957
Epoch: 71, step: 1024, loss: 0.3475945293903351, mean loss: 0.3392008387073968
Epoch: 71, step: 1025, loss: 0.3311511278152466, mean loss: 0.33920076096996665
Epoch: 71, step: 1026, loss: 0.3262427747249603, mean loss: 0.33920063583369325
Epoch: 71, step: 1027, loss: 0.29889827966690063, mean loss: 0.3392002466344874
Epoch: 71, step: 1028, loss: 0.3729698359966278, mean loss: 0.33920057274371995
Epoch: 71, step: 1029, loss: 0.33883488178253174, mean loss: 0.33920056921231645
Epoch: 71, step: 1030, loss: 0.3257398307323456, mean loss: 0.33920043922594706
Epoch: 71, step: 1031, loss: 0.36314457654953003, mean loss: 0.3392006704451649
Epoch: 71, step: 1032, loss: 0.30809491872787476, mean loss: 0.3392003700719239
Epoch: 71, step: 1033, loss: 0.35147547721862793, mean loss: 0.3392004886055683
Epoch: 71, step: 1034, loss: 0.3357580602169037, mean loss: 0.33920045536433974
Epoch: 71, step: 1035, loss: 0.32770755887031555, mean loss: 0.3392003443861967
Epoch: 71, step: 1036, loss: 0.37066322565078735, mean loss: 0.33920064819633045
Epoch: 71, step: 1037, loss: 0.3233879804611206, mean loss: 0.33920049550839726
Epoch: 71, step: 1038, loss: 0.34001949429512024, mean loss: 0.33920050341661534
Epoch: 71, step: 1039, loss: 0.2786380350589752, mean loss: 0.3391999186335985
Epoch: 71, step: 1040, loss: 0.32509541511535645, mean loss: 0.33919978244373206
Epoch: 71, step: 1041, loss: 0.34073349833488464, mean loss: 0.33919979725279964
Epoch: 71, step: 1042, loss: 0.35513928532600403, mean loss: 0.3391999511578859
Epoch: 71, step: 1043, loss: 0.3132777214050293, mean loss: 0.33919970086600276
Epoch: 71, step: 1044, loss: 0.3317033350467682, mean loss: 0.3391996284856011
Epoch: 71, step: 1045, loss: 0.32994595170021057, mean loss: 0.3391995391385239
Epoch: 71, step: 1046, loss: 0.3952905535697937, mean loss: 0.33920008070918006
Epoch: 71, step: 1047, loss: 0.31598836183547974, mean loss: 0.3391998565972688
Epoch: 71, step: 1048, loss: 0.2836897671222687, mean loss: 0.3391993206459159
Epoch: 71, step: 1049, loss: 0.3179507851600647, mean loss: 0.3391991154927357
Epoch: 71, step: 1050, loss: 0.2986815571784973, mean loss: 0.3391987243022137
Epoch: 71, step: 1051, loss: 0.329191118478775, mean loss: 0.3391986276813187
Epoch: 71, step: 1052, loss: 0.3267962336540222, mean loss: 0.33919850794050727
Epoch: 71, step: 1053, loss: 0.3659115135669708, mean loss: 0.33919876584281883
Epoch: 71, step: 1054, loss: 0.3117752969264984, mean loss: 0.3391985010838531
Epoch: 71, step: 1055, loss: 0.3451528549194336, mean loss: 0.33919855856940856
Epoch: 71, step: 1056, loss: 0.32582905888557434, mean loss: 0.33919842949651213
Epoch: 71, step: 1057, loss: 0.34514161944389343, mean loss: 0.3391984868731794
Epoch: 71, step: 1058, loss: 0.31503692269325256, mean loss: 0.339198253615172
Epoch: 71, step: 1059, loss: 0.34277480840682983, mean loss: 0.33919828814323416
Epoch: 71, step: 1060, loss: 0.3660259544849396, mean loss: 0.3391985471350413
Epoch: 71, step: 1061, loss: 0.3153717815876007, mean loss: 0.33919831711587317
Epoch: 71, step: 1062, loss: 0.31931477785110474, mean loss: 0.3391981251657321
Epoch: 71, step: 1063, loss: 0.30910637974739075, mean loss: 0.339197834671221
Epoch: 71, step: 1064, loss: 0.35584232211112976, mean loss: 0.3391979953493571
Epoch: 71, step: 1065, loss: 0.35680490732192993, mean loss: 0.3391981653166509
Epoch: 71, step: 1066, loss: 0.32704636454582214, mean loss: 0.33919804801108605
Epoch: 71, step: 1067, loss: 0.37628382444381714, mean loss: 0.3391984060095457
Epoch: 71, step: 1068, loss: 0.3564041256904602, mean loss: 0.3391985720991433
Epoch: 71, step: 1069, loss: 0.33597636222839355, mean loss: 0.33919854099493
Epoch: 71, step: 1070, loss: 0.31785041093826294, mean loss: 0.339198334921953
Epoch: 71, step: 1071, loss: 0.33281418681144714, mean loss: 0.33919827329652236
Epoch: 71, step: 1072, loss: 0.3635171055793762, mean loss: 0.3391985080410833
Epoch: 71, step: 1073, loss: 0.3131972551345825, mean loss: 0.33919825705889345
Epoch: 71, step: 1074, loss: 0.33048638701438904, mean loss: 0.33919817296667204
Epoch: 71, step: 1075, loss: 0.31735557317733765, mean loss: 0.33919796213076675
Epoch: 71, step: 1076, loss: 0.3544621169567108, mean loss: 0.3391981094667464
Epoch: 71, step: 1077, loss: 0.33830055594444275, mean loss: 0.3391981008032696
Epoch: 71, step: 1078, loss: 0.3372350335121155, mean loss: 0.3391980818552923
Epoch: 71, step: 1079, loss: 0.3257350027561188, mean loss: 0.33919795190780866
Epoch: 71, step: 1080, loss: 0.3510449528694153, mean loss: 0.3391980662555811
Epoch: 71, step: 1081, loss: 0.34708207845687866, mean loss: 0.33919814235167783
Epoch: 71, step: 1082, loss: 0.3338885009288788, mean loss: 0.33919809110377547
Epoch: 71, step: 1083, loss: 0.30162712931632996, mean loss: 0.3391977284777062
Epoch: 71, step: 1084, loss: 0.3086063861846924, mean loss: 0.3391974332201292
Epoch: 71, step: 1085, loss: 0.35807737708091736, mean loss: 0.3391976154413806
Epoch: 71, step: 1086, loss: 0.29440608620643616, mean loss: 0.3391971831366134
Epoch: 71, step: 1087, loss: 0.3181726336479187, mean loss: 0.3391969802204503
Epoch: 71, step: 1088, loss: 0.3007601797580719, mean loss: 0.3391966092554125
Epoch: 71, step: 1089, loss: 0.37839168310165405, mean loss: 0.3391969875351223
Epoch: 71, step: 1090, loss: 0.33749786019325256, mean loss: 0.33919697113665354
Epoch: 71, step: 1091, loss: 0.34900370240211487, mean loss: 0.33919706578160475
Epoch: 71, step: 1092, loss: 0.36059314012527466, mean loss: 0.3391972722735351
Epoch: 71, step: 1093, loss: 0.3544367253780365, mean loss: 0.33919741934694997
Epoch: 71, step: 1094, loss: 0.2934412956237793, mean loss: 0.3391969777665089
Epoch: 71, step: 1095, loss: 0.3297729194164276, mean loss: 0.33919688681825233
Epoch: 71, step: 1096, loss: 0.32035374641418457, mean loss: 0.33919670497151855
Epoch: 71, step: 1097, loss: 0.3715870976448059, mean loss: 0.339197017553718
Epoch: 71, step: 1098, loss: 0.33637329936027527, mean loss: 0.33919699030380057
Epoch: 71, step: 1099, loss: 0.36971554160118103, mean loss: 0.3391972848161847
Epoch: 71, step: 1100, loss: 0.3298669755458832, mean loss: 0.33919719477701205
Epoch: 71, step: 1101, loss: 0.33693844079971313, mean loss: 0.3391971729798378
Epoch: 71, step: 1102, loss: 0.30092915892601013, mean loss: 0.3391968036937053
Epoch: 71, step: 1103, loss: 0.360870361328125, mean loss: 0.3391970128414032
Epoch: 71, step: 1104, loss: 0.3079359233379364, mean loss: 0.3391967111778775
Epoch: 71, step: 1105, loss: 0.31309574842453003, mean loss: 0.339196459311017
Epoch: 71, step: 1106, loss: 0.30090153217315674, mean loss: 0.33919608977943727
Epoch: 71, step: 1107, loss: 0.32940614223480225, mean loss: 0.33919599531105354
Epoch: 71, step: 1108, loss: 0.29490602016448975, mean loss: 0.33919556793777333
Epoch: 71, step: 1109, loss: 0.34832075238227844, mean loss: 0.3391956559898069
Epoch: 71, step: 1110, loss: 0.3382473289966583, mean loss: 0.33919564683916287
Epoch: 71, step: 1111, loss: 0.31104668974876404, mean loss: 0.339195375225466
Epoch: 71, step: 1112, loss: 0.35602474212646484, mean loss: 0.3391955376130969
Epoch: 71, step: 1113, loss: 0.3255799412727356, mean loss: 0.3391954062366101
Epoch: 71, step: 1114, loss: 0.32450076937675476, mean loss: 0.3391952644498613
Epoch: 71, step: 1115, loss: 0.3177421987056732, mean loss: 0.33919505745385836
Epoch: 71, step: 1116, loss: 0.340324729681015, mean loss: 0.33919506835371677
Epoch: 71, step: 1117, loss: 0.36080074310302734, mean loss: 0.33919527681818823
Epoch: 71, step: 1118, loss: 0.28666970133781433, mean loss: 0.33919477002491244
Epoch: 71, step: 1119, loss: 0.3393971621990204, mean loss: 0.3391947719776755
Epoch: 71, step: 1120, loss: 0.3526042103767395, mean loss: 0.33919490135621183
Epoch: 71, step: 1121, loss: 0.32775482535362244, mean loss: 0.3391947909797766
Epoch: 71, step: 1122, loss: 0.31056392192840576, mean loss: 0.33919451474535545
Epoch: 71, step: 1123, loss: 0.40196019411087036, mean loss: 0.3391951203111104
Epoch: 71, step: 1124, loss: 0.4044778347015381, mean loss: 0.3391957501552419
Epoch: 71, step: 1125, loss: 0.3103426992893219, mean loss: 0.33919547178523834
Epoch: 71, step: 1126, loss: 0.34840863943099976, mean loss: 0.3391955606716711
Epoch: 71, step: 1127, loss: 0.32451826333999634, mean loss: 0.3391954190699912
Epoch: 71, step: 1128, loss: 0.3797592520713806, mean loss: 0.33919581041257657
Epoch: 71, step: 1129, loss: 0.32169079780578613, mean loss: 0.3391956415332993
Epoch: 71, step: 1130, loss: 0.3547804653644562, mean loss: 0.33919579188614124
Epoch: 71, step: 1131, loss: 0.31120598316192627, mean loss: 0.3391955218602023
Epoch: 71, step: 1132, loss: 0.3512514531612396, mean loss: 0.3391956381662048
Epoch: 71, step: 1133, loss: 0.34484899044036865, mean loss: 0.33919569270470906
Epoch: 71, step: 1134, loss: 0.31609073281288147, mean loss: 0.33919546981079834
Epoch: 71, step: 1135, loss: 0.34319111704826355, mean loss: 0.3391955083564981
Epoch: 71, step: 1136, loss: 0.34168383479118347, mean loss: 0.3391955323609591
Epoch: 71, step: 1137, loss: 0.32131868600845337, mean loss: 0.33919535990773275
Epoch: 71, step: 1138, loss: 0.3108028173446655, mean loss: 0.339195086014998
Epoch: 71, step: 1139, loss: 0.3291431963443756, mean loss: 0.33919498904893775
Epoch: 71, step: 1140, loss: 0.2969357967376709, mean loss: 0.33919458139744196
Epoch: 71, step: 1141, loss: 0.32272785902023315, mean loss: 0.33919442255343935
Epoch: 71, step: 1142, loss: 0.32924672961235046, mean loss: 0.3391943265952951
Epoch: 71, step: 1143, loss: 0.32228127121925354, mean loss: 0.33919416344894926
Epoch: 71, step: 1144, loss: 0.32125282287597656, mean loss: 0.3391939903852506
Epoch: 71, step: 1145, loss: 0.3162963092327118, mean loss: 0.33919376951439933
Epoch: 71, step: 1146, loss: 0.3431314527988434, mean loss: 0.33919380749689476
Epoch: 71, step: 1147, loss: 0.33467957377433777, mean loss: 0.339193763953472
Epoch: 71, step: 1148, loss: 0.3229042589664459, mean loss: 0.3391936068295826
Epoch: 71, step: 1149, loss: 0.3084293007850647, mean loss: 0.3391933100887793
Epoch: 71, step: 1150, loss: 0.31973323225975037, mean loss: 0.33919312238607535
Epoch: 71, step: 1151, loss: 0.3082035779953003, mean loss: 0.33919282347847485
Epoch: 71, step: 1152, loss: 0.31243422627449036, mean loss: 0.339192565382685
Epoch: 71, step: 1153, loss: 0.36096128821372986, mean loss: 0.3391927753474107
Epoch: 71, step: 1154, loss: 0.30893608927726746, mean loss: 0.33919248351699116
Epoch: 71, step: 1155, loss: 0.3108849823474884, mean loss: 0.339192210489395
Epoch: 71, step: 1156, loss: 0.28179818391799927, mean loss: 0.33919165692580505
Epoch: 71, step: 1157, loss: 0.35195493698120117, mean loss: 0.33919178002605443
Epoch: 71, step: 1158, loss: 0.2804173231124878, mean loss: 0.3391912131591919
Epoch: 71, step: 1159, loss: 0.3299199938774109, mean loss: 0.3391911237411594
Epoch: 71, step: 1160, loss: 0.3651401698589325, mean loss: 0.33919137400924176
Epoch: 71, step: 1161, loss: 0.34154626727104187, mean loss: 0.3391913967210183
Epoch: 71, step: 1162, loss: 0.3641534745693207, mean loss: 0.33919163746554604
Epoch: 71, step: 1163, loss: 0.37245628237724304, mean loss: 0.3391919582803454
Epoch: 71, step: 1164, loss: 0.30669474601745605, mean loss: 0.33919164486993286
Epoch: 71, step: 1165, loss: 0.36091145873069763, mean loss: 0.3391918543386749
Epoch: 71, step: 1166, loss: 0.35278481245040894, mean loss: 0.33919198542968676
Epoch: 71, step: 1167, loss: 0.3128255605697632, mean loss: 0.3391917311533216
Epoch: 71, step: 1168, loss: 0.3178297281265259, mean loss: 0.33919152514131473
Epoch: 71, step: 1169, loss: 0.3468741774559021, mean loss: 0.33919159923096615
Epoch: 71, step: 1170, loss: 0.35549989342689514, mean loss: 0.33919175650271693
Epoch: 71, step: 1171, loss: 0.3411427140235901, mean loss: 0.33919177531691924
Epoch: 71, step: 1172, loss: 0.35089433193206787, mean loss: 0.33919188817029605
Epoch: 71, step: 1173, loss: 0.3467075526714325, mean loss: 0.3391919606467614
Epoch: 71, step: 1174, loss: 0.32836490869522095, mean loss: 0.33919185623831044
Epoch: 71, step: 1175, loss: 0.31331226229667664, mean loss: 0.3391916066761702
Epoch: 71, step: 1176, loss: 0.3830569386482239, mean loss: 0.3391920296743281
Epoch: 71, step: 1177, loss: 0.3428024649620056, mean loss: 0.33919206448981176
Epoch: 71, step: 1178, loss: 0.33909517526626587, mean loss: 0.33919206355551645
Epoch: 71, step: 1179, loss: 0.3419455885887146, mean loss: 0.3391920901072891
Epoch: 71, step: 1180, loss: 0.3596271276473999, mean loss: 0.3391922871569737
Epoch: 71, step: 1181, loss: 0.314799427986145, mean loss: 0.33919205194532565
Epoch: 71, step: 1182, loss: 0.34235909581184387, mean loss: 0.3391920824837065
Epoch: 71, step: 1183, loss: 0.348488450050354, mean loss: 0.33919217212353725
Epoch: 71, step: 1184, loss: 0.2913241684436798, mean loss: 0.33919171056278863
Epoch: 71, step: 1185, loss: 0.35629504919052124, mean loss: 0.339191875477827
Epoch: 71, step: 1186, loss: 0.3111822009086609, mean loss: 0.33919160540353815
Epoch: 71, step: 1187, loss: 0.3156750202178955, mean loss: 0.33919137865460663
Epoch: 71, step: 1188, loss: 0.3013136088848114, mean loss: 0.339191013437423
Epoch: 71, step: 1189, loss: 0.3453653156757355, mean loss: 0.33919107296942674
Epoch: 71, step: 1190, loss: 0.3240758180618286, mean loss: 0.33919092723105804
Epoch: 71, step: 1191, loss: 0.3132146894931793, mean loss: 0.33919067677560527
Epoch: 71, step: 1192, loss: 0.32721617817878723, mean loss: 0.33919056132202874
Epoch: 71, step: 1193, loss: 0.34371858835220337, mean loss: 0.33919060497912806
Epoch: 71, step: 1194, loss: 0.3313767611980438, mean loss: 0.3391905296424609
Epoch: 71, step: 1195, loss: 0.3423382639884949, mean loss: 0.33919055999084446
Epoch: 71, step: 1196, loss: 0.3644487261772156, mean loss: 0.33919080351111697
Epoch: 71, step: 1197, loss: 0.32124635577201843, mean loss: 0.339190630505894
Epoch: 71, step: 1198, loss: 0.3229652941226959, mean loss: 0.3391904740764002
Epoch: 71, step: 1199, loss: 0.3866039216518402, mean loss: 0.3391909311880385
Epoch: 71, step: 1200, loss: 0.32226860523223877, mean loss: 0.33919076804197
Epoch: 71, step: 1201, loss: 0.3290318250656128, mean loss: 0.3391906701017913
Epoch: 71, step: 1202, loss: 0.3394854962825775, mean loss: 0.3391906729441196
Epoch: 71, step: 1203, loss: 0.3216082751750946, mean loss: 0.33919050343928225
Epoch: 71, step: 1204, loss: 0.31728509068489075, mean loss: 0.33919029226002906
Epoch: 71, step: 1205, loss: 0.31888818740844727, mean loss: 0.33919009653936144
Epoch: 71, step: 1206, loss: 0.3451027572154999, mean loss: 0.3391901535393005
Epoch: 71, step: 1207, loss: 0.3469642400741577, mean loss: 0.33919022848325736
Epoch: 71, step: 1208, loss: 0.325528621673584, mean loss: 0.33919009678353973
Epoch: 71, step: 1209, loss: 0.34974831342697144, mean loss: 0.33919019856517973
Epoch: 71, step: 1210, loss: 0.3292066752910614, mean loss: 0.33919010232453506
Epoch: 71, step: 1211, loss: 0.3448825180530548, mean loss: 0.33919015719859735
Epoch: 71, step: 1212, loss: 0.32083770632743835, mean loss: 0.3391899802853372
Epoch: 71, step: 1213, loss: 0.33327314257621765, mean loss: 0.3391899232489792
Epoch: 71, step: 1214, loss: 0.3384639024734497, mean loss: 0.33918991625044653
Epoch: 71, step: 1215, loss: 0.32904699444770813, mean loss: 0.33918981847792096
Epoch: 71, step: 1216, loss: 0.3357961177825928, mean loss: 0.33918978576471503
Epoch: 71, step: 1217, loss: 0.3801403045654297, mean loss: 0.33919018049894806
Epoch: 71, step: 1218, loss: 0.3434031009674072, mean loss: 0.3391902211081503
Epoch: 71, step: 1219, loss: 0.33907049894332886, mean loss: 0.33919021995413495
Epoch: 71, step: 1220, loss: 0.31412261724472046, mean loss: 0.33918997832704245
Epoch: 71, step: 1221, loss: 0.303437203168869, mean loss: 0.3391896337086942
Epoch: 71, step: 1222, loss: 0.3058345913887024, mean loss: 0.3391893122050139
Epoch: 71, step: 1223, loss: 0.3189554810523987, mean loss: 0.33918911717637573
Epoch: 71, step: 1224, loss: 0.34024903178215027, mean loss: 0.3391891273925186
Epoch: 71, step: 1225, loss: 0.38582590222358704, mean loss: 0.3391895769036013
Epoch: 71, step: 1226, loss: 0.3420115113258362, mean loss: 0.33918960410270704
Epoch: 71, step: 1227, loss: 0.3330182731151581, mean loss: 0.33918954462114537
Epoch: 71, step: 1228, loss: 0.32476183772087097, mean loss: 0.33918940556293115
Epoch: 71, step: 1229, loss: 0.32268843054771423, mean loss: 0.33918924652352045
Epoch: 71, step: 1230, loss: 0.30787399411201477, mean loss: 0.33918894470430777
Epoch: 71, step: 1231, loss: 0.3448142111301422, mean loss: 0.3391889989206078
Epoch: 71, step: 1232, loss: 0.321770578622818, mean loss: 0.339188831043546
Epoch: 71, step: 1233, loss: 0.3439794182777405, mean loss: 0.33918887721432067
Epoch: 71, step: 1234, loss: 0.31446272134780884, mean loss: 0.3391886389105989
Epoch: 71, step: 1235, loss: 0.30184048414230347, mean loss: 0.339188278963078
Epoch: 71, step: 1236, loss: 0.3485772907733917, mean loss: 0.3391883694499836
Epoch: 71, step: 1237, loss: 0.3773486018180847, mean loss: 0.3391887372169153
Epoch: 71, step: 1238, loss: 0.3227657675743103, mean loss: 0.33918857894306387
Epoch: 71, step: 1239, loss: 0.3300074338912964, mean loss: 0.33918849046203914
Epoch: 71, step: 1240, loss: 0.3234555423259735, mean loss: 0.3391883388410866
Epoch: 71, step: 1241, loss: 0.35855549573898315, mean loss: 0.339188525483695
Epoch: 71, step: 1242, loss: 0.306404709815979, mean loss: 0.3391882095468782
Epoch: 71, step: 1243, loss: 0.31545770168304443, mean loss: 0.3391879808587676
Epoch: 71, step: 1244, loss: 0.38431692123413086, mean loss: 0.3391884157568622
Epoch: 71, step: 1245, loss: 0.30446651577949524, mean loss: 0.3391880811524488
Epoch: 71, step: 1246, loss: 0.347716748714447, mean loss: 0.339188163339838
Epoch: 71, step: 1247, loss: 0.3287062644958496, mean loss: 0.3391880623309064
Epoch: 71, step: 1248, loss: 0.30686870217323303, mean loss: 0.33918775088804404
Epoch: 71, step: 1249, loss: 0.31383538246154785, mean loss: 0.33918750658438007
Epoch: 71, step: 1250, loss: 0.3402338922023773, mean loss: 0.3391875166675949
Epoch: 71, step: 1251, loss: 0.36931413412094116, mean loss: 0.3391878069718796
Epoch: 71, step: 1252, loss: 0.31845197081565857, mean loss: 0.3391876071603977
Epoch: 71, step: 1253, loss: 0.31857770681381226, mean loss: 0.3391874085643528
Epoch: 71, step: 1254, loss: 0.3664231300354004, mean loss: 0.33918767100397423
Epoch: 71, step: 1255, loss: 0.32865238189697266, mean loss: 0.3391875694883729
Epoch: 71, step: 1256, loss: 0.31022608280181885, mean loss: 0.3391872904248961
Epoch: 71, step: 1257, loss: 0.3093029856681824, mean loss: 0.3391870024722188
Epoch: 71, step: 1258, loss: 0.3512265980243683, mean loss: 0.3391871184796145
Epoch: 71, step: 1259, loss: 0.32584279775619507, mean loss: 0.3391869899017921
Epoch: 71, step: 1260, loss: 0.3536375164985657, mean loss: 0.3391871291370052
Epoch: 71, step: 1261, loss: 0.3450147211551666, mean loss: 0.3391871852870834
Epoch: 71, step: 1262, loss: 0.33013397455215454, mean loss: 0.339187098058329
Epoch: 71, step: 1263, loss: 0.30086323618888855, mean loss: 0.33918672880695244
Epoch: 71, step: 1264, loss: 0.30408233404159546, mean loss: 0.33918639057848154
Epoch: 71, step: 1265, loss: 0.34339913725852966, mean loss: 0.33918643116762
Epoch: 71, step: 1266, loss: 0.3172963559627533, mean loss: 0.339186220262289
Epoch: 71, step: 1267, loss: 0.3225274682044983, mean loss: 0.33918605976097815
Epoch: 71, step: 1268, loss: 0.32503390312194824, mean loss: 0.33918592341116033
Epoch: 71, step: 1269, loss: 0.3501231074333191, mean loss: 0.3391860287851128
Epoch: 71, step: 1270, loss: 0.3310227692127228, mean loss: 0.33918595013720515
Epoch: 71, step: 1271, loss: 0.3137757182121277, mean loss: 0.33918570532784903
Epoch: 71, step: 1272, loss: 0.3363919258117676, mean loss: 0.3391856784120469
Epoch: 71, step: 1273, loss: 0.3007754385471344, mean loss: 0.3391853083640704
Epoch: 71, step: 1274, loss: 0.3305065631866455, mean loss: 0.33918522475300306
Epoch: 71, step: 1275, loss: 0.3363184630870819, mean loss: 0.33918519713487527
Epoch: 71, step: 1276, loss: 0.3130233585834503, mean loss: 0.33918494509646957
Epoch: 71, step: 1277, loss: 0.34907102584838867, mean loss: 0.33918504033626024
Epoch: 71, step: 1278, loss: 0.2952163517475128, mean loss: 0.33918461675805356
Epoch: 71, step: 1279, loss: 0.3191594183444977, mean loss: 0.339184423844501
Epoch: 71, step: 1280, loss: 0.329789400100708, mean loss: 0.3391843333380346
Epoch: 71, step: 1281, loss: 0.30441412329673767, mean loss: 0.3391839983842743
Epoch: 71, step: 1282, loss: 0.29012784361839294, mean loss: 0.3391835258134962
Epoch: 71, step: 1283, loss: 0.35156795382499695, mean loss: 0.3391836451147833
Epoch: 71, step: 1284, loss: 0.3292787969112396, mean loss: 0.33918354970062653
Epoch: 71, step: 1285, loss: 0.3318559229373932, mean loss: 0.33918347911372004
Epoch: 71, step: 1286, loss: 0.3413068950176239, mean loss: 0.33918349956835303
Epoch: 71, step: 1287, loss: 0.3038259446620941, mean loss: 0.3391831589761777
Epoch: 71, step: 1288, loss: 0.31299492716789246, mean loss: 0.33918290671266726
Epoch: 71, step: 1289, loss: 0.3397344946861267, mean loss: 0.3391829120259003
Epoch: 71, step: 1290, loss: 0.370837539434433, mean loss: 0.33918321693971243
Epoch: 71, step: 1291, loss: 0.3343561291694641, mean loss: 0.3391831704431438
Epoch: 71, step: 1292, loss: 0.31413811445236206, mean loss: 0.339182929200804
Epoch: 71, step: 1293, loss: 0.29118695855140686, mean loss: 0.3391824668920459
Epoch: 71, step: 1294, loss: 0.31813478469848633, mean loss: 0.3391822641576505
Epoch: 71, step: 1295, loss: 0.3336055278778076, mean loss: 0.33918221044221725
Epoch: 71, step: 1296, loss: 0.36186182498931885, mean loss: 0.33918242889141875
Epoch: 71, step: 1297, loss: 0.34180134534835815, mean loss: 0.3391824541164814
Epoch: 71, step: 1298, loss: 0.32671651244163513, mean loss: 0.33918233404730913
Epoch: 71, step: 1299, loss: 0.35350632667541504, mean loss: 0.3391824720114853
Epoch: 71, step: 1300, loss: 0.36212027072906494, mean loss: 0.3391826929389952
Epoch: 71, step: 1301, loss: 0.3319646120071411, mean loss: 0.339182623418057
Epoch: 71, step: 1302, loss: 0.3048737943172455, mean loss: 0.3391822929757915
Epoch: 71, step: 1303, loss: 0.30342918634414673, mean loss: 0.33918194862641915
Epoch: 71, step: 1304, loss: 0.3480668067932129, mean loss: 0.33918203419844783
Epoch: 71, step: 1305, loss: 0.3298148810863495, mean loss: 0.33918194398219903
Epoch: 71, step: 1306, loss: 0.32888731360435486, mean loss: 0.33918184483425307
Epoch: 71, step: 1307, loss: 0.2914436459541321, mean loss: 0.33918138507041456
Epoch: 71, step: 1308, loss: 0.34293171763420105, mean loss: 0.3391814211893032
Epoch: 71, step: 1309, loss: 0.38621774315834045, mean loss: 0.33918187418468015
Epoch: 71, step: 1310, loss: 0.3435530662536621, mean loss: 0.3391819162821624
Epoch: 71, step: 1311, loss: 0.3210596740245819, mean loss: 0.33918174175461646
Epoch: 71, step: 1312, loss: 0.30644193291664124, mean loss: 0.3391814264545901
Epoch: 71, step: 1313, loss: 0.3040253221988678, mean loss: 0.33918108788774315
Epoch: 71, step: 1314, loss: 0.3401920199394226, mean loss: 0.33918109762331505
Epoch: 71, step: 1315, loss: 0.3265731930732727, mean loss: 0.33918097620666876
Epoch: 71, step: 1316, loss: 0.3172857165336609, mean loss: 0.3391807653529629
Epoch: 71, step: 1317, loss: 0.3134559690952301, mean loss: 0.3391805176227934
Epoch: 71, step: 1318, loss: 0.38032105565071106, mean loss: 0.3391809138029695
Epoch: 71, step: 1319, loss: 0.359225332736969, mean loss: 0.33918110682730346
Epoch: 71, step: 1320, loss: 0.3298726975917816, mean loss: 0.3391810171897741
Epoch: 71, step: 1321, loss: 0.34941616654396057, mean loss: 0.3391811157506176
Epoch: 71, step: 1322, loss: 0.339496910572052, mean loss: 0.33918111879157997
Epoch: 71, step: 1323, loss: 0.31925177574157715, mean loss: 0.3391809268827993
Epoch: 71, step: 1324, loss: 0.3472653329372406, mean loss: 0.3391810047305018
Epoch: 71, step: 1325, loss: 0.3507033586502075, mean loss: 0.3391811156823932
Epoch: 71, step: 1326, loss: 0.31333115696907043, mean loss: 0.3391808667684808
Epoch: 71, step: 1327, loss: 0.32018402218818665, mean loss: 0.3391806838462012
Epoch: 71, step: 1328, loss: 0.3033280074596405, mean loss: 0.33918033862096564
Epoch: 71, step: 1329, loss: 0.32538312673568726, mean loss: 0.33918020576896296
Epoch: 71, step: 1330, loss: 0.31660303473472595, mean loss: 0.3391799883776863
Epoch: 71, step: 1331, loss: 0.3603624403476715, mean loss: 0.339180192337515
Epoch: 71, step: 1332, loss: 0.3674454689025879, mean loss: 0.3391804644932346
Epoch: 71, step: 1333, loss: 0.30701377987861633, mean loss: 0.3391801547753061
Epoch: 71, step: 1334, loss: 0.2950976490974426, mean loss: 0.3391797303296088
Epoch: 71, step: 1335, loss: 0.31764572858810425, mean loss: 0.33917952299279247
Epoch: 71, step: 1336, loss: 0.33078065514564514, mean loss: 0.3391794421263667
Epoch: 71, step: 1337, loss: 0.32608985900878906, mean loss: 0.3391793160977603
Epoch: 71, step: 1338, loss: 0.29911696910858154, mean loss: 0.33917893037476954
Epoch: 71, step: 1339, loss: 0.31302133202552795, mean loss: 0.3391786785300654
Epoch: 71, step: 1340, loss: 0.32339778542518616, mean loss: 0.33917852659348324
Epoch: 71, step: 1341, loss: 0.32180172204971313, mean loss: 0.3391783592932643
Epoch: 71, step: 1342, loss: 0.34480294585227966, mean loss: 0.3391784134450792
Epoch: 71, step: 1343, loss: 0.29420962929725647, mean loss: 0.3391779805034211
Epoch: 71, step: 1344, loss: 0.3653291165828705, mean loss: 0.3391782322737864
Epoch: 71, step: 1345, loss: 0.31973132491111755, mean loss: 0.3391780450502631
Epoch: 71, step: 1346, loss: 0.3153546154499054, mean loss: 0.3391778156943351
Epoch: 71, step: 1347, loss: 0.31617945432662964, mean loss: 0.33917759428373967
Epoch: 71, step: 1348, loss: 0.2942303419113159, mean loss: 0.33917716157021094
Epoch: 71, step: 1349, loss: 0.3235834836959839, mean loss: 0.33917701144912316
Epoch: 71, step: 1350, loss: 0.34590378403663635, mean loss: 0.33917707620746335
Epoch: 71, step: 1351, loss: 0.3390945792198181, mean loss: 0.3391770754132762
Epoch: 71, step: 1352, loss: 0.3831421434879303, mean loss: 0.33917749865487995
Epoch: 71, step: 1353, loss: 0.353588342666626, mean loss: 0.339177637383427
Epoch: 71, step: 1354, loss: 0.32669728994369507, mean loss: 0.3391775172403043
Epoch: 71, step: 1355, loss: 0.33432716131210327, mean loss: 0.33917747054839126
Epoch: 71, step: 1356, loss: 0.32697364687919617, mean loss: 0.33917735306950997
Epoch: 71, step: 1357, loss: 0.3158027231693268, mean loss: 0.33917712805815187
Epoch: 71, step: 1358, loss: 0.3092857897281647, mean loss: 0.33917684031772916
Epoch: 71, step: 1359, loss: 0.3414023220539093, mean loss: 0.3391768617404866
Epoch: 71, step: 1360, loss: 0.34991151094436646, mean loss: 0.3391769650725288
Epoch: 71, step: 1361, loss: 0.3200163245201111, mean loss: 0.33917678063342677
Epoch: 71, step: 1362, loss: 0.3272685110569, mean loss: 0.3391766660062879
Epoch: 71, step: 1363, loss: 0.30293911695480347, mean loss: 0.3391763171926708
Epoch: 71, step: 1364, loss: 0.3684186041355133, mean loss: 0.3391765986689285
Epoch: 71, step: 1365, loss: 0.28904032707214355, mean loss: 0.33917611607896225
Epoch: 71, step: 1366, loss: 0.3451303243637085, mean loss: 0.33917617339103245
Epoch: 71, step: 1367, loss: 0.3354259431362152, mean loss: 0.3391761372936404
Epoch: 71, step: 1368, loss: 0.3059239387512207, mean loss: 0.33917581723166756
Epoch: 71, step: 1369, loss: 0.3526149392127991, mean loss: 0.33917594658583605
Epoch: 71, step: 1370, loss: 0.303062379360199, mean loss: 0.3391755989890583
Epoch: 71, step: 1371, loss: 0.3249174952507019, mean loss: 0.3391754617546726
Epoch: 71, step: 1372, loss: 0.3379121720790863, mean loss: 0.33917544959561435
Epoch: 71, step: 1373, loss: 0.3597364127635956, mean loss: 0.33917564749127327
Epoch: 71, step: 1374, loss: 0.28742945194244385, mean loss: 0.33917514944802407
Epoch: 71, step: 1375, loss: 0.3180829584598541, mean loss: 0.3391749464432985
Epoch: 71, step: 1376, loss: 0.3263093829154968, mean loss: 0.3391748226180848
Epoch: 71, step: 1377, loss: 0.357498437166214, mean loss: 0.3391749989728667
Epoch: 71, step: 1378, loss: 0.3341802954673767, mean loss: 0.33917495090203614
Epoch: 71, step: 1379, loss: 0.3137400150299072, mean loss: 0.3391747061093826
Epoch: 71, step: 1380, loss: 0.3402010202407837, mean loss: 0.33917471598681037
Epoch: 71, step: 1381, loss: 0.33077237010002136, mean loss: 0.3391746351219336
Epoch: 71, step: 1382, loss: 0.34671542048454285, mean loss: 0.3391747076943817
Epoch: 71, step: 1383, loss: 0.3239215612411499, mean loss: 0.3391745608996551
Epoch: 71, step: 1384, loss: 0.3336426317691803, mean loss: 0.3391745076614454
Epoch: 71, step: 1385, loss: 0.36483779549598694, mean loss: 0.33917475463755775
Epoch: 71, step: 1386, loss: 0.3515169620513916, mean loss: 0.3391748734142745
Epoch: 71, step: 1387, loss: 0.314561665058136, mean loss: 0.33917463654838453
Epoch: 71, step: 1388, loss: 0.3467140197753906, mean loss: 0.3391747091031489
Epoch: 71, step: 1389, loss: 0.31851503252983093, mean loss: 0.33917451028800777
Epoch: 71, step: 1390, loss: 0.2876521646976471, mean loss: 0.33917401447560735
Epoch: 71, step: 1391, loss: 0.31430134177207947, mean loss: 0.3391737751219688
Epoch: 71, step: 1392, loss: 0.28783077001571655, mean loss: 0.3391732810449159
Epoch: 71, step: 1393, loss: 0.33406761288642883, mean loss: 0.33917323191321436
Epoch: 71, step: 1394, loss: 0.3019067943096161, mean loss: 0.3391728733027812
Epoch: 71, step: 1395, loss: 0.31324058771133423, mean loss: 0.33917262376192675
Epoch: 71, step: 1396, loss: 0.3177371323108673, mean loss: 0.3391724174947483
Epoch: 71, step: 1397, loss: 0.3134641647338867, mean loss: 0.33917217011447504
Epoch: 71, step: 1398, loss: 0.2949078381061554, mean loss: 0.3391717441805431
Epoch: 71, step: 1399, loss: 0.35031798481941223, mean loss: 0.3391718514343116
Epoch: 71, step: 1400, loss: 0.35626280307769775, mean loss: 0.3391720158889822
Epoch: 71, step: 1401, loss: 0.33387547731399536, mean loss: 0.3391719649244635
Epoch: 71, step: 1402, loss: 0.3339046537876129, mean loss: 0.3391719142416656
Epoch: 71, step: 1403, loss: 0.3084567189216614, mean loss: 0.3391716186986424
Epoch: 71, step: 1404, loss: 0.3148350417613983, mean loss: 0.339171384533232
Epoch: 71, step: 1405, loss: 0.29070696234703064, mean loss: 0.33917091821530465
Epoch: 71, step: 1406, loss: 0.4348745048046112, mean loss: 0.3391718390530392
Epoch: 71, step: 1407, loss: 0.3378441631793976, mean loss: 0.3391718262785725
Epoch: 71, step: 1408, loss: 0.3566257655620575, mean loss: 0.33917199421310035
Epoch: 71, step: 1409, loss: 0.3710438907146454, mean loss: 0.33917230086825173
Epoch: 71, step: 1410, loss: 0.3629096746444702, mean loss: 0.33917252925497204
Epoch: 71, step: 1411, loss: 0.3056607246398926, mean loss: 0.3391722068276647
Epoch: 71, step: 1412, loss: 0.36576399207115173, mean loss: 0.3391724626728906
Epoch: 71, step: 1413, loss: 0.31784680485725403, mean loss: 0.33917225749617164
Epoch: 71, step: 1414, loss: 0.2906687557697296, mean loss: 0.3391717908426371
Epoch: 71, step: 1415, loss: 0.3591497838497162, mean loss: 0.3391719830496123
Epoch: 71, step: 1416, loss: 0.3102715313434601, mean loss: 0.3391717050029156
Epoch: 71, step: 1417, loss: 0.3384641408920288, mean loss: 0.33917169819561815
Epoch: 71, step: 1418, loss: 0.38846060633659363, mean loss: 0.3391721723873207
Epoch: 71, step: 1419, loss: 0.32678496837615967, mean loss: 0.3391720532154204
Epoch: 71, step: 1420, loss: 0.3588517904281616, mean loss: 0.33917224254378836
Epoch: 71, step: 1421, loss: 0.32211095094680786, mean loss: 0.3391720784076831
Epoch: 71, step: 1422, loss: 0.3261556029319763, mean loss: 0.3391719531854499
Epoch: 71, step: 1423, loss: 0.3548499345779419, mean loss: 0.3391721040106836
Epoch: 71, step: 1424, loss: 0.3218104839324951, mean loss: 0.3391719369901247
Epoch: 71, step: 1425, loss: 0.32314160466194153, mean loss: 0.3391717827781735
Epoch: 71, step: 1426, loss: 0.39987900853157043, mean loss: 0.3391723667766512
Epoch: 71, step: 1427, loss: 0.37347909808158875, mean loss: 0.3391726968013867
Epoch: 71, step: 1428, loss: 0.34266483783721924, mean loss: 0.3391727303948475
Epoch: 71, step: 1429, loss: 0.343516081571579, mean loss: 0.33917277217631986
Epoch: 71, step: 1430, loss: 0.3434959053993225, mean loss: 0.33917281376290276
Epoch: 71, step: 1431, loss: 0.3597061336040497, mean loss: 0.3391730112822363
Epoch: 71, step: 1432, loss: 0.3724389672279358, mean loss: 0.3391733312795039
Epoch: 71, step: 1433, loss: 0.41434311866760254, mean loss: 0.3391740543579335
Epoch: 71, step: 1434, loss: 0.31900593638420105, mean loss: 0.3391738603572412
Epoch: 71, step: 1435, loss: 0.3510814905166626, mean loss: 0.33917397489773904
Epoch: 71, step: 1436, loss: 0.30995768308639526, mean loss: 0.3391736938664695
Epoch: 71, step: 1437, loss: 0.3052982687950134, mean loss: 0.33917336802216996
Epoch: 71, step: 1438, loss: 0.36002546548843384, mean loss: 0.33917356859446457
Epoch: 71, step: 1439, loss: 0.3279273509979248, mean loss: 0.339173460420312
Epoch: 71, step: 1440, loss: 0.3200986981391907, mean loss: 0.3391732769473905
Epoch: 71, step: 1441, loss: 0.3559824228286743, mean loss: 0.3391734386266499
Epoch: 71, step: 1442, loss: 0.31871306896209717, mean loss: 0.33917324182988107
Epoch: 71, step: 1443, loss: 0.34687402844429016, mean loss: 0.3391733158986966
Valid: 71, mean loss: 0.1849007954200109
Epoch: 72, step: 0, loss: 0.32742542028427124, mean loss: 0.3391732029044809
Epoch: 72, step: 1, loss: 0.3115202486515045, mean loss: 0.3391729369339677
Epoch: 72, step: 2, loss: 0.34057044982910156, mean loss: 0.3391729503753398
Epoch: 72, step: 3, loss: 0.3276577591896057, mean loss: 0.33917283962252953
Epoch: 72, step: 4, loss: 0.29374960064888, mean loss: 0.3391724027471968
Epoch: 72, step: 5, loss: 0.3039678633213043, mean loss: 0.33917206415736256
Epoch: 72, step: 6, loss: 0.33125314116477966, mean loss: 0.33917198799556414
Epoch: 72, step: 7, loss: 0.36259621381759644, mean loss: 0.3391722132804936
Epoch: 72, step: 8, loss: 0.31893786787986755, mean loss: 0.33917201867644264
Epoch: 72, step: 9, loss: 0.3428521156311035, mean loss: 0.33917205406947726
Epoch: 72, step: 10, loss: 0.34509527683258057, mean loss: 0.33917211103504497
Epoch: 72, step: 11, loss: 0.372076153755188, mean loss: 0.3391724274809261
Epoch: 72, step: 12, loss: 0.3786619305610657, mean loss: 0.33917280725706866
Epoch: 72, step: 13, loss: 0.32746803760528564, mean loss: 0.3391726946917242
Epoch: 72, step: 14, loss: 0.29015955328941345, mean loss: 0.3391722233344696
Epoch: 72, step: 15, loss: 0.34831660985946655, mean loss: 0.3391723112747924
Epoch: 72, step: 16, loss: 0.3419875204563141, mean loss: 0.33917233834801624
Epoch: 72, step: 17, loss: 0.3273610472679138, mean loss: 0.3391722247626194
Epoch: 72, step: 18, loss: 0.3076575994491577, mean loss: 0.33917192169949306
Epoch: 72, step: 19, loss: 0.3390330374240875, mean loss: 0.33917192036391325
Epoch: 72, step: 20, loss: 0.29831093549728394, mean loss: 0.3391715274282675
Epoch: 72, step: 21, loss: 0.29933053255081177, mean loss: 0.3391711443049395
Epoch: 72, step: 22, loss: 0.33976009488105774, mean loss: 0.3391711499684159
Epoch: 72, step: 23, loss: 0.33603769540786743, mean loss: 0.3391711198367273
Epoch: 72, step: 24, loss: 0.3317035138607025, mean loss: 0.3391710480279904
Epoch: 72, step: 25, loss: 0.33932262659072876, mean loss: 0.3391710494855607
Epoch: 72, step: 26, loss: 0.3386806845664978, mean loss: 0.3391710447702867
Epoch: 72, step: 27, loss: 0.33860740065574646, mean loss: 0.3391710393504233
Epoch: 72, step: 28, loss: 0.3052937388420105, mean loss: 0.33917071359775247
Epoch: 72, step: 29, loss: 0.3535262942314148, mean loss: 0.3391708516348362
Epoch: 72, step: 30, loss: 0.32639843225479126, mean loss: 0.3391707288219305
Epoch: 72, step: 31, loss: 0.3127916157245636, mean loss: 0.33917047517661225
Epoch: 72, step: 32, loss: 0.3446235656738281, mean loss: 0.33917052760967054
Epoch: 72, step: 33, loss: 0.3333202600479126, mean loss: 0.33917047135817957
Epoch: 72, step: 34, loss: 0.2879958748817444, mean loss: 0.33916997930894566
Epoch: 72, step: 35, loss: 0.3103041648864746, mean loss: 0.3391697017637126
Epoch: 72, step: 36, loss: 0.3874179422855377, mean loss: 0.3391701656667992
Epoch: 72, step: 37, loss: 0.3403691053390503, mean loss: 0.33917017719440024
Epoch: 72, step: 38, loss: 0.3430767059326172, mean loss: 0.3391702147546485
Epoch: 72, step: 39, loss: 0.303920179605484, mean loss: 0.33916987583807334
Epoch: 72, step: 40, loss: 0.35581329464912415, mean loss: 0.3391700358570987
Epoch: 72, step: 41, loss: 0.3122241497039795, mean loss: 0.33916977678695015
Epoch: 72, step: 42, loss: 0.30498597025871277, mean loss: 0.33916944813126443
Epoch: 72, step: 43, loss: 0.340733140707016, mean loss: 0.3391694631650353
Epoch: 72, step: 44, loss: 0.3224323093891144, mean loss: 0.33916930225097863
Epoch: 72, step: 45, loss: 0.3729231357574463, mean loss: 0.3391696267633857
Epoch: 72, step: 46, loss: 0.37760990858078003, mean loss: 0.33916999632817746
Epoch: 72, step: 47, loss: 0.32215580344200134, mean loss: 0.33916983275533397
Epoch: 72, step: 48, loss: 0.3757225573062897, mean loss: 0.33917018416639705
Epoch: 72, step: 49, loss: 0.3428414463996887, mean loss: 0.33917021946088677
Epoch: 72, step: 50, loss: 0.31535306572914124, mean loss: 0.3391699904916241
Epoch: 72, step: 51, loss: 0.3521921932697296, mean loss: 0.3391701156810375
Epoch: 72, step: 52, loss: 0.4021437168121338, mean loss: 0.33917072107419016
Epoch: 72, step: 53, loss: 0.34993842244148254, mean loss: 0.3391708245878831
Epoch: 72, step: 54, loss: 0.3391283452510834, mean loss: 0.33917082417951827
Epoch: 72, step: 55, loss: 0.3131018579006195, mean loss: 0.339170573574213
Epoch: 72, step: 56, loss: 0.31475913524627686, mean loss: 0.3391703389052553
Epoch: 72, step: 57, loss: 0.2916705012321472, mean loss: 0.3391698822902006
Epoch: 72, step: 58, loss: 0.3069365620613098, mean loss: 0.3391695724348724
Epoch: 72, step: 59, loss: 0.31578487157821655, mean loss: 0.33916934764250056
Epoch: 72, step: 60, loss: 0.2995423376560211, mean loss: 0.3391689667197772
Epoch: 72, step: 61, loss: 0.31813737750053406, mean loss: 0.3391687645512756
Epoch: 72, step: 62, loss: 0.2920762598514557, mean loss: 0.33916831187366314
Epoch: 72, step: 63, loss: 0.3036651313304901, mean loss: 0.3391679706019338
Epoch: 72, step: 64, loss: 0.3527906835079193, mean loss: 0.3391681015480077
Epoch: 72, step: 65, loss: 0.3161344528198242, mean loss: 0.3391678801429985
Epoch: 72, step: 66, loss: 0.389680951833725, mean loss: 0.33916836568220826
Epoch: 72, step: 67, loss: 0.34212982654571533, mean loss: 0.33916839414794
Epoch: 72, step: 68, loss: 0.30197611451148987, mean loss: 0.3391680366570508
Epoch: 72, step: 69, loss: 0.36021679639816284, mean loss: 0.3391682389750475
Epoch: 72, step: 70, loss: 0.3115958273410797, mean loss: 0.33916797395508735
Epoch: 72, step: 71, loss: 0.3389209806919098, mean loss: 0.3391679715810652
Epoch: 72, step: 72, loss: 0.31617599725723267, mean loss: 0.3391677505915099
Epoch: 72, step: 73, loss: 0.3140552043914795, mean loss: 0.3391675092221956
Epoch: 72, step: 74, loss: 0.3498252034187317, mean loss: 0.33916761165767123
Epoch: 72, step: 75, loss: 0.30612778663635254, mean loss: 0.33916729410139673
Epoch: 72, step: 76, loss: 0.29991331696510315, mean loss: 0.3391669168225545
Epoch: 72, step: 77, loss: 0.3295454680919647, mean loss: 0.33916682434952594
Epoch: 72, step: 78, loss: 0.41083791851997375, mean loss: 0.3391675131833623
Epoch: 72, step: 79, loss: 0.3451366722583771, mean loss: 0.3391675705526445
Epoch: 72, step: 80, loss: 0.3089018762111664, mean loss: 0.33916727967340166
Epoch: 72, step: 81, loss: 0.3164609968662262, mean loss: 0.33916706144867503
Epoch: 72, step: 82, loss: 0.2974582016468048, mean loss: 0.3391666605985169
Epoch: 72, step: 83, loss: 0.33523499965667725, mean loss: 0.33916662281297755
Epoch: 72, step: 84, loss: 0.3439622223377228, mean loss: 0.33916666890102426
Epoch: 72, step: 85, loss: 0.3152879774570465, mean loss: 0.3391664394173769
Epoch: 72, step: 86, loss: 0.312461793422699, mean loss: 0.3391661827776576
Epoch: 72, step: 87, loss: 0.33512771129608154, mean loss: 0.33916614396709904
Epoch: 72, step: 88, loss: 0.3457750380039215, mean loss: 0.3391662074793475
Epoch: 72, step: 89, loss: 0.33935821056365967, mean loss: 0.339166209324502
Epoch: 72, step: 90, loss: 0.4002252519130707, mean loss: 0.3391667960977997
Epoch: 72, step: 91, loss: 0.3578585386276245, mean loss: 0.3391669757224636
Epoch: 72, step: 92, loss: 0.345141738653183, mean loss: 0.3391670331384305
Epoch: 72, step: 93, loss: 0.3316328823566437, mean loss: 0.33916696073783487
Epoch: 72, step: 94, loss: 0.29911527037620544, mean loss: 0.33916657585857557
Epoch: 72, step: 95, loss: 0.33069053292274475, mean loss: 0.339166494408286
Epoch: 72, step: 96, loss: 0.3149982988834381, mean loss: 0.3391662621669414
Epoch: 72, step: 97, loss: 0.327370822429657, mean loss: 0.33916614882118257
Epoch: 72, step: 98, loss: 0.34768855571746826, mean loss: 0.3391662307146444
Epoch: 72, step: 99, loss: 0.3066372275352478, mean loss: 0.3391659181401433
Epoch: 72, step: 100, loss: 0.34200724959373474, mean loss: 0.339165945442524
Epoch: 72, step: 101, loss: 0.33436909317970276, mean loss: 0.3391658993499684
Epoch: 72, step: 102, loss: 0.30916672945022583, mean loss: 0.3391656110932023
Epoch: 72, step: 103, loss: 0.29150015115737915, mean loss: 0.33916515308855233
Epoch: 72, step: 104, loss: 0.304372638463974, mean loss: 0.3391648187798015
Epoch: 72, step: 105, loss: 0.30601799488067627, mean loss: 0.3391645002869608
Epoch: 72, step: 106, loss: 0.4046490788459778, mean loss: 0.33916512949261596
Epoch: 72, step: 107, loss: 0.3123912811279297, mean loss: 0.3391648722397588
Epoch: 72, step: 108, loss: 0.36847034096717834, mean loss: 0.3391651538146382
Epoch: 72, step: 109, loss: 0.3725476562976837, mean loss: 0.3391654745596802
Epoch: 72, step: 110, loss: 0.3171924352645874, mean loss: 0.33916526344082537
Epoch: 72, step: 111, loss: 0.30464693903923035, mean loss: 0.3391649317889768
Epoch: 72, step: 112, loss: 0.33739951252937317, mean loss: 0.33916491482700234
Epoch: 72, step: 113, loss: 0.3562142550945282, mean loss: 0.33916507863381107
Epoch: 72, step: 114, loss: 0.3301929831504822, mean loss: 0.3391649924324575
Epoch: 72, step: 115, loss: 0.3198821246623993, mean loss: 0.33916480716990255
Epoch: 72, step: 116, loss: 0.3515932559967041, mean loss: 0.33916492657662617
Epoch: 72, step: 117, loss: 0.31813734769821167, mean loss: 0.33916472455542374
Epoch: 72, step: 118, loss: 0.309500515460968, mean loss: 0.33916443956105274
Epoch: 72, step: 119, loss: 0.31308847665786743, mean loss: 0.33916418904261736
Epoch: 72, step: 120, loss: 0.33249178528785706, mean loss: 0.33916412493974624
Epoch: 72, step: 121, loss: 0.34408557415008545, mean loss: 0.33916417222045725
Epoch: 72, step: 122, loss: 0.2973722517490387, mean loss: 0.33916377072637544
Epoch: 72, step: 123, loss: 0.34712985157966614, mean loss: 0.3391638472556078
Epoch: 72, step: 124, loss: 0.31093332171440125, mean loss: 0.3391635760507665
Epoch: 72, step: 125, loss: 0.35063254833221436, mean loss: 0.3391636862297613
Epoch: 72, step: 126, loss: 0.3169318735599518, mean loss: 0.33916347265742186
Epoch: 72, step: 127, loss: 0.32536420226097107, mean loss: 0.3391633400944954
Epoch: 72, step: 128, loss: 0.32933610677719116, mean loss: 0.33916324568991774
Epoch: 72, step: 129, loss: 0.3352585434913635, mean loss: 0.33916320818005014
Epoch: 72, step: 130, loss: 0.31819668412208557, mean loss: 0.3391630067705836
Epoch: 72, step: 131, loss: 0.2919156551361084, mean loss: 0.33916255290553426
Epoch: 72, step: 132, loss: 0.29173949360847473, mean loss: 0.3391620973569872
Epoch: 72, step: 133, loss: 0.32407838106155396, mean loss: 0.33916195246336084
Epoch: 72, step: 134, loss: 0.3421159088611603, mean loss: 0.33916198083868526
Epoch: 72, step: 135, loss: 0.3024865984916687, mean loss: 0.3391616285430737
Epoch: 72, step: 136, loss: 0.3625815808773041, mean loss: 0.3391618535077952
Epoch: 72, step: 137, loss: 0.32758939266204834, mean loss: 0.3391617423474313
Epoch: 72, step: 138, loss: 0.3320368230342865, mean loss: 0.33916167390900437
Epoch: 72, step: 139, loss: 0.3169519305229187, mean loss: 0.3391614605753183
Epoch: 72, step: 140, loss: 0.332710325717926, mean loss: 0.33916139861011974
Epoch: 72, step: 141, loss: 0.32607755064964294, mean loss: 0.33916127293681303
Epoch: 72, step: 142, loss: 0.3174898028373718, mean loss: 0.3391610647794608
Epoch: 72, step: 143, loss: 0.36226049065589905, mean loss: 0.3391612866503871
Epoch: 72, step: 144, loss: 0.33265671133995056, mean loss: 0.3391612241742764
Epoch: 72, step: 145, loss: 0.30807825922966003, mean loss: 0.3391609256268674
Epoch: 72, step: 146, loss: 0.3054729998111725, mean loss: 0.33916060206229154
Epoch: 72, step: 147, loss: 0.3462848663330078, mean loss: 0.33916067048851106
Epoch: 72, step: 148, loss: 0.3272888660430908, mean loss: 0.3391605564648219
Epoch: 72, step: 149, loss: 0.3516106903553009, mean loss: 0.3391606760419737
Epoch: 72, step: 150, loss: 0.317149817943573, mean loss: 0.33916046464099886
Epoch: 72, step: 151, loss: 0.3183991312980652, mean loss: 0.3391602652428684
Epoch: 72, step: 152, loss: 0.4025438129901886, mean loss: 0.33916087399180234
Epoch: 72, step: 153, loss: 0.37623274326324463, mean loss: 0.3391612300344184
Epoch: 72, step: 154, loss: 0.3871046304702759, mean loss: 0.33916169048408307
Epoch: 72, step: 155, loss: 0.33039095997810364, mean loss: 0.3391616062505682
Epoch: 72, step: 156, loss: 0.32589465379714966, mean loss: 0.33916147883685915
Epoch: 72, step: 157, loss: 0.3274744749069214, mean loss: 0.3391613665978033
Epoch: 72, step: 158, loss: 0.3369489014148712, mean loss: 0.33916134535004644
Epoch: 72, step: 159, loss: 0.3461759686470032, mean loss: 0.33916141271543615
Epoch: 72, step: 160, loss: 0.3267683684825897, mean loss: 0.33916129369917525
Epoch: 72, step: 161, loss: 0.35507646203041077, mean loss: 0.3391614465385907
Epoch: 72, step: 162, loss: 0.3287551999092102, mean loss: 0.3391613466044056
Epoch: 72, step: 163, loss: 0.3073771297931671, mean loss: 0.33916104137434366
Epoch: 72, step: 164, loss: 0.3829141855239868, mean loss: 0.33916146154032517
Epoch: 72, step: 165, loss: 0.31151285767555237, mean loss: 0.3391611960304642
Epoch: 72, step: 166, loss: 0.3460489511489868, mean loss: 0.3391612621730207
Epoch: 72, step: 167, loss: 0.35500046610832214, mean loss: 0.339161414274157
Epoch: 72, step: 168, loss: 0.3228928744792938, mean loss: 0.33916125805168285
Epoch: 72, step: 169, loss: 0.35313236713409424, mean loss: 0.33916139221125075
Epoch: 72, step: 170, loss: 0.3411523997783661, mean loss: 0.33916141133000133
Epoch: 72, step: 171, loss: 0.28718888759613037, mean loss: 0.3391609122660131
Epoch: 72, step: 172, loss: 0.3408834636211395, mean loss: 0.33916092880658166
Epoch: 72, step: 173, loss: 0.3074750304222107, mean loss: 0.3391606245499092
Epoch: 72, step: 174, loss: 0.3331540524959564, mean loss: 0.33916056687371343
Epoch: 72, step: 175, loss: 0.2944539189338684, mean loss: 0.3391601375964825
Epoch: 72, step: 176, loss: 0.33561381697654724, mean loss: 0.33916010354472176
Epoch: 72, step: 177, loss: 0.31223195791244507, mean loss: 0.3391598449832251
Epoch: 72, step: 178, loss: 0.31347084045410156, mean loss: 0.33915959832221204
Epoch: 72, step: 179, loss: 0.3331640660762787, mean loss: 0.3391595407547864
Epoch: 72, step: 180, loss: 0.32506969571113586, mean loss: 0.33915940546932954
Epoch: 72, step: 181, loss: 0.34160491824150085, mean loss: 0.33915942895000906
Epoch: 72, step: 182, loss: 0.32339709997177124, mean loss: 0.33915927760888914
Epoch: 72, step: 183, loss: 0.31201690435409546, mean loss: 0.3391590170054129
Epoch: 72, step: 184, loss: 0.33608338236808777, mean loss: 0.33915898747544604
Epoch: 72, step: 185, loss: 0.33256813883781433, mean loss: 0.3391589241956043
Epoch: 72, step: 186, loss: 0.3186989724636078, mean loss: 0.33915872775806666
Epoch: 72, step: 187, loss: 0.3594532012939453, mean loss: 0.33915892260496494
Epoch: 72, step: 188, loss: 0.3439647853374481, mean loss: 0.33915896874552903
Epoch: 72, step: 189, loss: 0.31954407691955566, mean loss: 0.3391587804268994
Epoch: 72, step: 190, loss: 0.3240775763988495, mean loss: 0.3391586356366842
Epoch: 72, step: 191, loss: 0.34240955114364624, mean loss: 0.33915866684747054
Epoch: 72, step: 192, loss: 0.31067386269569397, mean loss: 0.339158393378474
Epoch: 72, step: 193, loss: 0.3441395163536072, mean loss: 0.3391584411993969
Epoch: 72, step: 194, loss: 0.3156675398349762, mean loss: 0.3391582156788055
Epoch: 72, step: 195, loss: 0.3519643545150757, mean loss: 0.3391583386208856
Epoch: 72, step: 196, loss: 0.37843725085258484, mean loss: 0.33915871570447637
Epoch: 72, step: 197, loss: 0.339923620223999, mean loss: 0.33915872304760675
Epoch: 72, step: 198, loss: 0.33160942792892456, mean loss: 0.33915865057460554
Epoch: 72, step: 199, loss: 0.3381962180137634, mean loss: 0.3391586413353712
Epoch: 72, step: 200, loss: 0.38162070512771606, mean loss: 0.3391590489620528
Epoch: 72, step: 201, loss: 0.3125150799751282, mean loss: 0.3391587931881353
Epoch: 72, step: 202, loss: 0.3164123296737671, mean loss: 0.33915857483116923
Epoch: 72, step: 203, loss: 0.3396121561527252, mean loss: 0.339158579185327
Epoch: 72, step: 204, loss: 0.2988697588443756, mean loss: 0.3391581924361661
Epoch: 72, step: 205, loss: 0.312118262052536, mean loss: 0.3391579328711078
Epoch: 72, step: 206, loss: 0.3261740207672119, mean loss: 0.33915780823552244
Epoch: 72, step: 207, loss: 0.3337063193321228, mean loss: 0.3391577559059177
Epoch: 72, step: 208, loss: 0.3408416509628296, mean loss: 0.33915777206970676
Epoch: 72, step: 209, loss: 0.3292589485645294, mean loss: 0.3391576770513391
Epoch: 72, step: 210, loss: 0.3097977042198181, mean loss: 0.33915739522896765
Epoch: 72, step: 211, loss: 0.3114300072193146, mean loss: 0.3391571290801098
Epoch: 72, step: 212, loss: 0.33356207609176636, mean loss: 0.33915707537499096
Epoch: 72, step: 213, loss: 0.3178540766239166, mean loss: 0.3391568708963022
Epoch: 72, step: 214, loss: 0.30542707443237305, mean loss: 0.33915654714102095
Epoch: 72, step: 215, loss: 0.3043175935745239, mean loss: 0.33915621274271057
Epoch: 72, step: 216, loss: 0.338326096534729, mean loss: 0.3391562047749973
Epoch: 72, step: 217, loss: 0.3177010416984558, mean loss: 0.3391559988436526
Epoch: 72, step: 218, loss: 0.35411179065704346, mean loss: 0.33915614239123354
Epoch: 72, step: 219, loss: 0.3455270528793335, mean loss: 0.3391562035394511
Epoch: 72, step: 220, loss: 0.31044453382492065, mean loss: 0.3391559279665047
Epoch: 72, step: 221, loss: 0.28677165508270264, mean loss: 0.3391554251901069
Epoch: 72, step: 222, loss: 0.3506716787815094, mean loss: 0.3391555357203215
Epoch: 72, step: 223, loss: 0.3453886806964874, mean loss: 0.33915559554396413
Epoch: 72, step: 224, loss: 0.31680604815483093, mean loss: 0.3391553810425352
Epoch: 72, step: 225, loss: 0.31974291801452637, mean loss: 0.3391551947317781
Epoch: 72, step: 226, loss: 0.3714275658130646, mean loss: 0.33915550446229376
Epoch: 72, step: 227, loss: 0.29001691937446594, mean loss: 0.3391550328646788
Epoch: 72, step: 228, loss: 0.3227570950984955, mean loss: 0.33915487549030365
Epoch: 72, step: 229, loss: 0.332841694355011, mean loss: 0.33915481490198973
Epoch: 72, step: 230, loss: 0.3638555407524109, mean loss: 0.33915505195537654
Epoch: 72, step: 231, loss: 0.3326125144958496, mean loss: 0.3391549891671092
Epoch: 72, step: 232, loss: 0.3402552604675293, mean loss: 0.33915499972623336
Epoch: 72, step: 233, loss: 0.2961973547935486, mean loss: 0.3391545874726784
Epoch: 72, step: 234, loss: 0.3283974528312683, mean loss: 0.33915448424019334
Epoch: 72, step: 235, loss: 0.34283533692359924, mean loss: 0.33915451956371917
Epoch: 72, step: 236, loss: 0.3356669247150421, mean loss: 0.33915448609512505
Epoch: 72, step: 237, loss: 0.327934592962265, mean loss: 0.3391543784248073
Epoch: 72, step: 238, loss: 0.345485657453537, mean loss: 0.33915443918156096
Epoch: 72, step: 239, loss: 0.3296102285385132, mean loss: 0.33915434759348095
Epoch: 72, step: 240, loss: 0.30579811334609985, mean loss: 0.33915402750371665
Epoch: 72, step: 241, loss: 0.31328412890434265, mean loss: 0.3391537792559612
Epoch: 72, step: 242, loss: 0.3758142292499542, mean loss: 0.33915413104655906
Epoch: 72, step: 243, loss: 0.3620995283126831, mean loss: 0.33915435122655047
Epoch: 72, step: 244, loss: 0.3175365626811981, mean loss: 0.3391541437880491
Epoch: 72, step: 245, loss: 0.3244618773460388, mean loss: 0.3391540028063533
Epoch: 72, step: 246, loss: 0.34095197916030884, mean loss: 0.33915402005892115
Epoch: 72, step: 247, loss: 0.3323887884616852, mean loss: 0.33915395514344177
Epoch: 72, step: 248, loss: 0.31159108877182007, mean loss: 0.3391536906677193
Epoch: 72, step: 249, loss: 0.3405403792858124, mean loss: 0.33915370397337297
Epoch: 72, step: 250, loss: 0.30743324756622314, mean loss: 0.33915339960990365
Epoch: 72, step: 251, loss: 0.3518180251121521, mean loss: 0.33915352112809116
Epoch: 72, step: 252, loss: 0.3506629765033722, mean loss: 0.3391536315612608
Epoch: 72, step: 253, loss: 0.3154987096786499, mean loss: 0.33915340459457544
Epoch: 72, step: 254, loss: 0.36766156554222107, mean loss: 0.3391536781249953
Epoch: 72, step: 255, loss: 0.33177846670150757, mean loss: 0.33915360736191363
Epoch: 72, step: 256, loss: 0.28956133127212524, mean loss: 0.339153131542522
Epoch: 72, step: 257, loss: 0.3482060730457306, mean loss: 0.3391532184012857
Epoch: 72, step: 258, loss: 0.3313766419887543, mean loss: 0.3391531437893674
Epoch: 72, step: 259, loss: 0.33099931478500366, mean loss: 0.3391530655586712
Epoch: 72, step: 260, loss: 0.2958310544490814, mean loss: 0.33915264991608507
Epoch: 72, step: 261, loss: 0.35950785875320435, mean loss: 0.33915284520735284
Epoch: 72, step: 262, loss: 0.3475436270236969, mean loss: 0.33915292570914035
Epoch: 72, step: 263, loss: 0.31363895535469055, mean loss: 0.33915268092855133
Epoch: 72, step: 264, loss: 0.3146286904811859, mean loss: 0.3391524456480696
Epoch: 72, step: 265, loss: 0.315152645111084, mean loss: 0.33915221539881757
Epoch: 72, step: 266, loss: 0.33878812193870544, mean loss: 0.33915221190581174
Epoch: 72, step: 267, loss: 0.3651275038719177, mean loss: 0.33915246110274916
Epoch: 72, step: 268, loss: 0.3432951271533966, mean loss: 0.3391525008455089
Epoch: 72, step: 269, loss: 0.3142310678958893, mean loss: 0.33915226176347596
Epoch: 72, step: 270, loss: 0.3380763530731201, mean loss: 0.3391522514419198
Epoch: 72, step: 271, loss: 0.32971683144569397, mean loss: 0.3391521609256113
Epoch: 72, step: 272, loss: 0.285862535238266, mean loss: 0.33915164971000816
Epoch: 72, step: 273, loss: 0.32978102564811707, mean loss: 0.33915155981702777
Epoch: 72, step: 274, loss: 0.35479170083999634, mean loss: 0.33915170985243565
Epoch: 72, step: 275, loss: 0.3213200569152832, mean loss: 0.3391515387955601
Epoch: 72, step: 276, loss: 0.3285446763038635, mean loss: 0.3391514370461957
Epoch: 72, step: 277, loss: 0.31340163946151733, mean loss: 0.33915119003626165
Epoch: 72, step: 278, loss: 0.30271998047828674, mean loss: 0.33915084056616124
Epoch: 72, step: 279, loss: 0.33593255281448364, mean loss: 0.33915080969470324
Epoch: 72, step: 280, loss: 0.35453560948371887, mean loss: 0.339150957272136
Epoch: 72, step: 281, loss: 0.34467989206314087, mean loss: 0.33915101030748174
Epoch: 72, step: 282, loss: 0.36022064089775085, mean loss: 0.33915121241231133
Epoch: 72, step: 283, loss: 0.31840094923973083, mean loss: 0.339151013372838
Epoch: 72, step: 284, loss: 0.3274146318435669, mean loss: 0.33915090079687826
Epoch: 72, step: 285, loss: 0.33667171001434326, mean loss: 0.33915087701658414
Epoch: 72, step: 286, loss: 0.35283899307250977, mean loss: 0.33915100831116046
Epoch: 72, step: 287, loss: 0.34153157472610474, mean loss: 0.3391510311450157
Epoch: 72, step: 288, loss: 0.3097063899040222, mean loss: 0.33915074872137757
Epoch: 72, step: 289, loss: 0.30509576201438904, mean loss: 0.3391504220799044
Epoch: 72, step: 290, loss: 0.32957473397254944, mean loss: 0.3391503302347102
Epoch: 72, step: 291, loss: 0.3391382396221161, mean loss: 0.33915033011874424
Epoch: 72, step: 292, loss: 0.3431589603424072, mean loss: 0.33915036856677583
Epoch: 72, step: 293, loss: 0.34902408719062805, mean loss: 0.33915046326780424
Epoch: 72, step: 294, loss: 0.316373735666275, mean loss: 0.339150244813246
Epoch: 72, step: 295, loss: 0.33525580167770386, mean loss: 0.3391502074614934
Epoch: 72, step: 296, loss: 0.34463828802108765, mean loss: 0.3391502600973785
Epoch: 72, step: 297, loss: 0.3065465986728668, mean loss: 0.3391499474004166
Epoch: 72, step: 298, loss: 0.3434290885925293, mean loss: 0.3391499884406421
Epoch: 72, step: 299, loss: 0.34294939041137695, mean loss: 0.33915002487945334
Epoch: 72, step: 300, loss: 0.32923266291618347, mean loss: 0.3391499297662177
Epoch: 72, step: 301, loss: 0.3234761357307434, mean loss: 0.3391497794469117
Epoch: 72, step: 302, loss: 0.35523930191993713, mean loss: 0.3391499337517757
Epoch: 72, step: 303, loss: 0.3151690661907196, mean loss: 0.33914970376800674
Epoch: 72, step: 304, loss: 0.3483811020851135, mean loss: 0.33914979229905806
Epoch: 72, step: 305, loss: 0.3417981266975403, mean loss: 0.33914981769689834
Epoch: 72, step: 306, loss: 0.33670881390571594, mean loss: 0.3391497942876076
Epoch: 72, step: 307, loss: 0.36810049414634705, mean loss: 0.33915007192292024
Epoch: 72, step: 308, loss: 0.3294420838356018, mean loss: 0.3391499788248441
Epoch: 72, step: 309, loss: 0.333412230014801, mean loss: 0.33914992380126474
Epoch: 72, step: 310, loss: 0.3231375217437744, mean loss: 0.339149770247797
Epoch: 72, step: 311, loss: 0.3744422197341919, mean loss: 0.33915010868709017
Epoch: 72, step: 312, loss: 0.32312461733818054, mean loss: 0.33914995501104805
Epoch: 72, step: 313, loss: 0.3750283718109131, mean loss: 0.3391502990629151
Epoch: 72, step: 314, loss: 0.3344530165195465, mean loss: 0.3391502540193074
Epoch: 72, step: 315, loss: 0.3531229794025421, mean loss: 0.33915038800654784
Epoch: 72, step: 316, loss: 0.32670849561691284, mean loss: 0.3391502686999132
Epoch: 72, step: 317, loss: 0.3534945547580719, mean loss: 0.3391504062474849
Epoch: 72, step: 318, loss: 0.3221369683742523, mean loss: 0.33915024310694125
Epoch: 72, step: 319, loss: 0.3214993178844452, mean loss: 0.3391500738552035
Epoch: 72, step: 320, loss: 0.3663783669471741, mean loss: 0.33915033494019897
Epoch: 72, step: 321, loss: 0.3302125632762909, mean loss: 0.3391502492390611
Epoch: 72, step: 322, loss: 0.29904329776763916, mean loss: 0.339149864671347
Epoch: 72, step: 323, loss: 0.3480475842952728, mean loss: 0.3391499499868038
Epoch: 72, step: 324, loss: 0.32759225368499756, mean loss: 0.33914983916732117
Epoch: 72, step: 325, loss: 0.3666028678417206, mean loss: 0.3391501023946274
Epoch: 72, step: 326, loss: 0.34844544529914856, mean loss: 0.33915019152011666
Epoch: 72, step: 327, loss: 0.38665851950645447, mean loss: 0.33915064703449865
Epoch: 72, step: 328, loss: 0.32104289531707764, mean loss: 0.33915047341731197
Epoch: 72, step: 329, loss: 0.35082221031188965, mean loss: 0.33915058532489306
Epoch: 72, step: 330, loss: 0.3186638355255127, mean loss: 0.3391503889016311
Epoch: 72, step: 331, loss: 0.37265026569366455, mean loss: 0.339150710089328
Epoch: 72, step: 332, loss: 0.3565167188644409, mean loss: 0.3391508765882952
Epoch: 72, step: 333, loss: 0.2721214294433594, mean loss: 0.33915023394053057
Epoch: 72, step: 334, loss: 0.30048149824142456, mean loss: 0.33914986320588536
Epoch: 72, step: 335, loss: 0.32647478580474854, mean loss: 0.339149741685355
Epoch: 72, step: 336, loss: 0.35724323987960815, mean loss: 0.3391499151525732
Epoch: 72, step: 337, loss: 0.31301864981651306, mean loss: 0.33914966462752827
Epoch: 72, step: 338, loss: 0.3483540117740631, mean loss: 0.33914975287038013
Epoch: 72, step: 339, loss: 0.3329958915710449, mean loss: 0.3391496938733588
Epoch: 72, step: 340, loss: 0.35547879338264465, mean loss: 0.3391498504188104
Epoch: 72, step: 341, loss: 0.36423882842063904, mean loss: 0.33915009094203924
Epoch: 72, step: 342, loss: 0.34353169798851013, mean loss: 0.3391501329472644
Epoch: 72, step: 343, loss: 0.3564758002758026, mean loss: 0.3391502990419355
Epoch: 72, step: 344, loss: 0.30466869473457336, mean loss: 0.33914996848290346
Epoch: 72, step: 345, loss: 0.29224279522895813, mean loss: 0.3391495188100575
Epoch: 72, step: 346, loss: 0.36140817403793335, mean loss: 0.33914973218929567
Epoch: 72, step: 347, loss: 0.3037561774253845, mean loss: 0.33914939289757856
Epoch: 72, step: 348, loss: 0.32749202847480774, mean loss: 0.33914928114815684
Epoch: 72, step: 349, loss: 0.28760430216789246, mean loss: 0.33914878703420737
Epoch: 72, step: 350, loss: 0.32755059003829956, mean loss: 0.33914867585410596
Epoch: 72, step: 351, loss: 0.3480568826198578, mean loss: 0.3391487612471923
Epoch: 72, step: 352, loss: 0.32468488812446594, mean loss: 0.33914862259943085
Epoch: 72, step: 353, loss: 0.37341222167015076, mean loss: 0.33914895104021103
Epoch: 72, step: 354, loss: 0.33407583832740784, mean loss: 0.33914890241131124
Epoch: 72, step: 355, loss: 0.29264217615127563, mean loss: 0.33914845662006227
Epoch: 72, step: 356, loss: 0.337679922580719, mean loss: 0.3391484425435318
Epoch: 72, step: 357, loss: 0.35928767919540405, mean loss: 0.3391486355849276
Epoch: 72, step: 358, loss: 0.3649745583534241, mean loss: 0.33914888313276054
Epoch: 72, step: 359, loss: 0.27940893173217773, mean loss: 0.3391483105160958
Epoch: 72, step: 360, loss: 0.3410257399082184, mean loss: 0.3391483285113741
Epoch: 72, step: 361, loss: 0.34358373284339905, mean loss: 0.33914837102459494
Epoch: 72, step: 362, loss: 0.3241547644138336, mean loss: 0.3391482273126914
Epoch: 72, step: 363, loss: 0.32440605759620667, mean loss: 0.33914808601213436
Epoch: 72, step: 364, loss: 0.32132890820503235, mean loss: 0.3391479152207471
Epoch: 72, step: 365, loss: 0.3325537145137787, mean loss: 0.3391478520179493
Epoch: 72, step: 366, loss: 0.3021904528141022, mean loss: 0.33914749779933423
Epoch: 72, step: 367, loss: 0.3499508202075958, mean loss: 0.3391476013429089
Epoch: 72, step: 368, loss: 0.31048035621643066, mean loss: 0.33914732658663715
Epoch: 72, step: 369, loss: 0.306810200214386, mean loss: 0.3391470166599913
Epoch: 72, step: 370, loss: 0.3424023687839508, mean loss: 0.3391470478597548
Epoch: 72, step: 371, loss: 0.34796836972236633, mean loss: 0.33914713240376343
Epoch: 72, step: 372, loss: 0.3508160710334778, mean loss: 0.3391472442384078
Epoch: 72, step: 373, loss: 0.35969698429107666, mean loss: 0.3391474411844128
Epoch: 72, step: 374, loss: 0.35519516468048096, mean loss: 0.3391475949822095
Epoch: 72, step: 375, loss: 0.31264060735702515, mean loss: 0.3391473409475968
Epoch: 72, step: 376, loss: 0.2951289713382721, mean loss: 0.33914691909346284
Epoch: 72, step: 377, loss: 0.3145640194416046, mean loss: 0.33914668350321836
Epoch: 72, step: 378, loss: 0.3628625273704529, mean loss: 0.3391469107818547
Epoch: 72, step: 379, loss: 0.35512906312942505, mean loss: 0.33914706394389277
Epoch: 72, step: 380, loss: 0.32036253809928894, mean loss: 0.3391468839275453
Epoch: 72, step: 381, loss: 0.33766475319862366, mean loss: 0.33914686972408836
Epoch: 72, step: 382, loss: 0.3488256633281708, mean loss: 0.3391469624763725
Epoch: 72, step: 383, loss: 0.34189143776893616, mean loss: 0.33914698877654204
Epoch: 72, step: 384, loss: 0.3337271809577942, mean loss: 0.3391469368392923
Epoch: 72, step: 385, loss: 0.33545127511024475, mean loss: 0.33914690142462944
Epoch: 72, step: 386, loss: 0.3283025026321411, mean loss: 0.3391467975062854
Epoch: 72, step: 387, loss: 0.3335684537887573, mean loss: 0.33914674405134543
Epoch: 72, step: 388, loss: 0.35853812098503113, mean loss: 0.3391469298690379
Epoch: 72, step: 389, loss: 0.32057276368141174, mean loss: 0.3391467518839655
Epoch: 72, step: 390, loss: 0.3276943862438202, mean loss: 0.3391466421438794
Epoch: 72, step: 391, loss: 0.3213597536087036, mean loss: 0.33914647170608203
Epoch: 72, step: 392, loss: 0.30944812297821045, mean loss: 0.3391461871328341
Epoch: 72, step: 393, loss: 0.3429567217826843, mean loss: 0.33914622364549823
Epoch: 72, step: 394, loss: 0.31302011013031006, mean loss: 0.33914597330664714
Epoch: 72, step: 395, loss: 0.3312116861343384, mean loss: 0.3391458972815123
Epoch: 72, step: 396, loss: 0.3068598508834839, mean loss: 0.3391455879244826
Epoch: 72, step: 397, loss: 0.3383798897266388, mean loss: 0.33914558058781935
Epoch: 72, step: 398, loss: 0.35182273387908936, mean loss: 0.3391457020548855
Epoch: 72, step: 399, loss: 0.3462826907634735, mean loss: 0.3391457704378066
Epoch: 72, step: 400, loss: 0.3020545542240143, mean loss: 0.3391454150524315
Epoch: 72, step: 401, loss: 0.3665681779384613, mean loss: 0.3391456777980757
Epoch: 72, step: 402, loss: 0.33163338899612427, mean loss: 0.33914560582129283
Epoch: 72, step: 403, loss: 0.3094903826713562, mean loss: 0.3391453216912278
Epoch: 72, step: 404, loss: 0.32379087805747986, mean loss: 0.3391451745799669
Epoch: 72, step: 405, loss: 0.2986302077770233, mean loss: 0.3391447864089013
Epoch: 72, step: 406, loss: 0.31648939847946167, mean loss: 0.3391445693512924
Epoch: 72, step: 407, loss: 0.3443453311920166, mean loss: 0.3391446191784734
Epoch: 72, step: 408, loss: 0.322022408246994, mean loss: 0.339144455136482
Epoch: 72, step: 409, loss: 0.3552016317844391, mean loss: 0.33914460897327375
Epoch: 72, step: 410, loss: 0.306372731924057, mean loss: 0.33914429500325055
Epoch: 72, step: 411, loss: 0.32852357625961304, mean loss: 0.33914419325273565
Epoch: 72, step: 412, loss: 0.32853615283966064, mean loss: 0.33914409162465764
Epoch: 72, step: 413, loss: 0.3070112466812134, mean loss: 0.33914378378571086
Epoch: 72, step: 414, loss: 0.3154139816761017, mean loss: 0.3391435564517378
Epoch: 72, step: 415, loss: 0.3539733588695526, mean loss: 0.33914369852142684
Epoch: 72, step: 416, loss: 0.32541024684906006, mean loss: 0.3391435669560518
Epoch: 72, step: 417, loss: 0.3528240919113159, mean loss: 0.3391436980131376
Epoch: 72, step: 418, loss: 0.3355662524700165, mean loss: 0.3391436637421504
Epoch: 72, step: 419, loss: 0.32798388600349426, mean loss: 0.33914355683543945
Epoch: 72, step: 420, loss: 0.3872010111808777, mean loss: 0.3391440172043897
Epoch: 72, step: 421, loss: 0.3039347231388092, mean loss: 0.339143679918308
Epoch: 72, step: 422, loss: 0.36635392904281616, mean loss: 0.33914394057534863
Epoch: 72, step: 423, loss: 0.3336947560310364, mean loss: 0.33914388837609444
Epoch: 72, step: 424, loss: 0.33205750584602356, mean loss: 0.3391438204943157
Epoch: 72, step: 425, loss: 0.38989365100860596, mean loss: 0.3391443066317423
Epoch: 72, step: 426, loss: 0.3142036199569702, mean loss: 0.33914406772483413
Epoch: 72, step: 427, loss: 0.30450454354286194, mean loss: 0.3391437359159125
Epoch: 72, step: 428, loss: 0.3342319428920746, mean loss: 0.3391436888667346
Epoch: 72, step: 429, loss: 0.3337426483631134, mean loss: 0.3391436371316391
Epoch: 72, step: 430, loss: 0.32359567284584045, mean loss: 0.3391434882033516
Epoch: 72, step: 431, loss: 0.36660200357437134, mean loss: 0.339143751215951
Epoch: 72, step: 432, loss: 0.33797261118888855, mean loss: 0.33914373999824204
Epoch: 72, step: 433, loss: 0.3466162085533142, mean loss: 0.3391438115722402
Epoch: 72, step: 434, loss: 0.3338095247745514, mean loss: 0.3391437604790073
Epoch: 72, step: 435, loss: 0.35824888944625854, mean loss: 0.3391439434713157
Epoch: 72, step: 436, loss: 0.37005484104156494, mean loss: 0.3391442395385306
Epoch: 72, step: 437, loss: 0.36607763171195984, mean loss: 0.33914449750638853
Epoch: 72, step: 438, loss: 0.33043041825294495, mean loss: 0.3391444140437926
Epoch: 72, step: 439, loss: 0.34410804510116577, mean loss: 0.3391444615845084
Epoch: 72, step: 440, loss: 0.31066611409187317, mean loss: 0.3391441888269157
Epoch: 72, step: 441, loss: 0.3435728847980499, mean loss: 0.33914423124331233
Epoch: 72, step: 442, loss: 0.3257104456424713, mean loss: 0.33914410258076144
Epoch: 72, step: 443, loss: 0.3120398223400116, mean loss: 0.3391438429910568
Epoch: 72, step: 444, loss: 0.31172844767570496, mean loss: 0.33914358042417997
Epoch: 72, step: 445, loss: 0.31445473432540894, mean loss: 0.33914334397268786
Epoch: 72, step: 446, loss: 0.3476807475090027, mean loss: 0.3391434257368361
Epoch: 72, step: 447, loss: 0.31262463331222534, mean loss: 0.3391431717643374
Epoch: 72, step: 448, loss: 0.34803980588912964, mean loss: 0.3391432569672653
Epoch: 72, step: 449, loss: 0.33495521545410156, mean loss: 0.3391432168588404
Epoch: 72, step: 450, loss: 0.3574436902999878, mean loss: 0.33914339211883565
Epoch: 72, step: 451, loss: 0.3146818280220032, mean loss: 0.3391431578575438
Epoch: 72, step: 452, loss: 0.3307282030582428, mean loss: 0.33914307727073845
Epoch: 72, step: 453, loss: 0.34629857540130615, mean loss: 0.3391431457955525
Epoch: 72, step: 454, loss: 0.3329008221626282, mean loss: 0.3391430860163503
Epoch: 72, step: 455, loss: 0.36530670523643494, mean loss: 0.33914333656813167
Epoch: 72, step: 456, loss: 0.3480699956417084, mean loss: 0.33914342205205866
Epoch: 72, step: 457, loss: 0.35722389817237854, mean loss: 0.3391435951935763
Epoch: 72, step: 458, loss: 0.3657805621623993, mean loss: 0.33914385027096977
Epoch: 72, step: 459, loss: 0.31750714778900146, mean loss: 0.3391436430784306
Epoch: 72, step: 460, loss: 0.32282570004463196, mean loss: 0.33914348681969947
Epoch: 72, step: 461, loss: 0.3773970901966095, mean loss: 0.33914385312826384
Epoch: 72, step: 462, loss: 0.3011937439441681, mean loss: 0.3391434897293767
Epoch: 72, step: 463, loss: 0.38944771885871887, mean loss: 0.33914397142300634
Epoch: 72, step: 464, loss: 0.30797824263572693, mean loss: 0.3391436729950306
Epoch: 72, step: 465, loss: 0.3067900836467743, mean loss: 0.33914336319564203
Epoch: 72, step: 466, loss: 0.3026583790779114, mean loss: 0.33914301383973533
Epoch: 72, step: 467, loss: 0.31391701102256775, mean loss: 0.3391427722946473
Epoch: 72, step: 468, loss: 0.31379106640815735, mean loss: 0.33914252954824625
Epoch: 72, step: 469, loss: 0.35764503479003906, mean loss: 0.33914270671082347
Epoch: 72, step: 470, loss: 0.31144407391548157, mean loss: 0.3391424414973228
Epoch: 72, step: 471, loss: 0.3341262638568878, mean loss: 0.3391423934680463
Epoch: 72, step: 472, loss: 0.33554017543792725, mean loss: 0.3391423589775873
Epoch: 72, step: 473, loss: 0.3226967453956604, mean loss: 0.3391422015158997
Epoch: 72, step: 474, loss: 0.3288329839706421, mean loss: 0.3391421028092602
Epoch: 72, step: 475, loss: 0.3427080810070038, mean loss: 0.33914213695174994
Epoch: 72, step: 476, loss: 0.323872447013855, mean loss: 0.3391419907533686
Epoch: 72, step: 477, loss: 0.3159264922142029, mean loss: 0.3391417684806292
Epoch: 72, step: 478, loss: 0.33247581124305725, mean loss: 0.33914170465919596
Epoch: 72, step: 479, loss: 0.33740872144699097, mean loss: 0.33914168806736833
Epoch: 72, step: 480, loss: 0.2833561301231384, mean loss: 0.33914115397361977
Epoch: 72, step: 481, loss: 0.31733599305152893, mean loss: 0.3391409452119068
Epoch: 72, step: 482, loss: 0.3046196401119232, mean loss: 0.3391406147095172
Epoch: 72, step: 483, loss: 0.30781278014183044, mean loss: 0.3391403147838617
Epoch: 72, step: 484, loss: 0.36021456122398376, mean loss: 0.33914051654203464
Epoch: 72, step: 485, loss: 0.3320426344871521, mean loss: 0.33914044858980635
Epoch: 72, step: 486, loss: 0.3614514172077179, mean loss: 0.3391406621838767
Epoch: 72, step: 487, loss: 0.37993574142456055, mean loss: 0.33914105273185136
Epoch: 72, step: 488, loss: 0.35593312978744507, mean loss: 0.3391412134877323
Epoch: 72, step: 489, loss: 0.3177432119846344, mean loss: 0.3391410086398365
Epoch: 72, step: 490, loss: 0.3209797143936157, mean loss: 0.3391408347793338
Epoch: 72, step: 491, loss: 0.35463911294937134, mean loss: 0.3391409831450065
Epoch: 72, step: 492, loss: 0.36542773246765137, mean loss: 0.33914123478676106
Epoch: 72, step: 493, loss: 0.3187880218029022, mean loss: 0.33914103994832234
Epoch: 72, step: 494, loss: 0.3003014922142029, mean loss: 0.3391406681463663
Epoch: 72, step: 495, loss: 0.3687839210033417, mean loss: 0.3391409519116142
Epoch: 72, step: 496, loss: 0.34192341566085815, mean loss: 0.3391409785469825
Epoch: 72, step: 497, loss: 0.31267470121383667, mean loss: 0.3391407251987416
Epoch: 72, step: 498, loss: 0.3762868642807007, mean loss: 0.3391410807764751
Epoch: 72, step: 499, loss: 0.3848456144332886, mean loss: 0.3391415182744042
Epoch: 72, step: 500, loss: 0.41025781631469727, mean loss: 0.33914219901508363
Epoch: 72, step: 501, loss: 0.34756582975387573, mean loss: 0.33914227964713817
Epoch: 72, step: 502, loss: 0.3160304129123688, mean loss: 0.339142058419556
Epoch: 72, step: 503, loss: 0.31875374913215637, mean loss: 0.33914186326382734
Epoch: 72, step: 504, loss: 0.33091118931770325, mean loss: 0.3391417844810419
Epoch: 72, step: 505, loss: 0.36583608388900757, mean loss: 0.3391420399924553
Epoch: 72, step: 506, loss: 0.35238340497016907, mean loss: 0.3391421667344029
Epoch: 72, step: 507, loss: 0.31581175327301025, mean loss: 0.3391419434255716
Epoch: 72, step: 508, loss: 0.3413192927837372, mean loss: 0.3391419642660375
Epoch: 72, step: 509, loss: 0.36179012060165405, mean loss: 0.33914218104044297
Epoch: 72, step: 510, loss: 0.2874321937561035, mean loss: 0.33914168610856876
Epoch: 72, step: 511, loss: 0.33484822511672974, mean loss: 0.33914164501495286
Epoch: 72, step: 512, loss: 0.3281715214252472, mean loss: 0.33914154001860336
Epoch: 72, step: 513, loss: 0.37637898325920105, mean loss: 0.3391418964191627
Epoch: 72, step: 514, loss: 0.3678577244281769, mean loss: 0.3391421712564856
Epoch: 72, step: 515, loss: 0.33899131417274475, mean loss: 0.3391421698126561
Epoch: 72, step: 516, loss: 0.32147708535194397, mean loss: 0.3391420007445175
Epoch: 72, step: 517, loss: 0.33327367901802063, mean loss: 0.33914194458080443
Epoch: 72, step: 518, loss: 0.3189448416233063, mean loss: 0.3391417512830453
Epoch: 72, step: 519, loss: 0.2946709394454956, mean loss: 0.3391413256761638
Epoch: 72, step: 520, loss: 0.31972047686576843, mean loss: 0.3391411398111559
Epoch: 72, step: 521, loss: 0.30404558777809143, mean loss: 0.3391408039364116
Epoch: 72, step: 522, loss: 0.3365057110786438, mean loss: 0.3391407787180401
Epoch: 72, step: 523, loss: 0.30163541436195374, mean loss: 0.339140419787554
Epoch: 72, step: 524, loss: 0.365911602973938, mean loss: 0.3391406759882869
Epoch: 72, step: 525, loss: 0.36751896142959595, mean loss: 0.33914094756642
Epoch: 72, step: 526, loss: 0.30392715334892273, mean loss: 0.3391406105761887
Epoch: 72, step: 527, loss: 0.31396567821502686, mean loss: 0.33914036965852334
Epoch: 72, step: 528, loss: 0.3093629777431488, mean loss: 0.3391400846992239
Epoch: 72, step: 529, loss: 0.3124051094055176, mean loss: 0.33913982885724325
Epoch: 72, step: 530, loss: 0.31444889307022095, mean loss: 0.33913959257808474
Epoch: 72, step: 531, loss: 0.34947532415390015, mean loss: 0.339139691484607
Epoch: 72, step: 532, loss: 0.3336460292339325, mean loss: 0.3391396389141794
Epoch: 72, step: 533, loss: 0.3455623686313629, mean loss: 0.33913970037453156
Epoch: 72, step: 534, loss: 0.3451431691646576, mean loss: 0.33913975782234446
Epoch: 72, step: 535, loss: 0.3195078372955322, mean loss: 0.339139569964267
Epoch: 72, step: 536, loss: 0.3821778893470764, mean loss: 0.33913998179450844
Epoch: 72, step: 537, loss: 0.3540620505809784, mean loss: 0.3391401245812268
Epoch: 72, step: 538, loss: 0.33653271198272705, mean loss: 0.3391400996315813
Epoch: 72, step: 539, loss: 0.33072629570961, mean loss: 0.3391400191228746
Epoch: 72, step: 540, loss: 0.3499504625797272, mean loss: 0.33914012256318554
Epoch: 72, step: 541, loss: 0.3460509479045868, mean loss: 0.33914018868915763
Epoch: 72, step: 542, loss: 0.3382909893989563, mean loss: 0.33914018056370393
Epoch: 72, step: 543, loss: 0.32550352811813354, mean loss: 0.3391400500844054
Epoch: 72, step: 544, loss: 0.31827038526535034, mean loss: 0.33913985039953537
Epoch: 72, step: 545, loss: 0.37348079681396484, mean loss: 0.3391401789770122
Epoch: 72, step: 546, loss: 0.36232301592826843, mean loss: 0.3391404007905026
Epoch: 72, step: 547, loss: 0.3052978515625, mean loss: 0.3391400769879343
Epoch: 72, step: 548, loss: 0.3454836308956146, mean loss: 0.3391401376819258
Epoch: 72, step: 549, loss: 0.3198230266571045, mean loss: 0.3391399528610239
Epoch: 72, step: 550, loss: 0.33979731798171997, mean loss: 0.3391399591504557
Epoch: 72, step: 551, loss: 0.3116609454154968, mean loss: 0.33913969624370355
Epoch: 72, step: 552, loss: 0.32380297780036926, mean loss: 0.3391395495103347
Epoch: 72, step: 553, loss: 0.3604080080986023, mean loss: 0.33913975299341564
Epoch: 72, step: 554, loss: 0.3590085208415985, mean loss: 0.3391399430833274
Epoch: 72, step: 555, loss: 0.3180796802043915, mean loss: 0.3391397415959859
Epoch: 72, step: 556, loss: 0.310953289270401, mean loss: 0.33913947193368194
Epoch: 72, step: 557, loss: 0.3488423526287079, mean loss: 0.33913956476111906
Epoch: 72, step: 558, loss: 0.3174663186073303, mean loss: 0.33913935741520695
Epoch: 72, step: 559, loss: 0.31713101267814636, mean loss: 0.3391391468654525
Epoch: 72, step: 560, loss: 0.3039287328720093, mean loss: 0.3391388100171712
Epoch: 72, step: 561, loss: 0.29474106431007385, mean loss: 0.33913838528029466
Epoch: 72, step: 562, loss: 0.32033973932266235, mean loss: 0.33913820544229484
Epoch: 72, step: 563, loss: 0.3511330783367157, mean loss: 0.3391383201906293
Epoch: 72, step: 564, loss: 0.31278225779533386, mean loss: 0.3391380680591264
Epoch: 72, step: 565, loss: 0.3442395031452179, mean loss: 0.33913811686080897
Epoch: 72, step: 566, loss: 0.30713656544685364, mean loss: 0.3391378107283996
Epoch: 72, step: 567, loss: 0.28937047719955444, mean loss: 0.33913733464998136
Epoch: 72, step: 568, loss: 0.33903825283050537, mean loss: 0.3391373337021656
Epoch: 72, step: 569, loss: 0.35408350825309753, mean loss: 0.339137476675769
Epoch: 72, step: 570, loss: 0.318764328956604, mean loss: 0.33913728179015007
Epoch: 72, step: 571, loss: 0.3145080506801605, mean loss: 0.33913704619390833
Epoch: 72, step: 572, loss: 0.3413170874118805, mean loss: 0.339137067047365
Epoch: 72, step: 573, loss: 0.39248132705688477, mean loss: 0.33913757731366956
Epoch: 72, step: 574, loss: 0.31672802567481995, mean loss: 0.33913736295640373
Epoch: 72, step: 575, loss: 0.37972965836524963, mean loss: 0.33913775123593587
Epoch: 72, step: 576, loss: 0.3398492634296417, mean loss: 0.3391377580417343
Epoch: 72, step: 577, loss: 0.3345111906528473, mean loss: 0.33913771378784235
Epoch: 72, step: 578, loss: 0.2944830358028412, mean loss: 0.3391372866624539
Epoch: 72, step: 579, loss: 0.30515608191490173, mean loss: 0.33913696163275703
Epoch: 72, step: 580, loss: 0.33857935667037964, mean loss: 0.3391369562993252
Epoch: 72, step: 581, loss: 0.34748464822769165, mean loss: 0.33913703614334173
Epoch: 72, step: 582, loss: 0.325194776058197, mean loss: 0.3391369027896666
Epoch: 72, step: 583, loss: 0.324871301651001, mean loss: 0.3391367663446332
Epoch: 72, step: 584, loss: 0.33243536949157715, mean loss: 0.3391367022489415
Epoch: 72, step: 585, loss: 0.32937726378440857, mean loss: 0.3391366089054208
Epoch: 72, step: 586, loss: 0.34997260570526123, mean loss: 0.33913671254462313
Epoch: 72, step: 587, loss: 0.3446459472179413, mean loss: 0.33913676523633546
Epoch: 72, step: 588, loss: 0.31498774886131287, mean loss: 0.3391365342712506
Epoch: 72, step: 589, loss: 0.3138788044452667, mean loss: 0.339136292704562
Epoch: 72, step: 590, loss: 0.32616379857063293, mean loss: 0.3391361686359105
Epoch: 72, step: 591, loss: 0.36169904470443726, mean loss: 0.3391363844247023
Epoch: 72, step: 592, loss: 0.3330245912075043, mean loss: 0.33913632597276305
Epoch: 72, step: 593, loss: 0.32659557461738586, mean loss: 0.3391362060367313
Epoch: 72, step: 594, loss: 0.3278895318508148, mean loss: 0.33913609847789894
Epoch: 72, step: 595, loss: 0.336532324552536, mean loss: 0.3391360735766526
Epoch: 72, step: 596, loss: 0.32344716787338257, mean loss: 0.3391359235369098
Epoch: 72, step: 597, loss: 0.3156927227973938, mean loss: 0.3391356993416576
Epoch: 72, step: 598, loss: 0.3153665363788605, mean loss: 0.33913547203129235
Epoch: 72, step: 599, loss: 0.2957385778427124, mean loss: 0.3391350570200634
Epoch: 72, step: 600, loss: 0.29613474011421204, mean loss: 0.339134645805297
Epoch: 72, step: 601, loss: 0.3965676426887512, mean loss: 0.3391351950354479
Epoch: 72, step: 602, loss: 0.3488623797893524, mean loss: 0.3391352880553555
Epoch: 72, step: 603, loss: 0.34514120221138, mean loss: 0.33913534548864693
Epoch: 72, step: 604, loss: 0.3159458041191101, mean loss: 0.33913512373407007
Epoch: 72, step: 605, loss: 0.30582669377326965, mean loss: 0.33913480521866507
Epoch: 72, step: 606, loss: 0.32496896386146545, mean loss: 0.33913466975759543
Epoch: 72, step: 607, loss: 0.3859698176383972, mean loss: 0.33913511761511417
Epoch: 72, step: 608, loss: 0.32170164585113525, mean loss: 0.3391349509104682
Epoch: 72, step: 609, loss: 0.394211083650589, mean loss: 0.3391354775617021
Epoch: 72, step: 610, loss: 0.323179692029953, mean loss: 0.3391353249901004
Epoch: 72, step: 611, loss: 0.3354216516017914, mean loss: 0.339135289479741
Epoch: 72, step: 612, loss: 0.31064245104789734, mean loss: 0.33913501703217946
Epoch: 72, step: 613, loss: 0.3372126817703247, mean loss: 0.3391349986510502
Epoch: 72, step: 614, loss: 0.30877938866615295, mean loss: 0.3391347083972806
Epoch: 72, step: 615, loss: 0.3131921887397766, mean loss: 0.33913446034289696
Epoch: 72, step: 616, loss: 0.3621838390827179, mean loss: 0.3391346807318508
Epoch: 72, step: 617, loss: 0.3345481753349304, mean loss: 0.3391346368779373
Epoch: 72, step: 618, loss: 0.3277447521686554, mean loss: 0.3391345279744913
Epoch: 72, step: 619, loss: 0.33966466784477234, mean loss: 0.3391345330433316
Epoch: 72, step: 620, loss: 0.2933901250362396, mean loss: 0.33913409567029995
Epoch: 72, step: 621, loss: 0.3113609552383423, mean loss: 0.33913383012731846
Epoch: 72, step: 622, loss: 0.3267311155796051, mean loss: 0.3391337115443185
Epoch: 72, step: 623, loss: 0.40392300486564636, mean loss: 0.33913433099220475
Epoch: 72, step: 624, loss: 0.32699981331825256, mean loss: 0.33913421497566754
Epoch: 72, step: 625, loss: 0.3347663879394531, mean loss: 0.3391341732158435
Epoch: 72, step: 626, loss: 0.34765100479125977, mean loss: 0.3391342546425998
Epoch: 72, step: 627, loss: 0.3561398983001709, mean loss: 0.33913441722667237
Epoch: 72, step: 628, loss: 0.32149291038513184, mean loss: 0.33913424856498187
Epoch: 72, step: 629, loss: 0.3022797107696533, mean loss: 0.33913389622040746
Epoch: 72, step: 630, loss: 0.29669615626335144, mean loss: 0.33913349050199754
Epoch: 72, step: 631, loss: 0.3231058120727539, mean loss: 0.33913333727371425
Epoch: 72, step: 632, loss: 0.3593571186065674, mean loss: 0.33913353061585566
Epoch: 72, step: 633, loss: 0.3325277864933014, mean loss: 0.3391334674646337
Epoch: 72, step: 634, loss: 0.2889479994773865, mean loss: 0.33913298769380507
Epoch: 72, step: 635, loss: 0.3233315348625183, mean loss: 0.33913283663406707
Epoch: 72, step: 636, loss: 0.3246520459651947, mean loss: 0.339132698201003
Epoch: 72, step: 637, loss: 0.3291793167591095, mean loss: 0.33913260304985066
Epoch: 72, step: 638, loss: 0.3232446014881134, mean loss: 0.3391324511670745
Epoch: 72, step: 639, loss: 0.3023441731929779, mean loss: 0.3391320994895931
Epoch: 72, step: 640, loss: 0.3597377836704254, mean loss: 0.33913229646771337
Epoch: 72, step: 641, loss: 0.3393775224685669, mean loss: 0.3391322988119061
Epoch: 72, step: 642, loss: 0.35690557956695557, mean loss: 0.33913246871068115
Epoch: 72, step: 643, loss: 0.3946003317832947, mean loss: 0.33913299893535015
Epoch: 72, step: 644, loss: 0.34270286560058594, mean loss: 0.3391330330598535
Epoch: 72, step: 645, loss: 0.3447439968585968, mean loss: 0.33913308669477615
Epoch: 72, step: 646, loss: 0.3536089360713959, mean loss: 0.33913322506737453
Epoch: 72, step: 647, loss: 0.3214297890663147, mean loss: 0.3391330558443494
Epoch: 72, step: 648, loss: 0.3215104043483734, mean loss: 0.33913288739513464
Epoch: 72, step: 649, loss: 0.3367769718170166, mean loss: 0.3391328648759164
Epoch: 72, step: 650, loss: 0.3513626456260681, mean loss: 0.3391329817741925
Epoch: 72, step: 651, loss: 0.298252135515213, mean loss: 0.3391325910186366
Epoch: 72, step: 652, loss: 0.34087949991226196, mean loss: 0.3391326077161341
Epoch: 72, step: 653, loss: 0.3369509279727936, mean loss: 0.3391325868631611
Epoch: 72, step: 654, loss: 0.34500500559806824, mean loss: 0.33913264299248963
Epoch: 72, step: 655, loss: 0.35729455947875977, mean loss: 0.3391328165847484
Epoch: 72, step: 656, loss: 0.3261842131614685, mean loss: 0.3391326928227085
Epoch: 72, step: 657, loss: 0.31200137734413147, mean loss: 0.3391324335055648
Epoch: 72, step: 658, loss: 0.3209789991378784, mean loss: 0.33913225999935354
Epoch: 72, step: 659, loss: 0.2930397093296051, mean loss: 0.3391318194619193
Epoch: 72, step: 660, loss: 0.3244668245315552, mean loss: 0.3391316793000623
Epoch: 72, step: 661, loss: 0.30699023604393005, mean loss: 0.33913137210859473
Epoch: 72, step: 662, loss: 0.33535730838775635, mean loss: 0.33913133603836965
Epoch: 72, step: 663, loss: 0.3432386517524719, mean loss: 0.33913137529324117
Epoch: 72, step: 664, loss: 0.33670270442962646, mean loss: 0.33913135208191336
Epoch: 72, step: 665, loss: 0.2918681204319, mean loss: 0.3391309003813987
Epoch: 72, step: 666, loss: 0.36629506945610046, mean loss: 0.33913115999022053
Epoch: 72, step: 667, loss: 0.33495113253593445, mean loss: 0.3391311200419479
Epoch: 72, step: 668, loss: 0.3476397395133972, mean loss: 0.33913120135753866
Epoch: 72, step: 669, loss: 0.3336441218852997, mean loss: 0.3391311489188503
Epoch: 72, step: 670, loss: 0.34111928939819336, mean loss: 0.33913116791884534
Epoch: 72, step: 671, loss: 0.3737565279006958, mean loss: 0.33913149881869226
Epoch: 72, step: 672, loss: 0.29798567295074463, mean loss: 0.3391311056092823
Epoch: 72, step: 673, loss: 0.31198400259017944, mean loss: 0.3391308461809168
Epoch: 72, step: 674, loss: 0.3508591651916504, mean loss: 0.3391309582602629
Epoch: 72, step: 675, loss: 0.32778996229171753, mean loss: 0.3391308498833281
Epoch: 72, step: 676, loss: 0.32130900025367737, mean loss: 0.3391306795756246
Epoch: 72, step: 677, loss: 0.3319181501865387, mean loss: 0.3391306106524991
Epoch: 72, step: 678, loss: 0.3697090446949005, mean loss: 0.3391309028580477
Epoch: 72, step: 679, loss: 0.335697203874588, mean loss: 0.33913087004615466
Epoch: 72, step: 680, loss: 0.3139033317565918, mean loss: 0.3391306289780289
Epoch: 72, step: 681, loss: 0.32902586460113525, mean loss: 0.3391305324203187
Epoch: 72, step: 682, loss: 0.32158029079437256, mean loss: 0.339130364717749
Epoch: 72, step: 683, loss: 0.36461225152015686, mean loss: 0.33913060820938606
Epoch: 72, step: 684, loss: 0.36562901735305786, mean loss: 0.33913086141196164
Epoch: 72, step: 685, loss: 0.322002649307251, mean loss: 0.3391306977468164
Epoch: 72, step: 686, loss: 0.3304003179073334, mean loss: 0.3391306143262456
Epoch: 72, step: 687, loss: 0.3518439531326294, mean loss: 0.3391307358036459
Epoch: 72, step: 688, loss: 0.3178230822086334, mean loss: 0.3391305322085343
Epoch: 72, step: 689, loss: 0.3283206820487976, mean loss: 0.33913042892115863
Epoch: 72, step: 690, loss: 0.2783121168613434, mean loss: 0.3391298478119176
Epoch: 72, step: 691, loss: 0.2965298891067505, mean loss: 0.3391294407800171
Epoch: 72, step: 692, loss: 0.30977746844291687, mean loss: 0.3391291603319769
Epoch: 72, step: 693, loss: 0.3317726254463196, mean loss: 0.33912909004347785
Epoch: 72, step: 694, loss: 0.35020026564598083, mean loss: 0.3391291958227466
Epoch: 72, step: 695, loss: 0.37709280848503113, mean loss: 0.33912955854166293
Epoch: 72, step: 696, loss: 0.365496426820755, mean loss: 0.3391298104584286
Epoch: 72, step: 697, loss: 0.37767502665519714, mean loss: 0.33913017872717105
Epoch: 72, step: 698, loss: 0.3106441795825958, mean loss: 0.3391299065688103
Epoch: 72, step: 699, loss: 0.34477153420448303, mean loss: 0.33912996046902466
Epoch: 72, step: 700, loss: 0.3272039294242859, mean loss: 0.33912984652859296
Epoch: 72, step: 701, loss: 0.320559024810791, mean loss: 0.3391296691060104
Epoch: 72, step: 702, loss: 0.31205320358276367, mean loss: 0.3391294104243744
Epoch: 72, step: 703, loss: 0.33539336919784546, mean loss: 0.3391293747315317
Epoch: 72, step: 704, loss: 0.3656773269176483, mean loss: 0.3391296283590401
Epoch: 72, step: 705, loss: 0.32715436816215515, mean loss: 0.33912951395374175
Epoch: 72, step: 706, loss: 0.37568989396095276, mean loss: 0.3391298632289269
Epoch: 72, step: 707, loss: 0.3371768593788147, mean loss: 0.3391298445713182
Epoch: 72, step: 708, loss: 0.2985379993915558, mean loss: 0.3391294567894255
Epoch: 72, step: 709, loss: 0.32574379444122314, mean loss: 0.33912932891477804
Epoch: 72, step: 710, loss: 0.3398120105266571, mean loss: 0.33912933543644536
Epoch: 72, step: 711, loss: 0.34423306584358215, mean loss: 0.33912938419198996
Epoch: 72, step: 712, loss: 0.33806097507476807, mean loss: 0.33912937398565723
Epoch: 72, step: 713, loss: 0.31881117820739746, mean loss: 0.33912917989120184
Epoch: 72, step: 714, loss: 0.3494315445423126, mean loss: 0.33912927830607964
Epoch: 72, step: 715, loss: 0.33863240480422974, mean loss: 0.3391292735596666
Epoch: 72, step: 716, loss: 0.34734201431274414, mean loss: 0.339129352011601
Epoch: 72, step: 717, loss: 0.37193357944488525, mean loss: 0.3391296653699052
Epoch: 72, step: 718, loss: 0.31221136450767517, mean loss: 0.339129408238639
Epoch: 72, step: 719, loss: 0.3273879885673523, mean loss: 0.33912929608233006
Epoch: 72, step: 720, loss: 0.3523842692375183, mean loss: 0.33912942269518487
Epoch: 72, step: 721, loss: 0.32838597893714905, mean loss: 0.3391293200736952
Epoch: 72, step: 722, loss: 0.32880276441574097, mean loss: 0.33912922143526725
Epoch: 72, step: 723, loss: 0.31570369005203247, mean loss: 0.33912899767861554
Epoch: 72, step: 724, loss: 0.3396966755390167, mean loss: 0.33912900310092514
Epoch: 72, step: 725, loss: 0.32125163078308105, mean loss: 0.33912883234259783
Epoch: 72, step: 726, loss: 0.3122192323207855, mean loss: 0.33912857531408624
Epoch: 72, step: 727, loss: 0.31130993366241455, mean loss: 0.3391283096053519
Epoch: 72, step: 728, loss: 0.32513684034347534, mean loss: 0.3391281759676234
Epoch: 72, step: 729, loss: 0.28916680812835693, mean loss: 0.33912769877256865
Epoch: 72, step: 730, loss: 0.3226955831050873, mean loss: 0.3391275418263164
Epoch: 72, step: 731, loss: 0.34602054953575134, mean loss: 0.33912760766211114
Epoch: 72, step: 732, loss: 0.3215528726577759, mean loss: 0.3391274398056914
Epoch: 72, step: 733, loss: 0.315755158662796, mean loss: 0.339127216578999
Epoch: 72, step: 734, loss: 0.33053645491600037, mean loss: 0.3391271345301402
Epoch: 72, step: 735, loss: 0.3451460003852844, mean loss: 0.33912719201472397
Epoch: 72, step: 736, loss: 0.30780550837516785, mean loss: 0.3391268928725279
Epoch: 72, step: 737, loss: 0.3523271679878235, mean loss: 0.33912701894242947
Epoch: 72, step: 738, loss: 0.3071785569190979, mean loss: 0.3391267138199255
Epoch: 72, step: 739, loss: 0.3047516644001007, mean loss: 0.33912638552553137
Epoch: 72, step: 740, loss: 0.43511471152305603, mean loss: 0.3391273022406752
Epoch: 72, step: 741, loss: 0.34705498814582825, mean loss: 0.33912737795155196
Epoch: 72, step: 742, loss: 0.34784072637557983, mean loss: 0.33912746116485737
Epoch: 72, step: 743, loss: 0.31456857919692993, mean loss: 0.33912722662744077
Epoch: 72, step: 744, loss: 0.30467841029167175, mean loss: 0.33912689764425497
Epoch: 72, step: 745, loss: 0.3435281217098236, mean loss: 0.33912693967515883
Epoch: 72, step: 746, loss: 0.33431702852249146, mean loss: 0.33912689374180494
Epoch: 72, step: 747, loss: 0.3473290205001831, mean loss: 0.3391269720691547
Epoch: 72, step: 748, loss: 0.3261673152446747, mean loss: 0.339126848310292
Epoch: 72, step: 749, loss: 0.32650038599967957, mean loss: 0.3391267277344377
Epoch: 72, step: 750, loss: 0.34310054779052734, mean loss: 0.33912676568189765
Epoch: 72, step: 751, loss: 0.3014124631881714, mean loss: 0.3391264055376798
Epoch: 72, step: 752, loss: 0.3660458028316498, mean loss: 0.33912666259593266
Epoch: 72, step: 753, loss: 0.3351639211177826, mean loss: 0.33912662475535016
Epoch: 72, step: 754, loss: 0.33768272399902344, mean loss: 0.3391266109675408
Epoch: 72, step: 755, loss: 0.3323217034339905, mean loss: 0.33912654598809455
Epoch: 72, step: 756, loss: 0.32143720984458923, mean loss: 0.33912637707583726
Epoch: 72, step: 757, loss: 0.32312899827957153, mean loss: 0.33912622432123196
Epoch: 72, step: 758, loss: 0.3149353861808777, mean loss: 0.33912599333172455
Epoch: 72, step: 759, loss: 0.36447635293006897, mean loss: 0.3391262353907689
Epoch: 72, step: 760, loss: 0.3066466450691223, mean loss: 0.3391259252609069
Epoch: 72, step: 761, loss: 0.3003440201282501, mean loss: 0.33912555495721997
Epoch: 72, step: 762, loss: 0.3045254051685333, mean loss: 0.3391252245856033
Epoch: 72, step: 763, loss: 0.3096313774585724, mean loss: 0.3391249429730386
Epoch: 72, step: 764, loss: 0.30751076340675354, mean loss: 0.33912464111803997
Epoch: 72, step: 765, loss: 0.30997562408447266, mean loss: 0.3391243628032899
Epoch: 72, step: 766, loss: 0.30215567350387573, mean loss: 0.33912400982969654
Epoch: 72, step: 767, loss: 0.3153114914894104, mean loss: 0.3391237824721658
Epoch: 72, step: 768, loss: 0.32578951120376587, mean loss: 0.33912365516022
Epoch: 72, step: 769, loss: 0.3466656506061554, mean loss: 0.33912372716842565
Epoch: 72, step: 770, loss: 0.31646013259887695, mean loss: 0.33912351078680497
Epoch: 72, step: 771, loss: 0.351428359746933, mean loss: 0.3391236282667454
Epoch: 72, step: 772, loss: 0.3145740330219269, mean loss: 0.33912339388292967
Epoch: 72, step: 773, loss: 0.339516282081604, mean loss: 0.3391233976339388
Epoch: 72, step: 774, loss: 0.309885174036026, mean loss: 0.3391231184914319
Epoch: 72, step: 775, loss: 0.33631080389022827, mean loss: 0.33912309164202187
Epoch: 72, step: 776, loss: 0.30727383494377136, mean loss: 0.3391227875773248
Epoch: 72, step: 777, loss: 0.342246949672699, mean loss: 0.33912281740340017
Epoch: 72, step: 778, loss: 0.3622682988643646, mean loss: 0.3391230383689788
Epoch: 72, step: 779, loss: 0.37693411111831665, mean loss: 0.3391233993407658
Epoch: 72, step: 780, loss: 0.35902202129364014, mean loss: 0.33912358930555736
Epoch: 72, step: 781, loss: 0.3096850514411926, mean loss: 0.33912330826939635
Epoch: 72, step: 782, loss: 0.3441270887851715, mean loss: 0.3391233560377281
Epoch: 72, step: 783, loss: 0.36681580543518066, mean loss: 0.3391236203997393
Epoch: 72, step: 784, loss: 0.3529587984085083, mean loss: 0.33912375247402843
Epoch: 72, step: 785, loss: 0.36502397060394287, mean loss: 0.33912399972203927
Epoch: 72, step: 786, loss: 0.38394346833229065, mean loss: 0.3391244275724389
Epoch: 72, step: 787, loss: 0.3194391429424286, mean loss: 0.3391242396568576
Epoch: 72, step: 788, loss: 0.3296135663986206, mean loss: 0.3391241488689078
Epoch: 72, step: 789, loss: 0.2969246506690979, mean loss: 0.3391237460405014
Epoch: 72, step: 790, loss: 0.2970151901245117, mean loss: 0.33912334408404976
Epoch: 72, step: 791, loss: 0.313546359539032, mean loss: 0.3391230999356673
Epoch: 72, step: 792, loss: 0.36226513981819153, mean loss: 0.3391233208388649
Epoch: 72, step: 793, loss: 0.33395588397979736, mean loss: 0.33912327151337607
Epoch: 72, step: 794, loss: 0.35196053981781006, mean loss: 0.3391233940496561
Epoch: 72, step: 795, loss: 0.3167373239994049, mean loss: 0.3391231803687156
Epoch: 72, step: 796, loss: 0.29778656363487244, mean loss: 0.3391227858035771
Epoch: 72, step: 797, loss: 0.35475340485572815, mean loss: 0.33912293499910856
Epoch: 72, step: 798, loss: 0.35891392827033997, mean loss: 0.3391231239039476
Epoch: 72, step: 799, loss: 0.34372711181640625, mean loss: 0.3391231678485482
Epoch: 72, step: 800, loss: 0.29176053404808044, mean loss: 0.3391227157812974
Epoch: 72, step: 801, loss: 0.3314996063709259, mean loss: 0.3391226430208754
Epoch: 72, step: 802, loss: 0.3630206882953644, mean loss: 0.33912287111877726
Epoch: 72, step: 803, loss: 0.32725638151168823, mean loss: 0.33912275785865426
Epoch: 72, step: 804, loss: 0.3240881860256195, mean loss: 0.3391226143620298
Epoch: 72, step: 805, loss: 0.28115060925483704, mean loss: 0.33912206105677173
Epoch: 72, step: 806, loss: 0.3162798583507538, mean loss: 0.3391218430448156
Epoch: 72, step: 807, loss: 0.3074364960193634, mean loss: 0.3391215406344637
Epoch: 72, step: 808, loss: 0.33270344138145447, mean loss: 0.3391214793796153
Epoch: 72, step: 809, loss: 0.3302425742149353, mean loss: 0.3391213946394488
Epoch: 72, step: 810, loss: 0.3243411183357239, mean loss: 0.3391212535780118
Epoch: 72, step: 811, loss: 0.3499586284160614, mean loss: 0.3391213570078156
Epoch: 72, step: 812, loss: 0.3377154767513275, mean loss: 0.3391213435904951
Epoch: 72, step: 813, loss: 0.3415166139602661, mean loss: 0.3391213664500547
Epoch: 72, step: 814, loss: 0.31170618534088135, mean loss: 0.3391211048123739
Epoch: 72, step: 815, loss: 0.3370276093482971, mean loss: 0.3391210848332219
Epoch: 72, step: 816, loss: 0.3055352568626404, mean loss: 0.33912076431188803
Epoch: 72, step: 817, loss: 0.3090140223503113, mean loss: 0.3391204769954339
Epoch: 72, step: 818, loss: 0.3372620642185211, mean loss: 0.3391204592602876
Epoch: 72, step: 819, loss: 0.32880935072898865, mean loss: 0.3391203608605803
Epoch: 72, step: 820, loss: 0.2912662625312805, mean loss: 0.3391199041895716
Epoch: 72, step: 821, loss: 0.3704278767108917, mean loss: 0.3391202029582759
Epoch: 72, step: 822, loss: 0.3762316107749939, mean loss: 0.3391205571051761
Epoch: 72, step: 823, loss: 0.3458024561405182, mean loss: 0.3391206208686221
Epoch: 72, step: 824, loss: 0.35718220472335815, mean loss: 0.33912079322349176
Epoch: 72, step: 825, loss: 0.2943614423274994, mean loss: 0.33912036610599555
Epoch: 72, step: 826, loss: 0.33355164527893066, mean loss: 0.33912031296681117
Epoch: 72, step: 827, loss: 0.31569716334342957, mean loss: 0.3391200894549441
Epoch: 72, step: 828, loss: 0.3581337630748749, mean loss: 0.3391202708883212
Epoch: 72, step: 829, loss: 0.34851014614105225, mean loss: 0.3391203604880774
Epoch: 72, step: 830, loss: 0.36663952469825745, mean loss: 0.3391206230780278
Epoch: 72, step: 831, loss: 0.3326663672924042, mean loss: 0.3391205614916176
Epoch: 72, step: 832, loss: 0.302049845457077, mean loss: 0.3391202077667864
Epoch: 72, step: 833, loss: 0.3364565670490265, mean loss: 0.3391201823508524
Epoch: 72, step: 834, loss: 0.3506039083003998, mean loss: 0.3391202919252534
Epoch: 72, step: 835, loss: 0.3969442546367645, mean loss: 0.33912084365956424
Epoch: 72, step: 836, loss: 0.3735266625881195, mean loss: 0.3391211719437008
Epoch: 72, step: 837, loss: 0.3635849952697754, mean loss: 0.3391214053637657
Epoch: 72, step: 838, loss: 0.3482297658920288, mean loss: 0.33912149226979804
Epoch: 72, step: 839, loss: 0.32217153906822205, mean loss: 0.33912133054594873
Epoch: 72, step: 840, loss: 0.3117576539516449, mean loss: 0.33912106946458553
Epoch: 72, step: 841, loss: 0.3280258774757385, mean loss: 0.33912096360453414
Epoch: 72, step: 842, loss: 0.3200504183769226, mean loss: 0.3391207816527807
Epoch: 72, step: 843, loss: 0.3382734954357147, mean loss: 0.3391207735689142
Epoch: 72, step: 844, loss: 0.3568846881389618, mean loss: 0.3391209430508923
Epoch: 72, step: 845, loss: 0.35184621810913086, mean loss: 0.339121064459054
Epoch: 72, step: 846, loss: 0.3755093514919281, mean loss: 0.3391214116258434
Epoch: 72, step: 847, loss: 0.31935304403305054, mean loss: 0.33912122302517567
Epoch: 72, step: 848, loss: 0.32246071100234985, mean loss: 0.33912106407660797
Epoch: 72, step: 849, loss: 0.31838321685791016, mean loss: 0.33912086623036763
Epoch: 72, step: 850, loss: 0.32441189885139465, mean loss: 0.33912072590306647
Epoch: 72, step: 851, loss: 0.31297436356544495, mean loss: 0.3391204764624794
Epoch: 72, step: 852, loss: 0.37866100668907166, mean loss: 0.33912085368202727
Epoch: 72, step: 853, loss: 0.3715157210826874, mean loss: 0.33912116272848125
Epoch: 72, step: 854, loss: 0.31479111313819885, mean loss: 0.3391209306224588
Epoch: 72, step: 855, loss: 0.3350927233695984, mean loss: 0.3391208921941671
Epoch: 72, step: 856, loss: 0.30950409173965454, mean loss: 0.3391206096585081
Epoch: 72, step: 857, loss: 0.31626754999160767, mean loss: 0.33912039164904795
Epoch: 72, step: 858, loss: 0.3600999116897583, mean loss: 0.3391205917837465
Epoch: 72, step: 859, loss: 0.3238472044467926, mean loss: 0.339120446084245
Epoch: 72, step: 860, loss: 0.3475492596626282, mean loss: 0.33912052648960594
Epoch: 72, step: 861, loss: 0.31209251284599304, mean loss: 0.3391202686625179
Epoch: 72, step: 862, loss: 0.3086946904659271, mean loss: 0.33911997842796704
Epoch: 72, step: 863, loss: 0.34705448150634766, mean loss: 0.3391200541157635
Epoch: 72, step: 864, loss: 0.3793950378894806, mean loss: 0.33912043829807037
Epoch: 72, step: 865, loss: 0.34126797318458557, mean loss: 0.33912045878316954
Epoch: 72, step: 866, loss: 0.35625553131103516, mean loss: 0.33912062223118333
Epoch: 72, step: 867, loss: 0.33639612793922424, mean loss: 0.33912059624302765
Epoch: 72, step: 868, loss: 0.29090893268585205, mean loss: 0.33912013637042965
Epoch: 72, step: 869, loss: 0.34753328561782837, mean loss: 0.3391202166194734
Epoch: 72, step: 870, loss: 0.33767372369766235, mean loss: 0.3391202028221945
Epoch: 72, step: 871, loss: 0.2982819974422455, mean loss: 0.3391198132933374
Epoch: 72, step: 872, loss: 0.31821155548095703, mean loss: 0.33911961386508116
Epoch: 72, step: 873, loss: 0.32379215955734253, mean loss: 0.33911946766933604
Epoch: 72, step: 874, loss: 0.3725614845752716, mean loss: 0.33911978664167475
Epoch: 72, step: 875, loss: 0.31156787276268005, mean loss: 0.3391195238520647
Epoch: 72, step: 876, loss: 0.32161638140678406, mean loss: 0.3391193569090302
Epoch: 72, step: 877, loss: 0.3312579393386841, mean loss: 0.3391192819284151
Epoch: 72, step: 878, loss: 0.34741219878196716, mean loss: 0.33911936102382895
Epoch: 72, step: 879, loss: 0.3329630494117737, mean loss: 0.3391193023072906
Epoch: 72, step: 880, loss: 0.32915982604026794, mean loss: 0.3391192073185328
Epoch: 72, step: 881, loss: 0.3147902190685272, mean loss: 0.3391189752824026
Epoch: 72, step: 882, loss: 0.3381173014640808, mean loss: 0.33911896572909533
Epoch: 72, step: 883, loss: 0.30608612298965454, mean loss: 0.3391186506865331
Epoch: 72, step: 884, loss: 0.3492642045021057, mean loss: 0.3391187474463188
Epoch: 72, step: 885, loss: 0.3279457092285156, mean loss: 0.3391186408882646
Epoch: 72, step: 886, loss: 0.311390221118927, mean loss: 0.33911837644288984
Epoch: 72, step: 887, loss: 0.32090139389038086, mean loss: 0.33911820270955506
Epoch: 72, step: 888, loss: 0.3580654263496399, mean loss: 0.3391183834053945
Epoch: 72, step: 889, loss: 0.32099390029907227, mean loss: 0.3391182105575135
Epoch: 72, step: 890, loss: 0.3587644696235657, mean loss: 0.33911839791633885
Epoch: 72, step: 891, loss: 0.3021654486656189, mean loss: 0.33911804551361857
Epoch: 72, step: 892, loss: 0.3054729998111725, mean loss: 0.3391177246598626
Epoch: 72, step: 893, loss: 0.3270174264907837, mean loss: 0.33911760926726886
Epoch: 72, step: 894, loss: 0.2952022850513458, mean loss: 0.33911719047966776
Epoch: 72, step: 895, loss: 0.34575730562210083, mean loss: 0.33911725380087565
Epoch: 72, step: 896, loss: 0.31641703844070435, mean loss: 0.33911703733002874
Epoch: 72, step: 897, loss: 0.3464619815349579, mean loss: 0.33911710737126427
Epoch: 72, step: 898, loss: 0.29618901014328003, mean loss: 0.3391166980137235
Epoch: 72, step: 899, loss: 0.3684265613555908, mean loss: 0.33911697750664166
Epoch: 72, step: 900, loss: 0.3350363075733185, mean loss: 0.33911693859457104
Epoch: 72, step: 901, loss: 0.3110053241252899, mean loss: 0.3391166705330237
Epoch: 72, step: 902, loss: 0.38172444701194763, mean loss: 0.33911707682052433
Epoch: 72, step: 903, loss: 0.3857343792915344, mean loss: 0.33911752133671996
Epoch: 72, step: 904, loss: 0.31671154499053955, mean loss: 0.3391173076880559
Epoch: 72, step: 905, loss: 0.355394184589386, mean loss: 0.33911746289217615
Epoch: 72, step: 906, loss: 0.3814515769481659, mean loss: 0.3391178665547655
Epoch: 72, step: 907, loss: 0.3066767454147339, mean loss: 0.33911755722640496
Epoch: 72, step: 908, loss: 0.33712083101272583, mean loss: 0.3391175381876623
Epoch: 72, step: 909, loss: 0.34688693284988403, mean loss: 0.3391176122679715
Epoch: 72, step: 910, loss: 0.3121062219142914, mean loss: 0.3391173547198412
Epoch: 72, step: 911, loss: 0.3385065197944641, mean loss: 0.3391173488957096
Epoch: 72, step: 912, loss: 0.35536596179008484, mean loss: 0.3391175038199847
Epoch: 72, step: 913, loss: 0.32431796193122864, mean loss: 0.33911736271338977
Epoch: 72, step: 914, loss: 0.31457263231277466, mean loss: 0.33911712869328736
Epoch: 72, step: 915, loss: 0.33442801237106323, mean loss: 0.3391170839856454
Epoch: 72, step: 916, loss: 0.32297006249427795, mean loss: 0.3391169300358767
Epoch: 72, step: 917, loss: 0.32744261622428894, mean loss: 0.3391168187310904
Epoch: 72, step: 918, loss: 0.30306732654571533, mean loss: 0.3391164750327085
Epoch: 72, step: 919, loss: 0.3041445314884186, mean loss: 0.33911614161092957
Epoch: 72, step: 920, loss: 0.3221864104270935, mean loss: 0.33911598020476513
Epoch: 72, step: 921, loss: 0.36014804244041443, mean loss: 0.3391161807201835
Epoch: 72, step: 922, loss: 0.3597254455089569, mean loss: 0.33911637720286353
Epoch: 72, step: 923, loss: 0.3593802750110626, mean loss: 0.33911657039107435
Epoch: 72, step: 924, loss: 0.3420654833316803, mean loss: 0.3391165985046085
Epoch: 72, step: 925, loss: 0.3229365348815918, mean loss: 0.3391164442530439
Epoch: 72, step: 926, loss: 0.3568545877933502, mean loss: 0.33911661335684806
Epoch: 72, step: 927, loss: 0.32823681831359863, mean loss: 0.3391165096370204
Epoch: 72, step: 928, loss: 0.3680230379104614, mean loss: 0.3391167852076113
Epoch: 72, step: 929, loss: 0.3822709918022156, mean loss: 0.3391171965996931
Epoch: 72, step: 930, loss: 0.34558331966400146, mean loss: 0.33911725824111066
Epoch: 72, step: 931, loss: 0.3696626126766205, mean loss: 0.33911754942656763
Epoch: 72, step: 932, loss: 0.32892993092536926, mean loss: 0.3391174523100625
Epoch: 72, step: 933, loss: 0.3543267548084259, mean loss: 0.3391175972958826
Epoch: 72, step: 934, loss: 0.3032853603363037, mean loss: 0.33911725572093276
Epoch: 72, step: 935, loss: 0.3882239758968353, mean loss: 0.3391177238319693
Epoch: 72, step: 936, loss: 0.31250452995300293, mean loss: 0.3391174701434523
Epoch: 72, step: 937, loss: 0.3692023754119873, mean loss: 0.33911775692309565
Epoch: 72, step: 938, loss: 0.32050105929374695, mean loss: 0.3391175794640354
Epoch: 72, step: 939, loss: 0.3379412293434143, mean loss: 0.3391175682508761
Epoch: 72, step: 940, loss: 0.31059736013412476, mean loss: 0.3391172963942373
Epoch: 72, step: 941, loss: 0.3041355609893799, mean loss: 0.33911696294904237
Epoch: 72, step: 942, loss: 0.36738672852516174, mean loss: 0.33911723241330805
Epoch: 72, step: 943, loss: 0.34466755390167236, mean loss: 0.33911728531785174
Epoch: 72, step: 944, loss: 0.3403208553791046, mean loss: 0.3391172967899292
Epoch: 72, step: 945, loss: 0.3171398639678955, mean loss: 0.3391170873094707
Epoch: 72, step: 946, loss: 0.3524419665336609, mean loss: 0.3391172143158971
Epoch: 72, step: 947, loss: 0.301581472158432, mean loss: 0.3391168565464229
Epoch: 72, step: 948, loss: 0.32161664962768555, mean loss: 0.33911668974593373
Epoch: 72, step: 949, loss: 0.3223438262939453, mean loss: 0.339116529879529
Epoch: 72, step: 950, loss: 0.36694809794425964, mean loss: 0.33911679514671667
Epoch: 72, step: 951, loss: 0.2991659939289093, mean loss: 0.33911641437278206
Epoch: 72, step: 952, loss: 0.33518943190574646, mean loss: 0.3391163769447889
Epoch: 72, step: 953, loss: 0.35106831789016724, mean loss: 0.33911649085741874
Epoch: 72, step: 954, loss: 0.35344675183296204, mean loss: 0.3391166274362525
Epoch: 72, step: 955, loss: 0.3269152045249939, mean loss: 0.33911651114805424
Epoch: 72, step: 956, loss: 0.322407603263855, mean loss: 0.3391163519018509
Epoch: 72, step: 957, loss: 0.29601725935935974, mean loss: 0.33911594114481697
Epoch: 72, step: 958, loss: 0.38115251064300537, mean loss: 0.3391163417716289
Epoch: 72, step: 959, loss: 0.37975022196769714, mean loss: 0.3391167290265103
Epoch: 72, step: 960, loss: 0.3684259057044983, mean loss: 0.3391170083504024
Epoch: 72, step: 961, loss: 0.31765323877334595, mean loss: 0.3391168037971805
Epoch: 72, step: 962, loss: 0.318165123462677, mean loss: 0.3391166041261554
Epoch: 72, step: 963, loss: 0.36154794692993164, mean loss: 0.33911681789643333
Epoch: 72, step: 964, loss: 0.33915388584136963, mean loss: 0.3391168182496868
Epoch: 72, step: 965, loss: 0.3210182189941406, mean loss: 0.33911664577366135
Epoch: 72, step: 966, loss: 0.31328514218330383, mean loss: 0.3391163996069525
Epoch: 72, step: 967, loss: 0.29381829500198364, mean loss: 0.3391159679333171
Epoch: 72, step: 968, loss: 0.34173163771629333, mean loss: 0.3391159928594136
Epoch: 72, step: 969, loss: 0.3191898465156555, mean loss: 0.3391158029744687
Epoch: 72, step: 970, loss: 0.38135573267936707, mean loss: 0.3391162054933578
Epoch: 72, step: 971, loss: 0.29752445220947266, mean loss: 0.33911580915494266
Epoch: 72, step: 972, loss: 0.2815207839012146, mean loss: 0.33911526032250106
Epoch: 72, step: 973, loss: 0.3427020311355591, mean loss: 0.33911529450110267
Epoch: 72, step: 974, loss: 0.32295921444892883, mean loss: 0.3391151405501002
Epoch: 72, step: 975, loss: 0.3230048418045044, mean loss: 0.33911498703680987
Epoch: 72, step: 976, loss: 0.33819112181663513, mean loss: 0.33911497823348224
Epoch: 72, step: 977, loss: 0.3746751546859741, mean loss: 0.3391153170760913
Epoch: 72, step: 978, loss: 0.3215788006782532, mean loss: 0.33911514997730435
Epoch: 72, step: 979, loss: 0.349404901266098, mean loss: 0.33911524802349186
Epoch: 72, step: 980, loss: 0.3333781063556671, mean loss: 0.33911519335749535
Epoch: 72, step: 981, loss: 0.3306923508644104, mean loss: 0.33911511310173076
Epoch: 72, step: 982, loss: 0.34726160764694214, mean loss: 0.3391151907236166
Epoch: 72, step: 983, loss: 0.33124756813049316, mean loss: 0.3391151157596084
Epoch: 72, step: 984, loss: 0.34446439146995544, mean loss: 0.33911516672790576
Epoch: 72, step: 985, loss: 0.35758814215660095, mean loss: 0.33911534273811433
Epoch: 72, step: 986, loss: 0.34237906336784363, mean loss: 0.33911537383449497
Epoch: 72, step: 987, loss: 0.36871224641799927, mean loss: 0.3391156558276405
Epoch: 72, step: 988, loss: 0.30132022500038147, mean loss: 0.3391152957236853
Epoch: 72, step: 989, loss: 0.35235920548439026, mean loss: 0.3391154219066324
Epoch: 72, step: 990, loss: 0.40007928013801575, mean loss: 0.33911600274160825
Epoch: 72, step: 991, loss: 0.3432033956050873, mean loss: 0.3391160416839945
Epoch: 72, step: 992, loss: 0.3127819299697876, mean loss: 0.33911579078974124
Epoch: 72, step: 993, loss: 0.2982346713542938, mean loss: 0.3391154013047902
Epoch: 72, step: 994, loss: 0.33987143635749817, mean loss: 0.33911540850766214
Epoch: 72, step: 995, loss: 0.29318103194236755, mean loss: 0.3391149708873679
Epoch: 72, step: 996, loss: 0.33413687348365784, mean loss: 0.3391149234611077
Epoch: 72, step: 997, loss: 0.33076947927474976, mean loss: 0.33911484395494207
Epoch: 72, step: 998, loss: 0.36797645688056946, mean loss: 0.33911511891386176
Epoch: 72, step: 999, loss: 0.36459997296333313, mean loss: 0.3391153617007497
Epoch: 72, step: 1000, loss: 0.38099992275238037, mean loss: 0.33911576071913657
Epoch: 72, step: 1001, loss: 0.333676815032959, mean loss: 0.33911570890484977
Epoch: 72, step: 1002, loss: 0.35661596059799194, mean loss: 0.33911587561995865
Epoch: 72, step: 1003, loss: 0.32204511761665344, mean loss: 0.33911571299794513
Epoch: 72, step: 1004, loss: 0.3269205689430237, mean loss: 0.3391155968238427
Epoch: 72, step: 1005, loss: 0.34497833251953125, mean loss: 0.3391156526732501
Epoch: 72, step: 1006, loss: 0.326835036277771, mean loss: 0.33911553568714486
Epoch: 72, step: 1007, loss: 0.3285457193851471, mean loss: 0.3391154349992133
Epoch: 72, step: 1008, loss: 0.3265930116176605, mean loss: 0.33911531571190867
Epoch: 72, step: 1009, loss: 0.3076183497905731, mean loss: 0.3391150156779404
Epoch: 72, step: 1010, loss: 0.32254138588905334, mean loss: 0.339114857802272
Epoch: 72, step: 1011, loss: 0.31223198771476746, mean loss: 0.3391146017261614
Epoch: 72, step: 1012, loss: 0.33891791105270386, mean loss: 0.33911459985257786
Epoch: 72, step: 1013, loss: 0.31737756729125977, mean loss: 0.33911439279772504
Epoch: 72, step: 1014, loss: 0.3045842945575714, mean loss: 0.33911406388639426
Epoch: 72, step: 1015, loss: 0.32336723804473877, mean loss: 0.3391139138937683
Epoch: 72, step: 1016, loss: 0.37075069546699524, mean loss: 0.33911421523949936
Epoch: 72, step: 1017, loss: 0.3423890173435211, mean loss: 0.33911424643224986
Epoch: 72, step: 1018, loss: 0.32747888565063477, mean loss: 0.33911413560556863
Epoch: 72, step: 1019, loss: 0.36949071288108826, mean loss: 0.33911442493937133
Epoch: 72, step: 1020, loss: 0.3125777542591095, mean loss: 0.33911417218269513
Epoch: 72, step: 1021, loss: 0.32693883776664734, mean loss: 0.3391140562160848
Epoch: 72, step: 1022, loss: 0.3289893567562103, mean loss: 0.3391139597821099
Epoch: 72, step: 1023, loss: 0.3305850327014923, mean loss: 0.3391138785480437
Epoch: 72, step: 1024, loss: 0.32084354758262634, mean loss: 0.33911370453329065
Epoch: 72, step: 1025, loss: 0.3003568947315216, mean loss: 0.339113335399723
Epoch: 72, step: 1026, loss: 0.3221525549888611, mean loss: 0.33911317386078865
Epoch: 72, step: 1027, loss: 0.3158490061759949, mean loss: 0.3391129522888461
Epoch: 72, step: 1028, loss: 0.37196290493011475, mean loss: 0.33911326515447693
Epoch: 72, step: 1029, loss: 0.3007884621620178, mean loss: 0.3391129001494007
Epoch: 72, step: 1030, loss: 0.3191135823726654, mean loss: 0.3391127096778936
Epoch: 72, step: 1031, loss: 0.3413931429386139, mean loss: 0.3391127313963056
Epoch: 72, step: 1032, loss: 0.3618389070034027, mean loss: 0.33911294783401197
Epoch: 72, step: 1033, loss: 0.3557111322879791, mean loss: 0.3391131059089482
Epoch: 72, step: 1034, loss: 0.33731719851493835, mean loss: 0.33911308880555696
Epoch: 72, step: 1035, loss: 0.34603920578956604, mean loss: 0.3391131547660631
Epoch: 72, step: 1036, loss: 0.367869108915329, mean loss: 0.3391134286192524
Epoch: 72, step: 1037, loss: 0.2753832936286926, mean loss: 0.3391128217002669
Epoch: 72, step: 1038, loss: 0.34309378266334534, mean loss: 0.33911285961165344
Epoch: 72, step: 1039, loss: 0.33959561586380005, mean loss: 0.33911286420898173
Epoch: 72, step: 1040, loss: 0.4044336974620819, mean loss: 0.339113486258837
Epoch: 72, step: 1041, loss: 0.34480130672454834, mean loss: 0.3391135404233972
Epoch: 72, step: 1042, loss: 0.3036481738090515, mean loss: 0.33911320269338213
Epoch: 72, step: 1043, loss: 0.3367805480957031, mean loss: 0.3391131804801627
Epoch: 72, step: 1044, loss: 0.3201524615287781, mean loss: 0.33911299992424154
Epoch: 72, step: 1045, loss: 0.298526406288147, mean loss: 0.33911261343678617
Epoch: 72, step: 1046, loss: 0.3149893581867218, mean loss: 0.3391123837243141
Epoch: 72, step: 1047, loss: 0.3674044907093048, mean loss: 0.3391126531318995
Epoch: 72, step: 1048, loss: 0.35207489132881165, mean loss: 0.33911277656180316
Epoch: 72, step: 1049, loss: 0.3119376003742218, mean loss: 0.33911251779496143
Epoch: 72, step: 1050, loss: 0.3102353811264038, mean loss: 0.3391122428243688
Epoch: 72, step: 1051, loss: 0.3642643690109253, mean loss: 0.339112482322809
Epoch: 72, step: 1052, loss: 0.33651503920555115, mean loss: 0.33911245759020203
Epoch: 72, step: 1053, loss: 0.3303246796131134, mean loss: 0.33911237391461047
Epoch: 72, step: 1054, loss: 0.3155785799026489, mean loss: 0.33911214983232363
Epoch: 72, step: 1055, loss: 0.3763439655303955, mean loss: 0.3391125043400142
Epoch: 72, step: 1056, loss: 0.34415677189826965, mean loss: 0.3391125523692221
Epoch: 72, step: 1057, loss: 0.2996649146080017, mean loss: 0.3391121767704393
Epoch: 72, step: 1058, loss: 0.31687694787979126, mean loss: 0.3391119650607943
Epoch: 72, step: 1059, loss: 0.31544703245162964, mean loss: 0.33911173974056913
Epoch: 72, step: 1060, loss: 0.3481829762458801, mean loss: 0.3391118261094435
Epoch: 72, step: 1061, loss: 0.3553217351436615, mean loss: 0.33911198044543356
Epoch: 72, step: 1062, loss: 0.37167155742645264, mean loss: 0.3391122904451192
Epoch: 72, step: 1063, loss: 0.3418201208114624, mean loss: 0.33911231622612276
Epoch: 72, step: 1064, loss: 0.32970255613327026, mean loss: 0.3391122266375164
Epoch: 72, step: 1065, loss: 0.3269294202327728, mean loss: 0.3391121106483471
Epoch: 72, step: 1066, loss: 0.32992956042289734, mean loss: 0.3391120232246291
Epoch: 72, step: 1067, loss: 0.31033509969711304, mean loss: 0.339111749252624
Epoch: 72, step: 1068, loss: 0.34371939301490784, mean loss: 0.3391117931194877
Epoch: 72, step: 1069, loss: 0.33758285641670227, mean loss: 0.33911177856345365
Epoch: 72, step: 1070, loss: 0.31360113620758057, mean loss: 0.3391115356951632
Epoch: 72, step: 1071, loss: 0.30817389488220215, mean loss: 0.33911124116316765
Epoch: 72, step: 1072, loss: 0.2818525731563568, mean loss: 0.3391106960553716
Epoch: 72, step: 1073, loss: 0.4112533628940582, mean loss: 0.33911138285366976
Epoch: 72, step: 1074, loss: 0.3513311743736267, mean loss: 0.33911149918499617
Epoch: 72, step: 1075, loss: 0.30780041217803955, mean loss: 0.33911120110907556
Epoch: 72, step: 1076, loss: 0.3233293294906616, mean loss: 0.33911105086992455
Epoch: 72, step: 1077, loss: 0.4021387994289398, mean loss: 0.33911165087133877
Epoch: 72, step: 1078, loss: 0.302143931388855, mean loss: 0.3391112989553442
Epoch: 72, step: 1079, loss: 0.33218008279800415, mean loss: 0.3391112329739247
Epoch: 72, step: 1080, loss: 0.34222304821014404, mean loss: 0.3391112625964364
Epoch: 72, step: 1081, loss: 0.3442661166191101, mean loss: 0.3391113116669174
Epoch: 72, step: 1082, loss: 0.3468879461288452, mean loss: 0.33911138569414667
Epoch: 72, step: 1083, loss: 0.3429020345211029, mean loss: 0.3391114217776941
Epoch: 72, step: 1084, loss: 0.35113054513931274, mean loss: 0.3391115361877858
Epoch: 72, step: 1085, loss: 0.3584827184677124, mean loss: 0.33911172058040556
Epoch: 72, step: 1086, loss: 0.3557734191417694, mean loss: 0.33911187918017294
Epoch: 72, step: 1087, loss: 0.31542983651161194, mean loss: 0.33911165375713503
Epoch: 72, step: 1088, loss: 0.38830310106277466, mean loss: 0.33911212199292423
Epoch: 72, step: 1089, loss: 0.3142782151699066, mean loss: 0.3391118856100993
Epoch: 72, step: 1090, loss: 0.362006813287735, mean loss: 0.33911210353457677
Epoch: 72, step: 1091, loss: 0.33996790647506714, mean loss: 0.3391121116804262
Epoch: 72, step: 1092, loss: 0.3776862621307373, mean loss: 0.3391124788399854
Epoch: 72, step: 1093, loss: 0.34863343834877014, mean loss: 0.33911256946227997
Epoch: 72, step: 1094, loss: 0.35481706261634827, mean loss: 0.3391127189391953
Epoch: 72, step: 1095, loss: 0.34193235635757446, mean loss: 0.339112745776527
Epoch: 72, step: 1096, loss: 0.3293277621269226, mean loss: 0.3391126526438601
Epoch: 72, step: 1097, loss: 0.32576510310173035, mean loss: 0.33911252560419414
Epoch: 72, step: 1098, loss: 0.3229377269744873, mean loss: 0.33911237165672603
Epoch: 72, step: 1099, loss: 0.3444904386997223, mean loss: 0.33911242284326276
Epoch: 72, step: 1100, loss: 0.3472382128238678, mean loss: 0.3391125001809169
Epoch: 72, step: 1101, loss: 0.35142195224761963, mean loss: 0.33911261733569054
Epoch: 72, step: 1102, loss: 0.3145269751548767, mean loss: 0.3391123833449397
Epoch: 72, step: 1103, loss: 0.33714956045150757, mean loss: 0.339112364664198
Epoch: 72, step: 1104, loss: 0.3143766522407532, mean loss: 0.33911212924965356
Epoch: 72, step: 1105, loss: 0.30844414234161377, mean loss: 0.3391118373792869
Epoch: 72, step: 1106, loss: 0.3262869119644165, mean loss: 0.3391117153243222
Epoch: 72, step: 1107, loss: 0.35808059573173523, mean loss: 0.3391118958496601
Epoch: 72, step: 1108, loss: 0.320211797952652, mean loss: 0.3391117159806317
Epoch: 72, step: 1109, loss: 0.3272063732147217, mean loss: 0.33911160268058066
Epoch: 72, step: 1110, loss: 0.32301512360572815, mean loss: 0.33911144949603306
Epoch: 72, step: 1111, loss: 0.37844541668891907, mean loss: 0.3391118238200452
Epoch: 72, step: 1112, loss: 0.3485296070575714, mean loss: 0.3391119134440803
Epoch: 72, step: 1113, loss: 0.3573041558265686, mean loss: 0.3391120865683298
Epoch: 72, step: 1114, loss: 0.3134540617465973, mean loss: 0.33911184239919856
Epoch: 72, step: 1115, loss: 0.29952195286750793, mean loss: 0.3391114656540277
Epoch: 72, step: 1116, loss: 0.3410821855068207, mean loss: 0.33911148440760674
Epoch: 72, step: 1117, loss: 0.3015388548374176, mean loss: 0.33911112686588313
Epoch: 72, step: 1118, loss: 0.35346123576164246, mean loss: 0.3391112634204417
Epoch: 72, step: 1119, loss: 0.32889729738235474, mean loss: 0.3391111662260328
Epoch: 72, step: 1120, loss: 0.30598756670951843, mean loss: 0.33911085103034616
Epoch: 72, step: 1121, loss: 0.36767566204071045, mean loss: 0.3391111228431829
Epoch: 72, step: 1122, loss: 0.3225432336330414, mean loss: 0.33911096519039424
Epoch: 72, step: 1123, loss: 0.37226802110671997, mean loss: 0.33911128069543667
Epoch: 72, step: 1124, loss: 0.2876257598400116, mean loss: 0.3391107907910581
Epoch: 72, step: 1125, loss: 0.36032915115356445, mean loss: 0.33911099268993306
Epoch: 72, step: 1126, loss: 0.33518505096435547, mean loss: 0.33911095533381025
Epoch: 72, step: 1127, loss: 0.33570796251296997, mean loss: 0.3391109229539592
Epoch: 72, step: 1128, loss: 0.4288817048072815, mean loss: 0.3391117771246953
Epoch: 72, step: 1129, loss: 0.3443596661090851, mean loss: 0.339111827057986
Epoch: 72, step: 1130, loss: 0.32472750544548035, mean loss: 0.33911169019349047
Epoch: 72, step: 1131, loss: 0.3426815867424011, mean loss: 0.339111724160156
Epoch: 72, step: 1132, loss: 0.3002641499042511, mean loss: 0.33911135453879887
Epoch: 72, step: 1133, loss: 0.3227693736553192, mean loss: 0.3391111990519301
Epoch: 72, step: 1134, loss: 0.32994645833969116, mean loss: 0.33911111185422205
Epoch: 72, step: 1135, loss: 0.3132820725440979, mean loss: 0.3391108661067785
Epoch: 72, step: 1136, loss: 0.4024222791194916, mean loss: 0.33911146847025325
Epoch: 72, step: 1137, loss: 0.3769637942314148, mean loss: 0.3391118286050292
Epoch: 72, step: 1138, loss: 0.3161897659301758, mean loss: 0.33911161052190747
Epoch: 72, step: 1139, loss: 0.34736698865890503, mean loss: 0.3391116890637705
Epoch: 72, step: 1140, loss: 0.33602505922317505, mean loss: 0.3391116596977805
Epoch: 72, step: 1141, loss: 0.3885946273803711, mean loss: 0.33911213047094846
Epoch: 72, step: 1142, loss: 0.3196043074131012, mean loss: 0.33911194487835533
Epoch: 72, step: 1143, loss: 0.31053951382637024, mean loss: 0.3391116730499147
Epoch: 72, step: 1144, loss: 0.31430113315582275, mean loss: 0.33911143701307916
Epoch: 72, step: 1145, loss: 0.30855754017829895, mean loss: 0.33911114633917433
Epoch: 72, step: 1146, loss: 0.3455817997455597, mean loss: 0.33911120789702437
Epoch: 72, step: 1147, loss: 0.31924062967300415, mean loss: 0.33911101886226064
Epoch: 72, step: 1148, loss: 0.3280651867389679, mean loss: 0.33911091378095004
Epoch: 72, step: 1149, loss: 0.3072222173213959, mean loss: 0.3391106104199989
Epoch: 72, step: 1150, loss: 0.35961899161338806, mean loss: 0.33911080551680534
Epoch: 72, step: 1151, loss: 0.35870158672332764, mean loss: 0.3391109918826844
Epoch: 72, step: 1152, loss: 0.3061083257198334, mean loss: 0.3391106779333673
Epoch: 72, step: 1153, loss: 0.3240494728088379, mean loss: 0.33911053465978874
Epoch: 72, step: 1154, loss: 0.3396082818508148, mean loss: 0.3391105393946916
Epoch: 72, step: 1155, loss: 0.3759748637676239, mean loss: 0.33911089006936507
Epoch: 72, step: 1156, loss: 0.3411343991756439, mean loss: 0.3391109093179654
Epoch: 72, step: 1157, loss: 0.32582366466522217, mean loss: 0.33911078292445046
Epoch: 72, step: 1158, loss: 0.3094134032726288, mean loss: 0.3391105004339423
Epoch: 72, step: 1159, loss: 0.3242779076099396, mean loss: 0.3391103593431499
Epoch: 72, step: 1160, loss: 0.31710389256477356, mean loss: 0.3391101500149267
Epoch: 72, step: 1161, loss: 0.3854195177555084, mean loss: 0.339110590511148
Epoch: 72, step: 1162, loss: 0.3539358079433441, mean loss: 0.33911073152775995
Epoch: 72, step: 1163, loss: 0.36596912145614624, mean loss: 0.3391109870007836
Epoch: 72, step: 1164, loss: 0.33107706904411316, mean loss: 0.3391109105840738
Epoch: 72, step: 1165, loss: 0.299755722284317, mean loss: 0.3391105362504776
Epoch: 72, step: 1166, loss: 0.33792516589164734, mean loss: 0.3391105249757322
Epoch: 72, step: 1167, loss: 0.3660464286804199, mean loss: 0.33911078117630766
Epoch: 72, step: 1168, loss: 0.346721351146698, mean loss: 0.3391108535634784
Epoch: 72, step: 1169, loss: 0.34455910325050354, mean loss: 0.3391109053834644
Epoch: 72, step: 1170, loss: 0.30418628454208374, mean loss: 0.33911057320776516
Epoch: 72, step: 1171, loss: 0.3077124059200287, mean loss: 0.3391102745757765
Epoch: 72, step: 1172, loss: 0.30301350355148315, mean loss: 0.33910993125803157
Epoch: 72, step: 1173, loss: 0.3009342551231384, mean loss: 0.33910956817119536
Epoch: 72, step: 1174, loss: 0.3791029751300812, mean loss: 0.3391099485427556
Epoch: 72, step: 1175, loss: 0.3392924964427948, mean loss: 0.339109950278926
Epoch: 72, step: 1176, loss: 0.31753334403038025, mean loss: 0.33910974507082053
Epoch: 72, step: 1177, loss: 0.31671223044395447, mean loss: 0.33910953205734756
Epoch: 72, step: 1178, loss: 0.35759925842285156, mean loss: 0.3391097079037946
Epoch: 72, step: 1179, loss: 0.3474753201007843, mean loss: 0.3391097874641495
Epoch: 72, step: 1180, loss: 0.3556367754936218, mean loss: 0.3391099446409941
Epoch: 72, step: 1181, loss: 0.320742130279541, mean loss: 0.33910976995897446
Epoch: 72, step: 1182, loss: 0.3385845422744751, mean loss: 0.3391097649639893
Epoch: 72, step: 1183, loss: 0.33894577622413635, mean loss: 0.3391097634044494
Epoch: 72, step: 1184, loss: 0.35505446791648865, mean loss: 0.3391099150378266
Epoch: 72, step: 1185, loss: 0.31672802567481995, mean loss: 0.3391097021891536
Epoch: 72, step: 1186, loss: 0.3358985185623169, mean loss: 0.3391096716515317
Epoch: 72, step: 1187, loss: 0.3504026234149933, mean loss: 0.3391097790438989
Epoch: 72, step: 1188, loss: 0.32535773515701294, mean loss: 0.33910964826759404
Epoch: 72, step: 1189, loss: 0.4038848876953125, mean loss: 0.3391102642477328
Epoch: 72, step: 1190, loss: 0.36589592695236206, mean loss: 0.3391105189635698
Epoch: 72, step: 1191, loss: 0.3174600303173065, mean loss: 0.3391103130821639
Epoch: 72, step: 1192, loss: 0.35099315643310547, mean loss: 0.339110426078839
Epoch: 72, step: 1193, loss: 0.3029060363769531, mean loss: 0.33911008180629093
Epoch: 72, step: 1194, loss: 0.33983421325683594, mean loss: 0.3391100886920915
Epoch: 72, step: 1195, loss: 0.3304632604122162, mean loss: 0.33911000646976946
Epoch: 72, step: 1196, loss: 0.35935062170028687, mean loss: 0.3391101989350881
Epoch: 72, step: 1197, loss: 0.3318987190723419, mean loss: 0.3391101303627371
Epoch: 72, step: 1198, loss: 0.3606933653354645, mean loss: 0.33911033559094533
Epoch: 72, step: 1199, loss: 0.3484577536582947, mean loss: 0.33911042447176526
Epoch: 72, step: 1200, loss: 0.3058411180973053, mean loss: 0.33911010813038733
Epoch: 72, step: 1201, loss: 0.31241676211357117, mean loss: 0.33910985431897706
Epoch: 72, step: 1202, loss: 0.3170434534549713, mean loss: 0.3391096445044762
Epoch: 72, step: 1203, loss: 0.3364804983139038, mean loss: 0.3391096195059387
Epoch: 72, step: 1204, loss: 0.356668621301651, mean loss: 0.33910978645945145
Epoch: 72, step: 1205, loss: 0.2917175590991974, mean loss: 0.33910933585162667
Epoch: 72, step: 1206, loss: 0.3110829293727875, mean loss: 0.3391090693775931
Epoch: 72, step: 1207, loss: 0.3294353485107422, mean loss: 0.3391089774010883
Epoch: 72, step: 1208, loss: 0.3407764434814453, mean loss: 0.3391089932549925
Epoch: 72, step: 1209, loss: 0.3742589056491852, mean loss: 0.3391093274495236
Epoch: 72, step: 1210, loss: 0.3095461428165436, mean loss: 0.33910904637455014
Epoch: 72, step: 1211, loss: 0.355196475982666, mean loss: 0.339109199325963
Epoch: 72, step: 1212, loss: 0.34492623805999756, mean loss: 0.33910925463099656
Epoch: 72, step: 1213, loss: 0.33420321345329285, mean loss: 0.3391092079876433
Epoch: 72, step: 1214, loss: 0.3243575990200043, mean loss: 0.33910906774056
Epoch: 72, step: 1215, loss: 0.3153204917907715, mean loss: 0.339108841579015
Epoch: 72, step: 1216, loss: 0.34322690963745117, mean loss: 0.33910888072973094
Epoch: 72, step: 1217, loss: 0.328819215297699, mean loss: 0.3391087829062047
Epoch: 72, step: 1218, loss: 0.3521263003349304, mean loss: 0.3391089066621577
Epoch: 72, step: 1219, loss: 0.31818121671676636, mean loss: 0.33910870770704926
Epoch: 72, step: 1220, loss: 0.32042959332466125, mean loss: 0.33910853013035985
Epoch: 72, step: 1221, loss: 0.3234713673591614, mean loss: 0.33910838147399736
Epoch: 72, step: 1222, loss: 0.37085413932800293, mean loss: 0.3391086832655751
Epoch: 72, step: 1223, loss: 0.2995143532752991, mean loss: 0.3391083068649934
Epoch: 72, step: 1224, loss: 0.32352182269096375, mean loss: 0.3391081586946382
Epoch: 72, step: 1225, loss: 0.3066346049308777, mean loss: 0.3391078499930605
Epoch: 72, step: 1226, loss: 0.34174516797065735, mean loss: 0.33910787506381457
Epoch: 72, step: 1227, loss: 0.3053761422634125, mean loss: 0.3391075544077744
Epoch: 72, step: 1228, loss: 0.3488577902317047, mean loss: 0.3391076470932676
Epoch: 72, step: 1229, loss: 0.32221519947052, mean loss: 0.3391074865156176
Epoch: 72, step: 1230, loss: 0.3585498631000519, mean loss: 0.33910767133084
Epoch: 72, step: 1231, loss: 0.35851380228996277, mean loss: 0.3391078557997655
Epoch: 72, step: 1232, loss: 0.3389663100242615, mean loss: 0.3391078544542861
Epoch: 72, step: 1233, loss: 0.31584545969963074, mean loss: 0.3391076333330645
Epoch: 72, step: 1234, loss: 0.3253827691078186, mean loss: 0.339107502872296
Epoch: 72, step: 1235, loss: 0.29332658648490906, mean loss: 0.3391070677090286
Epoch: 72, step: 1236, loss: 0.3406960964202881, mean loss: 0.3391070828131464
Epoch: 72, step: 1237, loss: 0.3616310954093933, mean loss: 0.3391072969075193
Epoch: 72, step: 1238, loss: 0.3283851444721222, mean loss: 0.3391071949926996
Epoch: 72, step: 1239, loss: 0.37163081765174866, mean loss: 0.33910750412910234
Epoch: 72, step: 1240, loss: 0.3103630840778351, mean loss: 0.339107230916544
Epoch: 72, step: 1241, loss: 0.3253364861011505, mean loss: 0.3391071000283697
Epoch: 72, step: 1242, loss: 0.33971142768859863, mean loss: 0.3391071057723286
Epoch: 72, step: 1243, loss: 0.32454559206962585, mean loss: 0.33910696737068524
Epoch: 72, step: 1244, loss: 0.3038012683391571, mean loss: 0.3391066318066482
Epoch: 72, step: 1245, loss: 0.3094397187232971, mean loss: 0.33910634983929516
Epoch: 72, step: 1246, loss: 0.3807976245880127, mean loss: 0.3391067460876889
Epoch: 72, step: 1247, loss: 0.36625930666923523, mean loss: 0.33910700415262757
Epoch: 72, step: 1248, loss: 0.32350078225135803, mean loss: 0.3391068558284794
Epoch: 72, step: 1249, loss: 0.33947479724884033, mean loss: 0.33910685932542306
Epoch: 72, step: 1250, loss: 0.31173375248908997, mean loss: 0.33910659917177366
Epoch: 72, step: 1251, loss: 0.29867321252822876, mean loss: 0.3391062148970479
Epoch: 72, step: 1252, loss: 0.34538185596466064, mean loss: 0.33910627453952485
Epoch: 72, step: 1253, loss: 0.3472195565700531, mean loss: 0.33910635164585273
Epoch: 72, step: 1254, loss: 0.35864078998565674, mean loss: 0.33910653729384166
Epoch: 72, step: 1255, loss: 0.28248995542526245, mean loss: 0.3391059992361565
Epoch: 72, step: 1256, loss: 0.3449600636959076, mean loss: 0.3391060548699361
Epoch: 72, step: 1257, loss: 0.3265362083911896, mean loss: 0.3391059354142267
Epoch: 72, step: 1258, loss: 0.3152781128883362, mean loss: 0.3391057089721298
Epoch: 72, step: 1259, loss: 0.32143792510032654, mean loss: 0.33910554107210444
Epoch: 72, step: 1260, loss: 0.34174463152885437, mean loss: 0.3391055661516021
Epoch: 72, step: 1261, loss: 0.29373136162757874, mean loss: 0.339105134960834
Epoch: 72, step: 1262, loss: 0.3380163908004761, mean loss: 0.3391051246146037
Epoch: 72, step: 1263, loss: 0.3209112286567688, mean loss: 0.3391049517214157
Epoch: 72, step: 1264, loss: 0.3271920382976532, mean loss: 0.3391048385163049
Epoch: 72, step: 1265, loss: 0.3097492456436157, mean loss: 0.33910455956090196
Epoch: 72, step: 1266, loss: 0.3530011773109436, mean loss: 0.33910469161409484
Epoch: 72, step: 1267, loss: 0.2887246310710907, mean loss: 0.3391042128800063
Epoch: 72, step: 1268, loss: 0.33366256952285767, mean loss: 0.33910416117154485
Epoch: 72, step: 1269, loss: 0.34116873145103455, mean loss: 0.3391041807896512
Epoch: 72, step: 1270, loss: 0.3171882629394531, mean loss: 0.3391039725406385
Epoch: 72, step: 1271, loss: 0.3219625651836395, mean loss: 0.3391038096614352
Epoch: 72, step: 1272, loss: 0.33112579584121704, mean loss: 0.33910373385434656
Epoch: 72, step: 1273, loss: 0.3152337968349457, mean loss: 0.33910350704435605
Epoch: 72, step: 1274, loss: 0.3233706057071686, mean loss: 0.3391033575531658
Epoch: 72, step: 1275, loss: 0.35702309012413025, mean loss: 0.33910352782161407
Epoch: 72, step: 1276, loss: 0.30915164947509766, mean loss: 0.33910324322967766
Epoch: 72, step: 1277, loss: 0.4338934123516083, mean loss: 0.33910414388309085
Epoch: 72, step: 1278, loss: 0.3668610453605652, mean loss: 0.3391044076141376
Epoch: 72, step: 1279, loss: 0.3121020495891571, mean loss: 0.33910415105479186
Epoch: 72, step: 1280, loss: 0.33927860856056213, mean loss: 0.3391041527123611
Epoch: 72, step: 1281, loss: 0.318732887506485, mean loss: 0.33910395916114777
Epoch: 72, step: 1282, loss: 0.3425816297531128, mean loss: 0.3391039922028347
Epoch: 72, step: 1283, loss: 0.31474369764328003, mean loss: 0.33910376075550297
Epoch: 72, step: 1284, loss: 0.34258654713630676, mean loss: 0.33910379384516676
Epoch: 72, step: 1285, loss: 0.3538998067378998, mean loss: 0.3391039344195192
Epoch: 72, step: 1286, loss: 0.36802923679351807, mean loss: 0.33910420923118967
Epoch: 72, step: 1287, loss: 0.3134787082672119, mean loss: 0.33910396577237534
Epoch: 72, step: 1288, loss: 0.29832738637924194, mean loss: 0.33910357837220817
Epoch: 72, step: 1289, loss: 0.35225099325180054, mean loss: 0.33910370327876993
Epoch: 72, step: 1290, loss: 0.3122677803039551, mean loss: 0.3391034483274311
Epoch: 72, step: 1291, loss: 0.324004590511322, mean loss: 0.33910330488397855
Epoch: 72, step: 1292, loss: 0.3373640775680542, mean loss: 0.3391032883609803
Epoch: 72, step: 1293, loss: 0.33201274275779724, mean loss: 0.3391032210000561
Epoch: 72, step: 1294, loss: 0.339124858379364, mean loss: 0.3391032212056115
Epoch: 72, step: 1295, loss: 0.3509489595890045, mean loss: 0.33910333373922585
Epoch: 72, step: 1296, loss: 0.32110199332237244, mean loss: 0.33910316272948454
Epoch: 72, step: 1297, loss: 0.35583487153053284, mean loss: 0.3391033216764266
Epoch: 72, step: 1298, loss: 0.3432399034500122, mean loss: 0.33910336097251914
Epoch: 72, step: 1299, loss: 0.33146166801452637, mean loss: 0.3391032883797753
Epoch: 72, step: 1300, loss: 0.30002132058143616, mean loss: 0.33910291712168605
Epoch: 72, step: 1301, loss: 0.33626559376716614, mean loss: 0.33910289016886613
Epoch: 72, step: 1302, loss: 0.358395516872406, mean loss: 0.3391030734351665
Epoch: 72, step: 1303, loss: 0.33514949679374695, mean loss: 0.3391030358793431
Epoch: 72, step: 1304, loss: 0.3347487449645996, mean loss: 0.33910299451744674
Epoch: 72, step: 1305, loss: 0.3284686207771301, mean loss: 0.33910289350130085
Epoch: 72, step: 1306, loss: 0.3489570915699005, mean loss: 0.339102987105652
Epoch: 72, step: 1307, loss: 0.3883846402168274, mean loss: 0.3391034552242461
Epoch: 72, step: 1308, loss: 0.31220123171806335, mean loss: 0.339103199686726
Epoch: 72, step: 1309, loss: 0.30672532320022583, mean loss: 0.3391028921402634
Epoch: 72, step: 1310, loss: 0.4138135015964508, mean loss: 0.3391036017842518
Epoch: 72, step: 1311, loss: 0.3688488006591797, mean loss: 0.33910388431843563
Epoch: 72, step: 1312, loss: 0.3542827367782593, mean loss: 0.3391040284930964
Epoch: 72, step: 1313, loss: 0.38844913244247437, mean loss: 0.3391044971876876
Epoch: 72, step: 1314, loss: 0.33550167083740234, mean loss: 0.3391044629672878
Epoch: 72, step: 1315, loss: 0.3681887686252594, mean loss: 0.3391047392134948
Epoch: 72, step: 1316, loss: 0.33049774169921875, mean loss: 0.33910465746398144
Epoch: 72, step: 1317, loss: 0.35302427411079407, mean loss: 0.33910478967165053
Epoch: 72, step: 1318, loss: 0.3276902437210083, mean loss: 0.3391046812580197
Epoch: 72, step: 1319, loss: 0.32416683435440063, mean loss: 0.33910453938195684
Epoch: 72, step: 1320, loss: 0.32483577728271484, mean loss: 0.33910440386198704
Epoch: 72, step: 1321, loss: 0.31928956508636475, mean loss: 0.3391042156690079
Epoch: 72, step: 1322, loss: 0.3282903730869293, mean loss: 0.33910411296466864
Epoch: 72, step: 1323, loss: 0.3164232671260834, mean loss: 0.33910389755565523
Epoch: 72, step: 1324, loss: 0.38206303119659424, mean loss: 0.3391043055517579
Epoch: 72, step: 1325, loss: 0.33638590574264526, mean loss: 0.33910427973452417
Epoch: 72, step: 1326, loss: 0.3408661186695099, mean loss: 0.3391042964669325
Epoch: 72, step: 1327, loss: 0.32075703144073486, mean loss: 0.3391041222222791
Epoch: 72, step: 1328, loss: 0.3355710208415985, mean loss: 0.3391040886686035
Epoch: 72, step: 1329, loss: 0.32726356387138367, mean loss: 0.3391039762208381
Epoch: 72, step: 1330, loss: 0.36008670926094055, mean loss: 0.33910417548895117
Epoch: 72, step: 1331, loss: 0.36794355511665344, mean loss: 0.33910444936720024
Epoch: 72, step: 1332, loss: 0.3414975106716156, mean loss: 0.3391044720931127
Epoch: 72, step: 1333, loss: 0.358697772026062, mean loss: 0.33910465816080304
Epoch: 72, step: 1334, loss: 0.3335058391094208, mean loss: 0.3391046049921464
Epoch: 72, step: 1335, loss: 0.3504336178302765, mean loss: 0.3391047125760258
Epoch: 72, step: 1336, loss: 0.3309028446674347, mean loss: 0.3391046346892407
Epoch: 72, step: 1337, loss: 0.3727375864982605, mean loss: 0.33910495407229396
Epoch: 72, step: 1338, loss: 0.3123925030231476, mean loss: 0.3391047004096595
Epoch: 72, step: 1339, loss: 0.34413883090019226, mean loss: 0.3391047482135347
Epoch: 72, step: 1340, loss: 0.3579476773738861, mean loss: 0.33910492714343776
Epoch: 72, step: 1341, loss: 0.34623047709465027, mean loss: 0.33910499480605244
Epoch: 72, step: 1342, loss: 0.33800598978996277, mean loss: 0.3391049843702479
Epoch: 72, step: 1343, loss: 0.3150821924209595, mean loss: 0.3391047562595677
Epoch: 72, step: 1344, loss: 0.34704089164733887, mean loss: 0.3391048316171721
Epoch: 72, step: 1345, loss: 0.3255738317966461, mean loss: 0.3391047031347308
Epoch: 72, step: 1346, loss: 0.3467216193675995, mean loss: 0.3391047754598149
Epoch: 72, step: 1347, loss: 0.3511088788509369, mean loss: 0.33910488944157824
Epoch: 72, step: 1348, loss: 0.29926660656929016, mean loss: 0.33910451117137613
Epoch: 72, step: 1349, loss: 0.33371248841285706, mean loss: 0.33910445997383387
Epoch: 72, step: 1350, loss: 0.2974240481853485, mean loss: 0.3391040642198694
Epoch: 72, step: 1351, loss: 0.33325982093811035, mean loss: 0.339104008729523
Epoch: 72, step: 1352, loss: 0.31103840470314026, mean loss: 0.3391037422527138
Epoch: 72, step: 1353, loss: 0.3977782726287842, mean loss: 0.33910429934933534
Epoch: 72, step: 1354, loss: 0.34163686633110046, mean loss: 0.3391043233950517
Epoch: 72, step: 1355, loss: 0.3169788420200348, mean loss: 0.3391041133243995
Epoch: 72, step: 1356, loss: 0.3613283038139343, mean loss: 0.33910432433024323
Epoch: 72, step: 1357, loss: 0.3181856572628021, mean loss: 0.3391041257214755
Epoch: 72, step: 1358, loss: 0.3122918903827667, mean loss: 0.3391038711596316
Epoch: 72, step: 1359, loss: 0.3265605866909027, mean loss: 0.3391037520717872
Epoch: 72, step: 1360, loss: 0.34683871269226074, mean loss: 0.3391038255079788
Epoch: 72, step: 1361, loss: 0.34482380747795105, mean loss: 0.3391038798133236
Epoch: 72, step: 1362, loss: 0.2986179292201996, mean loss: 0.3391034954445187
Epoch: 72, step: 1363, loss: 0.34255191683769226, mean loss: 0.33910352818311085
Epoch: 72, step: 1364, loss: 0.3612901270389557, mean loss: 0.33910373881604505
Epoch: 72, step: 1365, loss: 0.31425514817237854, mean loss: 0.3391035029131966
Epoch: 72, step: 1366, loss: 0.31171536445617676, mean loss: 0.339103242903338
Epoch: 72, step: 1367, loss: 0.34834638237953186, mean loss: 0.33910333065244064
Epoch: 72, step: 1368, loss: 0.33953186869621277, mean loss: 0.33910333472069815
Epoch: 72, step: 1369, loss: 0.3062112033367157, mean loss: 0.33910302246746205
Epoch: 72, step: 1370, loss: 0.3386949598789215, mean loss: 0.33910301859365855
Epoch: 72, step: 1371, loss: 0.3317527770996094, mean loss: 0.3391029488173011
Epoch: 72, step: 1372, loss: 0.3276675343513489, mean loss: 0.3391028402611409
Epoch: 72, step: 1373, loss: 0.33116668462753296, mean loss: 0.33910276492408986
Epoch: 72, step: 1374, loss: 0.3276009261608124, mean loss: 0.33910265573943815
Epoch: 72, step: 1375, loss: 0.30450940132141113, mean loss: 0.3391023273557199
Epoch: 72, step: 1376, loss: 0.3642308712005615, mean loss: 0.3391025658914249
Epoch: 72, step: 1377, loss: 0.31131091713905334, mean loss: 0.3391023020783826
Epoch: 72, step: 1378, loss: 0.2814868986606598, mean loss: 0.3391017551676645
Epoch: 72, step: 1379, loss: 0.3101016879081726, mean loss: 0.3391014798889002
Epoch: 72, step: 1380, loss: 0.39568039774894714, mean loss: 0.339102016950646
Epoch: 72, step: 1381, loss: 0.3386014699935913, mean loss: 0.3391020121993697
Epoch: 72, step: 1382, loss: 0.3344992995262146, mean loss: 0.339101968510058
Epoch: 72, step: 1383, loss: 0.3536146283149719, mean loss: 0.3391021062640618
Epoch: 72, step: 1384, loss: 0.3151974081993103, mean loss: 0.33910187936309016
Epoch: 72, step: 1385, loss: 0.34032174944877625, mean loss: 0.3391018909418635
Epoch: 72, step: 1386, loss: 0.3439464569091797, mean loss: 0.3391019369251198
Epoch: 72, step: 1387, loss: 0.310170978307724, mean loss: 0.3391016623232118
Epoch: 72, step: 1388, loss: 0.3237944543361664, mean loss: 0.33910151703426106
Epoch: 72, step: 1389, loss: 0.28712671995162964, mean loss: 0.3391010237181666
Epoch: 72, step: 1390, loss: 0.3338099420070648, mean loss: 0.33910097349861523
Epoch: 72, step: 1391, loss: 0.3214159607887268, mean loss: 0.33910080564541945
Epoch: 72, step: 1392, loss: 0.380713552236557, mean loss: 0.33910120059940235
Epoch: 72, step: 1393, loss: 0.3060644567012787, mean loss: 0.3391008870447631
Epoch: 72, step: 1394, loss: 0.3085985779762268, mean loss: 0.3391005975474152
Epoch: 72, step: 1395, loss: 0.32498684525489807, mean loss: 0.3391004635950947
Epoch: 72, step: 1396, loss: 0.34705814719200134, mean loss: 0.33910053912001853
Epoch: 72, step: 1397, loss: 0.3084666132926941, mean loss: 0.33910024838177444
Epoch: 72, step: 1398, loss: 0.3425302803516388, mean loss: 0.3391002809349644
Epoch: 72, step: 1399, loss: 0.34846821427345276, mean loss: 0.33910036984177994
Epoch: 72, step: 1400, loss: 0.350668728351593, mean loss: 0.33910047963079293
Epoch: 72, step: 1401, loss: 0.34472575783729553, mean loss: 0.33910053301674914
Epoch: 72, step: 1402, loss: 0.3545706272125244, mean loss: 0.3391006798322315
Epoch: 72, step: 1403, loss: 0.37255561351776123, mean loss: 0.33910099732581317
Epoch: 72, step: 1404, loss: 0.294979989528656, mean loss: 0.3391005786131657
Epoch: 72, step: 1405, loss: 0.354214608669281, mean loss: 0.3391007220454171
Epoch: 72, step: 1406, loss: 0.3312062919139862, mean loss: 0.33910064712793064
Epoch: 72, step: 1407, loss: 0.31038129329681396, mean loss: 0.33910037458623393
Epoch: 72, step: 1408, loss: 0.31842878460884094, mean loss: 0.33910017841828477
Epoch: 72, step: 1409, loss: 0.36900395154953003, mean loss: 0.3391004621945296
Epoch: 72, step: 1410, loss: 0.3326832950115204, mean loss: 0.3391004012984575
Epoch: 72, step: 1411, loss: 0.35925716161727905, mean loss: 0.3391005925753631
Epoch: 72, step: 1412, loss: 0.28005450963974, mean loss: 0.33910003226484287
Epoch: 72, step: 1413, loss: 0.3477848470211029, mean loss: 0.3391001146775391
Epoch: 72, step: 1414, loss: 0.33339953422546387, mean loss: 0.33910006058361075
Epoch: 72, step: 1415, loss: 0.31817054748535156, mean loss: 0.3390998619812319
Epoch: 72, step: 1416, loss: 0.29802563786506653, mean loss: 0.339099472227243
Epoch: 72, step: 1417, loss: 0.31540849804878235, mean loss: 0.33909924742533215
Epoch: 72, step: 1418, loss: 0.33202847838401794, mean loss: 0.3390991803319616
Epoch: 72, step: 1419, loss: 0.3569226861000061, mean loss: 0.3390993494546869
Epoch: 72, step: 1420, loss: 0.3477913439273834, mean loss: 0.3390994319300351
Epoch: 72, step: 1421, loss: 0.32932668924331665, mean loss: 0.33909933920071844
Epoch: 72, step: 1422, loss: 0.3144081234931946, mean loss: 0.3390991049187047
Epoch: 72, step: 1423, loss: 0.34181323647499084, mean loss: 0.33909913067143316
Epoch: 72, step: 1424, loss: 0.30598872900009155, mean loss: 0.33909881651013524
Epoch: 72, step: 1425, loss: 0.29238903522491455, mean loss: 0.3390983733181007
Epoch: 72, step: 1426, loss: 0.29020625352859497, mean loss: 0.3390979094239901
Epoch: 72, step: 1427, loss: 0.3449726998806, mean loss: 0.33909796516415536
Epoch: 72, step: 1428, loss: 0.33425936102867126, mean loss: 0.3390979192557886
Epoch: 72, step: 1429, loss: 0.3337286412715912, mean loss: 0.33909786831290556
Epoch: 72, step: 1430, loss: 0.3174727261066437, mean loss: 0.3390976631388317
Epoch: 72, step: 1431, loss: 0.32896921038627625, mean loss: 0.33909756704345456
Epoch: 72, step: 1432, loss: 0.4108557105064392, mean loss: 0.33909824785429565
Epoch: 72, step: 1433, loss: 0.35864099860191345, mean loss: 0.3390984332658699
Epoch: 72, step: 1434, loss: 0.3311275541782379, mean loss: 0.33909835764298357
Epoch: 72, step: 1435, loss: 0.30943208932876587, mean loss: 0.33909807619001864
Epoch: 72, step: 1436, loss: 0.3309420943260193, mean loss: 0.33909799881245717
Epoch: 72, step: 1437, loss: 0.33076900243759155, mean loss: 0.3390979197942194
Epoch: 72, step: 1438, loss: 0.28698471188545227, mean loss: 0.3390974253943417
Epoch: 72, step: 1439, loss: 0.31790807843208313, mean loss: 0.33909722437215206
Epoch: 72, step: 1440, loss: 0.3142886459827423, mean loss: 0.3390969890167423
Epoch: 72, step: 1441, loss: 0.3052820861339569, mean loss: 0.33909666822267265
Epoch: 72, step: 1442, loss: 0.38202548027038574, mean loss: 0.33909707547440204
Epoch: 72, step: 1443, loss: 0.4078257977962494, mean loss: 0.3390977274753348
Valid: 72, mean loss: 0.18588196982940036
Epoch: 73, step: 0, loss: 0.34709155559539795, mean loss: 0.33909780330875305
Epoch: 73, step: 1, loss: 0.3078305125236511, mean loss: 0.33909750669453875
Epoch: 73, step: 2, loss: 0.30802860856056213, mean loss: 0.33909721196515363
Epoch: 73, step: 3, loss: 0.3247494101524353, mean loss: 0.33909707585866306
Epoch: 73, step: 4, loss: 0.321527361869812, mean loss: 0.33909690918996643
Epoch: 73, step: 5, loss: 0.3214471936225891, mean loss: 0.3390967417639522
Epoch: 73, step: 6, loss: 0.4051150977611542, mean loss: 0.3390973680111752
Epoch: 73, step: 7, loss: 0.30599987506866455, mean loss: 0.3390970540527902
Epoch: 73, step: 8, loss: 0.3226560056209564, mean loss: 0.3390968980966863
Epoch: 73, step: 9, loss: 0.3830241560935974, mean loss: 0.3390973147768669
Epoch: 73, step: 10, loss: 0.32856643199920654, mean loss: 0.33909721488516603
Epoch: 73, step: 11, loss: 0.35736775398254395, mean loss: 0.33909738819047697
Epoch: 73, step: 12, loss: 0.3225199580192566, mean loss: 0.33909723094665273
Epoch: 73, step: 13, loss: 0.3785736560821533, mean loss: 0.3390976053934224
Epoch: 73, step: 14, loss: 0.32738208770751953, mean loss: 0.33909749426896957
Epoch: 73, step: 15, loss: 0.33012324571609497, mean loss: 0.33909740914690945
Epoch: 73, step: 16, loss: 0.3081188499927521, mean loss: 0.339097115313532
Epoch: 73, step: 17, loss: 0.32850000262260437, mean loss: 0.33909701480027493
Epoch: 73, step: 18, loss: 0.32487425208091736, mean loss: 0.33909687989912896
Epoch: 73, step: 19, loss: 0.3392108976840973, mean loss: 0.3390968809805633
Epoch: 73, step: 20, loss: 0.3045543432235718, mean loss: 0.3390965533550783
Epoch: 73, step: 21, loss: 0.31997549533843994, mean loss: 0.3390963719993675
Epoch: 73, step: 22, loss: 0.3209092915058136, mean loss: 0.33909619950370196
Epoch: 73, step: 23, loss: 0.3006746768951416, mean loss: 0.339095835097592
Epoch: 73, step: 24, loss: 0.3397255837917328, mean loss: 0.3390958410703406
Epoch: 73, step: 25, loss: 0.34403514862060547, mean loss: 0.33909588791595174
Epoch: 73, step: 26, loss: 0.2980841398239136, mean loss: 0.3390954989541056
Epoch: 73, step: 27, loss: 0.33793237805366516, mean loss: 0.3390954879229893
Epoch: 73, step: 28, loss: 0.32458850741386414, mean loss: 0.3390953503391224
Epoch: 73, step: 29, loss: 0.30153825879096985, mean loss: 0.3390949941519148
Epoch: 73, step: 30, loss: 0.3014911711215973, mean loss: 0.33909463752489327
Epoch: 73, step: 31, loss: 0.3226434886455536, mean loss: 0.33909448150701765
Epoch: 73, step: 32, loss: 0.36403942108154297, mean loss: 0.339094718075272
Epoch: 73, step: 33, loss: 0.3519171178340912, mean loss: 0.3390948396768477
Epoch: 73, step: 34, loss: 0.3398611545562744, mean loss: 0.33909484694414677
Epoch: 73, step: 35, loss: 0.33160844445228577, mean loss: 0.33909477594799237
Epoch: 73, step: 36, loss: 0.31820541620254517, mean loss: 0.33909457784881886
Epoch: 73, step: 37, loss: 0.3576597273349762, mean loss: 0.33909475390523885
Epoch: 73, step: 38, loss: 0.30919599533081055, mean loss: 0.33909447037299567
Epoch: 73, step: 39, loss: 0.3646239638328552, mean loss: 0.3390947124688636
Epoch: 73, step: 40, loss: 0.31837624311447144, mean loss: 0.3390945159977404
Epoch: 73, step: 41, loss: 0.32514840364456177, mean loss: 0.3390943837494392
Epoch: 73, step: 42, loss: 0.3161776661872864, mean loss: 0.33909416643667484
Epoch: 73, step: 43, loss: 0.33051320910453796, mean loss: 0.33909408506665006
Epoch: 73, step: 44, loss: 0.33286455273628235, mean loss: 0.3390940259948736
Epoch: 73, step: 45, loss: 0.340314656496048, mean loss: 0.33909403756943884
Epoch: 73, step: 46, loss: 0.30830565094947815, mean loss: 0.33909374562293243
Epoch: 73, step: 47, loss: 0.3286387622356415, mean loss: 0.33909364648597634
Epoch: 73, step: 48, loss: 0.29618096351623535, mean loss: 0.33909323958026744
Epoch: 73, step: 49, loss: 0.31309160590171814, mean loss: 0.33909299303048
Epoch: 73, step: 50, loss: 0.3653141260147095, mean loss: 0.3390932416592217
Epoch: 73, step: 51, loss: 0.40222394466400146, mean loss: 0.3390938402587723
Epoch: 73, step: 52, loss: 0.37934941053390503, mean loss: 0.33909422195478783
Epoch: 73, step: 53, loss: 0.33886364102363586, mean loss: 0.339094219768482
Epoch: 73, step: 54, loss: 0.37739884853363037, mean loss: 0.3390945829591365
Epoch: 73, step: 55, loss: 0.30342385172843933, mean loss: 0.3390942447453539
Epoch: 73, step: 56, loss: 0.3303171992301941, mean loss: 0.3390941615261566
Epoch: 73, step: 57, loss: 0.3396289646625519, mean loss: 0.33909416659682257
Epoch: 73, step: 58, loss: 0.34365200996398926, mean loss: 0.33909420981100813
Epoch: 73, step: 59, loss: 0.305548757314682, mean loss: 0.3390938917602222
Epoch: 73, step: 60, loss: 0.32968756556510925, mean loss: 0.3390938025779083
Epoch: 73, step: 61, loss: 0.34788697957992554, mean loss: 0.3390938859461033
Epoch: 73, step: 62, loss: 0.306225061416626, mean loss: 0.33909357431941894
Epoch: 73, step: 63, loss: 0.3019656836986542, mean loss: 0.33909322231620853
Epoch: 73, step: 64, loss: 0.3130851089954376, mean loss: 0.3390929757400514
Epoch: 73, step: 65, loss: 0.32094240188598633, mean loss: 0.3390928036608135
Epoch: 73, step: 66, loss: 0.35454103350639343, mean loss: 0.3390929501186852
Epoch: 73, step: 67, loss: 0.32920876145362854, mean loss: 0.33909285641192877
Epoch: 73, step: 68, loss: 0.35003721714019775, mean loss: 0.33909296016863116
Epoch: 73, step: 69, loss: 0.33455702662467957, mean loss: 0.33909291716666357
Epoch: 73, step: 70, loss: 0.3551098704338074, mean loss: 0.33909306901059355
Epoch: 73, step: 71, loss: 0.3283827602863312, mean loss: 0.3390929674756809
Epoch: 73, step: 72, loss: 0.3212909996509552, mean loss: 0.33909279871265463
Epoch: 73, step: 73, loss: 0.3007911741733551, mean loss: 0.33909243561589736
Epoch: 73, step: 74, loss: 0.33088424801826477, mean loss: 0.33909235780358304
Epoch: 73, step: 75, loss: 0.35785770416259766, mean loss: 0.3390925356943987
Epoch: 73, step: 76, loss: 0.3170325756072998, mean loss: 0.33909232657344685
Epoch: 73, step: 77, loss: 0.3519952893257141, mean loss: 0.3390924488880051
Epoch: 73, step: 78, loss: 0.3623291850090027, mean loss: 0.3390926691602191
Epoch: 73, step: 79, loss: 0.36529719829559326, mean loss: 0.33909291756321774
Epoch: 73, step: 80, loss: 0.29891905188560486, mean loss: 0.3390925367430147
Epoch: 73, step: 81, loss: 0.33879464864730835, mean loss: 0.33909253391927024
Epoch: 73, step: 82, loss: 0.3553776443004608, mean loss: 0.33909268828782213
Epoch: 73, step: 83, loss: 0.3278529644012451, mean loss: 0.33909258174611545
Epoch: 73, step: 84, loss: 0.3123810589313507, mean loss: 0.3390923285491258
Epoch: 73, step: 85, loss: 0.34887224435806274, mean loss: 0.33909242125150696
Epoch: 73, step: 86, loss: 0.3018245995044708, mean loss: 0.33909206799866337
Epoch: 73, step: 87, loss: 0.3486711084842682, mean loss: 0.33909215879525567
Epoch: 73, step: 88, loss: 0.33428627252578735, mean loss: 0.33909211324226307
Epoch: 73, step: 89, loss: 0.3819916546344757, mean loss: 0.33909251986527866
Epoch: 73, step: 90, loss: 0.30087801814079285, mean loss: 0.33909215765281336
Epoch: 73, step: 91, loss: 0.3238586187362671, mean loss: 0.339092013264554
Epoch: 73, step: 92, loss: 0.30969417095184326, mean loss: 0.3390917346252259
Epoch: 73, step: 93, loss: 0.300662636756897, mean loss: 0.33909137038908893
Epoch: 73, step: 94, loss: 0.3332502841949463, mean loss: 0.33909131502701634
Epoch: 73, step: 95, loss: 0.3289700150489807, mean loss: 0.33909121909779794
Epoch: 73, step: 96, loss: 0.3600008487701416, mean loss: 0.3390914172764336
Epoch: 73, step: 97, loss: 0.3322983980178833, mean loss: 0.3390913528937281
Epoch: 73, step: 98, loss: 0.36456695199012756, mean loss: 0.33909159434342623
Epoch: 73, step: 99, loss: 0.2859684228897095, mean loss: 0.3390910908635239
Epoch: 73, step: 100, loss: 0.3374721109867096, mean loss: 0.3390910755196338
Epoch: 73, step: 101, loss: 0.3389291763305664, mean loss: 0.33909107398524796
Epoch: 73, step: 102, loss: 0.318636417388916, mean loss: 0.3390908801298094
Epoch: 73, step: 103, loss: 0.342625230550766, mean loss: 0.33909091362568133
Epoch: 73, step: 104, loss: 0.3297663629055023, mean loss: 0.33909082525555406
Epoch: 73, step: 105, loss: 0.3344959318637848, mean loss: 0.33909078170949186
Epoch: 73, step: 106, loss: 0.3386651277542114, mean loss: 0.3390907776755837
Epoch: 73, step: 107, loss: 0.34883010387420654, mean loss: 0.33909086997397453
Epoch: 73, step: 108, loss: 0.37781643867492676, mean loss: 0.3390912369679255
Epoch: 73, step: 109, loss: 0.3223457336425781, mean loss: 0.33909107827586765
Epoch: 73, step: 110, loss: 0.3670429587364197, mean loss: 0.33909134316485356
Epoch: 73, step: 111, loss: 0.34313690662384033, mean loss: 0.33909138150270524
Epoch: 73, step: 112, loss: 0.3484090268611908, mean loss: 0.3390914698006949
Epoch: 73, step: 113, loss: 0.3271960914134979, mean loss: 0.3390913570760736
Epoch: 73, step: 114, loss: 0.3133682310581207, mean loss: 0.33909111331735764
Epoch: 73, step: 115, loss: 0.32244324684143066, mean loss: 0.33909095555954477
Epoch: 73, step: 116, loss: 0.33680909872055054, mean loss: 0.33909093393651374
Epoch: 73, step: 117, loss: 0.35954928398132324, mean loss: 0.33909112779939676
Epoch: 73, step: 118, loss: 0.33009615540504456, mean loss: 0.3390910425640404
Epoch: 73, step: 119, loss: 0.325837641954422, mean loss: 0.33909091697748267
Epoch: 73, step: 120, loss: 0.2988857626914978, mean loss: 0.33909053600513955
Epoch: 73, step: 121, loss: 0.3201935291290283, mean loss: 0.3390903569442978
Epoch: 73, step: 122, loss: 0.296562522649765, mean loss: 0.3390899539705517
Epoch: 73, step: 123, loss: 0.37959766387939453, mean loss: 0.33909033779891273
Epoch: 73, step: 124, loss: 0.3234959542751312, mean loss: 0.33909019003667273
Epoch: 73, step: 125, loss: 0.32835620641708374, mean loss: 0.3390900883293861
Epoch: 73, step: 126, loss: 0.3767987787723541, mean loss: 0.33909044562565044
Epoch: 73, step: 127, loss: 0.30933481454849243, mean loss: 0.3390901636886495
Epoch: 73, step: 128, loss: 0.3182185888290405, mean loss: 0.33908996593067053
Epoch: 73, step: 129, loss: 0.32286086678504944, mean loss: 0.33908981216156303
Epoch: 73, step: 130, loss: 0.35675033926963806, mean loss: 0.3390899794917233
Epoch: 73, step: 131, loss: 0.3038652241230011, mean loss: 0.3390896457469783
Epoch: 73, step: 132, loss: 0.3115854859352112, mean loss: 0.3390893851551946
Epoch: 73, step: 133, loss: 0.3247447907924652, mean loss: 0.33908924924673417
Epoch: 73, step: 134, loss: 0.3316253125667572, mean loss: 0.3390891785300233
Epoch: 73, step: 135, loss: 0.3208577632904053, mean loss: 0.3390890057989887
Epoch: 73, step: 136, loss: 0.33752694725990295, mean loss: 0.33908899099962025
Epoch: 73, step: 137, loss: 0.33737751841545105, mean loss: 0.33908897478481603
Epoch: 73, step: 138, loss: 0.34600111842155457, mean loss: 0.3390890402711083
Epoch: 73, step: 139, loss: 0.3627558946609497, mean loss: 0.3390892644909657
Epoch: 73, step: 140, loss: 0.396658331155777, mean loss: 0.3390898098953281
Epoch: 73, step: 141, loss: 0.33567923307418823, mean loss: 0.3390897775841242
Epoch: 73, step: 142, loss: 0.33922824263572693, mean loss: 0.33908977889590525
Epoch: 73, step: 143, loss: 0.3361179828643799, mean loss: 0.33908975074216663
Epoch: 73, step: 144, loss: 0.3880957067012787, mean loss: 0.33909021500276476
Epoch: 73, step: 145, loss: 0.3363448679447174, mean loss: 0.33909018899481597
Epoch: 73, step: 146, loss: 0.3307632505893707, mean loss: 0.3390901101106052
Epoch: 73, step: 147, loss: 0.32701364159584045, mean loss: 0.3390899957067731
Epoch: 73, step: 148, loss: 0.3403189480304718, mean loss: 0.33909000734887884
Epoch: 73, step: 149, loss: 0.32242700457572937, mean loss: 0.33908984949848975
Epoch: 73, step: 150, loss: 0.36244478821754456, mean loss: 0.3390900707402006
Epoch: 73, step: 151, loss: 0.32705095410346985, mean loss: 0.33908995669453507
Epoch: 73, step: 152, loss: 0.3054085075855255, mean loss: 0.33908963763566985
Epoch: 73, step: 153, loss: 0.349970281124115, mean loss: 0.33908974070525183
Epoch: 73, step: 154, loss: 0.3385718762874603, mean loss: 0.33908973579969975
Epoch: 73, step: 155, loss: 0.35351017117500305, mean loss: 0.33908987239824645
Epoch: 73, step: 156, loss: 0.3406355381011963, mean loss: 0.33908988703953036
Epoch: 73, step: 157, loss: 0.3342606723308563, mean loss: 0.339089841295335
Epoch: 73, step: 158, loss: 0.36447077989578247, mean loss: 0.3390900817111556
Epoch: 73, step: 159, loss: 0.2939987778663635, mean loss: 0.33908965459692225
Epoch: 73, step: 160, loss: 0.34639132022857666, mean loss: 0.3390897237591667
Epoch: 73, step: 161, loss: 0.3271200656890869, mean loss: 0.33908961038221713
Epoch: 73, step: 162, loss: 0.29717496037483215, mean loss: 0.3390892133691931
Epoch: 73, step: 163, loss: 0.29912716150283813, mean loss: 0.33908883485464564
Epoch: 73, step: 164, loss: 0.32323023676872253, mean loss: 0.33908868464581143
Epoch: 73, step: 165, loss: 0.31574931740760803, mean loss: 0.33908846358302147
Epoch: 73, step: 166, loss: 0.314546138048172, mean loss: 0.33908823112840897
Epoch: 73, step: 167, loss: 0.2894584834575653, mean loss: 0.33908776106070987
Epoch: 73, step: 168, loss: 0.34962907433509827, mean loss: 0.33908786090171605
Epoch: 73, step: 169, loss: 0.33083590865135193, mean loss: 0.33908778274490664
Epoch: 73, step: 170, loss: 0.32982248067855835, mean loss: 0.3390876949911767
Epoch: 73, step: 171, loss: 0.3204425871372223, mean loss: 0.33908751840089923
Epoch: 73, step: 172, loss: 0.3201521933078766, mean loss: 0.33908733906363453
Epoch: 73, step: 173, loss: 0.3238523304462433, mean loss: 0.33908719477359023
Epoch: 73, step: 174, loss: 0.32549527287483215, mean loss: 0.3390870660463615
Epoch: 73, step: 175, loss: 0.32390475273132324, mean loss: 0.33908692225811554
Epoch: 73, step: 176, loss: 0.30977216362953186, mean loss: 0.3390866446273147
Epoch: 73, step: 177, loss: 0.2735641300678253, mean loss: 0.3390860240901941
Epoch: 73, step: 178, loss: 0.3864840567111969, mean loss: 0.3390864729734571
Epoch: 73, step: 179, loss: 0.2977624535560608, mean loss: 0.3390860816178675
Epoch: 73, step: 180, loss: 0.3624436557292938, mean loss: 0.33908630282167945
Epoch: 73, step: 181, loss: 0.30039021372795105, mean loss: 0.3390859363606202
Epoch: 73, step: 182, loss: 0.31432217359542847, mean loss: 0.33908570184418696
Epoch: 73, step: 183, loss: 0.3812582790851593, mean loss: 0.33908610122084176
Epoch: 73, step: 184, loss: 0.3431999683380127, mean loss: 0.3390861401790235
Epoch: 73, step: 185, loss: 0.32039326429367065, mean loss: 0.3390859631598007
Epoch: 73, step: 186, loss: 0.29269981384277344, mean loss: 0.3390855238928634
Epoch: 73, step: 187, loss: 0.33997347950935364, mean loss: 0.339085532301534
Epoch: 73, step: 188, loss: 0.35027164220809937, mean loss: 0.33908563822960197
Epoch: 73, step: 189, loss: 0.3710620105266571, mean loss: 0.33908594103042294
Epoch: 73, step: 190, loss: 0.3094295859336853, mean loss: 0.33908566020170505
Epoch: 73, step: 191, loss: 0.3336559534072876, mean loss: 0.33908560878597466
Epoch: 73, step: 192, loss: 0.3373023569583893, mean loss: 0.33908559189991977
Epoch: 73, step: 193, loss: 0.3493470251560211, mean loss: 0.3390856890670623
Epoch: 73, step: 194, loss: 0.3159762918949127, mean loss: 0.33908547024257935
Epoch: 73, step: 195, loss: 0.302203893661499, mean loss: 0.33908512101168226
Epoch: 73, step: 196, loss: 0.29348304867744446, mean loss: 0.3390846892106773
Epoch: 73, step: 197, loss: 0.30267688632011414, mean loss: 0.3390843444724623
Epoch: 73, step: 198, loss: 0.3184053301811218, mean loss: 0.3390841486688595
Epoch: 73, step: 199, loss: 0.34162938594818115, mean loss: 0.33908417276874664
Epoch: 73, step: 200, loss: 0.30707818269729614, mean loss: 0.3390838697190267
Epoch: 73, step: 201, loss: 0.3034740090370178, mean loss: 0.3390835325491375
Epoch: 73, step: 202, loss: 0.3164978623390198, mean loss: 0.33908331870006103
Epoch: 73, step: 203, loss: 0.3297867476940155, mean loss: 0.3390832306776875
Epoch: 73, step: 204, loss: 0.31940367817878723, mean loss: 0.339083044348285
Epoch: 73, step: 205, loss: 0.35364124178886414, mean loss: 0.33908318218650807
Epoch: 73, step: 206, loss: 0.3218379020690918, mean loss: 0.3390830189083089
Epoch: 73, step: 207, loss: 0.32875126600265503, mean loss: 0.3390829210882662
Epoch: 73, step: 208, loss: 0.3016795217990875, mean loss: 0.3390825669598326
Epoch: 73, step: 209, loss: 0.32766789197921753, mean loss: 0.3390824588888343
Epoch: 73, step: 210, loss: 0.3238579332828522, mean loss: 0.3390823147485845
Epoch: 73, step: 211, loss: 0.30291715264320374, mean loss: 0.33908197235327564
Epoch: 73, step: 212, loss: 0.3331962525844574, mean loss: 0.3390819166304849
Epoch: 73, step: 213, loss: 0.33891454339027405, mean loss: 0.3390819150459012
Epoch: 73, step: 214, loss: 0.3575621247291565, mean loss: 0.3390820900031534
Epoch: 73, step: 215, loss: 0.3097856342792511, mean loss: 0.3390818126481365
Epoch: 73, step: 216, loss: 0.37802761793136597, mean loss: 0.3390821813518569
Epoch: 73, step: 217, loss: 0.305025190114975, mean loss: 0.33908185893406617
Epoch: 73, step: 218, loss: 0.35637199878692627, mean loss: 0.33908202261839987
Epoch: 73, step: 219, loss: 0.3855438232421875, mean loss: 0.3390824624642858
Epoch: 73, step: 220, loss: 0.3466302156448364, mean loss: 0.3390825339168923
Epoch: 73, step: 221, loss: 0.32104602456092834, mean loss: 0.33908236317158913
Epoch: 73, step: 222, loss: 0.35185328125953674, mean loss: 0.33908248406824354
Epoch: 73, step: 223, loss: 0.31853142380714417, mean loss: 0.33908228952225294
Epoch: 73, step: 224, loss: 0.322539746761322, mean loss: 0.3390821329242545
Epoch: 73, step: 225, loss: 0.32716408371925354, mean loss: 0.33908202010453803
Epoch: 73, step: 226, loss: 0.31381386518478394, mean loss: 0.3390817809111064
Epoch: 73, step: 227, loss: 0.3146660327911377, mean loss: 0.3390815497889167
Epoch: 73, step: 228, loss: 0.31323808431625366, mean loss: 0.33908130515411133
Epoch: 73, step: 229, loss: 0.3065268099308014, mean loss: 0.3390809969954697
Epoch: 73, step: 230, loss: 0.3702625036239624, mean loss: 0.33908129215470056
Epoch: 73, step: 231, loss: 0.3264981210231781, mean loss: 0.3390811730455119
Epoch: 73, step: 232, loss: 0.3277839720249176, mean loss: 0.3390810661100107
Epoch: 73, step: 233, loss: 0.27664849162101746, mean loss: 0.3390804751498751
Epoch: 73, step: 234, loss: 0.31789809465408325, mean loss: 0.3390802746483891
Epoch: 73, step: 235, loss: 0.32887497544288635, mean loss: 0.33908017805120594
Epoch: 73, step: 236, loss: 0.3095850646495819, mean loss: 0.3390798988709638
Epoch: 73, step: 237, loss: 0.3219391405582428, mean loss: 0.33907973662999535
Epoch: 73, step: 238, loss: 0.35023707151412964, mean loss: 0.339079842235573
Epoch: 73, step: 239, loss: 0.3280890882015228, mean loss: 0.3390797382076887
Epoch: 73, step: 240, loss: 0.3437385857105255, mean loss: 0.3390797823034314
Epoch: 73, step: 241, loss: 0.2930185794830322, mean loss: 0.3390793463407341
Epoch: 73, step: 242, loss: 0.35964861512184143, mean loss: 0.3390795410240788
Epoch: 73, step: 243, loss: 0.33689650893211365, mean loss: 0.33907952036238337
Epoch: 73, step: 244, loss: 0.4025166928768158, mean loss: 0.33908012076910055
Epoch: 73, step: 245, loss: 0.32848647236824036, mean loss: 0.3390800205055294
Epoch: 73, step: 246, loss: 0.3428654670715332, mean loss: 0.3390800563325443
Epoch: 73, step: 247, loss: 0.3491196036338806, mean loss: 0.3390801513500277
Epoch: 73, step: 248, loss: 0.3181508481502533, mean loss: 0.3390799532702897
Epoch: 73, step: 249, loss: 0.3230884373188019, mean loss: 0.339079801924338
Epoch: 73, step: 250, loss: 0.33984890580177307, mean loss: 0.33907980920317615
Epoch: 73, step: 251, loss: 0.3483400344848633, mean loss: 0.33907989684158923
Epoch: 73, step: 252, loss: 0.3450568914413452, mean loss: 0.3390799534070991
Epoch: 73, step: 253, loss: 0.3438933789730072, mean loss: 0.3390799989603099
Epoch: 73, step: 254, loss: 0.3154218792915344, mean loss: 0.33907977506713916
Epoch: 73, step: 255, loss: 0.2883036136627197, mean loss: 0.3390792945417066
Epoch: 73, step: 256, loss: 0.3273102045059204, mean loss: 0.33907918316476504
Epoch: 73, step: 257, loss: 0.32873332500457764, mean loss: 0.339079085257524
Epoch: 73, step: 258, loss: 0.3414105474948883, mean loss: 0.3390791073209306
Epoch: 73, step: 259, loss: 0.31275108456611633, mean loss: 0.3390788581724073
Epoch: 73, step: 260, loss: 0.3080593943595886, mean loss: 0.33907856463040686
Epoch: 73, step: 261, loss: 0.3101734519004822, mean loss: 0.33907829109942733
Epoch: 73, step: 262, loss: 0.3511508107185364, mean loss: 0.33907840534139205
Epoch: 73, step: 263, loss: 0.2966308891773224, mean loss: 0.3390780036653619
Epoch: 73, step: 264, loss: 0.3503136932849884, mean loss: 0.3390781099864121
Epoch: 73, step: 265, loss: 0.3446967601776123, mean loss: 0.3390781631540552
Epoch: 73, step: 266, loss: 0.2929894030094147, mean loss: 0.3390777270337272
Epoch: 73, step: 267, loss: 0.32156792283058167, mean loss: 0.33907756134670786
Epoch: 73, step: 268, loss: 0.29098978638648987, mean loss: 0.3390771063190779
Epoch: 73, step: 269, loss: 0.3319951593875885, mean loss: 0.3390770393072222
Epoch: 73, step: 270, loss: 0.32685530185699463, mean loss: 0.3390769236619675
Epoch: 73, step: 271, loss: 0.33107489347457886, mean loss: 0.3390768479453956
Epoch: 73, step: 272, loss: 0.34824901819229126, mean loss: 0.33907693473321077
Epoch: 73, step: 273, loss: 0.3328617811203003, mean loss: 0.3390768759254821
Epoch: 73, step: 274, loss: 0.35036367177963257, mean loss: 0.33907698272003445
Epoch: 73, step: 275, loss: 0.3235865831375122, mean loss: 0.33907683615278383
Epoch: 73, step: 276, loss: 0.3295189142227173, mean loss: 0.33907674571837787
Epoch: 73, step: 277, loss: 0.337994247674942, mean loss: 0.33907673547617856
Epoch: 73, step: 278, loss: 0.3272683620452881, mean loss: 0.339076623750739
Epoch: 73, step: 279, loss: 0.31740501523017883, mean loss: 0.33907641870581107
Epoch: 73, step: 280, loss: 0.31046393513679504, mean loss: 0.33907614799267427
Epoch: 73, step: 281, loss: 0.31181129813194275, mean loss: 0.3390758900324319
Epoch: 73, step: 282, loss: 0.3732563257217407, mean loss: 0.33907621341987393
Epoch: 73, step: 283, loss: 0.30601662397384644, mean loss: 0.3390759006399253
Epoch: 73, step: 284, loss: 0.3082481622695923, mean loss: 0.33907560897849337
Epoch: 73, step: 285, loss: 0.33688265085220337, mean loss: 0.3390755882310987
Epoch: 73, step: 286, loss: 0.3302180767059326, mean loss: 0.3390755044317106
Epoch: 73, step: 287, loss: 0.35092487931251526, mean loss: 0.3390756165355411
Epoch: 73, step: 288, loss: 0.30079859495162964, mean loss: 0.33907525441009684
Epoch: 73, step: 289, loss: 0.32467180490493774, mean loss: 0.339075118145414
Epoch: 73, step: 290, loss: 0.34185492992401123, mean loss: 0.3390751444437384
Epoch: 73, step: 291, loss: 0.3211154639720917, mean loss: 0.33907497453833774
Epoch: 73, step: 292, loss: 0.321139395236969, mean loss: 0.3390748048625485
Epoch: 73, step: 293, loss: 0.29908329248428345, mean loss: 0.3390744265348057
Epoch: 73, step: 294, loss: 0.3396187126636505, mean loss: 0.3390744316838131
Epoch: 73, step: 295, loss: 0.314980685710907, mean loss: 0.3390742037564474
Epoch: 73, step: 296, loss: 0.3178066909313202, mean loss: 0.3390740025672126
Epoch: 73, step: 297, loss: 0.32811835408210754, mean loss: 0.3390738989284983
Epoch: 73, step: 298, loss: 0.29976367950439453, mean loss: 0.33907352706351335
Epoch: 73, step: 299, loss: 0.2963666021823883, mean loss: 0.3390731230703538
Epoch: 73, step: 300, loss: 0.315231055021286, mean loss: 0.3390728975345347
Epoch: 73, step: 301, loss: 0.3642274737358093, mean loss: 0.3390731354838716
Epoch: 73, step: 302, loss: 0.3441132605075836, mean loss: 0.3390731831604078
Epoch: 73, step: 303, loss: 0.3543629050254822, mean loss: 0.3390733277905666
Epoch: 73, step: 304, loss: 0.332553505897522, mean loss: 0.3390732661181592
Epoch: 73, step: 305, loss: 0.31258514523506165, mean loss: 0.3390730155636568
Epoch: 73, step: 306, loss: 0.2992522716522217, mean loss: 0.3390726388977414
Epoch: 73, step: 307, loss: 0.3248363733291626, mean loss: 0.33907250423764335
Epoch: 73, step: 308, loss: 0.3697648346424103, mean loss: 0.33907279455205963
Epoch: 73, step: 309, loss: 0.3097711205482483, mean loss: 0.33907251739428734
Epoch: 73, step: 310, loss: 0.35858187079429626, mean loss: 0.33907270192701344
Epoch: 73, step: 311, loss: 0.2981395721435547, mean loss: 0.3390723147573095
Epoch: 73, step: 312, loss: 0.3103382885456085, mean loss: 0.3390720429764988
Epoch: 73, step: 313, loss: 0.2944496273994446, mean loss: 0.3390716209193361
Epoch: 73, step: 314, loss: 0.3376169204711914, mean loss: 0.33907160716031104
Epoch: 73, step: 315, loss: 0.3510165512561798, mean loss: 0.33907172013836884
Epoch: 73, step: 316, loss: 0.337375670671463, mean loss: 0.33907170409689047
Epoch: 73, step: 317, loss: 0.33116415143013, mean loss: 0.33907162930683404
Epoch: 73, step: 318, loss: 0.3475041091442108, mean loss: 0.33907170906092543
Epoch: 73, step: 319, loss: 0.3398960828781128, mean loss: 0.3390717168577496
Epoch: 73, step: 320, loss: 0.3471129834651947, mean loss: 0.33907179291032175
Epoch: 73, step: 321, loss: 0.3497104346752167, mean loss: 0.3390718935273585
Epoch: 73, step: 322, loss: 0.29307547211647034, mean loss: 0.33907145851131454
Epoch: 73, step: 323, loss: 0.3170127272605896, mean loss: 0.33907124989049237
Epoch: 73, step: 324, loss: 0.33485084772109985, mean loss: 0.33907120997634527
Epoch: 73, step: 325, loss: 0.30448776483535767, mean loss: 0.33907088290901716
Epoch: 73, step: 326, loss: 0.34997037053108215, mean loss: 0.3390709859881802
Epoch: 73, step: 327, loss: 0.3072887361049652, mean loss: 0.3390706854183875
Epoch: 73, step: 328, loss: 0.3611448109149933, mean loss: 0.33907089417492936
Epoch: 73, step: 329, loss: 0.3207594156265259, mean loss: 0.33907072100363933
Epoch: 73, step: 330, loss: 0.29941684007644653, mean loss: 0.33907034600121905
Epoch: 73, step: 331, loss: 0.3281659781932831, mean loss: 0.339070242880779
Epoch: 73, step: 332, loss: 0.3185073137283325, mean loss: 0.3390700484230822
Epoch: 73, step: 333, loss: 0.32345351576805115, mean loss: 0.3390699007434285
Epoch: 73, step: 334, loss: 0.31986865401268005, mean loss: 0.33906971916620426
Epoch: 73, step: 335, loss: 0.3068639636039734, mean loss: 0.3390694146142925
Epoch: 73, step: 336, loss: 0.34928128123283386, mean loss: 0.3390695111813203
Epoch: 73, step: 337, loss: 0.3260338604450226, mean loss: 0.3390693879127554
Epoch: 73, step: 338, loss: 0.30998435616493225, mean loss: 0.339069112879595
Epoch: 73, step: 339, loss: 0.3007929027080536, mean loss: 0.33906875093646227
Epoch: 73, step: 340, loss: 0.3199552893638611, mean loss: 0.33906857019963615
Epoch: 73, step: 341, loss: 0.331866055727005, mean loss: 0.3390685020933284
Epoch: 73, step: 342, loss: 0.2985493242740631, mean loss: 0.3390681189513699
Epoch: 73, step: 343, loss: 0.3040027320384979, mean loss: 0.33906778738259924
Epoch: 73, step: 344, loss: 0.28903892636299133, mean loss: 0.33906731432775633
Epoch: 73, step: 345, loss: 0.32455703616142273, mean loss: 0.3390671771251034
Epoch: 73, step: 346, loss: 0.3100910186767578, mean loss: 0.3390669031421947
Epoch: 73, step: 347, loss: 0.31187736988067627, mean loss: 0.33906664605507986
Epoch: 73, step: 348, loss: 0.352939635515213, mean loss: 0.3390667772280969
Epoch: 73, step: 349, loss: 0.29664361476898193, mean loss: 0.3390663761089572
Epoch: 73, step: 350, loss: 0.3460964262485504, mean loss: 0.3390664425788015
Epoch: 73, step: 351, loss: 0.3516584038734436, mean loss: 0.33906656163595983
Epoch: 73, step: 352, loss: 0.337446004152298, mean loss: 0.3390665463137125
Epoch: 73, step: 353, loss: 0.31386950612068176, mean loss: 0.33906630807987376
Epoch: 73, step: 354, loss: 0.3207300305366516, mean loss: 0.3390661347150478
Epoch: 73, step: 355, loss: 0.3779744505882263, mean loss: 0.3390665025797694
Epoch: 73, step: 356, loss: 0.3213087320327759, mean loss: 0.33906633468775427
Epoch: 73, step: 357, loss: 0.31858375668525696, mean loss: 0.3390661410356979
Epoch: 73, step: 358, loss: 0.353656530380249, mean loss: 0.33906627897888975
Epoch: 73, step: 359, loss: 0.32258233428001404, mean loss: 0.3390661231347656
Epoch: 73, step: 360, loss: 0.35517340898513794, mean loss: 0.33906627541640505
Epoch: 73, step: 361, loss: 0.33302900195121765, mean loss: 0.3390662183393023
Epoch: 73, step: 362, loss: 0.33095335960388184, mean loss: 0.3390661416400942
Epoch: 73, step: 363, loss: 0.3364764451980591, mean loss: 0.3390661171572584
Epoch: 73, step: 364, loss: 0.35841143131256104, mean loss: 0.33906630004497645
Epoch: 73, step: 365, loss: 0.3401029109954834, mean loss: 0.3390663098448493
Epoch: 73, step: 366, loss: 0.2978805601596832, mean loss: 0.3390659204882692
Epoch: 73, step: 367, loss: 0.3226970136165619, mean loss: 0.339065765743451
Epoch: 73, step: 368, loss: 0.3325687348842621, mean loss: 0.3390657043238117
Epoch: 73, step: 369, loss: 0.3063737750053406, mean loss: 0.33906539527379076
Epoch: 73, step: 370, loss: 0.32199180126190186, mean loss: 0.3390652338717317
Epoch: 73, step: 371, loss: 0.3359670042991638, mean loss: 0.3390652045834691
Epoch: 73, step: 372, loss: 0.300841748714447, mean loss: 0.3390648432519394
Epoch: 73, step: 373, loss: 0.39041876792907715, mean loss: 0.3390653287029885
Epoch: 73, step: 374, loss: 0.34717339277267456, mean loss: 0.3390654053481724
Epoch: 73, step: 375, loss: 0.33565497398376465, mean loss: 0.3390653731098149
Epoch: 73, step: 376, loss: 0.34379827976226807, mean loss: 0.3390654178489338
Epoch: 73, step: 377, loss: 0.3493019640445709, mean loss: 0.3390655146118244
Epoch: 73, step: 378, loss: 0.3460456132888794, mean loss: 0.3390655805919047
Epoch: 73, step: 379, loss: 0.37406814098358154, mean loss: 0.3390659114539774
Epoch: 73, step: 380, loss: 0.3005833625793457, mean loss: 0.3390655477007151
Epoch: 73, step: 381, loss: 0.3487773537635803, mean loss: 0.3390656394999293
Epoch: 73, step: 382, loss: 0.3137027323246002, mean loss: 0.339065399763579
Epoch: 73, step: 383, loss: 0.3161538243293762, mean loss: 0.33906518319985796
Epoch: 73, step: 384, loss: 0.341661274433136, mean loss: 0.3390652077382781
Epoch: 73, step: 385, loss: 0.33182257413864136, mean loss: 0.3390651392810899
Epoch: 73, step: 386, loss: 0.32039734721183777, mean loss: 0.3390649628352627
Epoch: 73, step: 387, loss: 0.34575846791267395, mean loss: 0.33906502610090616
Epoch: 73, step: 388, loss: 0.35392308235168457, mean loss: 0.3390651665348931
Epoch: 73, step: 389, loss: 0.3378486931324005, mean loss: 0.3390651550372522
Epoch: 73, step: 390, loss: 0.31112509965896606, mean loss: 0.339064890961041
Epoch: 73, step: 391, loss: 0.30437523126602173, mean loss: 0.33906456309385546
Epoch: 73, step: 392, loss: 0.33242008090019226, mean loss: 0.3390645002945341
Epoch: 73, step: 393, loss: 0.3284241259098053, mean loss: 0.33906439972959085
Epoch: 73, step: 394, loss: 0.33895331621170044, mean loss: 0.3390643986797216
Epoch: 73, step: 395, loss: 0.3411749005317688, mean loss: 0.339064418626246
Epoch: 73, step: 396, loss: 0.3274381160736084, mean loss: 0.33906430874615495
Epoch: 73, step: 397, loss: 0.3335700035095215, mean loss: 0.3390642568200115
Epoch: 73, step: 398, loss: 0.33374813199043274, mean loss: 0.33906420657830855
Epoch: 73, step: 399, loss: 0.3528122007846832, mean loss: 0.33906433650680634
Epoch: 73, step: 400, loss: 0.35241323709487915, mean loss: 0.33906446266238827
Epoch: 73, step: 401, loss: 0.29818233847618103, mean loss: 0.33906407630402186
Epoch: 73, step: 402, loss: 0.34811535477638245, mean loss: 0.33906416184273064
Epoch: 73, step: 403, loss: 0.3192049562931061, mean loss: 0.33906397416595635
Epoch: 73, step: 404, loss: 0.31638479232788086, mean loss: 0.3390637598413975
Epoch: 73, step: 405, loss: 0.3251134753227234, mean loss: 0.33906362800858536
Epoch: 73, step: 406, loss: 0.324564665555954, mean loss: 0.33906349099195837
Epoch: 73, step: 407, loss: 0.3441406786441803, mean loss: 0.33906353897142966
Epoch: 73, step: 408, loss: 0.3607898950576782, mean loss: 0.3390637442837598
Epoch: 73, step: 409, loss: 0.31435108184814453, mean loss: 0.33906351075327995
Epoch: 73, step: 410, loss: 0.35998210310935974, mean loss: 0.3390637084285713
Epoch: 73, step: 411, loss: 0.3304509222507477, mean loss: 0.339063627040737
Epoch: 73, step: 412, loss: 0.31287258863449097, mean loss: 0.33906337954687066
Epoch: 73, step: 413, loss: 0.33460304141044617, mean loss: 0.3390633373990229
Epoch: 73, step: 414, loss: 0.3174166679382324, mean loss: 0.3390631328513228
Epoch: 73, step: 415, loss: 0.3521963953971863, mean loss: 0.339063256951396
Epoch: 73, step: 416, loss: 0.30125701427459717, mean loss: 0.33906289971242864
Epoch: 73, step: 417, loss: 0.33278876543045044, mean loss: 0.3390628404274028
Epoch: 73, step: 418, loss: 0.3008134961128235, mean loss: 0.33906247900830716
Epoch: 73, step: 419, loss: 0.3457665741443634, mean loss: 0.33906254235488603
Epoch: 73, step: 420, loss: 0.32770559191703796, mean loss: 0.3390624350447801
Epoch: 73, step: 421, loss: 0.35992130637168884, mean loss: 0.3390626321352362
Epoch: 73, step: 422, loss: 0.29901957511901855, mean loss: 0.33906225378160065
Epoch: 73, step: 423, loss: 0.30643874406814575, mean loss: 0.3390619455357324
Epoch: 73, step: 424, loss: 0.33135226368904114, mean loss: 0.3390618726908686
Epoch: 73, step: 425, loss: 0.3223904073238373, mean loss: 0.33906171517215733
Epoch: 73, step: 426, loss: 0.3402555286884308, mean loss: 0.3390617264516811
Epoch: 73, step: 427, loss: 0.4058801829814911, mean loss: 0.33906235776740795
Epoch: 73, step: 428, loss: 0.3429863750934601, mean loss: 0.3390623948420513
Epoch: 73, step: 429, loss: 0.30190175771713257, mean loss: 0.3390620437466721
Epoch: 73, step: 430, loss: 0.3126472234725952, mean loss: 0.3390617941806141
Epoch: 73, step: 431, loss: 0.34602323174476624, mean loss: 0.3390618599513481
Epoch: 73, step: 432, loss: 0.36014655232429504, mean loss: 0.3390620591548284
Epoch: 73, step: 433, loss: 0.36037561297416687, mean loss: 0.33906226051863825
Epoch: 73, step: 434, loss: 0.3204331398010254, mean loss: 0.339062084518178
Epoch: 73, step: 435, loss: 0.3084835708141327, mean loss: 0.3390617956273751
Epoch: 73, step: 436, loss: 0.3250599801540375, mean loss: 0.3390616633463382
Epoch: 73, step: 437, loss: 0.33565253019332886, mean loss: 0.33906163113912846
Epoch: 73, step: 438, loss: 0.31594279408454895, mean loss: 0.3390614127298829
Epoch: 73, step: 439, loss: 0.33380424976348877, mean loss: 0.33906136306466195
Epoch: 73, step: 440, loss: 0.32310551404953003, mean loss: 0.33906121232874503
Epoch: 73, step: 441, loss: 0.30491358041763306, mean loss: 0.33906088973694964
Epoch: 73, step: 442, loss: 0.3328014016151428, mean loss: 0.3390608306042859
Epoch: 73, step: 443, loss: 0.3543001711368561, mean loss: 0.3390609745672217
Epoch: 73, step: 444, loss: 0.3353247344493866, mean loss: 0.3390609392720582
Epoch: 73, step: 445, loss: 0.3287612795829773, mean loss: 0.3390608419751162
Epoch: 73, step: 446, loss: 0.33330851793289185, mean loss: 0.33906078763562647
Epoch: 73, step: 447, loss: 0.3272261917591095, mean loss: 0.3390606758408421
Epoch: 73, step: 448, loss: 0.3229856789112091, mean loss: 0.33906052399080355
Epoch: 73, step: 449, loss: 0.33068639039993286, mean loss: 0.3390604448865585
Epoch: 73, step: 450, loss: 0.33338120579719543, mean loss: 0.33906039123949494
Epoch: 73, step: 451, loss: 0.30228543281555176, mean loss: 0.33906004386023075
Epoch: 73, step: 452, loss: 0.35501253604888916, mean loss: 0.3390601945473529
Epoch: 73, step: 453, loss: 0.3560936748981476, mean loss: 0.3390603554439614
Epoch: 73, step: 454, loss: 0.34211990237236023, mean loss: 0.33906038434387287
Epoch: 73, step: 455, loss: 0.32796692848205566, mean loss: 0.339060279558141
Epoch: 73, step: 456, loss: 0.36740389466285706, mean loss: 0.3390605472816021
Epoch: 73, step: 457, loss: 0.34601038694381714, mean loss: 0.3390606129266353
Epoch: 73, step: 458, loss: 0.32025760412216187, mean loss: 0.3390604353236203
Epoch: 73, step: 459, loss: 0.30754944682121277, mean loss: 0.3390601376907381
Epoch: 73, step: 460, loss: 0.37512049078941345, mean loss: 0.339060478290826
Epoch: 73, step: 461, loss: 0.32617273926734924, mean loss: 0.3390603565636878
Epoch: 73, step: 462, loss: 0.3310401737689972, mean loss: 0.3390602808122565
Epoch: 73, step: 463, loss: 0.35198062658309937, mean loss: 0.3390604028450663
Epoch: 73, step: 464, loss: 0.33164864778518677, mean loss: 0.3390603328416183
Epoch: 73, step: 465, loss: 0.3006981313228607, mean loss: 0.33905997051704173
Epoch: 73, step: 466, loss: 0.3727147877216339, mean loss: 0.3390602883781587
Epoch: 73, step: 467, loss: 0.35549044609069824, mean loss: 0.33906044355531884
Epoch: 73, step: 468, loss: 0.33557164669036865, mean loss: 0.33906041060514963
Epoch: 73, step: 469, loss: 0.31376317143440247, mean loss: 0.3390601716859833
Epoch: 73, step: 470, loss: 0.3731416165828705, mean loss: 0.33906049356432916
Epoch: 73, step: 471, loss: 0.32887768745422363, mean loss: 0.33906039739487853
Epoch: 73, step: 472, loss: 0.3523028790950775, mean loss: 0.33906052245963464
Epoch: 73, step: 473, loss: 0.29921501874923706, mean loss: 0.33906014615395014
Epoch: 73, step: 474, loss: 0.3153107762336731, mean loss: 0.33905992186418915
Epoch: 73, step: 475, loss: 0.3245895802974701, mean loss: 0.33905978520714053
Epoch: 73, step: 476, loss: 0.3183920383453369, mean loss: 0.33905959002400665
Epoch: 73, step: 477, loss: 0.3718340992927551, mean loss: 0.3390598995386848
Epoch: 73, step: 478, loss: 0.32491499185562134, mean loss: 0.33905976595879905
Epoch: 73, step: 479, loss: 0.32788750529289246, mean loss: 0.33905966045261665
Epoch: 73, step: 480, loss: 0.3546115458011627, mean loss: 0.3390598073167658
Epoch: 73, step: 481, loss: 0.33932965993881226, mean loss: 0.3390598098650936
Epoch: 73, step: 482, loss: 0.33415502309799194, mean loss: 0.33905976354763984
Epoch: 73, step: 483, loss: 0.3036184310913086, mean loss: 0.339059428867081
Epoch: 73, step: 484, loss: 0.3361792266368866, mean loss: 0.33905940166893345
Epoch: 73, step: 485, loss: 0.36101147532463074, mean loss: 0.33905960896344
Epoch: 73, step: 486, loss: 0.34390440583229065, mean loss: 0.3390596547126621
Epoch: 73, step: 487, loss: 0.34286192059516907, mean loss: 0.33905969061696695
Epoch: 73, step: 488, loss: 0.3215998411178589, mean loss: 0.3390595257474237
Epoch: 73, step: 489, loss: 0.3398142158985138, mean loss: 0.3390595328737306
Epoch: 73, step: 490, loss: 0.3366519808769226, mean loss: 0.33905951014017255
Epoch: 73, step: 491, loss: 0.32968223094940186, mean loss: 0.33905942159508273
Epoch: 73, step: 492, loss: 0.33320069313049316, mean loss: 0.3390593662744797
Epoch: 73, step: 493, loss: 0.3146803677082062, mean loss: 0.33905913607979227
Epoch: 73, step: 494, loss: 0.31799939274787903, mean loss: 0.3390589372285045
Epoch: 73, step: 495, loss: 0.3124544620513916, mean loss: 0.33905868602486383
Epoch: 73, step: 496, loss: 0.35866960883140564, mean loss: 0.33905887119253425
Epoch: 73, step: 497, loss: 0.33587831258773804, mean loss: 0.33905884116176654
Epoch: 73, step: 498, loss: 0.3528212904930115, mean loss: 0.3390589711052977
Epoch: 73, step: 499, loss: 0.32152777910232544, mean loss: 0.3390588055792761
Epoch: 73, step: 500, loss: 0.30376532673835754, mean loss: 0.33905847234842773
Epoch: 73, step: 501, loss: 0.3500593602657318, mean loss: 0.33905857621465807
Epoch: 73, step: 502, loss: 0.33348554372787476, mean loss: 0.33905852359668626
Epoch: 73, step: 503, loss: 0.33282965421676636, mean loss: 0.3390584647871638
Epoch: 73, step: 504, loss: 0.29799655079841614, mean loss: 0.3390580771070559
Epoch: 73, step: 505, loss: 0.3259778916835785, mean loss: 0.33905795361354746
Epoch: 73, step: 506, loss: 0.3117351830005646, mean loss: 0.3390576956544408
Epoch: 73, step: 507, loss: 0.34004828333854675, mean loss: 0.33905770500666593
Epoch: 73, step: 508, loss: 0.3136565089225769, mean loss: 0.3390574651940123
Epoch: 73, step: 509, loss: 0.3237581253051758, mean loss: 0.3390573207543313
Epoch: 73, step: 510, loss: 0.3765430748462677, mean loss: 0.33905767465059644
Epoch: 73, step: 511, loss: 0.4037322700023651, mean loss: 0.3390582852260595
Epoch: 73, step: 512, loss: 0.3182631731033325, mean loss: 0.33905808890685135
Epoch: 73, step: 513, loss: 0.311413437128067, mean loss: 0.33905782792605554
Epoch: 73, step: 514, loss: 0.3039504587650299, mean loss: 0.3390574964962108
Epoch: 73, step: 515, loss: 0.3056299686431885, mean loss: 0.3390571809278261
Epoch: 73, step: 516, loss: 0.2968367338180542, mean loss: 0.33905678235475256
Epoch: 73, step: 517, loss: 0.3107459247112274, mean loss: 0.3390565150946974
Epoch: 73, step: 518, loss: 0.34180930256843567, mean loss: 0.3390565410813064
Epoch: 73, step: 519, loss: 0.324036568403244, mean loss: 0.3390563992924921
Epoch: 73, step: 520, loss: 0.346468061208725, mean loss: 0.33905646925805444
Epoch: 73, step: 521, loss: 0.34345924854278564, mean loss: 0.339056510819586
Epoch: 73, step: 522, loss: 0.3272804617881775, mean loss: 0.3390563996566178
Epoch: 73, step: 523, loss: 0.349286824464798, mean loss: 0.33905649622836687
Epoch: 73, step: 524, loss: 0.33193108439445496, mean loss: 0.33905642896752475
Epoch: 73, step: 525, loss: 0.30621451139450073, mean loss: 0.33905611895678667
Epoch: 73, step: 526, loss: 0.28677481412887573, mean loss: 0.3390556254529323
Epoch: 73, step: 527, loss: 0.3403612971305847, mean loss: 0.3390556377775658
Epoch: 73, step: 528, loss: 0.3246462941169739, mean loss: 0.33905550176465615
Epoch: 73, step: 529, loss: 0.315141499042511, mean loss: 0.3390552760373457
Epoch: 73, step: 530, loss: 0.36125123500823975, mean loss: 0.3390554855458453
Epoch: 73, step: 531, loss: 0.3237379789352417, mean loss: 0.3390553409646835
Epoch: 73, step: 532, loss: 0.36552953720092773, mean loss: 0.3390555908509097
Epoch: 73, step: 533, loss: 0.32019129395484924, mean loss: 0.33905541279513696
Epoch: 73, step: 534, loss: 0.3375590145587921, mean loss: 0.33905539867111045
Epoch: 73, step: 535, loss: 0.37534722685813904, mean loss: 0.3390557412148884
Epoch: 73, step: 536, loss: 0.31066077947616577, mean loss: 0.33905547320894464
Epoch: 73, step: 537, loss: 0.3270406126976013, mean loss: 0.33905535980771284
Epoch: 73, step: 538, loss: 0.33782586455345154, mean loss: 0.3390553482033367
Epoch: 73, step: 539, loss: 0.3374071419239044, mean loss: 0.3390553326471766
Epoch: 73, step: 540, loss: 0.3197733163833618, mean loss: 0.33905515066067066
Epoch: 73, step: 541, loss: 0.36223098635673523, mean loss: 0.33905536939555275
Epoch: 73, step: 542, loss: 0.3235025405883789, mean loss: 0.3390552226084374
Epoch: 73, step: 543, loss: 0.3306926190853119, mean loss: 0.3390551436831899
Epoch: 73, step: 544, loss: 0.3056330978870392, mean loss: 0.3390548282529135
Epoch: 73, step: 545, loss: 0.3366585671901703, mean loss: 0.33905480563771634
Epoch: 73, step: 546, loss: 0.35740792751312256, mean loss: 0.33905497884737174
Epoch: 73, step: 547, loss: 0.34232762455940247, mean loss: 0.33905500973304287
Epoch: 73, step: 548, loss: 0.32066109776496887, mean loss: 0.33905483614170295
Epoch: 73, step: 549, loss: 0.3675175905227661, mean loss: 0.33905510475454886
Epoch: 73, step: 550, loss: 0.34844136238098145, mean loss: 0.3390551933350687
Epoch: 73, step: 551, loss: 0.3240799009799957, mean loss: 0.33905505201072883
Epoch: 73, step: 552, loss: 0.34099748730659485, mean loss: 0.3390550703416428
Epoch: 73, step: 553, loss: 0.3410349190235138, mean loss: 0.33905508902545345
Epoch: 73, step: 554, loss: 0.36118248105049133, mean loss: 0.33905529783944294
Epoch: 73, step: 555, loss: 0.34270918369293213, mean loss: 0.3390553323204736
Epoch: 73, step: 556, loss: 0.37960121035575867, mean loss: 0.3390557149406553
Epoch: 73, step: 557, loss: 0.32785284519195557, mean loss: 0.3390556092232848
Epoch: 73, step: 558, loss: 0.2951239347457886, mean loss: 0.33905519466010736
Epoch: 73, step: 559, loss: 0.27333876490592957, mean loss: 0.33905457452998095
Epoch: 73, step: 560, loss: 0.32621872425079346, mean loss: 0.3390544534062015
Epoch: 73, step: 561, loss: 0.2818106710910797, mean loss: 0.3390539132380252
Epoch: 73, step: 562, loss: 0.317640095949173, mean loss: 0.3390537111732242
Epoch: 73, step: 563, loss: 0.3535662293434143, mean loss: 0.3390538481147786
Epoch: 73, step: 564, loss: 0.31147921085357666, mean loss: 0.33905358792023393
Epoch: 73, step: 565, loss: 0.3136616051197052, mean loss: 0.33905334832349876
Epoch: 73, step: 566, loss: 0.33918917179107666, mean loss: 0.33905334960510614
Epoch: 73, step: 567, loss: 0.3030918836593628, mean loss: 0.3390530102819702
Epoch: 73, step: 568, loss: 0.34753525257110596, mean loss: 0.3390530903174699
Epoch: 73, step: 569, loss: 0.31177493929862976, mean loss: 0.3390528329327157
Epoch: 73, step: 570, loss: 0.3304625451564789, mean loss: 0.33905275187926587
Epoch: 73, step: 571, loss: 0.34241941571235657, mean loss: 0.33905278364504027
Epoch: 73, step: 572, loss: 0.3463307023048401, mean loss: 0.3390528523143676
Epoch: 73, step: 573, loss: 0.3268948197364807, mean loss: 0.3390527376007962
Epoch: 73, step: 574, loss: 0.3582562506198883, mean loss: 0.33905291878823446
Epoch: 73, step: 575, loss: 0.3441922664642334, mean loss: 0.33905296727813594
Epoch: 73, step: 576, loss: 0.30525726079940796, mean loss: 0.33905264841762706
Epoch: 73, step: 577, loss: 0.325101763010025, mean loss: 0.3390525167930832
Epoch: 73, step: 578, loss: 0.33293408155441284, mean loss: 0.33905245906709475
Epoch: 73, step: 579, loss: 0.37316885590553284, mean loss: 0.3390527809441877
Epoch: 73, step: 580, loss: 0.3567335903644562, mean loss: 0.33905294775529243
Epoch: 73, step: 581, loss: 0.3217032849788666, mean loss: 0.3390527840699633
Epoch: 73, step: 582, loss: 0.33015698194503784, mean loss: 0.33905270014334293
Epoch: 73, step: 583, loss: 0.33342984318733215, mean loss: 0.3390526470955208
Epoch: 73, step: 584, loss: 0.3450910747051239, mean loss: 0.3390527040634313
Epoch: 73, step: 585, loss: 0.3278658390045166, mean loss: 0.3390525985249772
Epoch: 73, step: 586, loss: 0.3492259085178375, mean loss: 0.33905269450050524
Epoch: 73, step: 587, loss: 0.3112087547779083, mean loss: 0.3390524318218286
Epoch: 73, step: 588, loss: 0.3608856201171875, mean loss: 0.3390526377933599
Epoch: 73, step: 589, loss: 0.27408525347709656, mean loss: 0.3390520249050718
Epoch: 73, step: 590, loss: 0.39376315474510193, mean loss: 0.33905254103319876
Epoch: 73, step: 591, loss: 0.3531426191329956, mean loss: 0.339052673953448
Epoch: 73, step: 592, loss: 0.3980296552181244, mean loss: 0.3390532303138203
Epoch: 73, step: 593, loss: 0.3635331392288208, mean loss: 0.3390534612432857
Epoch: 73, step: 594, loss: 0.30337852239608765, mean loss: 0.3390531247094828
Epoch: 73, step: 595, loss: 0.3340764343738556, mean loss: 0.3390530777631171
Epoch: 73, step: 596, loss: 0.2816941738128662, mean loss: 0.3390525366873221
Epoch: 73, step: 597, loss: 0.3455422520637512, mean loss: 0.3390525979052768
Epoch: 73, step: 598, loss: 0.33522626757621765, mean loss: 0.33905256181156646
Epoch: 73, step: 599, loss: 0.3424011766910553, mean loss: 0.339052593398697
Epoch: 73, step: 600, loss: 0.36739397048950195, mean loss: 0.33905286073739216
Epoch: 73, step: 601, loss: 0.32544052600860596, mean loss: 0.33905273233609867
Epoch: 73, step: 602, loss: 0.3137732744216919, mean loss: 0.3390524938843898
Epoch: 73, step: 603, loss: 0.3332401514053345, mean loss: 0.33905243905924565
Epoch: 73, step: 604, loss: 0.3502887785434723, mean loss: 0.3390525450454505
Epoch: 73, step: 605, loss: 0.3532256484031677, mean loss: 0.3390526787312714
Epoch: 73, step: 606, loss: 0.29512810707092285, mean loss: 0.3390522644227827
Epoch: 73, step: 607, loss: 0.322150319814682, mean loss: 0.3390521050005547
Epoch: 73, step: 608, loss: 0.3197333812713623, mean loss: 0.33905192278454344
Epoch: 73, step: 609, loss: 0.33994805812835693, mean loss: 0.3390519312368962
Epoch: 73, step: 610, loss: 0.3402709662914276, mean loss: 0.3390519427347321
Epoch: 73, step: 611, loss: 0.315123051404953, mean loss: 0.3390517170415746
Epoch: 73, step: 612, loss: 0.3291521966457367, mean loss: 0.3390516236718939
Epoch: 73, step: 613, loss: 0.3386639952659607, mean loss: 0.3390516200159189
Epoch: 73, step: 614, loss: 0.3028458058834076, mean loss: 0.33905127853861466
Epoch: 73, step: 615, loss: 0.37320640683174133, mean loss: 0.33905160067171436
Epoch: 73, step: 616, loss: 0.30583158135414124, mean loss: 0.3390512873610228
Epoch: 73, step: 617, loss: 0.3875788748264313, mean loss: 0.3390517450389202
Epoch: 73, step: 618, loss: 0.3434411883354187, mean loss: 0.33905178643665573
Epoch: 73, step: 619, loss: 0.3335443437099457, mean loss: 0.33905173449532927
Epoch: 73, step: 620, loss: 0.37305504083633423, mean loss: 0.3390520551814019
Epoch: 73, step: 621, loss: 0.3202154040336609, mean loss: 0.339051877534127
Epoch: 73, step: 622, loss: 0.3093636631965637, mean loss: 0.33905159754908115
Epoch: 73, step: 623, loss: 0.3638266324996948, mean loss: 0.33905183119647403
Epoch: 73, step: 624, loss: 0.33968526124954224, mean loss: 0.3390518371701441
Epoch: 73, step: 625, loss: 0.3374139368534088, mean loss: 0.33905182172379167
Epoch: 73, step: 626, loss: 0.33200085163116455, mean loss: 0.3390517552296707
Epoch: 73, step: 627, loss: 0.32253962755203247, mean loss: 0.33905159951364205
Epoch: 73, step: 628, loss: 0.3665492534637451, mean loss: 0.339051858825172
Epoch: 73, step: 629, loss: 0.3231062889099121, mean loss: 0.33905170845484783
Epoch: 73, step: 630, loss: 0.3218802213668823, mean loss: 0.339051546525375
Epoch: 73, step: 631, loss: 0.3280494511127472, mean loss: 0.3390514427750882
Epoch: 73, step: 632, loss: 0.32928380370140076, mean loss: 0.33905135066665243
Epoch: 73, step: 633, loss: 0.3417493999004364, mean loss: 0.3390513761089061
Epoch: 73, step: 634, loss: 0.2756693363189697, mean loss: 0.33905077843014303
Epoch: 73, step: 635, loss: 0.3116340935230255, mean loss: 0.3390505198992428
Epoch: 73, step: 636, loss: 0.3502919673919678, mean loss: 0.3390506259016331
Epoch: 73, step: 637, loss: 0.30653396248817444, mean loss: 0.33905031928528784
Epoch: 73, step: 638, loss: 0.32019999623298645, mean loss: 0.3390501415375716
Epoch: 73, step: 639, loss: 0.3422037363052368, mean loss: 0.33905017127387804
Epoch: 73, step: 640, loss: 0.3029307723045349, mean loss: 0.3390498306951205
Epoch: 73, step: 641, loss: 0.3058058023452759, mean loss: 0.33904951723190035
Epoch: 73, step: 642, loss: 0.3226553499698639, mean loss: 0.33904936265015256
Epoch: 73, step: 643, loss: 0.30929261445999146, mean loss: 0.33904908207434176
Epoch: 73, step: 644, loss: 0.324485182762146, mean loss: 0.33904894475290787
Epoch: 73, step: 645, loss: 0.29303890466690063, mean loss: 0.3390485109332989
Epoch: 73, step: 646, loss: 0.343034565448761, mean loss: 0.33904854851666777
Epoch: 73, step: 647, loss: 0.40214651823043823, mean loss: 0.3390491434437818
Epoch: 73, step: 648, loss: 0.3339167535305023, mean loss: 0.33904909505285663
Epoch: 73, step: 649, loss: 0.33743050694465637, mean loss: 0.3390490797920836
Epoch: 73, step: 650, loss: 0.3299795389175415, mean loss: 0.3390489942811997
Epoch: 73, step: 651, loss: 0.34147748351097107, mean loss: 0.3390490171776512
Epoch: 73, step: 652, loss: 0.3657881021499634, mean loss: 0.3390492692785796
Epoch: 73, step: 653, loss: 0.31636980175971985, mean loss: 0.3390490554544746
Epoch: 73, step: 654, loss: 0.32383882999420166, mean loss: 0.3390489120524225
Epoch: 73, step: 655, loss: 0.34896382689476013, mean loss: 0.3390490055293886
Epoch: 73, step: 656, loss: 0.3200644254684448, mean loss: 0.3390488265460847
Epoch: 73, step: 657, loss: 0.33814239501953125, mean loss: 0.3390488180004872
Epoch: 73, step: 658, loss: 0.34103867411613464, mean loss: 0.33904883676014924
Epoch: 73, step: 659, loss: 0.30935138463974, mean loss: 0.3390485567856779
Epoch: 73, step: 660, loss: 0.34224840998649597, mean loss: 0.3390485869521972
Epoch: 73, step: 661, loss: 0.3261217176914215, mean loss: 0.33904846508567704
Epoch: 73, step: 662, loss: 0.2984274625778198, mean loss: 0.3390480821396247
Epoch: 73, step: 663, loss: 0.34888288378715515, mean loss: 0.3390481748542976
Epoch: 73, step: 664, loss: 0.31496691703796387, mean loss: 0.3390479478375285
Epoch: 73, step: 665, loss: 0.3279551863670349, mean loss: 0.3390478432657844
Epoch: 73, step: 666, loss: 0.31910404562950134, mean loss: 0.33904765525687
Epoch: 73, step: 667, loss: 0.2951629161834717, mean loss: 0.33904724156212
Epoch: 73, step: 668, loss: 0.33737286925315857, mean loss: 0.3390472257782161
Epoch: 73, step: 669, loss: 0.3698568642139435, mean loss: 0.33904751621050844
Epoch: 73, step: 670, loss: 0.3677661418914795, mean loss: 0.33904778692896176
Epoch: 73, step: 671, loss: 0.3285354673862457, mean loss: 0.33904768783466344
Epoch: 73, step: 672, loss: 0.41055142879486084, mean loss: 0.33904836185776716
Epoch: 73, step: 673, loss: 0.29846087098121643, mean loss: 0.3390479792673134
Epoch: 73, step: 674, loss: 0.363553524017334, mean loss: 0.33904821026210774
Epoch: 73, step: 675, loss: 0.33174028992652893, mean loss: 0.339048141376651
Epoch: 73, step: 676, loss: 0.33973851799964905, mean loss: 0.33904814788417414
Epoch: 73, step: 677, loss: 0.329096257686615, mean loss: 0.33904805407806426
Epoch: 73, step: 678, loss: 0.32469016313552856, mean loss: 0.3390479187424473
Epoch: 73, step: 679, loss: 0.40120649337768555, mean loss: 0.3390485046355837
Epoch: 73, step: 680, loss: 0.2947273254394531, mean loss: 0.33904808687777505
Epoch: 73, step: 681, loss: 0.3394603133201599, mean loss: 0.33904809076325815
Epoch: 73, step: 682, loss: 0.30786046385765076, mean loss: 0.339047796803817
Epoch: 73, step: 683, loss: 0.3167147934436798, mean loss: 0.33904758630574583
Epoch: 73, step: 684, loss: 0.35243090987205505, mean loss: 0.3390477124480832
Epoch: 73, step: 685, loss: 0.33119267225265503, mean loss: 0.3390476384123785
Epoch: 73, step: 686, loss: 0.3477582633495331, mean loss: 0.3390477205114081
Epoch: 73, step: 687, loss: 0.3076466917991638, mean loss: 0.33904742455449277
Epoch: 73, step: 688, loss: 0.3368183970451355, mean loss: 0.3390474035459489
Epoch: 73, step: 689, loss: 0.3589930832386017, mean loss: 0.3390475915318464
Epoch: 73, step: 690, loss: 0.3542151153087616, mean loss: 0.3390477344827882
Epoch: 73, step: 691, loss: 0.3013027310371399, mean loss: 0.33904737874687396
Epoch: 73, step: 692, loss: 0.36892497539520264, mean loss: 0.33904766033206457
Epoch: 73, step: 693, loss: 0.3359174430370331, mean loss: 0.3390476308312136
Epoch: 73, step: 694, loss: 0.33959686756134033, mean loss: 0.33904763600746707
Epoch: 73, step: 695, loss: 0.3566160500049591, mean loss: 0.3390478015785267
Epoch: 73, step: 696, loss: 0.33042773604393005, mean loss: 0.33904772034069075
Epoch: 73, step: 697, loss: 0.3075145483016968, mean loss: 0.33904742316632414
Epoch: 73, step: 698, loss: 0.3204163908958435, mean loss: 0.33904724758573146
Epoch: 73, step: 699, loss: 0.33602872490882874, mean loss: 0.3390472191391592
Epoch: 73, step: 700, loss: 0.32738617062568665, mean loss: 0.33904710924641734
Epoch: 73, step: 701, loss: 0.3135799765586853, mean loss: 0.3390468692485595
Epoch: 73, step: 702, loss: 0.38123902678489685, mean loss: 0.3390472668564145
Epoch: 73, step: 703, loss: 0.3106653690338135, mean loss: 0.3390469993953547
Epoch: 73, step: 704, loss: 0.323557585477829, mean loss: 0.3390468534299211
Epoch: 73, step: 705, loss: 0.32129350304603577, mean loss: 0.3390466861317211
Epoch: 73, step: 706, loss: 0.3196181654930115, mean loss: 0.3390465030493265
Epoch: 73, step: 707, loss: 0.32399922609329224, mean loss: 0.33904636125440607
Epoch: 73, step: 708, loss: 0.3211640417575836, mean loss: 0.3390461927456331
Epoch: 73, step: 709, loss: 0.3150232136249542, mean loss: 0.3390459663742952
Epoch: 73, step: 710, loss: 0.3343568742275238, mean loss: 0.3390459221888486
Epoch: 73, step: 711, loss: 0.3587735593318939, mean loss: 0.339046108081174
Epoch: 73, step: 712, loss: 0.3541091978549957, mean loss: 0.3390462500184157
Epoch: 73, step: 713, loss: 0.32341352105140686, mean loss: 0.3390461027149371
Epoch: 73, step: 714, loss: 0.33420780301094055, mean loss: 0.33904605712522196
Epoch: 73, step: 715, loss: 0.2951950430870056, mean loss: 0.3390456439353565
Epoch: 73, step: 716, loss: 0.3163950741291046, mean loss: 0.33904543051046976
Epoch: 73, step: 717, loss: 0.34689921140670776, mean loss: 0.3390455045119858
Epoch: 73, step: 718, loss: 0.3098466098308563, mean loss: 0.33904522939072357
Epoch: 73, step: 719, loss: 0.3208267092704773, mean loss: 0.3390450577316564
Epoch: 73, step: 720, loss: 0.37744054198265076, mean loss: 0.33904541949928996
Epoch: 73, step: 721, loss: 0.3176531493663788, mean loss: 0.33904521794022185
Epoch: 73, step: 722, loss: 0.3858843445777893, mean loss: 0.33904565925672103
Epoch: 73, step: 723, loss: 0.35047605633735657, mean loss: 0.33904576695248007
Epoch: 73, step: 724, loss: 0.3805793523788452, mean loss: 0.3390461582729944
Epoch: 73, step: 725, loss: 0.32609793543815613, mean loss: 0.33904603627877145
Epoch: 73, step: 726, loss: 0.36082255840301514, mean loss: 0.33904624144861595
Epoch: 73, step: 727, loss: 0.29872313141822815, mean loss: 0.3390458615436788
Epoch: 73, step: 728, loss: 0.35574254393577576, mean loss: 0.3390460188503029
Epoch: 73, step: 729, loss: 0.34922492504119873, mean loss: 0.3390461147492514
Epoch: 73, step: 730, loss: 0.3676888644695282, mean loss: 0.33904638459982767
Epoch: 73, step: 731, loss: 0.2867027223110199, mean loss: 0.33904589146161646
Epoch: 73, step: 732, loss: 0.3063020706176758, mean loss: 0.33904558297962634
Epoch: 73, step: 733, loss: 0.34114229679107666, mean loss: 0.3390456027327382
Epoch: 73, step: 734, loss: 0.33853664994239807, mean loss: 0.33904559793794614
Epoch: 73, step: 735, loss: 0.3637775778770447, mean loss: 0.33904583093319746
Epoch: 73, step: 736, loss: 0.39041978120803833, mean loss: 0.33904631491279474
Epoch: 73, step: 737, loss: 0.31014758348464966, mean loss: 0.3390460426685043
Epoch: 73, step: 738, loss: 0.3430017828941345, mean loss: 0.33904607993372293
Epoch: 73, step: 739, loss: 0.33727309107780457, mean loss: 0.33904606323136355
Epoch: 73, step: 740, loss: 0.3690272271633148, mean loss: 0.33904634566486924
Epoch: 73, step: 741, loss: 0.3038690388202667, mean loss: 0.3390460142849227
Epoch: 73, step: 742, loss: 0.32186371088027954, mean loss: 0.3390458524244036
Epoch: 73, step: 743, loss: 0.33036163449287415, mean loss: 0.33904577061821334
Epoch: 73, step: 744, loss: 0.376336008310318, mean loss: 0.33904612189262473
Epoch: 73, step: 745, loss: 0.32416826486587524, mean loss: 0.33904598174438316
Epoch: 73, step: 746, loss: 0.34887441992759705, mean loss: 0.33904607432662476
Epoch: 73, step: 747, loss: 0.2932073175907135, mean loss: 0.339045642537281
Epoch: 73, step: 748, loss: 0.32898613810539246, mean loss: 0.3390455477802192
Epoch: 73, step: 749, loss: 0.35822752118110657, mean loss: 0.3390457284660899
Epoch: 73, step: 750, loss: 0.30388960242271423, mean loss: 0.3390453973137483
Epoch: 73, step: 751, loss: 0.3293421268463135, mean loss: 0.3390453059148704
Epoch: 73, step: 752, loss: 0.33632755279541016, mean loss: 0.33904528031553804
Epoch: 73, step: 753, loss: 0.3753304183483124, mean loss: 0.3390456220929247
Epoch: 73, step: 754, loss: 0.3089894950389862, mean loss: 0.33904533899057604
Epoch: 73, step: 755, loss: 0.36049583554267883, mean loss: 0.339045541033532
Epoch: 73, step: 756, loss: 0.3446168899536133, mean loss: 0.33904559350976254
Epoch: 73, step: 757, loss: 0.32476431131362915, mean loss: 0.3390454589964142
Epoch: 73, step: 758, loss: 0.33985191583633423, mean loss: 0.33904546659224394
Epoch: 73, step: 759, loss: 0.3408530354499817, mean loss: 0.33904548361715503
Epoch: 73, step: 760, loss: 0.33720624446868896, mean loss: 0.3390454662941148
Epoch: 73, step: 761, loss: 0.31848394870758057, mean loss: 0.3390452726354264
Epoch: 73, step: 762, loss: 0.3122018873691559, mean loss: 0.3390450198133377
Epoch: 73, step: 763, loss: 0.3158054053783417, mean loss: 0.3390448009351125
Epoch: 73, step: 764, loss: 0.34471067786216736, mean loss: 0.3390448542976762
Epoch: 73, step: 765, loss: 0.32787641882896423, mean loss: 0.3390447491117105
Epoch: 73, step: 766, loss: 0.34749549627304077, mean loss: 0.33904482870133895
Epoch: 73, step: 767, loss: 0.2902933657169342, mean loss: 0.33904436956154815
Epoch: 73, step: 768, loss: 0.31527847051620483, mean loss: 0.3390441457371441
Epoch: 73, step: 769, loss: 0.32715365290641785, mean loss: 0.33904403375495473
Epoch: 73, step: 770, loss: 0.38431262969970703, mean loss: 0.3390444600811646
Epoch: 73, step: 771, loss: 0.2749972641468048, mean loss: 0.3390438569093503
Epoch: 73, step: 772, loss: 0.30481773614883423, mean loss: 0.33904353458396763
Epoch: 73, step: 773, loss: 0.3222333490848541, mean loss: 0.33904337627509923
Epoch: 73, step: 774, loss: 0.29833555221557617, mean loss: 0.3390429929153277
Epoch: 73, step: 775, loss: 0.3371971547603607, mean loss: 0.33904297553258994
Epoch: 73, step: 776, loss: 0.2907193899154663, mean loss: 0.3390425204611078
Epoch: 73, step: 777, loss: 0.3309704065322876, mean loss: 0.33904244444534426
Epoch: 73, step: 778, loss: 0.336024671792984, mean loss: 0.3390424160269976
Epoch: 73, step: 779, loss: 0.3274150788784027, mean loss: 0.3390423065334656
Epoch: 73, step: 780, loss: 0.344890832901001, mean loss: 0.3390423616079655
Epoch: 73, step: 781, loss: 0.3241606652736664, mean loss: 0.3390422214710808
Epoch: 73, step: 782, loss: 0.3682955801486969, mean loss: 0.3390424969394049
Epoch: 73, step: 783, loss: 0.3225283622741699, mean loss: 0.3390423414332214
Epoch: 73, step: 784, loss: 0.3070579767227173, mean loss: 0.339042040253671
Epoch: 73, step: 785, loss: 0.324578195810318, mean loss: 0.33904190405671397
Epoch: 73, step: 786, loss: 0.3431017994880676, mean loss: 0.3390419422858445
Epoch: 73, step: 787, loss: 0.37736669182777405, mean loss: 0.33904230315919237
Epoch: 73, step: 788, loss: 0.37114229798316956, mean loss: 0.33904260541618453
Epoch: 73, step: 789, loss: 0.3225036859512329, mean loss: 0.33904244968541236
Epoch: 73, step: 790, loss: 0.2951577603816986, mean loss: 0.3390420364702555
Epoch: 73, step: 791, loss: 0.3441449701786041, mean loss: 0.339042084518669
Epoch: 73, step: 792, loss: 0.2735825181007385, mean loss: 0.33904146816758934
Epoch: 73, step: 793, loss: 0.35081249475479126, mean loss: 0.33904157899961945
Epoch: 73, step: 794, loss: 0.31166180968284607, mean loss: 0.3390413212033413
Epoch: 73, step: 795, loss: 0.33482784032821655, mean loss: 0.3390412815313686
Epoch: 73, step: 796, loss: 0.32551002502441406, mean loss: 0.33904115412920394
Epoch: 73, step: 797, loss: 0.3162994086742401, mean loss: 0.3390409400086366
Epoch: 73, step: 798, loss: 0.330242395401001, mean loss: 0.33904085716839777
Epoch: 73, step: 799, loss: 0.3657588064670563, mean loss: 0.3390411087214172
Epoch: 73, step: 800, loss: 0.3227643370628357, mean loss: 0.3390409554749063
Epoch: 73, step: 801, loss: 0.29249411821365356, mean loss: 0.3390405172385414
Epoch: 73, step: 802, loss: 0.3018142580986023, mean loss: 0.3390401667582972
Epoch: 73, step: 803, loss: 0.3095259964466095, mean loss: 0.33903988888895253
Epoch: 73, step: 804, loss: 0.32507944107055664, mean loss: 0.3390397574556808
Epoch: 73, step: 805, loss: 0.29398712515830994, mean loss: 0.3390393333031615
Epoch: 73, step: 806, loss: 0.338276743888855, mean loss: 0.33903932612375465
Epoch: 73, step: 807, loss: 0.32958006858825684, mean loss: 0.3390392370703039
Epoch: 73, step: 808, loss: 0.31095725297927856, mean loss: 0.33903897269711886
Epoch: 73, step: 809, loss: 0.3340272307395935, mean loss: 0.339038925515349
Epoch: 73, step: 810, loss: 0.3144795298576355, mean loss: 0.3390386943093422
Epoch: 73, step: 811, loss: 0.30540233850479126, mean loss: 0.3390383776543885
Epoch: 73, step: 812, loss: 0.32398802042007446, mean loss: 0.3390382359706301
Epoch: 73, step: 813, loss: 0.34263789653778076, mean loss: 0.3390382698574428
Epoch: 73, step: 814, loss: 0.3365783393383026, mean loss: 0.33903824670014265
Epoch: 73, step: 815, loss: 0.4186951220035553, mean loss: 0.3390389965671768
Epoch: 73, step: 816, loss: 0.3644622564315796, mean loss: 0.33903923589221857
Epoch: 73, step: 817, loss: 0.3264163136482239, mean loss: 0.3390391170658772
Epoch: 73, step: 818, loss: 0.3643434941768646, mean loss: 0.3390393552673166
Epoch: 73, step: 819, loss: 0.28508806228637695, mean loss: 0.33903884740440354
Epoch: 73, step: 820, loss: 0.3379879891872406, mean loss: 0.33903883751239056
Epoch: 73, step: 821, loss: 0.28990817070007324, mean loss: 0.3390383750364712
Epoch: 73, step: 822, loss: 0.32263997197151184, mean loss: 0.3390382206767681
Epoch: 73, step: 823, loss: 0.31581634283065796, mean loss: 0.3390380020891156
Epoch: 73, step: 824, loss: 0.3167073428630829, mean loss: 0.33903779189248706
Epoch: 73, step: 825, loss: 0.32059943675994873, mean loss: 0.33903761833542523
Epoch: 73, step: 826, loss: 0.3374118208885193, mean loss: 0.33903760303221786
Epoch: 73, step: 827, loss: 0.3855200707912445, mean loss: 0.339038040555446
Epoch: 73, step: 828, loss: 0.37872710824012756, mean loss: 0.3390384141312565
Epoch: 73, step: 829, loss: 0.3116965591907501, mean loss: 0.3390381567767739
Epoch: 73, step: 830, loss: 0.3136530816555023, mean loss: 0.3390379178426783
Epoch: 73, step: 831, loss: 0.33372339606285095, mean loss: 0.339037867820825
Epoch: 73, step: 832, loss: 0.3299216032028198, mean loss: 0.3390377820166496
Epoch: 73, step: 833, loss: 0.30555257201194763, mean loss: 0.3390374668498668
Epoch: 73, step: 834, loss: 0.3177289664745331, mean loss: 0.33903726629361225
Epoch: 73, step: 835, loss: 0.3307107090950012, mean loss: 0.3390371879245399
Epoch: 73, step: 836, loss: 0.3103271424770355, mean loss: 0.33903691770980426
Epoch: 73, step: 837, loss: 0.3163469731807709, mean loss: 0.3390367041573852
Epoch: 73, step: 838, loss: 0.3598000705242157, mean loss: 0.3390368995754647
Epoch: 73, step: 839, loss: 0.30245518684387207, mean loss: 0.3390365552834727
Epoch: 73, step: 840, loss: 0.29607442021369934, mean loss: 0.33903615094538275
Epoch: 73, step: 841, loss: 0.3273774981498718, mean loss: 0.33903604122101666
Epoch: 73, step: 842, loss: 0.36262571811676025, mean loss: 0.33903626323105757
Epoch: 73, step: 843, loss: 0.3192317485809326, mean loss: 0.33903607684615084
Epoch: 73, step: 844, loss: 0.32824602723121643, mean loss: 0.33903597529943286
Epoch: 73, step: 845, loss: 0.3698970079421997, mean loss: 0.33903626573434265
Epoch: 73, step: 846, loss: 0.37692520022392273, mean loss: 0.33903662230587533
Epoch: 73, step: 847, loss: 0.3347300589084625, mean loss: 0.33903658177732837
Epoch: 73, step: 848, loss: 0.32952940464019775, mean loss: 0.33903649230727695
Epoch: 73, step: 849, loss: 0.3185150921344757, mean loss: 0.33903629918649836
Epoch: 73, step: 850, loss: 0.35866445302963257, mean loss: 0.3390364838994638
Epoch: 73, step: 851, loss: 0.31928175687789917, mean loss: 0.3390362979971166
Epoch: 73, step: 852, loss: 0.32145604491233826, mean loss: 0.339036132559267
Epoch: 73, step: 853, loss: 0.31181615591049194, mean loss: 0.3390358764098246
Epoch: 73, step: 854, loss: 0.3019789755344391, mean loss: 0.33903552769478723
Epoch: 73, step: 855, loss: 0.3250102698802948, mean loss: 0.33903539571471975
Epoch: 73, step: 856, loss: 0.3203090727329254, mean loss: 0.33903521949848564
Epoch: 73, step: 857, loss: 0.3187206983566284, mean loss: 0.33903502833897553
Epoch: 73, step: 858, loss: 0.3098351061344147, mean loss: 0.3390347535704855
Epoch: 73, step: 859, loss: 0.30074161291122437, mean loss: 0.3390343932390656
Epoch: 73, step: 860, loss: 0.3061296343803406, mean loss: 0.3390340836142422
Epoch: 73, step: 861, loss: 0.37018465995788574, mean loss: 0.33903437672992753
Epoch: 73, step: 862, loss: 0.3366490304470062, mean loss: 0.33903435428489076
Epoch: 73, step: 863, loss: 0.28923916816711426, mean loss: 0.3390338857389715
Epoch: 73, step: 864, loss: 0.3772329092025757, mean loss: 0.3390342451678551
Epoch: 73, step: 865, loss: 0.34855329990386963, mean loss: 0.3390343347353548
Epoch: 73, step: 866, loss: 0.32028937339782715, mean loss: 0.3390341583603293
Epoch: 73, step: 867, loss: 0.38785532116889954, mean loss: 0.3390346177239237
Epoch: 73, step: 868, loss: 0.35763195157051086, mean loss: 0.33903479270660025
Epoch: 73, step: 869, loss: 0.3053969144821167, mean loss: 0.3390344762101265
Epoch: 73, step: 870, loss: 0.3266298472881317, mean loss: 0.33903435949692756
Epoch: 73, step: 871, loss: 0.4006146490573883, mean loss: 0.3390349388907174
Epoch: 73, step: 872, loss: 0.3298431932926178, mean loss: 0.33903485240865877
Epoch: 73, step: 873, loss: 0.36084792017936707, mean loss: 0.33903505763858344
Epoch: 73, step: 874, loss: 0.3377350866794586, mean loss: 0.3390350454078218
Epoch: 73, step: 875, loss: 0.32564473152160645, mean loss: 0.3390349194263951
Epoch: 73, step: 876, loss: 0.3227882385253906, mean loss: 0.33903476657256354
Epoch: 73, step: 877, loss: 0.33967024087905884, mean loss: 0.33903477255124737
Epoch: 73, step: 878, loss: 0.3219667673110962, mean loss: 0.3390346119731623
Epoch: 73, step: 879, loss: 0.3609192371368408, mean loss: 0.3390348178647173
Epoch: 73, step: 880, loss: 0.31590089201927185, mean loss: 0.3390346002217319
Epoch: 73, step: 881, loss: 0.31999123096466064, mean loss: 0.3390344210642135
Epoch: 73, step: 882, loss: 0.36427852511405945, mean loss: 0.3390346585551966
Epoch: 73, step: 883, loss: 0.3180154263973236, mean loss: 0.3390344608127401
Epoch: 73, step: 884, loss: 0.3632670044898987, mean loss: 0.3390346887828961
Epoch: 73, step: 885, loss: 0.34103888273239136, mean loss: 0.3390347076373802
Epoch: 73, step: 886, loss: 0.327334463596344, mean loss: 0.3390345975681976
Epoch: 73, step: 887, loss: 0.3588100075721741, mean loss: 0.3390347836021581
Epoch: 73, step: 888, loss: 0.30864110589027405, mean loss: 0.339034497681257
Epoch: 73, step: 889, loss: 0.37716424465179443, mean loss: 0.33903485637391534
Epoch: 73, step: 890, loss: 0.3253653347492218, mean loss: 0.33903472778373794
Epoch: 73, step: 891, loss: 0.348888635635376, mean loss: 0.3390348204792889
Epoch: 73, step: 892, loss: 0.3408062160015106, mean loss: 0.33903483714262106
Epoch: 73, step: 893, loss: 0.3379823565483093, mean loss: 0.33903482724213946
Epoch: 73, step: 894, loss: 0.32080796360969543, mean loss: 0.3390346557871682
Epoch: 73, step: 895, loss: 0.2954705059528351, mean loss: 0.33903424599533843
Epoch: 73, step: 896, loss: 0.2938019633293152, mean loss: 0.33903382051600306
Epoch: 73, step: 897, loss: 0.3345354199409485, mean loss: 0.33903377820201025
Epoch: 73, step: 898, loss: 0.306185781955719, mean loss: 0.3390334692217895
Epoch: 73, step: 899, loss: 0.32077714800834656, mean loss: 0.33903329749779587
Epoch: 73, step: 900, loss: 0.298993319272995, mean loss: 0.33903292087425757
Epoch: 73, step: 901, loss: 0.34316039085388184, mean loss: 0.33903295969764846
Epoch: 73, step: 902, loss: 0.32476526498794556, mean loss: 0.3390328254955631
Epoch: 73, step: 903, loss: 0.34737855195999146, mean loss: 0.33903290399481495
Epoch: 73, step: 904, loss: 0.38515692949295044, mean loss: 0.33903333782971906
Epoch: 73, step: 905, loss: 0.3234643042087555, mean loss: 0.33903319139135846
Epoch: 73, step: 906, loss: 0.32969096302986145, mean loss: 0.33903310352156696
Epoch: 73, step: 907, loss: 0.3154149055480957, mean loss: 0.3390328813789976
Epoch: 73, step: 908, loss: 0.31994131207466125, mean loss: 0.3390327018136314
Epoch: 73, step: 909, loss: 0.3557029366493225, mean loss: 0.3390328586037109
Epoch: 73, step: 910, loss: 0.3421310782432556, mean loss: 0.33903288774340445
Epoch: 73, step: 911, loss: 0.37348422408103943, mean loss: 0.3390332117656039
Epoch: 73, step: 912, loss: 0.3326968848705292, mean loss: 0.3390331521716524
Epoch: 73, step: 913, loss: 0.3057733178138733, mean loss: 0.33903283936166845
Epoch: 73, step: 914, loss: 0.34143680334091187, mean loss: 0.33903286197082677
Epoch: 73, step: 915, loss: 0.3494165241718292, mean loss: 0.33903295962772056
Epoch: 73, step: 916, loss: 0.3231607973575592, mean loss: 0.33903281035365357
Epoch: 73, step: 917, loss: 0.324763685464859, mean loss: 0.3390326761570497
Epoch: 73, step: 918, loss: 0.32907381653785706, mean loss: 0.33903258249800744
Epoch: 73, step: 919, loss: 0.3507542014122009, mean loss: 0.33903269273405034
Epoch: 73, step: 920, loss: 0.33617812395095825, mean loss: 0.33903266588849174
Epoch: 73, step: 921, loss: 0.3121294677257538, mean loss: 0.3390324128819448
Epoch: 73, step: 922, loss: 0.33851417899131775, mean loss: 0.3390324080083482
Epoch: 73, step: 923, loss: 0.33808720111846924, mean loss: 0.33903239911947813
Epoch: 73, step: 924, loss: 0.2972080707550049, mean loss: 0.3390320058007992
Epoch: 73, step: 925, loss: 0.3387836813926697, mean loss: 0.3390320034655624
Epoch: 73, step: 926, loss: 0.33531635999679565, mean loss: 0.33903196852406897
Epoch: 73, step: 927, loss: 0.34745222330093384, mean loss: 0.33903204770645357
Epoch: 73, step: 928, loss: 0.2971948981285095, mean loss: 0.33903165428200227
Epoch: 73, step: 929, loss: 0.3093199133872986, mean loss: 0.33903137488401375
Epoch: 73, step: 930, loss: 0.3049861192703247, mean loss: 0.3390310547383002
Epoch: 73, step: 931, loss: 0.3348388969898224, mean loss: 0.3390310153175736
Epoch: 73, step: 932, loss: 0.35198476910591125, mean loss: 0.339031137126345
Epoch: 73, step: 933, loss: 0.31448134779930115, mean loss: 0.33903090627808247
Epoch: 73, step: 934, loss: 0.3339058458805084, mean loss: 0.33903085808621625
Epoch: 73, step: 935, loss: 0.38481396436691284, mean loss: 0.3390312885889646
Epoch: 73, step: 936, loss: 0.3303660452365875, mean loss: 0.33903120710965257
Epoch: 73, step: 937, loss: 0.3547283709049225, mean loss: 0.33903135470874796
Epoch: 73, step: 938, loss: 0.3483932912349701, mean loss: 0.3390314427374127
Epoch: 73, step: 939, loss: 0.30719488859176636, mean loss: 0.33903114338663276
Epoch: 73, step: 940, loss: 0.3393392860889435, mean loss: 0.3390311462839906
Epoch: 73, step: 941, loss: 0.3575020134449005, mean loss: 0.33903131995745056
Epoch: 73, step: 942, loss: 0.34005075693130493, mean loss: 0.339031329542679
Epoch: 73, step: 943, loss: 0.327218621969223, mean loss: 0.33903121847506107
Epoch: 73, step: 944, loss: 0.35734882950782776, mean loss: 0.33903139070266275
Epoch: 73, step: 945, loss: 0.3372941315174103, mean loss: 0.33903137436859115
Epoch: 73, step: 946, loss: 0.3620719611644745, mean loss: 0.33903159099893554
Epoch: 73, step: 947, loss: 0.3219849169254303, mean loss: 0.33903143072558023
Epoch: 73, step: 948, loss: 0.3474733233451843, mean loss: 0.33903151009576876
Epoch: 73, step: 949, loss: 0.35725975036621094, mean loss: 0.33903168147502327
Epoch: 73, step: 950, loss: 0.3467077910900116, mean loss: 0.339031753644007
Epoch: 73, step: 951, loss: 0.3389512598514557, mean loss: 0.33903175288723036
Epoch: 73, step: 952, loss: 0.30273059010505676, mean loss: 0.33903141159862243
Epoch: 73, step: 953, loss: 0.34705108404159546, mean loss: 0.3390314869955767
Epoch: 73, step: 954, loss: 0.3214821517467499, mean loss: 0.3390313220070441
Epoch: 73, step: 955, loss: 0.3146025836467743, mean loss: 0.3390310923445671
Epoch: 73, step: 956, loss: 0.3167212903499603, mean loss: 0.3390308826048685
Epoch: 73, step: 957, loss: 0.29844528436660767, mean loss: 0.33903050105369587
Epoch: 73, step: 958, loss: 0.34045708179473877, mean loss: 0.33903051446506494
Epoch: 73, step: 959, loss: 0.3150378167629242, mean loss: 0.3390302889104293
Epoch: 73, step: 960, loss: 0.3220020532608032, mean loss: 0.33903012882999867
Epoch: 73, step: 961, loss: 0.33521243929862976, mean loss: 0.33903009294068803
Epoch: 73, step: 962, loss: 0.3401104211807251, mean loss: 0.3390301030965352
Epoch: 73, step: 963, loss: 0.30858972668647766, mean loss: 0.339029816938225
Epoch: 73, step: 964, loss: 0.3530653417110443, mean loss: 0.33902994887957294
Epoch: 73, step: 965, loss: 0.33508774638175964, mean loss: 0.3390299118211351
Epoch: 73, step: 966, loss: 0.3026616871356964, mean loss: 0.339029569947037
Epoch: 73, step: 967, loss: 0.30538952350616455, mean loss: 0.33902925372174614
Epoch: 73, step: 968, loss: 0.34108102321624756, mean loss: 0.33902927300873814
Epoch: 73, step: 969, loss: 0.3190097212791443, mean loss: 0.3390290848232206
Epoch: 73, step: 970, loss: 0.3355903923511505, mean loss: 0.3390290524995178
Epoch: 73, step: 971, loss: 0.3456893563270569, mean loss: 0.33902911510577277
Epoch: 73, step: 972, loss: 0.29322490096092224, mean loss: 0.33902868455434026
Epoch: 73, step: 973, loss: 0.3720114827156067, mean loss: 0.3390289945838381
Epoch: 73, step: 974, loss: 0.36395135521888733, mean loss: 0.339029228845173
Epoch: 73, step: 975, loss: 0.35482800006866455, mean loss: 0.33902937734661326
Epoch: 73, step: 976, loss: 0.37325966358184814, mean loss: 0.339029699093093
Epoch: 73, step: 977, loss: 0.3488921821117401, mean loss: 0.3390297917943151
Epoch: 73, step: 978, loss: 0.2873580753803253, mean loss: 0.3390293061168009
Epoch: 73, step: 979, loss: 0.3536521792411804, mean loss: 0.3390294435601531
Epoch: 73, step: 980, loss: 0.2967921197414398, mean loss: 0.33902904656670596
Epoch: 73, step: 981, loss: 0.3169305622577667, mean loss: 0.3390288388624716
Epoch: 73, step: 982, loss: 0.33968260884284973, mean loss: 0.33902884500721503
Epoch: 73, step: 983, loss: 0.3414335250854492, mean loss: 0.33902886760844136
Epoch: 73, step: 984, loss: 0.33359986543655396, mean loss: 0.3390288165825462
Epoch: 73, step: 985, loss: 0.36305293440818787, mean loss: 0.3390290423773715
Epoch: 73, step: 986, loss: 0.3126213550567627, mean loss: 0.3390287941824889
Epoch: 73, step: 987, loss: 0.30526962876319885, mean loss: 0.3390284768970996
Epoch: 73, step: 988, loss: 0.3337436318397522, mean loss: 0.33902842722797
Epoch: 73, step: 989, loss: 0.3500474989414215, mean loss: 0.33902853078872747
Epoch: 73, step: 990, loss: 0.3225560188293457, mean loss: 0.33902837597625074
Epoch: 73, step: 991, loss: 0.34736138582229614, mean loss: 0.33902845429106826
Epoch: 73, step: 992, loss: 0.29978448152542114, mean loss: 0.3390280854740694
Epoch: 73, step: 993, loss: 0.3587910532951355, mean loss: 0.33902827120577456
Epoch: 73, step: 994, loss: 0.3169456124305725, mean loss: 0.33902806367564237
Epoch: 73, step: 995, loss: 0.29593852162361145, mean loss: 0.3390276587291905
Epoch: 73, step: 996, loss: 0.3098302483558655, mean loss: 0.33902738434064844
Epoch: 73, step: 997, loss: 0.30287209153175354, mean loss: 0.3390270445671985
Epoch: 73, step: 998, loss: 0.3927149772644043, mean loss: 0.3390275491008717
Epoch: 73, step: 999, loss: 0.3712652921676636, mean loss: 0.33902785205301117
Epoch: 73, step: 1000, loss: 0.3537808358669281, mean loss: 0.3390279906919351
Epoch: 73, step: 1001, loss: 0.32653602957725525, mean loss: 0.3390278733017316
Epoch: 73, step: 1002, loss: 0.3230205774307251, mean loss: 0.33902772287842786
Epoch: 73, step: 1003, loss: 0.3095570206642151, mean loss: 0.3390274459397888
Epoch: 73, step: 1004, loss: 0.31234967708587646, mean loss: 0.3390271952489325
Epoch: 73, step: 1005, loss: 0.3392470180988312, mean loss: 0.33902719731458725
Epoch: 73, step: 1006, loss: 0.30859997868537903, mean loss: 0.3390269113955443
Epoch: 73, step: 1007, loss: 0.29699480533599854, mean loss: 0.3390265164311949
Epoch: 73, step: 1008, loss: 0.32990890741348267, mean loss: 0.33902643075629035
Epoch: 73, step: 1009, loss: 0.3390097916126251, mean loss: 0.33902643059993975
Epoch: 73, step: 1010, loss: 0.3386313021183014, mean loss: 0.3390264268871288
Epoch: 73, step: 1011, loss: 0.30270472168922424, mean loss: 0.3390260855947023
Epoch: 73, step: 1012, loss: 0.33973997831344604, mean loss: 0.33902609230264424
Epoch: 73, step: 1013, loss: 0.3321720361709595, mean loss: 0.3390260279005608
Epoch: 73, step: 1014, loss: 0.3061463534832001, mean loss: 0.3390257189594611
Epoch: 73, step: 1015, loss: 0.33766499161720276, mean loss: 0.3390257061740349
Epoch: 73, step: 1016, loss: 0.30992814898490906, mean loss: 0.3390254327752696
Epoch: 73, step: 1017, loss: 0.33148351311683655, mean loss: 0.3390253619125461
Epoch: 73, step: 1018, loss: 0.3249271512031555, mean loss: 0.3390252294491594
Epoch: 73, step: 1019, loss: 0.3293527066707611, mean loss: 0.3390251385693227
Epoch: 73, step: 1020, loss: 0.3288654386997223, mean loss: 0.3390250431130275
Epoch: 73, step: 1021, loss: 0.3467710614204407, mean loss: 0.33902511589069545
Epoch: 73, step: 1022, loss: 0.3376263380050659, mean loss: 0.3390251027486098
Epoch: 73, step: 1023, loss: 0.33319899439811707, mean loss: 0.3390250480104728
Epoch: 73, step: 1024, loss: 0.3107016980648041, mean loss: 0.3390247819061111
Epoch: 73, step: 1025, loss: 0.332474023103714, mean loss: 0.33902472036080955
Epoch: 73, step: 1026, loss: 0.3088169991970062, mean loss: 0.33902443655768133
Epoch: 73, step: 1027, loss: 0.32692527770996094, mean loss: 0.3390243228865159
Epoch: 73, step: 1028, loss: 0.3010997176170349, mean loss: 0.33902396658955075
Epoch: 73, step: 1029, loss: 0.3369270861148834, mean loss: 0.3390239468898037
Epoch: 73, step: 1030, loss: 0.35467615723609924, mean loss: 0.33902409393761657
Epoch: 73, step: 1031, loss: 0.33638522028923035, mean loss: 0.3390240691464245
Epoch: 73, step: 1032, loss: 0.3210606276988983, mean loss: 0.3390239003884608
Epoch: 73, step: 1033, loss: 0.3157169818878174, mean loss: 0.33902368143313605
Epoch: 73, step: 1034, loss: 0.3256431818008423, mean loss: 0.3390235557320864
Epoch: 73, step: 1035, loss: 0.3451991677284241, mean loss: 0.3390236137473802
Epoch: 73, step: 1036, loss: 0.3408488929271698, mean loss: 0.3390236308943631
Epoch: 73, step: 1037, loss: 0.3173353672027588, mean loss: 0.33902342715304146
Epoch: 73, step: 1038, loss: 0.31788381934165955, mean loss: 0.3390232285677035
Epoch: 73, step: 1039, loss: 0.3346322774887085, mean loss: 0.3390231873195252
Epoch: 73, step: 1040, loss: 0.33341503143310547, mean loss: 0.33902313463753514
Epoch: 73, step: 1041, loss: 0.3463928699493408, mean loss: 0.3390232038668296
Epoch: 73, step: 1042, loss: 0.34397003054618835, mean loss: 0.3390232503355411
Epoch: 73, step: 1043, loss: 0.30356818437576294, mean loss: 0.3390229172865259
Epoch: 73, step: 1044, loss: 0.3103450834751129, mean loss: 0.3390226479023256
Epoch: 73, step: 1045, loss: 0.32851743698120117, mean loss: 0.3390225492229317
Epoch: 73, step: 1046, loss: 0.3101804852485657, mean loss: 0.339022278301131
Epoch: 73, step: 1047, loss: 0.33000311255455017, mean loss: 0.33902219358230945
Epoch: 73, step: 1048, loss: 0.35070425271987915, mean loss: 0.3390223033131887
Epoch: 73, step: 1049, loss: 0.3145354986190796, mean loss: 0.3390220733080724
Epoch: 73, step: 1050, loss: 0.33018505573272705, mean loss: 0.33902199030254393
Epoch: 73, step: 1051, loss: 0.3040907084941864, mean loss: 0.33902166219837904
Epoch: 73, step: 1052, loss: 0.37747013568878174, mean loss: 0.33902202333559306
Epoch: 73, step: 1053, loss: 0.3451502323150635, mean loss: 0.33902208089583746
Epoch: 73, step: 1054, loss: 0.33559975028038025, mean loss: 0.3390220487513174
Epoch: 73, step: 1055, loss: 0.3697061538696289, mean loss: 0.3390223369515759
Epoch: 73, step: 1056, loss: 0.33195170760154724, mean loss: 0.3390222705413593
Epoch: 73, step: 1057, loss: 0.38202908635139465, mean loss: 0.33902267447501017
Epoch: 73, step: 1058, loss: 0.3363254964351654, mean loss: 0.3390226491424967
Epoch: 73, step: 1059, loss: 0.36037755012512207, mean loss: 0.33902284971073043
Epoch: 73, step: 1060, loss: 0.3199167549610138, mean loss: 0.33902267026528654
Epoch: 73, step: 1061, loss: 0.3433338701725006, mean loss: 0.3390227107559219
Epoch: 73, step: 1062, loss: 0.33089905977249146, mean loss: 0.33902263445959896
Epoch: 73, step: 1063, loss: 0.30662527680397034, mean loss: 0.3390223301904899
Epoch: 73, step: 1064, loss: 0.34371769428253174, mean loss: 0.339022374287939
Epoch: 73, step: 1065, loss: 0.3153612017631531, mean loss: 0.3390221520714011
Epoch: 73, step: 1066, loss: 0.3314148485660553, mean loss: 0.3390220806272336
Epoch: 73, step: 1067, loss: 0.35828694701194763, mean loss: 0.33902226155197424
Epoch: 73, step: 1068, loss: 0.32962945103645325, mean loss: 0.3390221733408331
Epoch: 73, step: 1069, loss: 0.32588890194892883, mean loss: 0.339022050002885
Epoch: 73, step: 1070, loss: 0.31556710600852966, mean loss: 0.3390218297335087
Epoch: 73, step: 1071, loss: 0.3342016935348511, mean loss: 0.3390217844672133
Epoch: 73, step: 1072, loss: 0.3052905797958374, mean loss: 0.3390214676976714
Epoch: 73, step: 1073, loss: 0.3766454756259918, mean loss: 0.33902182102118744
Epoch: 73, step: 1074, loss: 0.33678552508354187, mean loss: 0.33902180002054005
Epoch: 73, step: 1075, loss: 0.3354332149028778, mean loss: 0.33902176632110803
Epoch: 73, step: 1076, loss: 0.33063364028930664, mean loss: 0.3390216875512254
Epoch: 73, step: 1077, loss: 0.3499240279197693, mean loss: 0.3390217899302316
Epoch: 73, step: 1078, loss: 0.33696281909942627, mean loss: 0.33902177059553823
Epoch: 73, step: 1079, loss: 0.35095304250717163, mean loss: 0.3390218826346765
Epoch: 73, step: 1080, loss: 0.3143366277217865, mean loss: 0.33902165083300956
Epoch: 73, step: 1081, loss: 0.3501393496990204, mean loss: 0.33902175523042977
Epoch: 73, step: 1082, loss: 0.3130626678466797, mean loss: 0.3390215114716863
Epoch: 73, step: 1083, loss: 0.3036070466041565, mean loss: 0.3390211789290099
Epoch: 73, step: 1084, loss: 0.344868004322052, mean loss: 0.33902123383032534
Epoch: 73, step: 1085, loss: 0.38806530833244324, mean loss: 0.33902169434671536
Epoch: 73, step: 1086, loss: 0.31440678238868713, mean loss: 0.33902146321861126
Epoch: 73, step: 1087, loss: 0.320538192987442, mean loss: 0.3390212896667781
Epoch: 73, step: 1088, loss: 0.3276195228099823, mean loss: 0.3390211826089396
Epoch: 73, step: 1089, loss: 0.39016759395599365, mean loss: 0.3390216628479149
Epoch: 73, step: 1090, loss: 0.31592780351638794, mean loss: 0.3390214460102734
Epoch: 73, step: 1091, loss: 0.3181232810020447, mean loss: 0.33902124979074166
Epoch: 73, step: 1092, loss: 0.32261669635772705, mean loss: 0.33902109576460737
Epoch: 73, step: 1093, loss: 0.33899199962615967, mean loss: 0.33902109549141957
Epoch: 73, step: 1094, loss: 0.31363391876220703, mean loss: 0.33902085712984026
Epoch: 73, step: 1095, loss: 0.30626600980758667, mean loss: 0.33902054959568956
Epoch: 73, step: 1096, loss: 0.33676058053970337, mean loss: 0.33902052837711594
Epoch: 73, step: 1097, loss: 0.3848513960838318, mean loss: 0.3390209586734985
Epoch: 73, step: 1098, loss: 0.33099764585494995, mean loss: 0.33902088334500835
Epoch: 73, step: 1099, loss: 0.3469689190387726, mean loss: 0.3390209579660435
Epoch: 73, step: 1100, loss: 0.34593677520751953, mean loss: 0.33902102289536895
Epoch: 73, step: 1101, loss: 0.3226873278617859, mean loss: 0.3390208695474989
Epoch: 73, step: 1102, loss: 0.3253917694091797, mean loss: 0.3390207415927494
Epoch: 73, step: 1103, loss: 0.3393906354904175, mean loss: 0.33902074506540986
Epoch: 73, step: 1104, loss: 0.35263797640800476, mean loss: 0.3390208729063305
Epoch: 73, step: 1105, loss: 0.33573535084724426, mean loss: 0.3390208420615713
Epoch: 73, step: 1106, loss: 0.3221305310726166, mean loss: 0.3390206834953907
Epoch: 73, step: 1107, loss: 0.3755953311920166, mean loss: 0.3390210268548321
Epoch: 73, step: 1108, loss: 0.3318414092063904, mean loss: 0.33902095945387223
Epoch: 73, step: 1109, loss: 0.3571135103702545, mean loss: 0.33902112930189343
Epoch: 73, step: 1110, loss: 0.3428983986377716, mean loss: 0.3390211657003176
Epoch: 73, step: 1111, loss: 0.34038347005844116, mean loss: 0.33902117848902585
Epoch: 73, step: 1112, loss: 0.34217745065689087, mean loss: 0.33902120811842895
Epoch: 73, step: 1113, loss: 0.44376128911972046, mean loss: 0.33902219135332934
Epoch: 73, step: 1114, loss: 0.35849300026893616, mean loss: 0.33902237413148806
Epoch: 73, step: 1115, loss: 0.3125510811805725, mean loss: 0.33902212564007783
Epoch: 73, step: 1116, loss: 0.2994838356971741, mean loss: 0.33902175448959354
Epoch: 73, step: 1117, loss: 0.32376864552497864, mean loss: 0.3390216113082459
Epoch: 73, step: 1118, loss: 0.3262858986854553, mean loss: 0.3390214917588882
Epoch: 73, step: 1119, loss: 0.29983651638031006, mean loss: 0.3390211239353668
Epoch: 73, step: 1120, loss: 0.3319101929664612, mean loss: 0.33902105718674463
Epoch: 73, step: 1121, loss: 0.34321412444114685, mean loss: 0.33902109654570284
Epoch: 73, step: 1122, loss: 0.30785173177719116, mean loss: 0.33902080397176215
Epoch: 73, step: 1123, loss: 0.3394434452056885, mean loss: 0.33902080793888345
Epoch: 73, step: 1124, loss: 0.3325556218624115, mean loss: 0.3390207472539939
Epoch: 73, step: 1125, loss: 0.34496983885765076, mean loss: 0.3390208030940848
Epoch: 73, step: 1126, loss: 0.3671415448188782, mean loss: 0.33902106704195106
Epoch: 73, step: 1127, loss: 0.31646472215652466, mean loss: 0.33902085532480364
Epoch: 73, step: 1128, loss: 0.28837889432907104, mean loss: 0.33902037999642304
Epoch: 73, step: 1129, loss: 0.33032092452049255, mean loss: 0.3390202983435962
Epoch: 73, step: 1130, loss: 0.30220600962638855, mean loss: 0.33901995280903535
Epoch: 73, step: 1131, loss: 0.30760928988456726, mean loss: 0.3390196579950343
Epoch: 73, step: 1132, loss: 0.3114510774612427, mean loss: 0.3390193992444544
Epoch: 73, step: 1133, loss: 0.3125086724758148, mean loss: 0.3390191504249138
Epoch: 73, step: 1134, loss: 0.2994237244129181, mean loss: 0.3390187788008792
Epoch: 73, step: 1135, loss: 0.32806459069252014, mean loss: 0.3390186759909897
Epoch: 73, step: 1136, loss: 0.3379133641719818, mean loss: 0.3390186656172479
Epoch: 73, step: 1137, loss: 0.3361800014972687, mean loss: 0.3390186389756325
Epoch: 73, step: 1138, loss: 0.3652777075767517, mean loss: 0.33901888542164055
Epoch: 73, step: 1139, loss: 0.31742793321609497, mean loss: 0.3390186827886331
Epoch: 73, step: 1140, loss: 0.3432955741882324, mean loss: 0.3390187229272627
Epoch: 73, step: 1141, loss: 0.2971344590187073, mean loss: 0.3390183298470976
Epoch: 73, step: 1142, loss: 0.35036319494247437, mean loss: 0.3390184363166682
Epoch: 73, step: 1143, loss: 0.3383268713951111, mean loss: 0.33901842982651353
Epoch: 73, step: 1144, loss: 0.3635505437850952, mean loss: 0.3390186600517823
Epoch: 73, step: 1145, loss: 0.3661479651927948, mean loss: 0.33901891464838824
Epoch: 73, step: 1146, loss: 0.3164975643157959, mean loss: 0.3390187032973965
Epoch: 73, step: 1147, loss: 0.3302876055240631, mean loss: 0.33901862136141886
Epoch: 73, step: 1148, loss: 0.34442850947380066, mean loss: 0.33901867212941195
Epoch: 73, step: 1149, loss: 0.30934497714042664, mean loss: 0.3390183936652785
Epoch: 73, step: 1150, loss: 0.35618311166763306, mean loss: 0.33901855474105524
Epoch: 73, step: 1151, loss: 0.3329150974750519, mean loss: 0.33901849746601614
Epoch: 73, step: 1152, loss: 0.3397309184074402, mean loss: 0.3390185041513344
Epoch: 73, step: 1153, loss: 0.3473566472530365, mean loss: 0.33901858239526866
Epoch: 73, step: 1154, loss: 0.3413068950176239, mean loss: 0.3390186038682633
Epoch: 73, step: 1155, loss: 0.3238993287086487, mean loss: 0.33901846199382485
Epoch: 73, step: 1156, loss: 0.32167983055114746, mean loss: 0.3390182992951841
Epoch: 73, step: 1157, loss: 0.34871384501457214, mean loss: 0.3390183902733742
Epoch: 73, step: 1158, loss: 0.3335452377796173, mean loss: 0.3390183389165089
Epoch: 73, step: 1159, loss: 0.4368751049041748, mean loss: 0.33901925713861214
Epoch: 73, step: 1160, loss: 0.3722059428691864, mean loss: 0.3390195685372378
Epoch: 73, step: 1161, loss: 0.35651734471321106, mean loss: 0.3390197327215245
Epoch: 73, step: 1162, loss: 0.2922397553920746, mean loss: 0.33901929378202345
Epoch: 73, step: 1163, loss: 0.30186817049980164, mean loss: 0.3390189451939428
Epoch: 73, step: 1164, loss: 0.3342706263065338, mean loss: 0.33901890064100093
Epoch: 73, step: 1165, loss: 0.3711285889148712, mean loss: 0.3390192019197665
Epoch: 73, step: 1166, loss: 0.29970160126686096, mean loss: 0.339018833014066
Epoch: 73, step: 1167, loss: 0.3124959170818329, mean loss: 0.33901858415953484
Epoch: 73, step: 1168, loss: 0.3042331039905548, mean loss: 0.33901825778353756
Epoch: 73, step: 1169, loss: 0.33879560232162476, mean loss: 0.3390182556944844
Epoch: 73, step: 1170, loss: 0.3668151795864105, mean loss: 0.3390185164952115
Epoch: 73, step: 1171, loss: 0.32459425926208496, mean loss: 0.3390183811629174
Epoch: 73, step: 1172, loss: 0.34693506360054016, mean loss: 0.33901845543868264
Epoch: 73, step: 1173, loss: 0.32845762372016907, mean loss: 0.33901835635595395
Epoch: 73, step: 1174, loss: 0.348022997379303, mean loss: 0.3390184408375608
Epoch: 73, step: 1175, loss: 0.3581889271736145, mean loss: 0.33901862069351396
Epoch: 73, step: 1176, loss: 0.3263574242591858, mean loss: 0.3390185019083069
Epoch: 73, step: 1177, loss: 0.29990246891975403, mean loss: 0.3390181349317332
Epoch: 73, step: 1178, loss: 0.34432780742645264, mean loss: 0.3390181847452493
Epoch: 73, step: 1179, loss: 0.35911059379577637, mean loss: 0.33901837324353296
Epoch: 73, step: 1180, loss: 0.34125128388404846, mean loss: 0.33901839419153745
Epoch: 73, step: 1181, loss: 0.35350528359413147, mean loss: 0.33901853009871236
Epoch: 73, step: 1182, loss: 0.30098164081573486, mean loss: 0.33901817326312644
Epoch: 73, step: 1183, loss: 0.3376760482788086, mean loss: 0.33901816067236334
Epoch: 73, step: 1184, loss: 0.3441029191017151, mean loss: 0.3390182083731282
Epoch: 73, step: 1185, loss: 0.39905399084091187, mean loss: 0.33901877157114757
Epoch: 73, step: 1186, loss: 0.33157065510749817, mean loss: 0.3390187017007317
Epoch: 73, step: 1187, loss: 0.36507266759872437, mean loss: 0.3390189461094174
Epoch: 73, step: 1188, loss: 0.3392961919307709, mean loss: 0.3390189487101981
Epoch: 73, step: 1189, loss: 0.3634762465953827, mean loss: 0.33901917813645543
Epoch: 73, step: 1190, loss: 0.34759965538978577, mean loss: 0.33901925862647214
Epoch: 73, step: 1191, loss: 0.32827579975128174, mean loss: 0.33901915784733744
Epoch: 73, step: 1192, loss: 0.299568235874176, mean loss: 0.33901878778099936
Epoch: 73, step: 1193, loss: 0.3437069356441498, mean loss: 0.33901883175739717
Epoch: 73, step: 1194, loss: 0.3236532509326935, mean loss: 0.3390186876244526
Epoch: 73, step: 1195, loss: 0.325729638338089, mean loss: 0.33901856297105615
Epoch: 73, step: 1196, loss: 0.32880765199661255, mean loss: 0.3390184671919852
Epoch: 73, step: 1197, loss: 0.3194843828678131, mean loss: 0.33901828396260403
Epoch: 73, step: 1198, loss: 0.29981687664985657, mean loss: 0.3390179162575144
Epoch: 73, step: 1199, loss: 0.34467533230781555, mean loss: 0.3390179693229859
Epoch: 73, step: 1200, loss: 0.36575770378112793, mean loss: 0.3390182201341858
Epoch: 73, step: 1201, loss: 0.29474642872810364, mean loss: 0.33901780488111016
Epoch: 73, step: 1202, loss: 0.37282487750053406, mean loss: 0.33901812197600883
Epoch: 73, step: 1203, loss: 0.31465429067611694, mean loss: 0.33901789345654365
Epoch: 73, step: 1204, loss: 0.32677096128463745, mean loss: 0.3390177785880689
Epoch: 73, step: 1205, loss: 0.3340810239315033, mean loss: 0.3390177322848682
Epoch: 73, step: 1206, loss: 0.3191355764865875, mean loss: 0.339017545806325
Epoch: 73, step: 1207, loss: 0.34302598237991333, mean loss: 0.3390175834018659
Epoch: 73, step: 1208, loss: 0.33700522780418396, mean loss: 0.3390175645279518
Epoch: 73, step: 1209, loss: 0.3498077988624573, mean loss: 0.3390176657287765
Epoch: 73, step: 1210, loss: 0.3264627456665039, mean loss: 0.3390175479781968
Epoch: 73, step: 1211, loss: 0.3461461365222931, mean loss: 0.3390176148354573
Epoch: 73, step: 1212, loss: 0.3140231966972351, mean loss: 0.33901738042121915
Epoch: 73, step: 1213, loss: 0.34456050395965576, mean loss: 0.33901743240782223
Epoch: 73, step: 1214, loss: 0.36003807187080383, mean loss: 0.33901762954962933
Epoch: 73, step: 1215, loss: 0.32592010498046875, mean loss: 0.3390175067158092
Epoch: 73, step: 1216, loss: 0.3071518838405609, mean loss: 0.33901720787006484
Epoch: 73, step: 1217, loss: 0.37426263093948364, mean loss: 0.3390175384095291
Epoch: 73, step: 1218, loss: 0.3114869296550751, mean loss: 0.3390172802237411
Epoch: 73, step: 1219, loss: 0.34961998462677, mean loss: 0.3390173796564105
Epoch: 73, step: 1220, loss: 0.325657457113266, mean loss: 0.3390172543675924
Epoch: 73, step: 1221, loss: 0.3419831693172455, mean loss: 0.3390172821815631
Epoch: 73, step: 1222, loss: 0.30215004086494446, mean loss: 0.33901693644853625
Epoch: 73, step: 1223, loss: 0.2882883548736572, mean loss: 0.3390164607313153
Epoch: 73, step: 1224, loss: 0.3439048230648041, mean loss: 0.33901650657246174
Epoch: 73, step: 1225, loss: 0.3355565071105957, mean loss: 0.33901647412624686
Epoch: 73, step: 1226, loss: 0.3503429889678955, mean loss: 0.33901658033987264
Epoch: 73, step: 1227, loss: 0.3554288148880005, mean loss: 0.33901673424304735
Epoch: 73, step: 1228, loss: 0.30300605297088623, mean loss: 0.33901639656165583
Epoch: 73, step: 1229, loss: 0.32710719108581543, mean loss: 0.33901628488702973
Epoch: 73, step: 1230, loss: 0.30878907442092896, mean loss: 0.3390160014440427
Epoch: 73, step: 1231, loss: 0.3156871199607849, mean loss: 0.3390157826892934
Epoch: 73, step: 1232, loss: 0.36224550008773804, mean loss: 0.33901600051213926
Epoch: 73, step: 1233, loss: 0.31724032759666443, mean loss: 0.33901579632564455
Epoch: 73, step: 1234, loss: 0.30891549587249756, mean loss: 0.33901551408328934
Epoch: 73, step: 1235, loss: 0.32461413741111755, mean loss: 0.33901537904675166
Epoch: 73, step: 1236, loss: 0.33976367115974426, mean loss: 0.3390153860631523
Epoch: 73, step: 1237, loss: 0.33276432752609253, mean loss: 0.33901532745032026
Epoch: 73, step: 1238, loss: 0.3335719406604767, mean loss: 0.3390152764110727
Epoch: 73, step: 1239, loss: 0.35047459602355957, mean loss: 0.3390153838569679
Epoch: 73, step: 1240, loss: 0.3490733504295349, mean loss: 0.3390154781624874
Epoch: 73, step: 1241, loss: 0.327480286359787, mean loss: 0.3390153700072208
Epoch: 73, step: 1242, loss: 0.3219294250011444, mean loss: 0.3390152098089647
Epoch: 73, step: 1243, loss: 0.3795431852340698, mean loss: 0.3390155897967331
Epoch: 73, step: 1244, loss: 0.3173626661300659, mean loss: 0.3390153867821755
Epoch: 73, step: 1245, loss: 0.36465269327163696, mean loss: 0.33901562715145384
Epoch: 73, step: 1246, loss: 0.31870153546333313, mean loss: 0.3390154366931551
Epoch: 73, step: 1247, loss: 0.33898845314979553, mean loss: 0.33901543644016857
Epoch: 73, step: 1248, loss: 0.28455764055252075, mean loss: 0.33901492587120813
Epoch: 73, step: 1249, loss: 0.3136250674724579, mean loss: 0.33901468783087135
Epoch: 73, step: 1250, loss: 0.3355967104434967, mean loss: 0.3390146557862318
Epoch: 73, step: 1251, loss: 0.33498454093933105, mean loss: 0.3390146180029605
Epoch: 73, step: 1252, loss: 0.33713778853416443, mean loss: 0.33901460040740933
Epoch: 73, step: 1253, loss: 0.32177916169166565, mean loss: 0.3390144388241615
Epoch: 73, step: 1254, loss: 0.3348195254802704, mean loss: 0.33901439949697176
Epoch: 73, step: 1255, loss: 0.32416942715644836, mean loss: 0.3390142603270957
Epoch: 73, step: 1256, loss: 0.3418886661529541, mean loss: 0.33901428727406085
Epoch: 73, step: 1257, loss: 0.332376629114151, mean loss: 0.3390142250479602
Epoch: 73, step: 1258, loss: 0.3119601309299469, mean loss: 0.3390139714261312
Epoch: 73, step: 1259, loss: 0.31313639879226685, mean loss: 0.33901372883601727
Epoch: 73, step: 1260, loss: 0.33422091603279114, mean loss: 0.33901368390606496
Epoch: 73, step: 1261, loss: 0.29692184925079346, mean loss: 0.3390132893222427
Epoch: 73, step: 1262, loss: 0.34384188055992126, mean loss: 0.33901333458674926
Epoch: 73, step: 1263, loss: 0.3362587094306946, mean loss: 0.3390133087643979
Epoch: 73, step: 1264, loss: 0.3005741834640503, mean loss: 0.33901294843250535
Epoch: 73, step: 1265, loss: 0.3440842628479004, mean loss: 0.339012995971027
Epoch: 73, step: 1266, loss: 0.3254661560058594, mean loss: 0.3390128689840852
Epoch: 73, step: 1267, loss: 0.3089500963687897, mean loss: 0.33901258718081734
Epoch: 73, step: 1268, loss: 0.31714457273483276, mean loss: 0.33901238219572677
Epoch: 73, step: 1269, loss: 0.33540579676628113, mean loss: 0.3390123483888481
Epoch: 73, step: 1270, loss: 0.31767117977142334, mean loss: 0.33901214834602383
Epoch: 73, step: 1271, loss: 0.34695664048194885, mean loss: 0.33901222281353666
Epoch: 73, step: 1272, loss: 0.32547712326049805, mean loss: 0.33901209594378406
Epoch: 73, step: 1273, loss: 0.3282919228076935, mean loss: 0.3390119954603735
Epoch: 73, step: 1274, loss: 0.3533896207809448, mean loss: 0.33901213022492144
Epoch: 73, step: 1275, loss: 0.3156309127807617, mean loss: 0.3390119110698389
Epoch: 73, step: 1276, loss: 0.355823278427124, mean loss: 0.33901206864341593
Epoch: 73, step: 1277, loss: 0.31297022104263306, mean loss: 0.33901182455448914
Epoch: 73, step: 1278, loss: 0.3447839021682739, mean loss: 0.339011878655375
Epoch: 73, step: 1279, loss: 0.33684539794921875, mean loss: 0.3390118583494411
Epoch: 73, step: 1280, loss: 0.31105703115463257, mean loss: 0.3390115963376203
Epoch: 73, step: 1281, loss: 0.31517094373703003, mean loss: 0.33901137288876093
Epoch: 73, step: 1282, loss: 0.3214268684387207, mean loss: 0.3390112080778096
Epoch: 73, step: 1283, loss: 0.33029529452323914, mean loss: 0.33901112638858455
Epoch: 73, step: 1284, loss: 0.30761009454727173, mean loss: 0.33901083208760285
Epoch: 73, step: 1285, loss: 0.303808331489563, mean loss: 0.33901050216107564
Epoch: 73, step: 1286, loss: 0.3074496388435364, mean loss: 0.33901020636764445
Epoch: 73, step: 1287, loss: 0.3507695198059082, mean loss: 0.33901031657676756
Epoch: 73, step: 1288, loss: 0.31054022908210754, mean loss: 0.33901004975558036
Epoch: 73, step: 1289, loss: 0.37095460295677185, mean loss: 0.33901034913659667
Epoch: 73, step: 1290, loss: 0.344746470451355, mean loss: 0.33901040289442275
Epoch: 73, step: 1291, loss: 0.3441784381866455, mean loss: 0.33901045132780194
Epoch: 73, step: 1292, loss: 0.30208030343055725, mean loss: 0.33901010523204356
Epoch: 73, step: 1293, loss: 0.31628280878067017, mean loss: 0.3390098922421793
Epoch: 73, step: 1294, loss: 0.3615838587284088, mean loss: 0.3390101037931224
Epoch: 73, step: 1295, loss: 0.36318740248680115, mean loss: 0.3390103303675001
Epoch: 73, step: 1296, loss: 0.3829483091831207, mean loss: 0.3390107421226362
Epoch: 73, step: 1297, loss: 0.30604052543640137, mean loss: 0.33901043315237395
Epoch: 73, step: 1298, loss: 0.3625815510749817, mean loss: 0.33901065403979813
Epoch: 73, step: 1299, loss: 0.2905694246292114, mean loss: 0.3390102000961984
Epoch: 73, step: 1300, loss: 0.3755028545856476, mean loss: 0.339010542066291
Epoch: 73, step: 1301, loss: 0.35071951150894165, mean loss: 0.33901065178919
Epoch: 73, step: 1302, loss: 0.32883450388908386, mean loss: 0.3390105564310126
Epoch: 73, step: 1303, loss: 0.2870488166809082, mean loss: 0.33901006951490115
Epoch: 73, step: 1304, loss: 0.3248036205768585, mean loss: 0.3390099363922596
Epoch: 73, step: 1305, loss: 0.32058185338974, mean loss: 0.3390097637120838
Epoch: 73, step: 1306, loss: 0.324424684047699, mean loss: 0.3390096270440147
Epoch: 73, step: 1307, loss: 0.3281654715538025, mean loss: 0.33900952543086355
Epoch: 73, step: 1308, loss: 0.31446322798728943, mean loss: 0.3390092954264835
Epoch: 73, step: 1309, loss: 0.33556848764419556, mean loss: 0.3390092631856355
Epoch: 73, step: 1310, loss: 0.38236770033836365, mean loss: 0.3390096694564221
Epoch: 73, step: 1311, loss: 0.31266316771507263, mean loss: 0.3390094225906586
Epoch: 73, step: 1312, loss: 0.34058547019958496, mean loss: 0.339009437358029
Epoch: 73, step: 1313, loss: 0.3800964057445526, mean loss: 0.3390098223342146
Epoch: 73, step: 1314, loss: 0.33798351883888245, mean loss: 0.33900981271805847
Epoch: 73, step: 1315, loss: 0.3305754065513611, mean loss: 0.33900973369094123
Epoch: 73, step: 1316, loss: 0.3055093288421631, mean loss: 0.3390094198080711
Epoch: 73, step: 1317, loss: 0.3703845739364624, mean loss: 0.3390097137755978
Epoch: 73, step: 1318, loss: 0.3084094822406769, mean loss: 0.3390094270713457
Epoch: 73, step: 1319, loss: 0.3289499878883362, mean loss: 0.33900933282183116
Epoch: 73, step: 1320, loss: 0.30614370107650757, mean loss: 0.33900902489802365
Epoch: 73, step: 1321, loss: 0.3280744254589081, mean loss: 0.3390089224508237
Epoch: 73, step: 1322, loss: 0.3525073528289795, mean loss: 0.3390090489175907
Epoch: 73, step: 1323, loss: 0.3424232006072998, mean loss: 0.33900908090447135
Epoch: 73, step: 1324, loss: 0.3261955678462982, mean loss: 0.33900896085694276
Epoch: 73, step: 1325, loss: 0.35175466537475586, mean loss: 0.3390090802680664
Epoch: 73, step: 1326, loss: 0.3427262306213379, mean loss: 0.3390091150927355
Epoch: 73, step: 1327, loss: 0.376835435628891, mean loss: 0.3390094694708556
Epoch: 73, step: 1328, loss: 0.3036135137081146, mean loss: 0.33900913786485826
Epoch: 73, step: 1329, loss: 0.3213973045349121, mean loss: 0.33900897287044807
Epoch: 73, step: 1330, loss: 0.3161994516849518, mean loss: 0.3390087591841062
Epoch: 73, step: 1331, loss: 0.3133430480957031, mean loss: 0.339008518742385
Epoch: 73, step: 1332, loss: 0.3572826087474823, mean loss: 0.3390086899362583
Epoch: 73, step: 1333, loss: 0.3768194615840912, mean loss: 0.33900904414879696
Epoch: 73, step: 1334, loss: 0.28802838921546936, mean loss: 0.33900856656483735
Epoch: 73, step: 1335, loss: 0.33767059445381165, mean loss: 0.33900855403090596
Epoch: 73, step: 1336, loss: 0.30731743574142456, mean loss: 0.33900825715582245
Epoch: 73, step: 1337, loss: 0.3289089798927307, mean loss: 0.3390081625490097
Epoch: 73, step: 1338, loss: 0.3285144865512848, mean loss: 0.33900806424851604
Epoch: 73, step: 1339, loss: 0.29485657811164856, mean loss: 0.33900765065920496
Epoch: 73, step: 1340, loss: 0.31441670656204224, mean loss: 0.33900742030554654
Epoch: 73, step: 1341, loss: 0.38245683908462524, mean loss: 0.3390078273106122
Epoch: 73, step: 1342, loss: 0.36255568265914917, mean loss: 0.3390080478890895
Epoch: 73, step: 1343, loss: 0.327960729598999, mean loss: 0.33900794440714666
Epoch: 73, step: 1344, loss: 0.35103288292884827, mean loss: 0.33900805704555464
Epoch: 73, step: 1345, loss: 0.3335896134376526, mean loss: 0.33900800629110434
Epoch: 73, step: 1346, loss: 0.2964673340320587, mean loss: 0.3390076078172308
Epoch: 73, step: 1347, loss: 0.32223111391067505, mean loss: 0.3390074506750998
Epoch: 73, step: 1348, loss: 0.343665212392807, mean loss: 0.33900749430303245
Epoch: 73, step: 1349, loss: 0.3530268371105194, mean loss: 0.3390076256170094
Epoch: 73, step: 1350, loss: 0.3180460035800934, mean loss: 0.3390074292791205
Epoch: 73, step: 1351, loss: 0.3369918763637543, mean loss: 0.3390074104005386
Epoch: 73, step: 1352, loss: 0.3159681260585785, mean loss: 0.33900719460618334
Epoch: 73, step: 1353, loss: 0.34620288014411926, mean loss: 0.339007262002972
Epoch: 73, step: 1354, loss: 0.32066255807876587, mean loss: 0.33900709018299086
Epoch: 73, step: 1355, loss: 0.36812373995780945, mean loss: 0.33900736289250843
Epoch: 73, step: 1356, loss: 0.30477437376976013, mean loss: 0.3390070422658366
Epoch: 73, step: 1357, loss: 0.3293885588645935, mean loss: 0.33900695217982557
Epoch: 73, step: 1358, loss: 0.3605217933654785, mean loss: 0.33900715368436507
Epoch: 73, step: 1359, loss: 0.34459128975868225, mean loss: 0.33900720598399486
Epoch: 73, step: 1360, loss: 0.3498959243297577, mean loss: 0.33900730796406797
Epoch: 73, step: 1361, loss: 0.32243672013282776, mean loss: 0.3390071527709701
Epoch: 73, step: 1362, loss: 0.3135228753089905, mean loss: 0.33900691409827083
Epoch: 73, step: 1363, loss: 0.3252542018890381, mean loss: 0.3390067852986135
Epoch: 73, step: 1364, loss: 0.37615451216697693, mean loss: 0.33900713319869374
Epoch: 73, step: 1365, loss: 0.3134218156337738, mean loss: 0.3390068935864369
Epoch: 73, step: 1366, loss: 0.33576858043670654, mean loss: 0.3390068632591895
Epoch: 73, step: 1367, loss: 0.3054969310760498, mean loss: 0.33900654943701136
Epoch: 73, step: 1368, loss: 0.2987612187862396, mean loss: 0.3390061725410219
Epoch: 73, step: 1369, loss: 0.33632904291152954, mean loss: 0.3390061474700396
Epoch: 73, step: 1370, loss: 0.3313457667827606, mean loss: 0.3390060757322097
Epoch: 73, step: 1371, loss: 0.299617737531662, mean loss: 0.339005706872285
Epoch: 73, step: 1372, loss: 0.3832046389579773, mean loss: 0.33900612077809655
Epoch: 73, step: 1373, loss: 0.3220585584640503, mean loss: 0.33900596207225203
Epoch: 73, step: 1374, loss: 0.3322248160839081, mean loss: 0.3390058985706461
Epoch: 73, step: 1375, loss: 0.31733018159866333, mean loss: 0.3390056955916881
Epoch: 73, step: 1376, loss: 0.3275785744190216, mean loss: 0.33900558858515023
Epoch: 73, step: 1377, loss: 0.3446969985961914, mean loss: 0.33900564188049637
Epoch: 73, step: 1378, loss: 0.3341000974178314, mean loss: 0.3390055959445611
Epoch: 73, step: 1379, loss: 0.3307282328605652, mean loss: 0.3390055184353555
Epoch: 73, step: 1380, loss: 0.3648067116737366, mean loss: 0.33900576003539706
Epoch: 73, step: 1381, loss: 0.345058798789978, mean loss: 0.33900581671497415
Epoch: 73, step: 1382, loss: 0.33844655752182007, mean loss: 0.3390058114782197
Epoch: 73, step: 1383, loss: 0.36122509837150574, mean loss: 0.3390060195317694
Epoch: 73, step: 1384, loss: 0.33480843901634216, mean loss: 0.339005980227477
Epoch: 73, step: 1385, loss: 0.3370257318019867, mean loss: 0.33900596168547786
Epoch: 73, step: 1386, loss: 0.30686429142951965, mean loss: 0.33900566073069127
Epoch: 73, step: 1387, loss: 0.3565855622291565, mean loss: 0.3390058253365105
Epoch: 73, step: 1388, loss: 0.30894529819488525, mean loss: 0.339005543873536
Epoch: 73, step: 1389, loss: 0.3293326795101166, mean loss: 0.339005453305341
Epoch: 73, step: 1390, loss: 0.3452606499195099, mean loss: 0.3390055118729525
Epoch: 73, step: 1391, loss: 0.3700290322303772, mean loss: 0.3390058023444738
Epoch: 73, step: 1392, loss: 0.29754358530044556, mean loss: 0.33900541413964214
Epoch: 73, step: 1393, loss: 0.3345196545124054, mean loss: 0.339005372140507
Epoch: 73, step: 1394, loss: 0.30923551321029663, mean loss: 0.3390050934147781
Epoch: 73, step: 1395, loss: 0.33192235231399536, mean loss: 0.33900502710194474
Epoch: 73, step: 1396, loss: 0.3324279487133026, mean loss: 0.33900496552400294
Epoch: 73, step: 1397, loss: 0.32391589879989624, mean loss: 0.3390048242538342
Epoch: 73, step: 1398, loss: 0.36687809228897095, mean loss: 0.3390050852126122
Epoch: 73, step: 1399, loss: 0.32718852162361145, mean loss: 0.3390049745830613
Epoch: 73, step: 1400, loss: 0.33698272705078125, mean loss: 0.33900495565046385
Epoch: 73, step: 1401, loss: 0.4139314591884613, mean loss: 0.3390056571175331
Epoch: 73, step: 1402, loss: 0.38260623812675476, mean loss: 0.3390060653053439
Epoch: 73, step: 1403, loss: 0.34930720925331116, mean loss: 0.3390061617435549
Epoch: 73, step: 1404, loss: 0.3241022527217865, mean loss: 0.3390060222160544
Epoch: 73, step: 1405, loss: 0.32431039214134216, mean loss: 0.33900588463970893
Epoch: 73, step: 1406, loss: 0.3585653603076935, mean loss: 0.3390060677482914
Epoch: 73, step: 1407, loss: 0.3249160349369049, mean loss: 0.3390059358438464
Epoch: 73, step: 1408, loss: 0.3219284117221832, mean loss: 0.3390057759733704
Epoch: 73, step: 1409, loss: 0.3161320984363556, mean loss: 0.3390055618444687
Epoch: 73, step: 1410, loss: 0.3705812692642212, mean loss: 0.33900585743350303
Epoch: 73, step: 1411, loss: 0.31691795587539673, mean loss: 0.33900565066441035
Epoch: 73, step: 1412, loss: 0.35809800028800964, mean loss: 0.33900582938989243
Epoch: 73, step: 1413, loss: 0.3185911476612091, mean loss: 0.33900563828771013
Epoch: 73, step: 1414, loss: 0.33273154497146606, mean loss: 0.33900557955636584
Epoch: 73, step: 1415, loss: 0.3337100148200989, mean loss: 0.3390055299854225
Epoch: 73, step: 1416, loss: 0.3361622989177704, mean loss: 0.3390055033706356
Epoch: 73, step: 1417, loss: 0.35780584812164307, mean loss: 0.3390056793543925
Epoch: 73, step: 1418, loss: 0.3757738471031189, mean loss: 0.33900602352572623
Epoch: 73, step: 1419, loss: 0.30623480677604675, mean loss: 0.33900571677103897
Epoch: 73, step: 1420, loss: 0.3067190945148468, mean loss: 0.3390054145552231
Epoch: 73, step: 1421, loss: 0.3355551064014435, mean loss: 0.3390053822592485
Epoch: 73, step: 1422, loss: 0.3396158814430237, mean loss: 0.33900538797366025
Epoch: 73, step: 1423, loss: 0.3152480721473694, mean loss: 0.33900516560183963
Epoch: 73, step: 1424, loss: 0.31041640043258667, mean loss: 0.3390048980094777
Epoch: 73, step: 1425, loss: 0.3556579351425171, mean loss: 0.3390050538813317
Epoch: 73, step: 1426, loss: 0.33338046073913574, mean loss: 0.3390050012358264
Epoch: 73, step: 1427, loss: 0.29806989431381226, mean loss: 0.33900461809180804
Epoch: 73, step: 1428, loss: 0.3565675616264343, mean loss: 0.3390047824757387
Epoch: 73, step: 1429, loss: 0.3261271119117737, mean loss: 0.3390046619456984
Epoch: 73, step: 1430, loss: 0.3006119132041931, mean loss: 0.33900430260770953
Epoch: 73, step: 1431, loss: 0.32396912574768066, mean loss: 0.3390041618868749
Epoch: 73, step: 1432, loss: 0.3431677520275116, mean loss: 0.33900420085538197
Epoch: 73, step: 1433, loss: 0.33528217673301697, mean loss: 0.33900416601997285
Epoch: 73, step: 1434, loss: 0.3434124290943146, mean loss: 0.3390042072776879
Epoch: 73, step: 1435, loss: 0.32193008065223694, mean loss: 0.3390040474794078
Epoch: 73, step: 1436, loss: 0.34250199794769287, mean loss: 0.3390040802167331
Epoch: 73, step: 1437, loss: 0.3302513360977173, mean loss: 0.33900399830055045
Epoch: 73, step: 1438, loss: 0.3403051793575287, mean loss: 0.33900401047807854
Epoch: 73, step: 1439, loss: 0.311004638671875, mean loss: 0.3390037484392603
Epoch: 73, step: 1440, loss: 0.3037698566913605, mean loss: 0.3390034186975427
Epoch: 73, step: 1441, loss: 0.34963738918304443, mean loss: 0.3390035182162363
Epoch: 73, step: 1442, loss: 0.327804833650589, mean loss: 0.3390034134136106
Epoch: 73, step: 1443, loss: 0.2967664897441864, mean loss: 0.3390030181440547
Valid: 73, mean loss: 0.18487513562043506
Epoch: 74, step: 0, loss: 0.3442559242248535, mean loss: 0.33900306730233243
Epoch: 74, step: 1, loss: 0.31527724862098694, mean loss: 0.3390028452710509
Epoch: 74, step: 2, loss: 0.39480060338974, mean loss: 0.33900336743350906
Epoch: 74, step: 3, loss: 0.3105587959289551, mean loss: 0.3390031012481122
Epoch: 74, step: 4, loss: 0.38518378138542175, mean loss: 0.33900353340465333
Epoch: 74, step: 5, loss: 0.35390809178352356, mean loss: 0.33900367287947486
Epoch: 74, step: 6, loss: 0.31000322103500366, mean loss: 0.3390034014997471
Epoch: 74, step: 7, loss: 0.3666374087333679, mean loss: 0.33900366009017263
Epoch: 74, step: 8, loss: 0.3265743553638458, mean loss: 0.3390035437817019
Epoch: 74, step: 9, loss: 0.3238937556743622, mean loss: 0.33900340239166105
Epoch: 74, step: 10, loss: 0.333587646484375, mean loss: 0.33900335171412815
Epoch: 74, step: 11, loss: 0.3483181893825531, mean loss: 0.33900343887621287
Epoch: 74, step: 12, loss: 0.309793084859848, mean loss: 0.33900316554761417
Epoch: 74, step: 13, loss: 0.3204704225063324, mean loss: 0.3390029921337184
Epoch: 74, step: 14, loss: 0.30460307002067566, mean loss: 0.339002670251055
Epoch: 74, step: 15, loss: 0.32117530703544617, mean loss: 0.33900250344063493
Epoch: 74, step: 16, loss: 0.3227861821651459, mean loss: 0.3390023517061344
Epoch: 74, step: 17, loss: 0.3248694837093353, mean loss: 0.3390022194675357
Epoch: 74, step: 18, loss: 0.30653116106987, mean loss: 0.3390019156447671
Epoch: 74, step: 19, loss: 0.34796738624572754, mean loss: 0.33900199953142646
Epoch: 74, step: 20, loss: 0.35887548327445984, mean loss: 0.33900218547867184
Epoch: 74, step: 21, loss: 0.3500071167945862, mean loss: 0.3390022884458991
Epoch: 74, step: 22, loss: 0.32163625955581665, mean loss: 0.3390021259628211
Epoch: 74, step: 23, loss: 0.32051554322242737, mean loss: 0.33900195299703945
Epoch: 74, step: 24, loss: 0.35447701811790466, mean loss: 0.33900209778484197
Epoch: 74, step: 25, loss: 0.3314034342765808, mean loss: 0.33900202669089247
Epoch: 74, step: 26, loss: 0.31555071473121643, mean loss: 0.3390018072798359
Epoch: 74, step: 27, loss: 0.35769012570381165, mean loss: 0.3390019821265709
Epoch: 74, step: 28, loss: 0.3119926452636719, mean loss: 0.3390017294312735
Epoch: 74, step: 29, loss: 0.344539076089859, mean loss: 0.3390017812373721
Epoch: 74, step: 30, loss: 0.3436935544013977, mean loss: 0.33900182513207555
Epoch: 74, step: 31, loss: 0.2955540716648102, mean loss: 0.33900141865283123
Epoch: 74, step: 32, loss: 0.30983880162239075, mean loss: 0.3390011458219784
Epoch: 74, step: 33, loss: 0.3617843985557556, mean loss: 0.3390013589686968
Epoch: 74, step: 34, loss: 0.33714377880096436, mean loss: 0.33900134159043144
Epoch: 74, step: 35, loss: 0.33160802721977234, mean loss: 0.33900127242422284
Epoch: 74, step: 36, loss: 0.3215339183807373, mean loss: 0.33900110901451364
Epoch: 74, step: 37, loss: 0.33576351404190063, mean loss: 0.33900107872661184
Epoch: 74, step: 38, loss: 0.4150225818157196, mean loss: 0.3390017899058353
Epoch: 74, step: 39, loss: 0.2910345196723938, mean loss: 0.3390013411774429
Epoch: 74, step: 40, loss: 0.3295048177242279, mean loss: 0.33900125233937023
Epoch: 74, step: 41, loss: 0.3647022247314453, mean loss: 0.33900149276456426
Epoch: 74, step: 42, loss: 0.32907137274742126, mean loss: 0.33900139987202066
Epoch: 74, step: 43, loss: 0.344461590051651, mean loss: 0.33900145094957146
Epoch: 74, step: 44, loss: 0.3324722349643707, mean loss: 0.3390013898723506
Epoch: 74, step: 45, loss: 0.3204098343849182, mean loss: 0.3390012159602116
Epoch: 74, step: 46, loss: 0.38693907856941223, mean loss: 0.3390016643841343
Epoch: 74, step: 47, loss: 0.31852278113365173, mean loss: 0.3390014728208322
Epoch: 74, step: 48, loss: 0.310041218996048, mean loss: 0.3390012019237383
Epoch: 74, step: 49, loss: 0.33992183208465576, mean loss: 0.3390012105353238
Epoch: 74, step: 50, loss: 0.31529751420021057, mean loss: 0.3390009888127393
Epoch: 74, step: 51, loss: 0.31524527072906494, mean loss: 0.3390007666056259
Epoch: 74, step: 52, loss: 0.2989233434200287, mean loss: 0.3390003917314508
Epoch: 74, step: 53, loss: 0.31859421730041504, mean loss: 0.3390002008589933
Epoch: 74, step: 54, loss: 0.3165218234062195, mean loss: 0.33899999060581587
Epoch: 74, step: 55, loss: 0.3111083507537842, mean loss: 0.33899972972172565
Epoch: 74, step: 56, loss: 0.3191051781177521, mean loss: 0.33899954364003676
Epoch: 74, step: 57, loss: 0.32981064915657043, mean loss: 0.33899945769343964
Epoch: 74, step: 58, loss: 0.40241214632987976, mean loss: 0.33900005080655415
Epoch: 74, step: 59, loss: 0.3116135001182556, mean loss: 0.33899979465639246
Epoch: 74, step: 60, loss: 0.3336917459964752, mean loss: 0.3389997450099503
Epoch: 74, step: 61, loss: 0.31202593445777893, mean loss: 0.33899949272492297
Epoch: 74, step: 62, loss: 0.3279474675655365, mean loss: 0.33899938935671753
Epoch: 74, step: 63, loss: 0.30841460824012756, mean loss: 0.3389991033037703
Epoch: 74, step: 64, loss: 0.3299274146556854, mean loss: 0.338999018458991
Epoch: 74, step: 65, loss: 0.34448349475860596, mean loss: 0.33899906975317085
Epoch: 74, step: 66, loss: 0.3431990444660187, mean loss: 0.33899910903353814
Epoch: 74, step: 67, loss: 0.35196635127067566, mean loss: 0.3389992303088574
Epoch: 74, step: 68, loss: 0.364884614944458, mean loss: 0.3389994723980287
Epoch: 74, step: 69, loss: 0.3089539706707001, mean loss: 0.3389991914046152
Epoch: 74, step: 70, loss: 0.32079628109931946, mean loss: 0.3389990211678153
Epoch: 74, step: 71, loss: 0.3281750977039337, mean loss: 0.3389989199415372
Epoch: 74, step: 72, loss: 0.3077922463417053, mean loss: 0.33899862809672804
Epoch: 74, step: 73, loss: 0.36732205748558044, mean loss: 0.33899889297496044
Epoch: 74, step: 74, loss: 0.29643312096595764, mean loss: 0.33899849490730927
Epoch: 74, step: 75, loss: 0.35139086842536926, mean loss: 0.3389986107975341
Epoch: 74, step: 76, loss: 0.32443761825561523, mean loss: 0.33899847462822674
Epoch: 74, step: 77, loss: 0.3046777844429016, mean loss: 0.33899815367614244
Epoch: 74, step: 78, loss: 0.3199171721935272, mean loss: 0.33899797524081743
Epoch: 74, step: 79, loss: 0.31680962443351746, mean loss: 0.3389977677489456
Epoch: 74, step: 80, loss: 0.3771311342716217, mean loss: 0.3389981243455073
Epoch: 74, step: 81, loss: 0.3328695297241211, mean loss: 0.3389980670357145
Epoch: 74, step: 82, loss: 0.3425968289375305, mean loss: 0.33899810068818836
Epoch: 74, step: 83, loss: 0.35279515385627747, mean loss: 0.33899822970495636
Epoch: 74, step: 84, loss: 0.321370929479599, mean loss: 0.3389980648729441
Epoch: 74, step: 85, loss: 0.3168572783470154, mean loss: 0.3389978578374807
Epoch: 74, step: 86, loss: 0.3439657688140869, mean loss: 0.33899790429130167
Epoch: 74, step: 87, loss: 0.3538837134838104, mean loss: 0.3389980434838622
Epoch: 74, step: 88, loss: 0.321659117937088, mean loss: 0.33899788135449155
Epoch: 74, step: 89, loss: 0.31332162022590637, mean loss: 0.33899764126826926
Epoch: 74, step: 90, loss: 0.3319563865661621, mean loss: 0.33899757542953884
Epoch: 74, step: 91, loss: 0.3165946900844574, mean loss: 0.33899736595497787
Epoch: 74, step: 92, loss: 0.29520902037620544, mean loss: 0.3389969565229535
Epoch: 74, step: 93, loss: 0.3598651885986328, mean loss: 0.338997151644338
Epoch: 74, step: 94, loss: 0.36160317063331604, mean loss: 0.33899736301233824
Epoch: 74, step: 95, loss: 0.3326404392719269, mean loss: 0.3389973035751726
Epoch: 74, step: 96, loss: 0.3312091529369354, mean loss: 0.3389972307567324
Epoch: 74, step: 97, loss: 0.3550960123538971, mean loss: 0.33899738127734497
Epoch: 74, step: 98, loss: 0.382146954536438, mean loss: 0.3389977847140544
Epoch: 74, step: 99, loss: 0.3918150067329407, mean loss: 0.33899827853601877
Epoch: 74, step: 100, loss: 0.31282109022140503, mean loss: 0.33899803379104354
Epoch: 74, step: 101, loss: 0.39101940393447876, mean loss: 0.33899852016298526
Epoch: 74, step: 102, loss: 0.3059654235839844, mean loss: 0.33899821132411634
Epoch: 74, step: 103, loss: 0.3333079218864441, mean loss: 0.3389981581239533
Epoch: 74, step: 104, loss: 0.3563719093799591, mean loss: 0.33899832055466406
Epoch: 74, step: 105, loss: 0.3627112805843353, mean loss: 0.3389985422498458
Epoch: 74, step: 106, loss: 0.38295692205429077, mean loss: 0.3389989532179358
Epoch: 74, step: 107, loss: 0.35135331749916077, mean loss: 0.33899906871814406
Epoch: 74, step: 108, loss: 0.3075791895389557, mean loss: 0.3389987749783303
Epoch: 74, step: 109, loss: 0.34257733821868896, mean loss: 0.3389988084334772
Epoch: 74, step: 110, loss: 0.3238583505153656, mean loss: 0.33899866689021696
Epoch: 74, step: 111, loss: 0.3287467658519745, mean loss: 0.33899857104939507
Epoch: 74, step: 112, loss: 0.37508654594421387, mean loss: 0.3389989084179308
Epoch: 74, step: 113, loss: 0.32427525520324707, mean loss: 0.3389987707751037
Epoch: 74, step: 114, loss: 0.317684531211853, mean loss: 0.3389985715226001
Epoch: 74, step: 115, loss: 0.30931374430656433, mean loss: 0.3389982940216913
Epoch: 74, step: 116, loss: 0.3663371801376343, mean loss: 0.338998549589789
Epoch: 74, step: 117, loss: 0.38193345069885254, mean loss: 0.3389989509480733
Epoch: 74, step: 118, loss: 0.32121163606643677, mean loss: 0.3389987846726362
Epoch: 74, step: 119, loss: 0.32779988646507263, mean loss: 0.33899867998655514
Epoch: 74, step: 120, loss: 0.3055562376976013, mean loss: 0.33899836737316824
Epoch: 74, step: 121, loss: 0.3808779716491699, mean loss: 0.33899875885183
Epoch: 74, step: 122, loss: 0.2974039316177368, mean loss: 0.3389983700388178
Epoch: 74, step: 123, loss: 0.29197731614112854, mean loss: 0.33899793050756055
Epoch: 74, step: 124, loss: 0.334968626499176, mean loss: 0.3389978928438258
Epoch: 74, step: 125, loss: 0.3395859897136688, mean loss: 0.338997898340983
Epoch: 74, step: 126, loss: 0.3237415552139282, mean loss: 0.33899775573568003
Epoch: 74, step: 127, loss: 0.3642846345901489, mean loss: 0.3389979920969944
Epoch: 74, step: 128, loss: 0.33132031559944153, mean loss: 0.33899792033294807
Epoch: 74, step: 129, loss: 0.31974348425865173, mean loss: 0.3389977403613997
Epoch: 74, step: 130, loss: 0.3322584331035614, mean loss: 0.3389976773695665
Epoch: 74, step: 131, loss: 0.3034832775592804, mean loss: 0.3389973454220601
Epoch: 74, step: 132, loss: 0.31749188899993896, mean loss: 0.3389971444158219
Epoch: 74, step: 133, loss: 0.31788188219070435, mean loss: 0.338996947058478
Epoch: 74, step: 134, loss: 0.3493611812591553, mean loss: 0.33899704392862784
Epoch: 74, step: 135, loss: 0.30234694480895996, mean loss: 0.3389967013787258
Epoch: 74, step: 136, loss: 0.3322111666202545, mean loss: 0.3389966379583641
Epoch: 74, step: 137, loss: 0.33677053451538086, mean loss: 0.33899661715249235
Epoch: 74, step: 138, loss: 0.3539695143699646, mean loss: 0.3389967570926505
Epoch: 74, step: 139, loss: 0.3221215307712555, mean loss: 0.33899659937435894
Epoch: 74, step: 140, loss: 0.3238109052181244, mean loss: 0.3389964574480044
Epoch: 74, step: 141, loss: 0.3593078553676605, mean loss: 0.3389966472777014
Epoch: 74, step: 142, loss: 0.3176267147064209, mean loss: 0.33899644755683883
Epoch: 74, step: 143, loss: 0.3121096193790436, mean loss: 0.3389961962780708
Epoch: 74, step: 144, loss: 0.3883960247039795, mean loss: 0.3389966579543956
Epoch: 74, step: 145, loss: 0.3296702206134796, mean loss: 0.338996570793059
Epoch: 74, step: 146, loss: 0.3617843985557556, mean loss: 0.33899678375744097
Epoch: 74, step: 147, loss: 0.3302461504936218, mean loss: 0.3389967019788788
Epoch: 74, step: 148, loss: 0.3287268579006195, mean loss: 0.33899660600351245
Epoch: 74, step: 149, loss: 0.3142451047897339, mean loss: 0.3389963746940418
Epoch: 74, step: 150, loss: 0.3267872929573059, mean loss: 0.3389962605979384
Epoch: 74, step: 151, loss: 0.3410601317882538, mean loss: 0.3389962798850122
Epoch: 74, step: 152, loss: 0.3376544415950775, mean loss: 0.33899626734552213
Epoch: 74, step: 153, loss: 0.33993881940841675, mean loss: 0.33899627615359673
Epoch: 74, step: 154, loss: 0.3154260516166687, mean loss: 0.33899605589376797
Epoch: 74, step: 155, loss: 0.3104880452156067, mean loss: 0.3389957894936383
Epoch: 74, step: 156, loss: 0.38903799653053284, mean loss: 0.3389962571210017
Epoch: 74, step: 157, loss: 0.3579944372177124, mean loss: 0.3389964346508585
Epoch: 74, step: 158, loss: 0.30237823724746704, mean loss: 0.3389960924726834
Epoch: 74, step: 159, loss: 0.2929798364639282, mean loss: 0.33899566247851426
Epoch: 74, step: 160, loss: 0.30870524048805237, mean loss: 0.33899537943542773
Epoch: 74, step: 161, loss: 0.2938726246356964, mean loss: 0.3389949577983685
Epoch: 74, step: 162, loss: 0.32181766629219055, mean loss: 0.3389947972914351
Epoch: 74, step: 163, loss: 0.32467228174209595, mean loss: 0.33899466346116464
Epoch: 74, step: 164, loss: 0.33524078130722046, mean loss: 0.33899462838503797
Epoch: 74, step: 165, loss: 0.2998766601085663, mean loss: 0.3389942628717017
Epoch: 74, step: 166, loss: 0.329155832529068, mean loss: 0.33899417094351486
Epoch: 74, step: 167, loss: 0.32629328966140747, mean loss: 0.3389940522703081
Epoch: 74, step: 168, loss: 0.33496811985969543, mean loss: 0.3389940146535605
Epoch: 74, step: 169, loss: 0.30032849311828613, mean loss: 0.3389936533813319
Epoch: 74, step: 170, loss: 0.31817254424095154, mean loss: 0.3389934588406166
Epoch: 74, step: 171, loss: 0.29670450091362, mean loss: 0.33899306372010674
Epoch: 74, step: 172, loss: 0.38501501083374023, mean loss: 0.33899349371522125
Epoch: 74, step: 173, loss: 0.33129122853279114, mean loss: 0.33899342175161123
Epoch: 74, step: 174, loss: 0.32908445596694946, mean loss: 0.3389933291712767
Epoch: 74, step: 175, loss: 0.31456658244132996, mean loss: 0.33899310095217655
Epoch: 74, step: 176, loss: 0.3166538178920746, mean loss: 0.33899289223819995
Epoch: 74, step: 177, loss: 0.31827136874198914, mean loss: 0.3389926986406188
Epoch: 74, step: 178, loss: 0.3080386519432068, mean loss: 0.33899240944505943
Epoch: 74, step: 179, loss: 0.3074679374694824, mean loss: 0.3389921149229176
Epoch: 74, step: 180, loss: 0.3068377673625946, mean loss: 0.3389918145188745
Epoch: 74, step: 181, loss: 0.3493865728378296, mean loss: 0.33899191163165987
Epoch: 74, step: 182, loss: 0.378301203250885, mean loss: 0.33899227887436223
Epoch: 74, step: 183, loss: 0.36318865418434143, mean loss: 0.3389925049242063
Epoch: 74, step: 184, loss: 0.3409198522567749, mean loss: 0.3389925229298988
Epoch: 74, step: 185, loss: 0.34858939051628113, mean loss: 0.3389926125850583
Epoch: 74, step: 186, loss: 0.3187371790409088, mean loss: 0.3389924233579856
Epoch: 74, step: 187, loss: 0.3321177065372467, mean loss: 0.3389923591347052
Epoch: 74, step: 188, loss: 0.3164661228656769, mean loss: 0.33899214869763417
Epoch: 74, step: 189, loss: 0.3392537236213684, mean loss: 0.3389921511412091
Epoch: 74, step: 190, loss: 0.35021135210990906, mean loss: 0.3389922559475182
Epoch: 74, step: 191, loss: 0.31099191308021545, mean loss: 0.3389919943794098
Epoch: 74, step: 192, loss: 0.3063494563102722, mean loss: 0.33899168944860175
Epoch: 74, step: 193, loss: 0.3260853886604309, mean loss: 0.3389915688853062
Epoch: 74, step: 194, loss: 0.3204895853996277, mean loss: 0.33899139605195117
Epoch: 74, step: 195, loss: 0.3457087278366089, mean loss: 0.3389914588002584
Epoch: 74, step: 196, loss: 0.3196282386779785, mean loss: 0.3389912779251767
Epoch: 74, step: 197, loss: 0.3157665729522705, mean loss: 0.33899106098134485
Epoch: 74, step: 198, loss: 0.31793516874313354, mean loss: 0.33899086429840397
Epoch: 74, step: 199, loss: 0.3496481776237488, mean loss: 0.3389909638473627
Epoch: 74, step: 200, loss: 0.2990705966949463, mean loss: 0.33899059095846096
Epoch: 74, step: 201, loss: 0.31106874346733093, mean loss: 0.3389903301479891
Epoch: 74, step: 202, loss: 0.3505000174045563, mean loss: 0.3389904376558797
Epoch: 74, step: 203, loss: 0.35419216752052307, mean loss: 0.33899057964849943
Epoch: 74, step: 204, loss: 0.3407343327999115, mean loss: 0.33899059593597247
Epoch: 74, step: 205, loss: 0.3490753173828125, mean loss: 0.33899069013112526
Epoch: 74, step: 206, loss: 0.35070186853408813, mean loss: 0.33899079951698596
Epoch: 74, step: 207, loss: 0.31445828080177307, mean loss: 0.3389905703781651
Epoch: 74, step: 208, loss: 0.32630372047424316, mean loss: 0.3389904518814584
Epoch: 74, step: 209, loss: 0.3255283236503601, mean loss: 0.33899032614473307
Epoch: 74, step: 210, loss: 0.3284105062484741, mean loss: 0.3389902273297864
Epoch: 74, step: 211, loss: 0.3310178220272064, mean loss: 0.3389901528686467
Epoch: 74, step: 212, loss: 0.3460423946380615, mean loss: 0.33899021873497376
Epoch: 74, step: 213, loss: 0.32647818326950073, mean loss: 0.33899010187651235
Epoch: 74, step: 214, loss: 0.3781713545322418, mean loss: 0.33899046781362563
Epoch: 74, step: 215, loss: 0.3083954155445099, mean loss: 0.3389901820708332
Epoch: 74, step: 216, loss: 0.328662246465683, mean loss: 0.3389900856138776
Epoch: 74, step: 217, loss: 0.324282705783844, mean loss: 0.33898994825672435
Epoch: 74, step: 218, loss: 0.3700312077999115, mean loss: 0.33899023815875134
Epoch: 74, step: 219, loss: 0.3388568162918091, mean loss: 0.3389902369127031
Epoch: 74, step: 220, loss: 0.3340282440185547, mean loss: 0.33899019057228547
Epoch: 74, step: 221, loss: 0.3396686911582947, mean loss: 0.3389901969087933
Epoch: 74, step: 222, loss: 0.3154338598251343, mean loss: 0.338989976918533
Epoch: 74, step: 223, loss: 0.3053401708602905, mean loss: 0.3389896626693169
Epoch: 74, step: 224, loss: 0.29204314947128296, mean loss: 0.33898922424874556
Epoch: 74, step: 225, loss: 0.3665851652622223, mean loss: 0.3389894819572401
Epoch: 74, step: 226, loss: 0.30885064601898193, mean loss: 0.33898920050419956
Epoch: 74, step: 227, loss: 0.32089176774024963, mean loss: 0.33898903150198856
Epoch: 74, step: 228, loss: 0.3265605568885803, mean loss: 0.3389889154402188
Epoch: 74, step: 229, loss: 0.3225420415401459, mean loss: 0.3389887618545596
Epoch: 74, step: 230, loss: 0.29135721921920776, mean loss: 0.33898831706160965
Epoch: 74, step: 231, loss: 0.33986929059028625, mean loss: 0.3389883252882413
Epoch: 74, step: 232, loss: 0.3833668529987335, mean loss: 0.3389887396961423
Epoch: 74, step: 233, loss: 0.32819241285324097, mean loss: 0.3389886388806895
Epoch: 74, step: 234, loss: 0.38924720883369446, mean loss: 0.33898910818782035
Epoch: 74, step: 235, loss: 0.3754976987838745, mean loss: 0.3389894490964839
Epoch: 74, step: 236, loss: 0.33324098587036133, mean loss: 0.3389893954191826
Epoch: 74, step: 237, loss: 0.3517422080039978, mean loss: 0.33898951449973413
Epoch: 74, step: 238, loss: 0.3614172637462616, mean loss: 0.33898972391893434
Epoch: 74, step: 239, loss: 0.32069867849349976, mean loss: 0.3389895531278177
Epoch: 74, step: 240, loss: 0.34970709681510925, mean loss: 0.3389896532010568
Epoch: 74, step: 241, loss: 0.31129467487335205, mean loss: 0.3389893946063274
Epoch: 74, step: 242, loss: 0.31654390692710876, mean loss: 0.3389891850293222
Epoch: 74, step: 243, loss: 0.3257436454296112, mean loss: 0.3389890613548161
Epoch: 74, step: 244, loss: 0.3106599748134613, mean loss: 0.3389887968466739
Epoch: 74, step: 245, loss: 0.3314146101474762, mean loss: 0.338988726127297
Epoch: 74, step: 246, loss: 0.3006652593612671, mean loss: 0.3389883683084986
Epoch: 74, step: 247, loss: 0.3792983293533325, mean loss: 0.3389887446712959
Epoch: 74, step: 248, loss: 0.3288656771183014, mean loss: 0.33898865015593665
Epoch: 74, step: 249, loss: 0.35655152797698975, mean loss: 0.3389888141325376
Epoch: 74, step: 250, loss: 0.35058262944221497, mean loss: 0.33898892237770656
Epoch: 74, step: 251, loss: 0.3917895555496216, mean loss: 0.3389894153439945
Epoch: 74, step: 252, loss: 0.28491273522377014, mean loss: 0.33898891046877283
Epoch: 74, step: 253, loss: 0.36154836416244507, mean loss: 0.33898912108826396
Epoch: 74, step: 254, loss: 0.32509902119636536, mean loss: 0.3389889914087736
Epoch: 74, step: 255, loss: 0.3345412313938141, mean loss: 0.33898894988438777
Epoch: 74, step: 256, loss: 0.3188721239566803, mean loss: 0.33898876207500955
Epoch: 74, step: 257, loss: 0.33204731345176697, mean loss: 0.3389886972707018
Epoch: 74, step: 258, loss: 0.3366963267326355, mean loss: 0.3389886758696792
Epoch: 74, step: 259, loss: 0.3199070990085602, mean loss: 0.3389884977303082
Epoch: 74, step: 260, loss: 0.3310956358909607, mean loss: 0.3389884240458152
Epoch: 74, step: 261, loss: 0.3412717878818512, mean loss: 0.3389884453621564
Epoch: 74, step: 262, loss: 0.3361193835735321, mean loss: 0.3389884185782825
Epoch: 74, step: 263, loss: 0.30967968702316284, mean loss: 0.3389881449717519
Epoch: 74, step: 264, loss: 0.3034270703792572, mean loss: 0.33898781300066694
Epoch: 74, step: 265, loss: 0.3799651265144348, mean loss: 0.33898819553005877
Epoch: 74, step: 266, loss: 0.3506566882133484, mean loss: 0.3389883044561781
Epoch: 74, step: 267, loss: 0.3312767744064331, mean loss: 0.33898823246922793
Epoch: 74, step: 268, loss: 0.3068941831588745, mean loss: 0.3389879328748353
Epoch: 74, step: 269, loss: 0.3172836899757385, mean loss: 0.3389877302700251
Epoch: 74, step: 270, loss: 0.32252079248428345, mean loss: 0.3389875765558561
Epoch: 74, step: 271, loss: 0.3424687683582306, mean loss: 0.33898760905148567
Epoch: 74, step: 272, loss: 0.3259095251560211, mean loss: 0.33898748697358055
Epoch: 74, step: 273, loss: 0.29746130108833313, mean loss: 0.3389870993493307
Epoch: 74, step: 274, loss: 0.33221572637557983, mean loss: 0.33898703614285475
Epoch: 74, step: 275, loss: 0.35849085450172424, mean loss: 0.3389872181969409
Epoch: 74, step: 276, loss: 0.3173671066761017, mean loss: 0.3389870163906672
Epoch: 74, step: 277, loss: 0.32412704825401306, mean loss: 0.33898687768616503
Epoch: 74, step: 278, loss: 0.3409200608730316, mean loss: 0.33898689573053137
Epoch: 74, step: 279, loss: 0.3326302170753479, mean loss: 0.3389868363977333
Epoch: 74, step: 280, loss: 0.338341623544693, mean loss: 0.33898683037541744
Epoch: 74, step: 281, loss: 0.3093372881412506, mean loss: 0.33898655363381097
Epoch: 74, step: 282, loss: 0.3669195771217346, mean loss: 0.33898681435141603
Epoch: 74, step: 283, loss: 0.33457934856414795, mean loss: 0.3389867732139717
Epoch: 74, step: 284, loss: 0.32532382011413574, mean loss: 0.3389866456908657
Epoch: 74, step: 285, loss: 0.34102863073349, mean loss: 0.3389866647495452
Epoch: 74, step: 286, loss: 0.3427480161190033, mean loss: 0.3389866998554445
Epoch: 74, step: 287, loss: 0.31245285272598267, mean loss: 0.3389864522088462
Epoch: 74, step: 288, loss: 0.33682703971862793, mean loss: 0.3389864320547327
Epoch: 74, step: 289, loss: 0.3002035915851593, mean loss: 0.3389860700921726
Epoch: 74, step: 290, loss: 0.32087406516075134, mean loss: 0.3389859010533294
Epoch: 74, step: 291, loss: 0.34619709849357605, mean loss: 0.33898596835460837
Epoch: 74, step: 292, loss: 0.34370186924934387, mean loss: 0.33898601236716003
Epoch: 74, step: 293, loss: 0.3275490403175354, mean loss: 0.33898590562920344
Epoch: 74, step: 294, loss: 0.3513792157173157, mean loss: 0.3389860212913073
Epoch: 74, step: 295, loss: 0.3411235511302948, mean loss: 0.3389860412398835
Epoch: 74, step: 296, loss: 0.32472968101501465, mean loss: 0.3389859081931165
Epoch: 74, step: 297, loss: 0.36747148633003235, mean loss: 0.33898617403086534
Epoch: 74, step: 298, loss: 0.32393214106559753, mean loss: 0.3389860335424797
Epoch: 74, step: 299, loss: 0.3116525113582611, mean loss: 0.338985778460896
Epoch: 74, step: 300, loss: 0.33652177453041077, mean loss: 0.33898575546656123
Epoch: 74, step: 301, loss: 0.3345728814601898, mean loss: 0.3389857142855574
Epoch: 74, step: 302, loss: 0.3492267429828644, mean loss: 0.33898580985409293
Epoch: 74, step: 303, loss: 0.2834123969078064, mean loss: 0.3389852912518818
Epoch: 74, step: 304, loss: 0.35119256377220154, mean loss: 0.3389854051671357
Epoch: 74, step: 305, loss: 0.33470869064331055, mean loss: 0.3389853652582639
Epoch: 74, step: 306, loss: 0.33424702286720276, mean loss: 0.33898532104204754
Epoch: 74, step: 307, loss: 0.341418594121933, mean loss: 0.3389853437481156
Epoch: 74, step: 308, loss: 0.3371571898460388, mean loss: 0.33898532668887144
Epoch: 74, step: 309, loss: 0.31762951612472534, mean loss: 0.33898512741101683
Epoch: 74, step: 310, loss: 0.36736005544662476, mean loss: 0.3389853921840163
Epoch: 74, step: 311, loss: 0.35469961166381836, mean loss: 0.33898553881565524
Epoch: 74, step: 312, loss: 0.3468463718891144, mean loss: 0.33898561216553325
Epoch: 74, step: 313, loss: 0.3097132444381714, mean loss: 0.3389853390259632
Epoch: 74, step: 314, loss: 0.3251439929008484, mean loss: 0.33898520987398995
Epoch: 74, step: 315, loss: 0.3875959813594818, mean loss: 0.33898566345115083
Epoch: 74, step: 316, loss: 0.3534184694290161, mean loss: 0.3389857981194533
Epoch: 74, step: 317, loss: 0.3354414701461792, mean loss: 0.33898576504867145
Epoch: 74, step: 318, loss: 0.2990707755088806, mean loss: 0.33898539262049754
Epoch: 74, step: 319, loss: 0.32162222266197205, mean loss: 0.3389852306143585
Epoch: 74, step: 320, loss: 0.31725865602493286, mean loss: 0.3389850278975947
Epoch: 74, step: 321, loss: 0.325493723154068, mean loss: 0.3389849020200383
Epoch: 74, step: 322, loss: 0.31288886070251465, mean loss: 0.3389846585391202
Epoch: 74, step: 323, loss: 0.33906933665275574, mean loss: 0.3389846593291754
Epoch: 74, step: 324, loss: 0.346820592880249, mean loss: 0.3389847324385283
Epoch: 74, step: 325, loss: 0.3434366285800934, mean loss: 0.3389847739743845
Epoch: 74, step: 326, loss: 0.3055976927280426, mean loss: 0.33898446247833336
Epoch: 74, step: 327, loss: 0.3103558123111725, mean loss: 0.33898419538016417
Epoch: 74, step: 328, loss: 0.3304615020751953, mean loss: 0.3389841158663021
Epoch: 74, step: 329, loss: 0.31091251969337463, mean loss: 0.33898385397019465
Epoch: 74, step: 330, loss: 0.3154551088809967, mean loss: 0.3389836344590124
Epoch: 74, step: 331, loss: 0.31458914279937744, mean loss: 0.33898340687297984
Epoch: 74, step: 332, loss: 0.3200414478778839, mean loss: 0.338983230157468
Epoch: 74, step: 333, loss: 0.34946000576019287, mean loss: 0.33898332789770125
Epoch: 74, step: 334, loss: 0.3041447401046753, mean loss: 0.3389830028835882
Epoch: 74, step: 335, loss: 0.36170175671577454, mean loss: 0.33898321482807875
Epoch: 74, step: 336, loss: 0.2970521152019501, mean loss: 0.3389828236542183
Epoch: 74, step: 337, loss: 0.30999743938446045, mean loss: 0.3389825532530366
Epoch: 74, step: 338, loss: 0.31649503111839294, mean loss: 0.33898234347159034
Epoch: 74, step: 339, loss: 0.3152129054069519, mean loss: 0.33898212173348385
Epoch: 74, step: 340, loss: 0.36868733167648315, mean loss: 0.33898239884207776
Epoch: 74, step: 341, loss: 0.3451947569847107, mean loss: 0.33898245679426103
Epoch: 74, step: 342, loss: 0.377890408039093, mean loss: 0.33898281974495315
Epoch: 74, step: 343, loss: 0.3085121810436249, mean loss: 0.3389825355039205
Epoch: 74, step: 344, loss: 0.3803131878376007, mean loss: 0.338982921047454
Epoch: 74, step: 345, loss: 0.3142381012439728, mean loss: 0.3389826902232175
Epoch: 74, step: 346, loss: 0.3662651777267456, mean loss: 0.3389829447169117
Epoch: 74, step: 347, loss: 0.3384871184825897, mean loss: 0.33898294009183955
Epoch: 74, step: 348, loss: 0.36034438014030457, mean loss: 0.3389831393497104
Epoch: 74, step: 349, loss: 0.3222643733024597, mean loss: 0.33898298339980043
Epoch: 74, step: 350, loss: 0.3405379056930542, mean loss: 0.3389829979037255
Epoch: 74, step: 351, loss: 0.3210808038711548, mean loss: 0.33898283091810844
Epoch: 74, step: 352, loss: 0.2930593490600586, mean loss: 0.3389824025633821
Epoch: 74, step: 353, loss: 0.33397215604782104, mean loss: 0.3389823558303673
Epoch: 74, step: 354, loss: 0.30529823899269104, mean loss: 0.33898204164509865
Epoch: 74, step: 355, loss: 0.34710362553596497, mean loss: 0.33898211739766265
Epoch: 74, step: 356, loss: 0.3585512936115265, mean loss: 0.3389822999238135
Epoch: 74, step: 357, loss: 0.32469069957733154, mean loss: 0.33898216662405467
Epoch: 74, step: 358, loss: 0.3808389902114868, mean loss: 0.3389825570248716
Epoch: 74, step: 359, loss: 0.3304596543312073, mean loss: 0.3389824775320469
Epoch: 74, step: 360, loss: 0.3451765477657318, mean loss: 0.33898253530339134
Epoch: 74, step: 361, loss: 0.30075207352638245, mean loss: 0.3389821787358208
Epoch: 74, step: 362, loss: 0.3060741424560547, mean loss: 0.3389818718122692
Epoch: 74, step: 363, loss: 0.33332473039627075, mean loss: 0.33898181905027125
Epoch: 74, step: 364, loss: 0.31939229369163513, mean loss: 0.33898163634795214
Epoch: 74, step: 365, loss: 0.31071898341178894, mean loss: 0.3389813727578966
Epoch: 74, step: 366, loss: 0.32499656081199646, mean loss: 0.3389812423305447
Epoch: 74, step: 367, loss: 0.34568706154823303, mean loss: 0.3389813048708269
Epoch: 74, step: 368, loss: 0.30598780512809753, mean loss: 0.33898099716740193
Epoch: 74, step: 369, loss: 0.3297383785247803, mean loss: 0.33898091096985056
Epoch: 74, step: 370, loss: 0.3963128626346588, mean loss: 0.3389814456481654
Epoch: 74, step: 371, loss: 0.28971898555755615, mean loss: 0.3389809862302886
Epoch: 74, step: 372, loss: 0.3160526156425476, mean loss: 0.33898077240407937
Epoch: 74, step: 373, loss: 0.3841799199581146, mean loss: 0.33898119391995696
Epoch: 74, step: 374, loss: 0.3348987102508545, mean loss: 0.3389811558480965
Epoch: 74, step: 375, loss: 0.33500829339027405, mean loss: 0.3389811187988719
Epoch: 74, step: 376, loss: 0.33506593108177185, mean loss: 0.3389810822878378
Epoch: 74, step: 377, loss: 0.33626165986061096, mean loss: 0.33898105692813446
Epoch: 74, step: 378, loss: 0.34721389412879944, mean loss: 0.3389811337019229
Epoch: 74, step: 379, loss: 0.3262268304824829, mean loss: 0.3389810147651552
Epoch: 74, step: 380, loss: 0.3586324453353882, mean loss: 0.33898119801748944
Epoch: 74, step: 381, loss: 0.31224754452705383, mean loss: 0.33898094872476214
Epoch: 74, step: 382, loss: 0.33829718828201294, mean loss: 0.33898094234871945
Epoch: 74, step: 383, loss: 0.36310818791389465, mean loss: 0.33898116733235956
Epoch: 74, step: 384, loss: 0.31854477524757385, mean loss: 0.33898097676725775
Epoch: 74, step: 385, loss: 0.3538421094417572, mean loss: 0.338981115342934
Epoch: 74, step: 386, loss: 0.30438899993896484, mean loss: 0.3389807927846747
Epoch: 74, step: 387, loss: 0.309219092130661, mean loss: 0.33898051527077505
Epoch: 74, step: 388, loss: 0.3234770596027374, mean loss: 0.3389803707096704
Epoch: 74, step: 389, loss: 0.3170856833457947, mean loss: 0.33898016655578717
Epoch: 74, step: 390, loss: 0.33844220638275146, mean loss: 0.3389801615397012
Epoch: 74, step: 391, loss: 0.33506932854652405, mean loss: 0.33898012507437786
Epoch: 74, step: 392, loss: 0.3447777032852173, mean loss: 0.3389801791315552
Epoch: 74, step: 393, loss: 0.33171510696411133, mean loss: 0.33898011139195455
Epoch: 74, step: 394, loss: 0.306092232465744, mean loss: 0.33897980474792394
Epoch: 74, step: 395, loss: 0.34982749819755554, mean loss: 0.3389799058900327
Epoch: 74, step: 396, loss: 0.3102417290210724, mean loss: 0.33897963794249864
Epoch: 74, step: 397, loss: 0.3207447826862335, mean loss: 0.3389794679268791
Epoch: 74, step: 398, loss: 0.3714941143989563, mean loss: 0.33897977107961297
Epoch: 74, step: 399, loss: 0.3262493908405304, mean loss: 0.338979652388069
Epoch: 74, step: 400, loss: 0.3150394856929779, mean loss: 0.3389794291842996
Epoch: 74, step: 401, loss: 0.33202505111694336, mean loss: 0.33897936434645004
Epoch: 74, step: 402, loss: 0.29568302631378174, mean loss: 0.3389789606848642
Epoch: 74, step: 403, loss: 0.3261192739009857, mean loss: 0.33897884079220353
Epoch: 74, step: 404, loss: 0.3160058856010437, mean loss: 0.3389786266141221
Epoch: 74, step: 405, loss: 0.31642991304397583, mean loss: 0.33897841639322773
Epoch: 74, step: 406, loss: 0.34228068590164185, mean loss: 0.3389784471798877
Epoch: 74, step: 407, loss: 0.341878205537796, mean loss: 0.33897847421373273
Epoch: 74, step: 408, loss: 0.35260438919067383, mean loss: 0.33897860124412454
Epoch: 74, step: 409, loss: 0.3619777262210846, mean loss: 0.33897881565619337
Epoch: 74, step: 410, loss: 0.37725144624710083, mean loss: 0.3389791724540025
Epoch: 74, step: 411, loss: 0.29597288370132446, mean loss: 0.3389787715302531
Epoch: 74, step: 412, loss: 0.31367895007133484, mean loss: 0.3389785356762649
Epoch: 74, step: 413, loss: 0.28719550371170044, mean loss: 0.3389780529408126
Epoch: 74, step: 414, loss: 0.323411762714386, mean loss: 0.3389779078289909
Epoch: 74, step: 415, loss: 0.35933247208595276, mean loss: 0.33897809757621533
Epoch: 74, step: 416, loss: 0.3395058810710907, mean loss: 0.33897810249621846
Epoch: 74, step: 417, loss: 0.3045010268688202, mean loss: 0.33897778110356386
Epoch: 74, step: 418, loss: 0.37462732195854187, mean loss: 0.3389781134227515
Epoch: 74, step: 419, loss: 0.37254661321640015, mean loss: 0.3389784263398979
Epoch: 74, step: 420, loss: 0.4118421971797943, mean loss: 0.3389791055513863
Epoch: 74, step: 421, loss: 0.4042363464832306, mean loss: 0.33897971385169884
Epoch: 74, step: 422, loss: 0.3241403102874756, mean loss: 0.3389795755263643
Epoch: 74, step: 423, loss: 0.3038991093635559, mean loss: 0.338979248527239
Epoch: 74, step: 424, loss: 0.347964882850647, mean loss: 0.33897933228516747
Epoch: 74, step: 425, loss: 0.3493906259536743, mean loss: 0.3389794293312112
Epoch: 74, step: 426, loss: 0.3208822011947632, mean loss: 0.338979260644391
Epoch: 74, step: 427, loss: 0.34429824352264404, mean loss: 0.3389793102229197
Epoch: 74, step: 428, loss: 0.3377844989299774, mean loss: 0.33897929908612245
Epoch: 74, step: 429, loss: 0.2944556474685669, mean loss: 0.3389788840864802
Epoch: 74, step: 430, loss: 0.3277912139892578, mean loss: 0.3389787798085146
Epoch: 74, step: 431, loss: 0.3380904495716095, mean loss: 0.33897877152864886
Epoch: 74, step: 432, loss: 0.33661821484565735, mean loss: 0.338978749526797
Epoch: 74, step: 433, loss: 0.3476162850856781, mean loss: 0.33897883003323337
Epoch: 74, step: 434, loss: 0.312800794839859, mean loss: 0.33897858604226305
Epoch: 74, step: 435, loss: 0.32936838269233704, mean loss: 0.33897849647171396
Epoch: 74, step: 436, loss: 0.3698662519454956, mean loss: 0.3389787843540127
Epoch: 74, step: 437, loss: 0.3240848779678345, mean loss: 0.33897864554004
Epoch: 74, step: 438, loss: 0.3340584635734558, mean loss: 0.33897859968345795
Epoch: 74, step: 439, loss: 0.3670421540737152, mean loss: 0.33897886123611964
Epoch: 74, step: 440, loss: 0.3649653494358063, mean loss: 0.33897910342824245
Epoch: 74, step: 441, loss: 0.30094099044799805, mean loss: 0.3389787489191837
Epoch: 74, step: 442, loss: 0.32981565594673157, mean loss: 0.33897866352143563
Epoch: 74, step: 443, loss: 0.33263275027275085, mean loss: 0.33897860437965327
Epoch: 74, step: 444, loss: 0.33662840723991394, mean loss: 0.33897858247680857
Epoch: 74, step: 445, loss: 0.30789270997047424, mean loss: 0.33897829277230623
Epoch: 74, step: 446, loss: 0.35465100407600403, mean loss: 0.33897843883263357
Epoch: 74, step: 447, loss: 0.31757548451423645, mean loss: 0.33897823937171584
Epoch: 74, step: 448, loss: 0.2904191315174103, mean loss: 0.3389777868382099
Epoch: 74, step: 449, loss: 0.3183230757713318, mean loss: 0.3389775943539959
Epoch: 74, step: 450, loss: 0.3498366177082062, mean loss: 0.33897769554984847
Epoch: 74, step: 451, loss: 0.33577725291252136, mean loss: 0.3389776657250205
Epoch: 74, step: 452, loss: 0.36298176646232605, mean loss: 0.33897788941642326
Epoch: 74, step: 453, loss: 0.35931962728500366, mean loss: 0.338978078976929
Epoch: 74, step: 454, loss: 0.3677004873752594, mean loss: 0.3389783466326996
Epoch: 74, step: 455, loss: 0.3235630393028259, mean loss: 0.3389782029832724
Epoch: 74, step: 456, loss: 0.34908273816108704, mean loss: 0.3389782971427422
Epoch: 74, step: 457, loss: 0.3291211426258087, mean loss: 0.33897820528935385
Epoch: 74, step: 458, loss: 0.3008047640323639, mean loss: 0.3389778495754158
Epoch: 74, step: 459, loss: 0.3275730311870575, mean loss: 0.3389777433021817
Epoch: 74, step: 460, loss: 0.2841293215751648, mean loss: 0.3389772322142672
Epoch: 74, step: 461, loss: 0.31305867433547974, mean loss: 0.3389769907025182
Epoch: 74, step: 462, loss: 0.35163918137550354, mean loss: 0.3389771086889947
Epoch: 74, step: 463, loss: 0.29540592432022095, mean loss: 0.3389767026958493
Epoch: 74, step: 464, loss: 0.3188052177429199, mean loss: 0.33897651474116236
Epoch: 74, step: 465, loss: 0.33901312947273254, mean loss: 0.3389765150823294
Epoch: 74, step: 466, loss: 0.3537156581878662, mean loss: 0.3389766524167601
Epoch: 74, step: 467, loss: 0.31288695335388184, mean loss: 0.3389764093238912
Epoch: 74, step: 468, loss: 0.2978261709213257, mean loss: 0.33897602590680853
Epoch: 74, step: 469, loss: 0.3013305068016052, mean loss: 0.3389756751481936
Epoch: 74, step: 470, loss: 0.312193900346756, mean loss: 0.33897542561382854
Epoch: 74, step: 471, loss: 0.3286333978176117, mean loss: 0.3389753292547443
Epoch: 74, step: 472, loss: 0.33830803632736206, mean loss: 0.3389753230374784
Epoch: 74, step: 473, loss: 0.2969871163368225, mean loss: 0.33897493183085675
Epoch: 74, step: 474, loss: 0.2955268919467926, mean loss: 0.33897452702665404
Epoch: 74, step: 475, loss: 0.3106934726238251, mean loss: 0.33897426353529636
Epoch: 74, step: 476, loss: 0.3452131152153015, mean loss: 0.3389743216614242
Epoch: 74, step: 477, loss: 0.36031943559646606, mean loss: 0.33897452052771015
Epoch: 74, step: 478, loss: 0.3301471173763275, mean loss: 0.3389744382861007
Epoch: 74, step: 479, loss: 0.35331544280052185, mean loss: 0.33897457189462454
Epoch: 74, step: 480, loss: 0.31262093782424927, mean loss: 0.33897432637225977
Epoch: 74, step: 481, loss: 0.33838289976119995, mean loss: 0.3389743208623135
Epoch: 74, step: 482, loss: 0.36662787199020386, mean loss: 0.33897457849049273
Epoch: 74, step: 483, loss: 0.30597424507141113, mean loss: 0.33897427105306566
Epoch: 74, step: 484, loss: 0.3537246584892273, mean loss: 0.3389744084692201
Epoch: 74, step: 485, loss: 0.3366696834564209, mean loss: 0.3389743869983605
Epoch: 74, step: 486, loss: 0.35335519909858704, mean loss: 0.33897452096901626
Epoch: 74, step: 487, loss: 0.27696356177330017, mean loss: 0.33897394328457003
Epoch: 74, step: 488, loss: 0.31995388865470886, mean loss: 0.3389737660983515
Epoch: 74, step: 489, loss: 0.31105688214302063, mean loss: 0.33897350603385024
Epoch: 74, step: 490, loss: 0.36975690722465515, mean loss: 0.3389737927992111
Epoch: 74, step: 491, loss: 0.3681093752384186, mean loss: 0.3389740642116495
Epoch: 74, step: 492, loss: 0.3583916425704956, mean loss: 0.3389742450943625
Epoch: 74, step: 493, loss: 0.3054056167602539, mean loss: 0.3389739323917232
Epoch: 74, step: 494, loss: 0.33027684688568115, mean loss: 0.3389738513763111
Epoch: 74, step: 495, loss: 0.3330850601196289, mean loss: 0.33897379652133625
Epoch: 74, step: 496, loss: 0.3636579215526581, mean loss: 0.3389740264555256
Epoch: 74, step: 497, loss: 0.3672146201133728, mean loss: 0.33897428951599523
Epoch: 74, step: 498, loss: 0.30162519216537476, mean loss: 0.3389739416132674
Epoch: 74, step: 499, loss: 0.37074822187423706, mean loss: 0.3389742375844312
Epoch: 74, step: 500, loss: 0.33245497941970825, mean loss: 0.33897417685939074
Epoch: 74, step: 501, loss: 0.30544960498809814, mean loss: 0.3389738645904227
Epoch: 74, step: 502, loss: 0.3662491738796234, mean loss: 0.33897411864745836
Epoch: 74, step: 503, loss: 0.31075519323349, mean loss: 0.3389738558035182
Epoch: 74, step: 504, loss: 0.3001975417137146, mean loss: 0.33897349462660953
Epoch: 74, step: 505, loss: 0.33106186985969543, mean loss: 0.33897342093550126
Epoch: 74, step: 506, loss: 0.29712700843811035, mean loss: 0.33897303116982314
Epoch: 74, step: 507, loss: 0.31000036001205444, mean loss: 0.3389727613152056
Epoch: 74, step: 508, loss: 0.3298589587211609, mean loss: 0.3389726764290454
Epoch: 74, step: 509, loss: 0.3531203866004944, mean loss: 0.33897280819990555
Epoch: 74, step: 510, loss: 0.3559475243091583, mean loss: 0.3389729662998442
Epoch: 74, step: 511, loss: 0.3020875155925751, mean loss: 0.3389726227575345
Epoch: 74, step: 512, loss: 0.3382073938846588, mean loss: 0.33897261563044123
Epoch: 74, step: 513, loss: 0.3561016023159027, mean loss: 0.3389727751627751
Epoch: 74, step: 514, loss: 0.30092161893844604, mean loss: 0.3389724207732637
Epoch: 74, step: 515, loss: 0.3350975215435028, mean loss: 0.33897238468471896
Epoch: 74, step: 516, loss: 0.3173505663871765, mean loss: 0.3389721833136266
Epoch: 74, step: 517, loss: 0.3547477126121521, mean loss: 0.33897233023494183
Epoch: 74, step: 518, loss: 0.32141631841659546, mean loss: 0.33897216673308556
Epoch: 74, step: 519, loss: 0.3512877821922302, mean loss: 0.338972281429251
Epoch: 74, step: 520, loss: 0.3204949200153351, mean loss: 0.3389721093499285
Epoch: 74, step: 521, loss: 0.3997785449028015, mean loss: 0.33897267563385586
Epoch: 74, step: 522, loss: 0.36948084831237793, mean loss: 0.33897295975060754
Epoch: 74, step: 523, loss: 0.34646308422088623, mean loss: 0.33897302950404834
Epoch: 74, step: 524, loss: 0.31614863872528076, mean loss: 0.33897281694884046
Epoch: 74, step: 525, loss: 0.30382707715034485, mean loss: 0.3389724896524612
Epoch: 74, step: 526, loss: 0.2938075661659241, mean loss: 0.33897206905587246
Epoch: 74, step: 527, loss: 0.31987473368644714, mean loss: 0.3389718912143377
Epoch: 74, step: 528, loss: 0.3233455717563629, mean loss: 0.33897174569755734
Epoch: 74, step: 529, loss: 0.33188724517822266, mean loss: 0.3389716797252656
Epoch: 74, step: 530, loss: 0.3642685115337372, mean loss: 0.3389719152922505
Epoch: 74, step: 531, loss: 0.30555763840675354, mean loss: 0.3389716041375881
Epoch: 74, step: 532, loss: 0.31587517261505127, mean loss: 0.33897138906498736
Epoch: 74, step: 533, loss: 0.372111052274704, mean loss: 0.33897169765669244
Epoch: 74, step: 534, loss: 0.36355865001678467, mean loss: 0.33897192660467096
Epoch: 74, step: 535, loss: 0.32381004095077515, mean loss: 0.3389717854220349
Epoch: 74, step: 536, loss: 0.37912556529045105, mean loss: 0.3389721593177252
Epoch: 74, step: 537, loss: 0.3608075678348541, mean loss: 0.33897236263828795
Epoch: 74, step: 538, loss: 0.3247881829738617, mean loss: 0.33897223056342723
Epoch: 74, step: 539, loss: 0.30986592173576355, mean loss: 0.33897195954487136
Epoch: 74, step: 540, loss: 0.3934009373188019, mean loss: 0.3389724663465304
Epoch: 74, step: 541, loss: 0.37541550397872925, mean loss: 0.3389728056734977
Epoch: 74, step: 542, loss: 0.31936678290367126, mean loss: 0.3389726231203755
Epoch: 74, step: 543, loss: 0.33694425225257874, mean loss: 0.3389726042342408
Epoch: 74, step: 544, loss: 0.31180158257484436, mean loss: 0.33897235124756786
Epoch: 74, step: 545, loss: 0.3273952305316925, mean loss: 0.3389722434551551
Epoch: 74, step: 546, loss: 0.33429720997810364, mean loss: 0.3389721999271952
Epoch: 74, step: 547, loss: 0.31084075570106506, mean loss: 0.3389719380054397
Epoch: 74, step: 548, loss: 0.32865026593208313, mean loss: 0.3389718419049595
Epoch: 74, step: 549, loss: 0.3272824287414551, mean loss: 0.338971733071066
Epoch: 74, step: 550, loss: 0.37071314454078674, mean loss: 0.33897202859567305
Epoch: 74, step: 551, loss: 0.3272835910320282, mean loss: 0.33897191977288926
Epoch: 74, step: 552, loss: 0.35985687375068665, mean loss: 0.3389721142161294
Epoch: 74, step: 553, loss: 0.3449818789958954, mean loss: 0.33897217016776127
Epoch: 74, step: 554, loss: 0.3362756371498108, mean loss: 0.33897214506294876
Epoch: 74, step: 555, loss: 0.31817254424095154, mean loss: 0.33897195141977277
Epoch: 74, step: 556, loss: 0.3151598572731018, mean loss: 0.3389717297325082
Epoch: 74, step: 557, loss: 0.3500855267047882, mean loss: 0.33897183319943963
Epoch: 74, step: 558, loss: 0.34540024399757385, mean loss: 0.33897189304593034
Epoch: 74, step: 559, loss: 0.3244972229003906, mean loss: 0.3389717582925403
Epoch: 74, step: 560, loss: 0.34379148483276367, mean loss: 0.33897180316184905
Epoch: 74, step: 561, loss: 0.3647463321685791, mean loss: 0.3389720431079382
Epoch: 74, step: 562, loss: 0.3145814836025238, mean loss: 0.3389718160479255
Epoch: 74, step: 563, loss: 0.37178754806518555, mean loss: 0.33897212153789025
Epoch: 74, step: 564, loss: 0.3313133716583252, mean loss: 0.3389720502413106
Epoch: 74, step: 565, loss: 0.3351222574710846, mean loss: 0.33897201440328145
Epoch: 74, step: 566, loss: 0.30921471118927, mean loss: 0.33897173739274167
Epoch: 74, step: 567, loss: 0.32225102186203003, mean loss: 0.3389715817411598
Epoch: 74, step: 568, loss: 0.33585798740386963, mean loss: 0.33897155275727026
Epoch: 74, step: 569, loss: 0.3293568789958954, mean loss: 0.33897146325683497
Epoch: 74, step: 570, loss: 0.31685736775398254, mean loss: 0.3389712574045306
Epoch: 74, step: 571, loss: 0.3460817039012909, mean loss: 0.3389713235925495
Epoch: 74, step: 572, loss: 0.37295565009117126, mean loss: 0.33897163993475227
Epoch: 74, step: 573, loss: 0.33529260754585266, mean loss: 0.33897160568889556
Epoch: 74, step: 574, loss: 0.3208991587162018, mean loss: 0.3389714374651336
Epoch: 74, step: 575, loss: 0.354638010263443, mean loss: 0.3389715832929391
Epoch: 74, step: 576, loss: 0.3068940341472626, mean loss: 0.33897128471104016
Epoch: 74, step: 577, loss: 0.3639431595802307, mean loss: 0.3389715171502574
Epoch: 74, step: 578, loss: 0.3484604060649872, mean loss: 0.3389716054723956
Epoch: 74, step: 579, loss: 0.3665253818035126, mean loss: 0.33897186193928125
Epoch: 74, step: 580, loss: 0.3495894968509674, mean loss: 0.3389719607658951
Epoch: 74, step: 581, loss: 0.30114424228668213, mean loss: 0.3389716086770766
Epoch: 74, step: 582, loss: 0.2996388077735901, mean loss: 0.33897124258281935
Epoch: 74, step: 583, loss: 0.3228156566619873, mean loss: 0.3389710922143726
Epoch: 74, step: 584, loss: 0.316407710313797, mean loss: 0.3389708822071882
Epoch: 74, step: 585, loss: 0.355759859085083, mean loss: 0.33897103846802545
Epoch: 74, step: 586, loss: 0.37134864926338196, mean loss: 0.33897133981488653
Epoch: 74, step: 587, loss: 0.3330819606781006, mean loss: 0.3389712850014103
Epoch: 74, step: 588, loss: 0.3096480071544647, mean loss: 0.3389710120871021
Epoch: 74, step: 589, loss: 0.3351192772388458, mean loss: 0.3389709762390031
Epoch: 74, step: 590, loss: 0.31134098768234253, mean loss: 0.33897071908907284
Epoch: 74, step: 591, loss: 0.3137848675251007, mean loss: 0.33897048468869717
Epoch: 74, step: 592, loss: 0.31606632471084595, mean loss: 0.3389702715256154
Epoch: 74, step: 593, loss: 0.33180752396583557, mean loss: 0.3389702048644003
Epoch: 74, step: 594, loss: 0.3257102966308594, mean loss: 0.3389700814601674
Epoch: 74, step: 595, loss: 0.32992836833000183, mean loss: 0.33896999731363564
Epoch: 74, step: 596, loss: 0.3201445937156677, mean loss: 0.33896982211700455
Epoch: 74, step: 597, loss: 0.343068391084671, mean loss: 0.33896986025954895
Epoch: 74, step: 598, loss: 0.3714029788970947, mean loss: 0.3389701620893255
Epoch: 74, step: 599, loss: 0.36910906434059143, mean loss: 0.33897044256600667
Epoch: 74, step: 600, loss: 0.3267744481563568, mean loss: 0.33897032906949726
Epoch: 74, step: 601, loss: 0.3681640923023224, mean loss: 0.338970600745531
Epoch: 74, step: 602, loss: 0.3306915760040283, mean loss: 0.3389705237019633
Epoch: 74, step: 603, loss: 0.34990671277046204, mean loss: 0.3389706254718225
Epoch: 74, step: 604, loss: 0.3029724955558777, mean loss: 0.3389702904839672
Epoch: 74, step: 605, loss: 0.2949857711791992, mean loss: 0.3389698811809642
Epoch: 74, step: 606, loss: 0.36075958609580994, mean loss: 0.33897008394568245
Epoch: 74, step: 607, loss: 0.34035027027130127, mean loss: 0.33897009678892603
Epoch: 74, step: 608, loss: 0.3390040993690491, mean loss: 0.3389700971053321
Epoch: 74, step: 609, loss: 0.3393879532814026, mean loss: 0.3389701009935961
Epoch: 74, step: 610, loss: 0.3391318917274475, mean loss: 0.3389701024990883
Epoch: 74, step: 611, loss: 0.3391335904598236, mean loss: 0.33897010402035943
Epoch: 74, step: 612, loss: 0.2893490493297577, mean loss: 0.33896964229600457
Epoch: 74, step: 613, loss: 0.3186483085155487, mean loss: 0.33896945320757266
Epoch: 74, step: 614, loss: 0.35530775785446167, mean loss: 0.3389696052328134
Epoch: 74, step: 615, loss: 0.3379182815551758, mean loss: 0.3389695954505103
Epoch: 74, step: 616, loss: 0.303619921207428, mean loss: 0.33896926653371967
Epoch: 74, step: 617, loss: 0.3644757866859436, mean loss: 0.33896950386107466
Epoch: 74, step: 618, loss: 0.30010154843330383, mean loss: 0.33896914221459473
Epoch: 74, step: 619, loss: 0.32264357805252075, mean loss: 0.33896899031496913
Epoch: 74, step: 620, loss: 0.3710184097290039, mean loss: 0.3389692885129037
Epoch: 74, step: 621, loss: 0.3350399136543274, mean loss: 0.3389692519530974
Epoch: 74, step: 622, loss: 0.33934327960014343, mean loss: 0.3389692554331042
Epoch: 74, step: 623, loss: 0.3474622666835785, mean loss: 0.3389693344525613
Epoch: 74, step: 624, loss: 0.34130242466926575, mean loss: 0.3389693561595627
Epoch: 74, step: 625, loss: 0.3274993896484375, mean loss: 0.3389692494443312
Epoch: 74, step: 626, loss: 0.3442385792732239, mean loss: 0.3389692984691056
Epoch: 74, step: 627, loss: 0.32150039076805115, mean loss: 0.33896913594344874
Epoch: 74, step: 628, loss: 0.32022741436958313, mean loss: 0.3389689615775226
Epoch: 74, step: 629, loss: 0.33223485946655273, mean loss: 0.3389688989265531
Epoch: 74, step: 630, loss: 0.3080783486366272, mean loss: 0.3389686115378429
Epoch: 74, step: 631, loss: 0.3330276310443878, mean loss: 0.3389685562667383
Epoch: 74, step: 632, loss: 0.3252255916595459, mean loss: 0.33896842841212427
Epoch: 74, step: 633, loss: 0.31598031520843506, mean loss: 0.3389682145493165
Epoch: 74, step: 634, loss: 0.305239200592041, mean loss: 0.33896790076477684
Epoch: 74, step: 635, loss: 0.3399363160133362, mean loss: 0.33896790977396124
Epoch: 74, step: 636, loss: 0.30540040135383606, mean loss: 0.3389675974977347
Epoch: 74, step: 637, loss: 0.3258496820926666, mean loss: 0.33896747546380346
Epoch: 74, step: 638, loss: 0.3468323051929474, mean loss: 0.3389675486284133
Epoch: 74, step: 639, loss: 0.3525545597076416, mean loss: 0.3389676750239171
Epoch: 74, step: 640, loss: 0.3708546757698059, mean loss: 0.33896797165545794
Epoch: 74, step: 641, loss: 0.3417271673679352, mean loss: 0.33896799732287236
Epoch: 74, step: 642, loss: 0.3259907066822052, mean loss: 0.33896787660276667
Epoch: 74, step: 643, loss: 0.35730424523353577, mean loss: 0.33896804717363765
Epoch: 74, step: 644, loss: 0.32322731614112854, mean loss: 0.33896790074959476
Epoch: 74, step: 645, loss: 0.31840723752975464, mean loss: 0.3389677094911696
Epoch: 74, step: 646, loss: 0.30624258518218994, mean loss: 0.3389674050799038
Epoch: 74, step: 647, loss: 0.30709460377693176, mean loss: 0.3389671085997607
Epoch: 74, step: 648, loss: 0.3057475984096527, mean loss: 0.3389667995954336
Epoch: 74, step: 649, loss: 0.3564789891242981, mean loss: 0.3389669624904304
Epoch: 74, step: 650, loss: 0.31866490840911865, mean loss: 0.3389667736464102
Epoch: 74, step: 651, loss: 0.33886072039604187, mean loss: 0.33896677265994174
Epoch: 74, step: 652, loss: 0.32410576939582825, mean loss: 0.33896663442962366
Epoch: 74, step: 653, loss: 0.34741613268852234, mean loss: 0.33896671302229653
Epoch: 74, step: 654, loss: 0.32580095529556274, mean loss: 0.3389665905626624
Epoch: 74, step: 655, loss: 0.34203189611434937, mean loss: 0.33896661907395
Epoch: 74, step: 656, loss: 0.3043125867843628, mean loss: 0.33896629674983764
Epoch: 74, step: 657, loss: 0.3966907262802124, mean loss: 0.33896683365135305
Epoch: 74, step: 658, loss: 0.3270123302936554, mean loss: 0.3389667224621854
Epoch: 74, step: 659, loss: 0.3145825266838074, mean loss: 0.3389664956662129
Epoch: 74, step: 660, loss: 0.3683972954750061, mean loss: 0.33896676939780707
Epoch: 74, step: 661, loss: 0.3060505986213684, mean loss: 0.3389664632521312
Epoch: 74, step: 662, loss: 0.31105443835258484, mean loss: 0.3389662036512709
Epoch: 74, step: 663, loss: 0.3234332799911499, mean loss: 0.33896605918583506
Epoch: 74, step: 664, loss: 0.2993473410606384, mean loss: 0.33896569071160093
Epoch: 74, step: 665, loss: 0.30171528458595276, mean loss: 0.3389653442670954
Epoch: 74, step: 666, loss: 0.34585583209991455, mean loss: 0.3389654083509457
Epoch: 74, step: 667, loss: 0.3221830725669861, mean loss: 0.33896525227103996
Epoch: 74, step: 668, loss: 0.318219393491745, mean loss: 0.3389650593311769
Epoch: 74, step: 669, loss: 0.3240821361541748, mean loss: 0.3389649209188563
Epoch: 74, step: 670, loss: 0.3535393476486206, mean loss: 0.3389650564608758
Epoch: 74, step: 671, loss: 0.3709966242313385, mean loss: 0.33896535435135805
Epoch: 74, step: 672, loss: 0.3486938178539276, mean loss: 0.3389654448242863
Epoch: 74, step: 673, loss: 0.3213955760002136, mean loss: 0.3389652814292447
Epoch: 74, step: 674, loss: 0.30540475249290466, mean loss: 0.3389649693282791
Epoch: 74, step: 675, loss: 0.34769678115844727, mean loss: 0.3389650505302639
Epoch: 74, step: 676, loss: 0.3173326551914215, mean loss: 0.3389648493604338
Epoch: 74, step: 677, loss: 0.3049854338169098, mean loss: 0.33896453337278765
Epoch: 74, step: 678, loss: 0.32285627722740173, mean loss: 0.33896438357731506
Epoch: 74, step: 679, loss: 0.3748822510242462, mean loss: 0.33896471758515845
Epoch: 74, step: 680, loss: 0.3476879894733429, mean loss: 0.33896479870395374
Epoch: 74, step: 681, loss: 0.3134687542915344, mean loss: 0.3389645616152557
Epoch: 74, step: 682, loss: 0.3379001319408417, mean loss: 0.3389645517171752
Epoch: 74, step: 683, loss: 0.34543144702911377, mean loss: 0.3389646118519652
Epoch: 74, step: 684, loss: 0.32164403796195984, mean loss: 0.33896445079177523
Epoch: 74, step: 685, loss: 0.35216426849365234, mean loss: 0.33896457353282244
Epoch: 74, step: 686, loss: 0.32658976316452026, mean loss: 0.33896445846433476
Epoch: 74, step: 687, loss: 0.34934547543525696, mean loss: 0.33896455499242534
Epoch: 74, step: 688, loss: 0.35093286633491516, mean loss: 0.33896466627896904
Epoch: 74, step: 689, loss: 0.31637120246887207, mean loss: 0.3389644561971082
Epoch: 74, step: 690, loss: 0.3345218002796173, mean loss: 0.33896441488813706
Epoch: 74, step: 691, loss: 0.3397555947303772, mean loss: 0.3389644222446648
Epoch: 74, step: 692, loss: 0.3582400977611542, mean loss: 0.3389646014715801
Epoch: 74, step: 693, loss: 0.34769207239151, mean loss: 0.3389646826196128
Epoch: 74, step: 694, loss: 0.3248932361602783, mean loss: 0.3389645517845071
Epoch: 74, step: 695, loss: 0.3272647261619568, mean loss: 0.3389644430015405
Epoch: 74, step: 696, loss: 0.3512192368507385, mean loss: 0.3389645569434468
Epoch: 74, step: 697, loss: 0.33291661739349365, mean loss: 0.33896450071179063
Epoch: 74, step: 698, loss: 0.3483109474182129, mean loss: 0.33896458761102083
Epoch: 74, step: 699, loss: 0.36009061336517334, mean loss: 0.3389647840298701
Epoch: 74, step: 700, loss: 0.3344782292842865, mean loss: 0.3389647423165949
Epoch: 74, step: 701, loss: 0.3587793707847595, mean loss: 0.3389649265393256
Epoch: 74, step: 702, loss: 0.3343040943145752, mean loss: 0.3389648832065294
Epoch: 74, step: 703, loss: 0.33525389432907104, mean loss: 0.3389648487049593
Epoch: 74, step: 704, loss: 0.35399967432022095, mean loss: 0.3389649884844855
Epoch: 74, step: 705, loss: 0.34341397881507874, mean loss: 0.33896502984658666
Epoch: 74, step: 706, loss: 0.3051574230194092, mean loss: 0.33896471554141827
Epoch: 74, step: 707, loss: 0.30598291754722595, mean loss: 0.33896440891654384
Epoch: 74, step: 708, loss: 0.3463171422481537, mean loss: 0.33896447727273155
Epoch: 74, step: 709, loss: 0.3108711540699005, mean loss: 0.33896421609984045
Epoch: 74, step: 710, loss: 0.3593406677246094, mean loss: 0.3389644055301641
Epoch: 74, step: 711, loss: 0.3317023515701294, mean loss: 0.3389643380188786
Epoch: 74, step: 712, loss: 0.33233144879341125, mean loss: 0.3389642763571617
Epoch: 74, step: 713, loss: 0.3061790466308594, mean loss: 0.3389639715767422
Epoch: 74, step: 714, loss: 0.33053070306777954, mean loss: 0.3389638931795114
Epoch: 74, step: 715, loss: 0.31417199969291687, mean loss: 0.33896366271160633
Epoch: 74, step: 716, loss: 0.33938899636268616, mean loss: 0.3389636666655135
Epoch: 74, step: 717, loss: 0.31110265851020813, mean loss: 0.33896340767162875
Epoch: 74, step: 718, loss: 0.32308077812194824, mean loss: 0.33896326002924393
Epoch: 74, step: 719, loss: 0.37390801310539246, mean loss: 0.33896358486706163
Epoch: 74, step: 720, loss: 0.3068388104438782, mean loss: 0.3389632862458468
Epoch: 74, step: 721, loss: 0.31685692071914673, mean loss: 0.33896308075433806
Epoch: 74, step: 722, loss: 0.3276810348033905, mean loss: 0.33896297588214225
Epoch: 74, step: 723, loss: 0.3409176766872406, mean loss: 0.3389629940518839
Epoch: 74, step: 724, loss: 0.313493549823761, mean loss: 0.3389627573052072
Epoch: 74, step: 725, loss: 0.324730783700943, mean loss: 0.3389626250156643
Epoch: 74, step: 726, loss: 0.34467145800590515, mean loss: 0.3389626780801168
Epoch: 74, step: 727, loss: 0.32239070534706116, mean loss: 0.33896252404259514
Epoch: 74, step: 728, loss: 0.3051551878452301, mean loss: 0.3389622098042143
Epoch: 74, step: 729, loss: 0.3668551445007324, mean loss: 0.3389624690659649
Epoch: 74, step: 730, loss: 0.34240013360977173, mean loss: 0.33896250101838055
Epoch: 74, step: 731, loss: 0.3522217571735382, mean loss: 0.3389626242594126
Epoch: 74, step: 732, loss: 0.3361280858516693, mean loss: 0.3389625979134255
Epoch: 74, step: 733, loss: 0.37414440512657166, mean loss: 0.33896292491228425
Epoch: 74, step: 734, loss: 0.3286382257938385, mean loss: 0.3389628289498049
Epoch: 74, step: 735, loss: 0.3719201982021332, mean loss: 0.3389631352678327
Epoch: 74, step: 736, loss: 0.34797707200050354, mean loss: 0.3389632190459292
Epoch: 74, step: 737, loss: 0.2985653579235077, mean loss: 0.33896284358018647
Epoch: 74, step: 738, loss: 0.31452396512031555, mean loss: 0.3389626164425085
Epoch: 74, step: 739, loss: 0.3336281478404999, mean loss: 0.3389625668638197
Epoch: 74, step: 740, loss: 0.3204275369644165, mean loss: 0.33896239460037464
Epoch: 74, step: 741, loss: 0.34526997804641724, mean loss: 0.33896245322212826
Epoch: 74, step: 742, loss: 0.3401356637477875, mean loss: 0.33896246412567316
Epoch: 74, step: 743, loss: 0.4014158248901367, mean loss: 0.3389630445472416
Epoch: 74, step: 744, loss: 0.32792454957962036, mean loss: 0.3389629419599518
Epoch: 74, step: 745, loss: 0.33104491233825684, mean loss: 0.33896286837368367
Epoch: 74, step: 746, loss: 0.30412840843200684, mean loss: 0.33896254464237563
Epoch: 74, step: 747, loss: 0.3155614137649536, mean loss: 0.3389623271678312
Epoch: 74, step: 748, loss: 0.33434978127479553, mean loss: 0.3389622843022962
Epoch: 74, step: 749, loss: 0.33927416801452637, mean loss: 0.33896228720068206
Epoch: 74, step: 750, loss: 0.33538445830345154, mean loss: 0.33896225395164714
Epoch: 74, step: 751, loss: 0.30537790060043335, mean loss: 0.3389619418526085
Epoch: 74, step: 752, loss: 0.31920868158340454, mean loss: 0.33896175828747666
Epoch: 74, step: 753, loss: 0.3231348991394043, mean loss: 0.3389616112113764
Epoch: 74, step: 754, loss: 0.31649214029312134, mean loss: 0.33896140240864325
Epoch: 74, step: 755, loss: 0.3635632395744324, mean loss: 0.3389616310247564
Epoch: 74, step: 756, loss: 0.3642481565475464, mean loss: 0.3389618660012511
Epoch: 74, step: 757, loss: 0.32011908292770386, mean loss: 0.3389616909052313
Epoch: 74, step: 758, loss: 0.29473552107810974, mean loss: 0.33896127993863906
Epoch: 74, step: 759, loss: 0.32365256547927856, mean loss: 0.338961137685494
Epoch: 74, step: 760, loss: 0.321367084980011, mean loss: 0.3389609741978229
Epoch: 74, step: 761, loss: 0.335880845785141, mean loss: 0.33896094557688206
Epoch: 74, step: 762, loss: 0.2967907786369324, mean loss: 0.3389605537300247
Epoch: 74, step: 763, loss: 0.3227043151855469, mean loss: 0.33896040267781746
Epoch: 74, step: 764, loss: 0.2869432270526886, mean loss: 0.3389599193411487
Epoch: 74, step: 765, loss: 0.30804216861724854, mean loss: 0.3389596320601957
Epoch: 74, step: 766, loss: 0.3326479494571686, mean loss: 0.33895957341397137
Epoch: 74, step: 767, loss: 0.3284730613231659, mean loss: 0.3389594759774136
Epoch: 74, step: 768, loss: 0.3416057229042053, mean loss: 0.3389595005650738
Epoch: 74, step: 769, loss: 0.3211444914340973, mean loss: 0.3389593350380717
Epoch: 74, step: 770, loss: 0.34001001715660095, mean loss: 0.33895934480032575
Epoch: 74, step: 771, loss: 0.28755074739456177, mean loss: 0.33895886714955265
Epoch: 74, step: 772, loss: 0.3364725410938263, mean loss: 0.3389588440486592
Epoch: 74, step: 773, loss: 0.3157373070716858, mean loss: 0.33895862829527285
Epoch: 74, step: 774, loss: 0.30874139070510864, mean loss: 0.338958347546812
Epoch: 74, step: 775, loss: 0.35122591257095337, mean loss: 0.33895846152374287
Epoch: 74, step: 776, loss: 0.30617061257362366, mean loss: 0.3389581568973834
Epoch: 74, step: 777, loss: 0.33040639758110046, mean loss: 0.33895807744517203
Epoch: 74, step: 778, loss: 0.34876763820648193, mean loss: 0.3389581685824486
Epoch: 74, step: 779, loss: 0.32737624645233154, mean loss: 0.338958060979768
Epoch: 74, step: 780, loss: 0.33138564229011536, mean loss: 0.3389579906283211
Epoch: 74, step: 781, loss: 0.32257673144340515, mean loss: 0.3389578384398822
Epoch: 74, step: 782, loss: 0.3087186813354492, mean loss: 0.33895755750864814
Epoch: 74, step: 783, loss: 0.3364919424057007, mean loss: 0.3389575346025249
Epoch: 74, step: 784, loss: 0.34985947608947754, mean loss: 0.3389576358830917
Epoch: 74, step: 785, loss: 0.3274793326854706, mean loss: 0.3389575292490344
Epoch: 74, step: 786, loss: 0.3422631025314331, mean loss: 0.3389575599577036
Epoch: 74, step: 787, loss: 0.30654698610305786, mean loss: 0.3389572588673144
Epoch: 74, step: 788, loss: 0.34078308939933777, mean loss: 0.33895727582890606
Epoch: 74, step: 789, loss: 0.33202511072158813, mean loss: 0.33895721143111046
Epoch: 74, step: 790, loss: 0.31001007556915283, mean loss: 0.338956942523144
Epoch: 74, step: 791, loss: 0.33407914638519287, mean loss: 0.3389568972106799
Epoch: 74, step: 792, loss: 0.30729585886001587, mean loss: 0.3389566030970481
Epoch: 74, step: 793, loss: 0.35840094089508057, mean loss: 0.33895678372257343
Epoch: 74, step: 794, loss: 0.35903164744377136, mean loss: 0.33895697020355103
Epoch: 74, step: 795, loss: 0.32246288657188416, mean loss: 0.3389568169868562
Epoch: 74, step: 796, loss: 0.3558167517185211, mean loss: 0.338956973600557
Epoch: 74, step: 797, loss: 0.3379168212413788, mean loss: 0.33895696393856245
Epoch: 74, step: 798, loss: 0.3356229066848755, mean loss: 0.33895693296873053
Epoch: 74, step: 799, loss: 0.3493555188179016, mean loss: 0.3389570295595926
Epoch: 74, step: 800, loss: 0.3048771917819977, mean loss: 0.33895671300016983
Epoch: 74, step: 801, loss: 0.36659330129623413, mean loss: 0.3389569697074122
Epoch: 74, step: 802, loss: 0.34321603178977966, mean loss: 0.33895700926808137
Epoch: 74, step: 803, loss: 0.3166891038417816, mean loss: 0.3389568024326232
Epoch: 74, step: 804, loss: 0.3240007162094116, mean loss: 0.33895666351429415
Epoch: 74, step: 805, loss: 0.36155959963798523, mean loss: 0.33895687345778513
Epoch: 74, step: 806, loss: 0.3521328568458557, mean loss: 0.3389569958395076
Epoch: 74, step: 807, loss: 0.3508445620536804, mean loss: 0.338957106253074
Epoch: 74, step: 808, loss: 0.3097524642944336, mean loss: 0.3389568349983305
Epoch: 74, step: 809, loss: 0.33311882615089417, mean loss: 0.33895678077500235
Epoch: 74, step: 810, loss: 0.3432156443595886, mean loss: 0.3389568203308884
Epoch: 74, step: 811, loss: 0.33359405398368835, mean loss: 0.33895677052252987
Epoch: 74, step: 812, loss: 0.32800915837287903, mean loss: 0.33895666884412523
Epoch: 74, step: 813, loss: 0.3555978238582611, mean loss: 0.33895682340115146
Epoch: 74, step: 814, loss: 0.31782934069633484, mean loss: 0.33895662717855946
Epoch: 74, step: 815, loss: 0.3076450228691101, mean loss: 0.3389563363731104
Epoch: 74, step: 816, loss: 0.3036624491214752, mean loss: 0.3389560085853897
Epoch: 74, step: 817, loss: 0.3096509277820587, mean loss: 0.33895573642051424
Epoch: 74, step: 818, loss: 0.3114490509033203, mean loss: 0.3389554809602355
Epoch: 74, step: 819, loss: 0.3165740668773651, mean loss: 0.3389552731013432
Epoch: 74, step: 820, loss: 0.35093048214912415, mean loss: 0.33895538431552125
Epoch: 74, step: 821, loss: 0.34222251176834106, mean loss: 0.3389554146571644
Epoch: 74, step: 822, loss: 0.3360759913921356, mean loss: 0.33895538791635826
Epoch: 74, step: 823, loss: 0.30841249227523804, mean loss: 0.3389551042713393
Epoch: 74, step: 824, loss: 0.3378922641277313, mean loss: 0.338955094401073
Epoch: 74, step: 825, loss: 0.32043683528900146, mean loss: 0.33895492242934966
Epoch: 74, step: 826, loss: 0.3366695046424866, mean loss: 0.33895490120577876
Epoch: 74, step: 827, loss: 0.33112746477127075, mean loss: 0.338954828516833
Epoch: 74, step: 828, loss: 0.32004860043525696, mean loss: 0.33895465294708715
Epoch: 74, step: 829, loss: 0.30403536558151245, mean loss: 0.3389543286775687
Epoch: 74, step: 830, loss: 0.33029884099960327, mean loss: 0.33895424830122173
Epoch: 74, step: 831, loss: 0.32269152998924255, mean loss: 0.3389540972842253
Epoch: 74, step: 832, loss: 0.3012487292289734, mean loss: 0.33895374715219645
Epoch: 74, step: 833, loss: 0.3711880147457123, mean loss: 0.33895404647680966
Epoch: 74, step: 834, loss: 0.3737655282020569, mean loss: 0.33895436973020804
Epoch: 74, step: 835, loss: 0.3448445498943329, mean loss: 0.33895442442489443
Epoch: 74, step: 836, loss: 0.316520631313324, mean loss: 0.3389542161124404
Epoch: 74, step: 837, loss: 0.3512144088745117, mean loss: 0.33895432995529856
Epoch: 74, step: 838, loss: 0.29897505044937134, mean loss: 0.3389539587284124
Epoch: 74, step: 839, loss: 0.34062981605529785, mean loss: 0.3389539742894112
Epoch: 74, step: 840, loss: 0.33527347445487976, mean loss: 0.3389539401148304
Epoch: 74, step: 841, loss: 0.3450993001461029, mean loss: 0.3389539971758717
Epoch: 74, step: 842, loss: 0.31996801495552063, mean loss: 0.3389538208884204
Epoch: 74, step: 843, loss: 0.3295958936214447, mean loss: 0.33895373399958784
Epoch: 74, step: 844, loss: 0.3456495702266693, mean loss: 0.3389537961701919
Epoch: 74, step: 845, loss: 0.3659706115722656, mean loss: 0.3389540470180443
Epoch: 74, step: 846, loss: 0.3648836016654968, mean loss: 0.3389542877685772
Epoch: 74, step: 847, loss: 0.3197551369667053, mean loss: 0.33895410951010213
Epoch: 74, step: 848, loss: 0.29624447226524353, mean loss: 0.33895371296734883
Epoch: 74, step: 849, loss: 0.3514367341995239, mean loss: 0.3389538288663817
Epoch: 74, step: 850, loss: 0.333418607711792, mean loss: 0.3389537774749108
Epoch: 74, step: 851, loss: 0.3227595388889313, mean loss: 0.3389536271217468
Epoch: 74, step: 852, loss: 0.3695865571498871, mean loss: 0.3389539115263001
Epoch: 74, step: 853, loss: 0.33330869674682617, mean loss: 0.338953859115059
Epoch: 74, step: 854, loss: 0.33555513620376587, mean loss: 0.338953827560966
Epoch: 74, step: 855, loss: 0.2989785373210907, mean loss: 0.3389534564297063
Epoch: 74, step: 856, loss: 0.3400910794734955, mean loss: 0.3389534669913195
Epoch: 74, step: 857, loss: 0.351087361574173, mean loss: 0.338953579640507
Epoch: 74, step: 858, loss: 0.35764238238334656, mean loss: 0.33895375314283016
Epoch: 74, step: 859, loss: 0.28363195061683655, mean loss: 0.3389532395533678
Epoch: 74, step: 860, loss: 0.3818255364894867, mean loss: 0.33895363756201025
Epoch: 74, step: 861, loss: 0.31443169713020325, mean loss: 0.3389534099125883
Epoch: 74, step: 862, loss: 0.31084051728248596, mean loss: 0.33895314892898626
Epoch: 74, step: 863, loss: 0.321650892496109, mean loss: 0.33895298830647946
Epoch: 74, step: 864, loss: 0.3180781900882721, mean loss: 0.3389527945206975
Epoch: 74, step: 865, loss: 0.32634294033050537, mean loss: 0.3389526774614692
Epoch: 74, step: 866, loss: 0.3771427273750305, mean loss: 0.3389530319823228
Epoch: 74, step: 867, loss: 0.29825377464294434, mean loss: 0.33895265417183174
Epoch: 74, step: 868, loss: 0.32785189151763916, mean loss: 0.3389525511246036
Epoch: 74, step: 869, loss: 0.29081279039382935, mean loss: 0.33895210425234684
Epoch: 74, step: 870, loss: 0.3613429069519043, mean loss: 0.3389523120999867
Epoch: 74, step: 871, loss: 0.31339773535728455, mean loss: 0.33895207488610785
Epoch: 74, step: 872, loss: 0.33409154415130615, mean loss: 0.33895202976798056
Epoch: 74, step: 873, loss: 0.3372775912284851, mean loss: 0.3389520142250627
Epoch: 74, step: 874, loss: 0.33714762330055237, mean loss: 0.33895199747602184
Epoch: 74, step: 875, loss: 0.31790709495544434, mean loss: 0.3389518021310684
Epoch: 74, step: 876, loss: 0.29731494188308716, mean loss: 0.33895141564911535
Epoch: 74, step: 877, loss: 0.3181018829345703, mean loss: 0.3389512221212345
Epoch: 74, step: 878, loss: 0.37250587344169617, mean loss: 0.3389515335766698
Epoch: 74, step: 879, loss: 0.3234546184539795, mean loss: 0.33895138973510225
Epoch: 74, step: 880, loss: 0.33820438385009766, mean loss: 0.3389513828014965
Epoch: 74, step: 881, loss: 0.31633830070495605, mean loss: 0.33895117291193017
Epoch: 74, step: 882, loss: 0.318814218044281, mean loss: 0.33895098600695733
Epoch: 74, step: 883, loss: 0.3133450150489807, mean loss: 0.3389507483424784
Epoch: 74, step: 884, loss: 0.36843782663345337, mean loss: 0.33895102202731786
Epoch: 74, step: 885, loss: 0.33090388774871826, mean loss: 0.33895094733839176
Epoch: 74, step: 886, loss: 0.32119062542915344, mean loss: 0.3389507824987093
Epoch: 74, step: 887, loss: 0.34180399775505066, mean loss: 0.3389508089801399
Epoch: 74, step: 888, loss: 0.3199552297592163, mean loss: 0.33895063267888026
Epoch: 74, step: 889, loss: 0.36543095111846924, mean loss: 0.33895087844501953
Epoch: 74, step: 890, loss: 0.32663920521736145, mean loss: 0.3389507641803697
Epoch: 74, step: 891, loss: 0.39130616188049316, mean loss: 0.33895125008635124
Epoch: 74, step: 892, loss: 0.3383040130138397, mean loss: 0.3389512440794549
Epoch: 74, step: 893, loss: 0.32601577043533325, mean loss: 0.33895112402865546
Epoch: 74, step: 894, loss: 0.35410258173942566, mean loss: 0.33895126464412734
Epoch: 74, step: 895, loss: 0.36283591389656067, mean loss: 0.3389514863072914
Epoch: 74, step: 896, loss: 0.3207956552505493, mean loss: 0.33895131781239046
Epoch: 74, step: 897, loss: 0.353457510471344, mean loss: 0.33895145243563096
Epoch: 74, step: 898, loss: 0.3441506028175354, mean loss: 0.3389515006853677
Epoch: 74, step: 899, loss: 0.33551743626594543, mean loss: 0.33895146881647487
Epoch: 74, step: 900, loss: 0.31731095910072327, mean loss: 0.33895126798952424
Epoch: 74, step: 901, loss: 0.34141942858695984, mean loss: 0.3389512908941865
Epoch: 74, step: 902, loss: 0.34096622467041016, mean loss: 0.33895130959270614
Epoch: 74, step: 903, loss: 0.3319507837295532, mean loss: 0.33895124462865767
Epoch: 74, step: 904, loss: 0.32687634229660034, mean loss: 0.33895113257603815
Epoch: 74, step: 905, loss: 0.3375270962715149, mean loss: 0.33895111936139566
Epoch: 74, step: 906, loss: 0.32314860820770264, mean loss: 0.33895097272005165
Epoch: 74, step: 907, loss: 0.3656201958656311, mean loss: 0.3389512201980883
Epoch: 74, step: 908, loss: 0.3630640506744385, mean loss: 0.3389514439519089
Epoch: 74, step: 909, loss: 0.30473238229751587, mean loss: 0.3389511264207613
Epoch: 74, step: 910, loss: 0.35625067353248596, mean loss: 0.3389512869480759
Epoch: 74, step: 911, loss: 0.3119121193885803, mean loss: 0.33895103604643945
Epoch: 74, step: 912, loss: 0.3316417634487152, mean loss: 0.3389509682229225
Epoch: 74, step: 913, loss: 0.33366596698760986, mean loss: 0.3389509191832896
Epoch: 74, step: 914, loss: 0.34340012073516846, mean loss: 0.33895096046713735
Epoch: 74, step: 915, loss: 0.3411063253879547, mean loss: 0.3389509804664407
Epoch: 74, step: 916, loss: 0.3581044673919678, mean loss: 0.3389511581870843
Epoch: 74, step: 917, loss: 0.32558438181877136, mean loss: 0.3389510341611006
Epoch: 74, step: 918, loss: 0.29938724637031555, mean loss: 0.33895066706494853
Epoch: 74, step: 919, loss: 0.35266801714897156, mean loss: 0.33895079434143016
Epoch: 74, step: 920, loss: 0.3346652686595917, mean loss: 0.3389507545785338
Epoch: 74, step: 921, loss: 0.364606648683548, mean loss: 0.3389509926224213
Epoch: 74, step: 922, loss: 0.31109702587127686, mean loss: 0.33895073418648525
Epoch: 74, step: 923, loss: 0.34163036942481995, mean loss: 0.33895075904856764
Epoch: 74, step: 924, loss: 0.32220396399497986, mean loss: 0.33895060367057844
Epoch: 74, step: 925, loss: 0.3584306240081787, mean loss: 0.33895078440595483
Epoch: 74, step: 926, loss: 0.3071023225784302, mean loss: 0.33895048891908003
Epoch: 74, step: 927, loss: 0.29550912976264954, mean loss: 0.33895008587819125
Epoch: 74, step: 928, loss: 0.29315823316574097, mean loss: 0.3389496610338
Epoch: 74, step: 929, loss: 0.34138238430023193, mean loss: 0.33894968360373734
Epoch: 74, step: 930, loss: 0.3281504809856415, mean loss: 0.33894958341352316
Epoch: 74, step: 931, loss: 0.3081304728984833, mean loss: 0.33894929749013175
Epoch: 74, step: 932, loss: 0.33239132165908813, mean loss: 0.3389492366492683
Epoch: 74, step: 933, loss: 0.3084699511528015, mean loss: 0.33894895388384016
Epoch: 74, step: 934, loss: 0.32741618156433105, mean loss: 0.338948846891862
Epoch: 74, step: 935, loss: 0.3100256621837616, mean loss: 0.33894857856782395
Epoch: 74, step: 936, loss: 0.3278792202472687, mean loss: 0.3389484758769412
Epoch: 74, step: 937, loss: 0.33831509947776794, mean loss: 0.33894847000113737
Epoch: 74, step: 938, loss: 0.3986304998397827, mean loss: 0.33894902366345786
Epoch: 74, step: 939, loss: 0.32550835609436035, mean loss: 0.33894889897731395
Epoch: 74, step: 940, loss: 0.3307468891143799, mean loss: 0.33894882288976175
Epoch: 74, step: 941, loss: 0.37623053789138794, mean loss: 0.3389491687376903
Epoch: 74, step: 942, loss: 0.3405173420906067, mean loss: 0.33894918328488793
Epoch: 74, step: 943, loss: 0.3188413381576538, mean loss: 0.3389489967557124
Epoch: 74, step: 944, loss: 0.313555508852005, mean loss: 0.33894876119678524
Epoch: 74, step: 945, loss: 0.33414119482040405, mean loss: 0.33894871660052195
Epoch: 74, step: 946, loss: 0.30492353439331055, mean loss: 0.33894840097681755
Epoch: 74, step: 947, loss: 0.309234619140625, mean loss: 0.3389481253489945
Epoch: 74, step: 948, loss: 0.35525450110435486, mean loss: 0.33894827660706
Epoch: 74, step: 949, loss: 0.3327494263648987, mean loss: 0.3389482191070114
Epoch: 74, step: 950, loss: 0.3934120833873749, mean loss: 0.3389487243048583
Epoch: 74, step: 951, loss: 0.36071574687957764, mean loss: 0.33894892621030664
Epoch: 74, step: 952, loss: 0.31258636713027954, mean loss: 0.33894868168008113
Epoch: 74, step: 953, loss: 0.3271732032299042, mean loss: 0.3389485724557193
Epoch: 74, step: 954, loss: 0.3063679337501526, mean loss: 0.3389482702542862
Epoch: 74, step: 955, loss: 0.32727834582328796, mean loss: 0.33894816201100686
Epoch: 74, step: 956, loss: 0.3389759659767151, mean loss: 0.3389481622688975
Epoch: 74, step: 957, loss: 0.31373298168182373, mean loss: 0.33894792839221555
Epoch: 74, step: 958, loss: 0.32418790459632874, mean loss: 0.33894779149082155
Epoch: 74, step: 959, loss: 0.3049226403236389, mean loss: 0.3389474759054616
Epoch: 74, step: 960, loss: 0.3357873260974884, mean loss: 0.3389474465951505
Epoch: 74, step: 961, loss: 0.29504817724227905, mean loss: 0.33894703943429283
Epoch: 74, step: 962, loss: 0.29979363083839417, mean loss: 0.3389466762941358
Epoch: 74, step: 963, loss: 0.33170169591903687, mean loss: 0.33894660909899227
Epoch: 74, step: 964, loss: 0.3518066108226776, mean loss: 0.3389467283707642
Epoch: 74, step: 965, loss: 0.3267371356487274, mean loss: 0.3389466151323461
Epoch: 74, step: 966, loss: 0.3234652876853943, mean loss: 0.3389464715514084
Epoch: 74, step: 967, loss: 0.3459847867488861, mean loss: 0.3389465368273692
Epoch: 74, step: 968, loss: 0.3624071478843689, mean loss: 0.33894675440781025
Epoch: 74, step: 969, loss: 0.3443838059902191, mean loss: 0.33894680483211964
Epoch: 74, step: 970, loss: 0.3394533097743988, mean loss: 0.33894680952950473
Epoch: 74, step: 971, loss: 0.3252478837966919, mean loss: 0.3389466824852701
Epoch: 74, step: 972, loss: 0.3367021381855011, mean loss: 0.3389466616694942
Epoch: 74, step: 973, loss: 0.3272280693054199, mean loss: 0.3389465529929444
Epoch: 74, step: 974, loss: 0.36518657207489014, mean loss: 0.33894679633687225
Epoch: 74, step: 975, loss: 0.33712238073349, mean loss: 0.33894677941781665
Epoch: 74, step: 976, loss: 0.33977919816970825, mean loss: 0.33894678713733434
Epoch: 74, step: 977, loss: 0.33742469549179077, mean loss: 0.33894677302219767
Epoch: 74, step: 978, loss: 0.32296621799468994, mean loss: 0.3389466248276873
Epoch: 74, step: 979, loss: 0.34707584977149963, mean loss: 0.33894670021276224
Epoch: 74, step: 980, loss: 0.33030498027801514, mean loss: 0.3389466200758896
Epoch: 74, step: 981, loss: 0.3523043096065521, mean loss: 0.33894674394400226
Epoch: 74, step: 982, loss: 0.35862070322036743, mean loss: 0.33894692638226
Epoch: 74, step: 983, loss: 0.3507707715034485, mean loss: 0.3389470360247407
Epoch: 74, step: 984, loss: 0.3397795855998993, mean loss: 0.3389470437448988
Epoch: 74, step: 985, loss: 0.35756081342697144, mean loss: 0.33894721634712877
Epoch: 74, step: 986, loss: 0.3328736126422882, mean loss: 0.33894716002818637
Epoch: 74, step: 987, loss: 0.36561310291290283, mean loss: 0.3389474072922241
Epoch: 74, step: 988, loss: 0.35169264674186707, mean loss: 0.33894752547331225
Epoch: 74, step: 989, loss: 0.2929869294166565, mean loss: 0.3389470993045526
Epoch: 74, step: 990, loss: 0.31330791115760803, mean loss: 0.3389468615678687
Epoch: 74, step: 991, loss: 0.39494752883911133, mean loss: 0.33894738082336967
Epoch: 74, step: 992, loss: 0.3137715756893158, mean loss: 0.3389471473876852
Epoch: 74, step: 993, loss: 0.36095884442329407, mean loss: 0.33894735148316074
Epoch: 74, step: 994, loss: 0.3674374222755432, mean loss: 0.3389476156445574
Epoch: 74, step: 995, loss: 0.36047545075416565, mean loss: 0.3389478152498972
Epoch: 74, step: 996, loss: 0.3489854633808136, mean loss: 0.3389479083177593
Epoch: 74, step: 997, loss: 0.33416983485221863, mean loss: 0.3389478640164495
Epoch: 74, step: 998, loss: 0.3545491099357605, mean loss: 0.3389480086666365
Epoch: 74, step: 999, loss: 0.3254050612449646, mean loss: 0.33894788310155505
Epoch: 74, step: 1000, loss: 0.3560951352119446, mean loss: 0.338948042082911
Epoch: 74, step: 1001, loss: 0.34906667470932007, mean loss: 0.3389481358973024
Epoch: 74, step: 1002, loss: 0.32963091135025024, mean loss: 0.33894804951392643
Epoch: 74, step: 1003, loss: 0.322561651468277, mean loss: 0.33894789759108157
Epoch: 74, step: 1004, loss: 0.3509265184402466, mean loss: 0.3389480086471709
Epoch: 74, step: 1005, loss: 0.3171522617340088, mean loss: 0.33894780657649803
Epoch: 74, step: 1006, loss: 0.31501758098602295, mean loss: 0.3389475847189047
Epoch: 74, step: 1007, loss: 0.32378125190734863, mean loss: 0.33894744411283767
Epoch: 74, step: 1008, loss: 0.32914379239082336, mean loss: 0.3389473532246745
Epoch: 74, step: 1009, loss: 0.3669227063655853, mean loss: 0.3389476125775117
Epoch: 74, step: 1010, loss: 0.34777772426605225, mean loss: 0.33894769443861555
Epoch: 74, step: 1011, loss: 0.3946349024772644, mean loss: 0.3389482106918884
Epoch: 74, step: 1012, loss: 0.36625340580940247, mean loss: 0.33894846382481
Epoch: 74, step: 1013, loss: 0.33714374899864197, mean loss: 0.338948447094349
Epoch: 74, step: 1014, loss: 0.3104974329471588, mean loss: 0.3389481833439977
Epoch: 74, step: 1015, loss: 0.37343665957450867, mean loss: 0.338948503060664
Epoch: 74, step: 1016, loss: 0.3304048180580139, mean loss: 0.3389484238593346
Epoch: 74, step: 1017, loss: 0.37467053532600403, mean loss: 0.3389487550059637
Epoch: 74, step: 1018, loss: 0.30719149112701416, mean loss: 0.33894846061649553
Epoch: 74, step: 1019, loss: 0.315584659576416, mean loss: 0.33894824403633833
Epoch: 74, step: 1020, loss: 0.3715226650238037, mean loss: 0.3389485459952451
Epoch: 74, step: 1021, loss: 0.33540618419647217, mean loss: 0.33894851315850544
Epoch: 74, step: 1022, loss: 0.3270457684993744, mean loss: 0.33894840282429156
Epoch: 74, step: 1023, loss: 0.34896260499954224, mean loss: 0.3389484956515271
Epoch: 74, step: 1024, loss: 0.3175309896469116, mean loss: 0.3389482971225368
Epoch: 74, step: 1025, loss: 0.2929936945438385, mean loss: 0.3389478711515446
Epoch: 74, step: 1026, loss: 0.298307865858078, mean loss: 0.3389474944471028
Epoch: 74, step: 1027, loss: 0.3935179114341736, mean loss: 0.33894800027203503
Epoch: 74, step: 1028, loss: 0.3527175188064575, mean loss: 0.3389481279034809
Epoch: 74, step: 1029, loss: 0.36657437682151794, mean loss: 0.3389483839723769
Epoch: 74, step: 1030, loss: 0.32146796584129333, mean loss: 0.3389482219471271
Epoch: 74, step: 1031, loss: 0.36517220735549927, mean loss: 0.33894846501387604
Epoch: 74, step: 1032, loss: 0.3365882337093353, mean loss: 0.3389484431373983
Epoch: 74, step: 1033, loss: 0.3198494613170624, mean loss: 0.3389482661146731
Epoch: 74, step: 1034, loss: 0.32490283250808716, mean loss: 0.33894813593297485
Epoch: 74, step: 1035, loss: 0.31203463673591614, mean loss: 0.33894788648445967
Epoch: 74, step: 1036, loss: 0.3164365291595459, mean loss: 0.3389476778392526
Epoch: 74, step: 1037, loss: 0.3772062659263611, mean loss: 0.3389480324334663
Epoch: 74, step: 1038, loss: 0.32439368963241577, mean loss: 0.3389478975398864
Epoch: 74, step: 1039, loss: 0.32713037729263306, mean loss: 0.33894778801293224
Epoch: 74, step: 1040, loss: 0.34891486167907715, mean loss: 0.3389478803887505
Epoch: 74, step: 1041, loss: 0.35055720806121826, mean loss: 0.3389479879841431
Epoch: 74, step: 1042, loss: 0.3915182650089264, mean loss: 0.338948475201606
Epoch: 74, step: 1043, loss: 0.3289321959018707, mean loss: 0.3389483823723261
Epoch: 74, step: 1044, loss: 0.3474331200122833, mean loss: 0.33894846100679327
Epoch: 74, step: 1045, loss: 0.322693794965744, mean loss: 0.33894831036393175
Epoch: 74, step: 1046, loss: 0.3134033977985382, mean loss: 0.3389480736243363
Epoch: 74, step: 1047, loss: 0.3431369662284851, mean loss: 0.3389481124448861
Epoch: 74, step: 1048, loss: 0.3054775893688202, mean loss: 0.3389478022597874
Epoch: 74, step: 1049, loss: 0.3743768334388733, mean loss: 0.3389481305921431
Epoch: 74, step: 1050, loss: 0.32234323024749756, mean loss: 0.3389479767105567
Epoch: 74, step: 1051, loss: 0.3473587930202484, mean loss: 0.33894805465488254
Epoch: 74, step: 1052, loss: 0.31905314326286316, mean loss: 0.3389478702873933
Epoch: 74, step: 1053, loss: 0.33503472805023193, mean loss: 0.3389478340243756
Epoch: 74, step: 1054, loss: 0.31627872586250305, mean loss: 0.33894762395211087
Epoch: 74, step: 1055, loss: 0.3515031039714813, mean loss: 0.3389477403013586
Epoch: 74, step: 1056, loss: 0.31504037976264954, mean loss: 0.33894751875844403
Epoch: 74, step: 1057, loss: 0.3530210852622986, mean loss: 0.3389476491730937
Epoch: 74, step: 1058, loss: 0.2926616370677948, mean loss: 0.3389472202613381
Epoch: 74, step: 1059, loss: 0.31310421228408813, mean loss: 0.33894698078797014
Epoch: 74, step: 1060, loss: 0.3182843029499054, mean loss: 0.33894678931973216
Epoch: 74, step: 1061, loss: 0.34670892357826233, mean loss: 0.3389468612459563
Epoch: 74, step: 1062, loss: 0.3666648864746094, mean loss: 0.3389471180869688
Epoch: 74, step: 1063, loss: 0.3095099925994873, mean loss: 0.3389468453189417
Epoch: 74, step: 1064, loss: 0.3013591766357422, mean loss: 0.33894649703020563
Epoch: 74, step: 1065, loss: 0.3576051592826843, mean loss: 0.338946669920462
Epoch: 74, step: 1066, loss: 0.3423669636249542, mean loss: 0.3389467016124434
Epoch: 74, step: 1067, loss: 0.337926983833313, mean loss: 0.33894669216396317
Epoch: 74, step: 1068, loss: 0.3474617600440979, mean loss: 0.33894677106197457
Epoch: 74, step: 1069, loss: 0.3368111252784729, mean loss: 0.3389467512739181
Epoch: 74, step: 1070, loss: 0.3205040991306305, mean loss: 0.3389465803931177
Epoch: 74, step: 1071, loss: 0.28701332211494446, mean loss: 0.3389460992088256
Epoch: 74, step: 1072, loss: 0.3397265672683716, mean loss: 0.3389461064401357
Epoch: 74, step: 1073, loss: 0.3571012318134308, mean loss: 0.3389462746521747
Epoch: 74, step: 1074, loss: 0.32212895154953003, mean loss: 0.33894611883667125
Epoch: 74, step: 1075, loss: 0.3235038220882416, mean loss: 0.3389459757623583
Epoch: 74, step: 1076, loss: 0.3883313536643982, mean loss: 0.33894643331823
Epoch: 74, step: 1077, loss: 0.3465930223464966, mean loss: 0.33894650416327443
Epoch: 74, step: 1078, loss: 0.32063931226730347, mean loss: 0.3389463345501564
Epoch: 74, step: 1079, loss: 0.30805349349975586, mean loss: 0.3389460483357233
Epoch: 74, step: 1080, loss: 0.3513031303882599, mean loss: 0.3389461628199322
Epoch: 74, step: 1081, loss: 0.34935852885246277, mean loss: 0.3389462592861075
Epoch: 74, step: 1082, loss: 0.3325660824775696, mean loss: 0.3389462001770106
Epoch: 74, step: 1083, loss: 0.33300694823265076, mean loss: 0.33894614515336835
Epoch: 74, step: 1084, loss: 0.3417440354824066, mean loss: 0.3389461710739206
Epoch: 74, step: 1085, loss: 0.34621766209602356, mean loss: 0.3389462384387186
Epoch: 74, step: 1086, loss: 0.3556824326515198, mean loss: 0.33894639348530997
Epoch: 74, step: 1087, loss: 0.33585864305496216, mean loss: 0.3389463648801959
Epoch: 74, step: 1088, loss: 0.3723604381084442, mean loss: 0.3389466744274026
Epoch: 74, step: 1089, loss: 0.3481953740119934, mean loss: 0.33894676010634933
Epoch: 74, step: 1090, loss: 0.33293843269348145, mean loss: 0.3389467044463735
Epoch: 74, step: 1091, loss: 0.33622583746910095, mean loss: 0.33894667924102484
Epoch: 74, step: 1092, loss: 0.35015547275543213, mean loss: 0.3389467830751828
Epoch: 74, step: 1093, loss: 0.29950907826423645, mean loss: 0.33894641774211365
Epoch: 74, step: 1094, loss: 0.35618624091148376, mean loss: 0.3389465774425626
Epoch: 74, step: 1095, loss: 0.35227298736572266, mean loss: 0.3389467008901127
Epoch: 74, step: 1096, loss: 0.31805703043937683, mean loss: 0.33894650738302673
Epoch: 74, step: 1097, loss: 0.3235985040664673, mean loss: 0.3389463652113303
Epoch: 74, step: 1098, loss: 0.34028542041778564, mean loss: 0.3389463776151579
Epoch: 74, step: 1099, loss: 0.30893293023109436, mean loss: 0.3389460995996017
Epoch: 74, step: 1100, loss: 0.34627261757850647, mean loss: 0.33894616746475154
Epoch: 74, step: 1101, loss: 0.32608237862586975, mean loss: 0.3389460483092574
Epoch: 74, step: 1102, loss: 0.315411776304245, mean loss: 0.33894583031657494
Epoch: 74, step: 1103, loss: 0.3254335820674896, mean loss: 0.3389457051568098
Epoch: 74, step: 1104, loss: 0.3133152723312378, mean loss: 0.33894546775225787
Epoch: 74, step: 1105, loss: 0.36531445384025574, mean loss: 0.3389457119954739
Epoch: 74, step: 1106, loss: 0.31926530599594116, mean loss: 0.3389455297070418
Epoch: 74, step: 1107, loss: 0.3599831163883209, mean loss: 0.33894572456446354
Epoch: 74, step: 1108, loss: 0.30945974588394165, mean loss: 0.33894545145763555
Epoch: 74, step: 1109, loss: 0.32608333230018616, mean loss: 0.33894533232643537
Epoch: 74, step: 1110, loss: 0.34791579842567444, mean loss: 0.3389454154116938
Epoch: 74, step: 1111, loss: 0.34757915139198303, mean loss: 0.33894549537738716
Epoch: 74, step: 1112, loss: 0.3263792097568512, mean loss: 0.338945378989483
Epoch: 74, step: 1113, loss: 0.3538276255130768, mean loss: 0.33894551682634994
Epoch: 74, step: 1114, loss: 0.3360505998134613, mean loss: 0.33894549001436325
Epoch: 74, step: 1115, loss: 0.3426162600517273, mean loss: 0.33894552401178885
Epoch: 74, step: 1116, loss: 0.3132845461368561, mean loss: 0.33894528635072657
Epoch: 74, step: 1117, loss: 0.31144586205482483, mean loss: 0.3389450316651143
Epoch: 74, step: 1118, loss: 0.36710506677627563, mean loss: 0.33894529246655086
Epoch: 74, step: 1119, loss: 0.32018566131591797, mean loss: 0.33894511872765376
Epoch: 74, step: 1120, loss: 0.3280109763145447, mean loss: 0.338945017464029
Epoch: 74, step: 1121, loss: 0.34114208817481995, mean loss: 0.33894503781142116
Epoch: 74, step: 1122, loss: 0.3030986487865448, mean loss: 0.33894470583586084
Epoch: 74, step: 1123, loss: 0.32495829463005066, mean loss: 0.33894457630806674
Epoch: 74, step: 1124, loss: 0.3422480821609497, mean loss: 0.33894460690146605
Epoch: 74, step: 1125, loss: 0.33421239256858826, mean loss: 0.33894456307736265
Epoch: 74, step: 1126, loss: 0.322966068983078, mean loss: 0.3389444151050513
Epoch: 74, step: 1127, loss: 0.3362482190132141, mean loss: 0.3389443901365736
Epoch: 74, step: 1128, loss: 0.2885930836200714, mean loss: 0.33894392385601135
Epoch: 74, step: 1129, loss: 0.3223646879196167, mean loss: 0.33894377032466527
Epoch: 74, step: 1130, loss: 0.35180899500846863, mean loss: 0.3389438894614566
Epoch: 74, step: 1131, loss: 0.3268435001373291, mean loss: 0.33894377740836434
Epoch: 74, step: 1132, loss: 0.3440443277359009, mean loss: 0.3389438246404929
Epoch: 74, step: 1133, loss: 0.32987794280052185, mean loss: 0.3389437406893693
Epoch: 74, step: 1134, loss: 0.3286179006099701, mean loss: 0.33894364507177077
Epoch: 74, step: 1135, loss: 0.34168434143066406, mean loss: 0.3389436704504688
Epoch: 74, step: 1136, loss: 0.3405957520008087, mean loss: 0.33894368574851175
Epoch: 74, step: 1137, loss: 0.38913533091545105, mean loss: 0.33894415051178717
Epoch: 74, step: 1138, loss: 0.3550631105899811, mean loss: 0.3389442997683276
Epoch: 74, step: 1139, loss: 0.3524736166000366, mean loss: 0.3389444250444196
Epoch: 74, step: 1140, loss: 0.3356751501560211, mean loss: 0.3389443947725149
Epoch: 74, step: 1141, loss: 0.33587512373924255, mean loss: 0.3389443663528124
Epoch: 74, step: 1142, loss: 0.32760047912597656, mean loss: 0.338944261315847
Epoch: 74, step: 1143, loss: 0.3991609513759613, mean loss: 0.338944818877792
Epoch: 74, step: 1144, loss: 0.3361144959926605, mean loss: 0.33894479267134126
Epoch: 74, step: 1145, loss: 0.3530142605304718, mean loss: 0.3389449229417794
Epoch: 74, step: 1146, loss: 0.34524402022361755, mean loss: 0.33894498126513417
Epoch: 74, step: 1147, loss: 0.3586815893650055, mean loss: 0.33894516400473734
Epoch: 74, step: 1148, loss: 0.3604949116706848, mean loss: 0.33894536353020066
Epoch: 74, step: 1149, loss: 0.28239449858665466, mean loss: 0.33894483994016916
Epoch: 74, step: 1150, loss: 0.3205505311489105, mean loss: 0.33894466963353354
Epoch: 74, step: 1151, loss: 0.3552069067955017, mean loss: 0.3389448201986506
Epoch: 74, step: 1152, loss: 0.32031741738319397, mean loss: 0.3389446477370704
Epoch: 74, step: 1153, loss: 0.3250342309474945, mean loss: 0.33894451894883976
Epoch: 74, step: 1154, loss: 0.3011159896850586, mean loss: 0.3389441687203513
Epoch: 74, step: 1155, loss: 0.3139125108718872, mean loss: 0.3389439369714915
Epoch: 74, step: 1156, loss: 0.31544074416160583, mean loss: 0.338943719375528
Epoch: 74, step: 1157, loss: 0.32657289505004883, mean loss: 0.33894360484570474
Epoch: 74, step: 1158, loss: 0.3243599832057953, mean loss: 0.3389434698309231
Epoch: 74, step: 1159, loss: 0.3468022048473358, mean loss: 0.3389435425862095
Epoch: 74, step: 1160, loss: 0.333120733499527, mean loss: 0.33894348867979585
Epoch: 74, step: 1161, loss: 0.3411169648170471, mean loss: 0.3389435088012213
Epoch: 74, step: 1162, loss: 0.33752667903900146, mean loss: 0.33894349568473475
Epoch: 74, step: 1163, loss: 0.37938445806503296, mean loss: 0.33894387006875976
Epoch: 74, step: 1164, loss: 0.3095482587814331, mean loss: 0.33894359794008766
Epoch: 74, step: 1165, loss: 0.3849041163921356, mean loss: 0.3389440234137731
Epoch: 74, step: 1166, loss: 0.34883663058280945, mean loss: 0.3389441149924848
Epoch: 74, step: 1167, loss: 0.36271148920059204, mean loss: 0.33894433501187127
Epoch: 74, step: 1168, loss: 0.3779936730861664, mean loss: 0.3389446964961395
Epoch: 74, step: 1169, loss: 0.3283802270889282, mean loss: 0.33894459870052174
Epoch: 74, step: 1170, loss: 0.33627545833587646, mean loss: 0.3389445739924361
Epoch: 74, step: 1171, loss: 0.3308849632740021, mean loss: 0.3389444993857534
Epoch: 74, step: 1172, loss: 0.3410479724407196, mean loss: 0.33894451885712734
Epoch: 74, step: 1173, loss: 0.32045233249664307, mean loss: 0.33894434768072856
Epoch: 74, step: 1174, loss: 0.35727354884147644, mean loss: 0.33894451734685366
Epoch: 74, step: 1175, loss: 0.3351507782936096, mean loss: 0.3389444822300452
Epoch: 74, step: 1176, loss: 0.32364264130592346, mean loss: 0.338944340589612
Epoch: 74, step: 1177, loss: 0.3195265531539917, mean loss: 0.33894416085186796
Epoch: 74, step: 1178, loss: 0.34265992045402527, mean loss: 0.33894419524590325
Epoch: 74, step: 1179, loss: 0.3292316794395447, mean loss: 0.3389441053451682
Epoch: 74, step: 1180, loss: 0.32515865564346313, mean loss: 0.33894397774583
Epoch: 74, step: 1181, loss: 0.32295697927474976, mean loss: 0.33894382977013193
Epoch: 74, step: 1182, loss: 0.3284566104412079, mean loss: 0.3389437327013019
Epoch: 74, step: 1183, loss: 0.34646886587142944, mean loss: 0.3389438023526641
Epoch: 74, step: 1184, loss: 0.31577226519584656, mean loss: 0.3389435878828132
Epoch: 74, step: 1185, loss: 0.41398122906684875, mean loss: 0.3389442824056949
Epoch: 74, step: 1186, loss: 0.31730350852012634, mean loss: 0.3389440821079071
Epoch: 74, step: 1187, loss: 0.3453926146030426, mean loss: 0.3389441417922255
Epoch: 74, step: 1188, loss: 0.3451698422431946, mean loss: 0.3389441994135911
Epoch: 74, step: 1189, loss: 0.3192579448223114, mean loss: 0.33894401721106077
Epoch: 74, step: 1190, loss: 0.30939650535583496, mean loss: 0.3389437437419977
Epoch: 74, step: 1191, loss: 0.30874499678611755, mean loss: 0.33894346424818983
Epoch: 74, step: 1192, loss: 0.29717493057250977, mean loss: 0.338943077677896
Epoch: 74, step: 1193, loss: 0.32866549491882324, mean loss: 0.33894298255912914
Epoch: 74, step: 1194, loss: 0.33796027302742004, mean loss: 0.3389429734642616
Epoch: 74, step: 1195, loss: 0.2961600720882416, mean loss: 0.3389425775169272
Epoch: 74, step: 1196, loss: 0.31995344161987305, mean loss: 0.33894240177783713
Epoch: 74, step: 1197, loss: 0.39314159750938416, mean loss: 0.3389429033714452
Epoch: 74, step: 1198, loss: 0.3438773453235626, mean loss: 0.3389429490374667
Epoch: 74, step: 1199, loss: 0.33516356348991394, mean loss: 0.33894291406129184
Epoch: 74, step: 1200, loss: 0.2798319160938263, mean loss: 0.3389423670259497
Epoch: 74, step: 1201, loss: 0.3581359386444092, mean loss: 0.3389425446488154
Epoch: 74, step: 1202, loss: 0.4304007589817047, mean loss: 0.3389433910217629
Epoch: 74, step: 1203, loss: 0.34183740615844727, mean loss: 0.3389434178033207
Epoch: 74, step: 1204, loss: 0.3429839015007019, mean loss: 0.3389434551940879
Epoch: 74, step: 1205, loss: 0.3339253067970276, mean loss: 0.33894340875640955
Epoch: 74, step: 1206, loss: 0.3490474224090576, mean loss: 0.3389435022575492
Epoch: 74, step: 1207, loss: 0.3263181447982788, mean loss: 0.33894338542532515
Epoch: 74, step: 1208, loss: 0.33343663811683655, mean loss: 0.33894333446759317
Epoch: 74, step: 1209, loss: 0.32450181245803833, mean loss: 0.3389432008314633
Epoch: 74, step: 1210, loss: 0.30398866534233093, mean loss: 0.33894287737901724
Epoch: 74, step: 1211, loss: 0.3362863063812256, mean loss: 0.33894285279661546
Epoch: 74, step: 1212, loss: 0.3439456820487976, mean loss: 0.3389428990895325
Epoch: 74, step: 1213, loss: 0.36218875646591187, mean loss: 0.338943114189536
Epoch: 74, step: 1214, loss: 0.40136104822158813, mean loss: 0.33894369175367467
Epoch: 74, step: 1215, loss: 0.38225221633911133, mean loss: 0.33894409249137347
Epoch: 74, step: 1216, loss: 0.3351290822029114, mean loss: 0.3389440571910645
Epoch: 74, step: 1217, loss: 0.3272705674171448, mean loss: 0.3389439491772057
Epoch: 74, step: 1218, loss: 0.3229995369911194, mean loss: 0.33894380164621163
Epoch: 74, step: 1219, loss: 0.3401179015636444, mean loss: 0.3389438125098624
Epoch: 74, step: 1220, loss: 0.3090120553970337, mean loss: 0.33894353556141715
Epoch: 74, step: 1221, loss: 0.35562095046043396, mean loss: 0.33894368987048007
Epoch: 74, step: 1222, loss: 0.32342448830604553, mean loss: 0.33894354627920364
Epoch: 74, step: 1223, loss: 0.33592653274536133, mean loss: 0.33894351836457065
Epoch: 74, step: 1224, loss: 0.3200218379497528, mean loss: 0.33894334329512815
Epoch: 74, step: 1225, loss: 0.35425397753715515, mean loss: 0.3389434849527052
Epoch: 74, step: 1226, loss: 0.33231160044670105, mean loss: 0.33894342359352286
Epoch: 74, step: 1227, loss: 0.33638259768486023, mean loss: 0.3389433999005997
Epoch: 74, step: 1228, loss: 0.336417555809021, mean loss: 0.3389433765315467
Epoch: 74, step: 1229, loss: 0.335528701543808, mean loss: 0.3389433449393425
Epoch: 74, step: 1230, loss: 0.33118075132369995, mean loss: 0.33894327312132905
Epoch: 74, step: 1231, loss: 0.3217551112174988, mean loss: 0.3389431141012537
Epoch: 74, step: 1232, loss: 0.31067705154418945, mean loss: 0.3389428525939536
Epoch: 74, step: 1233, loss: 0.3426675796508789, mean loss: 0.3389428870534509
Epoch: 74, step: 1234, loss: 0.3358931541442871, mean loss: 0.33894285883895653
Epoch: 74, step: 1235, loss: 0.3182542622089386, mean loss: 0.3389426674409194
Epoch: 74, step: 1236, loss: 0.3294084966182709, mean loss: 0.33894257923751286
Epoch: 74, step: 1237, loss: 0.32686567306518555, mean loss: 0.33894246751155055
Epoch: 74, step: 1238, loss: 0.3104539215564728, mean loss: 0.3389422039605449
Epoch: 74, step: 1239, loss: 0.3170028328895569, mean loss: 0.33894200099863075
Epoch: 74, step: 1240, loss: 0.3246409296989441, mean loss: 0.33894186870012755
Epoch: 74, step: 1241, loss: 0.32050925493240356, mean loss: 0.3389416981825068
Epoch: 74, step: 1242, loss: 0.32227903604507446, mean loss: 0.3389415440398955
Epoch: 74, step: 1243, loss: 0.3193701505661011, mean loss: 0.3389413629909272
Epoch: 74, step: 1244, loss: 0.37871816754341125, mean loss: 0.3389417309505627
Epoch: 74, step: 1245, loss: 0.32895898818969727, mean loss: 0.3389416386049746
Epoch: 74, step: 1246, loss: 0.33007800579071045, mean loss: 0.3389415566124969
Epoch: 74, step: 1247, loss: 0.31994014978408813, mean loss: 0.3389413808428045
Epoch: 74, step: 1248, loss: 0.32597222924232483, mean loss: 0.3389412608747031
Epoch: 74, step: 1249, loss: 0.3359932005405426, mean loss: 0.33894123360461326
Epoch: 74, step: 1250, loss: 0.3066464066505432, mean loss: 0.33894093487440197
Epoch: 74, step: 1251, loss: 0.3482957184314728, mean loss: 0.3389410214062364
Epoch: 74, step: 1252, loss: 0.314296692609787, mean loss: 0.33894079344807565
Epoch: 74, step: 1253, loss: 0.34131479263305664, mean loss: 0.33894081540718385
Epoch: 74, step: 1254, loss: 0.32300257682800293, mean loss: 0.3389406679824206
Epoch: 74, step: 1255, loss: 0.32510632276535034, mean loss: 0.33894054001933405
Epoch: 74, step: 1256, loss: 0.353992223739624, mean loss: 0.33894067924110866
Epoch: 74, step: 1257, loss: 0.35983213782310486, mean loss: 0.33894087247656923
Epoch: 74, step: 1258, loss: 0.34523138403892517, mean loss: 0.338940930660092
Epoch: 74, step: 1259, loss: 0.34433528780937195, mean loss: 0.33894098055425337
Epoch: 74, step: 1260, loss: 0.32178547978401184, mean loss: 0.33894082187892227
Epoch: 74, step: 1261, loss: 0.30548742413520813, mean loss: 0.33894051246330464
Epoch: 74, step: 1262, loss: 0.3269207179546356, mean loss: 0.338940401291406
Epoch: 74, step: 1263, loss: 0.34676700830459595, mean loss: 0.3389404736795582
Epoch: 74, step: 1264, loss: 0.29285669326782227, mean loss: 0.3389400474554166
Epoch: 74, step: 1265, loss: 0.32343775033950806, mean loss: 0.33893990407759234
Epoch: 74, step: 1266, loss: 0.3080207407474518, mean loss: 0.3389396181147229
Epoch: 74, step: 1267, loss: 0.36764824390411377, mean loss: 0.3389398836304806
Epoch: 74, step: 1268, loss: 0.32277432084083557, mean loss: 0.3389397341223854
Epoch: 74, step: 1269, loss: 0.31851866841316223, mean loss: 0.33893954525878456
Epoch: 74, step: 1270, loss: 0.32575616240501404, mean loss: 0.33893942333379956
Epoch: 74, step: 1271, loss: 0.3050854802131653, mean loss: 0.3389391102424345
Epoch: 74, step: 1272, loss: 0.3225529193878174, mean loss: 0.3389389586994548
Epoch: 74, step: 1273, loss: 0.32155075669288635, mean loss: 0.3389387978911499
Epoch: 74, step: 1274, loss: 0.29828858375549316, mean loss: 0.33893842195627333
Epoch: 74, step: 1275, loss: 0.330718457698822, mean loss: 0.3389383459384039
Epoch: 74, step: 1276, loss: 0.3649142384529114, mean loss: 0.3389385861600986
Epoch: 74, step: 1277, loss: 0.3275654911994934, mean loss: 0.33893848098415985
Epoch: 74, step: 1278, loss: 0.32241353392601013, mean loss: 0.338938328166413
Epoch: 74, step: 1279, loss: 0.31101539731025696, mean loss: 0.33893806994592346
Epoch: 74, step: 1280, loss: 0.3241962194442749, mean loss: 0.3389379336202394
Epoch: 74, step: 1281, loss: 0.3184830844402313, mean loss: 0.3389377444651858
Epoch: 74, step: 1282, loss: 0.3469809591770172, mean loss: 0.33893781884366825
Epoch: 74, step: 1283, loss: 0.325246125459671, mean loss: 0.33893769223285464
Epoch: 74, step: 1284, loss: 0.2878565788269043, mean loss: 0.3389372198762701
Epoch: 74, step: 1285, loss: 0.34419429302215576, mean loss: 0.33893726848895667
Epoch: 74, step: 1286, loss: 0.31878599524497986, mean loss: 0.3389370821498201
Epoch: 74, step: 1287, loss: 0.34349942207336426, mean loss: 0.3389371243374581
Epoch: 74, step: 1288, loss: 0.3227382004261017, mean loss: 0.3389369745485274
Epoch: 74, step: 1289, loss: 0.347562700510025, mean loss: 0.33893705430853666
Epoch: 74, step: 1290, loss: 0.3245190680027008, mean loss: 0.3389369209901246
Epoch: 74, step: 1291, loss: 0.35821956396102905, mean loss: 0.3389370992887799
Epoch: 74, step: 1292, loss: 0.3103466033935547, mean loss: 0.33893683492668786
Epoch: 74, step: 1293, loss: 0.31588831543922424, mean loss: 0.33893662181046513
Epoch: 74, step: 1294, loss: 0.3127169907093048, mean loss: 0.3389363793750637
Epoch: 74, step: 1295, loss: 0.3441312909126282, mean loss: 0.33893642740849383
Epoch: 74, step: 1296, loss: 0.3379474878311157, mean loss: 0.33893641826459975
Epoch: 74, step: 1297, loss: 0.30706846714019775, mean loss: 0.33893612361113223
Epoch: 74, step: 1298, loss: 0.33156049251556396, mean loss: 0.3389360554161242
Epoch: 74, step: 1299, loss: 0.32172760367393494, mean loss: 0.3389358963084303
Epoch: 74, step: 1300, loss: 0.33783647418022156, mean loss: 0.3389358861433728
Epoch: 74, step: 1301, loss: 0.33613696694374084, mean loss: 0.3389358602653129
Epoch: 74, step: 1302, loss: 0.32094600796699524, mean loss: 0.33893569393747797
Epoch: 74, step: 1303, loss: 0.2845468521118164, mean loss: 0.33893519108206166
Epoch: 74, step: 1304, loss: 0.3256516754627228, mean loss: 0.33893506826962816
Epoch: 74, step: 1305, loss: 0.3596808612346649, mean loss: 0.33893526007259933
Epoch: 74, step: 1306, loss: 0.3465266525745392, mean loss: 0.3389353302573437
Epoch: 74, step: 1307, loss: 0.3479834198951721, mean loss: 0.33893541390892495
Epoch: 74, step: 1308, loss: 0.3228294551372528, mean loss: 0.33893526500716586
Epoch: 74, step: 1309, loss: 0.31012800335884094, mean loss: 0.3389349986826124
Epoch: 74, step: 1310, loss: 0.30446112155914307, mean loss: 0.33893467997286614
Epoch: 74, step: 1311, loss: 0.34471994638442993, mean loss: 0.33893473345695024
Epoch: 74, step: 1312, loss: 0.29730409383773804, mean loss: 0.3389343485903099
Epoch: 74, step: 1313, loss: 0.30442723631858826, mean loss: 0.3389340295821536
Epoch: 74, step: 1314, loss: 0.31419655680656433, mean loss: 0.33893380089357
Epoch: 74, step: 1315, loss: 0.33909064531326294, mean loss: 0.33893380234352394
Epoch: 74, step: 1316, loss: 0.33088573813438416, mean loss: 0.33893372794358856
Epoch: 74, step: 1317, loss: 0.3336646556854248, mean loss: 0.33893367923435846
Epoch: 74, step: 1318, loss: 0.3764745891094208, mean loss: 0.33893402627304464
Epoch: 74, step: 1319, loss: 0.3252372443675995, mean loss: 0.3389338996573267
Epoch: 74, step: 1320, loss: 0.33222511410713196, mean loss: 0.3389338376405805
Epoch: 74, step: 1321, loss: 0.3105374276638031, mean loss: 0.3389335751434926
Epoch: 74, step: 1322, loss: 0.315784752368927, mean loss: 0.33893336115720346
Epoch: 74, step: 1323, loss: 0.30737361311912537, mean loss: 0.338933069423537
Epoch: 74, step: 1324, loss: 0.306132048368454, mean loss: 0.33893276621852825
Epoch: 74, step: 1325, loss: 0.29518717527389526, mean loss: 0.33893236184819914
Epoch: 74, step: 1326, loss: 0.3578079640865326, mean loss: 0.3389325363266499
Epoch: 74, step: 1327, loss: 0.3356156349182129, mean loss: 0.338932505666835
Epoch: 74, step: 1328, loss: 0.3129918575286865, mean loss: 0.3389322658863836
Epoch: 74, step: 1329, loss: 0.31140848994255066, mean loss: 0.3389320114747597
Epoch: 74, step: 1330, loss: 0.3359927237033844, mean loss: 0.3389319843061741
Epoch: 74, step: 1331, loss: 0.312428742647171, mean loss: 0.33893173933222454
Epoch: 74, step: 1332, loss: 0.33695587515830994, mean loss: 0.33893172106914626
Epoch: 74, step: 1333, loss: 0.33324432373046875, mean loss: 0.33893166850054157
Epoch: 74, step: 1334, loss: 0.3178410232067108, mean loss: 0.3389314735615421
Epoch: 74, step: 1335, loss: 0.33412495255470276, mean loss: 0.33893142913569724
Epoch: 74, step: 1336, loss: 0.3562033772468567, mean loss: 0.3389315887758598
Epoch: 74, step: 1337, loss: 0.35502496361732483, mean loss: 0.33893173752139877
Epoch: 74, step: 1338, loss: 0.3145352303981781, mean loss: 0.3389315120349426
Epoch: 74, step: 1339, loss: 0.288923978805542, mean loss: 0.3389310498410239
Epoch: 74, step: 1340, loss: 0.36048194766044617, mean loss: 0.33893124902305133
Epoch: 74, step: 1341, loss: 0.3472922146320343, mean loss: 0.3389313262977293
Epoch: 74, step: 1342, loss: 0.3334425687789917, mean loss: 0.33893127556937214
Epoch: 74, step: 1343, loss: 0.3148978650569916, mean loss: 0.3389310534491271
Epoch: 74, step: 1344, loss: 0.3038865029811859, mean loss: 0.33893072956533243
Epoch: 74, step: 1345, loss: 0.3334865868091583, mean loss: 0.3389306792507102
Epoch: 74, step: 1346, loss: 0.3147258162498474, mean loss: 0.3389304555520789
Epoch: 74, step: 1347, loss: 0.3178424835205078, mean loss: 0.3389302606612058
Epoch: 74, step: 1348, loss: 0.33812659978866577, mean loss: 0.33893025323399933
Epoch: 74, step: 1349, loss: 0.352243572473526, mean loss: 0.3389303762707925
Epoch: 74, step: 1350, loss: 0.39711153507232666, mean loss: 0.33893091395466507
Epoch: 74, step: 1351, loss: 0.34109053015708923, mean loss: 0.33893093391267376
Epoch: 74, step: 1352, loss: 0.3470063805580139, mean loss: 0.3389310085409084
Epoch: 74, step: 1353, loss: 0.32628628611564636, mean loss: 0.33893089168736046
Epoch: 74, step: 1354, loss: 0.3064063489437103, mean loss: 0.3389305911214037
Epoch: 74, step: 1355, loss: 0.313783198595047, mean loss: 0.3389303587313497
Epoch: 74, step: 1356, loss: 0.31920191645622253, mean loss: 0.3389301764201461
Epoch: 74, step: 1357, loss: 0.3164103329181671, mean loss: 0.33892996831543226
Epoch: 74, step: 1358, loss: 0.33303138613700867, mean loss: 0.33892991380744186
Epoch: 74, step: 1359, loss: 0.3147904574871063, mean loss: 0.3389296907400921
Epoch: 74, step: 1360, loss: 0.3233024477958679, mean loss: 0.3389295463335484
Epoch: 74, step: 1361, loss: 0.36645448207855225, mean loss: 0.3389298006806602
Epoch: 74, step: 1362, loss: 0.3348848521709442, mean loss: 0.3389297633032264
Epoch: 74, step: 1363, loss: 0.3608429729938507, mean loss: 0.33892996579084134
Epoch: 74, step: 1364, loss: 0.3128373920917511, mean loss: 0.33892972468630805
Epoch: 74, step: 1365, loss: 0.3623572587966919, mean loss: 0.33892994116294045
Epoch: 74, step: 1366, loss: 0.34654098749160767, mean loss: 0.3389300114903785
Epoch: 74, step: 1367, loss: 0.3003982901573181, mean loss: 0.3389296554536276
Epoch: 74, step: 1368, loss: 0.2934931218624115, mean loss: 0.33892923561963734
Epoch: 74, step: 1369, loss: 0.34987515211105347, mean loss: 0.33892933675907233
Epoch: 74, step: 1370, loss: 0.3013951778411865, mean loss: 0.33892898994950615
Epoch: 74, step: 1371, loss: 0.32742026448249817, mean loss: 0.3389288836117242
Epoch: 74, step: 1372, loss: 0.40659093856811523, mean loss: 0.3389295087866307
Epoch: 74, step: 1373, loss: 0.290047824382782, mean loss: 0.3389290571402812
Epoch: 74, step: 1374, loss: 0.323263555765152, mean loss: 0.3389289123989282
Epoch: 74, step: 1375, loss: 0.31204870343208313, mean loss: 0.33892866404161276
Epoch: 74, step: 1376, loss: 0.3251381814479828, mean loss: 0.3389285366268447
Epoch: 74, step: 1377, loss: 0.30656808614730835, mean loss: 0.33892823764084695
Epoch: 74, step: 1378, loss: 0.33677902817726135, mean loss: 0.3389282177839664
Epoch: 74, step: 1379, loss: 0.32222408056259155, mean loss: 0.3389280634532703
Epoch: 74, step: 1380, loss: 0.33653724193573, mean loss: 0.3389280413645066
Epoch: 74, step: 1381, loss: 0.376002699136734, mean loss: 0.33892838389354235
Epoch: 74, step: 1382, loss: 0.3325144648551941, mean loss: 0.33892832463653666
Epoch: 74, step: 1383, loss: 0.3468208611011505, mean loss: 0.3389283975535402
Epoch: 74, step: 1384, loss: 0.32331663370132446, mean loss: 0.33892825332202114
Epoch: 74, step: 1385, loss: 0.32827574014663696, mean loss: 0.33892815490815986
Epoch: 74, step: 1386, loss: 0.32594335079193115, mean loss: 0.33892803494840157
Epoch: 74, step: 1387, loss: 0.34934717416763306, mean loss: 0.3389281312044455
Epoch: 74, step: 1388, loss: 0.36829009652137756, mean loss: 0.3389284024591484
Epoch: 74, step: 1389, loss: 0.31995782256126404, mean loss: 0.33892822720482124
Epoch: 74, step: 1390, loss: 0.3218693137168884, mean loss: 0.3389280696123384
Epoch: 74, step: 1391, loss: 0.32215186953544617, mean loss: 0.3389279146330309
Epoch: 74, step: 1392, loss: 0.3524080514907837, mean loss: 0.3389280391620044
Epoch: 74, step: 1393, loss: 0.33730804920196533, mean loss: 0.33892802419673923
Epoch: 74, step: 1394, loss: 0.34152737259864807, mean loss: 0.33892804820897376
Epoch: 74, step: 1395, loss: 0.3389017581939697, mean loss: 0.33892804796611437
Epoch: 74, step: 1396, loss: 0.3014768064022064, mean loss: 0.3389277020058032
Epoch: 74, step: 1397, loss: 0.3391434848308563, mean loss: 0.3389277039991044
Epoch: 74, step: 1398, loss: 0.4213433265686035, mean loss: 0.3389284653091831
Epoch: 74, step: 1399, loss: 0.3191213309764862, mean loss: 0.3389282823434876
Epoch: 74, step: 1400, loss: 0.32348576188087463, mean loss: 0.3389281396966337
Epoch: 74, step: 1401, loss: 0.30230507254600525, mean loss: 0.33892780140230766
Epoch: 74, step: 1402, loss: 0.3576618731021881, mean loss: 0.33892797445093825
Epoch: 74, step: 1403, loss: 0.31377094984054565, mean loss: 0.33892774207494886
Epoch: 74, step: 1404, loss: 0.35396134853363037, mean loss: 0.3389278809394195
Epoch: 74, step: 1405, loss: 0.3120943605899811, mean loss: 0.33892763308218105
Epoch: 74, step: 1406, loss: 0.3385065197944641, mean loss: 0.3389276291924561
Epoch: 74, step: 1407, loss: 0.3096814751625061, mean loss: 0.33892735905506943
Epoch: 74, step: 1408, loss: 0.3621045649051666, mean loss: 0.33892757313354216
Epoch: 74, step: 1409, loss: 0.37250789999961853, mean loss: 0.33892788329856965
Epoch: 74, step: 1410, loss: 0.30512022972106934, mean loss: 0.3389275710367209
Epoch: 74, step: 1411, loss: 0.3107331097126007, mean loss: 0.3389273106231054
Epoch: 74, step: 1412, loss: 0.3740343749523163, mean loss: 0.3389276348808738
Epoch: 74, step: 1413, loss: 0.34079766273498535, mean loss: 0.33892765215276677
Epoch: 74, step: 1414, loss: 0.3011039197444916, mean loss: 0.3389273028096148
Epoch: 74, step: 1415, loss: 0.3256421685218811, mean loss: 0.3389271801081381
Epoch: 74, step: 1416, loss: 0.29768991470336914, mean loss: 0.3389267992443456
Epoch: 74, step: 1417, loss: 0.31050345301628113, mean loss: 0.33892653673121936
Epoch: 74, step: 1418, loss: 0.34497562050819397, mean loss: 0.33892659259899843
Epoch: 74, step: 1419, loss: 0.31390345096588135, mean loss: 0.33892636149384464
Epoch: 74, step: 1420, loss: 0.30956336855888367, mean loss: 0.33892609030981724
Epoch: 74, step: 1421, loss: 0.3105274438858032, mean loss: 0.3389258280345035
Epoch: 74, step: 1422, loss: 0.30764880776405334, mean loss: 0.33892553917867485
Epoch: 74, step: 1423, loss: 0.3287379741668701, mean loss: 0.33892544509329425
Epoch: 74, step: 1424, loss: 0.30373236536979675, mean loss: 0.33892512007708897
Epoch: 74, step: 1425, loss: 0.3112487494945526, mean loss: 0.3389248644817861
Epoch: 74, step: 1426, loss: 0.32565927505493164, mean loss: 0.33892474197327205
Epoch: 74, step: 1427, loss: 0.33383312821388245, mean loss: 0.33892469495234784
Epoch: 74, step: 1428, loss: 0.318293035030365, mean loss: 0.33892450442125005
Epoch: 74, step: 1429, loss: 0.3177869915962219, mean loss: 0.3389243092204593
Epoch: 74, step: 1430, loss: 0.3434293270111084, mean loss: 0.338924350823032
Epoch: 74, step: 1431, loss: 0.3169286251068115, mean loss: 0.33892414770056495
Epoch: 74, step: 1432, loss: 0.32317936420440674, mean loss: 0.3389240023046014
Epoch: 74, step: 1433, loss: 0.3242063522338867, mean loss: 0.33892386639500616
Epoch: 74, step: 1434, loss: 0.34813588857650757, mean loss: 0.33892395146229876
Epoch: 74, step: 1435, loss: 0.3244516849517822, mean loss: 0.3389238178211571
Epoch: 74, step: 1436, loss: 0.34143882989883423, mean loss: 0.3389238410452997
Epoch: 74, step: 1437, loss: 0.33777153491973877, mean loss: 0.3389238304047644
Epoch: 74, step: 1438, loss: 0.3279649019241333, mean loss: 0.3389237292096171
Epoch: 74, step: 1439, loss: 0.3094938397407532, mean loss: 0.3389234574554483
Epoch: 74, step: 1440, loss: 0.30573245882987976, mean loss: 0.33892315097421033
Epoch: 74, step: 1441, loss: 0.3470245599746704, mean loss: 0.3389232257808457
Epoch: 74, step: 1442, loss: 0.31196385622024536, mean loss: 0.33892297684623357
Epoch: 74, step: 1443, loss: 0.319730281829834, mean loss: 0.33892279962836636
Valid: 74, mean loss: 0.18488613764444986
Epoch: 75, step: 0, loss: 0.32993847131729126, mean loss: 0.33892271667134555
Epoch: 75, step: 1, loss: 0.3449782133102417, mean loss: 0.3389227725844094
Epoch: 75, step: 2, loss: 0.3161744475364685, mean loss: 0.33892256254105835
Epoch: 75, step: 3, loss: 0.31223514676094055, mean loss: 0.3389223161289611
Epoch: 75, step: 4, loss: 0.3056953549385071, mean loss: 0.33892200933831257
Epoch: 75, step: 5, loss: 0.3077273368835449, mean loss: 0.33892172131481935
Epoch: 75, step: 6, loss: 0.3619806468486786, mean loss: 0.33892193421819156
Epoch: 75, step: 7, loss: 0.3983766436576843, mean loss: 0.3389224831592618
Epoch: 75, step: 8, loss: 0.33973428606987, mean loss: 0.3389224906545107
Epoch: 75, step: 9, loss: 0.3301998972892761, mean loss: 0.33892241012091856
Epoch: 75, step: 10, loss: 0.3103695213794708, mean loss: 0.33892214650144553
Epoch: 75, step: 11, loss: 0.30061718821525574, mean loss: 0.33892179284757257
Epoch: 75, step: 12, loss: 0.31563547253608704, mean loss: 0.3389215778565714
Epoch: 75, step: 13, loss: 0.3643791675567627, mean loss: 0.3389218128916518
Epoch: 75, step: 14, loss: 0.2986728847026825, mean loss: 0.3389214413001992
Epoch: 75, step: 15, loss: 0.3303402364253998, mean loss: 0.33892136207640144
Epoch: 75, step: 16, loss: 0.2808929979801178, mean loss: 0.33892082634919246
Epoch: 75, step: 17, loss: 0.3184612989425659, mean loss: 0.33892063746528206
Epoch: 75, step: 18, loss: 0.3128666281700134, mean loss: 0.3389203969349107
Epoch: 75, step: 19, loss: 0.3414193391799927, mean loss: 0.3389204200049093
Epoch: 75, step: 20, loss: 0.33225777745246887, mean loss: 0.33892035849659097
Epoch: 75, step: 21, loss: 0.3194330930709839, mean loss: 0.3389201785953204
Epoch: 75, step: 22, loss: 0.30858516693115234, mean loss: 0.33891989855311644
Epoch: 75, step: 23, loss: 0.3176468312740326, mean loss: 0.33891970216942235
Epoch: 75, step: 24, loss: 0.3039495348930359, mean loss: 0.33891937934304545
Epoch: 75, step: 25, loss: 0.33333098888397217, mean loss: 0.3389193277544106
Epoch: 75, step: 26, loss: 0.3015187978744507, mean loss: 0.33891898249856595
Epoch: 75, step: 27, loss: 0.2922750413417816, mean loss: 0.3389185519179113
Epoch: 75, step: 28, loss: 0.36871337890625, mean loss: 0.3389188269580851
Epoch: 75, step: 29, loss: 0.3381138741970062, mean loss: 0.3389188195275233
Epoch: 75, step: 30, loss: 0.3604068458080292, mean loss: 0.33891901788280737
Epoch: 75, step: 31, loss: 0.29633209109306335, mean loss: 0.3389186247678756
Epoch: 75, step: 32, loss: 0.3585163354873657, mean loss: 0.3389188056703773
Epoch: 75, step: 33, loss: 0.3420734107494354, mean loss: 0.3389188347896296
Epoch: 75, step: 34, loss: 0.32362115383148193, mean loss: 0.3389186935824393
Epoch: 75, step: 35, loss: 0.33022820949554443, mean loss: 0.3389186133645608
Epoch: 75, step: 36, loss: 0.3319642245769501, mean loss: 0.3389185491723754
Epoch: 75, step: 37, loss: 0.3427469730377197, mean loss: 0.3389185845101504
Epoch: 75, step: 38, loss: 0.35830143094062805, mean loss: 0.3389187634193745
Epoch: 75, step: 39, loss: 0.33850717544555664, mean loss: 0.3389187596203347
Epoch: 75, step: 40, loss: 0.33775678277015686, mean loss: 0.33891874889515355
Epoch: 75, step: 41, loss: 0.3748604655265808, mean loss: 0.33891908063830606
Epoch: 75, step: 42, loss: 0.3426229953765869, mean loss: 0.33891911482523773
Epoch: 75, step: 43, loss: 0.3215485215187073, mean loss: 0.3389189544970857
Epoch: 75, step: 44, loss: 0.35770976543426514, mean loss: 0.33891912793204754
Epoch: 75, step: 45, loss: 0.354621946811676, mean loss: 0.338919272864199
Epoch: 75, step: 46, loss: 0.3220941424369812, mean loss: 0.33891911757489307
Epoch: 75, step: 47, loss: 0.3140769898891449, mean loss: 0.3389188882939863
Epoch: 75, step: 48, loss: 0.33428046107292175, mean loss: 0.33891884548392603
Epoch: 75, step: 49, loss: 0.33358117938041687, mean loss: 0.33891879622074095
Epoch: 75, step: 50, loss: 0.31546545028686523, mean loss: 0.3389185797636161
Epoch: 75, step: 51, loss: 0.333985835313797, mean loss: 0.33891853423843477
Epoch: 75, step: 52, loss: 0.3197534680366516, mean loss: 0.3389183573622412
Epoch: 75, step: 53, loss: 0.31808391213417053, mean loss: 0.33891816508096656
Epoch: 75, step: 54, loss: 0.31888097524642944, mean loss: 0.3389179801592755
Epoch: 75, step: 55, loss: 0.34247368574142456, mean loss: 0.33891801297430724
Epoch: 75, step: 56, loss: 0.3464300036430359, mean loss: 0.33891808230061443
Epoch: 75, step: 57, loss: 0.3284272849559784, mean loss: 0.3389179854845294
Epoch: 75, step: 58, loss: 0.3222309350967407, mean loss: 0.33891783148670374
Epoch: 75, step: 59, loss: 0.30960598587989807, mean loss: 0.3389175609824069
Epoch: 75, step: 60, loss: 0.34349146485328674, mean loss: 0.33891760319227826
Epoch: 75, step: 61, loss: 0.3136647045612335, mean loss: 0.3389173701502651
Epoch: 75, step: 62, loss: 0.33955010771751404, mean loss: 0.33891737598932054
Epoch: 75, step: 63, loss: 0.3396207094192505, mean loss: 0.3389173824797918
Epoch: 75, step: 64, loss: 0.3552837669849396, mean loss: 0.338917533509963
Epoch: 75, step: 65, loss: 0.3099820613861084, mean loss: 0.3389172664938129
Epoch: 75, step: 66, loss: 0.3111231327056885, mean loss: 0.33891701001228447
Epoch: 75, step: 67, loss: 0.31788012385368347, mean loss: 0.33891681588776285
Epoch: 75, step: 68, loss: 0.31417152285575867, mean loss: 0.3389165875448508
Epoch: 75, step: 69, loss: 0.3707596957683563, mean loss: 0.33891688138178194
Epoch: 75, step: 70, loss: 0.3222590982913971, mean loss: 0.3389167276710744
Epoch: 75, step: 71, loss: 0.28804779052734375, mean loss: 0.3389162582791914
Epoch: 75, step: 72, loss: 0.3617118000984192, mean loss: 0.3389164686225594
Epoch: 75, step: 73, loss: 0.35382503271102905, mean loss: 0.33891660618843394
Epoch: 75, step: 74, loss: 0.3492128551006317, mean loss: 0.33891670119419093
Epoch: 75, step: 75, loss: 0.32140660285949707, mean loss: 0.33891653962614693
Epoch: 75, step: 76, loss: 0.3594033122062683, mean loss: 0.33891672865862227
Epoch: 75, step: 77, loss: 0.3162274956703186, mean loss: 0.3389165193058663
Epoch: 75, step: 78, loss: 0.36810430884361267, mean loss: 0.33891678861809044
Epoch: 75, step: 79, loss: 0.30277013778686523, mean loss: 0.33891645510036733
Epoch: 75, step: 80, loss: 0.34974992275238037, mean loss: 0.338916555057626
Epoch: 75, step: 81, loss: 0.3309800326824188, mean loss: 0.3389164818303154
Epoch: 75, step: 82, loss: 0.328529417514801, mean loss: 0.33891638599365914
Epoch: 75, step: 83, loss: 0.31497591733932495, mean loss: 0.33891616510802425
Epoch: 75, step: 84, loss: 0.31066736578941345, mean loss: 0.33891590447417896
Epoch: 75, step: 85, loss: 0.35380327701568604, mean loss: 0.3389160418293036
Epoch: 75, step: 86, loss: 0.300331175327301, mean loss: 0.3389156858376579
Epoch: 75, step: 87, loss: 0.3136223256587982, mean loss: 0.3389154524782438
Epoch: 75, step: 88, loss: 0.3337402939796448, mean loss: 0.33891540473208415
Epoch: 75, step: 89, loss: 0.33023735880851746, mean loss: 0.33891532466892405
Epoch: 75, step: 90, loss: 0.31435921788215637, mean loss: 0.338915098117764
Epoch: 75, step: 91, loss: 0.3155387341976166, mean loss: 0.3389148824527341
Epoch: 75, step: 92, loss: 0.31479281187057495, mean loss: 0.3389146599100369
Epoch: 75, step: 93, loss: 0.3668016791343689, mean loss: 0.33891491718460215
Epoch: 75, step: 94, loss: 0.3428436517715454, mean loss: 0.33891495342921296
Epoch: 75, step: 95, loss: 0.343704491853714, mean loss: 0.3389149976147772
Epoch: 75, step: 96, loss: 0.34964197874069214, mean loss: 0.3389150965749064
Epoch: 75, step: 97, loss: 0.37022367119789124, mean loss: 0.33891538540472455
Epoch: 75, step: 98, loss: 0.3583383560180664, mean loss: 0.3389155645850732
Epoch: 75, step: 99, loss: 0.33654454350471497, mean loss: 0.338915542712185
Epoch: 75, step: 100, loss: 0.3301450312137604, mean loss: 0.3389154618041537
Epoch: 75, step: 101, loss: 0.3027604818344116, mean loss: 0.3389151282772818
Epoch: 75, step: 102, loss: 0.35356053709983826, mean loss: 0.3389152633787903
Epoch: 75, step: 103, loss: 0.3407251238822937, mean loss: 0.3389152800743043
Epoch: 75, step: 104, loss: 0.3060411810874939, mean loss: 0.3389149768216962
Epoch: 75, step: 105, loss: 0.3261384963989258, mean loss: 0.33891485896400914
Epoch: 75, step: 106, loss: 0.2951464354991913, mean loss: 0.3389144552223369
Epoch: 75, step: 107, loss: 0.3376915752887726, mean loss: 0.33891444394198916
Epoch: 75, step: 108, loss: 0.3498852849006653, mean loss: 0.338914545140607
Epoch: 75, step: 109, loss: 0.356499046087265, mean loss: 0.33891470734428697
Epoch: 75, step: 110, loss: 0.4009639322757721, mean loss: 0.3389152796960311
Epoch: 75, step: 111, loss: 0.32489168643951416, mean loss: 0.3389151503414093
Epoch: 75, step: 112, loss: 0.32019904255867004, mean loss: 0.33891497770429213
Epoch: 75, step: 113, loss: 0.34865254163742065, mean loss: 0.3389150675226176
Epoch: 75, step: 114, loss: 0.3787915110588074, mean loss: 0.3389154353355912
Epoch: 75, step: 115, loss: 0.2958703637123108, mean loss: 0.33891503829943764
Epoch: 75, step: 116, loss: 0.35347962379455566, mean loss: 0.3389151726380146
Epoch: 75, step: 117, loss: 0.3578977882862091, mean loss: 0.33891534772532156
Epoch: 75, step: 118, loss: 0.32622963190078735, mean loss: 0.3389152307189313
Epoch: 75, step: 119, loss: 0.31345775723457336, mean loss: 0.33891499591471175
Epoch: 75, step: 120, loss: 0.3164196014404297, mean loss: 0.33891478843281736
Epoch: 75, step: 121, loss: 0.36492982506752014, mean loss: 0.3389150283752334
Epoch: 75, step: 122, loss: 0.3186173439025879, mean loss: 0.338914841166943
Epoch: 75, step: 123, loss: 0.3272831439971924, mean loss: 0.33891473388721555
Epoch: 75, step: 124, loss: 0.319715291261673, mean loss: 0.3389145568114247
Epoch: 75, step: 125, loss: 0.31028348207473755, mean loss: 0.33891429275045465
Epoch: 75, step: 126, loss: 0.3183675706386566, mean loss: 0.33891410325224747
Epoch: 75, step: 127, loss: 0.3289514183998108, mean loss: 0.3389140113692942
Epoch: 75, step: 128, loss: 0.3438575863838196, mean loss: 0.3389140569620325
Epoch: 75, step: 129, loss: 0.34665587544441223, mean loss: 0.3389141283612622
Epoch: 75, step: 130, loss: 0.29266825318336487, mean loss: 0.3389137018607672
Epoch: 75, step: 131, loss: 0.31412646174430847, mean loss: 0.338913473263673
Epoch: 75, step: 132, loss: 0.36107128858566284, mean loss: 0.33891367760935487
Epoch: 75, step: 133, loss: 0.31868690252304077, mean loss: 0.33891349107399615
Epoch: 75, step: 134, loss: 0.3036412000656128, mean loss: 0.3389131657888852
Epoch: 75, step: 135, loss: 0.31824061274528503, mean loss: 0.33891297514598945
Epoch: 75, step: 136, loss: 0.3214176595211029, mean loss: 0.3389128138051591
Epoch: 75, step: 137, loss: 0.3309999406337738, mean loss: 0.3389127408337545
Epoch: 75, step: 138, loss: 0.3153747320175171, mean loss: 0.3389125237715461
Epoch: 75, step: 139, loss: 0.3341326415538788, mean loss: 0.3389124796929569
Epoch: 75, step: 140, loss: 0.3273552656173706, mean loss: 0.33891237311690103
Epoch: 75, step: 141, loss: 0.33364740014076233, mean loss: 0.3389123245658509
Epoch: 75, step: 142, loss: 0.35715198516845703, mean loss: 0.33891249276168284
Epoch: 75, step: 143, loss: 0.32486483454704285, mean loss: 0.33891236322332
Epoch: 75, step: 144, loss: 0.34799930453300476, mean loss: 0.33891244701640694
Epoch: 75, step: 145, loss: 0.3223338723182678, mean loss: 0.3389122941423987
Epoch: 75, step: 146, loss: 0.2928389608860016, mean loss: 0.3389118692958538
Epoch: 75, step: 147, loss: 0.3280009329319, mean loss: 0.3389117686860098
Epoch: 75, step: 148, loss: 0.31880006194114685, mean loss: 0.338911583237488
Epoch: 75, step: 149, loss: 0.3639953136444092, mean loss: 0.33891181453053
Epoch: 75, step: 150, loss: 0.30416208505630493, mean loss: 0.33891149411182037
Epoch: 75, step: 151, loss: 0.44299018383026123, mean loss: 0.3389124537869736
Epoch: 75, step: 152, loss: 0.31658849120140076, mean loss: 0.33891224794700064
Epoch: 75, step: 153, loss: 0.3246246874332428, mean loss: 0.33891211620856304
Epoch: 75, step: 154, loss: 0.35058829188346863, mean loss: 0.3389122238677367
Epoch: 75, step: 155, loss: 0.34350359439849854, mean loss: 0.33891226620168347
Epoch: 75, step: 156, loss: 0.3188355267047882, mean loss: 0.33891208108924725
Epoch: 75, step: 157, loss: 0.32710155844688416, mean loss: 0.33891197219435115
Epoch: 75, step: 158, loss: 0.35654863715171814, mean loss: 0.3389121348057062
Epoch: 75, step: 159, loss: 0.3346230089664459, mean loss: 0.3389120952600134
Epoch: 75, step: 160, loss: 0.3024481236934662, mean loss: 0.3389117590656987
Epoch: 75, step: 161, loss: 0.31704574823379517, mean loss: 0.33891155746503826
Epoch: 75, step: 162, loss: 0.3198295831680298, mean loss: 0.3389113815343126
Epoch: 75, step: 163, loss: 0.29383957386016846, mean loss: 0.33891096598806986
Epoch: 75, step: 164, loss: 0.3078838586807251, mean loss: 0.33891067993167096
Epoch: 75, step: 165, loss: 0.4024566411972046, mean loss: 0.338911265792321
Epoch: 75, step: 166, loss: 0.3112007677555084, mean loss: 0.338911010318324
Epoch: 75, step: 167, loss: 0.3222236633300781, mean loss: 0.33891085647251706
Epoch: 75, step: 168, loss: 0.34042689204216003, mean loss: 0.33891087044918844
Epoch: 75, step: 169, loss: 0.30347150564193726, mean loss: 0.3389105437287606
Epoch: 75, step: 170, loss: 0.3131418824195862, mean loss: 0.33891030616608203
Epoch: 75, step: 171, loss: 0.30091339349746704, mean loss: 0.3389099558737239
Epoch: 75, step: 172, loss: 0.34565261006355286, mean loss: 0.3389100180334705
Epoch: 75, step: 173, loss: 0.30727291107177734, mean loss: 0.33890972637734124
Epoch: 75, step: 174, loss: 0.31631389260292053, mean loss: 0.33890951807281233
Epoch: 75, step: 175, loss: 0.29954853653907776, mean loss: 0.33890915521852627
Epoch: 75, step: 176, loss: 0.30959904193878174, mean loss: 0.33890888502195665
Epoch: 75, step: 177, loss: 0.30280178785324097, mean loss: 0.33890855217016025
Epoch: 75, step: 178, loss: 0.355663001537323, mean loss: 0.33890870661894174
Epoch: 75, step: 179, loss: 0.3502325415611267, mean loss: 0.33890881100532577
Epoch: 75, step: 180, loss: 0.33528733253479004, mean loss: 0.33890877762179805
Epoch: 75, step: 181, loss: 0.30569422245025635, mean loss: 0.33890847144607145
Epoch: 75, step: 182, loss: 0.29560914635658264, mean loss: 0.33890807231141357
Epoch: 75, step: 183, loss: 0.328485906124115, mean loss: 0.3389079762404152
Epoch: 75, step: 184, loss: 0.4324720799922943, mean loss: 0.33890883870161953
Epoch: 75, step: 185, loss: 0.2909017503261566, mean loss: 0.3389083961828763
Epoch: 75, step: 186, loss: 0.3690223693847656, mean loss: 0.338908673764275
Epoch: 75, step: 187, loss: 0.3453420102596283, mean loss: 0.33890873306425745
Epoch: 75, step: 188, loss: 0.30151039361953735, mean loss: 0.3389083883441527
Epoch: 75, step: 189, loss: 0.3648326098918915, mean loss: 0.3389086272990937
Epoch: 75, step: 190, loss: 0.3292235732078552, mean loss: 0.33890853802851745
Epoch: 75, step: 191, loss: 0.3094891309738159, mean loss: 0.3389082668619148
Epoch: 75, step: 192, loss: 0.30456486344337463, mean loss: 0.3389079503124285
Epoch: 75, step: 193, loss: 0.3363485634326935, mean loss: 0.3389079267223048
Epoch: 75, step: 194, loss: 0.32866665720939636, mean loss: 0.33890783232837407
Epoch: 75, step: 195, loss: 0.391567200422287, mean loss: 0.33890831768606555
Epoch: 75, step: 196, loss: 0.3645027279853821, mean loss: 0.3389085535857706
Epoch: 75, step: 197, loss: 0.34978485107421875, mean loss: 0.3389086538299916
Epoch: 75, step: 198, loss: 0.37795114517211914, mean loss: 0.338909013671938
Epoch: 75, step: 199, loss: 0.32105812430381775, mean loss: 0.338908849147612
Epoch: 75, step: 200, loss: 0.301413357257843, mean loss: 0.3389085035702266
Epoch: 75, step: 201, loss: 0.3075198829174042, mean loss: 0.3389082142795163
Epoch: 75, step: 202, loss: 0.3643887937068939, mean loss: 0.33890844911707313
Epoch: 75, step: 203, loss: 0.3329349756240845, mean loss: 0.3389083940640475
Epoch: 75, step: 204, loss: 0.3389432430267334, mean loss: 0.3389083943852213
Epoch: 75, step: 205, loss: 0.3217911422252655, mean loss: 0.3389082366312523
Epoch: 75, step: 206, loss: 0.3632534146308899, mean loss: 0.33890846099629784
Epoch: 75, step: 207, loss: 0.32030391693115234, mean loss: 0.3389082895384877
Epoch: 75, step: 208, loss: 0.3445507287979126, mean loss: 0.3389083415382228
Epoch: 75, step: 209, loss: 0.31552132964134216, mean loss: 0.33890812600959047
Epoch: 75, step: 210, loss: 0.359371155500412, mean loss: 0.3389083145898219
Epoch: 75, step: 211, loss: 0.3712935745716095, mean loss: 0.3389086130384726
Epoch: 75, step: 212, loss: 0.35042500495910645, mean loss: 0.33890871916761767
Epoch: 75, step: 213, loss: 0.33450034260749817, mean loss: 0.3389086785426609
Epoch: 75, step: 214, loss: 0.3211696147918701, mean loss: 0.3389085150715854
Epoch: 75, step: 215, loss: 0.30845552682876587, mean loss: 0.33890823444026613
Epoch: 75, step: 216, loss: 0.3129664361476898, mean loss: 0.338907995382807
Epoch: 75, step: 217, loss: 0.3254227340221405, mean loss: 0.3389078711152997
Epoch: 75, step: 218, loss: 0.3184974491596222, mean loss: 0.3389076830337476
Epoch: 75, step: 219, loss: 0.3165484368801117, mean loss: 0.33890747699572554
Epoch: 75, step: 220, loss: 0.31309154629707336, mean loss: 0.3389072391069234
Epoch: 75, step: 221, loss: 0.3420989513397217, mean loss: 0.3389072685176625
Epoch: 75, step: 222, loss: 0.32052215933799744, mean loss: 0.3389070991055639
Epoch: 75, step: 223, loss: 0.28576549887657166, mean loss: 0.3389066094295454
Epoch: 75, step: 224, loss: 0.31911501288414, mean loss: 0.33890642706053786
Epoch: 75, step: 225, loss: 0.4084533751010895, mean loss: 0.3389070678926706
Epoch: 75, step: 226, loss: 0.2947014272212982, mean loss: 0.33890666056877267
Epoch: 75, step: 227, loss: 0.3597036302089691, mean loss: 0.3389068521964599
Epoch: 75, step: 228, loss: 0.337770015001297, mean loss: 0.3389068417214975
Epoch: 75, step: 229, loss: 0.3134354054927826, mean loss: 0.3389066070266092
Epoch: 75, step: 230, loss: 0.3355315029621124, mean loss: 0.33890657592854445
Epoch: 75, step: 231, loss: 0.35412493348121643, mean loss: 0.33890671614854917
Epoch: 75, step: 232, loss: 0.29662173986434937, mean loss: 0.33890632654376274
Epoch: 75, step: 233, loss: 0.3807418942451477, mean loss: 0.33890671200424244
Epoch: 75, step: 234, loss: 0.31085801124572754, mean loss: 0.33890645357423593
Epoch: 75, step: 235, loss: 0.3141078054904938, mean loss: 0.3389062250910775
Epoch: 75, step: 236, loss: 0.3316677510738373, mean loss: 0.3389061583997739
Epoch: 75, step: 237, loss: 0.3589177429676056, mean loss: 0.33890634277376797
Epoch: 75, step: 238, loss: 0.33301666378974915, mean loss: 0.33890628851051713
Epoch: 75, step: 239, loss: 0.30449000000953674, mean loss: 0.33890597142659873
Epoch: 75, step: 240, loss: 0.29156336188316345, mean loss: 0.3389055352540046
Epoch: 75, step: 241, loss: 0.305859237909317, mean loss: 0.3389052307976896
Epoch: 75, step: 242, loss: 0.31822720170021057, mean loss: 0.3389050402922761
Epoch: 75, step: 243, loss: 0.3005216419696808, mean loss: 0.33890468667164
Epoch: 75, step: 244, loss: 0.3100779950618744, mean loss: 0.33890442109799207
Epoch: 75, step: 245, loss: 0.3614772856235504, mean loss: 0.33890462905466046
Epoch: 75, step: 246, loss: 0.3173450827598572, mean loss: 0.3389044304352026
Epoch: 75, step: 247, loss: 0.3452547788619995, mean loss: 0.3389044889378781
Epoch: 75, step: 248, loss: 0.36847877502441406, mean loss: 0.338904761388901
Epoch: 75, step: 249, loss: 0.3435271978378296, mean loss: 0.3389048039723782
Epoch: 75, step: 250, loss: 0.3441993296146393, mean loss: 0.3389048527469233
Epoch: 75, step: 251, loss: 0.3414839804172516, mean loss: 0.33890487650629825
Epoch: 75, step: 252, loss: 0.3764008581638336, mean loss: 0.33890522192265393
Epoch: 75, step: 253, loss: 0.32475653290748596, mean loss: 0.33890509158485876
Epoch: 75, step: 254, loss: 0.3505105674266815, mean loss: 0.33890519849357637
Epoch: 75, step: 255, loss: 0.3523361384868622, mean loss: 0.3389053222171844
Epoch: 75, step: 256, loss: 0.3411857485771179, mean loss: 0.3389053432239031
Epoch: 75, step: 257, loss: 0.30910101532936096, mean loss: 0.3389050686763995
Epoch: 75, step: 258, loss: 0.3502616286277771, mean loss: 0.33890517328826913
Epoch: 75, step: 259, loss: 0.3529651165008545, mean loss: 0.33890530280137904
Epoch: 75, step: 260, loss: 0.3614731729030609, mean loss: 0.3389055106833081
Epoch: 75, step: 261, loss: 0.32812637090682983, mean loss: 0.33890541139313496
Epoch: 75, step: 262, loss: 0.3436853587627411, mean loss: 0.33890545542238404
Epoch: 75, step: 263, loss: 0.3641587495803833, mean loss: 0.33890568803443
Epoch: 75, step: 264, loss: 0.3551684319972992, mean loss: 0.33890583783173084
Epoch: 75, step: 265, loss: 0.35244476795196533, mean loss: 0.33890596253863836
Epoch: 75, step: 266, loss: 0.31390902400016785, mean loss: 0.3389057322942866
Epoch: 75, step: 267, loss: 0.3259008228778839, mean loss: 0.3389056125084435
Epoch: 75, step: 268, loss: 0.33746176958084106, mean loss: 0.33890559920959273
Epoch: 75, step: 269, loss: 0.2869429588317871, mean loss: 0.3389051206000286
Epoch: 75, step: 270, loss: 0.34285977482795715, mean loss: 0.3389051570246192
Epoch: 75, step: 271, loss: 0.37528321146965027, mean loss: 0.33890549208388354
Epoch: 75, step: 272, loss: 0.30159956216812134, mean loss: 0.3389051484816075
Epoch: 75, step: 273, loss: 0.3471962511539459, mean loss: 0.33890522484521823
Epoch: 75, step: 274, loss: 0.32061195373535156, mean loss: 0.33890505636010554
Epoch: 75, step: 275, loss: 0.335195392370224, mean loss: 0.3389050221935863
Epoch: 75, step: 276, loss: 0.3278348743915558, mean loss: 0.33890492023693064
Epoch: 75, step: 277, loss: 0.32036590576171875, mean loss: 0.33890474949318444
Epoch: 75, step: 278, loss: 0.3200720250606537, mean loss: 0.3389045760459761
Epoch: 75, step: 279, loss: 0.2911866009235382, mean loss: 0.3389041365730058
Epoch: 75, step: 280, loss: 0.3373619019985199, mean loss: 0.3389041223694658
Epoch: 75, step: 281, loss: 0.3256778120994568, mean loss: 0.33890400056004744
Epoch: 75, step: 282, loss: 0.34152308106422424, mean loss: 0.3389040246805866
Epoch: 75, step: 283, loss: 0.2932616174221039, mean loss: 0.3389036043386646
Epoch: 75, step: 284, loss: 0.33095353841781616, mean loss: 0.3389035311235251
Epoch: 75, step: 285, loss: 0.3252050578594208, mean loss: 0.33890340497030774
Epoch: 75, step: 286, loss: 0.3133484721183777, mean loss: 0.33890316962967904
Epoch: 75, step: 287, loss: 0.32457441091537476, mean loss: 0.3389030376744104
Epoch: 75, step: 288, loss: 0.3524664640426636, mean loss: 0.3389031625804908
Epoch: 75, step: 289, loss: 0.34443366527557373, mean loss: 0.3389032135106197
Epoch: 75, step: 290, loss: 0.29680225253105164, mean loss: 0.33890282580849906
Epoch: 75, step: 291, loss: 0.29986223578453064, mean loss: 0.33890246629223614
Epoch: 75, step: 292, loss: 0.31942683458328247, mean loss: 0.3389022869470508
Epoch: 75, step: 293, loss: 0.3024055063724518, mean loss: 0.33890195086236313
Epoch: 75, step: 294, loss: 0.3407250940799713, mean loss: 0.33890196765082686
Epoch: 75, step: 295, loss: 0.35004058480262756, mean loss: 0.3389020702201402
Epoch: 75, step: 296, loss: 0.3720689117908478, mean loss: 0.3389023756322747
Epoch: 75, step: 297, loss: 0.34286725521087646, mean loss: 0.33890241214196715
Epoch: 75, step: 298, loss: 0.34557095170021057, mean loss: 0.33890247354713254
Epoch: 75, step: 299, loss: 0.3660590350627899, mean loss: 0.33890272360755164
Epoch: 75, step: 300, loss: 0.3392369747161865, mean loss: 0.338902726685342
Epoch: 75, step: 301, loss: 0.3487410545349121, mean loss: 0.3389028172760111
Epoch: 75, step: 302, loss: 0.30286356806755066, mean loss: 0.33890248543205465
Epoch: 75, step: 303, loss: 0.3588723838329315, mean loss: 0.33890266931016594
Epoch: 75, step: 304, loss: 0.3547685146331787, mean loss: 0.33890281539778
Epoch: 75, step: 305, loss: 0.31889498233795166, mean loss: 0.3389026311737679
Epoch: 75, step: 306, loss: 0.33479613065719604, mean loss: 0.3389025933631248
Epoch: 75, step: 307, loss: 0.3595403730869293, mean loss: 0.33890278338393104
Epoch: 75, step: 308, loss: 0.32896527647972107, mean loss: 0.3389026918859253
Epoch: 75, step: 309, loss: 0.33218103647232056, mean loss: 0.33890262999792775
Epoch: 75, step: 310, loss: 0.3675009608268738, mean loss: 0.33890289330763695
Epoch: 75, step: 311, loss: 0.39230045676231384, mean loss: 0.33890338494358374
Epoch: 75, step: 312, loss: 0.3244008421897888, mean loss: 0.33890325141865807
Epoch: 75, step: 313, loss: 0.3326035141944885, mean loss: 0.33890319341750513
Epoch: 75, step: 314, loss: 0.3714069724082947, mean loss: 0.3389034926743204
Epoch: 75, step: 315, loss: 0.36526021361351013, mean loss: 0.33890373533397405
Epoch: 75, step: 316, loss: 0.29978734254837036, mean loss: 0.33890337520256936
Epoch: 75, step: 317, loss: 0.32071271538734436, mean loss: 0.33890320772885585
Epoch: 75, step: 318, loss: 0.3115409314632416, mean loss: 0.33890295581826685
Epoch: 75, step: 319, loss: 0.37577590346336365, mean loss: 0.3389032952856545
Epoch: 75, step: 320, loss: 0.3514375686645508, mean loss: 0.33890341068022256
Epoch: 75, step: 321, loss: 0.34233126044273376, mean loss: 0.3389034422378238
Epoch: 75, step: 322, loss: 0.33982235193252563, mean loss: 0.33890345069744743
Epoch: 75, step: 323, loss: 0.32798564434051514, mean loss: 0.3389033501873727
Epoch: 75, step: 324, loss: 0.2984342873096466, mean loss: 0.33890297762983185
Epoch: 75, step: 325, loss: 0.33143359422683716, mean loss: 0.3389029088674416
Epoch: 75, step: 326, loss: 0.3002067506313324, mean loss: 0.3389025526377912
Epoch: 75, step: 327, loss: 0.29707854986190796, mean loss: 0.3389021676173289
Epoch: 75, step: 328, loss: 0.3054570257663727, mean loss: 0.33890185973322934
Epoch: 75, step: 329, loss: 0.347200483083725, mean loss: 0.3389019361267058
Epoch: 75, step: 330, loss: 0.3542361259460449, mean loss: 0.33890207728521327
Epoch: 75, step: 331, loss: 0.333997905254364, mean loss: 0.33890203214039377
Epoch: 75, step: 332, loss: 0.299955278635025, mean loss: 0.33890167362361245
Epoch: 75, step: 333, loss: 0.33949998021125793, mean loss: 0.33890167913115693
Epoch: 75, step: 334, loss: 0.36107781529426575, mean loss: 0.3389018832655166
Epoch: 75, step: 335, loss: 0.3188161551952362, mean loss: 0.33890169837535067
Epoch: 75, step: 336, loss: 0.31088557839393616, mean loss: 0.3389014404878908
Epoch: 75, step: 337, loss: 0.32952576875686646, mean loss: 0.3389013541859363
Epoch: 75, step: 338, loss: 0.2939491868019104, mean loss: 0.3389009404103365
Epoch: 75, step: 339, loss: 0.35569438338279724, mean loss: 0.3389010949891562
Epoch: 75, step: 340, loss: 0.36694303154945374, mean loss: 0.3389013531047531
Epoch: 75, step: 341, loss: 0.3156510293483734, mean loss: 0.3389011390961399
Epoch: 75, step: 342, loss: 0.35335054993629456, mean loss: 0.3389012720951443
Epoch: 75, step: 343, loss: 0.33494868874549866, mean loss: 0.3389012357140892
Epoch: 75, step: 344, loss: 0.39367496967315674, mean loss: 0.33890173986737704
Epoch: 75, step: 345, loss: 0.3370376527309418, mean loss: 0.33890172270993785
Epoch: 75, step: 346, loss: 0.3309057354927063, mean loss: 0.33890164911391385
Epoch: 75, step: 347, loss: 0.3204253911972046, mean loss: 0.3389014790577884
Epoch: 75, step: 348, loss: 0.32470428943634033, mean loss: 0.3389013483875602
Epoch: 75, step: 349, loss: 0.33120042085647583, mean loss: 0.338901277509258
Epoch: 75, step: 350, loss: 0.31682372093200684, mean loss: 0.3389010743122642
Epoch: 75, step: 351, loss: 0.3598521649837494, mean loss: 0.3389012671397379
Epoch: 75, step: 352, loss: 0.3724671006202698, mean loss: 0.33890157606662885
Epoch: 75, step: 353, loss: 0.34723567962646484, mean loss: 0.33890165276977424
Epoch: 75, step: 354, loss: 0.3224221467971802, mean loss: 0.3389015011015954
Epoch: 75, step: 355, loss: 0.347262978553772, mean loss: 0.33890157805526067
Epoch: 75, step: 356, loss: 0.358463317155838, mean loss: 0.3389017580872798
Epoch: 75, step: 357, loss: 0.325588583946228, mean loss: 0.3389016355636355
Epoch: 75, step: 358, loss: 0.34414908289909363, mean loss: 0.3389016838564353
Epoch: 75, step: 359, loss: 0.3456065356731415, mean loss: 0.33890174556131125
Epoch: 75, step: 360, loss: 0.3170662224292755, mean loss: 0.3389015446104353
Epoch: 75, step: 361, loss: 0.3136137127876282, mean loss: 0.3389013118903324
Epoch: 75, step: 362, loss: 0.29438647627830505, mean loss: 0.33890090223078306
Epoch: 75, step: 363, loss: 0.32168686389923096, mean loss: 0.3389007438154999
Epoch: 75, step: 364, loss: 0.31640416383743286, mean loss: 0.3389005367885825
Epoch: 75, step: 365, loss: 0.3172101378440857, mean loss: 0.33890033718245965
Epoch: 75, step: 366, loss: 0.3420393764972687, mean loss: 0.3389003660692359
Epoch: 75, step: 367, loss: 0.37013232707977295, mean loss: 0.3389006534763936
Epoch: 75, step: 368, loss: 0.3311944603919983, mean loss: 0.338900582562029
Epoch: 75, step: 369, loss: 0.3478955626487732, mean loss: 0.33890066533538027
Epoch: 75, step: 370, loss: 0.30675289034843445, mean loss: 0.3389003695087569
Epoch: 75, step: 371, loss: 0.37339693307876587, mean loss: 0.33890068694621617
Epoch: 75, step: 372, loss: 0.32534274458885193, mean loss: 0.3389005621871467
Epoch: 75, step: 373, loss: 0.29583966732025146, mean loss: 0.3389001659479831
Epoch: 75, step: 374, loss: 0.3205517828464508, mean loss: 0.3388999971107795
Epoch: 75, step: 375, loss: 0.3793000876903534, mean loss: 0.3389003688588249
Epoch: 75, step: 376, loss: 0.33675748109817505, mean loss: 0.3389003491408739
Epoch: 75, step: 377, loss: 0.3174700438976288, mean loss: 0.33890015195004186
Epoch: 75, step: 378, loss: 0.3128693997859955, mean loss: 0.33889991243042755
Epoch: 75, step: 379, loss: 0.3342646062374115, mean loss: 0.33889986977946884
Epoch: 75, step: 380, loss: 0.31019991636276245, mean loss: 0.33889960570430006
Epoch: 75, step: 381, loss: 0.34506163001060486, mean loss: 0.3388996624020449
Epoch: 75, step: 382, loss: 0.3305171728134155, mean loss: 0.338899585274163
Epoch: 75, step: 383, loss: 0.3269885778427124, mean loss: 0.33889947568114626
Epoch: 75, step: 384, loss: 0.32926928997039795, mean loss: 0.3388993870747543
Epoch: 75, step: 385, loss: 0.3010956943035126, mean loss: 0.33889903924989395
Epoch: 75, step: 386, loss: 0.3567909598350525, mean loss: 0.338899203868667
Epoch: 75, step: 387, loss: 0.3122808039188385, mean loss: 0.33889895896214606
Epoch: 75, step: 388, loss: 0.28426092863082886, mean loss: 0.3388984562615017
Epoch: 75, step: 389, loss: 0.3096563518047333, mean loss: 0.3388981872201506
Epoch: 75, step: 390, loss: 0.3391667604446411, mean loss: 0.33889818969113
Epoch: 75, step: 391, loss: 0.31275686621665955, mean loss: 0.33889794918287297
Epoch: 75, step: 392, loss: 0.33351823687553406, mean loss: 0.3388978996883121
Epoch: 75, step: 393, loss: 0.3254089057445526, mean loss: 0.33889777558768147
Epoch: 75, step: 394, loss: 0.31759631633758545, mean loss: 0.33889757961308054
Epoch: 75, step: 395, loss: 0.3426751494407654, mean loss: 0.33889761436661175
Epoch: 75, step: 396, loss: 0.34095969796180725, mean loss: 0.3388976333375456
Epoch: 75, step: 397, loss: 0.31626227498054504, mean loss: 0.3388974250967467
Epoch: 75, step: 398, loss: 0.3022410273551941, mean loss: 0.3388970878682741
Epoch: 75, step: 399, loss: 0.33686360716819763, mean loss: 0.33889706916099993
Epoch: 75, step: 400, loss: 0.3040718734264374, mean loss: 0.3388967487849617
Epoch: 75, step: 401, loss: 0.32608136534690857, mean loss: 0.3388966308903191
Epoch: 75, step: 402, loss: 0.32264599204063416, mean loss: 0.3388964813945476
Epoch: 75, step: 403, loss: 0.30936309695243835, mean loss: 0.3388962097082762
Epoch: 75, step: 404, loss: 0.3654313385486603, mean loss: 0.3388964538104688
Epoch: 75, step: 405, loss: 0.3658282160758972, mean loss: 0.33889670155909596
Epoch: 75, step: 406, loss: 0.33020684123039246, mean loss: 0.3388966216207265
Epoch: 75, step: 407, loss: 0.3408406674861908, mean loss: 0.3388966395039169
Epoch: 75, step: 408, loss: 0.32009488344192505, mean loss: 0.338896466549
Epoch: 75, step: 409, loss: 0.29102444648742676, mean loss: 0.33889602618454356
Epoch: 75, step: 410, loss: 0.312515527009964, mean loss: 0.33889578351821564
Epoch: 75, step: 411, loss: 0.3023892641067505, mean loss: 0.3388954477087428
Epoch: 75, step: 412, loss: 0.3354949951171875, mean loss: 0.3388954164295711
Epoch: 75, step: 413, loss: 0.3305092453956604, mean loss: 0.3388953392898188
Epoch: 75, step: 414, loss: 0.2998602092266083, mean loss: 0.33889498023053477
Epoch: 75, step: 415, loss: 0.34613654017448425, mean loss: 0.3388950468404169
Epoch: 75, step: 416, loss: 0.3309978246688843, mean loss: 0.33889497420023945
Epoch: 75, step: 417, loss: 0.34833818674087524, mean loss: 0.3388950610599365
Epoch: 75, step: 418, loss: 0.34447237849235535, mean loss: 0.33889511236023756
Epoch: 75, step: 419, loss: 0.328379362821579, mean loss: 0.3388950156370078
Epoch: 75, step: 420, loss: 0.33151280879974365, mean loss: 0.3388949477365393
Epoch: 75, step: 421, loss: 0.3372901976108551, mean loss: 0.338894932976416
Epoch: 75, step: 422, loss: 0.3628585934638977, mean loss: 0.3388951533866373
Epoch: 75, step: 423, loss: 0.3436304032802582, mean loss: 0.3388951969395777
Epoch: 75, step: 424, loss: 0.32437455654144287, mean loss: 0.3388950633857456
Epoch: 75, step: 425, loss: 0.3321690559387207, mean loss: 0.33889500152374896
Epoch: 75, step: 426, loss: 0.30610570311546326, mean loss: 0.3388946999491777
Epoch: 75, step: 427, loss: 0.3738724887371063, mean loss: 0.33889502164909663
Epoch: 75, step: 428, loss: 0.3143687844276428, mean loss: 0.33889479607691975
Epoch: 75, step: 429, loss: 0.3108590543270111, mean loss: 0.3388945382295754
Epoch: 75, step: 430, loss: 0.3154233396053314, mean loss: 0.33889432236474726
Epoch: 75, step: 431, loss: 0.3141111433506012, mean loss: 0.3388940944357198
Epoch: 75, step: 432, loss: 0.3084504008293152, mean loss: 0.3388938144499417
Epoch: 75, step: 433, loss: 0.30229783058166504, mean loss: 0.33889347788563
Epoch: 75, step: 434, loss: 0.37988585233688354, mean loss: 0.33889385487900336
Epoch: 75, step: 435, loss: 0.3341413736343384, mean loss: 0.3388938111723998
Epoch: 75, step: 436, loss: 0.3487972021102905, mean loss: 0.33889390224895094
Epoch: 75, step: 437, loss: 0.33463427424430847, mean loss: 0.33889386307563524
Epoch: 75, step: 438, loss: 0.37819504737854004, mean loss: 0.3388942245023938
Epoch: 75, step: 439, loss: 0.3259979784488678, mean loss: 0.3388941059053177
Epoch: 75, step: 440, loss: 0.29145175218582153, mean loss: 0.3388936696176827
Epoch: 75, step: 441, loss: 0.3018982410430908, mean loss: 0.3388933294048066
Epoch: 75, step: 442, loss: 0.33725202083587646, mean loss: 0.33889331431134245
Epoch: 75, step: 443, loss: 0.35852140188217163, mean loss: 0.3388934948094625
Epoch: 75, step: 444, loss: 0.33999496698379517, mean loss: 0.338893504938408
Epoch: 75, step: 445, loss: 0.29558658599853516, mean loss: 0.3388931066992181
Epoch: 75, step: 446, loss: 0.35713884234428406, mean loss: 0.3388932744807261
Epoch: 75, step: 447, loss: 0.35236895084381104, mean loss: 0.33889339839727045
Epoch: 75, step: 448, loss: 0.341655969619751, mean loss: 0.33889342380045784
Epoch: 75, step: 449, loss: 0.346895307302475, mean loss: 0.3388934973809958
Epoch: 75, step: 450, loss: 0.34500375390052795, mean loss: 0.338893553566746
Epoch: 75, step: 451, loss: 0.3359825611114502, mean loss: 0.33889352679949153
Epoch: 75, step: 452, loss: 0.3345394432544708, mean loss: 0.33889348676304615
Epoch: 75, step: 453, loss: 0.3546368479728699, mean loss: 0.33889363152426144
Epoch: 75, step: 454, loss: 0.37700992822647095, mean loss: 0.33889398200282983
Epoch: 75, step: 455, loss: 0.32604047656059265, mean loss: 0.33889386381619696
Epoch: 75, step: 456, loss: 0.30649369955062866, mean loss: 0.33889356590282804
Epoch: 75, step: 457, loss: 0.35157668590545654, mean loss: 0.3388936825206401
Epoch: 75, step: 458, loss: 0.3238755464553833, mean loss: 0.33889354443426506
Epoch: 75, step: 459, loss: 0.31239819526672363, mean loss: 0.3388933008212716
Epoch: 75, step: 460, loss: 0.3034193515777588, mean loss: 0.3388929746570285
Epoch: 75, step: 461, loss: 0.3140823543071747, mean loss: 0.33889274653856477
Epoch: 75, step: 462, loss: 0.35852065682411194, mean loss: 0.3388929270035233
Epoch: 75, step: 463, loss: 0.3349675238132477, mean loss: 0.33889289091250796
Epoch: 75, step: 464, loss: 0.3333437740802765, mean loss: 0.3388928398931834
Epoch: 75, step: 465, loss: 0.3737681210041046, mean loss: 0.33889316053824814
Epoch: 75, step: 466, loss: 0.34244781732559204, mean loss: 0.3388931932196385
Epoch: 75, step: 467, loss: 0.3159058690071106, mean loss: 0.33889298187692546
Epoch: 75, step: 468, loss: 0.3359925448894501, mean loss: 0.3388929552108994
Epoch: 75, step: 469, loss: 0.35376328229904175, mean loss: 0.3388930919243966
Epoch: 75, step: 470, loss: 0.377403199672699, mean loss: 0.3388934459719621
Epoch: 75, step: 471, loss: 0.339450478553772, mean loss: 0.3388934510930648
Epoch: 75, step: 472, loss: 0.2987232506275177, mean loss: 0.33889308179001654
Epoch: 75, step: 473, loss: 0.3359200954437256, mean loss: 0.3388930544582429
Epoch: 75, step: 474, loss: 0.37171831727027893, mean loss: 0.33889335623036715
Epoch: 75, step: 475, loss: 0.2815278172492981, mean loss: 0.33889282885724276
Epoch: 75, step: 476, loss: 0.329476922750473, mean loss: 0.3388927422956892
Epoch: 75, step: 477, loss: 0.3046576976776123, mean loss: 0.3388924275717136
Epoch: 75, step: 478, loss: 0.3256274163722992, mean loss: 0.3388923056271177
Epoch: 75, step: 479, loss: 0.3218023180961609, mean loss: 0.33889214852114663
Epoch: 75, step: 480, loss: 0.3127422630786896, mean loss: 0.33889190813095493
Epoch: 75, step: 481, loss: 0.3202517628669739, mean loss: 0.3388917367777415
Epoch: 75, step: 482, loss: 0.34475237131118774, mean loss: 0.3388917906522856
Epoch: 75, step: 483, loss: 0.3440760672092438, mean loss: 0.33889183830889463
Epoch: 75, step: 484, loss: 0.35025638341903687, mean loss: 0.338891942776837
Epoch: 75, step: 485, loss: 0.3173253834247589, mean loss: 0.33889174452927434
Epoch: 75, step: 486, loss: 0.3582685589790344, mean loss: 0.33889192264627777
Epoch: 75, step: 487, loss: 0.3192414343357086, mean loss: 0.3388917420152494
Epoch: 75, step: 488, loss: 0.3298594653606415, mean loss: 0.3388916589896066
Epoch: 75, step: 489, loss: 0.3148643374443054, mean loss: 0.3388914381299546
Epoch: 75, step: 490, loss: 0.3375309109687805, mean loss: 0.33889142562407487
Epoch: 75, step: 491, loss: 0.28479504585266113, mean loss: 0.3388909283781398
Epoch: 75, step: 492, loss: 0.3262963891029358, mean loss: 0.33889081261205856
Epoch: 75, step: 493, loss: 0.34186291694641113, mean loss: 0.3388908399307005
Epoch: 75, step: 494, loss: 0.3259102404117584, mean loss: 0.33889072061823655
Epoch: 75, step: 495, loss: 0.3316788375377655, mean loss: 0.3388906543301094
Epoch: 75, step: 496, loss: 0.30724039673805237, mean loss: 0.3388903634189851
Epoch: 75, step: 497, loss: 0.33349746465682983, mean loss: 0.3388903138509897
Epoch: 75, step: 498, loss: 0.3001599907875061, mean loss: 0.3388899578704838
Epoch: 75, step: 499, loss: 0.3855046331882477, mean loss: 0.3388903863141908
Epoch: 75, step: 500, loss: 0.33833691477775574, mean loss: 0.33889038122718296
Epoch: 75, step: 501, loss: 0.3611319959163666, mean loss: 0.3388905856500308
Epoch: 75, step: 502, loss: 0.3168778121471405, mean loss: 0.3388903833323235
Epoch: 75, step: 503, loss: 0.3022763133049011, mean loss: 0.3388900468183164
Epoch: 75, step: 504, loss: 0.339839369058609, mean loss: 0.3388900555433037
Epoch: 75, step: 505, loss: 0.37712711095809937, mean loss: 0.3388904069674477
Epoch: 75, step: 506, loss: 0.3285609483718872, mean loss: 0.3388903120336788
Epoch: 75, step: 507, loss: 0.35569852590560913, mean loss: 0.33889046650958016
Epoch: 75, step: 508, loss: 0.29533401131629944, mean loss: 0.33889006620762724
Epoch: 75, step: 509, loss: 0.32598164677619934, mean loss: 0.33888994757497004
Epoch: 75, step: 510, loss: 0.32084977626800537, mean loss: 0.3388897817813342
Epoch: 75, step: 511, loss: 0.37404677271842957, mean loss: 0.33889010487980625
Epoch: 75, step: 512, loss: 0.33423787355422974, mean loss: 0.33889006212543565
Epoch: 75, step: 513, loss: 0.32709696888923645, mean loss: 0.33888995374698033
Epoch: 75, step: 514, loss: 0.31334903836250305, mean loss: 0.3388897190282799
Epoch: 75, step: 515, loss: 0.3552802801132202, mean loss: 0.33888986965466833
Epoch: 75, step: 516, loss: 0.32532522082328796, mean loss: 0.3388897449990646
Epoch: 75, step: 517, loss: 0.3569159209728241, mean loss: 0.338889910653423
Epoch: 75, step: 518, loss: 0.3108035922050476, mean loss: 0.33888965255218656
Epoch: 75, step: 519, loss: 0.35225775837898254, mean loss: 0.3388897753982243
Epoch: 75, step: 520, loss: 0.28399595618247986, mean loss: 0.3388892709568093
Epoch: 75, step: 521, loss: 0.30408790707588196, mean loss: 0.3388889511559981
Epoch: 75, step: 522, loss: 0.32559460401535034, mean loss: 0.33888882899113276
Epoch: 75, step: 523, loss: 0.30833008885383606, mean loss: 0.3388885481823026
Epoch: 75, step: 524, loss: 0.3620982766151428, mean loss: 0.33888876145800606
Epoch: 75, step: 525, loss: 0.3385457694530487, mean loss: 0.3388887583062592
Epoch: 75, step: 526, loss: 0.32925212383270264, mean loss: 0.3388886697562259
Epoch: 75, step: 527, loss: 0.34636130928993225, mean loss: 0.3388887384209035
Epoch: 75, step: 528, loss: 0.3406764566898346, mean loss: 0.3388887548477591
Epoch: 75, step: 529, loss: 0.34050771594047546, mean loss: 0.3388887697238143
Epoch: 75, step: 530, loss: 0.2968570291996002, mean loss: 0.33888838351271156
Epoch: 75, step: 531, loss: 0.3729393184185028, mean loss: 0.3388886963888409
Epoch: 75, step: 532, loss: 0.36818644404411316, mean loss: 0.33888896558795933
Epoch: 75, step: 533, loss: 0.3371583819389343, mean loss: 0.3388889496868287
Epoch: 75, step: 534, loss: 0.3255458474159241, mean loss: 0.3388888270874602
Epoch: 75, step: 535, loss: 0.3538390100002289, mean loss: 0.3388889644517782
Epoch: 75, step: 536, loss: 0.3847019374370575, mean loss: 0.33888938538374974
Epoch: 75, step: 537, loss: 0.369590163230896, mean loss: 0.3388896674614969
Epoch: 75, step: 538, loss: 0.3192098140716553, mean loss: 0.3388894866453061
Epoch: 75, step: 539, loss: 0.33130061626434326, mean loss: 0.3388894169202934
Epoch: 75, step: 540, loss: 0.3167564868927002, mean loss: 0.33888921356925816
Epoch: 75, step: 541, loss: 0.3482726812362671, mean loss: 0.3388892997810851
Epoch: 75, step: 542, loss: 0.3526421785354614, mean loss: 0.33888942613628253
Epoch: 75, step: 543, loss: 0.3383261263370514, mean loss: 0.3388894209609876
Epoch: 75, step: 544, loss: 0.3322717249393463, mean loss: 0.3388893601617224
Epoch: 75, step: 545, loss: 0.3618685305118561, mean loss: 0.33888957127807345
Epoch: 75, step: 546, loss: 0.3349854052066803, mean loss: 0.33888953540968875
Epoch: 75, step: 547, loss: 0.3307475447654724, mean loss: 0.33888946060821656
Epoch: 75, step: 548, loss: 0.39859575033187866, mean loss: 0.33889000913222433
Epoch: 75, step: 549, loss: 0.3482725918292999, mean loss: 0.3388900953295849
Epoch: 75, step: 550, loss: 0.31493085622787476, mean loss: 0.33888987521916697
Epoch: 75, step: 551, loss: 0.3196234107017517, mean loss: 0.3388896982222857
Epoch: 75, step: 552, loss: 0.3361375033855438, mean loss: 0.3388896729386937
Epoch: 75, step: 553, loss: 0.3308689296245575, mean loss: 0.33888959925519735
Epoch: 75, step: 554, loss: 0.35597851872444153, mean loss: 0.3388897562431122
Epoch: 75, step: 555, loss: 0.33574190735816956, mean loss: 0.3388897273255616
Epoch: 75, step: 556, loss: 0.3018980026245117, mean loss: 0.33888938750612235
Epoch: 75, step: 557, loss: 0.310939222574234, mean loss: 0.3388891307480988
Epoch: 75, step: 558, loss: 0.38170820474624634, mean loss: 0.33888952409246165
Epoch: 75, step: 559, loss: 0.3774980902671814, mean loss: 0.3388898787550207
Epoch: 75, step: 560, loss: 0.31689003109931946, mean loss: 0.33888967666384334
Epoch: 75, step: 561, loss: 0.33908718824386597, mean loss: 0.33888967847817325
Epoch: 75, step: 562, loss: 0.35206082463264465, mean loss: 0.3388897994664443
Epoch: 75, step: 563, loss: 0.32885250449180603, mean loss: 0.3388897072661304
Epoch: 75, step: 564, loss: 0.32236170768737793, mean loss: 0.3388895554450715
Epoch: 75, step: 565, loss: 0.3194136619567871, mean loss: 0.3388893765472201
Epoch: 75, step: 566, loss: 0.3545840084552765, mean loss: 0.33888952071057454
Epoch: 75, step: 567, loss: 0.32375267148017883, mean loss: 0.33888938167202115
Epoch: 75, step: 568, loss: 0.3083999752998352, mean loss: 0.3388891016161157
Epoch: 75, step: 569, loss: 0.3355824053287506, mean loss: 0.338889071243228
Epoch: 75, step: 570, loss: 0.360319048166275, mean loss: 0.33888926808147624
Epoch: 75, step: 571, loss: 0.3474794328212738, mean loss: 0.33888934698298206
Epoch: 75, step: 572, loss: 0.3151487112045288, mean loss: 0.33888912892491646
Epoch: 75, step: 573, loss: 0.3427075147628784, mean loss: 0.3388891639965207
Epoch: 75, step: 574, loss: 0.3312492072582245, mean loss: 0.3388890938247022
Epoch: 75, step: 575, loss: 0.33400487899780273, mean loss: 0.3388890489643581
Epoch: 75, step: 576, loss: 0.32728567719459534, mean loss: 0.3388889423911446
Epoch: 75, step: 577, loss: 0.33298182487487793, mean loss: 0.3388888881366807
Epoch: 75, step: 578, loss: 0.34531688690185547, mean loss: 0.33888894717468404
Epoch: 75, step: 579, loss: 0.34917396306991577, mean loss: 0.3388890416366228
Epoch: 75, step: 580, loss: 0.3180161118507385, mean loss: 0.3388888499325625
Epoch: 75, step: 581, loss: 0.3242436349391937, mean loss: 0.33888871542718063
Epoch: 75, step: 582, loss: 0.3222827911376953, mean loss: 0.3388885629155462
Epoch: 75, step: 583, loss: 0.32592135667800903, mean loss: 0.33888844382361133
Epoch: 75, step: 584, loss: 0.3383024036884308, mean loss: 0.33888843844141786
Epoch: 75, step: 585, loss: 0.32515400648117065, mean loss: 0.338888312305533
Epoch: 75, step: 586, loss: 0.3599832355976105, mean loss: 0.33888850603778103
Epoch: 75, step: 587, loss: 0.3442706763744354, mean loss: 0.33888855546627944
Epoch: 75, step: 588, loss: 0.3506048321723938, mean loss: 0.33888866306462917
Epoch: 75, step: 589, loss: 0.35670819878578186, mean loss: 0.33888882671175674
Epoch: 75, step: 590, loss: 0.3322840929031372, mean loss: 0.338888766057214
Epoch: 75, step: 591, loss: 0.3512430489063263, mean loss: 0.3388888795116721
Epoch: 75, step: 592, loss: 0.3833940625190735, mean loss: 0.33888928821730985
Epoch: 75, step: 593, loss: 0.32668110728263855, mean loss: 0.33888917610662483
Epoch: 75, step: 594, loss: 0.28373268246650696, mean loss: 0.33888866959582414
Epoch: 75, step: 595, loss: 0.3307057321071625, mean loss: 0.33888859445130565
Epoch: 75, step: 596, loss: 0.35655543208122253, mean loss: 0.33888875668568885
Epoch: 75, step: 597, loss: 0.35356706380844116, mean loss: 0.33888889147519025
Epoch: 75, step: 598, loss: 0.36752232909202576, mean loss: 0.33888915441091616
Epoch: 75, step: 599, loss: 0.30748724937438965, mean loss: 0.338888866055498
Epoch: 75, step: 600, loss: 0.3851783573627472, mean loss: 0.33888929111579413
Epoch: 75, step: 601, loss: 0.33903613686561584, mean loss: 0.3388892924642152
Epoch: 75, step: 602, loss: 0.340585321187973, mean loss: 0.33888930803797096
Epoch: 75, step: 603, loss: 0.3052721321582794, mean loss: 0.3388889993516428
Epoch: 75, step: 604, loss: 0.3415583074092865, mean loss: 0.3388890238620698
Epoch: 75, step: 605, loss: 0.29537448287010193, mean loss: 0.3388886243015223
Epoch: 75, step: 606, loss: 0.3285382390022278, mean loss: 0.33888852926277085
Epoch: 75, step: 607, loss: 0.34950628876686096, mean loss: 0.3388886267556961
Epoch: 75, step: 608, loss: 0.3331119418144226, mean loss: 0.33888857371430425
Epoch: 75, step: 609, loss: 0.2831275761127472, mean loss: 0.33888806172277364
Epoch: 75, step: 610, loss: 0.33502185344696045, mean loss: 0.33888802622398767
Epoch: 75, step: 611, loss: 0.32663652300834656, mean loss: 0.338887913734058
Epoch: 75, step: 612, loss: 0.28948715329170227, mean loss: 0.33888746015404053
Epoch: 75, step: 613, loss: 0.3355467617511749, mean loss: 0.33888742948123074
Epoch: 75, step: 614, loss: 0.32535216212272644, mean loss: 0.33888730520755533
Epoch: 75, step: 615, loss: 0.3174721300601959, mean loss: 0.3388871085865341
Epoch: 75, step: 616, loss: 0.32871192693710327, mean loss: 0.33888701516510633
Epoch: 75, step: 617, loss: 0.36371251940727234, mean loss: 0.33888724309349505
Epoch: 75, step: 618, loss: 0.311085969209671, mean loss: 0.3388869878462573
Epoch: 75, step: 619, loss: 0.3466292917728424, mean loss: 0.3388870589287392
Epoch: 75, step: 620, loss: 0.33579134941101074, mean loss: 0.3388870305071353
Epoch: 75, step: 621, loss: 0.3298742473125458, mean loss: 0.33888694776183875
Epoch: 75, step: 622, loss: 0.3897903263568878, mean loss: 0.33888741509544684
Epoch: 75, step: 623, loss: 0.35115453600883484, mean loss: 0.3388875277163652
Epoch: 75, step: 624, loss: 0.3685818910598755, mean loss: 0.33888780032929466
Epoch: 75, step: 625, loss: 0.3311308026313782, mean loss: 0.3388877291158314
Epoch: 75, step: 626, loss: 0.33895421028137207, mean loss: 0.3388877297261591
Epoch: 75, step: 627, loss: 0.3868120610713959, mean loss: 0.3388881696895418
Epoch: 75, step: 628, loss: 0.3423655927181244, mean loss: 0.3388882016132997
Epoch: 75, step: 629, loss: 0.34231191873550415, mean loss: 0.3388882330437332
Epoch: 75, step: 630, loss: 0.33381155133247375, mean loss: 0.3388881864391697
Epoch: 75, step: 631, loss: 0.31868916749954224, mean loss: 0.3388880010113896
Epoch: 75, step: 632, loss: 0.309565931558609, mean loss: 0.33888773183612175
Epoch: 75, step: 633, loss: 0.3022438883781433, mean loss: 0.3388873954503886
Epoch: 75, step: 634, loss: 0.3351493179798126, mean loss: 0.33888736113563694
Epoch: 75, step: 635, loss: 0.31059730052948, mean loss: 0.33888710144131545
Epoch: 75, step: 636, loss: 0.35509318113327026, mean loss: 0.33888725020692945
Epoch: 75, step: 637, loss: 0.323113352060318, mean loss: 0.33888710540990596
Epoch: 75, step: 638, loss: 0.3589685559272766, mean loss: 0.33888728974655785
Epoch: 75, step: 639, loss: 0.2941361665725708, mean loss: 0.33888687895967357
Epoch: 75, step: 640, loss: 0.332815021276474, mean loss: 0.33888682322438857
Epoch: 75, step: 641, loss: 0.36279693245887756, mean loss: 0.33888704269997405
Epoch: 75, step: 642, loss: 0.3711397647857666, mean loss: 0.33888733875132276
Epoch: 75, step: 643, loss: 0.328774094581604, mean loss: 0.3388872459215738
Epoch: 75, step: 644, loss: 0.3213634192943573, mean loss: 0.33888708507135923
Epoch: 75, step: 645, loss: 0.3107457756996155, mean loss: 0.3388868267662414
Epoch: 75, step: 646, loss: 0.33358079195022583, mean loss: 0.33888677806334166
Epoch: 75, step: 647, loss: 0.31634849309921265, mean loss: 0.3388865711913939
Epoch: 75, step: 648, loss: 0.31284669041633606, mean loss: 0.3388863321815749
Epoch: 75, step: 649, loss: 0.32727643847465515, mean loss: 0.33888622561990706
Epoch: 75, step: 650, loss: 0.383811354637146, mean loss: 0.33888663796241897
Epoch: 75, step: 651, loss: 0.35044652223587036, mean loss: 0.33888674406312636
Epoch: 75, step: 652, loss: 0.35268324613571167, mean loss: 0.33888687069114093
Epoch: 75, step: 653, loss: 0.3226386606693268, mean loss: 0.33888672156205873
Epoch: 75, step: 654, loss: 0.3093739449977875, mean loss: 0.33888645069081313
Epoch: 75, step: 655, loss: 0.35022735595703125, mean loss: 0.33888655477783236
Epoch: 75, step: 656, loss: 0.30820411443710327, mean loss: 0.3388862731764636
Epoch: 75, step: 657, loss: 0.3416908383369446, mean loss: 0.3388862989163373
Epoch: 75, step: 658, loss: 0.29041630029678345, mean loss: 0.3388858540701234
Epoch: 75, step: 659, loss: 0.2917531430721283, mean loss: 0.33888542150118983
Epoch: 75, step: 660, loss: 0.2981601357460022, mean loss: 0.3388850477409843
Epoch: 75, step: 661, loss: 0.33533740043640137, mean loss: 0.33888501518241065
Epoch: 75, step: 662, loss: 0.3620864748954773, mean loss: 0.33888522811211813
Epoch: 75, step: 663, loss: 0.3611927032470703, mean loss: 0.33888543283546835
Epoch: 75, step: 664, loss: 0.33724698424339294, mean loss: 0.33888541779900166
Epoch: 75, step: 665, loss: 0.3090277314186096, mean loss: 0.33888514378980267
Epoch: 75, step: 666, loss: 0.3102273643016815, mean loss: 0.3388848807947722
Epoch: 75, step: 667, loss: 0.3091577887535095, mean loss: 0.3388846079890674
Epoch: 75, step: 668, loss: 0.31537264585494995, mean loss: 0.3388843922216277
Epoch: 75, step: 669, loss: 0.3131362497806549, mean loss: 0.3388841559351044
Epoch: 75, step: 670, loss: 0.30567654967308044, mean loss: 0.33888385119708914
Epoch: 75, step: 671, loss: 0.2837870121002197, mean loss: 0.3388833455916208
Epoch: 75, step: 672, loss: 0.3161854147911072, mean loss: 0.33888313730212893
Epoch: 75, step: 673, loss: 0.33927541971206665, mean loss: 0.3388831409019088
Epoch: 75, step: 674, loss: 0.3291308581829071, mean loss: 0.3388830514108997
Epoch: 75, step: 675, loss: 0.34885963797569275, mean loss: 0.3388831429593743
Epoch: 75, step: 676, loss: 0.3339601457118988, mean loss: 0.33888309778472964
Epoch: 75, step: 677, loss: 0.35358506441116333, mean loss: 0.33888323269238646
Epoch: 75, step: 678, loss: 0.3218037784099579, mean loss: 0.3388830759699511
Epoch: 75, step: 679, loss: 0.29768964648246765, mean loss: 0.33888269797922355
Epoch: 75, step: 680, loss: 0.34852778911590576, mean loss: 0.33888278648172526
Epoch: 75, step: 681, loss: 0.333863228559494, mean loss: 0.33888274042312916
Epoch: 75, step: 682, loss: 0.33879172801971436, mean loss: 0.33888273958802273
Epoch: 75, step: 683, loss: 0.27086612582206726, mean loss: 0.33888211549078123
Epoch: 75, step: 684, loss: 0.38596951961517334, mean loss: 0.33888254754477143
Epoch: 75, step: 685, loss: 0.32874831557273865, mean loss: 0.33888245455822297
Epoch: 75, step: 686, loss: 0.29871484637260437, mean loss: 0.33888208600410014
Epoch: 75, step: 687, loss: 0.3197121322154999, mean loss: 0.33888191011360036
Epoch: 75, step: 688, loss: 0.31516292691230774, mean loss: 0.3388816924862875
Epoch: 75, step: 689, loss: 0.30271461606025696, mean loss: 0.338881360647803
Epoch: 75, step: 690, loss: 0.33693841099739075, mean loss: 0.33888134282110494
Epoch: 75, step: 691, loss: 0.35374316573143005, mean loss: 0.33888147917811196
Epoch: 75, step: 692, loss: 0.3518916666507721, mean loss: 0.3388815985452958
Epoch: 75, step: 693, loss: 0.34212082624435425, mean loss: 0.33888162826461704
Epoch: 75, step: 694, loss: 0.36071059107780457, mean loss: 0.33888182853951787
Epoch: 75, step: 695, loss: 0.3629166781902313, mean loss: 0.3388820490508178
Epoch: 75, step: 696, loss: 0.31271347403526306, mean loss: 0.3388818089655401
Epoch: 75, step: 697, loss: 0.337078720331192, mean loss: 0.338881792423139
Epoch: 75, step: 698, loss: 0.31435492634773254, mean loss: 0.33888156740395464
Epoch: 75, step: 699, loss: 0.3030426502227783, mean loss: 0.3388812386065493
Epoch: 75, step: 700, loss: 0.3214002251625061, mean loss: 0.3388810782317505
Epoch: 75, step: 701, loss: 0.34954556822776794, mean loss: 0.33888117606931306
Epoch: 75, step: 702, loss: 0.3229559659957886, mean loss: 0.3388810299704894
Epoch: 75, step: 703, loss: 0.3229671120643616, mean loss: 0.33888088397660016
Epoch: 75, step: 704, loss: 0.3054385185241699, mean loss: 0.33888057717998116
Epoch: 75, step: 705, loss: 0.32194802165031433, mean loss: 0.33888042184398565
Epoch: 75, step: 706, loss: 0.31187155842781067, mean loss: 0.3388801740721598
Epoch: 75, step: 707, loss: 0.34834951162338257, mean loss: 0.3388802609404406
Epoch: 75, step: 708, loss: 0.32871121168136597, mean loss: 0.3388801676541132
Epoch: 75, step: 709, loss: 0.3275285065174103, mean loss: 0.3388800635199867
Epoch: 75, step: 710, loss: 0.34910646080970764, mean loss: 0.33888015733067817
Epoch: 75, step: 711, loss: 0.30352839827537537, mean loss: 0.33887983303831537
Epoch: 75, step: 712, loss: 0.32515737414360046, mean loss: 0.3388797071592102
Epoch: 75, step: 713, loss: 0.37469038367271423, mean loss: 0.33888003565533464
Epoch: 75, step: 714, loss: 0.3716105818748474, mean loss: 0.3388803358942579
Epoch: 75, step: 715, loss: 0.3386375606060028, mean loss: 0.3388803336672886
Epoch: 75, step: 716, loss: 0.332634299993515, mean loss: 0.33888027637316315
Epoch: 75, step: 717, loss: 0.3180316090583801, mean loss: 0.33888008513256695
Epoch: 75, step: 718, loss: 0.3154316246509552, mean loss: 0.33887987004656833
Epoch: 75, step: 719, loss: 0.31664741039276123, mean loss: 0.3388796661164669
Epoch: 75, step: 720, loss: 0.33621710538864136, mean loss: 0.3388796416940095
Epoch: 75, step: 721, loss: 0.33778253197669983, mean loss: 0.33887963163081386
Epoch: 75, step: 722, loss: 0.31153935194015503, mean loss: 0.3388793808554757
Epoch: 75, step: 723, loss: 0.306869775056839, mean loss: 0.33887908725401367
Epoch: 75, step: 724, loss: 0.3658723831176758, mean loss: 0.33887933484214355
Epoch: 75, step: 725, loss: 0.3092874586582184, mean loss: 0.3388790634217834
Epoch: 75, step: 726, loss: 0.3145444393157959, mean loss: 0.33887884022363884
Epoch: 75, step: 727, loss: 0.3728359639644623, mean loss: 0.3388791516768778
Epoch: 75, step: 728, loss: 0.3194107115268707, mean loss: 0.3388789731148425
Epoch: 75, step: 729, loss: 0.3214643597602844, mean loss: 0.338878813391708
Epoch: 75, step: 730, loss: 0.3308781683444977, mean loss: 0.3388787400121641
Epoch: 75, step: 731, loss: 0.3060430586338043, mean loss: 0.3388784388557937
Epoch: 75, step: 732, loss: 0.28993797302246094, mean loss: 0.33887798999658747
Epoch: 75, step: 733, loss: 0.36279037594795227, mean loss: 0.33887820930786605
Epoch: 75, step: 734, loss: 0.30069249868392944, mean loss: 0.3388778590927001
Epoch: 75, step: 735, loss: 0.3293279707431793, mean loss: 0.33887777150797255
Epoch: 75, step: 736, loss: 0.3741686940193176, mean loss: 0.3388780951680376
Epoch: 75, step: 737, loss: 0.3346445858478546, mean loss: 0.3388780563420382
Epoch: 75, step: 738, loss: 0.3192312717437744, mean loss: 0.33887787616077647
Epoch: 75, step: 739, loss: 0.36103835701942444, mean loss: 0.33887807939335957
Epoch: 75, step: 740, loss: 0.3165840804576874, mean loss: 0.3388778749381644
Epoch: 75, step: 741, loss: 0.3565395176410675, mean loss: 0.33887803690917284
Epoch: 75, step: 742, loss: 0.3664330542087555, mean loss: 0.33887828960780825
Epoch: 75, step: 743, loss: 0.3435323238372803, mean loss: 0.33887833228814124
Epoch: 75, step: 744, loss: 0.39271271228790283, mean loss: 0.33887882597771896
Epoch: 75, step: 745, loss: 0.35250529646873474, mean loss: 0.338878950938474
Epoch: 75, step: 746, loss: 0.3969508707523346, mean loss: 0.3388794834787531
Epoch: 75, step: 747, loss: 0.31267839670181274, mean loss: 0.33887924320761764
Epoch: 75, step: 748, loss: 0.3220250606536865, mean loss: 0.33887908865156896
Epoch: 75, step: 749, loss: 0.3079718351364136, mean loss: 0.3388788052287949
Epoch: 75, step: 750, loss: 0.32337939739227295, mean loss: 0.33887866309889386
Epoch: 75, step: 751, loss: 0.3371853232383728, mean loss: 0.33887864757107355
Epoch: 75, step: 752, loss: 0.3022843897342682, mean loss: 0.33887831200710156
Epoch: 75, step: 753, loss: 0.3098212480545044, mean loss: 0.33887804556053425
Epoch: 75, step: 754, loss: 0.3135205805301666, mean loss: 0.33887781304056697
Epoch: 75, step: 755, loss: 0.3007214367389679, mean loss: 0.338877463161823
Epoch: 75, step: 756, loss: 0.32733598351478577, mean loss: 0.3388773573320308
Epoch: 75, step: 757, loss: 0.3223608136177063, mean loss: 0.33887720588469344
Epoch: 75, step: 758, loss: 0.3234333395957947, mean loss: 0.33887706427449815
Epoch: 75, step: 759, loss: 0.3296920955181122, mean loss: 0.33887698005508904
Epoch: 75, step: 760, loss: 0.3689051866531372, mean loss: 0.33887725538913693
Epoch: 75, step: 761, loss: 0.3475019335746765, mean loss: 0.3388773344696433
Epoch: 75, step: 762, loss: 0.36296626925468445, mean loss: 0.3388775553413852
Epoch: 75, step: 763, loss: 0.3194543421268463, mean loss: 0.3388773772513352
Epoch: 75, step: 764, loss: 0.3277018070220947, mean loss: 0.3388772747842722
Epoch: 75, step: 765, loss: 0.3405410945415497, mean loss: 0.33887729003943656
Epoch: 75, step: 766, loss: 0.33392396569252014, mean loss: 0.3388772446240098
Epoch: 75, step: 767, loss: 0.3913741111755371, mean loss: 0.3388777259463642
Epoch: 75, step: 768, loss: 0.3457679748535156, mean loss: 0.33887778911966654
Epoch: 75, step: 769, loss: 0.36006951332092285, mean loss: 0.3388779834143782
Epoch: 75, step: 770, loss: 0.30166754126548767, mean loss: 0.33887764225639716
Epoch: 75, step: 771, loss: 0.32104796171188354, mean loss: 0.33887747878932456
Epoch: 75, step: 772, loss: 0.33909645676612854, mean loss: 0.3388774807969523
Epoch: 75, step: 773, loss: 0.29124486446380615, mean loss: 0.3388770440969474
Epoch: 75, step: 774, loss: 0.31490856409072876, mean loss: 0.3388768243538348
Epoch: 75, step: 775, loss: 0.3919465243816376, mean loss: 0.3388773108925787
Epoch: 75, step: 776, loss: 0.3776629567146301, mean loss: 0.33887766647300194
Epoch: 75, step: 777, loss: 0.31376394629478455, mean loss: 0.33887743623665567
Epoch: 75, step: 778, loss: 0.3041200339794159, mean loss: 0.3388771175923496
Epoch: 75, step: 779, loss: 0.35546809434890747, mean loss: 0.33887726969151316
Epoch: 75, step: 780, loss: 0.2991468608379364, mean loss: 0.3388769054630146
Epoch: 75, step: 781, loss: 0.34673115611076355, mean loss: 0.33887697746619244
Epoch: 75, step: 782, loss: 0.3192759156227112, mean loss: 0.3388767977767647
Epoch: 75, step: 783, loss: 0.3130880892276764, mean loss: 0.338876561365297
Epoch: 75, step: 784, loss: 0.3309398889541626, mean loss: 0.33887648860852554
Epoch: 75, step: 785, loss: 0.3734140992164612, mean loss: 0.3388768052175368
Epoch: 75, step: 786, loss: 0.36882877349853516, mean loss: 0.3388770797870848
Epoch: 75, step: 787, loss: 0.33768537640571594, mean loss: 0.33887706886284585
Epoch: 75, step: 788, loss: 0.2907460331916809, mean loss: 0.33887662765396437
Epoch: 75, step: 789, loss: 0.3112252354621887, mean loss: 0.338876374180757
Epoch: 75, step: 790, loss: 0.3331969082355499, mean loss: 0.33887632211902924
Epoch: 75, step: 791, loss: 0.3232859671115875, mean loss: 0.33887617920887075
Epoch: 75, step: 792, loss: 0.3619261384010315, mean loss: 0.3388763904961137
Epoch: 75, step: 793, loss: 0.3216538727283478, mean loss: 0.3388762326275071
Epoch: 75, step: 794, loss: 0.40365853905677795, mean loss: 0.33887682644304795
Epoch: 75, step: 795, loss: 0.3106081485748291, mean loss: 0.33887656732559296
Epoch: 75, step: 796, loss: 0.32592982053756714, mean loss: 0.3388764486537066
Epoch: 75, step: 797, loss: 0.3804985582828522, mean loss: 0.33887683016491327
Epoch: 75, step: 798, loss: 0.3137396574020386, mean loss: 0.3388765997579181
Epoch: 75, step: 799, loss: 0.3243911862373352, mean loss: 0.3388764669860252
Epoch: 75, step: 800, loss: 0.38129672408103943, mean loss: 0.3388768558024164
Epoch: 75, step: 801, loss: 0.34543880820274353, mean loss: 0.338876915947532
Epoch: 75, step: 802, loss: 0.349465548992157, mean loss: 0.338877012999245
Epoch: 75, step: 803, loss: 0.3176896870136261, mean loss: 0.3388768188053934
Epoch: 75, step: 804, loss: 0.35650745034217834, mean loss: 0.33887698039864333
Epoch: 75, step: 805, loss: 0.32201385498046875, mean loss: 0.3388768258413741
Epoch: 75, step: 806, loss: 0.36523666977882385, mean loss: 0.3388770674376414
Epoch: 75, step: 807, loss: 0.33240512013435364, mean loss: 0.3388770081207508
Epoch: 75, step: 808, loss: 0.32851582765579224, mean loss: 0.33887691315901103
Epoch: 75, step: 809, loss: 0.28832465410232544, mean loss: 0.3388764498443831
Epoch: 75, step: 810, loss: 0.32992368936538696, mean loss: 0.3388763677925232
Epoch: 75, step: 811, loss: 0.3806475102901459, mean loss: 0.33887675062064937
Epoch: 75, step: 812, loss: 0.3079693615436554, mean loss: 0.3388764673602764
Epoch: 75, step: 813, loss: 0.31875744462013245, mean loss: 0.3388762829749295
Epoch: 75, step: 814, loss: 0.32701534032821655, mean loss: 0.33887617427362676
Epoch: 75, step: 815, loss: 0.3162052035331726, mean loss: 0.33887596650418195
Epoch: 75, step: 816, loss: 0.3759401738643646, mean loss: 0.3388763061781774
Epoch: 75, step: 817, loss: 0.29571786522865295, mean loss: 0.33887591065735634
Epoch: 75, step: 818, loss: 0.3697710335254669, mean loss: 0.3388761937897427
Epoch: 75, step: 819, loss: 0.28047841787338257, mean loss: 0.33887565861950886
Epoch: 75, step: 820, loss: 0.30720794200897217, mean loss: 0.33887536841215543
Epoch: 75, step: 821, loss: 0.3127583861351013, mean loss: 0.33887512907469575
Epoch: 75, step: 822, loss: 0.3242685794830322, mean loss: 0.33887499522069986
Epoch: 75, step: 823, loss: 0.31842130422592163, mean loss: 0.3388748077853878
Epoch: 75, step: 824, loss: 0.3408641815185547, mean loss: 0.33887482601561675
Epoch: 75, step: 825, loss: 0.3348017930984497, mean loss: 0.3388747886914876
Epoch: 75, step: 826, loss: 0.3283211886882782, mean loss: 0.3388746919821489
Epoch: 75, step: 827, loss: 0.3240516185760498, mean loss: 0.33887455615015893
Epoch: 75, step: 828, loss: 0.32290202379226685, mean loss: 0.33887440978638433
Epoch: 75, step: 829, loss: 0.3291166126728058, mean loss: 0.338874320371951
Epoch: 75, step: 830, loss: 0.29775065183639526, mean loss: 0.3388739435434739
Epoch: 75, step: 831, loss: 0.2986685335636139, mean loss: 0.3388735751326505
Epoch: 75, step: 832, loss: 0.3059394061565399, mean loss: 0.33887327335253836
Epoch: 75, step: 833, loss: 0.35170283913612366, mean loss: 0.338873390910456
Epoch: 75, step: 834, loss: 0.3496893644332886, mean loss: 0.33887349001682443
Epoch: 75, step: 835, loss: 0.3195146918296814, mean loss: 0.3388733126344924
Epoch: 75, step: 836, loss: 0.34847041964530945, mean loss: 0.3388734005708202
Epoch: 75, step: 837, loss: 0.31721898913383484, mean loss: 0.33887320215769706
Epoch: 75, step: 838, loss: 0.32957905530929565, mean loss: 0.3388731169988918
Epoch: 75, step: 839, loss: 0.3233299255371094, mean loss: 0.33887297458372356
Epoch: 75, step: 840, loss: 0.2972620725631714, mean loss: 0.3388725933255161
Epoch: 75, step: 841, loss: 0.31702226400375366, mean loss: 0.33887239312459144
Epoch: 75, step: 842, loss: 0.3389337658882141, mean loss: 0.3388723936869066
Epoch: 75, step: 843, loss: 0.32555294036865234, mean loss: 0.3388722716513085
Epoch: 75, step: 844, loss: 0.3150612711906433, mean loss: 0.33887205349197497
Epoch: 75, step: 845, loss: 0.33372706174850464, mean loss: 0.3388720063533557
Epoch: 75, step: 846, loss: 0.31507226824760437, mean loss: 0.33887178830120485
Epoch: 75, step: 847, loss: 0.3252103626728058, mean loss: 0.33887166313697253
Epoch: 75, step: 848, loss: 0.33522704243659973, mean loss: 0.33887162974573026
Epoch: 75, step: 849, loss: 0.29311659932136536, mean loss: 0.33887121055168146
Epoch: 75, step: 850, loss: 0.3541956841945648, mean loss: 0.3388713509486878
Epoch: 75, step: 851, loss: 0.33102449774742126, mean loss: 0.3388712790594581
Epoch: 75, step: 852, loss: 0.32126763463020325, mean loss: 0.3388711177845098
Epoch: 75, step: 853, loss: 0.28126904368400574, mean loss: 0.3388705900706917
Epoch: 75, step: 854, loss: 0.3804610073566437, mean loss: 0.3388709710923333
Epoch: 75, step: 855, loss: 0.32453933358192444, mean loss: 0.3388708397973288
Epoch: 75, step: 856, loss: 0.38349440693855286, mean loss: 0.33887124859902856
Epoch: 75, step: 857, loss: 0.2938520908355713, mean loss: 0.33887083617705527
Epoch: 75, step: 858, loss: 0.3259429633617401, mean loss: 0.3388707177454755
Epoch: 75, step: 859, loss: 0.335721492767334, mean loss: 0.3388706888958513
Epoch: 75, step: 860, loss: 0.3183838129043579, mean loss: 0.33887050122006973
Epoch: 75, step: 861, loss: 0.34419089555740356, mean loss: 0.3388705499585899
Epoch: 75, step: 862, loss: 0.3416174352169037, mean loss: 0.3388705751217428
Epoch: 75, step: 863, loss: 0.3217290937900543, mean loss: 0.33887041809670404
Epoch: 75, step: 864, loss: 0.32625311613082886, mean loss: 0.33887030251660083
Epoch: 75, step: 865, loss: 0.3289255201816559, mean loss: 0.33887021141880175
Epoch: 75, step: 866, loss: 0.32848241925239563, mean loss: 0.3388701162637442
Epoch: 75, step: 867, loss: 0.31468668580055237, mean loss: 0.33886989473884255
Epoch: 75, step: 868, loss: 0.27450594305992126, mean loss: 0.3388693051579938
Epoch: 75, step: 869, loss: 0.4720458984375, mean loss: 0.33887052505900395
Epoch: 75, step: 870, loss: 0.29269739985466003, mean loss: 0.338870102115867
Epoch: 75, step: 871, loss: 0.32459527254104614, mean loss: 0.33886997136045743
Epoch: 75, step: 872, loss: 0.3252272605895996, mean loss: 0.3388698463963109
Epoch: 75, step: 873, loss: 0.31914785504341125, mean loss: 0.3388696657489832
Epoch: 75, step: 874, loss: 0.3115159571170807, mean loss: 0.33886941519978575
Epoch: 75, step: 875, loss: 0.35340163111686707, mean loss: 0.33886954830794064
Epoch: 75, step: 876, loss: 0.33193182945251465, mean loss: 0.33886948476233253
Epoch: 75, step: 877, loss: 0.35509973764419556, mean loss: 0.3388696334209715
Epoch: 75, step: 878, loss: 0.32486075162887573, mean loss: 0.338869505109833
Epoch: 75, step: 879, loss: 0.36968597769737244, mean loss: 0.33886978736365775
Epoch: 75, step: 880, loss: 0.3114285171031952, mean loss: 0.3388695360262432
Epoch: 75, step: 881, loss: 0.3224620819091797, mean loss: 0.3388693857500611
Epoch: 75, step: 882, loss: 0.35192906856536865, mean loss: 0.3388695053628471
Epoch: 75, step: 883, loss: 0.3393257260322571, mean loss: 0.3388695095413043
Epoch: 75, step: 884, loss: 0.2953035831451416, mean loss: 0.3388691105311253
Epoch: 75, step: 885, loss: 0.32875943183898926, mean loss: 0.3388690179397794
Epoch: 75, step: 886, loss: 0.2967151403427124, mean loss: 0.3388686318692985
Epoch: 75, step: 887, loss: 0.3258170783519745, mean loss: 0.33886851233644216
Epoch: 75, step: 888, loss: 0.3126547634601593, mean loss: 0.3388682722596132
Epoch: 75, step: 889, loss: 0.3259320855140686, mean loss: 0.3388681537855153
Epoch: 75, step: 890, loss: 0.30923259258270264, mean loss: 0.33886788237522325
Epoch: 75, step: 891, loss: 0.30828964710235596, mean loss: 0.3388676023342379
Epoch: 75, step: 892, loss: 0.3065316677093506, mean loss: 0.3388673061986374
Epoch: 75, step: 893, loss: 0.3427642583847046, mean loss: 0.33886734188697365
Epoch: 75, step: 894, loss: 0.3502437174320221, mean loss: 0.3388674460710072
Epoch: 75, step: 895, loss: 0.3121757507324219, mean loss: 0.3388672016326089
Epoch: 75, step: 896, loss: 0.3450385630130768, mean loss: 0.3388672581484599
Epoch: 75, step: 897, loss: 0.32472267746925354, mean loss: 0.33886712861696044
Epoch: 75, step: 898, loss: 0.34826239943504333, mean loss: 0.3388672146550269
Epoch: 75, step: 899, loss: 0.3894856870174408, mean loss: 0.3388676781941511
Epoch: 75, step: 900, loss: 0.341490775346756, mean loss: 0.3388677022149673
Epoch: 75, step: 901, loss: 0.3141612708568573, mean loss: 0.3388674759697396
Epoch: 75, step: 902, loss: 0.37241119146347046, mean loss: 0.3388677831381827
Epoch: 75, step: 903, loss: 0.3484213054180145, mean loss: 0.33886787062144597
Epoch: 75, step: 904, loss: 0.34316372871398926, mean loss: 0.3388679099590046
Epoch: 75, step: 905, loss: 0.296597421169281, mean loss: 0.3388675228878841
Epoch: 75, step: 906, loss: 0.3133127689361572, mean loss: 0.33886728888499096
Epoch: 75, step: 907, loss: 0.3354349434375763, mean loss: 0.3388672574555586
Epoch: 75, step: 908, loss: 0.34110817313194275, mean loss: 0.33886727797507327
Epoch: 75, step: 909, loss: 0.3211457431316376, mean loss: 0.3388671157048156
Epoch: 75, step: 910, loss: 0.3376680910587311, mean loss: 0.33886710472584236
Epoch: 75, step: 911, loss: 0.3046615421772003, mean loss: 0.33886679152250804
Epoch: 75, step: 912, loss: 0.3045004606246948, mean loss: 0.33886647684997917
Epoch: 75, step: 913, loss: 0.33669090270996094, mean loss: 0.3388664569296929
Epoch: 75, step: 914, loss: 0.3097478449344635, mean loss: 0.33886619031236015
Epoch: 75, step: 915, loss: 0.32534879446029663, mean loss: 0.33886606654481827
Epoch: 75, step: 916, loss: 0.3342643976211548, mean loss: 0.33886602441155217
Epoch: 75, step: 917, loss: 0.33571457862854004, mean loss: 0.3388659955569148
Epoch: 75, step: 918, loss: 0.3181856870651245, mean loss: 0.33886580620974543
Epoch: 75, step: 919, loss: 0.3428248167037964, mean loss: 0.33886584245778145
Epoch: 75, step: 920, loss: 0.35323768854141235, mean loss: 0.3388659740427888
Epoch: 75, step: 921, loss: 0.2950047254562378, mean loss: 0.33886557246390736
Epoch: 75, step: 922, loss: 0.32551467418670654, mean loss: 0.33886545022867964
Epoch: 75, step: 923, loss: 0.3206973075866699, mean loss: 0.3388652838903049
Epoch: 75, step: 924, loss: 0.29250529408454895, mean loss: 0.33886485944544514
Epoch: 75, step: 925, loss: 0.35670241713523865, mean loss: 0.33886502275416003
Epoch: 75, step: 926, loss: 0.3538658916950226, mean loss: 0.33886516009079787
Epoch: 75, step: 927, loss: 0.33598268032073975, mean loss: 0.33886513370122956
Epoch: 75, step: 928, loss: 0.3321956396102905, mean loss: 0.33886507264149185
Epoch: 75, step: 929, loss: 0.34315869212150574, mean loss: 0.33886511194955266
Epoch: 75, step: 930, loss: 0.2789570689201355, mean loss: 0.3388645634967963
Epoch: 75, step: 931, loss: 0.2945040762424469, mean loss: 0.33886415738423536
Epoch: 75, step: 932, loss: 0.33963248133659363, mean loss: 0.3388641644180434
Epoch: 75, step: 933, loss: 0.38075751066207886, mean loss: 0.3388645479373345
Epoch: 75, step: 934, loss: 0.28861770033836365, mean loss: 0.3388640879487997
Epoch: 75, step: 935, loss: 0.3313116431236267, mean loss: 0.33886401881001005
Epoch: 75, step: 936, loss: 0.3499520421028137, mean loss: 0.3388641203142924
Epoch: 75, step: 937, loss: 0.3318779766559601, mean loss: 0.33886405636087275
Epoch: 75, step: 938, loss: 0.32431110739707947, mean loss: 0.33886392313968833
Epoch: 75, step: 939, loss: 0.2923620343208313, mean loss: 0.3388634974541444
Epoch: 75, step: 940, loss: 0.41149142384529114, mean loss: 0.33886416229542554
Epoch: 75, step: 941, loss: 0.30361759662628174, mean loss: 0.33886383964877254
Epoch: 75, step: 942, loss: 0.35323894023895264, mean loss: 0.3388639712370719
Epoch: 75, step: 943, loss: 0.3588969111442566, mean loss: 0.338864154615014
Epoch: 75, step: 944, loss: 0.3204773962497711, mean loss: 0.3388639863074634
Epoch: 75, step: 945, loss: 0.32112613320350647, mean loss: 0.33886382394130715
Epoch: 75, step: 946, loss: 0.3333551287651062, mean loss: 0.33886377351708336
Epoch: 75, step: 947, loss: 0.333146870136261, mean loss: 0.3388637211874903
Epoch: 75, step: 948, loss: 0.2981358766555786, mean loss: 0.3388633483891623
Epoch: 75, step: 949, loss: 0.38005027174949646, mean loss: 0.3388637253861725
Epoch: 75, step: 950, loss: 0.31358861923217773, mean loss: 0.338863494037204
Epoch: 75, step: 951, loss: 0.3321262001991272, mean loss: 0.3388634323697394
Epoch: 75, step: 952, loss: 0.338326632976532, mean loss: 0.33886342745637876
Epoch: 75, step: 953, loss: 0.3171093165874481, mean loss: 0.3388632283413727
Epoch: 75, step: 954, loss: 0.28645116090774536, mean loss: 0.3388627486190037
Epoch: 75, step: 955, loss: 0.3439963757991791, mean loss: 0.33886279560614563
Epoch: 75, step: 956, loss: 0.3768801689147949, mean loss: 0.3388631435689609
Epoch: 75, step: 957, loss: 0.31151607632637024, mean loss: 0.3388628932708844
Epoch: 75, step: 958, loss: 0.31947898864746094, mean loss: 0.338862715858455
Epoch: 75, step: 959, loss: 0.3228623569011688, mean loss: 0.3388625694154845
Epoch: 75, step: 960, loss: 0.2815323770046234, mean loss: 0.33886204470682896
Epoch: 75, step: 961, loss: 0.33433103561401367, mean loss: 0.3388620032376165
Epoch: 75, step: 962, loss: 0.3616480827331543, mean loss: 0.33886221178103465
Epoch: 75, step: 963, loss: 0.30310311913490295, mean loss: 0.3388618845086243
Epoch: 75, step: 964, loss: 0.3849826157093048, mean loss: 0.3388623066083928
Epoch: 75, step: 965, loss: 0.3389168679714203, mean loss: 0.3388623071077372
Epoch: 75, step: 966, loss: 0.3252323865890503, mean loss: 0.3388621823681496
Epoch: 75, step: 967, loss: 0.3334682881832123, mean loss: 0.3388621330042536
Epoch: 75, step: 968, loss: 0.32919400930404663, mean loss: 0.33886204452423
Epoch: 75, step: 969, loss: 0.32454365491867065, mean loss: 0.33886191348744404
Epoch: 75, step: 970, loss: 0.3287172317504883, mean loss: 0.3388618206477909
Epoch: 75, step: 971, loss: 0.3364282548427582, mean loss: 0.33886179837707375
Epoch: 75, step: 972, loss: 0.3576744496822357, mean loss: 0.3388619705390104
Epoch: 75, step: 973, loss: 0.3397832214832306, mean loss: 0.3388619789696613
Epoch: 75, step: 974, loss: 0.33371007442474365, mean loss: 0.3388619318234289
Epoch: 75, step: 975, loss: 0.34014588594436646, mean loss: 0.3388619435730731
Epoch: 75, step: 976, loss: 0.33318251371383667, mean loss: 0.3388618916002896
Epoch: 75, step: 977, loss: 0.32061752676963806, mean loss: 0.33886172464660425
Epoch: 75, step: 978, loss: 0.35326868295669556, mean loss: 0.3388618564830807
Epoch: 75, step: 979, loss: 0.33863356709480286, mean loss: 0.338861854394049
Epoch: 75, step: 980, loss: 0.3562677502632141, mean loss: 0.33886201367055513
Epoch: 75, step: 981, loss: 0.3301135301589966, mean loss: 0.3388619336163512
Epoch: 75, step: 982, loss: 0.30079227685928345, mean loss: 0.3388615852578988
Epoch: 75, step: 983, loss: 0.29415011405944824, mean loss: 0.33886117612690797
Epoch: 75, step: 984, loss: 0.3077815771102905, mean loss: 0.3388608917365615
Epoch: 75, step: 985, loss: 0.32613274455070496, mean loss: 0.3388607752701597
Epoch: 75, step: 986, loss: 0.31984615325927734, mean loss: 0.33886060128220125
Epoch: 75, step: 987, loss: 0.3257300555706024, mean loss: 0.3388604811359298
Epoch: 75, step: 988, loss: 0.34560057520866394, mean loss: 0.33886054280813904
Epoch: 75, step: 989, loss: 0.31207284331321716, mean loss: 0.3388602977015465
Epoch: 75, step: 990, loss: 0.3486195504665375, mean loss: 0.3388603869975797
Epoch: 75, step: 991, loss: 0.33917397260665894, mean loss: 0.3388603898668255
Epoch: 75, step: 992, loss: 0.34188416600227356, mean loss: 0.33886041753352086
Epoch: 75, step: 993, loss: 0.3089594542980194, mean loss: 0.33886014395067793
Epoch: 75, step: 994, loss: 0.34466731548309326, mean loss: 0.33886019708368065
Epoch: 75, step: 995, loss: 0.2937256395816803, mean loss: 0.3388597841265962
Epoch: 75, step: 996, loss: 0.35444176197052, mean loss: 0.33885992669206316
Epoch: 75, step: 997, loss: 0.3328498303890228, mean loss: 0.3388598717038996
Epoch: 75, step: 998, loss: 0.2901724874973297, mean loss: 0.3388594262525761
Epoch: 75, step: 999, loss: 0.3280036449432373, mean loss: 0.3388593269316126
Epoch: 75, step: 1000, loss: 0.3463813364505768, mean loss: 0.3388593957508322
Epoch: 75, step: 1001, loss: 0.3715389370918274, mean loss: 0.3388596947347606
Epoch: 75, step: 1002, loss: 0.33698520064353943, mean loss: 0.3388596775852396
Epoch: 75, step: 1003, loss: 0.359673410654068, mean loss: 0.33885986800583784
Epoch: 75, step: 1004, loss: 0.34395596385002136, mean loss: 0.33885991462855264
Epoch: 75, step: 1005, loss: 0.302395224571228, mean loss: 0.33885958102664554
Epoch: 75, step: 1006, loss: 0.3117050528526306, mean loss: 0.33885933260222467
Epoch: 75, step: 1007, loss: 0.3139986991882324, mean loss: 0.33885910516568374
Epoch: 75, step: 1008, loss: 0.36704978346824646, mean loss: 0.3388593630646518
Epoch: 75, step: 1009, loss: 0.3535923957824707, mean loss: 0.33885949784676433
Epoch: 75, step: 1010, loss: 0.32876452803611755, mean loss: 0.338859405495859
Epoch: 75, step: 1011, loss: 0.30624496936798096, mean loss: 0.3388591071348728
Epoch: 75, step: 1012, loss: 0.3083781898021698, mean loss: 0.33885882829413716
Epoch: 75, step: 1013, loss: 0.3040607273578644, mean loss: 0.33885850996253336
Epoch: 75, step: 1014, loss: 0.35041531920433044, mean loss: 0.3388586156827844
Epoch: 75, step: 1015, loss: 0.36091598868370056, mean loss: 0.33885881745903856
Epoch: 75, step: 1016, loss: 0.3313122093677521, mean loss: 0.338858748424871
Epoch: 75, step: 1017, loss: 0.34125447273254395, mean loss: 0.33885877034005707
Epoch: 75, step: 1018, loss: 0.3862835466861725, mean loss: 0.3388592041601281
Epoch: 75, step: 1019, loss: 0.3910036087036133, mean loss: 0.3388596811488268
Epoch: 75, step: 1020, loss: 0.32598164677619934, mean loss: 0.33885956334863865
Epoch: 75, step: 1021, loss: 0.35618120431900024, mean loss: 0.33885972179470597
Epoch: 75, step: 1022, loss: 0.334071546792984, mean loss: 0.3388596779962829
Epoch: 75, step: 1023, loss: 0.34130197763442993, mean loss: 0.3388597003362964
Epoch: 75, step: 1024, loss: 0.3071877360343933, mean loss: 0.33885941063161495
Epoch: 75, step: 1025, loss: 0.3144606947898865, mean loss: 0.33885918745765964
Epoch: 75, step: 1026, loss: 0.35074323415756226, mean loss: 0.3388592961595055
Epoch: 75, step: 1027, loss: 0.33531367778778076, mean loss: 0.3388592637284872
Epoch: 75, step: 1028, loss: 0.3324449956417084, mean loss: 0.3388592050590757
Epoch: 75, step: 1029, loss: 0.3275769352912903, mean loss: 0.33885910186443774
Epoch: 75, step: 1030, loss: 0.30772846937179565, mean loss: 0.33885881712696625
Epoch: 75, step: 1031, loss: 0.3338761031627655, mean loss: 0.33885877155280714
Epoch: 75, step: 1032, loss: 0.3561422824859619, mean loss: 0.3388589296341818
Epoch: 75, step: 1033, loss: 0.3455331325531006, mean loss: 0.33885899067834846
Epoch: 75, step: 1034, loss: 0.36375999450683594, mean loss: 0.33885921842796046
Epoch: 75, step: 1035, loss: 0.31935974955558777, mean loss: 0.33885904008350964
Epoch: 75, step: 1036, loss: 0.307788223028183, mean loss: 0.33885875590873754
Epoch: 75, step: 1037, loss: 0.3371211290359497, mean loss: 0.33885874001648714
Epoch: 75, step: 1038, loss: 0.314654678106308, mean loss: 0.3388585186493454
Epoch: 75, step: 1039, loss: 0.32135048508644104, mean loss: 0.3388583585246558
Epoch: 75, step: 1040, loss: 0.3717244565486908, mean loss: 0.3388586591081334
Epoch: 75, step: 1041, loss: 0.3287090063095093, mean loss: 0.33885856628330124
Epoch: 75, step: 1042, loss: 0.32886844873428345, mean loss: 0.33885847491835286
Epoch: 75, step: 1043, loss: 0.34702739119529724, mean loss: 0.3388585496267619
Epoch: 75, step: 1044, loss: 0.3158622086048126, mean loss: 0.3388583393168161
Epoch: 75, step: 1045, loss: 0.35438477993011475, mean loss: 0.3388584813104932
Epoch: 75, step: 1046, loss: 0.374463826417923, mean loss: 0.33885880692843523
Epoch: 75, step: 1047, loss: 0.35344281792640686, mean loss: 0.3388589403008883
Epoch: 75, step: 1048, loss: 0.31902748346328735, mean loss: 0.33885875894159984
Epoch: 75, step: 1049, loss: 0.3078734874725342, mean loss: 0.33885847558292154
Epoch: 75, step: 1050, loss: 0.316510945558548, mean loss: 0.3388582712178035
Epoch: 75, step: 1051, loss: 0.32367971539497375, mean loss: 0.33885813241324736
Epoch: 75, step: 1052, loss: 0.3336862325668335, mean loss: 0.33885808511779275
Epoch: 75, step: 1053, loss: 0.35838091373443604, mean loss: 0.33885826364650334
Epoch: 75, step: 1054, loss: 0.3374113440513611, mean loss: 0.33885825041510476
Epoch: 75, step: 1055, loss: 0.30188727378845215, mean loss: 0.33885791233601786
Epoch: 75, step: 1056, loss: 0.32969436049461365, mean loss: 0.33885782854118224
Epoch: 75, step: 1057, loss: 0.33895471692085266, mean loss: 0.33885782942715653
Epoch: 75, step: 1058, loss: 0.3538573980331421, mean loss: 0.3388579665861339
Epoch: 75, step: 1059, loss: 0.3141166567802429, mean loss: 0.33885774034884597
Epoch: 75, step: 1060, loss: 0.3313564658164978, mean loss: 0.3388576717569848
Epoch: 75, step: 1061, loss: 0.33870357275009155, mean loss: 0.3388576703479121
Epoch: 75, step: 1062, loss: 0.33860456943511963, mean loss: 0.3388576680335927
Epoch: 75, step: 1063, loss: 0.3092893362045288, mean loss: 0.3388573976673677
Epoch: 75, step: 1064, loss: 0.3256997764110565, mean loss: 0.33885727735811655
Epoch: 75, step: 1065, loss: 0.3250128924846649, mean loss: 0.3388571507704671
Epoch: 75, step: 1066, loss: 0.3380590081214905, mean loss: 0.3388571434726291
Epoch: 75, step: 1067, loss: 0.33925101161003113, mean loss: 0.33885714707393966
Epoch: 75, step: 1068, loss: 0.31743499636650085, mean loss: 0.33885695120353115
Epoch: 75, step: 1069, loss: 0.31379014253616333, mean loss: 0.3388567220108031
Epoch: 75, step: 1070, loss: 0.31148648262023926, mean loss: 0.3388564717594623
Epoch: 75, step: 1071, loss: 0.3167547285556793, mean loss: 0.3388562696808389
Epoch: 75, step: 1072, loss: 0.30580800771713257, mean loss: 0.3388559675197757
Epoch: 75, step: 1073, loss: 0.2921980619430542, mean loss: 0.3388555409293102
Epoch: 75, step: 1074, loss: 0.322645902633667, mean loss: 0.3388553927269029
Epoch: 75, step: 1075, loss: 0.3422190546989441, mean loss: 0.3388554234801026
Epoch: 75, step: 1076, loss: 0.31122922897338867, mean loss: 0.3388551709023714
Epoch: 75, step: 1077, loss: 0.3394213616847992, mean loss: 0.33885517607883087
Epoch: 75, step: 1078, loss: 0.32527437806129456, mean loss: 0.3388550519160755
Epoch: 75, step: 1079, loss: 0.29737240076065063, mean loss: 0.33885467266345937
Epoch: 75, step: 1080, loss: 0.315961092710495, mean loss: 0.33885446336221003
Epoch: 75, step: 1081, loss: 0.3205791115760803, mean loss: 0.3388542962839724
Epoch: 75, step: 1082, loss: 0.290332555770874, mean loss: 0.33885385268907636
Epoch: 75, step: 1083, loss: 0.31635114550590515, mean loss: 0.33885364696696724
Epoch: 75, step: 1084, loss: 0.3135114908218384, mean loss: 0.33885341528843593
Epoch: 75, step: 1085, loss: 0.3544090688228607, mean loss: 0.3388535574972518
Epoch: 75, step: 1086, loss: 0.3768327832221985, mean loss: 0.33885390469779414
Epoch: 75, step: 1087, loss: 0.3793724477291107, mean loss: 0.33885427510901867
Epoch: 75, step: 1088, loss: 0.34630224108695984, mean loss: 0.33885434319599245
Epoch: 75, step: 1089, loss: 0.3288891315460205, mean loss: 0.33885425209797937
Epoch: 75, step: 1090, loss: 0.3052522838115692, mean loss: 0.33885394492491866
Epoch: 75, step: 1091, loss: 0.32418668270111084, mean loss: 0.3388538108450753
Epoch: 75, step: 1092, loss: 0.35052162408828735, mean loss: 0.33885391750467186
Epoch: 75, step: 1093, loss: 0.31925269961357117, mean loss: 0.338853738324663
Epoch: 75, step: 1094, loss: 0.32643213868141174, mean loss: 0.33885362477651504
Epoch: 75, step: 1095, loss: 0.31169047951698303, mean loss: 0.3388533764754322
Epoch: 75, step: 1096, loss: 0.33851075172424316, mean loss: 0.33885337334349297
Epoch: 75, step: 1097, loss: 0.3269561529159546, mean loss: 0.3388532645917751
Epoch: 75, step: 1098, loss: 0.2967005670070648, mean loss: 0.3388528792802313
Epoch: 75, step: 1099, loss: 0.32672983407974243, mean loss: 0.33885276846628976
Epoch: 75, step: 1100, loss: 0.33028674125671387, mean loss: 0.3388526901669396
Epoch: 75, step: 1101, loss: 0.3010641634464264, mean loss: 0.338852344757105
Epoch: 75, step: 1102, loss: 0.33530041575431824, mean loss: 0.338852312290637
Epoch: 75, step: 1103, loss: 0.3444453179836273, mean loss: 0.3388523634131343
Epoch: 75, step: 1104, loss: 0.3130652904510498, mean loss: 0.33885212771026
Epoch: 75, step: 1105, loss: 0.3025456964969635, mean loss: 0.33885179585980196
Epoch: 75, step: 1106, loss: 0.320511132478714, mean loss: 0.3388516282227826
Epoch: 75, step: 1107, loss: 0.288109689950943, mean loss: 0.33885116443642077
Epoch: 75, step: 1108, loss: 0.3240013122558594, mean loss: 0.3388510287085357
Epoch: 75, step: 1109, loss: 0.3197323977947235, mean loss: 0.3388508539655422
Epoch: 75, step: 1110, loss: 0.3494585454463959, mean loss: 0.33885095091823875
Epoch: 75, step: 1111, loss: 0.3294650912284851, mean loss: 0.3388508651336841
Epoch: 75, step: 1112, loss: 0.29471102356910706, mean loss: 0.33885046170957944
Epoch: 75, step: 1113, loss: 0.3436550498008728, mean loss: 0.33885050562158425
Epoch: 75, step: 1114, loss: 0.37504109740257263, mean loss: 0.33885083638602953
Epoch: 75, step: 1115, loss: 0.3242672085762024, mean loss: 0.33885070309996707
Epoch: 75, step: 1116, loss: 0.3414700925350189, mean loss: 0.3388507270394777
Epoch: 75, step: 1117, loss: 0.33321112394332886, mean loss: 0.3388506754976556
Epoch: 75, step: 1118, loss: 0.3116540014743805, mean loss: 0.33885042694234047
Epoch: 75, step: 1119, loss: 0.33062565326690674, mean loss: 0.33885035177533557
Epoch: 75, step: 1120, loss: 0.33702054619789124, mean loss: 0.3388503350527176
Epoch: 75, step: 1121, loss: 0.32081079483032227, mean loss: 0.338850170190622
Epoch: 75, step: 1122, loss: 0.30979764461517334, mean loss: 0.3388499046840505
Epoch: 75, step: 1123, loss: 0.42753496766090393, mean loss: 0.33885071515582066
Epoch: 75, step: 1124, loss: 0.3290103077888489, mean loss: 0.338850625227492
Epoch: 75, step: 1125, loss: 0.36365869641304016, mean loss: 0.33885085193843073
Epoch: 75, step: 1126, loss: 0.31116798520088196, mean loss: 0.33885059895820885
Epoch: 75, step: 1127, loss: 0.33115363121032715, mean loss: 0.3388505286200162
Epoch: 75, step: 1128, loss: 0.32130804657936096, mean loss: 0.33885036831075593
Epoch: 75, step: 1129, loss: 0.32738742232322693, mean loss: 0.3388502635593533
Epoch: 75, step: 1130, loss: 0.35440680384635925, mean loss: 0.3388504057177937
Epoch: 75, step: 1131, loss: 0.3076958656311035, mean loss: 0.3388501210246501
Epoch: 75, step: 1132, loss: 0.3115886449813843, mean loss: 0.33884987190897164
Epoch: 75, step: 1133, loss: 0.37556809186935425, mean loss: 0.33885020743741767
Epoch: 75, step: 1134, loss: 0.3623270094394684, mean loss: 0.338850421964781
Epoch: 75, step: 1135, loss: 0.3744485676288605, mean loss: 0.33885074725212394
Epoch: 75, step: 1136, loss: 0.30819809436798096, mean loss: 0.3388504671580709
Epoch: 75, step: 1137, loss: 0.3338764011859894, mean loss: 0.3388504217070761
Epoch: 75, step: 1138, loss: 0.3685273230075836, mean loss: 0.3388506928800702
Epoch: 75, step: 1139, loss: 0.33254706859588623, mean loss: 0.3388506352811641
Epoch: 75, step: 1140, loss: 0.3233325183391571, mean loss: 0.3388504934868005
Epoch: 75, step: 1141, loss: 0.31498396396636963, mean loss: 0.33885027541211693
Epoch: 75, step: 1142, loss: 0.3142002522945404, mean loss: 0.33885005018050673
Epoch: 75, step: 1143, loss: 0.33708715438842773, mean loss: 0.33885003407276404
Epoch: 75, step: 1144, loss: 0.3429349958896637, mean loss: 0.3388500713970988
Epoch: 75, step: 1145, loss: 0.33353158831596375, mean loss: 0.3388500228025126
Epoch: 75, step: 1146, loss: 0.30402132868766785, mean loss: 0.33884970457822033
Epoch: 75, step: 1147, loss: 0.32121968269348145, mean loss: 0.33884954349695906
Epoch: 75, step: 1148, loss: 0.334023654460907, mean loss: 0.3388494994043768
Epoch: 75, step: 1149, loss: 0.33186542987823486, mean loss: 0.33884943559378267
Epoch: 75, step: 1150, loss: 0.31627997756004333, mean loss: 0.3388492293877358
Epoch: 75, step: 1151, loss: 0.37789395451545715, mean loss: 0.3388495861169425
Epoch: 75, step: 1152, loss: 0.31711581349372864, mean loss: 0.338849387549771
Epoch: 75, step: 1153, loss: 0.3661244213581085, mean loss: 0.338849636741521
Epoch: 75, step: 1154, loss: 0.35797953605651855, mean loss: 0.3388498115156228
Epoch: 75, step: 1155, loss: 0.32018938660621643, mean loss: 0.33884964103227877
Epoch: 75, step: 1156, loss: 0.36534494161605835, mean loss: 0.3388498830935502
Epoch: 75, step: 1157, loss: 0.3133058547973633, mean loss: 0.33884964972524184
Epoch: 75, step: 1158, loss: 0.32555484771728516, mean loss: 0.33884952826604703
Epoch: 75, step: 1159, loss: 0.31626543402671814, mean loss: 0.33884932194324197
Epoch: 75, step: 1160, loss: 0.31923797726631165, mean loss: 0.3388491427803924
Epoch: 75, step: 1161, loss: 0.33607161045074463, mean loss: 0.3388491174059946
Epoch: 75, step: 1162, loss: 0.36619144678115845, mean loss: 0.33884936719203534
Epoch: 75, step: 1163, loss: 0.351847767829895, mean loss: 0.33884948593793024
Epoch: 75, step: 1164, loss: 0.33587297797203064, mean loss: 0.3388494587465178
Epoch: 75, step: 1165, loss: 0.32777300477027893, mean loss: 0.3388493575602684
Epoch: 75, step: 1166, loss: 0.3048647344112396, mean loss: 0.33884904710485125
Epoch: 75, step: 1167, loss: 0.3213886320590973, mean loss: 0.3388488876023935
Epoch: 75, step: 1168, loss: 0.3184138536453247, mean loss: 0.33884870092823044
Epoch: 75, step: 1169, loss: 0.3504314124584198, mean loss: 0.3388488067354062
Epoch: 75, step: 1170, loss: 0.349032998085022, mean loss: 0.33884889976635824
Epoch: 75, step: 1171, loss: 0.314505010843277, mean loss: 0.3388486773908748
Epoch: 75, step: 1172, loss: 0.3411879241466522, mean loss: 0.33884869875912776
Epoch: 75, step: 1173, loss: 0.3046432435512543, mean loss: 0.33884838630635167
Epoch: 75, step: 1174, loss: 0.3586730360984802, mean loss: 0.33884856739472613
Epoch: 75, step: 1175, loss: 0.302518367767334, mean loss: 0.33884823553934573
Epoch: 75, step: 1176, loss: 0.30582892894744873, mean loss: 0.33884793392981505
Epoch: 75, step: 1177, loss: 0.3733460605144501, mean loss: 0.3388482490445101
Epoch: 75, step: 1178, loss: 0.336479514837265, mean loss: 0.3388482274080848
Epoch: 75, step: 1179, loss: 0.3352002203464508, mean loss: 0.33884819408686573
Epoch: 75, step: 1180, loss: 0.3223988115787506, mean loss: 0.33884804383812384
Epoch: 75, step: 1181, loss: 0.3102680742740631, mean loss: 0.3388477827909237
Epoch: 75, step: 1182, loss: 0.3207339644432068, mean loss: 0.338847617342239
Epoch: 75, step: 1183, loss: 0.3337252736091614, mean loss: 0.33884757055600784
Epoch: 75, step: 1184, loss: 0.3069688379764557, mean loss: 0.3388472793861437
Epoch: 75, step: 1185, loss: 0.2977781891822815, mean loss: 0.3388469042780001
Epoch: 75, step: 1186, loss: 0.31780457496643066, mean loss: 0.33884671208779205
Epoch: 75, step: 1187, loss: 0.35200852155685425, mean loss: 0.33884683230013923
Epoch: 75, step: 1188, loss: 0.3910180926322937, mean loss: 0.3388473087978726
Epoch: 75, step: 1189, loss: 0.3225193917751312, mean loss: 0.33884715967085627
Epoch: 75, step: 1190, loss: 0.32666081190109253, mean loss: 0.3388470483708611
Epoch: 75, step: 1191, loss: 0.3108426332473755, mean loss: 0.3388467926040916
Epoch: 75, step: 1192, loss: 0.28374338150024414, mean loss: 0.3388462893444211
Epoch: 75, step: 1193, loss: 0.32701364159584045, mean loss: 0.33884618127778965
Epoch: 75, step: 1194, loss: 0.2900314927101135, mean loss: 0.3388457354611901
Epoch: 75, step: 1195, loss: 0.3169616460800171, mean loss: 0.33884553559919167
Epoch: 75, step: 1196, loss: 0.36872464418411255, mean loss: 0.33884580847523926
Epoch: 75, step: 1197, loss: 0.3251427412033081, mean loss: 0.33884568333078663
Epoch: 75, step: 1198, loss: 0.3381829261779785, mean loss: 0.3388456772781546
Epoch: 75, step: 1199, loss: 0.3314759433269501, mean loss: 0.33884560997464824
Epoch: 75, step: 1200, loss: 0.3065769374370575, mean loss: 0.33884531528626605
Epoch: 75, step: 1201, loss: 0.3299564719200134, mean loss: 0.33884523411109696
Epoch: 75, step: 1202, loss: 0.35024750232696533, mean loss: 0.3388453382385475
Epoch: 75, step: 1203, loss: 0.3838712275028229, mean loss: 0.338845749418863
Epoch: 75, step: 1204, loss: 0.36771640181541443, mean loss: 0.3388460130657503
Epoch: 75, step: 1205, loss: 0.34117960929870605, mean loss: 0.3388460343759637
Epoch: 75, step: 1206, loss: 0.33709144592285156, mean loss: 0.33884601835334915
Epoch: 75, step: 1207, loss: 0.2972874343395233, mean loss: 0.33884563885062774
Epoch: 75, step: 1208, loss: 0.3164544403553009, mean loss: 0.3388454343816024
Epoch: 75, step: 1209, loss: 0.33642682433128357, mean loss: 0.33884541229585635
Epoch: 75, step: 1210, loss: 0.31697073578834534, mean loss: 0.3388452125471872
Epoch: 75, step: 1211, loss: 0.29382485151290894, mean loss: 0.3388448014473896
Epoch: 75, step: 1212, loss: 0.3379809558391571, mean loss: 0.3388447935593251
Epoch: 75, step: 1213, loss: 0.3371407389640808, mean loss: 0.3388447779991721
Epoch: 75, step: 1214, loss: 0.3128117024898529, mean loss: 0.33884454028675365
Epoch: 75, step: 1215, loss: 0.296928346157074, mean loss: 0.33884415754638575
Epoch: 75, step: 1216, loss: 0.2944752871990204, mean loss: 0.33884375241412
Epoch: 75, step: 1217, loss: 0.3272990882396698, mean loss: 0.33884364700072517
Epoch: 75, step: 1218, loss: 0.3143573999404907, mean loss: 0.33884342342082524
Epoch: 75, step: 1219, loss: 0.36202648282051086, mean loss: 0.3388436350995999
Epoch: 75, step: 1220, loss: 0.33000698685646057, mean loss: 0.3388435544150897
Epoch: 75, step: 1221, loss: 0.3753126859664917, mean loss: 0.33884388739961835
Epoch: 75, step: 1222, loss: 0.34405598044395447, mean loss: 0.33884393498864573
Epoch: 75, step: 1223, loss: 0.33016690611839294, mean loss: 0.3388438557637373
Epoch: 75, step: 1224, loss: 0.28333157300949097, mean loss: 0.3388433489179692
Epoch: 75, step: 1225, loss: 0.3276931941509247, mean loss: 0.33884324711424435
Epoch: 75, step: 1226, loss: 0.307833731174469, mean loss: 0.3388429639921289
Epoch: 75, step: 1227, loss: 0.31033065915107727, mean loss: 0.3388427036723491
Epoch: 75, step: 1228, loss: 0.3223501741886139, mean loss: 0.33884255309552025
Epoch: 75, step: 1229, loss: 0.34705138206481934, mean loss: 0.3388426280414617
Epoch: 75, step: 1230, loss: 0.3335120379924774, mean loss: 0.33884257937405204
Epoch: 75, step: 1231, loss: 0.3376302719116211, mean loss: 0.3388425683059855
Epoch: 75, step: 1232, loss: 0.3569898009300232, mean loss: 0.33884273398420695
Epoch: 75, step: 1233, loss: 0.3166707754135132, mean loss: 0.33884253156341915
Epoch: 75, step: 1234, loss: 0.3301079273223877, mean loss: 0.3388424518208324
Epoch: 75, step: 1235, loss: 0.303970605134964, mean loss: 0.3388421334611453
Epoch: 75, step: 1236, loss: 0.384748637676239, mean loss: 0.3388425525570144
Epoch: 75, step: 1237, loss: 0.2962837815284729, mean loss: 0.338842164027271
Epoch: 75, step: 1238, loss: 0.34596025943756104, mean loss: 0.3388422290095642
Epoch: 75, step: 1239, loss: 0.3386296033859253, mean loss: 0.3388422270684867
Epoch: 75, step: 1240, loss: 0.33791327476501465, mean loss: 0.33884221858807934
Epoch: 75, step: 1241, loss: 0.315935879945755, mean loss: 0.3388420094779787
Epoch: 75, step: 1242, loss: 0.32900354266166687, mean loss: 0.338841919664236
Epoch: 75, step: 1243, loss: 0.3139277696609497, mean loss: 0.3388416922291414
Epoch: 75, step: 1244, loss: 0.2933028042316437, mean loss: 0.3388412765197252
Epoch: 75, step: 1245, loss: 0.362946093082428, mean loss: 0.33884149656259815
Epoch: 75, step: 1246, loss: 0.30323484539985657, mean loss: 0.3388411715272146
Epoch: 75, step: 1247, loss: 0.33315762877464294, mean loss: 0.33884111964545727
Epoch: 75, step: 1248, loss: 0.3538362681865692, mean loss: 0.3388412565262005
Epoch: 75, step: 1249, loss: 0.3049381673336029, mean loss: 0.3388409470502608
Epoch: 75, step: 1250, loss: 0.32207563519477844, mean loss: 0.3388407940136673
Epoch: 75, step: 1251, loss: 0.35541337728500366, mean loss: 0.3388409452896209
Epoch: 75, step: 1252, loss: 0.31508466601371765, mean loss: 0.3388407284422568
Epoch: 75, step: 1253, loss: 0.33659011125564575, mean loss: 0.3388407078988062
Epoch: 75, step: 1254, loss: 0.295249342918396, mean loss: 0.3388403100040047
Epoch: 75, step: 1255, loss: 0.3058299124240875, mean loss: 0.3388400086932816
Epoch: 75, step: 1256, loss: 0.34751105308532715, mean loss: 0.33884008783970215
Epoch: 75, step: 1257, loss: 0.34079408645629883, mean loss: 0.3388401056749914
Epoch: 75, step: 1258, loss: 0.36499103903770447, mean loss: 0.33884034436768995
Epoch: 75, step: 1259, loss: 0.3221292793750763, mean loss: 0.33884019183880176
Epoch: 75, step: 1260, loss: 0.32050690054893494, mean loss: 0.33884002450470213
Epoch: 75, step: 1261, loss: 0.32859766483306885, mean loss: 0.3388399310201028
Epoch: 75, step: 1262, loss: 0.3426949977874756, mean loss: 0.3388399662059481
Epoch: 75, step: 1263, loss: 0.3564976751804352, mean loss: 0.3388401273693683
Epoch: 75, step: 1264, loss: 0.3271319270133972, mean loss: 0.33884002050859746
Epoch: 75, step: 1265, loss: 0.3204331398010254, mean loss: 0.3388398525104894
Epoch: 75, step: 1266, loss: 0.3864014744758606, mean loss: 0.33884028659759563
Epoch: 75, step: 1267, loss: 0.3262515962123871, mean loss: 0.33884017170373626
Epoch: 75, step: 1268, loss: 0.38368576765060425, mean loss: 0.33884058099464837
Epoch: 75, step: 1269, loss: 0.29775404930114746, mean loss: 0.33884020601489395
Epoch: 75, step: 1270, loss: 0.3113139867782593, mean loss: 0.33883995479678664
Epoch: 75, step: 1271, loss: 0.3272232711315155, mean loss: 0.3388398487780623
Epoch: 75, step: 1272, loss: 0.3330644965171814, mean loss: 0.33883979607025777
Epoch: 75, step: 1273, loss: 0.34141626954078674, mean loss: 0.33883981958380543
Epoch: 75, step: 1274, loss: 0.38367098569869995, mean loss: 0.33884022872061687
Epoch: 75, step: 1275, loss: 0.3308483362197876, mean loss: 0.3388401557859186
Epoch: 75, step: 1276, loss: 0.3344223201274872, mean loss: 0.3388401154687383
Epoch: 75, step: 1277, loss: 0.37267643213272095, mean loss: 0.3388404242562382
Epoch: 75, step: 1278, loss: 0.3365921676158905, mean loss: 0.33884040373901647
Epoch: 75, step: 1279, loss: 0.36199283599853516, mean loss: 0.3388406150223917
Epoch: 75, step: 1280, loss: 0.30618467926979065, mean loss: 0.3388403170151117
Epoch: 75, step: 1281, loss: 0.3360719084739685, mean loss: 0.33884029175176056
Epoch: 75, step: 1282, loss: 0.31898263096809387, mean loss: 0.33884011054061663
Epoch: 75, step: 1283, loss: 0.33918818831443787, mean loss: 0.3388401137169724
Epoch: 75, step: 1284, loss: 0.32102862000465393, mean loss: 0.3388399511810988
Epoch: 75, step: 1285, loss: 0.31762558221817017, mean loss: 0.33883975759460994
Epoch: 75, step: 1286, loss: 0.31745100021362305, mean loss: 0.33883956241856367
Epoch: 75, step: 1287, loss: 0.3097097873687744, mean loss: 0.33883929660684114
Epoch: 75, step: 1288, loss: 0.34113213419914246, mean loss: 0.33883931752899205
Epoch: 75, step: 1289, loss: 0.30114680528640747, mean loss: 0.33883897358782733
Epoch: 75, step: 1290, loss: 0.3154715299606323, mean loss: 0.33883876036371563
Epoch: 75, step: 1291, loss: 0.3060920834541321, mean loss: 0.33883846155835656
Epoch: 75, step: 1292, loss: 0.3325343430042267, mean loss: 0.33883840403535276
Epoch: 75, step: 1293, loss: 0.3647032678127289, mean loss: 0.33883864004155545
Epoch: 75, step: 1294, loss: 0.3233202397823334, mean loss: 0.33883849844385244
Epoch: 75, step: 1295, loss: 0.3428421914577484, mean loss: 0.3388385349752315
Epoch: 75, step: 1296, loss: 0.2959924340248108, mean loss: 0.3388381440329525
Epoch: 75, step: 1297, loss: 0.36177000403404236, mean loss: 0.3388383532690699
Epoch: 75, step: 1298, loss: 0.3227541744709015, mean loss: 0.3388382065142747
Epoch: 75, step: 1299, loss: 0.3245002329349518, mean loss: 0.3388380756933479
Epoch: 75, step: 1300, loss: 0.32668137550354004, mean loss: 0.33883796477556255
Epoch: 75, step: 1301, loss: 0.3163798153400421, mean loss: 0.33883775986917913
Epoch: 75, step: 1302, loss: 0.303035169839859, mean loss: 0.33883743321215304
Epoch: 75, step: 1303, loss: 0.3302931785583496, mean loss: 0.3388373552564703
Epoch: 75, step: 1304, loss: 0.31251260638237, mean loss: 0.3388371150781128
Epoch: 75, step: 1305, loss: 0.3455604016780853, mean loss: 0.3388371764186106
Epoch: 75, step: 1306, loss: 0.3604726493358612, mean loss: 0.3388373738099535
Epoch: 75, step: 1307, loss: 0.3408523499965668, mean loss: 0.33883739219343084
Epoch: 75, step: 1308, loss: 0.33597585558891296, mean loss: 0.33883736608666404
Epoch: 75, step: 1309, loss: 0.29346486926078796, mean loss: 0.33883695214179743
Epoch: 75, step: 1310, loss: 0.38966190814971924, mean loss: 0.33883741582661014
Epoch: 75, step: 1311, loss: 0.3133990168571472, mean loss: 0.3388371837498396
Epoch: 75, step: 1312, loss: 0.3377473056316376, mean loss: 0.33883717380687556
Epoch: 75, step: 1313, loss: 0.32231658697128296, mean loss: 0.33883702309084623
Epoch: 75, step: 1314, loss: 0.332261860370636, mean loss: 0.33883696310669514
Epoch: 75, step: 1315, loss: 0.37472379207611084, mean loss: 0.33883729049347233
Epoch: 75, step: 1316, loss: 0.33378732204437256, mean loss: 0.33883724442426366
Epoch: 75, step: 1317, loss: 0.3590681850910187, mean loss: 0.33883742898282765
Epoch: 75, step: 1318, loss: 0.3580692410469055, mean loss: 0.3388376044251512
Epoch: 75, step: 1319, loss: 0.3429039418697357, mean loss: 0.3388376415200011
Epoch: 75, step: 1320, loss: 0.3731086254119873, mean loss: 0.33883795415155793
Epoch: 75, step: 1321, loss: 0.3223852813243866, mean loss: 0.33883780406605657
Epoch: 75, step: 1322, loss: 0.3067142963409424, mean loss: 0.33883751102985316
Epoch: 75, step: 1323, loss: 0.301352858543396, mean loss: 0.33883716909147754
Epoch: 75, step: 1324, loss: 0.31078729033470154, mean loss: 0.33883691322029164
Epoch: 75, step: 1325, loss: 0.32415086030960083, mean loss: 0.33883677925523853
Epoch: 75, step: 1326, loss: 0.3316637873649597, mean loss: 0.33883671382435115
Epoch: 75, step: 1327, loss: 0.380536824464798, mean loss: 0.33883709420263625
Epoch: 75, step: 1328, loss: 0.3144760727882385, mean loss: 0.33883687198934037
Epoch: 75, step: 1329, loss: 0.293308824300766, mean loss: 0.33883645670111917
Epoch: 75, step: 1330, loss: 0.3463549315929413, mean loss: 0.33883652528094504
Epoch: 75, step: 1331, loss: 0.3274993896484375, mean loss: 0.3388364218701194
Epoch: 75, step: 1332, loss: 0.3633697032928467, mean loss: 0.3388366456465501
Epoch: 75, step: 1333, loss: 0.3279179036617279, mean loss: 0.33883654605388736
Epoch: 75, step: 1334, loss: 0.3322945535182953, mean loss: 0.33883648638322983
Epoch: 75, step: 1335, loss: 0.33938243985176086, mean loss: 0.33883649136292143
Epoch: 75, step: 1336, loss: 0.32283255457878113, mean loss: 0.3388363453908793
Epoch: 75, step: 1337, loss: 0.2987196147441864, mean loss: 0.33883597948917876
Epoch: 75, step: 1338, loss: 0.34858641028404236, mean loss: 0.3388360684213178
Epoch: 75, step: 1339, loss: 0.3629280626773834, mean loss: 0.3388362881585876
Epoch: 75, step: 1340, loss: 0.315132737159729, mean loss: 0.3388360719661869
Epoch: 75, step: 1341, loss: 0.3193264603614807, mean loss: 0.3388358940269702
Epoch: 75, step: 1342, loss: 0.3318291902542114, mean loss: 0.3388358301222633
Epoch: 75, step: 1343, loss: 0.30969178676605225, mean loss: 0.33883556431616946
Epoch: 75, step: 1344, loss: 0.33311110734939575, mean loss: 0.33883551210715884
Epoch: 75, step: 1345, loss: 0.3206362724304199, mean loss: 0.3388353461253658
Epoch: 75, step: 1346, loss: 0.33699068427085876, mean loss: 0.338835329301724
Epoch: 75, step: 1347, loss: 0.3406723439693451, mean loss: 0.33883534605546933
Epoch: 75, step: 1348, loss: 0.31469908356666565, mean loss: 0.3388351259325089
Epoch: 75, step: 1349, loss: 0.34377002716064453, mean loss: 0.33883517093844806
Epoch: 75, step: 1350, loss: 0.32457324862480164, mean loss: 0.33883504087194327
Epoch: 75, step: 1351, loss: 0.31497159600257874, mean loss: 0.33883482324303665
Epoch: 75, step: 1352, loss: 0.3761674463748932, mean loss: 0.3388351637045209
Epoch: 75, step: 1353, loss: 0.3196100890636444, mean loss: 0.3388349883796386
Epoch: 75, step: 1354, loss: 0.3295440077781677, mean loss: 0.338834903650437
Epoch: 75, step: 1355, loss: 0.3339085280895233, mean loss: 0.33883485872470964
Epoch: 75, step: 1356, loss: 0.3156323730945587, mean loss: 0.3388346471332414
Epoch: 75, step: 1357, loss: 0.29885637760162354, mean loss: 0.33883428256093906
Epoch: 75, step: 1358, loss: 0.328431636095047, mean loss: 0.3388341876973486
Epoch: 75, step: 1359, loss: 0.40269920229911804, mean loss: 0.33883477008850854
Epoch: 75, step: 1360, loss: 0.3225921094417572, mean loss: 0.3388346219714875
Epoch: 75, step: 1361, loss: 0.3091451823711395, mean loss: 0.3388343512355936
Epoch: 75, step: 1362, loss: 0.29261550307273865, mean loss: 0.3388339297730386
Epoch: 75, step: 1363, loss: 0.3331774175167084, mean loss: 0.33883387819264527
Epoch: 75, step: 1364, loss: 0.2895992696285248, mean loss: 0.3388334292380238
Epoch: 75, step: 1365, loss: 0.3412114977836609, mean loss: 0.3388334509226712
Epoch: 75, step: 1366, loss: 0.31024104356765747, mean loss: 0.338833190202424
Epoch: 75, step: 1367, loss: 0.3248665928840637, mean loss: 0.3388330628489816
Epoch: 75, step: 1368, loss: 0.31656667590141296, mean loss: 0.3388328598163384
Epoch: 75, step: 1369, loss: 0.3271331489086151, mean loss: 0.33883275313528705
Epoch: 75, step: 1370, loss: 0.3169088661670685, mean loss: 0.33883255322932315
Epoch: 75, step: 1371, loss: 0.30744925141334534, mean loss: 0.33883226707331415
Epoch: 75, step: 1372, loss: 0.3125893771648407, mean loss: 0.33883202779026445
Epoch: 75, step: 1373, loss: 0.3626772165298462, mean loss: 0.33883224520905775
Epoch: 75, step: 1374, loss: 0.3040078580379486, mean loss: 0.3388319276855823
Epoch: 75, step: 1375, loss: 0.3348202109336853, mean loss: 0.33883189110769146
Epoch: 75, step: 1376, loss: 0.34600624442100525, mean loss: 0.33883195652116294
Epoch: 75, step: 1377, loss: 0.3313087821006775, mean loss: 0.33883188792787694
Epoch: 75, step: 1378, loss: 0.3678157925605774, mean loss: 0.3388321521890813
Epoch: 75, step: 1379, loss: 0.3224324584007263, mean loss: 0.3388320026659797
Epoch: 75, step: 1380, loss: 0.3544054329395294, mean loss: 0.3388321446543849
Epoch: 75, step: 1381, loss: 0.3249720335006714, mean loss: 0.33883201828806087
Epoch: 75, step: 1382, loss: 0.3418688476085663, mean loss: 0.33883204597539
Epoch: 75, step: 1383, loss: 0.3228325843811035, mean loss: 0.33883190010669817
Epoch: 75, step: 1384, loss: 0.3632774353027344, mean loss: 0.33883212297705595
Epoch: 75, step: 1385, loss: 0.32394441962242126, mean loss: 0.33883198724685015
Epoch: 75, step: 1386, loss: 0.3611829876899719, mean loss: 0.3388321910175836
Epoch: 75, step: 1387, loss: 0.3667694628238678, mean loss: 0.3388324457151969
Epoch: 75, step: 1388, loss: 0.3466581404209137, mean loss: 0.33883251705958606
Epoch: 75, step: 1389, loss: 0.31756478548049927, mean loss: 0.33883232317015605
Epoch: 75, step: 1390, loss: 0.3005354106426239, mean loss: 0.33883197403565524
Epoch: 75, step: 1391, loss: 0.2984669804573059, mean loss: 0.3388316060508106
Epoch: 75, step: 1392, loss: 0.3323018252849579, mean loss: 0.33883154652303066
Epoch: 75, step: 1393, loss: 0.38022497296333313, mean loss: 0.3388319238766365
Epoch: 75, step: 1394, loss: 0.3213958740234375, mean loss: 0.33883176492636663
Epoch: 75, step: 1395, loss: 0.3316109776496887, mean loss: 0.33883169910092836
Epoch: 75, step: 1396, loss: 0.3291592597961426, mean loss: 0.33883161092678227
Epoch: 75, step: 1397, loss: 0.33128228783607483, mean loss: 0.3388315421076325
Epoch: 75, step: 1398, loss: 0.36725735664367676, mean loss: 0.33883180123319
Epoch: 75, step: 1399, loss: 0.32812076807022095, mean loss: 0.3388317035938722
Epoch: 75, step: 1400, loss: 0.3280904293060303, mean loss: 0.3388316056797758
Epoch: 75, step: 1401, loss: 0.30614474415779114, mean loss: 0.3388313077192872
Epoch: 75, step: 1402, loss: 0.32324808835983276, mean loss: 0.33883116567012395
Epoch: 75, step: 1403, loss: 0.3150620460510254, mean loss: 0.33883094900419
Epoch: 75, step: 1404, loss: 0.3742939233779907, mean loss: 0.33883127226178417
Epoch: 75, step: 1405, loss: 0.3408614993095398, mean loss: 0.3388312907678554
Epoch: 75, step: 1406, loss: 0.33635368943214417, mean loss: 0.33883126818405185
Epoch: 75, step: 1407, loss: 0.35209769010543823, mean loss: 0.338831389108888
Epoch: 75, step: 1408, loss: 0.3617125451564789, mean loss: 0.33883159767113946
Epoch: 75, step: 1409, loss: 0.3234415352344513, mean loss: 0.3388314573916532
Epoch: 75, step: 1410, loss: 0.3127591609954834, mean loss: 0.33883121974641806
Epoch: 75, step: 1411, loss: 0.38384032249450684, mean loss: 0.33883162999418265
Epoch: 75, step: 1412, loss: 0.292337566614151, mean loss: 0.3388312062152013
Epoch: 75, step: 1413, loss: 0.35985618829727173, mean loss: 0.3388313978496516
Epoch: 75, step: 1414, loss: 0.3169611096382141, mean loss: 0.33883119851238497
Epoch: 75, step: 1415, loss: 0.36967015266418457, mean loss: 0.3388314795922106
Epoch: 75, step: 1416, loss: 0.3063797056674957, mean loss: 0.3388311838151303
Epoch: 75, step: 1417, loss: 0.32234638929367065, mean loss: 0.33883103356818334
Epoch: 75, step: 1418, loss: 0.32562020421028137, mean loss: 0.33883091316215197
Epoch: 75, step: 1419, loss: 0.31844618916511536, mean loss: 0.33883072737356285
Epoch: 75, step: 1420, loss: 0.3074134588241577, mean loss: 0.3388304410357738
Epoch: 75, step: 1421, loss: 0.37183380126953125, mean loss: 0.3388307418265016
Epoch: 75, step: 1422, loss: 0.32488760352134705, mean loss: 0.3388306147506988
Epoch: 75, step: 1423, loss: 0.3143976628780365, mean loss: 0.33883039207423904
Epoch: 75, step: 1424, loss: 0.311440646648407, mean loss: 0.338830142452499
Epoch: 75, step: 1425, loss: 0.2921072542667389, mean loss: 0.3388297166383056
Epoch: 75, step: 1426, loss: 0.32617977261543274, mean loss: 0.3388296013526965
Epoch: 75, step: 1427, loss: 0.33010825514793396, mean loss: 0.33882952187119497
Epoch: 75, step: 1428, loss: 0.37083637714385986, mean loss: 0.3388298135612247
Epoch: 75, step: 1429, loss: 0.32520684599876404, mean loss: 0.3388296894113335
Epoch: 75, step: 1430, loss: 0.35945454239845276, mean loss: 0.33882987736964054
Epoch: 75, step: 1431, loss: 0.35321927070617676, mean loss: 0.33883000850179285
Epoch: 75, step: 1432, loss: 0.3990461826324463, mean loss: 0.3388305572535278
Epoch: 75, step: 1433, loss: 0.35189422965049744, mean loss: 0.338830676302067
Epoch: 75, step: 1434, loss: 0.37847012281417847, mean loss: 0.33883103753090477
Epoch: 75, step: 1435, loss: 0.3636232316493988, mean loss: 0.3388312634567096
Epoch: 75, step: 1436, loss: 0.384292870759964, mean loss: 0.33883167773454936
Epoch: 75, step: 1437, loss: 0.33985546231269836, mean loss: 0.3388316870639027
Epoch: 75, step: 1438, loss: 0.32743069529533386, mean loss: 0.3388315831720159
Epoch: 75, step: 1439, loss: 0.32352474331855774, mean loss: 0.33883144368923973
Epoch: 75, step: 1440, loss: 0.3465592861175537, mean loss: 0.33883151410815726
Epoch: 75, step: 1441, loss: 0.36627742648124695, mean loss: 0.33883176420303773
Epoch: 75, step: 1442, loss: 0.36329054832458496, mean loss: 0.3388319870763337
Epoch: 75, step: 1443, loss: 0.32728567719459534, mean loss: 0.33883188186502483
Valid: 75, mean loss: 0.18497634927431744
Epoch: 76, step: 0, loss: 0.34923285245895386, mean loss: 0.33883197663900627
Epoch: 76, step: 1, loss: 0.3054746985435486, mean loss: 0.3388316726891758
Epoch: 76, step: 2, loss: 0.3201683759689331, mean loss: 0.3388315026317098
Epoch: 76, step: 3, loss: 0.3657560348510742, mean loss: 0.3388317479622144
Epoch: 76, step: 4, loss: 0.32853472232818604, mean loss: 0.33883165413880245
Epoch: 76, step: 5, loss: 0.33244508504867554, mean loss: 0.338831595946829
Epoch: 76, step: 6, loss: 0.3338930308818817, mean loss: 0.33883155094892403
Epoch: 76, step: 7, loss: 0.40222418308258057, mean loss: 0.3388321285478027
Epoch: 76, step: 8, loss: 0.35143953561782837, mean loss: 0.33883224341853124
Epoch: 76, step: 9, loss: 0.3436819016933441, mean loss: 0.3388322876051511
Epoch: 76, step: 10, loss: 0.35469284653663635, mean loss: 0.3388324321139109
Epoch: 76, step: 11, loss: 0.3316178023815155, mean loss: 0.33883236638055936
Epoch: 76, step: 12, loss: 0.3357841670513153, mean loss: 0.3388323386083049
Epoch: 76, step: 13, loss: 0.36776164174079895, mean loss: 0.33883260218183153
Epoch: 76, step: 14, loss: 0.3308064937591553, mean loss: 0.3388325290569997
Epoch: 76, step: 15, loss: 0.2883114516735077, mean loss: 0.33883206877021593
Epoch: 76, step: 16, loss: 0.30937865376472473, mean loss: 0.3388318004288651
Epoch: 76, step: 17, loss: 0.3200679421424866, mean loss: 0.33883162947846074
Epoch: 76, step: 18, loss: 0.3050478398799896, mean loss: 0.33883132168995644
Epoch: 76, step: 19, loss: 0.35060805082321167, mean loss: 0.3388314289813191
Epoch: 76, step: 20, loss: 0.31944191455841064, mean loss: 0.3388312523356268
Epoch: 76, step: 21, loss: 0.32976818084716797, mean loss: 0.3388311697684248
Epoch: 76, step: 22, loss: 0.3313502073287964, mean loss: 0.33883110161531466
Epoch: 76, step: 23, loss: 0.30279549956321716, mean loss: 0.3388307733265415
Epoch: 76, step: 24, loss: 0.37527939677238464, mean loss: 0.3388311053749654
Epoch: 76, step: 25, loss: 0.3545149266719818, mean loss: 0.3388312482539059
Epoch: 76, step: 26, loss: 0.3564856946468353, mean loss: 0.3388314090836915
Epoch: 76, step: 27, loss: 0.3213512599468231, mean loss: 0.3388312498431827
Epoch: 76, step: 28, loss: 0.3713393211364746, mean loss: 0.33883154598222687
Epoch: 76, step: 29, loss: 0.31965169310569763, mean loss: 0.3388313712609552
Epoch: 76, step: 30, loss: 0.3193081319332123, mean loss: 0.33883119341318174
Epoch: 76, step: 31, loss: 0.3559645712375641, mean loss: 0.3388313494889891
Epoch: 76, step: 32, loss: 0.32389453053474426, mean loss: 0.3388312134238848
Epoch: 76, step: 33, loss: 0.317343145608902, mean loss: 0.3388310176827726
Epoch: 76, step: 34, loss: 0.30817481875419617, mean loss: 0.33883073842900885
Epoch: 76, step: 35, loss: 0.33080339431762695, mean loss: 0.3388306653069091
Epoch: 76, step: 36, loss: 0.35754990577697754, mean loss: 0.3388308358213011
Epoch: 76, step: 37, loss: 0.3156575560569763, mean loss: 0.33883062473679026
Epoch: 76, step: 38, loss: 0.3319891095161438, mean loss: 0.3388305624182599
Epoch: 76, step: 39, loss: 0.32262977957725525, mean loss: 0.3388304148486428
Epoch: 76, step: 40, loss: 0.31329992413520813, mean loss: 0.33883018229874334
Epoch: 76, step: 41, loss: 0.3550843596458435, mean loss: 0.33883033035202287
Epoch: 76, step: 42, loss: 0.3416155278682709, mean loss: 0.3388303557211241
Epoch: 76, step: 43, loss: 0.39646607637405396, mean loss: 0.3388308806939868
Epoch: 76, step: 44, loss: 0.32724452018737793, mean loss: 0.3388307751610053
Epoch: 76, step: 45, loss: 0.31500864028930664, mean loss: 0.33883055818191
Epoch: 76, step: 46, loss: 0.33610981702804565, mean loss: 0.3388305334008154
Epoch: 76, step: 47, loss: 0.3146948516368866, mean loss: 0.3388303135698463
Epoch: 76, step: 48, loss: 0.32347387075424194, mean loss: 0.338830173702616
Epoch: 76, step: 49, loss: 0.36790594458580017, mean loss: 0.33883043852374356
Epoch: 76, step: 50, loss: 0.3365657925605774, mean loss: 0.33883041789761337
Epoch: 76, step: 51, loss: 0.32830002903938293, mean loss: 0.3388303219889386
Epoch: 76, step: 52, loss: 0.29856061935424805, mean loss: 0.3388299552238846
Epoch: 76, step: 53, loss: 0.3351035416126251, mean loss: 0.3388299212850732
Epoch: 76, step: 54, loss: 0.299212247133255, mean loss: 0.33882956046508256
Epoch: 76, step: 55, loss: 0.31718704104423523, mean loss: 0.3388293633565268
Epoch: 76, step: 56, loss: 0.391408771276474, mean loss: 0.3388298422174472
Epoch: 76, step: 57, loss: 0.33800819516181946, mean loss: 0.33882983473445916
Epoch: 76, step: 58, loss: 0.3336000442504883, mean loss: 0.33882978710561035
Epoch: 76, step: 59, loss: 0.3290652334690094, mean loss: 0.33882969817848896
Epoch: 76, step: 60, loss: 0.3174613416194916, mean loss: 0.33882950357572444
Epoch: 76, step: 61, loss: 0.33445030450820923, mean loss: 0.33882946369448785
Epoch: 76, step: 62, loss: 0.31624463200569153, mean loss: 0.33882925801696556
Epoch: 76, step: 63, loss: 0.332792192697525, mean loss: 0.3388292030385913
Epoch: 76, step: 64, loss: 0.3198160231113434, mean loss: 0.3388290298908536
Epoch: 76, step: 65, loss: 0.2837812900543213, mean loss: 0.3388285285909735
Epoch: 76, step: 66, loss: 0.34770146012306213, mean loss: 0.3388286093928197
Epoch: 76, step: 67, loss: 0.33341506123542786, mean loss: 0.33882856009449025
Epoch: 76, step: 68, loss: 0.3707066774368286, mean loss: 0.33882885038905775
Epoch: 76, step: 69, loss: 0.296688050031662, mean loss: 0.3388284666419913
Epoch: 76, step: 70, loss: 0.37855619192123413, mean loss: 0.3388288284115608
Epoch: 76, step: 71, loss: 0.3303883671760559, mean loss: 0.33882875155152914
Epoch: 76, step: 72, loss: 0.3129425048828125, mean loss: 0.33882851582985885
Epoch: 76, step: 73, loss: 0.3260144293308258, mean loss: 0.33882839914510315
Epoch: 76, step: 74, loss: 0.3051966428756714, mean loss: 0.3388280928979486
Epoch: 76, step: 75, loss: 0.37316668033599854, mean loss: 0.3388284055785845
Epoch: 76, step: 76, loss: 0.3737035095691681, mean loss: 0.3388287231417463
Epoch: 76, step: 77, loss: 0.3274625539779663, mean loss: 0.3388286196454599
Epoch: 76, step: 78, loss: 0.29799434542655945, mean loss: 0.3388282478264947
Epoch: 76, step: 79, loss: 0.3118760287761688, mean loss: 0.33882800241366096
Epoch: 76, step: 80, loss: 0.31754374504089355, mean loss: 0.33882780861209144
Epoch: 76, step: 81, loss: 0.34991487860679626, mean loss: 0.3388279095633233
Epoch: 76, step: 82, loss: 0.3177781403064728, mean loss: 0.33882771790035104
Epoch: 76, step: 83, loss: 0.31013134121894836, mean loss: 0.3388274566156451
Epoch: 76, step: 84, loss: 0.32042428851127625, mean loss: 0.33882728905363413
Epoch: 76, step: 85, loss: 0.33489990234375, mean loss: 0.338827253294855
Epoch: 76, step: 86, loss: 0.3486899435520172, mean loss: 0.33882734309363916
Epoch: 76, step: 87, loss: 0.31770020723342896, mean loss: 0.3388271507349836
Epoch: 76, step: 88, loss: 0.3308894634246826, mean loss: 0.3388270784644701
Epoch: 76, step: 89, loss: 0.3490823805332184, mean loss: 0.33882717183539407
Epoch: 76, step: 90, loss: 0.35073959827423096, mean loss: 0.3388272802928661
Epoch: 76, step: 91, loss: 0.32077834010124207, mean loss: 0.3388271159665961
Epoch: 76, step: 92, loss: 0.3169091045856476, mean loss: 0.33882691641624985
Epoch: 76, step: 93, loss: 0.33935344219207764, mean loss: 0.33882692120990754
Epoch: 76, step: 94, loss: 0.29682162404060364, mean loss: 0.33882653878383695
Epoch: 76, step: 95, loss: 0.3624880611896515, mean loss: 0.3388267542019215
Epoch: 76, step: 96, loss: 0.3057304918766022, mean loss: 0.3388264528912786
Epoch: 76, step: 97, loss: 0.37419870495796204, mean loss: 0.3388267749197565
Epoch: 76, step: 98, loss: 0.32185235619544983, mean loss: 0.33882662038629763
Epoch: 76, step: 99, loss: 0.32427847385406494, mean loss: 0.3388264879425908
Epoch: 76, step: 100, loss: 0.3259557783603668, mean loss: 0.33882637077103467
Epoch: 76, step: 101, loss: 0.34971871972084045, mean loss: 0.338826469931213
Epoch: 76, step: 102, loss: 0.3137466013431549, mean loss: 0.3388262416148404
Epoch: 76, step: 103, loss: 0.328120619058609, mean loss: 0.338826144156329
Epoch: 76, step: 104, loss: 0.3345020115375519, mean loss: 0.338826104791996
Epoch: 76, step: 105, loss: 0.3481602072715759, mean loss: 0.3388261897633431
Epoch: 76, step: 106, loss: 0.33083680272102356, mean loss: 0.33882611703403664
Epoch: 76, step: 107, loss: 0.43639615178108215, mean loss: 0.338827005229379
Epoch: 76, step: 108, loss: 0.2877733111381531, mean loss: 0.33882654048381816
Epoch: 76, step: 109, loss: 0.3529273271560669, mean loss: 0.33882666884315576
Epoch: 76, step: 110, loss: 0.32270628213882446, mean loss: 0.33882652210075254
Epoch: 76, step: 111, loss: 0.4210887551307678, mean loss: 0.33882727091950643
Epoch: 76, step: 112, loss: 0.3450305759906769, mean loss: 0.3388273273865961
Epoch: 76, step: 113, loss: 0.31902366876602173, mean loss: 0.33882714712062895
Epoch: 76, step: 114, loss: 0.37528592348098755, mean loss: 0.3388274789894459
Epoch: 76, step: 115, loss: 0.3742062747478485, mean loss: 0.33882780102472493
Epoch: 76, step: 116, loss: 0.3428223431110382, mean loss: 0.3388278373846897
Epoch: 76, step: 117, loss: 0.3487401306629181, mean loss: 0.3388279276096381
Epoch: 76, step: 118, loss: 0.3483210802078247, mean loss: 0.3388280140186438
Epoch: 76, step: 119, loss: 0.32836592197418213, mean loss: 0.3388279187909801
Epoch: 76, step: 120, loss: 0.32610905170440674, mean loss: 0.3388278030228366
Epoch: 76, step: 121, loss: 0.331417053937912, mean loss: 0.33882773557022083
Epoch: 76, step: 122, loss: 0.33722034096717834, mean loss: 0.3388277209398532
Epoch: 76, step: 123, loss: 0.3189375400543213, mean loss: 0.33882753990278247
Epoch: 76, step: 124, loss: 0.33101195096969604, mean loss: 0.33882746876725806
Epoch: 76, step: 125, loss: 0.3764954209327698, mean loss: 0.3388278116083627
Epoch: 76, step: 126, loss: 0.30292990803718567, mean loss: 0.3388274848806222
Epoch: 76, step: 127, loss: 0.3470357060432434, mean loss: 0.3388275595877465
Epoch: 76, step: 128, loss: 0.31374219059944153, mean loss: 0.3388273312753405
Epoch: 76, step: 129, loss: 0.31361672282218933, mean loss: 0.3388271018251662
Epoch: 76, step: 130, loss: 0.3059491813182831, mean loss: 0.3388268025949454
Epoch: 76, step: 131, loss: 0.3650551736354828, mean loss: 0.3388270413037721
Epoch: 76, step: 132, loss: 0.36388498544692993, mean loss: 0.33882726935827073
Epoch: 76, step: 133, loss: 0.3418576121330261, mean loss: 0.3388272969374292
Epoch: 76, step: 134, loss: 0.3096626400947571, mean loss: 0.33882703151221744
Epoch: 76, step: 135, loss: 0.3057733178138733, mean loss: 0.33882673069574765
Epoch: 76, step: 136, loss: 0.3150128722190857, mean loss: 0.3388265139716691
Epoch: 76, step: 137, loss: 0.3171192705631256, mean loss: 0.33882631642117483
Epoch: 76, step: 138, loss: 0.3417492210865021, mean loss: 0.3388263430213283
Epoch: 76, step: 139, loss: 0.2999221682548523, mean loss: 0.3388259889736529
Epoch: 76, step: 140, loss: 0.3099426329135895, mean loss: 0.3388257261228902
Epoch: 76, step: 141, loss: 0.30688807368278503, mean loss: 0.33882543547938293
Epoch: 76, step: 142, loss: 0.31859347224235535, mean loss: 0.338825251363307
Epoch: 76, step: 143, loss: 0.3173866868019104, mean loss: 0.33882505626862364
Epoch: 76, step: 144, loss: 0.37183988094329834, mean loss: 0.3388253567065626
Epoch: 76, step: 145, loss: 0.3245689570903778, mean loss: 0.3388252269731964
Epoch: 76, step: 146, loss: 0.3622768819332123, mean loss: 0.3388254403815279
Epoch: 76, step: 147, loss: 0.2976802885532379, mean loss: 0.33882506596708617
Epoch: 76, step: 148, loss: 0.3500639796257019, mean loss: 0.3388251682385107
Epoch: 76, step: 149, loss: 0.3639375865459442, mean loss: 0.3388253967534279
Epoch: 76, step: 150, loss: 0.32099631428718567, mean loss: 0.338825234515997
Epoch: 76, step: 151, loss: 0.35588935017585754, mean loss: 0.33882538979112675
Epoch: 76, step: 152, loss: 0.3439687490463257, mean loss: 0.3388254365927615
Epoch: 76, step: 153, loss: 0.3347870707511902, mean loss: 0.33882539984627075
Epoch: 76, step: 154, loss: 0.3264865577220917, mean loss: 0.3388252875718904
Epoch: 76, step: 155, loss: 0.32272177934646606, mean loss: 0.33882514104315314
Epoch: 76, step: 156, loss: 0.34744855761528015, mean loss: 0.33882521950846806
Epoch: 76, step: 157, loss: 0.3549710810184479, mean loss: 0.33882536641991196
Epoch: 76, step: 158, loss: 0.34773483872413635, mean loss: 0.3388254474866008
Epoch: 76, step: 159, loss: 0.3104417622089386, mean loss: 0.3388251892277087
Epoch: 76, step: 160, loss: 0.30013278126716614, mean loss: 0.33882483717449946
Epoch: 76, step: 161, loss: 0.3459409177303314, mean loss: 0.33882490192147013
Epoch: 76, step: 162, loss: 0.2906464636325836, mean loss: 0.3388244635650571
Epoch: 76, step: 163, loss: 0.36229974031448364, mean loss: 0.338824677155303
Epoch: 76, step: 164, loss: 0.36151227355003357, mean loss: 0.33882488357694635
Epoch: 76, step: 165, loss: 0.34822994470596313, mean loss: 0.33882496914751437
Epoch: 76, step: 166, loss: 0.30480730533599854, mean loss: 0.33882465964561
Epoch: 76, step: 167, loss: 0.3189838230609894, mean loss: 0.3388244791299558
Epoch: 76, step: 168, loss: 0.3130268454551697, mean loss: 0.33882424442037934
Epoch: 76, step: 169, loss: 0.326811283826828, mean loss: 0.33882413512619847
Epoch: 76, step: 170, loss: 0.3510092794895172, mean loss: 0.33882424598590244
Epoch: 76, step: 171, loss: 0.36562809348106384, mean loss: 0.3388244898434618
Epoch: 76, step: 172, loss: 0.3213333785533905, mean loss: 0.3388243307132882
Epoch: 76, step: 173, loss: 0.35928890109062195, mean loss: 0.3388245168936261
Epoch: 76, step: 174, loss: 0.3273322284221649, mean loss: 0.3388244123412878
Epoch: 76, step: 175, loss: 0.33586031198501587, mean loss: 0.3388243853753093
Epoch: 76, step: 176, loss: 0.32672175765037537, mean loss: 0.33882427527234693
Epoch: 76, step: 177, loss: 0.3170511722564697, mean loss: 0.3388240771945917
Epoch: 76, step: 178, loss: 0.3113381564617157, mean loss: 0.3388238271475521
Epoch: 76, step: 179, loss: 0.299367755651474, mean loss: 0.33882346820799847
Epoch: 76, step: 180, loss: 0.3401239812374115, mean loss: 0.3388234800389107
Epoch: 76, step: 181, loss: 0.3154503107070923, mean loss: 0.33882326741251356
Epoch: 76, step: 182, loss: 0.30766451358795166, mean loss: 0.33882298396300775
Epoch: 76, step: 183, loss: 0.31405478715896606, mean loss: 0.33882275865010475
Epoch: 76, step: 184, loss: 0.3134026527404785, mean loss: 0.3388225274089772
Epoch: 76, step: 185, loss: 0.3492315709590912, mean loss: 0.33882262209690184
Epoch: 76, step: 186, loss: 0.343102365732193, mean loss: 0.3388226610280826
Epoch: 76, step: 187, loss: 0.3806397318840027, mean loss: 0.3388230414184226
Epoch: 76, step: 188, loss: 0.29328495264053345, mean loss: 0.33882262718349065
Epoch: 76, step: 189, loss: 0.30032020807266235, mean loss: 0.33882227695135947
Epoch: 76, step: 190, loss: 0.3001616895198822, mean loss: 0.3388219252836701
Epoch: 76, step: 191, loss: 0.31865355372428894, mean loss: 0.3388217418281
Epoch: 76, step: 192, loss: 0.33783623576164246, mean loss: 0.33882173286381984
Epoch: 76, step: 193, loss: 0.330794095993042, mean loss: 0.3388216598441463
Epoch: 76, step: 194, loss: 0.31638166308403015, mean loss: 0.3388214557309857
Epoch: 76, step: 195, loss: 0.301564484834671, mean loss: 0.33882111684640415
Epoch: 76, step: 196, loss: 0.35332271456718445, mean loss: 0.3388212487498589
Epoch: 76, step: 197, loss: 0.31560230255126953, mean loss: 0.3388210375571737
Epoch: 76, step: 198, loss: 0.31458860635757446, mean loss: 0.33882081714813267
Epoch: 76, step: 199, loss: 0.328950434923172, mean loss: 0.3388207273716808
Epoch: 76, step: 200, loss: 0.30060040950775146, mean loss: 0.33882037974043006
Epoch: 76, step: 201, loss: 0.3034173846244812, mean loss: 0.33882005773694546
Epoch: 76, step: 202, loss: 0.3162030875682831, mean loss: 0.33881985202901194
Epoch: 76, step: 203, loss: 0.3296666145324707, mean loss: 0.33881976877840714
Epoch: 76, step: 204, loss: 0.3247888386249542, mean loss: 0.3388196411653306
Epoch: 76, step: 205, loss: 0.3541867434978485, mean loss: 0.3388197809297902
Epoch: 76, step: 206, loss: 0.3242156505584717, mean loss: 0.3388196481058016
Epoch: 76, step: 207, loss: 0.3324635624885559, mean loss: 0.33881959029797987
Epoch: 76, step: 208, loss: 0.30157366394996643, mean loss: 0.33881925155391335
Epoch: 76, step: 209, loss: 0.40029025077819824, mean loss: 0.3388198106149682
Epoch: 76, step: 210, loss: 0.34681078791618347, mean loss: 0.33881988328994705
Epoch: 76, step: 211, loss: 0.3020484149456024, mean loss: 0.33881954887010324
Epoch: 76, step: 212, loss: 0.3139323890209198, mean loss: 0.33881932253471897
Epoch: 76, step: 213, loss: 0.33364197611808777, mean loss: 0.33881927544995555
Epoch: 76, step: 214, loss: 0.3719756305217743, mean loss: 0.33881957698375514
Epoch: 76, step: 215, loss: 0.33851197361946106, mean loss: 0.3388195741863437
Epoch: 76, step: 216, loss: 0.35423123836517334, mean loss: 0.33881971434207325
Epoch: 76, step: 217, loss: 0.32002344727516174, mean loss: 0.3388195434078681
Epoch: 76, step: 218, loss: 0.3402087986469269, mean loss: 0.3388195560417107
Epoch: 76, step: 219, loss: 0.28445860743522644, mean loss: 0.33881906168948084
Epoch: 76, step: 220, loss: 0.3335701823234558, mean loss: 0.33881901395720815
Epoch: 76, step: 221, loss: 0.3014533221721649, mean loss: 0.338818674164074
Epoch: 76, step: 222, loss: 0.3153717815876007, mean loss: 0.3388184609465399
Epoch: 76, step: 223, loss: 0.328792542219162, mean loss: 0.33881836977530166
Epoch: 76, step: 224, loss: 0.319071501493454, mean loss: 0.33881819020771187
Epoch: 76, step: 225, loss: 0.32731616497039795, mean loss: 0.3388180856153209
Epoch: 76, step: 226, loss: 0.3473822772502899, mean loss: 0.33881816349213967
Epoch: 76, step: 227, loss: 0.3570336699485779, mean loss: 0.33881832912981524
Epoch: 76, step: 228, loss: 0.33117905259132385, mean loss: 0.33881825966479623
Epoch: 76, step: 229, loss: 0.2954799234867096, mean loss: 0.3388178655867762
Epoch: 76, step: 230, loss: 0.39056286215782166, mean loss: 0.33881833610277134
Epoch: 76, step: 231, loss: 0.3110012710094452, mean loss: 0.33881808316517503
Epoch: 76, step: 232, loss: 0.33436763286590576, mean loss: 0.33881804269807464
Epoch: 76, step: 233, loss: 0.32730716466903687, mean loss: 0.33881793803279586
Epoch: 76, step: 234, loss: 0.34460029006004333, mean loss: 0.3388179906096699
Epoch: 76, step: 235, loss: 0.34784355759620667, mean loss: 0.33881807267519987
Epoch: 76, step: 236, loss: 0.327412873506546, mean loss: 0.33881796897365896
Epoch: 76, step: 237, loss: 0.3413371443748474, mean loss: 0.33881799187900163
Epoch: 76, step: 238, loss: 0.3075905740261078, mean loss: 0.3388177079495048
Epoch: 76, step: 239, loss: 0.3403712809085846, mean loss: 0.3388177220749499
Epoch: 76, step: 240, loss: 0.3429059088230133, mean loss: 0.3388177592453527
Epoch: 76, step: 241, loss: 0.3271710276603699, mean loss: 0.33881765335249736
Epoch: 76, step: 242, loss: 0.34130391478538513, mean loss: 0.3388176759575455
Epoch: 76, step: 243, loss: 0.2944764494895935, mean loss: 0.33881727281150714
Epoch: 76, step: 244, loss: 0.3090125620365143, mean loss: 0.3388170018324931
Epoch: 76, step: 245, loss: 0.324838787317276, mean loss: 0.3388168747462624
Epoch: 76, step: 246, loss: 0.33602577447891235, mean loss: 0.3388168493705474
Epoch: 76, step: 247, loss: 0.31699755787849426, mean loss: 0.338816650998925
Epoch: 76, step: 248, loss: 0.28823256492614746, mean loss: 0.3388161911143317
Epoch: 76, step: 249, loss: 0.339141845703125, mean loss: 0.3388161940749895
Epoch: 76, step: 250, loss: 0.35859742760658264, mean loss: 0.33881637391255964
Epoch: 76, step: 251, loss: 0.32068926095962524, mean loss: 0.33881620911463106
Epoch: 76, step: 252, loss: 0.3322232663631439, mean loss: 0.3388161491771532
Epoch: 76, step: 253, loss: 0.3272424638271332, mean loss: 0.33881604395991877
Epoch: 76, step: 254, loss: 0.3122563362121582, mean loss: 0.3388158025058351
Epoch: 76, step: 255, loss: 0.360360711812973, mean loss: 0.33881599836864695
Epoch: 76, step: 256, loss: 0.3271665573120117, mean loss: 0.3388158924656001
Epoch: 76, step: 257, loss: 0.3149542808532715, mean loss: 0.33881567554580216
Epoch: 76, step: 258, loss: 0.3030967712402344, mean loss: 0.338815350837346
Epoch: 76, step: 259, loss: 0.34799712896347046, mean loss: 0.33881543430502103
Epoch: 76, step: 260, loss: 0.3203471899032593, mean loss: 0.33881526641952125
Epoch: 76, step: 261, loss: 0.31667882204055786, mean loss: 0.33881506519009397
Epoch: 76, step: 262, loss: 0.32454633712768555, mean loss: 0.3388149354826384
Epoch: 76, step: 263, loss: 0.35800933837890625, mean loss: 0.33881510996452063
Epoch: 76, step: 264, loss: 0.35598886013031006, mean loss: 0.33881526607674933
Epoch: 76, step: 265, loss: 0.38374048471450806, mean loss: 0.33881567445070293
Epoch: 76, step: 266, loss: 0.35049110651016235, mean loss: 0.3388157805803814
Epoch: 76, step: 267, loss: 0.3417263329029083, mean loss: 0.3388158070370618
Epoch: 76, step: 268, loss: 0.3358331322669983, mean loss: 0.3388157799250408
Epoch: 76, step: 269, loss: 0.3210727870464325, mean loss: 0.33881561864563203
Epoch: 76, step: 270, loss: 0.3375225365161896, mean loss: 0.33881560689194273
Epoch: 76, step: 271, loss: 0.3646918833255768, mean loss: 0.3388158420966078
Epoch: 76, step: 272, loss: 0.30202773213386536, mean loss: 0.3388155077109223
Epoch: 76, step: 273, loss: 0.3507150709629059, mean loss: 0.3388156158710711
Epoch: 76, step: 274, loss: 0.37555837631225586, mean loss: 0.33881594983848073
Epoch: 76, step: 275, loss: 0.34035634994506836, mean loss: 0.3388159638395724
Epoch: 76, step: 276, loss: 0.339955598115921, mean loss: 0.3388159741979065
Epoch: 76, step: 277, loss: 0.34356382489204407, mean loss: 0.3388160173515548
Epoch: 76, step: 278, loss: 0.3619247078895569, mean loss: 0.3388162273866433
Epoch: 76, step: 279, loss: 0.3145608901977539, mean loss: 0.3388160069316772
Epoch: 76, step: 280, loss: 0.3298671245574951, mean loss: 0.3388159255966863
Epoch: 76, step: 281, loss: 0.34005671739578247, mean loss: 0.3388159368739462
Epoch: 76, step: 282, loss: 0.33960238099098206, mean loss: 0.3388159440216837
Epoch: 76, step: 283, loss: 0.3417157530784607, mean loss: 0.3388159703768756
Epoch: 76, step: 284, loss: 0.34285447001457214, mean loss: 0.3388160070808322
Epoch: 76, step: 285, loss: 0.2962592840194702, mean loss: 0.3388156203070154
Epoch: 76, step: 286, loss: 0.3384607434272766, mean loss: 0.3388156170817709
Epoch: 76, step: 287, loss: 0.31744539737701416, mean loss: 0.33881542286354616
Epoch: 76, step: 288, loss: 0.3012888431549072, mean loss: 0.33881508181513603
Epoch: 76, step: 289, loss: 0.37305712699890137, mean loss: 0.3388153930102683
Epoch: 76, step: 290, loss: 0.3347541093826294, mean loss: 0.33881535610125185
Epoch: 76, step: 291, loss: 0.3096482455730438, mean loss: 0.3388150910324514
Epoch: 76, step: 292, loss: 0.32137641310691833, mean loss: 0.33881493255232265
Epoch: 76, step: 293, loss: 0.3384486734867096, mean loss: 0.3388149292238446
Epoch: 76, step: 294, loss: 0.3661157488822937, mean loss: 0.33881517732515104
Epoch: 76, step: 295, loss: 0.30628082156181335, mean loss: 0.33881488166579293
Epoch: 76, step: 296, loss: 0.3410862386226654, mean loss: 0.33881490230679906
Epoch: 76, step: 297, loss: 0.33536896109580994, mean loss: 0.33881487099201735
Epoch: 76, step: 298, loss: 0.33026182651519775, mean loss: 0.3388147932674508
Epoch: 76, step: 299, loss: 0.2969164252281189, mean loss: 0.33881441252549266
Epoch: 76, step: 300, loss: 0.33627238869667053, mean loss: 0.3388143894256351
Epoch: 76, step: 301, loss: 0.309461385011673, mean loss: 0.3388141226916837
Epoch: 76, step: 302, loss: 0.3239802122116089, mean loss: 0.3388139878955468
Epoch: 76, step: 303, loss: 0.3248128592967987, mean loss: 0.33881386066807695
Epoch: 76, step: 304, loss: 0.34283947944641113, mean loss: 0.33881389724831645
Epoch: 76, step: 305, loss: 0.31698670983314514, mean loss: 0.338813698909494
Epoch: 76, step: 306, loss: 0.3215014636516571, mean loss: 0.3388135415984722
Epoch: 76, step: 307, loss: 0.31586509943008423, mean loss: 0.3388133330748455
Epoch: 76, step: 308, loss: 0.3404461145401001, mean loss: 0.33881334791116496
Epoch: 76, step: 309, loss: 0.34814688563346863, mean loss: 0.3388134327198745
Epoch: 76, step: 310, loss: 0.3481241464614868, mean loss: 0.3388135173204264
Epoch: 76, step: 311, loss: 0.31989046931266785, mean loss: 0.33881334538025043
Epoch: 76, step: 312, loss: 0.30594030022621155, mean loss: 0.3388130466891617
Epoch: 76, step: 313, loss: 0.3653836250305176, mean loss: 0.3388132881125779
Epoch: 76, step: 314, loss: 0.3153093457221985, mean loss: 0.3388130745549189
Epoch: 76, step: 315, loss: 0.32281622290611267, mean loss: 0.33881292920827477
Epoch: 76, step: 316, loss: 0.39010581374168396, mean loss: 0.33881339524878445
Epoch: 76, step: 317, loss: 0.31479576230049133, mean loss: 0.33881317702966296
Epoch: 76, step: 318, loss: 0.2763601839542389, mean loss: 0.3388126096001628
Epoch: 76, step: 319, loss: 0.33071181178092957, mean loss: 0.33881253599936856
Epoch: 76, step: 320, loss: 0.3172147572040558, mean loss: 0.3388123397718776
Epoch: 76, step: 321, loss: 0.36358627676963806, mean loss: 0.3388125648544371
Epoch: 76, step: 322, loss: 0.34957587718963623, mean loss: 0.33881266264316884
Epoch: 76, step: 323, loss: 0.4126470983028412, mean loss: 0.33881333345063025
Epoch: 76, step: 324, loss: 0.33576950430870056, mean loss: 0.33881330579680274
Epoch: 76, step: 325, loss: 0.3315029740333557, mean loss: 0.33881323938150554
Epoch: 76, step: 326, loss: 0.3364562392234802, mean loss: 0.3388132179680528
Epoch: 76, step: 327, loss: 0.31425830721855164, mean loss: 0.33881299488760774
Epoch: 76, step: 328, loss: 0.326910138130188, mean loss: 0.33881288675158205
Epoch: 76, step: 329, loss: 0.32728320360183716, mean loss: 0.3388127820067454
Epoch: 76, step: 330, loss: 0.298738032579422, mean loss: 0.33881241793906947
Epoch: 76, step: 331, loss: 0.31470170617103577, mean loss: 0.3388121989021153
Epoch: 76, step: 332, loss: 0.29456788301467896, mean loss: 0.33881179696241953
Epoch: 76, step: 333, loss: 0.34143704175949097, mean loss: 0.33881182081137023
Epoch: 76, step: 334, loss: 0.3858168423175812, mean loss: 0.3388122478230755
Epoch: 76, step: 335, loss: 0.3530848026275635, mean loss: 0.33881237747927834
Epoch: 76, step: 336, loss: 0.3238368034362793, mean loss: 0.3388122414378721
Epoch: 76, step: 337, loss: 0.3507043421268463, mean loss: 0.3388123494673473
Epoch: 76, step: 338, loss: 0.35874876379966736, mean loss: 0.3388125305708268
Epoch: 76, step: 339, loss: 0.3239279091358185, mean loss: 0.3388123953593389
Epoch: 76, step: 340, loss: 0.3124190866947174, mean loss: 0.3388121556054336
Epoch: 76, step: 341, loss: 0.31944769620895386, mean loss: 0.33881197970241783
Epoch: 76, step: 342, loss: 0.32200005650520325, mean loss: 0.338811826987536
Epoch: 76, step: 343, loss: 0.326216459274292, mean loss: 0.33881171257572257
Epoch: 76, step: 344, loss: 0.3568924367427826, mean loss: 0.33881187681305935
Epoch: 76, step: 345, loss: 0.3188193440437317, mean loss: 0.3388116952113447
Epoch: 76, step: 346, loss: 0.4030371606349945, mean loss: 0.33881227859659346
Epoch: 76, step: 347, loss: 0.29876846075057983, mean loss: 0.33881191486609674
Epoch: 76, step: 348, loss: 0.3281481862068176, mean loss: 0.3388118180050006
Epoch: 76, step: 349, loss: 0.34586700797080994, mean loss: 0.3388118820883291
Epoch: 76, step: 350, loss: 0.3341991603374481, mean loss: 0.33881184019067934
Epoch: 76, step: 351, loss: 0.31905367970466614, mean loss: 0.33881166072766083
Epoch: 76, step: 352, loss: 0.3707718253135681, mean loss: 0.33881195101862777
Epoch: 76, step: 353, loss: 0.2768886685371399, mean loss: 0.3388113885807771
Epoch: 76, step: 354, loss: 0.2967592775821686, mean loss: 0.33881100663261227
Epoch: 76, step: 355, loss: 0.35361796617507935, mean loss: 0.33881114111907495
Epoch: 76, step: 356, loss: 0.3667367696762085, mean loss: 0.33881139475554106
Epoch: 76, step: 357, loss: 0.30735984444618225, mean loss: 0.3388111090972396
Epoch: 76, step: 358, loss: 0.3752804696559906, mean loss: 0.3388114403267298
Epoch: 76, step: 359, loss: 0.34552231431007385, mean loss: 0.33881150127704934
Epoch: 76, step: 360, loss: 0.3225170969963074, mean loss: 0.3388113532873642
Epoch: 76, step: 361, loss: 0.3269346356391907, mean loss: 0.3388112454211476
Epoch: 76, step: 362, loss: 0.3521004319190979, mean loss: 0.3388113661145322
Epoch: 76, step: 363, loss: 0.28872907161712646, mean loss: 0.33881091126752294
Epoch: 76, step: 364, loss: 0.30597934126853943, mean loss: 0.33881061309416743
Epoch: 76, step: 365, loss: 0.3124275803565979, mean loss: 0.3388103734880214
Epoch: 76, step: 366, loss: 0.3304852843284607, mean loss: 0.3388102978816863
Epoch: 76, step: 367, loss: 0.3639238178730011, mean loss: 0.33881052595419425
Epoch: 76, step: 368, loss: 0.3082214891910553, mean loss: 0.3388102481574149
Epoch: 76, step: 369, loss: 0.33166906237602234, mean loss: 0.3388101833047551
Epoch: 76, step: 370, loss: 0.3160819411277771, mean loss: 0.3388099769001583
Epoch: 76, step: 371, loss: 0.34332409501075745, mean loss: 0.33881001789436543
Epoch: 76, step: 372, loss: 0.38898688554763794, mean loss: 0.33881047356304195
Epoch: 76, step: 373, loss: 0.3340511918067932, mean loss: 0.33881043034320724
Epoch: 76, step: 374, loss: 0.3556150496006012, mean loss: 0.33881058294738325
Epoch: 76, step: 375, loss: 0.34843966364860535, mean loss: 0.3388106703890896
Epoch: 76, step: 376, loss: 0.3223990499973297, mean loss: 0.33881052135647644
Epoch: 76, step: 377, loss: 0.315024733543396, mean loss: 0.33881030536159973
Epoch: 76, step: 378, loss: 0.3843846619129181, mean loss: 0.33881071921117295
Epoch: 76, step: 379, loss: 0.3394709527492523, mean loss: 0.3388107252065376
Epoch: 76, step: 380, loss: 0.3278357684612274, mean loss: 0.3388106255474525
Epoch: 76, step: 381, loss: 0.3120133876800537, mean loss: 0.3388103822149255
Epoch: 76, step: 382, loss: 0.3396257162094116, mean loss: 0.33881038961850496
Epoch: 76, step: 383, loss: 0.354340523481369, mean loss: 0.3388105306374453
Epoch: 76, step: 384, loss: 0.336692214012146, mean loss: 0.33881051140257873
Epoch: 76, step: 385, loss: 0.3269709050655365, mean loss: 0.3388104038968461
Epoch: 76, step: 386, loss: 0.31827741861343384, mean loss: 0.3388102174553783
Epoch: 76, step: 387, loss: 0.3698231279850006, mean loss: 0.3388104990530114
Epoch: 76, step: 388, loss: 0.34788474440574646, mean loss: 0.33881058144652976
Epoch: 76, step: 389, loss: 0.29614078998565674, mean loss: 0.3388101940113012
Epoch: 76, step: 390, loss: 0.295243501663208, mean loss: 0.3388097984359405
Epoch: 76, step: 391, loss: 0.34606385231018066, mean loss: 0.33880986430045235
Epoch: 76, step: 392, loss: 0.382976770401001, mean loss: 0.33881026531833097
Epoch: 76, step: 393, loss: 0.4383188486099243, mean loss: 0.33881116880834616
Epoch: 76, step: 394, loss: 0.3499162793159485, mean loss: 0.3388112696364861
Epoch: 76, step: 395, loss: 0.30298954248428345, mean loss: 0.3388109443983605
Epoch: 76, step: 396, loss: 0.3056512176990509, mean loss: 0.33881064333221167
Epoch: 76, step: 397, loss: 0.32501110434532166, mean loss: 0.33881051804359347
Epoch: 76, step: 398, loss: 0.33368200063705444, mean loss: 0.338810471481239
Epoch: 76, step: 399, loss: 0.3521720767021179, mean loss: 0.3388105927915711
Epoch: 76, step: 400, loss: 0.32558783888816833, mean loss: 0.33881047274296333
Epoch: 76, step: 401, loss: 0.3381636142730713, mean loss: 0.33881046687022653
Epoch: 76, step: 402, loss: 0.3514256179332733, mean loss: 0.33881058140036413
Epoch: 76, step: 403, loss: 0.4010099470615387, mean loss: 0.33881114608937946
Epoch: 76, step: 404, loss: 0.35203689336776733, mean loss: 0.3388112661608034
Epoch: 76, step: 405, loss: 0.3009882867336273, mean loss: 0.3388109227837773
Epoch: 76, step: 406, loss: 0.3434404730796814, mean loss: 0.3388109648129036
Epoch: 76, step: 407, loss: 0.3540208637714386, mean loss: 0.3388111028939095
Epoch: 76, step: 408, loss: 0.3164944052696228, mean loss: 0.3388109002966346
Epoch: 76, step: 409, loss: 0.37456709146499634, mean loss: 0.33881122489847537
Epoch: 76, step: 410, loss: 0.337116003036499, mean loss: 0.33881120950905264
Epoch: 76, step: 411, loss: 0.3357670307159424, mean loss: 0.33881118187389164
Epoch: 76, step: 412, loss: 0.34410974383354187, mean loss: 0.3388112299739848
Epoch: 76, step: 413, loss: 0.3312121331691742, mean loss: 0.3388111609903721
Epoch: 76, step: 414, loss: 0.35199233889579773, mean loss: 0.33881128064630495
Epoch: 76, step: 415, loss: 0.3219374120235443, mean loss: 0.33881112747030073
Epoch: 76, step: 416, loss: 0.3312165141105652, mean loss: 0.3388110585292657
Epoch: 76, step: 417, loss: 0.3348148763179779, mean loss: 0.3388110222537604
Epoch: 76, step: 418, loss: 0.3367648720741272, mean loss: 0.33881100367991823
Epoch: 76, step: 419, loss: 0.33782434463500977, mean loss: 0.33881099472364357
Epoch: 76, step: 420, loss: 0.33802393078804016, mean loss: 0.3388109875792335
Epoch: 76, step: 421, loss: 0.3327639102935791, mean loss: 0.33881093268863854
Epoch: 76, step: 422, loss: 0.2991935908794403, mean loss: 0.3388105730769417
Epoch: 76, step: 423, loss: 0.3121596574783325, mean loss: 0.33881033116535575
Epoch: 76, step: 424, loss: 0.32589423656463623, mean loss: 0.3388102139264355
Epoch: 76, step: 425, loss: 0.31143081188201904, mean loss: 0.33880996540685626
Epoch: 76, step: 426, loss: 0.2874208092689514, mean loss: 0.33880949895782575
Epoch: 76, step: 427, loss: 0.34824368357658386, mean loss: 0.33880958458924404
Epoch: 76, step: 428, loss: 0.3246670961380005, mean loss: 0.3388094562230522
Epoch: 76, step: 429, loss: 0.35416120290756226, mean loss: 0.33880959556397366
Epoch: 76, step: 430, loss: 0.32153749465942383, mean loss: 0.3388094387942809
Epoch: 76, step: 431, loss: 0.30746540427207947, mean loss: 0.33880915430369746
Epoch: 76, step: 432, loss: 0.341814786195755, mean loss: 0.3388091815837277
Epoch: 76, step: 433, loss: 0.398831844329834, mean loss: 0.3388097263627466
Epoch: 76, step: 434, loss: 0.3391891121864319, mean loss: 0.33880972980610535
Epoch: 76, step: 435, loss: 0.317665696144104, mean loss: 0.338809537901643
Epoch: 76, step: 436, loss: 0.31294897198677063, mean loss: 0.3388093031917936
Epoch: 76, step: 437, loss: 0.3421678841114044, mean loss: 0.33880933367391336
Epoch: 76, step: 438, loss: 0.3335202932357788, mean loss: 0.33880928567158597
Epoch: 76, step: 439, loss: 0.3362922966480255, mean loss: 0.33880926282807855
Epoch: 76, step: 440, loss: 0.3730415999889374, mean loss: 0.33880957350863544
Epoch: 76, step: 441, loss: 0.3272463381290436, mean loss: 0.33880946856576266
Epoch: 76, step: 442, loss: 0.3334192931652069, mean loss: 0.33880941964732947
Epoch: 76, step: 443, loss: 0.32866328954696655, mean loss: 0.3388093275671565
Epoch: 76, step: 444, loss: 0.31446409225463867, mean loss: 0.33880910662645175
Epoch: 76, step: 445, loss: 0.32515957951545715, mean loss: 0.3388089827538035
Epoch: 76, step: 446, loss: 0.3794231712818146, mean loss: 0.3388093513337105
Epoch: 76, step: 447, loss: 0.3127431273460388, mean loss: 0.33880911478093
Epoch: 76, step: 448, loss: 0.3311503231525421, mean loss: 0.3388090452774985
Epoch: 76, step: 449, loss: 0.3615334630012512, mean loss: 0.3388092514994137
Epoch: 76, step: 450, loss: 0.31176379323005676, mean loss: 0.33880900606669656
Epoch: 76, step: 451, loss: 0.3359493613243103, mean loss: 0.3388089801161653
Epoch: 76, step: 452, loss: 0.34364262223243713, mean loss: 0.33880902397981055
Epoch: 76, step: 453, loss: 0.3445412814617157, mean loss: 0.3388090759976102
Epoch: 76, step: 454, loss: 0.37761813402175903, mean loss: 0.3388094281701165
Epoch: 76, step: 455, loss: 0.3217322826385498, mean loss: 0.3388092732050935
Epoch: 76, step: 456, loss: 0.34841418266296387, mean loss: 0.3388093603631906
Epoch: 76, step: 457, loss: 0.36826080083847046, mean loss: 0.3388096276127911
Epoch: 76, step: 458, loss: 0.36700648069381714, mean loss: 0.33880988347563584
Epoch: 76, step: 459, loss: 0.3473927974700928, mean loss: 0.33880996135769087
Epoch: 76, step: 460, loss: 0.31485244631767273, mean loss: 0.33880974396723634
Epoch: 76, step: 461, loss: 0.34599074721336365, mean loss: 0.33880980912705744
Epoch: 76, step: 462, loss: 0.27173563838005066, mean loss: 0.3388092005071808
Epoch: 76, step: 463, loss: 0.31843066215515137, mean loss: 0.3388090155973888
Epoch: 76, step: 464, loss: 0.3460792601108551, mean loss: 0.3388090815651819
Epoch: 76, step: 465, loss: 0.3207039535045624, mean loss: 0.3388089172867311
Epoch: 76, step: 466, loss: 0.3586927056312561, mean loss: 0.33880909770237333
Epoch: 76, step: 467, loss: 0.3368802070617676, mean loss: 0.3388090802007343
Epoch: 76, step: 468, loss: 0.3199123442173004, mean loss: 0.33880890874422753
Epoch: 76, step: 469, loss: 0.3022921681404114, mean loss: 0.3388085774184377
Epoch: 76, step: 470, loss: 0.37353530526161194, mean loss: 0.338808892500122
Epoch: 76, step: 471, loss: 0.36489808559417725, mean loss: 0.338809129209793
Epoch: 76, step: 472, loss: 0.34200653433799744, mean loss: 0.33880915821988333
Epoch: 76, step: 473, loss: 0.3180467486381531, mean loss: 0.338808969844032
Epoch: 76, step: 474, loss: 0.3527402877807617, mean loss: 0.3388090962407326
Epoch: 76, step: 475, loss: 0.3104444742202759, mean loss: 0.3388088388952234
Epoch: 76, step: 476, loss: 0.3279045522212982, mean loss: 0.33880873996410615
Epoch: 76, step: 477, loss: 0.32626551389694214, mean loss: 0.3388086261644467
Epoch: 76, step: 478, loss: 0.32320863008499146, mean loss: 0.3388084846332229
Epoch: 76, step: 479, loss: 0.3225000500679016, mean loss: 0.3388083366760215
Epoch: 76, step: 480, loss: 0.34916630387306213, mean loss: 0.338808430647146
Epoch: 76, step: 481, loss: 0.3406691253185272, mean loss: 0.33880844752786987
Epoch: 76, step: 482, loss: 0.3301026225090027, mean loss: 0.33880836854699387
Epoch: 76, step: 483, loss: 0.3354017436504364, mean loss: 0.3388083376417348
Epoch: 76, step: 484, loss: 0.32069718837738037, mean loss: 0.33880817333697594
Epoch: 76, step: 485, loss: 0.34354034066200256, mean loss: 0.33880821626691626
Epoch: 76, step: 486, loss: 0.33197444677352905, mean loss: 0.3388081542719285
Epoch: 76, step: 487, loss: 0.31123441457748413, mean loss: 0.3388079041291415
Epoch: 76, step: 488, loss: 0.3149099051952362, mean loss: 0.33880768733381766
Epoch: 76, step: 489, loss: 0.36139073967933655, mean loss: 0.3388078921984905
Epoch: 76, step: 490, loss: 0.3297716975212097, mean loss: 0.3388078102263884
Epoch: 76, step: 491, loss: 0.3526611924171448, mean loss: 0.33880793589660674
Epoch: 76, step: 492, loss: 0.3425704836845398, mean loss: 0.3388079700280489
Epoch: 76, step: 493, loss: 0.3477630317211151, mean loss: 0.3388080512619401
Epoch: 76, step: 494, loss: 0.389676034450531, mean loss: 0.33880851269558143
Epoch: 76, step: 495, loss: 0.3399020731449127, mean loss: 0.33880852261539685
Epoch: 76, step: 496, loss: 0.35449862480163574, mean loss: 0.33880866494086725
Epoch: 76, step: 497, loss: 0.32815486192703247, mean loss: 0.3388085683007209
Epoch: 76, step: 498, loss: 0.3247080147266388, mean loss: 0.3388084403964225
Epoch: 76, step: 499, loss: 0.351832777261734, mean loss: 0.3388085585374267
Epoch: 76, step: 500, loss: 0.3030189275741577, mean loss: 0.3388082339002009
Epoch: 76, step: 501, loss: 0.3157941699028015, mean loss: 0.33880802514828245
Epoch: 76, step: 502, loss: 0.3386920988559723, mean loss: 0.3388080240967682
Epoch: 76, step: 503, loss: 0.30254194140434265, mean loss: 0.33880769514674014
Epoch: 76, step: 504, loss: 0.31755533814430237, mean loss: 0.3388075023798488
Epoch: 76, step: 505, loss: 0.3226982057094574, mean loss: 0.3388073562637792
Epoch: 76, step: 506, loss: 0.31683069467544556, mean loss: 0.3388071569307882
Epoch: 76, step: 507, loss: 0.4139236509799957, mean loss: 0.338807838247173
Epoch: 76, step: 508, loss: 0.33742842078208923, mean loss: 0.3388078257357904
Epoch: 76, step: 509, loss: 0.3050171732902527, mean loss: 0.3388075192557312
Epoch: 76, step: 510, loss: 0.3028600811958313, mean loss: 0.3388071932166576
Epoch: 76, step: 511, loss: 0.321035772562027, mean loss: 0.3388070320334054
Epoch: 76, step: 512, loss: 0.3212786614894867, mean loss: 0.33880687305601126
Epoch: 76, step: 513, loss: 0.3654840588569641, mean loss: 0.3388071150083939
Epoch: 76, step: 514, loss: 0.3137919306755066, mean loss: 0.3388068881318184
Epoch: 76, step: 515, loss: 0.3070353865623474, mean loss: 0.33880659998106955
Epoch: 76, step: 516, loss: 0.3340344727039337, mean loss: 0.33880655670078663
Epoch: 76, step: 517, loss: 0.34761929512023926, mean loss: 0.33880663662622257
Epoch: 76, step: 518, loss: 0.385810911655426, mean loss: 0.3388070629185875
Epoch: 76, step: 519, loss: 0.34683167934417725, mean loss: 0.33880713569498255
Epoch: 76, step: 520, loss: 0.28809380531311035, mean loss: 0.33880667577270096
Epoch: 76, step: 521, loss: 0.3434256911277771, mean loss: 0.33880671766245263
Epoch: 76, step: 522, loss: 0.3370503783226013, mean loss: 0.3388067017343931
Epoch: 76, step: 523, loss: 0.34821617603302, mean loss: 0.3388067870671669
Epoch: 76, step: 524, loss: 0.3111829161643982, mean loss: 0.3388065365536871
Epoch: 76, step: 525, loss: 0.3242894411087036, mean loss: 0.33880640490323416
Epoch: 76, step: 526, loss: 0.32843002676963806, mean loss: 0.3388063108043493
Epoch: 76, step: 527, loss: 0.32568901777267456, mean loss: 0.3388061918503716
Epoch: 76, step: 528, loss: 0.3597377836704254, mean loss: 0.33880638166648086
Epoch: 76, step: 529, loss: 0.30739086866378784, mean loss: 0.3388060967805331
Epoch: 76, step: 530, loss: 0.31638431549072266, mean loss: 0.3388058934544729
Epoch: 76, step: 531, loss: 0.3423285484313965, mean loss: 0.33880592539845866
Epoch: 76, step: 532, loss: 0.31972524523735046, mean loss: 0.3388057523734384
Epoch: 76, step: 533, loss: 0.3573547601699829, mean loss: 0.33880592057568903
Epoch: 76, step: 534, loss: 0.31496623158454895, mean loss: 0.338805704399545
Epoch: 76, step: 535, loss: 0.31490135192871094, mean loss: 0.3388054876390039
Epoch: 76, step: 536, loss: 0.32499921321868896, mean loss: 0.33880536244722637
Epoch: 76, step: 537, loss: 0.33262792229652405, mean loss: 0.3388053064322815
Epoch: 76, step: 538, loss: 0.3166521489620209, mean loss: 0.3388051055567389
Epoch: 76, step: 539, loss: 0.31712815165519714, mean loss: 0.3388049090009928
Epoch: 76, step: 540, loss: 0.3150741457939148, mean loss: 0.33880469382428513
Epoch: 76, step: 541, loss: 0.30323946475982666, mean loss: 0.3388043713424736
Epoch: 76, step: 542, loss: 0.29080313444137573, mean loss: 0.3388039361031716
Epoch: 76, step: 543, loss: 0.33244019746780396, mean loss: 0.33880387840207415
Epoch: 76, step: 544, loss: 0.33840957283973694, mean loss: 0.3388038748268712
Epoch: 76, step: 545, loss: 0.36315879225730896, mean loss: 0.3388040956530334
Epoch: 76, step: 546, loss: 0.3399258852005005, mean loss: 0.3388041058242128
Epoch: 76, step: 547, loss: 0.3676706850528717, mean loss: 0.3388043675528896
Epoch: 76, step: 548, loss: 0.37373489141464233, mean loss: 0.33880468425951527
Epoch: 76, step: 549, loss: 0.3700842261314392, mean loss: 0.3388049678609974
Epoch: 76, step: 550, loss: 0.37482282519340515, mean loss: 0.3388052944202914
Epoch: 76, step: 551, loss: 0.32944801449775696, mean loss: 0.33880520958240135
Epoch: 76, step: 552, loss: 0.3318583071231842, mean loss: 0.33880514659879835
Epoch: 76, step: 553, loss: 0.3213950991630554, mean loss: 0.33880498875325776
Epoch: 76, step: 554, loss: 0.3567960560321808, mean loss: 0.33880515186504734
Epoch: 76, step: 555, loss: 0.34276846051216125, mean loss: 0.33880518779712937
Epoch: 76, step: 556, loss: 0.3131019175052643, mean loss: 0.3388049547686864
Epoch: 76, step: 557, loss: 0.346116840839386, mean loss: 0.33880502105838256
Epoch: 76, step: 558, loss: 0.29495155811309814, mean loss: 0.3388046234856697
Epoch: 76, step: 559, loss: 0.34690338373184204, mean loss: 0.33880469690785064
Epoch: 76, step: 560, loss: 0.31457290053367615, mean loss: 0.3388044772279053
Epoch: 76, step: 561, loss: 0.3308819830417633, mean loss: 0.33880440540502904
Epoch: 76, step: 562, loss: 0.3099924921989441, mean loss: 0.33880414420752386
Epoch: 76, step: 563, loss: 0.38075315952301025, mean loss: 0.3388045244973969
Epoch: 76, step: 564, loss: 0.38221338391304016, mean loss: 0.33880491801795654
Epoch: 76, step: 565, loss: 0.3345303237438202, mean loss: 0.3388048792672152
Epoch: 76, step: 566, loss: 0.31723275780677795, mean loss: 0.3388046837099139
Epoch: 76, step: 567, loss: 0.3324911296367645, mean loss: 0.3388046264763031
Epoch: 76, step: 568, loss: 0.31497377157211304, mean loss: 0.33880441044686954
Epoch: 76, step: 569, loss: 0.33572623133659363, mean loss: 0.3388043825430757
Epoch: 76, step: 570, loss: 0.3468344509601593, mean loss: 0.3388044553352474
Epoch: 76, step: 571, loss: 0.30490562319755554, mean loss: 0.33880414804680203
Epoch: 76, step: 572, loss: 0.3333129286766052, mean loss: 0.3388040982700734
Epoch: 76, step: 573, loss: 0.32923373579978943, mean loss: 0.33880401151757183
Epoch: 76, step: 574, loss: 0.39208984375, mean loss: 0.3388044945334823
Epoch: 76, step: 575, loss: 0.31694284081459045, mean loss: 0.3388042963676582
Epoch: 76, step: 576, loss: 0.3341728746891022, mean loss: 0.3388042543863339
Epoch: 76, step: 577, loss: 0.35908088088035583, mean loss: 0.3388044381812841
Epoch: 76, step: 578, loss: 0.3365470767021179, mean loss: 0.33880441771989817
Epoch: 76, step: 579, loss: 0.3370444178581238, mean loss: 0.3388044017668883
Epoch: 76, step: 580, loss: 0.3168356716632843, mean loss: 0.338804202639491
Epoch: 76, step: 581, loss: 0.3175235390663147, mean loss: 0.3388040097505657
Epoch: 76, step: 582, loss: 0.31278249621391296, mean loss: 0.33880377389249344
Epoch: 76, step: 583, loss: 0.32669246196746826, mean loss: 0.33880366411698837
Epoch: 76, step: 584, loss: 0.34835290908813477, mean loss: 0.3388037506694358
Epoch: 76, step: 585, loss: 0.3390007019042969, mean loss: 0.33880375245454625
Epoch: 76, step: 586, loss: 0.3083648979663849, mean loss: 0.3388034765678554
Epoch: 76, step: 587, loss: 0.3898402452468872, mean loss: 0.33880393914234586
Epoch: 76, step: 588, loss: 0.30817604064941406, mean loss: 0.33880366154726105
Epoch: 76, step: 589, loss: 0.31595200300216675, mean loss: 0.33880345443378246
Epoch: 76, step: 590, loss: 0.3307923376560211, mean loss: 0.3388033818265701
Epoch: 76, step: 591, loss: 0.3087773621082306, mean loss: 0.3388031096939958
Epoch: 76, step: 592, loss: 0.3336159586906433, mean loss: 0.3388030626821049
Epoch: 76, step: 593, loss: 0.31381794810295105, mean loss: 0.33880283624049295
Epoch: 76, step: 594, loss: 0.3427157402038574, mean loss: 0.338802871703058
Epoch: 76, step: 595, loss: 0.36753880977630615, mean loss: 0.3388031321338906
Epoch: 76, step: 596, loss: 0.39880505204200745, mean loss: 0.33880367592015237
Epoch: 76, step: 597, loss: 0.32157692313194275, mean loss: 0.3388035197987046
Epoch: 76, step: 598, loss: 0.33880308270454407, mean loss: 0.3388035197947434
Epoch: 76, step: 599, loss: 0.368704617023468, mean loss: 0.33880379077546935
Epoch: 76, step: 600, loss: 0.33029693365097046, mean loss: 0.33880371368219714
Epoch: 76, step: 601, loss: 0.3038060665130615, mean loss: 0.3388033965193895
Epoch: 76, step: 602, loss: 0.303745299577713, mean loss: 0.33880307881164085
Epoch: 76, step: 603, loss: 0.38688144087791443, mean loss: 0.33880351450927076
Epoch: 76, step: 604, loss: 0.3331080675125122, mean loss: 0.338803462896234
Epoch: 76, step: 605, loss: 0.34939339756965637, mean loss: 0.3388035588630185
Epoch: 76, step: 606, loss: 0.29749032855033875, mean loss: 0.33880318448281066
Epoch: 76, step: 607, loss: 0.31992512941360474, mean loss: 0.3388030134115562
Epoch: 76, step: 608, loss: 0.32448694109916687, mean loss: 0.338802883681759
Epoch: 76, step: 609, loss: 0.3256404995918274, mean loss: 0.33880276440756785
Epoch: 76, step: 610, loss: 0.35134947299957275, mean loss: 0.3388028781016333
Epoch: 76, step: 611, loss: 0.33533400297164917, mean loss: 0.33880284666813504
Epoch: 76, step: 612, loss: 0.32097455859184265, mean loss: 0.33880268511709544
Epoch: 76, step: 613, loss: 0.297759085893631, mean loss: 0.3388023132038746
Epoch: 76, step: 614, loss: 0.3111204504966736, mean loss: 0.3388020623692104
Epoch: 76, step: 615, loss: 0.32894429564476013, mean loss: 0.3388019730454815
Epoch: 76, step: 616, loss: 0.32407209277153015, mean loss: 0.3388018395755032
Epoch: 76, step: 617, loss: 0.35993310809135437, mean loss: 0.33880203104782625
Epoch: 76, step: 618, loss: 0.33194103837013245, mean loss: 0.3388019688803183
Epoch: 76, step: 619, loss: 0.31862473487854004, mean loss: 0.33880178605590094
Epoch: 76, step: 620, loss: 0.3067166805267334, mean loss: 0.338801495337779
Epoch: 76, step: 621, loss: 0.33876165747642517, mean loss: 0.3388014949768176
Epoch: 76, step: 622, loss: 0.39104163646698, mean loss: 0.33880196830798986
Epoch: 76, step: 623, loss: 0.31791573762893677, mean loss: 0.3388017790662651
Epoch: 76, step: 624, loss: 0.31724119186401367, mean loss: 0.3388015837162374
Epoch: 76, step: 625, loss: 0.3258271813392639, mean loss: 0.3388014661625328
Epoch: 76, step: 626, loss: 0.3464725911617279, mean loss: 0.3388015356656179
Epoch: 76, step: 627, loss: 0.33821552991867065, mean loss: 0.3388015303562482
Epoch: 76, step: 628, loss: 0.29163315892219543, mean loss: 0.33880110300199096
Epoch: 76, step: 629, loss: 0.3037661612033844, mean loss: 0.33880078558174886
Epoch: 76, step: 630, loss: 0.31519076228141785, mean loss: 0.338800571674403
Epoch: 76, step: 631, loss: 0.312856525182724, mean loss: 0.33880033662288367
Epoch: 76, step: 632, loss: 0.3099241554737091, mean loss: 0.33880007500876885
Epoch: 76, step: 633, loss: 0.3221849203109741, mean loss: 0.33879992447918234
Epoch: 76, step: 634, loss: 0.3336063325405121, mean loss: 0.33879987742682693
Epoch: 76, step: 635, loss: 0.363749623298645, mean loss: 0.33880010346185024
Epoch: 76, step: 636, loss: 0.3199107348918915, mean loss: 0.33879993233304573
Epoch: 76, step: 637, loss: 0.3509328365325928, mean loss: 0.3388000422504616
Epoch: 76, step: 638, loss: 0.3446315824985504, mean loss: 0.3388000950805192
Epoch: 76, step: 639, loss: 0.3257817327976227, mean loss: 0.3387999771434787
Epoch: 76, step: 640, loss: 0.3313557505607605, mean loss: 0.33879990970472723
Epoch: 76, step: 641, loss: 0.3218501806259155, mean loss: 0.33879975615510066
Epoch: 76, step: 642, loss: 0.33771246671676636, mean loss: 0.33879974630530457
Epoch: 76, step: 643, loss: 0.29751893877983093, mean loss: 0.33879937234429863
Epoch: 76, step: 644, loss: 0.32189056277275085, mean loss: 0.33879921916952965
Epoch: 76, step: 645, loss: 0.32762694358825684, mean loss: 0.33879911796221396
Epoch: 76, step: 646, loss: 0.2848218083381653, mean loss: 0.33879862899744667
Epoch: 76, step: 647, loss: 0.35014060139656067, mean loss: 0.338798731740149
Epoch: 76, step: 648, loss: 0.3311518132686615, mean loss: 0.338798662470191
Epoch: 76, step: 649, loss: 0.36328643560409546, mean loss: 0.3387988842917858
Epoch: 76, step: 650, loss: 0.340962678194046, mean loss: 0.3387989038922559
Epoch: 76, step: 651, loss: 0.33024105429649353, mean loss: 0.33879882637269365
Epoch: 76, step: 652, loss: 0.3069639205932617, mean loss: 0.33879853800520376
Epoch: 76, step: 653, loss: 0.3270622193813324, mean loss: 0.33879843169604396
Epoch: 76, step: 654, loss: 0.3292087912559509, mean loss: 0.338798344832572
Epoch: 76, step: 655, loss: 0.3355301320552826, mean loss: 0.3387983152291954
Epoch: 76, step: 656, loss: 0.32967013120651245, mean loss: 0.33879823254711805
Epoch: 76, step: 657, loss: 0.30773958563804626, mean loss: 0.33879795122389106
Epoch: 76, step: 658, loss: 0.4075930416584015, mean loss: 0.33879857435089333
Epoch: 76, step: 659, loss: 0.3207336962223053, mean loss: 0.3387984107256793
Epoch: 76, step: 660, loss: 0.36831989884376526, mean loss: 0.3387986781183528
Epoch: 76, step: 661, loss: 0.33860069513320923, mean loss: 0.3387986763251261
Epoch: 76, step: 662, loss: 0.3235126733779907, mean loss: 0.3387985378737331
Epoch: 76, step: 663, loss: 0.30912795662879944, mean loss: 0.3387982691379418
Epoch: 76, step: 664, loss: 0.36995670199394226, mean loss: 0.3387985513471173
Epoch: 76, step: 665, loss: 0.35924673080444336, mean loss: 0.33879873654935855
Epoch: 76, step: 666, loss: 0.3701149821281433, mean loss: 0.3387990201827427
Epoch: 76, step: 667, loss: 0.30615586042404175, mean loss: 0.33879872453408355
Epoch: 76, step: 668, loss: 0.3076629340648651, mean loss: 0.33879844254020175
Epoch: 76, step: 669, loss: 0.3447885811328888, mean loss: 0.3387984967918238
Epoch: 76, step: 670, loss: 0.3736222982406616, mean loss: 0.338798812181956
Epoch: 76, step: 671, loss: 0.3437190353870392, mean loss: 0.3387988567427371
Epoch: 76, step: 672, loss: 0.3134573698043823, mean loss: 0.3387986272356237
Epoch: 76, step: 673, loss: 0.3134201169013977, mean loss: 0.33879839739528667
Epoch: 76, step: 674, loss: 0.3052414059638977, mean loss: 0.3387980934893336
Epoch: 76, step: 675, loss: 0.3225599229335785, mean loss: 0.33879794643109634
Epoch: 76, step: 676, loss: 0.3113201856613159, mean loss: 0.33879769758567047
Epoch: 76, step: 677, loss: 0.3516966998577118, mean loss: 0.33879781440118073
Epoch: 76, step: 678, loss: 0.3270401358604431, mean loss: 0.33879770792265235
Epoch: 76, step: 679, loss: 0.3560180068016052, mean loss: 0.33879786386971894
Epoch: 76, step: 680, loss: 0.3099764287471771, mean loss: 0.3387976028650993
Epoch: 76, step: 681, loss: 0.35268405079841614, mean loss: 0.3387977286185263
Epoch: 76, step: 682, loss: 0.35025519132614136, mean loss: 0.33879783237451633
Epoch: 76, step: 683, loss: 0.3132135570049286, mean loss: 0.33879760069165177
Epoch: 76, step: 684, loss: 0.3209763169288635, mean loss: 0.33879743930937206
Epoch: 76, step: 685, loss: 0.2956809401512146, mean loss: 0.3387970488674708
Epoch: 76, step: 686, loss: 0.310916930437088, mean loss: 0.33879679640105803
Epoch: 76, step: 687, loss: 0.33513376116752625, mean loss: 0.33879676323100555
Epoch: 76, step: 688, loss: 0.3579566776752472, mean loss: 0.3387969367290944
Epoch: 76, step: 689, loss: 0.34089383482933044, mean loss: 0.3387969557168889
Epoch: 76, step: 690, loss: 0.3426632285118103, mean loss: 0.33879699072637676
Epoch: 76, step: 691, loss: 0.3862048387527466, mean loss: 0.33879742000530777
Epoch: 76, step: 692, loss: 0.30052629113197327, mean loss: 0.33879707346267374
Epoch: 76, step: 693, loss: 0.3253992795944214, mean loss: 0.3387969521476022
Epoch: 76, step: 694, loss: 0.30117473006248474, mean loss: 0.3387966114869471
Epoch: 76, step: 695, loss: 0.31515929102897644, mean loss: 0.3387963974583302
Epoch: 76, step: 696, loss: 0.35920462012290955, mean loss: 0.3387965822467934
Epoch: 76, step: 697, loss: 0.3420015573501587, mean loss: 0.33879661126632493
Epoch: 76, step: 698, loss: 0.3601330518722534, mean loss: 0.3387968044559395
Epoch: 76, step: 699, loss: 0.3153232932090759, mean loss: 0.33879659191826206
Epoch: 76, step: 700, loss: 0.2960455119609833, mean loss: 0.3387962048379963
Epoch: 76, step: 701, loss: 0.3182027041912079, mean loss: 0.338796018380355
Epoch: 76, step: 702, loss: 0.3515820801258087, mean loss: 0.33879613414684706
Epoch: 76, step: 703, loss: 0.3302823007106781, mean loss: 0.3387960570623056
Epoch: 76, step: 704, loss: 0.32618558406829834, mean loss: 0.33879594288768206
Epoch: 76, step: 705, loss: 0.30429911613464355, mean loss: 0.3387956305578789
Epoch: 76, step: 706, loss: 0.34309321641921997, mean loss: 0.3387956694673126
Epoch: 76, step: 707, loss: 0.3686390221118927, mean loss: 0.33879593966027105
Epoch: 76, step: 708, loss: 0.3446405827999115, mean loss: 0.33879599257547605
Epoch: 76, step: 709, loss: 0.34927573800086975, mean loss: 0.33879608745429823
Epoch: 76, step: 710, loss: 0.3818581998348236, mean loss: 0.3387964773154397
Epoch: 76, step: 711, loss: 0.32727187871932983, mean loss: 0.33879637297888404
Epoch: 76, step: 712, loss: 0.3582041263580322, mean loss: 0.33879654868303477
Epoch: 76, step: 713, loss: 0.324093759059906, mean loss: 0.3387964155755222
Epoch: 76, step: 714, loss: 0.32021939754486084, mean loss: 0.3387962473953103
Epoch: 76, step: 715, loss: 0.29150035977363586, mean loss: 0.3387958192232333
Epoch: 76, step: 716, loss: 0.3441236913204193, mean loss: 0.3387958674562938
Epoch: 76, step: 717, loss: 0.32982373237609863, mean loss: 0.33879578623256906
Epoch: 76, step: 718, loss: 0.3808504045009613, mean loss: 0.33879616694482806
Epoch: 76, step: 719, loss: 0.32810741662979126, mean loss: 0.3387960701825316
Epoch: 76, step: 720, loss: 0.3560970425605774, mean loss: 0.33879622680202537
Epoch: 76, step: 721, loss: 0.3077813386917114, mean loss: 0.33879594603791596
Epoch: 76, step: 722, loss: 0.34614160656929016, mean loss: 0.3387960125343405
Epoch: 76, step: 723, loss: 0.3596019744873047, mean loss: 0.33879620087813195
Epoch: 76, step: 724, loss: 0.33124175667762756, mean loss: 0.3387961324929361
Epoch: 76, step: 725, loss: 0.345226526260376, mean loss: 0.33879619070234834
Epoch: 76, step: 726, loss: 0.30951353907585144, mean loss: 0.33879592563141003
Epoch: 76, step: 727, loss: 0.31959810853004456, mean loss: 0.3387957518514739
Epoch: 76, step: 728, loss: 0.3089866042137146, mean loss: 0.33879548201950016
Epoch: 76, step: 729, loss: 0.3357592821121216, mean loss: 0.33879545453611126
Epoch: 76, step: 730, loss: 0.2922137975692749, mean loss: 0.3387950328872589
Epoch: 76, step: 731, loss: 0.37777644395828247, mean loss: 0.33879538573684675
Epoch: 76, step: 732, loss: 0.3497447669506073, mean loss: 0.33879548484689875
Epoch: 76, step: 733, loss: 0.31163159012794495, mean loss: 0.3387952389708445
Epoch: 76, step: 734, loss: 0.3273131847381592, mean loss: 0.3387951350411001
Epoch: 76, step: 735, loss: 0.32333996891975403, mean loss: 0.3387949951500237
Epoch: 76, step: 736, loss: 0.313016414642334, mean loss: 0.3387947618195822
Epoch: 76, step: 737, loss: 0.33105581998825073, mean loss: 0.3387946917724991
Epoch: 76, step: 738, loss: 0.32671061158180237, mean loss: 0.3387945823974804
Epoch: 76, step: 739, loss: 0.31356871128082275, mean loss: 0.3387943540759939
Epoch: 76, step: 740, loss: 0.3188193738460541, mean loss: 0.3387941732823999
Epoch: 76, step: 741, loss: 0.33239245414733887, mean loss: 0.3387941153409491
Epoch: 76, step: 742, loss: 0.32621338963508606, mean loss: 0.3387940014748318
Epoch: 76, step: 743, loss: 0.43514522910118103, mean loss: 0.3387948735263453
Epoch: 76, step: 744, loss: 0.3141408860683441, mean loss: 0.33879465039112405
Epoch: 76, step: 745, loss: 0.3316795229911804, mean loss: 0.3387945859950031
Epoch: 76, step: 746, loss: 0.3322237730026245, mean loss: 0.3387945265257885
Epoch: 76, step: 747, loss: 0.33249399065971375, mean loss: 0.33879446950323605
Epoch: 76, step: 748, loss: 0.31522491574287415, mean loss: 0.338794256190594
Epoch: 76, step: 749, loss: 0.3608589768409729, mean loss: 0.33879445588216683
Epoch: 76, step: 750, loss: 0.3333779573440552, mean loss: 0.3387944068618624
Epoch: 76, step: 751, loss: 0.2990401089191437, mean loss: 0.3387940470814365
Epoch: 76, step: 752, loss: 0.36457908153533936, mean loss: 0.3387942804365
Epoch: 76, step: 753, loss: 0.398966908454895, mean loss: 0.3387948249950261
Epoch: 76, step: 754, loss: 0.30329596996307373, mean loss: 0.3387945037355122
Epoch: 76, step: 755, loss: 0.35129889845848083, mean loss: 0.3387946168974554
Epoch: 76, step: 756, loss: 0.3178686201572418, mean loss: 0.33879442752363303
Epoch: 76, step: 757, loss: 0.33145299553871155, mean loss: 0.338794361086537
Epoch: 76, step: 758, loss: 0.34838810563087463, mean loss: 0.33879444790539753
Epoch: 76, step: 759, loss: 0.3494909107685089, mean loss: 0.33879454470246245
Epoch: 76, step: 760, loss: 0.3306500315666199, mean loss: 0.3387944709997962
Epoch: 76, step: 761, loss: 0.29516008496284485, mean loss: 0.33879407613991497
Epoch: 76, step: 762, loss: 0.31395816802978516, mean loss: 0.3387938513948028
Epoch: 76, step: 763, loss: 0.32043808698654175, mean loss: 0.3387936852913134
Epoch: 76, step: 764, loss: 0.3300863206386566, mean loss: 0.3387936064980508
Epoch: 76, step: 765, loss: 0.33973944187164307, mean loss: 0.3387936150568724
Epoch: 76, step: 766, loss: 0.3501351475715637, mean loss: 0.3387937176849593
Epoch: 76, step: 767, loss: 0.3780480921268463, mean loss: 0.3387940728895927
Epoch: 76, step: 768, loss: 0.3003528416156769, mean loss: 0.3387937250460695
Epoch: 76, step: 769, loss: 0.365915447473526, mean loss: 0.33879397046042814
Epoch: 76, step: 770, loss: 0.28904634714126587, mean loss: 0.3387935203167977
Epoch: 76, step: 771, loss: 0.3426101803779602, mean loss: 0.33879355485170726
Epoch: 76, step: 772, loss: 0.32796597480773926, mean loss: 0.33879345687963014
Epoch: 76, step: 773, loss: 0.3383902311325073, mean loss: 0.3387934532311227
Epoch: 76, step: 774, loss: 0.34081557393074036, mean loss: 0.3387934715277115
Epoch: 76, step: 775, loss: 0.31986886262893677, mean loss: 0.3387933002952748
Epoch: 76, step: 776, loss: 0.3079303503036499, mean loss: 0.33879302104563
Epoch: 76, step: 777, loss: 0.37316203117370605, mean loss: 0.33879333201548334
Epoch: 76, step: 778, loss: 0.33252501487731934, mean loss: 0.33879327530043635
Epoch: 76, step: 779, loss: 0.3202565014362335, mean loss: 0.338793107583254
Epoch: 76, step: 780, loss: 0.30664509534835815, mean loss: 0.33879281671682343
Epoch: 76, step: 781, loss: 0.35723352432250977, mean loss: 0.3387929835617975
Epoch: 76, step: 782, loss: 0.3491894602775574, mean loss: 0.33879307762457594
Epoch: 76, step: 783, loss: 0.33794069290161133, mean loss: 0.3387930699126412
Epoch: 76, step: 784, loss: 0.33369505405426025, mean loss: 0.33879302378885595
Epoch: 76, step: 785, loss: 0.31371018290519714, mean loss: 0.33879279685643143
Epoch: 76, step: 786, loss: 0.36866191029548645, mean loss: 0.3387930670893384
Epoch: 76, step: 787, loss: 0.33183059096336365, mean loss: 0.3387930040987463
Epoch: 76, step: 788, loss: 0.31014931201934814, mean loss: 0.33879274495720413
Epoch: 76, step: 789, loss: 0.2943613827228546, mean loss: 0.33879234298711136
Epoch: 76, step: 790, loss: 0.3387545049190521, mean loss: 0.33879234264479385
Epoch: 76, step: 791, loss: 0.31862202286720276, mean loss: 0.3387921601674129
Epoch: 76, step: 792, loss: 0.3324655592441559, mean loss: 0.33879210293227063
Epoch: 76, step: 793, loss: 0.4011608958244324, mean loss: 0.3387926671617021
Epoch: 76, step: 794, loss: 0.3181961178779602, mean loss: 0.3387924808333539
Epoch: 76, step: 795, loss: 0.35635215044021606, mean loss: 0.3387926396868875
Epoch: 76, step: 796, loss: 0.3532462418079376, mean loss: 0.33879277044020184
Epoch: 76, step: 797, loss: 0.3852221369743347, mean loss: 0.3387931904558206
Epoch: 76, step: 798, loss: 0.3211980164051056, mean loss: 0.3387930312854159
Epoch: 76, step: 799, loss: 0.3611656427383423, mean loss: 0.33879323367189956
Epoch: 76, step: 800, loss: 0.3668498396873474, mean loss: 0.33879348747447785
Epoch: 76, step: 801, loss: 0.3123023509979248, mean loss: 0.33879324783544545
Epoch: 76, step: 802, loss: 0.3022969365119934, mean loss: 0.33879291769250786
Epoch: 76, step: 803, loss: 0.31746095418930054, mean loss: 0.33879272472688654
Epoch: 76, step: 804, loss: 0.3350638449192047, mean loss: 0.33879269099632536
Epoch: 76, step: 805, loss: 0.31163468956947327, mean loss: 0.33879244533371633
Epoch: 76, step: 806, loss: 0.29027801752090454, mean loss: 0.33879200649166324
Epoch: 76, step: 807, loss: 0.3186488747596741, mean loss: 0.3387918242866219
Epoch: 76, step: 808, loss: 0.35811859369277954, mean loss: 0.3387919991056626
Epoch: 76, step: 809, loss: 0.35812485218048096, mean loss: 0.3387921739781509
Epoch: 76, step: 810, loss: 0.3226431906223297, mean loss: 0.33879202790621066
Epoch: 76, step: 811, loss: 0.3177676498889923, mean loss: 0.3387918377367217
Epoch: 76, step: 812, loss: 0.3159755766391754, mean loss: 0.338791631361177
Epoch: 76, step: 813, loss: 0.3303300142288208, mean loss: 0.33879155482562884
Epoch: 76, step: 814, loss: 0.3183228671550751, mean loss: 0.3387913696874884
Epoch: 76, step: 815, loss: 0.33592382073402405, mean loss: 0.33879134375090236
Epoch: 76, step: 816, loss: 0.3554919958114624, mean loss: 0.33879149480463794
Epoch: 76, step: 817, loss: 0.4032718539237976, mean loss: 0.3387920780100713
Epoch: 76, step: 818, loss: 0.3456774055957794, mean loss: 0.33879214028522286
Epoch: 76, step: 819, loss: 0.3117070198059082, mean loss: 0.33879189531289483
Epoch: 76, step: 820, loss: 0.3260480761528015, mean loss: 0.33879178005201516
Epoch: 76, step: 821, loss: 0.34977445006370544, mean loss: 0.33879187938336486
Epoch: 76, step: 822, loss: 0.35659223794937134, mean loss: 0.33879204037496785
Epoch: 76, step: 823, loss: 0.31863194704055786, mean loss: 0.33879185804288864
Epoch: 76, step: 824, loss: 0.29758504033088684, mean loss: 0.3387914853632252
Epoch: 76, step: 825, loss: 0.33648887276649475, mean loss: 0.3387914645382944
Epoch: 76, step: 826, loss: 0.30507373809814453, mean loss: 0.3387911595964341
Epoch: 76, step: 827, loss: 0.33454397320747375, mean loss: 0.3387911211853862
Epoch: 76, step: 828, loss: 0.3178066611289978, mean loss: 0.3387909314061448
Epoch: 76, step: 829, loss: 0.37275785207748413, mean loss: 0.3387912385933739
Epoch: 76, step: 830, loss: 0.3537295162677765, mean loss: 0.3387913736897128
Epoch: 76, step: 831, loss: 0.3358539044857025, mean loss: 0.33879134712455217
Epoch: 76, step: 832, loss: 0.2979792356491089, mean loss: 0.338790978041366
Epoch: 76, step: 833, loss: 0.3191114664077759, mean loss: 0.33879080007186363
Epoch: 76, step: 834, loss: 0.34512507915496826, mean loss: 0.3387908573547029
Epoch: 76, step: 835, loss: 0.3178475499153137, mean loss: 0.3387906679596275
Epoch: 76, step: 836, loss: 0.341408371925354, mean loss: 0.3387906916319036
Epoch: 76, step: 837, loss: 0.30618229508399963, mean loss: 0.33879039675211714
Epoch: 76, step: 838, loss: 0.3282637894153595, mean loss: 0.33879030156020395
Epoch: 76, step: 839, loss: 0.3362601399421692, mean loss: 0.33879027868020667
Epoch: 76, step: 840, loss: 0.33398646116256714, mean loss: 0.3387902352401604
Epoch: 76, step: 841, loss: 0.32814013957977295, mean loss: 0.33879013893415727
Epoch: 76, step: 842, loss: 0.3538514971733093, mean loss: 0.3387902751288116
Epoch: 76, step: 843, loss: 0.44271180033683777, mean loss: 0.3387912148467304
Epoch: 76, step: 844, loss: 0.32350024580955505, mean loss: 0.33879107657828567
Epoch: 76, step: 845, loss: 0.33896082639694214, mean loss: 0.33879107811323295
Epoch: 76, step: 846, loss: 0.3466813564300537, mean loss: 0.33879114945971067
Epoch: 76, step: 847, loss: 0.39631202816963196, mean loss: 0.33879166957760987
Epoch: 76, step: 848, loss: 0.3374793231487274, mean loss: 0.33879165771115877
Epoch: 76, step: 849, loss: 0.3961733877658844, mean loss: 0.33879217656145855
Epoch: 76, step: 850, loss: 0.3456965684890747, mean loss: 0.338792238990971
Epoch: 76, step: 851, loss: 0.3458918333053589, mean loss: 0.338792303184923
Epoch: 76, step: 852, loss: 0.3218589723110199, mean loss: 0.3387921500765125
Epoch: 76, step: 853, loss: 0.3654177486896515, mean loss: 0.33879239081864715
Epoch: 76, step: 854, loss: 0.3276459872722626, mean loss: 0.33879229003651035
Epoch: 76, step: 855, loss: 0.32868120074272156, mean loss: 0.33879219861617316
Epoch: 76, step: 856, loss: 0.35911184549331665, mean loss: 0.33879238233645487
Epoch: 76, step: 857, loss: 0.3506958782672882, mean loss: 0.33879248996105416
Epoch: 76, step: 858, loss: 0.32858291268348694, mean loss: 0.3387923976527327
Epoch: 76, step: 859, loss: 0.387616366147995, mean loss: 0.33879283908313756
Epoch: 76, step: 860, loss: 0.3237168490886688, mean loss: 0.3387927027783593
Epoch: 76, step: 861, loss: 0.3218498229980469, mean loss: 0.33879254959607463
Epoch: 76, step: 862, loss: 0.3324945867061615, mean loss: 0.3387924926560718
Epoch: 76, step: 863, loss: 0.3136783540248871, mean loss: 0.33879226560071746
Epoch: 76, step: 864, loss: 0.34953054785728455, mean loss: 0.338792362683977
Epoch: 76, step: 865, loss: 0.310527503490448, mean loss: 0.33879210714777597
Epoch: 76, step: 866, loss: 0.35449522733688354, mean loss: 0.33879224911485145
Epoch: 76, step: 867, loss: 0.3260272741317749, mean loss: 0.3387921337116856
Epoch: 76, step: 868, loss: 0.3272131681442261, mean loss: 0.3387920290317152
Epoch: 76, step: 869, loss: 0.3076953589916229, mean loss: 0.3387917479039191
Epoch: 76, step: 870, loss: 0.31569230556488037, mean loss: 0.3387915390765237
Epoch: 76, step: 871, loss: 0.3211233615875244, mean loss: 0.33879137935119025
Epoch: 76, step: 872, loss: 0.28871920704841614, mean loss: 0.3387909266886492
Epoch: 76, step: 873, loss: 0.3156820237636566, mean loss: 0.33879071778139247
Epoch: 76, step: 874, loss: 0.2999263107776642, mean loss: 0.3387903664456635
Epoch: 76, step: 875, loss: 0.33237653970718384, mean loss: 0.3387903084649481
Epoch: 76, step: 876, loss: 0.3512606620788574, mean loss: 0.3387904211953846
Epoch: 76, step: 877, loss: 0.33465462923049927, mean loss: 0.33879038380868065
Epoch: 76, step: 878, loss: 0.35540077090263367, mean loss: 0.3387905339617871
Epoch: 76, step: 879, loss: 0.33738183975219727, mean loss: 0.338790521227713
Epoch: 76, step: 880, loss: 0.36499127745628357, mean loss: 0.3387907580707072
Epoch: 76, step: 881, loss: 0.32247719168663025, mean loss: 0.33879061060477345
Epoch: 76, step: 882, loss: 0.3108917772769928, mean loss: 0.33879035841648913
Epoch: 76, step: 883, loss: 0.3494979441165924, mean loss: 0.33879045520559947
Epoch: 76, step: 884, loss: 0.3498428463935852, mean loss: 0.338790555110608
Epoch: 76, step: 885, loss: 0.3082795739173889, mean loss: 0.33879027931759353
Epoch: 76, step: 886, loss: 0.335834801197052, mean loss: 0.33879025260285606
Epoch: 76, step: 887, loss: 0.3543129563331604, mean loss: 0.33879039291220353
Epoch: 76, step: 888, loss: 0.326127827167511, mean loss: 0.3387902784566094
Epoch: 76, step: 889, loss: 0.3642140030860901, mean loss: 0.3387905082568935
Epoch: 76, step: 890, loss: 0.34420183300971985, mean loss: 0.33879055716840206
Epoch: 76, step: 891, loss: 0.31050246953964233, mean loss: 0.3387903014822996
Epoch: 76, step: 892, loss: 0.34089747071266174, mean loss: 0.33879032052809105
Epoch: 76, step: 893, loss: 0.31947895884513855, mean loss: 0.3387901459826213
Epoch: 76, step: 894, loss: 0.3089001774787903, mean loss: 0.3387898758250051
Epoch: 76, step: 895, loss: 0.30031710863113403, mean loss: 0.3387895280957282
Epoch: 76, step: 896, loss: 0.35683369636535645, mean loss: 0.338789691183266
Epoch: 76, step: 897, loss: 0.34513500332832336, mean loss: 0.33878974853320676
Epoch: 76, step: 898, loss: 0.33577924966812134, mean loss: 0.33878972132408497
Epoch: 76, step: 899, loss: 0.3129175305366516, mean loss: 0.33878948749133503
Epoch: 76, step: 900, loss: 0.3420284390449524, mean loss: 0.33878951676470076
Epoch: 76, step: 901, loss: 0.3338986933231354, mean loss: 0.3387894725622584
Epoch: 76, step: 902, loss: 0.3047892153263092, mean loss: 0.3387891652764103
Epoch: 76, step: 903, loss: 0.30755090713500977, mean loss: 0.3387888829553729
Epoch: 76, step: 904, loss: 0.33384236693382263, mean loss: 0.3387888382508024
Epoch: 76, step: 905, loss: 0.3117792308330536, mean loss: 0.33878859415132284
Epoch: 76, step: 906, loss: 0.35502395033836365, mean loss: 0.3387887408771201
Epoch: 76, step: 907, loss: 0.31040096282958984, mean loss: 0.3387884843270528
Epoch: 76, step: 908, loss: 0.3400470018386841, mean loss: 0.33878849570060354
Epoch: 76, step: 909, loss: 0.386292427778244, mean loss: 0.33878892500213875
Epoch: 76, step: 910, loss: 0.31398501992225647, mean loss: 0.3387887008468355
Epoch: 76, step: 911, loss: 0.33543720841407776, mean loss: 0.33878867055934603
Epoch: 76, step: 912, loss: 0.3250507712364197, mean loss: 0.33878854641085726
Epoch: 76, step: 913, loss: 0.3497951626777649, mean loss: 0.3387886458760226
Epoch: 76, step: 914, loss: 0.31595975160598755, mean loss: 0.3387884395765416
Epoch: 76, step: 915, loss: 0.33863797783851624, mean loss: 0.33878843821686566
Epoch: 76, step: 916, loss: 0.3211838901042938, mean loss: 0.33878827913147774
Epoch: 76, step: 917, loss: 0.3300146162509918, mean loss: 0.3387881998480482
Epoch: 76, step: 918, loss: 0.34648674726486206, mean loss: 0.33878826941554063
Epoch: 76, step: 919, loss: 0.307710736989975, mean loss: 0.33878798858769754
Epoch: 76, step: 920, loss: 0.32349684834480286, mean loss: 0.3387878504126626
Epoch: 76, step: 921, loss: 0.3510980010032654, mean loss: 0.3387879616496332
Epoch: 76, step: 922, loss: 0.34436097741127014, mean loss: 0.3387880120080577
Epoch: 76, step: 923, loss: 0.39853763580322266, mean loss: 0.338788551907792
Epoch: 76, step: 924, loss: 0.3505406975746155, mean loss: 0.33878865809964037
Epoch: 76, step: 925, loss: 0.29789048433303833, mean loss: 0.33878828854896026
Epoch: 76, step: 926, loss: 0.33137384057044983, mean loss: 0.33878822155355964
Epoch: 76, step: 927, loss: 0.29514333605766296, mean loss: 0.33878782719106965
Epoch: 76, step: 928, loss: 0.3332732319831848, mean loss: 0.33878777736324167
Epoch: 76, step: 929, loss: 0.3715241551399231, mean loss: 0.3387880731542836
Epoch: 76, step: 930, loss: 0.3250558078289032, mean loss: 0.3387879490768919
Epoch: 76, step: 931, loss: 0.32135337591171265, mean loss: 0.33878779154885363
Epoch: 76, step: 932, loss: 0.37740787863731384, mean loss: 0.3387881404929621
Epoch: 76, step: 933, loss: 0.3397235870361328, mean loss: 0.3387881489449267
Epoch: 76, step: 934, loss: 0.3116709887981415, mean loss: 0.33878790393765207
Epoch: 76, step: 935, loss: 0.3469257354736328, mean loss: 0.3387879774634159
Epoch: 76, step: 936, loss: 0.34548497200012207, mean loss: 0.33878803797059
Epoch: 76, step: 937, loss: 0.3404853343963623, mean loss: 0.3387880533054812
Epoch: 76, step: 938, loss: 0.3265054225921631, mean loss: 0.33878794233423254
Epoch: 76, step: 939, loss: 0.31285229325294495, mean loss: 0.3387877080126587
Epoch: 76, step: 940, loss: 0.341056764125824, mean loss: 0.33878772851278166
Epoch: 76, step: 941, loss: 0.3270856738090515, mean loss: 0.3387876227897932
Epoch: 76, step: 942, loss: 0.4102949798107147, mean loss: 0.338788268821911
Epoch: 76, step: 943, loss: 0.3104044795036316, mean loss: 0.33878801239131945
Epoch: 76, step: 944, loss: 0.28783026337623596, mean loss: 0.3387875520226377
Epoch: 76, step: 945, loss: 0.3353370726108551, mean loss: 0.3387875208501794
Epoch: 76, step: 946, loss: 0.35282087326049805, mean loss: 0.3387876476297045
Epoch: 76, step: 947, loss: 0.34309107065200806, mean loss: 0.33878768650715746
Epoch: 76, step: 948, loss: 0.3871675133705139, mean loss: 0.3387881235702677
Epoch: 76, step: 949, loss: 0.3161678910255432, mean loss: 0.33878791922104784
Epoch: 76, step: 950, loss: 0.33238717913627625, mean loss: 0.3387878613978392
Epoch: 76, step: 951, loss: 0.3321056365966797, mean loss: 0.3387878010322903
Epoch: 76, step: 952, loss: 0.32174569368362427, mean loss: 0.33878764707954223
Epoch: 76, step: 953, loss: 0.35573580861091614, mean loss: 0.3387878001822318
Epoch: 76, step: 954, loss: 0.34119537472724915, mean loss: 0.33878782193106916
Epoch: 76, step: 955, loss: 0.3245569169521332, mean loss: 0.3387876933772753
Epoch: 76, step: 956, loss: 0.32278522849082947, mean loss: 0.3387875488215361
Epoch: 76, step: 957, loss: 0.3413924276828766, mean loss: 0.33878757235208534
Epoch: 76, step: 958, loss: 0.3258359432220459, mean loss: 0.3387874553577028
Epoch: 76, step: 959, loss: 0.3314478397369385, mean loss: 0.338787389058241
Epoch: 76, step: 960, loss: 0.29888108372688293, mean loss: 0.33878702858395954
Epoch: 76, step: 961, loss: 0.3623860776424408, mean loss: 0.338787241752614
Epoch: 76, step: 962, loss: 0.3265576958656311, mean loss: 0.33878713128493004
Epoch: 76, step: 963, loss: 0.31268370151519775, mean loss: 0.3387868954986294
Epoch: 76, step: 964, loss: 0.2884085178375244, mean loss: 0.3387864404463964
Epoch: 76, step: 965, loss: 0.3760140836238861, mean loss: 0.3387867767090933
Epoch: 76, step: 966, loss: 0.33561235666275024, mean loss: 0.3387867480360613
Epoch: 76, step: 967, loss: 0.35063907504081726, mean loss: 0.33878685509154766
Epoch: 76, step: 968, loss: 0.2983289062976837, mean loss: 0.33878648966066965
Epoch: 76, step: 969, loss: 0.31730613112449646, mean loss: 0.33878629564402735
Epoch: 76, step: 970, loss: 0.3199980556964874, mean loss: 0.3387861259448904
Epoch: 76, step: 971, loss: 0.3299337327480316, mean loss: 0.33878604598902856
Epoch: 76, step: 972, loss: 0.3184172213077545, mean loss: 0.33878586201705785
Epoch: 76, step: 973, loss: 0.3069271445274353, mean loss: 0.33878557427055334
Epoch: 76, step: 974, loss: 0.3292354643344879, mean loss: 0.33878548801516867
Epoch: 76, step: 975, loss: 0.35703033208847046, mean loss: 0.33878565279880374
Epoch: 76, step: 976, loss: 0.3882240951061249, mean loss: 0.3387860993124941
Epoch: 76, step: 977, loss: 0.30381283164024353, mean loss: 0.33878578344692384
Epoch: 76, step: 978, loss: 0.33873507380485535, mean loss: 0.3387857829889373
Epoch: 76, step: 979, loss: 0.35794806480407715, mean loss: 0.33878595605242684
Epoch: 76, step: 980, loss: 0.32871925830841064, mean loss: 0.3387858651362133
Epoch: 76, step: 981, loss: 0.33401966094970703, mean loss: 0.3387858220911815
Epoch: 76, step: 982, loss: 0.34501948952674866, mean loss: 0.33878587838880936
Epoch: 76, step: 983, loss: 0.3581097424030304, mean loss: 0.33878605290531844
Epoch: 76, step: 984, loss: 0.32367366552352905, mean loss: 0.33878591642447436
Epoch: 76, step: 985, loss: 0.38803189992904663, mean loss: 0.33878636116378175
Epoch: 76, step: 986, loss: 0.39081454277038574, mean loss: 0.3387868310248108
Epoch: 76, step: 987, loss: 0.3225153386592865, mean loss: 0.3387866840800038
Epoch: 76, step: 988, loss: 0.34053486585617065, mean loss: 0.33878669986736415
Epoch: 76, step: 989, loss: 0.31305134296417236, mean loss: 0.3387864674603627
Epoch: 76, step: 990, loss: 0.36480164527893066, mean loss: 0.3387867023922073
Epoch: 76, step: 991, loss: 0.3095187246799469, mean loss: 0.3387864380881173
Epoch: 76, step: 992, loss: 0.3548128008842468, mean loss: 0.33878658281267005
Epoch: 76, step: 993, loss: 0.32275012135505676, mean loss: 0.33878643799823005
Epoch: 76, step: 994, loss: 0.35960033535957336, mean loss: 0.33878662595276604
Epoch: 76, step: 995, loss: 0.3374204933643341, mean loss: 0.3387866136163692
Epoch: 76, step: 996, loss: 0.2993417978286743, mean loss: 0.3387862574265588
Epoch: 76, step: 997, loss: 0.35357415676116943, mean loss: 0.33878639096125507
Epoch: 76, step: 998, loss: 0.34813427925109863, mean loss: 0.33878647537190215
Epoch: 76, step: 999, loss: 0.34131869673728943, mean loss: 0.33878649823744217
Epoch: 76, step: 1000, loss: 0.3291822075843811, mean loss: 0.3387864115130695
Epoch: 76, step: 1001, loss: 0.3203686773777008, mean loss: 0.3387862452069805
Epoch: 76, step: 1002, loss: 0.322947233915329, mean loss: 0.33878610218720306
Epoch: 76, step: 1003, loss: 0.31042563915252686, mean loss: 0.3387858461061629
Epoch: 76, step: 1004, loss: 0.33636674284935, mean loss: 0.3387858242630469
Epoch: 76, step: 1005, loss: 0.3220753073692322, mean loss: 0.3387856733780185
Epoch: 76, step: 1006, loss: 0.3765830099582672, mean loss: 0.3387860146601431
Epoch: 76, step: 1007, loss: 0.33892351388931274, mean loss: 0.3387860159016487
Epoch: 76, step: 1008, loss: 0.3377627730369568, mean loss: 0.3387860066626857
Epoch: 76, step: 1009, loss: 0.3293618857860565, mean loss: 0.33878592157211673
Epoch: 76, step: 1010, loss: 0.3100183308124542, mean loss: 0.3387856618313307
Epoch: 76, step: 1011, loss: 0.3090853989124298, mean loss: 0.33878539367192695
Epoch: 76, step: 1012, loss: 0.33521512150764465, mean loss: 0.3387853614367439
Epoch: 76, step: 1013, loss: 0.3202628493309021, mean loss: 0.33878519420266506
Epoch: 76, step: 1014, loss: 0.34867653250694275, mean loss: 0.3387852835077175
Epoch: 76, step: 1015, loss: 0.3317359685897827, mean loss: 0.3387852198627652
Epoch: 76, step: 1016, loss: 0.3333217203617096, mean loss: 0.33878517053584056
Epoch: 76, step: 1017, loss: 0.3412887454032898, mean loss: 0.3387851931390336
Epoch: 76, step: 1018, loss: 0.35088837146759033, mean loss: 0.33878530240998445
Epoch: 76, step: 1019, loss: 0.3372420370578766, mean loss: 0.33878528847706985
Epoch: 76, step: 1020, loss: 0.29360148310661316, mean loss: 0.33878488055213535
Epoch: 76, step: 1021, loss: 0.3617551624774933, mean loss: 0.33878508792878453
Epoch: 76, step: 1022, loss: 0.31018710136413574, mean loss: 0.33878482974731744
Epoch: 76, step: 1023, loss: 0.3307952284812927, mean loss: 0.33878475761817123
Epoch: 76, step: 1024, loss: 0.28754091262817383, mean loss: 0.3387842949991624
Epoch: 76, step: 1025, loss: 0.3431550860404968, mean loss: 0.3387843344574186
Epoch: 76, step: 1026, loss: 0.34393343329429626, mean loss: 0.33878438094159624
Epoch: 76, step: 1027, loss: 0.3603252172470093, mean loss: 0.338784575402618
Epoch: 76, step: 1028, loss: 0.35701918601989746, mean loss: 0.3387847400150292
Epoch: 76, step: 1029, loss: 0.28912249207496643, mean loss: 0.3387842916945935
Epoch: 76, step: 1030, loss: 0.2956027388572693, mean loss: 0.33878390188143315
Epoch: 76, step: 1031, loss: 0.34699955582618713, mean loss: 0.33878397604599897
Epoch: 76, step: 1032, loss: 0.313746839761734, mean loss: 0.3387837500321488
Epoch: 76, step: 1033, loss: 0.3335835039615631, mean loss: 0.3387837030891992
Epoch: 76, step: 1034, loss: 0.3200254738330841, mean loss: 0.33878353375900794
Epoch: 76, step: 1035, loss: 0.35079073905944824, mean loss: 0.3387836421468514
Epoch: 76, step: 1036, loss: 0.3367791473865509, mean loss: 0.3387836240526407
Epoch: 76, step: 1037, loss: 0.34269848465919495, mean loss: 0.33878365939105853
Epoch: 76, step: 1038, loss: 0.31706199049949646, mean loss: 0.3387834633170319
Epoch: 76, step: 1039, loss: 0.31554320454597473, mean loss: 0.33878325353711086
Epoch: 76, step: 1040, loss: 0.3144208490848541, mean loss: 0.33878303363004353
Epoch: 76, step: 1041, loss: 0.41293051838874817, mean loss: 0.3387837029157363
Epoch: 76, step: 1042, loss: 0.3325188159942627, mean loss: 0.33878364636680075
Epoch: 76, step: 1043, loss: 0.3886825144290924, mean loss: 0.3387840967663753
Epoch: 76, step: 1044, loss: 0.3139059543609619, mean loss: 0.3387838722121108
Epoch: 76, step: 1045, loss: 0.30693426728248596, mean loss: 0.3387835847348572
Epoch: 76, step: 1046, loss: 0.31459033489227295, mean loss: 0.33878336636648937
Epoch: 76, step: 1047, loss: 0.35193416476249695, mean loss: 0.33878348506457584
Epoch: 76, step: 1048, loss: 0.2957189381122589, mean loss: 0.33878309637082304
Epoch: 76, step: 1049, loss: 0.30769288539886475, mean loss: 0.33878281575805547
Epoch: 76, step: 1050, loss: 0.3451676070690155, mean loss: 0.3387828733851263
Epoch: 76, step: 1051, loss: 0.32295548915863037, mean loss: 0.3387827305335412
Epoch: 76, step: 1052, loss: 0.3339974284172058, mean loss: 0.3387826873437245
Epoch: 76, step: 1053, loss: 0.3411619961261749, mean loss: 0.33878270881801814
Epoch: 76, step: 1054, loss: 0.3271494209766388, mean loss: 0.33878260382349795
Epoch: 76, step: 1055, loss: 0.4014779031276703, mean loss: 0.33878316966554944
Epoch: 76, step: 1056, loss: 0.2828376889228821, mean loss: 0.3387826647469951
Epoch: 76, step: 1057, loss: 0.35050931572914124, mean loss: 0.3387827705812849
Epoch: 76, step: 1058, loss: 0.3028775155544281, mean loss: 0.33878244653541045
Epoch: 76, step: 1059, loss: 0.3000134527683258, mean loss: 0.338782096647376
Epoch: 76, step: 1060, loss: 0.3319517970085144, mean loss: 0.3387820350048541
Epoch: 76, step: 1061, loss: 0.30310046672821045, mean loss: 0.33878171298647713
Epoch: 76, step: 1062, loss: 0.3225725293159485, mean loss: 0.33878156670344745
Epoch: 76, step: 1063, loss: 0.3423430919647217, mean loss: 0.33878159884485654
Epoch: 76, step: 1064, loss: 0.3354353904724121, mean loss: 0.33878156864687287
Epoch: 76, step: 1065, loss: 0.3476707637310028, mean loss: 0.3387816488670252
Epoch: 76, step: 1066, loss: 0.3143625557422638, mean loss: 0.3387814284999757
Epoch: 76, step: 1067, loss: 0.3087517321109772, mean loss: 0.3387811575031849
Epoch: 76, step: 1068, loss: 0.3387470841407776, mean loss: 0.3387811571956996
Epoch: 76, step: 1069, loss: 0.2852379083633423, mean loss: 0.3387806740144334
Epoch: 76, step: 1070, loss: 0.33076027035713196, mean loss: 0.33878060163791707
Epoch: 76, step: 1071, loss: 0.3086254894733429, mean loss: 0.33878032951916015
Epoch: 76, step: 1072, loss: 0.329605370759964, mean loss: 0.33878024672537616
Epoch: 76, step: 1073, loss: 0.3471592962741852, mean loss: 0.3387803223362837
Epoch: 76, step: 1074, loss: 0.3178454637527466, mean loss: 0.33878013342591107
Epoch: 76, step: 1075, loss: 0.3322906792163849, mean loss: 0.33878007486739986
Epoch: 76, step: 1076, loss: 0.3562108278274536, mean loss: 0.33878023215485403
Epoch: 76, step: 1077, loss: 0.3048425614833832, mean loss: 0.33877992591899225
Epoch: 76, step: 1078, loss: 0.2923392653465271, mean loss: 0.33877950686644387
Epoch: 76, step: 1079, loss: 0.3253049850463867, mean loss: 0.3387793852815722
Epoch: 76, step: 1080, loss: 0.3593549430370331, mean loss: 0.3387795709396616
Epoch: 76, step: 1081, loss: 0.307315468788147, mean loss: 0.33877928703424093
Epoch: 76, step: 1082, loss: 0.33676275610923767, mean loss: 0.3387792688389372
Epoch: 76, step: 1083, loss: 0.3263740539550781, mean loss: 0.33877915690680016
Epoch: 76, step: 1084, loss: 0.3423864543437958, mean loss: 0.33877918945511726
Epoch: 76, step: 1085, loss: 0.3371858298778534, mean loss: 0.33877917507850824
Epoch: 76, step: 1086, loss: 0.32249608635902405, mean loss: 0.33877902816032907
Epoch: 76, step: 1087, loss: 0.3908980190753937, mean loss: 0.3387794984125208
Epoch: 76, step: 1088, loss: 0.3342618942260742, mean loss: 0.3387794576520597
Epoch: 76, step: 1089, loss: 0.32658126950263977, mean loss: 0.33877934759388123
Epoch: 76, step: 1090, loss: 0.34230124950408936, mean loss: 0.338779379369962
Epoch: 76, step: 1091, loss: 0.35026952624320984, mean loss: 0.33877948303796585
Epoch: 76, step: 1092, loss: 0.32900795340538025, mean loss: 0.33877939487670533
Epoch: 76, step: 1093, loss: 0.37423986196517944, mean loss: 0.3387797148072985
Epoch: 76, step: 1094, loss: 0.34452757239341736, mean loss: 0.33877976666501636
Epoch: 76, step: 1095, loss: 0.3171382546424866, mean loss: 0.3387795714149981
Epoch: 76, step: 1096, loss: 0.308971643447876, mean loss: 0.33877930248988947
Epoch: 76, step: 1097, loss: 0.33259662985801697, mean loss: 0.33877924671073867
Epoch: 76, step: 1098, loss: 0.361992746591568, mean loss: 0.3387794561375846
Epoch: 76, step: 1099, loss: 0.32062384486198425, mean loss: 0.3387792923433217
Epoch: 76, step: 1100, loss: 0.3150288760662079, mean loss: 0.33877907807640595
Epoch: 76, step: 1101, loss: 0.37732481956481934, mean loss: 0.3387794258177903
Epoch: 76, step: 1102, loss: 0.3607610762119293, mean loss: 0.33877962412401774
Epoch: 76, step: 1103, loss: 0.3246996998786926, mean loss: 0.3387794971039159
Epoch: 76, step: 1104, loss: 0.34902697801589966, mean loss: 0.33877958954932286
Epoch: 76, step: 1105, loss: 0.3215186297893524, mean loss: 0.3387794338347558
Epoch: 76, step: 1106, loss: 0.3165839612483978, mean loss: 0.3387792336067688
Epoch: 76, step: 1107, loss: 0.3485380709171295, mean loss: 0.33877932164160185
Epoch: 76, step: 1108, loss: 0.34137552976608276, mean loss: 0.3387793450618803
Epoch: 76, step: 1109, loss: 0.38619139790534973, mean loss: 0.33877977276004945
Epoch: 76, step: 1110, loss: 0.3334304094314575, mean loss: 0.3387797245045506
Epoch: 76, step: 1111, loss: 0.3048563301563263, mean loss: 0.33877941849139526
Epoch: 76, step: 1112, loss: 0.3623868525028229, mean loss: 0.338779631445327
Epoch: 76, step: 1113, loss: 0.3785439729690552, mean loss: 0.33877999014151067
Epoch: 76, step: 1114, loss: 0.3150321841239929, mean loss: 0.3387797759251997
Epoch: 76, step: 1115, loss: 0.35467520356178284, mean loss: 0.33877991930809376
Epoch: 76, step: 1116, loss: 0.33671531081199646, mean loss: 0.33877990068469604
Epoch: 76, step: 1117, loss: 0.3239344656467438, mean loss: 0.33877976677555643
Epoch: 76, step: 1118, loss: 0.3162626326084137, mean loss: 0.3387795636678093
Epoch: 76, step: 1119, loss: 0.3279116749763489, mean loss: 0.3387794656387946
Epoch: 76, step: 1120, loss: 0.32365551590919495, mean loss: 0.3387793292210818
Epoch: 76, step: 1121, loss: 0.32980090379714966, mean loss: 0.3387792482366012
Epoch: 76, step: 1122, loss: 0.31979119777679443, mean loss: 0.3387790769678697
Epoch: 76, step: 1123, loss: 0.30926769971847534, mean loss: 0.3387788107830621
Epoch: 76, step: 1124, loss: 0.2946951687335968, mean loss: 0.3387784131638714
Epoch: 76, step: 1125, loss: 0.33623772859573364, mean loss: 0.33877839024798284
Epoch: 76, step: 1126, loss: 0.33213385939598083, mean loss: 0.33877833031769583
Epoch: 76, step: 1127, loss: 0.3036700487136841, mean loss: 0.3387780136617177
Epoch: 76, step: 1128, loss: 0.3188735544681549, mean loss: 0.33877783413686324
Epoch: 76, step: 1129, loss: 0.3800244629383087, mean loss: 0.33877820615039933
Epoch: 76, step: 1130, loss: 0.3349013328552246, mean loss: 0.3387781711842366
Epoch: 76, step: 1131, loss: 0.2932875454425812, mean loss: 0.3387777609004444
Epoch: 76, step: 1132, loss: 0.33345553278923035, mean loss: 0.3387777128992529
Epoch: 76, step: 1133, loss: 0.32039907574653625, mean loss: 0.3387775471437635
Epoch: 76, step: 1134, loss: 0.3253558874130249, mean loss: 0.33877742609595707
Epoch: 76, step: 1135, loss: 0.3785581886768341, mean loss: 0.33877778486906834
Epoch: 76, step: 1136, loss: 0.34133344888687134, mean loss: 0.3387778079177784
Epoch: 76, step: 1137, loss: 0.31644853949546814, mean loss: 0.3387776065391198
Epoch: 76, step: 1138, loss: 0.31613555550575256, mean loss: 0.33877740234144266
Epoch: 76, step: 1139, loss: 0.33499449491500854, mean loss: 0.33877736822554294
Epoch: 76, step: 1140, loss: 0.3253158926963806, mean loss: 0.3387772468252135
Epoch: 76, step: 1141, loss: 0.34256264567375183, mean loss: 0.3387772809629662
Epoch: 76, step: 1142, loss: 0.3186037540435791, mean loss: 0.3387770990342738
Epoch: 76, step: 1143, loss: 0.33437836170196533, mean loss: 0.33877705936598385
Epoch: 76, step: 1144, loss: 0.38135579228401184, mean loss: 0.3387774433421485
Epoch: 76, step: 1145, loss: 0.3202791213989258, mean loss: 0.33877727652528544
Epoch: 76, step: 1146, loss: 0.3095695674419403, mean loss: 0.3387770131341258
Epoch: 76, step: 1147, loss: 0.3356732428073883, mean loss: 0.33877698514499827
Epoch: 76, step: 1148, loss: 0.35728833079338074, mean loss: 0.3387771520747923
Epoch: 76, step: 1149, loss: 0.3276541531085968, mean loss: 0.3387770517718096
Epoch: 76, step: 1150, loss: 0.35839930176734924, mean loss: 0.33877722871621646
Epoch: 76, step: 1151, loss: 0.3569965958595276, mean loss: 0.3387773930085908
Epoch: 76, step: 1152, loss: 0.3292112648487091, mean loss: 0.3387773067472117
Epoch: 76, step: 1153, loss: 0.34676486253738403, mean loss: 0.33877737877335995
Epoch: 76, step: 1154, loss: 0.35176175832748413, mean loss: 0.33877749585628725
Epoch: 76, step: 1155, loss: 0.3620528280735016, mean loss: 0.33877770573304306
Epoch: 76, step: 1156, loss: 0.3314913511276245, mean loss: 0.3387776400316102
Epoch: 76, step: 1157, loss: 0.31790870428085327, mean loss: 0.3387774518570439
Epoch: 76, step: 1158, loss: 0.3182586431503296, mean loss: 0.3387772668412309
Epoch: 76, step: 1159, loss: 0.34239661693573, mean loss: 0.3387772994762133
Epoch: 76, step: 1160, loss: 0.3251911401748657, mean loss: 0.33877717697353715
Epoch: 76, step: 1161, loss: 0.3357343077659607, mean loss: 0.33877714953706656
Epoch: 76, step: 1162, loss: 0.3285943865776062, mean loss: 0.33877705772353844
Epoch: 76, step: 1163, loss: 0.3141457140445709, mean loss: 0.33877683563546834
Epoch: 76, step: 1164, loss: 0.35278305411338806, mean loss: 0.3387769619211483
Epoch: 76, step: 1165, loss: 0.3263596296310425, mean loss: 0.33877684996251256
Epoch: 76, step: 1166, loss: 0.3448435366153717, mean loss: 0.3387769046612048
Epoch: 76, step: 1167, loss: 0.3580563962459564, mean loss: 0.33877707848812694
Epoch: 76, step: 1168, loss: 0.35996440052986145, mean loss: 0.33877726951462556
Epoch: 76, step: 1169, loss: 0.3647150993347168, mean loss: 0.33877750336995327
Epoch: 76, step: 1170, loss: 0.3512232303619385, mean loss: 0.3387776155795461
Epoch: 76, step: 1171, loss: 0.34035155177116394, mean loss: 0.33877762976989007
Epoch: 76, step: 1172, loss: 0.2974586486816406, mean loss: 0.338777257248265
Epoch: 76, step: 1173, loss: 0.32068294286727905, mean loss: 0.33877709411591156
Epoch: 76, step: 1174, loss: 0.34734946489334106, mean loss: 0.33877717140087427
Epoch: 76, step: 1175, loss: 0.34500908851623535, mean loss: 0.3387772275847646
Epoch: 76, step: 1176, loss: 0.35506489872932434, mean loss: 0.3387773744250486
Epoch: 76, step: 1177, loss: 0.35807034373283386, mean loss: 0.33877754835780594
Epoch: 76, step: 1178, loss: 0.29952555894851685, mean loss: 0.3387771944908044
Epoch: 76, step: 1179, loss: 0.33661341667175293, mean loss: 0.3387771749839545
Epoch: 76, step: 1180, loss: 0.3634939193725586, mean loss: 0.3387773978078841
Epoch: 76, step: 1181, loss: 0.432869553565979, mean loss: 0.33877824605045803
Epoch: 76, step: 1182, loss: 0.35525935888290405, mean loss: 0.3387783946266643
Epoch: 76, step: 1183, loss: 0.3429499566555023, mean loss: 0.3387784322326973
Epoch: 76, step: 1184, loss: 0.331440269947052, mean loss: 0.3387783660808138
Epoch: 76, step: 1185, loss: 0.3114864230155945, mean loss: 0.33877812005229974
Epoch: 76, step: 1186, loss: 0.29811277985572815, mean loss: 0.33877775347000805
Epoch: 76, step: 1187, loss: 0.31537556648254395, mean loss: 0.33877754251025805
Epoch: 76, step: 1188, loss: 0.3844393491744995, mean loss: 0.3387779541263386
Epoch: 76, step: 1189, loss: 0.333227276802063, mean loss: 0.3387779040904855
Epoch: 76, step: 1190, loss: 0.3005305826663971, mean loss: 0.33877755931812853
Epoch: 76, step: 1191, loss: 0.3222135603427887, mean loss: 0.33877741000682315
Epoch: 76, step: 1192, loss: 0.34750691056251526, mean loss: 0.3387774886956335
Epoch: 76, step: 1193, loss: 0.32402947545051575, mean loss: 0.33877735575639495
Epoch: 76, step: 1194, loss: 0.325960248708725, mean loss: 0.338777240223471
Epoch: 76, step: 1195, loss: 0.32600221037864685, mean loss: 0.3387771250708674
Epoch: 76, step: 1196, loss: 0.3922525644302368, mean loss: 0.33877760708778953
Epoch: 76, step: 1197, loss: 0.3444238007068634, mean loss: 0.3387776579809916
Epoch: 76, step: 1198, loss: 0.35934871435165405, mean loss: 0.33877784340103945
Epoch: 76, step: 1199, loss: 0.30656304955482483, mean loss: 0.33877755303117857
Epoch: 76, step: 1200, loss: 0.3477080464363098, mean loss: 0.3387776335259589
Epoch: 76, step: 1201, loss: 0.3696642816066742, mean loss: 0.3387779119194844
Epoch: 76, step: 1202, loss: 0.32437431812286377, mean loss: 0.33877778209539006
Epoch: 76, step: 1203, loss: 0.3471403419971466, mean loss: 0.33877785746907774
Epoch: 76, step: 1204, loss: 0.30999234318733215, mean loss: 0.33877759802091434
Epoch: 76, step: 1205, loss: 0.320883184671402, mean loss: 0.338777436737333
Epoch: 76, step: 1206, loss: 0.3247475326061249, mean loss: 0.33877731028597946
Epoch: 76, step: 1207, loss: 0.29941031336784363, mean loss: 0.33877695547491776
Epoch: 76, step: 1208, loss: 0.33137965202331543, mean loss: 0.33877688880431445
Epoch: 76, step: 1209, loss: 0.33428385853767395, mean loss: 0.3387768483097828
Epoch: 76, step: 1210, loss: 0.29894474148750305, mean loss: 0.3387764893164357
Epoch: 76, step: 1211, loss: 0.36702796816825867, mean loss: 0.3387767439351932
Epoch: 76, step: 1212, loss: 0.36305004358291626, mean loss: 0.3387769626983145
Epoch: 76, step: 1213, loss: 0.329385906457901, mean loss: 0.3387768780621797
Epoch: 76, step: 1214, loss: 0.3325496017932892, mean loss: 0.33877682193986186
Epoch: 76, step: 1215, loss: 0.31903642416000366, mean loss: 0.33877664403433033
Epoch: 76, step: 1216, loss: 0.35185444355010986, mean loss: 0.33877676189375405
Epoch: 76, step: 1217, loss: 0.31972506642341614, mean loss: 0.3387765901980792
Epoch: 76, step: 1218, loss: 0.33553779125213623, mean loss: 0.33877656100998094
Epoch: 76, step: 1219, loss: 0.281049519777298, mean loss: 0.3387760407778225
Epoch: 76, step: 1220, loss: 0.35258007049560547, mean loss: 0.3387761651776757
Epoch: 76, step: 1221, loss: 0.32821840047836304, mean loss: 0.33877607003353516
Epoch: 76, step: 1222, loss: 0.33645743131637573, mean loss: 0.3387760491386861
Epoch: 76, step: 1223, loss: 0.3249650001525879, mean loss: 0.3387759246789411
Epoch: 76, step: 1224, loss: 0.3242563307285309, mean loss: 0.3387757938352464
Epoch: 76, step: 1225, loss: 0.32143938541412354, mean loss: 0.3387756376091635
Epoch: 76, step: 1226, loss: 0.29158589243888855, mean loss: 0.3387752123652244
Epoch: 76, step: 1227, loss: 0.3842710852622986, mean loss: 0.3387756223413706
Epoch: 76, step: 1228, loss: 0.3651053011417389, mean loss: 0.3387758596033965
Epoch: 76, step: 1229, loss: 0.29675209522247314, mean loss: 0.33877548092222454
Epoch: 76, step: 1230, loss: 0.3400735557079315, mean loss: 0.33877549261922646
Epoch: 76, step: 1231, loss: 0.347988486289978, mean loss: 0.33877557563711924
Epoch: 76, step: 1232, loss: 0.31060782074928284, mean loss: 0.33877532182096914
Epoch: 76, step: 1233, loss: 0.33653634786605835, mean loss: 0.338775301646034
Epoch: 76, step: 1234, loss: 0.30728527903556824, mean loss: 0.3387750178984546
Epoch: 76, step: 1235, loss: 0.31875449419021606, mean loss: 0.33877483750087206
Epoch: 76, step: 1236, loss: 0.34163615107536316, mean loss: 0.338774863282885
Epoch: 76, step: 1237, loss: 0.3321705162525177, mean loss: 0.3387748037746131
Epoch: 76, step: 1238, loss: 0.34415704011917114, mean loss: 0.3387748522706561
Epoch: 76, step: 1239, loss: 0.2967257499694824, mean loss: 0.33877447339530203
Epoch: 76, step: 1240, loss: 0.3355715870857239, mean loss: 0.3387744445365706
Epoch: 76, step: 1241, loss: 0.33075931668281555, mean loss: 0.338774372319103
Epoch: 76, step: 1242, loss: 0.35516172647476196, mean loss: 0.3387745199702167
Epoch: 76, step: 1243, loss: 0.3273525536060333, mean loss: 0.3387744170584932
Epoch: 76, step: 1244, loss: 0.34153714776039124, mean loss: 0.3387744419504258
Epoch: 76, step: 1245, loss: 0.3036653697490692, mean loss: 0.3387741256239801
Epoch: 76, step: 1246, loss: 0.3620483875274658, mean loss: 0.33877433531901757
Epoch: 76, step: 1247, loss: 0.35669881105422974, mean loss: 0.3387744968124201
Epoch: 76, step: 1248, loss: 0.3300810754299164, mean loss: 0.3387744184883692
Epoch: 76, step: 1249, loss: 0.34221747517585754, mean loss: 0.33877444950857466
Epoch: 76, step: 1250, loss: 0.3603852689266205, mean loss: 0.3387746442094118
Epoch: 76, step: 1251, loss: 0.3977923095226288, mean loss: 0.338775175919251
Epoch: 76, step: 1252, loss: 0.31058645248413086, mean loss: 0.33877492195992387
Epoch: 76, step: 1253, loss: 0.32383981347084045, mean loss: 0.3387747874069726
Epoch: 76, step: 1254, loss: 0.4028978645801544, mean loss: 0.33877536509755696
Epoch: 76, step: 1255, loss: 0.3684709072113037, mean loss: 0.3387756326249634
Epoch: 76, step: 1256, loss: 0.30602747201919556, mean loss: 0.33877533759914735
Epoch: 76, step: 1257, loss: 0.3732322156429291, mean loss: 0.33877564801587895
Epoch: 76, step: 1258, loss: 0.3227432370185852, mean loss: 0.3387755035836474
Epoch: 76, step: 1259, loss: 0.33503296971321106, mean loss: 0.338775469868341
Epoch: 76, step: 1260, loss: 0.3353833854198456, mean loss: 0.3387754393103981
Epoch: 76, step: 1261, loss: 0.32520484924316406, mean loss: 0.3387753170594381
Epoch: 76, step: 1262, loss: 0.32740849256515503, mean loss: 0.3387752146620713
Epoch: 76, step: 1263, loss: 0.3407047986984253, mean loss: 0.3387752320444585
Epoch: 76, step: 1264, loss: 0.39787712693214417, mean loss: 0.3387757644507939
Epoch: 76, step: 1265, loss: 0.3815978765487671, mean loss: 0.3387761502008353
Epoch: 76, step: 1266, loss: 0.30785590410232544, mean loss: 0.33877587166766204
Epoch: 76, step: 1267, loss: 0.30463463068008423, mean loss: 0.3387755641221626
Epoch: 76, step: 1268, loss: 0.34757423400878906, mean loss: 0.3387756433801764
Epoch: 76, step: 1269, loss: 0.35314324498176575, mean loss: 0.33877577280170523
Epoch: 76, step: 1270, loss: 0.3285589814186096, mean loss: 0.3387756807709762
Epoch: 76, step: 1271, loss: 0.30633750557899475, mean loss: 0.3387753885772817
Epoch: 76, step: 1272, loss: 0.3237832188606262, mean loss: 0.338775253533372
Epoch: 76, step: 1273, loss: 0.30058255791664124, mean loss: 0.33877490951082057
Epoch: 76, step: 1274, loss: 0.39887362718582153, mean loss: 0.3387754508480482
Epoch: 76, step: 1275, loss: 0.30998408794403076, mean loss: 0.33877519151312746
Epoch: 76, step: 1276, loss: 0.3432592451572418, mean loss: 0.3387752319023659
Epoch: 76, step: 1277, loss: 0.33499810099601746, mean loss: 0.33877519788090255
Epoch: 76, step: 1278, loss: 0.2953418493270874, mean loss: 0.3387748066705357
Epoch: 76, step: 1279, loss: 0.35109585523605347, mean loss: 0.33877491764697837
Epoch: 76, step: 1280, loss: 0.3037826418876648, mean loss: 0.3387746024722361
Epoch: 76, step: 1281, loss: 0.33850613236427307, mean loss: 0.3387746000541529
Epoch: 76, step: 1282, loss: 0.34256869554519653, mean loss: 0.33877463422688103
Epoch: 76, step: 1283, loss: 0.2981991171836853, mean loss: 0.3387742687738688
Epoch: 76, step: 1284, loss: 0.3191203474998474, mean loss: 0.3387740917577624
Epoch: 76, step: 1285, loss: 0.31485968828201294, mean loss: 0.33877387637089873
Epoch: 76, step: 1286, loss: 0.2980078160762787, mean loss: 0.33877350921163424
Epoch: 76, step: 1287, loss: 0.32819339632987976, mean loss: 0.33877341392277266
Epoch: 76, step: 1288, loss: 0.3158336579799652, mean loss: 0.3387732073197272
Epoch: 76, step: 1289, loss: 0.3400857448577881, mean loss: 0.33877321914076886
Epoch: 76, step: 1290, loss: 0.3322482407093048, mean loss: 0.3387731603757089
Epoch: 76, step: 1291, loss: 0.28726279735565186, mean loss: 0.33877269646884073
Epoch: 76, step: 1292, loss: 0.3383265733718872, mean loss: 0.338772692451053
Epoch: 76, step: 1293, loss: 0.3017275929450989, mean loss: 0.33877235882563195
Epoch: 76, step: 1294, loss: 0.3308676779270172, mean loss: 0.33877228763730266
Epoch: 76, step: 1295, loss: 0.3437308967113495, mean loss: 0.33877233229336423
Epoch: 76, step: 1296, loss: 0.30487948656082153, mean loss: 0.33877202706515364
Epoch: 76, step: 1297, loss: 0.30370888113975525, mean loss: 0.33877171130043465
Epoch: 76, step: 1298, loss: 0.3560762405395508, mean loss: 0.33877186713672547
Epoch: 76, step: 1299, loss: 0.3313482403755188, mean loss: 0.3387718002837054
Epoch: 76, step: 1300, loss: 0.350155234336853, mean loss: 0.3387719027956065
Epoch: 76, step: 1301, loss: 0.31199169158935547, mean loss: 0.338771661632384
Epoch: 76, step: 1302, loss: 0.3668941557407379, mean loss: 0.33877191488095537
Epoch: 76, step: 1303, loss: 0.29762569069862366, mean loss: 0.3387715443544787
Epoch: 76, step: 1304, loss: 0.3298289477825165, mean loss: 0.3387714638260942
Epoch: 76, step: 1305, loss: 0.31707099080085754, mean loss: 0.3387712684143605
Epoch: 76, step: 1306, loss: 0.33159947395324707, mean loss: 0.33877120383327197
Epoch: 76, step: 1307, loss: 0.31065401434898376, mean loss: 0.33877095064386986
Epoch: 76, step: 1308, loss: 0.35328876972198486, mean loss: 0.3387710813726127
Epoch: 76, step: 1309, loss: 0.32639995217323303, mean loss: 0.3387709699751916
Epoch: 76, step: 1310, loss: 0.32376629114151, mean loss: 0.3387708348648514
Epoch: 76, step: 1311, loss: 0.3192264437675476, mean loss: 0.33877065887804203
Epoch: 76, step: 1312, loss: 0.31921854615211487, mean loss: 0.3387704828232888
Epoch: 76, step: 1313, loss: 0.36170390248298645, mean loss: 0.3387706893227725
Epoch: 76, step: 1314, loss: 0.3178499937057495, mean loss: 0.33877050094816424
Epoch: 76, step: 1315, loss: 0.31929758191108704, mean loss: 0.33877032561123793
Epoch: 76, step: 1316, loss: 0.3383817970752716, mean loss: 0.33877032211290337
Epoch: 76, step: 1317, loss: 0.34987515211105347, mean loss: 0.3387704221005679
Epoch: 76, step: 1318, loss: 0.29558053612709045, mean loss: 0.33877003322321025
Epoch: 76, step: 1319, loss: 0.33294567465782166, mean loss: 0.33876998078174797
Epoch: 76, step: 1320, loss: 0.31779369711875916, mean loss: 0.33876979191681605
Epoch: 76, step: 1321, loss: 0.30153170228004456, mean loss: 0.3387694566378861
Epoch: 76, step: 1322, loss: 0.3418356776237488, mean loss: 0.33876948424483494
Epoch: 76, step: 1323, loss: 0.32819443941116333, mean loss: 0.33876938903248904
Epoch: 76, step: 1324, loss: 0.36371996998786926, mean loss: 0.33876961367285635
Epoch: 76, step: 1325, loss: 0.3050476908683777, mean loss: 0.33876931006321553
Epoch: 76, step: 1326, loss: 0.3313881754875183, mean loss: 0.3387692436090144
Epoch: 76, step: 1327, loss: 0.3290765583515167, mean loss: 0.33876915634412985
Epoch: 76, step: 1328, loss: 0.3221980631351471, mean loss: 0.3387690071531185
Epoch: 76, step: 1329, loss: 0.31887635588645935, mean loss: 0.3387688280594398
Epoch: 76, step: 1330, loss: 0.3563196659088135, mean loss: 0.33876898606833333
Epoch: 76, step: 1331, loss: 0.3088168501853943, mean loss: 0.3387687164138996
Epoch: 76, step: 1332, loss: 0.32402679324150085, mean loss: 0.3387685836958466
Epoch: 76, step: 1333, loss: 0.3563310503959656, mean loss: 0.3387687418051635
Epoch: 76, step: 1334, loss: 0.31606951355934143, mean loss: 0.3387685374530515
Epoch: 76, step: 1335, loss: 0.3439037799835205, mean loss: 0.33876858368317875
Epoch: 76, step: 1336, loss: 0.324451208114624, mean loss: 0.33876845479186907
Epoch: 76, step: 1337, loss: 0.33515051007270813, mean loss: 0.33876842222183323
Epoch: 76, step: 1338, loss: 0.31623512506484985, mean loss: 0.3387682193708375
Epoch: 76, step: 1339, loss: 0.3433121144771576, mean loss: 0.3387682602758743
Epoch: 76, step: 1340, loss: 0.34201350808143616, mean loss: 0.3387682894899699
Epoch: 76, step: 1341, loss: 0.3476749658584595, mean loss: 0.33876836966817747
Epoch: 76, step: 1342, loss: 0.34437358379364014, mean loss: 0.33876842012605396
Epoch: 76, step: 1343, loss: 0.3177817165851593, mean loss: 0.3387682312064268
Epoch: 76, step: 1344, loss: 0.3481806814670563, mean loss: 0.3387683159353402
Epoch: 76, step: 1345, loss: 0.32218942046165466, mean loss: 0.3387681666969256
Epoch: 76, step: 1346, loss: 0.38656988739967346, mean loss: 0.33876859699029505
Epoch: 76, step: 1347, loss: 0.2973800003528595, mean loss: 0.33876822442884474
Epoch: 76, step: 1348, loss: 0.31097540259361267, mean loss: 0.3387679742526695
Epoch: 76, step: 1349, loss: 0.3922899663448334, mean loss: 0.3387684560247913
Epoch: 76, step: 1350, loss: 0.3483293652534485, mean loss: 0.33876854208545315
Epoch: 76, step: 1351, loss: 0.3443715274333954, mean loss: 0.3387685925191803
Epoch: 76, step: 1352, loss: 0.36211562156677246, mean loss: 0.3387688026691308
Epoch: 76, step: 1353, loss: 0.36122065782546997, mean loss: 0.33876900475967386
Epoch: 76, step: 1354, loss: 0.338932067155838, mean loss: 0.3387690062273954
Epoch: 76, step: 1355, loss: 0.3395635783672333, mean loss: 0.33876901337925985
Epoch: 76, step: 1356, loss: 0.33278632164001465, mean loss: 0.3387689595301339
Epoch: 76, step: 1357, loss: 0.3641795814037323, mean loss: 0.3387691882444854
Epoch: 76, step: 1358, loss: 0.3334278166294098, mean loss: 0.3387691401686313
Epoch: 76, step: 1359, loss: 0.31178539991378784, mean loss: 0.3387688972994254
Epoch: 76, step: 1360, loss: 0.3205545246601105, mean loss: 0.338768733361055
Epoch: 76, step: 1361, loss: 0.3186570107936859, mean loss: 0.33876855234722525
Epoch: 76, step: 1362, loss: 0.3009900748729706, mean loss: 0.3387682123283473
Epoch: 76, step: 1363, loss: 0.31786322593688965, mean loss: 0.33876802417820157
Epoch: 76, step: 1364, loss: 0.3471692204475403, mean loss: 0.3387680997904046
Epoch: 76, step: 1365, loss: 0.35491958260536194, mean loss: 0.3387682451552036
Epoch: 76, step: 1366, loss: 0.3120666742324829, mean loss: 0.338768004840825
Epoch: 76, step: 1367, loss: 0.3249112367630005, mean loss: 0.33876788013090997
Epoch: 76, step: 1368, loss: 0.3231363296508789, mean loss: 0.33876773944934724
Epoch: 76, step: 1369, loss: 0.3283764719963074, mean loss: 0.3387676459303717
Epoch: 76, step: 1370, loss: 0.3552778959274292, mean loss: 0.3387677945174211
Epoch: 76, step: 1371, loss: 0.32217937707901, mean loss: 0.3387676452282329
Epoch: 76, step: 1372, loss: 0.28777286410331726, mean loss: 0.33876718629952596
Epoch: 76, step: 1373, loss: 0.3075876533985138, mean loss: 0.33876690570112694
Epoch: 76, step: 1374, loss: 0.31179019808769226, mean loss: 0.3387666629279953
Epoch: 76, step: 1375, loss: 0.3022141754627228, mean loss: 0.3387663339819238
Epoch: 76, step: 1376, loss: 0.34346824884414673, mean loss: 0.33876637629539164
Epoch: 76, step: 1377, loss: 0.36696189641952515, mean loss: 0.33876663003020674
Epoch: 76, step: 1378, loss: 0.30023834109306335, mean loss: 0.3387662833127051
Epoch: 76, step: 1379, loss: 0.32461339235305786, mean loss: 0.33876615595146037
Epoch: 76, step: 1380, loss: 0.2961655557155609, mean loss: 0.33876577259397794
Epoch: 76, step: 1381, loss: 0.3634369373321533, mean loss: 0.33876599460471113
Epoch: 76, step: 1382, loss: 0.3024851083755493, mean loss: 0.3387656681234219
Epoch: 76, step: 1383, loss: 0.3489329218864441, mean loss: 0.3387657596147991
Epoch: 76, step: 1384, loss: 0.3047467768192291, mean loss: 0.3387654534932395
Epoch: 76, step: 1385, loss: 0.3407219648361206, mean loss: 0.33876547109884864
Epoch: 76, step: 1386, loss: 0.340581476688385, mean loss: 0.33876548743997387
Epoch: 76, step: 1387, loss: 0.30433619022369385, mean loss: 0.33876517763454234
Epoch: 76, step: 1388, loss: 0.3329504132270813, mean loss: 0.3387651253119702
Epoch: 76, step: 1389, loss: 0.3273768424987793, mean loss: 0.33876502283853444
Epoch: 76, step: 1390, loss: 0.3381027579307556, mean loss: 0.33876501687943145
Epoch: 76, step: 1391, loss: 0.3181326389312744, mean loss: 0.3387648312296155
Epoch: 76, step: 1392, loss: 0.30328431725502014, mean loss: 0.338764511979375
Epoch: 76, step: 1393, loss: 0.3399815559387207, mean loss: 0.33876452293012055
Epoch: 76, step: 1394, loss: 0.3497287631034851, mean loss: 0.3387646215835201
Epoch: 76, step: 1395, loss: 0.3516477346420288, mean loss: 0.33876473750139896
Epoch: 76, step: 1396, loss: 0.3040892779827118, mean loss: 0.33876442550619
Epoch: 76, step: 1397, loss: 0.2961258888244629, mean loss: 0.33876404186601183
Epoch: 76, step: 1398, loss: 0.35962164402008057, mean loss: 0.3387642295305715
Epoch: 76, step: 1399, loss: 0.30289554595947266, mean loss: 0.33876390680794527
Epoch: 76, step: 1400, loss: 0.32227256894111633, mean loss: 0.3387637584311594
Epoch: 76, step: 1401, loss: 0.30036434531211853, mean loss: 0.338763412944924
Epoch: 76, step: 1402, loss: 0.33231544494628906, mean loss: 0.3387633549319502
Epoch: 76, step: 1403, loss: 0.31665244698524475, mean loss: 0.33876315599982415
Epoch: 76, step: 1404, loss: 0.34959903359413147, mean loss: 0.3387632534894785
Epoch: 76, step: 1405, loss: 0.3280409276485443, mean loss: 0.3387631570223094
Epoch: 76, step: 1406, loss: 0.3568800389766693, mean loss: 0.33876332001573234
Epoch: 76, step: 1407, loss: 0.3431360423564911, mean loss: 0.3387633593557563
Epoch: 76, step: 1408, loss: 0.3368212580680847, mean loss: 0.33876334188343177
Epoch: 76, step: 1409, loss: 0.40426814556121826, mean loss: 0.33876393119918896
Epoch: 76, step: 1410, loss: 0.28829389810562134, mean loss: 0.33876347714824123
Epoch: 76, step: 1411, loss: 0.32641810178756714, mean loss: 0.3387633660847326
Epoch: 76, step: 1412, loss: 0.29207369685173035, mean loss: 0.3387629460511834
Epoch: 76, step: 1413, loss: 0.3669457733631134, mean loss: 0.33876319958963597
Epoch: 76, step: 1414, loss: 0.34729456901550293, mean loss: 0.33876327633888187
Epoch: 76, step: 1415, loss: 0.33339089155197144, mean loss: 0.3387632280086841
Epoch: 76, step: 1416, loss: 0.3193320631980896, mean loss: 0.33876305320668687
Epoch: 76, step: 1417, loss: 0.33038821816444397, mean loss: 0.3387629778676768
Epoch: 76, step: 1418, loss: 0.3462190330028534, mean loss: 0.33876304494084986
Epoch: 76, step: 1419, loss: 0.3543274700641632, mean loss: 0.3387631849540297
Epoch: 76, step: 1420, loss: 0.317082941532135, mean loss: 0.3387629899264273
Epoch: 76, step: 1421, loss: 0.34839770197868347, mean loss: 0.33876307659602095
Epoch: 76, step: 1422, loss: 0.31542351841926575, mean loss: 0.3387628666456024
Epoch: 76, step: 1423, loss: 0.30272603034973145, mean loss: 0.3387625424800485
Epoch: 76, step: 1424, loss: 0.3288070261478424, mean loss: 0.33876245292705864
Epoch: 76, step: 1425, loss: 0.3277497887611389, mean loss: 0.33876235386558373
Epoch: 76, step: 1426, loss: 0.3566020131111145, mean loss: 0.3387625143360234
Epoch: 76, step: 1427, loss: 0.3196765184402466, mean loss: 0.3387623426561409
Epoch: 76, step: 1428, loss: 0.3763722777366638, mean loss: 0.338762680957123
Epoch: 76, step: 1429, loss: 0.32960543036460876, mean loss: 0.3387625985884883
Epoch: 76, step: 1430, loss: 0.33844122290611267, mean loss: 0.3387625956977693
Epoch: 76, step: 1431, loss: 0.3178521990776062, mean loss: 0.3387624076140406
Epoch: 76, step: 1432, loss: 0.33155694603919983, mean loss: 0.3387623428033192
Epoch: 76, step: 1433, loss: 0.32549697160720825, mean loss: 0.33876222348680696
Epoch: 76, step: 1434, loss: 0.32550227642059326, mean loss: 0.3387621042201553
Epoch: 76, step: 1435, loss: 0.3180588483810425, mean loss: 0.33876191800630534
Epoch: 76, step: 1436, loss: 0.3566738963127136, mean loss: 0.3387620791127741
Epoch: 76, step: 1437, loss: 0.3594845235347748, mean loss: 0.3387622654958615
Epoch: 76, step: 1438, loss: 0.3573349118232727, mean loss: 0.3387624325415999
Epoch: 76, step: 1439, loss: 0.2994564175605774, mean loss: 0.3387620790193756
Epoch: 76, step: 1440, loss: 0.37893104553222656, mean loss: 0.3387624402998227
Epoch: 76, step: 1441, loss: 0.32787489891052246, mean loss: 0.33876234237794955
Epoch: 76, step: 1442, loss: 0.3201126754283905, mean loss: 0.3387621746455083
Epoch: 76, step: 1443, loss: 0.31023356318473816, mean loss: 0.33876191806555844
Valid: 76, mean loss: 0.18584854404131573
Epoch: 77, step: 0, loss: 0.3342415690422058, mean loss: 0.3387618774109161
Epoch: 77, step: 1, loss: 0.3065863847732544, mean loss: 0.3387615880369379
Epoch: 77, step: 2, loss: 0.3653898239135742, mean loss: 0.3387618275188733
Epoch: 77, step: 3, loss: 0.316729336977005, mean loss: 0.3387616293707103
Epoch: 77, step: 4, loss: 0.3603431284427643, mean loss: 0.3387618234611573
Epoch: 77, step: 5, loss: 0.33556467294692993, mean loss: 0.33876179470825235
Epoch: 77, step: 6, loss: 0.3048671782016754, mean loss: 0.33876148988684396
Epoch: 77, step: 7, loss: 0.35134389996528625, mean loss: 0.3387616030420841
Epoch: 77, step: 8, loss: 0.31499427556991577, mean loss: 0.3387613893013584
Epoch: 77, step: 9, loss: 0.3460068106651306, mean loss: 0.33876145445919725
Epoch: 77, step: 10, loss: 0.34725892543792725, mean loss: 0.33876153087599037
Epoch: 77, step: 11, loss: 0.3344273269176483, mean loss: 0.3387614918993361
Epoch: 77, step: 12, loss: 0.32941651344299316, mean loss: 0.33876140786251574
Epoch: 77, step: 13, loss: 0.33218052983283997, mean loss: 0.3387613486830223
Epoch: 77, step: 14, loss: 0.3416447341442108, mean loss: 0.3387613746120482
Epoch: 77, step: 15, loss: 0.31905362010002136, mean loss: 0.3387611973904149
Epoch: 77, step: 16, loss: 0.3288874924182892, mean loss: 0.33876110860209624
Epoch: 77, step: 17, loss: 0.35586410760879517, mean loss: 0.3387612623977458
Epoch: 77, step: 18, loss: 0.370802640914917, mean loss: 0.33876155052150164
Epoch: 77, step: 19, loss: 0.36082831025123596, mean loss: 0.33876174894931016
Epoch: 77, step: 20, loss: 0.32403799891471863, mean loss: 0.3387616165522017
Epoch: 77, step: 21, loss: 0.3393387198448181, mean loss: 0.33876162174151286
Epoch: 77, step: 22, loss: 0.3213004767894745, mean loss: 0.3387614647323595
Epoch: 77, step: 23, loss: 0.3077707886695862, mean loss: 0.338761186069301
Epoch: 77, step: 24, loss: 0.32326120138168335, mean loss: 0.338761046697243
Epoch: 77, step: 25, loss: 0.3738212585449219, mean loss: 0.3387613619472281
Epoch: 77, step: 26, loss: 0.35846325755119324, mean loss: 0.338761539098652
Epoch: 77, step: 27, loss: 0.35992780327796936, mean loss: 0.3387617294153706
Epoch: 77, step: 28, loss: 0.339828222990036, mean loss: 0.33876173900467416
Epoch: 77, step: 29, loss: 0.338121235370636, mean loss: 0.3387617332456816
Epoch: 77, step: 30, loss: 0.3410535454750061, mean loss: 0.3387617538519829
Epoch: 77, step: 31, loss: 0.35750412940979004, mean loss: 0.33876192236821706
Epoch: 77, step: 32, loss: 0.30318212509155273, mean loss: 0.33876160246642445
Epoch: 77, step: 33, loss: 0.34381887316703796, mean loss: 0.3387616479364816
Epoch: 77, step: 34, loss: 0.354109525680542, mean loss: 0.33876178592842343
Epoch: 77, step: 35, loss: 0.3231215476989746, mean loss: 0.33876164530914854
Epoch: 77, step: 36, loss: 0.2925170063972473, mean loss: 0.3387612295335683
Epoch: 77, step: 37, loss: 0.33520787954330444, mean loss: 0.3387611975864517
Epoch: 77, step: 38, loss: 0.3311506509780884, mean loss: 0.33876112916289797
Epoch: 77, step: 39, loss: 0.3424849510192871, mean loss: 0.33876116264207456
Epoch: 77, step: 40, loss: 0.31437939405441284, mean loss: 0.33876094343873203
Epoch: 77, step: 41, loss: 0.3438599705696106, mean loss: 0.3387609892809251
Epoch: 77, step: 42, loss: 0.33095425367355347, mean loss: 0.3387609190960341
Epoch: 77, step: 43, loss: 0.32258713245391846, mean loss: 0.33876077369015595
Epoch: 77, step: 44, loss: 0.30250224471092224, mean loss: 0.3387604477209833
Epoch: 77, step: 45, loss: 0.3240012228488922, mean loss: 0.33876031503471044
Epoch: 77, step: 46, loss: 0.3312491178512573, mean loss: 0.3387602475092267
Epoch: 77, step: 47, loss: 0.3066559135913849, mean loss: 0.33875995889462424
Epoch: 77, step: 48, loss: 0.3578934669494629, mean loss: 0.33876013090131313
Epoch: 77, step: 49, loss: 0.31344860792160034, mean loss: 0.33875990335746137
Epoch: 77, step: 50, loss: 0.3335731029510498, mean loss: 0.338759856729926
Epoch: 77, step: 51, loss: 0.3564639985561371, mean loss: 0.3387600158825853
Epoch: 77, step: 52, loss: 0.30176085233688354, mean loss: 0.3387596832789271
Epoch: 77, step: 53, loss: 0.33851927518844604, mean loss: 0.3387596811178001
Epoch: 77, step: 54, loss: 0.3293691873550415, mean loss: 0.33875959670355593
Epoch: 77, step: 55, loss: 0.3169632852077484, mean loss: 0.3387594007710877
Epoch: 77, step: 56, loss: 0.3301735520362854, mean loss: 0.33875932359145056
Epoch: 77, step: 57, loss: 0.32764461636543274, mean loss: 0.3387592236803776
Epoch: 77, step: 58, loss: 0.30676281452178955, mean loss: 0.33875893606444946
Epoch: 77, step: 59, loss: 0.3239111006259918, mean loss: 0.3387588025983607
Epoch: 77, step: 60, loss: 0.3682950437068939, mean loss: 0.3387590680950493
Epoch: 77, step: 61, loss: 0.3103569746017456, mean loss: 0.3387588127953325
Epoch: 77, step: 62, loss: 0.3101106584072113, mean loss: 0.33875855528614707
Epoch: 77, step: 63, loss: 0.29863154888153076, mean loss: 0.3387581946004389
Epoch: 77, step: 64, loss: 0.32026463747024536, mean loss: 0.33875802837070007
Epoch: 77, step: 65, loss: 0.35109129548072815, mean loss: 0.33875813922754217
Epoch: 77, step: 66, loss: 0.27687177062034607, mean loss: 0.33875758297057745
Epoch: 77, step: 67, loss: 0.3161717653274536, mean loss: 0.33875737996294064
Epoch: 77, step: 68, loss: 0.3231096565723419, mean loss: 0.3387572393180968
Epoch: 77, step: 69, loss: 0.3182106614112854, mean loss: 0.33875705464303607
Epoch: 77, step: 70, loss: 0.3582841157913208, mean loss: 0.33875723015298265
Epoch: 77, step: 71, loss: 0.32202228903770447, mean loss: 0.3387570797400659
Epoch: 77, step: 72, loss: 0.341761976480484, mean loss: 0.33875710674770326
Epoch: 77, step: 73, loss: 0.3547130823135376, mean loss: 0.3387572501567339
Epoch: 77, step: 74, loss: 0.3554712235927582, mean loss: 0.3387574003771435
Epoch: 77, step: 75, loss: 0.3374980688095093, mean loss: 0.33875738905873354
Epoch: 77, step: 76, loss: 0.33189627528190613, mean loss: 0.338757327394115
Epoch: 77, step: 77, loss: 0.3496462106704712, mean loss: 0.33875742525764274
Epoch: 77, step: 78, loss: 0.3306978940963745, mean loss: 0.3387573528234874
Epoch: 77, step: 79, loss: 0.34065622091293335, mean loss: 0.3387573698892034
Epoch: 77, step: 80, loss: 0.3202550709247589, mean loss: 0.3387572036048029
Epoch: 77, step: 81, loss: 0.4108009338378906, mean loss: 0.3387578510724962
Epoch: 77, step: 82, loss: 0.3379186689853668, mean loss: 0.33875784353071003
Epoch: 77, step: 83, loss: 0.32343828678131104, mean loss: 0.33875770585405507
Epoch: 77, step: 84, loss: 0.32858386635780334, mean loss: 0.33875761442271507
Epoch: 77, step: 85, loss: 0.37415629625320435, mean loss: 0.33875793254448505
Epoch: 77, step: 86, loss: 0.33368104696273804, mean loss: 0.33875788691981124
Epoch: 77, step: 87, loss: 0.3252578377723694, mean loss: 0.3387577655994084
Epoch: 77, step: 88, loss: 0.30915066599845886, mean loss: 0.33875749953274953
Epoch: 77, step: 89, loss: 0.30458784103393555, mean loss: 0.33875719246703573
Epoch: 77, step: 90, loss: 0.32767945528030396, mean loss: 0.3387570929178199
Epoch: 77, step: 91, loss: 0.31651562452316284, mean loss: 0.3387568930484059
Epoch: 77, step: 92, loss: 0.3744847774505615, mean loss: 0.3387572141084647
Epoch: 77, step: 93, loss: 0.35642093420028687, mean loss: 0.3387573728378198
Epoch: 77, step: 94, loss: 0.3463737666606903, mean loss: 0.338757441279485
Epoch: 77, step: 95, loss: 0.34756097197532654, mean loss: 0.33875752038816814
Epoch: 77, step: 96, loss: 0.325774610042572, mean loss: 0.3387574037245536
Epoch: 77, step: 97, loss: 0.3384709358215332, mean loss: 0.3387574011503942
Epoch: 77, step: 98, loss: 0.3444347083568573, mean loss: 0.3387574521654023
Epoch: 77, step: 99, loss: 0.33684343099594116, mean loss: 0.3387574349665923
Epoch: 77, step: 100, loss: 0.3604932427406311, mean loss: 0.3387576302761716
Epoch: 77, step: 101, loss: 0.32587966322898865, mean loss: 0.33875751456076997
Epoch: 77, step: 102, loss: 0.3174948990345001, mean loss: 0.338757323506547
Epoch: 77, step: 103, loss: 0.3439304828643799, mean loss: 0.33875736998930733
Epoch: 77, step: 104, loss: 0.31730079650878906, mean loss: 0.33875717719574905
Epoch: 77, step: 105, loss: 0.30977684259414673, mean loss: 0.33875691680134684
Epoch: 77, step: 106, loss: 0.3521670997142792, mean loss: 0.3387570372935784
Epoch: 77, step: 107, loss: 0.3455663025379181, mean loss: 0.33875709847515945
Epoch: 77, step: 108, loss: 0.32826662063598633, mean loss: 0.3387570042185502
Epoch: 77, step: 109, loss: 0.3384575843811035, mean loss: 0.3387570015282967
Epoch: 77, step: 110, loss: 0.34694111347198486, mean loss: 0.3387570750609604
Epoch: 77, step: 111, loss: 0.30925294756889343, mean loss: 0.33875680997446006
Epoch: 77, step: 112, loss: 0.305622935295105, mean loss: 0.3387565122783506
Epoch: 77, step: 113, loss: 0.3694535195827484, mean loss: 0.33875678807759324
Epoch: 77, step: 114, loss: 0.36913490295410156, mean loss: 0.3387570610092741
Epoch: 77, step: 115, loss: 0.33347925543785095, mean loss: 0.33875701359134147
Epoch: 77, step: 116, loss: 0.3294476568698883, mean loss: 0.33875692995307977
Epoch: 77, step: 117, loss: 0.3895602524280548, mean loss: 0.338757386382405
Epoch: 77, step: 118, loss: 0.3213014006614685, mean loss: 0.3387572295550202
Epoch: 77, step: 119, loss: 0.3645265996456146, mean loss: 0.33875746106910803
Epoch: 77, step: 120, loss: 0.34546926617622375, mean loss: 0.3387575213679617
Epoch: 77, step: 121, loss: 0.3411412537097931, mean loss: 0.3387575427832195
Epoch: 77, step: 122, loss: 0.32358574867248535, mean loss: 0.3387574064822779
Epoch: 77, step: 123, loss: 0.391304612159729, mean loss: 0.33875787855362405
Epoch: 77, step: 124, loss: 0.3499510586261749, mean loss: 0.3387579791095346
Epoch: 77, step: 125, loss: 0.35354459285736084, mean loss: 0.338758111946498
Epoch: 77, step: 126, loss: 0.3402235805988312, mean loss: 0.338758125111558
Epoch: 77, step: 127, loss: 0.32608577609062195, mean loss: 0.33875801127034
Epoch: 77, step: 128, loss: 0.33723294734954834, mean loss: 0.3387579975701512
Epoch: 77, step: 129, loss: 0.33629947900772095, mean loss: 0.3387579754846074
Epoch: 77, step: 130, loss: 0.3225434720516205, mean loss: 0.33875782982660263
Epoch: 77, step: 131, loss: 0.3339422047138214, mean loss: 0.3387577865673041
Epoch: 77, step: 132, loss: 0.31626570224761963, mean loss: 0.33875758452021215
Epoch: 77, step: 133, loss: 0.3233224153518677, mean loss: 0.3387574458668537
Epoch: 77, step: 134, loss: 0.34723222255706787, mean loss: 0.3387575219946682
Epoch: 77, step: 135, loss: 0.3253484070301056, mean loss: 0.3387574015434181
Epoch: 77, step: 136, loss: 0.3749028444290161, mean loss: 0.3387577262273874
Epoch: 77, step: 137, loss: 0.3143494427204132, mean loss: 0.33875750697686635
Epoch: 77, step: 138, loss: 0.30883052945137024, mean loss: 0.3387572381563868
Epoch: 77, step: 139, loss: 0.3286969065666199, mean loss: 0.3387571477897981
Epoch: 77, step: 140, loss: 0.3214479982852936, mean loss: 0.33875699231234385
Epoch: 77, step: 141, loss: 0.35016629099845886, mean loss: 0.3387570947941429
Epoch: 77, step: 142, loss: 0.37619075179100037, mean loss: 0.33875743103164185
Epoch: 77, step: 143, loss: 0.2959088683128357, mean loss: 0.3387570461597028
Epoch: 77, step: 144, loss: 0.3436545133590698, mean loss: 0.33875709014906086
Epoch: 77, step: 145, loss: 0.3338119089603424, mean loss: 0.3387570457315317
Epoch: 77, step: 146, loss: 0.33841878175735474, mean loss: 0.338757042693278
Epoch: 77, step: 147, loss: 0.3653491139411926, mean loss: 0.3387572815384965
Epoch: 77, step: 148, loss: 0.32522380352020264, mean loss: 0.338757159984314
Epoch: 77, step: 149, loss: 0.33677470684051514, mean loss: 0.338757142178595
Epoch: 77, step: 150, loss: 0.3077770173549652, mean loss: 0.33875686392816323
Epoch: 77, step: 151, loss: 0.3392757177352905, mean loss: 0.3387568685882477
Epoch: 77, step: 152, loss: 0.32447749376296997, mean loss: 0.33875674033922154
Epoch: 77, step: 153, loss: 0.3101344406604767, mean loss: 0.33875648327270863
Epoch: 77, step: 154, loss: 0.34164395928382874, mean loss: 0.33875650920587025
Epoch: 77, step: 155, loss: 0.29920104146003723, mean loss: 0.3387561539512742
Epoch: 77, step: 156, loss: 0.33572131395339966, mean loss: 0.3387561266950885
Epoch: 77, step: 157, loss: 0.3471330404281616, mean loss: 0.3387562019282691
Epoch: 77, step: 158, loss: 0.3260924518108368, mean loss: 0.3387560881959717
Epoch: 77, step: 159, loss: 0.3379378914833069, mean loss: 0.33875608084786746
Epoch: 77, step: 160, loss: 0.3240511417388916, mean loss: 0.3387559487861596
Epoch: 77, step: 161, loss: 0.3179677724838257, mean loss: 0.33875576209396113
Epoch: 77, step: 162, loss: 0.3379846513271332, mean loss: 0.33875575516891543
Epoch: 77, step: 163, loss: 0.31451311707496643, mean loss: 0.33875553745717163
Epoch: 77, step: 164, loss: 0.32078760862350464, mean loss: 0.338755376097093
Epoch: 77, step: 165, loss: 0.32871004939079285, mean loss: 0.33875528588635334
Epoch: 77, step: 166, loss: 0.313480406999588, mean loss: 0.338755058910655
Epoch: 77, step: 167, loss: 0.3323632776737213, mean loss: 0.3387550015111324
Epoch: 77, step: 168, loss: 0.3542313575744629, mean loss: 0.33875514049077504
Epoch: 77, step: 169, loss: 0.3840496838092804, mean loss: 0.3387555472378729
Epoch: 77, step: 170, loss: 0.3259503245353699, mean loss: 0.3387554322474123
Epoch: 77, step: 171, loss: 0.3233526051044464, mean loss: 0.338755293931795
Epoch: 77, step: 172, loss: 0.3452378213405609, mean loss: 0.3387553521436233
Epoch: 77, step: 173, loss: 0.32902106642723083, mean loss: 0.33875526473242634
Epoch: 77, step: 174, loss: 0.3356546461582184, mean loss: 0.338755236889978
Epoch: 77, step: 175, loss: 0.3678000271320343, mean loss: 0.3387554976994877
Epoch: 77, step: 176, loss: 0.3732384741306305, mean loss: 0.3387558073387499
Epoch: 77, step: 177, loss: 0.30011364817619324, mean loss: 0.33875546035529747
Epoch: 77, step: 178, loss: 0.36573731899261475, mean loss: 0.33875570263405724
Epoch: 77, step: 179, loss: 0.29481205344200134, mean loss: 0.3387553080534848
Epoch: 77, step: 180, loss: 0.33837440609931946, mean loss: 0.33875530463330544
Epoch: 77, step: 181, loss: 0.3272152841091156, mean loss: 0.3387552010145524
Epoch: 77, step: 182, loss: 0.3645496964454651, mean loss: 0.3387554326232785
Epoch: 77, step: 183, loss: 0.3012065887451172, mean loss: 0.338755095475307
Epoch: 77, step: 184, loss: 0.34064799547195435, mean loss: 0.3387551124713473
Epoch: 77, step: 185, loss: 0.324645072221756, mean loss: 0.33875498578073504
Epoch: 77, step: 186, loss: 0.36948785185813904, mean loss: 0.3387552617211712
Epoch: 77, step: 187, loss: 0.31798818707466125, mean loss: 0.33875507526201803
Epoch: 77, step: 188, loss: 0.34931477904319763, mean loss: 0.33875517007247063
Epoch: 77, step: 189, loss: 0.3295557498931885, mean loss: 0.3387550874760855
Epoch: 77, step: 190, loss: 0.3243735730648041, mean loss: 0.33875495835376973
Epoch: 77, step: 191, loss: 0.30667299032211304, mean loss: 0.33875467031311585
Epoch: 77, step: 192, loss: 0.3302893340587616, mean loss: 0.33875459430970184
Epoch: 77, step: 193, loss: 0.2893276512622833, mean loss: 0.33875415054910274
Epoch: 77, step: 194, loss: 0.32400256395339966, mean loss: 0.33875401810890454
Epoch: 77, step: 195, loss: 0.3298782408237457, mean loss: 0.3387539384226185
Epoch: 77, step: 196, loss: 0.3252428472042084, mean loss: 0.338753817121804
Epoch: 77, step: 197, loss: 0.34432920813560486, mean loss: 0.33875386717648787
Epoch: 77, step: 198, loss: 0.287259966135025, mean loss: 0.3387534048792625
Epoch: 77, step: 199, loss: 0.418892502784729, mean loss: 0.3387541243382518
Epoch: 77, step: 200, loss: 0.30988258123397827, mean loss: 0.3387538651426122
Epoch: 77, step: 201, loss: 0.3348323404788971, mean loss: 0.33875382993725567
Epoch: 77, step: 202, loss: 0.32075390219688416, mean loss: 0.338753668344957
Epoch: 77, step: 203, loss: 0.3278685510158539, mean loss: 0.33875357062593475
Epoch: 77, step: 204, loss: 0.33601054549217224, mean loss: 0.33875354600118157
Epoch: 77, step: 205, loss: 0.3250262439250946, mean loss: 0.3387534227692115
Epoch: 77, step: 206, loss: 0.32452988624572754, mean loss: 0.33875329508361945
Epoch: 77, step: 207, loss: 0.31488242745399475, mean loss: 0.3387530807952462
Epoch: 77, step: 208, loss: 0.2992967963218689, mean loss: 0.3387527266000302
Epoch: 77, step: 209, loss: 0.32399776577949524, mean loss: 0.3387525941473756
Epoch: 77, step: 210, loss: 0.34473273158073425, mean loss: 0.338752647829522
Epoch: 77, step: 211, loss: 0.3689737021923065, mean loss: 0.3387529191136725
Epoch: 77, step: 212, loss: 0.3426288068294525, mean loss: 0.33875295390588905
Epoch: 77, step: 213, loss: 0.3262091279029846, mean loss: 0.3387528413062409
Epoch: 77, step: 214, loss: 0.34062984585762024, mean loss: 0.3387528581550201
Epoch: 77, step: 215, loss: 0.3221387267112732, mean loss: 0.3387527090209545
Epoch: 77, step: 216, loss: 0.4297112822532654, mean loss: 0.3387535254885568
Epoch: 77, step: 217, loss: 0.32801562547683716, mean loss: 0.3387534291032633
Epoch: 77, step: 218, loss: 0.3402736783027649, mean loss: 0.338753442749167
Epoch: 77, step: 219, loss: 0.31553253531455994, mean loss: 0.33875323431792836
Epoch: 77, step: 220, loss: 0.3564833402633667, mean loss: 0.33875339346221606
Epoch: 77, step: 221, loss: 0.41413450241088867, mean loss: 0.33875407007211594
Epoch: 77, step: 222, loss: 0.3353774845600128, mean loss: 0.3387540397646462
Epoch: 77, step: 223, loss: 0.31960341334342957, mean loss: 0.33875386787448697
Epoch: 77, step: 224, loss: 0.33224353194236755, mean loss: 0.3387538094402295
Epoch: 77, step: 225, loss: 0.3053775727748871, mean loss: 0.33875350987072594
Epoch: 77, step: 226, loss: 0.36487507820129395, mean loss: 0.33875374432361227
Epoch: 77, step: 227, loss: 0.3260470926761627, mean loss: 0.3387536302766922
Epoch: 77, step: 228, loss: 0.3857363164424896, mean loss: 0.3387540519599736
Epoch: 77, step: 229, loss: 0.34849774837493896, mean loss: 0.3387541394116997
Epoch: 77, step: 230, loss: 0.314598947763443, mean loss: 0.3387539226157165
Epoch: 77, step: 231, loss: 0.34200039505958557, mean loss: 0.33875395175296696
Epoch: 77, step: 232, loss: 0.36544060707092285, mean loss: 0.3387541912648661
Epoch: 77, step: 233, loss: 0.32601243257522583, mean loss: 0.3387540769090056
Epoch: 77, step: 234, loss: 0.35080426931381226, mean loss: 0.33875418505716537
Epoch: 77, step: 235, loss: 0.3181164860725403, mean loss: 0.3387539998394476
Epoch: 77, step: 236, loss: 0.310026079416275, mean loss: 0.3387537420165136
Epoch: 77, step: 237, loss: 0.3587439954280853, mean loss: 0.3387539214203638
Epoch: 77, step: 238, loss: 0.3121018707752228, mean loss: 0.33875368223192076
Epoch: 77, step: 239, loss: 0.3203498423099518, mean loss: 0.3387535170684078
Epoch: 77, step: 240, loss: 0.3250468969345093, mean loss: 0.3387533940607515
Epoch: 77, step: 241, loss: 0.3099539875984192, mean loss: 0.33875313560785314
Epoch: 77, step: 242, loss: 0.2663824260234833, mean loss: 0.3387524861412811
Epoch: 77, step: 243, loss: 0.34077173471450806, mean loss: 0.3387525042621851
Epoch: 77, step: 244, loss: 0.33657780289649963, mean loss: 0.33875248474641
Epoch: 77, step: 245, loss: 0.37147068977355957, mean loss: 0.33875277835702283
Epoch: 77, step: 246, loss: 0.34967583417892456, mean loss: 0.33875287637879176
Epoch: 77, step: 247, loss: 0.33345574140548706, mean loss: 0.33875282884357
Epoch: 77, step: 248, loss: 0.38414767384529114, mean loss: 0.3387532362023916
Epoch: 77, step: 249, loss: 0.30871349573135376, mean loss: 0.3387529666377864
Epoch: 77, step: 250, loss: 0.38146862387657166, mean loss: 0.33875334994755446
Epoch: 77, step: 251, loss: 0.3006576597690582, mean loss: 0.3387530080982169
Epoch: 77, step: 252, loss: 0.33386000990867615, mean loss: 0.33875296419159195
Epoch: 77, step: 253, loss: 0.3464711010456085, mean loss: 0.3387530334485763
Epoch: 77, step: 254, loss: 0.42428940534591675, mean loss: 0.3387538009832972
Epoch: 77, step: 255, loss: 0.3293387293815613, mean loss: 0.33875371650076247
Epoch: 77, step: 256, loss: 0.3325726389884949, mean loss: 0.33875366103773125
Epoch: 77, step: 257, loss: 0.3086110055446625, mean loss: 0.3387533905690245
Epoch: 77, step: 258, loss: 0.33228227496147156, mean loss: 0.338753332504513
Epoch: 77, step: 259, loss: 0.33044174313545227, mean loss: 0.3387532579263297
Epoch: 77, step: 260, loss: 0.32474014163017273, mean loss: 0.33875313219064523
Epoch: 77, step: 261, loss: 0.32753872871398926, mean loss: 0.33875303156791325
Epoch: 77, step: 262, loss: 0.3593560755252838, mean loss: 0.3387532164298163
Epoch: 77, step: 263, loss: 0.3247837424278259, mean loss: 0.3387530910890956
Epoch: 77, step: 264, loss: 0.30867111682891846, mean loss: 0.3387528211818319
Epoch: 77, step: 265, loss: 0.30419501662254333, mean loss: 0.3387525111184465
Epoch: 77, step: 266, loss: 0.3247930407524109, mean loss: 0.3387523858708545
Epoch: 77, step: 267, loss: 0.31417936086654663, mean loss: 0.33875216539797726
Epoch: 77, step: 268, loss: 0.31564608216285706, mean loss: 0.3387519580885823
Epoch: 77, step: 269, loss: 0.37148505449295044, mean loss: 0.33875225176957785
Epoch: 77, step: 270, loss: 0.35813283920288086, mean loss: 0.3387524256504438
Epoch: 77, step: 271, loss: 0.34433799982070923, mean loss: 0.33875247576325707
Epoch: 77, step: 272, loss: 0.301417738199234, mean loss: 0.3387521408054013
Epoch: 77, step: 273, loss: 0.3432677090167999, mean loss: 0.3387521813175777
Epoch: 77, step: 274, loss: 0.3534408509731293, mean loss: 0.3387523130982552
Epoch: 77, step: 275, loss: 0.3198320269584656, mean loss: 0.3387521433547852
Epoch: 77, step: 276, loss: 0.3279535174369812, mean loss: 0.3387520464757118
Epoch: 77, step: 277, loss: 0.3366328775882721, mean loss: 0.3387520274639155
Epoch: 77, step: 278, loss: 0.3467741310596466, mean loss: 0.338752099432333
Epoch: 77, step: 279, loss: 0.3500850796699524, mean loss: 0.33875220110259024
Epoch: 77, step: 280, loss: 0.3441706895828247, mean loss: 0.3387522497124143
Epoch: 77, step: 281, loss: 0.36533474922180176, mean loss: 0.3387524881846446
Epoch: 77, step: 282, loss: 0.29190847277641296, mean loss: 0.3387520679496471
Epoch: 77, step: 283, loss: 0.3503885269165039, mean loss: 0.33875217233872207
Epoch: 77, step: 284, loss: 0.3565409481525421, mean loss: 0.33875233191795484
Epoch: 77, step: 285, loss: 0.30936190485954285, mean loss: 0.3387520682652012
Epoch: 77, step: 286, loss: 0.3853442072868347, mean loss: 0.338752486225632
Epoch: 77, step: 287, loss: 0.3298981785774231, mean loss: 0.33875240679770446
Epoch: 77, step: 288, loss: 0.3268284499645233, mean loss: 0.33875229983432337
Epoch: 77, step: 289, loss: 0.3503929078578949, mean loss: 0.33875240425499853
Epoch: 77, step: 290, loss: 0.3273150622844696, mean loss: 0.3387523016586174
Epoch: 77, step: 291, loss: 0.35176971554756165, mean loss: 0.3387524184276692
Epoch: 77, step: 292, loss: 0.29983919858932495, mean loss: 0.3387520693707013
Epoch: 77, step: 293, loss: 0.3582266569137573, mean loss: 0.33875224405888005
Epoch: 77, step: 294, loss: 0.3278124928474426, mean loss: 0.338752145929558
Epoch: 77, step: 295, loss: 0.3233698904514313, mean loss: 0.3387520079523103
Epoch: 77, step: 296, loss: 0.31214094161987305, mean loss: 0.33875176925592665
Epoch: 77, step: 297, loss: 0.3050985634326935, mean loss: 0.3387514673955511
Epoch: 77, step: 298, loss: 0.3160727620124817, mean loss: 0.33875126397537314
Epoch: 77, step: 299, loss: 0.3542609214782715, mean loss: 0.33875140309041246
Epoch: 77, step: 300, loss: 0.33391281962394714, mean loss: 0.3387513596907635
Epoch: 77, step: 301, loss: 0.29281365871429443, mean loss: 0.33875094765649155
Epoch: 77, step: 302, loss: 0.3408537209033966, mean loss: 0.3387509665169668
Epoch: 77, step: 303, loss: 0.3667801022529602, mean loss: 0.33875121791738777
Epoch: 77, step: 304, loss: 0.3215220868587494, mean loss: 0.3387510633863315
Epoch: 77, step: 305, loss: 0.3331986367702484, mean loss: 0.33875101358610354
Epoch: 77, step: 306, loss: 0.34208154678344727, mean loss: 0.33875104345769597
Epoch: 77, step: 307, loss: 0.33245736360549927, mean loss: 0.33875098701011175
Epoch: 77, step: 308, loss: 0.3277854025363922, mean loss: 0.3387508886614165
Epoch: 77, step: 309, loss: 0.2951592803001404, mean loss: 0.3387504976982749
Epoch: 77, step: 310, loss: 0.3364728093147278, mean loss: 0.3387504772703932
Epoch: 77, step: 311, loss: 0.3327594995498657, mean loss: 0.3387504235396513
Epoch: 77, step: 312, loss: 0.3268404006958008, mean loss: 0.3387503167242609
Epoch: 77, step: 313, loss: 0.31258127093315125, mean loss: 0.3387500820285085
Epoch: 77, step: 314, loss: 0.3155131936073303, mean loss: 0.33874987363152886
Epoch: 77, step: 315, loss: 0.2905377447605133, mean loss: 0.33874944125126566
Epoch: 77, step: 316, loss: 0.3188619315624237, mean loss: 0.33874926289594803
Epoch: 77, step: 317, loss: 0.3978080451488495, mean loss: 0.338749792542624
Epoch: 77, step: 318, loss: 0.3446301817893982, mean loss: 0.33874984527823027
Epoch: 77, step: 319, loss: 0.32528528571128845, mean loss: 0.33874972452851215
Epoch: 77, step: 320, loss: 0.3375197649002075, mean loss: 0.3387497134983744
Epoch: 77, step: 321, loss: 0.32571446895599365, mean loss: 0.3387495966008357
Epoch: 77, step: 322, loss: 0.29445555806159973, mean loss: 0.338749199384072
Epoch: 77, step: 323, loss: 0.35427945852279663, mean loss: 0.33874933865391865
Epoch: 77, step: 324, loss: 0.34803396463394165, mean loss: 0.33874942191439933
Epoch: 77, step: 325, loss: 0.3432835042476654, mean loss: 0.3387494625737097
Epoch: 77, step: 326, loss: 0.28182563185691833, mean loss: 0.33874895211475153
Epoch: 77, step: 327, loss: 0.32639551162719727, mean loss: 0.3387488413374596
Epoch: 77, step: 328, loss: 0.37264031171798706, mean loss: 0.33874914525049865
Epoch: 77, step: 329, loss: 0.33595603704452515, mean loss: 0.3387491202042442
Epoch: 77, step: 330, loss: 0.2963695526123047, mean loss: 0.3387487401831931
Epoch: 77, step: 331, loss: 0.3070562183856964, mean loss: 0.3387484559963047
Epoch: 77, step: 332, loss: 0.3053176999092102, mean loss: 0.338748156225355
Epoch: 77, step: 333, loss: 0.3364478051662445, mean loss: 0.33874813559847367
Epoch: 77, step: 334, loss: 0.3409585654735565, mean loss: 0.3387481554188683
Epoch: 77, step: 335, loss: 0.3201709985733032, mean loss: 0.338747988843451
Epoch: 77, step: 336, loss: 0.32551905512809753, mean loss: 0.33874787022490166
Epoch: 77, step: 337, loss: 0.3047344386577606, mean loss: 0.3387475652428206
Epoch: 77, step: 338, loss: 0.297977089881897, mean loss: 0.3387471996768558
Epoch: 77, step: 339, loss: 0.3086950182914734, mean loss: 0.3387469302182321
Epoch: 77, step: 340, loss: 0.3529600203037262, mean loss: 0.3387470576567466
Epoch: 77, step: 341, loss: 0.34619253873825073, mean loss: 0.3387471244144
Epoch: 77, step: 342, loss: 0.33639031648635864, mean loss: 0.3387471032829843
Epoch: 77, step: 343, loss: 0.2857397496700287, mean loss: 0.3387466280171089
Epoch: 77, step: 344, loss: 0.32426726818084717, mean loss: 0.3387464981958019
Epoch: 77, step: 345, loss: 0.3582266569137573, mean loss: 0.338746672852487
Epoch: 77, step: 346, loss: 0.45204493403434753, mean loss: 0.33874768866152616
Epoch: 77, step: 347, loss: 0.30145344138145447, mean loss: 0.33874735429193
Epoch: 77, step: 348, loss: 0.3545825481414795, mean loss: 0.3387474962644938
Epoch: 77, step: 349, loss: 0.3560878336429596, mean loss: 0.33874765173023086
Epoch: 77, step: 350, loss: 0.3768603205680847, mean loss: 0.33874799342837086
Epoch: 77, step: 351, loss: 0.3154418170452118, mean loss: 0.33874778447932674
Epoch: 77, step: 352, loss: 0.3026212155818939, mean loss: 0.3387474605933216
Epoch: 77, step: 353, loss: 0.3116569221019745, mean loss: 0.3387472177203366
Epoch: 77, step: 354, loss: 0.3543227016925812, mean loss: 0.33874735735692496
Epoch: 77, step: 355, loss: 0.3451729714870453, mean loss: 0.3387474149630188
Epoch: 77, step: 356, loss: 0.34705227613449097, mean loss: 0.33874748941603033
Epoch: 77, step: 357, loss: 0.33565616607666016, mean loss: 0.3387474617025907
Epoch: 77, step: 358, loss: 0.3204074501991272, mean loss: 0.3387472972874876
Epoch: 77, step: 359, loss: 0.327025443315506, mean loss: 0.33874719220399013
Epoch: 77, step: 360, loss: 0.33442258834838867, mean loss: 0.3387471534353427
Epoch: 77, step: 361, loss: 0.31635916233062744, mean loss: 0.3387469527361844
Epoch: 77, step: 362, loss: 0.29947629570961, mean loss: 0.33874660069400614
Epoch: 77, step: 363, loss: 0.3132303059101105, mean loss: 0.3387463719549895
Epoch: 77, step: 364, loss: 0.35411345958709717, mean loss: 0.33874650971092285
Epoch: 77, step: 365, loss: 0.3344976603984833, mean loss: 0.3387464716230971
Epoch: 77, step: 366, loss: 0.31491705775260925, mean loss: 0.3387462580117496
Epoch: 77, step: 367, loss: 0.31246957182884216, mean loss: 0.33874602246470437
Epoch: 77, step: 368, loss: 0.3102323114871979, mean loss: 0.33874576686701907
Epoch: 77, step: 369, loss: 0.3395281136035919, mean loss: 0.33874577387993376
Epoch: 77, step: 370, loss: 0.3194534182548523, mean loss: 0.3387456009458305
Epoch: 77, step: 371, loss: 0.34471628069877625, mean loss: 0.3387456544657279
Epoch: 77, step: 372, loss: 0.31696224212646484, mean loss: 0.338745459205625
Epoch: 77, step: 373, loss: 0.3251219093799591, mean loss: 0.3387453370892249
Epoch: 77, step: 374, loss: 0.32666853070259094, mean loss: 0.3387452288382242
Epoch: 77, step: 375, loss: 0.364949494600296, mean loss: 0.3387454637192411
Epoch: 77, step: 376, loss: 0.3528991937637329, mean loss: 0.3387455905845666
Epoch: 77, step: 377, loss: 0.33324187994003296, mean loss: 0.33874554125313366
Epoch: 77, step: 378, loss: 0.35035160183906555, mean loss: 0.3387456452808532
Epoch: 77, step: 379, loss: 0.32312455773353577, mean loss: 0.3387455052668031
Epoch: 77, step: 380, loss: 0.30057471990585327, mean loss: 0.33874516313964087
Epoch: 77, step: 381, loss: 0.32131341099739075, mean loss: 0.33874500689914483
Epoch: 77, step: 382, loss: 0.304902046918869, mean loss: 0.33874470356799263
Epoch: 77, step: 383, loss: 0.3178994953632355, mean loss: 0.3387445167360975
Epoch: 77, step: 384, loss: 0.3359822630882263, mean loss: 0.3387444919787311
Epoch: 77, step: 385, loss: 0.3643378019332886, mean loss: 0.3387447213629062
Epoch: 77, step: 386, loss: 0.31819626688957214, mean loss: 0.33874453719571396
Epoch: 77, step: 387, loss: 0.3531927466392517, mean loss: 0.33874466668780406
Epoch: 77, step: 388, loss: 0.33989933133125305, mean loss: 0.3387446770363942
Epoch: 77, step: 389, loss: 0.33407077193260193, mean loss: 0.3387446351472664
Epoch: 77, step: 390, loss: 0.3309491276741028, mean loss: 0.33874456528190217
Epoch: 77, step: 391, loss: 0.2928173840045929, mean loss: 0.3387441536742549
Epoch: 77, step: 392, loss: 0.3298359811306, mean loss: 0.33874407383832816
Epoch: 77, step: 393, loss: 0.34715673327445984, mean loss: 0.33874414923274154
Epoch: 77, step: 394, loss: 0.344813734292984, mean loss: 0.33874420362799046
Epoch: 77, step: 395, loss: 0.3281526267528534, mean loss: 0.338744108707779
Epoch: 77, step: 396, loss: 0.302987277507782, mean loss: 0.33874378826299517
Epoch: 77, step: 397, loss: 0.32895082235336304, mean loss: 0.3387437005013951
Epoch: 77, step: 398, loss: 0.35928478837013245, mean loss: 0.3387438845827654
Epoch: 77, step: 399, loss: 0.33066800236701965, mean loss: 0.3387438122104474
Epoch: 77, step: 400, loss: 0.3384856581687927, mean loss: 0.33874380989701114
Epoch: 77, step: 401, loss: 0.30083295702934265, mean loss: 0.3387434701635864
Epoch: 77, step: 402, loss: 0.33675071597099304, mean loss: 0.3387434523059259
Epoch: 77, step: 403, loss: 0.34907788038253784, mean loss: 0.33874354491496667
Epoch: 77, step: 404, loss: 0.30596408247947693, mean loss: 0.33874325117376036
Epoch: 77, step: 405, loss: 0.3331337869167328, mean loss: 0.3387432009070412
Epoch: 77, step: 406, loss: 0.3847906291484833, mean loss: 0.33874361353689236
Epoch: 77, step: 407, loss: 0.35467469692230225, mean loss: 0.33874375629365233
Epoch: 77, step: 408, loss: 0.3550410270690918, mean loss: 0.3387439023304703
Epoch: 77, step: 409, loss: 0.3286087214946747, mean loss: 0.33874381151181016
Epoch: 77, step: 410, loss: 0.3447648584842682, mean loss: 0.3387438654643274
Epoch: 77, step: 411, loss: 0.42780306935310364, mean loss: 0.3387446634858676
Epoch: 77, step: 412, loss: 0.32222405076026917, mean loss: 0.33874451545302986
Epoch: 77, step: 413, loss: 0.32194650173187256, mean loss: 0.3387443649358911
Epoch: 77, step: 414, loss: 0.28667470812797546, mean loss: 0.33874389837444735
Epoch: 77, step: 415, loss: 0.3285503685474396, mean loss: 0.33874380703784807
Epoch: 77, step: 416, loss: 0.3124500513076782, mean loss: 0.33874357144127326
Epoch: 77, step: 417, loss: 0.31613487005233765, mean loss: 0.33874336886523443
Epoch: 77, step: 418, loss: 0.2968107759952545, mean loss: 0.3387429931487214
Epoch: 77, step: 419, loss: 0.3301906883716583, mean loss: 0.33874291652065913
Epoch: 77, step: 420, loss: 0.3010200262069702, mean loss: 0.3387425785291861
Epoch: 77, step: 421, loss: 0.35895365476608276, mean loss: 0.33874275961579337
Epoch: 77, step: 422, loss: 0.3428923785686493, mean loss: 0.3387427967950943
Epoch: 77, step: 423, loss: 0.3300946056842804, mean loss: 0.33874271931067407
Epoch: 77, step: 424, loss: 0.33235758543014526, mean loss: 0.3387426621028768
Epoch: 77, step: 425, loss: 0.33787715435028076, mean loss: 0.3387426543484038
Epoch: 77, step: 426, loss: 0.3173069655895233, mean loss: 0.33874246229815286
Epoch: 77, step: 427, loss: 0.3458517789840698, mean loss: 0.3387425259925756
Epoch: 77, step: 428, loss: 0.3306601047515869, mean loss: 0.3387424535804767
Epoch: 77, step: 429, loss: 0.30463042855262756, mean loss: 0.3387421479664626
Epoch: 77, step: 430, loss: 0.2908634841442108, mean loss: 0.33874171901920613
Epoch: 77, step: 431, loss: 0.329719215631485, mean loss: 0.3387416381868877
Epoch: 77, step: 432, loss: 0.34725743532180786, mean loss: 0.33874171447895757
Epoch: 77, step: 433, loss: 0.3772801160812378, mean loss: 0.33874205973707516
Epoch: 77, step: 434, loss: 0.3253959119319916, mean loss: 0.3387419401725785
Epoch: 77, step: 435, loss: 0.310406357049942, mean loss: 0.338741686324095
Epoch: 77, step: 436, loss: 0.32214125990867615, mean loss: 0.3387415376080689
Epoch: 77, step: 437, loss: 0.35803869366645813, mean loss: 0.3387417104813785
Epoch: 77, step: 438, loss: 0.3615001440048218, mean loss: 0.3387419143606687
Epoch: 77, step: 439, loss: 0.3734886944293976, mean loss: 0.3387422256336474
Epoch: 77, step: 440, loss: 0.3250890076160431, mean loss: 0.33874210332476695
Epoch: 77, step: 441, loss: 0.35483846068382263, mean loss: 0.338742247518598
Epoch: 77, step: 442, loss: 0.3194151818752289, mean loss: 0.33874207438509885
Epoch: 77, step: 443, loss: 0.3592270612716675, mean loss: 0.3387422578897112
Epoch: 77, step: 444, loss: 0.2920152246952057, mean loss: 0.33874183931246976
Epoch: 77, step: 445, loss: 0.34661248326301575, mean loss: 0.33874190981647345
Epoch: 77, step: 446, loss: 0.3038979172706604, mean loss: 0.33874159769220646
Epoch: 77, step: 447, loss: 0.3503291606903076, mean loss: 0.338741701489933
Epoch: 77, step: 448, loss: 0.3682933449745178, mean loss: 0.3387419662018429
Epoch: 77, step: 449, loss: 0.3565916121006012, mean loss: 0.3387421260904641
Epoch: 77, step: 450, loss: 0.3574002683162689, mean loss: 0.3387422932197131
Epoch: 77, step: 451, loss: 0.3554249107837677, mean loss: 0.3387424426519736
Epoch: 77, step: 452, loss: 0.3389524817466736, mean loss: 0.33874244453335317
Epoch: 77, step: 453, loss: 0.3544371724128723, mean loss: 0.33874258511420874
Epoch: 77, step: 454, loss: 0.326172798871994, mean loss: 0.33874247252509665
Epoch: 77, step: 455, loss: 0.3417477011680603, mean loss: 0.3387424994430559
Epoch: 77, step: 456, loss: 0.2984420359134674, mean loss: 0.3387421384733436
Epoch: 77, step: 457, loss: 0.3268766701221466, mean loss: 0.3387420321957488
Epoch: 77, step: 458, loss: 0.33029672503471375, mean loss: 0.3387419565528102
Epoch: 77, step: 459, loss: 0.32909300923347473, mean loss: 0.33874187012987994
Epoch: 77, step: 460, loss: 0.37992390990257263, mean loss: 0.3387422389826218
Epoch: 77, step: 461, loss: 0.31265121698379517, mean loss: 0.33874200529680004
Epoch: 77, step: 462, loss: 0.2911270260810852, mean loss: 0.338741578834169
Epoch: 77, step: 463, loss: 0.3210444450378418, mean loss: 0.3387414203315556
Epoch: 77, step: 464, loss: 0.32135528326034546, mean loss: 0.33874126461574794
Epoch: 77, step: 465, loss: 0.30195778608322144, mean loss: 0.3387409351740931
Epoch: 77, step: 466, loss: 0.33091962337493896, mean loss: 0.33874086512517637
Epoch: 77, step: 467, loss: 0.318035751581192, mean loss: 0.3387406796885358
Epoch: 77, step: 468, loss: 0.32413333654403687, mean loss: 0.3387405488651826
Epoch: 77, step: 469, loss: 0.31552571058273315, mean loss: 0.33874034095497213
Epoch: 77, step: 470, loss: 0.3162168562412262, mean loss: 0.33874013923827473
Epoch: 77, step: 471, loss: 0.3175341486930847, mean loss: 0.33873994932254353
Epoch: 77, step: 472, loss: 0.39059895277023315, mean loss: 0.33874041375509784
Epoch: 77, step: 473, loss: 0.3545699417591095, mean loss: 0.33874055551798943
Epoch: 77, step: 474, loss: 0.3662559688091278, mean loss: 0.33874080193276684
Epoch: 77, step: 475, loss: 0.3921312689781189, mean loss: 0.3387412800677705
Epoch: 77, step: 476, loss: 0.31788888573646545, mean loss: 0.33874109332712365
Epoch: 77, step: 477, loss: 0.34042492508888245, mean loss: 0.33874110840630406
Epoch: 77, step: 478, loss: 0.29596778750419617, mean loss: 0.33874072536278266
Epoch: 77, step: 479, loss: 0.33068904280662537, mean loss: 0.3387406532590237
Epoch: 77, step: 480, loss: 0.32862260937690735, mean loss: 0.33874056265156877
Epoch: 77, step: 481, loss: 0.3414539396762848, mean loss: 0.3387405869497422
Epoch: 77, step: 482, loss: 0.3250958323478699, mean loss: 0.3387404647626515
Epoch: 77, step: 483, loss: 0.31781941652297974, mean loss: 0.3387402774189285
Epoch: 77, step: 484, loss: 0.36157533526420593, mean loss: 0.33874048190038636
Epoch: 77, step: 485, loss: 0.3263106644153595, mean loss: 0.3387403705958975
Epoch: 77, step: 486, loss: 0.32185113430023193, mean loss: 0.33874021936029153
Epoch: 77, step: 487, loss: 0.32653215527534485, mean loss: 0.3387401100434814
Epoch: 77, step: 488, loss: 0.3479633033275604, mean loss: 0.3387401926315997
Epoch: 77, step: 489, loss: 0.362077921628952, mean loss: 0.33874040160497854
Epoch: 77, step: 490, loss: 0.3167421519756317, mean loss: 0.33874020462748383
Epoch: 77, step: 491, loss: 0.31198620796203613, mean loss: 0.3387399650680581
Epoch: 77, step: 492, loss: 0.3230888545513153, mean loss: 0.33873982492684773
Epoch: 77, step: 493, loss: 0.3774697482585907, mean loss: 0.33874017171436344
Epoch: 77, step: 494, loss: 0.3643229603767395, mean loss: 0.3387404007804582
Epoch: 77, step: 495, loss: 0.31458207964897156, mean loss: 0.3387401844708603
Epoch: 77, step: 496, loss: 0.40384814143180847, mean loss: 0.33874076743148135
Epoch: 77, step: 497, loss: 0.37318283319473267, mean loss: 0.33874107581449947
Epoch: 77, step: 498, loss: 0.34548795223236084, mean loss: 0.3387411362232885
Epoch: 77, step: 499, loss: 0.33422693610191345, mean loss: 0.3387410958053374
Epoch: 77, step: 500, loss: 0.32313287258148193, mean loss: 0.33874095605815346
Epoch: 77, step: 501, loss: 0.30669668316841125, mean loss: 0.33874066915446566
Epoch: 77, step: 502, loss: 0.41431924700737, mean loss: 0.33874134583009624
Epoch: 77, step: 503, loss: 0.30868589878082275, mean loss: 0.3387410767378869
Epoch: 77, step: 504, loss: 0.3575518727302551, mean loss: 0.33874124515306053
Epoch: 77, step: 505, loss: 0.3212917745113373, mean loss: 0.33874108892738464
Epoch: 77, step: 506, loss: 0.37627145648002625, mean loss: 0.3387414249349727
Epoch: 77, step: 507, loss: 0.3317401707172394, mean loss: 0.3387413622536393
Epoch: 77, step: 508, loss: 0.3350183069705963, mean loss: 0.3387413289219
Epoch: 77, step: 509, loss: 0.3829894959926605, mean loss: 0.33874172506298644
Epoch: 77, step: 510, loss: 0.3650515675544739, mean loss: 0.3387419606053144
Epoch: 77, step: 511, loss: 0.3225036561489105, mean loss: 0.3387418152310579
Epoch: 77, step: 512, loss: 0.3268410861492157, mean loss: 0.338741708690122
Epoch: 77, step: 513, loss: 0.3167993128299713, mean loss: 0.33874151225321075
Epoch: 77, step: 514, loss: 0.3228273391723633, mean loss: 0.3387413697845834
Epoch: 77, step: 515, loss: 0.3441064953804016, mean loss: 0.3387414178144265
Epoch: 77, step: 516, loss: 0.3553520441055298, mean loss: 0.3387415665152572
Epoch: 77, step: 517, loss: 0.3473881781101227, mean loss: 0.3387416439203348
Epoch: 77, step: 518, loss: 0.34246790409088135, mean loss: 0.3387416772777803
Epoch: 77, step: 519, loss: 0.3189442753791809, mean loss: 0.33874150005321363
Epoch: 77, step: 520, loss: 0.30847665667533875, mean loss: 0.3387412291274746
Epoch: 77, step: 521, loss: 0.31748276948928833, mean loss: 0.33874103882705714
Epoch: 77, step: 522, loss: 0.3712526559829712, mean loss: 0.33874132986032296
Epoch: 77, step: 523, loss: 0.32672011852264404, mean loss: 0.33874122225137016
Epoch: 77, step: 524, loss: 0.3105795979499817, mean loss: 0.33874097016231786
Epoch: 77, step: 525, loss: 0.3023836314678192, mean loss: 0.33874064471216214
Epoch: 77, step: 526, loss: 0.3038751184940338, mean loss: 0.3387403326186544
Epoch: 77, step: 527, loss: 0.3122366666793823, mean loss: 0.3387400953772034
Epoch: 77, step: 528, loss: 0.29740265011787415, mean loss: 0.33873972535791125
Epoch: 77, step: 529, loss: 0.3121301531791687, mean loss: 0.3387394871727291
Epoch: 77, step: 530, loss: 0.2918700873851776, mean loss: 0.33873906764337613
Epoch: 77, step: 531, loss: 0.39459696412086487, mean loss: 0.3387395676245476
Epoch: 77, step: 532, loss: 0.35400936007499695, mean loss: 0.33873970430245465
Epoch: 77, step: 533, loss: 0.3260234296321869, mean loss: 0.33873959048176877
Epoch: 77, step: 534, loss: 0.32950595021247864, mean loss: 0.3387395078341468
Epoch: 77, step: 535, loss: 0.32654067873954773, mean loss: 0.33873939864696145
Epoch: 77, step: 536, loss: 0.32644355297088623, mean loss: 0.3387392885924018
Epoch: 77, step: 537, loss: 0.33824893832206726, mean loss: 0.3387392842035374
Epoch: 77, step: 538, loss: 0.3186594843864441, mean loss: 0.33873910448153804
Epoch: 77, step: 539, loss: 0.33712294697761536, mean loss: 0.33873909001643077
Epoch: 77, step: 540, loss: 0.3308945298194885, mean loss: 0.33873901980583015
Epoch: 77, step: 541, loss: 0.3455222249031067, mean loss: 0.3387390805165175
Epoch: 77, step: 542, loss: 0.32335910201072693, mean loss: 0.3387389428646706
Epoch: 77, step: 543, loss: 0.3229929208755493, mean loss: 0.33873880193797107
Epoch: 77, step: 544, loss: 0.29701370000839233, mean loss: 0.33873842850217384
Epoch: 77, step: 545, loss: 0.304007351398468, mean loss: 0.3387381176650329
Epoch: 77, step: 546, loss: 0.36369049549102783, mean loss: 0.33873834098250577
Epoch: 77, step: 547, loss: 0.3773234188556671, mean loss: 0.3387386863061067
Epoch: 77, step: 548, loss: 0.3037279546260834, mean loss: 0.3387383729745184
Epoch: 77, step: 549, loss: 0.29102641344070435, mean loss: 0.3387379459760082
Epoch: 77, step: 550, loss: 0.33695870637893677, mean loss: 0.3387379300528337
Epoch: 77, step: 551, loss: 0.33368271589279175, mean loss: 0.33873788481196954
Epoch: 77, step: 552, loss: 0.3315792977809906, mean loss: 0.3387378207478657
Epoch: 77, step: 553, loss: 0.3647158145904541, mean loss: 0.33873805322977796
Epoch: 77, step: 554, loss: 0.3038587272167206, mean loss: 0.3387377410909772
Epoch: 77, step: 555, loss: 0.28560659289360046, mean loss: 0.3387372656189322
Epoch: 77, step: 556, loss: 0.3269163966178894, mean loss: 0.3387371598346107
Epoch: 77, step: 557, loss: 0.33852890133857727, mean loss: 0.3387371579709333
Epoch: 77, step: 558, loss: 0.31732460856437683, mean loss: 0.33873696635460887
Epoch: 77, step: 559, loss: 0.3656134009361267, mean loss: 0.3387372068639207
Epoch: 77, step: 560, loss: 0.3518645763397217, mean loss: 0.3387373243358397
Epoch: 77, step: 561, loss: 0.3298458158969879, mean loss: 0.33873724476976863
Epoch: 77, step: 562, loss: 0.3409420847892761, mean loss: 0.3387372644997041
Epoch: 77, step: 563, loss: 0.35666143894195557, mean loss: 0.33873742489213055
Epoch: 77, step: 564, loss: 0.32260847091674805, mean loss: 0.33873728056532076
Epoch: 77, step: 565, loss: 0.3271912932395935, mean loss: 0.33873717724922175
Epoch: 77, step: 566, loss: 0.3367657959461212, mean loss: 0.338737159609015
Epoch: 77, step: 567, loss: 0.32829445600509644, mean loss: 0.33873706616701993
Epoch: 77, step: 568, loss: 0.3128935396671295, mean loss: 0.3387368349195231
Epoch: 77, step: 569, loss: 0.3113009035587311, mean loss: 0.33873658942540763
Epoch: 77, step: 570, loss: 0.32809552550315857, mean loss: 0.33873649421102736
Epoch: 77, step: 571, loss: 0.32087552547454834, mean loss: 0.33873633439563067
Epoch: 77, step: 572, loss: 0.27280640602111816, mean loss: 0.33873574447671106
Epoch: 77, step: 573, loss: 0.33807021379470825, mean loss: 0.3387357385218187
Epoch: 77, step: 574, loss: 0.29866620898246765, mean loss: 0.33873537999950326
Epoch: 77, step: 575, loss: 0.3090338110923767, mean loss: 0.33873511424694513
Epoch: 77, step: 576, loss: 0.34043195843696594, mean loss: 0.3387351294291953
Epoch: 77, step: 577, loss: 0.327310711145401, mean loss: 0.3387350272118995
Epoch: 77, step: 578, loss: 0.31301620602607727, mean loss: 0.33873479710085436
Epoch: 77, step: 579, loss: 0.3301211893558502, mean loss: 0.33873472003400384
Epoch: 77, step: 580, loss: 0.3841968774795532, mean loss: 0.3387351267850479
Epoch: 77, step: 581, loss: 0.34047091007232666, mean loss: 0.33873514231500484
Epoch: 77, step: 582, loss: 0.3233257532119751, mean loss: 0.3387350044492874
Epoch: 77, step: 583, loss: 0.3248017728328705, mean loss: 0.3387348797916664
Epoch: 77, step: 584, loss: 0.32463622093200684, mean loss: 0.338734753655132
Epoch: 77, step: 585, loss: 0.3166846036911011, mean loss: 0.3387345563807215
Epoch: 77, step: 586, loss: 0.3504185378551483, mean loss: 0.33873466091198046
Epoch: 77, step: 587, loss: 0.3105132579803467, mean loss: 0.338734408430205
Epoch: 77, step: 588, loss: 0.31980353593826294, mean loss: 0.33873423906734423
Epoch: 77, step: 589, loss: 0.3602442443370819, mean loss: 0.33873443150239646
Epoch: 77, step: 590, loss: 0.3877950608730316, mean loss: 0.33873487040978845
Epoch: 77, step: 591, loss: 0.40989819169044495, mean loss: 0.33873550704712324
Epoch: 77, step: 592, loss: 0.37388283014297485, mean loss: 0.3387358214773314
Epoch: 77, step: 593, loss: 0.3423822224140167, mean loss: 0.33873585409797635
Epoch: 77, step: 594, loss: 0.3624912202358246, mean loss: 0.3387360666112041
Epoch: 77, step: 595, loss: 0.3055986762046814, mean loss: 0.3387357701699387
Epoch: 77, step: 596, loss: 0.3332236707210541, mean loss: 0.3387357208601078
Epoch: 77, step: 597, loss: 0.35772475600242615, mean loss: 0.33873589072963656
Epoch: 77, step: 598, loss: 0.3278484046459198, mean loss: 0.3387357933347151
Epoch: 77, step: 599, loss: 0.36719968914985657, mean loss: 0.3387360479586087
Epoch: 77, step: 600, loss: 0.309787780046463, mean loss: 0.3387357890040791
Epoch: 77, step: 601, loss: 0.36479657888412476, mean loss: 0.33873602212680815
Epoch: 77, step: 602, loss: 0.32890141010284424, mean loss: 0.3387359341536079
Epoch: 77, step: 603, loss: 0.37473541498184204, mean loss: 0.3387362561755847
Epoch: 77, step: 604, loss: 0.3254113793373108, mean loss: 0.338736136983177
Epoch: 77, step: 605, loss: 0.30395394563674927, mean loss: 0.3387358258556447
Epoch: 77, step: 606, loss: 0.32571977376937866, mean loss: 0.3387357094277894
Epoch: 77, step: 607, loss: 0.34084269404411316, mean loss: 0.33873572827447995
Epoch: 77, step: 608, loss: 0.3091651499271393, mean loss: 0.33873546377204833
Epoch: 77, step: 609, loss: 0.3939034640789032, mean loss: 0.33873595723347255
Epoch: 77, step: 610, loss: 0.3832635283470154, mean loss: 0.3387363555158464
Epoch: 77, step: 611, loss: 0.3336247205734253, mean loss: 0.3387363097946036
Epoch: 77, step: 612, loss: 0.3193044066429138, mean loss: 0.33873613598664887
Epoch: 77, step: 613, loss: 0.3507709801197052, mean loss: 0.33873624363091404
Epoch: 77, step: 614, loss: 0.30299922823905945, mean loss: 0.33873592398819075
Epoch: 77, step: 615, loss: 0.31923604011535645, mean loss: 0.3387357495768649
Epoch: 77, step: 616, loss: 0.32991570234298706, mean loss: 0.33873567068909394
Epoch: 77, step: 617, loss: 0.3795692026615143, mean loss: 0.3387360359068101
Epoch: 77, step: 618, loss: 0.37015941739082336, mean loss: 0.338736316957026
Epoch: 77, step: 619, loss: 0.3252575099468231, mean loss: 0.33873619640387226
Epoch: 77, step: 620, loss: 0.3697785437107086, mean loss: 0.33873647404115825
Epoch: 77, step: 621, loss: 0.35852259397506714, mean loss: 0.33873665100314676
Epoch: 77, step: 622, loss: 0.3018973171710968, mean loss: 0.3387363215245281
Epoch: 77, step: 623, loss: 0.3351053297519684, mean loss: 0.3387362890504486
Epoch: 77, step: 624, loss: 0.3040052354335785, mean loss: 0.33873597843313563
Epoch: 77, step: 625, loss: 0.32439741492271423, mean loss: 0.338735850197284
Epoch: 77, step: 626, loss: 0.3060176968574524, mean loss: 0.3387355575875864
Epoch: 77, step: 627, loss: 0.3187722861766815, mean loss: 0.33873537905078116
Epoch: 77, step: 628, loss: 0.3407478928565979, mean loss: 0.33873539704906236
Epoch: 77, step: 629, loss: 0.29900923371315, mean loss: 0.3387350417738532
Epoch: 77, step: 630, loss: 0.3028702139854431, mean loss: 0.3387347210338378
Epoch: 77, step: 631, loss: 0.29458296298980713, mean loss: 0.33873432618713734
Epoch: 77, step: 632, loss: 0.3225272297859192, mean loss: 0.33873418124927773
Epoch: 77, step: 633, loss: 0.32634615898132324, mean loss: 0.33873407046586956
Epoch: 77, step: 634, loss: 0.307872474193573, mean loss: 0.3387337944797462
Epoch: 77, step: 635, loss: 0.4254540205001831, mean loss: 0.33873456998613144
Epoch: 77, step: 636, loss: 0.32646575570106506, mean loss: 0.338734460271718
Epoch: 77, step: 637, loss: 0.3289051949977875, mean loss: 0.33873437237386533
Epoch: 77, step: 638, loss: 0.32000312209129333, mean loss: 0.3387342048718284
Epoch: 77, step: 639, loss: 0.3899785578250885, mean loss: 0.3387346631144238
Epoch: 77, step: 640, loss: 0.3426327705383301, mean loss: 0.3387346979721747
Epoch: 77, step: 641, loss: 0.3642217814922333, mean loss: 0.338734925881354
Epoch: 77, step: 642, loss: 0.351615846157074, mean loss: 0.3387350410633722
Epoch: 77, step: 643, loss: 0.3321326673030853, mean loss: 0.33873498202504904
Epoch: 77, step: 644, loss: 0.2997020184993744, mean loss: 0.3387346329960189
Epoch: 77, step: 645, loss: 0.316621333360672, mean loss: 0.3387344352627747
Epoch: 77, step: 646, loss: 0.3215372562408447, mean loss: 0.3387342814899932
Epoch: 77, step: 647, loss: 0.2985210418701172, mean loss: 0.3387339219166928
Epoch: 77, step: 648, loss: 0.3003285527229309, mean loss: 0.338733578511834
Epoch: 77, step: 649, loss: 0.33585354685783386, mean loss: 0.3387335527600175
Epoch: 77, step: 650, loss: 0.2982047498226166, mean loss: 0.3387331903747768
Epoch: 77, step: 651, loss: 0.36782726645469666, mean loss: 0.338733450514942
Epoch: 77, step: 652, loss: 0.3509291112422943, mean loss: 0.3387335595595744
Epoch: 77, step: 653, loss: 0.3519476354122162, mean loss: 0.3387336777090697
Epoch: 77, step: 654, loss: 0.3537306785583496, mean loss: 0.3387338117988281
Epoch: 77, step: 655, loss: 0.30428001284599304, mean loss: 0.33873350374655037
Epoch: 77, step: 656, loss: 0.301514208316803, mean loss: 0.33873317097087485
Epoch: 77, step: 657, loss: 0.3118014633655548, mean loss: 0.33873293017810974
Epoch: 77, step: 658, loss: 0.30037668347358704, mean loss: 0.33873258724314764
Epoch: 77, step: 659, loss: 0.3118387460708618, mean loss: 0.3387323467932409
Epoch: 77, step: 660, loss: 0.3357751667499542, mean loss: 0.33873232035420214
Epoch: 77, step: 661, loss: 0.30990272760391235, mean loss: 0.33873206260192007
Epoch: 77, step: 662, loss: 0.33222895860671997, mean loss: 0.33873200446114354
Epoch: 77, step: 663, loss: 0.33153384923934937, mean loss: 0.3387319401068609
Epoch: 77, step: 664, loss: 0.34278950095176697, mean loss: 0.33873197638269475
Epoch: 77, step: 665, loss: 0.36660251021385193, mean loss: 0.33873222555155624
Epoch: 77, step: 666, loss: 0.33358117938041687, mean loss: 0.3387321795004528
Epoch: 77, step: 667, loss: 0.3088734447956085, mean loss: 0.3387319125613999
Epoch: 77, step: 668, loss: 0.35019364953041077, mean loss: 0.3387320150291665
Epoch: 77, step: 669, loss: 0.32501843571662903, mean loss: 0.33873189243105717
Epoch: 77, step: 670, loss: 0.3340933918952942, mean loss: 0.3387318509636693
Epoch: 77, step: 671, loss: 0.3153665065765381, mean loss: 0.3387316420834227
Epoch: 77, step: 672, loss: 0.3036508560180664, mean loss: 0.3387313284729055
Epoch: 77, step: 673, loss: 0.3744564354419708, mean loss: 0.33873164784058146
Epoch: 77, step: 674, loss: 0.33232855796813965, mean loss: 0.3387315906001188
Epoch: 77, step: 675, loss: 0.330938458442688, mean loss: 0.3387315209339871
Epoch: 77, step: 676, loss: 0.32124486565589905, mean loss: 0.33873136461471587
Epoch: 77, step: 677, loss: 0.295886367559433, mean loss: 0.33873098161186377
Epoch: 77, step: 678, loss: 0.2998652756214142, mean loss: 0.3387306341840612
Epoch: 77, step: 679, loss: 0.32175999879837036, mean loss: 0.3387304824817389
Epoch: 77, step: 680, loss: 0.32374289631843567, mean loss: 0.3387303485073031
Epoch: 77, step: 681, loss: 0.3537733852863312, mean loss: 0.33873048297621144
Epoch: 77, step: 682, loss: 0.3170822858810425, mean loss: 0.33873028946585493
Epoch: 77, step: 683, loss: 0.29710906744003296, mean loss: 0.33872991742260883
Epoch: 77, step: 684, loss: 0.3557640612125397, mean loss: 0.338730069685834
Epoch: 77, step: 685, loss: 0.330759197473526, mean loss: 0.3387299984371774
Epoch: 77, step: 686, loss: 0.3344085216522217, mean loss: 0.3387299598094519
Epoch: 77, step: 687, loss: 0.3203083276748657, mean loss: 0.33872979514829016
Epoch: 77, step: 688, loss: 0.3311813771724701, mean loss: 0.33872972767760384
Epoch: 77, step: 689, loss: 0.3178926110267639, mean loss: 0.33872954142904155
Epoch: 77, step: 690, loss: 0.3332240879535675, mean loss: 0.33872949222004367
Epoch: 77, step: 691, loss: 0.29874712228775024, mean loss: 0.3387291348517032
Epoch: 77, step: 692, loss: 0.3058754801750183, mean loss: 0.3387288412034995
Epoch: 77, step: 693, loss: 0.3030390441417694, mean loss: 0.3387285222085132
Epoch: 77, step: 694, loss: 0.3515753149986267, mean loss: 0.33872863703196976
Epoch: 77, step: 695, loss: 0.3124871850013733, mean loss: 0.33872840249037284
Epoch: 77, step: 696, loss: 0.33701208233833313, mean loss: 0.3387283871503348
Epoch: 77, step: 697, loss: 0.3012256622314453, mean loss: 0.3387280519634042
Epoch: 77, step: 698, loss: 0.3470081090927124, mean loss: 0.33872812596715024
Epoch: 77, step: 699, loss: 0.31858929991722107, mean loss: 0.3387279459762124
Epoch: 77, step: 700, loss: 0.32361865043640137, mean loss: 0.3387278109379554
Epoch: 77, step: 701, loss: 0.2994149625301361, mean loss: 0.3387274595853018
Epoch: 77, step: 702, loss: 0.38184309005737305, mean loss: 0.3387278449213027
Epoch: 77, step: 703, loss: 0.3590523302555084, mean loss: 0.3387280265650783
Epoch: 77, step: 704, loss: 0.3296840786933899, mean loss: 0.3387279457383253
Epoch: 77, step: 705, loss: 0.39871564507484436, mean loss: 0.33872848185017523
Epoch: 77, step: 706, loss: 0.2960946559906006, mean loss: 0.33872810083381294
Epoch: 77, step: 707, loss: 0.3193500339984894, mean loss: 0.33872792765454973
Epoch: 77, step: 708, loss: 0.33299368619918823, mean loss: 0.33872787640883756
Epoch: 77, step: 709, loss: 0.3320370316505432, mean loss: 0.33872781661469686
Epoch: 77, step: 710, loss: 0.29908815026283264, mean loss: 0.3387274623696513
Epoch: 77, step: 711, loss: 0.31685054302215576, mean loss: 0.33872726686545696
Epoch: 77, step: 712, loss: 0.33407503366470337, mean loss: 0.3387272252909116
Epoch: 77, step: 713, loss: 0.31415796279907227, mean loss: 0.338727005730381
Epoch: 77, step: 714, loss: 0.348798543214798, mean loss: 0.3387270957327713
Epoch: 77, step: 715, loss: 0.3829163610935211, mean loss: 0.33872749061825674
Epoch: 77, step: 716, loss: 0.27409735321998596, mean loss: 0.3387269130735769
Epoch: 77, step: 717, loss: 0.3089579939842224, mean loss: 0.338726647056392
Epoch: 77, step: 718, loss: 0.3655813932418823, mean loss: 0.33872688703017545
Epoch: 77, step: 719, loss: 0.3002074360847473, mean loss: 0.3387265428237653
Epoch: 77, step: 720, loss: 0.3397897779941559, mean loss: 0.3387265523246559
Epoch: 77, step: 721, loss: 0.3705139756202698, mean loss: 0.33872683636918544
Epoch: 77, step: 722, loss: 0.3162539005279541, mean loss: 0.3387266355583997
Epoch: 77, step: 723, loss: 0.31597885489463806, mean loss: 0.3387264322935071
Epoch: 77, step: 724, loss: 0.3554919362068176, mean loss: 0.3387265821018753
Epoch: 77, step: 725, loss: 0.31922435760498047, mean loss: 0.33872640784106345
Epoch: 77, step: 726, loss: 0.31267592310905457, mean loss: 0.3387261750707938
Epoch: 77, step: 727, loss: 0.3294943571090698, mean loss: 0.3387260925819811
Epoch: 77, step: 728, loss: 0.3478355407714844, mean loss: 0.3387261739766592
Epoch: 77, step: 729, loss: 0.34376654028892517, mean loss: 0.33872621901290284
Epoch: 77, step: 730, loss: 0.31482329964637756, mean loss: 0.3387260054395206
Epoch: 77, step: 731, loss: 0.3717607259750366, mean loss: 0.33872630060321374
Epoch: 77, step: 732, loss: 0.3257547914981842, mean loss: 0.3387261847044181
Epoch: 77, step: 733, loss: 0.3269438147544861, mean loss: 0.3387260794313713
Epoch: 77, step: 734, loss: 0.3027079105377197, mean loss: 0.3387257576193318
Epoch: 77, step: 735, loss: 0.3029833137989044, mean loss: 0.3387254382736703
Epoch: 77, step: 736, loss: 0.33593109250068665, mean loss: 0.338725413307436
Epoch: 77, step: 737, loss: 0.31127381324768066, mean loss: 0.3387251680418135
Epoch: 77, step: 738, loss: 0.30253687500953674, mean loss: 0.33872484472131864
Epoch: 77, step: 739, loss: 0.3139741122722626, mean loss: 0.3387246235904805
Epoch: 77, step: 740, loss: 0.35215047001838684, mean loss: 0.33872474354014886
Epoch: 77, step: 741, loss: 0.3486699163913727, mean loss: 0.33872483239186735
Epoch: 77, step: 742, loss: 0.33985933661460876, mean loss: 0.3387248425276137
Epoch: 77, step: 743, loss: 0.32526925206184387, mean loss: 0.33872472231542716
Epoch: 77, step: 744, loss: 0.3492059111595154, mean loss: 0.338724815953486
Epoch: 77, step: 745, loss: 0.32493746280670166, mean loss: 0.338724692779534
Epoch: 77, step: 746, loss: 0.31427299976348877, mean loss: 0.33872447433406994
Epoch: 77, step: 747, loss: 0.3749108612537384, mean loss: 0.3387247976115403
Epoch: 77, step: 748, loss: 0.32808294892311096, mean loss: 0.3387247025415573
Epoch: 77, step: 749, loss: 0.32650187611579895, mean loss: 0.33872459334873245
Epoch: 77, step: 750, loss: 0.3845667243003845, mean loss: 0.33872500287651947
Epoch: 77, step: 751, loss: 0.30890655517578125, mean loss: 0.3387247364976763
Epoch: 77, step: 752, loss: 0.32689791917800903, mean loss: 0.338724630845437
Epoch: 77, step: 753, loss: 0.35130345821380615, mean loss: 0.33872474321458684
Epoch: 77, step: 754, loss: 0.40026962757110596, mean loss: 0.33872529300228554
Epoch: 77, step: 755, loss: 0.35217249393463135, mean loss: 0.3387254131266418
Epoch: 77, step: 756, loss: 0.32028138637542725, mean loss: 0.3387252483669227
Epoch: 77, step: 757, loss: 0.29696124792099, mean loss: 0.3387248752941872
Epoch: 77, step: 758, loss: 0.2930224537849426, mean loss: 0.3387244670436623
Epoch: 77, step: 759, loss: 0.3508002460002899, mean loss: 0.33872457491319957
Epoch: 77, step: 760, loss: 0.32502949237823486, mean loss: 0.33872445257997164
Epoch: 77, step: 761, loss: 0.31858381628990173, mean loss: 0.33872427267254607
Epoch: 77, step: 762, loss: 0.347581684589386, mean loss: 0.3387243517911954
Epoch: 77, step: 763, loss: 0.31375476717948914, mean loss: 0.3387241287528878
Epoch: 77, step: 764, loss: 0.3254719376564026, mean loss: 0.3387240103800787
Epoch: 77, step: 765, loss: 0.3607192635536194, mean loss: 0.33872420684695953
Epoch: 77, step: 766, loss: 0.33426812291145325, mean loss: 0.33872416704450375
Epoch: 77, step: 767, loss: 0.3039482533931732, mean loss: 0.33872385642324493
Epoch: 77, step: 768, loss: 0.28892964124679565, mean loss: 0.33872341166128117
Epoch: 77, step: 769, loss: 0.3176543414592743, mean loss: 0.33872322347401274
Epoch: 77, step: 770, loss: 0.32250136137008667, mean loss: 0.3387230785829177
Epoch: 77, step: 771, loss: 0.2999374568462372, mean loss: 0.33872273215900084
Epoch: 77, step: 772, loss: 0.337137371301651, mean loss: 0.3387227179990625
Epoch: 77, step: 773, loss: 0.2950942814350128, mean loss: 0.33872232832724025
Epoch: 77, step: 774, loss: 0.34034377336502075, mean loss: 0.3387223428092123
Epoch: 77, step: 775, loss: 0.34511393308639526, mean loss: 0.33872239989533176
Epoch: 77, step: 776, loss: 0.3339858055114746, mean loss: 0.33872235759109043
Epoch: 77, step: 777, loss: 0.32563817501068115, mean loss: 0.33872224073255675
Epoch: 77, step: 778, loss: 0.3070793151855469, mean loss: 0.33872195812316697
Epoch: 77, step: 779, loss: 0.3409455120563507, mean loss: 0.33872197798200104
Epoch: 77, step: 780, loss: 0.2951781153678894, mean loss: 0.33872158908987365
Epoch: 77, step: 781, loss: 0.31047162413597107, mean loss: 0.3387213367904635
Epoch: 77, step: 782, loss: 0.35084420442581177, mean loss: 0.33872144505838675
Epoch: 77, step: 783, loss: 0.3548223376274109, mean loss: 0.3387215888523046
Epoch: 77, step: 784, loss: 0.3389425277709961, mean loss: 0.33872159082544917
Epoch: 77, step: 785, loss: 0.3024899661540985, mean loss: 0.33872126725368545
Epoch: 77, step: 786, loss: 0.33980047702789307, mean loss: 0.33872127689163833
Epoch: 77, step: 787, loss: 0.3267313838005066, mean loss: 0.3387211698160767
Epoch: 77, step: 788, loss: 0.3335668444633484, mean loss: 0.338721123785862
Epoch: 77, step: 789, loss: 0.3035135567188263, mean loss: 0.3387208093708245
Epoch: 77, step: 790, loss: 0.322455495595932, mean loss: 0.3387206641175737
Epoch: 77, step: 791, loss: 0.3375459313392639, mean loss: 0.33872065362701487
Epoch: 77, step: 792, loss: 0.3243812322616577, mean loss: 0.3387205255747438
Epoch: 77, step: 793, loss: 0.3289148509502411, mean loss: 0.3387204380100046
Epoch: 77, step: 794, loss: 0.37518033385276794, mean loss: 0.33872076359420794
Epoch: 77, step: 795, loss: 0.32869574427604675, mean loss: 0.33872067407231804
Epoch: 77, step: 796, loss: 0.33493882417678833, mean loss: 0.3387206403012782
Epoch: 77, step: 797, loss: 0.3500997722148895, mean loss: 0.33872074191337176
Epoch: 77, step: 798, loss: 0.3335469365119934, mean loss: 0.33872069571331814
Epoch: 77, step: 799, loss: 0.32063063979148865, mean loss: 0.3387205341776543
Epoch: 77, step: 800, loss: 0.3185226023197174, mean loss: 0.3387203538212634
Epoch: 77, step: 801, loss: 0.32831132411956787, mean loss: 0.33872026087519946
Epoch: 77, step: 802, loss: 0.3841862678527832, mean loss: 0.3387206668543137
Epoch: 77, step: 803, loss: 0.31304916739463806, mean loss: 0.33872043762812376
Epoch: 77, step: 804, loss: 0.3559736907482147, mean loss: 0.3387205916846551
Epoch: 77, step: 805, loss: 0.3056325316429138, mean loss: 0.3387202962397202
Epoch: 77, step: 806, loss: 0.327450156211853, mean loss: 0.33872019560897754
Epoch: 77, step: 807, loss: 0.36603793501853943, mean loss: 0.33872043952607644
Epoch: 77, step: 808, loss: 0.31435537338256836, mean loss: 0.3387202219750158
Epoch: 77, step: 809, loss: 0.35690611600875854, mean loss: 0.3387203843519692
Epoch: 77, step: 810, loss: 0.3907569646835327, mean loss: 0.33872084896844196
Epoch: 77, step: 811, loss: 0.3508765399456024, mean loss: 0.33872095750139714
Epoch: 77, step: 812, loss: 0.3554157018661499, mean loss: 0.3387211065602838
Epoch: 77, step: 813, loss: 0.3258541226387024, mean loss: 0.33872099167855024
Epoch: 77, step: 814, loss: 0.3442840576171875, mean loss: 0.3387210413474514
Epoch: 77, step: 815, loss: 0.32168594002723694, mean loss: 0.33872088925376437
Epoch: 77, step: 816, loss: 0.3743521571159363, mean loss: 0.3387212073758827
Epoch: 77, step: 817, loss: 0.3462183177471161, mean loss: 0.33872127431078236
Epoch: 77, step: 818, loss: 0.3287554979324341, mean loss: 0.33872118533619705
Epoch: 77, step: 819, loss: 0.3005833327770233, mean loss: 0.33872084484397724
Epoch: 77, step: 820, loss: 0.2996755540370941, mean loss: 0.33872049625332107
Epoch: 77, step: 821, loss: 0.3051750361919403, mean loss: 0.33872019676702464
Epoch: 77, step: 822, loss: 0.33323991298675537, mean loss: 0.33872014784072474
Epoch: 77, step: 823, loss: 0.2880100607872009, mean loss: 0.3387196951205961
Epoch: 77, step: 824, loss: 0.3315848708152771, mean loss: 0.338719631424201
Epoch: 77, step: 825, loss: 0.31001415848731995, mean loss: 0.33871937515736883
Epoch: 77, step: 826, loss: 0.3176574110984802, mean loss: 0.33871918712930066
Epoch: 77, step: 827, loss: 0.34339621663093567, mean loss: 0.33871922888252787
Epoch: 77, step: 828, loss: 0.3263247609138489, mean loss: 0.33871911823443007
Epoch: 77, step: 829, loss: 0.3222503960132599, mean loss: 0.33871897121589534
Epoch: 77, step: 830, loss: 0.3378850519657135, mean loss: 0.33871896377145067
Epoch: 77, step: 831, loss: 0.312883585691452, mean loss: 0.33871873313961637
Epoch: 77, step: 832, loss: 0.3530709147453308, mean loss: 0.3387188612600724
Epoch: 77, step: 833, loss: 0.34269124269485474, mean loss: 0.33871889672079825
Epoch: 77, step: 834, loss: 0.315211683511734, mean loss: 0.33871868687805873
Epoch: 77, step: 835, loss: 0.3412665128707886, mean loss: 0.3387187096216315
Epoch: 77, step: 836, loss: 0.3286469876766205, mean loss: 0.338718619715611
Epoch: 77, step: 837, loss: 0.34752944111824036, mean loss: 0.33871869836540125
Epoch: 77, step: 838, loss: 0.37344345450401306, mean loss: 0.3387190083331424
Epoch: 77, step: 839, loss: 0.32359325885772705, mean loss: 0.33871887331556216
Epoch: 77, step: 840, loss: 0.3863741457462311, mean loss: 0.3387192986989221
Epoch: 77, step: 841, loss: 0.33549797534942627, mean loss: 0.33871926994480844
Epoch: 77, step: 842, loss: 0.3017210364341736, mean loss: 0.3387189396948463
Epoch: 77, step: 843, loss: 0.34077906608581543, mean loss: 0.338718958083578
Epoch: 77, step: 844, loss: 0.3506595492362976, mean loss: 0.33871906466459567
Epoch: 77, step: 845, loss: 0.3177007734775543, mean loss: 0.33871887705823345
Epoch: 77, step: 846, loss: 0.2877369523048401, mean loss: 0.33871842200468094
Epoch: 77, step: 847, loss: 0.33228951692581177, mean loss: 0.33871836462218713
Epoch: 77, step: 848, loss: 0.38077840209007263, mean loss: 0.3387187400342159
Epoch: 77, step: 849, loss: 0.32576924562454224, mean loss: 0.3387186244529452
Epoch: 77, step: 850, loss: 0.31419289112091064, mean loss: 0.33871840554940863
Epoch: 77, step: 851, loss: 0.3588992953300476, mean loss: 0.3387185856715952
Epoch: 77, step: 852, loss: 0.3234735131263733, mean loss: 0.3387184496046862
Epoch: 77, step: 853, loss: 0.30584755539894104, mean loss: 0.3387181562245769
Epoch: 77, step: 854, loss: 0.30751100182533264, mean loss: 0.33871787769620476
Epoch: 77, step: 855, loss: 0.3510603606700897, mean loss: 0.33871798785366947
Epoch: 77, step: 856, loss: 0.3437362313270569, mean loss: 0.3387180326414197
Epoch: 77, step: 857, loss: 0.31151270866394043, mean loss: 0.3387177898364648
Epoch: 77, step: 858, loss: 0.3195039629936218, mean loss: 0.3387176183563998
Epoch: 77, step: 859, loss: 0.34389421343803406, mean loss: 0.33871766455619884
Epoch: 77, step: 860, loss: 0.3321313261985779, mean loss: 0.338717605775323
Epoch: 77, step: 861, loss: 0.32220378518104553, mean loss: 0.33871745839629047
Epoch: 77, step: 862, loss: 0.3083828091621399, mean loss: 0.3387171876744831
Epoch: 77, step: 863, loss: 0.3378170430660248, mean loss: 0.3387171796412074
Epoch: 77, step: 864, loss: 0.37141919136047363, mean loss: 0.3387174714853501
Epoch: 77, step: 865, loss: 0.30673766136169434, mean loss: 0.338717186088933
Epoch: 77, step: 866, loss: 0.33678483963012695, mean loss: 0.3387171688443079
Epoch: 77, step: 867, loss: 0.3811459243297577, mean loss: 0.33871754748316246
Epoch: 77, step: 868, loss: 0.34147122502326965, mean loss: 0.3387175720570627
Epoch: 77, step: 869, loss: 0.3164181113243103, mean loss: 0.33871737305778793
Epoch: 77, step: 870, loss: 0.32779332995414734, mean loss: 0.3387172755730424
Epoch: 77, step: 871, loss: 0.33087578415870667, mean loss: 0.33871720559721324
Epoch: 77, step: 872, loss: 0.3478870689868927, mean loss: 0.3387172874264258
Epoch: 77, step: 873, loss: 0.32870590686798096, mean loss: 0.33871719808855427
Epoch: 77, step: 874, loss: 0.3294404447078705, mean loss: 0.33871711530696375
Epoch: 77, step: 875, loss: 0.3136373460292816, mean loss: 0.3387168915083373
Epoch: 77, step: 876, loss: 0.298829048871994, mean loss: 0.33871653557345455
Epoch: 77, step: 877, loss: 0.3247372508049011, mean loss: 0.3387164108319204
Epoch: 77, step: 878, loss: 0.3318830728530884, mean loss: 0.33871634985645055
Epoch: 77, step: 879, loss: 0.3235247731208801, mean loss: 0.33871621429967486
Epoch: 77, step: 880, loss: 0.3508263826370239, mean loss: 0.33871632235960525
Epoch: 77, step: 881, loss: 0.3721202313899994, mean loss: 0.3387166204225037
Epoch: 77, step: 882, loss: 0.34766656160354614, mean loss: 0.3387167002820676
Epoch: 77, step: 883, loss: 0.3169514238834381, mean loss: 0.3387165060740906
Epoch: 77, step: 884, loss: 0.29283687472343445, mean loss: 0.3387160967013483
Epoch: 77, step: 885, loss: 0.30578118562698364, mean loss: 0.33871580283380476
Epoch: 77, step: 886, loss: 0.3534589409828186, mean loss: 0.33871593438087727
Epoch: 77, step: 887, loss: 0.344079852104187, mean loss: 0.3387159822405236
Epoch: 77, step: 888, loss: 0.3715943396091461, mean loss: 0.33871627559560424
Epoch: 77, step: 889, loss: 0.32796531915664673, mean loss: 0.3387161796717259
Epoch: 77, step: 890, loss: 0.3623824119567871, mean loss: 0.3387163908284304
Epoch: 77, step: 891, loss: 0.35379305481910706, mean loss: 0.3387165253454182
Epoch: 77, step: 892, loss: 0.3226706385612488, mean loss: 0.33871638218210964
Epoch: 77, step: 893, loss: 0.30901038646698, mean loss: 0.33871611714405075
Epoch: 77, step: 894, loss: 0.3572234809398651, mean loss: 0.3387162822660032
Epoch: 77, step: 895, loss: 0.3537474274635315, mean loss: 0.33871641637207717
Epoch: 77, step: 896, loss: 0.3113458752632141, mean loss: 0.33871617217757205
Epoch: 77, step: 897, loss: 0.32962486147880554, mean loss: 0.3387160910674361
Epoch: 77, step: 898, loss: 0.3500354290008545, mean loss: 0.33871619205450804
Epoch: 77, step: 899, loss: 0.3389381170272827, mean loss: 0.3387161940344254
Epoch: 77, step: 900, loss: 0.31011155247688293, mean loss: 0.33871593883862955
Epoch: 77, step: 901, loss: 0.3355119824409485, mean loss: 0.3387159102548451
Epoch: 77, step: 902, loss: 0.3332456052303314, mean loss: 0.3387158614524879
Epoch: 77, step: 903, loss: 0.34054750204086304, mean loss: 0.33871587779299916
Epoch: 77, step: 904, loss: 0.3460678458213806, mean loss: 0.3387159433811093
Epoch: 77, step: 905, loss: 0.37091249227523804, mean loss: 0.3387162306092294
Epoch: 77, step: 906, loss: 0.3180169463157654, mean loss: 0.33871604595082094
Epoch: 77, step: 907, loss: 0.33752012252807617, mean loss: 0.3387160352820779
Epoch: 77, step: 908, loss: 0.32653141021728516, mean loss: 0.33871592658492217
Epoch: 77, step: 909, loss: 0.3078360855579376, mean loss: 0.3387156511130937
Epoch: 77, step: 910, loss: 0.2896733582019806, mean loss: 0.33871521362218915
Epoch: 77, step: 911, loss: 0.3600253760814667, mean loss: 0.33871540372176506
Epoch: 77, step: 912, loss: 0.29962414503097534, mean loss: 0.3387150550071355
Epoch: 77, step: 913, loss: 0.34395092725753784, mean loss: 0.33871510171345875
Epoch: 77, step: 914, loss: 0.3253735303878784, mean loss: 0.3387149827017345
Epoch: 77, step: 915, loss: 0.3558462858200073, mean loss: 0.33871513551789734
Epoch: 77, step: 916, loss: 0.3500177562236786, mean loss: 0.33871523633963324
Epoch: 77, step: 917, loss: 0.30587100982666016, mean loss: 0.3387149433648905
Epoch: 77, step: 918, loss: 0.33893024921417236, mean loss: 0.33871494528542934
Epoch: 77, step: 919, loss: 0.31965845823287964, mean loss: 0.33871477530213595
Epoch: 77, step: 920, loss: 0.33851855993270874, mean loss: 0.33871477355191637
Epoch: 77, step: 921, loss: 0.32656431198120117, mean loss: 0.3387146651720968
Epoch: 77, step: 922, loss: 0.33634045720100403, mean loss: 0.33871464399479956
Epoch: 77, step: 923, loss: 0.33359602093696594, mean loss: 0.3387145983384643
Epoch: 77, step: 924, loss: 0.3500535488128662, mean loss: 0.3387146994770519
Epoch: 77, step: 925, loss: 0.31895095109939575, mean loss: 0.33871452319444334
Epoch: 77, step: 926, loss: 0.35420867800712585, mean loss: 0.33871466139321077
Epoch: 77, step: 927, loss: 0.3468330502510071, mean loss: 0.3387147338038289
Epoch: 77, step: 928, loss: 0.3895167112350464, mean loss: 0.338715186919569
Epoch: 77, step: 929, loss: 0.3202754259109497, mean loss: 0.33871502245212387
Epoch: 77, step: 930, loss: 0.31393349170684814, mean loss: 0.3387148014232996
Epoch: 77, step: 931, loss: 0.33218124508857727, mean loss: 0.33871474315041045
Epoch: 77, step: 932, loss: 0.31394678354263306, mean loss: 0.338714522246569
Epoch: 77, step: 933, loss: 0.29962027072906494, mean loss: 0.33871417357055966
Epoch: 77, step: 934, loss: 0.3412075340747833, mean loss: 0.3387141958082852
Epoch: 77, step: 935, loss: 0.34892934560775757, mean loss: 0.3387142869141127
Epoch: 77, step: 936, loss: 0.35557106137275696, mean loss: 0.3387144372532383
Epoch: 77, step: 937, loss: 0.32051989436149597, mean loss: 0.3387142749845148
Epoch: 77, step: 938, loss: 0.3251793384552002, mean loss: 0.33871415427374457
Epoch: 77, step: 939, loss: 0.2899353802204132, mean loss: 0.3387137192461506
Epoch: 77, step: 940, loss: 0.3507969081401825, mean loss: 0.33871382700764757
Epoch: 77, step: 941, loss: 0.31024181842803955, mean loss: 0.3387135730880134
Epoch: 77, step: 942, loss: 0.34920766949653625, mean loss: 0.33871366667583847
Epoch: 77, step: 943, loss: 0.37883228063583374, mean loss: 0.33871402445607923
Epoch: 77, step: 944, loss: 0.3363199532032013, mean loss: 0.3387140031057965
Epoch: 77, step: 945, loss: 0.3272130489349365, mean loss: 0.33871390054141665
Epoch: 77, step: 946, loss: 0.321691632270813, mean loss: 0.3387137487398536
Epoch: 77, step: 947, loss: 0.31912049651145935, mean loss: 0.33871357401227076
Epoch: 77, step: 948, loss: 0.3470713496208191, mean loss: 0.33871364854409886
Epoch: 77, step: 949, loss: 0.3069416582584381, mean loss: 0.33871336521471646
Epoch: 77, step: 950, loss: 0.34006810188293457, mean loss: 0.3387133772955863
Epoch: 77, step: 951, loss: 0.35966938734054565, mean loss: 0.3387135641692268
Epoch: 77, step: 952, loss: 0.325641006231308, mean loss: 0.338713447596716
Epoch: 77, step: 953, loss: 0.3110654652118683, mean loss: 0.3387132010523135
Epoch: 77, step: 954, loss: 0.33122366666793823, mean loss: 0.33871313426674166
Epoch: 77, step: 955, loss: 0.35412654280662537, mean loss: 0.3387132717097483
Epoch: 77, step: 956, loss: 0.36048611998558044, mean loss: 0.3387134658588256
Epoch: 77, step: 957, loss: 0.29370352625846863, mean loss: 0.33871306450755495
Epoch: 77, step: 958, loss: 0.31580668687820435, mean loss: 0.3387128602544084
Epoch: 77, step: 959, loss: 0.3017198443412781, mean loss: 0.3387125303955084
Epoch: 77, step: 960, loss: 0.3265736699104309, mean loss: 0.3387124221568216
Epoch: 77, step: 961, loss: 0.2939329147338867, mean loss: 0.3387120228745441
Epoch: 77, step: 962, loss: 0.31849098205566406, mean loss: 0.33871184257262243
Epoch: 77, step: 963, loss: 0.3544637858867645, mean loss: 0.3387119830243604
Epoch: 77, step: 964, loss: 0.3180420398712158, mean loss: 0.3387117987230653
Epoch: 77, step: 965, loss: 0.33995264768600464, mean loss: 0.33871180978686116
Epoch: 77, step: 966, loss: 0.31956005096435547, mean loss: 0.3387116390253363
Epoch: 77, step: 967, loss: 0.32547304034233093, mean loss: 0.3387115209879715
Epoch: 77, step: 968, loss: 0.32748931646347046, mean loss: 0.3387114209299767
Epoch: 77, step: 969, loss: 0.33711692690849304, mean loss: 0.3387114067134783
Epoch: 77, step: 970, loss: 0.36795398592948914, mean loss: 0.3387116674378002
Epoch: 77, step: 971, loss: 0.3265974223613739, mean loss: 0.33871155942919573
Epoch: 77, step: 972, loss: 0.3468036353588104, mean loss: 0.3387116315761624
Epoch: 77, step: 973, loss: 0.3373337686061859, mean loss: 0.3387116192915832
Epoch: 77, step: 974, loss: 0.29084399342536926, mean loss: 0.338711192523167
Epoch: 77, step: 975, loss: 0.3589102327823639, mean loss: 0.338711372608045
Epoch: 77, step: 976, loss: 0.3000401258468628, mean loss: 0.33871102783697776
Epoch: 77, step: 977, loss: 0.37992504239082336, mean loss: 0.33871139527465544
Epoch: 77, step: 978, loss: 0.33482423424720764, mean loss: 0.33871136061953383
Epoch: 77, step: 979, loss: 0.3404809832572937, mean loss: 0.33871137639607113
Epoch: 77, step: 980, loss: 0.38101208209991455, mean loss: 0.33871175351190264
Epoch: 77, step: 981, loss: 0.38336610794067383, mean loss: 0.3387121516072439
Epoch: 77, step: 982, loss: 0.30412566661834717, mean loss: 0.33871184327010695
Epoch: 77, step: 983, loss: 0.3135864734649658, mean loss: 0.33871161928043214
Epoch: 77, step: 984, loss: 0.31051984429359436, mean loss: 0.3387113679563614
Epoch: 77, step: 985, loss: 0.3289991021156311, mean loss: 0.3387112813742137
Epoch: 77, step: 986, loss: 0.3407411575317383, mean loss: 0.3387112994698335
Epoch: 77, step: 987, loss: 0.36231622099876404, mean loss: 0.3387115098973896
Epoch: 77, step: 988, loss: 0.3571067154407501, mean loss: 0.3387116738811433
Epoch: 77, step: 989, loss: 0.3171231746673584, mean loss: 0.33871148143254187
Epoch: 77, step: 990, loss: 0.34124132990837097, mean loss: 0.33871150398443195
Epoch: 77, step: 991, loss: 0.31449785828590393, mean loss: 0.3387112881380627
Epoch: 77, step: 992, loss: 0.33861279487609863, mean loss: 0.3387112872600775
Epoch: 77, step: 993, loss: 0.31071195006370544, mean loss: 0.3387110376715767
Epoch: 77, step: 994, loss: 0.33299538493156433, mean loss: 0.33871098672221056
Epoch: 77, step: 995, loss: 0.327849417924881, mean loss: 0.3387108899029779
Epoch: 77, step: 996, loss: 0.297299861907959, mean loss: 0.3387105207713828
Epoch: 77, step: 997, loss: 0.3565268814563751, mean loss: 0.33871067958229223
Epoch: 77, step: 998, loss: 0.3601001501083374, mean loss: 0.3387108702413751
Epoch: 77, step: 999, loss: 0.3251872956752777, mean loss: 0.3387107496975151
Epoch: 77, step: 1000, loss: 0.3192606270313263, mean loss: 0.3387105763282662
Epoch: 77, step: 1001, loss: 0.3354019522666931, mean loss: 0.33871054683700974
Epoch: 77, step: 1002, loss: 0.35328906774520874, mean loss: 0.3387106767807745
Epoch: 77, step: 1003, loss: 0.32656171917915344, mean loss: 0.33871056849357395
Epoch: 77, step: 1004, loss: 0.3418563902378082, mean loss: 0.3387105965329502
Epoch: 77, step: 1005, loss: 0.3468565046787262, mean loss: 0.3387106691385097
Epoch: 77, step: 1006, loss: 0.34895041584968567, mean loss: 0.3387107604059166
Epoch: 77, step: 1007, loss: 0.3254691958427429, mean loss: 0.33871064238419957
Epoch: 77, step: 1008, loss: 0.35929688811302185, mean loss: 0.33871082586723145
Epoch: 77, step: 1009, loss: 0.32188937067985535, mean loss: 0.3387106759407159
Epoch: 77, step: 1010, loss: 0.31552645564079285, mean loss: 0.33871046930589477
Epoch: 77, step: 1011, loss: 0.3225032687187195, mean loss: 0.33871032485669167
Epoch: 77, step: 1012, loss: 0.4158175587654114, mean loss: 0.33871101208081544
Epoch: 77, step: 1013, loss: 0.34145134687423706, mean loss: 0.33871103650404133
Epoch: 77, step: 1014, loss: 0.36122211813926697, mean loss: 0.3387112371322031
Epoch: 77, step: 1015, loss: 0.3621699810028076, mean loss: 0.33871144620446314
Epoch: 77, step: 1016, loss: 0.32582888007164, mean loss: 0.3387113313916996
Epoch: 77, step: 1017, loss: 0.31592613458633423, mean loss: 0.33871112832593836
Epoch: 77, step: 1018, loss: 0.33640703558921814, mean loss: 0.3387111077916336
Epoch: 77, step: 1019, loss: 0.3318345844745636, mean loss: 0.3387110465079166
Epoch: 77, step: 1020, loss: 0.34400975704193115, mean loss: 0.33871109372971286
Epoch: 77, step: 1021, loss: 0.33215972781181335, mean loss: 0.3387110353448459
Epoch: 77, step: 1022, loss: 0.3074679374694824, mean loss: 0.3387107569131603
Epoch: 77, step: 1023, loss: 0.3206653296947479, mean loss: 0.3387105960976752
Epoch: 77, step: 1024, loss: 0.290264755487442, mean loss: 0.3387101643665869
Epoch: 77, step: 1025, loss: 0.3180362582206726, mean loss: 0.33870998013016235
Epoch: 77, step: 1026, loss: 0.3134273588657379, mean loss: 0.33870975482497795
Epoch: 77, step: 1027, loss: 0.30456453561782837, mean loss: 0.3387094505437773
Epoch: 77, step: 1028, loss: 0.2967546582221985, mean loss: 0.3387090766717943
Epoch: 77, step: 1029, loss: 0.30590683221817017, mean loss: 0.33870878436356877
Epoch: 77, step: 1030, loss: 0.30514904856681824, mean loss: 0.3387084853078314
Epoch: 77, step: 1031, loss: 0.31248271465301514, mean loss: 0.3387082516082176
Epoch: 77, step: 1032, loss: 0.3644384741783142, mean loss: 0.3387084808899258
Epoch: 77, step: 1033, loss: 0.3602355718612671, mean loss: 0.33870867271586874
Epoch: 77, step: 1034, loss: 0.3329211473464966, mean loss: 0.3387086211442179
Epoch: 77, step: 1035, loss: 0.3496643900871277, mean loss: 0.33870871876833525
Epoch: 77, step: 1036, loss: 0.4058211147785187, mean loss: 0.33870931678478444
Epoch: 77, step: 1037, loss: 0.3441299498081207, mean loss: 0.338709365085829
Epoch: 77, step: 1038, loss: 0.35346993803977966, mean loss: 0.3387094966100875
Epoch: 77, step: 1039, loss: 0.34892258048057556, mean loss: 0.33870958761308023
Epoch: 77, step: 1040, loss: 0.3262997567653656, mean loss: 0.33870947703710746
Epoch: 77, step: 1041, loss: 0.3331300616264343, mean loss: 0.3387094273229899
Epoch: 77, step: 1042, loss: 0.388876348733902, mean loss: 0.33870987431999977
Epoch: 77, step: 1043, loss: 0.30426186323165894, mean loss: 0.33870956738426766
Epoch: 77, step: 1044, loss: 0.3607882857322693, mean loss: 0.3387097641064291
Epoch: 77, step: 1045, loss: 0.3434213697910309, mean loss: 0.3387098060866284
Epoch: 77, step: 1046, loss: 0.34286147356033325, mean loss: 0.33870984307747326
Epoch: 77, step: 1047, loss: 0.33763694763183594, mean loss: 0.3387098335181924
Epoch: 77, step: 1048, loss: 0.32795852422714233, mean loss: 0.3387097377270603
Epoch: 77, step: 1049, loss: 0.3316108286380768, mean loss: 0.338709674478347
Epoch: 77, step: 1050, loss: 0.3318978250026703, mean loss: 0.33870961378777176
Epoch: 77, step: 1051, loss: 0.3478505313396454, mean loss: 0.338709695228591
Epoch: 77, step: 1052, loss: 0.34584107995033264, mean loss: 0.33870975876495224
Epoch: 77, step: 1053, loss: 0.3241412341594696, mean loss: 0.338709628969291
Epoch: 77, step: 1054, loss: 0.38096508383750916, mean loss: 0.3387100054333455
Epoch: 77, step: 1055, loss: 0.3395337164402008, mean loss: 0.3387100127719205
Epoch: 77, step: 1056, loss: 0.33901920914649963, mean loss: 0.3387100155265766
Epoch: 77, step: 1057, loss: 0.34274372458457947, mean loss: 0.33871005146290445
Epoch: 77, step: 1058, loss: 0.35170453786849976, mean loss: 0.33871016722979713
Epoch: 77, step: 1059, loss: 0.3276457190513611, mean loss: 0.33871006865834663
Epoch: 77, step: 1060, loss: 0.3368408977985382, mean loss: 0.3387100520063421
Epoch: 77, step: 1061, loss: 0.3504977226257324, mean loss: 0.3387101570189979
Epoch: 77, step: 1062, loss: 0.34829431772232056, mean loss: 0.3387102424005153
Epoch: 77, step: 1063, loss: 0.3369205594062805, mean loss: 0.33871022645707555
Epoch: 77, step: 1064, loss: 0.3139450252056122, mean loss: 0.33871000583757094
Epoch: 77, step: 1065, loss: 0.3492308259010315, mean loss: 0.3387100995609132
Epoch: 77, step: 1066, loss: 0.33457332849502563, mean loss: 0.3387100627093603
Epoch: 77, step: 1067, loss: 0.3077794313430786, mean loss: 0.3387097871728067
Epoch: 77, step: 1068, loss: 0.34961020946502686, mean loss: 0.33870988427519044
Epoch: 77, step: 1069, loss: 0.3011209964752197, mean loss: 0.33870954943145726
Epoch: 77, step: 1070, loss: 0.3245953917503357, mean loss: 0.33870942370293944
Epoch: 77, step: 1071, loss: 0.3643794059753418, mean loss: 0.33870965236837924
Epoch: 77, step: 1072, loss: 0.32914379239082336, mean loss: 0.33870956715748696
Epoch: 77, step: 1073, loss: 0.35691922903060913, mean loss: 0.3387097293643056
Epoch: 77, step: 1074, loss: 0.33246108889579773, mean loss: 0.3387096737035762
Epoch: 77, step: 1075, loss: 0.34015727043151855, mean loss: 0.3387096865981526
Epoch: 77, step: 1076, loss: 0.3472706079483032, mean loss: 0.33870976285452237
Epoch: 77, step: 1077, loss: 0.32661813497543335, mean loss: 0.3387096551493589
Epoch: 77, step: 1078, loss: 0.3350144922733307, mean loss: 0.338709622235298
Epoch: 77, step: 1079, loss: 0.3379131853580475, mean loss: 0.33870961514122955
Epoch: 77, step: 1080, loss: 0.29916244745254517, mean loss: 0.3387092628875559
Epoch: 77, step: 1081, loss: 0.3286619186401367, mean loss: 0.3387091733948664
Epoch: 77, step: 1082, loss: 0.34934285283088684, mean loss: 0.3387092681092578
Epoch: 77, step: 1083, loss: 0.3617955148220062, mean loss: 0.3387094737370787
Epoch: 77, step: 1084, loss: 0.3627086579799652, mean loss: 0.3387096874944758
Epoch: 77, step: 1085, loss: 0.34810367226600647, mean loss: 0.33870977116464673
Epoch: 77, step: 1086, loss: 0.34467488527297974, mean loss: 0.33870982429414226
Epoch: 77, step: 1087, loss: 0.33970996737480164, mean loss: 0.33870983320203957
Epoch: 77, step: 1088, loss: 0.30975034832954407, mean loss: 0.33870957527312384
Epoch: 77, step: 1089, loss: 0.34932008385658264, mean loss: 0.33870966977523986
Epoch: 77, step: 1090, loss: 0.29831814765930176, mean loss: 0.3387093100327937
Epoch: 77, step: 1091, loss: 0.32464495301246643, mean loss: 0.3387091847713311
Epoch: 77, step: 1092, loss: 0.3372690975666046, mean loss: 0.3387091719455885
Epoch: 77, step: 1093, loss: 0.3583138585090637, mean loss: 0.3387093465478094
Epoch: 77, step: 1094, loss: 0.3330306112766266, mean loss: 0.33870929597260857
Epoch: 77, step: 1095, loss: 0.32523736357688904, mean loss: 0.3387091759917351
Epoch: 77, step: 1096, loss: 0.32991012930870056, mean loss: 0.33870909762822543
Epoch: 77, step: 1097, loss: 0.3746598958969116, mean loss: 0.3387094177999144
Epoch: 77, step: 1098, loss: 0.3818044364452362, mean loss: 0.3387098015933958
Epoch: 77, step: 1099, loss: 0.30773425102233887, mean loss: 0.3387095257353293
Epoch: 77, step: 1100, loss: 0.3159245550632477, mean loss: 0.33870932282168087
Epoch: 77, step: 1101, loss: 0.34640511870384216, mean loss: 0.3387093913566874
Epoch: 77, step: 1102, loss: 0.3167440593242645, mean loss: 0.33870919574589015
Epoch: 77, step: 1103, loss: 0.359447717666626, mean loss: 0.33870938042976717
Epoch: 77, step: 1104, loss: 0.2861914038658142, mean loss: 0.33870891274276477
Epoch: 77, step: 1105, loss: 0.3350948095321655, mean loss: 0.33870888055846987
Epoch: 77, step: 1106, loss: 0.31167545914649963, mean loss: 0.3387086398227166
Epoch: 77, step: 1107, loss: 0.32147762179374695, mean loss: 0.3387084863798689
Epoch: 77, step: 1108, loss: 0.3474295735359192, mean loss: 0.3387085640407784
Epoch: 77, step: 1109, loss: 0.4008704125881195, mean loss: 0.3387091175844617
Epoch: 77, step: 1110, loss: 0.2977447807788849, mean loss: 0.3387087528052846
Epoch: 77, step: 1111, loss: 0.3053573668003082, mean loss: 0.33870845582054726
Epoch: 77, step: 1112, loss: 0.309932678937912, mean loss: 0.3387081995826074
Epoch: 77, step: 1113, loss: 0.3252069652080536, mean loss: 0.3387080793600435
Epoch: 77, step: 1114, loss: 0.3376007676124573, mean loss: 0.33870806950000637
Epoch: 77, step: 1115, loss: 0.3249509632587433, mean loss: 0.3387079470011974
Epoch: 77, step: 1116, loss: 0.350523978471756, mean loss: 0.33870805221495875
Epoch: 77, step: 1117, loss: 0.32177093625068665, mean loss: 0.3387079014027496
Epoch: 77, step: 1118, loss: 0.343972384929657, mean loss: 0.3387079482785768
Epoch: 77, step: 1119, loss: 0.32553017139434814, mean loss: 0.33870783094252876
Epoch: 77, step: 1120, loss: 0.33588626980781555, mean loss: 0.33870780581933174
Epoch: 77, step: 1121, loss: 0.33804672956466675, mean loss: 0.33870779993315725
Epoch: 77, step: 1122, loss: 0.374664306640625, mean loss: 0.3387081200844043
Epoch: 77, step: 1123, loss: 0.3353356122970581, mean loss: 0.33870809005637714
Epoch: 77, step: 1124, loss: 0.3322884142398834, mean loss: 0.3387080328975815
Epoch: 77, step: 1125, loss: 0.30838456749916077, mean loss: 0.3387077629092862
Epoch: 77, step: 1126, loss: 0.33699098229408264, mean loss: 0.33870774762387806
Epoch: 77, step: 1127, loss: 0.3124278485774994, mean loss: 0.33870751364208523
Epoch: 77, step: 1128, loss: 0.3627980947494507, mean loss: 0.33870772812948347
Epoch: 77, step: 1129, loss: 0.31754153966903687, mean loss: 0.3387075396807178
Epoch: 77, step: 1130, loss: 0.319955050945282, mean loss: 0.33870737272331314
Epoch: 77, step: 1131, loss: 0.3605343699455261, mean loss: 0.3387075670519921
Epoch: 77, step: 1132, loss: 0.32210102677345276, mean loss: 0.3387074192030567
Epoch: 77, step: 1133, loss: 0.36495494842529297, mean loss: 0.338707652884163
Epoch: 77, step: 1134, loss: 0.35280343890190125, mean loss: 0.3387077783774815
Epoch: 77, step: 1135, loss: 0.37711191177368164, mean loss: 0.33870812028244746
Epoch: 77, step: 1136, loss: 0.3923744559288025, mean loss: 0.33870859805975123
Epoch: 77, step: 1137, loss: 0.31573086977005005, mean loss: 0.338708393496887
Epoch: 77, step: 1138, loss: 0.3824692964553833, mean loss: 0.33870878308178604
Epoch: 77, step: 1139, loss: 0.3731471300125122, mean loss: 0.33870908966916347
Epoch: 77, step: 1140, loss: 0.3156064450740814, mean loss: 0.33870888399970506
Epoch: 77, step: 1141, loss: 0.34104445576667786, mean loss: 0.3387089047917621
Epoch: 77, step: 1142, loss: 0.38241827487945557, mean loss: 0.33870929390402926
Epoch: 77, step: 1143, loss: 0.3677796423435211, mean loss: 0.33870955269358555
Epoch: 77, step: 1144, loss: 0.2808496356010437, mean loss: 0.3387090376186112
Epoch: 77, step: 1145, loss: 0.30027297139167786, mean loss: 0.33870869545981486
Epoch: 77, step: 1146, loss: 0.3222378194332123, mean loss: 0.33870854883698115
Epoch: 77, step: 1147, loss: 0.33906450867652893, mean loss: 0.3387085520056879
Epoch: 77, step: 1148, loss: 0.3267129957675934, mean loss: 0.3387084452238062
Epoch: 77, step: 1149, loss: 0.3837158977985382, mean loss: 0.33870884586697747
Epoch: 77, step: 1150, loss: 0.3369593024253845, mean loss: 0.3387088302931924
Epoch: 77, step: 1151, loss: 0.36771059036254883, mean loss: 0.33870908845377695
Epoch: 77, step: 1152, loss: 0.31229129433631897, mean loss: 0.33870885329658484
Epoch: 77, step: 1153, loss: 0.34995391964912415, mean loss: 0.3387089533933105
Epoch: 77, step: 1154, loss: 0.3436669707298279, mean loss: 0.3387089975261655
Epoch: 77, step: 1155, loss: 0.35256117582321167, mean loss: 0.3387091208276173
Epoch: 77, step: 1156, loss: 0.33308106660842896, mean loss: 0.3387090707314473
Epoch: 77, step: 1157, loss: 0.33945977687835693, mean loss: 0.33870907741353784
Epoch: 77, step: 1158, loss: 0.30820930004119873, mean loss: 0.3387088059351951
Epoch: 77, step: 1159, loss: 0.30567020177841187, mean loss: 0.3387085118613873
Epoch: 77, step: 1160, loss: 0.31010571122169495, mean loss: 0.3387082572725557
Epoch: 77, step: 1161, loss: 0.3052925765514374, mean loss: 0.3387079598477162
Epoch: 77, step: 1162, loss: 0.35823988914489746, mean loss: 0.3387081336951167
Epoch: 77, step: 1163, loss: 0.3618635833263397, mean loss: 0.33870833979246817
Epoch: 77, step: 1164, loss: 0.31473585963249207, mean loss: 0.3387081264249554
Epoch: 77, step: 1165, loss: 0.31884658336639404, mean loss: 0.33870794964848944
Epoch: 77, step: 1166, loss: 0.31775400042533875, mean loss: 0.3387077631507882
Epoch: 77, step: 1167, loss: 0.32354047894477844, mean loss: 0.338707628157693
Epoch: 77, step: 1168, loss: 0.32122546434402466, mean loss: 0.33870747256290307
Epoch: 77, step: 1169, loss: 0.3392944633960724, mean loss: 0.33870747778719357
Epoch: 77, step: 1170, loss: 0.3152144253253937, mean loss: 0.3387072686980021
Epoch: 77, step: 1171, loss: 0.3454654812812805, mean loss: 0.33870732884585353
Epoch: 77, step: 1172, loss: 0.3653707206249237, mean loss: 0.33870756614697917
Epoch: 77, step: 1173, loss: 0.29290565848350525, mean loss: 0.3387071585188873
Epoch: 77, step: 1174, loss: 0.32181233167648315, mean loss: 0.3387070081595444
Epoch: 77, step: 1175, loss: 0.29296666383743286, mean loss: 0.33870660108660006
Epoch: 77, step: 1176, loss: 0.3164081871509552, mean loss: 0.3387064026403407
Epoch: 77, step: 1177, loss: 0.32766324281692505, mean loss: 0.33870630436185944
Epoch: 77, step: 1178, loss: 0.35113659501075745, mean loss: 0.33870641498411197
Epoch: 77, step: 1179, loss: 0.3178369104862213, mean loss: 0.33870622925948846
Epoch: 77, step: 1180, loss: 0.3398691713809967, mean loss: 0.338706239608803
Epoch: 77, step: 1181, loss: 0.3212536573410034, mean loss: 0.33870608429526494
Epoch: 77, step: 1182, loss: 0.31889116764068604, mean loss: 0.3387059079604752
Epoch: 77, step: 1183, loss: 0.30018094182014465, mean loss: 0.3387055651262626
Epoch: 77, step: 1184, loss: 0.3289298415184021, mean loss: 0.3387054781327356
Epoch: 77, step: 1185, loss: 0.30782967805862427, mean loss: 0.338705203373449
Epoch: 77, step: 1186, loss: 0.3010900020599365, mean loss: 0.3387048686441826
Epoch: 77, step: 1187, loss: 0.3751998245716095, mean loss: 0.3387051934017458
Epoch: 77, step: 1188, loss: 0.3263320326805115, mean loss: 0.33870508329771454
Epoch: 77, step: 1189, loss: 0.40890154242515564, mean loss: 0.3387057079436339
Epoch: 77, step: 1190, loss: 0.37466099858283997, mean loss: 0.3387060278903378
Epoch: 77, step: 1191, loss: 0.34195730090141296, mean loss: 0.33870605682140215
Epoch: 77, step: 1192, loss: 0.3340306878089905, mean loss: 0.3387060152185599
Epoch: 77, step: 1193, loss: 0.3346071243286133, mean loss: 0.3387059787457183
Epoch: 77, step: 1194, loss: 0.322040855884552, mean loss: 0.33870583045707264
Epoch: 77, step: 1195, loss: 0.34272241592407227, mean loss: 0.3387058661969063
Epoch: 77, step: 1196, loss: 0.3401368260383606, mean loss: 0.33870587892956494
Epoch: 77, step: 1197, loss: 0.3093234598636627, mean loss: 0.3387056174875787
Epoch: 77, step: 1198, loss: 0.32145556807518005, mean loss: 0.338705463999636
Epoch: 77, step: 1199, loss: 0.3364565968513489, mean loss: 0.3387054439897849
Epoch: 77, step: 1200, loss: 0.30517876148223877, mean loss: 0.3387051456804975
Epoch: 77, step: 1201, loss: 0.31106969714164734, mean loss: 0.33870489979164137
Epoch: 77, step: 1202, loss: 0.3017338812351227, mean loss: 0.33870457084164934
Epoch: 77, step: 1203, loss: 0.3164832293987274, mean loss: 0.33870437312880997
Epoch: 77, step: 1204, loss: 0.3009725511074066, mean loss: 0.33870403741553584
Epoch: 77, step: 1205, loss: 0.30008143186569214, mean loss: 0.3387036937797052
Epoch: 77, step: 1206, loss: 0.3573647737503052, mean loss: 0.3387038598109341
Epoch: 77, step: 1207, loss: 0.3132421374320984, mean loss: 0.3387036332750932
Epoch: 77, step: 1208, loss: 0.3188009560108185, mean loss: 0.3387034562002846
Epoch: 77, step: 1209, loss: 0.35571181774139404, mean loss: 0.33870360752291967
Epoch: 77, step: 1210, loss: 0.33002111315727234, mean loss: 0.33870353027584127
Epoch: 77, step: 1211, loss: 0.3390740156173706, mean loss: 0.3387035335719742
Epoch: 77, step: 1212, loss: 0.3361356854438782, mean loss: 0.3387035107265535
Epoch: 77, step: 1213, loss: 0.3063214123249054, mean loss: 0.33870322263471886
Epoch: 77, step: 1214, loss: 0.3369271755218506, mean loss: 0.3387032068340097
Epoch: 77, step: 1215, loss: 0.2983308732509613, mean loss: 0.3387028476623291
Epoch: 77, step: 1216, loss: 0.3182229995727539, mean loss: 0.3387026654653798
Epoch: 77, step: 1217, loss: 0.3200721740722656, mean loss: 0.3387024997225245
Epoch: 77, step: 1218, loss: 0.32914161682128906, mean loss: 0.3387024146665858
Epoch: 77, step: 1219, loss: 0.33327630162239075, mean loss: 0.3387023663949944
Epoch: 77, step: 1220, loss: 0.337375670671463, mean loss: 0.3387023545925967
Epoch: 77, step: 1221, loss: 0.3131309747695923, mean loss: 0.3387021271094562
Epoch: 77, step: 1222, loss: 0.3265342712402344, mean loss: 0.33870201886510404
Epoch: 77, step: 1223, loss: 0.3051215410232544, mean loss: 0.3387017201382969
Epoch: 77, step: 1224, loss: 0.3442080318927765, mean loss: 0.3387017691211704
Epoch: 77, step: 1225, loss: 0.3036142885684967, mean loss: 0.33870145699385035
Epoch: 77, step: 1226, loss: 0.33966249227523804, mean loss: 0.3387014655428454
Epoch: 77, step: 1227, loss: 0.3431653678417206, mean loss: 0.3387015052516262
Epoch: 77, step: 1228, loss: 0.31623736023902893, mean loss: 0.338701305422908
Epoch: 77, step: 1229, loss: 0.292881041765213, mean loss: 0.3387008978345889
Epoch: 77, step: 1230, loss: 0.32393568754196167, mean loss: 0.3387007664937097
Epoch: 77, step: 1231, loss: 0.301064670085907, mean loss: 0.338700431712564
Epoch: 77, step: 1232, loss: 0.2906006872653961, mean loss: 0.3387000038588316
Epoch: 77, step: 1233, loss: 0.3085573613643646, mean loss: 0.3386997357383348
Epoch: 77, step: 1234, loss: 0.33594462275505066, mean loss: 0.33869971123166814
Epoch: 77, step: 1235, loss: 0.417384535074234, mean loss: 0.33870041112514143
Epoch: 77, step: 1236, loss: 0.3257162868976593, mean loss: 0.33870029563370957
Epoch: 77, step: 1237, loss: 0.3158484995365143, mean loss: 0.33870009237293275
Epoch: 77, step: 1238, loss: 0.3019343614578247, mean loss: 0.3386997653542369
Epoch: 77, step: 1239, loss: 0.32106930017471313, mean loss: 0.33869960853862885
Epoch: 77, step: 1240, loss: 0.3664475679397583, mean loss: 0.3386998553429178
Epoch: 77, step: 1241, loss: 0.36304154992103577, mean loss: 0.3387000718482507
Epoch: 77, step: 1242, loss: 0.3392065167427063, mean loss: 0.33870007635274585
Epoch: 77, step: 1243, loss: 0.33011704683303833, mean loss: 0.338700000013007
Epoch: 77, step: 1244, loss: 0.3192139267921448, mean loss: 0.3386998267002499
Epoch: 77, step: 1245, loss: 0.3295868933200836, mean loss: 0.3386997456488475
Epoch: 77, step: 1246, loss: 0.34213516116142273, mean loss: 0.3386997762035281
Epoch: 77, step: 1247, loss: 0.3412165641784668, mean loss: 0.3386997985877109
Epoch: 77, step: 1248, loss: 0.33308565616607666, mean loss: 0.33869974865626107
Epoch: 77, step: 1249, loss: 0.32132259011268616, mean loss: 0.338699594107456
Epoch: 77, step: 1250, loss: 0.32360291481018066, mean loss: 0.3386994598419494
Epoch: 77, step: 1251, loss: 0.3640739619731903, mean loss: 0.33869968551343754
Epoch: 77, step: 1252, loss: 0.38456040620803833, mean loss: 0.33870009337819057
Epoch: 77, step: 1253, loss: 0.30392077565193176, mean loss: 0.33869978406923373
Epoch: 77, step: 1254, loss: 0.3438519239425659, mean loss: 0.33869982988924807
Epoch: 77, step: 1255, loss: 0.3058801293373108, mean loss: 0.3386995380132871
Epoch: 77, step: 1256, loss: 0.39997169375419617, mean loss: 0.33870008292107084
Epoch: 77, step: 1257, loss: 0.35493919253349304, mean loss: 0.338700227338032
Epoch: 77, step: 1258, loss: 0.3589364290237427, mean loss: 0.3387004073001625
Epoch: 77, step: 1259, loss: 0.2938563823699951, mean loss: 0.33870000850227433
Epoch: 77, step: 1260, loss: 0.3103383183479309, mean loss: 0.3386997562840229
Epoch: 77, step: 1261, loss: 0.3654674291610718, mean loss: 0.3386999943246887
Epoch: 77, step: 1262, loss: 0.31713566184043884, mean loss: 0.33869980255820836
Epoch: 77, step: 1263, loss: 0.35714074969291687, mean loss: 0.3386999665477073
Epoch: 77, step: 1264, loss: 0.29678574204444885, mean loss: 0.3386995938211059
Epoch: 77, step: 1265, loss: 0.34147194027900696, mean loss: 0.33869961847426594
Epoch: 77, step: 1266, loss: 0.3773103356361389, mean loss: 0.3386999618179782
Epoch: 77, step: 1267, loss: 0.3317492604255676, mean loss: 0.33869990000979194
Epoch: 77, step: 1268, loss: 0.3472774922847748, mean loss: 0.3386999762842104
Epoch: 77, step: 1269, loss: 0.3303575813770294, mean loss: 0.33869990210189427
Epoch: 77, step: 1270, loss: 0.38459476828575134, mean loss: 0.33870031020499125
Epoch: 77, step: 1271, loss: 0.3471791446208954, mean loss: 0.3387003855992151
Epoch: 77, step: 1272, loss: 0.3302655816078186, mean loss: 0.3387003105971789
Epoch: 77, step: 1273, loss: 0.3543199896812439, mean loss: 0.33870044948568423
Epoch: 77, step: 1274, loss: 0.3147084712982178, mean loss: 0.3387002361534933
Epoch: 77, step: 1275, loss: 0.3233514130115509, mean loss: 0.338700099675837
Epoch: 77, step: 1276, loss: 0.33418136835098267, mean loss: 0.3387000594968362
Epoch: 77, step: 1277, loss: 0.31252941489219666, mean loss: 0.33869982679855754
Epoch: 77, step: 1278, loss: 0.32037925720214844, mean loss: 0.3386996639012668
Epoch: 77, step: 1279, loss: 0.3388596773147583, mean loss: 0.33869966532401297
Epoch: 77, step: 1280, loss: 0.32104071974754333, mean loss: 0.3386995083123424
Epoch: 77, step: 1281, loss: 0.3230932354927063, mean loss: 0.33869936955291485
Epoch: 77, step: 1282, loss: 0.3320198953151703, mean loss: 0.3386993101645015
Epoch: 77, step: 1283, loss: 0.3312718868255615, mean loss: 0.3386992441265246
Epoch: 77, step: 1284, loss: 0.32086238265037537, mean loss: 0.3386990855385837
Epoch: 77, step: 1285, loss: 0.3321235477924347, mean loss: 0.33869902707584787
Epoch: 77, step: 1286, loss: 0.31725406646728516, mean loss: 0.338698836411606
Epoch: 77, step: 1287, loss: 0.33202946186065674, mean loss: 0.33869877711562685
Epoch: 77, step: 1288, loss: 0.37648463249206543, mean loss: 0.3386991130585785
Epoch: 77, step: 1289, loss: 0.29063090682029724, mean loss: 0.33869868570206224
Epoch: 77, step: 1290, loss: 0.3124381899833679, mean loss: 0.3386984522318525
Epoch: 77, step: 1291, loss: 0.3151973485946655, mean loss: 0.3386982432960094
Epoch: 77, step: 1292, loss: 0.3037099242210388, mean loss: 0.33869793223619415
Epoch: 77, step: 1293, loss: 0.3289353847503662, mean loss: 0.3386978454441075
Epoch: 77, step: 1294, loss: 0.3027932643890381, mean loss: 0.33869752624404126
Epoch: 77, step: 1295, loss: 0.3016919493675232, mean loss: 0.3386971972587911
Epoch: 77, step: 1296, loss: 0.31843850016593933, mean loss: 0.3386970171574701
Epoch: 77, step: 1297, loss: 0.3267859220504761, mean loss: 0.33869691126789175
Epoch: 77, step: 1298, loss: 0.3420172929763794, mean loss: 0.3386969407858068
Epoch: 77, step: 1299, loss: 0.31324055790901184, mean loss: 0.3386967144827089
Epoch: 77, step: 1300, loss: 0.30653586983680725, mean loss: 0.33869642858057936
Epoch: 77, step: 1301, loss: 0.32818803191185, mean loss: 0.3386963351643053
Epoch: 77, step: 1302, loss: 0.3304768204689026, mean loss: 0.338696262096107
Epoch: 77, step: 1303, loss: 0.3314144015312195, mean loss: 0.3386961973638543
Epoch: 77, step: 1304, loss: 0.35477688908576965, mean loss: 0.33869634031223084
Epoch: 77, step: 1305, loss: 0.42426806688308716, mean loss: 0.33869710099036987
Epoch: 77, step: 1306, loss: 0.3371802866458893, mean loss: 0.3386970875069764
Epoch: 77, step: 1307, loss: 0.3412415683269501, mean loss: 0.3386971101253879
Epoch: 77, step: 1308, loss: 0.335652619600296, mean loss: 0.3386970830625282
Epoch: 77, step: 1309, loss: 0.33586522936820984, mean loss: 0.3386970578900479
Epoch: 77, step: 1310, loss: 0.32243552803993225, mean loss: 0.338696913341831
Epoch: 77, step: 1311, loss: 0.33270856738090515, mean loss: 0.3386968601120891
Epoch: 77, step: 1312, loss: 0.3454405665397644, mean loss: 0.3386969200556134
Epoch: 77, step: 1313, loss: 0.38786301016807556, mean loss: 0.33869735707975623
Epoch: 77, step: 1314, loss: 0.32364076375961304, mean loss: 0.33869722324694
Epoch: 77, step: 1315, loss: 0.35674557089805603, mean loss: 0.33869738367099295
Epoch: 77, step: 1316, loss: 0.31284984946250916, mean loss: 0.3386971539253442
Epoch: 77, step: 1317, loss: 0.3155565857887268, mean loss: 0.338696948242375
Epoch: 77, step: 1318, loss: 0.35790586471557617, mean loss: 0.3386971189776757
Epoch: 77, step: 1319, loss: 0.3226531744003296, mean loss: 0.33869697637497564
Epoch: 77, step: 1320, loss: 0.3225955069065094, mean loss: 0.3386968332622516
Epoch: 77, step: 1321, loss: 0.30006787180900574, mean loss: 0.33869648992422424
Epoch: 77, step: 1322, loss: 0.3267250955104828, mean loss: 0.3386963835222332
Epoch: 77, step: 1323, loss: 0.37355169653892517, mean loss: 0.33869669331419333
Epoch: 77, step: 1324, loss: 0.3237515091896057, mean loss: 0.33869656048346153
Epoch: 77, step: 1325, loss: 0.35651683807373047, mean loss: 0.33869671886621916
Epoch: 77, step: 1326, loss: 0.332565039396286, mean loss: 0.33869666436966783
Epoch: 77, step: 1327, loss: 0.3518071174621582, mean loss: 0.3386967808904568
Epoch: 77, step: 1328, loss: 0.2924833297729492, mean loss: 0.3386963701662896
Epoch: 77, step: 1329, loss: 0.3293420374393463, mean loss: 0.3386962870299672
Epoch: 77, step: 1330, loss: 0.29353344440460205, mean loss: 0.33869588565026576
Epoch: 77, step: 1331, loss: 0.32381534576416016, mean loss: 0.33869575340231084
Epoch: 77, step: 1332, loss: 0.34673479199409485, mean loss: 0.3386958248470953
Epoch: 77, step: 1333, loss: 0.31296202540397644, mean loss: 0.33869559614693495
Epoch: 77, step: 1334, loss: 0.3391491174697876, mean loss: 0.33869560017741157
Epoch: 77, step: 1335, loss: 0.3441697359085083, mean loss: 0.3386956488260175
Epoch: 77, step: 1336, loss: 0.29750990867614746, mean loss: 0.338695282811886
Epoch: 77, step: 1337, loss: 0.3051908016204834, mean loss: 0.3386949850630884
Epoch: 77, step: 1338, loss: 0.3692152202129364, mean loss: 0.33869525628897335
Epoch: 77, step: 1339, loss: 0.3499056100845337, mean loss: 0.33869535591176764
Epoch: 77, step: 1340, loss: 0.30697736144065857, mean loss: 0.3386950740466976
Epoch: 77, step: 1341, loss: 0.33501946926116943, mean loss: 0.33869504138336526
Epoch: 77, step: 1342, loss: 0.35118624567985535, mean loss: 0.338695152385705
Epoch: 77, step: 1343, loss: 0.3244028687477112, mean loss: 0.33869502537931007
Epoch: 77, step: 1344, loss: 0.3318227231502533, mean loss: 0.33869496431009277
Epoch: 77, step: 1345, loss: 0.34188342094421387, mean loss: 0.33869499264336655
Epoch: 77, step: 1346, loss: 0.36548835039138794, mean loss: 0.3386952307324744
Epoch: 77, step: 1347, loss: 0.3134380280971527, mean loss: 0.3386950062958262
Epoch: 77, step: 1348, loss: 0.33925244212150574, mean loss: 0.3386950112491822
Epoch: 77, step: 1349, loss: 0.34154537320137024, mean loss: 0.3386950365771777
Epoch: 77, step: 1350, loss: 0.35668590664863586, mean loss: 0.3386951964406035
Epoch: 77, step: 1351, loss: 0.30790281295776367, mean loss: 0.3386949228278126
Epoch: 77, step: 1352, loss: 0.3421548902988434, mean loss: 0.3386949535718745
Epoch: 77, step: 1353, loss: 0.3341638743877411, mean loss: 0.33869491331064594
Epoch: 77, step: 1354, loss: 0.37004172801971436, mean loss: 0.3386951918425378
Epoch: 77, step: 1355, loss: 0.3052824139595032, mean loss: 0.3386948949561833
Epoch: 77, step: 1356, loss: 0.34457939863204956, mean loss: 0.33869494724196836
Epoch: 77, step: 1357, loss: 0.31985652446746826, mean loss: 0.33869477985776303
Epoch: 77, step: 1358, loss: 0.3256931006908417, mean loss: 0.3386946643355442
Epoch: 77, step: 1359, loss: 0.3305031359195709, mean loss: 0.3386945915530121
Epoch: 77, step: 1360, loss: 0.30134037137031555, mean loss: 0.33869425966005723
Epoch: 77, step: 1361, loss: 0.3542080819606781, mean loss: 0.33869439749943797
Epoch: 77, step: 1362, loss: 0.322945773601532, mean loss: 0.33869425757510235
Epoch: 77, step: 1363, loss: 0.34813234210014343, mean loss: 0.3386943414304272
Epoch: 77, step: 1364, loss: 0.3124014437198639, mean loss: 0.3386941078258346
Epoch: 77, step: 1365, loss: 0.3301861882209778, mean loss: 0.33869403223616557
Epoch: 77, step: 1366, loss: 0.3355579674243927, mean loss: 0.3386940043736556
Epoch: 77, step: 1367, loss: 0.3501127064228058, mean loss: 0.3386941058227303
Epoch: 77, step: 1368, loss: 0.3295290470123291, mean loss: 0.3386940243967967
Epoch: 77, step: 1369, loss: 0.32550719380378723, mean loss: 0.33869390724092513
Epoch: 77, step: 1370, loss: 0.31510546803474426, mean loss: 0.3386936976758152
Epoch: 77, step: 1371, loss: 0.29602450132369995, mean loss: 0.33869331859624563
Epoch: 77, step: 1372, loss: 0.3268740773200989, mean loss: 0.3386932135932581
Epoch: 77, step: 1373, loss: 0.30338820815086365, mean loss: 0.33869289994384316
Epoch: 77, step: 1374, loss: 0.3232579529285431, mean loss: 0.3386927628211029
Epoch: 77, step: 1375, loss: 0.33355003595352173, mean loss: 0.3386927171339661
Epoch: 77, step: 1376, loss: 0.36198902130126953, mean loss: 0.33869292409264923
Epoch: 77, step: 1377, loss: 0.39041224122047424, mean loss: 0.33869338355036405
Epoch: 77, step: 1378, loss: 0.3306361734867096, mean loss: 0.3386933119733471
Epoch: 77, step: 1379, loss: 0.3203776776790619, mean loss: 0.3386931492660565
Epoch: 77, step: 1380, loss: 0.3936016261577606, mean loss: 0.33869363704223726
Epoch: 77, step: 1381, loss: 0.33810552954673767, mean loss: 0.3386936318178658
Epoch: 77, step: 1382, loss: 0.31385883688926697, mean loss: 0.3386934112033654
Epoch: 77, step: 1383, loss: 0.33992886543273926, mean loss: 0.3386934221781569
Epoch: 77, step: 1384, loss: 0.3151938021183014, mean loss: 0.3386932134281008
Epoch: 77, step: 1385, loss: 0.29577547311782837, mean loss: 0.33869283218784724
Epoch: 77, step: 1386, loss: 0.3579610288143158, mean loss: 0.3386930033466003
Epoch: 77, step: 1387, loss: 0.34554368257522583, mean loss: 0.3386930642004166
Epoch: 77, step: 1388, loss: 0.3157649338245392, mean loss: 0.3386928605342115
Epoch: 77, step: 1389, loss: 0.341560423374176, mean loss: 0.3386928860059985
Epoch: 77, step: 1390, loss: 0.3653358817100525, mean loss: 0.33869312266643875
Epoch: 77, step: 1391, loss: 0.31173744797706604, mean loss: 0.3386928832307069
Epoch: 77, step: 1392, loss: 0.34745684266090393, mean loss: 0.3386929610765195
Epoch: 77, step: 1393, loss: 0.30387312173843384, mean loss: 0.33869265179227037
Epoch: 77, step: 1394, loss: 0.33939477801322937, mean loss: 0.33869265802879117
Epoch: 77, step: 1395, loss: 0.3156919777393341, mean loss: 0.33869245373084217
Epoch: 77, step: 1396, loss: 0.3485138714313507, mean loss: 0.33869254096642154
Epoch: 77, step: 1397, loss: 0.3734879493713379, mean loss: 0.33869285002268434
Epoch: 77, step: 1398, loss: 0.31448718905448914, mean loss: 0.33869263502751645
Epoch: 77, step: 1399, loss: 0.34399983286857605, mean loss: 0.33869268216573584
Epoch: 77, step: 1400, loss: 0.36240923404693604, mean loss: 0.33869289281288506
Epoch: 77, step: 1401, loss: 0.3213575780391693, mean loss: 0.338692738844373
Epoch: 77, step: 1402, loss: 0.38317838311195374, mean loss: 0.3386931339527233
Epoch: 77, step: 1403, loss: 0.3662486672401428, mean loss: 0.33869337869065574
Epoch: 77, step: 1404, loss: 0.33085760474205017, mean loss: 0.3386933090968626
Epoch: 77, step: 1405, loss: 0.35666343569755554, mean loss: 0.33869346869796574
Epoch: 77, step: 1406, loss: 0.3600670397281647, mean loss: 0.3386936585249654
Epoch: 77, step: 1407, loss: 0.3277669847011566, mean loss: 0.33869356148178603
Epoch: 77, step: 1408, loss: 0.3167424499988556, mean loss: 0.3386933665288878
Epoch: 77, step: 1409, loss: 0.35929253697395325, mean loss: 0.33869354947326025
Epoch: 77, step: 1410, loss: 0.3290329575538635, mean loss: 0.33869346367683295
Epoch: 77, step: 1411, loss: 0.3158552348613739, mean loss: 0.33869326085064455
Epoch: 77, step: 1412, loss: 0.2805249094963074, mean loss: 0.33869274426241397
Epoch: 77, step: 1413, loss: 0.31932950019836426, mean loss: 0.338692572300601
Epoch: 77, step: 1414, loss: 0.33115696907043457, mean loss: 0.33869250537873186
Epoch: 77, step: 1415, loss: 0.29908666014671326, mean loss: 0.3386921536519261
Epoch: 77, step: 1416, loss: 0.3152782917022705, mean loss: 0.338691945722776
Epoch: 77, step: 1417, loss: 0.3313823342323303, mean loss: 0.33869188080961427
Epoch: 77, step: 1418, loss: 0.2925123870372772, mean loss: 0.33869147071527045
Epoch: 77, step: 1419, loss: 0.36338916420936584, mean loss: 0.33869169003977223
Epoch: 77, step: 1420, loss: 0.32767772674560547, mean loss: 0.3386915922326405
Epoch: 77, step: 1421, loss: 0.33093738555908203, mean loss: 0.33869152337368774
Epoch: 77, step: 1422, loss: 0.3366323411464691, mean loss: 0.3386915050878877
Epoch: 77, step: 1423, loss: 0.3242871165275574, mean loss: 0.33869137717622144
Epoch: 77, step: 1424, loss: 0.37924501299858093, mean loss: 0.3386917372912687
Epoch: 77, step: 1425, loss: 0.292287141084671, mean loss: 0.33869132522353107
Epoch: 77, step: 1426, loss: 0.3314850628376007, mean loss: 0.3386912612332777
Epoch: 77, step: 1427, loss: 0.3215361535549164, mean loss: 0.3386911089005037
Epoch: 77, step: 1428, loss: 0.3120626211166382, mean loss: 0.33869087244874435
Epoch: 77, step: 1429, loss: 0.3030531108379364, mean loss: 0.33869055600056014
Epoch: 77, step: 1430, loss: 0.3227199614048004, mean loss: 0.3386904141897236
Epoch: 77, step: 1431, loss: 0.3650607764720917, mean loss: 0.33869064834318025
Epoch: 77, step: 1432, loss: 0.32787778973579407, mean loss: 0.33869055233214673
Epoch: 77, step: 1433, loss: 0.3240445554256439, mean loss: 0.3386904222865348
Epoch: 77, step: 1434, loss: 0.3420765995979309, mean loss: 0.338690452353016
Epoch: 77, step: 1435, loss: 0.3380107581615448, mean loss: 0.3386904463179418
Epoch: 77, step: 1436, loss: 0.32354992628097534, mean loss: 0.3386903118849115
Epoch: 77, step: 1437, loss: 0.32548755407333374, mean loss: 0.33869019465835803
Epoch: 77, step: 1438, loss: 0.32383695244789124, mean loss: 0.3386900627784162
Epoch: 77, step: 1439, loss: 0.3496732711791992, mean loss: 0.338690160295982
Epoch: 77, step: 1440, loss: 0.32032346725463867, mean loss: 0.3386899972234781
Epoch: 77, step: 1441, loss: 0.35886234045028687, mean loss: 0.3386901763262325
Epoch: 77, step: 1442, loss: 0.31140926480293274, mean loss: 0.338689934111287
Epoch: 77, step: 1443, loss: 0.3641437590122223, mean loss: 0.3386901601023455
Valid: 77, mean loss: 0.18511075278123218
Epoch: 78, step: 0, loss: 0.34870657324790955, mean loss: 0.3386902490319944
Epoch: 78, step: 1, loss: 0.36096811294555664, mean loss: 0.3386904468218617
Epoch: 78, step: 2, loss: 0.3300323188304901, mean loss: 0.3386903699529667
Epoch: 78, step: 3, loss: 0.316417396068573, mean loss: 0.33869017221002584
Epoch: 78, step: 4, loss: 0.3255646824836731, mean loss: 0.3386900556809126
Epoch: 78, step: 5, loss: 0.35392212867736816, mean loss: 0.3386901909112345
Epoch: 78, step: 6, loss: 0.32032260298728943, mean loss: 0.3386900278452633
Epoch: 78, step: 7, loss: 0.3814784586429596, mean loss: 0.33869040771414466
Epoch: 78, step: 8, loss: 0.3103429973125458, mean loss: 0.3386901560525791
Epoch: 78, step: 9, loss: 0.3450726568698883, mean loss: 0.3386902127143999
Epoch: 78, step: 10, loss: 0.39183881878852844, mean loss: 0.33869068454670265
Epoch: 78, step: 11, loss: 0.31175658106803894, mean loss: 0.338690445438508
Epoch: 78, step: 12, loss: 0.3044430911540985, mean loss: 0.3386901414094407
Epoch: 78, step: 13, loss: 0.34445488452911377, mean loss: 0.338690192585187
Epoch: 78, step: 14, loss: 0.2959912419319153, mean loss: 0.3386898135342522
Epoch: 78, step: 15, loss: 0.3216385245323181, mean loss: 0.3386896621663717
Epoch: 78, step: 16, loss: 0.3203921616077423, mean loss: 0.3386894997370509
Epoch: 78, step: 17, loss: 0.34163594245910645, mean loss: 0.3386895258927786
Epoch: 78, step: 18, loss: 0.3125288784503937, mean loss: 0.338689293665391
Epoch: 78, step: 19, loss: 0.35882240533828735, mean loss: 0.33868947238491376
Epoch: 78, step: 20, loss: 0.29905012249946594, mean loss: 0.3386891205136819
Epoch: 78, step: 21, loss: 0.30844756960868835, mean loss: 0.33868885206736926
Epoch: 78, step: 22, loss: 0.3427126407623291, mean loss: 0.3386888877851687
Epoch: 78, step: 23, loss: 0.3428070843219757, mean loss: 0.33868892434066983
Epoch: 78, step: 24, loss: 0.32883042097091675, mean loss: 0.33868883683165246
Epoch: 78, step: 25, loss: 0.3712741434574127, mean loss: 0.3386891260725996
Epoch: 78, step: 26, loss: 0.28176766633987427, mean loss: 0.3386886208181616
Epoch: 78, step: 27, loss: 0.3047535717487335, mean loss: 0.3386883196016777
Epoch: 78, step: 28, loss: 0.32337918877601624, mean loss: 0.33868818371498377
Epoch: 78, step: 29, loss: 0.30447256565093994, mean loss: 0.3386878800134867
Epoch: 78, step: 30, loss: 0.3266414403915405, mean loss: 0.3386877730889452
Epoch: 78, step: 31, loss: 0.3535080552101135, mean loss: 0.33868790463302423
Epoch: 78, step: 32, loss: 0.3358648419380188, mean loss: 0.3386878795758841
Epoch: 78, step: 33, loss: 0.3452177345752716, mean loss: 0.33868793753351994
Epoch: 78, step: 34, loss: 0.33910709619522095, mean loss: 0.3386879412538521
Epoch: 78, step: 35, loss: 0.3020024001598358, mean loss: 0.33868761564639394
Epoch: 78, step: 36, loss: 0.35523971915245056, mean loss: 0.33868776255551275
Epoch: 78, step: 37, loss: 0.29483336210250854, mean loss: 0.33868737332678767
Epoch: 78, step: 38, loss: 0.30591556429862976, mean loss: 0.3386870824639301
Epoch: 78, step: 39, loss: 0.3169674575328827, mean loss: 0.3386868896953192
Epoch: 78, step: 40, loss: 0.3192266821861267, mean loss: 0.33868671698129266
Epoch: 78, step: 41, loss: 0.3553730547428131, mean loss: 0.338686865075243
Epoch: 78, step: 42, loss: 0.3197901248931885, mean loss: 0.3386866973651016
Epoch: 78, step: 43, loss: 0.3272518217563629, mean loss: 0.33868659588052985
Epoch: 78, step: 44, loss: 0.3509470224380493, mean loss: 0.3386867046909043
Epoch: 78, step: 45, loss: 0.33298903703689575, mean loss: 0.3386866541249761
Epoch: 78, step: 46, loss: 0.34619492292404175, mean loss: 0.3386867207591209
Epoch: 78, step: 47, loss: 0.31753018498420715, mean loss: 0.3386865330014374
Epoch: 78, step: 48, loss: 0.3595931828022003, mean loss: 0.3386867185398139
Epoch: 78, step: 49, loss: 0.3375425338745117, mean loss: 0.33868670838571063
Epoch: 78, step: 50, loss: 0.33185237646102905, mean loss: 0.33868664773475243
Epoch: 78, step: 51, loss: 0.3289843797683716, mean loss: 0.3386865616331944
Epoch: 78, step: 52, loss: 0.31194043159484863, mean loss: 0.3386863242801302
Epoch: 78, step: 53, loss: 0.34955456852912903, mean loss: 0.33868642072728644
Epoch: 78, step: 54, loss: 0.33211028575897217, mean loss: 0.3386863623697566
Epoch: 78, step: 55, loss: 0.3577761650085449, mean loss: 0.33868653177379815
Epoch: 78, step: 56, loss: 0.3384484052658081, mean loss: 0.33868652966066815
Epoch: 78, step: 57, loss: 0.3305582106113434, mean loss: 0.33868645753076265
Epoch: 78, step: 58, loss: 0.3420526087284088, mean loss: 0.33868648740139295
Epoch: 78, step: 59, loss: 0.29495444893836975, mean loss: 0.3386860993344631
Epoch: 78, step: 60, loss: 0.33398759365081787, mean loss: 0.33868605764149473
Epoch: 78, step: 61, loss: 0.37012234330177307, mean loss: 0.33868633659410674
Epoch: 78, step: 62, loss: 0.35470396280288696, mean loss: 0.3386864787266433
Epoch: 78, step: 63, loss: 0.3311326503753662, mean loss: 0.33868641169828073
Epoch: 78, step: 64, loss: 0.3071294128894806, mean loss: 0.3386861316819643
Epoch: 78, step: 65, loss: 0.37935227155685425, mean loss: 0.33868649252368177
Epoch: 78, step: 66, loss: 0.32125091552734375, mean loss: 0.3386863378144386
Epoch: 78, step: 67, loss: 0.40457454323768616, mean loss: 0.33868692244802706
Epoch: 78, step: 68, loss: 0.335997998714447, mean loss: 0.3386868985891107
Epoch: 78, step: 69, loss: 0.3352218568325043, mean loss: 0.3386868678439442
Epoch: 78, step: 70, loss: 0.33527672290802, mean loss: 0.33868683758614326
Epoch: 78, step: 71, loss: 0.3461487591266632, mean loss: 0.3386869037942773
Epoch: 78, step: 72, loss: 0.3101232051849365, mean loss: 0.33868665035655393
Epoch: 78, step: 73, loss: 0.31379958987236023, mean loss: 0.33868642954257344
Epoch: 78, step: 74, loss: 0.3367863595485687, mean loss: 0.338686412684082
Epoch: 78, step: 75, loss: 0.3376774191856384, mean loss: 0.3386864037318027
Epoch: 78, step: 76, loss: 0.37360429763793945, mean loss: 0.33868671353753166
Epoch: 78, step: 77, loss: 0.38266676664352417, mean loss: 0.3386871037429536
Epoch: 78, step: 78, loss: 0.3425382375717163, mean loss: 0.3386871379111699
Epoch: 78, step: 79, loss: 0.3262495696544647, mean loss: 0.3386870275629527
Epoch: 78, step: 80, loss: 0.33362236618995667, mean loss: 0.3386869826288158
Epoch: 78, step: 81, loss: 0.3397301733493805, mean loss: 0.33868699188401674
Epoch: 78, step: 82, loss: 0.33661186695098877, mean loss: 0.33868697347364607
Epoch: 78, step: 83, loss: 0.32379233837127686, mean loss: 0.3386868413306042
Epoch: 78, step: 84, loss: 0.32809513807296753, mean loss: 0.33868674736338317
Epoch: 78, step: 85, loss: 0.34287676215171814, mean loss: 0.33868678453592693
Epoch: 78, step: 86, loss: 0.3227737545967102, mean loss: 0.33868664336159127
Epoch: 78, step: 87, loss: 0.36657604575157166, mean loss: 0.3386868907835429
Epoch: 78, step: 88, loss: 0.32612213492393494, mean loss: 0.3386867793157964
Epoch: 78, step: 89, loss: 0.3334237039089203, mean loss: 0.3386867326250403
Epoch: 78, step: 90, loss: 0.3147202432155609, mean loss: 0.3386865200110271
Epoch: 78, step: 91, loss: 0.3743163049221039, mean loss: 0.33868683609087624
Epoch: 78, step: 92, loss: 0.34725067019462585, mean loss: 0.338686912061904
Epoch: 78, step: 93, loss: 0.32665786147117615, mean loss: 0.33868680535137946
Epoch: 78, step: 94, loss: 0.32342904806137085, mean loss: 0.33868666999997926
Epoch: 78, step: 95, loss: 0.3765168786048889, mean loss: 0.3386870055883744
Epoch: 78, step: 96, loss: 0.34981536865234375, mean loss: 0.3386871043062115
Epoch: 78, step: 97, loss: 0.31978869438171387, mean loss: 0.3386869366630826
Epoch: 78, step: 98, loss: 0.2927229404449463, mean loss: 0.3386865289314363
Epoch: 78, step: 99, loss: 0.28878408670425415, mean loss: 0.3386860862670444
Epoch: 78, step: 100, loss: 0.33108875155448914, mean loss: 0.3386860188747572
Epoch: 78, step: 101, loss: 0.3505067527294159, mean loss: 0.3386861237298484
Epoch: 78, step: 102, loss: 0.3527350127696991, mean loss: 0.3386862483485475
Epoch: 78, step: 103, loss: 0.30688074231147766, mean loss: 0.33868596622477126
Epoch: 78, step: 104, loss: 0.321585476398468, mean loss: 0.33868581453996655
Epoch: 78, step: 105, loss: 0.3179449141025543, mean loss: 0.33868563056561507
Epoch: 78, step: 106, loss: 0.32198861241340637, mean loss: 0.33868548246231317
Epoch: 78, step: 107, loss: 0.37432023882865906, mean loss: 0.338685798541401
Epoch: 78, step: 108, loss: 0.3531464636325836, mean loss: 0.3386859268058753
Epoch: 78, step: 109, loss: 0.3263775408267975, mean loss: 0.3386858176328432
Epoch: 78, step: 110, loss: 0.2996124029159546, mean loss: 0.3386854710621939
Epoch: 78, step: 111, loss: 0.32599201798439026, mean loss: 0.3386853584756875
Epoch: 78, step: 112, loss: 0.3315800130367279, mean loss: 0.3386852954543079
Epoch: 78, step: 113, loss: 0.32687851786613464, mean loss: 0.33868519073416187
Epoch: 78, step: 114, loss: 0.3014718294143677, mean loss: 0.33868486067339465
Epoch: 78, step: 115, loss: 0.3173940181732178, mean loss: 0.33868467183773904
Epoch: 78, step: 116, loss: 0.33217886090278625, mean loss: 0.33868461413602163
Epoch: 78, step: 117, loss: 0.32112735509872437, mean loss: 0.3386844584175379
Epoch: 78, step: 118, loss: 0.37878409028053284, mean loss: 0.33868481406522055
Epoch: 78, step: 119, loss: 0.35577183961868286, mean loss: 0.3386849656104309
Epoch: 78, step: 120, loss: 0.3109376132488251, mean loss: 0.33868471952072715
Epoch: 78, step: 121, loss: 0.3090718388557434, mean loss: 0.3386844568880874
Epoch: 78, step: 122, loss: 0.3152145445346832, mean loss: 0.3386842487384501
Epoch: 78, step: 123, loss: 0.3111945688724518, mean loss: 0.3386840049405159
Epoch: 78, step: 124, loss: 0.3276679515838623, mean loss: 0.33868390724322567
Epoch: 78, step: 125, loss: 0.35508692264556885, mean loss: 0.3386840527141936
Epoch: 78, step: 126, loss: 0.3211430609226227, mean loss: 0.3386838971524044
Epoch: 78, step: 127, loss: 0.3019416034221649, mean loss: 0.33868357130730214
Epoch: 78, step: 128, loss: 0.2930728495121002, mean loss: 0.33868316681708127
Epoch: 78, step: 129, loss: 0.34594014286994934, mean loss: 0.3386832311736558
Epoch: 78, step: 130, loss: 0.344839870929718, mean loss: 0.3386832857717044
Epoch: 78, step: 131, loss: 0.3294789493083954, mean loss: 0.33868320414692643
Epoch: 78, step: 132, loss: 0.32709234952926636, mean loss: 0.33868310135922974
Epoch: 78, step: 133, loss: 0.3055359721183777, mean loss: 0.33868280741310025
Epoch: 78, step: 134, loss: 0.32857638597488403, mean loss: 0.3386827177909463
Epoch: 78, step: 135, loss: 0.29055580496788025, mean loss: 0.3386822910128459
Epoch: 78, step: 136, loss: 0.3195813298225403, mean loss: 0.3386821216315338
Epoch: 78, step: 137, loss: 0.3460685908794403, mean loss: 0.33868218713183745
Epoch: 78, step: 138, loss: 0.338329553604126, mean loss: 0.3386821840048498
Epoch: 78, step: 139, loss: 0.32416102290153503, mean loss: 0.33868205523918893
Epoch: 78, step: 140, loss: 0.31062015891075134, mean loss: 0.3386818064039506
Epoch: 78, step: 141, loss: 0.364338219165802, mean loss: 0.33868203390685697
Epoch: 78, step: 142, loss: 0.31026512384414673, mean loss: 0.33868178192804904
Epoch: 78, step: 143, loss: 0.3597029149532318, mean loss: 0.3386819683252703
Epoch: 78, step: 144, loss: 0.3433937132358551, mean loss: 0.3386820101045774
Epoch: 78, step: 145, loss: 0.29133856296539307, mean loss: 0.33868159031129197
Epoch: 78, step: 146, loss: 0.3482515513896942, mean loss: 0.33868167516717007
Epoch: 78, step: 147, loss: 0.30431315302848816, mean loss: 0.3386813704276583
Epoch: 78, step: 148, loss: 0.31676724553108215, mean loss: 0.3386811761207724
Epoch: 78, step: 149, loss: 0.3074116110801697, mean loss: 0.3386808988640733
Epoch: 78, step: 150, loss: 0.32216590642929077, mean loss: 0.33868075243249735
Epoch: 78, step: 151, loss: 0.32028356194496155, mean loss: 0.3386805893136996
Epoch: 78, step: 152, loss: 0.360132098197937, mean loss: 0.33868077951194303
Epoch: 78, step: 153, loss: 0.30304521322250366, mean loss: 0.3386804635545876
Epoch: 78, step: 154, loss: 0.3773704469203949, mean loss: 0.3386808065904283
Epoch: 78, step: 155, loss: 0.3398740589618683, mean loss: 0.3386808171700323
Epoch: 78, step: 156, loss: 0.3476528525352478, mean loss: 0.33868089671711016
Epoch: 78, step: 157, loss: 0.32501694560050964, mean loss: 0.33868077557205195
Epoch: 78, step: 158, loss: 0.3338528275489807, mean loss: 0.33868073276767907
Epoch: 78, step: 159, loss: 0.36003100872039795, mean loss: 0.33868092205659983
Epoch: 78, step: 160, loss: 0.33918824791908264, mean loss: 0.33868092655444865
Epoch: 78, step: 161, loss: 0.31673577427864075, mean loss: 0.3386807319948774
Epoch: 78, step: 162, loss: 0.32490184903144836, mean loss: 0.3386806098362448
Epoch: 78, step: 163, loss: 0.3808741569519043, mean loss: 0.33868098390577844
Epoch: 78, step: 164, loss: 0.3452696204185486, mean loss: 0.3386810423172301
Epoch: 78, step: 165, loss: 0.3924657106399536, mean loss: 0.3386815191401199
Epoch: 78, step: 166, loss: 0.3263046443462372, mean loss: 0.33868140941507985
Epoch: 78, step: 167, loss: 0.33385196328163147, mean loss: 0.3386813666008411
Epoch: 78, step: 168, loss: 0.35446396470069885, mean loss: 0.3386815065162505
Epoch: 78, step: 169, loss: 0.3154242932796478, mean loss: 0.33868130033893773
Epoch: 78, step: 170, loss: 0.325039267539978, mean loss: 0.33868117940214704
Epoch: 78, step: 171, loss: 0.33008888363838196, mean loss: 0.33868110323201334
Epoch: 78, step: 172, loss: 0.29480013251304626, mean loss: 0.33868071423355833
Epoch: 78, step: 173, loss: 0.3193392753601074, mean loss: 0.3386805427760217
Epoch: 78, step: 174, loss: 0.31823620200157166, mean loss: 0.33868036154311265
Epoch: 78, step: 175, loss: 0.33973199129104614, mean loss: 0.33868037086541025
Epoch: 78, step: 176, loss: 0.33239948749542236, mean loss: 0.3386803151882624
Epoch: 78, step: 177, loss: 0.32449451088905334, mean loss: 0.338680189438734
Epoch: 78, step: 178, loss: 0.30463045835494995, mean loss: 0.33867988760884965
Epoch: 78, step: 179, loss: 0.33390143513679504, mean loss: 0.3386798452511885
Epoch: 78, step: 180, loss: 0.315367192029953, mean loss: 0.33867963860254674
Epoch: 78, step: 181, loss: 0.31915104389190674, mean loss: 0.33867946549819167
Epoch: 78, step: 182, loss: 0.3555099368095398, mean loss: 0.338679614684659
Epoch: 78, step: 183, loss: 0.31299078464508057, mean loss: 0.3386793869791027
Epoch: 78, step: 184, loss: 0.29124385118484497, mean loss: 0.338678966514671
Epoch: 78, step: 185, loss: 0.315582811832428, mean loss: 0.3386787617941948
Epoch: 78, step: 186, loss: 0.3331546485424042, mean loss: 0.33867871282980716
Epoch: 78, step: 187, loss: 0.3219553232192993, mean loss: 0.3386785645990891
Epoch: 78, step: 188, loss: 0.3590700626373291, mean loss: 0.3386787453411322
Epoch: 78, step: 189, loss: 0.33287835121154785, mean loss: 0.33867869392922556
Epoch: 78, step: 190, loss: 0.3163889944553375, mean loss: 0.33867849636579017
Epoch: 78, step: 191, loss: 0.34464943408966064, mean loss: 0.3386785492883751
Epoch: 78, step: 192, loss: 0.33424651622772217, mean loss: 0.33867851000600807
Epoch: 78, step: 193, loss: 0.336978554725647, mean loss: 0.33867849493895547
Epoch: 78, step: 194, loss: 0.30634382367134094, mean loss: 0.3386782083526661
Epoch: 78, step: 195, loss: 0.35148605704307556, mean loss: 0.3386783218692461
Epoch: 78, step: 196, loss: 0.31722474098205566, mean loss: 0.3386781317268103
Epoch: 78, step: 197, loss: 0.3139561116695404, mean loss: 0.33867791261823943
Epoch: 78, step: 198, loss: 0.3292798697948456, mean loss: 0.3386778293251478
Epoch: 78, step: 199, loss: 0.35435643792152405, mean loss: 0.3386779682804849
Epoch: 78, step: 200, loss: 0.33271524310112, mean loss: 0.3386779154349062
Epoch: 78, step: 201, loss: 0.3327796757221222, mean loss: 0.33867786316130327
Epoch: 78, step: 202, loss: 0.305919885635376, mean loss: 0.33867757284378186
Epoch: 78, step: 203, loss: 0.29279664158821106, mean loss: 0.3386771662277085
Epoch: 78, step: 204, loss: 0.3160252571105957, mean loss: 0.33867696547875986
Epoch: 78, step: 205, loss: 0.3019160032272339, mean loss: 0.3386766396934548
Epoch: 78, step: 206, loss: 0.32760000228881836, mean loss: 0.33867654153025406
Epoch: 78, step: 207, loss: 0.3353261649608612, mean loss: 0.338676511838863
Epoch: 78, step: 208, loss: 0.3587203323841095, mean loss: 0.3386766894677439
Epoch: 78, step: 209, loss: 0.3263239860534668, mean loss: 0.3386765799987216
Epoch: 78, step: 210, loss: 0.2939321994781494, mean loss: 0.33867618347983675
Epoch: 78, step: 211, loss: 0.34039828181266785, mean loss: 0.3386761987407131
Epoch: 78, step: 212, loss: 0.32483914494514465, mean loss: 0.338676076120714
Epoch: 78, step: 213, loss: 0.34380680322647095, mean loss: 0.338676121587342
Epoch: 78, step: 214, loss: 0.333786278963089, mean loss: 0.3386760782557282
Epoch: 78, step: 215, loss: 0.35271474719047546, mean loss: 0.3386762026590755
Epoch: 78, step: 216, loss: 0.31832394003868103, mean loss: 0.33867602230955873
Epoch: 78, step: 217, loss: 0.3384893536567688, mean loss: 0.338676020655428
Epoch: 78, step: 218, loss: 0.314383864402771, mean loss: 0.3386758053967573
Epoch: 78, step: 219, loss: 0.30991604924201965, mean loss: 0.3386755505518617
Epoch: 78, step: 220, loss: 0.3317835330963135, mean loss: 0.33867548948111076
Epoch: 78, step: 221, loss: 0.3327614665031433, mean loss: 0.33867543707691616
Epoch: 78, step: 222, loss: 0.3215109705924988, mean loss: 0.338675284983819
Epoch: 78, step: 223, loss: 0.31370416283607483, mean loss: 0.33867506371847067
Epoch: 78, step: 224, loss: 0.31683605909347534, mean loss: 0.33867487020805814
Epoch: 78, step: 225, loss: 0.33527058362960815, mean loss: 0.3386748400437226
Epoch: 78, step: 226, loss: 0.33737269043922424, mean loss: 0.338674828505878
Epoch: 78, step: 227, loss: 0.37553876638412476, mean loss: 0.3386751551400963
Epoch: 78, step: 228, loss: 0.36471158266067505, mean loss: 0.3386753858347341
Epoch: 78, step: 229, loss: 0.30906689167022705, mean loss: 0.338675123492279
Epoch: 78, step: 230, loss: 0.32872873544692993, mean loss: 0.33867503536430044
Epoch: 78, step: 231, loss: 0.3175453543663025, mean loss: 0.33867484815065396
Epoch: 78, step: 232, loss: 0.3624192178249359, mean loss: 0.33867505852915636
Epoch: 78, step: 233, loss: 0.35448595881462097, mean loss: 0.3386751986147471
Epoch: 78, step: 234, loss: 0.30956360697746277, mean loss: 0.33867494068646303
Epoch: 78, step: 235, loss: 0.3028097152709961, mean loss: 0.338674622923896
Epoch: 78, step: 236, loss: 0.34099727869033813, mean loss: 0.3386746435022281
Epoch: 78, step: 237, loss: 0.3523942232131958, mean loss: 0.33867476505427657
Epoch: 78, step: 238, loss: 0.33974745869636536, mean loss: 0.33867477455799005
Epoch: 78, step: 239, loss: 0.32414036989212036, mean loss: 0.3386746457890778
Epoch: 78, step: 240, loss: 0.35365617275238037, mean loss: 0.3386747785181358
Epoch: 78, step: 241, loss: 0.37246769666671753, mean loss: 0.3386750779043377
Epoch: 78, step: 242, loss: 0.32149022817611694, mean loss: 0.338674925657607
Epoch: 78, step: 243, loss: 0.3201856017112732, mean loss: 0.33867476185552375
Epoch: 78, step: 244, loss: 0.34759604930877686, mean loss: 0.33867484089100003
Epoch: 78, step: 245, loss: 0.33818820118904114, mean loss: 0.3386748365797994
Epoch: 78, step: 246, loss: 0.3376297652721405, mean loss: 0.338674827321467
Epoch: 78, step: 247, loss: 0.3614000976085663, mean loss: 0.33867502864384724
Epoch: 78, step: 248, loss: 0.3243996798992157, mean loss: 0.3386749021801488
Epoch: 78, step: 249, loss: 0.34420421719551086, mean loss: 0.3386749511632906
Epoch: 78, step: 250, loss: 0.3211763799190521, mean loss: 0.33867479614817547
Epoch: 78, step: 251, loss: 0.3184463381767273, mean loss: 0.3386746169513188
Epoch: 78, step: 252, loss: 0.3172045946121216, mean loss: 0.3386744267575611
Epoch: 78, step: 253, loss: 0.34947794675827026, mean loss: 0.33867452246048263
Epoch: 78, step: 254, loss: 0.3125348687171936, mean loss: 0.3386742909045573
Epoch: 78, step: 255, loss: 0.31524986028671265, mean loss: 0.3386740834030459
Epoch: 78, step: 256, loss: 0.31735289096832275, mean loss: 0.33867389453440117
Epoch: 78, step: 257, loss: 0.3648624122142792, mean loss: 0.33867412651701856
Epoch: 78, step: 258, loss: 0.34977439045906067, mean loss: 0.3386742248442895
Epoch: 78, step: 259, loss: 0.32017919421195984, mean loss: 0.3386740610148717
Epoch: 78, step: 260, loss: 0.29767677187919617, mean loss: 0.3386736978631339
Epoch: 78, step: 261, loss: 0.30595263838768005, mean loss: 0.3386734080243517
Epoch: 78, step: 262, loss: 0.33723658323287964, mean loss: 0.338673395297262
Epoch: 78, step: 263, loss: 0.30517926812171936, mean loss: 0.3386730986160051
Epoch: 78, step: 264, loss: 0.329291969537735, mean loss: 0.3386730155214226
Epoch: 78, step: 265, loss: 0.35421666502952576, mean loss: 0.33867315320011937
Epoch: 78, step: 266, loss: 0.3014407157897949, mean loss: 0.3386728234147589
Epoch: 78, step: 267, loss: 0.3539818227291107, mean loss: 0.33867295901262706
Epoch: 78, step: 268, loss: 0.3034365177154541, mean loss: 0.3386726469122799
Epoch: 78, step: 269, loss: 0.30023548007011414, mean loss: 0.3386723064651059
Epoch: 78, step: 270, loss: 0.32242655754089355, mean loss: 0.33867216257389904
Epoch: 78, step: 271, loss: 0.3332129716873169, mean loss: 0.33867211422139704
Epoch: 78, step: 272, loss: 0.29410722851753235, mean loss: 0.33867171951004055
Epoch: 78, step: 273, loss: 0.36482733488082886, mean loss: 0.33867195116837023
Epoch: 78, step: 274, loss: 0.29804834723472595, mean loss: 0.33867159137133435
Epoch: 78, step: 275, loss: 0.31469470262527466, mean loss: 0.3386713790135851
Epoch: 78, step: 276, loss: 0.30792176723480225, mean loss: 0.338671106673809
Epoch: 78, step: 277, loss: 0.3476954996585846, mean loss: 0.33867118659935136
Epoch: 78, step: 278, loss: 0.35524460673332214, mean loss: 0.3386713333823941
Epoch: 78, step: 279, loss: 0.3075419068336487, mean loss: 0.3386710576860416
Epoch: 78, step: 280, loss: 0.4444410800933838, mean loss: 0.33867199442514523
Epoch: 78, step: 281, loss: 0.38093769550323486, mean loss: 0.33867236874277706
Epoch: 78, step: 282, loss: 0.3167012631893158, mean loss: 0.33867217416184847
Epoch: 78, step: 283, loss: 0.3275527358055115, mean loss: 0.33867207568653623
Epoch: 78, step: 284, loss: 0.3244496285915375, mean loss: 0.33867194973165704
Epoch: 78, step: 285, loss: 0.36391380429267883, mean loss: 0.3386721732731169
Epoch: 78, step: 286, loss: 0.311269611120224, mean loss: 0.33867193059861433
Epoch: 78, step: 287, loss: 0.3655086159706116, mean loss: 0.33867216825966084
Epoch: 78, step: 288, loss: 0.3305170238018036, mean loss: 0.33867209603975085
Epoch: 78, step: 289, loss: 0.31496521830558777, mean loss: 0.33867188609945814
Epoch: 78, step: 290, loss: 0.3225693702697754, mean loss: 0.33867174350214996
Epoch: 78, step: 291, loss: 0.3729517161846161, mean loss: 0.33867204706890885
Epoch: 78, step: 292, loss: 0.2907086908817291, mean loss: 0.3386716223325246
Epoch: 78, step: 293, loss: 0.33707720041275024, mean loss: 0.33867160821334996
Epoch: 78, step: 294, loss: 0.32104671001434326, mean loss: 0.33867145213997335
Epoch: 78, step: 295, loss: 0.34404563903808594, mean loss: 0.33867149972947197
Epoch: 78, step: 296, loss: 0.3669312000274658, mean loss: 0.3386717499725477
Epoch: 78, step: 297, loss: 0.35124024748802185, mean loss: 0.33867186126713295
Epoch: 78, step: 298, loss: 0.3413248360157013, mean loss: 0.33867188475913024
Epoch: 78, step: 299, loss: 0.30798450112342834, mean loss: 0.33867161302584264
Epoch: 78, step: 300, loss: 0.31074240803718567, mean loss: 0.33867136571810275
Epoch: 78, step: 301, loss: 0.3091680407524109, mean loss: 0.3386711044741464
Epoch: 78, step: 302, loss: 0.3785735070705414, mean loss: 0.33867145779599167
Epoch: 78, step: 303, loss: 0.33899930119514465, mean loss: 0.3386714606989048
Epoch: 78, step: 304, loss: 0.3438766598701477, mean loss: 0.33867150678831015
Epoch: 78, step: 305, loss: 0.3978154957294464, mean loss: 0.3386720304737742
Epoch: 78, step: 306, loss: 0.3393383026123047, mean loss: 0.33867203637317245
Epoch: 78, step: 307, loss: 0.3449520468711853, mean loss: 0.3386720919780113
Epoch: 78, step: 308, loss: 0.3437734842300415, mean loss: 0.3386721371466591
Epoch: 78, step: 309, loss: 0.32655030488967896, mean loss: 0.3386720298187186
Epoch: 78, step: 310, loss: 0.3027055859565735, mean loss: 0.3386717113709718
Epoch: 78, step: 311, loss: 0.33541154861450195, mean loss: 0.33867168250566904
Epoch: 78, step: 312, loss: 0.2876286804676056, mean loss: 0.33867123057772147
Epoch: 78, step: 313, loss: 0.34966593980789185, mean loss: 0.338671327922552
Epoch: 78, step: 314, loss: 0.34750571846961975, mean loss: 0.3386714061396852
Epoch: 78, step: 315, loss: 0.35124820470809937, mean loss: 0.33867151749002844
Epoch: 78, step: 316, loss: 0.3291792869567871, mean loss: 0.3386714334500588
Epoch: 78, step: 317, loss: 0.35731804370880127, mean loss: 0.33867159853735634
Epoch: 78, step: 318, loss: 0.3546537458896637, mean loss: 0.3386717400336455
Epoch: 78, step: 319, loss: 0.35259145498275757, mean loss: 0.3386718632693115
Epoch: 78, step: 320, loss: 0.3047238290309906, mean loss: 0.33867156271922216
Epoch: 78, step: 321, loss: 0.3620142638683319, mean loss: 0.3386717693759244
Epoch: 78, step: 322, loss: 0.41799989342689514, mean loss: 0.33867247167439773
Epoch: 78, step: 323, loss: 0.31373122334480286, mean loss: 0.33867225086940883
Epoch: 78, step: 324, loss: 0.32150956988334656, mean loss: 0.3386720989294584
Epoch: 78, step: 325, loss: 0.31499332189559937, mean loss: 0.3386718893048454
Epoch: 78, step: 326, loss: 0.38261324167251587, mean loss: 0.3386722783075133
Epoch: 78, step: 327, loss: 0.31330636143684387, mean loss: 0.3386720537508838
Epoch: 78, step: 328, loss: 0.37387093901634216, mean loss: 0.3386723653529877
Epoch: 78, step: 329, loss: 0.3909075856208801, mean loss: 0.33867282776707625
Epoch: 78, step: 330, loss: 0.33626747131347656, mean loss: 0.3386728064737638
Epoch: 78, step: 331, loss: 0.35215720534324646, mean loss: 0.3386729258427563
Epoch: 78, step: 332, loss: 0.33822017908096313, mean loss: 0.33867292183490644
Epoch: 78, step: 333, loss: 0.30783817172050476, mean loss: 0.33867264887888326
Epoch: 78, step: 334, loss: 0.3374394178390503, mean loss: 0.33867263796214614
Epoch: 78, step: 335, loss: 0.30966848134994507, mean loss: 0.3386723812154868
Epoch: 78, step: 336, loss: 0.3445517122745514, mean loss: 0.33867243325924273
Epoch: 78, step: 337, loss: 0.4036962687969208, mean loss: 0.3386730088442258
Epoch: 78, step: 338, loss: 0.3419834077358246, mean loss: 0.3386730381473115
Epoch: 78, step: 339, loss: 0.3544933497905731, mean loss: 0.33867317818476894
Epoch: 78, step: 340, loss: 0.35306990146636963, mean loss: 0.3386733056198488
Epoch: 78, step: 341, loss: 0.30590763688087463, mean loss: 0.33867301559144636
Epoch: 78, step: 342, loss: 0.3391200602054596, mean loss: 0.33867301954846885
Epoch: 78, step: 343, loss: 0.35795846581459045, mean loss: 0.3386731902523906
Epoch: 78, step: 344, loss: 0.3513709306716919, mean loss: 0.3386733026446512
Epoch: 78, step: 345, loss: 0.33076176047325134, mean loss: 0.33867323261737003
Epoch: 78, step: 346, loss: 0.3302246332168579, mean loss: 0.33867315783710644
Epoch: 78, step: 347, loss: 0.33737048506736755, mean loss: 0.3386731463069881
Epoch: 78, step: 348, loss: 0.30063310265541077, mean loss: 0.33867280961282137
Epoch: 78, step: 349, loss: 0.3014887869358063, mean loss: 0.33867248049824844
Epoch: 78, step: 350, loss: 0.29696568846702576, mean loss: 0.3386721113560586
Epoch: 78, step: 351, loss: 0.3423374891281128, mean loss: 0.33867214379762356
Epoch: 78, step: 352, loss: 0.3459102213382721, mean loss: 0.3386722078599109
Epoch: 78, step: 353, loss: 0.30304154753685, mean loss: 0.33867189250526236
Epoch: 78, step: 354, loss: 0.3366837203502655, mean loss: 0.33867187490879413
Epoch: 78, step: 355, loss: 0.3848801255226135, mean loss: 0.338672283874796
Epoch: 78, step: 356, loss: 0.3646480441093445, mean loss: 0.33867251377115964
Epoch: 78, step: 357, loss: 0.34932610392570496, mean loss: 0.3386726080590626
Epoch: 78, step: 358, loss: 0.3085705041885376, mean loss: 0.33867234164754423
Epoch: 78, step: 359, loss: 0.3329348564147949, mean loss: 0.33867229086974376
Epoch: 78, step: 360, loss: 0.32784074544906616, mean loss: 0.33867219500942125
Epoch: 78, step: 361, loss: 0.37072890996932983, mean loss: 0.3386724787122281
Epoch: 78, step: 362, loss: 0.3281797170639038, mean loss: 0.33867238585182147
Epoch: 78, step: 363, loss: 0.3524208664894104, mean loss: 0.3386725075240987
Epoch: 78, step: 364, loss: 0.3081471025943756, mean loss: 0.3386722373806
Epoch: 78, step: 365, loss: 0.2917076349258423, mean loss: 0.3386718217572929
Epoch: 78, step: 366, loss: 0.299614816904068, mean loss: 0.33867147611702303
Epoch: 78, step: 367, loss: 0.3258196711540222, mean loss: 0.33867136238423573
Epoch: 78, step: 368, loss: 0.3310658931732178, mean loss: 0.3386712950797941
Epoch: 78, step: 369, loss: 0.3008766174316406, mean loss: 0.3386709606195399
Epoch: 78, step: 370, loss: 0.33874014019966125, mean loss: 0.3386709612317323
Epoch: 78, step: 371, loss: 0.3003673851490021, mean loss: 0.33867062227403094
Epoch: 78, step: 372, loss: 0.31311094760894775, mean loss: 0.33867039609222777
Epoch: 78, step: 373, loss: 0.3391485810279846, mean loss: 0.3386704003237282
Epoch: 78, step: 374, loss: 0.3439170718193054, mean loss: 0.3386704467515733
Epoch: 78, step: 375, loss: 0.37070316076278687, mean loss: 0.3386707302068509
Epoch: 78, step: 376, loss: 0.3160804212093353, mean loss: 0.3386705303085331
Epoch: 78, step: 377, loss: 0.36838939785957336, mean loss: 0.33867079328408883
Epoch: 78, step: 378, loss: 0.3423742949962616, mean loss: 0.3386708260552502
Epoch: 78, step: 379, loss: 0.34459537267684937, mean loss: 0.33867087847929916
Epoch: 78, step: 380, loss: 0.3232250511646271, mean loss: 0.3386707418062853
Epoch: 78, step: 381, loss: 0.3361809253692627, mean loss: 0.33867071977524105
Epoch: 78, step: 382, loss: 0.3178274929523468, mean loss: 0.338670535346388
Epoch: 78, step: 383, loss: 0.2961215078830719, mean loss: 0.3386701588596298
Epoch: 78, step: 384, loss: 0.34799638390541077, mean loss: 0.3386702413801802
Epoch: 78, step: 385, loss: 0.3683190941810608, mean loss: 0.33867050371762025
Epoch: 78, step: 386, loss: 0.35640037059783936, mean loss: 0.33867066059271983
Epoch: 78, step: 387, loss: 0.3114314079284668, mean loss: 0.3386704195800436
Epoch: 78, step: 388, loss: 0.3239428997039795, mean loss: 0.3386702892722258
Epoch: 78, step: 389, loss: 0.40390607714653015, mean loss: 0.3386708664677088
Epoch: 78, step: 390, loss: 0.29884541034698486, mean loss: 0.3386705141017645
Epoch: 78, step: 391, loss: 0.3241153955459595, mean loss: 0.3386703853227569
Epoch: 78, step: 392, loss: 0.3456515371799469, mean loss: 0.3386704470891967
Epoch: 78, step: 393, loss: 0.38800427317619324, mean loss: 0.33867088357129893
Epoch: 78, step: 394, loss: 0.342178612947464, mean loss: 0.3386709146057365
Epoch: 78, step: 395, loss: 0.3275264799594879, mean loss: 0.3386708160068526
Epoch: 78, step: 396, loss: 0.355162650346756, mean loss: 0.33867096191484386
Epoch: 78, step: 397, loss: 0.35316577553749084, mean loss: 0.3386710901534851
Epoch: 78, step: 398, loss: 0.36021074652671814, mean loss: 0.3386712807176345
Epoch: 78, step: 399, loss: 0.3251475989818573, mean loss: 0.3386711610729168
Epoch: 78, step: 400, loss: 0.3436495065689087, mean loss: 0.3386712051162094
Epoch: 78, step: 401, loss: 0.3520973324775696, mean loss: 0.3386713238957568
Epoch: 78, step: 402, loss: 0.3610754907131195, mean loss: 0.3386715221013287
Epoch: 78, step: 403, loss: 0.3270418643951416, mean loss: 0.3386714192167813
Epoch: 78, step: 404, loss: 0.32614725828170776, mean loss: 0.33867130841977733
Epoch: 78, step: 405, loss: 0.36720168590545654, mean loss: 0.3386715608161174
Epoch: 78, step: 406, loss: 0.33322787284851074, mean loss: 0.33867151265850837
Epoch: 78, step: 407, loss: 0.3193238079547882, mean loss: 0.33867134150046957
Epoch: 78, step: 408, loss: 0.3470025658607483, mean loss: 0.3386714152013777
Epoch: 78, step: 409, loss: 0.3223066031932831, mean loss: 0.33867127043383993
Epoch: 78, step: 410, loss: 0.3365156650543213, mean loss: 0.3386712513649424
Epoch: 78, step: 411, loss: 0.32539352774620056, mean loss: 0.3386711339086987
Epoch: 78, step: 412, loss: 0.34462061524391174, mean loss: 0.3386711865380174
Epoch: 78, step: 413, loss: 0.3379383981227875, mean loss: 0.338671180055803
Epoch: 78, step: 414, loss: 0.33442962169647217, mean loss: 0.3386711425354941
Epoch: 78, step: 415, loss: 0.3143920600414276, mean loss: 0.3386709277675858
Epoch: 78, step: 416, loss: 0.31414058804512024, mean loss: 0.3386707107790258
Epoch: 78, step: 417, loss: 0.3118530809879303, mean loss: 0.3386704735598326
Epoch: 78, step: 418, loss: 0.3200055956840515, mean loss: 0.338670308458437
Epoch: 78, step: 419, loss: 0.3246595561504364, mean loss: 0.33867018452650915
Epoch: 78, step: 420, loss: 0.3172885477542877, mean loss: 0.3386699953971913
Epoch: 78, step: 421, loss: 0.3509109318256378, mean loss: 0.33867010367232026
Epoch: 78, step: 422, loss: 0.347612202167511, mean loss: 0.33867018276743766
Epoch: 78, step: 423, loss: 0.31511178612709045, mean loss: 0.3386699743893185
Epoch: 78, step: 424, loss: 0.34857282042503357, mean loss: 0.33867006198094074
Epoch: 78, step: 425, loss: 0.3325973153114319, mean loss: 0.3386700082673896
Epoch: 78, step: 426, loss: 0.29188889265060425, mean loss: 0.3386695944912584
Epoch: 78, step: 427, loss: 0.3600071370601654, mean loss: 0.3386697832188594
Epoch: 78, step: 428, loss: 0.3126896321773529, mean loss: 0.3386695534300636
Epoch: 78, step: 429, loss: 0.3321630656719208, mean loss: 0.33866949588210093
Epoch: 78, step: 430, loss: 0.32462775707244873, mean loss: 0.3386693716881665
Epoch: 78, step: 431, loss: 0.32516223192214966, mean loss: 0.33866925222361755
Epoch: 78, step: 432, loss: 0.28275933861732483, mean loss: 0.3386687577300642
Epoch: 78, step: 433, loss: 0.3035828173160553, mean loss: 0.3386684474162615
Epoch: 78, step: 434, loss: 0.33112770318984985, mean loss: 0.3386683807235552
Epoch: 78, step: 435, loss: 0.37396040558815, mean loss: 0.3386686928545283
Epoch: 78, step: 436, loss: 0.2916404604911804, mean loss: 0.3386682769294528
Epoch: 78, step: 437, loss: 0.30728021264076233, mean loss: 0.33866799933093605
Epoch: 78, step: 438, loss: 0.31896108388900757, mean loss: 0.33866782504296267
Epoch: 78, step: 439, loss: 0.39519745111465454, mean loss: 0.33866832498659216
Epoch: 78, step: 440, loss: 0.3346385359764099, mean loss: 0.3386682893477658
Epoch: 78, step: 441, loss: 0.33400508761405945, mean loss: 0.33866824810750074
Epoch: 78, step: 442, loss: 0.3341215252876282, mean loss: 0.3386682078977035
Epoch: 78, step: 443, loss: 0.4060969352722168, mean loss: 0.3386688042110448
Epoch: 78, step: 444, loss: 0.34410926699638367, mean loss: 0.3386688523239483
Epoch: 78, step: 445, loss: 0.3406648635864258, mean loss: 0.33866886997558043
Epoch: 78, step: 446, loss: 0.3364998400211334, mean loss: 0.3386688507940352
Epoch: 78, step: 447, loss: 0.3408011794090271, mean loss: 0.33866886965084997
Epoch: 78, step: 448, loss: 0.33354419469833374, mean loss: 0.3386688243322292
Epoch: 78, step: 449, loss: 0.3848221004009247, mean loss: 0.3386692324721283
Epoch: 78, step: 450, loss: 0.30190151929855347, mean loss: 0.3386689073329547
Epoch: 78, step: 451, loss: 0.32055747509002686, mean loss: 0.3386687471738496
Epoch: 78, step: 452, loss: 0.3357049524784088, mean loss: 0.3386687209652924
Epoch: 78, step: 453, loss: 0.32159796357154846, mean loss: 0.33866857001152806
Epoch: 78, step: 454, loss: 0.33551040291786194, mean loss: 0.3386685420846479
Epoch: 78, step: 455, loss: 0.37006378173828125, mean loss: 0.33866881970242924
Epoch: 78, step: 456, loss: 0.33765846490859985, mean loss: 0.338668810768273
Epoch: 78, step: 457, loss: 0.3816831111907959, mean loss: 0.3386691911228616
Epoch: 78, step: 458, loss: 0.36219149827957153, mean loss: 0.3386693991173718
Epoch: 78, step: 459, loss: 0.30359452962875366, mean loss: 0.3386690889728038
Epoch: 78, step: 460, loss: 0.3380292057991028, mean loss: 0.33866908331477746
Epoch: 78, step: 461, loss: 0.32000166177749634, mean loss: 0.33866891825366424
Epoch: 78, step: 462, loss: 0.3359471261501312, mean loss: 0.3386688941872413
Epoch: 78, step: 463, loss: 0.34213387966156006, mean loss: 0.33866892482480115
Epoch: 78, step: 464, loss: 0.37687888741493225, mean loss: 0.33866926267604913
Epoch: 78, step: 465, loss: 0.3367067873477936, mean loss: 0.33866924532405945
Epoch: 78, step: 466, loss: 0.2964201867580414, mean loss: 0.3386688717658621
Epoch: 78, step: 467, loss: 0.378291517496109, mean loss: 0.3386692220987156
Epoch: 78, step: 468, loss: 0.35627955198287964, mean loss: 0.3386693778031734
Epoch: 78, step: 469, loss: 0.33573195338249207, mean loss: 0.3386693518317103
Epoch: 78, step: 470, loss: 0.31020647287368774, mean loss: 0.3386691001772099
Epoch: 78, step: 471, loss: 0.3194473683834076, mean loss: 0.3386689302298005
Epoch: 78, step: 472, loss: 0.31683504581451416, mean loss: 0.3386687371889587
Epoch: 78, step: 473, loss: 0.35286813974380493, mean loss: 0.33866886272962454
Epoch: 78, step: 474, loss: 0.30634453892707825, mean loss: 0.3386685769442726
Epoch: 78, step: 475, loss: 0.33427977561950684, mean loss: 0.33866853814240777
Epoch: 78, step: 476, loss: 0.335903137922287, mean loss: 0.338668513693423
Epoch: 78, step: 477, loss: 0.29003390669822693, mean loss: 0.3386680837172317
Epoch: 78, step: 478, loss: 0.39175304770469666, mean loss: 0.33866855303466314
Epoch: 78, step: 479, loss: 0.36842766404151917, mean loss: 0.33866881612886185
Epoch: 78, step: 480, loss: 0.3344459533691406, mean loss: 0.3386687787957281
Epoch: 78, step: 481, loss: 0.3495800197124481, mean loss: 0.3386688752580662
Epoch: 78, step: 482, loss: 0.31504133343696594, mean loss: 0.3386686663773535
Epoch: 78, step: 483, loss: 0.30279430747032166, mean loss: 0.3386683492307172
Epoch: 78, step: 484, loss: 0.33495500683784485, mean loss: 0.33866831640326955
Epoch: 78, step: 485, loss: 0.30386078357696533, mean loss: 0.338668008693331
Epoch: 78, step: 486, loss: 0.3194746971130371, mean loss: 0.338667839019699
Epoch: 78, step: 487, loss: 0.36804622411727905, mean loss: 0.3386680987296097
Epoch: 78, step: 488, loss: 0.3532097637653351, mean loss: 0.3386682272792604
Epoch: 78, step: 489, loss: 0.29815566539764404, mean loss: 0.338667869147669
Epoch: 78, step: 490, loss: 0.3708275556564331, mean loss: 0.33866815343721673
Epoch: 78, step: 491, loss: 0.3212287127971649, mean loss: 0.33866799927505276
Epoch: 78, step: 492, loss: 0.3063533306121826, mean loss: 0.3386677136205231
Epoch: 78, step: 493, loss: 0.2950180470943451, mean loss: 0.33866732777052816
Epoch: 78, step: 494, loss: 0.3321129381656647, mean loss: 0.33866726983219686
Epoch: 78, step: 495, loss: 0.3405955731868744, mean loss: 0.33866728687752035
Epoch: 78, step: 496, loss: 0.3022419512271881, mean loss: 0.33866696489698794
Epoch: 78, step: 497, loss: 0.31395044922828674, mean loss: 0.3386667464181082
Epoch: 78, step: 498, loss: 0.32737264037132263, mean loss: 0.3386666465860016
Epoch: 78, step: 499, loss: 0.35778194665908813, mean loss: 0.3386668155505746
Epoch: 78, step: 500, loss: 0.32028448581695557, mean loss: 0.33866665306633276
Epoch: 78, step: 501, loss: 0.3163685202598572, mean loss: 0.338666455971447
Epoch: 78, step: 502, loss: 0.34040191769599915, mean loss: 0.33866647131118915
Epoch: 78, step: 503, loss: 0.33588629961013794, mean loss: 0.3386664467374752
Epoch: 78, step: 504, loss: 0.3463291823863983, mean loss: 0.3386665144671803
Epoch: 78, step: 505, loss: 0.3325006365776062, mean loss: 0.33866645996844524
Epoch: 78, step: 506, loss: 0.29645708203315735, mean loss: 0.338666086893043
Epoch: 78, step: 507, loss: 0.31019705533981323, mean loss: 0.33866583526646044
Epoch: 78, step: 508, loss: 0.3345077335834503, mean loss: 0.3386657985149585
Epoch: 78, step: 509, loss: 0.2956039011478424, mean loss: 0.3386654179144974
Epoch: 78, step: 510, loss: 0.3198093771934509, mean loss: 0.33866525125778224
Epoch: 78, step: 511, loss: 0.3099440932273865, mean loss: 0.3386649974117274
Epoch: 78, step: 512, loss: 0.33001503348350525, mean loss: 0.33866492096147394
Epoch: 78, step: 513, loss: 0.35127711296081543, mean loss: 0.33866503242977153
Epoch: 78, step: 514, loss: 0.30613550543785095, mean loss: 0.33866474493185295
Epoch: 78, step: 515, loss: 0.3262653946876526, mean loss: 0.3386646353466173
Epoch: 78, step: 516, loss: 0.30638056993484497, mean loss: 0.3386643500231464
Epoch: 78, step: 517, loss: 0.28337186574935913, mean loss: 0.3386638613577971
Epoch: 78, step: 518, loss: 0.3533729910850525, mean loss: 0.33866399135337577
Epoch: 78, step: 519, loss: 0.3536766767501831, mean loss: 0.33866412403053037
Epoch: 78, step: 520, loss: 0.28914472460746765, mean loss: 0.338663686398303
Epoch: 78, step: 521, loss: 0.3437296152114868, mean loss: 0.33866373116851717
Epoch: 78, step: 522, loss: 0.315496027469635, mean loss: 0.3386635264254329
Epoch: 78, step: 523, loss: 0.3102395832538605, mean loss: 0.33866327523289186
Epoch: 78, step: 524, loss: 0.323274701833725, mean loss: 0.3386631392397726
Epoch: 78, step: 525, loss: 0.3583522140979767, mean loss: 0.3386633132360862
Epoch: 78, step: 526, loss: 0.3311518728733063, mean loss: 0.33866324685656396
Epoch: 78, step: 527, loss: 0.31955206394195557, mean loss: 0.3386630779701826
Epoch: 78, step: 528, loss: 0.3295208811759949, mean loss: 0.33866299718089304
Epoch: 78, step: 529, loss: 0.374224454164505, mean loss: 0.33866331143353073
Epoch: 78, step: 530, loss: 0.317085862159729, mean loss: 0.3386631207576979
Epoch: 78, step: 531, loss: 0.343851238489151, mean loss: 0.3386631666037066
Epoch: 78, step: 532, loss: 0.3110556900501251, mean loss: 0.33866292264597625
Epoch: 78, step: 533, loss: 0.3360036015510559, mean loss: 0.33866289914668235
Epoch: 78, step: 534, loss: 0.3550787568092346, mean loss: 0.33866304420538024
Epoch: 78, step: 535, loss: 0.3527648448944092, mean loss: 0.33866316881481656
Epoch: 78, step: 536, loss: 0.37698543071746826, mean loss: 0.3386635074434331
Epoch: 78, step: 537, loss: 0.3170955181121826, mean loss: 0.33866331686298484
Epoch: 78, step: 538, loss: 0.30331751704216003, mean loss: 0.3386630045409251
Epoch: 78, step: 539, loss: 0.3418618440628052, mean loss: 0.3386630328062162
Epoch: 78, step: 540, loss: 0.35520556569099426, mean loss: 0.33866317897652964
Epoch: 78, step: 541, loss: 0.30338194966316223, mean loss: 0.3386628672332908
Epoch: 78, step: 542, loss: 0.3318912088871002, mean loss: 0.3386628073997733
Epoch: 78, step: 543, loss: 0.3655661344528198, mean loss: 0.3386630451120714
Epoch: 78, step: 544, loss: 0.31242692470550537, mean loss: 0.33866281329712306
Epoch: 78, step: 545, loss: 0.35436490178108215, mean loss: 0.33866295203511526
Epoch: 78, step: 546, loss: 0.3508606255054474, mean loss: 0.3386630598084078
Epoch: 78, step: 547, loss: 0.34159162640571594, mean loss: 0.33866308568370906
Epoch: 78, step: 548, loss: 0.34764227271080017, mean loss: 0.33866316501846516
Epoch: 78, step: 549, loss: 0.31595855951309204, mean loss: 0.3386629644158472
Epoch: 78, step: 550, loss: 0.33523261547088623, mean loss: 0.33866293410785975
Epoch: 78, step: 551, loss: 0.32144445180892944, mean loss: 0.33866278197962346
Epoch: 78, step: 552, loss: 0.35323846340179443, mean loss: 0.33866291075712424
Epoch: 78, step: 553, loss: 0.35117366909980774, mean loss: 0.338663021289861
Epoch: 78, step: 554, loss: 0.2874574363231659, mean loss: 0.33866256889175017
Epoch: 78, step: 555, loss: 0.3118111491203308, mean loss: 0.3386623316632474
Epoch: 78, step: 556, loss: 0.30323272943496704, mean loss: 0.3386620186504791
Epoch: 78, step: 557, loss: 0.3133576810359955, mean loss: 0.338661795094179
Epoch: 78, step: 558, loss: 0.3706749379634857, mean loss: 0.33866207791828046
Epoch: 78, step: 559, loss: 0.30799075961112976, mean loss: 0.3386618069510893
Epoch: 78, step: 560, loss: 0.35072076320648193, mean loss: 0.3386619134855592
Epoch: 78, step: 561, loss: 0.29904741048812866, mean loss: 0.33866156351556964
Epoch: 78, step: 562, loss: 0.3446562886238098, mean loss: 0.33866161647484444
Epoch: 78, step: 563, loss: 0.3486756682395935, mean loss: 0.3386617049413253
Epoch: 78, step: 564, loss: 0.32886531949043274, mean loss: 0.33866161839852427
Epoch: 78, step: 565, loss: 0.30902814865112305, mean loss: 0.338661356614131
Epoch: 78, step: 566, loss: 0.32223832607269287, mean loss: 0.33866121153307427
Epoch: 78, step: 567, loss: 0.35220953822135925, mean loss: 0.338661331217939
Epoch: 78, step: 568, loss: 0.3488028347492218, mean loss: 0.3386614208064014
Epoch: 78, step: 569, loss: 0.33053237199783325, mean loss: 0.33866134899628486
Epoch: 78, step: 570, loss: 0.3264033794403076, mean loss: 0.3386612407132044
Epoch: 78, step: 571, loss: 0.34470266103744507, mean loss: 0.3386612940807561
Epoch: 78, step: 572, loss: 0.3207583427429199, mean loss: 0.338661135934461
Epoch: 78, step: 573, loss: 0.28914451599121094, mean loss: 0.3386606985316737
Epoch: 78, step: 574, loss: 0.31114283204078674, mean loss: 0.3386604554560115
Epoch: 78, step: 575, loss: 0.3009812831878662, mean loss: 0.33866012262465445
Epoch: 78, step: 576, loss: 0.3094629943370819, mean loss: 0.3386598647199977
Epoch: 78, step: 577, loss: 0.33058714866638184, mean loss: 0.33865979341255087
Epoch: 78, step: 578, loss: 0.3386143147945404, mean loss: 0.3386597930108353
Epoch: 78, step: 579, loss: 0.3032134473323822, mean loss: 0.33865947991376366
Epoch: 78, step: 580, loss: 0.31407272815704346, mean loss: 0.3386592627412503
Epoch: 78, step: 581, loss: 0.3080606162548065, mean loss: 0.33865899246861186
Epoch: 78, step: 582, loss: 0.3143637478351593, mean loss: 0.338658777874745
Epoch: 78, step: 583, loss: 0.315206378698349, mean loss: 0.3386585707273526
Epoch: 78, step: 584, loss: 0.3218075633049011, mean loss: 0.338658421889215
Epoch: 78, step: 585, loss: 0.32933393120765686, mean loss: 0.33865833953048513
Epoch: 78, step: 586, loss: 0.3267552852630615, mean loss: 0.33865823439747506
Epoch: 78, step: 587, loss: 0.3524729311466217, mean loss: 0.33865835641387454
Epoch: 78, step: 588, loss: 0.3525451123714447, mean loss: 0.3386584790656437
Epoch: 78, step: 589, loss: 0.3215460479259491, mean loss: 0.33865832792513095
Epoch: 78, step: 590, loss: 0.3381548523902893, mean loss: 0.3386583234783707
Epoch: 78, step: 591, loss: 0.3348088264465332, mean loss: 0.33865828947942145
Epoch: 78, step: 592, loss: 0.32145100831985474, mean loss: 0.3386581375052006
Epoch: 78, step: 593, loss: 0.3381563127040863, mean loss: 0.33865813307313725
Epoch: 78, step: 594, loss: 0.35535451769828796, mean loss: 0.33865828053252967
Epoch: 78, step: 595, loss: 0.3249855935573578, mean loss: 0.3386581597789442
Epoch: 78, step: 596, loss: 0.3221907615661621, mean loss: 0.3386580143444865
Epoch: 78, step: 597, loss: 0.33931073546409607, mean loss: 0.33865802010904644
Epoch: 78, step: 598, loss: 0.3416271507740021, mean loss: 0.338658046330935
Epoch: 78, step: 599, loss: 0.3032519221305847, mean loss: 0.3386577336443782
Epoch: 78, step: 600, loss: 0.35381603240966797, mean loss: 0.3386578675125859
Epoch: 78, step: 601, loss: 0.28189846873283386, mean loss: 0.3386573662550239
Epoch: 78, step: 602, loss: 0.31840428709983826, mean loss: 0.338657187396198
Epoch: 78, step: 603, loss: 0.3452165424823761, mean loss: 0.3386572453226091
Epoch: 78, step: 604, loss: 0.32850247621536255, mean loss: 0.33865715564547966
Epoch: 78, step: 605, loss: 0.38873329758644104, mean loss: 0.3386575978657762
Epoch: 78, step: 606, loss: 0.3185041546821594, mean loss: 0.33865741989314146
Epoch: 78, step: 607, loss: 0.3204520046710968, mean loss: 0.3386572591247273
Epoch: 78, step: 608, loss: 0.3115566074848175, mean loss: 0.3386570198063564
Epoch: 78, step: 609, loss: 0.3395252227783203, mean loss: 0.33865702747314935
Epoch: 78, step: 610, loss: 0.33350521326065063, mean loss: 0.3386569819797042
Epoch: 78, step: 611, loss: 0.30375540256500244, mean loss: 0.3386566737816591
Epoch: 78, step: 612, loss: 0.344584196805954, mean loss: 0.33865672612412917
Epoch: 78, step: 613, loss: 0.30394965410232544, mean loss: 0.3386564196490923
Epoch: 78, step: 614, loss: 0.31223395466804504, mean loss: 0.33865618633196265
Epoch: 78, step: 615, loss: 0.35437101125717163, mean loss: 0.3386563250966642
Epoch: 78, step: 616, loss: 0.307849258184433, mean loss: 0.3386560530671813
Epoch: 78, step: 617, loss: 0.3488115072250366, mean loss: 0.33865614274006567
Epoch: 78, step: 618, loss: 0.295287549495697, mean loss: 0.3386557597978114
Epoch: 78, step: 619, loss: 0.3280486464500427, mean loss: 0.3386556661384204
Epoch: 78, step: 620, loss: 0.34897932410240173, mean loss: 0.3386557572941334
Epoch: 78, step: 621, loss: 0.3655175268650055, mean loss: 0.3386559944757744
Epoch: 78, step: 622, loss: 0.33383357524871826, mean loss: 0.33865595189558606
Epoch: 78, step: 623, loss: 0.3332058787345886, mean loss: 0.3386559037738692
Epoch: 78, step: 624, loss: 0.3205476999282837, mean loss: 0.3386557438879121
Epoch: 78, step: 625, loss: 0.3595837354660034, mean loss: 0.3386559286694867
Epoch: 78, step: 626, loss: 0.2980034351348877, mean loss: 0.3386555697355959
Epoch: 78, step: 627, loss: 0.31896960735321045, mean loss: 0.33865539592346117
Epoch: 78, step: 628, loss: 0.32990193367004395, mean loss: 0.33865531863770304
Epoch: 78, step: 629, loss: 0.37390729784965515, mean loss: 0.3386556298804783
Epoch: 78, step: 630, loss: 0.3162885904312134, mean loss: 0.3386554324016949
Epoch: 78, step: 631, loss: 0.3025597929954529, mean loss: 0.33865511371579815
Epoch: 78, step: 632, loss: 0.34829655289649963, mean loss: 0.3386551988386444
Epoch: 78, step: 633, loss: 0.34892863035202026, mean loss: 0.3386552895404571
Epoch: 78, step: 634, loss: 0.32532674074172974, mean loss: 0.33865517186674104
Epoch: 78, step: 635, loss: 0.297269344329834, mean loss: 0.3386548064870439
Epoch: 78, step: 636, loss: 0.3101913332939148, mean loss: 0.33865455519610643
Epoch: 78, step: 637, loss: 0.30625206232070923, mean loss: 0.3386542691318981
Epoch: 78, step: 638, loss: 0.30935147404670715, mean loss: 0.33865401043554083
Epoch: 78, step: 639, loss: 0.3396257162094116, mean loss: 0.3386540190140578
Epoch: 78, step: 640, loss: 0.3205442428588867, mean loss: 0.3386538591368041
Epoch: 78, step: 641, loss: 0.35330983996391296, mean loss: 0.338653988522019
Epoch: 78, step: 642, loss: 0.3707841634750366, mean loss: 0.33865427216955774
Epoch: 78, step: 643, loss: 0.4032481908798218, mean loss: 0.33865484240437105
Epoch: 78, step: 644, loss: 0.3416273593902588, mean loss: 0.3386548686455055
Epoch: 78, step: 645, loss: 0.3306945562362671, mean loss: 0.3386547983731454
Epoch: 78, step: 646, loss: 0.3683132827281952, mean loss: 0.33865506019117303
Epoch: 78, step: 647, loss: 0.34839797019958496, mean loss: 0.33865514619850007
Epoch: 78, step: 648, loss: 0.35656481981277466, mean loss: 0.33865530429803675
Epoch: 78, step: 649, loss: 0.29412901401519775, mean loss: 0.33865491124097313
Epoch: 78, step: 650, loss: 0.3195330798625946, mean loss: 0.3386547424439658
Epoch: 78, step: 651, loss: 0.3148728609085083, mean loss: 0.33865453251245264
Epoch: 78, step: 652, loss: 0.32712262868881226, mean loss: 0.3386544307169473
Epoch: 78, step: 653, loss: 0.3422921299934387, mean loss: 0.3386544628277048
Epoch: 78, step: 654, loss: 0.29555124044418335, mean loss: 0.3386540823496059
Epoch: 78, step: 655, loss: 0.2894364297389984, mean loss: 0.33865364790242164
Epoch: 78, step: 656, loss: 0.30792298913002014, mean loss: 0.33865337664344
Epoch: 78, step: 657, loss: 0.3076573610305786, mean loss: 0.33865310304457324
Epoch: 78, step: 658, loss: 0.3339990973472595, mean loss: 0.3386530619644725
Epoch: 78, step: 659, loss: 0.3378855884075165, mean loss: 0.33865305519017636
Epoch: 78, step: 660, loss: 0.4101763367652893, mean loss: 0.3386536865026279
Epoch: 78, step: 661, loss: 0.3368425667285919, mean loss: 0.3386536705166112
Epoch: 78, step: 662, loss: 0.31807446479797363, mean loss: 0.3386534888739463
Epoch: 78, step: 663, loss: 0.30921101570129395, mean loss: 0.3386532290018134
Epoch: 78, step: 664, loss: 0.37387019395828247, mean loss: 0.33865353983939034
Epoch: 78, step: 665, loss: 0.29367178678512573, mean loss: 0.33865314281779196
Epoch: 78, step: 666, loss: 0.3640271723270416, mean loss: 0.3386533667741332
Epoch: 78, step: 667, loss: 0.36791738867759705, mean loss: 0.3386536250620582
Epoch: 78, step: 668, loss: 0.33166131377220154, mean loss: 0.3386535633475871
Epoch: 78, step: 669, loss: 0.3413425087928772, mean loss: 0.3386535870801377
Epoch: 78, step: 670, loss: 0.33034253120422363, mean loss: 0.3386535137276592
Epoch: 78, step: 671, loss: 0.30680719017982483, mean loss: 0.33865323265793923
Epoch: 78, step: 672, loss: 0.32908740639686584, mean loss: 0.3386531482324835
Epoch: 78, step: 673, loss: 0.34324178099632263, mean loss: 0.33865318873018674
Epoch: 78, step: 674, loss: 0.33209994435310364, mean loss: 0.33865313089400384
Epoch: 78, step: 675, loss: 0.34163039922714233, mean loss: 0.33865315716989197
Epoch: 78, step: 676, loss: 0.3592613935470581, mean loss: 0.3386533390463217
Epoch: 78, step: 677, loss: 0.3335414528846741, mean loss: 0.3386532939321556
Epoch: 78, step: 678, loss: 0.3330494165420532, mean loss: 0.3386532444764329
Epoch: 78, step: 679, loss: 0.33805951476097107, mean loss: 0.33865323923665497
Epoch: 78, step: 680, loss: 0.3758571445941925, mean loss: 0.3386535675653142
Epoch: 78, step: 681, loss: 0.3040454387664795, mean loss: 0.3386532621473711
Epoch: 78, step: 682, loss: 0.3342362940311432, mean loss: 0.33865322316781754
Epoch: 78, step: 683, loss: 0.31240278482437134, mean loss: 0.33865299151087286
Epoch: 78, step: 684, loss: 0.3201668858528137, mean loss: 0.3386528283746651
Epoch: 78, step: 685, loss: 0.33273231983184814, mean loss: 0.33865277612781514
Epoch: 78, step: 686, loss: 0.33051228523254395, mean loss: 0.338652704290869
Epoch: 78, step: 687, loss: 0.299115926027298, mean loss: 0.3386523553958967
Epoch: 78, step: 688, loss: 0.3799314498901367, mean loss: 0.3386527196628419
Epoch: 78, step: 689, loss: 0.3634035885334015, mean loss: 0.33865293807470254
Epoch: 78, step: 690, loss: 0.3436148166656494, mean loss: 0.3386529818599764
Epoch: 78, step: 691, loss: 0.3636869788169861, mean loss: 0.3386532027663771
Epoch: 78, step: 692, loss: 0.3197002410888672, mean loss: 0.33865303552206494
Epoch: 78, step: 693, loss: 0.3089946210384369, mean loss: 0.33865277381323833
Epoch: 78, step: 694, loss: 0.33241045475006104, mean loss: 0.3386527187308743
Epoch: 78, step: 695, loss: 0.34503173828125, mean loss: 0.33865277501898977
Epoch: 78, step: 696, loss: 0.30549103021621704, mean loss: 0.33865248240417095
Epoch: 78, step: 697, loss: 0.332803338766098, mean loss: 0.338652430792562
Epoch: 78, step: 698, loss: 0.31554117798805237, mean loss: 0.33865222686554464
Epoch: 78, step: 699, loss: 0.36409640312194824, mean loss: 0.3386524513756235
Epoch: 78, step: 700, loss: 0.32457613945007324, mean loss: 0.33865232717250593
Epoch: 78, step: 701, loss: 0.2855442762374878, mean loss: 0.33865185857481295
Epoch: 78, step: 702, loss: 0.2850039601325989, mean loss: 0.3386513852179643
Epoch: 78, step: 703, loss: 0.3087894320487976, mean loss: 0.33865112173634176
Epoch: 78, step: 704, loss: 0.30900833010673523, mean loss: 0.33865086019075974
Epoch: 78, step: 705, loss: 0.3316437602043152, mean loss: 0.33865079836595263
Epoch: 78, step: 706, loss: 0.31166014075279236, mean loss: 0.3386505602249984
Epoch: 78, step: 707, loss: 0.33369579911231995, mean loss: 0.3386505165090895
Epoch: 78, step: 708, loss: 0.33111414313316345, mean loss: 0.33865045001617544
Epoch: 78, step: 709, loss: 0.36525362730026245, mean loss: 0.33865068473214377
Epoch: 78, step: 710, loss: 0.3236069083213806, mean loss: 0.33865055200426103
Epoch: 78, step: 711, loss: 0.3727203905582428, mean loss: 0.33865085259219296
Epoch: 78, step: 712, loss: 0.30012592673301697, mean loss: 0.3386505127013653
Epoch: 78, step: 713, loss: 0.3843519389629364, mean loss: 0.3386509159041802
Epoch: 78, step: 714, loss: 0.3626459836959839, mean loss: 0.3386511275998386
Epoch: 78, step: 715, loss: 0.34941554069519043, mean loss: 0.3386512225676642
Epoch: 78, step: 716, loss: 0.31019705533981323, mean loss: 0.33865097153618423
Epoch: 78, step: 717, loss: 0.3539935350418091, mean loss: 0.3386511068918393
Epoch: 78, step: 718, loss: 0.28824400901794434, mean loss: 0.3386506621926494
Epoch: 78, step: 719, loss: 0.29880431294441223, mean loss: 0.3386503106651135
Epoch: 78, step: 720, loss: 0.3386441767215729, mean loss: 0.3386503106109998
Epoch: 78, step: 721, loss: 0.32914814352989197, mean loss: 0.33865022678363527
Epoch: 78, step: 722, loss: 0.3317146897315979, mean loss: 0.3386501655994171
Epoch: 78, step: 723, loss: 0.32684382796287537, mean loss: 0.33865006144668025
Epoch: 78, step: 724, loss: 0.3247923254966736, mean loss: 0.3386499391980679
Epoch: 78, step: 725, loss: 0.32905080914497375, mean loss: 0.3386498545182919
Epoch: 78, step: 726, loss: 0.3143729269504547, mean loss: 0.33864964035860834
Epoch: 78, step: 727, loss: 0.28840193152427673, mean loss: 0.3386491971007675
Epoch: 78, step: 728, loss: 0.34780609607696533, mean loss: 0.338649277877216
Epoch: 78, step: 729, loss: 0.2911401391029358, mean loss: 0.3386488587849384
Epoch: 78, step: 730, loss: 0.36738091707229614, mean loss: 0.33864911223675503
Epoch: 78, step: 731, loss: 0.3332535922527313, mean loss: 0.3386490646421043
Epoch: 78, step: 732, loss: 0.2796649634838104, mean loss: 0.33864854433953157
Epoch: 78, step: 733, loss: 0.32843834161758423, mean loss: 0.3386484542754672
Epoch: 78, step: 734, loss: 0.3053430914878845, mean loss: 0.33864816049189006
Epoch: 78, step: 735, loss: 0.3100427985191345, mean loss: 0.3386479081688185
Epoch: 78, step: 736, loss: 0.3850775957107544, mean loss: 0.33864831771364595
Epoch: 78, step: 737, loss: 0.3608979880809784, mean loss: 0.3386485139707719
Epoch: 78, step: 738, loss: 0.35135066509246826, mean loss: 0.3386486260113389
Epoch: 78, step: 739, loss: 0.3008574843406677, mean loss: 0.33864829267381574
Epoch: 78, step: 740, loss: 0.30651387572288513, mean loss: 0.3386480092340466
Epoch: 78, step: 741, loss: 0.3230448365211487, mean loss: 0.33864787160837656
Epoch: 78, step: 742, loss: 0.29352423548698425, mean loss: 0.3386474736049709
Epoch: 78, step: 743, loss: 0.3254401981830597, mean loss: 0.33864735711404315
Epoch: 78, step: 744, loss: 0.3176230788230896, mean loss: 0.338647171677153
Epoch: 78, step: 745, loss: 0.31752896308898926, mean loss: 0.33864698541342825
Epoch: 78, step: 746, loss: 0.30465778708457947, mean loss: 0.3386466856295324
Epoch: 78, step: 747, loss: 0.3358406722545624, mean loss: 0.3386466608807815
Epoch: 78, step: 748, loss: 0.3389984369277954, mean loss: 0.3386466639833829
Epoch: 78, step: 749, loss: 0.30103057622909546, mean loss: 0.33864633221918966
Epoch: 78, step: 750, loss: 0.3453918695449829, mean loss: 0.33864639171256455
Epoch: 78, step: 751, loss: 0.3143578767776489, mean loss: 0.3386461774979052
Epoch: 78, step: 752, loss: 0.3566683828830719, mean loss: 0.3386463364449034
Epoch: 78, step: 753, loss: 0.3370510935783386, mean loss: 0.338646322375769
Epoch: 78, step: 754, loss: 0.3849073648452759, mean loss: 0.33864673036824144
Epoch: 78, step: 755, loss: 0.3361029624938965, mean loss: 0.338646707934052
Epoch: 78, step: 756, loss: 0.3853469789028168, mean loss: 0.338647119792971
Epoch: 78, step: 757, loss: 0.34008195996284485, mean loss: 0.33864713244699846
Epoch: 78, step: 758, loss: 0.30727049708366394, mean loss: 0.338646855735131
Epoch: 78, step: 759, loss: 0.33250173926353455, mean loss: 0.3386468015415682
Epoch: 78, step: 760, loss: 0.34473279118537903, mean loss: 0.33864685521322024
Epoch: 78, step: 761, loss: 0.36325499415397644, mean loss: 0.33864707222769136
Epoch: 78, step: 762, loss: 0.3279014527797699, mean loss: 0.3386469774649642
Epoch: 78, step: 763, loss: 0.37133538722991943, mean loss: 0.3386472657327141
Epoch: 78, step: 764, loss: 0.3372335433959961, mean loss: 0.338647253265697
Epoch: 78, step: 765, loss: 0.3269463777542114, mean loss: 0.33864715008155344
Epoch: 78, step: 766, loss: 0.4345718026161194, mean loss: 0.3386479959854197
Epoch: 78, step: 767, loss: 0.37178072333335876, mean loss: 0.3386482881611459
Epoch: 78, step: 768, loss: 0.33621659874916077, mean loss: 0.33864826671786574
Epoch: 78, step: 769, loss: 0.35941648483276367, mean loss: 0.338648449855889
Epoch: 78, step: 770, loss: 0.3130526840686798, mean loss: 0.3386482241496397
Epoch: 78, step: 771, loss: 0.3135926127433777, mean loss: 0.3386480032084788
Epoch: 78, step: 772, loss: 0.30862313508987427, mean loss: 0.3386477384505923
Epoch: 78, step: 773, loss: 0.34023165702819824, mean loss: 0.3386477524173893
Epoch: 78, step: 774, loss: 0.28846797347068787, mean loss: 0.33864730994224274
Epoch: 78, step: 775, loss: 0.3193499743938446, mean loss: 0.3386471397837394
Epoch: 78, step: 776, loss: 0.29737356305122375, mean loss: 0.3386467758481017
Epoch: 78, step: 777, loss: 0.35576263070106506, mean loss: 0.33864692676825736
Epoch: 78, step: 778, loss: 0.38766011595726013, mean loss: 0.338647358941408
Epoch: 78, step: 779, loss: 0.30059635639190674, mean loss: 0.3386470234301522
Epoch: 78, step: 780, loss: 0.33788615465164185, mean loss: 0.33864701672132
Epoch: 78, step: 781, loss: 0.32962697744369507, mean loss: 0.33864693718934624
Epoch: 78, step: 782, loss: 0.3214319944381714, mean loss: 0.33864678540216864
Epoch: 78, step: 783, loss: 0.30027082562446594, mean loss: 0.33864644703756597
Epoch: 78, step: 784, loss: 0.3298400938510895, mean loss: 0.3386463693917705
Epoch: 78, step: 785, loss: 0.3292451798915863, mean loss: 0.33864628650202194
Epoch: 78, step: 786, loss: 0.32626238465309143, mean loss: 0.33864617731483243
Epoch: 78, step: 787, loss: 0.3185887336730957, mean loss: 0.33864600047262083
Epoch: 78, step: 788, loss: 0.3466191291809082, mean loss: 0.33864607076937986
Epoch: 78, step: 789, loss: 0.30041858553886414, mean loss: 0.33864573373172197
Epoch: 78, step: 790, loss: 0.31181177496910095, mean loss: 0.33864549714867653
Epoch: 78, step: 791, loss: 0.32688429951667786, mean loss: 0.3386453934563572
Epoch: 78, step: 792, loss: 0.3747808039188385, mean loss: 0.33864571204053584
Epoch: 78, step: 793, loss: 0.3121531307697296, mean loss: 0.33864547847344123
Epoch: 78, step: 794, loss: 0.32203638553619385, mean loss: 0.3386453320436411
Epoch: 78, step: 795, loss: 0.2933499217033386, mean loss: 0.3386449327118153
Epoch: 78, step: 796, loss: 0.3513602912425995, mean loss: 0.3386450448115299
Epoch: 78, step: 797, loss: 0.3343771696090698, mean loss: 0.33864500718589996
Epoch: 78, step: 798, loss: 0.3139130175113678, mean loss: 0.338644789150357
Epoch: 78, step: 799, loss: 0.3413800299167633, mean loss: 0.33864481326384144
Epoch: 78, step: 800, loss: 0.31739452481269836, mean loss: 0.33864462592604333
Epoch: 78, step: 801, loss: 0.35715433955192566, mean loss: 0.33864478910210716
Epoch: 78, step: 802, loss: 0.34831348061561584, mean loss: 0.3386448743376298
Epoch: 78, step: 803, loss: 0.3437647819519043, mean loss: 0.33864491947239844
Epoch: 78, step: 804, loss: 0.30142807960510254, mean loss: 0.3386445913886174
Epoch: 78, step: 805, loss: 0.33406323194503784, mean loss: 0.3386445510021557
Epoch: 78, step: 806, loss: 0.34829241037368774, mean loss: 0.338644636051031
Epoch: 78, step: 807, loss: 0.3397274613380432, mean loss: 0.3386446455963879
Epoch: 78, step: 808, loss: 0.3103799521923065, mean loss: 0.3386443964387341
Epoch: 78, step: 809, loss: 0.31044894456863403, mean loss: 0.33864414789364616
Epoch: 78, step: 810, loss: 0.30765238404273987, mean loss: 0.3386438747012601
Epoch: 78, step: 811, loss: 0.38431814312934875, mean loss: 0.33864427731636915
Epoch: 78, step: 812, loss: 0.31634852290153503, mean loss: 0.3386440807827677
Epoch: 78, step: 813, loss: 0.2943805456161499, mean loss: 0.3386436906100409
Epoch: 78, step: 814, loss: 0.3344587981700897, mean loss: 0.3386436537215164
Epoch: 78, step: 815, loss: 0.32498228549957275, mean loss: 0.3386435333018684
Epoch: 78, step: 816, loss: 0.31259745359420776, mean loss: 0.3386433037178288
Epoch: 78, step: 817, loss: 0.3777807056903839, mean loss: 0.338643648692725
Epoch: 78, step: 818, loss: 0.31745126843452454, mean loss: 0.3386434618950744
Epoch: 78, step: 819, loss: 0.3304160535335541, mean loss: 0.33864338937622623
Epoch: 78, step: 820, loss: 0.27882203459739685, mean loss: 0.33864286209748723
Epoch: 78, step: 821, loss: 0.31728431582450867, mean loss: 0.33864267384016467
Epoch: 78, step: 822, loss: 0.33690622448921204, mean loss: 0.3386426585349833
Epoch: 78, step: 823, loss: 0.3007342517375946, mean loss: 0.33864232441068143
Epoch: 78, step: 824, loss: 0.3571849763393402, mean loss: 0.33864248784398154
Epoch: 78, step: 825, loss: 0.38872766494750977, mean loss: 0.33864292928642814
Epoch: 78, step: 826, loss: 0.3181508183479309, mean loss: 0.33864274867395194
Epoch: 78, step: 827, loss: 0.3517599403858185, mean loss: 0.33864286428466683
Epoch: 78, step: 828, loss: 0.3265543580055237, mean loss: 0.338642757741394
Epoch: 78, step: 829, loss: 0.33492520451545715, mean loss: 0.33864272497665143
Epoch: 78, step: 830, loss: 0.31054049730300903, mean loss: 0.33864247729919117
Epoch: 78, step: 831, loss: 0.32636478543281555, mean loss: 0.33864236909137313
Epoch: 78, step: 832, loss: 0.330172061920166, mean loss: 0.3386422944400959
Epoch: 78, step: 833, loss: 0.3066428005695343, mean loss: 0.33864201242174796
Epoch: 78, step: 834, loss: 0.3119841516017914, mean loss: 0.3386417774824192
Epoch: 78, step: 835, loss: 0.35846665501594543, mean loss: 0.3386419522002034
Epoch: 78, step: 836, loss: 0.344857394695282, mean loss: 0.33864200697677227
Epoch: 78, step: 837, loss: 0.33713364601135254, mean loss: 0.33864199368373477
Epoch: 78, step: 838, loss: 0.3073250651359558, mean loss: 0.33864171769314205
Epoch: 78, step: 839, loss: 0.38113781809806824, mean loss: 0.33864209220051306
Epoch: 78, step: 840, loss: 0.36224663257598877, mean loss: 0.33864230021951647
Epoch: 78, step: 841, loss: 0.3571345806121826, mean loss: 0.3386424631844282
Epoch: 78, step: 842, loss: 0.3450675904750824, mean loss: 0.3386425198059509
Epoch: 78, step: 843, loss: 0.322258323431015, mean loss: 0.33864237542126713
Epoch: 78, step: 844, loss: 0.35031989216804504, mean loss: 0.33864247832773053
Epoch: 78, step: 845, loss: 0.33279794454574585, mean loss: 0.3386424268240577
Epoch: 78, step: 846, loss: 0.37153059244155884, mean loss: 0.338642716641254
Epoch: 78, step: 847, loss: 0.2992200255393982, mean loss: 0.33864236924355307
Epoch: 78, step: 848, loss: 0.3024912476539612, mean loss: 0.33864205067814046
Epoch: 78, step: 849, loss: 0.31819069385528564, mean loss: 0.338641870461394
Epoch: 78, step: 850, loss: 0.3514135479927063, mean loss: 0.3386419830040438
Epoch: 78, step: 851, loss: 0.3277398943901062, mean loss: 0.3386418869368571
Epoch: 78, step: 852, loss: 0.32932037115097046, mean loss: 0.33864180479810935
Epoch: 78, step: 853, loss: 0.32115450501441956, mean loss: 0.3386416507059765
Epoch: 78, step: 854, loss: 0.30760109424591064, mean loss: 0.3386413771895697
Epoch: 78, step: 855, loss: 0.3051178753376007, mean loss: 0.338641081797089
Epoch: 78, step: 856, loss: 0.34246256947517395, mean loss: 0.33864111546984743
Epoch: 78, step: 857, loss: 0.3199421465396881, mean loss: 0.3386409507067059
Epoch: 78, step: 858, loss: 0.30259671807289124, mean loss: 0.3386406331111905
Epoch: 78, step: 859, loss: 0.38509654998779297, mean loss: 0.33864104244327453
Epoch: 78, step: 860, loss: 0.3318450152873993, mean loss: 0.3386409825626902
Epoch: 78, step: 861, loss: 0.3355734050273895, mean loss: 0.3386409555341465
Epoch: 78, step: 862, loss: 0.30445539951324463, mean loss: 0.33864065432655127
Epoch: 78, step: 863, loss: 0.35751938819885254, mean loss: 0.33864082066487045
Epoch: 78, step: 864, loss: 0.30252155661582947, mean loss: 0.3386405024250575
Epoch: 78, step: 865, loss: 0.3293451964855194, mean loss: 0.3386404205266457
Epoch: 78, step: 866, loss: 0.32830458879470825, mean loss: 0.3386403294612466
Epoch: 78, step: 867, loss: 0.35602179169654846, mean loss: 0.33864048260188306
Epoch: 78, step: 868, loss: 0.37340664863586426, mean loss: 0.3386407889090172
Epoch: 78, step: 869, loss: 0.3636236786842346, mean loss: 0.3386410090187049
Epoch: 78, step: 870, loss: 0.34372079372406006, mean loss: 0.33864105377333437
Epoch: 78, step: 871, loss: 0.35008278489112854, mean loss: 0.33864115457798544
Epoch: 78, step: 872, loss: 0.3211689889431, mean loss: 0.3386410006449813
Epoch: 78, step: 873, loss: 0.3446156978607178, mean loss: 0.33864105328270283
Epoch: 78, step: 874, loss: 0.32564061880111694, mean loss: 0.33864093874849366
Epoch: 78, step: 875, loss: 0.34748828411102295, mean loss: 0.33864101669317914
Epoch: 78, step: 876, loss: 0.33034199476242065, mean loss: 0.3386409435798407
Epoch: 78, step: 877, loss: 0.3105992376804352, mean loss: 0.3386406965381184
Epoch: 78, step: 878, loss: 0.30685871839523315, mean loss: 0.33864041654782545
Epoch: 78, step: 879, loss: 0.3530927300453186, mean loss: 0.3386405438675229
Epoch: 78, step: 880, loss: 0.30985546112060547, mean loss: 0.3386402902835039
Epoch: 78, step: 881, loss: 0.33222073316574097, mean loss: 0.338640233730505
Epoch: 78, step: 882, loss: 0.3010129928588867, mean loss: 0.3386399022567714
Epoch: 78, step: 883, loss: 0.3383093476295471, mean loss: 0.3386398993448063
Epoch: 78, step: 884, loss: 0.30148324370384216, mean loss: 0.33863957202241723
Epoch: 78, step: 885, loss: 0.2994062602519989, mean loss: 0.338639226409283
Epoch: 78, step: 886, loss: 0.3664698004722595, mean loss: 0.33863947157153834
Epoch: 78, step: 887, loss: 0.34437263011932373, mean loss: 0.33863952207504916
Epoch: 78, step: 888, loss: 0.30324432253837585, mean loss: 0.33863921028075966
Epoch: 78, step: 889, loss: 0.30456626415252686, mean loss: 0.33863891013676883
Epoch: 78, step: 890, loss: 0.3030361533164978, mean loss: 0.3386385965196444
Epoch: 78, step: 891, loss: 0.3457542061805725, mean loss: 0.3386386591989867
Epoch: 78, step: 892, loss: 0.3462758958339691, mean loss: 0.33863872647259724
Epoch: 78, step: 893, loss: 0.34195777773857117, mean loss: 0.33863875570864244
Epoch: 78, step: 894, loss: 0.3296606242656708, mean loss: 0.3386386766249756
Epoch: 78, step: 895, loss: 0.31952109932899475, mean loss: 0.3386385082297137
Epoch: 78, step: 896, loss: 0.3370114266872406, mean loss: 0.3386384938978554
Epoch: 78, step: 897, loss: 0.3038548529148102, mean loss: 0.33863818751504043
Epoch: 78, step: 898, loss: 0.34388989210128784, mean loss: 0.3386382337729311
Epoch: 78, step: 899, loss: 0.3278350234031677, mean loss: 0.3386381386172889
Epoch: 78, step: 900, loss: 0.29369333386421204, mean loss: 0.33863774274291975
Epoch: 78, step: 901, loss: 0.3185279071331024, mean loss: 0.3386375656168112
Epoch: 78, step: 902, loss: 0.303832471370697, mean loss: 0.3386372590585318
Epoch: 78, step: 903, loss: 0.3472515046596527, mean loss: 0.3386373349309036
Epoch: 78, step: 904, loss: 0.3882591128349304, mean loss: 0.338637771984709
Epoch: 78, step: 905, loss: 0.34646353125572205, mean loss: 0.33863784091105326
Epoch: 78, step: 906, loss: 0.349618524312973, mean loss: 0.3386379376239308
Epoch: 78, step: 907, loss: 0.3116946816444397, mean loss: 0.33863770032204615
Epoch: 78, step: 908, loss: 0.32575079798698425, mean loss: 0.3386375868220564
Epoch: 78, step: 909, loss: 0.3829704225063324, mean loss: 0.33863797727524275
Epoch: 78, step: 910, loss: 0.2942763566970825, mean loss: 0.33863758657197984
Epoch: 78, step: 911, loss: 0.2984195649623871, mean loss: 0.33863723236549065
Epoch: 78, step: 912, loss: 0.32921478152275085, mean loss: 0.3386371493812039
Epoch: 78, step: 913, loss: 0.32719144225120544, mean loss: 0.3386370485788231
Epoch: 78, step: 914, loss: 0.32484740018844604, mean loss: 0.3386369271344134
Epoch: 78, step: 915, loss: 0.35324397683143616, mean loss: 0.3386370557764828
Epoch: 78, step: 916, loss: 0.3131406009197235, mean loss: 0.3386368312350526
Epoch: 78, step: 917, loss: 0.33019644021987915, mean loss: 0.3386367569031194
Epoch: 78, step: 918, loss: 0.3242654800415039, mean loss: 0.33863663034080943
Epoch: 78, step: 919, loss: 0.30849018692970276, mean loss: 0.33863636485501075
Epoch: 78, step: 920, loss: 0.3452087640762329, mean loss: 0.33863642273458433
Epoch: 78, step: 921, loss: 0.33407148718833923, mean loss: 0.3386363825340141
Epoch: 78, step: 922, loss: 0.37126389145851135, mean loss: 0.3386366698618194
Epoch: 78, step: 923, loss: 0.3309355676174164, mean loss: 0.338636602044159
Epoch: 78, step: 924, loss: 0.3290470242500305, mean loss: 0.33863651759689645
Epoch: 78, step: 925, loss: 0.3092764616012573, mean loss: 0.3386362590501098
Epoch: 78, step: 926, loss: 0.3298428952693939, mean loss: 0.33863618161579123
Epoch: 78, step: 927, loss: 0.315046101808548, mean loss: 0.3386359738834928
Epoch: 78, step: 928, loss: 0.30031344294548035, mean loss: 0.3386356364214157
Epoch: 78, step: 929, loss: 0.293401300907135, mean loss: 0.33863523809860074
Epoch: 78, step: 930, loss: 0.3630269169807434, mean loss: 0.3386354528840404
Epoch: 78, step: 931, loss: 0.36408916115760803, mean loss: 0.3386356770194026
Epoch: 78, step: 932, loss: 0.3986758589744568, mean loss: 0.3386362057050184
Epoch: 78, step: 933, loss: 0.29090556502342224, mean loss: 0.3386357854151369
Epoch: 78, step: 934, loss: 0.32859134674072266, mean loss: 0.3386356969700897
Epoch: 78, step: 935, loss: 0.34364035725593567, mean loss: 0.33863574103761124
Epoch: 78, step: 936, loss: 0.3256366550922394, mean loss: 0.33863562657780316
Epoch: 78, step: 937, loss: 0.3476529121398926, mean loss: 0.33863570597628484
Epoch: 78, step: 938, loss: 0.3003043532371521, mean loss: 0.338635368466245
Epoch: 78, step: 939, loss: 0.36195966601371765, mean loss: 0.33863557383638504
Epoch: 78, step: 940, loss: 0.3048979938030243, mean loss: 0.3386352767800421
Epoch: 78, step: 941, loss: 0.389675110578537, mean loss: 0.3386357261772087
Epoch: 78, step: 942, loss: 0.3505870997905731, mean loss: 0.33863583140612014
Epoch: 78, step: 943, loss: 0.296785831451416, mean loss: 0.3386354629303862
Epoch: 78, step: 944, loss: 0.3068602681159973, mean loss: 0.3386351831625211
Epoch: 78, step: 945, loss: 0.3579990565776825, mean loss: 0.3386353536521707
Epoch: 78, step: 946, loss: 0.28386396169662476, mean loss: 0.3386348714204909
Epoch: 78, step: 947, loss: 0.33943378925323486, mean loss: 0.3386348784544567
Epoch: 78, step: 948, loss: 0.32328009605407715, mean loss: 0.33863474326650805
Epoch: 78, step: 949, loss: 0.3915270268917084, mean loss: 0.3386352089413828
Epoch: 78, step: 950, loss: 0.30152711272239685, mean loss: 0.33863488223671556
Epoch: 78, step: 951, loss: 0.35358676314353943, mean loss: 0.33863501387392597
Epoch: 78, step: 952, loss: 0.3413187265396118, mean loss: 0.338635037501277
Epoch: 78, step: 953, loss: 0.3451912999153137, mean loss: 0.33863509522196805
Epoch: 78, step: 954, loss: 0.3073791265487671, mean loss: 0.33863482004990897
Epoch: 78, step: 955, loss: 0.30664607882499695, mean loss: 0.3386345384291284
Epoch: 78, step: 956, loss: 0.3160773813724518, mean loss: 0.33863433984337576
Epoch: 78, step: 957, loss: 0.2987086772918701, mean loss: 0.3386339883541377
Epoch: 78, step: 958, loss: 0.33162739872932434, mean loss: 0.3386339266715253
Epoch: 78, step: 959, loss: 0.3337002992630005, mean loss: 0.3386338832386479
Epoch: 78, step: 960, loss: 0.3415796756744385, mean loss: 0.3386339091715173
Epoch: 78, step: 961, loss: 0.3091314435005188, mean loss: 0.33863364945299634
Epoch: 78, step: 962, loss: 0.33601710200309753, mean loss: 0.3386336264189944
Epoch: 78, step: 963, loss: 0.3062536418437958, mean loss: 0.3386333413738821
Epoch: 78, step: 964, loss: 0.3753160238265991, mean loss: 0.338633664293347
Epoch: 78, step: 965, loss: 0.3153562843799591, mean loss: 0.33863345938322614
Epoch: 78, step: 966, loss: 0.31624940037727356, mean loss: 0.33863326233871865
Epoch: 78, step: 967, loss: 0.3628886044025421, mean loss: 0.33863347585405373
Epoch: 78, step: 968, loss: 0.3055288791656494, mean loss: 0.33863318444291574
Epoch: 78, step: 969, loss: 0.33334973454475403, mean loss: 0.3386331379344925
Epoch: 78, step: 970, loss: 0.33660975098609924, mean loss: 0.33863312012345803
Epoch: 78, step: 971, loss: 0.3319624364376068, mean loss: 0.3386330614047185
Epoch: 78, step: 972, loss: 0.2933235466480255, mean loss: 0.3386326625709105
Epoch: 78, step: 973, loss: 0.3077594041824341, mean loss: 0.3386323908136232
Epoch: 78, step: 974, loss: 0.31317511200904846, mean loss: 0.3386321667316669
Epoch: 78, step: 975, loss: 0.34147974848747253, mean loss: 0.33863219179664256
Epoch: 78, step: 976, loss: 0.3331359624862671, mean loss: 0.3386321434181751
Epoch: 78, step: 977, loss: 0.33044955134391785, mean loss: 0.3386320713946554
Epoch: 78, step: 978, loss: 0.30851981043815613, mean loss: 0.3386318063476005
Epoch: 78, step: 979, loss: 0.3274610638618469, mean loss: 0.338631708023986
Epoch: 78, step: 980, loss: 0.3260349929332733, mean loss: 0.33863159715009755
Epoch: 78, step: 981, loss: 0.3743435740470886, mean loss: 0.33863191147735383
Epoch: 78, step: 982, loss: 0.3827000558376312, mean loss: 0.33863229934994427
Epoch: 78, step: 983, loss: 0.30990490317344666, mean loss: 0.33863204650354783
Epoch: 78, step: 984, loss: 0.34768375754356384, mean loss: 0.3386321261721805
Epoch: 78, step: 985, loss: 0.3530702292919159, mean loss: 0.33863225324802343
Epoch: 78, step: 986, loss: 0.30413132905960083, mean loss: 0.33863194959349213
Epoch: 78, step: 987, loss: 0.34149205684661865, mean loss: 0.33863197476606083
Epoch: 78, step: 988, loss: 0.33293256163597107, mean loss: 0.3386319246044434
Epoch: 78, step: 989, loss: 0.31913426518440247, mean loss: 0.33863175300335013
Epoch: 78, step: 990, loss: 0.335785835981369, mean loss: 0.33863172795633484
Epoch: 78, step: 991, loss: 0.36415207386016846, mean loss: 0.33863195255981565
Epoch: 78, step: 992, loss: 0.2930140793323517, mean loss: 0.3386315510823835
Epoch: 78, step: 993, loss: 0.3167532682418823, mean loss: 0.3386313585359343
Epoch: 78, step: 994, loss: 0.3655955195426941, mean loss: 0.338631595840105
Epoch: 78, step: 995, loss: 0.3235761821269989, mean loss: 0.3386314633427125
Epoch: 78, step: 996, loss: 0.31095486879348755, mean loss: 0.3386312197728971
Epoch: 78, step: 997, loss: 0.32534873485565186, mean loss: 0.33863110288048387
Epoch: 78, step: 998, loss: 0.28811919689178467, mean loss: 0.33863065835472955
Epoch: 78, step: 999, loss: 0.34012570977211, mean loss: 0.33863067151168724
Epoch: 78, step: 1000, loss: 0.3002508878707886, mean loss: 0.3386303337595937
Epoch: 78, step: 1001, loss: 0.32901298999786377, mean loss: 0.3386302491252082
Epoch: 78, step: 1002, loss: 0.3479560613632202, mean loss: 0.33863033119334074
Epoch: 78, step: 1003, loss: 0.34098079800605774, mean loss: 0.3386303518775149
Epoch: 78, step: 1004, loss: 0.34063616394996643, mean loss: 0.3386303695285623
Epoch: 78, step: 1005, loss: 0.28954017162323, mean loss: 0.33862993754104137
Epoch: 78, step: 1006, loss: 0.320020854473114, mean loss: 0.3386297737849095
Epoch: 78, step: 1007, loss: 0.3102421462535858, mean loss: 0.3386295239817809
Epoch: 78, step: 1008, loss: 0.31594744324684143, mean loss: 0.3386293243876139
Epoch: 78, step: 1009, loss: 0.29615452885627747, mean loss: 0.3386289506279517
Epoch: 78, step: 1010, loss: 0.37497422099113464, mean loss: 0.3386292704476534
Epoch: 78, step: 1011, loss: 0.3718889057636261, mean loss: 0.3386295631127771
Epoch: 78, step: 1012, loss: 0.3272540271282196, mean loss: 0.3386294630156678
Epoch: 78, step: 1013, loss: 0.30997347831726074, mean loss: 0.3386292108643849
Epoch: 78, step: 1014, loss: 0.31171560287475586, mean loss: 0.3386289740468007
Epoch: 78, step: 1015, loss: 0.34224992990493774, mean loss: 0.3386290059079497
Epoch: 78, step: 1016, loss: 0.3586750626564026, mean loss: 0.338629182293635
Epoch: 78, step: 1017, loss: 0.3282582461833954, mean loss: 0.3386290910403476
Epoch: 78, step: 1018, loss: 0.32865145802497864, mean loss: 0.33862900324848466
Epoch: 78, step: 1019, loss: 0.3301446735858917, mean loss: 0.3386289285966557
Epoch: 78, step: 1020, loss: 0.36333099007606506, mean loss: 0.3386291459429772
Epoch: 78, step: 1021, loss: 0.3748818635940552, mean loss: 0.3386294649173877
Epoch: 78, step: 1022, loss: 0.32145559787750244, mean loss: 0.338629313812139
Epoch: 78, step: 1023, loss: 0.3475870192050934, mean loss: 0.33862939262632735
Epoch: 78, step: 1024, loss: 0.35353919863700867, mean loss: 0.3386295238087975
Epoch: 78, step: 1025, loss: 0.39887747168540955, mean loss: 0.33863005388981143
Epoch: 78, step: 1026, loss: 0.3054220676422119, mean loss: 0.3386297617177331
Epoch: 78, step: 1027, loss: 0.3155411183834076, mean loss: 0.33862955857992444
Epoch: 78, step: 1028, loss: 0.34988901019096375, mean loss: 0.33862965764162206
Epoch: 78, step: 1029, loss: 0.29550376534461975, mean loss: 0.3386292782193675
Epoch: 78, step: 1030, loss: 0.3189676105976105, mean loss: 0.33862910523723944
Epoch: 78, step: 1031, loss: 0.3263355493545532, mean loss: 0.33862899708025146
Epoch: 78, step: 1032, loss: 0.2851797640323639, mean loss: 0.3386285268454998
Epoch: 78, step: 1033, loss: 0.35927796363830566, mean loss: 0.3386287085131647
Epoch: 78, step: 1034, loss: 0.32416194677352905, mean loss: 0.33862858123997425
Epoch: 78, step: 1035, loss: 0.3200256824493408, mean loss: 0.3386284175800278
Epoch: 78, step: 1036, loss: 0.32809072732925415, mean loss: 0.3386283248749785
Epoch: 78, step: 1037, loss: 0.34043413400650024, mean loss: 0.3386283407613965
Epoch: 78, step: 1038, loss: 0.3247237503528595, mean loss: 0.33862821843828494
Epoch: 78, step: 1039, loss: 0.33126017451286316, mean loss: 0.33862815361982546
Epoch: 78, step: 1040, loss: 0.32735005021095276, mean loss: 0.3386280544045025
Epoch: 78, step: 1041, loss: 0.3282710313796997, mean loss: 0.33862796329287603
Epoch: 78, step: 1042, loss: 0.34509649872779846, mean loss: 0.33862802019664057
Epoch: 78, step: 1043, loss: 0.30579662322998047, mean loss: 0.33862773138108615
Epoch: 78, step: 1044, loss: 0.31929630041122437, mean loss: 0.3386275613253056
Epoch: 78, step: 1045, loss: 0.31135088205337524, mean loss: 0.33862732137844453
Epoch: 78, step: 1046, loss: 0.3624235987663269, mean loss: 0.3386275307071454
Epoch: 78, step: 1047, loss: 0.3732551336288452, mean loss: 0.33862783531308244
Epoch: 78, step: 1048, loss: 0.343525767326355, mean loss: 0.33862787839796044
Epoch: 78, step: 1049, loss: 0.35681581497192383, mean loss: 0.33862803838755046
Epoch: 78, step: 1050, loss: 0.35408496856689453, mean loss: 0.3386281743527359
Epoch: 78, step: 1051, loss: 0.32452306151390076, mean loss: 0.3386280502797543
Epoch: 78, step: 1052, loss: 0.3213513195514679, mean loss: 0.33862789830956713
Epoch: 78, step: 1053, loss: 0.3460797369480133, mean loss: 0.33862796385711597
Epoch: 78, step: 1054, loss: 0.320382297039032, mean loss: 0.33862780336676246
Epoch: 78, step: 1055, loss: 0.33168497681617737, mean loss: 0.33862774229763865
Epoch: 78, step: 1056, loss: 0.3345347046852112, mean loss: 0.3386277062955838
Epoch: 78, step: 1057, loss: 0.3311915695667267, mean loss: 0.33862764088845276
Epoch: 78, step: 1058, loss: 0.3148445188999176, mean loss: 0.33862743169755827
Epoch: 78, step: 1059, loss: 0.3475019931793213, mean loss: 0.33862750975548217
Epoch: 78, step: 1060, loss: 0.31451883912086487, mean loss: 0.3386272977048666
Epoch: 78, step: 1061, loss: 0.3212214410305023, mean loss: 0.3386271446109771
Epoch: 78, step: 1062, loss: 0.31916293501853943, mean loss: 0.33862697341427017
Epoch: 78, step: 1063, loss: 0.3258002698421478, mean loss: 0.33862686059848446
Epoch: 78, step: 1064, loss: 0.3170328140258789, mean loss: 0.3386266706722193
Epoch: 78, step: 1065, loss: 0.2968480587005615, mean loss: 0.3386263032197402
Epoch: 78, step: 1066, loss: 0.3057538866996765, mean loss: 0.3386260141018366
Epoch: 78, step: 1067, loss: 0.33413586020469666, mean loss: 0.3386259746105974
Epoch: 78, step: 1068, loss: 0.3421132564544678, mean loss: 0.33862600528123216
Epoch: 78, step: 1069, loss: 0.3360297381877899, mean loss: 0.33862598244727066
Epoch: 78, step: 1070, loss: 0.3142545819282532, mean loss: 0.3386257681046366
Epoch: 78, step: 1071, loss: 0.33733463287353516, mean loss: 0.3386257567494052
Epoch: 78, step: 1072, loss: 0.301937460899353, mean loss: 0.3386254340872896
Epoch: 78, step: 1073, loss: 0.3115547001361847, mean loss: 0.33862519601072416
Epoch: 78, step: 1074, loss: 0.28512006998062134, mean loss: 0.3386247254581106
Epoch: 78, step: 1075, loss: 0.3769473433494568, mean loss: 0.3386250624846865
Epoch: 78, step: 1076, loss: 0.4149143397808075, mean loss: 0.33862573340147667
Epoch: 78, step: 1077, loss: 0.3303440511226654, mean loss: 0.3386256605698675
Epoch: 78, step: 1078, loss: 0.3569127321243286, mean loss: 0.3386258213904702
Epoch: 78, step: 1079, loss: 0.33609041571617126, mean loss: 0.33862579909374096
Epoch: 78, step: 1080, loss: 0.37974873185157776, mean loss: 0.33862616073166063
Epoch: 78, step: 1081, loss: 0.29145345091819763, mean loss: 0.33862574589523053
Epoch: 78, step: 1082, loss: 0.35382139682769775, mean loss: 0.3386258795244873
Epoch: 78, step: 1083, loss: 0.3487406373023987, mean loss: 0.3386259684720213
Epoch: 78, step: 1084, loss: 0.3332041800022125, mean loss: 0.338625920794115
Epoch: 78, step: 1085, loss: 0.3349222242832184, mean loss: 0.3386258882249834
Epoch: 78, step: 1086, loss: 0.3060356676578522, mean loss: 0.33862560163944744
Epoch: 78, step: 1087, loss: 0.32062047719955444, mean loss: 0.3386254433108822
Epoch: 78, step: 1088, loss: 0.3187614977359772, mean loss: 0.3386252686382573
Epoch: 78, step: 1089, loss: 0.3291793167591095, mean loss: 0.33862518557647614
Epoch: 78, step: 1090, loss: 0.35236939787864685, mean loss: 0.33862530643340305
Epoch: 78, step: 1091, loss: 0.31550920009613037, mean loss: 0.33862510316842526
Epoch: 78, step: 1092, loss: 0.29038578271865845, mean loss: 0.33862467899326193
Epoch: 78, step: 1093, loss: 0.38422712683677673, mean loss: 0.33862507997850577
Epoch: 78, step: 1094, loss: 0.31210073828697205, mean loss: 0.3386248467503217
Epoch: 78, step: 1095, loss: 0.31296977400779724, mean loss: 0.33862462116759146
Epoch: 78, step: 1096, loss: 0.3396928608417511, mean loss: 0.33862463056044356
Epoch: 78, step: 1097, loss: 0.31828150153160095, mean loss: 0.33862445168829874
Epoch: 78, step: 1098, loss: 0.34147611260414124, mean loss: 0.3386244767620334
Epoch: 78, step: 1099, loss: 0.3353593051433563, mean loss: 0.33862444805268493
Epoch: 78, step: 1100, loss: 0.30497607588768005, mean loss: 0.3386241521986042
Epoch: 78, step: 1101, loss: 0.33978545665740967, mean loss: 0.3386241624093104
Epoch: 78, step: 1102, loss: 0.347295880317688, mean loss: 0.3386242386542474
Epoch: 78, step: 1103, loss: 0.3281172215938568, mean loss: 0.3386241462734967
Epoch: 78, step: 1104, loss: 0.33794617652893066, mean loss: 0.3386241403126419
Epoch: 78, step: 1105, loss: 0.3251594305038452, mean loss: 0.3386240219290778
Epoch: 78, step: 1106, loss: 0.3339460790157318, mean loss: 0.3386239808003277
Epoch: 78, step: 1107, loss: 0.362500935792923, mean loss: 0.33862419072607935
Epoch: 78, step: 1108, loss: 0.3288143277168274, mean loss: 0.33862410447870145
Epoch: 78, step: 1109, loss: 0.31014108657836914, mean loss: 0.33862385406093226
Epoch: 78, step: 1110, loss: 0.2918572425842285, mean loss: 0.33862344290058416
Epoch: 78, step: 1111, loss: 0.30880510807037354, mean loss: 0.338623180747549
Epoch: 78, step: 1112, loss: 0.32261526584625244, mean loss: 0.33862304001244065
Epoch: 78, step: 1113, loss: 0.32925915718078613, mean loss: 0.3386229576896967
Epoch: 78, step: 1114, loss: 0.32411274313926697, mean loss: 0.3386228301240066
Epoch: 78, step: 1115, loss: 0.3425617516040802, mean loss: 0.33862286475249664
Epoch: 78, step: 1116, loss: 0.33979201316833496, mean loss: 0.33862287503081484
Epoch: 78, step: 1117, loss: 0.3082517087459564, mean loss: 0.3386226080315508
Epoch: 78, step: 1118, loss: 0.3560502231121063, mean loss: 0.33862276124000684
Epoch: 78, step: 1119, loss: 0.3267037868499756, mean loss: 0.33862265645965667
Epoch: 78, step: 1120, loss: 0.2976745367050171, mean loss: 0.3386222964856801
Epoch: 78, step: 1121, loss: 0.31309273838996887, mean loss: 0.3386220720578965
Epoch: 78, step: 1122, loss: 0.3459564745426178, mean loss: 0.338622136533326
Epoch: 78, step: 1123, loss: 0.3619157671928406, mean loss: 0.33862234130169566
Epoch: 78, step: 1124, loss: 0.349600613117218, mean loss: 0.3386224378080365
Epoch: 78, step: 1125, loss: 0.3298700749874115, mean loss: 0.3386223608695986
Epoch: 78, step: 1126, loss: 0.3271884024143219, mean loss: 0.338622260359235
Epoch: 78, step: 1127, loss: 0.3572320342063904, mean loss: 0.33862242394726105
Epoch: 78, step: 1128, loss: 0.3298979699611664, mean loss: 0.33862234725618073
Epoch: 78, step: 1129, loss: 0.3121465742588043, mean loss: 0.3386221145266841
Epoch: 78, step: 1130, loss: 0.3184305727481842, mean loss: 0.33862193703890886
Epoch: 78, step: 1131, loss: 0.3082438111305237, mean loss: 0.33862167001132626
Epoch: 78, step: 1132, loss: 0.33584240078926086, mean loss: 0.3386216455814118
Epoch: 78, step: 1133, loss: 0.33926087617874146, mean loss: 0.3386216512002311
Epoch: 78, step: 1134, loss: 0.33942097425460815, mean loss: 0.3386216582261969
Epoch: 78, step: 1135, loss: 0.3632432520389557, mean loss: 0.3386218746455223
Epoch: 78, step: 1136, loss: 0.3471815288066864, mean loss: 0.33862194988266214
Epoch: 78, step: 1137, loss: 0.3447454869747162, mean loss: 0.3386220037064917
Epoch: 78, step: 1138, loss: 0.34148839116096497, mean loss: 0.338622028900851
Epoch: 78, step: 1139, loss: 0.33049118518829346, mean loss: 0.33862195743472834
Epoch: 78, step: 1140, loss: 0.32569074630737305, mean loss: 0.33862184377673277
Epoch: 78, step: 1141, loss: 0.3206997215747833, mean loss: 0.33862168625285033
Epoch: 78, step: 1142, loss: 0.3484414219856262, mean loss: 0.33862177256122855
Epoch: 78, step: 1143, loss: 0.3066962659358978, mean loss: 0.3386214919615711
Epoch: 78, step: 1144, loss: 0.32589834928512573, mean loss: 0.3386213801363105
Epoch: 78, step: 1145, loss: 0.34049397706985474, mean loss: 0.33862139659464985
Epoch: 78, step: 1146, loss: 0.3259812295436859, mean loss: 0.33862128550062504
Epoch: 78, step: 1147, loss: 0.3518573045730591, mean loss: 0.33862140183055184
Epoch: 78, step: 1148, loss: 0.36458316445350647, mean loss: 0.3386216300036442
Epoch: 78, step: 1149, loss: 0.33355972170829773, mean loss: 0.33862158551586674
Epoch: 78, step: 1150, loss: 0.3698978126049042, mean loss: 0.338621860391965
Epoch: 78, step: 1151, loss: 0.326149582862854, mean loss: 0.3386217507783328
Epoch: 78, step: 1152, loss: 0.348877489566803, mean loss: 0.33862184091094066
Epoch: 78, step: 1153, loss: 0.29347386956214905, mean loss: 0.33862144413127226
Epoch: 78, step: 1154, loss: 0.3521415591239929, mean loss: 0.33862156295077706
Epoch: 78, step: 1155, loss: 0.3107159733772278, mean loss: 0.33862131770883963
Epoch: 78, step: 1156, loss: 0.33095479011535645, mean loss: 0.33862125033389484
Epoch: 78, step: 1157, loss: 0.31871262192726135, mean loss: 0.33862107537450997
Epoch: 78, step: 1158, loss: 0.3273976147174835, mean loss: 0.3386209767422749
Epoch: 78, step: 1159, loss: 0.3429900109767914, mean loss: 0.3386210151371905
Epoch: 78, step: 1160, loss: 0.3540434241294861, mean loss: 0.33862115066757453
Epoch: 78, step: 1161, loss: 0.3183174431324005, mean loss: 0.3386209722424595
Epoch: 78, step: 1162, loss: 0.3858114778995514, mean loss: 0.33862138693999155
Epoch: 78, step: 1163, loss: 0.34171637892723083, mean loss: 0.3386214141377137
Epoch: 78, step: 1164, loss: 0.3665638267993927, mean loss: 0.3386216596838411
Epoch: 78, step: 1165, loss: 0.3183058202266693, mean loss: 0.33862148115838847
Epoch: 78, step: 1166, loss: 0.33401232957839966, mean loss: 0.33862144065582184
Epoch: 78, step: 1167, loss: 0.34834712743759155, mean loss: 0.3386215261187988
Epoch: 78, step: 1168, loss: 0.3205380439758301, mean loss: 0.3386213672143767
Epoch: 78, step: 1169, loss: 0.33864641189575195, mean loss: 0.3386213674344491
Epoch: 78, step: 1170, loss: 0.28665271401405334, mean loss: 0.33862091077993717
Epoch: 78, step: 1171, loss: 0.3079589307308197, mean loss: 0.3386206413519729
Epoch: 78, step: 1172, loss: 0.3152959644794464, mean loss: 0.33862043639896666
Epoch: 78, step: 1173, loss: 0.3275783061981201, mean loss: 0.3386203393730612
Epoch: 78, step: 1174, loss: 0.3150654435157776, mean loss: 0.3386201324007672
Epoch: 78, step: 1175, loss: 0.3039901554584503, mean loss: 0.338619828116561
Epoch: 78, step: 1176, loss: 0.322200745344162, mean loss: 0.33861968384780566
Epoch: 78, step: 1177, loss: 0.30825474858283997, mean loss: 0.33861941704405146
Epoch: 78, step: 1178, loss: 0.34889963269233704, mean loss: 0.3386195073711345
Epoch: 78, step: 1179, loss: 0.3175382614135742, mean loss: 0.3386193221424595
Epoch: 78, step: 1180, loss: 0.32369130849838257, mean loss: 0.33861919097981863
Epoch: 78, step: 1181, loss: 0.3198005259037018, mean loss: 0.3386190256340345
Epoch: 78, step: 1182, loss: 0.3089185357093811, mean loss: 0.338618764679943
Epoch: 78, step: 1183, loss: 0.3851681053638458, mean loss: 0.3386191736676133
Epoch: 78, step: 1184, loss: 0.39019909501075745, mean loss: 0.33861962685054153
Epoch: 78, step: 1185, loss: 0.304796427488327, mean loss: 0.3386193296813823
Epoch: 78, step: 1186, loss: 0.3037542998790741, mean loss: 0.33861902336143745
Epoch: 78, step: 1187, loss: 0.3181852698326111, mean loss: 0.3386188438345219
Epoch: 78, step: 1188, loss: 0.3598327338695526, mean loss: 0.338619030213925
Epoch: 78, step: 1189, loss: 0.3290294110774994, mean loss: 0.33861894596290903
Epoch: 78, step: 1190, loss: 0.3687168061733246, mean loss: 0.3386192103897842
Epoch: 78, step: 1191, loss: 0.30498212575912476, mean loss: 0.3386189148713994
Epoch: 78, step: 1192, loss: 0.34118011593818665, mean loss: 0.3386189373726168
Epoch: 78, step: 1193, loss: 0.32264167070388794, mean loss: 0.3386187970069124
Epoch: 78, step: 1194, loss: 0.2975403666496277, mean loss: 0.33861843612214554
Epoch: 78, step: 1195, loss: 0.34920406341552734, mean loss: 0.3386185291188361
Epoch: 78, step: 1196, loss: 0.34634333848953247, mean loss: 0.3386185969821167
Epoch: 78, step: 1197, loss: 0.3270432651042938, mean loss: 0.33861849529247534
Epoch: 78, step: 1198, loss: 0.3686046600341797, mean loss: 0.33861875871952724
Epoch: 78, step: 1199, loss: 0.3095431923866272, mean loss: 0.3386185032942836
Epoch: 78, step: 1200, loss: 0.32645145058631897, mean loss: 0.3386183964091738
Epoch: 78, step: 1201, loss: 0.3341323137283325, mean loss: 0.33861835700018633
Epoch: 78, step: 1202, loss: 0.37065625190734863, mean loss: 0.33861863844170176
Epoch: 78, step: 1203, loss: 0.3517402112483978, mean loss: 0.3386187537090408
Epoch: 78, step: 1204, loss: 0.37231773138046265, mean loss: 0.3386190497373767
Epoch: 78, step: 1205, loss: 0.3301916718482971, mean loss: 0.33861897570780936
Epoch: 78, step: 1206, loss: 0.33024367690086365, mean loss: 0.33861890213637247
Epoch: 78, step: 1207, loss: 0.30795153975486755, mean loss: 0.3386186327463305
Epoch: 78, step: 1208, loss: 0.3497743010520935, mean loss: 0.338618730739745
Epoch: 78, step: 1209, loss: 0.29291027784347534, mean loss: 0.3386183292319281
Epoch: 78, step: 1210, loss: 0.3689638376235962, mean loss: 0.33861859578769693
Epoch: 78, step: 1211, loss: 0.389665424823761, mean loss: 0.33861904418048916
Epoch: 78, step: 1212, loss: 0.33638641238212585, mean loss: 0.3386190245693354
Epoch: 78, step: 1213, loss: 0.3123570680618286, mean loss: 0.338618793889676
Epoch: 78, step: 1214, loss: 0.35229066014289856, mean loss: 0.3386189139795005
Epoch: 78, step: 1215, loss: 0.28792253136634827, mean loss: 0.3386184686806581
Epoch: 78, step: 1216, loss: 0.34557652473449707, mean loss: 0.3386185297971901
Epoch: 78, step: 1217, loss: 0.3112914562225342, mean loss: 0.33861828977019337
Epoch: 78, step: 1218, loss: 0.3095810115337372, mean loss: 0.33861803472387636
Epoch: 78, step: 1219, loss: 0.3569106459617615, mean loss: 0.3386181953939677
Epoch: 78, step: 1220, loss: 0.3072921931743622, mean loss: 0.33861792024968324
Epoch: 78, step: 1221, loss: 0.3143424093723297, mean loss: 0.33861770703353905
Epoch: 78, step: 1222, loss: 0.36893507838249207, mean loss: 0.33861797331408316
Epoch: 78, step: 1223, loss: 0.3401850461959839, mean loss: 0.33861798707772217
Epoch: 78, step: 1224, loss: 0.36253437399864197, mean loss: 0.33861819713408164
Epoch: 78, step: 1225, loss: 0.3185945153236389, mean loss: 0.33861802126868956
Epoch: 78, step: 1226, loss: 0.34981095790863037, mean loss: 0.33861811957393234
Epoch: 78, step: 1227, loss: 0.3602651357650757, mean loss: 0.33861830969351947
Epoch: 78, step: 1228, loss: 0.3185173273086548, mean loss: 0.3386181331538581
Epoch: 78, step: 1229, loss: 0.34695953130722046, mean loss: 0.3386182064126991
Epoch: 78, step: 1230, loss: 0.3283730745315552, mean loss: 0.33861811643499007
Epoch: 78, step: 1231, loss: 0.33507096767425537, mean loss: 0.33861808528248566
Epoch: 78, step: 1232, loss: 0.3119131624698639, mean loss: 0.33861785075104217
Epoch: 78, step: 1233, loss: 0.31811198592185974, mean loss: 0.33861767066335285
Epoch: 78, step: 1234, loss: 0.2997920513153076, mean loss: 0.33861732968994224
Epoch: 78, step: 1235, loss: 0.3380688428878784, mean loss: 0.33861732487307705
Epoch: 78, step: 1236, loss: 0.3014684319496155, mean loss: 0.3386169986307027
Epoch: 78, step: 1237, loss: 0.3509480655193329, mean loss: 0.3386171069214456
Epoch: 78, step: 1238, loss: 0.34079328179359436, mean loss: 0.3386171260323243
Epoch: 78, step: 1239, loss: 0.3255033493041992, mean loss: 0.33861701086988993
Epoch: 78, step: 1240, loss: 0.3366934359073639, mean loss: 0.33861699397760675
Epoch: 78, step: 1241, loss: 0.2838766574859619, mean loss: 0.33861651326790576
Epoch: 78, step: 1242, loss: 0.3241080343723297, mean loss: 0.3386163858608463
Epoch: 78, step: 1243, loss: 0.31468701362609863, mean loss: 0.33861617572550406
Epoch: 78, step: 1244, loss: 0.3349818289279938, mean loss: 0.33861614381083477
Epoch: 78, step: 1245, loss: 0.3038327693939209, mean loss: 0.33861583836663645
Epoch: 78, step: 1246, loss: 0.30898773670196533, mean loss: 0.33861557819486054
Epoch: 78, step: 1247, loss: 0.36378830671310425, mean loss: 0.3386157992409487
Epoch: 78, step: 1248, loss: 0.3442835807800293, mean loss: 0.3386158490102828
Epoch: 78, step: 1249, loss: 0.30749520659446716, mean loss: 0.33861557573933204
Epoch: 78, step: 1250, loss: 0.3333587348461151, mean loss: 0.3386155295793179
Epoch: 78, step: 1251, loss: 0.34343430399894714, mean loss: 0.3386155718923243
Epoch: 78, step: 1252, loss: 0.3559185266494751, mean loss: 0.3386157238258955
Epoch: 78, step: 1253, loss: 0.32748737931251526, mean loss: 0.3386156261111236
Epoch: 78, step: 1254, loss: 0.32512474060058594, mean loss: 0.33861550765260323
Epoch: 78, step: 1255, loss: 0.3467090427875519, mean loss: 0.33861557871834447
Epoch: 78, step: 1256, loss: 0.3532477915287018, mean loss: 0.3386157071961853
Epoch: 78, step: 1257, loss: 0.3062472939491272, mean loss: 0.3386154229885003
Epoch: 78, step: 1258, loss: 0.3282715082168579, mean loss: 0.33861533216556633
Epoch: 78, step: 1259, loss: 0.33046409487724304, mean loss: 0.3386152605956818
Epoch: 78, step: 1260, loss: 0.31411662697792053, mean loss: 0.33861504549349275
Epoch: 78, step: 1261, loss: 0.33355721831321716, mean loss: 0.33861500108529585
Epoch: 78, step: 1262, loss: 0.3391891419887543, mean loss: 0.33861500612626255
Epoch: 78, step: 1263, loss: 0.3278184235095978, mean loss: 0.3386149113329194
Epoch: 78, step: 1264, loss: 0.3456366956233978, mean loss: 0.33861497298322
Epoch: 78, step: 1265, loss: 0.3012084364891052, mean loss: 0.3386146445618562
Epoch: 78, step: 1266, loss: 0.3405291438102722, mean loss: 0.3386146613706012
Epoch: 78, step: 1267, loss: 0.4011182487010956, mean loss: 0.3386152101290501
Epoch: 78, step: 1268, loss: 0.35457077622413635, mean loss: 0.338615350211807
Epoch: 78, step: 1269, loss: 0.384431928396225, mean loss: 0.3386157524574057
Epoch: 78, step: 1270, loss: 0.33425450325012207, mean loss: 0.33861571416825437
Epoch: 78, step: 1271, loss: 0.2947692573070526, mean loss: 0.33861532922604987
Epoch: 78, step: 1272, loss: 0.35927000641822815, mean loss: 0.33861551055853917
Epoch: 78, step: 1273, loss: 0.3102240562438965, mean loss: 0.3386152613051696
Epoch: 78, step: 1274, loss: 0.3437695801258087, mean loss: 0.3386153065554073
Epoch: 78, step: 1275, loss: 0.33249631524086, mean loss: 0.3386152528366929
Epoch: 78, step: 1276, loss: 0.3467874526977539, mean loss: 0.3386153245799253
Epoch: 78, step: 1277, loss: 0.29851034283638, mean loss: 0.3386149725038851
Epoch: 78, step: 1278, loss: 0.31345176696777344, mean loss: 0.33861475160155313
Epoch: 78, step: 1279, loss: 0.33615145087242126, mean loss: 0.33861472997695935
Epoch: 78, step: 1280, loss: 0.3206078112125397, mean loss: 0.3386145719008946
Epoch: 78, step: 1281, loss: 0.3747391998767853, mean loss: 0.3386148890228285
Epoch: 78, step: 1282, loss: 0.3205699622631073, mean loss: 0.3386147306158868
Epoch: 78, step: 1283, loss: 0.3147136867046356, mean loss: 0.3386145208030079
Epoch: 78, step: 1284, loss: 0.29611268639564514, mean loss: 0.3386141477082599
Epoch: 78, step: 1285, loss: 0.3323996961116791, mean loss: 0.3386140931562875
Epoch: 78, step: 1286, loss: 0.34191569685935974, mean loss: 0.338614122138316
Epoch: 78, step: 1287, loss: 0.3987244665622711, mean loss: 0.33861464979232253
Epoch: 78, step: 1288, loss: 0.3918016850948334, mean loss: 0.338615116668801
Epoch: 78, step: 1289, loss: 0.30600684881210327, mean loss: 0.3386148304355198
Epoch: 78, step: 1290, loss: 0.3632808327674866, mean loss: 0.3386150469502037
Epoch: 78, step: 1291, loss: 0.3223799467086792, mean loss: 0.3386149044420383
Epoch: 78, step: 1292, loss: 0.33379319310188293, mean loss: 0.33861486211848035
Epoch: 78, step: 1293, loss: 0.3444538116455078, mean loss: 0.3386149133706048
Epoch: 78, step: 1294, loss: 0.3155879080295563, mean loss: 0.3386147112499017
Epoch: 78, step: 1295, loss: 0.33188095688819885, mean loss: 0.33861465214455133
Epoch: 78, step: 1296, loss: 0.3034743666648865, mean loss: 0.33861434370433435
Epoch: 78, step: 1297, loss: 0.3599911332130432, mean loss: 0.3386145313352438
Epoch: 78, step: 1298, loss: 0.3658217489719391, mean loss: 0.3386147701395871
Epoch: 78, step: 1299, loss: 0.33129626512527466, mean loss: 0.3386147059038586
Epoch: 78, step: 1300, loss: 0.32004326581954956, mean loss: 0.3386145429006893
Epoch: 78, step: 1301, loss: 0.31272828578948975, mean loss: 0.3386143156967194
Epoch: 78, step: 1302, loss: 0.4174758493900299, mean loss: 0.3386150078592129
Epoch: 78, step: 1303, loss: 0.3800433874130249, mean loss: 0.33861537147018356
Epoch: 78, step: 1304, loss: 0.3035733997821808, mean loss: 0.338615063914502
Epoch: 78, step: 1305, loss: 0.3911493718624115, mean loss: 0.33861552499252645
Epoch: 78, step: 1306, loss: 0.31880807876586914, mean loss: 0.33861535114997715
Epoch: 78, step: 1307, loss: 0.32873302698135376, mean loss: 0.33861526441727424
Epoch: 78, step: 1308, loss: 0.2973879873752594, mean loss: 0.33861490258723026
Epoch: 78, step: 1309, loss: 0.3121740520000458, mean loss: 0.33861467053188116
Epoch: 78, step: 1310, loss: 0.31283339858055115, mean loss: 0.33861444426724047
Epoch: 78, step: 1311, loss: 0.32447609305381775, mean loss: 0.33861432018566345
Epoch: 78, step: 1312, loss: 0.39204245805740356, mean loss: 0.33861478907976034
Epoch: 78, step: 1313, loss: 0.3290722370147705, mean loss: 0.33861470533349397
Epoch: 78, step: 1314, loss: 0.3585492968559265, mean loss: 0.3386148802796665
Epoch: 78, step: 1315, loss: 0.3507925868034363, mean loss: 0.3386149871504016
Epoch: 78, step: 1316, loss: 0.3310735523700714, mean loss: 0.33861492096785695
Epoch: 78, step: 1317, loss: 0.32732659578323364, mean loss: 0.33861482190401154
Epoch: 78, step: 1318, loss: 0.3230806291103363, mean loss: 0.3386146855805673
Epoch: 78, step: 1319, loss: 0.33438560366630554, mean loss: 0.33861464846773104
Epoch: 78, step: 1320, loss: 0.3281624913215637, mean loss: 0.3386145567443262
Epoch: 78, step: 1321, loss: 0.3434124290943146, mean loss: 0.33861459884791495
Epoch: 78, step: 1322, loss: 0.3332822024822235, mean loss: 0.33861455205403695
Epoch: 78, step: 1323, loss: 0.3181966543197632, mean loss: 0.33861437288051616
Epoch: 78, step: 1324, loss: 0.3732496201992035, mean loss: 0.33861467681311636
Epoch: 78, step: 1325, loss: 0.3254474997520447, mean loss: 0.3386145612689943
Epoch: 78, step: 1326, loss: 0.2970709800720215, mean loss: 0.33861419672050586
Epoch: 78, step: 1327, loss: 0.3374720513820648, mean loss: 0.3386141866981705
Epoch: 78, step: 1328, loss: 0.3369915783405304, mean loss: 0.3386141724598929
Epoch: 78, step: 1329, loss: 0.309943825006485, mean loss: 0.3386139208817576
Epoch: 78, step: 1330, loss: 0.3447277247905731, mean loss: 0.3386139745290283
Epoch: 78, step: 1331, loss: 0.3143758177757263, mean loss: 0.33861376184645525
Epoch: 78, step: 1332, loss: 0.33260679244995117, mean loss: 0.33861370913755867
Epoch: 78, step: 1333, loss: 0.31996071338653564, mean loss: 0.3386135454659746
Epoch: 78, step: 1334, loss: 0.30485522747039795, mean loss: 0.33861324925463276
Epoch: 78, step: 1335, loss: 0.33282262086868286, mean loss: 0.3386131984453847
Epoch: 78, step: 1336, loss: 0.35585689544677734, mean loss: 0.3386133497470281
Epoch: 78, step: 1337, loss: 0.3410334885120392, mean loss: 0.33861337098190364
Epoch: 78, step: 1338, loss: 0.3241546154022217, mean loss: 0.33861324411844207
Epoch: 78, step: 1339, loss: 0.29149141907691956, mean loss: 0.33861283066755027
Epoch: 78, step: 1340, loss: 0.3201919198036194, mean loss: 0.3386126690423332
Epoch: 78, step: 1341, loss: 0.3238687217235565, mean loss: 0.3386125396799583
Epoch: 78, step: 1342, loss: 0.3314042091369629, mean loss: 0.33861247643511916
Epoch: 78, step: 1343, loss: 0.31110596656799316, mean loss: 0.3386122350991373
Epoch: 78, step: 1344, loss: 0.30500826239585876, mean loss: 0.33861194026796343
Epoch: 78, step: 1345, loss: 0.38330376148223877, mean loss: 0.33861233237715305
Epoch: 78, step: 1346, loss: 0.3919003903865814, mean loss: 0.33861279990238147
Epoch: 78, step: 1347, loss: 0.28631284832954407, mean loss: 0.3386123410503761
Epoch: 78, step: 1348, loss: 0.33897170424461365, mean loss: 0.3386123442032103
Epoch: 78, step: 1349, loss: 0.33648815751075745, mean loss: 0.3386123255670511
Epoch: 78, step: 1350, loss: 0.34296077489852905, mean loss: 0.3386123637170325
Epoch: 78, step: 1351, loss: 0.3734072744846344, mean loss: 0.3386126689783917
Epoch: 78, step: 1352, loss: 0.31709733605384827, mean loss: 0.33861248022256485
Epoch: 78, step: 1353, loss: 0.33636176586151123, mean loss: 0.33861246047703153
Epoch: 78, step: 1354, loss: 0.3378245234489441, mean loss: 0.33861245356451497
Epoch: 78, step: 1355, loss: 0.3460034728050232, mean loss: 0.33861251840484236
Epoch: 78, step: 1356, loss: 0.35373520851135254, mean loss: 0.33861265107282
Epoch: 78, step: 1357, loss: 0.3836454451084137, mean loss: 0.3386130461319834
Epoch: 78, step: 1358, loss: 0.32355543971061707, mean loss: 0.338612914037288
Epoch: 78, step: 1359, loss: 0.3397234380245209, mean loss: 0.33861292377941016
Epoch: 78, step: 1360, loss: 0.3415006101131439, mean loss: 0.3386129491115475
Epoch: 78, step: 1361, loss: 0.32230356335639954, mean loss: 0.33861280603923005
Epoch: 78, step: 1362, loss: 0.342629998922348, mean loss: 0.33861284127930974
Epoch: 78, step: 1363, loss: 0.3000633716583252, mean loss: 0.338612503114202
Epoch: 78, step: 1364, loss: 0.3652653992176056, mean loss: 0.33861273691768895
Epoch: 78, step: 1365, loss: 0.34066200256347656, mean loss: 0.33861275489401876
Epoch: 78, step: 1366, loss: 0.30293288826942444, mean loss: 0.3386124419099871
Epoch: 78, step: 1367, loss: 0.34293147921562195, mean loss: 0.3386124797962793
Epoch: 78, step: 1368, loss: 0.3406124711036682, mean loss: 0.3386124973399088
Epoch: 78, step: 1369, loss: 0.3490857183933258, mean loss: 0.33861258920865717
Epoch: 78, step: 1370, loss: 0.36994585394859314, mean loss: 0.3386128640546239
Epoch: 78, step: 1371, loss: 0.3167078197002411, mean loss: 0.33861267191185385
Epoch: 78, step: 1372, loss: 0.2911069095134735, mean loss: 0.3386122552129161
Epoch: 78, step: 1373, loss: 0.35004279017448425, mean loss: 0.3386123554754897
Epoch: 78, step: 1374, loss: 0.3180076479911804, mean loss: 0.33861217474353916
Epoch: 78, step: 1375, loss: 0.2867056131362915, mean loss: 0.3386117194547734
Epoch: 78, step: 1376, loss: 0.32357239723205566, mean loss: 0.3386115875413085
Epoch: 78, step: 1377, loss: 0.3312133252620697, mean loss: 0.3386115226499632
Epoch: 78, step: 1378, loss: 0.32001522183418274, mean loss: 0.3386113595402561
Epoch: 78, step: 1379, loss: 0.31908920407295227, mean loss: 0.33861118831130244
Epoch: 78, step: 1380, loss: 0.32330289483070374, mean loss: 0.3386110540433375
Epoch: 78, step: 1381, loss: 0.3478725850582123, mean loss: 0.33861113527486186
Epoch: 78, step: 1382, loss: 0.3035805821418762, mean loss: 0.3386108280297351
Epoch: 78, step: 1383, loss: 0.3351045846939087, mean loss: 0.3386107972775307
Epoch: 78, step: 1384, loss: 0.30375006794929504, mean loss: 0.3386104915272537
Epoch: 78, step: 1385, loss: 0.3176886737346649, mean loss: 0.3386103080315092
Epoch: 78, step: 1386, loss: 0.3297034502029419, mean loss: 0.3386102299141969
Epoch: 78, step: 1387, loss: 0.3282523453235626, mean loss: 0.3386101390714975
Epoch: 78, step: 1388, loss: 0.3442951738834381, mean loss: 0.3386101889310393
Epoch: 78, step: 1389, loss: 0.32276976108551025, mean loss: 0.3386100500067278
Epoch: 78, step: 1390, loss: 0.33863088488578796, mean loss: 0.338610050189453
Epoch: 78, step: 1391, loss: 0.2793188989162445, mean loss: 0.33860953020110607
Epoch: 78, step: 1392, loss: 0.3126051723957062, mean loss: 0.33860930214271706
Epoch: 78, step: 1393, loss: 0.33185815811157227, mean loss: 0.33860924293565875
Epoch: 78, step: 1394, loss: 0.3171815872192383, mean loss: 0.33860905501827326
Epoch: 78, step: 1395, loss: 0.345048725605011, mean loss: 0.3386091114927408
Epoch: 78, step: 1396, loss: 0.417194128036499, mean loss: 0.3386098006596768
Epoch: 78, step: 1397, loss: 0.3178554177284241, mean loss: 0.338609618651583
Epoch: 78, step: 1398, loss: 0.29811960458755493, mean loss: 0.3386092635725776
Epoch: 78, step: 1399, loss: 0.31848645210266113, mean loss: 0.3386090871062219
Epoch: 78, step: 1400, loss: 0.3221222758293152, mean loss: 0.33860894252692225
Epoch: 78, step: 1401, loss: 0.3631352186203003, mean loss: 0.3386091576055487
Epoch: 78, step: 1402, loss: 0.3363446891307831, mean loss: 0.3386091377478868
Epoch: 78, step: 1403, loss: 0.3116492033004761, mean loss: 0.3386089013318914
Epoch: 78, step: 1404, loss: 0.34436628222465515, mean loss: 0.3386089518188465
Epoch: 78, step: 1405, loss: 0.3233829140663147, mean loss: 0.33860881830161754
Epoch: 78, step: 1406, loss: 0.37749210000038147, mean loss: 0.3386091592663901
Epoch: 78, step: 1407, loss: 0.3415420651435852, mean loss: 0.33860918498461073
Epoch: 78, step: 1408, loss: 0.32529133558273315, mean loss: 0.3386090682033706
Epoch: 78, step: 1409, loss: 0.3348177373409271, mean loss: 0.3386090349583305
Epoch: 78, step: 1410, loss: 0.34683412313461304, mean loss: 0.3386091070810226
Epoch: 78, step: 1411, loss: 0.37778857350349426, mean loss: 0.33860945062795555
Epoch: 78, step: 1412, loss: 0.351167768239975, mean loss: 0.338609560745169
Epoch: 78, step: 1413, loss: 0.285030335187912, mean loss: 0.33860909094153224
Epoch: 78, step: 1414, loss: 0.323822021484375, mean loss: 0.33860896128385204
Epoch: 78, step: 1415, loss: 0.3178134858608246, mean loss: 0.33860877894417557
Epoch: 78, step: 1416, loss: 0.3082563877105713, mean loss: 0.33860851280952087
Epoch: 78, step: 1417, loss: 0.3778008818626404, mean loss: 0.3386088564515117
Epoch: 78, step: 1418, loss: 0.3253554403781891, mean loss: 0.33860874024546284
Epoch: 78, step: 1419, loss: 0.35817956924438477, mean loss: 0.33860891184112973
Epoch: 78, step: 1420, loss: 0.31754443049430847, mean loss: 0.33860872715084234
Epoch: 78, step: 1421, loss: 0.32221540808677673, mean loss: 0.33860858341788197
Epoch: 78, step: 1422, loss: 0.3231710195541382, mean loss: 0.33860844806595647
Epoch: 78, step: 1423, loss: 0.3323076665401459, mean loss: 0.3386083928230799
Epoch: 78, step: 1424, loss: 0.37005090713500977, mean loss: 0.3386086684967721
Epoch: 78, step: 1425, loss: 0.3732629716396332, mean loss: 0.33860897232730697
Epoch: 78, step: 1426, loss: 0.32775232195854187, mean loss: 0.338608877142794
Epoch: 78, step: 1427, loss: 0.35022181272506714, mean loss: 0.3386089789570635
Epoch: 78, step: 1428, loss: 0.35571369528770447, mean loss: 0.33860912891819245
Epoch: 78, step: 1429, loss: 0.3309714198112488, mean loss: 0.33860906195716156
Epoch: 78, step: 1430, loss: 0.2960270345211029, mean loss: 0.3386086886369137
Epoch: 78, step: 1431, loss: 0.33872637152671814, mean loss: 0.3386086896686405
Epoch: 78, step: 1432, loss: 0.31481289863586426, mean loss: 0.3386084810525792
Epoch: 78, step: 1433, loss: 0.31883054971694946, mean loss: 0.33860830766233724
Epoch: 78, step: 1434, loss: 0.3298896849155426, mean loss: 0.3386082312281122
Epoch: 78, step: 1435, loss: 0.31451842188835144, mean loss: 0.33860802003996704
Epoch: 78, step: 1436, loss: 0.32641467452049255, mean loss: 0.3386079131454951
Epoch: 78, step: 1437, loss: 0.33234140276908875, mean loss: 0.33860785820983824
Epoch: 78, step: 1438, loss: 0.34713923931121826, mean loss: 0.33860793299993475
Epoch: 78, step: 1439, loss: 0.32114899158477783, mean loss: 0.33860777994799024
Epoch: 78, step: 1440, loss: 0.33584851026535034, mean loss: 0.3386077557593594
Epoch: 78, step: 1441, loss: 0.34860682487487793, mean loss: 0.3386078434135936
Epoch: 78, step: 1442, loss: 0.28415337204933167, mean loss: 0.33860736605684266
Epoch: 78, step: 1443, loss: 0.3595963716506958, mean loss: 0.33860755004826587
Valid: 78, mean loss: 0.18509584665298462
Epoch: 79, step: 0, loss: 0.30552247166633606, mean loss: 0.3386072600241735
Epoch: 79, step: 1, loss: 0.2993444502353668, mean loss: 0.33860691584904956
Epoch: 79, step: 2, loss: 0.2853591740131378, mean loss: 0.33860644908705273
Epoch: 79, step: 3, loss: 0.32285940647125244, mean loss: 0.3386063110519667
Epoch: 79, step: 4, loss: 0.354192852973938, mean loss: 0.3386064476789416
Epoch: 79, step: 5, loss: 0.3232657015323639, mean loss: 0.3386063132077179
Epoch: 79, step: 6, loss: 0.3297041654586792, mean loss: 0.33860623517551547
Epoch: 79, step: 7, loss: 0.33140262961387634, mean loss: 0.3386061720325194
Epoch: 79, step: 8, loss: 0.3450280427932739, mean loss: 0.3386062283227483
Epoch: 79, step: 9, loss: 0.33653295040130615, mean loss: 0.33860621014980924
Epoch: 79, step: 10, loss: 0.3561479449272156, mean loss: 0.33860636390733445
Epoch: 79, step: 11, loss: 0.3299804925918579, mean loss: 0.33860628830016004
Epoch: 79, step: 12, loss: 0.37316766381263733, mean loss: 0.33860659123361997
Epoch: 79, step: 13, loss: 0.3452232778072357, mean loss: 0.33860664922894446
Epoch: 79, step: 14, loss: 0.3047320544719696, mean loss: 0.3386063523203824
Epoch: 79, step: 15, loss: 0.323358416557312, mean loss: 0.33860621867441454
Epoch: 79, step: 16, loss: 0.32575613260269165, mean loss: 0.33860610604624214
Epoch: 79, step: 17, loss: 0.2998126447200775, mean loss: 0.33860576603308346
Epoch: 79, step: 18, loss: 0.32381778955459595, mean loss: 0.33860563642200076
Epoch: 79, step: 19, loss: 0.41726821660995483, mean loss: 0.3386063258640512
Epoch: 79, step: 20, loss: 0.34842532873153687, mean loss: 0.3386064119224302
Epoch: 79, step: 21, loss: 0.3450455069541931, mean loss: 0.3386064683572058
Epoch: 79, step: 22, loss: 0.34157562255859375, mean loss: 0.33860649437981954
Epoch: 79, step: 23, loss: 0.3184666633605957, mean loss: 0.3386063178694688
Epoch: 79, step: 24, loss: 0.31755879521369934, mean loss: 0.3386061334055057
Epoch: 79, step: 25, loss: 0.3511739671230316, mean loss: 0.3386062435511098
Epoch: 79, step: 26, loss: 0.31678998470306396, mean loss: 0.33860605235316715
Epoch: 79, step: 27, loss: 0.3191397488117218, mean loss: 0.33860588175175493
Epoch: 79, step: 28, loss: 0.3227805495262146, mean loss: 0.3386057430607929
Epoch: 79, step: 29, loss: 0.32896316051483154, mean loss: 0.3386056585553107
Epoch: 79, step: 30, loss: 0.3343895971775055, mean loss: 0.33860562160699575
Epoch: 79, step: 31, loss: 0.34120965003967285, mean loss: 0.3386056444277308
Epoch: 79, step: 32, loss: 0.361285537481308, mean loss: 0.33860584318412207
Epoch: 79, step: 33, loss: 0.34425434470176697, mean loss: 0.3386058926846174
Epoch: 79, step: 34, loss: 0.33352717757225037, mean loss: 0.33860584817782036
Epoch: 79, step: 35, loss: 0.3342326283454895, mean loss: 0.33860580985389443
Epoch: 79, step: 36, loss: 0.3763144910335541, mean loss: 0.33860614030424785
Epoch: 79, step: 37, loss: 0.35157132148742676, mean loss: 0.3386062539202913
Epoch: 79, step: 38, loss: 0.3161415159702301, mean loss: 0.33860605705977387
Epoch: 79, step: 39, loss: 0.32910946011543274, mean loss: 0.3386059738409707
Epoch: 79, step: 40, loss: 0.3400394320487976, mean loss: 0.33860598640227363
Epoch: 79, step: 41, loss: 0.3130994737148285, mean loss: 0.3386057628922867
Epoch: 79, step: 42, loss: 0.2944639027118683, mean loss: 0.33860537608675756
Epoch: 79, step: 43, loss: 0.31039029359817505, mean loss: 0.33860512884628713
Epoch: 79, step: 44, loss: 0.33110055327415466, mean loss: 0.33860506308647453
Epoch: 79, step: 45, loss: 0.35337886214256287, mean loss: 0.33860519254266225
Epoch: 79, step: 46, loss: 0.3944736123085022, mean loss: 0.3386056820883258
Epoch: 79, step: 47, loss: 0.30018895864486694, mean loss: 0.3386053454656746
Epoch: 79, step: 48, loss: 0.34110745787620544, mean loss: 0.33860536738998925
Epoch: 79, step: 49, loss: 0.35885196924209595, mean loss: 0.3386055447956799
Epoch: 79, step: 50, loss: 0.3466557562351227, mean loss: 0.33860561533298866
Epoch: 79, step: 51, loss: 0.347507119178772, mean loss: 0.3386056933287815
Epoch: 79, step: 52, loss: 0.3466033935546875, mean loss: 0.3386057634047501
Epoch: 79, step: 53, loss: 0.33779680728912354, mean loss: 0.3386057563167267
Epoch: 79, step: 54, loss: 0.32997655868530273, mean loss: 0.3386056807088933
Epoch: 79, step: 55, loss: 0.3518078625202179, mean loss: 0.3386057963835666
Epoch: 79, step: 56, loss: 0.3700832426548004, mean loss: 0.33860607217975414
Epoch: 79, step: 57, loss: 0.35402339696884155, mean loss: 0.3386062072606659
Epoch: 79, step: 58, loss: 0.3410528898239136, mean loss: 0.3386062286974081
Epoch: 79, step: 59, loss: 0.3189261257648468, mean loss: 0.33860605627062834
Epoch: 79, step: 60, loss: 0.32894328236579895, mean loss: 0.3386059716111936
Epoch: 79, step: 61, loss: 0.30259573459625244, mean loss: 0.3386056561138394
Epoch: 79, step: 62, loss: 0.36509254574775696, mean loss: 0.3386058881720284
Epoch: 79, step: 63, loss: 0.35133999586105347, mean loss: 0.33860599973771693
Epoch: 79, step: 64, loss: 0.32039204239845276, mean loss: 0.3386058401635294
Epoch: 79, step: 65, loss: 0.3253116011619568, mean loss: 0.33860572369247577
Epoch: 79, step: 66, loss: 0.33314722776412964, mean loss: 0.3386056758709192
Epoch: 79, step: 67, loss: 0.34628111124038696, mean loss: 0.3386057431143606
Epoch: 79, step: 68, loss: 0.3345962166786194, mean loss: 0.33860570798775463
Epoch: 79, step: 69, loss: 0.32983696460723877, mean loss: 0.3386056311673371
Epoch: 79, step: 70, loss: 0.348834753036499, mean loss: 0.33860572078092194
Epoch: 79, step: 71, loss: 0.3252682685852051, mean loss: 0.3386056039374188
Epoch: 79, step: 72, loss: 0.35973143577575684, mean loss: 0.33860578900984023
Epoch: 79, step: 73, loss: 0.34781140089035034, mean loss: 0.33860586965470996
Epoch: 79, step: 74, loss: 0.33140113949775696, mean loss: 0.33860580653892336
Epoch: 79, step: 75, loss: 0.35426008701324463, mean loss: 0.33860594367432595
Epoch: 79, step: 76, loss: 0.3169848322868347, mean loss: 0.3386057542696551
Epoch: 79, step: 77, loss: 0.334499329328537, mean loss: 0.3386057182969784
Epoch: 79, step: 78, loss: 0.3223171830177307, mean loss: 0.33860557560909543
Epoch: 79, step: 79, loss: 0.3373701274394989, mean loss: 0.33860556478664044
Epoch: 79, step: 80, loss: 0.3235173225402832, mean loss: 0.3386054326156632
Epoch: 79, step: 81, loss: 0.32307663559913635, mean loss: 0.33860529658667693
Epoch: 79, step: 82, loss: 0.34268438816070557, mean loss: 0.33860533231834566
Epoch: 79, step: 83, loss: 0.33020663261413574, mean loss: 0.33860525874879677
Epoch: 79, step: 84, loss: 0.34515535831451416, mean loss: 0.3386053161247795
Epoch: 79, step: 85, loss: 0.30418258905410767, mean loss: 0.33860501459951653
Epoch: 79, step: 86, loss: 0.3705502450466156, mean loss: 0.338605294420741
Epoch: 79, step: 87, loss: 0.3576357662677765, mean loss: 0.3386054611148989
Epoch: 79, step: 88, loss: 0.31230735778808594, mean loss: 0.3386052307631858
Epoch: 79, step: 89, loss: 0.3081150949001312, mean loss: 0.33860496369474286
Epoch: 79, step: 90, loss: 0.35441339015960693, mean loss: 0.3386051021623076
Epoch: 79, step: 91, loss: 0.34948402643203735, mean loss: 0.33860519745104234
Epoch: 79, step: 92, loss: 0.3136349022388458, mean loss: 0.33860497873759815
Epoch: 79, step: 93, loss: 0.3431381583213806, mean loss: 0.33860501844312135
Epoch: 79, step: 94, loss: 0.37989333271980286, mean loss: 0.33860538007886315
Epoch: 79, step: 95, loss: 0.32419440150260925, mean loss: 0.3386052538572101
Epoch: 79, step: 96, loss: 0.3208388388156891, mean loss: 0.3386050982476085
Epoch: 79, step: 97, loss: 0.3917224109172821, mean loss: 0.3386055634788579
Epoch: 79, step: 98, loss: 0.341277152299881, mean loss: 0.3386055868779279
Epoch: 79, step: 99, loss: 0.30334657430648804, mean loss: 0.3386052780651076
Epoch: 79, step: 100, loss: 0.3400646448135376, mean loss: 0.33860529084672514
Epoch: 79, step: 101, loss: 0.36493149399757385, mean loss: 0.33860552141831646
Epoch: 79, step: 102, loss: 0.3667142689228058, mean loss: 0.338605767599729
Epoch: 79, step: 103, loss: 0.3121684491634369, mean loss: 0.3386055360590175
Epoch: 79, step: 104, loss: 0.35649198293685913, mean loss: 0.3386056927089582
Epoch: 79, step: 105, loss: 0.3332615792751312, mean loss: 0.33860564590549147
Epoch: 79, step: 106, loss: 0.3419877588748932, mean loss: 0.338605675525601
Epoch: 79, step: 107, loss: 0.3256462812423706, mean loss: 0.33860556202988984
Epoch: 79, step: 108, loss: 0.29916420578956604, mean loss: 0.33860521661362464
Epoch: 79, step: 109, loss: 0.34381577372550964, mean loss: 0.33860526224581344
Epoch: 79, step: 110, loss: 0.36371880769729614, mean loss: 0.3386054821793037
Epoch: 79, step: 111, loss: 0.3592764437198639, mean loss: 0.33860566320499413
Epoch: 79, step: 112, loss: 0.3060505986213684, mean loss: 0.33860537810691477
Epoch: 79, step: 113, loss: 0.3646422326564789, mean loss: 0.33860560612035334
Epoch: 79, step: 114, loss: 0.3136662542819977, mean loss: 0.33860538772002546
Epoch: 79, step: 115, loss: 0.3556770980358124, mean loss: 0.3386055372200808
Epoch: 79, step: 116, loss: 0.3016393482685089, mean loss: 0.33860521350331224
Epoch: 79, step: 117, loss: 0.34583622217178345, mean loss: 0.3386052768254541
Epoch: 79, step: 118, loss: 0.31573498249053955, mean loss: 0.33860507655141114
Epoch: 79, step: 119, loss: 0.30113133788108826, mean loss: 0.33860474839859783
Epoch: 79, step: 120, loss: 0.34377413988113403, mean loss: 0.33860479366591206
Epoch: 79, step: 121, loss: 0.3265668451786041, mean loss: 0.33860468825295836
Epoch: 79, step: 122, loss: 0.31659480929374695, mean loss: 0.33860449552028155
Epoch: 79, step: 123, loss: 0.315973162651062, mean loss: 0.33860429734748937
Epoch: 79, step: 124, loss: 0.2979103922843933, mean loss: 0.33860394101168617
Epoch: 79, step: 125, loss: 0.32528871297836304, mean loss: 0.33860382441803605
Epoch: 79, step: 126, loss: 0.32525917887687683, mean loss: 0.3386037075678172
Epoch: 79, step: 127, loss: 0.32140037417411804, mean loss: 0.3386035569309447
Epoch: 79, step: 128, loss: 0.31003665924072266, mean loss: 0.33860330679393064
Epoch: 79, step: 129, loss: 0.34098806977272034, mean loss: 0.3386033276751714
Epoch: 79, step: 130, loss: 0.30884850025177, mean loss: 0.3386030671409885
Epoch: 79, step: 131, loss: 0.3563690483570099, mean loss: 0.33860322269910365
Epoch: 79, step: 132, loss: 0.3551217019557953, mean loss: 0.33860336733288254
Epoch: 79, step: 133, loss: 0.31122225522994995, mean loss: 0.33860312758932154
Epoch: 79, step: 134, loss: 0.3358229100704193, mean loss: 0.3386031032465041
Epoch: 79, step: 135, loss: 0.35437315702438354, mean loss: 0.33860324132353437
Epoch: 79, step: 136, loss: 0.3461052179336548, mean loss: 0.3386033070076212
Epoch: 79, step: 137, loss: 0.36296606063842773, mean loss: 0.33860352031556623
Epoch: 79, step: 138, loss: 0.3035627603530884, mean loss: 0.33860321351908623
Epoch: 79, step: 139, loss: 0.367641419172287, mean loss: 0.3386034677584717
Epoch: 79, step: 140, loss: 0.3815052807331085, mean loss: 0.3386038433751748
Epoch: 79, step: 141, loss: 0.3523902893066406, mean loss: 0.3386039640780932
Epoch: 79, step: 142, loss: 0.3287715017795563, mean loss: 0.3386038779937964
Epoch: 79, step: 143, loss: 0.29570120573043823, mean loss: 0.3386035023794358
Epoch: 79, step: 144, loss: 0.33229461312294006, mean loss: 0.33860344714537854
Epoch: 79, step: 145, loss: 0.30731961131095886, mean loss: 0.3386031732591234
Epoch: 79, step: 146, loss: 0.3319057524204254, mean loss: 0.33860311462451537
Epoch: 79, step: 147, loss: 0.33631017804145813, mean loss: 0.33860309455048027
Epoch: 79, step: 148, loss: 0.3045833110809326, mean loss: 0.338602796719152
Epoch: 79, step: 149, loss: 0.3287768065929413, mean loss: 0.3386027106967917
Epoch: 79, step: 150, loss: 0.2990635335445404, mean loss: 0.33860236455115933
Epoch: 79, step: 151, loss: 0.290839284658432, mean loss: 0.3386019464130505
Epoch: 79, step: 152, loss: 0.3158434331417084, mean loss: 0.3386017471771886
Epoch: 79, step: 153, loss: 0.40763065218925476, mean loss: 0.3386023514747025
Epoch: 79, step: 154, loss: 0.38117197155952454, mean loss: 0.3386027241372905
Epoch: 79, step: 155, loss: 0.3282875120639801, mean loss: 0.3386026338367436
Epoch: 79, step: 156, loss: 0.3126169741153717, mean loss: 0.33860240635729616
Epoch: 79, step: 157, loss: 0.32656100392341614, mean loss: 0.33860230094732685
Epoch: 79, step: 158, loss: 0.37459316849708557, mean loss: 0.33860261600722574
Epoch: 79, step: 159, loss: 0.29510971903800964, mean loss: 0.3386022352787604
Epoch: 79, step: 160, loss: 0.34564536809921265, mean loss: 0.3386022969324524
Epoch: 79, step: 161, loss: 0.30418938398361206, mean loss: 0.3386019956936969
Epoch: 79, step: 162, loss: 0.34744325280189514, mean loss: 0.33860207308633083
Epoch: 79, step: 163, loss: 0.33125582337379456, mean loss: 0.33860200878092367
Epoch: 79, step: 164, loss: 0.2946600317955017, mean loss: 0.33860162413813355
Epoch: 79, step: 165, loss: 0.3295896649360657, mean loss: 0.3386015452533171
Epoch: 79, step: 166, loss: 0.3492618799209595, mean loss: 0.3386016385661211
Epoch: 79, step: 167, loss: 0.32766684889793396, mean loss: 0.33860154285177574
Epoch: 79, step: 168, loss: 0.35571154952049255, mean loss: 0.3386016926176882
Epoch: 79, step: 169, loss: 0.3467852473258972, mean loss: 0.33860176424868366
Epoch: 79, step: 170, loss: 0.3388565182685852, mean loss: 0.3386017664785367
Epoch: 79, step: 171, loss: 0.3678702116012573, mean loss: 0.33860202266197204
Epoch: 79, step: 172, loss: 0.33797451853752136, mean loss: 0.3386020171695465
Epoch: 79, step: 173, loss: 0.306758314371109, mean loss: 0.3386017384500472
Epoch: 79, step: 174, loss: 0.31631189584732056, mean loss: 0.3386015433546642
Epoch: 79, step: 175, loss: 0.3218258023262024, mean loss: 0.33860139652361504
Epoch: 79, step: 176, loss: 0.31289079785346985, mean loss: 0.33860117149146124
Epoch: 79, step: 177, loss: 0.30407819151878357, mean loss: 0.3386008693315371
Epoch: 79, step: 178, loss: 0.3781188130378723, mean loss: 0.33860121520649844
Epoch: 79, step: 179, loss: 0.305957555770874, mean loss: 0.3386009295001947
Epoch: 79, step: 180, loss: 0.3726610243320465, mean loss: 0.3386012276009223
Epoch: 79, step: 181, loss: 0.32779204845428467, mean loss: 0.3386011329976635
Epoch: 79, step: 182, loss: 0.36774948239326477, mean loss: 0.3386013881053521
Epoch: 79, step: 183, loss: 0.33753034472465515, mean loss: 0.33860137873161344
Epoch: 79, step: 184, loss: 0.29483893513679504, mean loss: 0.3386009957274073
Epoch: 79, step: 185, loss: 0.3415749669075012, mean loss: 0.33860102175505585
Epoch: 79, step: 186, loss: 0.32455986738204956, mean loss: 0.3386008988705318
Epoch: 79, step: 187, loss: 0.3175116181373596, mean loss: 0.3386007143042578
Epoch: 79, step: 188, loss: 0.37455734610557556, mean loss: 0.3386010289818214
Epoch: 79, step: 189, loss: 0.29296472668647766, mean loss: 0.3386006295952821
Epoch: 79, step: 190, loss: 0.34244871139526367, mean loss: 0.33860066327151234
Epoch: 79, step: 191, loss: 0.33816686272621155, mean loss: 0.33860065947516915
Epoch: 79, step: 192, loss: 0.30964455008506775, mean loss: 0.3386004060721518
Epoch: 79, step: 193, loss: 0.3260774314403534, mean loss: 0.338600296481055
Epoch: 79, step: 194, loss: 0.3672332167625427, mean loss: 0.3386005470513684
Epoch: 79, step: 195, loss: 0.36129626631736755, mean loss: 0.33860074566274534
Epoch: 79, step: 196, loss: 0.33022987842559814, mean loss: 0.3386006724095076
Epoch: 79, step: 197, loss: 0.3340562880039215, mean loss: 0.33860063264206786
Epoch: 79, step: 198, loss: 0.34310582280158997, mean loss: 0.3386006720661778
Epoch: 79, step: 199, loss: 0.33084699511528015, mean loss: 0.3386006042157372
Epoch: 79, step: 200, loss: 0.3413088321685791, mean loss: 0.3386006279145388
Epoch: 79, step: 201, loss: 0.3335769772529602, mean loss: 0.3386005839546282
Epoch: 79, step: 202, loss: 0.32456913590431213, mean loss: 0.3386004611722443
Epoch: 79, step: 203, loss: 0.30801281332969666, mean loss: 0.3386001935169429
Epoch: 79, step: 204, loss: 0.33338335156440735, mean loss: 0.3386001478676928
Epoch: 79, step: 205, loss: 0.3038085699081421, mean loss: 0.3385998434314915
Epoch: 79, step: 206, loss: 0.3221927285194397, mean loss: 0.33859969986582633
Epoch: 79, step: 207, loss: 0.34424832463264465, mean loss: 0.33859974929203446
Epoch: 79, step: 208, loss: 0.31655746698379517, mean loss: 0.3385995564208588
Epoch: 79, step: 209, loss: 0.3307037651538849, mean loss: 0.33859948733285794
Epoch: 79, step: 210, loss: 0.3185119330883026, mean loss: 0.33859931156873563
Epoch: 79, step: 211, loss: 0.3414386808872223, mean loss: 0.3385993364127203
Epoch: 79, step: 212, loss: 0.31662020087242126, mean loss: 0.33859914410081327
Epoch: 79, step: 213, loss: 0.29940545558929443, mean loss: 0.33859880116889873
Epoch: 79, step: 214, loss: 0.3100888133049011, mean loss: 0.33859855171804204
Epoch: 79, step: 215, loss: 0.35849425196647644, mean loss: 0.33859872579584493
Epoch: 79, step: 216, loss: 0.3388500213623047, mean loss: 0.338598727994541
Epoch: 79, step: 217, loss: 0.3063373267650604, mean loss: 0.33859844572774456
Epoch: 79, step: 218, loss: 0.3367461562156677, mean loss: 0.3385984295215281
Epoch: 79, step: 219, loss: 0.31795233488082886, mean loss: 0.33859824888445733
Epoch: 79, step: 220, loss: 0.3280884027481079, mean loss: 0.33859815693238393
Epoch: 79, step: 221, loss: 0.33354610204696655, mean loss: 0.33859811273165524
Epoch: 79, step: 222, loss: 0.3338428735733032, mean loss: 0.338598071128149
Epoch: 79, step: 223, loss: 0.3498850464820862, mean loss: 0.33859816987683977
Epoch: 79, step: 224, loss: 0.31311357021331787, mean loss: 0.33859794691641365
Epoch: 79, step: 225, loss: 0.34884151816368103, mean loss: 0.33859803653489146
Epoch: 79, step: 226, loss: 0.3040837049484253, mean loss: 0.33859773458016074
Epoch: 79, step: 227, loss: 0.33479318022727966, mean loss: 0.33859770129563566
Epoch: 79, step: 228, loss: 0.3280847370624542, mean loss: 0.33859760932271904
Epoch: 79, step: 229, loss: 0.357072651386261, mean loss: 0.33859777095064814
Epoch: 79, step: 230, loss: 0.3134109079837799, mean loss: 0.33859755060663627
Epoch: 79, step: 231, loss: 0.3466191589832306, mean loss: 0.3385976207820254
Epoch: 79, step: 232, loss: 0.33055058121681213, mean loss: 0.3385975503847726
Epoch: 79, step: 233, loss: 0.3196704387664795, mean loss: 0.3385973848077311
Epoch: 79, step: 234, loss: 0.2948984205722809, mean loss: 0.3385970025263738
Epoch: 79, step: 235, loss: 0.37411853671073914, mean loss: 0.33859731326832726
Epoch: 79, step: 236, loss: 0.35803940892219543, mean loss: 0.33859748334605816
Epoch: 79, step: 237, loss: 0.3425115644931793, mean loss: 0.3385975175857939
Epoch: 79, step: 238, loss: 0.3094661235809326, mean loss: 0.3385972627513976
Epoch: 79, step: 239, loss: 0.298000693321228, mean loss: 0.33859690762552347
Epoch: 79, step: 240, loss: 0.35204601287841797, mean loss: 0.33859702527298846
Epoch: 79, step: 241, loss: 0.31256869435310364, mean loss: 0.3385967975894135
Epoch: 79, step: 242, loss: 0.31037023663520813, mean loss: 0.33859655067891786
Epoch: 79, step: 243, loss: 0.38108429312705994, mean loss: 0.3385969223351674
Epoch: 79, step: 244, loss: 0.34331777691841125, mean loss: 0.3385969636298953
Epoch: 79, step: 245, loss: 0.34822311997413635, mean loss: 0.3385970478320291
Epoch: 79, step: 246, loss: 0.3084295094013214, mean loss: 0.33859678395215864
Epoch: 79, step: 247, loss: 0.3184337615966797, mean loss: 0.3385966075847961
Epoch: 79, step: 248, loss: 0.33224013447761536, mean loss: 0.3385965519847689
Epoch: 79, step: 249, loss: 0.32712894678115845, mean loss: 0.3385964516785813
Epoch: 79, step: 250, loss: 0.306735098361969, mean loss: 0.3385961729924152
Epoch: 79, step: 251, loss: 0.34561285376548767, mean loss: 0.33859623436566383
Epoch: 79, step: 252, loss: 0.3247671127319336, mean loss: 0.33859611340666274
Epoch: 79, step: 253, loss: 0.34798383712768555, mean loss: 0.33859619551742737
Epoch: 79, step: 254, loss: 0.3776074945926666, mean loss: 0.33859653673108836
Epoch: 79, step: 255, loss: 0.321804404258728, mean loss: 0.33859638985941226
Epoch: 79, step: 256, loss: 0.32420405745506287, mean loss: 0.33859626397858694
Epoch: 79, step: 257, loss: 0.3198621869087219, mean loss: 0.33859610012464086
Epoch: 79, step: 258, loss: 0.3083370327949524, mean loss: 0.3385958354719332
Epoch: 79, step: 259, loss: 0.3204866051673889, mean loss: 0.3385956770858579
Epoch: 79, step: 260, loss: 0.3062138855457306, mean loss: 0.33859539387227405
Epoch: 79, step: 261, loss: 0.3303588330745697, mean loss: 0.338595321835324
Epoch: 79, step: 262, loss: 0.2923326790332794, mean loss: 0.3385949172258486
Epoch: 79, step: 263, loss: 0.3249928057193756, mean loss: 0.3385947982638799
Epoch: 79, step: 264, loss: 0.3198152184486389, mean loss: 0.3385946340220085
Epoch: 79, step: 265, loss: 0.3251979649066925, mean loss: 0.3385945168588566
Epoch: 79, step: 266, loss: 0.3292785882949829, mean loss: 0.3385944353853203
Epoch: 79, step: 267, loss: 0.3461054861545563, mean loss: 0.3385945010735136
Epoch: 79, step: 268, loss: 0.3355821371078491, mean loss: 0.3385944747289951
Epoch: 79, step: 269, loss: 0.34113389253616333, mean loss: 0.33859449693718613
Epoch: 79, step: 270, loss: 0.32444220781326294, mean loss: 0.3385943731710259
Epoch: 79, step: 271, loss: 0.3953372538089752, mean loss: 0.33859486940078626
Epoch: 79, step: 272, loss: 0.3256995379924774, mean loss: 0.3385947566290838
Epoch: 79, step: 273, loss: 0.3288099765777588, mean loss: 0.3385946710603907
Epoch: 79, step: 274, loss: 0.32568106055259705, mean loss: 0.3385945581308098
Epoch: 79, step: 275, loss: 0.3608326315879822, mean loss: 0.33859475260115973
Epoch: 79, step: 276, loss: 0.34999778866767883, mean loss: 0.3385948523190164
Epoch: 79, step: 277, loss: 0.3460052013397217, mean loss: 0.33859491712085127
Epoch: 79, step: 278, loss: 0.37459561228752136, mean loss: 0.33859523193607727
Epoch: 79, step: 279, loss: 0.2990463078022003, mean loss: 0.33859488609568295
Epoch: 79, step: 280, loss: 0.316936731338501, mean loss: 0.3385946967049613
Epoch: 79, step: 281, loss: 0.3528546988964081, mean loss: 0.33859482140111014
Epoch: 79, step: 282, loss: 0.31934237480163574, mean loss: 0.33859465305015746
Epoch: 79, step: 283, loss: 0.3072364926338196, mean loss: 0.3385943788444875
Epoch: 79, step: 284, loss: 0.3121911883354187, mean loss: 0.33859414796866
Epoch: 79, step: 285, loss: 0.31492137908935547, mean loss: 0.3385939409701038
Epoch: 79, step: 286, loss: 0.3577328622341156, mean loss: 0.3385941083224928
Epoch: 79, step: 287, loss: 0.33086681365966797, mean loss: 0.33859404075494826
Epoch: 79, step: 288, loss: 0.34747761487960815, mean loss: 0.33859411843233317
Epoch: 79, step: 289, loss: 0.3412984013557434, mean loss: 0.33859414207819755
Epoch: 79, step: 290, loss: 0.35188284516334534, mean loss: 0.3385942582717069
Epoch: 79, step: 291, loss: 0.32131779193878174, mean loss: 0.33859410721138994
Epoch: 79, step: 292, loss: 0.33124256134033203, mean loss: 0.338594042932207
Epoch: 79, step: 293, loss: 0.3629254996776581, mean loss: 0.33859425567555534
Epoch: 79, step: 294, loss: 0.29627448320388794, mean loss: 0.33859388565367504
Epoch: 79, step: 295, loss: 0.32872289419174194, mean loss: 0.3385937993476608
Epoch: 79, step: 296, loss: 0.3240578770637512, mean loss: 0.33859367225540754
Epoch: 79, step: 297, loss: 0.327543169260025, mean loss: 0.3385935756381432
Epoch: 79, step: 298, loss: 0.3728688657283783, mean loss: 0.33859387531281065
Epoch: 79, step: 299, loss: 0.32495877146720886, mean loss: 0.3385937560998303
Epoch: 79, step: 300, loss: 0.3741467595100403, mean loss: 0.3385940669403263
Epoch: 79, step: 301, loss: 0.3141278624534607, mean loss: 0.3385938530337666
Epoch: 79, step: 302, loss: 0.3231019973754883, mean loss: 0.3385937175905851
Epoch: 79, step: 303, loss: 0.3552361726760864, mean loss: 0.3385938630920284
Epoch: 79, step: 304, loss: 0.3333709239959717, mean loss: 0.3385938174293825
Epoch: 79, step: 305, loss: 0.3314613997936249, mean loss: 0.3385937550732632
Epoch: 79, step: 306, loss: 0.3366403877735138, mean loss: 0.33859373799583653
Epoch: 79, step: 307, loss: 0.32891398668289185, mean loss: 0.33859365337079006
Epoch: 79, step: 308, loss: 0.33324965834617615, mean loss: 0.338593606651421
Epoch: 79, step: 309, loss: 0.33593428134918213, mean loss: 0.33859358340272533
Epoch: 79, step: 310, loss: 0.3536234498023987, mean loss: 0.33859371479760764
Epoch: 79, step: 311, loss: 0.300641268491745, mean loss: 0.3385933830106518
Epoch: 79, step: 312, loss: 0.30340445041656494, mean loss: 0.3385930753855078
Epoch: 79, step: 313, loss: 0.31910738348960876, mean loss: 0.338592905041143
Epoch: 79, step: 314, loss: 0.332387775182724, mean loss: 0.33859285079622986
Epoch: 79, step: 315, loss: 0.2875376343727112, mean loss: 0.33859240447816197
Epoch: 79, step: 316, loss: 0.3310188353061676, mean loss: 0.33859233827158314
Epoch: 79, step: 317, loss: 0.34321504831314087, mean loss: 0.33859237868200714
Epoch: 79, step: 318, loss: 0.3069111406803131, mean loss: 0.33859210173600424
Epoch: 79, step: 319, loss: 0.3443402647972107, mean loss: 0.33859215198394177
Epoch: 79, step: 320, loss: 0.3124145567417145, mean loss: 0.33859192315280773
Epoch: 79, step: 321, loss: 0.3416881561279297, mean loss: 0.33859195021825444
Epoch: 79, step: 322, loss: 0.3536032438278198, mean loss: 0.3385920814370029
Epoch: 79, step: 323, loss: 0.33230435848236084, mean loss: 0.3385920264743897
Epoch: 79, step: 324, loss: 0.3200068473815918, mean loss: 0.33859186401795055
Epoch: 79, step: 325, loss: 0.31917908787727356, mean loss: 0.338591694328818
Epoch: 79, step: 326, loss: 0.3435814678668976, mean loss: 0.3385917379445758
Epoch: 79, step: 327, loss: 0.3273521065711975, mean loss: 0.33859163969948497
Epoch: 79, step: 328, loss: 0.3423721492290497, mean loss: 0.3385916727444527
Epoch: 79, step: 329, loss: 0.3417547047138214, mean loss: 0.33859170039188347
Epoch: 79, step: 330, loss: 0.3145831823348999, mean loss: 0.3385914905400557
Epoch: 79, step: 331, loss: 0.2852833569049835, mean loss: 0.33859102459245033
Epoch: 79, step: 332, loss: 0.3233812749385834, mean loss: 0.33859089165055195
Epoch: 79, step: 333, loss: 0.31478795409202576, mean loss: 0.3385906836011021
Epoch: 79, step: 334, loss: 0.3351806104183197, mean loss: 0.338590653795636
Epoch: 79, step: 335, loss: 0.3603037893772125, mean loss: 0.3385908435758652
Epoch: 79, step: 336, loss: 0.3121034801006317, mean loss: 0.33859061206927527
Epoch: 79, step: 337, loss: 0.297319620847702, mean loss: 0.3385902513530061
Epoch: 79, step: 338, loss: 0.3415694236755371, mean loss: 0.3385902773913081
Epoch: 79, step: 339, loss: 0.3136219382286072, mean loss: 0.338590059167116
Epoch: 79, step: 340, loss: 0.2858656644821167, mean loss: 0.33858959835801694
Epoch: 79, step: 341, loss: 0.33059918880462646, mean loss: 0.33858952852276764
Epoch: 79, step: 342, loss: 0.38012710213661194, mean loss: 0.33858989155315256
Epoch: 79, step: 343, loss: 0.2743176817893982, mean loss: 0.33858932983134027
Epoch: 79, step: 344, loss: 0.311776340007782, mean loss: 0.3385890954950749
Epoch: 79, step: 345, loss: 0.38729310035705566, mean loss: 0.3385895211475269
Epoch: 79, step: 346, loss: 0.32819753885269165, mean loss: 0.33858943032678024
Epoch: 79, step: 347, loss: 0.3204188644886017, mean loss: 0.3385892715264775
Epoch: 79, step: 348, loss: 0.3250269591808319, mean loss: 0.33858915300069775
Epoch: 79, step: 349, loss: 0.3190629780292511, mean loss: 0.33858898235613294
Epoch: 79, step: 350, loss: 0.3501362204551697, mean loss: 0.3385890832697119
Epoch: 79, step: 351, loss: 0.3398943543434143, mean loss: 0.3385890946766322
Epoch: 79, step: 352, loss: 0.3544418513774872, mean loss: 0.33858923321456136
Epoch: 79, step: 353, loss: 0.324693888425827, mean loss: 0.33858911178360107
Epoch: 79, step: 354, loss: 0.31807947158813477, mean loss: 0.33858893255209743
Epoch: 79, step: 355, loss: 0.323477566242218, mean loss: 0.33858880049667317
Epoch: 79, step: 356, loss: 0.3370358347892761, mean loss: 0.3385887869257128
Epoch: 79, step: 357, loss: 0.32770615816116333, mean loss: 0.33858869182610285
Epoch: 79, step: 358, loss: 0.35366395115852356, mean loss: 0.3385888235625413
Epoch: 79, step: 359, loss: 0.3116092085838318, mean loss: 0.3385885878009367
Epoch: 79, step: 360, loss: 0.3113998770713806, mean loss: 0.33858835021422323
Epoch: 79, step: 361, loss: 0.3181364834308624, mean loss: 0.33858817149852755
Epoch: 79, step: 362, loss: 0.3408328890800476, mean loss: 0.3385881911134978
Epoch: 79, step: 363, loss: 0.3283850848674774, mean loss: 0.3385881019566799
Epoch: 79, step: 364, loss: 0.3446106016635895, mean loss: 0.3385881545820476
Epoch: 79, step: 365, loss: 0.3051997721195221, mean loss: 0.33858786283266834
Epoch: 79, step: 366, loss: 0.34591615200042725, mean loss: 0.33858792686707123
Epoch: 79, step: 367, loss: 0.3068758249282837, mean loss: 0.33858764976995875
Epoch: 79, step: 368, loss: 0.32285773754119873, mean loss: 0.33858751232479095
Epoch: 79, step: 369, loss: 0.32842811942100525, mean loss: 0.33858742355460325
Epoch: 79, step: 370, loss: 0.33974358439445496, mean loss: 0.3385874336567539
Epoch: 79, step: 371, loss: 0.3227621614933014, mean loss: 0.3385872953819727
Epoch: 79, step: 372, loss: 0.3400537073612213, mean loss: 0.33858730819477123
Epoch: 79, step: 373, loss: 0.3611568510532379, mean loss: 0.3385875053947962
Epoch: 79, step: 374, loss: 0.3322267532348633, mean loss: 0.3385874498185919
Epoch: 79, step: 375, loss: 0.33061519265174866, mean loss: 0.338587380162691
Epoch: 79, step: 376, loss: 0.3553905487060547, mean loss: 0.33858752697551847
Epoch: 79, step: 377, loss: 0.3052571415901184, mean loss: 0.3385872357634561
Epoch: 79, step: 378, loss: 0.28833362460136414, mean loss: 0.338586796694729
Epoch: 79, step: 379, loss: 0.2994001805782318, mean loss: 0.33858645432197343
Epoch: 79, step: 380, loss: 0.31415125727653503, mean loss: 0.33858624083396444
Epoch: 79, step: 381, loss: 0.33066466450691223, mean loss: 0.33858617162450483
Epoch: 79, step: 382, loss: 0.34539806842803955, mean loss: 0.33858623113836395
Epoch: 79, step: 383, loss: 0.3097987771034241, mean loss: 0.3385859796316888
Epoch: 79, step: 384, loss: 0.3557511568069458, mean loss: 0.3385861295969798
Epoch: 79, step: 385, loss: 0.3286742568016052, mean loss: 0.3385860430016661
Epoch: 79, step: 386, loss: 0.3432438373565674, mean loss: 0.33858608369424237
Epoch: 79, step: 387, loss: 0.3524121642112732, mean loss: 0.33858620448401483
Epoch: 79, step: 388, loss: 0.329545795917511, mean loss: 0.33858612550433925
Epoch: 79, step: 389, loss: 0.33254194259643555, mean loss: 0.338586072701036
Epoch: 79, step: 390, loss: 0.3128168284893036, mean loss: 0.3385858475772518
Epoch: 79, step: 391, loss: 0.332528293132782, mean loss: 0.33858579465805655
Epoch: 79, step: 392, loss: 0.3302759826183319, mean loss: 0.33858572206362453
Epoch: 79, step: 393, loss: 0.32404372096061707, mean loss: 0.3385855950259631
Epoch: 79, step: 394, loss: 0.33430540561676025, mean loss: 0.338585557634926
Epoch: 79, step: 395, loss: 0.33648455142974854, mean loss: 0.3385855392810385
Epoch: 79, step: 396, loss: 0.3380209803581238, mean loss: 0.33858553434922994
Epoch: 79, step: 397, loss: 0.36901360750198364, mean loss: 0.33858580015695183
Epoch: 79, step: 398, loss: 0.3115704357624054, mean loss: 0.33858556416337776
Epoch: 79, step: 399, loss: 0.330407053232193, mean loss: 0.33858549272035976
Epoch: 79, step: 400, loss: 0.3082011640071869, mean loss: 0.33858522730172796
Epoch: 79, step: 401, loss: 0.38830000162124634, mean loss: 0.3385856615753379
Epoch: 79, step: 402, loss: 0.323100209236145, mean loss: 0.33858552630640354
Epoch: 79, step: 403, loss: 0.33765578269958496, mean loss: 0.33858551818495347
Epoch: 79, step: 404, loss: 0.3486466109752655, mean loss: 0.33858560606934296
Epoch: 79, step: 405, loss: 0.334191232919693, mean loss: 0.3385855676845039
Epoch: 79, step: 406, loss: 0.31376883387565613, mean loss: 0.3385853509122861
Epoch: 79, step: 407, loss: 0.3361855745315552, mean loss: 0.33858532995061125
Epoch: 79, step: 408, loss: 0.31553196907043457, mean loss: 0.33858512858483514
Epoch: 79, step: 409, loss: 0.35082849860191345, mean loss: 0.3385852355269068
Epoch: 79, step: 410, loss: 0.3423357605934143, mean loss: 0.33858526828630364
Epoch: 79, step: 411, loss: 0.31539538502693176, mean loss: 0.33858506573334385
Epoch: 79, step: 412, loss: 0.3023729622364044, mean loss: 0.33858474944004496
Epoch: 79, step: 413, loss: 0.32495737075805664, mean loss: 0.3385846304132419
Epoch: 79, step: 414, loss: 0.3316027522087097, mean loss: 0.33858456943134635
Epoch: 79, step: 415, loss: 0.33221060037612915, mean loss: 0.33858451375960463
Epoch: 79, step: 416, loss: 0.3140413463115692, mean loss: 0.338584299395692
Epoch: 79, step: 417, loss: 0.33607032895088196, mean loss: 0.33858427743846764
Epoch: 79, step: 418, loss: 0.31139886379241943, mean loss: 0.33858404000090575
Epoch: 79, step: 419, loss: 0.3400026857852936, mean loss: 0.3385840523912581
Epoch: 79, step: 420, loss: 0.3329991400241852, mean loss: 0.33858400361345287
Epoch: 79, step: 421, loss: 0.3435874581336975, mean loss: 0.3385840473125089
Epoch: 79, step: 422, loss: 0.3372567594051361, mean loss: 0.33858403572037354
Epoch: 79, step: 423, loss: 0.32764363288879395, mean loss: 0.33858394017100385
Epoch: 79, step: 424, loss: 0.35426250100135803, mean loss: 0.3385840771004702
Epoch: 79, step: 425, loss: 0.3396581709384918, mean loss: 0.3385840864810386
Epoch: 79, step: 426, loss: 0.3116351366043091, mean loss: 0.33858385112519745
Epoch: 79, step: 427, loss: 0.35846075415611267, mean loss: 0.33858402471653953
Epoch: 79, step: 428, loss: 0.3110300302505493, mean loss: 0.33858378408080775
Epoch: 79, step: 429, loss: 0.39150434732437134, mean loss: 0.3385842462449148
Epoch: 79, step: 430, loss: 0.31011533737182617, mean loss: 0.33858399762335567
Epoch: 79, step: 431, loss: 0.33173859119415283, mean loss: 0.33858393784232355
Epoch: 79, step: 432, loss: 0.30298474431037903, mean loss: 0.3385836269567728
Epoch: 79, step: 433, loss: 0.37834206223487854, mean loss: 0.33858397416169184
Epoch: 79, step: 434, loss: 0.32886800169944763, mean loss: 0.3385838893141884
Epoch: 79, step: 435, loss: 0.29719078540802, mean loss: 0.33858352784024764
Epoch: 79, step: 436, loss: 0.3216381072998047, mean loss: 0.33858337986210946
Epoch: 79, step: 437, loss: 0.3159603178501129, mean loss: 0.3385831823049373
Epoch: 79, step: 438, loss: 0.3162813186645508, mean loss: 0.3385829875543488
Epoch: 79, step: 439, loss: 0.3553965389728546, mean loss: 0.33858313437707593
Epoch: 79, step: 440, loss: 0.3059937059879303, mean loss: 0.3385828497954995
Epoch: 79, step: 441, loss: 0.3481253981590271, mean loss: 0.3385829331234337
Epoch: 79, step: 442, loss: 0.32990700006484985, mean loss: 0.33858285736366406
Epoch: 79, step: 443, loss: 0.3617284595966339, mean loss: 0.3385830594733587
Epoch: 79, step: 444, loss: 0.3060857057571411, mean loss: 0.3385827757057203
Epoch: 79, step: 445, loss: 0.29108160734176636, mean loss: 0.33858236092804994
Epoch: 79, step: 446, loss: 0.31200116872787476, mean loss: 0.33858212882452315
Epoch: 79, step: 447, loss: 0.3406052887439728, mean loss: 0.33858214649033924
Epoch: 79, step: 448, loss: 0.30825233459472656, mean loss: 0.33858188165897585
Epoch: 79, step: 449, loss: 0.3053654432296753, mean loss: 0.3385815916249362
Epoch: 79, step: 450, loss: 0.38399365544319153, mean loss: 0.3385819881433451
Epoch: 79, step: 451, loss: 0.3079695701599121, mean loss: 0.3385817208513468
Epoch: 79, step: 452, loss: 0.3242732584476471, mean loss: 0.3385815959182521
Epoch: 79, step: 453, loss: 0.3162786662578583, mean loss: 0.3385814011838623
Epoch: 79, step: 454, loss: 0.39163699746131897, mean loss: 0.3385818644260961
Epoch: 79, step: 455, loss: 0.28787490725517273, mean loss: 0.3385814216943079
Epoch: 79, step: 456, loss: 0.3432399332523346, mean loss: 0.33858146236827574
Epoch: 79, step: 457, loss: 0.35637542605400085, mean loss: 0.3385816177279391
Epoch: 79, step: 458, loss: 0.31672683358192444, mean loss: 0.338581426914789
Epoch: 79, step: 459, loss: 0.3294702172279358, mean loss: 0.3385813473659163
Epoch: 79, step: 460, loss: 0.31007763743400574, mean loss: 0.3385810985056359
Epoch: 79, step: 461, loss: 0.30776700377464294, mean loss: 0.3385808294761895
Epoch: 79, step: 462, loss: 0.32017281651496887, mean loss: 0.33858066876225834
Epoch: 79, step: 463, loss: 0.33045873045921326, mean loss: 0.33858059785307115
Epoch: 79, step: 464, loss: 0.3823930323123932, mean loss: 0.3385809803574535
Epoch: 79, step: 465, loss: 0.3990025222301483, mean loss: 0.33858150786301366
Epoch: 79, step: 466, loss: 0.3352714478969574, mean loss: 0.33858147896504553
Epoch: 79, step: 467, loss: 0.3318011164665222, mean loss: 0.338581419770653
Epoch: 79, step: 468, loss: 0.40053513646125793, mean loss: 0.3385819606385799
Epoch: 79, step: 469, loss: 0.3438963294029236, mean loss: 0.3385820070336419
Epoch: 79, step: 470, loss: 0.3645416796207428, mean loss: 0.33858223366264645
Epoch: 79, step: 471, loss: 0.2967298924922943, mean loss: 0.3385818682931841
Epoch: 79, step: 472, loss: 0.30017349123954773, mean loss: 0.33858153299233423
Epoch: 79, step: 473, loss: 0.3265190124511719, mean loss: 0.33858142768879396
Epoch: 79, step: 474, loss: 0.3168996274471283, mean loss: 0.3385812384123997
Epoch: 79, step: 475, loss: 0.3176449239253998, mean loss: 0.3385810556454948
Epoch: 79, step: 476, loss: 0.33790141344070435, mean loss: 0.3385810497125013
Epoch: 79, step: 477, loss: 0.35952067375183105, mean loss: 0.338581232505106
Epoch: 79, step: 478, loss: 0.3270041048526764, mean loss: 0.33858113144336577
Epoch: 79, step: 479, loss: 0.3156144320964813, mean loss: 0.33858093095889225
Epoch: 79, step: 480, loss: 0.32543468475341797, mean loss: 0.338580816201643
Epoch: 79, step: 481, loss: 0.3201577067375183, mean loss: 0.3385806553825866
Epoch: 79, step: 482, loss: 0.28702491521835327, mean loss: 0.33858020534601013
Epoch: 79, step: 483, loss: 0.3039332628250122, mean loss: 0.33857990291110684
Epoch: 79, step: 484, loss: 0.30952441692352295, mean loss: 0.3385796492865227
Epoch: 79, step: 485, loss: 0.37830623984336853, mean loss: 0.33857999605587513
Epoch: 79, step: 486, loss: 0.3560624122619629, mean loss: 0.338580148656769
Epoch: 79, step: 487, loss: 0.34701406955718994, mean loss: 0.33858022227431817
Epoch: 79, step: 488, loss: 0.29206886887550354, mean loss: 0.338579816292095
Epoch: 79, step: 489, loss: 0.34141257405281067, mean loss: 0.3385798410180849
Epoch: 79, step: 490, loss: 0.3147248923778534, mean loss: 0.33857963279976167
Epoch: 79, step: 491, loss: 0.3137478530406952, mean loss: 0.3385794160570433
Epoch: 79, step: 492, loss: 0.33113545179367065, mean loss: 0.33857935108340936
Epoch: 79, step: 493, loss: 0.3059883117675781, mean loss: 0.3385790666194195
Epoch: 79, step: 494, loss: 0.3450666666030884, mean loss: 0.33857912324456885
Epoch: 79, step: 495, loss: 0.35190972685813904, mean loss: 0.3385792395958904
Epoch: 79, step: 496, loss: 0.34006360173225403, mean loss: 0.33857925255149196
Epoch: 79, step: 497, loss: 0.3079809248447418, mean loss: 0.33857898548978765
Epoch: 79, step: 498, loss: 0.39814651012420654, mean loss: 0.3385795053896317
Epoch: 79, step: 499, loss: 0.3372194468975067, mean loss: 0.33857949351927064
Epoch: 79, step: 500, loss: 0.36997467279434204, mean loss: 0.3385797675287077
Epoch: 79, step: 501, loss: 0.29783201217651367, mean loss: 0.3385794118953806
Epoch: 79, step: 502, loss: 0.38385462760925293, mean loss: 0.33857980703947954
Epoch: 79, step: 503, loss: 0.313172310590744, mean loss: 0.33857958529487797
Epoch: 79, step: 504, loss: 0.35188183188438416, mean loss: 0.33857970138957594
Epoch: 79, step: 505, loss: 0.3161478340625763, mean loss: 0.33857950561827393
Epoch: 79, step: 506, loss: 0.32866111397743225, mean loss: 0.33857941905751326
Epoch: 79, step: 507, loss: 0.3480023741722107, mean loss: 0.338579501293734
Epoch: 79, step: 508, loss: 0.3025191128253937, mean loss: 0.3385791865894667
Epoch: 79, step: 509, loss: 0.31613925099372864, mean loss: 0.33857899075458636
Epoch: 79, step: 510, loss: 0.3170323669910431, mean loss: 0.33857880271734164
Epoch: 79, step: 511, loss: 0.34175992012023926, mean loss: 0.33857883047869014
Epoch: 79, step: 512, loss: 0.33067983388900757, mean loss: 0.3385787615454017
Epoch: 79, step: 513, loss: 0.33998432755470276, mean loss: 0.3385787738114459
Epoch: 79, step: 514, loss: 0.30152925848960876, mean loss: 0.3385784504918543
Epoch: 79, step: 515, loss: 0.29517674446105957, mean loss: 0.33857807174197624
Epoch: 79, step: 516, loss: 0.3506908714771271, mean loss: 0.33857817744476554
Epoch: 79, step: 517, loss: 0.3377922773361206, mean loss: 0.33857817058663936
Epoch: 79, step: 518, loss: 0.28892746567726135, mean loss: 0.3385777373155114
Epoch: 79, step: 519, loss: 0.3200763463973999, mean loss: 0.3385775758666744
Epoch: 79, step: 520, loss: 0.37734174728393555, mean loss: 0.33857791413182464
Epoch: 79, step: 521, loss: 0.31134092807769775, mean loss: 0.33857767645764136
Epoch: 79, step: 522, loss: 0.36379751563072205, mean loss: 0.3385778965279663
Epoch: 79, step: 523, loss: 0.2849522829055786, mean loss: 0.3385774285906747
Epoch: 79, step: 524, loss: 0.34967073798179626, mean loss: 0.3385775253900865
Epoch: 79, step: 525, loss: 0.3258123993873596, mean loss: 0.3385774140034964
Epoch: 79, step: 526, loss: 0.3104718029499054, mean loss: 0.33857716876025623
Epoch: 79, step: 527, loss: 0.33362001180648804, mean loss: 0.3385771255055971
Epoch: 79, step: 528, loss: 0.3194500207901001, mean loss: 0.3385769586096963
Epoch: 79, step: 529, loss: 0.3429296016693115, mean loss: 0.33857699658888635
Epoch: 79, step: 530, loss: 0.37351834774017334, mean loss: 0.33857730146861575
Epoch: 79, step: 531, loss: 0.31987258791923523, mean loss: 0.3385771382626131
Epoch: 79, step: 532, loss: 0.3330584764480591, mean loss: 0.33857709011053244
Epoch: 79, step: 533, loss: 0.32067498564720154, mean loss: 0.33857693391033644
Epoch: 79, step: 534, loss: 0.36648696660995483, mean loss: 0.3385771774300047
Epoch: 79, step: 535, loss: 0.3177189230918884, mean loss: 0.3385769954398611
Epoch: 79, step: 536, loss: 0.30691230297088623, mean loss: 0.33857671916498416
Epoch: 79, step: 537, loss: 0.3786640167236328, mean loss: 0.33857706892415457
Epoch: 79, step: 538, loss: 0.34014859795570374, mean loss: 0.3385770826355277
Epoch: 79, step: 539, loss: 0.3761359453201294, mean loss: 0.3385774103285434
Epoch: 79, step: 540, loss: 0.28572824597358704, mean loss: 0.33857694923495035
Epoch: 79, step: 541, loss: 0.3178694248199463, mean loss: 0.33857676856939684
Epoch: 79, step: 542, loss: 0.3461092412471771, mean loss: 0.3385768342868841
Epoch: 79, step: 543, loss: 0.33207187056541443, mean loss: 0.3385767775344524
Epoch: 79, step: 544, loss: 0.32442405819892883, mean loss: 0.3385766540604002
Epoch: 79, step: 545, loss: 0.36840489506721497, mean loss: 0.3385769142917782
Epoch: 79, step: 546, loss: 0.3286462724208832, mean loss: 0.33857682765435054
Epoch: 79, step: 547, loss: 0.37584948539733887, mean loss: 0.338577152827593
Epoch: 79, step: 548, loss: 0.2860582172870636, mean loss: 0.33857669464713025
Epoch: 79, step: 549, loss: 0.33548709750175476, mean loss: 0.33857666769340994
Epoch: 79, step: 550, loss: 0.32626888155937195, mean loss: 0.33857656032092237
Epoch: 79, step: 551, loss: 0.35506829619407654, mean loss: 0.33857670419271524
Epoch: 79, step: 552, loss: 0.33852100372314453, mean loss: 0.3385767037067957
Epoch: 79, step: 553, loss: 0.3572688102722168, mean loss: 0.33857686677149573
Epoch: 79, step: 554, loss: 0.317401260137558, mean loss: 0.3385766820430485
Epoch: 79, step: 555, loss: 0.3279629945755005, mean loss: 0.3385765894538285
Epoch: 79, step: 556, loss: 0.282025009393692, mean loss: 0.3385760961266011
Epoch: 79, step: 557, loss: 0.33351388573646545, mean loss: 0.3385760519668371
Epoch: 79, step: 558, loss: 0.35762038826942444, mean loss: 0.3385762180970443
Epoch: 79, step: 559, loss: 0.33875569701194763, mean loss: 0.33857621966268614
Epoch: 79, step: 560, loss: 0.3547488749027252, mean loss: 0.33857636073978375
Epoch: 79, step: 561, loss: 0.3214874863624573, mean loss: 0.33857621167163554
Epoch: 79, step: 562, loss: 0.3297358751296997, mean loss: 0.3385761345570712
Epoch: 79, step: 563, loss: 0.32242608070373535, mean loss: 0.33857599368081637
Epoch: 79, step: 564, loss: 0.3202706277370453, mean loss: 0.33857583400525576
Epoch: 79, step: 565, loss: 0.3297746479511261, mean loss: 0.3385757572342115
Epoch: 79, step: 566, loss: 0.3384760618209839, mean loss: 0.3385757563645953
Epoch: 79, step: 567, loss: 0.3985790014266968, mean loss: 0.33857627975216953
Epoch: 79, step: 568, loss: 0.31722790002822876, mean loss: 0.3385760935392538
Epoch: 79, step: 569, loss: 0.355075478553772, mean loss: 0.3385762374551777
Epoch: 79, step: 570, loss: 0.3637722134590149, mean loss: 0.3385764572252197
Epoch: 79, step: 571, loss: 0.37002572417259216, mean loss: 0.33857673153673795
Epoch: 79, step: 572, loss: 0.3266574442386627, mean loss: 0.3385766275734474
Epoch: 79, step: 573, loss: 0.3829583525657654, mean loss: 0.33857701467964013
Epoch: 79, step: 574, loss: 0.3074887692928314, mean loss: 0.33857674352417366
Epoch: 79, step: 575, loss: 0.3187863826751709, mean loss: 0.3385765709117391
Epoch: 79, step: 576, loss: 0.3480859696865082, mean loss: 0.33857665385242774
Epoch: 79, step: 577, loss: 0.3341609835624695, mean loss: 0.33857661533942085
Epoch: 79, step: 578, loss: 0.3363393545150757, mean loss: 0.33857659582643995
Epoch: 79, step: 579, loss: 0.32523268461227417, mean loss: 0.338576479444295
Epoch: 79, step: 580, loss: 0.30914872884750366, mean loss: 0.33857622278529814
Epoch: 79, step: 581, loss: 0.34833890199661255, mean loss: 0.3385763079313779
Epoch: 79, step: 582, loss: 0.3014506697654724, mean loss: 0.33857598413962875
Epoch: 79, step: 583, loss: 0.3714832365512848, mean loss: 0.33857627113816713
Epoch: 79, step: 584, loss: 0.3352491855621338, mean loss: 0.338576242121452
Epoch: 79, step: 585, loss: 0.33226555585861206, mean loss: 0.3385761870841575
Epoch: 79, step: 586, loss: 0.35186007618904114, mean loss: 0.33857630293573215
Epoch: 79, step: 587, loss: 0.2971211075782776, mean loss: 0.33857594139945785
Epoch: 79, step: 588, loss: 0.3394985795021057, mean loss: 0.3385759494458373
Epoch: 79, step: 589, loss: 0.30489590764045715, mean loss: 0.33857565572283477
Epoch: 79, step: 590, loss: 0.3443412482738495, mean loss: 0.338575706004019
Epoch: 79, step: 591, loss: 0.2985354959964752, mean loss: 0.3385753568202013
Epoch: 79, step: 592, loss: 0.2884010970592499, mean loss: 0.33857491926288624
Epoch: 79, step: 593, loss: 0.3875732719898224, mean loss: 0.3385753465616804
Epoch: 79, step: 594, loss: 0.37592098116874695, mean loss: 0.3385756722380468
Epoch: 79, step: 595, loss: 0.31932494044303894, mean loss: 0.3385755043615661
Epoch: 79, step: 596, loss: 0.3509881794452667, mean loss: 0.3385756126056609
Epoch: 79, step: 597, loss: 0.3365970849990845, mean loss: 0.3385755953521631
Epoch: 79, step: 598, loss: 0.3015653192996979, mean loss: 0.3385752726115827
Epoch: 79, step: 599, loss: 0.33733034133911133, mean loss: 0.33857526175550756
Epoch: 79, step: 600, loss: 0.3453935384750366, mean loss: 0.3385753212118652
Epoch: 79, step: 601, loss: 0.32684674859046936, mean loss: 0.3385752189379101
Epoch: 79, step: 602, loss: 0.3499751687049866, mean loss: 0.33857531834538457
Epoch: 79, step: 603, loss: 0.3375706076622009, mean loss: 0.3385753095843915
Epoch: 79, step: 604, loss: 0.2883700728416443, mean loss: 0.3385748718027473
Epoch: 79, step: 605, loss: 0.2987437844276428, mean loss: 0.33857452448505687
Epoch: 79, step: 606, loss: 0.3401641249656677, mean loss: 0.3385745383458774
Epoch: 79, step: 607, loss: 0.3268144726753235, mean loss: 0.3385744358026659
Epoch: 79, step: 608, loss: 0.3794431984424591, mean loss: 0.3385747921593179
Epoch: 79, step: 609, loss: 0.32554787397384644, mean loss: 0.33857467857162465
Epoch: 79, step: 610, loss: 0.3098828196525574, mean loss: 0.33857442839628726
Epoch: 79, step: 611, loss: 0.34852197766304016, mean loss: 0.3385745151320335
Epoch: 79, step: 612, loss: 0.3252581059932709, mean loss: 0.3385743990231727
Epoch: 79, step: 613, loss: 0.34148117899894714, mean loss: 0.33857442436784074
Epoch: 79, step: 614, loss: 0.3307989537715912, mean loss: 0.33857435657289087
Epoch: 79, step: 615, loss: 0.3559630215167999, mean loss: 0.33857450818472906
Epoch: 79, step: 616, loss: 0.30085259675979614, mean loss: 0.3385741792901023
Epoch: 79, step: 617, loss: 0.3667525351047516, mean loss: 0.3385744249730135
Epoch: 79, step: 618, loss: 0.3116571307182312, mean loss: 0.33857419028715746
Epoch: 79, step: 619, loss: 0.3284209966659546, mean loss: 0.3385741017645096
Epoch: 79, step: 620, loss: 0.33023130893707275, mean loss: 0.33857402902683703
Epoch: 79, step: 621, loss: 0.3390636146068573, mean loss: 0.3385740332953123
Epoch: 79, step: 622, loss: 0.3343234956264496, mean loss: 0.3385739962371194
Epoch: 79, step: 623, loss: 0.3206474781036377, mean loss: 0.33857383994663875
Epoch: 79, step: 624, loss: 0.3275547921657562, mean loss: 0.33857374387905625
Epoch: 79, step: 625, loss: 0.31827253103256226, mean loss: 0.3385735668881333
Epoch: 79, step: 626, loss: 0.32445114850997925, mean loss: 0.33857344376652027
Epoch: 79, step: 627, loss: 0.3100489675998688, mean loss: 0.33857319508751893
Epoch: 79, step: 628, loss: 0.2991997003555298, mean loss: 0.33857285182877056
Epoch: 79, step: 629, loss: 0.34101590514183044, mean loss: 0.3385728731271622
Epoch: 79, step: 630, loss: 0.32135429978370667, mean loss: 0.3385727230179854
Epoch: 79, step: 631, loss: 0.32573992013931274, mean loss: 0.33857261114433335
Epoch: 79, step: 632, loss: 0.31611499190330505, mean loss: 0.33857241536528165
Epoch: 79, step: 633, loss: 0.3175855576992035, mean loss: 0.3385722324095004
Epoch: 79, step: 634, loss: 0.2935473918914795, mean loss: 0.3385718399027616
Epoch: 79, step: 635, loss: 0.36730411648750305, mean loss: 0.33857209037591685
Epoch: 79, step: 636, loss: 0.324861079454422, mean loss: 0.3385719708514434
Epoch: 79, step: 637, loss: 0.33204907178878784, mean loss: 0.33857191398916797
Epoch: 79, step: 638, loss: 0.3158276081085205, mean loss: 0.33857171572123546
Epoch: 79, step: 639, loss: 0.3674611449241638, mean loss: 0.33857196755558466
Epoch: 79, step: 640, loss: 0.37068599462509155, mean loss: 0.338572247496893
Epoch: 79, step: 641, loss: 0.2930148243904114, mean loss: 0.3385718503715674
Epoch: 79, step: 642, loss: 0.32516616582870483, mean loss: 0.33857173351486064
Epoch: 79, step: 643, loss: 0.3763924837112427, mean loss: 0.33857206319364547
Epoch: 79, step: 644, loss: 0.3958794176578522, mean loss: 0.33857256273038644
Epoch: 79, step: 645, loss: 0.317710280418396, mean loss: 0.3385723808796315
Epoch: 79, step: 646, loss: 0.3289298713207245, mean loss: 0.33857229682927054
Epoch: 79, step: 647, loss: 0.39176198840141296, mean loss: 0.33857276046104395
Epoch: 79, step: 648, loss: 0.3351544141769409, mean loss: 0.33857273066504234
Epoch: 79, step: 649, loss: 0.30918750166893005, mean loss: 0.33857247453104483
Epoch: 79, step: 650, loss: 0.35391557216644287, mean loss: 0.3385726082667621
Epoch: 79, step: 651, loss: 0.3802741765975952, mean loss: 0.33857297174880946
Epoch: 79, step: 652, loss: 0.32796066999435425, mean loss: 0.33857287924994905
Epoch: 79, step: 653, loss: 0.35277342796325684, mean loss: 0.3385730030235803
Epoch: 79, step: 654, loss: 0.32239317893981934, mean loss: 0.3385728619995843
Epoch: 79, step: 655, loss: 0.31136831641197205, mean loss: 0.33857262488573997
Epoch: 79, step: 656, loss: 0.3866787254810333, mean loss: 0.33857304417313416
Epoch: 79, step: 657, loss: 0.32987141609191895, mean loss: 0.33857296833137773
Epoch: 79, step: 658, loss: 0.33555763959884644, mean loss: 0.33857294205056776
Epoch: 79, step: 659, loss: 0.3236909806728363, mean loss: 0.3385728123444478
Epoch: 79, step: 660, loss: 0.3494808077812195, mean loss: 0.338572907414002
Epoch: 79, step: 661, loss: 0.35678836703300476, mean loss: 0.33857306617099286
Epoch: 79, step: 662, loss: 0.31705811619758606, mean loss: 0.33857287865890046
Epoch: 79, step: 663, loss: 0.2880493402481079, mean loss: 0.3385724383282537
Epoch: 79, step: 664, loss: 0.3720552623271942, mean loss: 0.3385727301404568
Epoch: 79, step: 665, loss: 0.329062283039093, mean loss: 0.338572647254965
Epoch: 79, step: 666, loss: 0.38071882724761963, mean loss: 0.3385730145643433
Epoch: 79, step: 667, loss: 0.2825518846511841, mean loss: 0.3385725263372472
Epoch: 79, step: 668, loss: 0.3379126787185669, mean loss: 0.33857252058669063
Epoch: 79, step: 669, loss: 0.3403993248939514, mean loss: 0.33857253650710883
Epoch: 79, step: 670, loss: 0.29719409346580505, mean loss: 0.33857217590122773
Epoch: 79, step: 671, loss: 0.3332632780075073, mean loss: 0.338572129635516
Epoch: 79, step: 672, loss: 0.33453088998794556, mean loss: 0.33857209441743435
Epoch: 79, step: 673, loss: 0.3937602937221527, mean loss: 0.3385725753603477
Epoch: 79, step: 674, loss: 0.35411536693573, mean loss: 0.33857271080833135
Epoch: 79, step: 675, loss: 0.3464987874031067, mean loss: 0.3385727798796904
Epoch: 79, step: 676, loss: 0.33602312207221985, mean loss: 0.3385727576610312
Epoch: 79, step: 677, loss: 0.3465912938117981, mean loss: 0.3385728275369061
Epoch: 79, step: 678, loss: 0.35493263602256775, mean loss: 0.33857297009983134
Epoch: 79, step: 679, loss: 0.3144069314002991, mean loss: 0.33857275951355525
Epoch: 79, step: 680, loss: 0.31297439336776733, mean loss: 0.33857253644771923
Epoch: 79, step: 681, loss: 0.4139060974121094, mean loss: 0.33857319290357385
Epoch: 79, step: 682, loss: 0.33754655718803406, mean loss: 0.33857318395755903
Epoch: 79, step: 683, loss: 0.4159271717071533, mean loss: 0.338573858007644
Epoch: 79, step: 684, loss: 0.3457525968551636, mean loss: 0.33857392056146324
Epoch: 79, step: 685, loss: 0.3240284323692322, mean loss: 0.33857379381665054
Epoch: 79, step: 686, loss: 0.3399730324745178, mean loss: 0.3385738060090702
Epoch: 79, step: 687, loss: 0.3109913468360901, mean loss: 0.33857356566837826
Epoch: 79, step: 688, loss: 0.33992302417755127, mean loss: 0.3385735774268282
Epoch: 79, step: 689, loss: 0.3404003977775574, mean loss: 0.3385735933446118
Epoch: 79, step: 690, loss: 0.34095802903175354, mean loss: 0.3385736141209298
Epoch: 79, step: 691, loss: 0.39387544989585876, mean loss: 0.33857409597855365
Epoch: 79, step: 692, loss: 0.3336700201034546, mean loss: 0.3385740532485841
Epoch: 79, step: 693, loss: 0.32343167066574097, mean loss: 0.3385739213118185
Epoch: 79, step: 694, loss: 0.3020137548446655, mean loss: 0.33857360276299986
Epoch: 79, step: 695, loss: 0.31680232286453247, mean loss: 0.33857341307143834
Epoch: 79, step: 696, loss: 0.30887657403945923, mean loss: 0.33857315432731705
Epoch: 79, step: 697, loss: 0.33495596051216125, mean loss: 0.3385731228115224
Epoch: 79, step: 698, loss: 0.31752970814704895, mean loss: 0.33857293946658956
Epoch: 79, step: 699, loss: 0.3424619138240814, mean loss: 0.3385729733497564
Epoch: 79, step: 700, loss: 0.3173021972179413, mean loss: 0.33857278802712093
Epoch: 79, step: 701, loss: 0.32201945781707764, mean loss: 0.338572643806711
Epoch: 79, step: 702, loss: 0.38380786776542664, mean loss: 0.3385730379138557
Epoch: 79, step: 703, loss: 0.34311237931251526, mean loss: 0.338573077462047
Epoch: 79, step: 704, loss: 0.35384973883628845, mean loss: 0.33857321055603795
Epoch: 79, step: 705, loss: 0.3274146616458893, mean loss: 0.33857311334089174
Epoch: 79, step: 706, loss: 0.33597898483276367, mean loss: 0.33857309074060676
Epoch: 79, step: 707, loss: 0.3252982497215271, mean loss: 0.3385729750899846
Epoch: 79, step: 708, loss: 0.3838198184967041, mean loss: 0.33857336927775655
Epoch: 79, step: 709, loss: 0.31967779994010925, mean loss: 0.33857320466212976
Epoch: 79, step: 710, loss: 0.3410780429840088, mean loss: 0.33857322648375
Epoch: 79, step: 711, loss: 0.3450978398323059, mean loss: 0.3385732833243026
Epoch: 79, step: 712, loss: 0.33900198340415955, mean loss: 0.3385732870589817
Epoch: 79, step: 713, loss: 0.3188943564891815, mean loss: 0.3385731156247926
Epoch: 79, step: 714, loss: 0.32281213998794556, mean loss: 0.33857297832329997
Epoch: 79, step: 715, loss: 0.3232346773147583, mean loss: 0.3385728447050948
Epoch: 79, step: 716, loss: 0.31045541167259216, mean loss: 0.33857259976478454
Epoch: 79, step: 717, loss: 0.32806646823883057, mean loss: 0.33857250824317603
Epoch: 79, step: 718, loss: 0.32170650362968445, mean loss: 0.33857236132036045
Epoch: 79, step: 719, loss: 0.30427369475364685, mean loss: 0.33857206254107747
Epoch: 79, step: 720, loss: 0.3280543386936188, mean loss: 0.33857197092087965
Epoch: 79, step: 721, loss: 0.3617423474788666, mean loss: 0.33857217275694435
Epoch: 79, step: 722, loss: 0.3340096175670624, mean loss: 0.33857213301308603
Epoch: 79, step: 723, loss: 0.31430381536483765, mean loss: 0.33857192161659083
Epoch: 79, step: 724, loss: 0.3782356083393097, mean loss: 0.33857226711607885
Epoch: 79, step: 725, loss: 0.3489377498626709, mean loss: 0.3385723574061674
Epoch: 79, step: 726, loss: 0.2985825836658478, mean loss: 0.3385720090722934
Epoch: 79, step: 727, loss: 0.34911006689071655, mean loss: 0.33857210086402384
Epoch: 79, step: 728, loss: 0.3178879916667938, mean loss: 0.3385719206967036
Epoch: 79, step: 729, loss: 0.3169926404953003, mean loss: 0.3385717327337034
Epoch: 79, step: 730, loss: 0.3349817991256714, mean loss: 0.3385717014644114
Epoch: 79, step: 731, loss: 0.31727561354637146, mean loss: 0.33857151597134544
Epoch: 79, step: 732, loss: 0.30038702487945557, mean loss: 0.33857118337990144
Epoch: 79, step: 733, loss: 0.3192601799964905, mean loss: 0.3385710151802378
Epoch: 79, step: 734, loss: 0.338819295167923, mean loss: 0.33857101734274825
Epoch: 79, step: 735, loss: 0.2808007597923279, mean loss: 0.3385705141701047
Epoch: 79, step: 736, loss: 0.30247366428375244, mean loss: 0.33857019977321684
Epoch: 79, step: 737, loss: 0.2964637577533722, mean loss: 0.33856983303708693
Epoch: 79, step: 738, loss: 0.3083244562149048, mean loss: 0.33856956961003626
Epoch: 79, step: 739, loss: 0.3008061647415161, mean loss: 0.33856924070635674
Epoch: 79, step: 740, loss: 0.30701547861099243, mean loss: 0.33856896588849794
Epoch: 79, step: 741, loss: 0.31839442253112793, mean loss: 0.3385687901796077
Epoch: 79, step: 742, loss: 0.371914267539978, mean loss: 0.33856908059737273
Epoch: 79, step: 743, loss: 0.3601711392402649, mean loss: 0.33856926873583854
Epoch: 79, step: 744, loss: 0.3163169026374817, mean loss: 0.3385690749353482
Epoch: 79, step: 745, loss: 0.3078589141368866, mean loss: 0.33856880747649193
Epoch: 79, step: 746, loss: 0.3519324064254761, mean loss: 0.3385689238608309
Epoch: 79, step: 747, loss: 0.3239850401878357, mean loss: 0.3385687968500694
Epoch: 79, step: 748, loss: 0.33239462971687317, mean loss: 0.3385687430798353
Epoch: 79, step: 749, loss: 0.35441797971725464, mean loss: 0.33856888110812716
Epoch: 79, step: 750, loss: 0.32559195160865784, mean loss: 0.33856876809525127
Epoch: 79, step: 751, loss: 0.3239921033382416, mean loss: 0.3385686411517814
Epoch: 79, step: 752, loss: 0.3569672703742981, mean loss: 0.3385688013781112
Epoch: 79, step: 753, loss: 0.34546974301338196, mean loss: 0.3385688614751384
Epoch: 79, step: 754, loss: 0.3295503854751587, mean loss: 0.3385687829381928
Epoch: 79, step: 755, loss: 0.33811745047569275, mean loss: 0.33856877900782095
Epoch: 79, step: 756, loss: 0.35000523924827576, mean loss: 0.33856887859992635
Epoch: 79, step: 757, loss: 0.34789907932281494, mean loss: 0.3385689598493884
Epoch: 79, step: 758, loss: 0.29789549112319946, mean loss: 0.33856860565886526
Epoch: 79, step: 759, loss: 0.353090763092041, mean loss: 0.33856873211883803
Epoch: 79, step: 760, loss: 0.35630616545677185, mean loss: 0.3385688865763155
Epoch: 79, step: 761, loss: 0.3037016689777374, mean loss: 0.33856858295540954
Epoch: 79, step: 762, loss: 0.313545286655426, mean loss: 0.33856836505647014
Epoch: 79, step: 763, loss: 0.3407132625579834, mean loss: 0.33856838373373854
Epoch: 79, step: 764, loss: 0.33934083580970764, mean loss: 0.3385683904600129
Epoch: 79, step: 765, loss: 0.3144152760505676, mean loss: 0.33856818014397516
Epoch: 79, step: 766, loss: 0.3299448788166046, mean loss: 0.33856810505623514
Epoch: 79, step: 767, loss: 0.4004114270210266, mean loss: 0.33856864355473715
Epoch: 79, step: 768, loss: 0.3093491792678833, mean loss: 0.33856838912951803
Epoch: 79, step: 769, loss: 0.36061590909957886, mean loss: 0.3385685811041621
Epoch: 79, step: 770, loss: 0.32446542382240295, mean loss: 0.33856845830463506
Epoch: 79, step: 771, loss: 0.37623873353004456, mean loss: 0.33856878630577764
Epoch: 79, step: 772, loss: 0.3073549270629883, mean loss: 0.33856851452405345
Epoch: 79, step: 773, loss: 0.345581591129303, mean loss: 0.33856857558697556
Epoch: 79, step: 774, loss: 0.3678445816040039, mean loss: 0.3385688304912082
Epoch: 79, step: 775, loss: 0.3795354664325714, mean loss: 0.3385691871818704
Epoch: 79, step: 776, loss: 0.34096986055374146, mean loss: 0.3385692080840094
Epoch: 79, step: 777, loss: 0.3107633590698242, mean loss: 0.33856896598665964
Epoch: 79, step: 778, loss: 0.34194445610046387, mean loss: 0.3385689953758035
Epoch: 79, step: 779, loss: 0.3048548996448517, mean loss: 0.3385687018421985
Epoch: 79, step: 780, loss: 0.4406099319458008, mean loss: 0.3385695902619736
Epoch: 79, step: 781, loss: 0.34924036264419556, mean loss: 0.33856968316601493
Epoch: 79, step: 782, loss: 0.3543234169483185, mean loss: 0.33856982032317096
Epoch: 79, step: 783, loss: 0.3111693263053894, mean loss: 0.3385695817675901
Epoch: 79, step: 784, loss: 0.3194020390510559, mean loss: 0.33856941489160336
Epoch: 79, step: 785, loss: 0.3423936665058136, mean loss: 0.3385694481859184
Epoch: 79, step: 786, loss: 0.2886025011539459, mean loss: 0.33856901317249344
Epoch: 79, step: 787, loss: 0.3097979426383972, mean loss: 0.33856876269305225
Epoch: 79, step: 788, loss: 0.3378121852874756, mean loss: 0.3385687561063861
Epoch: 79, step: 789, loss: 0.32218605279922485, mean loss: 0.3385686134819079
Epoch: 79, step: 790, loss: 0.3099626898765564, mean loss: 0.33856836444673155
Epoch: 79, step: 791, loss: 0.37002766132354736, mean loss: 0.33856863832019396
Epoch: 79, step: 792, loss: 0.3251028060913086, mean loss: 0.338568521092463
Epoch: 79, step: 793, loss: 0.34230735898017883, mean loss: 0.33856855364089067
Epoch: 79, step: 794, loss: 0.3267563283443451, mean loss: 0.33856845081053927
Epoch: 79, step: 795, loss: 0.33329397439956665, mean loss: 0.33856840489442036
Epoch: 79, step: 796, loss: 0.3071243166923523, mean loss: 0.33856813116527423
Epoch: 79, step: 797, loss: 0.34183087944984436, mean loss: 0.3385681595681181
Epoch: 79, step: 798, loss: 0.2904336452484131, mean loss: 0.3385677405516713
Epoch: 79, step: 799, loss: 0.3802257776260376, mean loss: 0.3385681031864869
Epoch: 79, step: 800, loss: 0.3013409376144409, mean loss: 0.3385677791253992
Epoch: 79, step: 801, loss: 0.3223194479942322, mean loss: 0.338567637685514
Epoch: 79, step: 802, loss: 0.2949032187461853, mean loss: 0.33856725759499323
Epoch: 79, step: 803, loss: 0.28321194648742676, mean loss: 0.3385667757416584
Epoch: 79, step: 804, loss: 0.34964248538017273, mean loss: 0.33856687215194065
Epoch: 79, step: 805, loss: 0.32615524530410767, mean loss: 0.33856676411389425
Epoch: 79, step: 806, loss: 0.33315104246139526, mean loss: 0.33856671697270146
Epoch: 79, step: 807, loss: 0.2942467927932739, mean loss: 0.33856633119292207
Epoch: 79, step: 808, loss: 0.3486490845680237, mean loss: 0.33856641895680223
Epoch: 79, step: 809, loss: 0.3279231786727905, mean loss: 0.33856632631505057
Epoch: 79, step: 810, loss: 0.366780549287796, mean loss: 0.3385665718974313
Epoch: 79, step: 811, loss: 0.29118967056274414, mean loss: 0.33856615952275915
Epoch: 79, step: 812, loss: 0.3333032429218292, mean loss: 0.3385661137140516
Epoch: 79, step: 813, loss: 0.320458322763443, mean loss: 0.33856595610424267
Epoch: 79, step: 814, loss: 0.3645836412906647, mean loss: 0.33856618255962373
Epoch: 79, step: 815, loss: 0.3445435166358948, mean loss: 0.33856623458530066
Epoch: 79, step: 816, loss: 0.3508763313293457, mean loss: 0.3385663417293107
Epoch: 79, step: 817, loss: 0.33167168498039246, mean loss: 0.33856628172046127
Epoch: 79, step: 818, loss: 0.337663471698761, mean loss: 0.33856627386276494
Epoch: 79, step: 819, loss: 0.34188199043273926, mean loss: 0.338566302721181
Epoch: 79, step: 820, loss: 0.3808256685733795, mean loss: 0.3385666705233503
Epoch: 79, step: 821, loss: 0.3769702613353729, mean loss: 0.33856700476407525
Epoch: 79, step: 822, loss: 0.3089974522590637, mean loss: 0.33856674741150905
Epoch: 79, step: 823, loss: 0.3166773021221161, mean loss: 0.3385665569028468
Epoch: 79, step: 824, loss: 0.33023762702941895, mean loss: 0.33856648441496706
Epoch: 79, step: 825, loss: 0.31766006350517273, mean loss: 0.33856630246494956
Epoch: 79, step: 826, loss: 0.31408414244651794, mean loss: 0.3385660893968833
Epoch: 79, step: 827, loss: 0.33029502630233765, mean loss: 0.3385660174145059
Epoch: 79, step: 828, loss: 0.29700759053230286, mean loss: 0.3385656557381047
Epoch: 79, step: 829, loss: 0.35144051909446716, mean loss: 0.3385657677850244
Epoch: 79, step: 830, loss: 0.33139920234680176, mean loss: 0.338565705416627
Epoch: 79, step: 831, loss: 0.3281799256801605, mean loss: 0.3385656150331921
Epoch: 79, step: 832, loss: 0.3230690360069275, mean loss: 0.33856548017361604
Epoch: 79, step: 833, loss: 0.31884071230888367, mean loss: 0.3385653085195575
Epoch: 79, step: 834, loss: 0.3310428559780121, mean loss: 0.33856524305626384
Epoch: 79, step: 835, loss: 0.34344640374183655, mean loss: 0.3385652855336438
Epoch: 79, step: 836, loss: 0.31978946924209595, mean loss: 0.33856512214206674
Epoch: 79, step: 837, loss: 0.33376938104629517, mean loss: 0.338565080408761
Epoch: 79, step: 838, loss: 0.3354915678501129, mean loss: 0.33856505366279604
Epoch: 79, step: 839, loss: 0.32280439138412476, mean loss: 0.3385649165133801
Epoch: 79, step: 840, loss: 0.3194151520729065, mean loss: 0.3385647498734187
Epoch: 79, step: 841, loss: 0.36624398827552795, mean loss: 0.3385649907341925
Epoch: 79, step: 842, loss: 0.3599080741405487, mean loss: 0.3385651764570356
Epoch: 79, step: 843, loss: 0.3677806258201599, mean loss: 0.338565430681273
Epoch: 79, step: 844, loss: 0.33533743023872375, mean loss: 0.3385654025924081
Epoch: 79, step: 845, loss: 0.34513890743255615, mean loss: 0.33856545979211605
Epoch: 79, step: 846, loss: 0.3351234793663025, mean loss: 0.33856542984179777
Epoch: 79, step: 847, loss: 0.3113875985145569, mean loss: 0.3385651933565438
Epoch: 79, step: 848, loss: 0.31455233693122864, mean loss: 0.33856498441282895
Epoch: 79, step: 849, loss: 0.35506385564804077, mean loss: 0.33856512797365274
Epoch: 79, step: 850, loss: 0.321556031703949, mean loss: 0.3385649799745205
Epoch: 79, step: 851, loss: 0.3239316940307617, mean loss: 0.33856485264883884
Epoch: 79, step: 852, loss: 0.2998029589653015, mean loss: 0.33856451538066734
Epoch: 79, step: 853, loss: 0.34868186712265015, mean loss: 0.33856460341122285
Epoch: 79, step: 854, loss: 0.34396928548812866, mean loss: 0.33856465043667355
Epoch: 79, step: 855, loss: 0.308569073677063, mean loss: 0.3385643894512495
Epoch: 79, step: 856, loss: 0.32800668478012085, mean loss: 0.3385642975916037
Epoch: 79, step: 857, loss: 0.3397879898548126, mean loss: 0.3385643082385164
Epoch: 79, step: 858, loss: 0.33156201243400574, mean loss: 0.33856424731455237
Epoch: 79, step: 859, loss: 0.3212944567203522, mean loss: 0.33856409705883966
Epoch: 79, step: 860, loss: 0.295282244682312, mean loss: 0.33856372048861094
Epoch: 79, step: 861, loss: 0.31634896993637085, mean loss: 0.3385635272126661
Epoch: 79, step: 862, loss: 0.3455481231212616, mean loss: 0.33856358798051606
Epoch: 79, step: 863, loss: 0.32657715678215027, mean loss: 0.3385634836962704
Epoch: 79, step: 864, loss: 0.40311282873153687, mean loss: 0.3385640452830413
Epoch: 79, step: 865, loss: 0.31985679268836975, mean loss: 0.33856388252919506
Epoch: 79, step: 866, loss: 0.3171628415584564, mean loss: 0.338563696340902
Epoch: 79, step: 867, loss: 0.3111942410469055, mean loss: 0.33856345822968875
Epoch: 79, step: 868, loss: 0.3220062851905823, mean loss: 0.33856331418538027
Epoch: 79, step: 869, loss: 0.31387707591056824, mean loss: 0.33856309942159313
Epoch: 79, step: 870, loss: 0.33093011379241943, mean loss: 0.3385630330172013
Epoch: 79, step: 871, loss: 0.36086156964302063, mean loss: 0.3385632270052361
Epoch: 79, step: 872, loss: 0.32415199279785156, mean loss: 0.3385631016345569
Epoch: 79, step: 873, loss: 0.3496001660823822, mean loss: 0.3385631976507765
Epoch: 79, step: 874, loss: 0.4009265899658203, mean loss: 0.33856374017230584
Epoch: 79, step: 875, loss: 0.3790685534477234, mean loss: 0.33856409253514663
Epoch: 79, step: 876, loss: 0.3019373416900635, mean loss: 0.3385637739114409
Epoch: 79, step: 877, loss: 0.33017632365226746, mean loss: 0.3385637009479054
Epoch: 79, step: 878, loss: 0.3478497266769409, mean loss: 0.3385637817275646
Epoch: 79, step: 879, loss: 0.29954883456230164, mean loss: 0.33856344233730085
Epoch: 79, step: 880, loss: 0.313494473695755, mean loss: 0.338563224264729
Epoch: 79, step: 881, loss: 0.32897263765335083, mean loss: 0.33856314083785477
Epoch: 79, step: 882, loss: 0.33264464139938354, mean loss: 0.33856308935428725
Epoch: 79, step: 883, loss: 0.39382606744766235, mean loss: 0.338563570069128
Epoch: 79, step: 884, loss: 0.35003745555877686, mean loss: 0.3385636698758928
Epoch: 79, step: 885, loss: 0.3209506571292877, mean loss: 0.3385635166686352
Epoch: 79, step: 886, loss: 0.3236512839794159, mean loss: 0.33856338695531274
Epoch: 79, step: 887, loss: 0.3379226326942444, mean loss: 0.3385633813817918
Epoch: 79, step: 888, loss: 0.3272450566291809, mean loss: 0.3385632829316135
Epoch: 79, step: 889, loss: 0.31564056873321533, mean loss: 0.33856308354471476
Epoch: 79, step: 890, loss: 0.3135649859905243, mean loss: 0.3385628661075584
Epoch: 79, step: 891, loss: 0.3134096562862396, mean loss: 0.3385626473231156
Epoch: 79, step: 892, loss: 0.31377267837524414, mean loss: 0.33856243170004374
Epoch: 79, step: 893, loss: 0.30421364307403564, mean loss: 0.33856213293698706
Epoch: 79, step: 894, loss: 0.32174941897392273, mean loss: 0.33856198670259785
Epoch: 79, step: 895, loss: 0.36852410435676575, mean loss: 0.33856224730620266
Epoch: 79, step: 896, loss: 0.3155648112297058, mean loss: 0.3385620472815353
Epoch: 79, step: 897, loss: 0.3255176246166229, mean loss: 0.3385619338261222
Epoch: 79, step: 898, loss: 0.35561004281044006, mean loss: 0.3385620821027822
Epoch: 79, step: 899, loss: 0.3628078103065491, mean loss: 0.33856229297921037
Epoch: 79, step: 900, loss: 0.2888355255126953, mean loss: 0.3385618604860381
Epoch: 79, step: 901, loss: 0.3240043818950653, mean loss: 0.3385617338750465
Epoch: 79, step: 902, loss: 0.3209563195705414, mean loss: 0.3385615807565266
Epoch: 79, step: 903, loss: 0.31915685534477234, mean loss: 0.33856141199043327
Epoch: 79, step: 904, loss: 0.32715001702308655, mean loss: 0.3385613127445147
Epoch: 79, step: 905, loss: 0.33275094628334045, mean loss: 0.3385612622116794
Epoch: 79, step: 906, loss: 0.3367364704608917, mean loss: 0.3385612463415791
Epoch: 79, step: 907, loss: 0.3411524295806885, mean loss: 0.3385612688767426
Epoch: 79, step: 908, loss: 0.3891974687576294, mean loss: 0.338561709248964
Epoch: 79, step: 909, loss: 0.3397768437862396, mean loss: 0.3385617198166378
Epoch: 79, step: 910, loss: 0.31757867336273193, mean loss: 0.3385615373347359
Epoch: 79, step: 911, loss: 0.3097597360610962, mean loss: 0.33856128685815334
Epoch: 79, step: 912, loss: 0.303358256816864, mean loss: 0.33856098071556545
Epoch: 79, step: 913, loss: 0.3132059872150421, mean loss: 0.33856076021818743
Epoch: 79, step: 914, loss: 0.2940029501914978, mean loss: 0.33856037272864453
Epoch: 79, step: 915, loss: 0.3294049799442291, mean loss: 0.3385602931109947
Epoch: 79, step: 916, loss: 0.3343330919742584, mean loss: 0.33856025635048637
Epoch: 79, step: 917, loss: 0.34632566571235657, mean loss: 0.3385603238793084
Epoch: 79, step: 918, loss: 0.3625926077365875, mean loss: 0.3385605328647761
Epoch: 79, step: 919, loss: 0.35498589277267456, mean loss: 0.33856067569896087
Epoch: 79, step: 920, loss: 0.38220903277397156, mean loss: 0.3385610552597935
Epoch: 79, step: 921, loss: 0.344959557056427, mean loss: 0.33856111089990726
Epoch: 79, step: 922, loss: 0.32562685012817383, mean loss: 0.3385609984270964
Epoch: 79, step: 923, loss: 0.3417476415634155, mean loss: 0.33856102613703676
Epoch: 79, step: 924, loss: 0.30214226245880127, mean loss: 0.338560709454889
Epoch: 79, step: 925, loss: 0.3337203562259674, mean loss: 0.33856066736559287
Epoch: 79, step: 926, loss: 0.32184338569641113, mean loss: 0.33856052200171827
Epoch: 79, step: 927, loss: 0.31610679626464844, mean loss: 0.33856032675872033
Epoch: 79, step: 928, loss: 0.29377833008766174, mean loss: 0.3385599373669837
Epoch: 79, step: 929, loss: 0.30537116527557373, mean loss: 0.338559648784022
Epoch: 79, step: 930, loss: 0.3337753415107727, mean loss: 0.3385596071838822
Epoch: 79, step: 931, loss: 0.329684853553772, mean loss: 0.3385595300174796
Epoch: 79, step: 932, loss: 0.37453046441078186, mean loss: 0.33855984278373613
Epoch: 79, step: 933, loss: 0.3085286617279053, mean loss: 0.3385595816657372
Epoch: 79, step: 934, loss: 0.3158645033836365, mean loss: 0.3385593843361054
Epoch: 79, step: 935, loss: 0.36884593963623047, mean loss: 0.3385596476699775
Epoch: 79, step: 936, loss: 0.34144482016563416, mean loss: 0.3385596727555982
Epoch: 79, step: 937, loss: 0.38456279039382935, mean loss: 0.33856007273401506
Epoch: 79, step: 938, loss: 0.31357723474502563, mean loss: 0.33855985552027784
Epoch: 79, step: 939, loss: 0.38583406805992126, mean loss: 0.3385602665432011
Epoch: 79, step: 940, loss: 0.308944970369339, mean loss: 0.3385600090569497
Epoch: 79, step: 941, loss: 0.36830809712409973, mean loss: 0.33856026769549386
Epoch: 79, step: 942, loss: 0.33278489112854004, mean loss: 0.33856021748312404
Epoch: 79, step: 943, loss: 0.3124856650829315, mean loss: 0.33855999078731114
Epoch: 79, step: 944, loss: 0.31610843539237976, mean loss: 0.338559795592039
Epoch: 79, step: 945, loss: 0.32761505246162415, mean loss: 0.3385597004385629
Epoch: 79, step: 946, loss: 0.35474473237991333, mean loss: 0.33855984114982884
Epoch: 79, step: 947, loss: 0.35753899812698364, mean loss: 0.3385600061515413
Epoch: 79, step: 948, loss: 0.2935028374195099, mean loss: 0.3385596144352298
Epoch: 79, step: 949, loss: 0.31389105319976807, mean loss: 0.3385593999744885
Epoch: 79, step: 950, loss: 0.3134826719760895, mean loss: 0.33855918196716844
Epoch: 79, step: 951, loss: 0.2998916208744049, mean loss: 0.3385588458093539
Epoch: 79, step: 952, loss: 0.31648457050323486, mean loss: 0.3385586539075265
Epoch: 79, step: 953, loss: 0.32143548130989075, mean loss: 0.3385585050492061
Epoch: 79, step: 954, loss: 0.3457068204879761, mean loss: 0.33855856719171934
Epoch: 79, step: 955, loss: 0.3482533097267151, mean loss: 0.3385586514703769
Epoch: 79, step: 956, loss: 0.32345089316368103, mean loss: 0.3385585201362527
Epoch: 79, step: 957, loss: 0.3856954574584961, mean loss: 0.3385589299015162
Epoch: 79, step: 958, loss: 0.2976621091365814, mean loss: 0.33855857438518844
Epoch: 79, step: 959, loss: 0.3337358832359314, mean loss: 0.33855853246186746
Epoch: 79, step: 960, loss: 0.33637210726737976, mean loss: 0.3385585134555895
Epoch: 79, step: 961, loss: 0.34229347109794617, mean loss: 0.33855854592275375
Epoch: 79, step: 962, loss: 0.36377254128456116, mean loss: 0.3385587651005575
Epoch: 79, step: 963, loss: 0.32814255356788635, mean loss: 0.3385586745562987
Epoch: 79, step: 964, loss: 0.33443328738212585, mean loss: 0.33855863869615166
Epoch: 79, step: 965, loss: 0.3343640863895416, mean loss: 0.3385586022351
Epoch: 79, step: 966, loss: 0.3427591025829315, mean loss: 0.3385586387475375
Epoch: 79, step: 967, loss: 0.3190642297267914, mean loss: 0.33855846929577105
Epoch: 79, step: 968, loss: 0.34872516989707947, mean loss: 0.3385585576672831
Epoch: 79, step: 969, loss: 0.3190862834453583, mean loss: 0.338558388410862
Epoch: 79, step: 970, loss: 0.34692543745040894, mean loss: 0.33855846113808685
Epoch: 79, step: 971, loss: 0.3019166886806488, mean loss: 0.338558142646914
Epoch: 79, step: 972, loss: 0.3483535349369049, mean loss: 0.33855822778796074
Epoch: 79, step: 973, loss: 0.3300289213657379, mean loss: 0.3385581536523117
Epoch: 79, step: 974, loss: 0.27496016025543213, mean loss: 0.33855760087142844
Epoch: 79, step: 975, loss: 0.32418566942214966, mean loss: 0.3385574759545956
Epoch: 79, step: 976, loss: 0.32544800639152527, mean loss: 0.33855736201172093
Epoch: 79, step: 977, loss: 0.3227311074733734, mean loss: 0.3385572244567073
Epoch: 79, step: 978, loss: 0.32711195945739746, mean loss: 0.3385571249802395
Epoch: 79, step: 979, loss: 0.36304375529289246, mean loss: 0.33855733780382374
Epoch: 79, step: 980, loss: 0.3303183615207672, mean loss: 0.33855726619604426
Epoch: 79, step: 981, loss: 0.2974413335323334, mean loss: 0.33855690884642353
Epoch: 79, step: 982, loss: 0.319315642118454, mean loss: 0.3385567416168567
Epoch: 79, step: 983, loss: 0.31147921085357666, mean loss: 0.33855650628285044
Epoch: 79, step: 984, loss: 0.3371178209781647, mean loss: 0.33855649377917585
Epoch: 79, step: 985, loss: 0.3132142722606659, mean loss: 0.33855627353077483
Epoch: 79, step: 986, loss: 0.31602081656455994, mean loss: 0.33855607767757295
Epoch: 79, step: 987, loss: 0.3117680549621582, mean loss: 0.3385558448678087
Epoch: 79, step: 988, loss: 0.2993800938129425, mean loss: 0.33855550440154136
Epoch: 79, step: 989, loss: 0.3406442403793335, mean loss: 0.338555522554045
Epoch: 79, step: 990, loss: 0.31714266538619995, mean loss: 0.33855533646370484
Epoch: 79, step: 991, loss: 0.2990599274635315, mean loss: 0.3385549932283223
Epoch: 79, step: 992, loss: 0.3413538932800293, mean loss: 0.3385550175519894
Epoch: 79, step: 993, loss: 0.32898324728012085, mean loss: 0.3385549343698371
Epoch: 79, step: 994, loss: 0.33360546827316284, mean loss: 0.33855489135755684
Epoch: 79, step: 995, loss: 0.3427944779396057, mean loss: 0.33855492820046024
Epoch: 79, step: 996, loss: 0.3455846309661865, mean loss: 0.3385549892895321
Epoch: 79, step: 997, loss: 0.30946826934814453, mean loss: 0.3385547365241816
Epoch: 79, step: 998, loss: 0.3385329842567444, mean loss: 0.33855473633515476
Epoch: 79, step: 999, loss: 0.33035603165626526, mean loss: 0.3385546650891549
Epoch: 79, step: 1000, loss: 0.3105921149253845, mean loss: 0.33855442209924236
Epoch: 79, step: 1001, loss: 0.3252655863761902, mean loss: 0.3385543066224725
Epoch: 79, step: 1002, loss: 0.3073901832103729, mean loss: 0.3385540358161272
Epoch: 79, step: 1003, loss: 0.3093656301498413, mean loss: 0.3385537821803463
Epoch: 79, step: 1004, loss: 0.3042480945587158, mean loss: 0.33855348407998553
Epoch: 79, step: 1005, loss: 0.36247095465660095, mean loss: 0.33855369190979884
Epoch: 79, step: 1006, loss: 0.32874077558517456, mean loss: 0.33855360664163303
Epoch: 79, step: 1007, loss: 0.3448299765586853, mean loss: 0.3385536611789268
Epoch: 79, step: 1008, loss: 0.33671125769615173, mean loss: 0.33855364516985975
Epoch: 79, step: 1009, loss: 0.33081766963005066, mean loss: 0.3385535779507754
Epoch: 79, step: 1010, loss: 0.43115296959877014, mean loss: 0.33855438255417675
Epoch: 79, step: 1011, loss: 0.31686845421791077, mean loss: 0.3385541941250761
Epoch: 79, step: 1012, loss: 0.36374518275260925, mean loss: 0.33855441300775496
Epoch: 79, step: 1013, loss: 0.34972065687179565, mean loss: 0.3385545100295976
Epoch: 79, step: 1014, loss: 0.3446768820285797, mean loss: 0.3385545632255208
Epoch: 79, step: 1015, loss: 0.31356093287467957, mean loss: 0.33855434606333445
Epoch: 79, step: 1016, loss: 0.36816802620887756, mean loss: 0.33855460336551746
Epoch: 79, step: 1017, loss: 0.33825773000717163, mean loss: 0.3385546007861184
Epoch: 79, step: 1018, loss: 0.31823620200157166, mean loss: 0.3385544242502238
Epoch: 79, step: 1019, loss: 0.35676053166389465, mean loss: 0.3385545824321538
Epoch: 79, step: 1020, loss: 0.3563121259212494, mean loss: 0.33855473671544084
Epoch: 79, step: 1021, loss: 0.32012686133384705, mean loss: 0.33855457660948435
Epoch: 79, step: 1022, loss: 0.33856379985809326, mean loss: 0.3385545766896175
Epoch: 79, step: 1023, loss: 0.3911697268486023, mean loss: 0.3385550338151619
Epoch: 79, step: 1024, loss: 0.36449071764945984, mean loss: 0.33855525914494905
Epoch: 79, step: 1025, loss: 0.31747180223464966, mean loss: 0.33855507597300666
Epoch: 79, step: 1026, loss: 0.33298012614250183, mean loss: 0.3385550275385625
Epoch: 79, step: 1027, loss: 0.3557654619216919, mean loss: 0.3385551770592949
Epoch: 79, step: 1028, loss: 0.3152652084827423, mean loss: 0.33855497472257123
Epoch: 79, step: 1029, loss: 0.35265734791755676, mean loss: 0.3385550972389752
Epoch: 79, step: 1030, loss: 0.3152601718902588, mean loss: 0.33855489486270485
Epoch: 79, step: 1031, loss: 0.34380584955215454, mean loss: 0.3385549404803395
Epoch: 79, step: 1032, loss: 0.3297806978225708, mean loss: 0.3385548642548258
Epoch: 79, step: 1033, loss: 0.3345894515514374, mean loss: 0.3385548298059273
Epoch: 79, step: 1034, loss: 0.3237091302871704, mean loss: 0.3385547008373707
Epoch: 79, step: 1035, loss: 0.3394707441329956, mean loss: 0.3385547087952143
Epoch: 79, step: 1036, loss: 0.3248198330402374, mean loss: 0.3385545894787535
Epoch: 79, step: 1037, loss: 0.337705135345459, mean loss: 0.3385545820995109
Epoch: 79, step: 1038, loss: 0.3057122826576233, mean loss: 0.33855429679959825
Epoch: 79, step: 1039, loss: 0.34013888239860535, mean loss: 0.33855431056471863
Epoch: 79, step: 1040, loss: 0.35165542364120483, mean loss: 0.33855442437165484
Epoch: 79, step: 1041, loss: 0.3152444660663605, mean loss: 0.33855422188413503
Epoch: 79, step: 1042, loss: 0.3485102951526642, mean loss: 0.338554308369192
Epoch: 79, step: 1043, loss: 0.331447035074234, mean loss: 0.33855424663123773
Epoch: 79, step: 1044, loss: 0.3185478448867798, mean loss: 0.33855407284537986
Epoch: 79, step: 1045, loss: 0.33859604597091675, mean loss: 0.33855407320997677
Epoch: 79, step: 1046, loss: 0.3555173873901367, mean loss: 0.3385542205594567
Epoch: 79, step: 1047, loss: 0.3183397054672241, mean loss: 0.33855404497039543
Epoch: 79, step: 1048, loss: 0.31165483593940735, mean loss: 0.3385538113181997
Epoch: 79, step: 1049, loss: 0.3206162452697754, mean loss: 0.33855365551007605
Epoch: 79, step: 1050, loss: 0.34723156690597534, mean loss: 0.33855373088693286
Epoch: 79, step: 1051, loss: 0.402288019657135, mean loss: 0.33855428448196423
Epoch: 79, step: 1052, loss: 0.3016594648361206, mean loss: 0.3385539640169237
Epoch: 79, step: 1053, loss: 0.321012943983078, mean loss: 0.3385538116585459
Epoch: 79, step: 1054, loss: 0.3302830159664154, mean loss: 0.33855373982041637
Epoch: 79, step: 1055, loss: 0.31889140605926514, mean loss: 0.3385535690396277
Epoch: 79, step: 1056, loss: 0.3696174919605255, mean loss: 0.3385538388486566
Epoch: 79, step: 1057, loss: 0.31330156326293945, mean loss: 0.338553619519218
Epoch: 79, step: 1058, loss: 0.3205829858779907, mean loss: 0.3385534634360665
Epoch: 79, step: 1059, loss: 0.32870158553123474, mean loss: 0.33855337786875567
Epoch: 79, step: 1060, loss: 0.308297336101532, mean loss: 0.3385531150857948
Epoch: 79, step: 1061, loss: 0.2972885072231293, mean loss: 0.33855275669318885
Epoch: 79, step: 1062, loss: 0.3181607127189636, mean loss: 0.33855257958513707
Epoch: 79, step: 1063, loss: 0.3422758877277374, mean loss: 0.3385526119223626
Epoch: 79, step: 1064, loss: 0.32318195700645447, mean loss: 0.3385524784281692
Epoch: 79, step: 1065, loss: 0.32492125034332275, mean loss: 0.33855236004193234
Epoch: 79, step: 1066, loss: 0.31231939792633057, mean loss: 0.33855213221251923
Epoch: 79, step: 1067, loss: 0.334250807762146, mean loss: 0.3385520948564742
Epoch: 79, step: 1068, loss: 0.3138010799884796, mean loss: 0.3385518799012884
Epoch: 79, step: 1069, loss: 0.31410959362983704, mean loss: 0.33855166762916195
Epoch: 79, step: 1070, loss: 0.34820041060447693, mean loss: 0.3385517514241629
Epoch: 79, step: 1071, loss: 0.3554779887199402, mean loss: 0.3385518984196582
Epoch: 79, step: 1072, loss: 0.34294065833091736, mean loss: 0.3385519365334057
Epoch: 79, step: 1073, loss: 0.3015470802783966, mean loss: 0.338551615171215
Epoch: 79, step: 1074, loss: 0.32983478903770447, mean loss: 0.3385515394721231
Epoch: 79, step: 1075, loss: 0.3451905846595764, mean loss: 0.33855159712674643
Epoch: 79, step: 1076, loss: 0.31755927205085754, mean loss: 0.33855141482732676
Epoch: 79, step: 1077, loss: 0.3370439410209656, mean loss: 0.33855140173638937
Epoch: 79, step: 1078, loss: 0.3146861791610718, mean loss: 0.3385511944920441
Epoch: 79, step: 1079, loss: 0.29781651496887207, mean loss: 0.3385508407572885
Epoch: 79, step: 1080, loss: 0.33351999521255493, mean loss: 0.3385507970704475
Epoch: 79, step: 1081, loss: 0.3450978994369507, mean loss: 0.3385508539236611
Epoch: 79, step: 1082, loss: 0.3034110367298126, mean loss: 0.3385505487819249
Epoch: 79, step: 1083, loss: 0.3461001217365265, mean loss: 0.3385506143391753
Epoch: 79, step: 1084, loss: 0.3323844373226166, mean loss: 0.3385505607952063
Epoch: 79, step: 1085, loss: 0.3816550672054291, mean loss: 0.3385509350897341
Epoch: 79, step: 1086, loss: 0.31961289048194885, mean loss: 0.33855077064416905
Epoch: 79, step: 1087, loss: 0.32835519313812256, mean loss: 0.3385506821132262
Epoch: 79, step: 1088, loss: 0.3086932301521301, mean loss: 0.33855042285518805
Epoch: 79, step: 1089, loss: 0.35544291138648987, mean loss: 0.33855056953466406
Epoch: 79, step: 1090, loss: 0.31745824217796326, mean loss: 0.3385503863890811
Epoch: 79, step: 1091, loss: 0.3549550771713257, mean loss: 0.33855052883047787
Epoch: 79, step: 1092, loss: 0.37366029620170593, mean loss: 0.33855083368479955
Epoch: 79, step: 1093, loss: 0.3577680289745331, mean loss: 0.33855100054418386
Epoch: 79, step: 1094, loss: 0.3169218897819519, mean loss: 0.3385508127442102
Epoch: 79, step: 1095, loss: 0.33974114060401917, mean loss: 0.33855082307942935
Epoch: 79, step: 1096, loss: 0.38233861327171326, mean loss: 0.3385512032708821
Epoch: 79, step: 1097, loss: 0.3266368806362152, mean loss: 0.3385510998245953
Epoch: 79, step: 1098, loss: 0.3479311764240265, mean loss: 0.3385511812665454
Epoch: 79, step: 1099, loss: 0.34161075949668884, mean loss: 0.3385512078309184
Epoch: 79, step: 1100, loss: 0.3567049205303192, mean loss: 0.33855136544669845
Epoch: 79, step: 1101, loss: 0.3118077218532562, mean loss: 0.3385511332526719
Epoch: 79, step: 1102, loss: 0.32833629846572876, mean loss: 0.3385510445660642
Epoch: 79, step: 1103, loss: 0.36460721492767334, mean loss: 0.3385512707873731
Epoch: 79, step: 1104, loss: 0.3266943395137787, mean loss: 0.33855116784564426
Epoch: 79, step: 1105, loss: 0.3284941017627716, mean loss: 0.3385510805310805
Epoch: 79, step: 1106, loss: 0.29880115389823914, mean loss: 0.3385507354287075
Epoch: 79, step: 1107, loss: 0.3321804404258728, mean loss: 0.3385506801233265
Epoch: 79, step: 1108, loss: 0.28323718905448914, mean loss: 0.3385501999089664
Epoch: 79, step: 1109, loss: 0.34977635741233826, mean loss: 0.3385502973700945
Epoch: 79, step: 1110, loss: 0.32632920145988464, mean loss: 0.33855019127221964
Epoch: 79, step: 1111, loss: 0.30694466829299927, mean loss: 0.3385499168901401
Epoch: 79, step: 1112, loss: 0.30967479944229126, mean loss: 0.33854966621414284
Epoch: 79, step: 1113, loss: 0.3543134927749634, mean loss: 0.3385498030647945
Epoch: 79, step: 1114, loss: 0.3421704173088074, mean loss: 0.33854983449619314
Epoch: 79, step: 1115, loss: 0.2880589962005615, mean loss: 0.33854939617722746
Epoch: 79, step: 1116, loss: 0.34138062596321106, mean loss: 0.33854942075536837
Epoch: 79, step: 1117, loss: 0.3401522934436798, mean loss: 0.3385494346699185
Epoch: 79, step: 1118, loss: 0.3256296217441559, mean loss: 0.33854932251389674
Epoch: 79, step: 1119, loss: 0.31436920166015625, mean loss: 0.338549112609726
Epoch: 79, step: 1120, loss: 0.30191540718078613, mean loss: 0.3385487946005293
Epoch: 79, step: 1121, loss: 0.30493584275245667, mean loss: 0.33854850281636767
Epoch: 79, step: 1122, loss: 0.3341509997844696, mean loss: 0.33854846464326693
Epoch: 79, step: 1123, loss: 0.3079518973827362, mean loss: 0.33854819904806505
Epoch: 79, step: 1124, loss: 0.3453097641468048, mean loss: 0.33854825774169706
Epoch: 79, step: 1125, loss: 0.3419848680496216, mean loss: 0.33854828757286587
Epoch: 79, step: 1126, loss: 0.34471872448921204, mean loss: 0.3385483411342915
Epoch: 79, step: 1127, loss: 0.28005871176719666, mean loss: 0.338547833429443
Epoch: 79, step: 1128, loss: 0.2968716025352478, mean loss: 0.33854747167230664
Epoch: 79, step: 1129, loss: 0.3470038175582886, mean loss: 0.3385475450742639
Epoch: 79, step: 1130, loss: 0.3691762089729309, mean loss: 0.3385478109319279
Epoch: 79, step: 1131, loss: 0.3544943034648895, mean loss: 0.3385479493467301
Epoch: 79, step: 1132, loss: 0.3276638984680176, mean loss: 0.33854785487450245
Epoch: 79, step: 1133, loss: 0.35825490951538086, mean loss: 0.3385480259278367
Epoch: 79, step: 1134, loss: 0.3612961769104004, mean loss: 0.3385482233755716
Epoch: 79, step: 1135, loss: 0.3406323790550232, mean loss: 0.3385482414653164
Epoch: 79, step: 1136, loss: 0.3325091004371643, mean loss: 0.33854818904813233
Epoch: 79, step: 1137, loss: 0.31582093238830566, mean loss: 0.338547991786891
Epoch: 79, step: 1138, loss: 0.3049612045288086, mean loss: 0.33854770027287584
Epoch: 79, step: 1139, loss: 0.33350682258605957, mean loss: 0.3385476565213336
Epoch: 79, step: 1140, loss: 0.313340425491333, mean loss: 0.33854743774084955
Epoch: 79, step: 1141, loss: 0.3064058721065521, mean loss: 0.3385471587777914
Epoch: 79, step: 1142, loss: 0.32927432656288147, mean loss: 0.33854707829772984
Epoch: 79, step: 1143, loss: 0.32949763536453247, mean loss: 0.33854699975717323
Epoch: 79, step: 1144, loss: 0.32916024327278137, mean loss: 0.3385469182897629
Epoch: 79, step: 1145, loss: 0.3488878011703491, mean loss: 0.338547008037232
Epoch: 79, step: 1146, loss: 0.3245300352573395, mean loss: 0.33854688638640895
Epoch: 79, step: 1147, loss: 0.36318814754486084, mean loss: 0.3385471002416922
Epoch: 79, step: 1148, loss: 0.3039209544658661, mean loss: 0.3385467997327247
Epoch: 79, step: 1149, loss: 0.33345383405685425, mean loss: 0.3385467555329289
Epoch: 79, step: 1150, loss: 0.29867246747016907, mean loss: 0.3385464094830616
Epoch: 79, step: 1151, loss: 0.31123456358909607, mean loss: 0.3385461724586761
Epoch: 79, step: 1152, loss: 0.31249281764030457, mean loss: 0.3385459463579999
Epoch: 79, step: 1153, loss: 0.31700563430786133, mean loss: 0.33854575942480497
Epoch: 79, step: 1154, loss: 0.3318590819835663, mean loss: 0.33854570139634527
Epoch: 79, step: 1155, loss: 0.31437915563583374, mean loss: 0.338545491675558
Epoch: 79, step: 1156, loss: 0.30505236983299255, mean loss: 0.3385452010199138
Epoch: 79, step: 1157, loss: 0.3455774188041687, mean loss: 0.3385452620454599
Epoch: 79, step: 1158, loss: 0.29497605562210083, mean loss: 0.33854488395541416
Epoch: 79, step: 1159, loss: 0.2947149872779846, mean loss: 0.33854450360642013
Epoch: 79, step: 1160, loss: 0.36812612414360046, mean loss: 0.3385447603088728
Epoch: 79, step: 1161, loss: 0.33985570073127747, mean loss: 0.3385447716848115
Epoch: 79, step: 1162, loss: 0.3710145950317383, mean loss: 0.3385450534455292
Epoch: 79, step: 1163, loss: 0.29531827569007874, mean loss: 0.33854467834332724
Epoch: 79, step: 1164, loss: 0.27860549092292786, mean loss: 0.33854415822299316
Epoch: 79, step: 1165, loss: 0.31940850615501404, mean loss: 0.33854399217544046
Epoch: 79, step: 1166, loss: 0.3228566348552704, mean loss: 0.33854385605127396
Epoch: 79, step: 1167, loss: 0.3218899965286255, mean loss: 0.3385437115417158
Epoch: 79, step: 1168, loss: 0.3680463135242462, mean loss: 0.33854396754069177
Epoch: 79, step: 1169, loss: 0.32230469584465027, mean loss: 0.33854382663105764
Epoch: 79, step: 1170, loss: 0.32056963443756104, mean loss: 0.3385436706687142
Epoch: 79, step: 1171, loss: 0.3479110896587372, mean loss: 0.3385437519492483
Epoch: 79, step: 1172, loss: 0.3199998736381531, mean loss: 0.33854359104652193
Epoch: 79, step: 1173, loss: 0.31727975606918335, mean loss: 0.3385434065447
Epoch: 79, step: 1174, loss: 0.36413219571113586, mean loss: 0.3385436285713129
Epoch: 79, step: 1175, loss: 0.32292479276657104, mean loss: 0.3385434930523128
Epoch: 79, step: 1176, loss: 0.31304270029067993, mean loss: 0.33854327179305915
Epoch: 79, step: 1177, loss: 0.3461173176765442, mean loss: 0.3385433375091808
Epoch: 79, step: 1178, loss: 0.33987024426460266, mean loss: 0.3385433490219721
Epoch: 79, step: 1179, loss: 0.349104106426239, mean loss: 0.3385434406506717
Epoch: 79, step: 1180, loss: 0.3020724058151245, mean loss: 0.3385431242183957
Epoch: 79, step: 1181, loss: 0.3458993434906006, mean loss: 0.3385431880423322
Epoch: 79, step: 1182, loss: 0.2981267273426056, mean loss: 0.33854283738459007
Epoch: 79, step: 1183, loss: 0.29751670360565186, mean loss: 0.3385424814403442
Epoch: 79, step: 1184, loss: 0.30732402205467224, mean loss: 0.33854221059019207
Epoch: 79, step: 1185, loss: 0.347549170255661, mean loss: 0.3385422887335495
Epoch: 79, step: 1186, loss: 0.38810306787490845, mean loss: 0.33854271871350095
Epoch: 79, step: 1187, loss: 0.3208274245262146, mean loss: 0.3385425650202907
Epoch: 79, step: 1188, loss: 0.32618555426597595, mean loss: 0.33854245781506137
Epoch: 79, step: 1189, loss: 0.33525145053863525, mean loss: 0.33854242926364747
Epoch: 79, step: 1190, loss: 0.3288658559322357, mean loss: 0.3385423453144397
Epoch: 79, step: 1191, loss: 0.3223220705986023, mean loss: 0.3385422045965066
Epoch: 79, step: 1192, loss: 0.3321300148963928, mean loss: 0.3385421489684565
Epoch: 79, step: 1193, loss: 0.2870168089866638, mean loss: 0.338541701971493
Epoch: 79, step: 1194, loss: 0.36068597435951233, mean loss: 0.3385418940776809
Epoch: 79, step: 1195, loss: 0.3337576985359192, mean loss: 0.33854185257414543
Epoch: 79, step: 1196, loss: 0.30469441413879395, mean loss: 0.33854155894564236
Epoch: 79, step: 1197, loss: 0.3241959810256958, mean loss: 0.33854143449799656
Epoch: 79, step: 1198, loss: 0.35372957587242126, mean loss: 0.33854156625372306
Epoch: 79, step: 1199, loss: 0.3497152626514435, mean loss: 0.3385416631836686
Epoch: 79, step: 1200, loss: 0.3203269839286804, mean loss: 0.3385415051757463
Epoch: 79, step: 1201, loss: 0.3200969099998474, mean loss: 0.3385413451747472
Epoch: 79, step: 1202, loss: 0.32800108194351196, mean loss: 0.33854125374210786
Epoch: 79, step: 1203, loss: 0.33355003595352173, mean loss: 0.33854121044563157
Epoch: 79, step: 1204, loss: 0.34997454285621643, mean loss: 0.33854130962357426
Epoch: 79, step: 1205, loss: 0.33804571628570557, mean loss: 0.3385413053246088
Epoch: 79, step: 1206, loss: 0.31882962584495544, mean loss: 0.3385411343394724
Epoch: 79, step: 1207, loss: 0.29739469289779663, mean loss: 0.33854077742575117
Epoch: 79, step: 1208, loss: 0.32470691204071045, mean loss: 0.3385406574286537
Epoch: 79, step: 1209, loss: 0.3771217167377472, mean loss: 0.338540992083853
Epoch: 79, step: 1210, loss: 0.2871636152267456, mean loss: 0.3385405464362357
Epoch: 79, step: 1211, loss: 0.3203197717666626, mean loss: 0.3385403883905183
Epoch: 79, step: 1212, loss: 0.3620958626270294, mean loss: 0.33854059270727216
Epoch: 79, step: 1213, loss: 0.3895640969276428, mean loss: 0.33854103527388
Epoch: 79, step: 1214, loss: 0.2973116338253021, mean loss: 0.3385406776622586
Epoch: 79, step: 1215, loss: 0.37841275334358215, mean loss: 0.33854102349783854
Epoch: 79, step: 1216, loss: 0.2963743209838867, mean loss: 0.3385406577626897
Epoch: 79, step: 1217, loss: 0.353530615568161, mean loss: 0.33854078777776253
Epoch: 79, step: 1218, loss: 0.34126144647598267, mean loss: 0.33854081137513187
Epoch: 79, step: 1219, loss: 0.3554324209690094, mean loss: 0.33854095788159866
Epoch: 79, step: 1220, loss: 0.3662508428096771, mean loss: 0.338541198216429
Epoch: 79, step: 1221, loss: 0.33627909421920776, mean loss: 0.3385411785967999
Epoch: 79, step: 1222, loss: 0.3018980324268341, mean loss: 0.3385408607870516
Epoch: 79, step: 1223, loss: 0.3119502067565918, mean loss: 0.33854063016559427
Epoch: 79, step: 1224, loss: 0.3122977316379547, mean loss: 0.33854040256220375
Epoch: 79, step: 1225, loss: 0.34606027603149414, mean loss: 0.3385404677811372
Epoch: 79, step: 1226, loss: 0.31722143292427063, mean loss: 0.3385402828853855
Epoch: 79, step: 1227, loss: 0.3832746744155884, mean loss: 0.3385406708545065
Epoch: 79, step: 1228, loss: 0.31453317403793335, mean loss: 0.3385404626458701
Epoch: 79, step: 1229, loss: 0.3039071559906006, mean loss: 0.3385401622859005
Epoch: 79, step: 1230, loss: 0.3342064321041107, mean loss: 0.3385401247016239
Epoch: 79, step: 1231, loss: 0.33805859088897705, mean loss: 0.338540120525558
Epoch: 79, step: 1232, loss: 0.3011910021305084, mean loss: 0.3385397966209331
Epoch: 79, step: 1233, loss: 0.34499475359916687, mean loss: 0.33853985260009345
Epoch: 79, step: 1234, loss: 0.31075912714004517, mean loss: 0.33853961168009916
Epoch: 79, step: 1235, loss: 0.355861634016037, mean loss: 0.3385397618988304
Epoch: 79, step: 1236, loss: 0.3765672743320465, mean loss: 0.3385400916752861
Epoch: 79, step: 1237, loss: 0.3547362983226776, mean loss: 0.33854023212836765
Epoch: 79, step: 1238, loss: 0.3011918365955353, mean loss: 0.33853990824686453
Epoch: 79, step: 1239, loss: 0.3223212659358978, mean loss: 0.3385397676016608
Epoch: 79, step: 1240, loss: 0.3489629626274109, mean loss: 0.33853985798898467
Epoch: 79, step: 1241, loss: 0.30923596024513245, mean loss: 0.3385396038751625
Epoch: 79, step: 1242, loss: 0.319643497467041, mean loss: 0.33853944001572556
Epoch: 79, step: 1243, loss: 0.32253941893577576, mean loss: 0.33853930127117926
Epoch: 79, step: 1244, loss: 0.32128775119781494, mean loss: 0.3385391516752681
Epoch: 79, step: 1245, loss: 0.31632211804389954, mean loss: 0.3385389590230974
Epoch: 79, step: 1246, loss: 0.296021431684494, mean loss: 0.3385385903409842
Epoch: 79, step: 1247, loss: 0.31158503890037537, mean loss: 0.3385383566207574
Epoch: 79, step: 1248, loss: 0.3449443280696869, mean loss: 0.33853841216787595
Epoch: 79, step: 1249, loss: 0.3229457437992096, mean loss: 0.33853827696273253
Epoch: 79, step: 1250, loss: 0.2857140898704529, mean loss: 0.33853781892439727
Epoch: 79, step: 1251, loss: 0.3376915752887726, mean loss: 0.3385378115866854
Epoch: 79, step: 1252, loss: 0.3053440749645233, mean loss: 0.3385375237689065
Epoch: 79, step: 1253, loss: 0.3062058687210083, mean loss: 0.338537243428535
Epoch: 79, step: 1254, loss: 0.32349467277526855, mean loss: 0.33853711299898304
Epoch: 79, step: 1255, loss: 0.32904407382011414, mean loss: 0.3385370306884432
Epoch: 79, step: 1256, loss: 0.32302436232566833, mean loss: 0.3385368961851496
Epoch: 79, step: 1257, loss: 0.3634760081768036, mean loss: 0.3385371124189748
Epoch: 79, step: 1258, loss: 0.3450865149497986, mean loss: 0.3385371692048813
Epoch: 79, step: 1259, loss: 0.36853840947151184, mean loss: 0.3385374293252277
Epoch: 79, step: 1260, loss: 0.32091277837753296, mean loss: 0.33853727651519316
Epoch: 79, step: 1261, loss: 0.32501497864723206, mean loss: 0.3385371592745798
Epoch: 79, step: 1262, loss: 0.32330530881881714, mean loss: 0.33853702721300083
Epoch: 79, step: 1263, loss: 0.3141528367996216, mean loss: 0.33853681580160483
Epoch: 79, step: 1264, loss: 0.3329937756061554, mean loss: 0.3385367677437573
Epoch: 79, step: 1265, loss: 0.3336845338344574, mean loss: 0.33853672567552623
Epoch: 79, step: 1266, loss: 0.3726624846458435, mean loss: 0.338537021538812
Epoch: 79, step: 1267, loss: 0.3227153420448303, mean loss: 0.33853688436930607
Epoch: 79, step: 1268, loss: 0.37689757347106934, mean loss: 0.3385372169427952
Epoch: 79, step: 1269, loss: 0.32828304171562195, mean loss: 0.3385371280435249
Epoch: 79, step: 1270, loss: 0.32999876141548157, mean loss: 0.3385370540202159
Epoch: 79, step: 1271, loss: 0.3255035877227783, mean loss: 0.3385369410276517
Epoch: 79, step: 1272, loss: 0.38397902250289917, mean loss: 0.3385373349806246
Epoch: 79, step: 1273, loss: 0.2874850630760193, mean loss: 0.3385368923948257
Epoch: 79, step: 1274, loss: 0.2993508279323578, mean loss: 0.33853655268329774
Epoch: 79, step: 1275, loss: 0.3381728231906891, mean loss: 0.33853654953008416
Epoch: 79, step: 1276, loss: 0.3085486590862274, mean loss: 0.3385362895638029
Epoch: 79, step: 1277, loss: 0.2965192198753357, mean loss: 0.33853592531921933
Epoch: 79, step: 1278, loss: 0.33985769748687744, mean loss: 0.3385359367775191
Epoch: 79, step: 1279, loss: 0.3283578157424927, mean loss: 0.3385358485452552
Epoch: 79, step: 1280, loss: 0.3630583584308624, mean loss: 0.33853606112455153
Epoch: 79, step: 1281, loss: 0.3339631259441376, mean loss: 0.3385360214833027
Epoch: 79, step: 1282, loss: 0.37305495142936707, mean loss: 0.3385363207137914
Epoch: 79, step: 1283, loss: 0.3431323766708374, mean loss: 0.33853636055477576
Epoch: 79, step: 1284, loss: 0.365066260099411, mean loss: 0.33853659052763957
Epoch: 79, step: 1285, loss: 0.30886903405189514, mean loss: 0.3385363333584116
Epoch: 79, step: 1286, loss: 0.3167617619037628, mean loss: 0.3385361446101001
Epoch: 79, step: 1287, loss: 0.3624671399593353, mean loss: 0.33853635204912225
Epoch: 79, step: 1288, loss: 0.38127219676971436, mean loss: 0.338536722489418
Epoch: 79, step: 1289, loss: 0.33320438861846924, mean loss: 0.33853667626840084
Epoch: 79, step: 1290, loss: 0.30255094170570374, mean loss: 0.33853636434441425
Epoch: 79, step: 1291, loss: 0.36938661336898804, mean loss: 0.3385366317517458
Epoch: 79, step: 1292, loss: 0.3865387439727783, mean loss: 0.3385370478263605
Epoch: 79, step: 1293, loss: 0.35770249366760254, mean loss: 0.3385372139479332
Epoch: 79, step: 1294, loss: 0.34200942516326904, mean loss: 0.3385372440439817
Epoch: 79, step: 1295, loss: 0.34880879521369934, mean loss: 0.3385373330738258
Epoch: 79, step: 1296, loss: 0.33377012610435486, mean loss: 0.3385372917538725
Epoch: 79, step: 1297, loss: 0.3236621916294098, mean loss: 0.33853716282447655
Epoch: 79, step: 1298, loss: 0.33851855993270874, mean loss: 0.338537162663238
Epoch: 79, step: 1299, loss: 0.3044847846031189, mean loss: 0.33853686752059087
Epoch: 79, step: 1300, loss: 0.31798839569091797, mean loss: 0.3385366894220805
Epoch: 79, step: 1301, loss: 0.3677886128425598, mean loss: 0.3385369429532859
Epoch: 79, step: 1302, loss: 0.3276582956314087, mean loss: 0.33853684866708716
Epoch: 79, step: 1303, loss: 0.2861131429672241, mean loss: 0.33853639431013016
Epoch: 79, step: 1304, loss: 0.3398389220237732, mean loss: 0.3385364055990574
Epoch: 79, step: 1305, loss: 0.3324986398220062, mean loss: 0.3385363532705679
Epoch: 79, step: 1306, loss: 0.4036843478679657, mean loss: 0.3385369178944258
Epoch: 79, step: 1307, loss: 0.4170632064342499, mean loss: 0.3385375984592228
Epoch: 79, step: 1308, loss: 0.3946009874343872, mean loss: 0.3385380843403077
Epoch: 79, step: 1309, loss: 0.36200618743896484, mean loss: 0.3385382877280939
Epoch: 79, step: 1310, loss: 0.30660831928253174, mean loss: 0.3385380110074196
Epoch: 79, step: 1311, loss: 0.3459969758987427, mean loss: 0.3385380756498858
Epoch: 79, step: 1312, loss: 0.3402864933013916, mean loss: 0.338538090802263
Epoch: 79, step: 1313, loss: 0.3435666263103485, mean loss: 0.3385381343808704
Epoch: 79, step: 1314, loss: 0.3773983120918274, mean loss: 0.3385384711504426
Epoch: 79, step: 1315, loss: 0.33032503724098206, mean loss: 0.33853839997190416
Epoch: 79, step: 1316, loss: 0.3418845236301422, mean loss: 0.33853842896953534
Epoch: 79, step: 1317, loss: 0.3205035924911499, mean loss: 0.3385382726803307
Epoch: 79, step: 1318, loss: 0.31296539306640625, mean loss: 0.3385380510686524
Epoch: 79, step: 1319, loss: 0.33243051171302795, mean loss: 0.3385379981418668
Epoch: 79, step: 1320, loss: 0.35845237970352173, mean loss: 0.33853817071465087
Epoch: 79, step: 1321, loss: 0.3188495635986328, mean loss: 0.3385380000998472
Epoch: 79, step: 1322, loss: 0.3115094006061554, mean loss: 0.33853776588118417
Epoch: 79, step: 1323, loss: 0.2991630434989929, mean loss: 0.3385374246790838
Epoch: 79, step: 1324, loss: 0.36573517322540283, mean loss: 0.33853766035943794
Epoch: 79, step: 1325, loss: 0.364204078912735, mean loss: 0.3385378827682225
Epoch: 79, step: 1326, loss: 0.2910712957382202, mean loss: 0.33853747145667057
Epoch: 79, step: 1327, loss: 0.3727364242076874, mean loss: 0.3385377677978091
Epoch: 79, step: 1328, loss: 0.3398159444332123, mean loss: 0.33853777887338327
Epoch: 79, step: 1329, loss: 0.32114192843437195, mean loss: 0.33853762813728255
Epoch: 79, step: 1330, loss: 0.3321232199668884, mean loss: 0.3385375725565277
Epoch: 79, step: 1331, loss: 0.3390044867992401, mean loss: 0.3385375766022979
Epoch: 79, step: 1332, loss: 0.3288966417312622, mean loss: 0.33853749306518316
Epoch: 79, step: 1333, loss: 0.3483218848705292, mean loss: 0.338537577844594
Epoch: 79, step: 1334, loss: 0.3349078893661499, mean loss: 0.3385375463944854
Epoch: 79, step: 1335, loss: 0.3324356973171234, mean loss: 0.33853749352434126
Epoch: 79, step: 1336, loss: 0.3253357410430908, mean loss: 0.3385373791372923
Epoch: 79, step: 1337, loss: 0.34550049901008606, mean loss: 0.33853743946896675
Epoch: 79, step: 1338, loss: 0.2986780107021332, mean loss: 0.3385370941115282
Epoch: 79, step: 1339, loss: 0.35729631781578064, mean loss: 0.33853725664725726
Epoch: 79, step: 1340, loss: 0.325050413608551, mean loss: 0.33853713979408107
Epoch: 79, step: 1341, loss: 0.3218333423137665, mean loss: 0.3385369950697098
Epoch: 79, step: 1342, loss: 0.30561476945877075, mean loss: 0.33853670982875633
Epoch: 79, step: 1343, loss: 0.35163214802742004, mean loss: 0.33853682328775997
Epoch: 79, step: 1344, loss: 0.2969694435596466, mean loss: 0.33853646315069885
Epoch: 79, step: 1345, loss: 0.29947206377983093, mean loss: 0.33853612470222827
Epoch: 79, step: 1346, loss: 0.35865533351898193, mean loss: 0.3385362990107181
Epoch: 79, step: 1347, loss: 0.3030063211917877, mean loss: 0.3385359911893134
Epoch: 79, step: 1348, loss: 0.3159443736076355, mean loss: 0.33853579546379825
Epoch: 79, step: 1349, loss: 0.29999932646751404, mean loss: 0.3385354616008125
Epoch: 79, step: 1350, loss: 0.30663028359413147, mean loss: 0.3385351851908044
Epoch: 79, step: 1351, loss: 0.3340534567832947, mean loss: 0.33853514636375714
Epoch: 79, step: 1352, loss: 0.35499095916748047, mean loss: 0.3385352889259625
Epoch: 79, step: 1353, loss: 0.3159279525279999, mean loss: 0.3385350930727493
Epoch: 79, step: 1354, loss: 0.32614588737487793, mean loss: 0.3385349857427799
Epoch: 79, step: 1355, loss: 0.36366522312164307, mean loss: 0.3385352034487659
Epoch: 79, step: 1356, loss: 0.3164745569229126, mean loss: 0.33853501233663574
Epoch: 79, step: 1357, loss: 0.3629603981971741, mean loss: 0.33853522393275004
Epoch: 79, step: 1358, loss: 0.336581826210022, mean loss: 0.3385352070106924
Epoch: 79, step: 1359, loss: 0.2790028154850006, mean loss: 0.3385346912929655
Epoch: 79, step: 1360, loss: 0.2978156805038452, mean loss: 0.338534338555015
Epoch: 79, step: 1361, loss: 0.3240906596183777, mean loss: 0.3385342134343534
Epoch: 79, step: 1362, loss: 0.35860806703567505, mean loss: 0.33853438732579044
Epoch: 79, step: 1363, loss: 0.3313966393470764, mean loss: 0.33853432549498674
Epoch: 79, step: 1364, loss: 0.3144111633300781, mean loss: 0.3385341165296957
Epoch: 79, step: 1365, loss: 0.34090498089790344, mean loss: 0.338534137066973
Epoch: 79, step: 1366, loss: 0.3199601471424103, mean loss: 0.3385339761738056
Epoch: 79, step: 1367, loss: 0.3082367479801178, mean loss: 0.3385337137328975
Epoch: 79, step: 1368, loss: 0.36195066571235657, mean loss: 0.3385339165736613
Epoch: 79, step: 1369, loss: 0.33118733763694763, mean loss: 0.3385338529371651
Epoch: 79, step: 1370, loss: 0.31186527013778687, mean loss: 0.338533621934343
Epoch: 79, step: 1371, loss: 0.3184070289134979, mean loss: 0.338533447599638
Epoch: 79, step: 1372, loss: 0.3206220865249634, mean loss: 0.33853329245441305
Epoch: 79, step: 1373, loss: 0.3061312437057495, mean loss: 0.33853301179569717
Epoch: 79, step: 1374, loss: 0.3304294943809509, mean loss: 0.3385329416055956
Epoch: 79, step: 1375, loss: 0.3265036940574646, mean loss: 0.33853283741296536
Epoch: 79, step: 1376, loss: 0.3325745463371277, mean loss: 0.338532785805029
Epoch: 79, step: 1377, loss: 0.3192608654499054, mean loss: 0.33853261888209557
Epoch: 79, step: 1378, loss: 0.34462979435920715, mean loss: 0.33853267169206896
Epoch: 79, step: 1379, loss: 0.32152295112609863, mean loss: 0.3385325243656367
Epoch: 79, step: 1380, loss: 0.3294124901294708, mean loss: 0.3385324453748935
Epoch: 79, step: 1381, loss: 0.3403976559638977, mean loss: 0.33853246152977745
Epoch: 79, step: 1382, loss: 0.3510597348213196, mean loss: 0.33853257002953313
Epoch: 79, step: 1383, loss: 0.34537994861602783, mean loss: 0.3385326293347348
Epoch: 79, step: 1384, loss: 0.32597246766090393, mean loss: 0.3385325205520145
Epoch: 79, step: 1385, loss: 0.30017146468162537, mean loss: 0.3385321883123523
Epoch: 79, step: 1386, loss: 0.2934721112251282, mean loss: 0.33853179805679784
Epoch: 79, step: 1387, loss: 0.2896614670753479, mean loss: 0.33853137480512646
Epoch: 79, step: 1388, loss: 0.3397705852985382, mean loss: 0.33853138553747386
Epoch: 79, step: 1389, loss: 0.3197774887084961, mean loss: 0.338531223118261
Epoch: 79, step: 1390, loss: 0.41220805048942566, mean loss: 0.338531861195178
Epoch: 79, step: 1391, loss: 0.3910442888736725, mean loss: 0.33853231597423084
Epoch: 79, step: 1392, loss: 0.32353487610816956, mean loss: 0.3385321860914063
Epoch: 79, step: 1393, loss: 0.3624028265476227, mean loss: 0.33853239281731307
Epoch: 79, step: 1394, loss: 0.3109028935432434, mean loss: 0.338532153540791
Epoch: 79, step: 1395, loss: 0.3376716673374176, mean loss: 0.3385321460888875
Epoch: 79, step: 1396, loss: 0.3281225264072418, mean loss: 0.3385320559412367
Epoch: 79, step: 1397, loss: 0.30021175742149353, mean loss: 0.3385317240890577
Epoch: 79, step: 1398, loss: 0.3201359510421753, mean loss: 0.33853156478381374
Epoch: 79, step: 1399, loss: 0.3287854492664337, mean loss: 0.3385314803843237
Epoch: 79, step: 1400, loss: 0.33230385184288025, mean loss: 0.3385314264547226
Epoch: 79, step: 1401, loss: 0.30684712529182434, mean loss: 0.3385311520795069
Epoch: 79, step: 1402, loss: 0.30134132504463196, mean loss: 0.3385308300311082
Epoch: 79, step: 1403, loss: 0.3321553170681, mean loss: 0.33853077482230176
Epoch: 79, step: 1404, loss: 0.3349166214466095, mean loss: 0.3385307435257822
Epoch: 79, step: 1405, loss: 0.30168092250823975, mean loss: 0.3385304244299836
Epoch: 79, step: 1406, loss: 0.32732632756233215, mean loss: 0.338530327410536
Epoch: 79, step: 1407, loss: 0.3232209384441376, mean loss: 0.3385301948433495
Epoch: 79, step: 1408, loss: 0.36071211099624634, mean loss: 0.3385303869195166
Epoch: 79, step: 1409, loss: 0.29646462202072144, mean loss: 0.3385300226696084
Epoch: 79, step: 1410, loss: 0.345673531293869, mean loss: 0.33853008452513
Epoch: 79, step: 1411, loss: 0.3185783326625824, mean loss: 0.3385299117647405
Epoch: 79, step: 1412, loss: 0.3651657700538635, mean loss: 0.33853014240019746
Epoch: 79, step: 1413, loss: 0.302411288022995, mean loss: 0.3385298296557661
Epoch: 79, step: 1414, loss: 0.35170838236808777, mean loss: 0.3385299437646812
Epoch: 79, step: 1415, loss: 0.34984317421913147, mean loss: 0.3385300417215133
Epoch: 79, step: 1416, loss: 0.3204694092273712, mean loss: 0.33852988534292333
Epoch: 79, step: 1417, loss: 0.32846927642822266, mean loss: 0.33852979823355905
Epoch: 79, step: 1418, loss: 0.312136173248291, mean loss: 0.33852956970743253
Epoch: 79, step: 1419, loss: 0.3501870632171631, mean loss: 0.3385296706416078
Epoch: 79, step: 1420, loss: 0.32598981261253357, mean loss: 0.33852956206858836
Epoch: 79, step: 1421, loss: 0.32400667667388916, mean loss: 0.33852943632714355
Epoch: 79, step: 1422, loss: 0.3718472123146057, mean loss: 0.3385297247952341
Epoch: 79, step: 1423, loss: 0.3468230962753296, mean loss: 0.33852979659931615
Epoch: 79, step: 1424, loss: 0.3204159140586853, mean loss: 0.3385296397705221
Epoch: 79, step: 1425, loss: 0.34186145663261414, mean loss: 0.3385296686169218
Epoch: 79, step: 1426, loss: 0.32496798038482666, mean loss: 0.3385295512027574
Epoch: 79, step: 1427, loss: 0.37186262011528015, mean loss: 0.33852983979076223
Epoch: 79, step: 1428, loss: 0.34026527404785156, mean loss: 0.3385298548155166
Epoch: 79, step: 1429, loss: 0.3290767967700958, mean loss: 0.33852977297510967
Epoch: 79, step: 1430, loss: 0.34262269735336304, mean loss: 0.33852980840953684
Epoch: 79, step: 1431, loss: 0.3646339774131775, mean loss: 0.3385300344040048
Epoch: 79, step: 1432, loss: 0.3644784390926361, mean loss: 0.33853025904801254
Epoch: 79, step: 1433, loss: 0.3104685842990875, mean loss: 0.3385300161108231
Epoch: 79, step: 1434, loss: 0.3788914382457733, mean loss: 0.33853036552708765
Epoch: 79, step: 1435, loss: 0.3283240497112274, mean loss: 0.3385302771698969
Epoch: 79, step: 1436, loss: 0.3328818380832672, mean loss: 0.33853022827116613
Epoch: 79, step: 1437, loss: 0.3416264057159424, mean loss: 0.33853025507464835
Epoch: 79, step: 1438, loss: 0.3510281443595886, mean loss: 0.33853036326743097
Epoch: 79, step: 1439, loss: 0.3467724323272705, mean loss: 0.33853043461745225
Epoch: 79, step: 1440, loss: 0.29739874601364136, mean loss: 0.3385300785513442
Epoch: 79, step: 1441, loss: 0.3167386054992676, mean loss: 0.3385298899099805
Epoch: 79, step: 1442, loss: 0.30855685472488403, mean loss: 0.33852963044586476
Epoch: 79, step: 1443, loss: 0.35902294516563416, mean loss: 0.3385298078464423
Valid: 79, mean loss: 0.18574700752894083
